Skip to content

Commit

Permalink
Merge pull request #438 from kokkos/iamax
Browse files Browse the repository at this point in the history
BLAS IAMAX support
  • Loading branch information
srajama1 authored Jul 30, 2019
2 parents 5765b47 + bf1346d commit 624ee31
Show file tree
Hide file tree
Showing 144 changed files with 11,207 additions and 1 deletion.
4 changes: 4 additions & 0 deletions scripts/generate_specialization.bash
Original file line number Diff line number Diff line change
Expand Up @@ -44,6 +44,10 @@ ${KOKKOSKERNELS_PATH}/scripts/generate_specialization_function.bash axpby Kokkos
${KOKKOSKERNELS_PATH}/scripts/generate_specialization_function.bash dot KokkosBlas1_dot KokkosBlas1_dot_spec.hpp KokkosBlas ${KOKKOSKERNELS_PATH}
${KOKKOSKERNELS_PATH}/scripts/generate_specialization_function.bash dot KokkosBlas1_dot_mv KokkosBlas1_dot_spec.hpp KokkosBlas ${KOKKOSKERNELS_PATH}

#iamax
${KOKKOSKERNELS_PATH}/scripts/generate_specialization_function.bash iamax KokkosBlas1_iamax KokkosBlas1_iamax_spec.hpp KokkosBlas ${KOKKOSKERNELS_PATH}
${KOKKOSKERNELS_PATH}/scripts/generate_specialization_function.bash iamax KokkosBlas1_iamax_mv KokkosBlas1_iamax_spec.hpp KokkosBlas ${KOKKOSKERNELS_PATH}

#mult
${KOKKOSKERNELS_PATH}/scripts/generate_specialization_function.bash mult KokkosBlas1_mult KokkosBlas1_mult_spec.hpp KokkosBlas ${KOKKOSKERNELS_PATH}
${KOKKOSKERNELS_PATH}/scripts/generate_specialization_function.bash mult KokkosBlas1_mult_mv KokkosBlas1_mult_spec.hpp KokkosBlas ${KOKKOSKERNELS_PATH}
Expand Down
163 changes: 163 additions & 0 deletions src/blas/KokkosBlas1_iamax.hpp
Original file line number Diff line number Diff line change
@@ -0,0 +1,163 @@
/*
//@HEADER
// ************************************************************************
//
// KokkosKernels 0.9: Linear Algebra and Graph Kernels
// Copyright 2017 Sandia Corporation
//
// Under the terms of Contract DE-AC04-94AL85000 with Sandia Corporation,
// the U.S. Government retains certain rights in this software.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
// 1. Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//
// 2. Redistributions in binary form must reproduce the above copyright
// notice, this list of conditions and the following disclaimer in the
// documentation and/or other materials provided with the distribution.
//
// 3. Neither the name of the Corporation nor the names of the
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY SANDIA CORPORATION "AS IS" AND ANY
// EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
// PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL SANDIA CORPORATION OR THE
// CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
// EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
// PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
// PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
// LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
// NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
// SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
//
// Questions? Contact Siva Rajamanickam (srajama@sandia.gov)
//
// ************************************************************************
//@HEADER
*/

#ifndef KOKKOSBLAS1_IAMAX_HPP_
#define KOKKOSBLAS1_IAMAX_HPP_

#include<KokkosBlas1_iamax_spec.hpp>
#include<KokkosKernels_helpers.hpp>

namespace KokkosBlas {

/// \brief Return the (smallest) index of the element of the maximum magnitude of the vector x.
///
/// \tparam XVector Type of the first vector x; a 1-D Kokkos::View.
///
/// \param x [in] Input 1-D View.
///
/// \return The (smallest) index of the element of the maximum magnitude; a single value.
/// Note: Returned index is 1-based for compatibility with Fortran.
template<class XVector>
typename XVector::size_type iamax (const XVector& x)
{
static_assert (Kokkos::Impl::is_view<XVector>::value,
"KokkosBlas::iamax: XVector must be a Kokkos::View.");
static_assert (XVector::rank == 1, "KokkosBlas::iamax: "
"Both Vector inputs must have rank 1.");

typedef typename XVector::size_type index_type;

typedef Kokkos::View<typename XVector::const_value_type*,
typename KokkosKernels::Impl::GetUnifiedLayout<XVector>::array_layout,
typename XVector::device_type,
Kokkos::MemoryTraits<Kokkos::Unmanaged> > XVector_Internal;

typedef Kokkos::View<index_type,
Kokkos::LayoutLeft,
Kokkos::HostSpace,
Kokkos::MemoryTraits<Kokkos::Unmanaged> > RVector_Internal;

index_type result;
RVector_Internal R = RVector_Internal(&result);
XVector_Internal X = x;

Impl::Iamax<RVector_Internal,XVector_Internal>::iamax (R,X);
Kokkos::fence();
return result;
}

/// \brief R(j) = iamax(X(i,j))
///
/// Replace each entry in R with the (smallest) index of the element of the maximum magnitude of the
/// corresponding entry in X.
///
/// \tparam RMV 0-D or 1-D Kokkos::View specialization.
/// \tparam XMV 1-D or 2-D Kokkos::View specialization.
///
/// Note for TPL cuBLAS: When TPL cuBLAS iamax is used and returns result to a view, RMV must be 0-D view and XMV must be 1-D view.
template<class RV, class XMV>
void
iamax (const RV& R, const XMV& X,
typename std::enable_if<Kokkos::Impl::is_view<RV>::value, int>::type = 0)
{
static_assert (Kokkos::Impl::is_view<RV>::value, "KokkosBlas::iamax: "
"R is not a Kokkos::View.");
static_assert (Kokkos::Impl::is_view<XMV>::value, "KokkosBlas::iamax: "
"X is not a Kokkos::View.");
static_assert (Kokkos::Impl::is_same<typename RV::value_type,
typename RV::non_const_value_type>::value,
"KokkosBlas::iamax: R is const. "
"It must be nonconst, because it is an output argument "
"(we have to be able to write to its entries).");
static_assert (((RV::rank == 0) && (XMV::rank == 1)) ||
((RV::rank == 1) && (XMV::rank == 2)), "KokkosBlas::iamax: "
"RV and XMV must either have rank 0 and 1 or rank 1 and 2.");

typedef typename XMV::size_type index_type;
static_assert (Kokkos::Impl::is_same<typename RV::value_type,
index_type>::value,
"KokkosBlas::iamax: R must have the type of"
"the Xvectors size_type it is an output argument "
"(we have to be able to write to its entries).");

// Check compatibility of dimensions at run time.
if (X.extent(1) != R.extent(0)) {
std::ostringstream os;
os << "KokkosBlas::iamax (MV): Dimensions of R and X do not match: "
<< "R: " << R.extent(0)
<< ", X: " << X.extent(0) << " x " << X.extent(1);
Kokkos::Impl::throw_runtime_exception (os.str ());
}

// Create unmanaged versions of the input Views. RV may be rank 0 or rank 2.
// XMV may be rank 1 or rank 2.
typedef Kokkos::View<
typename std::conditional<
RV::rank == 0,
typename RV::non_const_value_type,
typename RV::non_const_value_type* >::type,
typename KokkosKernels::Impl::GetUnifiedLayout<RV>::array_layout,
typename std::conditional<
std::is_same<typename RV::device_type::memory_space, Kokkos::HostSpace>::value,
Kokkos::HostSpace,
typename RV::device_type >::type,
Kokkos::MemoryTraits<Kokkos::Unmanaged> > RV_Internal;
typedef Kokkos::View<
typename std::conditional<
XMV::rank == 1,
typename XMV::const_value_type*,
typename XMV::const_value_type** >::type,
typename KokkosKernels::Impl::GetUnifiedLayout<XMV>::array_layout,
typename XMV::device_type,
Kokkos::MemoryTraits<Kokkos::Unmanaged> > XMV_Internal;

RV_Internal R_internal = R;
XMV_Internal X_internal = X;

Impl::Iamax<RV_Internal, XMV_Internal>::iamax (R_internal, X_internal);
}

}

#endif // KOKKOSBLAS1_IAMAX_HPP_

Loading

0 comments on commit 624ee31

Please sign in to comment.