Skip to content

Commit

Permalink
#5635: Add test for parallel_scan with return value for ThreadVectorR…
Browse files Browse the repository at this point in the history
…ange
  • Loading branch information
thearusable committed Jul 24, 2023
1 parent 7ee8bbb commit d2a3b91
Showing 1 changed file with 81 additions and 0 deletions.
81 changes: 81 additions & 0 deletions core/unit_test/TestTeamVector.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -605,6 +605,71 @@ struct functor_vec_scan {
}
};

// Temporary: This condition will progressively be reduced when parallel_scan
// with return value will be implemented for more backends.
#if defined(KOKKOS_ENABLE_CUDA)
#if !defined(KOKKOS_ENABLE_HIP) && !defined(KOKKOS_ENABLE_OPENACC) && \
!defined(KOKKOS_ENABLE_SYCL) && !defined(KOKKOS_ENABLE_THREADS) && \
!defined(KOKKOS_ENABLE_OPENMPTARGET) && !defined(KOKKOS_ENABLE_HPX) && \
!defined(KOKKOS_ENABLE_SERIAL) && !defined(KOKKOS_ENABLE_OPENMP)
template <typename Scalar, class ExecutionSpace>
struct functor_vec_scan_ret_val {
using policy_type = Kokkos::TeamPolicy<ExecutionSpace>;
using execution_space = ExecutionSpace;
using view_type = Kokkos::View<Scalar **, execution_space>;

Kokkos::View<int, Kokkos::LayoutLeft, ExecutionSpace> flag;
view_type return_values;
int team_size;

functor_vec_scan_ret_val(
Kokkos::View<int, Kokkos::LayoutLeft, ExecutionSpace> flag_, int nteams,
int tsize)
: flag(flag_), team_size(tsize) {
return_values = view_type("return_values", nteams, tsize);
}

KOKKOS_INLINE_FUNCTION
void operator()(typename policy_type::member_type team) const {
Scalar return_val;

Kokkos::parallel_scan(
Kokkos::ThreadVectorRange(team, 13),
[&](int i, Scalar &val, bool final) {
val += i;

if (final) {
Scalar test = 0;
for (int k = 0; k <= i; k++) test += k;
return_values(team.league_rank(), team.team_rank()) = test;

if (test != val) {
Kokkos::printf("FAILED vector_par_scan %i %i %lf %lf\n",
team.league_rank(), team.team_rank(),
static_cast<double>(test),
static_cast<double>(val));

flag() = 1;
}
}
},
return_val);

if (flag() == 0 &&
return_values(team.league_rank(), team.team_rank()) != return_val) {
Kokkos::printf("FAILED vector_scan_ret_val %i %i %lf %lf\n",
team.league_rank(), team.team_rank(),
static_cast<double>(
return_values(team.league_rank(), team.team_rank())),
static_cast<double>(return_val));

flag() = 1;
}
}
};
#endif
#endif

template <typename Scalar, class ExecutionSpace>
struct functor_reduce {
using value_type = double;
Expand Down Expand Up @@ -676,6 +741,21 @@ bool test_scalar(int nteams, int team_size, int test) {
Kokkos::parallel_for(
"B", Kokkos::TeamPolicy<ExecutionSpace>(nteams, team_size, 8),
functor_vec_single<Scalar, ExecutionSpace>(d_flag, 4, 13));
} else if (test == 12) {
// Temporary: This condition will progressively be reduced when
// parallel_scan
// with return value will be implemented for more backends.
#if defined(KOKKOS_ENABLE_CUDA)
#if !defined(KOKKOS_ENABLE_HIP) && !defined(KOKKOS_ENABLE_OPENACC) && \
!defined(KOKKOS_ENABLE_SYCL) && !defined(KOKKOS_ENABLE_THREADS) && \
!defined(KOKKOS_ENABLE_OPENMPTARGET) && !defined(KOKKOS_ENABLE_HPX) && \
!defined(KOKKOS_ENABLE_SERIAL) && !defined(KOKKOS_ENABLE_OPENMP)
Kokkos::parallel_for(
Kokkos::TeamPolicy<ExecutionSpace>(nteams, team_size, 8),
functor_vec_scan_ret_val<Scalar, ExecutionSpace>(d_flag, nteams,
team_size));
#endif
#endif
}

Kokkos::deep_copy(h_flag, d_flag);
Expand Down Expand Up @@ -965,6 +1045,7 @@ TEST(TEST_CATEGORY, team_vector) {
ASSERT_TRUE((TestTeamVector::Test<TEST_EXECSPACE>(9)));
ASSERT_TRUE((TestTeamVector::Test<TEST_EXECSPACE>(10)));
ASSERT_TRUE((TestTeamVector::Test<TEST_EXECSPACE>(11)));
ASSERT_TRUE((TestTeamVector::Test<TEST_EXECSPACE>(12)));
}
#endif

Expand Down

0 comments on commit d2a3b91

Please sign in to comment.