Files
lammps/lib/kokkos/algorithms/unit_tests/TestStdAlgorithmsTeamTransformReduce.cpp
2024-09-11 09:20:36 -06:00

324 lines
11 KiB
C++

//@HEADER
// ************************************************************************
//
// Kokkos v. 4.0
// Copyright (2022) National Technology & Engineering
// Solutions of Sandia, LLC (NTESS).
//
// Under the terms of Contract DE-NA0003525 with NTESS,
// the U.S. Government retains certain rights in this software.
//
// Part of Kokkos, under the Apache License v2.0 with LLVM Exceptions.
// See https://kokkos.org/LICENSE for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//@HEADER
#include <TestStdAlgorithmsCommon.hpp>
#ifndef KOKKOS_ENABLE_OPENMPTARGET
namespace Test {
namespace stdalgos {
namespace TeamTransformReduce {
namespace KE = Kokkos::Experimental;
template <class ValueType>
struct PlusFunctor {
KOKKOS_INLINE_FUNCTION
ValueType operator()(const ValueType& lhs, const ValueType& rhs) const {
return lhs + rhs;
}
};
template <class ValueType>
struct MultipliesFunctor {
KOKKOS_INLINE_FUNCTION
ValueType operator()(const ValueType& lhs, const ValueType& rhs) const {
return lhs * rhs;
}
};
template <class ValueType>
struct PlusOneFunctor {
KOKKOS_INLINE_FUNCTION
ValueType operator()(const ValueType& val) const { return val + 1; };
};
template <class FirstDataViewType, class SecondDataViewType,
class InitValuesViewType, class ResultsViewType,
class IntraTeamSentinelView, class BinaryJoinerType,
class BinaryTransformType, class UnaryTransformType>
struct TestFunctorA {
FirstDataViewType m_firstDataView;
SecondDataViewType m_secondDataView;
InitValuesViewType m_initValuesView;
ResultsViewType m_resultsView;
IntraTeamSentinelView m_intraTeamSentinelView;
BinaryJoinerType m_binaryJoiner;
BinaryTransformType m_binaryTransform;
UnaryTransformType m_unaryTransform;
int m_apiPick;
TestFunctorA(const FirstDataViewType firstDataView,
const SecondDataViewType secondDataview,
const InitValuesViewType initValuesView,
const ResultsViewType resultsView,
const IntraTeamSentinelView intraTeamSentinelView,
BinaryJoinerType binaryJoiner,
BinaryTransformType binaryTransform,
UnaryTransformType unaryTransform, int apiPick)
: m_firstDataView(firstDataView),
m_secondDataView(secondDataview),
m_initValuesView(initValuesView),
m_resultsView(resultsView),
m_intraTeamSentinelView(intraTeamSentinelView),
m_binaryJoiner(binaryJoiner),
m_binaryTransform(binaryTransform),
m_unaryTransform(unaryTransform),
m_apiPick(apiPick) {}
template <class MemberType>
KOKKOS_INLINE_FUNCTION void operator()(const MemberType& member) const {
const int rowIndex = member.league_rank();
auto firstDataRow =
Kokkos::subview(m_firstDataView, rowIndex, Kokkos::ALL());
auto firstDataRowBegin = KE::cbegin(firstDataRow);
auto firstDataRowEnd = KE::cend(firstDataRow);
auto secondDataRow =
Kokkos::subview(m_secondDataView, rowIndex, Kokkos::ALL());
auto secondDataRowBegin = KE::cbegin(secondDataRow);
const auto initVal = m_initValuesView(rowIndex);
typename InitValuesViewType::non_const_value_type result = 0;
switch (m_apiPick) {
case 0: {
result =
KE::transform_reduce(member, firstDataRowBegin, firstDataRowEnd,
secondDataRowBegin, initVal);
Kokkos::single(Kokkos::PerTeam(member),
[=, *this]() { m_resultsView(rowIndex) = result; });
break;
}
case 1: {
result =
KE::transform_reduce(member, firstDataRow, secondDataRow, initVal);
Kokkos::single(Kokkos::PerTeam(member),
[=, *this]() { m_resultsView(rowIndex) = result; });
break;
}
case 2: {
result = KE::transform_reduce(
member, firstDataRowBegin, firstDataRowEnd, secondDataRowBegin,
initVal, m_binaryJoiner, m_binaryTransform);
Kokkos::single(Kokkos::PerTeam(member),
[=, *this]() { m_resultsView(rowIndex) = result; });
break;
}
case 3: {
result =
KE::transform_reduce(member, firstDataRow, secondDataRow, initVal,
m_binaryJoiner, m_binaryTransform);
Kokkos::single(Kokkos::PerTeam(member),
[=, *this]() { m_resultsView(rowIndex) = result; });
break;
}
case 4: {
result =
KE::transform_reduce(member, firstDataRowBegin, firstDataRowEnd,
initVal, m_binaryJoiner, m_unaryTransform);
Kokkos::single(Kokkos::PerTeam(member),
[=, *this]() { m_resultsView(rowIndex) = result; });
break;
}
case 5: {
result = KE::transform_reduce(member, firstDataRow, initVal,
m_binaryJoiner, m_unaryTransform);
Kokkos::single(Kokkos::PerTeam(member),
[=, *this]() { m_resultsView(rowIndex) = result; });
break;
}
}
// store result of checking if all members have their local
// values matching the one stored in m_distancesView
member.team_barrier();
const bool intraTeamCheck = team_members_have_matching_result(
member, result, m_resultsView(rowIndex));
Kokkos::single(Kokkos::PerTeam(member), [=, *this]() {
m_intraTeamSentinelView(rowIndex) = intraTeamCheck;
});
}
};
template <class LayoutTag, class ValueType>
void test_A(std::size_t numTeams, std::size_t numCols, int apiId) {
/* description:
use a rank-2 view randomly filled with values,
and run a team-level transform_reduce
*/
// -----------------------------------------------
// prepare data
// -----------------------------------------------
// create a view in the memory space associated with default exespace
// with as many rows as the number of teams and fill it with random
// values from an arbitrary range.
constexpr ValueType lowerBound = 5;
constexpr ValueType upperBound = 523;
const auto bounds = make_bounds(lowerBound, upperBound);
auto [firstDataView, firstDataViewBeforeOp_h] =
create_random_view_and_host_clone(LayoutTag{}, numTeams, numCols, bounds,
"firstDataView");
auto [secondDataView, secondDataViewBeforeOp_h] =
create_random_view_and_host_clone(LayoutTag{}, numTeams, numCols, bounds,
"secondDataView");
// Create view of init values to be used by test cases
Kokkos::View<ValueType*, Kokkos::DefaultHostExecutionSpace> initValuesView_h(
"initValuesView_h", numTeams);
using rand_pool =
Kokkos::Random_XorShift64_Pool<Kokkos::DefaultHostExecutionSpace>;
rand_pool pool(lowerBound * upperBound);
Kokkos::fill_random(initValuesView_h, pool, lowerBound, upperBound);
// -----------------------------------------------
// launch kokkos kernel
// -----------------------------------------------
using space_t = Kokkos::DefaultExecutionSpace;
Kokkos::TeamPolicy<space_t> policy(numTeams, Kokkos::AUTO());
// to verify that things work, each team stores the result of its
// transform_reduce call, and then we check that these match what we expect
Kokkos::View<ValueType*> resultsView("resultsView", numTeams);
// sentinel to check if all members of the team compute the same result
Kokkos::View<bool*> intraTeamSentinelView("intraTeamSameResult", numTeams);
PlusFunctor<ValueType> binaryJoiner;
MultipliesFunctor<ValueType> binaryTransform;
PlusOneFunctor<ValueType> unaryTransform;
// use CTAD for functor
auto initValuesView =
Kokkos::create_mirror_view_and_copy(space_t(), initValuesView_h);
TestFunctorA fnc(firstDataView, secondDataView, initValuesView, resultsView,
intraTeamSentinelView, binaryJoiner, binaryTransform,
unaryTransform, apiId);
Kokkos::parallel_for(policy, fnc);
// -----------------------------------------------
// run cpp-std kernel and check
// -----------------------------------------------
auto resultsView_h = create_host_space_copy(resultsView);
auto intraTeamSentinelView_h = create_host_space_copy(intraTeamSentinelView);
for (std::size_t i = 0; i < firstDataView.extent(0); ++i) {
auto firstDataRow =
Kokkos::subview(firstDataViewBeforeOp_h, i, Kokkos::ALL());
const auto firstDataRowBegin = KE::cbegin(firstDataRow);
const auto firstDataRowEnd = KE::cend(firstDataRow);
auto secondDataRow =
Kokkos::subview(secondDataViewBeforeOp_h, i, Kokkos::ALL());
const auto secondDataRowBegin = KE::cbegin(secondDataRow);
const auto initVal = initValuesView_h(i);
ASSERT_TRUE(intraTeamSentinelView_h(i));
// libstdc++ as provided by GCC 8 does not have reduce, transform_reduce,
// exclusive_scan, inclusive_scan, transform_exclusive_scan,
// transform_inclusive_scan and for GCC 9.1, 9.2 fails to compile them for
// missing overload not accepting policy
#if defined(_GLIBCXX_RELEASE) && (_GLIBCXX_RELEASE <= 9)
#define transform_reduce testing_transform_reduce
#else
#define transform_reduce std::transform_reduce
#endif
switch (apiId) {
case 0:
case 1: {
const auto result = transform_reduce(firstDataRowBegin, firstDataRowEnd,
secondDataRowBegin, initVal);
if constexpr (std::is_floating_point_v<ValueType>) {
EXPECT_FLOAT_EQ(result, resultsView_h(i));
} else {
ASSERT_EQ(result, resultsView_h(i));
}
break;
}
case 2:
case 3: {
const ValueType result = transform_reduce(
firstDataRowBegin, firstDataRowEnd, secondDataRowBegin, initVal,
binaryJoiner, binaryTransform);
if constexpr (std::is_floating_point_v<ValueType>) {
EXPECT_FLOAT_EQ(result, resultsView_h(i));
} else {
ASSERT_EQ(result, resultsView_h(i));
}
break;
}
case 4:
case 5: {
const ValueType result =
transform_reduce(firstDataRowBegin, firstDataRowEnd, initVal,
binaryJoiner, unaryTransform);
if constexpr (std::is_floating_point_v<ValueType>) {
EXPECT_FLOAT_EQ(result, resultsView_h(i));
} else {
ASSERT_EQ(result, resultsView_h(i));
}
break;
}
}
#undef transform_reduce
}
}
template <class LayoutTag, class ValueType>
void run_all_scenarios() {
for (int numTeams : teamSizesToTest) {
for (const auto& numCols : {0, 1, 2, 13, 101, 1444, 8153}) {
for (int apiId : {0, 1, 2, 3, 4, 5}) {
test_A<LayoutTag, ValueType>(numTeams, numCols, apiId);
}
}
}
}
TEST(std_algorithms_transform_reduce_team_test, test) {
run_all_scenarios<DynamicTag, double>();
run_all_scenarios<StridedTwoRowsTag, int>();
run_all_scenarios<StridedThreeRowsTag, unsigned>();
}
} // namespace TeamTransformReduce
} // namespace stdalgos
} // namespace Test
#endif