Files
lammps/lib/kokkos/core/unit_test/TestExecSpacePartitioning.hpp
2023-06-29 10:42:42 -06:00

141 lines
4.1 KiB
C++

//@HEADER
// ************************************************************************
//
// Kokkos v. 4.0
// Copyright (2022) National Technology & Engineering
// Solutions of Sandia, LLC (NTESS).
//
// Under the terms of Contract DE-NA0003525 with NTESS,
// the U.S. Government retains certain rights in this software.
//
// Part of Kokkos, under the Apache License v2.0 with LLVM Exceptions.
// See https://kokkos.org/LICENSE for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//@HEADER
#include <cstdio>
#include <sstream>
#include <iostream>
#include <thread>
#include <Kokkos_Core.hpp>
namespace Test {
namespace {
struct SumFunctor {
KOKKOS_INLINE_FUNCTION
void operator()(int i, int& lsum) const { lsum += i; }
};
template <class ExecSpace>
void check_distinctive(ExecSpace, ExecSpace) {}
#ifdef KOKKOS_ENABLE_CUDA
void check_distinctive(Kokkos::Cuda exec1, Kokkos::Cuda exec2) {
ASSERT_NE(exec1.cuda_stream(), exec2.cuda_stream());
}
#endif
#ifdef KOKKOS_ENABLE_HIP
void check_distinctive(Kokkos::HIP exec1, Kokkos::HIP exec2) {
ASSERT_NE(exec1.hip_stream(), exec2.hip_stream());
}
#endif
#ifdef KOKKOS_ENABLE_SYCL
void check_distinctive(Kokkos::Experimental::SYCL exec1,
Kokkos::Experimental::SYCL exec2) {
ASSERT_NE(*exec1.impl_internal_space_instance()->m_queue,
*exec2.impl_internal_space_instance()->m_queue);
}
#endif
#ifdef KOKKOS_ENABLE_OPENMP
void check_distinctive(Kokkos::OpenMP exec1, Kokkos::OpenMP exec2) {
ASSERT_NE(exec1, exec2);
}
#endif
} // namespace
#ifdef KOKKOS_ENABLE_OPENMP
template <class Lambda1, class Lambda2>
void run_threaded_test(const Lambda1 l1, const Lambda2 l2) {
#pragma omp parallel num_threads(2)
{
if (omp_get_thread_num() == 0) l1();
if (omp_get_thread_num() == 1) l2();
}
}
// We cannot run the multithreaded test when threads or HPX is enabled because
// we cannot launch a thread from inside another thread
#elif !defined(KOKKOS_ENABLE_THREADS) && !defined(KOKKOS_ENABLE_HPX)
template <class Lambda1, class Lambda2>
void run_threaded_test(const Lambda1 l1, const Lambda2 l2) {
std::thread t1(std::move(l1));
std::thread t2(std::move(l2));
t1.join();
t2.join();
}
#else
template <class Lambda1, class Lambda2>
void run_threaded_test(const Lambda1 l1, const Lambda2 l2) {
l1();
l2();
}
#endif
void test_partitioning(std::vector<TEST_EXECSPACE>& instances) {
check_distinctive(instances[0], instances[1]);
int sum1, sum2;
int N = 3910;
run_threaded_test(
[&]() {
Kokkos::parallel_reduce(
Kokkos::RangePolicy<TEST_EXECSPACE>(instances[0], 0, N),
SumFunctor(), sum1);
},
[&]() {
Kokkos::parallel_reduce(
Kokkos::RangePolicy<TEST_EXECSPACE>(instances[1], 0, N),
SumFunctor(), sum2);
});
ASSERT_EQ(sum1, sum2);
ASSERT_EQ(sum1, N * (N - 1) / 2);
#if defined(KOKKOS_ENABLE_CUDA) || defined(KOKKOS_ENABLE_HIP) || \
defined(KOKKOS_ENABLE_SYCL) || defined(KOKKOS_ENABLE_OPENMP)
// Eliminate unused function warning
// (i.e. when compiling for Serial and CUDA, during Serial compilation the
// Cuda overload is unused ...)
if (sum1 != sum2) {
#ifdef KOKKOS_ENABLE_CUDA
check_distinctive(Kokkos::Cuda(), Kokkos::Cuda());
#endif
#ifdef KOKKOS_ENABLE_HIP
check_distinctive(Kokkos::HIP(), Kokkos::HIP());
#endif
#ifdef KOKKOS_ENABLE_SYCL
check_distinctive(Kokkos::Experimental::SYCL(),
Kokkos::Experimental::SYCL());
#endif
#ifdef KOKKOS_ENABLE_OPENMP
check_distinctive(Kokkos::OpenMP(), Kokkos::OpenMP());
#endif
}
#endif
}
TEST(TEST_CATEGORY, partitioning_by_args) {
auto instances =
Kokkos::Experimental::partition_space(TEST_EXECSPACE(), 1, 1);
ASSERT_EQ(int(instances.size()), 2);
test_partitioning(instances);
}
TEST(TEST_CATEGORY, partitioning_by_vector) {
// Make sure we can use a temporary as argument for weights
auto instances = Kokkos::Experimental::partition_space(
TEST_EXECSPACE(), std::vector<int> /*weights*/ {1, 1});
ASSERT_EQ(int(instances.size()), 2);
test_partitioning(instances);
}
} // namespace Test