git-svn-id: svn://svn.icms.temple.edu/lammps-ro/trunk@13583 f3b2605a-c512-4ea7-a41b-209d697bcdaa
This commit is contained in:
81
lib/kokkos/containers/performance_tests/Makefile
Executable file
81
lib/kokkos/containers/performance_tests/Makefile
Executable file
@ -0,0 +1,81 @@
|
||||
KOKKOS_PATH = ../..
|
||||
|
||||
GTEST_PATH = ../../TPL/gtest
|
||||
|
||||
vpath %.cpp ${KOKKOS_PATH}/containers/performance_tests
|
||||
|
||||
default: build_all
|
||||
echo "End Build"
|
||||
|
||||
|
||||
include $(KOKKOS_PATH)/Makefile.kokkos
|
||||
|
||||
ifeq ($(KOKKOS_INTERNAL_USE_CUDA), 1)
|
||||
CXX = nvcc_wrapper
|
||||
CXXFLAGS ?= -O3
|
||||
LINK = $(CXX)
|
||||
LDFLAGS ?= -lpthread
|
||||
else
|
||||
CXX ?= g++
|
||||
CXXFLAGS ?= -O3
|
||||
LINK ?= $(CXX)
|
||||
LDFLAGS ?= -lpthread
|
||||
endif
|
||||
|
||||
KOKKOS_CXXFLAGS += -I$(GTEST_PATH) -I${KOKKOS_PATH}/containers/performance_tests
|
||||
|
||||
TEST_TARGETS =
|
||||
TARGETS =
|
||||
|
||||
ifeq ($(KOKKOS_INTERNAL_USE_CUDA), 1)
|
||||
OBJ_CUDA = TestCuda.o TestMain.o gtest-all.o
|
||||
TARGETS += KokkosContainers_PerformanceTest_Cuda
|
||||
TEST_TARGETS += test-cuda
|
||||
endif
|
||||
|
||||
ifeq ($(KOKKOS_INTERNAL_USE_PTHREADS), 1)
|
||||
OBJ_THREADS = TestThreads.o TestMain.o gtest-all.o
|
||||
TARGETS += KokkosContainers_PerformanceTest_Threads
|
||||
TEST_TARGETS += test-threads
|
||||
endif
|
||||
|
||||
ifeq ($(KOKKOS_INTERNAL_USE_OPENMP), 1)
|
||||
OBJ_OPENMP = TestOpenMP.o TestMain.o gtest-all.o
|
||||
TARGETS += KokkosContainers_PerformanceTest_OpenMP
|
||||
TEST_TARGETS += test-openmp
|
||||
endif
|
||||
|
||||
KokkosContainers_PerformanceTest_Cuda: $(OBJ_CUDA) $(KOKKOS_LINK_DEPENDS)
|
||||
$(LINK) $(KOKKOS_LDFLAGS) $(LDFLAGS) $(EXTRA_PATH) $(OBJ_CUDA) $(KOKKOS_LIBS) $(LIB) -o KokkosContainers_PerformanceTest_Cuda
|
||||
|
||||
KokkosContainers_PerformanceTest_Threads: $(OBJ_THREADS) $(KOKKOS_LINK_DEPENDS)
|
||||
$(LINK) $(KOKKOS_LDFLAGS) $(LDFLAGS) $(EXTRA_PATH) $(OBJ_THREADS) $(KOKKOS_LIBS) $(LIB) -o KokkosContainers_PerformanceTest_Threads
|
||||
|
||||
KokkosContainers_PerformanceTest_OpenMP: $(OBJ_OPENMP) $(KOKKOS_LINK_DEPENDS)
|
||||
$(LINK) $(KOKKOS_LDFLAGS) $(LDFLAGS) $(EXTRA_PATH) $(OBJ_OPENMP) $(KOKKOS_LIBS) $(LIB) -o KokkosContainers_PerformanceTest_OpenMP
|
||||
|
||||
test-cuda: KokkosContainers_PerformanceTest_Cuda
|
||||
./KokkosContainers_PerformanceTest_Cuda
|
||||
|
||||
test-threads: KokkosContainers_PerformanceTest_Threads
|
||||
./KokkosContainers_PerformanceTest_Threads
|
||||
|
||||
test-openmp: KokkosContainers_PerformanceTest_OpenMP
|
||||
./KokkosContainers_PerformanceTest_OpenMP
|
||||
|
||||
|
||||
build_all: $(TARGETS)
|
||||
|
||||
test: $(TEST_TARGETS)
|
||||
|
||||
clean: kokkos-clean
|
||||
rm -f *.o $(TARGETS)
|
||||
|
||||
# Compilation rules
|
||||
|
||||
%.o:%.cpp $(KOKKOS_CPP_DEPENDS)
|
||||
$(CXX) $(KOKKOS_CPPFLAGS) $(KOKKOS_CXXFLAGS) $(CXXFLAGS) $(EXTRA_INC) -c $<
|
||||
|
||||
gtest-all.o:$(GTEST_PATH)/gtest/gtest-all.cc
|
||||
$(CXX) $(KOKKOS_CPPFLAGS) $(KOKKOS_CXXFLAGS) $(CXXFLAGS) $(EXTRA_INC) -c $(GTEST_PATH)/gtest/gtest-all.cc
|
||||
|
||||
100
lib/kokkos/containers/performance_tests/TestCuda.cpp
Executable file
100
lib/kokkos/containers/performance_tests/TestCuda.cpp
Executable file
@ -0,0 +1,100 @@
|
||||
/*
|
||||
//@HEADER
|
||||
// ************************************************************************
|
||||
//
|
||||
// Kokkos v. 2.0
|
||||
// Copyright (2014) Sandia Corporation
|
||||
//
|
||||
// Under the terms of Contract DE-AC04-94AL85000 with Sandia Corporation,
|
||||
// the U.S. Government retains certain rights in this software.
|
||||
//
|
||||
// Redistribution and use in source and binary forms, with or without
|
||||
// modification, are permitted provided that the following conditions are
|
||||
// met:
|
||||
//
|
||||
// 1. Redistributions of source code must retain the above copyright
|
||||
// notice, this list of conditions and the following disclaimer.
|
||||
//
|
||||
// 2. Redistributions in binary form must reproduce the above copyright
|
||||
// notice, this list of conditions and the following disclaimer in the
|
||||
// documentation and/or other materials provided with the distribution.
|
||||
//
|
||||
// 3. Neither the name of the Corporation nor the names of the
|
||||
// contributors may be used to endorse or promote products derived from
|
||||
// this software without specific prior written permission.
|
||||
//
|
||||
// THIS SOFTWARE IS PROVIDED BY SANDIA CORPORATION "AS IS" AND ANY
|
||||
// EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
||||
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
||||
// PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL SANDIA CORPORATION OR THE
|
||||
// CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
||||
// EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
||||
// PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
||||
// PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
|
||||
// LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
||||
// NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
||||
// SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||
//
|
||||
// Questions? Contact H. Carter Edwards (hcedwar@sandia.gov)
|
||||
//
|
||||
// ************************************************************************
|
||||
//@HEADER
|
||||
*/
|
||||
|
||||
#include <stdint.h>
|
||||
#include <string>
|
||||
#include <iostream>
|
||||
#include <iomanip>
|
||||
#include <sstream>
|
||||
#include <fstream>
|
||||
|
||||
#include <gtest/gtest.h>
|
||||
|
||||
#include <Kokkos_Core.hpp>
|
||||
|
||||
#if defined( KOKKOS_HAVE_CUDA )
|
||||
|
||||
#include <Kokkos_UnorderedMap.hpp>
|
||||
|
||||
#include <TestGlobal2LocalIds.hpp>
|
||||
|
||||
#include <TestUnorderedMapPerformance.hpp>
|
||||
|
||||
namespace Performance {
|
||||
|
||||
class cuda : public ::testing::Test {
|
||||
protected:
|
||||
static void SetUpTestCase()
|
||||
{
|
||||
std::cout << std::setprecision(5) << std::scientific;
|
||||
Kokkos::HostSpace::execution_space::initialize();
|
||||
Kokkos::Cuda::initialize( Kokkos::Cuda::SelectDevice(0) );
|
||||
}
|
||||
static void TearDownTestCase()
|
||||
{
|
||||
Kokkos::Cuda::finalize();
|
||||
Kokkos::HostSpace::execution_space::finalize();
|
||||
}
|
||||
};
|
||||
|
||||
TEST_F( cuda, global_2_local)
|
||||
{
|
||||
std::cout << "Cuda" << std::endl;
|
||||
std::cout << "size, create, generate, fill, find" << std::endl;
|
||||
for (unsigned i=Performance::begin_id_size; i<=Performance::end_id_size; i *= Performance::id_step)
|
||||
test_global_to_local_ids<Kokkos::Cuda>(i);
|
||||
}
|
||||
|
||||
TEST_F( cuda, unordered_map_performance_near)
|
||||
{
|
||||
Perf::run_performance_tests<Kokkos::Cuda,true>("cuda-near");
|
||||
}
|
||||
|
||||
TEST_F( cuda, unordered_map_performance_far)
|
||||
{
|
||||
Perf::run_performance_tests<Kokkos::Cuda,false>("cuda-far");
|
||||
}
|
||||
|
||||
}
|
||||
|
||||
#endif /* #if defined( KOKKOS_HAVE_CUDA ) */
|
||||
231
lib/kokkos/containers/performance_tests/TestGlobal2LocalIds.hpp
Executable file
231
lib/kokkos/containers/performance_tests/TestGlobal2LocalIds.hpp
Executable file
@ -0,0 +1,231 @@
|
||||
//@HEADER
|
||||
// ************************************************************************
|
||||
//
|
||||
// Kokkos v. 2.0
|
||||
// Copyright (2014) Sandia Corporation
|
||||
//
|
||||
// Under the terms of Contract DE-AC04-94AL85000 with Sandia Corporation,
|
||||
// the U.S. Government retains certain rights in this software.
|
||||
//
|
||||
// Redistribution and use in source and binary forms, with or without
|
||||
// modification, are permitted provided that the following conditions are
|
||||
// met:
|
||||
//
|
||||
// 1. Redistributions of source code must retain the above copyright
|
||||
// notice, this list of conditions and the following disclaimer.
|
||||
//
|
||||
// 2. Redistributions in binary form must reproduce the above copyright
|
||||
// notice, this list of conditions and the following disclaimer in the
|
||||
// documentation and/or other materials provided with the distribution.
|
||||
//
|
||||
// 3. Neither the name of the Corporation nor the names of the
|
||||
// contributors may be used to endorse or promote products derived from
|
||||
// this software without specific prior written permission.
|
||||
//
|
||||
// THIS SOFTWARE IS PROVIDED BY SANDIA CORPORATION "AS IS" AND ANY
|
||||
// EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
||||
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
||||
// PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL SANDIA CORPORATION OR THE
|
||||
// CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
||||
// EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
||||
// PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
||||
// PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
|
||||
// LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
||||
// NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
||||
// SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||
//
|
||||
// Questions? Contact H. Carter Edwards (hcedwar@sandia.gov)
|
||||
//
|
||||
// ************************************************************************
|
||||
//@HEADER
|
||||
|
||||
#ifndef KOKKOS_TEST_GLOBAL_TO_LOCAL_IDS_HPP
|
||||
#define KOKKOS_TEST_GLOBAL_TO_LOCAL_IDS_HPP
|
||||
|
||||
#include <Kokkos_Core.hpp>
|
||||
#include <Kokkos_UnorderedMap.hpp>
|
||||
#include <vector>
|
||||
#include <algorithm>
|
||||
|
||||
#include <impl/Kokkos_Timer.hpp>
|
||||
|
||||
// This test will simulate global ids
|
||||
|
||||
namespace Performance {
|
||||
|
||||
static const unsigned begin_id_size = 256u;
|
||||
static const unsigned end_id_size = 1u << 22;
|
||||
static const unsigned id_step = 2u;
|
||||
|
||||
union helper
|
||||
{
|
||||
uint32_t word;
|
||||
uint8_t byte[4];
|
||||
};
|
||||
|
||||
|
||||
template <typename Device>
|
||||
struct generate_ids
|
||||
{
|
||||
typedef Device execution_space;
|
||||
typedef typename execution_space::size_type size_type;
|
||||
typedef Kokkos::View<uint32_t*,execution_space> local_id_view;
|
||||
|
||||
local_id_view local_2_global;
|
||||
|
||||
generate_ids( local_id_view & ids)
|
||||
: local_2_global(ids)
|
||||
{
|
||||
Kokkos::parallel_for(local_2_global.dimension_0(), *this);
|
||||
}
|
||||
|
||||
|
||||
KOKKOS_INLINE_FUNCTION
|
||||
void operator()(size_type i) const
|
||||
{
|
||||
|
||||
helper x = {static_cast<uint32_t>(i)};
|
||||
|
||||
// shuffle the bytes of i to create a unique, semi-random global_id
|
||||
x.word = ~x.word;
|
||||
|
||||
uint8_t tmp = x.byte[3];
|
||||
x.byte[3] = x.byte[1];
|
||||
x.byte[1] = tmp;
|
||||
|
||||
tmp = x.byte[2];
|
||||
x.byte[2] = x.byte[0];
|
||||
x.byte[0] = tmp;
|
||||
|
||||
local_2_global[i] = x.word;
|
||||
}
|
||||
|
||||
};
|
||||
|
||||
template <typename Device>
|
||||
struct fill_map
|
||||
{
|
||||
typedef Device execution_space;
|
||||
typedef typename execution_space::size_type size_type;
|
||||
typedef Kokkos::View<const uint32_t*,execution_space, Kokkos::MemoryRandomAccess> local_id_view;
|
||||
typedef Kokkos::UnorderedMap<uint32_t,size_type,execution_space> global_id_view;
|
||||
|
||||
global_id_view global_2_local;
|
||||
local_id_view local_2_global;
|
||||
|
||||
fill_map( global_id_view gIds, local_id_view lIds)
|
||||
: global_2_local(gIds) , local_2_global(lIds)
|
||||
{
|
||||
Kokkos::parallel_for(local_2_global.dimension_0(), *this);
|
||||
}
|
||||
|
||||
KOKKOS_INLINE_FUNCTION
|
||||
void operator()(size_type i) const
|
||||
{
|
||||
global_2_local.insert( local_2_global[i], i);
|
||||
}
|
||||
|
||||
};
|
||||
|
||||
template <typename Device>
|
||||
struct find_test
|
||||
{
|
||||
typedef Device execution_space;
|
||||
typedef typename execution_space::size_type size_type;
|
||||
typedef Kokkos::View<const uint32_t*,execution_space, Kokkos::MemoryRandomAccess> local_id_view;
|
||||
typedef Kokkos::UnorderedMap<const uint32_t, const size_type,execution_space> global_id_view;
|
||||
|
||||
global_id_view global_2_local;
|
||||
local_id_view local_2_global;
|
||||
|
||||
typedef size_t value_type;
|
||||
|
||||
find_test( global_id_view gIds, local_id_view lIds, value_type & num_errors)
|
||||
: global_2_local(gIds) , local_2_global(lIds)
|
||||
{
|
||||
Kokkos::parallel_reduce(local_2_global.dimension_0(), *this, num_errors);
|
||||
}
|
||||
|
||||
KOKKOS_INLINE_FUNCTION
|
||||
void init(value_type & v) const
|
||||
{ v = 0; }
|
||||
|
||||
KOKKOS_INLINE_FUNCTION
|
||||
void join(volatile value_type & dst, volatile value_type const & src) const
|
||||
{ dst += src; }
|
||||
|
||||
KOKKOS_INLINE_FUNCTION
|
||||
void operator()(size_type i, value_type & num_errors) const
|
||||
{
|
||||
uint32_t index = global_2_local.find( local_2_global[i] );
|
||||
|
||||
if ( global_2_local.value_at(index) != i) ++num_errors;
|
||||
}
|
||||
|
||||
};
|
||||
|
||||
template <typename Device>
|
||||
void test_global_to_local_ids(unsigned num_ids)
|
||||
{
|
||||
|
||||
typedef Device execution_space;
|
||||
typedef typename execution_space::size_type size_type;
|
||||
|
||||
typedef Kokkos::View<uint32_t*,execution_space> local_id_view;
|
||||
typedef Kokkos::UnorderedMap<uint32_t,size_type,execution_space> global_id_view;
|
||||
|
||||
//size
|
||||
std::cout << num_ids << ", ";
|
||||
|
||||
double elasped_time = 0;
|
||||
Kokkos::Impl::Timer timer;
|
||||
|
||||
local_id_view local_2_global("local_ids", num_ids);
|
||||
global_id_view global_2_local((3u*num_ids)/2u);
|
||||
|
||||
//create
|
||||
elasped_time = timer.seconds();
|
||||
std::cout << elasped_time << ", ";
|
||||
timer.reset();
|
||||
|
||||
// generate unique ids
|
||||
{
|
||||
generate_ids<Device> gen(local_2_global);
|
||||
}
|
||||
Device::fence();
|
||||
// generate
|
||||
elasped_time = timer.seconds();
|
||||
std::cout << elasped_time << ", ";
|
||||
timer.reset();
|
||||
|
||||
{
|
||||
fill_map<Device> fill(global_2_local, local_2_global);
|
||||
}
|
||||
Device::fence();
|
||||
|
||||
// fill
|
||||
elasped_time = timer.seconds();
|
||||
std::cout << elasped_time << ", ";
|
||||
timer.reset();
|
||||
|
||||
|
||||
size_t num_errors = 0;
|
||||
for (int i=0; i<100; ++i)
|
||||
{
|
||||
find_test<Device> find(global_2_local, local_2_global,num_errors);
|
||||
}
|
||||
Device::fence();
|
||||
|
||||
// find
|
||||
elasped_time = timer.seconds();
|
||||
std::cout << elasped_time << std::endl;
|
||||
|
||||
ASSERT_EQ( num_errors, 0u);
|
||||
}
|
||||
|
||||
|
||||
} // namespace Performance
|
||||
|
||||
|
||||
#endif //KOKKOS_TEST_GLOBAL_TO_LOCAL_IDS_HPP
|
||||
|
||||
50
lib/kokkos/containers/performance_tests/TestMain.cpp
Executable file
50
lib/kokkos/containers/performance_tests/TestMain.cpp
Executable file
@ -0,0 +1,50 @@
|
||||
/*
|
||||
//@HEADER
|
||||
// ************************************************************************
|
||||
//
|
||||
// Kokkos v. 2.0
|
||||
// Copyright (2014) Sandia Corporation
|
||||
//
|
||||
// Under the terms of Contract DE-AC04-94AL85000 with Sandia Corporation,
|
||||
// the U.S. Government retains certain rights in this software.
|
||||
//
|
||||
// Redistribution and use in source and binary forms, with or without
|
||||
// modification, are permitted provided that the following conditions are
|
||||
// met:
|
||||
//
|
||||
// 1. Redistributions of source code must retain the above copyright
|
||||
// notice, this list of conditions and the following disclaimer.
|
||||
//
|
||||
// 2. Redistributions in binary form must reproduce the above copyright
|
||||
// notice, this list of conditions and the following disclaimer in the
|
||||
// documentation and/or other materials provided with the distribution.
|
||||
//
|
||||
// 3. Neither the name of the Corporation nor the names of the
|
||||
// contributors may be used to endorse or promote products derived from
|
||||
// this software without specific prior written permission.
|
||||
//
|
||||
// THIS SOFTWARE IS PROVIDED BY SANDIA CORPORATION "AS IS" AND ANY
|
||||
// EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
||||
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
||||
// PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL SANDIA CORPORATION OR THE
|
||||
// CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
||||
// EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
||||
// PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
||||
// PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
|
||||
// LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
||||
// NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
||||
// SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||
//
|
||||
// Questions? Contact H. Carter Edwards (hcedwar@sandia.gov)
|
||||
//
|
||||
// ************************************************************************
|
||||
//@HEADER
|
||||
*/
|
||||
|
||||
#include <gtest/gtest.h>
|
||||
|
||||
int main(int argc, char *argv[]) {
|
||||
::testing::InitGoogleTest(&argc,argv);
|
||||
return RUN_ALL_TESTS();
|
||||
}
|
||||
|
||||
131
lib/kokkos/containers/performance_tests/TestOpenMP.cpp
Executable file
131
lib/kokkos/containers/performance_tests/TestOpenMP.cpp
Executable file
@ -0,0 +1,131 @@
|
||||
/*
|
||||
//@HEADER
|
||||
// ************************************************************************
|
||||
//
|
||||
// Kokkos v. 2.0
|
||||
// Copyright (2014) Sandia Corporation
|
||||
//
|
||||
// Under the terms of Contract DE-AC04-94AL85000 with Sandia Corporation,
|
||||
// the U.S. Government retains certain rights in this software.
|
||||
//
|
||||
// Redistribution and use in source and binary forms, with or without
|
||||
// modification, are permitted provided that the following conditions are
|
||||
// met:
|
||||
//
|
||||
// 1. Redistributions of source code must retain the above copyright
|
||||
// notice, this list of conditions and the following disclaimer.
|
||||
//
|
||||
// 2. Redistributions in binary form must reproduce the above copyright
|
||||
// notice, this list of conditions and the following disclaimer in the
|
||||
// documentation and/or other materials provided with the distribution.
|
||||
//
|
||||
// 3. Neither the name of the Corporation nor the names of the
|
||||
// contributors may be used to endorse or promote products derived from
|
||||
// this software without specific prior written permission.
|
||||
//
|
||||
// THIS SOFTWARE IS PROVIDED BY SANDIA CORPORATION "AS IS" AND ANY
|
||||
// EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
||||
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
||||
// PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL SANDIA CORPORATION OR THE
|
||||
// CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
||||
// EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
||||
// PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
||||
// PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
|
||||
// LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
||||
// NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
||||
// SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||
//
|
||||
// Questions? Contact H. Carter Edwards (hcedwar@sandia.gov)
|
||||
//
|
||||
// ************************************************************************
|
||||
//@HEADER
|
||||
*/
|
||||
|
||||
#include <gtest/gtest.h>
|
||||
|
||||
#include <Kokkos_Core.hpp>
|
||||
|
||||
#include <Kokkos_UnorderedMap.hpp>
|
||||
|
||||
#include <TestGlobal2LocalIds.hpp>
|
||||
#include <TestUnorderedMapPerformance.hpp>
|
||||
|
||||
#include <iomanip>
|
||||
#include <sstream>
|
||||
#include <string>
|
||||
#include <fstream>
|
||||
|
||||
|
||||
namespace Performance {
|
||||
|
||||
class openmp : public ::testing::Test {
|
||||
protected:
|
||||
static void SetUpTestCase()
|
||||
{
|
||||
std::cout << std::setprecision(5) << std::scientific;
|
||||
|
||||
unsigned num_threads = 4;
|
||||
|
||||
if (Kokkos::hwloc::available()) {
|
||||
num_threads = Kokkos::hwloc::get_available_numa_count()
|
||||
* Kokkos::hwloc::get_available_cores_per_numa()
|
||||
* Kokkos::hwloc::get_available_threads_per_core()
|
||||
;
|
||||
|
||||
}
|
||||
|
||||
std::cout << "OpenMP: " << num_threads << std::endl;
|
||||
|
||||
Kokkos::OpenMP::initialize( num_threads );
|
||||
|
||||
std::cout << "available threads: " << omp_get_max_threads() << std::endl;
|
||||
}
|
||||
|
||||
static void TearDownTestCase()
|
||||
{
|
||||
Kokkos::OpenMP::finalize();
|
||||
|
||||
omp_set_num_threads(1);
|
||||
|
||||
ASSERT_EQ( 1 , omp_get_max_threads() );
|
||||
}
|
||||
};
|
||||
|
||||
TEST_F( openmp, global_2_local)
|
||||
{
|
||||
std::cout << "OpenMP" << std::endl;
|
||||
std::cout << "size, create, generate, fill, find" << std::endl;
|
||||
for (unsigned i=Performance::begin_id_size; i<=Performance::end_id_size; i *= Performance::id_step)
|
||||
test_global_to_local_ids<Kokkos::OpenMP>(i);
|
||||
}
|
||||
|
||||
TEST_F( openmp, unordered_map_performance_near)
|
||||
{
|
||||
unsigned num_openmp = 4;
|
||||
if (Kokkos::hwloc::available()) {
|
||||
num_openmp = Kokkos::hwloc::get_available_numa_count() *
|
||||
Kokkos::hwloc::get_available_cores_per_numa() *
|
||||
Kokkos::hwloc::get_available_threads_per_core();
|
||||
|
||||
}
|
||||
std::ostringstream base_file_name;
|
||||
base_file_name << "openmp-" << num_openmp << "-near";
|
||||
Perf::run_performance_tests<Kokkos::OpenMP,true>(base_file_name.str());
|
||||
}
|
||||
|
||||
TEST_F( openmp, unordered_map_performance_far)
|
||||
{
|
||||
unsigned num_openmp = 4;
|
||||
if (Kokkos::hwloc::available()) {
|
||||
num_openmp = Kokkos::hwloc::get_available_numa_count() *
|
||||
Kokkos::hwloc::get_available_cores_per_numa() *
|
||||
Kokkos::hwloc::get_available_threads_per_core();
|
||||
|
||||
}
|
||||
std::ostringstream base_file_name;
|
||||
base_file_name << "openmp-" << num_openmp << "-far";
|
||||
Perf::run_performance_tests<Kokkos::OpenMP,false>(base_file_name.str());
|
||||
}
|
||||
|
||||
} // namespace test
|
||||
|
||||
126
lib/kokkos/containers/performance_tests/TestThreads.cpp
Executable file
126
lib/kokkos/containers/performance_tests/TestThreads.cpp
Executable file
@ -0,0 +1,126 @@
|
||||
/*
|
||||
//@HEADER
|
||||
// ************************************************************************
|
||||
//
|
||||
// Kokkos v. 2.0
|
||||
// Copyright (2014) Sandia Corporation
|
||||
//
|
||||
// Under the terms of Contract DE-AC04-94AL85000 with Sandia Corporation,
|
||||
// the U.S. Government retains certain rights in this software.
|
||||
//
|
||||
// Redistribution and use in source and binary forms, with or without
|
||||
// modification, are permitted provided that the following conditions are
|
||||
// met:
|
||||
//
|
||||
// 1. Redistributions of source code must retain the above copyright
|
||||
// notice, this list of conditions and the following disclaimer.
|
||||
//
|
||||
// 2. Redistributions in binary form must reproduce the above copyright
|
||||
// notice, this list of conditions and the following disclaimer in the
|
||||
// documentation and/or other materials provided with the distribution.
|
||||
//
|
||||
// 3. Neither the name of the Corporation nor the names of the
|
||||
// contributors may be used to endorse or promote products derived from
|
||||
// this software without specific prior written permission.
|
||||
//
|
||||
// THIS SOFTWARE IS PROVIDED BY SANDIA CORPORATION "AS IS" AND ANY
|
||||
// EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
||||
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
||||
// PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL SANDIA CORPORATION OR THE
|
||||
// CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
||||
// EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
||||
// PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
||||
// PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
|
||||
// LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
||||
// NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
||||
// SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||
//
|
||||
// Questions? Contact H. Carter Edwards (hcedwar@sandia.gov)
|
||||
//
|
||||
// ************************************************************************
|
||||
//@HEADER
|
||||
*/
|
||||
|
||||
#include <gtest/gtest.h>
|
||||
|
||||
#include <Kokkos_Core.hpp>
|
||||
|
||||
#include <Kokkos_UnorderedMap.hpp>
|
||||
|
||||
#include <iomanip>
|
||||
|
||||
#include <TestGlobal2LocalIds.hpp>
|
||||
#include <TestUnorderedMapPerformance.hpp>
|
||||
|
||||
#include <iomanip>
|
||||
#include <sstream>
|
||||
#include <string>
|
||||
#include <fstream>
|
||||
|
||||
namespace Performance {
|
||||
|
||||
class threads : public ::testing::Test {
|
||||
protected:
|
||||
static void SetUpTestCase()
|
||||
{
|
||||
std::cout << std::setprecision(5) << std::scientific;
|
||||
|
||||
unsigned num_threads = 4;
|
||||
|
||||
if (Kokkos::hwloc::available()) {
|
||||
num_threads = Kokkos::hwloc::get_available_numa_count() *
|
||||
Kokkos::hwloc::get_available_cores_per_numa() *
|
||||
Kokkos::hwloc::get_available_threads_per_core();
|
||||
|
||||
}
|
||||
|
||||
std::cout << "Threads: " << num_threads << std::endl;
|
||||
|
||||
Kokkos::Threads::initialize( num_threads );
|
||||
}
|
||||
|
||||
static void TearDownTestCase()
|
||||
{
|
||||
Kokkos::Threads::finalize();
|
||||
}
|
||||
};
|
||||
|
||||
TEST_F( threads, global_2_local)
|
||||
{
|
||||
std::cout << "Threads" << std::endl;
|
||||
std::cout << "size, create, generate, fill, find" << std::endl;
|
||||
for (unsigned i=Performance::begin_id_size; i<=Performance::end_id_size; i *= Performance::id_step)
|
||||
test_global_to_local_ids<Kokkos::Threads>(i);
|
||||
}
|
||||
|
||||
TEST_F( threads, unordered_map_performance_near)
|
||||
{
|
||||
unsigned num_threads = 4;
|
||||
if (Kokkos::hwloc::available()) {
|
||||
num_threads = Kokkos::hwloc::get_available_numa_count() *
|
||||
Kokkos::hwloc::get_available_cores_per_numa() *
|
||||
Kokkos::hwloc::get_available_threads_per_core();
|
||||
|
||||
}
|
||||
std::ostringstream base_file_name;
|
||||
base_file_name << "threads-" << num_threads << "-near";
|
||||
Perf::run_performance_tests<Kokkos::Threads,true>(base_file_name.str());
|
||||
}
|
||||
|
||||
TEST_F( threads, unordered_map_performance_far)
|
||||
{
|
||||
unsigned num_threads = 4;
|
||||
if (Kokkos::hwloc::available()) {
|
||||
num_threads = Kokkos::hwloc::get_available_numa_count() *
|
||||
Kokkos::hwloc::get_available_cores_per_numa() *
|
||||
Kokkos::hwloc::get_available_threads_per_core();
|
||||
|
||||
}
|
||||
std::ostringstream base_file_name;
|
||||
base_file_name << "threads-" << num_threads << "-far";
|
||||
Perf::run_performance_tests<Kokkos::Threads,false>(base_file_name.str());
|
||||
}
|
||||
|
||||
} // namespace Performance
|
||||
|
||||
|
||||
262
lib/kokkos/containers/performance_tests/TestUnorderedMapPerformance.hpp
Executable file
262
lib/kokkos/containers/performance_tests/TestUnorderedMapPerformance.hpp
Executable file
@ -0,0 +1,262 @@
|
||||
//@HEADER
|
||||
// ************************************************************************
|
||||
//
|
||||
// Kokkos v. 2.0
|
||||
// Copyright (2014) Sandia Corporation
|
||||
//
|
||||
// Under the terms of Contract DE-AC04-94AL85000 with Sandia Corporation,
|
||||
// the U.S. Government retains certain rights in this software.
|
||||
//
|
||||
// Redistribution and use in source and binary forms, with or without
|
||||
// modification, are permitted provided that the following conditions are
|
||||
// met:
|
||||
//
|
||||
// 1. Redistributions of source code must retain the above copyright
|
||||
// notice, this list of conditions and the following disclaimer.
|
||||
//
|
||||
// 2. Redistributions in binary form must reproduce the above copyright
|
||||
// notice, this list of conditions and the following disclaimer in the
|
||||
// documentation and/or other materials provided with the distribution.
|
||||
//
|
||||
// 3. Neither the name of the Corporation nor the names of the
|
||||
// contributors may be used to endorse or promote products derived from
|
||||
// this software without specific prior written permission.
|
||||
//
|
||||
// THIS SOFTWARE IS PROVIDED BY SANDIA CORPORATION "AS IS" AND ANY
|
||||
// EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
||||
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
||||
// PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL SANDIA CORPORATION OR THE
|
||||
// CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
||||
// EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
||||
// PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
||||
// PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
|
||||
// LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
||||
// NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
||||
// SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||
//
|
||||
// Questions? Contact H. Carter Edwards (hcedwar@sandia.gov)
|
||||
//
|
||||
// ************************************************************************
|
||||
//@HEADER
|
||||
|
||||
#ifndef KOKKOS_TEST_UNORDERED_MAP_PERFORMANCE_HPP
|
||||
#define KOKKOS_TEST_UNORDERED_MAP_PERFORMANCE_HPP
|
||||
|
||||
#include <impl/Kokkos_Timer.hpp>
|
||||
|
||||
#include <iostream>
|
||||
#include <iomanip>
|
||||
#include <fstream>
|
||||
#include <string>
|
||||
#include <sstream>
|
||||
|
||||
|
||||
namespace Perf {
|
||||
|
||||
template <typename Device, bool Near>
|
||||
struct UnorderedMapTest
|
||||
{
|
||||
typedef Device execution_space;
|
||||
typedef Kokkos::UnorderedMap<uint32_t, uint32_t, execution_space> map_type;
|
||||
typedef typename map_type::histogram_type histogram_type;
|
||||
|
||||
struct value_type {
|
||||
uint32_t failed_count;
|
||||
uint32_t max_list;
|
||||
};
|
||||
|
||||
uint32_t capacity;
|
||||
uint32_t inserts;
|
||||
uint32_t collisions;
|
||||
double seconds;
|
||||
map_type map;
|
||||
histogram_type histogram;
|
||||
|
||||
UnorderedMapTest( uint32_t arg_capacity, uint32_t arg_inserts, uint32_t arg_collisions)
|
||||
: capacity(arg_capacity)
|
||||
, inserts(arg_inserts)
|
||||
, collisions(arg_collisions)
|
||||
, seconds(0)
|
||||
, map(capacity)
|
||||
, histogram(map.get_histogram())
|
||||
{
|
||||
Kokkos::Impl::Timer wall_clock ;
|
||||
wall_clock.reset();
|
||||
|
||||
value_type v = {};
|
||||
int loop_count = 0;
|
||||
do {
|
||||
++loop_count;
|
||||
|
||||
v = value_type();
|
||||
Kokkos::parallel_reduce(inserts, *this, v);
|
||||
|
||||
if (v.failed_count > 0u) {
|
||||
const uint32_t new_capacity = map.capacity() + ((map.capacity()*3ull)/20u) + v.failed_count/collisions ;
|
||||
map.rehash( new_capacity );
|
||||
}
|
||||
} while (v.failed_count > 0u);
|
||||
|
||||
seconds = wall_clock.seconds();
|
||||
|
||||
switch (loop_count)
|
||||
{
|
||||
case 1u: std::cout << " \033[0;32m" << loop_count << "\033[0m "; break;
|
||||
case 2u: std::cout << " \033[1;31m" << loop_count << "\033[0m "; break;
|
||||
default: std::cout << " \033[0;31m" << loop_count << "\033[0m "; break;
|
||||
}
|
||||
std::cout << std::setprecision(2) << std::fixed << std::setw(5) << (1e9*(seconds/(inserts))) << "; " << std::flush;
|
||||
|
||||
histogram.calculate();
|
||||
Device::fence();
|
||||
}
|
||||
|
||||
void print(std::ostream & metrics_out, std::ostream & length_out, std::ostream & distance_out, std::ostream & block_distance_out)
|
||||
{
|
||||
metrics_out << map.capacity() << " , ";
|
||||
metrics_out << inserts/collisions << " , ";
|
||||
metrics_out << (100.0 * inserts/collisions) / map.capacity() << " , ";
|
||||
metrics_out << inserts << " , ";
|
||||
metrics_out << (map.failed_insert() ? "true" : "false") << " , ";
|
||||
metrics_out << collisions << " , ";
|
||||
metrics_out << 1e9*(seconds/inserts) << " , ";
|
||||
metrics_out << seconds << std::endl;
|
||||
|
||||
length_out << map.capacity() << " , ";
|
||||
length_out << ((100.0 *inserts/collisions) / map.capacity()) << " , ";
|
||||
length_out << collisions << " , ";
|
||||
histogram.print_length(length_out);
|
||||
|
||||
distance_out << map.capacity() << " , ";
|
||||
distance_out << ((100.0 *inserts/collisions) / map.capacity()) << " , ";
|
||||
distance_out << collisions << " , ";
|
||||
histogram.print_distance(distance_out);
|
||||
|
||||
block_distance_out << map.capacity() << " , ";
|
||||
block_distance_out << ((100.0 *inserts/collisions) / map.capacity()) << " , ";
|
||||
block_distance_out << collisions << " , ";
|
||||
histogram.print_block_distance(block_distance_out);
|
||||
}
|
||||
|
||||
|
||||
KOKKOS_INLINE_FUNCTION
|
||||
void init( value_type & v ) const
|
||||
{
|
||||
v.failed_count = 0;
|
||||
v.max_list = 0;
|
||||
}
|
||||
|
||||
KOKKOS_INLINE_FUNCTION
|
||||
void join( volatile value_type & dst, const volatile value_type & src ) const
|
||||
{
|
||||
dst.failed_count += src.failed_count;
|
||||
dst.max_list = src.max_list < dst.max_list ? dst.max_list : src.max_list;
|
||||
}
|
||||
|
||||
KOKKOS_INLINE_FUNCTION
|
||||
void operator()(uint32_t i, value_type & v) const
|
||||
{
|
||||
const uint32_t key = Near ? i/collisions : i%(inserts/collisions);
|
||||
typename map_type::insert_result result = map.insert(key,i);
|
||||
v.failed_count += !result.failed() ? 0 : 1;
|
||||
v.max_list = result.list_position() < v.max_list ? v.max_list : result.list_position();
|
||||
}
|
||||
|
||||
};
|
||||
|
||||
//#define KOKKOS_COLLECT_UNORDERED_MAP_METRICS
|
||||
|
||||
template <typename Device, bool Near>
|
||||
void run_performance_tests(std::string const & base_file_name)
|
||||
{
|
||||
#if defined(KOKKOS_COLLECT_UNORDERED_MAP_METRICS)
|
||||
std::string metrics_file_name = base_file_name + std::string("-metrics.csv");
|
||||
std::string length_file_name = base_file_name + std::string("-length.csv");
|
||||
std::string distance_file_name = base_file_name + std::string("-distance.csv");
|
||||
std::string block_distance_file_name = base_file_name + std::string("-block_distance.csv");
|
||||
|
||||
std::ofstream metrics_out( metrics_file_name.c_str(), std::ofstream::out );
|
||||
std::ofstream length_out( length_file_name.c_str(), std::ofstream::out );
|
||||
std::ofstream distance_out( distance_file_name.c_str(), std::ofstream::out );
|
||||
std::ofstream block_distance_out( block_distance_file_name.c_str(), std::ofstream::out );
|
||||
|
||||
|
||||
/*
|
||||
const double test_ratios[] = {
|
||||
0.50
|
||||
, 0.75
|
||||
, 0.80
|
||||
, 0.85
|
||||
, 0.90
|
||||
, 0.95
|
||||
, 1.00
|
||||
, 1.25
|
||||
, 2.00
|
||||
};
|
||||
*/
|
||||
|
||||
const double test_ratios[] = { 1.00 };
|
||||
|
||||
const int num_ratios = sizeof(test_ratios) / sizeof(double);
|
||||
|
||||
/*
|
||||
const uint32_t collisions[] {
|
||||
1
|
||||
, 4
|
||||
, 16
|
||||
, 64
|
||||
};
|
||||
*/
|
||||
|
||||
const uint32_t collisions[] = { 16 };
|
||||
|
||||
const int num_collisions = sizeof(collisions) / sizeof(uint32_t);
|
||||
|
||||
// set up file headers
|
||||
metrics_out << "Capacity , Unique , Percent Full , Attempted Inserts , Failed Inserts , Collision Ratio , Nanoseconds/Inserts, Seconds" << std::endl;
|
||||
length_out << "Capacity , Percent Full , ";
|
||||
distance_out << "Capacity , Percent Full , ";
|
||||
block_distance_out << "Capacity , Percent Full , ";
|
||||
|
||||
for (int i=0; i<100; ++i) {
|
||||
length_out << i << " , ";
|
||||
distance_out << i << " , ";
|
||||
block_distance_out << i << " , ";
|
||||
}
|
||||
|
||||
length_out << "\b\b\b " << std::endl;
|
||||
distance_out << "\b\b\b " << std::endl;
|
||||
block_distance_out << "\b\b\b " << std::endl;
|
||||
|
||||
Kokkos::Impl::Timer wall_clock ;
|
||||
for (int i=0; i < num_collisions ; ++i) {
|
||||
wall_clock.reset();
|
||||
std::cout << "Collisions: " << collisions[i] << std::endl;
|
||||
for (int j = 0; j < num_ratios; ++j) {
|
||||
std::cout << std::setprecision(1) << std::fixed << std::setw(5) << (100.0*test_ratios[j]) << "% " << std::flush;
|
||||
for (uint32_t capacity = 1<<14; capacity < 1<<25; capacity = capacity << 1) {
|
||||
uint32_t inserts = static_cast<uint32_t>(test_ratios[j]*(capacity));
|
||||
std::cout << capacity << std::flush;
|
||||
UnorderedMapTest<Device, Near> test(capacity, inserts*collisions[i], collisions[i]);
|
||||
Device::fence();
|
||||
test.print(metrics_out, length_out, distance_out, block_distance_out);
|
||||
}
|
||||
std::cout << "\b\b " << std::endl;
|
||||
|
||||
}
|
||||
std::cout << " " << wall_clock.seconds() << " secs" << std::endl;
|
||||
}
|
||||
metrics_out.close();
|
||||
length_out.close();
|
||||
distance_out.close();
|
||||
block_distance_out.close();
|
||||
#else
|
||||
(void)base_file_name;
|
||||
std::cout << "skipping test" << std::endl;
|
||||
#endif
|
||||
}
|
||||
|
||||
|
||||
} // namespace Perf
|
||||
|
||||
#endif //KOKKOS_TEST_UNORDERED_MAP_PERFORMANCE_HPP
|
||||
Reference in New Issue
Block a user