Files
lammps-gran-kokkos/lib/kokkos/core/unit_test/TestCuda.cpp

496 lines
15 KiB
C++
Executable File

/*
//@HEADER
// ************************************************************************
//
// Kokkos v. 2.0
// Copyright (2014) Sandia Corporation
//
// Under the terms of Contract DE-AC04-94AL85000 with Sandia Corporation,
// the U.S. Government retains certain rights in this software.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
// 1. Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//
// 2. Redistributions in binary form must reproduce the above copyright
// notice, this list of conditions and the following disclaimer in the
// documentation and/or other materials provided with the distribution.
//
// 3. Neither the name of the Corporation nor the names of the
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY SANDIA CORPORATION "AS IS" AND ANY
// EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
// PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL SANDIA CORPORATION OR THE
// CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
// EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
// PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
// PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
// LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
// NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
// SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
//
// Questions? Contact H. Carter Edwards (hcedwar@sandia.gov)
//
// ************************************************************************
//@HEADER
*/
#include <gtest/gtest.h>
#include <iostream>
#include <Kokkos_Core.hpp>
//----------------------------------------------------------------------------
#include <impl/Kokkos_ViewTileLeft.hpp>
//----------------------------------------------------------------------------
#include <TestSharedAlloc.hpp>
#include <TestViewMapping.hpp>
#include <TestViewImpl.hpp>
#include <TestAtomic.hpp>
#include <TestViewAPI.hpp>
#include <TestViewSubview.hpp>
#include <TestTile.hpp>
#include <TestReduce.hpp>
#include <TestScan.hpp>
#include <TestRange.hpp>
#include <TestTeam.hpp>
#include <TestAggregate.hpp>
#include <TestAggregateReduction.hpp>
#include <TestCompilerMacros.hpp>
#include <TestMemorySpaceTracking.hpp>
#include <TestTeamVector.hpp>
#include <TestTemplateMetaFunctions.hpp>
#include <TestCXX11Deduction.hpp>
//----------------------------------------------------------------------------
class cuda : public ::testing::Test {
protected:
static void SetUpTestCase()
{
Kokkos::Cuda::print_configuration( std::cout );
Kokkos::HostSpace::execution_space::initialize();
Kokkos::Cuda::initialize( Kokkos::Cuda::SelectDevice(0) );
}
static void TearDownTestCase()
{
Kokkos::Cuda::finalize();
Kokkos::HostSpace::execution_space::finalize();
}
};
//----------------------------------------------------------------------------
namespace Test {
__global__
void test_abort()
{
Kokkos::Impl::VerifyExecutionCanAccessMemorySpace<
Kokkos::CudaSpace ,
Kokkos::HostSpace >::verify();
}
__global__
void test_cuda_spaces_int_value( int * ptr )
{
if ( *ptr == 42 ) { *ptr = 2 * 42 ; }
}
TEST_F( cuda , compiler_macros )
{
ASSERT_TRUE( ( TestCompilerMacros::Test< Kokkos::Cuda >() ) );
}
TEST_F( cuda , memory_space )
{
TestMemorySpace< Kokkos::Cuda >();
}
TEST_F( cuda, spaces )
{
if ( Kokkos::CudaUVMSpace::available() ) {
Kokkos::Impl::AllocationTracker tracker = Kokkos::CudaUVMSpace::allocate_and_track("uvm_ptr",sizeof(int));
int * uvm_ptr = (int*) tracker.alloc_ptr();
*uvm_ptr = 42 ;
Kokkos::Cuda::fence();
test_cuda_spaces_int_value<<<1,1>>>(uvm_ptr);
Kokkos::Cuda::fence();
EXPECT_EQ( *uvm_ptr, int(2*42) );
}
}
//----------------------------------------------------------------------------
TEST_F( cuda , impl_shared_alloc )
{
test_shared_alloc< Kokkos::CudaSpace , Kokkos::HostSpace::execution_space >();
test_shared_alloc< Kokkos::CudaUVMSpace , Kokkos::HostSpace::execution_space >();
test_shared_alloc< Kokkos::CudaHostPinnedSpace , Kokkos::HostSpace::execution_space >();
}
TEST_F( cuda , impl_view_mapping )
{
test_view_mapping< Kokkos::Cuda >();
test_view_mapping_subview< Kokkos::Cuda >();
test_view_mapping_operator< Kokkos::Cuda >();
TestViewMappingAtomic< Kokkos::Cuda >::run();
}
template< class MemSpace >
struct TestViewCudaTexture {
enum { N = 1000 };
using V = Kokkos::Experimental::View<double*,MemSpace> ;
using T = Kokkos::Experimental::View<const double*, MemSpace, Kokkos::MemoryRandomAccess > ;
V m_base ;
T m_tex ;
struct TagInit {};
struct TagTest {};
KOKKOS_INLINE_FUNCTION
void operator()( const TagInit & , const int i ) const { m_base[i] = i + 1 ; }
KOKKOS_INLINE_FUNCTION
void operator()( const TagTest & , const int i , long & error_count ) const
{ if ( m_tex[i] != i + 1 ) ++error_count ; }
TestViewCudaTexture()
: m_base("base",N)
, m_tex( m_base )
{}
static void run()
{
EXPECT_TRUE( ( std::is_same< typename V::reference_type
, double &
>::value ) );
EXPECT_TRUE( ( std::is_same< typename T::reference_type
, const double
>::value ) );
EXPECT_TRUE( V::reference_type_is_lvalue_reference ); // An ordinary view
EXPECT_FALSE( T::reference_type_is_lvalue_reference ); // Texture fetch returns by value
TestViewCudaTexture self ;
Kokkos::parallel_for( Kokkos::RangePolicy< Kokkos::Cuda , TagInit >(0,N) , self );
long error_count = -1 ;
Kokkos::parallel_reduce( Kokkos::RangePolicy< Kokkos::Cuda , TagTest >(0,N) , self , error_count );
EXPECT_EQ( error_count , 0 );
}
};
TEST_F( cuda , impl_view_texture )
{
TestViewCudaTexture< Kokkos::CudaSpace >::run();
TestViewCudaTexture< Kokkos::CudaUVMSpace >::run();
}
template< class MemSpace , class ExecSpace >
struct TestViewCudaAccessible {
enum { N = 1000 };
using V = Kokkos::Experimental::View<double*,MemSpace> ;
V m_base ;
struct TagInit {};
struct TagTest {};
KOKKOS_INLINE_FUNCTION
void operator()( const TagInit & , const int i ) const { m_base[i] = i + 1 ; }
KOKKOS_INLINE_FUNCTION
void operator()( const TagTest & , const int i , long & error_count ) const
{ if ( m_base[i] != i + 1 ) ++error_count ; }
TestViewCudaAccessible()
: m_base("base",N)
{}
static void run()
{
TestViewCudaAccessible self ;
Kokkos::parallel_for( Kokkos::RangePolicy< typename MemSpace::execution_space , TagInit >(0,N) , self );
MemSpace::execution_space::fence();
// Next access is a different execution space, must complete prior kernel.
long error_count = -1 ;
Kokkos::parallel_reduce( Kokkos::RangePolicy< ExecSpace , TagTest >(0,N) , self , error_count );
EXPECT_EQ( error_count , 0 );
}
};
TEST_F( cuda , impl_view_accessible )
{
TestViewCudaAccessible< Kokkos::CudaSpace , Kokkos::Cuda >::run();
TestViewCudaAccessible< Kokkos::CudaUVMSpace , Kokkos::Cuda >::run();
TestViewCudaAccessible< Kokkos::CudaUVMSpace , Kokkos::HostSpace::execution_space >::run();
TestViewCudaAccessible< Kokkos::CudaHostPinnedSpace , Kokkos::Cuda >::run();
TestViewCudaAccessible< Kokkos::CudaHostPinnedSpace , Kokkos::HostSpace::execution_space >::run();
}
//----------------------------------------------------------------------------
TEST_F( cuda, view_impl )
{
// test_abort<<<32,32>>>(); // Aborts the kernel with CUDA version 4.1 or greater
test_view_impl< Kokkos::Cuda >();
}
TEST_F( cuda, view_api )
{
typedef Kokkos::View< const int * , Kokkos::Cuda , Kokkos::MemoryTraits< Kokkos::RandomAccess > > view_texture_managed ;
typedef Kokkos::View< const int * , Kokkos::Cuda , Kokkos::MemoryTraits< Kokkos::RandomAccess | Kokkos::Unmanaged > > view_texture_unmanaged ;
TestViewAPI< double , Kokkos::Cuda >();
#if 0
Kokkos::View<double, Kokkos::Cuda > x("x");
Kokkos::View<double[1], Kokkos::Cuda > y("y");
// *x = 10 ;
// x() = 10 ;
// y[0] = 10 ;
// y(0) = 10 ;
#endif
}
TEST_F( cuda, view_subview_auto_1d_left ) {
TestViewSubview::test_auto_1d< Kokkos::LayoutLeft,Kokkos::Cuda >();
}
TEST_F( cuda, view_subview_auto_1d_right ) {
TestViewSubview::test_auto_1d< Kokkos::LayoutRight,Kokkos::Cuda >();
}
TEST_F( cuda, view_subview_auto_1d_stride ) {
TestViewSubview::test_auto_1d< Kokkos::LayoutStride,Kokkos::Cuda >();
}
TEST_F( cuda, view_subview_assign_strided ) {
TestViewSubview::test_1d_strided_assignment< Kokkos::Cuda >();
}
TEST_F( cuda, view_subview_left_0 ) {
TestViewSubview::test_left_0< Kokkos::CudaUVMSpace >();
}
TEST_F( cuda, view_subview_left_1 ) {
TestViewSubview::test_left_1< Kokkos::CudaUVMSpace >();
}
TEST_F( cuda, view_subview_left_2 ) {
TestViewSubview::test_left_2< Kokkos::CudaUVMSpace >();
}
TEST_F( cuda, view_subview_left_3 ) {
TestViewSubview::test_left_3< Kokkos::CudaUVMSpace >();
}
TEST_F( cuda, view_subview_right_0 ) {
TestViewSubview::test_right_0< Kokkos::CudaUVMSpace >();
}
TEST_F( cuda, view_subview_right_1 ) {
TestViewSubview::test_right_1< Kokkos::CudaUVMSpace >();
}
TEST_F( cuda, view_subview_right_3 ) {
TestViewSubview::test_right_3< Kokkos::CudaUVMSpace >();
}
TEST_F( cuda, range_tag )
{
TestRange< Kokkos::Cuda >::test_for(1000);
TestRange< Kokkos::Cuda >::test_reduce(1000);
TestRange< Kokkos::Cuda >::test_scan(1000);
}
TEST_F( cuda, team_tag )
{
TestTeamPolicy< Kokkos::Cuda >::test_for(1000);
TestTeamPolicy< Kokkos::Cuda >::test_reduce(1000);
}
TEST_F( cuda, reduce )
{
TestReduce< long , Kokkos::Cuda >( 10000000 );
TestReduce< double , Kokkos::Cuda >( 1000000 );
}
TEST_F( cuda, reduce_team )
{
TestReduceTeam< long , Kokkos::Cuda >( 10000000 );
TestReduceTeam< double , Kokkos::Cuda >( 1000000 );
}
TEST_F( cuda, shared_team )
{
TestSharedTeam< Kokkos::Cuda >();
}
TEST_F( cuda, reduce_dynamic )
{
TestReduceDynamic< long , Kokkos::Cuda >( 10000000 );
TestReduceDynamic< double , Kokkos::Cuda >( 1000000 );
}
TEST_F( cuda, reduce_dynamic_view )
{
TestReduceDynamicView< long , Kokkos::Cuda >( 10000000 );
TestReduceDynamicView< double , Kokkos::Cuda >( 1000000 );
}
TEST_F( cuda, atomic )
{
const int loop_count = 1e3 ;
ASSERT_TRUE( ( TestAtomic::Loop<int,Kokkos::Cuda>(loop_count,1) ) );
ASSERT_TRUE( ( TestAtomic::Loop<int,Kokkos::Cuda>(loop_count,2) ) );
ASSERT_TRUE( ( TestAtomic::Loop<int,Kokkos::Cuda>(loop_count,3) ) );
ASSERT_TRUE( ( TestAtomic::Loop<unsigned int,Kokkos::Cuda>(loop_count,1) ) );
ASSERT_TRUE( ( TestAtomic::Loop<unsigned int,Kokkos::Cuda>(loop_count,2) ) );
ASSERT_TRUE( ( TestAtomic::Loop<unsigned int,Kokkos::Cuda>(loop_count,3) ) );
ASSERT_TRUE( ( TestAtomic::Loop<long int,Kokkos::Cuda>(loop_count,1) ) );
ASSERT_TRUE( ( TestAtomic::Loop<long int,Kokkos::Cuda>(loop_count,2) ) );
ASSERT_TRUE( ( TestAtomic::Loop<long int,Kokkos::Cuda>(loop_count,3) ) );
ASSERT_TRUE( ( TestAtomic::Loop<unsigned long int,Kokkos::Cuda>(loop_count,1) ) );
ASSERT_TRUE( ( TestAtomic::Loop<unsigned long int,Kokkos::Cuda>(loop_count,2) ) );
ASSERT_TRUE( ( TestAtomic::Loop<unsigned long int,Kokkos::Cuda>(loop_count,3) ) );
ASSERT_TRUE( ( TestAtomic::Loop<long long int,Kokkos::Cuda>(loop_count,1) ) );
ASSERT_TRUE( ( TestAtomic::Loop<long long int,Kokkos::Cuda>(loop_count,2) ) );
ASSERT_TRUE( ( TestAtomic::Loop<long long int,Kokkos::Cuda>(loop_count,3) ) );
ASSERT_TRUE( ( TestAtomic::Loop<double,Kokkos::Cuda>(loop_count,1) ) );
ASSERT_TRUE( ( TestAtomic::Loop<double,Kokkos::Cuda>(loop_count,2) ) );
ASSERT_TRUE( ( TestAtomic::Loop<double,Kokkos::Cuda>(loop_count,3) ) );
ASSERT_TRUE( ( TestAtomic::Loop<float,Kokkos::Cuda>(100,1) ) );
ASSERT_TRUE( ( TestAtomic::Loop<float,Kokkos::Cuda>(100,2) ) );
ASSERT_TRUE( ( TestAtomic::Loop<float,Kokkos::Cuda>(100,3) ) );
}
//----------------------------------------------------------------------------
TEST_F( cuda, tile_layout)
{
TestTile::test< Kokkos::Cuda , 1 , 1 >( 1 , 1 );
TestTile::test< Kokkos::Cuda , 1 , 1 >( 2 , 3 );
TestTile::test< Kokkos::Cuda , 1 , 1 >( 9 , 10 );
TestTile::test< Kokkos::Cuda , 2 , 2 >( 1 , 1 );
TestTile::test< Kokkos::Cuda , 2 , 2 >( 2 , 3 );
TestTile::test< Kokkos::Cuda , 2 , 2 >( 4 , 4 );
TestTile::test< Kokkos::Cuda , 2 , 2 >( 9 , 9 );
TestTile::test< Kokkos::Cuda , 2 , 4 >( 9 , 9 );
TestTile::test< Kokkos::Cuda , 4 , 4 >( 9 , 9 );
TestTile::test< Kokkos::Cuda , 4 , 4 >( 1 , 1 );
TestTile::test< Kokkos::Cuda , 4 , 4 >( 4 , 4 );
TestTile::test< Kokkos::Cuda , 4 , 4 >( 9 , 9 );
TestTile::test< Kokkos::Cuda , 4 , 4 >( 9 , 11 );
TestTile::test< Kokkos::Cuda , 8 , 8 >( 1 , 1 );
TestTile::test< Kokkos::Cuda , 8 , 8 >( 4 , 4 );
TestTile::test< Kokkos::Cuda , 8 , 8 >( 9 , 9 );
TestTile::test< Kokkos::Cuda , 8 , 8 >( 9 , 11 );
}
TEST_F( cuda , view_aggregate )
{
TestViewAggregate< Kokkos::Cuda >();
TestViewAggregateReduction< Kokkos::Cuda >();
}
TEST_F( cuda , scan )
{
TestScan< Kokkos::Cuda >::test_range( 1 , 1000 );
TestScan< Kokkos::Cuda >( 1000000 );
TestScan< Kokkos::Cuda >( 10000000 );
Kokkos::Cuda::fence();
}
TEST_F( cuda , team_scan )
{
TestScanTeam< Kokkos::Cuda >( 10 );
TestScanTeam< Kokkos::Cuda >( 10000 );
}
}
//----------------------------------------------------------------------------
TEST_F( cuda , template_meta_functions )
{
TestTemplateMetaFunctions<int, Kokkos::Cuda >();
}
//----------------------------------------------------------------------------
#ifdef KOKKOS_HAVE_CXX11
namespace Test {
TEST_F( cuda , reduction_deduction )
{
TestCXX11::test_reduction_deduction< Kokkos::Cuda >();
}
TEST_F( cuda , team_vector )
{
ASSERT_TRUE( ( TestTeamVector::Test< Kokkos::Cuda >(0) ) );
ASSERT_TRUE( ( TestTeamVector::Test< Kokkos::Cuda >(1) ) );
ASSERT_TRUE( ( TestTeamVector::Test< Kokkos::Cuda >(2) ) );
ASSERT_TRUE( ( TestTeamVector::Test< Kokkos::Cuda >(3) ) );
ASSERT_TRUE( ( TestTeamVector::Test< Kokkos::Cuda >(4) ) );
ASSERT_TRUE( ( TestTeamVector::Test< Kokkos::Cuda >(5) ) );
ASSERT_TRUE( ( TestTeamVector::Test< Kokkos::Cuda >(6) ) );
ASSERT_TRUE( ( TestTeamVector::Test< Kokkos::Cuda >(7) ) );
ASSERT_TRUE( ( TestTeamVector::Test< Kokkos::Cuda >(8) ) );
ASSERT_TRUE( ( TestTeamVector::Test< Kokkos::Cuda >(9) ) );
ASSERT_TRUE( ( TestTeamVector::Test< Kokkos::Cuda >(10) ) );
}
}
#endif