Files
lammps/lib/kokkos/core/unit_test/TestMDRange.hpp

2518 lines
80 KiB
C++

/*
//@HEADER
// ************************************************************************
//
// Kokkos v. 2.0
// Copyright (2014) Sandia Corporation
//
// Under the terms of Contract DE-AC04-94AL85000 with Sandia Corporation,
// the U.S. Government retains certain rights in this software.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
// 1. Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//
// 2. Redistributions in binary form must reproduce the above copyright
// notice, this list of conditions and the following disclaimer in the
// documentation and/or other materials provided with the distribution.
//
// 3. Neither the name of the Corporation nor the names of the
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY SANDIA CORPORATION "AS IS" AND ANY
// EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
// PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL SANDIA CORPORATION OR THE
// CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
// EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
// PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
// PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
// LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
// NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
// SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
//
// Questions? Contact H. Carter Edwards (hcedwar@sandia.gov)
//
// ************************************************************************
//@HEADER
*/
#include <cstdio>
#include <gtest/gtest.h>
#include <Kokkos_Core.hpp>
namespace Test {
namespace {
template <typename ExecSpace >
struct TestMDRange_ReduceArray_2D {
using DataType = int;
using ViewType_2 = typename Kokkos::View< DataType**, ExecSpace >;
using HostViewType_2 = typename ViewType_2::HostMirror;
ViewType_2 input_view;
using scalar_type = double;
using value_type = scalar_type[];
const unsigned value_count;
TestMDRange_ReduceArray_2D( const int N0, const int N1, const unsigned array_size )
: input_view( "input_view", N0, N1 )
, value_count( array_size )
{}
KOKKOS_INLINE_FUNCTION
void init( scalar_type dst[] ) const
{
for ( unsigned i = 0; i < value_count; ++i ) {
dst[i] = 0.0;
}
}
KOKKOS_INLINE_FUNCTION
void join( volatile scalar_type dst[],
const volatile scalar_type src[] ) const
{
for ( unsigned i = 0; i < value_count; ++i ) {
dst[i] += src[i];
}
}
KOKKOS_INLINE_FUNCTION
void operator()( const int i, const int j ) const
{
input_view( i, j ) = 1;
}
KOKKOS_INLINE_FUNCTION
void operator()( const int i, const int j, value_type lsum ) const
{
lsum[0] += input_view( i, j ) * 2; //+=6 each time if InitTag => N0*N1*6
lsum[1] += input_view( i, j ) ; //+=3 each time if InitTag => N0*N1*3
}
// tagged operators
struct InitTag {};
KOKKOS_INLINE_FUNCTION
void operator()( const InitTag &, const int i, const int j ) const
{
input_view( i, j ) = 3;
}
static void test_arrayreduce2( const int N0, const int N1 )
{
using namespace Kokkos::Experimental;
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2>, Kokkos::IndexType<int>, InitTag > range_type_init;
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type_init range_init( point_type{ { 0, 0 } }, point_type{ { N0, N1 } }, tile_type{ { 3, 3 } } );
range_type range( point_type{ { 0, 0 } }, point_type{ { N0, N1 } }, tile_type{ { 3, 3 } } );
const unsigned array_size = 2;
TestMDRange_ReduceArray_2D functor( N0, N1, array_size );
parallel_for( range_init, functor ); // Init the view to 3's
double sums[ array_size ];
parallel_reduce( range, functor, sums );
// Check output
//printf("Array Reduce result. N0 = %d N1 = %d N0*N1 = %d sums[0] = %lf sums[1] = %lf \n", N0, N1, N0*N1, sums[0], sums[1]);
ASSERT_EQ( sums[0], 6 * N0 * N1 );
ASSERT_EQ( sums[1], 3 * N0 * N1 );
}
}
};
template <typename ExecSpace >
struct TestMDRange_ReduceArray_3D {
using DataType = int;
using ViewType_3 = typename Kokkos::View< DataType***, ExecSpace >;
using HostViewType_3 = typename ViewType_3::HostMirror;
ViewType_3 input_view;
using scalar_type = double;
using value_type = scalar_type[];
const unsigned value_count;
TestMDRange_ReduceArray_3D( const int N0, const int N1, const int N2, const unsigned array_size )
: input_view( "input_view", N0, N1, N2 )
, value_count( array_size )
{}
KOKKOS_INLINE_FUNCTION
void init( scalar_type dst[] ) const
{
for ( unsigned i = 0; i < value_count; ++i ) {
dst[i] = 0.0;
}
}
KOKKOS_INLINE_FUNCTION
void join( volatile scalar_type dst[],
const volatile scalar_type src[] ) const
{
for ( unsigned i = 0; i < value_count; ++i ) {
dst[i] += src[i];
}
}
KOKKOS_INLINE_FUNCTION
void operator()( const int i, const int j, const int k ) const
{
input_view( i, j, k ) = 1;
}
KOKKOS_INLINE_FUNCTION
void operator()( const int i, const int j, const int k, value_type lsum ) const
{
lsum[0] += input_view( i, j, k ) * 2; //+=6 each time if InitTag => N0*N1*N2*6
lsum[1] += input_view( i, j, k ) ; //+=3 each time if InitTag => N0*N1*N2*3
}
// tagged operators
struct InitTag {};
KOKKOS_INLINE_FUNCTION
void operator()( const InitTag &, const int i, const int j, const int k ) const
{
input_view( i, j, k ) = 3;
}
static void test_arrayreduce3( const int N0, const int N1, const int N2 )
{
using namespace Kokkos::Experimental;
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<3>, Kokkos::IndexType<int>, InitTag > range_type_init;
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<3>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type_init range_init( point_type{ { 0, 0, 0 } }, point_type{ { N0, N1, N2 } }, tile_type{ { 3, 3, 3 } } );
range_type range( point_type{ { 0, 0, 0 } }, point_type{ { N0, N1, N2 } }, tile_type{ { 3, 3, 3 } } );
const unsigned array_size = 2;
TestMDRange_ReduceArray_3D functor( N0, N1, N2, array_size );
parallel_for( range_init, functor ); // Init the view to 3's
double sums[ array_size ];
parallel_reduce( range, functor, sums );
ASSERT_EQ( sums[0], 6 * N0 * N1 * N2 );
ASSERT_EQ( sums[1], 3 * N0 * N1 * N2 );
}
}
};
template <typename ExecSpace >
struct TestMDRange_2D {
using DataType = int;
using ViewType = typename Kokkos::View< DataType**, ExecSpace >;
using HostViewType = typename ViewType::HostMirror;
ViewType input_view;
using value_type = double;
TestMDRange_2D( const DataType N0, const DataType N1 ) : input_view( "input_view", N0, N1 ) {}
KOKKOS_INLINE_FUNCTION
void operator()( const int i, const int j ) const
{
input_view( i, j ) = 1;
}
KOKKOS_INLINE_FUNCTION
void operator()( const int i, const int j, value_type &lsum ) const
{
lsum += input_view( i, j ) * 2;
}
// tagged operators
struct InitTag {};
KOKKOS_INLINE_FUNCTION
void operator()( const InitTag &, const int i, const int j ) const
{
input_view( i, j ) = 3;
}
// reduction tagged operators
KOKKOS_INLINE_FUNCTION
void operator()( const InitTag &, const int i, const int j, value_type &lsum ) const
{
lsum += input_view( i, j ) * 3;
}
static void test_reduce2( const int N0, const int N1 )
{
using namespace Kokkos::Experimental;
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0 } }, point_type{ { N0, N1 } }, tile_type{ { 3, 3 } } );
TestMDRange_2D functor( N0, N1 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * N0 * N1 );
}
// Test with reducers - scalar
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2>, Kokkos::IndexType<int> > range_type;
int s0 = 1;
int s1 = 1;
range_type range( {{ s0, s1 }}, {{ N0, N1 }}, {{ 3, 3 }} );
TestMDRange_2D functor( N0, N1 );
parallel_for( range, functor );
value_type sum = 0.0;
Kokkos::Experimental::Sum< value_type > reducer_scalar( sum );
parallel_reduce( range, functor, reducer_scalar );
ASSERT_EQ( sum, 2 * (N0 - s0) * (N1 - s1) );
}
// Test with reducers - scalar view
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2>, Kokkos::IndexType<int> > range_type;
range_type range( {{ 0, 0 }}, {{ N0, N1 }}, {{ 3, 3 }} );
TestMDRange_2D functor( N0, N1 );
parallel_for( range, functor );
value_type sum = 0.0;
Kokkos::View< value_type, Kokkos::HostSpace > sum_view("sum_view");
sum_view() = sum;
Kokkos::Experimental::Sum< value_type > reducer_view( sum_view );
parallel_reduce( range, functor, reducer_view);
sum = sum_view();
ASSERT_EQ( sum, 2 * N0 * N1 );
}
// Tagged operator test
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2, Iterate::Default, Iterate::Default >, Kokkos::IndexType<int>, InitTag > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0 } }, point_type{ { N0, N1 } }, tile_type{ { 2, 4 } } );
TestMDRange_2D functor( N0, N1 );
parallel_for( range, functor );
// check parallel_for results correct with InitTag
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
{
if ( h_view( i, j ) != 3 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "Defaults + InitTag op(): Errors in test_for3; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 9 * N0 * N1 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2, Iterate::Default, Iterate::Default>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0 } }, point_type{ { N0, N1 } }, tile_type{ { 2, 6 } } );
TestMDRange_2D functor( N0, N1 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * N0 * N1 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2, Iterate::Left, Iterate::Left>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0 } }, point_type{ { N0, N1 } }, tile_type{ { 2, 6 } } );
TestMDRange_2D functor( N0, N1 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * N0 * N1 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2, Iterate::Left, Iterate::Right>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0 } }, point_type{ { N0, N1 } }, tile_type{ { 2, 6 } } );
TestMDRange_2D functor( N0, N1 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * N0 * N1 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2, Iterate::Right, Iterate::Left>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0 } }, point_type{ { N0, N1 } }, tile_type{ { 2, 6 } } );
TestMDRange_2D functor( N0, N1 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * N0 * N1 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2, Iterate::Right, Iterate::Right>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0 } }, point_type{ { N0, N1 } }, tile_type{ { 2, 6 } } );
TestMDRange_2D functor( N0, N1 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * N0 * N1 );
}
} // end test_reduce2
static void test_for2( const int N0, const int N1 )
{
using namespace Kokkos::Experimental;
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2>, Kokkos::IndexType<int>, InitTag > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
const int s0 = 1;
const int s1 = 1;
range_type range( point_type{ { s0, s1 } }, point_type{ { N0, N1 } }, tile_type{ { 3, 3 } } );
TestMDRange_2D functor( N0, N1 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = s0; i < N0; ++i )
for ( int j = s1; j < N1; ++j )
{
if ( h_view( i, j ) != 3 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "Offset Start + Default Layouts + InitTag op(): Errors in test_for2; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2>, InitTag > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0 } }, point_type{ { N0, N1 } }, tile_type{ { 3, 3 } } );
TestMDRange_2D functor( N0, N1 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
{
if ( h_view( i, j ) != 3 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "Default Layouts + InitTag op(): Errors in test_for2; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2>, InitTag > range_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0 } }, point_type{ { N0, N1 } } );
TestMDRange_2D functor( N0, N1 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
{
if ( h_view( i, j ) != 3 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "Default Layouts + InitTag op() + Default Tile: Errors in test_for2; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0 } }, point_type{ { N0, N1 } }, tile_type{ { 3, 3 } } );
TestMDRange_2D functor( N0, N1 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
{
if ( h_view( i, j ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "No info: Errors in test_for2; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2, Iterate::Default, Iterate::Default>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0 } }, point_type{ { N0, N1 } }, tile_type{ { 4, 4 } } );
TestMDRange_2D functor( N0, N1 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
{
if ( h_view( i, j ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "D D: Errors in test_for2; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2, Iterate::Left, Iterate::Left>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0 } }, point_type{ { N0, N1 } }, tile_type{ { 3, 3 } } );
TestMDRange_2D functor( N0, N1 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
{
if ( h_view( i, j ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "L L: Errors in test_for2; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2, Iterate::Left, Iterate::Right>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0 } }, point_type{ { N0, N1 } }, tile_type{ { 7, 7 } } );
TestMDRange_2D functor( N0, N1 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
{
if ( h_view( i, j ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "L R: Errors in test_for2; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2, Iterate::Right, Iterate::Left>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0 } }, point_type{ { N0, N1 } }, tile_type{ { 16, 16 } } );
TestMDRange_2D functor( N0, N1 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
{
if ( h_view( i, j ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "R L: Errors in test_for2; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<2, Iterate::Right, Iterate::Right>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0 } }, point_type{ { N0, N1 } }, tile_type{ { 5, 16 } } );
TestMDRange_2D functor( N0, N1 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
{
if ( h_view( i, j ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "R R: Errors in test_for2; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
} // end test_for2
}; // MDRange_2D
template <typename ExecSpace >
struct TestMDRange_3D {
using DataType = int;
using ViewType = typename Kokkos::View< DataType***, ExecSpace >;
using HostViewType = typename ViewType::HostMirror;
ViewType input_view;
using value_type = double;
TestMDRange_3D( const DataType N0, const DataType N1, const DataType N2 ) : input_view( "input_view", N0, N1, N2 ) {}
KOKKOS_INLINE_FUNCTION
void operator()( const int i, const int j, const int k ) const
{
input_view( i, j, k ) = 1;
}
KOKKOS_INLINE_FUNCTION
void operator()( const int i, const int j, const int k, double &lsum ) const
{
lsum += input_view( i, j, k ) * 2;
}
// tagged operators
struct InitTag {};
KOKKOS_INLINE_FUNCTION
void operator()( const InitTag &, const int i, const int j, const int k ) const
{
input_view( i, j, k ) = 3;
}
// reduction tagged operators
KOKKOS_INLINE_FUNCTION
void operator()( const InitTag &, const int i, const int j, const int k, value_type &lsum ) const
{
lsum += input_view( i, j, k ) * 3;
}
static void test_reduce3( const int N0, const int N1, const int N2 )
{
using namespace Kokkos::Experimental;
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<3>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
int s0 = 1;
int s1 = 1;
int s2 = 1;
range_type range( point_type{ { s0, s1, s2 } }, point_type{ { N0, N1, N2 } }, tile_type{ { 3, 3, 3 } } );
TestMDRange_3D functor( N0, N1, N2 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * (N0 - s0) * (N1 - s1) * (N2 - s2) );
}
// Test with reducers - scalar
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<3>, Kokkos::IndexType<int> > range_type;
range_type range( {{ 0, 0, 0 }}, {{ N0, N1, N2 }}, {{ 3, 3, 3 }} );
TestMDRange_3D functor( N0, N1, N2 );
parallel_for( range, functor );
value_type sum = 0.0;
Kokkos::Experimental::Sum< value_type > reducer_scalar( sum );
parallel_reduce( range, functor, reducer_scalar );
ASSERT_EQ( sum, 2 * N0 * N1 * N2 );
}
// Test with reducers - scalar view
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<3>, Kokkos::IndexType<int> > range_type;
range_type range( {{ 0, 0, 0 }}, {{ N0, N1, N2 }}, {{ 3, 3, 3 }} );
TestMDRange_3D functor( N0, N1, N2 );
parallel_for( range, functor );
value_type sum = 0.0;
Kokkos::View< value_type, Kokkos::HostSpace > sum_view("sum_view");
sum_view() = sum;
Kokkos::Experimental::Sum< value_type > reducer_view( sum_view );
parallel_reduce( range, functor, reducer_view);
sum = sum_view();
ASSERT_EQ( sum, 2 * N0 * N1 * N2 );
}
// Tagged operator test
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<3, Iterate::Default, Iterate::Default >, Kokkos::IndexType<int>, InitTag > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0 } }, point_type{ { N0, N1, N2 } }, tile_type{ { 2, 4, 6 } } );
TestMDRange_3D functor( N0, N1, N2 );
parallel_for( range, functor );
// check parallel_for results correct with InitTag
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
{
if ( h_view( i, j, k ) != 3 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "Defaults + InitTag op(): Errors in test_for3; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 9 * N0 * N1 * N2 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<3, Iterate::Default, Iterate::Default >, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0 } }, point_type{ { N0, N1, N2 } }, tile_type{ { 2, 4, 6 } } );
TestMDRange_3D functor( N0, N1, N2 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * N0 * N1 * N2 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<3, Iterate::Left, Iterate::Left>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0 } }, point_type{ { N0, N1, N2 } }, tile_type{ { 2, 4, 6 } } );
TestMDRange_3D functor( N0, N1, N2 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * N0 * N1 * N2 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<3, Iterate::Left, Iterate::Right>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0 } }, point_type{ { N0, N1, N2 } }, tile_type{ { 2, 4, 6 } } );
TestMDRange_3D functor( N0, N1, N2 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * N0 * N1 * N2 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<3, Iterate::Right, Iterate::Left>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0 } }, point_type{ { N0, N1, N2 } }, tile_type{ { 2, 4, 6 } } );
TestMDRange_3D functor( N0, N1, N2 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * N0 * N1 * N2 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<3, Iterate::Right, Iterate::Right>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0 } }, point_type{ { N0, N1, N2 } }, tile_type{ { 2, 4, 6 } } );
TestMDRange_3D functor( N0, N1, N2 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * N0 * N1 * N2 );
}
} // end test_reduce3
static void test_for3( const int N0, const int N1, const int N2 )
{
using namespace Kokkos::Experimental;
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<3> > range_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0 } }, point_type{ { N0, N1, N2 } } );
TestMDRange_3D functor( N0, N1, N2 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
{
if ( h_view( i, j, k ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "Defaults + No Tile: Errors in test_for3; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<3>, Kokkos::IndexType<int>, InitTag > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
int s0 = 1;
int s1 = 1;
int s2 = 1;
range_type range( point_type{ { s0, s1, s2 } }, point_type{ { N0, N1, N2 } }, tile_type{ { 3, 3, 3 } } );
TestMDRange_3D functor( N0, N1, N2 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = s0; i < N0; ++i )
for ( int j = s1; j < N1; ++j )
for ( int k = s2; k < N2; ++k )
{
if ( h_view( i, j, k ) != 3 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "Offset Start + Defaults + InitTag op(): Errors in test_for3; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<3>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0 } }, point_type{ { N0, N1, N2 } }, tile_type{ { 3, 3, 3 } } );
TestMDRange_3D functor( N0, N1, N2 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
{
if ( h_view( i, j, k ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for3; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<3, Iterate::Default, Iterate::Default>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0 } }, point_type{ { N0, N1, N2 } }, tile_type{ { 3, 3, 3 } } );
TestMDRange_3D functor( N0, N1, N2 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
{
if ( h_view( i, j, k ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for3; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<3, Iterate::Left, Iterate::Left>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0 } }, point_type{ { N0, N1, N2 } }, tile_type{ { 2, 4, 2 } } );
TestMDRange_3D functor( N0, N1, N2 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
{
if ( h_view( i, j, k ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for3; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<3, Iterate::Left, Iterate::Right>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0 } }, point_type{ { N0, N1, N2 } }, tile_type{ { 3, 5, 7 } } );
TestMDRange_3D functor( N0, N1, N2 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
{
if ( h_view( i, j, k ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for3; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<3, Iterate::Right, Iterate::Left>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0 } }, point_type{ { N0, N1, N2 } }, tile_type{ { 8, 8, 8 } } );
TestMDRange_3D functor( N0, N1, N2 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
{
if ( h_view( i, j, k ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for3; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<3, Iterate::Right, Iterate::Right>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0 } }, point_type{ { N0, N1, N2 } }, tile_type{ { 2, 4, 2 } } );
TestMDRange_3D functor( N0, N1, N2 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
{
if ( h_view( i, j, k ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for3; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
} // end test_for3
};
template <typename ExecSpace >
struct TestMDRange_4D {
using DataType = int;
using ViewType = typename Kokkos::View< DataType****, ExecSpace >;
using HostViewType = typename ViewType::HostMirror;
ViewType input_view;
using value_type = double;
TestMDRange_4D( const DataType N0, const DataType N1, const DataType N2, const DataType N3 ) : input_view( "input_view", N0, N1, N2, N3 ) {}
KOKKOS_INLINE_FUNCTION
void operator()( const int i, const int j, const int k, const int l ) const
{
input_view( i, j, k, l ) = 1;
}
KOKKOS_INLINE_FUNCTION
void operator()( const int i, const int j, const int k, const int l, double &lsum ) const
{
lsum += input_view( i, j, k, l ) * 2;
}
// tagged operators
struct InitTag {};
KOKKOS_INLINE_FUNCTION
void operator()( const InitTag &, const int i, const int j, const int k, const int l ) const
{
input_view( i, j, k, l ) = 3;
}
// reduction tagged operators
KOKKOS_INLINE_FUNCTION
void operator()( const InitTag &, const int i, const int j, const int k, const int l, value_type &lsum ) const
{
lsum += input_view( i, j, k, l ) * 3;
}
static void test_reduce4( const int N0, const int N1, const int N2, const int N3 )
{
using namespace Kokkos::Experimental;
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<4>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
int s0 = 1;
int s1 = 1;
int s2 = 1;
int s3 = 1;
range_type range( point_type{ { s0, s1, s2, s3 } }, point_type{ { N0, N1, N2, N3 } }, tile_type{ { 3, 3, 3, 3 } } );
TestMDRange_4D functor( N0, N1, N2, N3 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * (N0 - s0) * (N1 - s1) * (N2 - s2) * (N3 - s3) );
}
// Test with reducers - scalar
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<4>, Kokkos::IndexType<int> > range_type;
range_type range( {{ 0, 0, 0, 0 }}, {{ N0, N1, N2, N3 }}, {{ 3, 3, 3, 3 }} );
TestMDRange_4D functor( N0, N1, N2, N3 );
parallel_for( range, functor );
value_type sum = 0.0;
Kokkos::Experimental::Sum< value_type > reducer_scalar( sum );
parallel_reduce( range, functor, reducer_scalar );
ASSERT_EQ( sum, 2 * N0 * N1 * N2 * N3 );
}
// Test with reducers - scalar view
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<4>, Kokkos::IndexType<int> > range_type;
range_type range( {{ 0, 0, 0, 0 }}, {{ N0, N1, N2, N3 }}, {{ 3, 3, 3, 3 }} );
TestMDRange_4D functor( N0, N1, N2, N3 );
parallel_for( range, functor );
value_type sum = 0.0;
Kokkos::View< value_type, Kokkos::HostSpace > sum_view("sum_view");
sum_view() = sum;
Kokkos::Experimental::Sum< value_type > reducer_view( sum_view );
parallel_reduce( range, functor, reducer_view);
sum = sum_view();
ASSERT_EQ( sum, 2 * N0 * N1 * N2 * N3 );
}
// Tagged operator test
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<4, Iterate::Default, Iterate::Default >, Kokkos::IndexType<int>, InitTag > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3 } }, tile_type{ { 2, 4, 6, 2 } } );
TestMDRange_4D functor( N0, N1, N2, N3 );
parallel_for( range, functor );
// check parallel_for results correct with InitTag
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
{
if ( h_view( i, j, k, l ) != 3 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "Defaults + InitTag op(): Errors in test_reduce4 parallel_for init; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 9 * N0 * N1 * N2 * N3 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<4, Iterate::Default, Iterate::Default >, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3 } }, tile_type{ { 2, 4, 6, 2 } } );
TestMDRange_4D functor( N0, N1, N2, N3 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * N0 * N1 * N2 * N3 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<4, Iterate::Left, Iterate::Left>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3 } }, tile_type{ { 2, 4, 6, 2 } } );
TestMDRange_4D functor( N0, N1, N2, N3 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * N0 * N1 * N2 * N3 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<4, Iterate::Left, Iterate::Right>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3 } }, tile_type{ { 2, 4, 6, 2 } } );
TestMDRange_4D functor( N0, N1, N2, N3 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * N0 * N1 * N2 * N3 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<4, Iterate::Right, Iterate::Left>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3 } }, tile_type{ { 2, 4, 6, 2 } } );
TestMDRange_4D functor( N0, N1, N2, N3 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * N0 * N1 * N2 * N3 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<4, Iterate::Right, Iterate::Right>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3 } }, tile_type{ { 2, 4, 6, 2 } } );
TestMDRange_4D functor( N0, N1, N2, N3 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * N0 * N1 * N2 * N3 );
}
} // end test_reduce
static void test_for4( const int N0, const int N1, const int N2, const int N3 )
{
using namespace Kokkos::Experimental;
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<4> > range_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3 } } );
TestMDRange_4D functor( N0, N1, N2, N3 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
{
if ( h_view( i, j, k, l ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "Defaults + No Tile: Errors in test_for4; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<4>, Kokkos::IndexType<int>, InitTag > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
int s0 = 1;
int s1 = 1;
int s2 = 1;
int s3 = 1;
range_type range( point_type{ { s0, s1, s2, s3 } }, point_type{ { N0, N1, N2, N3 } }, tile_type{ { 3, 11, 3, 3 } } );
TestMDRange_4D functor( N0, N1, N2, N3 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = s0; i < N0; ++i )
for ( int j = s1; j < N1; ++j )
for ( int k = s2; k < N2; ++k )
for ( int l = s3; l < N3; ++l )
{
if ( h_view( i, j, k, l ) != 3 ) {
++counter;
}
}
if ( counter != 0 ) {
printf("Offset Start + Defaults +m_tile > m_upper dim2 InitTag op(): Errors in test_for4; mismatches = %d\n\n",counter);
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<4>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3 } }, tile_type{ { 4, 4, 4, 4 } } );
TestMDRange_4D functor( N0, N1, N2, N3 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
{
if ( h_view( i, j, k, l ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for4; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<4, Iterate::Default, Iterate::Default>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3 } }, tile_type{ { 4, 4, 4, 4 } } );
TestMDRange_4D functor( N0, N1, N2, N3 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
{
if ( h_view( i, j, k, l ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for4; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<4, Iterate::Left, Iterate::Left>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3 } }, tile_type{ { 4, 4, 4, 4 } } );
TestMDRange_4D functor( N0, N1, N2, N3 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
{
if ( h_view( i, j, k, l ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for4; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<4, Iterate::Left, Iterate::Right>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3 } }, tile_type{ { 4, 4, 4, 4 } } );
TestMDRange_4D functor( N0, N1, N2, N3 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
{
if ( h_view( i, j, k, l ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for4; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<4, Iterate::Right, Iterate::Left>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3 } }, tile_type{ { 4, 4, 4, 4 } } );
TestMDRange_4D functor( N0, N1, N2, N3 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
{
if ( h_view( i, j, k, l ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for4; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<4, Iterate::Right, Iterate::Right>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3 } }, tile_type{ { 4, 4, 4, 4 } } );
TestMDRange_4D functor( N0, N1, N2, N3 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
{
if ( h_view( i, j, k, l ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for4; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
} // end test_for4
};
template <typename ExecSpace >
struct TestMDRange_5D {
using DataType = int;
using ViewType = typename Kokkos::View< DataType*****, ExecSpace >;
using HostViewType = typename ViewType::HostMirror;
ViewType input_view;
using value_type = double;
TestMDRange_5D( const DataType N0, const DataType N1, const DataType N2, const DataType N3, const DataType N4 ) : input_view( "input_view", N0, N1, N2, N3, N4 ) {}
KOKKOS_INLINE_FUNCTION
void operator()( const int i, const int j, const int k, const int l, const int m ) const
{
input_view( i, j, k, l, m ) = 1;
}
KOKKOS_INLINE_FUNCTION
void operator()( const int i, const int j, const int k, const int l, const int m, value_type &lsum ) const
{
lsum += input_view( i, j, k, l, m ) * 2;
}
// tagged operators
struct InitTag {};
KOKKOS_INLINE_FUNCTION
void operator()( const InitTag &, const int i, const int j, const int k, const int l, const int m ) const
{
input_view( i, j, k, l, m ) = 3;
}
// reduction tagged operators
KOKKOS_INLINE_FUNCTION
void operator()( const InitTag &, const int i, const int j, const int k, const int l, const int m, value_type &lsum ) const
{
lsum += input_view( i, j, k, l, m ) * 3;
}
static void test_reduce5( const int N0, const int N1, const int N2, const int N3, const int N4 )
{
using namespace Kokkos::Experimental;
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<5>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
int s0 = 1;
int s1 = 1;
int s2 = 1;
int s3 = 1;
int s4 = 1;
range_type range( point_type{ { s0, s1, s2, s3, s4 } }, point_type{ { N0, N1, N2, N3, N4 } }, tile_type{ { 3, 3, 3, 3, 3 } } );
TestMDRange_5D functor( N0, N1, N2, N3, N4 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * (N0 - s0) * (N1 - s1) * (N2 - s2) * (N3 - s3) * (N4 - s4) );
}
// Test with reducers - scalar
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<5>, Kokkos::IndexType<int> > range_type;
range_type range( {{ 0, 0, 0, 0, 0 }}, {{ N0, N1, N2, N3, N4 }}, {{ 3, 3, 3, 3, 3 }} );
TestMDRange_5D functor( N0, N1, N2, N3, N4 );
parallel_for( range, functor );
value_type sum = 0.0;
Kokkos::Experimental::Sum< value_type > reducer_scalar( sum );
parallel_reduce( range, functor, reducer_scalar );
ASSERT_EQ( sum, 2 * N0 * N1 * N2 * N3 * N4 );
}
// Test with reducers - scalar view
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<5>, Kokkos::IndexType<int> > range_type;
range_type range( {{ 0, 0, 0, 0, 0 }}, {{ N0, N1, N2, N3, N4 }}, {{ 3, 3, 3, 3, 3 }} );
TestMDRange_5D functor( N0, N1, N2, N3, N4 );
parallel_for( range, functor );
value_type sum = 0.0;
Kokkos::View< value_type, Kokkos::HostSpace > sum_view("sum_view");
sum_view() = sum;
Kokkos::Experimental::Sum< value_type > reducer_view( sum_view );
parallel_reduce( range, functor, reducer_view);
sum = sum_view();
ASSERT_EQ( sum, 2 * N0 * N1 * N2 * N3 * N4 );
}
// Tagged operator test
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<5, Iterate::Default, Iterate::Default >, Kokkos::IndexType<int>, InitTag > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3, N4 } }, tile_type{ { 2, 4, 6, 2, 2 } } );
TestMDRange_5D functor( N0, N1, N2, N3, N4 );
parallel_for( range, functor );
// check parallel_for results correct with InitTag
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
for ( int m = 0; m < N4; ++m )
{
if ( h_view( i, j, k, l, m ) != 3 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "Defaults + InitTag op(): Errors in test_reduce5 parallel_for init; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 9 * N0 * N1 * N2 * N3 * N4 );
}
}
static void test_for5( const int N0, const int N1, const int N2, const int N3, const int N4 )
{
using namespace Kokkos::Experimental;
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<5> > range_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3, N4 } } );
TestMDRange_5D functor( N0, N1, N2, N3, N4 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
for ( int m = 0; m < N4; ++m )
{
if ( h_view( i, j, k, l, m ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "Defaults + No Tile: Errors in test_for5; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<5>, Kokkos::IndexType<int>, InitTag > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
int s0 = 1;
int s1 = 1;
int s2 = 1;
int s3 = 1;
int s4 = 1;
range_type range( point_type{ { s0, s1, s2, s3, s4 } }, point_type{ { N0, N1, N2, N3, N4 } }, tile_type{ { 3, 3, 3, 3, 5 } } );
TestMDRange_5D functor( N0, N1, N2, N3, N4 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = s0; i < N0; ++i )
for ( int j = s1; j < N1; ++j )
for ( int k = s2; k < N2; ++k )
for ( int l = s3; l < N3; ++l )
for ( int m = s4; m < N4; ++m )
{
if ( h_view( i, j, k, l, m ) != 3 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "Offset Start + Defaults + InitTag op(): Errors in test_for5; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<5>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3, N4 } }, tile_type{ { 4, 4, 4, 2, 2 } } );
TestMDRange_5D functor( N0, N1, N2, N3, N4 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
for ( int m = 0; m < N4; ++m )
{
if ( h_view( i, j, k, l, m ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for5; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<5, Iterate::Default, Iterate::Default>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3, N4 } }, tile_type{ { 4, 4, 4, 2, 2 } } );
TestMDRange_5D functor( N0, N1, N2, N3, N4 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
for ( int m = 0; m < N4; ++m )
{
if ( h_view( i, j, k, l, m ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for5; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<5, Iterate::Left, Iterate::Left>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3, N4 } }, tile_type{ { 4, 4, 4, 2, 2 } } );
TestMDRange_5D functor( N0, N1, N2, N3, N4 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
for ( int m = 0; m < N4; ++m )
{
if ( h_view( i, j, k, l, m ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for5; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<5, Iterate::Left, Iterate::Right>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3, N4 } }, tile_type{ { 4, 4, 4, 2, 2 } } );
TestMDRange_5D functor( N0, N1, N2, N3, N4 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
for ( int m = 0; m < N4; ++m )
{
if ( h_view( i, j, k, l, m ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for5; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<5, Iterate::Right, Iterate::Left>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3, N4 } }, tile_type{ { 4, 4, 4, 2, 2 } } );
TestMDRange_5D functor( N0, N1, N2, N3, N4 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
for ( int m = 0; m < N4; ++m )
{
if ( h_view( i, j, k, l, m ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for5; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<5, Iterate::Right, Iterate::Right>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3, N4 } }, tile_type{ { 4, 4, 4, 2, 2 } } );
TestMDRange_5D functor( N0, N1, N2, N3, N4 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
for ( int m = 0; m < N4; ++m )
{
if ( h_view( i, j, k, l, m ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for5; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
}
};
template <typename ExecSpace >
struct TestMDRange_6D {
using DataType = int;
using ViewType = typename Kokkos::View< DataType******, ExecSpace >;
using HostViewType = typename ViewType::HostMirror;
ViewType input_view;
using value_type = double;
TestMDRange_6D( const DataType N0, const DataType N1, const DataType N2, const DataType N3, const DataType N4, const DataType N5 ) : input_view( "input_view", N0, N1, N2, N3, N4, N5 ) {}
KOKKOS_INLINE_FUNCTION
void operator()( const int i, const int j, const int k, const int l, const int m, const int n ) const
{
input_view( i, j, k, l, m, n ) = 1;
}
KOKKOS_INLINE_FUNCTION
void operator()( const int i, const int j, const int k, const int l, const int m, const int n, value_type &lsum ) const
{
lsum += input_view( i, j, k, l, m, n ) * 2;
}
// tagged operators
struct InitTag {};
KOKKOS_INLINE_FUNCTION
void operator()( const InitTag &, const int i, const int j, const int k, const int l, const int m, const int n ) const
{
input_view( i, j, k, l, m, n ) = 3;
}
// reduction tagged operators
KOKKOS_INLINE_FUNCTION
void operator()( const InitTag &, const int i, const int j, const int k, const int l, const int m, const int n, value_type &lsum ) const
{
lsum += input_view( i, j, k, l, m, n ) * 3;
}
static void test_reduce6( const int N0, const int N1, const int N2, const int N3, const int N4, const int N5 )
{
using namespace Kokkos::Experimental;
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<6>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
int s0 = 1;
int s1 = 1;
int s2 = 1;
int s3 = 1;
int s4 = 1;
int s5 = 1;
range_type range( point_type{ { s0, s1, s2, s3, s4, s5 } }, point_type{ { N0, N1, N2, N3, N4, N5 } }, tile_type{ { 3, 3, 3, 3, 3, 2 } } );
TestMDRange_6D functor( N0, N1, N2, N3, N4, N5 );
parallel_for( range, functor );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 2 * (N0 - s0) * (N1 - s1) * (N2 - s2) * (N3 - s3) * (N4 - s4) * (N5 - s5) );
}
// Test with reducers - scalar
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<6>, Kokkos::IndexType<int> > range_type;
range_type range( {{ 0, 0, 0, 0, 0, 0 }}, {{ N0, N1, N2, N3, N4, N5 }}, {{ 3, 3, 3, 3, 3, 2 }} );
TestMDRange_6D functor( N0, N1, N2, N3, N4, N5 );
parallel_for( range, functor );
value_type sum = 0.0;
Kokkos::Experimental::Sum< value_type > reducer_scalar( sum );
parallel_reduce( range, functor, reducer_scalar );
ASSERT_EQ( sum, 2 * N0 * N1 * N2 * N3 * N4 * N5 );
}
// Test with reducers - scalar view
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<6>, Kokkos::IndexType<int> > range_type;
range_type range( {{ 0, 0, 0, 0, 0, 0 }}, {{ N0, N1, N2, N3, N4, N5 }}, {{ 3, 3, 3, 3, 3, 2 }} );
TestMDRange_6D functor( N0, N1, N2, N3, N4, N5 );
parallel_for( range, functor );
value_type sum = 0.0;
Kokkos::View< value_type, Kokkos::HostSpace > sum_view("sum_view");
sum_view() = sum;
Kokkos::Experimental::Sum< value_type > reducer_view( sum_view );
parallel_reduce( range, functor, reducer_view);
sum = sum_view();
ASSERT_EQ( sum, 2 * N0 * N1 * N2 * N3 * N4 * N5 );
}
// Tagged operator test
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<6, Iterate::Default, Iterate::Default >, Kokkos::IndexType<int>, InitTag > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3, N4, N5 } }, tile_type{ { 2, 4, 6, 2, 2, 2 } } );
TestMDRange_6D functor( N0, N1, N2, N3, N4, N5 );
parallel_for( range, functor );
// check parallel_for results correct with InitTag
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
for ( int m = 0; m < N4; ++m )
for ( int n = 0; n < N5; ++n )
{
if ( h_view( i, j, k, l, m, n ) != 3 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "Defaults + InitTag op(): Errors in test_reduce6 parallel_for init; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
double sum = 0.0;
parallel_reduce( range, functor, sum );
ASSERT_EQ( sum, 9 * N0 * N1 * N2 * N3 * N4 * N5 );
}
}
static void test_for6( const int N0, const int N1, const int N2, const int N3, const int N4, const int N5 )
{
using namespace Kokkos::Experimental;
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<6> > range_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3, N4, N5 } } );
TestMDRange_6D functor( N0, N1, N2, N3, N4, N5 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
for ( int m = 0; m < N4; ++m )
for ( int n = 0; n < N5; ++n )
{
if ( h_view( i, j, k, l, m, n ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "Defaults + No Tile: Errors in test_for6; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<6>, Kokkos::IndexType<int>, InitTag > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
int s0 = 1;
int s1 = 1;
int s2 = 1;
int s3 = 1;
int s4 = 1;
int s5 = 1;
range_type range( point_type{ { s0, s1, s2, s3, s4, s5 } }, point_type{ { N0, N1, N2, N3, N4, N5 } }, tile_type{ { 3, 3, 3, 3, 2, 3 } } ); //tile dims 3,3,3,3,3,3 more than cuda can handle with debugging
TestMDRange_6D functor( N0, N1, N2, N3, N4, N5 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = s0; i < N0; ++i )
for ( int j = s1; j < N1; ++j )
for ( int k = s2; k < N2; ++k )
for ( int l = s3; l < N3; ++l )
for ( int m = s4; m < N4; ++m )
for ( int n = s5; n < N5; ++n )
{
if ( h_view( i, j, k, l, m, n ) != 3 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( "Offset Start + Defaults + InitTag op(): Errors in test_for6; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<6>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3, N4, N5 } }, tile_type{ { 4, 4, 4, 2, 2, 2 } } );
TestMDRange_6D functor( N0, N1, N2, N3, N4, N5 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
for ( int m = 0; m < N4; ++m )
for ( int n = 0; n < N5; ++n )
{
if ( h_view( i, j, k, l, m, n ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for6; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<6, Iterate::Default, Iterate::Default>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3, N4, N5 } }, tile_type{ { 4, 4, 4, 2, 2, 2 } } );
TestMDRange_6D functor( N0, N1, N2, N3, N4, N5 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
for ( int m = 0; m < N4; ++m )
for ( int n = 0; n < N5; ++n )
{
if ( h_view( i, j, k, l, m, n ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for6; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<6, Iterate::Left, Iterate::Left>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3, N4, N5 } }, tile_type{ { 4, 4, 4, 2, 2, 2 } } );
TestMDRange_6D functor( N0, N1, N2, N3, N4, N5 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
for ( int m = 0; m < N4; ++m )
for ( int n = 0; n < N5; ++n )
{
if ( h_view( i, j, k, l, m, n ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for6; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<6, Iterate::Left, Iterate::Right>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3, N4, N5 } }, tile_type{ { 4, 4, 4, 2, 2, 2 } } );
TestMDRange_6D functor( N0, N1, N2, N3, N4, N5 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
for ( int m = 0; m < N4; ++m )
for ( int n = 0; n < N5; ++n )
{
if ( h_view( i, j, k, l, m, n ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for6; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<6, Iterate::Right, Iterate::Left>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3, N4, N5 } }, tile_type{ { 4, 4, 4, 2, 2, 2 } } );
TestMDRange_6D functor( N0, N1, N2, N3, N4, N5 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
for ( int m = 0; m < N4; ++m )
for ( int n = 0; n < N5; ++n )
{
if ( h_view( i, j, k, l, m, n ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for6; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
{
typedef typename Kokkos::Experimental::MDRangePolicy< ExecSpace, Rank<6, Iterate::Right, Iterate::Right>, Kokkos::IndexType<int> > range_type;
typedef typename range_type::tile_type tile_type;
typedef typename range_type::point_type point_type;
range_type range( point_type{ { 0, 0, 0, 0, 0, 0 } }, point_type{ { N0, N1, N2, N3, N4, N5 } }, tile_type{ { 4, 4, 4, 2, 2, 2 } } );
TestMDRange_6D functor( N0, N1, N2, N3, N4, N5 );
parallel_for( range, functor );
HostViewType h_view = Kokkos::create_mirror_view( functor.input_view );
Kokkos::deep_copy( h_view, functor.input_view );
int counter = 0;
for ( int i = 0; i < N0; ++i )
for ( int j = 0; j < N1; ++j )
for ( int k = 0; k < N2; ++k )
for ( int l = 0; l < N3; ++l )
for ( int m = 0; m < N4; ++m )
for ( int n = 0; n < N5; ++n )
{
if ( h_view( i, j, k, l, m, n ) != 1 ) {
++counter;
}
}
if ( counter != 0 ) {
printf( " Errors in test_for6; mismatches = %d\n\n", counter );
}
ASSERT_EQ( counter, 0 );
}
}
};
} // namespace
TEST_F( TEST_CATEGORY , mdrange_for ) {
TestMDRange_2D< TEST_EXECSPACE >::test_for2( 100, 100 );
TestMDRange_3D< TEST_EXECSPACE >::test_for3( 100, 10, 100 );
TestMDRange_4D< TEST_EXECSPACE >::test_for4( 100, 10, 10, 10 );
TestMDRange_5D< TEST_EXECSPACE >::test_for5( 100, 10, 10, 10, 5 );
TestMDRange_6D< TEST_EXECSPACE >::test_for6( 10, 10, 10, 10, 5, 5 );
}
TEST_F( TEST_CATEGORY , mdrange_reduce ) {
TestMDRange_2D< TEST_EXECSPACE >::test_reduce2( 100, 100 );
TestMDRange_3D< TEST_EXECSPACE >::test_reduce3( 100, 10, 100 );
TestMDRange_4D< TEST_EXECSPACE >::test_reduce4( 100, 10, 10, 10 );
TestMDRange_5D< TEST_EXECSPACE >::test_reduce5( 100, 10, 10, 10, 5 );
TestMDRange_6D< TEST_EXECSPACE >::test_reduce6( 100, 10, 10, 10, 5, 5 );
}
//#ifndef KOKKOS_ENABLE_CUDA
TEST_F( TEST_CATEGORY , mdrange_array_reduce ) {
TestMDRange_ReduceArray_2D< TEST_EXECSPACE >::test_arrayreduce2( 4, 5 );
TestMDRange_ReduceArray_3D< TEST_EXECSPACE >::test_arrayreduce3( 4, 5, 10 );
}
//#endif
} // namespace Test