git-svn-id: svn://svn.icms.temple.edu/lammps-ro/trunk@14919 f3b2605a-c512-4ea7-a41b-209d697bcdaa
983 lines
37 KiB
C++
983 lines
37 KiB
C++
/*
|
|
//@HEADER
|
|
// ************************************************************************
|
|
//
|
|
// Kokkos v. 2.0
|
|
// Copyright (2014) Sandia Corporation
|
|
//
|
|
// Under the terms of Contract DE-AC04-94AL85000 with Sandia Corporation,
|
|
// the U.S. Government retains certain rights in this software.
|
|
//
|
|
// Redistribution and use in source and binary forms, with or without
|
|
// modification, are permitted provided that the following conditions are
|
|
// met:
|
|
//
|
|
// 1. Redistributions of source code must retain the above copyright
|
|
// notice, this list of conditions and the following disclaimer.
|
|
//
|
|
// 2. Redistributions in binary form must reproduce the above copyright
|
|
// notice, this list of conditions and the following disclaimer in the
|
|
// documentation and/or other materials provided with the distribution.
|
|
//
|
|
// 3. Neither the name of the Corporation nor the names of the
|
|
// contributors may be used to endorse or promote products derived from
|
|
// this software without specific prior written permission.
|
|
//
|
|
// THIS SOFTWARE IS PROVIDED BY SANDIA CORPORATION "AS IS" AND ANY
|
|
// EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
|
// PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL SANDIA CORPORATION OR THE
|
|
// CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
|
// EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
|
// PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
|
// PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
|
|
// LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
|
// NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
|
// SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
//
|
|
// Questions? Contact H. Carter Edwards (hcedwar@sandia.gov)
|
|
//
|
|
// ************************************************************************
|
|
//@HEADER
|
|
*/
|
|
|
|
/// \file Kokkos_DualView.hpp
|
|
/// \brief Declaration and definition of Kokkos::DualView.
|
|
///
|
|
/// This header file declares and defines Kokkos::DualView and its
|
|
/// related nonmember functions.
|
|
|
|
#ifndef KOKKOS_DUALVIEW_HPP
|
|
#define KOKKOS_DUALVIEW_HPP
|
|
|
|
#include <Kokkos_Core.hpp>
|
|
#include <impl/Kokkos_Error.hpp>
|
|
|
|
namespace Kokkos {
|
|
|
|
/* \class DualView
|
|
* \brief Container to manage mirroring a Kokkos::View that lives
|
|
* in device memory with a Kokkos::View that lives in host memory.
|
|
*
|
|
* This class provides capabilities to manage data which exists in two
|
|
* memory spaces at the same time. It keeps views of the same layout
|
|
* on two memory spaces as well as modified flags for both
|
|
* allocations. Users are responsible for setting the modified flags
|
|
* manually if they change the data in either memory space, by calling
|
|
* the sync() method templated on the device where they modified the
|
|
* data. Users may synchronize data by calling the modify() function,
|
|
* templated on the device towards which they want to synchronize
|
|
* (i.e., the target of the one-way copy operation).
|
|
*
|
|
* The DualView class also provides convenience methods such as
|
|
* realloc, resize and capacity which call the appropriate methods of
|
|
* the underlying Kokkos::View objects.
|
|
*
|
|
* The four template arguments are the same as those of Kokkos::View.
|
|
* (Please refer to that class' documentation for a detailed
|
|
* description.)
|
|
*
|
|
* \tparam DataType The type of the entries stored in the container.
|
|
*
|
|
* \tparam Layout The array's layout in memory.
|
|
*
|
|
* \tparam Device The Kokkos Device type. If its memory space is
|
|
* not the same as the host's memory space, then DualView will
|
|
* contain two separate Views: one in device memory, and one in
|
|
* host memory. Otherwise, DualView will only store one View.
|
|
*
|
|
* \tparam MemoryTraits (optional) The user's intended memory access
|
|
* behavior. Please see the documentation of Kokkos::View for
|
|
* examples. The default suffices for most users.
|
|
*/
|
|
template< class DataType ,
|
|
class Arg1Type = void ,
|
|
class Arg2Type = void ,
|
|
class Arg3Type = void>
|
|
class DualView : public ViewTraits< DataType , Arg1Type , Arg2Type, Arg3Type >
|
|
{
|
|
public:
|
|
//! \name Typedefs for device types and various Kokkos::View specializations.
|
|
//@{
|
|
typedef ViewTraits< DataType , Arg1Type , Arg2Type, Arg3Type > traits ;
|
|
|
|
//! The Kokkos Host Device type;
|
|
typedef typename traits::host_mirror_space host_mirror_space ;
|
|
|
|
//! The type of a Kokkos::View on the device.
|
|
typedef View< typename traits::data_type ,
|
|
Arg1Type ,
|
|
Arg2Type ,
|
|
Arg3Type > t_dev ;
|
|
|
|
/// \typedef t_host
|
|
/// \brief The type of a Kokkos::View host mirror of \c t_dev.
|
|
typedef typename t_dev::HostMirror t_host ;
|
|
|
|
//! The type of a const View on the device.
|
|
//! The type of a Kokkos::View on the device.
|
|
typedef View< typename traits::const_data_type ,
|
|
Arg1Type ,
|
|
Arg2Type ,
|
|
Arg3Type > t_dev_const ;
|
|
|
|
/// \typedef t_host_const
|
|
/// \brief The type of a const View host mirror of \c t_dev_const.
|
|
typedef typename t_dev_const::HostMirror t_host_const;
|
|
|
|
//! The type of a const, random-access View on the device.
|
|
typedef View< typename traits::const_data_type ,
|
|
typename traits::array_layout ,
|
|
typename traits::device_type ,
|
|
Kokkos::MemoryTraits<Kokkos::RandomAccess> > t_dev_const_randomread ;
|
|
|
|
/// \typedef t_host_const_randomread
|
|
/// \brief The type of a const, random-access View host mirror of
|
|
/// \c t_dev_const_randomread.
|
|
typedef typename t_dev_const_randomread::HostMirror t_host_const_randomread;
|
|
|
|
//! The type of an unmanaged View on the device.
|
|
typedef View< typename traits::data_type ,
|
|
typename traits::array_layout ,
|
|
typename traits::device_type ,
|
|
MemoryUnmanaged> t_dev_um;
|
|
|
|
//! The type of an unmanaged View host mirror of \c t_dev_um.
|
|
typedef View< typename t_host::data_type ,
|
|
typename t_host::array_layout ,
|
|
typename t_host::device_type ,
|
|
MemoryUnmanaged> t_host_um;
|
|
|
|
//! The type of a const unmanaged View on the device.
|
|
typedef View< typename traits::const_data_type ,
|
|
typename traits::array_layout ,
|
|
typename traits::device_type ,
|
|
MemoryUnmanaged> t_dev_const_um;
|
|
|
|
//! The type of a const unmanaged View host mirror of \c t_dev_const_um.
|
|
typedef View<typename t_host::const_data_type,
|
|
typename t_host::array_layout,
|
|
typename t_host::device_type,
|
|
MemoryUnmanaged> t_host_const_um;
|
|
|
|
//! The type of a const, random-access View on the device.
|
|
typedef View< typename t_host::const_data_type ,
|
|
typename t_host::array_layout ,
|
|
typename t_host::device_type ,
|
|
Kokkos::MemoryTraits<Kokkos::Unmanaged|Kokkos::RandomAccess> > t_dev_const_randomread_um ;
|
|
|
|
/// \typedef t_host_const_randomread
|
|
/// \brief The type of a const, random-access View host mirror of
|
|
/// \c t_dev_const_randomread.
|
|
typedef typename t_dev_const_randomread::HostMirror t_host_const_randomread_um;
|
|
|
|
//@}
|
|
//! \name The two View instances.
|
|
//@{
|
|
|
|
t_dev d_view;
|
|
t_host h_view;
|
|
|
|
//@}
|
|
//! \name Counters to keep track of changes ("modified" flags)
|
|
//@{
|
|
|
|
View<unsigned int,LayoutLeft,typename t_host::execution_space> modified_device;
|
|
View<unsigned int,LayoutLeft,typename t_host::execution_space> modified_host;
|
|
|
|
//@}
|
|
//! \name Constructors
|
|
//@{
|
|
|
|
/// \brief Empty constructor.
|
|
///
|
|
/// Both device and host View objects are constructed using their
|
|
/// default constructors. The "modified" flags are both initialized
|
|
/// to "unmodified."
|
|
DualView () :
|
|
modified_device (View<unsigned int,LayoutLeft,typename t_host::execution_space> ("DualView::modified_device")),
|
|
modified_host (View<unsigned int,LayoutLeft,typename t_host::execution_space> ("DualView::modified_host"))
|
|
{}
|
|
|
|
/// \brief Constructor that allocates View objects on both host and device.
|
|
///
|
|
/// This constructor works like the analogous constructor of View.
|
|
/// The first argument is a string label, which is entirely for your
|
|
/// benefit. (Different DualView objects may have the same label if
|
|
/// you like.) The arguments that follow are the dimensions of the
|
|
/// View objects. For example, if the View has three dimensions,
|
|
/// the first three integer arguments will be nonzero, and you may
|
|
/// omit the integer arguments that follow.
|
|
DualView (const std::string& label,
|
|
const size_t n0 = 0,
|
|
const size_t n1 = 0,
|
|
const size_t n2 = 0,
|
|
const size_t n3 = 0,
|
|
const size_t n4 = 0,
|
|
const size_t n5 = 0,
|
|
const size_t n6 = 0,
|
|
const size_t n7 = 0)
|
|
: d_view (label, n0, n1, n2, n3, n4, n5, n6, n7)
|
|
, h_view (create_mirror_view (d_view)) // without UVM, host View mirrors
|
|
, modified_device (View<unsigned int,LayoutLeft,typename t_host::execution_space> ("DualView::modified_device"))
|
|
, modified_host (View<unsigned int,LayoutLeft,typename t_host::execution_space> ("DualView::modified_host"))
|
|
{}
|
|
|
|
//! Copy constructor (shallow copy)
|
|
template<class SS, class LS, class DS, class MS>
|
|
DualView (const DualView<SS,LS,DS,MS>& src) :
|
|
d_view (src.d_view),
|
|
h_view (src.h_view),
|
|
modified_device (src.modified_device),
|
|
modified_host (src.modified_host)
|
|
{}
|
|
|
|
//! Subview constructor
|
|
template< class SD, class S1 , class S2 , class S3
|
|
, class Arg0 , class ... Args >
|
|
DualView( const DualView<SD,S1,S2,S3> & src
|
|
, const Arg0 & arg0
|
|
, Args ... args
|
|
)
|
|
: d_view( Kokkos::subview( src.d_view , arg0 , args ... ) )
|
|
, h_view( Kokkos::subview( src.h_view , arg0 , args ... ) )
|
|
, modified_device (src.modified_device)
|
|
, modified_host (src.modified_host)
|
|
{}
|
|
|
|
/// \brief Create DualView from existing device and host View objects.
|
|
///
|
|
/// This constructor assumes that the device and host View objects
|
|
/// are synchronized. You, the caller, are responsible for making
|
|
/// sure this is the case before calling this constructor. After
|
|
/// this constructor returns, you may use DualView's sync() and
|
|
/// modify() methods to ensure synchronization of the View objects.
|
|
///
|
|
/// \param d_view_ Device View
|
|
/// \param h_view_ Host View (must have type t_host = t_dev::HostMirror)
|
|
DualView (const t_dev& d_view_, const t_host& h_view_) :
|
|
d_view (d_view_),
|
|
h_view (h_view_),
|
|
modified_device (View<unsigned int,LayoutLeft,typename t_host::execution_space> ("DualView::modified_device")),
|
|
modified_host (View<unsigned int,LayoutLeft,typename t_host::execution_space> ("DualView::modified_host"))
|
|
{
|
|
#if ! KOKKOS_USING_EXP_VIEW
|
|
Impl::assert_shapes_are_equal (d_view.shape (), h_view.shape ());
|
|
#else
|
|
if ( int(d_view.rank) != int(h_view.rank) ||
|
|
d_view.dimension_0() != h_view.dimension_0() ||
|
|
d_view.dimension_1() != h_view.dimension_1() ||
|
|
d_view.dimension_2() != h_view.dimension_2() ||
|
|
d_view.dimension_3() != h_view.dimension_3() ||
|
|
d_view.dimension_4() != h_view.dimension_4() ||
|
|
d_view.dimension_5() != h_view.dimension_5() ||
|
|
d_view.dimension_6() != h_view.dimension_6() ||
|
|
d_view.dimension_7() != h_view.dimension_7() ||
|
|
d_view.stride_0() != h_view.stride_0() ||
|
|
d_view.stride_1() != h_view.stride_1() ||
|
|
d_view.stride_2() != h_view.stride_2() ||
|
|
d_view.stride_3() != h_view.stride_3() ||
|
|
d_view.stride_4() != h_view.stride_4() ||
|
|
d_view.stride_5() != h_view.stride_5() ||
|
|
d_view.stride_6() != h_view.stride_6() ||
|
|
d_view.stride_7() != h_view.stride_7() ||
|
|
d_view.span() != h_view.span() ) {
|
|
Kokkos::Impl::throw_runtime_exception("DualView constructed with incompatible views");
|
|
}
|
|
#endif
|
|
}
|
|
|
|
//@}
|
|
//! \name Methods for synchronizing, marking as modified, and getting Views.
|
|
//@{
|
|
|
|
/// \brief Return a View on a specific device \c Device.
|
|
///
|
|
/// Please don't be afraid of the if_c expression in the return
|
|
/// value's type. That just tells the method what the return type
|
|
/// should be: t_dev if the \c Device template parameter matches
|
|
/// this DualView's device type, else t_host.
|
|
///
|
|
/// For example, suppose you create a DualView on Cuda, like this:
|
|
/// \code
|
|
/// typedef Kokkos::DualView<float, Kokkos::LayoutRight, Kokkos::Cuda> dual_view_type;
|
|
/// dual_view_type DV ("my dual view", 100);
|
|
/// \endcode
|
|
/// If you want to get the CUDA device View, do this:
|
|
/// \code
|
|
/// typename dual_view_type::t_dev cudaView = DV.view<Kokkos::Cuda> ();
|
|
/// \endcode
|
|
/// and if you want to get the host mirror of that View, do this:
|
|
/// \code
|
|
/// typedef typename Kokkos::HostSpace::execution_space host_device_type;
|
|
/// typename dual_view_type::t_host hostView = DV.view<host_device_type> ();
|
|
/// \endcode
|
|
template< class Device >
|
|
KOKKOS_INLINE_FUNCTION
|
|
const typename Impl::if_c<
|
|
Impl::is_same<typename t_dev::memory_space,
|
|
typename Device::memory_space>::value,
|
|
t_dev,
|
|
t_host>::type& view () const
|
|
{
|
|
return Impl::if_c<
|
|
Impl::is_same<
|
|
typename t_dev::memory_space,
|
|
typename Device::memory_space>::value,
|
|
t_dev,
|
|
t_host >::select (d_view , h_view);
|
|
}
|
|
|
|
/// \brief Update data on device or host only if data in the other
|
|
/// space has been marked as modified.
|
|
///
|
|
/// If \c Device is the same as this DualView's device type, then
|
|
/// copy data from host to device. Otherwise, copy data from device
|
|
/// to host. In either case, only copy if the source of the copy
|
|
/// has been modified.
|
|
///
|
|
/// This is a one-way synchronization only. If the target of the
|
|
/// copy has been modified, this operation will discard those
|
|
/// modifications. It will also reset both device and host modified
|
|
/// flags.
|
|
///
|
|
/// \note This method doesn't know on its own whether you modified
|
|
/// the data in either View. You must manually mark modified data
|
|
/// as modified, by calling the modify() method with the
|
|
/// appropriate template parameter.
|
|
template<class Device>
|
|
void sync( const typename Impl::enable_if<
|
|
( Impl::is_same< typename traits::data_type , typename traits::non_const_data_type>::value) ||
|
|
( Impl::is_same< Device , int>::value)
|
|
, int >::type& = 0)
|
|
{
|
|
const unsigned int dev =
|
|
Impl::if_c<
|
|
Impl::is_same<
|
|
typename t_dev::memory_space,
|
|
typename Device::memory_space>::value ,
|
|
unsigned int,
|
|
unsigned int>::select (1, 0);
|
|
|
|
if (dev) { // if Device is the same as DualView's device type
|
|
if ((modified_host () > 0) && (modified_host () >= modified_device ())) {
|
|
deep_copy (d_view, h_view);
|
|
modified_host() = modified_device() = 0;
|
|
}
|
|
} else { // hopefully Device is the same as DualView's host type
|
|
if ((modified_device () > 0) && (modified_device () >= modified_host ())) {
|
|
deep_copy (h_view, d_view);
|
|
modified_host() = modified_device() = 0;
|
|
}
|
|
}
|
|
if(Impl::is_same<typename t_host::memory_space,typename t_dev::memory_space>::value) {
|
|
t_dev::execution_space::fence();
|
|
t_host::execution_space::fence();
|
|
}
|
|
}
|
|
|
|
template<class Device>
|
|
void sync ( const typename Impl::enable_if<
|
|
( ! Impl::is_same< typename traits::data_type , typename traits::non_const_data_type>::value ) ||
|
|
( Impl::is_same< Device , int>::value)
|
|
, int >::type& = 0 )
|
|
{
|
|
const unsigned int dev =
|
|
Impl::if_c<
|
|
Impl::is_same<
|
|
typename t_dev::memory_space,
|
|
typename Device::memory_space>::value,
|
|
unsigned int,
|
|
unsigned int>::select (1, 0);
|
|
if (dev) { // if Device is the same as DualView's device type
|
|
if ((modified_host () > 0) && (modified_host () >= modified_device ())) {
|
|
Impl::throw_runtime_exception("Calling sync on a DualView with a const datatype.");
|
|
}
|
|
} else { // hopefully Device is the same as DualView's host type
|
|
if ((modified_device () > 0) && (modified_device () >= modified_host ())) {
|
|
Impl::throw_runtime_exception("Calling sync on a DualView with a const datatype.");
|
|
}
|
|
}
|
|
}
|
|
|
|
template<class Device>
|
|
bool need_sync() const
|
|
{
|
|
const unsigned int dev =
|
|
Impl::if_c<
|
|
Impl::is_same<
|
|
typename t_dev::memory_space,
|
|
typename Device::memory_space>::value ,
|
|
unsigned int,
|
|
unsigned int>::select (1, 0);
|
|
|
|
if (dev) { // if Device is the same as DualView's device type
|
|
if ((modified_host () > 0) && (modified_host () >= modified_device ())) {
|
|
return true;
|
|
}
|
|
} else { // hopefully Device is the same as DualView's host type
|
|
if ((modified_device () > 0) && (modified_device () >= modified_host ())) {
|
|
return true;
|
|
}
|
|
}
|
|
return false;
|
|
}
|
|
/// \brief Mark data as modified on the given device \c Device.
|
|
///
|
|
/// If \c Device is the same as this DualView's device type, then
|
|
/// mark the device's data as modified. Otherwise, mark the host's
|
|
/// data as modified.
|
|
template<class Device>
|
|
void modify () {
|
|
const unsigned int dev =
|
|
Impl::if_c<
|
|
Impl::is_same<
|
|
typename t_dev::memory_space,
|
|
typename Device::memory_space>::value,
|
|
unsigned int,
|
|
unsigned int>::select (1, 0);
|
|
|
|
if (dev) { // if Device is the same as DualView's device type
|
|
// Increment the device's modified count.
|
|
modified_device () = (modified_device () > modified_host () ?
|
|
modified_device () : modified_host ()) + 1;
|
|
} else { // hopefully Device is the same as DualView's host type
|
|
// Increment the host's modified count.
|
|
modified_host () = (modified_device () > modified_host () ?
|
|
modified_device () : modified_host ()) + 1;
|
|
}
|
|
}
|
|
|
|
//@}
|
|
//! \name Methods for reallocating or resizing the View objects.
|
|
//@{
|
|
|
|
/// \brief Reallocate both View objects.
|
|
///
|
|
/// This discards any existing contents of the objects, and resets
|
|
/// their modified flags. It does <i>not</i> copy the old contents
|
|
/// of either View into the new View objects.
|
|
void realloc( const size_t n0 = 0 ,
|
|
const size_t n1 = 0 ,
|
|
const size_t n2 = 0 ,
|
|
const size_t n3 = 0 ,
|
|
const size_t n4 = 0 ,
|
|
const size_t n5 = 0 ,
|
|
const size_t n6 = 0 ,
|
|
const size_t n7 = 0 ) {
|
|
::Kokkos::realloc(d_view,n0,n1,n2,n3,n4,n5,n6,n7);
|
|
h_view = create_mirror_view( d_view );
|
|
|
|
/* Reset dirty flags */
|
|
modified_device() = modified_host() = 0;
|
|
}
|
|
|
|
/// \brief Resize both views, copying old contents into new if necessary.
|
|
///
|
|
/// This method only copies the old contents into the new View
|
|
/// objects for the device which was last marked as modified.
|
|
void resize( const size_t n0 = 0 ,
|
|
const size_t n1 = 0 ,
|
|
const size_t n2 = 0 ,
|
|
const size_t n3 = 0 ,
|
|
const size_t n4 = 0 ,
|
|
const size_t n5 = 0 ,
|
|
const size_t n6 = 0 ,
|
|
const size_t n7 = 0 ) {
|
|
if(modified_device() >= modified_host()) {
|
|
/* Resize on Device */
|
|
::Kokkos::resize(d_view,n0,n1,n2,n3,n4,n5,n6,n7);
|
|
h_view = create_mirror_view( d_view );
|
|
|
|
/* Mark Device copy as modified */
|
|
modified_device() = modified_device()+1;
|
|
|
|
} else {
|
|
/* Realloc on Device */
|
|
|
|
::Kokkos::realloc(d_view,n0,n1,n2,n3,n4,n5,n6,n7);
|
|
t_host temp_view = create_mirror_view( d_view );
|
|
|
|
/* Remap on Host */
|
|
Kokkos::deep_copy( temp_view , h_view );
|
|
|
|
h_view = temp_view;
|
|
|
|
/* Mark Host copy as modified */
|
|
modified_host() = modified_host()+1;
|
|
}
|
|
}
|
|
|
|
//@}
|
|
//! \name Methods for getting capacity, stride, or dimension(s).
|
|
//@{
|
|
|
|
//! The allocation size (same as Kokkos::View::capacity).
|
|
size_t capacity() const {
|
|
#if KOKKOS_USING_EXP_VIEW
|
|
return d_view.span();
|
|
#else
|
|
return d_view.capacity();
|
|
#endif
|
|
}
|
|
|
|
//! Get stride(s) for each dimension.
|
|
template< typename iType>
|
|
void stride(iType* stride_) const {
|
|
d_view.stride(stride_);
|
|
}
|
|
|
|
/* \brief return size of dimension 0 */
|
|
size_t dimension_0() const {return d_view.dimension_0();}
|
|
/* \brief return size of dimension 1 */
|
|
size_t dimension_1() const {return d_view.dimension_1();}
|
|
/* \brief return size of dimension 2 */
|
|
size_t dimension_2() const {return d_view.dimension_2();}
|
|
/* \brief return size of dimension 3 */
|
|
size_t dimension_3() const {return d_view.dimension_3();}
|
|
/* \brief return size of dimension 4 */
|
|
size_t dimension_4() const {return d_view.dimension_4();}
|
|
/* \brief return size of dimension 5 */
|
|
size_t dimension_5() const {return d_view.dimension_5();}
|
|
/* \brief return size of dimension 6 */
|
|
size_t dimension_6() const {return d_view.dimension_6();}
|
|
/* \brief return size of dimension 7 */
|
|
size_t dimension_7() const {return d_view.dimension_7();}
|
|
|
|
//@}
|
|
};
|
|
|
|
} // namespace Kokkos
|
|
|
|
//----------------------------------------------------------------------------
|
|
//----------------------------------------------------------------------------
|
|
//
|
|
// Partial specializations of Kokkos::subview() for DualView objects.
|
|
//
|
|
|
|
#if KOKKOS_USING_EXP_VIEW
|
|
|
|
namespace Kokkos {
|
|
namespace Impl {
|
|
|
|
template< class D, class A1, class A2, class A3, class ... Args >
|
|
struct DualViewSubview {
|
|
|
|
typedef typename Kokkos::Experimental::Impl::ViewMapping
|
|
< void
|
|
, Kokkos::ViewTraits< D, A1, A2, A3 >
|
|
, Args ...
|
|
>::traits_type dst_traits ;
|
|
|
|
typedef Kokkos::DualView
|
|
< typename dst_traits::data_type
|
|
, typename dst_traits::array_layout
|
|
, typename dst_traits::device_type
|
|
, typename dst_traits::memory_traits
|
|
> type ;
|
|
};
|
|
|
|
} /* namespace Impl */
|
|
|
|
|
|
template< class D , class A1 , class A2 , class A3 , class ... Args >
|
|
typename Impl::DualViewSubview<D,A1,A2,A3,Args...>::type
|
|
subview( const DualView<D,A1,A2,A3> & src , Args ... args )
|
|
{
|
|
return typename
|
|
Impl::DualViewSubview<D,A1,A2,A3,Args...>::type( src , args ... );
|
|
}
|
|
|
|
} /* namespace Kokkos */
|
|
|
|
#else
|
|
|
|
//----------------------------------------------------------------------------
|
|
//----------------------------------------------------------------------------
|
|
//
|
|
// Partial specializations of Kokkos::subview() for DualView objects.
|
|
//
|
|
|
|
namespace Kokkos {
|
|
namespace Impl {
|
|
|
|
template< class SrcDataType , class SrcArg1Type , class SrcArg2Type , class SrcArg3Type
|
|
, class SubArg0_type , class SubArg1_type , class SubArg2_type , class SubArg3_type
|
|
, class SubArg4_type , class SubArg5_type , class SubArg6_type , class SubArg7_type
|
|
>
|
|
struct ViewSubview< DualView< SrcDataType , SrcArg1Type , SrcArg2Type , SrcArg3Type >
|
|
, SubArg0_type , SubArg1_type , SubArg2_type , SubArg3_type
|
|
, SubArg4_type , SubArg5_type , SubArg6_type , SubArg7_type >
|
|
{
|
|
private:
|
|
|
|
typedef DualView< SrcDataType , SrcArg1Type , SrcArg2Type , SrcArg3Type > SrcViewType ;
|
|
|
|
enum { V0 = Impl::is_same< SubArg0_type , void >::value ? 1 : 0 };
|
|
enum { V1 = Impl::is_same< SubArg1_type , void >::value ? 1 : 0 };
|
|
enum { V2 = Impl::is_same< SubArg2_type , void >::value ? 1 : 0 };
|
|
enum { V3 = Impl::is_same< SubArg3_type , void >::value ? 1 : 0 };
|
|
enum { V4 = Impl::is_same< SubArg4_type , void >::value ? 1 : 0 };
|
|
enum { V5 = Impl::is_same< SubArg5_type , void >::value ? 1 : 0 };
|
|
enum { V6 = Impl::is_same< SubArg6_type , void >::value ? 1 : 0 };
|
|
enum { V7 = Impl::is_same< SubArg7_type , void >::value ? 1 : 0 };
|
|
|
|
// The source view rank must be equal to the input argument rank
|
|
// Once a void argument is encountered all subsequent arguments must be void.
|
|
enum { InputRank =
|
|
Impl::StaticAssert<( SrcViewType::rank ==
|
|
( V0 ? 0 : (
|
|
V1 ? 1 : (
|
|
V2 ? 2 : (
|
|
V3 ? 3 : (
|
|
V4 ? 4 : (
|
|
V5 ? 5 : (
|
|
V6 ? 6 : (
|
|
V7 ? 7 : 8 ))))))) ))
|
|
&&
|
|
( SrcViewType::rank ==
|
|
( 8 - ( V0 + V1 + V2 + V3 + V4 + V5 + V6 + V7 ) ) )
|
|
>::value ? SrcViewType::rank : 0 };
|
|
|
|
enum { R0 = Impl::ViewOffsetRange< SubArg0_type >::is_range ? 1 : 0 };
|
|
enum { R1 = Impl::ViewOffsetRange< SubArg1_type >::is_range ? 1 : 0 };
|
|
enum { R2 = Impl::ViewOffsetRange< SubArg2_type >::is_range ? 1 : 0 };
|
|
enum { R3 = Impl::ViewOffsetRange< SubArg3_type >::is_range ? 1 : 0 };
|
|
enum { R4 = Impl::ViewOffsetRange< SubArg4_type >::is_range ? 1 : 0 };
|
|
enum { R5 = Impl::ViewOffsetRange< SubArg5_type >::is_range ? 1 : 0 };
|
|
enum { R6 = Impl::ViewOffsetRange< SubArg6_type >::is_range ? 1 : 0 };
|
|
enum { R7 = Impl::ViewOffsetRange< SubArg7_type >::is_range ? 1 : 0 };
|
|
|
|
enum { OutputRank = unsigned(R0) + unsigned(R1) + unsigned(R2) + unsigned(R3)
|
|
+ unsigned(R4) + unsigned(R5) + unsigned(R6) + unsigned(R7) };
|
|
|
|
// Reverse
|
|
enum { R0_rev = 0 == InputRank ? 0u : (
|
|
1 == InputRank ? unsigned(R0) : (
|
|
2 == InputRank ? unsigned(R1) : (
|
|
3 == InputRank ? unsigned(R2) : (
|
|
4 == InputRank ? unsigned(R3) : (
|
|
5 == InputRank ? unsigned(R4) : (
|
|
6 == InputRank ? unsigned(R5) : (
|
|
7 == InputRank ? unsigned(R6) : unsigned(R7) ))))))) };
|
|
|
|
typedef typename SrcViewType::array_layout SrcViewLayout ;
|
|
|
|
// Choose array layout, attempting to preserve original layout if at all possible.
|
|
typedef typename Impl::if_c<
|
|
( // Same Layout IF
|
|
// OutputRank 0
|
|
( OutputRank == 0 )
|
|
||
|
|
// OutputRank 1 or 2, InputLayout Left, Interval 0
|
|
// because single stride one or second index has a stride.
|
|
( OutputRank <= 2 && R0 && Impl::is_same<SrcViewLayout,LayoutLeft>::value )
|
|
||
|
|
// OutputRank 1 or 2, InputLayout Right, Interval [InputRank-1]
|
|
// because single stride one or second index has a stride.
|
|
( OutputRank <= 2 && R0_rev && Impl::is_same<SrcViewLayout,LayoutRight>::value )
|
|
), SrcViewLayout , Kokkos::LayoutStride >::type OutputViewLayout ;
|
|
|
|
// Choose data type as a purely dynamic rank array to accomodate a runtime range.
|
|
typedef typename Impl::if_c< OutputRank == 0 , typename SrcViewType::value_type ,
|
|
typename Impl::if_c< OutputRank == 1 , typename SrcViewType::value_type *,
|
|
typename Impl::if_c< OutputRank == 2 , typename SrcViewType::value_type **,
|
|
typename Impl::if_c< OutputRank == 3 , typename SrcViewType::value_type ***,
|
|
typename Impl::if_c< OutputRank == 4 , typename SrcViewType::value_type ****,
|
|
typename Impl::if_c< OutputRank == 5 , typename SrcViewType::value_type *****,
|
|
typename Impl::if_c< OutputRank == 6 , typename SrcViewType::value_type ******,
|
|
typename Impl::if_c< OutputRank == 7 , typename SrcViewType::value_type *******,
|
|
typename SrcViewType::value_type ********
|
|
>::type >::type >::type >::type >::type >::type >::type >::type OutputData ;
|
|
|
|
// Choose space.
|
|
// If the source view's template arg1 or arg2 is a space then use it,
|
|
// otherwise use the source view's execution space.
|
|
|
|
typedef typename Impl::if_c< Impl::is_space< SrcArg1Type >::value , SrcArg1Type ,
|
|
typename Impl::if_c< Impl::is_space< SrcArg2Type >::value , SrcArg2Type , typename SrcViewType::execution_space
|
|
>::type >::type OutputSpace ;
|
|
|
|
public:
|
|
|
|
// If keeping the layout then match non-data type arguments
|
|
// else keep execution space and memory traits.
|
|
typedef typename
|
|
Impl::if_c< Impl::is_same< SrcViewLayout , OutputViewLayout >::value
|
|
, Kokkos::DualView< OutputData , SrcArg1Type , SrcArg2Type , SrcArg3Type >
|
|
, Kokkos::DualView< OutputData , OutputViewLayout , OutputSpace
|
|
, typename SrcViewType::memory_traits >
|
|
>::type type ;
|
|
};
|
|
|
|
} /* namespace Impl */
|
|
} /* namespace Kokkos */
|
|
|
|
namespace Kokkos {
|
|
|
|
template< class D , class A1 , class A2 , class A3 ,
|
|
class ArgType0 >
|
|
typename Impl::ViewSubview< DualView<D,A1,A2,A3>
|
|
, ArgType0 , void , void , void
|
|
, void , void , void , void
|
|
>::type
|
|
subview( const DualView<D,A1,A2,A3> & src ,
|
|
const ArgType0 & arg0 )
|
|
{
|
|
typedef typename
|
|
Impl::ViewSubview< DualView<D,A1,A2,A3>
|
|
, ArgType0 , void , void , void
|
|
, void , void , void , void
|
|
>::type
|
|
DstViewType ;
|
|
DstViewType sub_view;
|
|
sub_view.d_view = subview(src.d_view,arg0);
|
|
sub_view.h_view = subview(src.h_view,arg0);
|
|
sub_view.modified_device = src.modified_device;
|
|
sub_view.modified_host = src.modified_host;
|
|
return sub_view;
|
|
}
|
|
|
|
|
|
template< class D , class A1 , class A2 , class A3 ,
|
|
class ArgType0 , class ArgType1 >
|
|
typename Impl::ViewSubview< DualView<D,A1,A2,A3>
|
|
, ArgType0 , ArgType1 , void , void
|
|
, void , void , void , void
|
|
>::type
|
|
subview( const DualView<D,A1,A2,A3> & src ,
|
|
const ArgType0 & arg0 ,
|
|
const ArgType1 & arg1 )
|
|
{
|
|
typedef typename
|
|
Impl::ViewSubview< DualView<D,A1,A2,A3>
|
|
, ArgType0 , ArgType1 , void , void
|
|
, void , void , void , void
|
|
>::type
|
|
DstViewType ;
|
|
DstViewType sub_view;
|
|
sub_view.d_view = subview(src.d_view,arg0,arg1);
|
|
sub_view.h_view = subview(src.h_view,arg0,arg1);
|
|
sub_view.modified_device = src.modified_device;
|
|
sub_view.modified_host = src.modified_host;
|
|
return sub_view;
|
|
}
|
|
|
|
template< class D , class A1 , class A2 , class A3 ,
|
|
class ArgType0 , class ArgType1 , class ArgType2 >
|
|
typename Impl::ViewSubview< DualView<D,A1,A2,A3>
|
|
, ArgType0 , ArgType1 , ArgType2 , void
|
|
, void , void , void , void
|
|
>::type
|
|
subview( const DualView<D,A1,A2,A3> & src ,
|
|
const ArgType0 & arg0 ,
|
|
const ArgType1 & arg1 ,
|
|
const ArgType2 & arg2 )
|
|
{
|
|
typedef typename
|
|
Impl::ViewSubview< DualView<D,A1,A2,A3>
|
|
, ArgType0 , ArgType1 , ArgType2 , void
|
|
, void , void , void , void
|
|
>::type
|
|
DstViewType ;
|
|
DstViewType sub_view;
|
|
sub_view.d_view = subview(src.d_view,arg0,arg1,arg2);
|
|
sub_view.h_view = subview(src.h_view,arg0,arg1,arg2);
|
|
sub_view.modified_device = src.modified_device;
|
|
sub_view.modified_host = src.modified_host;
|
|
return sub_view;
|
|
}
|
|
|
|
template< class D , class A1 , class A2 , class A3 ,
|
|
class ArgType0 , class ArgType1 , class ArgType2 , class ArgType3 >
|
|
typename Impl::ViewSubview< DualView<D,A1,A2,A3>
|
|
, ArgType0 , ArgType1 , ArgType2 , ArgType3
|
|
, void , void , void , void
|
|
>::type
|
|
subview( const DualView<D,A1,A2,A3> & src ,
|
|
const ArgType0 & arg0 ,
|
|
const ArgType1 & arg1 ,
|
|
const ArgType2 & arg2 ,
|
|
const ArgType3 & arg3 )
|
|
{
|
|
typedef typename
|
|
Impl::ViewSubview< DualView<D,A1,A2,A3>
|
|
, ArgType0 , ArgType1 , ArgType2 , ArgType3
|
|
, void , void , void , void
|
|
>::type
|
|
DstViewType ;
|
|
DstViewType sub_view;
|
|
sub_view.d_view = subview(src.d_view,arg0,arg1,arg2,arg3);
|
|
sub_view.h_view = subview(src.h_view,arg0,arg1,arg2,arg3);
|
|
sub_view.modified_device = src.modified_device;
|
|
sub_view.modified_host = src.modified_host;
|
|
return sub_view;
|
|
}
|
|
|
|
template< class D , class A1 , class A2 , class A3 ,
|
|
class ArgType0 , class ArgType1 , class ArgType2 , class ArgType3 ,
|
|
class ArgType4 >
|
|
typename Impl::ViewSubview< DualView<D,A1,A2,A3>
|
|
, ArgType0 , ArgType1 , ArgType2 , ArgType3
|
|
, ArgType4 , void , void , void
|
|
>::type
|
|
subview( const DualView<D,A1,A2,A3> & src ,
|
|
const ArgType0 & arg0 ,
|
|
const ArgType1 & arg1 ,
|
|
const ArgType2 & arg2 ,
|
|
const ArgType3 & arg3 ,
|
|
const ArgType4 & arg4 )
|
|
{
|
|
typedef typename
|
|
Impl::ViewSubview< DualView<D,A1,A2,A3>
|
|
, ArgType0 , ArgType1 , ArgType2 , ArgType3
|
|
, ArgType4 , void , void ,void
|
|
>::type
|
|
DstViewType ;
|
|
DstViewType sub_view;
|
|
sub_view.d_view = subview(src.d_view,arg0,arg1,arg2,arg3,arg4);
|
|
sub_view.h_view = subview(src.h_view,arg0,arg1,arg2,arg3,arg4);
|
|
sub_view.modified_device = src.modified_device;
|
|
sub_view.modified_host = src.modified_host;
|
|
return sub_view;
|
|
}
|
|
|
|
template< class D , class A1 , class A2 , class A3 ,
|
|
class ArgType0 , class ArgType1 , class ArgType2 , class ArgType3 ,
|
|
class ArgType4 , class ArgType5 >
|
|
typename Impl::ViewSubview< DualView<D,A1,A2,A3>
|
|
, ArgType0 , ArgType1 , ArgType2 , ArgType3
|
|
, ArgType4 , ArgType5 , void , void
|
|
>::type
|
|
subview( const DualView<D,A1,A2,A3> & src ,
|
|
const ArgType0 & arg0 ,
|
|
const ArgType1 & arg1 ,
|
|
const ArgType2 & arg2 ,
|
|
const ArgType3 & arg3 ,
|
|
const ArgType4 & arg4 ,
|
|
const ArgType5 & arg5 )
|
|
{
|
|
typedef typename
|
|
Impl::ViewSubview< DualView<D,A1,A2,A3>
|
|
, ArgType0 , ArgType1 , ArgType2 , ArgType3
|
|
, ArgType4 , ArgType5 , void , void
|
|
>::type
|
|
DstViewType ;
|
|
DstViewType sub_view;
|
|
sub_view.d_view = subview(src.d_view,arg0,arg1,arg2,arg3,arg4,arg5);
|
|
sub_view.h_view = subview(src.h_view,arg0,arg1,arg2,arg3,arg4,arg5);
|
|
sub_view.modified_device = src.modified_device;
|
|
sub_view.modified_host = src.modified_host;
|
|
return sub_view;
|
|
}
|
|
|
|
template< class D , class A1 , class A2 , class A3 ,
|
|
class ArgType0 , class ArgType1 , class ArgType2 , class ArgType3 ,
|
|
class ArgType4 , class ArgType5 , class ArgType6 >
|
|
typename Impl::ViewSubview< DualView<D,A1,A2,A3>
|
|
, ArgType0 , ArgType1 , ArgType2 , ArgType3
|
|
, ArgType4 , ArgType5 , ArgType6 , void
|
|
>::type
|
|
subview( const DualView<D,A1,A2,A3> & src ,
|
|
const ArgType0 & arg0 ,
|
|
const ArgType1 & arg1 ,
|
|
const ArgType2 & arg2 ,
|
|
const ArgType3 & arg3 ,
|
|
const ArgType4 & arg4 ,
|
|
const ArgType5 & arg5 ,
|
|
const ArgType6 & arg6 )
|
|
{
|
|
typedef typename
|
|
Impl::ViewSubview< DualView<D,A1,A2,A3>
|
|
, ArgType0 , ArgType1 , ArgType2 , ArgType3
|
|
, ArgType4 , ArgType5 , ArgType6 , void
|
|
>::type
|
|
DstViewType ;
|
|
DstViewType sub_view;
|
|
sub_view.d_view = subview(src.d_view,arg0,arg1,arg2,arg3,arg4,arg5,arg6);
|
|
sub_view.h_view = subview(src.h_view,arg0,arg1,arg2,arg3,arg4,arg5,arg6);
|
|
sub_view.modified_device = src.modified_device;
|
|
sub_view.modified_host = src.modified_host;
|
|
return sub_view;
|
|
}
|
|
|
|
template< class D , class A1 , class A2 , class A3 ,
|
|
class ArgType0 , class ArgType1 , class ArgType2 , class ArgType3 ,
|
|
class ArgType4 , class ArgType5 , class ArgType6 , class ArgType7 >
|
|
typename Impl::ViewSubview< DualView<D,A1,A2,A3>
|
|
, ArgType0 , ArgType1 , ArgType2 , ArgType3
|
|
, ArgType4 , ArgType5 , ArgType6 , ArgType7
|
|
>::type
|
|
subview( const DualView<D,A1,A2,A3> & src ,
|
|
const ArgType0 & arg0 ,
|
|
const ArgType1 & arg1 ,
|
|
const ArgType2 & arg2 ,
|
|
const ArgType3 & arg3 ,
|
|
const ArgType4 & arg4 ,
|
|
const ArgType5 & arg5 ,
|
|
const ArgType6 & arg6 ,
|
|
const ArgType7 & arg7 )
|
|
{
|
|
typedef typename
|
|
Impl::ViewSubview< DualView<D,A1,A2,A3>
|
|
, ArgType0 , ArgType1 , ArgType2 , ArgType3
|
|
, ArgType4 , ArgType5 , ArgType6 , ArgType7
|
|
>::type
|
|
DstViewType ;
|
|
DstViewType sub_view;
|
|
sub_view.d_view = subview(src.d_view,arg0,arg1,arg2,arg3,arg4,arg5,arg6,arg7);
|
|
sub_view.h_view = subview(src.h_view,arg0,arg1,arg2,arg3,arg4,arg5,arg6,arg7);
|
|
sub_view.modified_device = src.modified_device;
|
|
sub_view.modified_host = src.modified_host;
|
|
return sub_view;
|
|
}
|
|
|
|
} // namespace Kokkos
|
|
|
|
#endif /* KOKKOS_USING_EXP_VIEW */
|
|
|
|
//----------------------------------------------------------------------------
|
|
//----------------------------------------------------------------------------
|
|
|
|
namespace Kokkos {
|
|
|
|
//
|
|
// Partial specialization of Kokkos::deep_copy() for DualView objects.
|
|
//
|
|
|
|
template< class DT , class DL , class DD , class DM ,
|
|
class ST , class SL , class SD , class SM >
|
|
void
|
|
deep_copy (DualView<DT,DL,DD,DM> dst, // trust me, this must not be a reference
|
|
const DualView<ST,SL,SD,SM>& src )
|
|
{
|
|
if (src.modified_device () >= src.modified_host ()) {
|
|
deep_copy (dst.d_view, src.d_view);
|
|
dst.template modify<typename DualView<DT,DL,DD,DM>::device_type> ();
|
|
} else {
|
|
deep_copy (dst.h_view, src.h_view);
|
|
dst.template modify<typename DualView<DT,DL,DD,DM>::host_mirror_space> ();
|
|
}
|
|
}
|
|
|
|
template< class ExecutionSpace ,
|
|
class DT , class DL , class DD , class DM ,
|
|
class ST , class SL , class SD , class SM >
|
|
void
|
|
deep_copy (const ExecutionSpace& exec ,
|
|
DualView<DT,DL,DD,DM> dst, // trust me, this must not be a reference
|
|
const DualView<ST,SL,SD,SM>& src )
|
|
{
|
|
if (src.modified_device () >= src.modified_host ()) {
|
|
deep_copy (exec, dst.d_view, src.d_view);
|
|
dst.template modify<typename DualView<DT,DL,DD,DM>::device_type> ();
|
|
} else {
|
|
deep_copy (exec, dst.h_view, src.h_view);
|
|
dst.template modify<typename DualView<DT,DL,DD,DM>::host_mirror_space> ();
|
|
}
|
|
}
|
|
|
|
} // namespace Kokkos
|
|
|
|
#endif
|