Files
lammps/src/KOKKOS/atom_vec_sphere_kokkos.cpp
2022-12-12 17:34:18 -07:00

1735 lines
63 KiB
C++

// clang-format off
/* ----------------------------------------------------------------------
LAMMPS - Large-scale Atomic/Molecular Massively Parallel Simulator
https://www.lammps.org/, Sandia National Laboratories
LAMMPS development team: developers@lammps.org
Copyright (2003) Sandia Corporation. Under the terms of Contract
DE-AC04-94AL85000 with Sandia Corporation, the U.S. Government retains
certain rights in this software. This software is distributed under
the GNU General Public License.
See the README file in the top-level LAMMPS directory.
------------------------------------------------------------------------- */
#include "atom_vec_sphere_kokkos.h"
#include "atom_kokkos.h"
#include "atom_masks.h"
#include "comm_kokkos.h"
#include "domain.h"
#include "error.h"
#include "fix.h"
#include "fix_adapt.h"
#include "math_const.h"
#include "memory.h"
#include "memory_kokkos.h"
#include "modify.h"
#include <cstring>
using namespace LAMMPS_NS;
using namespace MathConst;
/* ---------------------------------------------------------------------- */
AtomVecSphereKokkos::AtomVecSphereKokkos(LAMMPS *lmp) : AtomVec(lmp),
AtomVecKokkos(lmp), AtomVecSphere(lmp)
{
no_border_vel_flag = 0;
}
/* ----------------------------------------------------------------------
grow atom arrays
n = 0 grows arrays by a chunk
n > 0 allocates arrays to size n
------------------------------------------------------------------------- */
void AtomVecSphereKokkos::grow(int n)
{
auto DELTA = LMP_KOKKOS_AV_DELTA;
int step = MAX(DELTA,nmax*0.01);
if (n == 0) nmax += step;
else nmax = n;
atom->nmax = nmax;
if (nmax < 0 || nmax > MAXSMALLINT)
error->one(FLERR,"Per-processor system is too big");
atomKK->sync(Device,ALL_MASK);
atomKK->modified(Device,ALL_MASK);
memoryKK->grow_kokkos(atomKK->k_tag,atomKK->tag,nmax,"atom:tag");
memoryKK->grow_kokkos(atomKK->k_type,atomKK->type,nmax,"atom:type");
memoryKK->grow_kokkos(atomKK->k_mask,atomKK->mask,nmax,"atom:mask");
memoryKK->grow_kokkos(atomKK->k_image,atomKK->image,nmax,"atom:image");
memoryKK->grow_kokkos(atomKK->k_x,atomKK->x,nmax,"atom:x");
memoryKK->grow_kokkos(atomKK->k_v,atomKK->v,nmax,"atom:v");
memoryKK->grow_kokkos(atomKK->k_f,atomKK->f,nmax,"atom:f");
memoryKK->grow_kokkos(atomKK->k_radius,atomKK->radius,nmax,"atom:radius");
memoryKK->grow_kokkos(atomKK->k_rmass,atomKK->rmass,nmax,"atom:rmass");
memoryKK->grow_kokkos(atomKK->k_omega,atomKK->omega,nmax,"atom:omega");
memoryKK->grow_kokkos(atomKK->k_torque,atomKK->torque,nmax,"atom:torque");
if (atom->nextra_grow)
for (int iextra = 0; iextra < atom->nextra_grow; iextra++)
modify->fix[atom->extra_grow[iextra]]->grow_arrays(nmax);
grow_pointers();
atomKK->sync(Host,ALL_MASK);
}
/* ----------------------------------------------------------------------
reset local array ptrs
------------------------------------------------------------------------- */
void AtomVecSphereKokkos::grow_pointers()
{
tag = atomKK->tag;
d_tag = atomKK->k_tag.d_view;
h_tag = atomKK->k_tag.h_view;
type = atomKK->type;
d_type = atomKK->k_type.d_view;
h_type = atomKK->k_type.h_view;
mask = atomKK->mask;
d_mask = atomKK->k_mask.d_view;
h_mask = atomKK->k_mask.h_view;
image = atomKK->image;
d_image = atomKK->k_image.d_view;
h_image = atomKK->k_image.h_view;
x = atomKK->x;
d_x = atomKK->k_x.d_view;
h_x = atomKK->k_x.h_view;
v = atomKK->v;
d_v = atomKK->k_v.d_view;
h_v = atomKK->k_v.h_view;
f = atomKK->f;
d_f = atomKK->k_f.d_view;
h_f = atomKK->k_f.h_view;
radius = atomKK->radius;
d_radius = atomKK->k_radius.d_view;
h_radius = atomKK->k_radius.h_view;
rmass = atomKK->rmass;
d_rmass = atomKK->k_rmass.d_view;
h_rmass = atomKK->k_rmass.h_view;
omega = atomKK->omega;
d_omega = atomKK->k_omega.d_view;
h_omega = atomKK->k_omega.h_view;
torque = atomKK->torque;
d_torque = atomKK->k_torque.d_view;
h_torque = atomKK->k_torque.h_view;
}
/* ---------------------------------------------------------------------- */
template<class DeviceType,int PBC_FLAG,int TRICLINIC>
struct AtomVecSphereKokkos_PackComm {
typedef DeviceType device_type;
typename ArrayTypes<DeviceType>::t_x_array_randomread _x;
typename ArrayTypes<DeviceType>::t_float_1d _radius,_rmass;
typename ArrayTypes<DeviceType>::t_xfloat_2d_um _buf;
typename ArrayTypes<DeviceType>::t_int_2d_const _list;
const int _iswap;
X_FLOAT _xprd,_yprd,_zprd,_xy,_xz,_yz;
X_FLOAT _pbc[6];
AtomVecSphereKokkos_PackComm(
const typename DAT::tdual_x_array &x,
const typename DAT::tdual_float_1d &radius,
const typename DAT::tdual_float_1d &rmass,
const typename DAT::tdual_xfloat_2d &buf,
const typename DAT::tdual_int_2d &list,
const int & iswap,
const X_FLOAT &xprd, const X_FLOAT &yprd, const X_FLOAT &zprd,
const X_FLOAT &xy, const X_FLOAT &xz, const X_FLOAT &yz, const int* const pbc):
_x(x.view<DeviceType>()),
_radius(radius.view<DeviceType>()),
_rmass(rmass.view<DeviceType>()),
_list(list.view<DeviceType>()),_iswap(iswap),
_xprd(xprd),_yprd(yprd),_zprd(zprd),
_xy(xy),_xz(xz),_yz(yz) {
const size_t elements = 5;
const size_t maxsend = (buf.view<DeviceType>().extent(0)*buf.view<DeviceType>().extent(1))/elements;
_buf = typename ArrayTypes<DeviceType>::t_xfloat_2d_um(buf.view<DeviceType>().data(),maxsend,elements);
_pbc[0] = pbc[0]; _pbc[1] = pbc[1]; _pbc[2] = pbc[2];
_pbc[3] = pbc[3]; _pbc[4] = pbc[4]; _pbc[5] = pbc[5];
}
KOKKOS_INLINE_FUNCTION
void operator() (const int& i) const {
const int j = _list(_iswap,i);
if (PBC_FLAG == 0) {
_buf(i,0) = _x(j,0);
_buf(i,1) = _x(j,1);
_buf(i,2) = _x(j,2);
} else {
if (TRICLINIC == 0) {
_buf(i,0) = _x(j,0) + _pbc[0]*_xprd;
_buf(i,1) = _x(j,1) + _pbc[1]*_yprd;
_buf(i,2) = _x(j,2) + _pbc[2]*_zprd;
} else {
_buf(i,0) = _x(j,0) + _pbc[0]*_xprd + _pbc[5]*_xy + _pbc[4]*_xz;
_buf(i,1) = _x(j,1) + _pbc[1]*_yprd + _pbc[3]*_yz;
_buf(i,2) = _x(j,2) + _pbc[2]*_zprd;
}
}
_buf(i,3) = _radius(j);
_buf(i,4) = _rmass(j);
}
};
/* ---------------------------------------------------------------------- */
int AtomVecSphereKokkos::pack_comm_kokkos(
const int &n,
const DAT::tdual_int_2d &list,
const int & iswap,
const DAT::tdual_xfloat_2d &buf,
const int &pbc_flag,
const int* const pbc)
{
// Fallback to AtomVecKokkos if radvary == 0
if (radvary == 0)
return AtomVecKokkos::pack_comm_kokkos(n,list,iswap,buf,pbc_flag,pbc);
// Check whether to always run forward communication on the host
// Choose correct forward PackComm kernel
if (commKK->forward_comm_on_host) {
atomKK->sync(Host,X_MASK|RADIUS_MASK|RMASS_MASK);
if (pbc_flag) {
if (domain->triclinic) {
struct AtomVecSphereKokkos_PackComm<LMPHostType,1,1> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackComm<LMPHostType,1,0> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc);
Kokkos::parallel_for(n,f);
}
} else {
if (domain->triclinic) {
struct AtomVecSphereKokkos_PackComm<LMPHostType,0,1> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackComm<LMPHostType,0,0> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc);
Kokkos::parallel_for(n,f);
}
}
} else {
atomKK->sync(Device,X_MASK|RADIUS_MASK|RMASS_MASK);
if (pbc_flag) {
if (domain->triclinic) {
struct AtomVecSphereKokkos_PackComm<LMPDeviceType,1,1> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackComm<LMPDeviceType,1,0> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc);
Kokkos::parallel_for(n,f);
}
} else {
if (domain->triclinic) {
struct AtomVecSphereKokkos_PackComm<LMPDeviceType,0,1> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackComm<LMPDeviceType,0,0> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc);
Kokkos::parallel_for(n,f);
}
}
}
return n*size_forward;
}
/* ---------------------------------------------------------------------- */
template<class DeviceType,int RADVARY,int PBC_FLAG,int TRICLINIC,int DEFORM_VREMAP>
struct AtomVecSphereKokkos_PackCommVel {
typedef DeviceType device_type;
typename ArrayTypes<DeviceType>::t_x_array_randomread _x;
typename ArrayTypes<DeviceType>::t_int_1d _mask;
typename ArrayTypes<DeviceType>::t_float_1d _radius,_rmass;
typename ArrayTypes<DeviceType>::t_v_array _v, _omega;
typename ArrayTypes<DeviceType>::t_xfloat_2d_um _buf;
typename ArrayTypes<DeviceType>::t_int_2d_const _list;
const int _iswap;
X_FLOAT _xprd,_yprd,_zprd,_xy,_xz,_yz;
X_FLOAT _pbc[6];
X_FLOAT _h_rate[6];
const int _deform_vremap;
AtomVecSphereKokkos_PackCommVel(
const typename DAT::tdual_x_array &x,
const typename DAT::tdual_int_1d &mask,
const typename DAT::tdual_float_1d &radius,
const typename DAT::tdual_float_1d &rmass,
const typename DAT::tdual_v_array &v,
const typename DAT::tdual_v_array &omega,
const typename DAT::tdual_xfloat_2d &buf,
const typename DAT::tdual_int_2d &list,
const int &iswap,
const X_FLOAT &xprd, const X_FLOAT &yprd, const X_FLOAT &zprd,
const X_FLOAT &xy, const X_FLOAT &xz, const X_FLOAT &yz, const int* const pbc,
const double * const h_rate,
const int &deform_vremap):
_x(x.view<DeviceType>()),
_mask(mask.view<DeviceType>()),
_radius(radius.view<DeviceType>()),
_rmass(rmass.view<DeviceType>()),
_v(v.view<DeviceType>()),
_omega(omega.view<DeviceType>()),
_list(list.view<DeviceType>()),_iswap(iswap),
_xprd(xprd),_yprd(yprd),_zprd(zprd),
_xy(xy),_xz(xz),_yz(yz),
_deform_vremap(deform_vremap)
{
const size_t elements = 9 + 2 * RADVARY;
const int maxsend = (buf.template view<DeviceType>().extent(0)*buf.template view<DeviceType>().extent(1))/elements;
_buf = typename ArrayTypes<DeviceType>::t_xfloat_2d_um(buf.view<DeviceType>().data(),maxsend,elements);
_pbc[0] = pbc[0]; _pbc[1] = pbc[1]; _pbc[2] = pbc[2];
_pbc[3] = pbc[3]; _pbc[4] = pbc[4]; _pbc[5] = pbc[5];
_h_rate[0] = h_rate[0]; _h_rate[1] = h_rate[1]; _h_rate[2] = h_rate[2];
_h_rate[3] = h_rate[3]; _h_rate[4] = h_rate[4]; _h_rate[5] = h_rate[5];
}
KOKKOS_INLINE_FUNCTION
void operator() (const int& i) const {
const int j = _list(_iswap,i);
if (PBC_FLAG == 0) {
_buf(i,0) = _x(j,0);
_buf(i,1) = _x(j,1);
_buf(i,2) = _x(j,2);
} else {
if (TRICLINIC == 0) {
_buf(i,0) = _x(j,0) + _pbc[0]*_xprd;
_buf(i,1) = _x(j,1) + _pbc[1]*_yprd;
_buf(i,2) = _x(j,2) + _pbc[2]*_zprd;
} else {
_buf(i,0) = _x(j,0) + _pbc[0]*_xprd + _pbc[5]*_xy + _pbc[4]*_xz;
_buf(i,1) = _x(j,1) + _pbc[1]*_yprd + _pbc[3]*_yz;
_buf(i,2) = _x(j,2) + _pbc[2]*_zprd;
}
}
if (DEFORM_VREMAP == 0) {
_buf(i,3) = _v(j,0);
_buf(i,4) = _v(j,1);
_buf(i,5) = _v(j,2);
} else {
if (_mask(i) & _deform_vremap) {
_buf(i,3) = _v(j,0) + _pbc[0]*_h_rate[0] + _pbc[5]*_h_rate[5] + _pbc[4]*_h_rate[4];
_buf(i,4) = _v(j,1) + _pbc[1]*_h_rate[1] + _pbc[3]*_h_rate[3];
_buf(i,5) = _v(j,2) + _pbc[2]*_h_rate[2];
} else {
_buf(i,3) = _v(j,0);
_buf(i,4) = _v(j,1);
_buf(i,5) = _v(j,2);
}
}
_buf(i,6) = _omega(j,0);
_buf(i,7) = _omega(j,1);
_buf(i,8) = _omega(j,2);
if (RADVARY) {
_buf(i,9) = _radius(j);
_buf(i,10) = _rmass(j);
}
}
};
/* ---------------------------------------------------------------------- */
int AtomVecSphereKokkos::pack_comm_vel_kokkos(
const int &n,
const DAT::tdual_int_2d &list,
const int & iswap,
const DAT::tdual_xfloat_2d &buf,
const int &pbc_flag,
const int* const pbc)
{
if (commKK->forward_comm_on_host) {
atomKK->sync(Host,X_MASK|RADIUS_MASK|RMASS_MASK|V_MASK|OMEGA_MASK);
if (pbc_flag) {
if (deform_vremap) {
if (domain->triclinic) {
if (radvary == 0) {
struct AtomVecSphereKokkos_PackCommVel<LMPHostType,0,1,1,1> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackCommVel<LMPHostType,1,1,1,1> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
}
} else {
if (radvary == 0) {
struct AtomVecSphereKokkos_PackCommVel<LMPHostType,0,1,0,1> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackCommVel<LMPHostType,1,1,0,1> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
}
}
} else {
if (domain->triclinic) {
if (radvary == 0) {
struct AtomVecSphereKokkos_PackCommVel<LMPHostType,0,1,1,0> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackCommVel<LMPHostType,1,1,1,0> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
}
} else {
if (radvary == 0) {
struct AtomVecSphereKokkos_PackCommVel<LMPHostType,0,1,0,0> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackCommVel<LMPHostType,1,1,0,0> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
}
}
}
} else {
if (domain->triclinic) {
if (radvary == 0) {
struct AtomVecSphereKokkos_PackCommVel<LMPHostType,0,0,1,0> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackCommVel<LMPHostType,1,0,1,0> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
}
} else {
if (radvary == 0) {
struct AtomVecSphereKokkos_PackCommVel<LMPHostType,0,0,0,0> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackCommVel<LMPHostType,1,0,0,0> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
}
}
}
} else {
atomKK->sync(Device,X_MASK|RADIUS_MASK|RMASS_MASK|V_MASK|OMEGA_MASK);
if (pbc_flag) {
if (deform_vremap) {
if (domain->triclinic) {
if (radvary == 0) {
struct AtomVecSphereKokkos_PackCommVel<LMPDeviceType,0,1,1,1> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackCommVel<LMPDeviceType,1,1,1,1> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
}
} else {
if (radvary == 0) {
struct AtomVecSphereKokkos_PackCommVel<LMPDeviceType,0,1,0,1> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackCommVel<LMPDeviceType,1,1,0,1> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
}
}
} else {
if (domain->triclinic) {
if (radvary == 0) {
struct AtomVecSphereKokkos_PackCommVel<LMPDeviceType,0,1,1,0> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackCommVel<LMPDeviceType,1,1,1,0> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
}
} else {
if (radvary == 0) {
struct AtomVecSphereKokkos_PackCommVel<LMPDeviceType,0,1,0,0> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackCommVel<LMPDeviceType,1,1,0,0> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
}
}
}
} else {
if (domain->triclinic) {
if (radvary == 0) {
struct AtomVecSphereKokkos_PackCommVel<LMPDeviceType,0,0,1,0> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackCommVel<LMPDeviceType,1,0,1,0> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
}
} else {
if (radvary == 0) {
struct AtomVecSphereKokkos_PackCommVel<LMPDeviceType,0,0,0,0> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackCommVel<LMPDeviceType,1,0,0,0> f(
atomKK->k_x,atomKK->k_mask,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc,h_rate,deform_vremap);
Kokkos::parallel_for(n,f);
}
}
}
}
return n*(size_forward+size_velocity);
}
/* ---------------------------------------------------------------------- */
template<class DeviceType,int PBC_FLAG,int TRICLINIC>
struct AtomVecSphereKokkos_PackCommSelf {
typedef DeviceType device_type;
typename ArrayTypes<DeviceType>::t_x_array_randomread _x;
typename ArrayTypes<DeviceType>::t_x_array _xw;
typename ArrayTypes<DeviceType>::t_float_1d _radius,_rmass;
int _nfirst;
typename ArrayTypes<DeviceType>::t_int_2d_const _list;
const int _iswap;
X_FLOAT _xprd,_yprd,_zprd,_xy,_xz,_yz;
X_FLOAT _pbc[6];
AtomVecSphereKokkos_PackCommSelf(
const typename DAT::tdual_x_array &x,
const typename DAT::tdual_float_1d &radius,
const typename DAT::tdual_float_1d &rmass,
const int &nfirst,
const typename DAT::tdual_int_2d &list,
const int & iswap,
const X_FLOAT &xprd, const X_FLOAT &yprd, const X_FLOAT &zprd,
const X_FLOAT &xy, const X_FLOAT &xz, const X_FLOAT &yz, const int* const pbc):
_x(x.view<DeviceType>()),_xw(x.view<DeviceType>()),
_radius(radius.view<DeviceType>()),
_rmass(rmass.view<DeviceType>()),
_nfirst(nfirst),_list(list.view<DeviceType>()),_iswap(iswap),
_xprd(xprd),_yprd(yprd),_zprd(zprd),
_xy(xy),_xz(xz),_yz(yz) {
_pbc[0] = pbc[0]; _pbc[1] = pbc[1]; _pbc[2] = pbc[2];
_pbc[3] = pbc[3]; _pbc[4] = pbc[4]; _pbc[5] = pbc[5];
};
KOKKOS_INLINE_FUNCTION
void operator() (const int& i) const {
const int j = _list(_iswap,i);
if (PBC_FLAG == 0) {
_xw(i+_nfirst,0) = _x(j,0);
_xw(i+_nfirst,1) = _x(j,1);
_xw(i+_nfirst,2) = _x(j,2);
} else {
if (TRICLINIC == 0) {
_xw(i+_nfirst,0) = _x(j,0) + _pbc[0]*_xprd;
_xw(i+_nfirst,1) = _x(j,1) + _pbc[1]*_yprd;
_xw(i+_nfirst,2) = _x(j,2) + _pbc[2]*_zprd;
} else {
_xw(i+_nfirst,0) = _x(j,0) + _pbc[0]*_xprd + _pbc[5]*_xy + _pbc[4]*_xz;
_xw(i+_nfirst,1) = _x(j,1) + _pbc[1]*_yprd + _pbc[3]*_yz;
_xw(i+_nfirst,2) = _x(j,2) + _pbc[2]*_zprd;
}
}
_radius(i+_nfirst) = _radius(j);
_rmass(i+_nfirst) = _rmass(j);
}
};
/* ---------------------------------------------------------------------- */
int AtomVecSphereKokkos::pack_comm_self(
const int &n, const DAT::tdual_int_2d &list, const int &iswap,
const int nfirst, const int &pbc_flag, const int* const pbc) {
// Fallback to AtomVecKokkos if radvary == 0
if (radvary == 0)
return AtomVecKokkos::pack_comm_self(n,list,iswap,nfirst,pbc_flag,pbc);
if (commKK->forward_comm_on_host) {
atomKK->sync(Host,X_MASK|RADIUS_MASK|RMASS_MASK);
atomKK->modified(Host,X_MASK|RADIUS_MASK|RMASS_MASK);
if (pbc_flag) {
if (domain->triclinic) {
struct AtomVecSphereKokkos_PackCommSelf<LMPHostType,1,1> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
nfirst,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackCommSelf<LMPHostType,1,0> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
nfirst,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc);
Kokkos::parallel_for(n,f);
}
} else {
if (domain->triclinic) {
struct AtomVecSphereKokkos_PackCommSelf<LMPHostType,0,1> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
nfirst,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackCommSelf<LMPHostType,0,0> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
nfirst,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc);
Kokkos::parallel_for(n,f);
}
}
} else {
atomKK->sync(Device,X_MASK|RADIUS_MASK|RMASS_MASK);
atomKK->modified(Device,X_MASK|RADIUS_MASK|RMASS_MASK);
if (pbc_flag) {
if (domain->triclinic) {
struct AtomVecSphereKokkos_PackCommSelf<LMPDeviceType,1,1> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
nfirst,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackCommSelf<LMPDeviceType,1,0> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
nfirst,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc);
Kokkos::parallel_for(n,f);
}
} else {
if (domain->triclinic) {
struct AtomVecSphereKokkos_PackCommSelf<LMPDeviceType,0,1> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
nfirst,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_PackCommSelf<LMPDeviceType,0,0> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
nfirst,list,iswap,
domain->xprd,domain->yprd,domain->zprd,
domain->xy,domain->xz,domain->yz,pbc);
Kokkos::parallel_for(n,f);
}
}
}
return n*size_forward;
}
/* ---------------------------------------------------------------------- */
template<class DeviceType>
struct AtomVecSphereKokkos_UnpackComm {
typedef DeviceType device_type;
typename ArrayTypes<DeviceType>::t_x_array _x;
typename ArrayTypes<DeviceType>::t_float_1d _radius,_rmass;
typename ArrayTypes<DeviceType>::t_xfloat_2d_const_um _buf;
int _first;
AtomVecSphereKokkos_UnpackComm(
const typename DAT::tdual_x_array &x,
const typename DAT::tdual_float_1d &radius,
const typename DAT::tdual_float_1d &rmass,
const typename DAT::tdual_xfloat_2d &buf,
const int& first):
_x(x.view<DeviceType>()),
_radius(radius.view<DeviceType>()),
_rmass(rmass.view<DeviceType>()),
_first(first)
{
const size_t elements = 5;
const size_t maxsend = (buf.view<DeviceType>().extent(0)*buf.view<DeviceType>().extent(1))/elements;
_buf = typename ArrayTypes<DeviceType>::t_xfloat_2d_const_um(buf.view<DeviceType>().data(),maxsend,elements);
};
KOKKOS_INLINE_FUNCTION
void operator() (const int& i) const {
_x(i+_first,0) = _buf(i,0);
_x(i+_first,1) = _buf(i,1);
_x(i+_first,2) = _buf(i,2);
_radius(i+_first) = _buf(i,3);
_rmass(i+_first) = _buf(i,4);
}
};
/* ---------------------------------------------------------------------- */
void AtomVecSphereKokkos::unpack_comm_kokkos(
const int &n, const int &first,
const DAT::tdual_xfloat_2d &buf) {
// Fallback to AtomVecKokkos if radvary == 0
if (radvary == 0) {
AtomVecKokkos::unpack_comm_kokkos(n,first,buf);
return;
}
if (commKK->forward_comm_on_host) {
atomKK->modified(Host,X_MASK|RADIUS_MASK|RMASS_MASK);
struct AtomVecSphereKokkos_UnpackComm<LMPHostType> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
buf,first);
Kokkos::parallel_for(n,f);
} else {
atomKK->modified(Device,X_MASK|RADIUS_MASK|RMASS_MASK);
struct AtomVecSphereKokkos_UnpackComm<LMPDeviceType> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
buf,first);
Kokkos::parallel_for(n,f);
}
}
/* ---------------------------------------------------------------------- */
template<class DeviceType,int RADVARY>
struct AtomVecSphereKokkos_UnpackCommVel {
typedef DeviceType device_type;
typename ArrayTypes<DeviceType>::t_x_array _x;
typename ArrayTypes<DeviceType>::t_float_1d _radius,_rmass;
typename ArrayTypes<DeviceType>::t_v_array _v, _omega;
typename ArrayTypes<DeviceType>::t_xfloat_2d_const _buf;
int _first;
AtomVecSphereKokkos_UnpackCommVel(
const typename DAT::tdual_x_array &x,
const typename DAT::tdual_float_1d &radius,
const typename DAT::tdual_float_1d &rmass,
const typename DAT::tdual_v_array &v,
const typename DAT::tdual_v_array &omega,
const typename DAT::tdual_xfloat_2d &buf,
const int& first):
_x(x.view<DeviceType>()),
_radius(radius.view<DeviceType>()),
_rmass(rmass.view<DeviceType>()),
_v(v.view<DeviceType>()),
_omega(omega.view<DeviceType>()),
_first(first)
{
const size_t elements = 9 + 2 * RADVARY;
const int maxsend = (buf.template view<DeviceType>().extent(0)*buf.template view<DeviceType>().extent(1))/elements;
buffer_view<DeviceType>(_buf,buf,maxsend,elements);
};
KOKKOS_INLINE_FUNCTION
void operator() (const int& i) const {
_x(i+_first,0) = _buf(i,0);
_x(i+_first,1) = _buf(i,1);
_x(i+_first,2) = _buf(i,2);
_v(i+_first,0) = _buf(i,3);
_v(i+_first,1) = _buf(i,4);
_v(i+_first,2) = _buf(i,5);
_omega(i+_first,0) = _buf(i,6);
_omega(i+_first,1) = _buf(i,7);
_omega(i+_first,2) = _buf(i,8);
if (RADVARY) {
_radius(i+_first) = _buf(i,9);
_rmass(i+_first) = _buf(i,10);
}
}
};
/* ---------------------------------------------------------------------- */
void AtomVecSphereKokkos::unpack_comm_vel_kokkos(
const int &n, const int &first,
const DAT::tdual_xfloat_2d &buf) {
if (commKK->forward_comm_on_host) {
atomKK->modified(Host,X_MASK|RADIUS_MASK|RMASS_MASK|V_MASK|OMEGA_MASK);
if (radvary == 0) {
struct AtomVecSphereKokkos_UnpackCommVel<LMPHostType,0> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,first);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_UnpackCommVel<LMPHostType,1> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,first);
Kokkos::parallel_for(n,f);
}
} else {
atomKK->modified(Device,X_MASK|RADIUS_MASK|RMASS_MASK|V_MASK|OMEGA_MASK);
if (radvary == 0) {
struct AtomVecSphereKokkos_UnpackCommVel<LMPDeviceType,0> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,first);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_UnpackCommVel<LMPDeviceType,1> f(
atomKK->k_x,
atomKK->k_radius,atomKK->k_rmass,
atomKK->k_v,atomKK->k_omega,
buf,first);
Kokkos::parallel_for(n,f);
}
}
}
/* ---------------------------------------------------------------------- */
template<class DeviceType,int PBC_FLAG>
struct AtomVecSphereKokkos_PackBorder {
typedef DeviceType device_type;
typename ArrayTypes<DeviceType>::t_xfloat_2d_um _buf;
const typename ArrayTypes<DeviceType>::t_int_2d_const _list;
const int _iswap;
const typename ArrayTypes<DeviceType>::t_x_array_randomread _x;
const typename ArrayTypes<DeviceType>::t_tagint_1d _tag;
const typename ArrayTypes<DeviceType>::t_int_1d _type;
const typename ArrayTypes<DeviceType>::t_int_1d _mask;
typename ArrayTypes<DeviceType>::t_float_1d _radius,_rmass;
X_FLOAT _dx,_dy,_dz;
AtomVecSphereKokkos_PackBorder(
const typename ArrayTypes<DeviceType>::t_xfloat_2d &buf,
const typename ArrayTypes<DeviceType>::t_int_2d_const &list,
const int &iswap,
const typename ArrayTypes<DeviceType>::t_x_array &x,
const typename ArrayTypes<DeviceType>::t_tagint_1d &tag,
const typename ArrayTypes<DeviceType>::t_int_1d &type,
const typename ArrayTypes<DeviceType>::t_int_1d &mask,
const typename ArrayTypes<DeviceType>::t_float_1d &radius,
const typename ArrayTypes<DeviceType>::t_float_1d &rmass,
const X_FLOAT &dx, const X_FLOAT &dy, const X_FLOAT &dz):
_list(list),_iswap(iswap),
_x(x),_tag(tag),_type(type),_mask(mask),
_radius(radius),
_rmass(rmass),
_dx(dx),_dy(dy),_dz(dz)
{
const size_t elements = 8;
const int maxsend = (buf.extent(0)*buf.extent(1))/elements;
_buf = typename ArrayTypes<DeviceType>::t_xfloat_2d_um(buf.data(),maxsend,elements);
}
KOKKOS_INLINE_FUNCTION
void operator() (const int& i) const {
const int j = _list(_iswap,i);
if (PBC_FLAG == 0) {
_buf(i,0) = _x(j,0);
_buf(i,1) = _x(j,1);
_buf(i,2) = _x(j,2);
} else {
_buf(i,0) = _x(j,0) + _dx;
_buf(i,1) = _x(j,1) + _dy;
_buf(i,2) = _x(j,2) + _dz;
}
_buf(i,3) = d_ubuf(_tag(j)).d;
_buf(i,4) = d_ubuf(_type(j)).d;
_buf(i,5) = d_ubuf(_mask(j)).d;
_buf(i,6) = _radius(j);
_buf(i,7) = _rmass(j);
}
};
/* ---------------------------------------------------------------------- */
int AtomVecSphereKokkos::pack_border_kokkos(
int n, DAT::tdual_int_2d k_sendlist, DAT::tdual_xfloat_2d buf,int iswap,
int pbc_flag, int *pbc, ExecutionSpace space)
{
X_FLOAT dx,dy,dz;
// This was in atom_vec_dpd_kokkos but doesn't appear in any other atom_vec
atomKK->sync(space,ALL_MASK);
if (pbc_flag != 0) {
if (domain->triclinic == 0) {
dx = pbc[0]*domain->xprd;
dy = pbc[1]*domain->yprd;
dz = pbc[2]*domain->zprd;
} else {
dx = pbc[0];
dy = pbc[1];
dz = pbc[2];
}
if (space==Host) {
AtomVecSphereKokkos_PackBorder<LMPHostType,1> f(
buf.view<LMPHostType>(), k_sendlist.view<LMPHostType>(),
iswap,h_x,h_tag,h_type,h_mask,
h_radius,h_rmass,
dx,dy,dz);
Kokkos::parallel_for(n,f);
} else {
AtomVecSphereKokkos_PackBorder<LMPDeviceType,1> f(
buf.view<LMPDeviceType>(), k_sendlist.view<LMPDeviceType>(),
iswap,d_x,d_tag,d_type,d_mask,
d_radius,d_rmass,
dx,dy,dz);
Kokkos::parallel_for(n,f);
}
} else {
dx = dy = dz = 0;
if (space==Host) {
AtomVecSphereKokkos_PackBorder<LMPHostType,0> f(
buf.view<LMPHostType>(), k_sendlist.view<LMPHostType>(),
iswap,h_x,h_tag,h_type,h_mask,
h_radius,h_rmass,
dx,dy,dz);
Kokkos::parallel_for(n,f);
} else {
AtomVecSphereKokkos_PackBorder<LMPDeviceType,0> f(
buf.view<LMPDeviceType>(), k_sendlist.view<LMPDeviceType>(),
iswap,d_x,d_tag,d_type,d_mask,
d_radius,d_rmass,
dx,dy,dz);
Kokkos::parallel_for(n,f);
}
}
return n*size_border;
}
/* ---------------------------------------------------------------------- */
template<class DeviceType,int PBC_FLAG,int DEFORM_VREMAP>
struct AtomVecSphereKokkos_PackBorderVel {
typedef DeviceType device_type;
typename ArrayTypes<DeviceType>::t_xfloat_2d_um _buf;
const typename ArrayTypes<DeviceType>::t_int_2d_const _list;
const int _iswap;
const typename ArrayTypes<DeviceType>::t_x_array_randomread _x;
const typename ArrayTypes<DeviceType>::t_tagint_1d _tag;
const typename ArrayTypes<DeviceType>::t_int_1d _type;
const typename ArrayTypes<DeviceType>::t_int_1d _mask;
typename ArrayTypes<DeviceType>::t_float_1d _radius,_rmass;
typename ArrayTypes<DeviceType>::t_v_array _v, _omega;
X_FLOAT _dx,_dy,_dz, _dvx, _dvy, _dvz;
const int _deform_groupbit;
AtomVecSphereKokkos_PackBorderVel(
const typename ArrayTypes<DeviceType>::t_xfloat_2d &buf,
const typename ArrayTypes<DeviceType>::t_int_2d_const &list,
const int &iswap,
const typename ArrayTypes<DeviceType>::t_x_array &x,
const typename ArrayTypes<DeviceType>::t_tagint_1d &tag,
const typename ArrayTypes<DeviceType>::t_int_1d &type,
const typename ArrayTypes<DeviceType>::t_int_1d &mask,
const typename ArrayTypes<DeviceType>::t_float_1d &radius,
const typename ArrayTypes<DeviceType>::t_float_1d &rmass,
const typename ArrayTypes<DeviceType>::t_v_array &v,
const typename ArrayTypes<DeviceType>::t_v_array &omega,
const X_FLOAT &dx, const X_FLOAT &dy, const X_FLOAT &dz,
const X_FLOAT &dvx, const X_FLOAT &dvy, const X_FLOAT &dvz,
const int &deform_groupbit):
_buf(buf),_list(list),_iswap(iswap),
_x(x),_tag(tag),_type(type),_mask(mask),
_radius(radius),
_rmass(rmass),
_v(v), _omega(omega),
_dx(dx),_dy(dy),_dz(dz),
_dvx(dvx),_dvy(dvy),_dvz(dvz),
_deform_groupbit(deform_groupbit)
{
const size_t elements = 14;
const int maxsend = (buf.extent(0)*buf.extent(1))/elements;
_buf = typename ArrayTypes<DeviceType>::t_xfloat_2d_um(buf.data(),maxsend,elements);
}
KOKKOS_INLINE_FUNCTION
void operator() (const int& i) const {
const int j = _list(_iswap,i);
if (PBC_FLAG == 0) {
_buf(i,0) = _x(j,0);
_buf(i,1) = _x(j,1);
_buf(i,2) = _x(j,2);
} else {
_buf(i,0) = _x(j,0) + _dx;
_buf(i,1) = _x(j,1) + _dy;
_buf(i,2) = _x(j,2) + _dz;
}
_buf(i,3) = d_ubuf(_tag(j)).d;
_buf(i,4) = d_ubuf(_type(j)).d;
_buf(i,5) = d_ubuf(_mask(j)).d;
_buf(i,6) = _radius(j);
_buf(i,7) = _rmass(j);
if (DEFORM_VREMAP) {
if (_mask(i) & _deform_groupbit) {
_buf(i,8) = _v(j,0) + _dvx;
_buf(i,9) = _v(j,1) + _dvy;
_buf(i,10) = _v(j,2) + _dvz;
}
}
else {
_buf(i,8) = _v(j,0);
_buf(i,9) = _v(j,1);
_buf(i,10) = _v(j,2);
}
_buf(i,11) = _omega(j,0);
_buf(i,12) = _omega(j,1);
_buf(i,13) = _omega(j,2);
}
};
/* ---------------------------------------------------------------------- */
int AtomVecSphereKokkos::pack_border_vel_kokkos(
int n, DAT::tdual_int_2d k_sendlist, DAT::tdual_xfloat_2d buf,int iswap,
int pbc_flag, int *pbc, ExecutionSpace space)
{
X_FLOAT dx=0,dy=0,dz=0;
X_FLOAT dvx=0,dvy=0,dvz=0;
// This was in atom_vec_dpd_kokkos but doesn't appear in any other atom_vec
atomKK->sync(space,ALL_MASK);
if (pbc_flag != 0) {
if (domain->triclinic == 0) {
dx = pbc[0]*domain->xprd;
dy = pbc[1]*domain->yprd;
dz = pbc[2]*domain->zprd;
} else {
dx = pbc[0];
dy = pbc[1];
dz = pbc[2];
}
if (!deform_vremap) {
if (space==Host) {
AtomVecSphereKokkos_PackBorderVel<LMPHostType,1,0> f(
buf.view<LMPHostType>(), k_sendlist.view<LMPHostType>(),
iswap,h_x,h_tag,h_type,h_mask,
h_radius,h_rmass,
h_v, h_omega,
dx,dy,dz,dvx,dvy,dvz,
deform_groupbit);
Kokkos::parallel_for(n,f);
} else {
AtomVecSphereKokkos_PackBorderVel<LMPDeviceType,1,0> f(
buf.view<LMPDeviceType>(), k_sendlist.view<LMPDeviceType>(),
iswap,d_x,d_tag,d_type,d_mask,
d_radius,d_rmass,
d_v, d_omega,
dx,dy,dz,dvx,dvy,dvz,
deform_groupbit);
Kokkos::parallel_for(n,f);
}
}
else {
dvx = pbc[0]*h_rate[0] + pbc[5]*h_rate[5] + pbc[4]*h_rate[4];
dvy = pbc[1]*h_rate[1] + pbc[3]*h_rate[3];
dvz = pbc[2]*h_rate[2];
if (space==Host) {
AtomVecSphereKokkos_PackBorderVel<LMPHostType,1,1> f(
buf.view<LMPHostType>(), k_sendlist.view<LMPHostType>(),
iswap,h_x,h_tag,h_type,h_mask,
h_radius,h_rmass,
h_v, h_omega,
dx,dy,dz,dvx,dvy,dvz,
deform_groupbit);
Kokkos::parallel_for(n,f);
} else {
AtomVecSphereKokkos_PackBorderVel<LMPDeviceType,1,1> f(
buf.view<LMPDeviceType>(), k_sendlist.view<LMPDeviceType>(),
iswap,d_x,d_tag,d_type,d_mask,
d_radius,d_rmass,
d_v, d_omega,
dx,dy,dz,dvx,dvy,dvz,
deform_groupbit);
Kokkos::parallel_for(n,f);
}
}
} else {
if (space==Host) {
AtomVecSphereKokkos_PackBorderVel<LMPHostType,0,0> f(
buf.view<LMPHostType>(), k_sendlist.view<LMPHostType>(),
iswap,h_x,h_tag,h_type,h_mask,
h_radius,h_rmass,
h_v, h_omega,
dx,dy,dz,dvx,dvy,dvz,
deform_groupbit);
Kokkos::parallel_for(n,f);
} else {
AtomVecSphereKokkos_PackBorderVel<LMPDeviceType,0,0> f(
buf.view<LMPDeviceType>(), k_sendlist.view<LMPDeviceType>(),
iswap,d_x,d_tag,d_type,d_mask,
d_radius,d_rmass,
d_v, d_omega,
dx,dy,dz,dvx,dvy,dvz,
deform_groupbit);
Kokkos::parallel_for(n,f);
}
}
return n*(size_border + size_velocity);
}
/* ---------------------------------------------------------------------- */
template<class DeviceType>
struct AtomVecSphereKokkos_UnpackBorder {
typedef DeviceType device_type;
typename ArrayTypes<DeviceType>::t_xfloat_2d_const_um _buf;
typename ArrayTypes<DeviceType>::t_x_array _x;
typename ArrayTypes<DeviceType>::t_tagint_1d _tag;
typename ArrayTypes<DeviceType>::t_int_1d _type;
typename ArrayTypes<DeviceType>::t_int_1d _mask;
typename ArrayTypes<DeviceType>::t_float_1d _radius,_rmass;
int _first;
AtomVecSphereKokkos_UnpackBorder(
const typename ArrayTypes<DeviceType>::t_xfloat_2d &buf,
const typename ArrayTypes<DeviceType>::t_x_array &x,
const typename ArrayTypes<DeviceType>::t_tagint_1d &tag,
const typename ArrayTypes<DeviceType>::t_int_1d &type,
const typename ArrayTypes<DeviceType>::t_int_1d &mask,
const typename ArrayTypes<DeviceType>::t_float_1d &radius,
const typename ArrayTypes<DeviceType>::t_float_1d &rmass,
const int& first):
_buf(buf),_x(x),_tag(tag),_type(type),_mask(mask),
_radius(radius),
_rmass(rmass),
_first(first)
{
const size_t elements = 8;
const int maxsend = (buf.extent(0)*buf.extent(1))/elements;
_buf = typename ArrayTypes<DeviceType>::t_xfloat_2d_const_um(buf.data(),maxsend,elements);
};
KOKKOS_INLINE_FUNCTION
void operator() (const int& i) const {
_x(i+_first,0) = _buf(i,0);
_x(i+_first,1) = _buf(i,1);
_x(i+_first,2) = _buf(i,2);
_tag(i+_first) = static_cast<tagint> (d_ubuf(_buf(i,3)).i);
_type(i+_first) = static_cast<int> (d_ubuf(_buf(i,4)).i);
_mask(i+_first) = static_cast<int> (d_ubuf(_buf(i,5)).i);
_radius(i+_first) = _buf(i,6);
_rmass(i+_first) = _buf(i,7);
}
};
/* ---------------------------------------------------------------------- */
void AtomVecSphereKokkos::unpack_border_kokkos(const int &n, const int &first,
const DAT::tdual_xfloat_2d &buf,ExecutionSpace space) {
while (first+n >= nmax) grow(0);
if (space==Host) {
struct AtomVecSphereKokkos_UnpackBorder<LMPHostType> f(buf.view<LMPHostType>(),
h_x,h_tag,h_type,h_mask,
h_radius,h_rmass,
first);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_UnpackBorder<LMPDeviceType> f(buf.view<LMPDeviceType>(),
d_x,d_tag,d_type,d_mask,
d_radius,d_rmass,
first);
Kokkos::parallel_for(n,f);
}
atomKK->modified(space,X_MASK|TAG_MASK|TYPE_MASK|MASK_MASK|
RADIUS_MASK|RMASS_MASK);
}
/* ---------------------------------------------------------------------- */
template<class DeviceType>
struct AtomVecSphereKokkos_UnpackBorderVel {
typedef DeviceType device_type;
typename ArrayTypes<DeviceType>::t_xfloat_2d_const_um _buf;
typename ArrayTypes<DeviceType>::t_x_array _x;
typename ArrayTypes<DeviceType>::t_tagint_1d _tag;
typename ArrayTypes<DeviceType>::t_int_1d _type;
typename ArrayTypes<DeviceType>::t_int_1d _mask;
typename ArrayTypes<DeviceType>::t_float_1d _radius,_rmass;
typename ArrayTypes<DeviceType>::t_v_array _v;
typename ArrayTypes<DeviceType>::t_v_array _omega;
int _first;
AtomVecSphereKokkos_UnpackBorderVel(
const typename ArrayTypes<DeviceType>::t_xfloat_2d_const &buf,
const typename ArrayTypes<DeviceType>::t_x_array &x,
const typename ArrayTypes<DeviceType>::t_tagint_1d &tag,
const typename ArrayTypes<DeviceType>::t_int_1d &type,
const typename ArrayTypes<DeviceType>::t_int_1d &mask,
const typename ArrayTypes<DeviceType>::t_float_1d &radius,
const typename ArrayTypes<DeviceType>::t_float_1d &rmass,
const typename ArrayTypes<DeviceType>::t_v_array &v,
const typename ArrayTypes<DeviceType>::t_v_array &omega,
const int& first):
_buf(buf),_x(x),_tag(tag),_type(type),_mask(mask),
_radius(radius),
_rmass(rmass),
_v(v), _omega(omega),
_first(first)
{
const size_t elements = 14;
const int maxsend = (buf.extent(0)*buf.extent(1))/elements;
_buf = typename ArrayTypes<DeviceType>::t_xfloat_2d_const_um(buf.data(),maxsend,elements);
};
KOKKOS_INLINE_FUNCTION
void operator() (const int& i) const {
_x(i+_first,0) = _buf(i,0);
_x(i+_first,1) = _buf(i,1);
_x(i+_first,2) = _buf(i,2);
_tag(i+_first) = static_cast<tagint> (d_ubuf(_buf(i,3)).i);
_type(i+_first) = static_cast<int> (d_ubuf(_buf(i,4)).i);
_mask(i+_first) = static_cast<int> (d_ubuf(_buf(i,5)).i);
_radius(i+_first) = _buf(i,6);
_rmass(i+_first) = _buf(i,7);
_v(i+_first,0) = _buf(i,8);
_v(i+_first,1) = _buf(i,9);
_v(i+_first,2) = _buf(i,10);
_omega(i+_first,0) = _buf(i,11);
_omega(i+_first,1) = _buf(i,12);
_omega(i+_first,2) = _buf(i,13);
}
};
/* ---------------------------------------------------------------------- */
void AtomVecSphereKokkos::unpack_border_vel_kokkos(
const int &n, const int &first,
const DAT::tdual_xfloat_2d &buf,ExecutionSpace space) {
while (first+n >= nmax) grow(0);
if (space==Host) {
struct AtomVecSphereKokkos_UnpackBorderVel<LMPHostType> f(buf.view<LMPHostType>(),
h_x,h_tag,h_type,h_mask,
h_radius,h_rmass,
h_v, h_omega,
first);
Kokkos::parallel_for(n,f);
} else {
struct AtomVecSphereKokkos_UnpackBorderVel<LMPDeviceType> f(buf.view<LMPDeviceType>(),
d_x,d_tag,d_type,d_mask,
d_radius,d_rmass,
d_v, d_omega,
first);
Kokkos::parallel_for(n,f);
}
atomKK->modified(space,X_MASK|TAG_MASK|TYPE_MASK|MASK_MASK|
RADIUS_MASK|RMASS_MASK|V_MASK|OMEGA_MASK);
}
/* ---------------------------------------------------------------------- */
template<class DeviceType>
struct AtomVecSphereKokkos_PackExchangeFunctor {
typedef DeviceType device_type;
typedef ArrayTypes<DeviceType> AT;
typename AT::t_x_array_randomread _x;
typename AT::t_v_array_randomread _v;
typename AT::t_tagint_1d_randomread _tag;
typename AT::t_int_1d_randomread _type;
typename AT::t_int_1d_randomread _mask;
typename AT::t_imageint_1d_randomread _image;
typename AT::t_float_1d_randomread _radius,_rmass;
typename AT::t_v_array_randomread _omega;
typename AT::t_x_array _xw;
typename AT::t_v_array _vw;
typename AT::t_tagint_1d _tagw;
typename AT::t_int_1d _typew;
typename AT::t_int_1d _maskw;
typename AT::t_imageint_1d _imagew;
typename AT::t_float_1d _radiusw,_rmassw;
typename AT::t_v_array _omegaw;
typename AT::t_xfloat_2d_um _buf;
typename AT::t_int_1d_const _sendlist;
typename AT::t_int_1d_const _copylist;
int _nlocal,_dim;
X_FLOAT _lo,_hi;
AtomVecSphereKokkos_PackExchangeFunctor(
const AtomKokkos* atom,
const typename AT::tdual_xfloat_2d buf,
typename AT::tdual_int_1d sendlist,
typename AT::tdual_int_1d copylist,int nlocal, int dim,X_FLOAT lo, X_FLOAT hi):
_x(atom->k_x.view<DeviceType>()),
_v(atom->k_v.view<DeviceType>()),
_tag(atom->k_tag.view<DeviceType>()),
_type(atom->k_type.view<DeviceType>()),
_mask(atom->k_mask.view<DeviceType>()),
_image(atom->k_image.view<DeviceType>()),
_radius(atom->k_radius.view<DeviceType>()),
_rmass(atom->k_rmass.view<DeviceType>()),
_omega(atom->k_omega.view<DeviceType>()),
_xw(atom->k_x.view<DeviceType>()),
_vw(atom->k_v.view<DeviceType>()),
_tagw(atom->k_tag.view<DeviceType>()),
_typew(atom->k_type.view<DeviceType>()),
_maskw(atom->k_mask.view<DeviceType>()),
_imagew(atom->k_image.view<DeviceType>()),
_radiusw(atom->k_radius.view<DeviceType>()),
_rmassw(atom->k_rmass.view<DeviceType>()),
_omegaw(atom->k_omega.view<DeviceType>()),
_sendlist(sendlist.template view<DeviceType>()),
_copylist(copylist.template view<DeviceType>()),
_nlocal(nlocal),_dim(dim),
_lo(lo),_hi(hi)
{
const size_t elements = 16;
const int maxsend = (buf.template view<DeviceType>().extent(0)*buf.template view<DeviceType>().extent(1))/elements;
_buf = typename AT::t_xfloat_2d_um(buf.template view<DeviceType>().data(),maxsend,elements);
}
KOKKOS_INLINE_FUNCTION
void operator() (const int &mysend) const {
const int i = _sendlist(mysend);
_buf(mysend,0) = 16;
_buf(mysend,1) = _x(i,0);
_buf(mysend,2) = _x(i,1);
_buf(mysend,3) = _x(i,2);
_buf(mysend,4) = _v(i,0);
_buf(mysend,5) = _v(i,1);
_buf(mysend,6) = _v(i,2);
_buf(mysend,7) = d_ubuf(_tag[i]).d;
_buf(mysend,8) = d_ubuf(_type[i]).d;
_buf(mysend,9) = d_ubuf(_mask[i]).d;
_buf(mysend,10) = d_ubuf(_image[i]).d;
_buf(mysend,11) = _radius[i];
_buf(mysend,12) = _rmass[i];
_buf(mysend,13) = _omega(i,0);
_buf(mysend,14) = _omega(i,1);
_buf(mysend,15) = _omega(i,2);
const int j = _copylist(mysend);
if (j>-1) {
_xw(i,0) = _x(j,0);
_xw(i,1) = _x(j,1);
_xw(i,2) = _x(j,2);
_vw(i,0) = _v(j,0);
_vw(i,1) = _v(j,1);
_vw(i,2) = _v(j,2);
_tagw[i] = _tag(j);
_typew[i] = _type(j);
_maskw[i] = _mask(j);
_imagew[i] = _image(j);
_radiusw[i] = _radius(j);
_rmassw[i] = _rmass(j);
_omegaw(i,0) = _omega(j,0);
_omegaw(i,1) = _omega(j,1);
_omegaw(i,2) = _omega(j,2);
}
}
};
/* ---------------------------------------------------------------------- */
int AtomVecSphereKokkos::pack_exchange_kokkos(
const int &nsend,
DAT::tdual_xfloat_2d &k_buf,
DAT::tdual_int_1d k_sendlist,
DAT::tdual_int_1d k_copylist,
ExecutionSpace space,int dim,X_FLOAT lo,X_FLOAT hi)
{
if (nsend > (int) (k_buf.view<LMPHostType>().extent(0)*k_buf.view<LMPHostType>().extent(1))/16) {
int newsize = nsend*17/k_buf.view<LMPHostType>().extent(1)+1;
k_buf.resize(newsize,k_buf.view<LMPHostType>().extent(1));
}
atomKK->sync(space,X_MASK | V_MASK | TAG_MASK | TYPE_MASK |
MASK_MASK | IMAGE_MASK| RADIUS_MASK | RMASS_MASK |
OMEGA_MASK);
if (space == Host) {
AtomVecSphereKokkos_PackExchangeFunctor<LMPHostType> f(atomKK,k_buf,k_sendlist,k_copylist,atom->nlocal,dim,lo,hi);
Kokkos::parallel_for(nsend,f);
} else {
AtomVecSphereKokkos_PackExchangeFunctor<LMPDeviceType> f(atomKK,k_buf,k_sendlist,k_copylist,atom->nlocal,dim,lo,hi);
Kokkos::parallel_for(nsend,f);
}
return nsend*16;
}
/* ---------------------------------------------------------------------- */
template<class DeviceType>
struct AtomVecSphereKokkos_UnpackExchangeFunctor {
typedef DeviceType device_type;
typedef ArrayTypes<DeviceType> AT;
typename AT::t_x_array _x;
typename AT::t_v_array _v;
typename AT::t_tagint_1d _tag;
typename AT::t_int_1d _type;
typename AT::t_int_1d _mask;
typename AT::t_imageint_1d _image;
typename AT::t_float_1d _radius;
typename AT::t_float_1d _rmass;
typename AT::t_v_array _omega;
typename AT::t_xfloat_2d_um _buf;
typename AT::t_int_1d _nlocal;
int _dim;
X_FLOAT _lo,_hi;
AtomVecSphereKokkos_UnpackExchangeFunctor(
const AtomKokkos* atom,
const typename AT::tdual_xfloat_2d buf,
typename AT::tdual_int_1d nlocal,
int dim, X_FLOAT lo, X_FLOAT hi):
_x(atom->k_x.view<DeviceType>()),
_v(atom->k_v.view<DeviceType>()),
_tag(atom->k_tag.view<DeviceType>()),
_type(atom->k_type.view<DeviceType>()),
_mask(atom->k_mask.view<DeviceType>()),
_image(atom->k_image.view<DeviceType>()),
_radius(atom->k_radius.view<DeviceType>()),
_rmass(atom->k_rmass.view<DeviceType>()),
_omega(atom->k_omega.view<DeviceType>()),
_nlocal(nlocal.template view<DeviceType>()),_dim(dim),
_lo(lo),_hi(hi)
{
const size_t elements = 16;
const int maxsendlist = (buf.template view<DeviceType>().extent(0)*buf.template view<DeviceType>().extent(1))/elements;
buffer_view<DeviceType>(_buf,buf,maxsendlist,elements);
}
KOKKOS_INLINE_FUNCTION
void operator() (const int &myrecv) const {
X_FLOAT x = _buf(myrecv,_dim+1);
if (x >= _lo && x < _hi) {
int i = Kokkos::atomic_fetch_add(&_nlocal(0),1);
_x(i,0) = _buf(myrecv,1);
_x(i,1) = _buf(myrecv,2);
_x(i,2) = _buf(myrecv,3);
_v(i,0) = _buf(myrecv,4);
_v(i,1) = _buf(myrecv,5);
_v(i,2) = _buf(myrecv,6);
_tag[i] = (tagint) d_ubuf(_buf(myrecv,7)).i;
_type[i] = (int) d_ubuf(_buf(myrecv,8)).i;
_mask[i] = (int) d_ubuf(_buf(myrecv,9)).i;
_image[i] = (imageint) d_ubuf(_buf(myrecv,10)).i;
_radius[i] = _buf(myrecv,11);
_rmass[i] = _buf(myrecv,12);
_omega(i,0) = _buf(myrecv,13);
_omega(i,1) = _buf(myrecv,14);
_omega(i,2) = _buf(myrecv,15);
}
}
};
/* ---------------------------------------------------------------------- */
int AtomVecSphereKokkos::unpack_exchange_kokkos(DAT::tdual_xfloat_2d &k_buf,int nrecv,int nlocal,int dim,X_FLOAT lo,X_FLOAT hi,ExecutionSpace space) {
while (nlocal + nrecv/16 >= nmax) grow(0);
if (space == Host) {
k_count.h_view(0) = nlocal;
AtomVecSphereKokkos_UnpackExchangeFunctor<LMPHostType> f(atomKK,k_buf,k_count,dim,lo,hi);
Kokkos::parallel_for(nrecv/16,f);
} else {
k_count.h_view(0) = nlocal;
k_count.modify<LMPHostType>();
k_count.sync<LMPDeviceType>();
AtomVecSphereKokkos_UnpackExchangeFunctor<LMPDeviceType> f(atomKK,k_buf,k_count,dim,lo,hi);
Kokkos::parallel_for(nrecv/16,f);
k_count.modify<LMPDeviceType>();
k_count.sync<LMPHostType>();
}
atomKK->modified(space,X_MASK | V_MASK | TAG_MASK | TYPE_MASK |
MASK_MASK | IMAGE_MASK| RADIUS_MASK | RMASS_MASK |
OMEGA_MASK);
return k_count.h_view(0);
}
/* ---------------------------------------------------------------------- */
void AtomVecSphereKokkos::sync(ExecutionSpace space, unsigned int mask)
{
if (space == Device) {
if (mask & X_MASK) atomKK->k_x.sync<LMPDeviceType>();
if (mask & V_MASK) atomKK->k_v.sync<LMPDeviceType>();
if (mask & F_MASK) atomKK->k_f.sync<LMPDeviceType>();
if (mask & TAG_MASK) atomKK->k_tag.sync<LMPDeviceType>();
if (mask & TYPE_MASK) atomKK->k_type.sync<LMPDeviceType>();
if (mask & MASK_MASK) atomKK->k_mask.sync<LMPDeviceType>();
if (mask & IMAGE_MASK) atomKK->k_image.sync<LMPDeviceType>();
if (mask & RADIUS_MASK) atomKK->k_radius.sync<LMPDeviceType>();
if (mask & RMASS_MASK) atomKK->k_rmass.sync<LMPDeviceType>();
if (mask & OMEGA_MASK) atomKK->k_omega.sync<LMPDeviceType>();
if (mask & TORQUE_MASK) atomKK->k_torque.sync<LMPDeviceType>();
} else {
if (mask & X_MASK) atomKK->k_x.sync<LMPHostType>();
if (mask & V_MASK) atomKK->k_v.sync<LMPHostType>();
if (mask & F_MASK) atomKK->k_f.sync<LMPHostType>();
if (mask & TAG_MASK) atomKK->k_tag.sync<LMPHostType>();
if (mask & TYPE_MASK) atomKK->k_type.sync<LMPHostType>();
if (mask & MASK_MASK) atomKK->k_mask.sync<LMPHostType>();
if (mask & IMAGE_MASK) atomKK->k_image.sync<LMPHostType>();
if (mask & RADIUS_MASK) atomKK->k_radius.sync<LMPHostType>();
if (mask & RMASS_MASK) atomKK->k_rmass.sync<LMPHostType>();
if (mask & OMEGA_MASK) atomKK->k_omega.sync<LMPHostType>();
if (mask & TORQUE_MASK) atomKK->k_torque.sync<LMPHostType>();
}
}
/* ---------------------------------------------------------------------- */
void AtomVecSphereKokkos::sync_overlapping_device(ExecutionSpace space, unsigned int mask)
{
if (space == Device) {
if ((mask & X_MASK) && atomKK->k_x.need_sync<LMPDeviceType>())
perform_async_copy<DAT::tdual_x_array>(atomKK->k_x,space);
if ((mask & V_MASK) && atomKK->k_v.need_sync<LMPDeviceType>())
perform_async_copy<DAT::tdual_v_array>(atomKK->k_v,space);
if ((mask & F_MASK) && atomKK->k_f.need_sync<LMPDeviceType>())
perform_async_copy<DAT::tdual_f_array>(atomKK->k_f,space);
if ((mask & TAG_MASK) && atomKK->k_tag.need_sync<LMPDeviceType>())
perform_async_copy<DAT::tdual_tagint_1d>(atomKK->k_tag,space);
if ((mask & TYPE_MASK) && atomKK->k_type.need_sync<LMPDeviceType>())
perform_async_copy<DAT::tdual_int_1d>(atomKK->k_type,space);
if ((mask & MASK_MASK) && atomKK->k_mask.need_sync<LMPDeviceType>())
perform_async_copy<DAT::tdual_int_1d>(atomKK->k_mask,space);
if ((mask & IMAGE_MASK) && atomKK->k_image.need_sync<LMPDeviceType>())
perform_async_copy<DAT::tdual_imageint_1d>(atomKK->k_image,space);
if ((mask & RADIUS_MASK) && atomKK->k_radius.need_sync<LMPDeviceType>())
perform_async_copy<DAT::tdual_float_1d>(atomKK->k_radius,space);
if ((mask & RMASS_MASK) && atomKK->k_rmass.need_sync<LMPDeviceType>())
perform_async_copy<DAT::tdual_float_1d>(atomKK->k_rmass,space);
if ((mask & OMEGA_MASK) && atomKK->k_omega.need_sync<LMPDeviceType>())
perform_async_copy<DAT::tdual_v_array>(atomKK->k_omega,space);
if ((mask & TORQUE_MASK) && atomKK->k_torque.need_sync<LMPDeviceType>())
perform_async_copy<DAT::tdual_f_array>(atomKK->k_torque,space);
} else {
if ((mask & X_MASK) && atomKK->k_x.need_sync<LMPHostType>())
perform_async_copy<DAT::tdual_x_array>(atomKK->k_x,space);
if ((mask & V_MASK) && atomKK->k_v.need_sync<LMPHostType>())
perform_async_copy<DAT::tdual_v_array>(atomKK->k_v,space);
if ((mask & F_MASK) && atomKK->k_f.need_sync<LMPHostType>())
perform_async_copy<DAT::tdual_f_array>(atomKK->k_f,space);
if ((mask & TAG_MASK) && atomKK->k_tag.need_sync<LMPHostType>())
perform_async_copy<DAT::tdual_tagint_1d>(atomKK->k_tag,space);
if ((mask & TYPE_MASK) && atomKK->k_type.need_sync<LMPHostType>())
perform_async_copy<DAT::tdual_int_1d>(atomKK->k_type,space);
if ((mask & MASK_MASK) && atomKK->k_mask.need_sync<LMPHostType>())
perform_async_copy<DAT::tdual_int_1d>(atomKK->k_mask,space);
if ((mask & IMAGE_MASK) && atomKK->k_image.need_sync<LMPHostType>())
perform_async_copy<DAT::tdual_imageint_1d>(atomKK->k_image,space);
if ((mask & RADIUS_MASK) && atomKK->k_radius.need_sync<LMPHostType>())
perform_async_copy<DAT::tdual_float_1d>(atomKK->k_radius,space);
if ((mask & RMASS_MASK) && atomKK->k_rmass.need_sync<LMPHostType>())
perform_async_copy<DAT::tdual_float_1d>(atomKK->k_rmass,space);
if ((mask & OMEGA_MASK) && atomKK->k_omega.need_sync<LMPHostType>())
perform_async_copy<DAT::tdual_v_array>(atomKK->k_omega,space);
if ((mask & TORQUE_MASK) && atomKK->k_torque.need_sync<LMPHostType>())
perform_async_copy<DAT::tdual_f_array>(atomKK->k_torque,space);
}
}
/* ---------------------------------------------------------------------- */
void AtomVecSphereKokkos::modified(ExecutionSpace space, unsigned int mask)
{
if (space == Device) {
if (mask & X_MASK) atomKK->k_x.modify<LMPDeviceType>();
if (mask & V_MASK) atomKK->k_v.modify<LMPDeviceType>();
if (mask & F_MASK) atomKK->k_f.modify<LMPDeviceType>();
if (mask & TAG_MASK) atomKK->k_tag.modify<LMPDeviceType>();
if (mask & TYPE_MASK) atomKK->k_type.modify<LMPDeviceType>();
if (mask & MASK_MASK) atomKK->k_mask.modify<LMPDeviceType>();
if (mask & IMAGE_MASK) atomKK->k_image.modify<LMPDeviceType>();
if (mask & RADIUS_MASK) atomKK->k_radius.modify<LMPDeviceType>();
if (mask & RMASS_MASK) atomKK->k_rmass.modify<LMPDeviceType>();
if (mask & OMEGA_MASK) atomKK->k_omega.modify<LMPDeviceType>();
if (mask & TORQUE_MASK) atomKK->k_torque.modify<LMPDeviceType>();
} else {
if (mask & X_MASK) atomKK->k_x.modify<LMPHostType>();
if (mask & V_MASK) atomKK->k_v.modify<LMPHostType>();
if (mask & F_MASK) atomKK->k_f.modify<LMPHostType>();
if (mask & TAG_MASK) atomKK->k_tag.modify<LMPHostType>();
if (mask & TYPE_MASK) atomKK->k_type.modify<LMPHostType>();
if (mask & MASK_MASK) atomKK->k_mask.modify<LMPHostType>();
if (mask & IMAGE_MASK) atomKK->k_image.modify<LMPHostType>();
if (mask & RADIUS_MASK) atomKK->k_radius.modify<LMPHostType>();
if (mask & RMASS_MASK) atomKK->k_rmass.modify<LMPHostType>();
if (mask & OMEGA_MASK) atomKK->k_omega.modify<LMPHostType>();
if (mask & TORQUE_MASK) atomKK->k_torque.modify<LMPHostType>();
}
}