Misc Improvements to GPU Package
- Optimizations for molecular systems - Improved kernel performance and greater CPU overlap - Reduced GPU to CPU communications for discrete devices - Switch classic Intel makefiles to use LLVM-based compilers - Prefetch optimizations supported for OpenCL - Optimized data repack for quaternions
This commit is contained in:
@ -105,28 +105,32 @@ void re_gpu_clear() {
|
||||
tagint **special, const bool eflag, const bool vflag,
|
||||
const bool eatom, const bool vatom, int &host_start,
|
||||
int **ilist, int **numj, const double cpu_time, bool &success,
|
||||
double **host_quat);
|
||||
const int *ellipsoid, const EllipsoidBonus *bonus);
|
||||
|
||||
int** re_gpu_compute_n(const int ago, const int inum_full, const int nall,
|
||||
double **host_x, int *host_type, double *sublo,
|
||||
double *subhi, tagint *tag, int **nspecial, tagint **special,
|
||||
const bool eflag, const bool vflag, const bool eatom,
|
||||
const bool vatom, int &host_start, int **ilist,
|
||||
int **jnum, const double cpu_time, bool &success,
|
||||
double **host_quat) {
|
||||
double *subhi, tagint *tag, int **nspecial,
|
||||
tagint **special, const bool eflag, const bool vflag,
|
||||
const bool eatom, const bool vatom, int &host_start,
|
||||
int **ilist, int **jnum, const double cpu_time,
|
||||
bool &success, const int *ellipsoid,
|
||||
const void *bonus) {
|
||||
return REMF.compute(ago, inum_full, nall, host_x, host_type, sublo, subhi,
|
||||
tag, nspecial, special, eflag, vflag, eatom, vatom,
|
||||
host_start, ilist, jnum, cpu_time, success, host_quat);
|
||||
host_start, ilist, jnum, cpu_time, success, ellipsoid,
|
||||
static_cast<const EllipsoidBonus *>(bonus));
|
||||
}
|
||||
|
||||
int * re_gpu_compute(const int ago, const int inum_full, const int nall,
|
||||
double **host_x, int *host_type, int *ilist, int *numj,
|
||||
int **firstneigh, const bool eflag, const bool vflag,
|
||||
const bool eatom, const bool vatom, int &host_start,
|
||||
const double cpu_time, bool &success, double **host_quat) {
|
||||
const double cpu_time, bool &success,
|
||||
const int *ellipsoid, const void *bonus) {
|
||||
return REMF.compute(ago, inum_full, nall, host_x, host_type, ilist,
|
||||
numj, firstneigh, eflag, vflag, eatom, vatom, host_start,
|
||||
cpu_time, success, host_quat);
|
||||
cpu_time, success, ellipsoid,
|
||||
static_cast<const EllipsoidBonus *>(bonus));
|
||||
}
|
||||
|
||||
// ---------------------------------------------------------------------------
|
||||
@ -135,4 +139,3 @@ int * re_gpu_compute(const int ago, const int inum_full, const int nall,
|
||||
double re_gpu_bytes() {
|
||||
return REMF.host_memory_usage();
|
||||
}
|
||||
|
||||
|
||||
Reference in New Issue
Block a user