Merge pull request #2692 from arghdos/master

Porting to new default platform for AMD/HIP in ROCm 4.1
2021-04-06 14:39:30 -04:00
parent 0b4d3588b5 160f2cc630
commit 00e4bdb2b7
7 changed files with 33 additions and 17 deletions
--- a/lib/gpu/Makefile.hip
+++ b/lib/gpu/Makefile.hip
@ -1,6 +1,6 @@
 # /* ----------------------------------------------------------------------
 #  Generic Linux Makefile for HIP
-#     - export HIP_PLATFORM=hcc (or nvcc) before execution
+#     - export HIP_PLATFORM=amd (or nvcc) before execution
 #     - change HIP_ARCH for your GPU
 # ------------------------------------------------------------------------- */

@ -42,6 +42,10 @@ ifeq (hcc,$(HIP_PLATFORM))
 	HIP_OPTS  += -ffast-math
 	# possible values: gfx803,gfx900,gfx906
 	HIP_ARCH = gfx906
+else ifeq (amd,$(HIP_PLATFORM))
+	HIP_OPTS  += -ffast-math
+	# possible values: gfx803,gfx900,gfx906
+	HIP_ARCH = gfx906
 else ifeq (nvcc,$(HIP_PLATFORM))
 	HIP_OPTS  += --use_fast_math
 	HIP_ARCH = -gencode arch=compute_30,code=[sm_30,compute_30] -gencode arch=compute_32,code=[sm_32,compute_32] -gencode arch=compute_35,code=[sm_35,compute_35] \
--- a/lib/gpu/README
+++ b/lib/gpu/README
@ -212,8 +212,8 @@ additionally requires cub (https://nvlabs.github.io/cub). Download and
 extract the cub directory to lammps/lib/gpu/ or specify an appropriate
 path in lammps/lib/gpu/Makefile.hip.
 2. In Makefile.hip it is possible to specify the target platform via
-export HIP_PLATFORM=hcc or HIP_PLATFORM=nvcc as well as the target
-architecture (gfx803, gfx900, gfx906 etc.)
+export HIP_PLATFORM=amd (ROCm >= 4.1), HIP_PLATFORM=hcc (ROCm <= 4.0)
+or HIP_PLATFORM=nvcc as well as the target architecture (gfx803, gfx900, gfx906 etc.)
 3. If your MPI implementation does not support `mpicxx --showme` command,
 it is required to specify the corresponding MPI compiler and linker flags
 in lammps/lib/gpu/Makefile.hip and in lammps/src/MAKE/OPTIONS/Makefile.hip.
@ -278,4 +278,3 @@ and
 Brown, W.M., Masako, Y. Implementing Molecular Dynamics on Hybrid High
 Performance Computers - Three-Body Potentials. Computer Physics Communications.
 2013. 184: p. 2785–2793.
-
--- a/lib/gpu/lal_pre_cuda_hip.h
+++ b/lib/gpu/lal_pre_cuda_hip.h
@ -30,7 +30,7 @@
 // -------------------------------------------------------------------------


-#ifdef __HIP_PLATFORM_HCC__
+#if defined(__HIP_PLATFORM_HCC__) || defined(__HIP_PLATFORM_AMD__)
 #define CONFIG_ID 303
 #define SIMD_SIZE 64
 #else
@ -161,7 +161,7 @@
 //                         KERNEL MACROS - TEXTURES
 // -------------------------------------------------------------------------

-#ifdef __HIP_PLATFORM_HCC__
+#if defined(__HIP_PLATFORM_HCC__) || defined(__HIP_PLATFORM_AMD__)
 #define _texture(name, type)  __device__ type* name
 #define _texture_2d(name, type)  __device__ type* name
 #else
@ -201,7 +201,7 @@
  #define mu_tex mu_
 #endif

-#ifdef __HIP_PLATFORM_HCC__
+#if defined(__HIP_PLATFORM_HCC__) || defined(__HIP_PLATFORM_AMD__)

 #undef fetch4
 #undef fetch
@ -266,7 +266,7 @@ typedef struct _double4 double4;
 #endif
 #endif

-#if defined(CUDA_PRE_NINE) || defined(__HIP_PLATFORM_HCC__)
+#if defined(CUDA_PRE_NINE) || defined(__HIP_PLATFORM_HCC__) || defined(__HIP_PLATFORM_AMD__)

  #ifdef _SINGLE_SINGLE
    #define shfl_down __shfl_down