Merge pull request #3069 from Vsevak/fix-hip-ffast-math
Fix HIP Makefile under lib/gpu
This commit is contained in:
@ -306,12 +306,12 @@ elseif(GPU_API STREQUAL "HIP")
|
|||||||
|
|
||||||
if(HIP_COMPILER STREQUAL "clang")
|
if(HIP_COMPILER STREQUAL "clang")
|
||||||
add_custom_command(OUTPUT ${CUBIN_FILE}
|
add_custom_command(OUTPUT ${CUBIN_FILE}
|
||||||
VERBATIM COMMAND ${HIP_HIPCC_EXECUTABLE} --genco --offload-arch=${HIP_ARCH} -O3 -ffast-math -DUSE_HIP -D_${GPU_PREC_SETTING} -DLAMMPS_${LAMMPS_SIZES} -I${LAMMPS_LIB_SOURCE_DIR}/gpu -o ${CUBIN_FILE} ${CU_CPP_FILE}
|
VERBATIM COMMAND ${HIP_HIPCC_EXECUTABLE} --genco --offload-arch=${HIP_ARCH} -O3 -DUSE_HIP -D_${GPU_PREC_SETTING} -DLAMMPS_${LAMMPS_SIZES} -I${LAMMPS_LIB_SOURCE_DIR}/gpu -o ${CUBIN_FILE} ${CU_CPP_FILE}
|
||||||
DEPENDS ${CU_CPP_FILE}
|
DEPENDS ${CU_CPP_FILE}
|
||||||
COMMENT "Generating ${CU_NAME}.cubin")
|
COMMENT "Generating ${CU_NAME}.cubin")
|
||||||
else()
|
else()
|
||||||
add_custom_command(OUTPUT ${CUBIN_FILE}
|
add_custom_command(OUTPUT ${CUBIN_FILE}
|
||||||
VERBATIM COMMAND ${HIP_HIPCC_EXECUTABLE} --genco -t="${HIP_ARCH}" -f=\"-O3 -ffast-math -DUSE_HIP -D_${GPU_PREC_SETTING} -DLAMMPS_${LAMMPS_SIZES} -I${LAMMPS_LIB_SOURCE_DIR}/gpu\" -o ${CUBIN_FILE} ${CU_CPP_FILE}
|
VERBATIM COMMAND ${HIP_HIPCC_EXECUTABLE} --genco -t="${HIP_ARCH}" -f=\"-O3 -DUSE_HIP -D_${GPU_PREC_SETTING} -DLAMMPS_${LAMMPS_SIZES} -I${LAMMPS_LIB_SOURCE_DIR}/gpu\" -o ${CUBIN_FILE} ${CU_CPP_FILE}
|
||||||
DEPENDS ${CU_CPP_FILE}
|
DEPENDS ${CU_CPP_FILE}
|
||||||
COMMENT "Generating ${CU_NAME}.cubin")
|
COMMENT "Generating ${CU_NAME}.cubin")
|
||||||
endif()
|
endif()
|
||||||
|
|||||||
@ -39,11 +39,9 @@ HIP_PLATFORM=$(shell $(HIP_PATH)/bin/hipconfig --platform)
|
|||||||
HIP_COMPILER=$(shell $(HIP_PATH)/bin/hipconfig --compiler)
|
HIP_COMPILER=$(shell $(HIP_PATH)/bin/hipconfig --compiler)
|
||||||
|
|
||||||
ifeq (hcc,$(HIP_PLATFORM))
|
ifeq (hcc,$(HIP_PLATFORM))
|
||||||
HIP_OPTS += -ffast-math
|
|
||||||
# possible values: gfx803,gfx900,gfx906
|
# possible values: gfx803,gfx900,gfx906
|
||||||
HIP_ARCH = gfx906
|
HIP_ARCH = gfx906
|
||||||
else ifeq (amd,$(HIP_PLATFORM))
|
else ifeq (amd,$(HIP_PLATFORM))
|
||||||
HIP_OPTS += -ffast-math
|
|
||||||
# possible values: gfx803,gfx900,gfx906
|
# possible values: gfx803,gfx900,gfx906
|
||||||
HIP_ARCH = gfx906
|
HIP_ARCH = gfx906
|
||||||
else ifeq (nvcc,$(HIP_PLATFORM))
|
else ifeq (nvcc,$(HIP_PLATFORM))
|
||||||
|
|||||||
Reference in New Issue
Block a user