Files
lammps/lib/gpu/device_ptx.h

89 lines
2.2 KiB
C

const char * device =
" .version 2.3\n"
" .target sm_20\n"
" .address_size 64\n"
" .entry kernel_zero (\n"
" .param .u64 __cudaparm_kernel_zero_mem,\n"
" .param .s32 __cudaparm_kernel_zero_numel)\n"
" {\n"
" .reg .u32 %r<9>;\n"
" .reg .u64 %rd<6>;\n"
" .reg .pred %p<3>;\n"
" .loc 16 20 0\n"
"$LDWbegin_kernel_zero:\n"
" cvt.s32.u32 %r1, %ctaid.x;\n"
" cvt.s32.u32 %r2, %ntid.x;\n"
" mul24.lo.s32 %r3, %r1, %r2;\n"
" mov.u32 %r4, %tid.x;\n"
" add.u32 %r5, %r3, %r4;\n"
" ld.param.s32 %r6, [__cudaparm_kernel_zero_numel];\n"
" setp.le.s32 %p1, %r6, %r5;\n"
" @%p1 bra $Lt_0_1026;\n"
" .loc 16 24 0\n"
" mov.s32 %r7, 0;\n"
" ld.param.u64 %rd1, [__cudaparm_kernel_zero_mem];\n"
" cvt.s64.s32 %rd2, %r5;\n"
" mul.wide.s32 %rd3, %r5, 4;\n"
" add.u64 %rd4, %rd1, %rd3;\n"
" st.global.s32 [%rd4+0], %r7;\n"
"$Lt_0_1026:\n"
" .loc 16 25 0\n"
" exit;\n"
"$LDWend_kernel_zero:\n"
" }\n"
" .entry kernel_info (\n"
" .param .u64 __cudaparm_kernel_info_info)\n"
" {\n"
" .reg .u32 %r<16>;\n"
" .reg .u64 %rd<3>;\n"
" .loc 16 27 0\n"
"$LDWbegin_kernel_info:\n"
" .loc 16 28 0\n"
" ld.param.u64 %rd1, [__cudaparm_kernel_info_info];\n"
" mov.s32 %r1, 200;\n"
" st.global.s32 [%rd1+0], %r1;\n"
" .loc 16 29 0\n"
" mov.s32 %r2, 32;\n"
" st.global.s32 [%rd1+4], %r2;\n"
" .loc 16 30 0\n"
" mov.s32 %r3, 32;\n"
" st.global.s32 [%rd1+8], %r3;\n"
" .loc 16 31 0\n"
" mov.s32 %r4, 4;\n"
" st.global.s32 [%rd1+12], %r4;\n"
" .loc 16 32 0\n"
" mov.s32 %r5, 8;\n"
" st.global.s32 [%rd1+16], %r5;\n"
" .loc 16 33 0\n"
" mov.s32 %r6, 64;\n"
" st.global.s32 [%rd1+20], %r6;\n"
" .loc 16 34 0\n"
" mov.s32 %r7, 128;\n"
" st.global.s32 [%rd1+24], %r7;\n"
" .loc 16 35 0\n"
" mov.s32 %r8, 11;\n"
" st.global.s32 [%rd1+28], %r8;\n"
" .loc 16 36 0\n"
" mov.s32 %r9, 8;\n"
" st.global.s32 [%rd1+32], %r9;\n"
" .loc 16 37 0\n"
" mov.s32 %r10, 128;\n"
" st.global.s32 [%rd1+36], %r10;\n"
" .loc 16 38 0\n"
" mov.s32 %r11, 128;\n"
" st.global.s32 [%rd1+40], %r11;\n"
" .loc 16 39 0\n"
" mov.s32 %r12, 128;\n"
" st.global.s32 [%rd1+44], %r12;\n"
" .loc 16 40 0\n"
" mov.s32 %r13, 128;\n"
" st.global.s32 [%rd1+48], %r13;\n"
" .loc 16 41 0\n"
" mov.s32 %r14, 8;\n"
" st.global.s32 [%rd1+52], %r14;\n"
" .loc 16 42 0\n"
" exit;\n"
"$LDWend_kernel_info:\n"
" }\n"
;