Page Menu
Home
c4science
Search
Configure Global Search
Log In
Files
F96436292
device.ptx
No One
Temporary
Actions
Download File
Edit File
Delete File
View Transforms
Subscribe
Mute Notifications
Award Token
Subscribers
None
File Metadata
Details
File Info
Storage
Attached
Created
Thu, Dec 26, 18:14
Size
3 KB
Mime Type
text/x-asm
Expires
Sat, Dec 28, 18:14 (1 d, 23 h)
Engine
blob
Format
Raw Data
Handle
23170371
Attached To
rLAMMPS lammps
device.ptx
View Options
.version 2.3
.target sm_20
.address_size 64
// compiled with /usr/local/cuda/open64/lib//be
// nvopencc 4.0 built on 2011-05-12
//-----------------------------------------------------------
// Compiling /tmp/tmpxft_00009a81_00000000-9_lal_device.cpp3.i (/home/sjplimp/ccBI#.zwVkZj)
//-----------------------------------------------------------
//-----------------------------------------------------------
// Options:
//-----------------------------------------------------------
// Target:ptx, ISA:sm_20, Endian:little, Pointer Size:64
// -O3 (Optimization level)
// -g0 (Debug level)
// -m2 (Report advisories)
//-----------------------------------------------------------
.file 1 "<command-line>"
.file 2 "/tmp/tmpxft_00009a81_00000000-8_lal_device.cudafe2.gpu"
.file 3 "/usr/lib/gcc/x86_64-redhat-linux/4.4.5/include/stddef.h"
.file 4 "/usr/local/cuda/include/crt/device_runtime.h"
.file 5 "/usr/local/cuda/include/host_defines.h"
.file 6 "/usr/local/cuda/include/builtin_types.h"
.file 7 "/usr/local/cuda/include/device_types.h"
.file 8 "/usr/local/cuda/include/driver_types.h"
.file 9 "/usr/local/cuda/include/surface_types.h"
.file 10 "/usr/local/cuda/include/texture_types.h"
.file 11 "/usr/local/cuda/include/vector_types.h"
.file 12 "/usr/local/cuda/include/device_launch_parameters.h"
.file 13 "/usr/local/cuda/include/crt/storage_class.h"
.file 14 "/usr/include/bits/types.h"
.file 15 "/usr/include/time.h"
.file 16 "lal_device.cu"
.file 17 "/usr/local/cuda/include/common_functions.h"
.file 18 "/usr/local/cuda/include/math_functions.h"
.file 19 "/usr/local/cuda/include/math_constants.h"
.file 20 "/usr/local/cuda/include/device_functions.h"
.file 21 "/usr/local/cuda/include/sm_11_atomic_functions.h"
.file 22 "/usr/local/cuda/include/sm_12_atomic_functions.h"
.file 23 "/usr/local/cuda/include/sm_13_double_functions.h"
.file 24 "/usr/local/cuda/include/sm_20_atomic_functions.h"
.file 25 "/usr/local/cuda/include/sm_20_intrinsics.h"
.file 26 "/usr/local/cuda/include/surface_functions.h"
.file 27 "/usr/local/cuda/include/texture_fetch_functions.h"
.file 28 "/usr/local/cuda/include/math_functions_dbl_ptx3.h"
.entry kernel_zero (
.param .u64 __cudaparm_kernel_zero_mem,
.param .s32 __cudaparm_kernel_zero_numel)
{
.reg .u32 %r<9>;
.reg .u64 %rd<6>;
.reg .pred %p<3>;
.loc 16 20 0
$LDWbegin_kernel_zero:
cvt.s32.u32 %r1, %ctaid.x;
cvt.s32.u32 %r2, %ntid.x;
mul24.lo.s32 %r3, %r1, %r2;
mov.u32 %r4, %tid.x;
add.u32 %r5, %r3, %r4;
ld.param.s32 %r6, [__cudaparm_kernel_zero_numel];
setp.le.s32 %p1, %r6, %r5;
@%p1 bra $Lt_0_1026;
.loc 16 24 0
mov.s32 %r7, 0;
ld.param.u64 %rd1, [__cudaparm_kernel_zero_mem];
cvt.s64.s32 %rd2, %r5;
mul.wide.s32 %rd3, %r5, 4;
add.u64 %rd4, %rd1, %rd3;
st.global.s32 [%rd4+0], %r7;
$Lt_0_1026:
.loc 16 25 0
exit;
$LDWend_kernel_zero:
} // kernel_zero
.entry kernel_info (
.param .u64 __cudaparm_kernel_info_info)
{
.reg .u32 %r<16>;
.reg .u64 %rd<3>;
.loc 16 27 0
$LDWbegin_kernel_info:
.loc 16 28 0
ld.param.u64 %rd1, [__cudaparm_kernel_info_info];
mov.s32 %r1, 200;
st.global.s32 [%rd1+0], %r1;
.loc 16 29 0
mov.s32 %r2, 32;
st.global.s32 [%rd1+4], %r2;
.loc 16 30 0
mov.s32 %r3, 32;
st.global.s32 [%rd1+8], %r3;
.loc 16 31 0
mov.s32 %r4, 4;
st.global.s32 [%rd1+12], %r4;
.loc 16 32 0
mov.s32 %r5, 8;
st.global.s32 [%rd1+16], %r5;
.loc 16 33 0
mov.s32 %r6, 64;
st.global.s32 [%rd1+20], %r6;
.loc 16 34 0
mov.s32 %r7, 128;
st.global.s32 [%rd1+24], %r7;
.loc 16 35 0
mov.s32 %r8, 11;
st.global.s32 [%rd1+28], %r8;
.loc 16 36 0
mov.s32 %r9, 8;
st.global.s32 [%rd1+32], %r9;
.loc 16 37 0
mov.s32 %r10, 128;
st.global.s32 [%rd1+36], %r10;
.loc 16 38 0
mov.s32 %r11, 128;
st.global.s32 [%rd1+40], %r11;
.loc 16 39 0
mov.s32 %r12, 128;
st.global.s32 [%rd1+44], %r12;
.loc 16 40 0
mov.s32 %r13, 128;
st.global.s32 [%rd1+48], %r13;
.loc 16 41 0
mov.s32 %r14, 8;
st.global.s32 [%rd1+52], %r14;
.loc 16 42 0
exit;
$LDWend_kernel_info:
} // kernel_info
Event Timeline
Log In to Comment