// | |
// Generated by LLVM NVPTX Back-End | |
// | |
.version 8.2 | |
.target sm_89 | |
.address_size 64 | |
// .globl triton__0d1de | |
.visible .entry triton__0d1de( | |
.param .u64 triton__0d1de_param_0, | |
.param .u32 triton__0d1de_param_1 | |
) | |
.maxntid 256, 1, 1 | |
{ | |
.reg .pred %p<2>; | |
.reg .b32 %r<9>; | |
.reg .b64 %rd<4>; | |
.loc 1 18 0 | |
$L__func_begin0: | |
.loc 1 18 0 | |
ld.param.u64 %rd2, [triton__0d1de_param_0]; | |
$L__tmp0: | |
.loc 1 21 36 | |
mov.u32 %r4, %tid.x; | |
shl.b32 %r5, %r4, 1; | |
and.b32 %r6, %r5, 510; | |
.loc 1 20 28 | |
mov.u32 %r1, %ctaid.x; | |
.loc 1 20 33 | |
shl.b32 %r7, %r1, 9; | |
.loc 1 21 23 | |
or.b32 %r8, %r7, %r6; | |
.loc 1 22 21 | |
setp.lt.s32 %p1, %r8, 12865792; | |
.loc 1 25 25 | |
mul.wide.s32 %rd3, %r8, 4; | |
add.s64 %rd1, %rd2, %rd3; | |
mov.b32 %r2, 0; | |
.loc 1 25 36 | |
@%p1 st.global.v2.b32 [ %rd1 + 0 ], { %r2, %r2 }; | |
.loc 1 25 4 | |
ret; | |
$L__tmp1: | |
$L__func_end0: | |
} | |
.file 1 "/tmp/torchinductor_root/4y/c4yseldwmu3to52pbh2md2oeufrq3fcdmapkt4nxdzmyqtgd2ysp.py" | |
.section .debug_abbrev | |
{ | |
.b8 1 | |
.b8 17 | |
.b8 1 | |
.b8 37 | |
.b8 8 | |
.b8 19 | |
.b8 5 | |
.b8 3 | |
.b8 8 | |
.b8 16 | |
.b8 6 | |
.b8 27 | |
.b8 8 | |
.b8 180 | |
.b8 66 | |
.b8 12 | |
.b8 17 | |
.b8 1 | |
.b8 18 | |
.b8 1 | |
.b8 0 | |
.b8 0 | |
.b8 2 | |
.b8 46 | |
.b8 0 | |
.b8 17 | |
.b8 1 | |
.b8 18 | |
.b8 1 | |
.b8 64 | |
.b8 10 | |
.b8 135 | |
.b8 64 | |
.b8 8 | |
.b8 3 | |
.b8 8 | |
.b8 58 | |
.b8 11 | |
.b8 59 | |
.b8 11 | |
.b8 63 | |
.b8 12 | |
.b8 0 | |
.b8 0 | |
.b8 0 | |
} | |
.section .debug_info | |
{ | |
.b32 172 | |
.b8 2 | |
.b8 0 | |
.b32 .debug_abbrev | |
.b8 8 | |
.b8 1 | |
.b8 116 | |
.b8 114 | |
.b8 105 | |
.b8 116 | |
.b8 111 | |
.b8 110 | |
.b8 0 | |
.b8 2 | |
.b8 0 | |
.b8 99 | |
.b8 52 | |
.b8 121 | |
.b8 115 | |
.b8 101 | |
.b8 108 | |
.b8 100 | |
.b8 119 | |
.b8 109 | |
.b8 117 | |
.b8 51 | |
.b8 116 | |
.b8 111 | |
.b8 53 | |
.b8 50 | |
.b8 112 | |
.b8 98 | |
.b8 104 | |
.b8 50 | |
.b8 109 | |
.b8 100 | |
.b8 50 | |
.b8 111 | |
.b8 101 | |
.b8 117 | |
.b8 102 | |
.b8 114 | |
.b8 113 | |
.b8 51 | |
.b8 102 | |
.b8 99 | |
.b8 100 | |
.b8 109 | |
.b8 97 | |
.b8 112 | |
.b8 107 | |
.b8 116 | |
.b8 52 | |
.b8 110 | |
.b8 120 | |
.b8 100 | |
.b8 122 | |
.b8 109 | |
.b8 121 | |
.b8 113 | |
.b8 116 | |
.b8 103 | |
.b8 100 | |
.b8 50 | |
.b8 121 | |
.b8 115 | |
.b8 112 | |
.b8 46 | |
.b8 112 | |
.b8 121 | |
.b8 0 | |
.b32 .debug_line | |
.b8 47 | |
.b8 116 | |
.b8 109 | |
.b8 112 | |
.b8 47 | |
.b8 116 | |
.b8 111 | |
.b8 114 | |
.b8 99 | |
.b8 104 | |
.b8 105 | |
.b8 110 | |
.b8 100 | |
.b8 117 | |
.b8 99 | |
.b8 116 | |
.b8 111 | |
.b8 114 | |
.b8 95 | |
.b8 114 | |
.b8 111 | |
.b8 111 | |
.b8 116 | |
.b8 47 | |
.b8 52 | |
.b8 121 | |
.b8 0 | |
.b8 1 | |
.b64 $L__func_begin0 | |
.b64 $L__func_end0 | |
.b8 2 | |
.b64 $L__func_begin0 | |
.b64 $L__func_end0 | |
.b8 1 | |
.b8 156 | |
.b8 116 | |
.b8 114 | |
.b8 105 | |
.b8 116 | |
.b8 111 | |
.b8 110 | |
.b8 95 | |
.b8 95 | |
.b8 48 | |
.b8 100 | |
.b8 49 | |
.b8 100 | |
.b8 101 | |
.b8 0 | |
.b8 116 | |
.b8 114 | |
.b8 105 | |
.b8 116 | |
.b8 111 | |
.b8 110 | |
.b8 95 | |
.b8 95 | |
.b8 48 | |
.b8 100 | |
.b8 49 | |
.b8 100 | |
.b8 101 | |
.b8 0 | |
.b8 1 | |
.b8 18 | |
.b8 1 | |
.b8 0 | |
} | |
.section .debug_pubnames | |
{ | |
.b32 $L__pubNames_end0-$L__pubNames_start0 | |
$L__pubNames_start0: | |
.b8 2 | |
.b8 0 | |
.b32 .debug_info | |
.b32 176 | |
.b32 125 | |
.b8 116 | |
.b8 114 | |
.b8 105 | |
.b8 116 | |
.b8 111 | |
.b8 110 | |
.b8 95 | |
.b8 95 | |
.b8 48 | |
.b8 100 | |
.b8 49 | |
.b8 100 | |
.b8 101 | |
.b8 0 | |
.b32 0 | |
$L__pubNames_end0: | |
} | |
.section .debug_pubtypes | |
{ | |
.b32 $L__pubTypes_end0-$L__pubTypes_start0 | |
$L__pubTypes_start0: | |
.b8 2 | |
.b8 0 | |
.b32 .debug_info | |
.b32 176 | |
.b32 0 | |
$L__pubTypes_end0: | |
} | |
.section .debug_loc { } | |