//
// Generated by NVIDIA NVVM Compiler
//
// Compiler Build ID: CL-27506705
// Cuda compilation tools, release 10.2, V10.2.89
// Based on LLVM 3.4svn
//
.version 6.5
.target sm_30
.address_size 64
// .globl _Z3subPKiS0_Pi
.visible .entry _Z3subPKiS0_Pi(
.param .u64 _Z3subPKiS0_Pi_param_0,
.param .u64 _Z3subPKiS0_Pi_param_1,
.param .u64 _Z3subPKiS0_Pi_param_2
)
{
.reg .b32 %r<8>;
.reg .b64 %rd<11>;
ld.param.u64 %rd1, [_Z3subPKiS0_Pi_param_0];
ld.param.u64 %rd2, [_Z3subPKiS0_Pi_param_1];
ld.param.u64 %rd3, [_Z3subPKiS0_Pi_param_2];
cvta.to.global.u64 %rd4, %rd3;
cvta.to.global.u64 %rd5, %rd2;
cvta.to.global.u64 %rd6, %rd1;
mov.u32 %r1, %ntid.x;
mov.u32 %r2, %ctaid.x;
mov.u32 %r3, %tid.x;
mad.lo.s32 %r4, %r2, %r1, %r3;
mul.wide.s32 %rd7, %r4, 4;
add.s64 %rd8, %rd6, %rd7;
ld.global.u32 %r5, [%rd8];
add.s64 %rd9, %rd5, %rd7;
ld.global.u32 %r6, [%rd9];
sub.s32 %r7, %r5, %r6;
add.s64 %rd10, %rd4, %rd7;
st.global.u32 [%rd10], %r7;
ret;
}