accel 0.3.1

GPGPU Framework for Rust
Documentation
//
// Generated by NVIDIA NVVM Compiler
//
// Compiler Build ID: CL-27506705
// Cuda compilation tools, release 10.2, V10.2.89
// Based on LLVM 3.4svn
//

.version 6.5
.target sm_30
.address_size 64

	// .globl	_Z3subPKiS0_Pi

.visible .entry _Z3subPKiS0_Pi(
	.param .u64 _Z3subPKiS0_Pi_param_0,
	.param .u64 _Z3subPKiS0_Pi_param_1,
	.param .u64 _Z3subPKiS0_Pi_param_2
)
{
	.reg .b32 	%r<8>;
	.reg .b64 	%rd<11>;


	ld.param.u64 	%rd1, [_Z3subPKiS0_Pi_param_0];
	ld.param.u64 	%rd2, [_Z3subPKiS0_Pi_param_1];
	ld.param.u64 	%rd3, [_Z3subPKiS0_Pi_param_2];
	cvta.to.global.u64 	%rd4, %rd3;
	cvta.to.global.u64 	%rd5, %rd2;
	cvta.to.global.u64 	%rd6, %rd1;
	mov.u32 	%r1, %ntid.x;
	mov.u32 	%r2, %ctaid.x;
	mov.u32 	%r3, %tid.x;
	mad.lo.s32 	%r4, %r2, %r1, %r3;
	mul.wide.s32 	%rd7, %r4, 4;
	add.s64 	%rd8, %rd6, %rd7;
	ld.global.u32 	%r5, [%rd8];
	add.s64 	%rd9, %rd5, %rd7;
	ld.global.u32 	%r6, [%rd9];
	sub.s32 	%r7, %r5, %r6;
	add.s64 	%rd10, %rd4, %rd7;
	st.global.u32 	[%rd10], %r7;
	ret;
}