ArabDesert/Assets/Editor/x64/Bakery/fixPos12_notrimark.ptx

647 lines
22 KiB
Plaintext

//
// Generated by NVIDIA NVVM Compiler
//
// Compiler Build ID: CL-23083092
// Cuda compilation tools, release 9.1, V9.1.85
// Based on LLVM 3.4svn
//
.version 6.1
.target sm_30
.address_size 64
// .globl _Z6oxMainv
.global .align 8 .b8 pixelID[8];
.global .align 8 .b8 resolution[8];
.global .align 4 .b8 normal[12];
.global .align 4 .b8 camPos[12];
.global .align 4 .b8 root[4];
.global .align 4 .u32 imageEnabled;
.global .texref lightmap;
.global .align 16 .b8 tileInfo[16];
.global .align 4 .u32 additive;
.global .align 1 .b8 image_HDR[1];
.global .align 1 .b8 image_HDR2[1];
.global .align 1 .b8 uvfacenormal[1];
.global .align 1 .b8 uvpos[1];
.global .align 1 .b8 uvsmoothpos[1];
.global .align 1 .b8 triangleMarks[1];
.global .align 1 .b8 image_Mask[1];
.global .align 4 .f32 fakeBias;
.global .align 4 .b8 _ZN21rti_internal_typeinfo7pixelIDE[8] = {82, 97, 121, 0, 8, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo10resolutionE[8] = {82, 97, 121, 0, 8, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo6normalE[8] = {82, 97, 121, 0, 12, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo6camPosE[8] = {82, 97, 121, 0, 12, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo4rootE[8] = {82, 97, 121, 0, 4, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo12imageEnabledE[8] = {82, 97, 121, 0, 4, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo8tileInfoE[8] = {82, 97, 121, 0, 16, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo8additiveE[8] = {82, 97, 121, 0, 4, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo8fakeBiasE[8] = {82, 97, 121, 0, 4, 0, 0, 0};
.global .align 8 .u64 _ZN21rti_internal_register20reg_bitness_detectorE;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail0E;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail1E;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail2E;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail3E;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail4E;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail5E;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail6E;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail7E;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail8E;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail9E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail0E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail1E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail2E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail3E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail4E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail5E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail6E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail7E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail8E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail9E;
.global .align 4 .u32 _ZN21rti_internal_register14reg_rayIndex_xE;
.global .align 4 .u32 _ZN21rti_internal_register14reg_rayIndex_yE;
.global .align 4 .u32 _ZN21rti_internal_register14reg_rayIndex_zE;
.global .align 8 .b8 _ZN21rti_internal_typename7pixelIDE[6] = {117, 105, 110, 116, 50, 0};
.global .align 8 .b8 _ZN21rti_internal_typename10resolutionE[6] = {117, 105, 110, 116, 50, 0};
.global .align 8 .b8 _ZN21rti_internal_typename6normalE[7] = {102, 108, 111, 97, 116, 51, 0};
.global .align 8 .b8 _ZN21rti_internal_typename6camPosE[7] = {102, 108, 111, 97, 116, 51, 0};
.global .align 16 .b8 _ZN21rti_internal_typename4rootE[9] = {114, 116, 79, 98, 106, 101, 99, 116, 0};
.global .align 4 .b8 _ZN21rti_internal_typename12imageEnabledE[4] = {105, 110, 116, 0};
.global .align 8 .b8 _ZN21rti_internal_typename8tileInfoE[6] = {117, 105, 110, 116, 52, 0};
.global .align 4 .b8 _ZN21rti_internal_typename8additiveE[4] = {105, 110, 116, 0};
.global .align 8 .b8 _ZN21rti_internal_typename8fakeBiasE[6] = {102, 108, 111, 97, 116, 0};
.global .align 4 .u32 _ZN21rti_internal_typeenum7pixelIDE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum10resolutionE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum6normalE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum6camPosE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum4rootE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum12imageEnabledE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum8tileInfoE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum8additiveE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum8fakeBiasE = 4919;
.global .align 16 .b8 _ZN21rti_internal_semantic7pixelIDE[14] = {114, 116, 76, 97, 117, 110, 99, 104, 73, 110, 100, 101, 120, 0};
.global .align 16 .b8 _ZN21rti_internal_semantic10resolutionE[12] = {114, 116, 76, 97, 117, 110, 99, 104, 68, 105, 109, 0};
.global .align 16 .b8 _ZN21rti_internal_semantic6normalE[17] = {97, 116, 116, 114, 105, 98, 117, 116, 101, 32, 110, 111, 114, 109, 97, 108, 0};
.global .align 1 .b8 _ZN21rti_internal_semantic6camPosE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic4rootE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic12imageEnabledE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic8tileInfoE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic8additiveE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic8fakeBiasE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation7pixelIDE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation10resolutionE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation6normalE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation6camPosE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation4rootE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation12imageEnabledE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation8tileInfoE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation8additiveE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation8fakeBiasE[1];
.visible .entry _Z6oxMainv(
)
{
.local .align 4 .b8 __local_depot0[24];
.reg .b64 %SP;
.reg .b64 %SPL;
.reg .pred %p<28>;
.reg .b16 %rs<11>;
.reg .f32 %f<360>;
.reg .b32 %r<109>;
.reg .b64 %rd<101>;
mov.u64 %rd100, __local_depot0;
cvta.local.u64 %SP, %rd100;
ld.global.v2.u32 {%r6, %r7}, [pixelID];
cvt.u64.u32 %rd7, %r6;
cvt.u64.u32 %rd8, %r7;
mov.u64 %rd11, uvfacenormal;
cvta.global.u64 %rd6, %rd11;
mov.u32 %r4, 2;
mov.u32 %r5, 4;
mov.u64 %rd10, 0;
// inline asm
call (%rd5), _rt_buffer_get_64, (%rd6, %r4, %r5, %rd7, %rd8, %rd10, %rd10);
// inline asm
ld.u32 %r1, [%rd5];
shr.u32 %r10, %r1, 16;
cvt.u16.u32 %rs1, %r10;
and.b16 %rs2, %rs1, 255;
cvt.u16.u32 %rs3, %r1;
or.b16 %rs4, %rs3, %rs2;
setp.eq.s16 %p1, %rs4, 0;
mov.f32 %f338, 0f00000000;
mov.f32 %f339, %f338;
mov.f32 %f340, %f338;
@%p1 bra BB0_2;
ld.u8 %rs5, [%rd5+1];
and.b16 %rs7, %rs3, 255;
cvt.rn.f32.u16 %f103, %rs7;
div.rn.f32 %f104, %f103, 0f437F0000;
fma.rn.f32 %f105, %f104, 0f40000000, 0fBF800000;
cvt.rn.f32.u16 %f106, %rs5;
div.rn.f32 %f107, %f106, 0f437F0000;
fma.rn.f32 %f108, %f107, 0f40000000, 0fBF800000;
cvt.rn.f32.u16 %f109, %rs2;
div.rn.f32 %f110, %f109, 0f437F0000;
fma.rn.f32 %f111, %f110, 0f40000000, 0fBF800000;
mul.f32 %f112, %f108, %f108;
fma.rn.f32 %f113, %f105, %f105, %f112;
fma.rn.f32 %f114, %f111, %f111, %f113;
sqrt.rn.f32 %f115, %f114;
rcp.rn.f32 %f116, %f115;
mul.f32 %f338, %f105, %f116;
mul.f32 %f339, %f108, %f116;
mul.f32 %f340, %f111, %f116;
BB0_2:
ld.global.v2.u32 {%r11, %r12}, [pixelID];
ld.global.v2.u32 {%r14, %r15}, [tileInfo];
add.s32 %r2, %r11, %r14;
add.s32 %r3, %r12, %r15;
setp.eq.f32 %p2, %f339, 0f00000000;
setp.eq.f32 %p3, %f338, 0f00000000;
and.pred %p4, %p3, %p2;
setp.eq.f32 %p5, %f340, 0f00000000;
and.pred %p6, %p4, %p5;
@%p6 bra BB0_24;
bra.uni BB0_3;
BB0_24:
cvt.u64.u32 %rd84, %r2;
cvt.u64.u32 %rd85, %r3;
mov.u64 %rd88, image_HDR;
cvta.global.u64 %rd83, %rd88;
mov.u32 %r91, 16;
// inline asm
call (%rd82), _rt_buffer_get_64, (%rd83, %r4, %r91, %rd84, %rd85, %rd10, %rd10);
// inline asm
mov.f32 %f326, 0f00000000;
st.v4.f32 [%rd82], {%f326, %f326, %f326, %f326};
bra.uni BB0_25;
BB0_3:
ld.global.v2.u32 {%r36, %r37}, [pixelID];
cvt.u64.u32 %rd14, %r36;
cvt.u64.u32 %rd15, %r37;
mov.u64 %rd55, uvpos;
cvta.global.u64 %rd13, %rd55;
mov.u32 %r32, 16;
// inline asm
call (%rd12), _rt_buffer_get_64, (%rd13, %r4, %r32, %rd14, %rd15, %rd10, %rd10);
// inline asm
ld.f32 %f126, [%rd12];
ld.global.v2.u32 {%r40, %r41}, [pixelID];
cvt.u64.u32 %rd20, %r40;
cvt.u64.u32 %rd21, %r41;
// inline asm
call (%rd18), _rt_buffer_get_64, (%rd13, %r4, %r32, %rd20, %rd21, %rd10, %rd10);
// inline asm
ld.f32 %f127, [%rd18+4];
ld.global.v2.u32 {%r44, %r45}, [pixelID];
cvt.u64.u32 %rd26, %r44;
cvt.u64.u32 %rd27, %r45;
// inline asm
call (%rd24), _rt_buffer_get_64, (%rd13, %r4, %r32, %rd26, %rd27, %rd10, %rd10);
// inline asm
abs.f32 %f128, %f126;
setp.gtu.f32 %p7, %f128, 0f7F800000;
abs.f32 %f129, %f127;
setp.gtu.f32 %p8, %f129, 0f7F800000;
ld.f32 %f130, [%rd24+8];
abs.f32 %f131, %f130;
setp.gtu.f32 %p9, %f131, 0f7F800000;
ld.global.v2.u32 {%r48, %r49}, [pixelID];
cvt.u64.u32 %rd32, %r48;
cvt.u64.u32 %rd33, %r49;
// inline asm
call (%rd30), _rt_buffer_get_64, (%rd13, %r4, %r32, %rd32, %rd33, %rd10, %rd10);
// inline asm
ld.f32 %f132, [%rd30+12];
add.f32 %f7, %f132, 0f38D1B717;
mul.f32 %f133, %f126, 0f3456BF95;
selp.f32 %f134, 0f00000000, %f133, %p7;
mul.f32 %f135, %f127, 0f3456BF95;
selp.f32 %f136, 0f00000000, %f135, %p8;
mul.f32 %f137, %f130, 0f3456BF95;
selp.f32 %f138, 0f00000000, %f137, %p9;
abs.f32 %f139, %f338;
div.rn.f32 %f140, %f134, %f139;
abs.f32 %f141, %f339;
div.rn.f32 %f142, %f136, %f141;
abs.f32 %f143, %f340;
div.rn.f32 %f144, %f138, %f143;
abs.f32 %f145, %f140;
abs.f32 %f146, %f142;
abs.f32 %f147, %f144;
mov.f32 %f148, 0f38D1B717;
max.f32 %f149, %f145, %f148;
max.f32 %f150, %f146, %f148;
max.f32 %f151, %f147, %f148;
ld.global.v2.u32 {%r52, %r53}, [pixelID];
cvt.u64.u32 %rd38, %r52;
cvt.u64.u32 %rd39, %r53;
mov.u64 %rd56, uvsmoothpos;
cvta.global.u64 %rd37, %rd56;
// inline asm
call (%rd36), _rt_buffer_get_64, (%rd37, %r4, %r32, %rd38, %rd39, %rd10, %rd10);
// inline asm
ld.f32 %f345, [%rd36];
ld.global.v2.u32 {%r56, %r57}, [pixelID];
cvt.u64.u32 %rd44, %r56;
cvt.u64.u32 %rd45, %r57;
// inline asm
call (%rd42), _rt_buffer_get_64, (%rd37, %r4, %r32, %rd44, %rd45, %rd10, %rd10);
// inline asm
ld.f32 %f346, [%rd42+4];
ld.global.v2.u32 {%r60, %r61}, [pixelID];
cvt.u64.u32 %rd50, %r60;
cvt.u64.u32 %rd51, %r61;
// inline asm
call (%rd48), _rt_buffer_get_64, (%rd37, %r4, %r32, %rd50, %rd51, %rd10, %rd10);
// inline asm
fma.rn.f32 %f10, %f338, %f149, %f345;
fma.rn.f32 %f11, %f339, %f150, %f346;
ld.f32 %f347, [%rd48+8];
fma.rn.f32 %f13, %f340, %f151, %f347;
setp.gt.f32 %p10, %f139, %f143;
neg.f32 %f152, %f339;
selp.f32 %f153, %f152, 0f00000000, %p10;
neg.f32 %f154, %f340;
selp.f32 %f155, %f338, %f154, %p10;
selp.f32 %f156, 0f00000000, %f339, %p10;
mul.f32 %f157, %f155, %f155;
fma.rn.f32 %f158, %f153, %f153, %f157;
fma.rn.f32 %f159, %f156, %f156, %f158;
sqrt.rn.f32 %f160, %f159;
rcp.rn.f32 %f161, %f160;
mul.f32 %f14, %f153, %f161;
mul.f32 %f15, %f155, %f161;
mul.f32 %f16, %f156, %f161;
mul.f32 %f162, %f340, %f15;
mul.f32 %f163, %f339, %f16;
sub.f32 %f17, %f162, %f163;
mul.f32 %f164, %f338, %f16;
mul.f32 %f165, %f340, %f14;
sub.f32 %f18, %f164, %f165;
mul.f32 %f166, %f339, %f14;
mul.f32 %f167, %f338, %f15;
sub.f32 %f19, %f166, %f167;
mov.f32 %f168, 0f3F8147AE;
sqrt.rn.f32 %f169, %f168;
rcp.rn.f32 %f20, %f169;
neg.f32 %f21, %f20;
mul.f32 %f22, %f20, 0f00000000;
mul.f32 %f170, %f20, 0f3DCCCCCD;
mul.f32 %f171, %f10, 0f3456BF95;
mul.f32 %f172, %f11, 0f3456BF95;
mul.f32 %f173, %f13, 0f3456BF95;
abs.f32 %f174, %f171;
abs.f32 %f175, %f172;
abs.f32 %f176, %f173;
max.f32 %f177, %f174, %f175;
max.f32 %f178, %f177, %f176;
max.f32 %f23, %f178, %f148;
mul.f32 %f124, %f7, 0f3FB504F3;
mul.f32 %f25, %f14, %f22;
mul.f32 %f26, %f15, %f22;
mul.f32 %f27, %f16, %f22;
fma.rn.f32 %f179, %f17, %f21, %f25;
fma.rn.f32 %f180, %f18, %f21, %f26;
fma.rn.f32 %f181, %f19, %f21, %f27;
mul.f32 %f28, %f338, %f170;
mul.f32 %f29, %f339, %f170;
mul.f32 %f30, %f340, %f170;
add.f32 %f120, %f179, %f28;
add.f32 %f121, %f180, %f29;
add.f32 %f122, %f181, %f30;
add.u64 %rd54, %SP, 12;
cvta.to.local.u64 %rd57, %rd54;
mov.u32 %r34, 0;
st.local.u32 [%rd57+8], %r34;
st.local.u32 [%rd57+4], %r34;
st.local.u32 [%rd57], %r34;
ld.global.u32 %r33, [root];
mov.f32 %f123, 0f00000000;
mov.u32 %r35, 12;
// inline asm
call _rt_trace_64, (%r33, %f10, %f11, %f13, %f120, %f121, %f122, %r34, %f123, %f124, %rd54, %r35);
// inline asm
ld.local.f32 %f34, [%rd57+4];
ld.local.f32 %f35, [%rd57];
add.f32 %f182, %f35, %f34;
ld.local.f32 %f36, [%rd57+8];
add.f32 %f183, %f182, %f36;
mov.f32 %f348, 0f47C34F80;
setp.eq.f32 %p11, %f183, 0f00000000;
@%p11 bra BB0_6;
mul.f32 %f185, %f34, %f34;
fma.rn.f32 %f186, %f35, %f35, %f185;
fma.rn.f32 %f187, %f36, %f36, %f186;
sqrt.rn.f32 %f37, %f187;
rcp.rn.f32 %f188, %f37;
mul.f32 %f189, %f188, %f35;
mul.f32 %f190, %f188, %f34;
mul.f32 %f191, %f188, %f36;
fma.rn.f32 %f192, %f23, %f189, %f10;
fma.rn.f32 %f193, %f23, %f190, %f11;
fma.rn.f32 %f194, %f23, %f191, %f13;
fma.rn.f32 %f38, %f37, %f120, %f192;
fma.rn.f32 %f39, %f37, %f121, %f193;
fma.rn.f32 %f40, %f37, %f122, %f194;
setp.geu.f32 %p12, %f37, 0f47C34F80;
@%p12 bra BB0_6;
mov.f32 %f345, %f38;
mov.f32 %f346, %f39;
mov.f32 %f347, %f40;
mov.f32 %f348, %f37;
BB0_6:
mov.u32 %r93, 12;
mov.f32 %f327, 0f00000000;
add.u64 %rd90, %SP, 12;
cvta.to.local.u64 %rd89, %rd90;
mov.u32 %r92, 0;
fma.rn.f32 %f203, %f17, %f20, %f25;
fma.rn.f32 %f204, %f18, %f20, %f26;
fma.rn.f32 %f205, %f19, %f20, %f27;
add.f32 %f198, %f203, %f28;
add.f32 %f199, %f204, %f29;
add.f32 %f200, %f205, %f30;
st.local.u32 [%rd89+8], %r92;
st.local.u32 [%rd89+4], %r92;
st.local.u32 [%rd89], %r92;
ld.global.u32 %r64, [root];
// inline asm
call _rt_trace_64, (%r64, %f10, %f11, %f13, %f198, %f199, %f200, %r92, %f327, %f124, %rd90, %r93);
// inline asm
ld.local.f32 %f48, [%rd89+4];
ld.local.f32 %f49, [%rd89];
add.f32 %f206, %f49, %f48;
ld.local.f32 %f50, [%rd89+8];
add.f32 %f207, %f206, %f50;
setp.eq.f32 %p13, %f207, 0f00000000;
@%p13 bra BB0_9;
mul.f32 %f208, %f48, %f48;
fma.rn.f32 %f209, %f49, %f49, %f208;
fma.rn.f32 %f210, %f50, %f50, %f209;
sqrt.rn.f32 %f51, %f210;
rcp.rn.f32 %f211, %f51;
mul.f32 %f212, %f211, %f49;
mul.f32 %f213, %f211, %f48;
mul.f32 %f214, %f211, %f50;
fma.rn.f32 %f215, %f23, %f212, %f10;
fma.rn.f32 %f216, %f23, %f213, %f11;
fma.rn.f32 %f217, %f23, %f214, %f13;
fma.rn.f32 %f52, %f51, %f198, %f215;
fma.rn.f32 %f53, %f51, %f199, %f216;
fma.rn.f32 %f54, %f51, %f200, %f217;
setp.geu.f32 %p14, %f51, %f348;
@%p14 bra BB0_9;
mov.f32 %f345, %f52;
mov.f32 %f346, %f53;
mov.f32 %f347, %f54;
mov.f32 %f348, %f51;
BB0_9:
neg.f32 %f330, %f20;
mul.f32 %f329, %f20, 0f00000000;
mov.u32 %r95, 12;
mov.f32 %f328, 0f00000000;
add.u64 %rd93, %SP, 12;
cvta.to.local.u64 %rd92, %rd93;
mov.u32 %r94, 0;
mul.f32 %f59, %f17, %f329;
fma.rn.f32 %f226, %f14, %f330, %f59;
mul.f32 %f60, %f18, %f329;
fma.rn.f32 %f227, %f15, %f330, %f60;
mul.f32 %f61, %f19, %f329;
fma.rn.f32 %f228, %f16, %f330, %f61;
add.f32 %f221, %f226, %f28;
add.f32 %f222, %f227, %f29;
add.f32 %f223, %f228, %f30;
st.local.u32 [%rd92+8], %r94;
st.local.u32 [%rd92+4], %r94;
st.local.u32 [%rd92], %r94;
ld.global.u32 %r67, [root];
// inline asm
call _rt_trace_64, (%r67, %f10, %f11, %f13, %f221, %f222, %f223, %r94, %f328, %f124, %rd93, %r95);
// inline asm
ld.local.f32 %f65, [%rd92+4];
ld.local.f32 %f66, [%rd92];
add.f32 %f229, %f66, %f65;
ld.local.f32 %f67, [%rd92+8];
add.f32 %f230, %f229, %f67;
setp.eq.f32 %p15, %f230, 0f00000000;
@%p15 bra BB0_12;
mul.f32 %f231, %f65, %f65;
fma.rn.f32 %f232, %f66, %f66, %f231;
fma.rn.f32 %f233, %f67, %f67, %f232;
sqrt.rn.f32 %f68, %f233;
rcp.rn.f32 %f234, %f68;
mul.f32 %f235, %f234, %f66;
mul.f32 %f236, %f234, %f65;
mul.f32 %f237, %f234, %f67;
fma.rn.f32 %f238, %f23, %f235, %f10;
fma.rn.f32 %f239, %f23, %f236, %f11;
fma.rn.f32 %f240, %f23, %f237, %f13;
fma.rn.f32 %f69, %f68, %f221, %f238;
fma.rn.f32 %f70, %f68, %f222, %f239;
fma.rn.f32 %f71, %f68, %f223, %f240;
setp.geu.f32 %p16, %f68, %f348;
@%p16 bra BB0_12;
mov.f32 %f345, %f69;
mov.f32 %f346, %f70;
mov.f32 %f347, %f71;
mov.f32 %f348, %f68;
BB0_12:
mov.u32 %r97, 12;
mov.f32 %f331, 0f00000000;
add.u64 %rd96, %SP, 12;
cvta.to.local.u64 %rd95, %rd96;
mov.u32 %r96, 0;
fma.rn.f32 %f249, %f14, %f20, %f59;
fma.rn.f32 %f250, %f15, %f20, %f60;
fma.rn.f32 %f251, %f16, %f20, %f61;
add.f32 %f244, %f249, %f28;
add.f32 %f245, %f250, %f29;
add.f32 %f246, %f251, %f30;
st.local.u32 [%rd95+8], %r96;
st.local.u32 [%rd95+4], %r96;
st.local.u32 [%rd95], %r96;
ld.global.u32 %r70, [root];
// inline asm
call _rt_trace_64, (%r70, %f10, %f11, %f13, %f244, %f245, %f246, %r96, %f331, %f124, %rd96, %r97);
// inline asm
ld.local.f32 %f79, [%rd95+4];
ld.local.f32 %f80, [%rd95];
add.f32 %f252, %f80, %f79;
ld.local.f32 %f81, [%rd95+8];
add.f32 %f253, %f252, %f81;
setp.eq.f32 %p17, %f253, 0f00000000;
@%p17 bra BB0_15;
mul.f32 %f254, %f79, %f79;
fma.rn.f32 %f255, %f80, %f80, %f254;
fma.rn.f32 %f256, %f81, %f81, %f255;
sqrt.rn.f32 %f257, %f256;
rcp.rn.f32 %f258, %f257;
mul.f32 %f259, %f258, %f80;
mul.f32 %f260, %f258, %f79;
mul.f32 %f261, %f258, %f81;
fma.rn.f32 %f262, %f23, %f259, %f10;
fma.rn.f32 %f263, %f23, %f260, %f11;
fma.rn.f32 %f264, %f23, %f261, %f13;
fma.rn.f32 %f82, %f257, %f244, %f262;
fma.rn.f32 %f83, %f257, %f245, %f263;
fma.rn.f32 %f84, %f257, %f246, %f264;
setp.geu.f32 %p18, %f257, %f348;
@%p18 bra BB0_15;
mov.f32 %f345, %f82;
mov.f32 %f346, %f83;
mov.f32 %f347, %f84;
BB0_15:
abs.f32 %f265, %f345;
setp.gtu.f32 %p19, %f265, 0f7F800000;
selp.f32 %f356, 0f00000000, %f345, %p19;
abs.f32 %f266, %f346;
setp.gtu.f32 %p20, %f266, 0f7F800000;
selp.f32 %f357, 0f00000000, %f346, %p20;
abs.f32 %f267, %f347;
setp.gtu.f32 %p21, %f267, 0f7F800000;
selp.f32 %f358, 0f00000000, %f347, %p21;
ld.global.f32 %f91, [fakeBias];
setp.eq.f32 %p22, %f91, 0f00000000;
@%p22 bra BB0_17;
fma.rn.f32 %f356, %f338, %f91, %f356;
fma.rn.f32 %f357, %f339, %f91, %f357;
fma.rn.f32 %f358, %f340, %f91, %f358;
BB0_17:
mov.u32 %r99, 16;
mov.u64 %rd98, 0;
mov.u32 %r98, 2;
cvt.u64.u32 %rd67, %r3;
cvt.u64.u32 %rd66, %r2;
mov.u64 %rd70, image_HDR;
cvta.global.u64 %rd65, %rd70;
// inline asm
call (%rd64), _rt_buffer_get_64, (%rd65, %r98, %r99, %rd66, %rd67, %rd98, %rd98);
// inline asm
mov.f32 %f268, 0f3F800000;
st.v4.f32 [%rd64], {%f356, %f357, %f358, %f268};
ld.global.u8 %rs9, [imageEnabled];
and.b16 %rs10, %rs9, 32;
setp.eq.s16 %p23, %rs10, 0;
@%p23 bra BB0_25;
add.f32 %f333, %f132, 0f38D1B717;
mov.f32 %f332, 0f38D1B717;
mov.u32 %r101, 12;
mov.u32 %r100, 0;
mul.f32 %f276, %f333, 0f41000000;
add.u64 %rd71, %SP, 0;
cvta.to.local.u64 %rd4, %rd71;
st.local.u32 [%rd4+8], %r100;
st.local.u32 [%rd4+4], %r100;
st.local.u32 [%rd4], %r100;
ld.global.u32 %r75, [root];
// inline asm
call _rt_trace_64, (%r75, %f10, %f11, %f13, %f120, %f121, %f122, %r100, %f332, %f276, %rd71, %r101);
// inline asm
ld.local.f32 %f278, [%rd4+4];
ld.local.f32 %f279, [%rd4];
add.f32 %f280, %f279, %f278;
ld.local.f32 %f281, [%rd4+8];
add.f32 %f282, %f280, %f281;
setp.neu.f32 %p24, %f282, 0f00000000;
mov.f32 %f359, 0f437F0000;
@%p24 bra BB0_23;
mov.f32 %f334, 0f38D1B717;
mov.u32 %r103, 12;
mov.u32 %r102, 0;
st.local.u32 [%rd4+8], %r102;
st.local.u32 [%rd4+4], %r102;
st.local.u32 [%rd4], %r102;
ld.global.u32 %r78, [root];
// inline asm
call _rt_trace_64, (%r78, %f10, %f11, %f13, %f198, %f199, %f200, %r102, %f334, %f276, %rd71, %r103);
// inline asm
ld.local.f32 %f292, [%rd4+4];
ld.local.f32 %f293, [%rd4];
add.f32 %f294, %f293, %f292;
ld.local.f32 %f295, [%rd4+8];
add.f32 %f296, %f294, %f295;
setp.neu.f32 %p25, %f296, 0f00000000;
@%p25 bra BB0_23;
mov.f32 %f335, 0f38D1B717;
mov.u32 %r105, 12;
mov.u32 %r104, 0;
st.local.u32 [%rd4+8], %r104;
st.local.u32 [%rd4+4], %r104;
st.local.u32 [%rd4], %r104;
ld.global.u32 %r81, [root];
// inline asm
call _rt_trace_64, (%r81, %f10, %f11, %f13, %f221, %f222, %f223, %r104, %f335, %f276, %rd71, %r105);
// inline asm
ld.local.f32 %f306, [%rd4+4];
ld.local.f32 %f307, [%rd4];
add.f32 %f308, %f307, %f306;
ld.local.f32 %f309, [%rd4+8];
add.f32 %f310, %f308, %f309;
setp.neu.f32 %p26, %f310, 0f00000000;
@%p26 bra BB0_23;
mov.f32 %f336, 0f38D1B717;
mov.u32 %r107, 12;
mov.u32 %r106, 0;
st.local.u32 [%rd4+8], %r106;
st.local.u32 [%rd4+4], %r106;
st.local.u32 [%rd4], %r106;
ld.global.u32 %r84, [root];
// inline asm
call _rt_trace_64, (%r84, %f10, %f11, %f13, %f244, %f245, %f246, %r106, %f336, %f276, %rd71, %r107);
// inline asm
ld.local.f32 %f320, [%rd4+4];
ld.local.f32 %f321, [%rd4];
add.f32 %f322, %f321, %f320;
ld.local.f32 %f323, [%rd4+8];
add.f32 %f324, %f322, %f323;
setp.neu.f32 %p27, %f324, 0f00000000;
@%p27 bra BB0_23;
mov.f32 %f359, 0f00000000;
BB0_23:
mov.u64 %rd99, 0;
mov.u32 %r108, 2;
mov.u64 %rd81, image_Mask;
cvta.global.u64 %rd76, %rd81;
mov.u32 %r88, 1;
// inline asm
call (%rd75), _rt_buffer_get_64, (%rd76, %r108, %r88, %rd66, %rd67, %rd99, %rd99);
// inline asm
cvt.rzi.u32.f32 %r89, %f359;
st.u8 [%rd75], %r89;
BB0_25:
ret;
}