Files
PrinceOfGlory/Assets/Editor/x64/Bakery/lmPreview.ptx
kridoo 6e91a0c7f0 111
2025-09-15 17:32:08 +08:00

2898 lines
86 KiB
Plaintext

//
// Generated by NVIDIA NVVM Compiler
//
// Compiler Build ID: CL-23083092
// Cuda compilation tools, release 9.1, V9.1.85
// Based on LLVM 3.4svn
//
.version 6.1
.target sm_30
.address_size 64
// .globl _Z6oxMainv
.global .align 8 .b8 pixelID[8];
.global .align 8 .b8 resolution[8];
.global .align 4 .b8 normal[12];
.global .align 4 .b8 camPos[12];
.global .align 4 .b8 root[4];
.global .align 4 .u32 imageEnabled;
.global .texref lightmap;
.global .align 16 .b8 tileInfo[16];
.global .align 4 .u32 additive;
.global .align 1 .b8 accumBufferAdd[1];
.global .align 1 .b8 accumBufferLerp[1];
.global .align 1 .b8 GBufferPos[1];
.global .align 1 .b8 GBufferNormal[1];
.global .align 1 .b8 GBufferAtten[1];
.global .align 1 .b8 colorOutput[1];
.global .align 1 .b8 rnd_seeds[1];
.global .align 1 .b8 globalLights[1];
.global .align 1 .b8 localLights[1];
.global .align 1 .b8 localLightIndices[1];
.global .align 4 .u32 tileCubemap;
.global .align 4 .b8 cameraRht[12];
.global .align 4 .b8 cameraUp[12];
.global .align 4 .b8 cameraFwd[12];
.global .align 4 .b8 cameraPos[12];
.global .align 4 .f32 cameraFov;
.global .align 4 .f32 cameraExp;
.global .align 4 .f32 integration;
.global .align 4 .u32 finalBounceFlag;
.global .align 4 .u32 bounceFlag;
.global .align 16 .b8 rndOffset[16];
.global .align 4 .u32 firstSkylight;
.global .align 4 .f32 backFaceWeight;
.global .align 4 .b8 _ZN21rti_internal_typeinfo7pixelIDE[8] = {82, 97, 121, 0, 8, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo10resolutionE[8] = {82, 97, 121, 0, 8, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo6normalE[8] = {82, 97, 121, 0, 12, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo6camPosE[8] = {82, 97, 121, 0, 12, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo4rootE[8] = {82, 97, 121, 0, 4, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo12imageEnabledE[8] = {82, 97, 121, 0, 4, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo8tileInfoE[8] = {82, 97, 121, 0, 16, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo8additiveE[8] = {82, 97, 121, 0, 4, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo11tileCubemapE[8] = {82, 97, 121, 0, 4, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo9cameraRhtE[8] = {82, 97, 121, 0, 12, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo8cameraUpE[8] = {82, 97, 121, 0, 12, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo9cameraFwdE[8] = {82, 97, 121, 0, 12, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo9cameraPosE[8] = {82, 97, 121, 0, 12, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo9cameraFovE[8] = {82, 97, 121, 0, 4, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo9cameraExpE[8] = {82, 97, 121, 0, 4, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo11integrationE[8] = {82, 97, 121, 0, 4, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo15finalBounceFlagE[8] = {82, 97, 121, 0, 4, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo10bounceFlagE[8] = {82, 97, 121, 0, 4, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo9rndOffsetE[8] = {82, 97, 121, 0, 16, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo13firstSkylightE[8] = {82, 97, 121, 0, 4, 0, 0, 0};
.global .align 4 .b8 _ZN21rti_internal_typeinfo14backFaceWeightE[8] = {82, 97, 121, 0, 4, 0, 0, 0};
.global .align 8 .u64 _ZN21rti_internal_register20reg_bitness_detectorE;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail0E;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail1E;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail2E;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail3E;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail4E;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail5E;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail6E;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail7E;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail8E;
.global .align 8 .u64 _ZN21rti_internal_register24reg_exception_64_detail9E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail0E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail1E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail2E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail3E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail4E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail5E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail6E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail7E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail8E;
.global .align 4 .u32 _ZN21rti_internal_register21reg_exception_detail9E;
.global .align 4 .u32 _ZN21rti_internal_register14reg_rayIndex_xE;
.global .align 4 .u32 _ZN21rti_internal_register14reg_rayIndex_yE;
.global .align 4 .u32 _ZN21rti_internal_register14reg_rayIndex_zE;
.global .align 8 .b8 _ZN21rti_internal_typename7pixelIDE[6] = {117, 105, 110, 116, 50, 0};
.global .align 8 .b8 _ZN21rti_internal_typename10resolutionE[6] = {117, 105, 110, 116, 50, 0};
.global .align 8 .b8 _ZN21rti_internal_typename6normalE[7] = {102, 108, 111, 97, 116, 51, 0};
.global .align 8 .b8 _ZN21rti_internal_typename6camPosE[7] = {102, 108, 111, 97, 116, 51, 0};
.global .align 16 .b8 _ZN21rti_internal_typename4rootE[9] = {114, 116, 79, 98, 106, 101, 99, 116, 0};
.global .align 4 .b8 _ZN21rti_internal_typename12imageEnabledE[4] = {105, 110, 116, 0};
.global .align 8 .b8 _ZN21rti_internal_typename8tileInfoE[6] = {117, 105, 110, 116, 52, 0};
.global .align 4 .b8 _ZN21rti_internal_typename8additiveE[4] = {105, 110, 116, 0};
.global .align 4 .b8 _ZN21rti_internal_typename11tileCubemapE[4] = {105, 110, 116, 0};
.global .align 8 .b8 _ZN21rti_internal_typename9cameraRhtE[7] = {102, 108, 111, 97, 116, 51, 0};
.global .align 8 .b8 _ZN21rti_internal_typename8cameraUpE[7] = {102, 108, 111, 97, 116, 51, 0};
.global .align 8 .b8 _ZN21rti_internal_typename9cameraFwdE[7] = {102, 108, 111, 97, 116, 51, 0};
.global .align 8 .b8 _ZN21rti_internal_typename9cameraPosE[7] = {102, 108, 111, 97, 116, 51, 0};
.global .align 8 .b8 _ZN21rti_internal_typename9cameraFovE[6] = {102, 108, 111, 97, 116, 0};
.global .align 8 .b8 _ZN21rti_internal_typename9cameraExpE[6] = {102, 108, 111, 97, 116, 0};
.global .align 8 .b8 _ZN21rti_internal_typename11integrationE[6] = {102, 108, 111, 97, 116, 0};
.global .align 4 .b8 _ZN21rti_internal_typename15finalBounceFlagE[4] = {105, 110, 116, 0};
.global .align 4 .b8 _ZN21rti_internal_typename10bounceFlagE[4] = {105, 110, 116, 0};
.global .align 8 .b8 _ZN21rti_internal_typename9rndOffsetE[6] = {117, 105, 110, 116, 52, 0};
.global .align 4 .b8 _ZN21rti_internal_typename13firstSkylightE[4] = {105, 110, 116, 0};
.global .align 8 .b8 _ZN21rti_internal_typename14backFaceWeightE[6] = {102, 108, 111, 97, 116, 0};
.global .align 4 .u32 _ZN21rti_internal_typeenum7pixelIDE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum10resolutionE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum6normalE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum6camPosE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum4rootE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum12imageEnabledE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum8tileInfoE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum8additiveE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum11tileCubemapE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum9cameraRhtE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum8cameraUpE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum9cameraFwdE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum9cameraPosE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum9cameraFovE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum9cameraExpE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum11integrationE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum15finalBounceFlagE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum10bounceFlagE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum9rndOffsetE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum13firstSkylightE = 4919;
.global .align 4 .u32 _ZN21rti_internal_typeenum14backFaceWeightE = 4919;
.global .align 16 .b8 _ZN21rti_internal_semantic7pixelIDE[14] = {114, 116, 76, 97, 117, 110, 99, 104, 73, 110, 100, 101, 120, 0};
.global .align 16 .b8 _ZN21rti_internal_semantic10resolutionE[12] = {114, 116, 76, 97, 117, 110, 99, 104, 68, 105, 109, 0};
.global .align 16 .b8 _ZN21rti_internal_semantic6normalE[17] = {97, 116, 116, 114, 105, 98, 117, 116, 101, 32, 110, 111, 114, 109, 97, 108, 0};
.global .align 1 .b8 _ZN21rti_internal_semantic6camPosE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic4rootE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic12imageEnabledE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic8tileInfoE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic8additiveE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic11tileCubemapE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic9cameraRhtE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic8cameraUpE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic9cameraFwdE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic9cameraPosE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic9cameraFovE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic9cameraExpE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic11integrationE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic15finalBounceFlagE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic10bounceFlagE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic9rndOffsetE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic13firstSkylightE[1];
.global .align 1 .b8 _ZN21rti_internal_semantic14backFaceWeightE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation7pixelIDE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation10resolutionE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation6normalE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation6camPosE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation4rootE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation12imageEnabledE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation8tileInfoE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation8additiveE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation11tileCubemapE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation9cameraRhtE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation8cameraUpE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation9cameraFwdE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation9cameraPosE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation9cameraFovE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation9cameraExpE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation11integrationE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation15finalBounceFlagE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation10bounceFlagE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation9rndOffsetE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation13firstSkylightE[1];
.global .align 1 .b8 _ZN23rti_internal_annotation14backFaceWeightE[1];
.const .align 4 .b8 __cudart_i2opi_f[24] = {65, 144, 67, 60, 153, 149, 98, 219, 192, 221, 52, 245, 209, 87, 39, 252, 41, 21, 68, 78, 110, 131, 249, 162};
.visible .entry _Z6oxMainv(
)
{
.local .align 4 .b8 __local_depot0[60];
.reg .b64 %SP;
.reg .b64 %SPL;
.reg .pred %p<197>;
.reg .b16 %rs<18>;
.reg .f32 %f<1537>;
.reg .b32 %r<777>;
.reg .b64 %rd<259>;
mov.u64 %rd258, __local_depot0;
cvta.local.u64 %SP, %rd258;
ld.global.v2.u32 {%r227, %r228}, [pixelID];
ld.global.v4.u32 {%r230, %r231, %r232, %r233}, [rndOffset];
add.s32 %r235, %r230, %r227;
and.b32 %r236, %r235, 255;
add.s32 %r239, %r231, %r228;
and.b32 %r240, %r239, 255;
add.s32 %r242, %r232, %r227;
and.b32 %r243, %r242, 255;
add.s32 %r245, %r233, %r228;
and.b32 %r246, %r245, 255;
cvt.u64.u32 %rd59, %r236;
cvt.u64.u32 %rd60, %r240;
mov.u64 %rd75, rnd_seeds;
cvta.global.u64 %rd46, %rd75;
mov.u32 %r225, 2;
mov.u32 %r226, 3;
mov.u64 %rd253, 0;
// inline asm
call (%rd45), _rt_buffer_get_64, (%rd46, %r225, %r226, %rd59, %rd60, %rd253, %rd253);
// inline asm
ld.u8 %rs4, [%rd45];
cvt.rn.f32.u16 %f416, %rs4;
div.rn.f32 %f1, %f416, 0f437F0000;
// inline asm
call (%rd51), _rt_buffer_get_64, (%rd46, %r225, %r226, %rd59, %rd60, %rd253, %rd253);
// inline asm
ld.u8 %rs5, [%rd51+1];
cvt.rn.f32.u16 %f417, %rs5;
div.rn.f32 %f2, %f417, 0f437F0000;
// inline asm
call (%rd57), _rt_buffer_get_64, (%rd46, %r225, %r226, %rd59, %rd60, %rd253, %rd253);
// inline asm
ld.u8 %rs6, [%rd57+2];
cvt.rn.f32.u16 %f418, %rs6;
div.rn.f32 %f3, %f418, 0f437F0000;
cvt.u64.u32 %rd71, %r243;
cvt.u64.u32 %rd72, %r246;
// inline asm
call (%rd63), _rt_buffer_get_64, (%rd46, %r225, %r226, %rd71, %rd72, %rd253, %rd253);
// inline asm
ld.u8 %rs1, [%rd63];
// inline asm
call (%rd69), _rt_buffer_get_64, (%rd46, %r225, %r226, %rd71, %rd72, %rd253, %rd253);
// inline asm
ld.global.u32 %r247, [bounceFlag];
setp.eq.s32 %p6, %r247, 0;
@%p6 bra BB0_48;
ld.u8 %rs7, [%rd69+1];
cvt.rn.f32.u16 %f419, %rs7;
div.rn.f32 %f420, %f419, 0f437F0000;
cvt.rn.f32.u16 %f421, %rs1;
div.rn.f32 %f422, %f421, 0f437F0000;
ld.global.v2.u32 {%r252, %r253}, [pixelID];
cvt.u64.u32 %rd78, %r252;
cvt.u64.u32 %rd79, %r253;
mov.u64 %rd88, GBufferPos;
cvta.global.u64 %rd77, %rd88;
mov.u32 %r251, 12;
// inline asm
call (%rd76), _rt_buffer_get_64, (%rd77, %r225, %r251, %rd78, %rd79, %rd253, %rd253);
// inline asm
ld.f32 %f1454, [%rd76+8];
ld.f32 %f1453, [%rd76+4];
ld.f32 %f1452, [%rd76];
ld.global.v2.u32 {%r256, %r257}, [pixelID];
cvt.u64.u32 %rd84, %r256;
cvt.u64.u32 %rd85, %r257;
mov.u64 %rd89, GBufferNormal;
cvta.global.u64 %rd83, %rd89;
// inline asm
call (%rd82), _rt_buffer_get_64, (%rd83, %r225, %r251, %rd84, %rd85, %rd253, %rd253);
// inline asm
ld.f32 %f9, [%rd82+4];
ld.f32 %f8, [%rd82+8];
ld.f32 %f7, [%rd82];
abs.f32 %f423, %f7;
abs.f32 %f424, %f8;
setp.gt.f32 %p7, %f423, %f424;
neg.f32 %f425, %f9;
neg.f32 %f426, %f8;
selp.f32 %f427, %f425, 0f00000000, %p7;
selp.f32 %f428, %f7, %f426, %p7;
selp.f32 %f429, 0f00000000, %f9, %p7;
mul.f32 %f430, %f428, %f428;
fma.rn.f32 %f431, %f427, %f427, %f430;
fma.rn.f32 %f432, %f429, %f429, %f431;
sqrt.rn.f32 %f433, %f432;
rcp.rn.f32 %f434, %f433;
mul.f32 %f10, %f427, %f434;
mul.f32 %f11, %f428, %f434;
mul.f32 %f12, %f429, %f434;
sqrt.rn.f32 %f13, %f422;
mul.f32 %f1443, %f420, 0f40C90FDB;
add.u64 %rd90, %SP, 32;
cvta.to.local.u64 %rd2, %rd90;
abs.f32 %f15, %f1443;
setp.neu.f32 %p8, %f15, 0f7F800000;
mov.f32 %f1437, %f1443;
@%p8 bra BB0_3;
mov.f32 %f435, 0f00000000;
mul.rn.f32 %f1437, %f1443, %f435;
BB0_3:
mul.f32 %f436, %f1437, 0f3F22F983;
cvt.rni.s32.f32 %r726, %f436;
cvt.rn.f32.s32 %f437, %r726;
neg.f32 %f438, %f437;
mov.f32 %f439, 0f3FC90FDA;
fma.rn.f32 %f440, %f438, %f439, %f1437;
mov.f32 %f441, 0f33A22168;
fma.rn.f32 %f442, %f438, %f441, %f440;
mov.f32 %f443, 0f27C234C5;
fma.rn.f32 %f1438, %f438, %f443, %f442;
abs.f32 %f444, %f1437;
add.s64 %rd3, %rd2, 24;
setp.leu.f32 %p9, %f444, 0f47CE4780;
@%p9 bra BB0_14;
mov.b32 %r2, %f1437;
shr.u32 %r3, %r2, 23;
shl.b32 %r262, %r2, 8;
or.b32 %r4, %r262, -2147483648;
mov.u32 %r718, 0;
mov.u64 %rd246, __cudart_i2opi_f;
mov.u32 %r717, -6;
mov.u64 %rd247, %rd2;
BB0_5:
.pragma "nounroll";
ld.const.u32 %r265, [%rd246];
// inline asm
{
mad.lo.cc.u32 %r263, %r265, %r4, %r718;
madc.hi.u32 %r718, %r265, %r4, 0;
}
// inline asm
st.local.u32 [%rd247], %r263;
add.s64 %rd247, %rd247, 4;
add.s64 %rd246, %rd246, 4;
add.s32 %r717, %r717, 1;
setp.ne.s32 %p10, %r717, 0;
@%p10 bra BB0_5;
and.b32 %r268, %r3, 255;
add.s32 %r269, %r268, -128;
shr.u32 %r270, %r269, 5;
and.b32 %r9, %r2, -2147483648;
st.local.u32 [%rd3], %r718;
mov.u32 %r271, 6;
sub.s32 %r272, %r271, %r270;
mul.wide.s32 %rd92, %r272, 4;
add.s64 %rd8, %rd2, %rd92;
ld.local.u32 %r719, [%rd8];
ld.local.u32 %r720, [%rd8+-4];
and.b32 %r12, %r3, 31;
setp.eq.s32 %p11, %r12, 0;
@%p11 bra BB0_8;
mov.u32 %r273, 32;
sub.s32 %r274, %r273, %r12;
shr.u32 %r275, %r720, %r274;
shl.b32 %r276, %r719, %r12;
add.s32 %r719, %r275, %r276;
ld.local.u32 %r277, [%rd8+-8];
shr.u32 %r278, %r277, %r274;
shl.b32 %r279, %r720, %r12;
add.s32 %r720, %r278, %r279;
BB0_8:
shr.u32 %r280, %r720, 30;
shl.b32 %r281, %r719, 2;
add.s32 %r721, %r280, %r281;
shl.b32 %r18, %r720, 2;
shr.u32 %r282, %r721, 31;
shr.u32 %r283, %r719, 30;
add.s32 %r19, %r282, %r283;
setp.eq.s32 %p12, %r282, 0;
@%p12 bra BB0_9;
not.b32 %r284, %r721;
neg.s32 %r723, %r18;
setp.eq.s32 %p13, %r18, 0;
selp.u32 %r285, 1, 0, %p13;
add.s32 %r721, %r285, %r284;
xor.b32 %r722, %r9, -2147483648;
bra.uni BB0_11;
BB0_48:
ld.global.f32 %f1452, [cameraPos];
ld.global.f32 %f1453, [cameraPos+4];
ld.global.f32 %f1454, [cameraPos+8];
ld.global.v2.u32 {%r352, %r353}, [resolution];
cvt.rn.f32.u32 %f506, %r352;
cvt.rn.f32.u32 %f507, %r353;
div.rn.f32 %f508, %f506, %f507;
ld.global.v2.u32 {%r356, %r357}, [pixelID];
cvt.rn.f32.u32 %f509, %r356;
add.f32 %f510, %f1, %f509;
div.rn.f32 %f511, %f510, %f506;
cvt.rn.f32.u32 %f512, %r357;
add.f32 %f513, %f2, %f512;
div.rn.f32 %f514, %f513, %f507;
fma.rn.f32 %f515, %f511, 0f40000000, 0fBF800000;
fma.rn.f32 %f516, %f514, 0f40000000, 0fBF800000;
ld.global.f32 %f517, [cameraFov];
mul.f32 %f518, %f508, %f517;
ld.global.f32 %f519, [cameraRht];
mul.f32 %f520, %f515, %f519;
ld.global.f32 %f521, [cameraRht+4];
mul.f32 %f522, %f515, %f521;
ld.global.f32 %f523, [cameraRht+8];
mul.f32 %f524, %f515, %f523;
ld.global.f32 %f525, [cameraFwd];
fma.rn.f32 %f526, %f518, %f520, %f525;
ld.global.f32 %f527, [cameraFwd+4];
fma.rn.f32 %f528, %f518, %f522, %f527;
ld.global.f32 %f529, [cameraFwd+8];
fma.rn.f32 %f530, %f518, %f524, %f529;
ld.global.f32 %f531, [cameraUp];
mul.f32 %f532, %f516, %f531;
ld.global.f32 %f533, [cameraUp+4];
mul.f32 %f534, %f516, %f533;
ld.global.f32 %f535, [cameraUp+8];
mul.f32 %f536, %f516, %f535;
fma.rn.f32 %f537, %f517, %f532, %f526;
fma.rn.f32 %f538, %f517, %f534, %f528;
fma.rn.f32 %f539, %f517, %f536, %f530;
mul.f32 %f540, %f538, %f538;
fma.rn.f32 %f541, %f537, %f537, %f540;
fma.rn.f32 %f542, %f539, %f539, %f541;
sqrt.rn.f32 %f543, %f542;
rcp.rn.f32 %f544, %f543;
mul.f32 %f62, %f537, %f544;
mul.f32 %f63, %f538, %f544;
mul.f32 %f64, %f544, %f539;
bra.uni BB0_49;
BB0_9:
mov.u32 %r722, %r9;
mov.u32 %r723, %r18;
BB0_11:
clz.b32 %r725, %r721;
setp.eq.s32 %p14, %r725, 0;
shl.b32 %r286, %r721, %r725;
mov.u32 %r287, 32;
sub.s32 %r288, %r287, %r725;
shr.u32 %r289, %r723, %r288;
add.s32 %r290, %r289, %r286;
selp.b32 %r27, %r721, %r290, %p14;
mov.u32 %r291, -921707870;
mul.hi.u32 %r724, %r27, %r291;
setp.eq.s32 %p15, %r9, 0;
neg.s32 %r292, %r19;
selp.b32 %r726, %r19, %r292, %p15;
setp.lt.s32 %p16, %r724, 1;
@%p16 bra BB0_13;
mul.lo.s32 %r293, %r27, -921707870;
shr.u32 %r294, %r293, 31;
shl.b32 %r295, %r724, 1;
add.s32 %r724, %r294, %r295;
add.s32 %r725, %r725, 1;
BB0_13:
mov.u32 %r296, 126;
sub.s32 %r297, %r296, %r725;
shl.b32 %r298, %r297, 23;
add.s32 %r299, %r724, 1;
shr.u32 %r300, %r299, 7;
add.s32 %r301, %r300, 1;
shr.u32 %r302, %r301, 1;
add.s32 %r303, %r302, %r298;
or.b32 %r304, %r303, %r722;
mov.b32 %f1438, %r304;
BB0_14:
mul.rn.f32 %f21, %f1438, %f1438;
add.s32 %r35, %r726, 1;
and.b32 %r36, %r35, 1;
setp.eq.s32 %p17, %r36, 0;
@%p17 bra BB0_16;
mov.f32 %f445, 0fBAB6061A;
mov.f32 %f446, 0f37CCF5CE;
fma.rn.f32 %f1439, %f446, %f21, %f445;
bra.uni BB0_17;
BB0_16:
mov.f32 %f447, 0f3C08839E;
mov.f32 %f448, 0fB94CA1F9;
fma.rn.f32 %f1439, %f448, %f21, %f447;
BB0_17:
@%p17 bra BB0_19;
mov.f32 %f449, 0f3D2AAAA5;
fma.rn.f32 %f450, %f1439, %f21, %f449;
mov.f32 %f451, 0fBF000000;
fma.rn.f32 %f1440, %f450, %f21, %f451;
bra.uni BB0_20;
BB0_19:
mov.f32 %f452, 0fBE2AAAA3;
fma.rn.f32 %f453, %f1439, %f21, %f452;
mov.f32 %f454, 0f00000000;
fma.rn.f32 %f1440, %f453, %f21, %f454;
BB0_20:
fma.rn.f32 %f1441, %f1440, %f1438, %f1438;
@%p17 bra BB0_22;
mov.f32 %f455, 0f3F800000;
fma.rn.f32 %f1441, %f1440, %f21, %f455;
BB0_22:
and.b32 %r305, %r35, 2;
setp.eq.s32 %p20, %r305, 0;
@%p20 bra BB0_24;
mov.f32 %f456, 0f00000000;
mov.f32 %f457, 0fBF800000;
fma.rn.f32 %f1441, %f1441, %f457, %f456;
BB0_24:
@%p8 bra BB0_26;
mov.f32 %f458, 0f00000000;
mul.rn.f32 %f1443, %f1443, %f458;
BB0_26:
mul.f32 %f459, %f1443, 0f3F22F983;
cvt.rni.s32.f32 %r736, %f459;
cvt.rn.f32.s32 %f460, %r736;
neg.f32 %f461, %f460;
fma.rn.f32 %f463, %f461, %f439, %f1443;
fma.rn.f32 %f465, %f461, %f441, %f463;
fma.rn.f32 %f1444, %f461, %f443, %f465;
abs.f32 %f467, %f1443;
setp.leu.f32 %p22, %f467, 0f47CE4780;
@%p22 bra BB0_37;
mov.b32 %r38, %f1443;
shr.u32 %r39, %r38, 23;
shl.b32 %r308, %r38, 8;
or.b32 %r40, %r308, -2147483648;
mov.u32 %r728, 0;
mov.u64 %rd248, __cudart_i2opi_f;
mov.u32 %r727, -6;
mov.u64 %rd249, %rd2;
BB0_28:
.pragma "nounroll";
ld.const.u32 %r311, [%rd248];
// inline asm
{
mad.lo.cc.u32 %r309, %r311, %r40, %r728;
madc.hi.u32 %r728, %r311, %r40, 0;
}
// inline asm
st.local.u32 [%rd249], %r309;
add.s64 %rd249, %rd249, 4;
add.s64 %rd248, %rd248, 4;
add.s32 %r727, %r727, 1;
setp.ne.s32 %p23, %r727, 0;
@%p23 bra BB0_28;
and.b32 %r314, %r39, 255;
add.s32 %r315, %r314, -128;
shr.u32 %r316, %r315, 5;
and.b32 %r45, %r38, -2147483648;
st.local.u32 [%rd3], %r728;
mov.u32 %r317, 6;
sub.s32 %r318, %r317, %r316;
mul.wide.s32 %rd94, %r318, 4;
add.s64 %rd13, %rd2, %rd94;
ld.local.u32 %r729, [%rd13];
ld.local.u32 %r730, [%rd13+-4];
and.b32 %r48, %r39, 31;
setp.eq.s32 %p24, %r48, 0;
@%p24 bra BB0_31;
mov.u32 %r319, 32;
sub.s32 %r320, %r319, %r48;
shr.u32 %r321, %r730, %r320;
shl.b32 %r322, %r729, %r48;
add.s32 %r729, %r321, %r322;
ld.local.u32 %r323, [%rd13+-8];
shr.u32 %r324, %r323, %r320;
shl.b32 %r325, %r730, %r48;
add.s32 %r730, %r324, %r325;
BB0_31:
shr.u32 %r326, %r730, 30;
shl.b32 %r327, %r729, 2;
add.s32 %r731, %r326, %r327;
shl.b32 %r54, %r730, 2;
shr.u32 %r328, %r731, 31;
shr.u32 %r329, %r729, 30;
add.s32 %r55, %r328, %r329;
setp.eq.s32 %p25, %r328, 0;
@%p25 bra BB0_32;
not.b32 %r330, %r731;
neg.s32 %r733, %r54;
setp.eq.s32 %p26, %r54, 0;
selp.u32 %r331, 1, 0, %p26;
add.s32 %r731, %r331, %r330;
xor.b32 %r732, %r45, -2147483648;
bra.uni BB0_34;
BB0_32:
mov.u32 %r732, %r45;
mov.u32 %r733, %r54;
BB0_34:
clz.b32 %r735, %r731;
setp.eq.s32 %p27, %r735, 0;
shl.b32 %r332, %r731, %r735;
mov.u32 %r333, 32;
sub.s32 %r334, %r333, %r735;
shr.u32 %r335, %r733, %r334;
add.s32 %r336, %r335, %r332;
selp.b32 %r63, %r731, %r336, %p27;
mov.u32 %r337, -921707870;
mul.hi.u32 %r734, %r63, %r337;
setp.eq.s32 %p28, %r45, 0;
neg.s32 %r338, %r55;
selp.b32 %r736, %r55, %r338, %p28;
setp.lt.s32 %p29, %r734, 1;
@%p29 bra BB0_36;
mul.lo.s32 %r339, %r63, -921707870;
shr.u32 %r340, %r339, 31;
shl.b32 %r341, %r734, 1;
add.s32 %r734, %r340, %r341;
add.s32 %r735, %r735, 1;
BB0_36:
mov.u32 %r342, 126;
sub.s32 %r343, %r342, %r735;
shl.b32 %r344, %r343, 23;
add.s32 %r345, %r734, 1;
shr.u32 %r346, %r345, 7;
add.s32 %r347, %r346, 1;
shr.u32 %r348, %r347, 1;
add.s32 %r349, %r348, %r344;
or.b32 %r350, %r349, %r732;
mov.b32 %f1444, %r350;
BB0_37:
mul.rn.f32 %f38, %f1444, %f1444;
and.b32 %r71, %r736, 1;
setp.eq.s32 %p30, %r71, 0;
@%p30 bra BB0_39;
mov.f32 %f468, 0fBAB6061A;
mov.f32 %f469, 0f37CCF5CE;
fma.rn.f32 %f1445, %f469, %f38, %f468;
bra.uni BB0_40;
BB0_39:
mov.f32 %f470, 0f3C08839E;
mov.f32 %f471, 0fB94CA1F9;
fma.rn.f32 %f1445, %f471, %f38, %f470;
BB0_40:
@%p30 bra BB0_42;
mov.f32 %f472, 0f3D2AAAA5;
fma.rn.f32 %f473, %f1445, %f38, %f472;
mov.f32 %f474, 0fBF000000;
fma.rn.f32 %f1446, %f473, %f38, %f474;
bra.uni BB0_43;
BB0_42:
mov.f32 %f475, 0fBE2AAAA3;
fma.rn.f32 %f476, %f1445, %f38, %f475;
mov.f32 %f477, 0f00000000;
fma.rn.f32 %f1446, %f476, %f38, %f477;
BB0_43:
fma.rn.f32 %f1447, %f1446, %f1444, %f1444;
@%p30 bra BB0_45;
mov.f32 %f478, 0f3F800000;
fma.rn.f32 %f1447, %f1446, %f38, %f478;
BB0_45:
and.b32 %r351, %r736, 2;
setp.eq.s32 %p33, %r351, 0;
@%p33 bra BB0_47;
mov.f32 %f479, 0f00000000;
mov.f32 %f480, 0fBF800000;
fma.rn.f32 %f1447, %f1447, %f480, %f479;
BB0_47:
mul.f32 %f481, %f13, %f1441;
mul.f32 %f482, %f481, %f481;
mov.f32 %f483, 0f3F800000;
sub.f32 %f484, %f483, %f482;
mul.f32 %f485, %f13, %f1447;
mul.f32 %f486, %f485, %f485;
sub.f32 %f487, %f484, %f486;
mov.f32 %f488, 0f00000000;
max.f32 %f489, %f488, %f487;
sqrt.rn.f32 %f490, %f489;
mul.f32 %f491, %f10, %f485;
mul.f32 %f492, %f11, %f485;
mul.f32 %f493, %f12, %f485;
mul.f32 %f494, %f8, %f11;
mul.f32 %f495, %f9, %f12;
sub.f32 %f496, %f494, %f495;
fma.rn.f32 %f497, %f496, %f481, %f491;
mul.f32 %f498, %f7, %f12;
mul.f32 %f499, %f8, %f10;
sub.f32 %f500, %f498, %f499;
fma.rn.f32 %f501, %f500, %f481, %f492;
mul.f32 %f502, %f9, %f10;
mul.f32 %f503, %f7, %f11;
sub.f32 %f504, %f502, %f503;
fma.rn.f32 %f505, %f504, %f481, %f493;
fma.rn.f32 %f62, %f7, %f490, %f497;
fma.rn.f32 %f63, %f9, %f490, %f501;
fma.rn.f32 %f64, %f8, %f490, %f505;
BB0_49:
add.u64 %rd101, %SP, 0;
cvta.to.local.u64 %rd102, %rd101;
add.s64 %rd14, %rd102, 12;
mov.u32 %r362, -1082130432;
st.local.u32 [%rd102+12], %r362;
mov.u32 %r363, 0;
st.local.u32 [%rd102], %r363;
st.local.u32 [%rd102+4], %r363;
st.local.u32 [%rd102+8], %r363;
st.local.u32 [%rd102+16], %r363;
st.local.u32 [%rd102+20], %r363;
st.local.u32 [%rd102+24], %r363;
ld.global.v2.u32 {%r364, %r365}, [pixelID];
cvt.u64.u32 %rd97, %r364;
cvt.u64.u32 %rd98, %r365;
mov.u64 %rd103, GBufferAtten;
cvta.global.u64 %rd96, %rd103;
mov.u32 %r361, 12;
// inline asm
call (%rd95), _rt_buffer_get_64, (%rd96, %r225, %r361, %rd97, %rd98, %rd253, %rd253);
// inline asm
ld.f32 %f70, [%rd95+8];
ld.f32 %f68, [%rd95+4];
ld.f32 %f69, [%rd95];
add.f32 %f545, %f69, %f68;
add.f32 %f546, %f70, %f545;
ld.global.u32 %r368, [bounceFlag];
setp.ne.s32 %p34, %r368, 0;
setp.eq.f32 %p35, %f546, 0f00000000;
and.pred %p36, %p34, %p35;
@%p36 bra BB0_51;
ld.global.u32 %r369, [root];
mov.u32 %r370, 0;
mov.f32 %f553, 0f00000000;
mov.f32 %f554, 0f6C4ECB8F;
mov.u32 %r371, 28;
// inline asm
call _rt_trace_64, (%r369, %f1452, %f1453, %f1454, %f62, %f63, %f64, %r370, %f553, %f554, %rd101, %r371);
// inline asm
BB0_51:
ld.local.f32 %f71, [%rd14];
setp.ltu.f32 %p37, %f71, 0f00000000;
@%p37 bra BB0_188;
bra.uni BB0_52;
BB0_188:
ld.global.u32 %r629, [bounceFlag];
setp.eq.s32 %p136, %r629, 0;
selp.u16 %rs17, 1, 0, %p136;
mov.f32 %f1513, 0f00000000;
mov.f32 %f1514, %f1513;
mov.f32 %f1515, %f1513;
mov.f32 %f1516, %f1513;
mov.f32 %f1517, %f1513;
mov.f32 %f1518, %f1513;
mov.f32 %f1499, %f1513;
mov.f32 %f1500, %f1513;
mov.f32 %f1501, %f1513;
bra.uni BB0_189;
BB0_52:
fma.rn.f32 %f555, %f62, %f71, %f1452;
fma.rn.f32 %f556, %f63, %f71, %f1453;
fma.rn.f32 %f557, %f64, %f71, %f1454;
mul.f32 %f558, %f555, 0f3456BF95;
mul.f32 %f559, %f556, 0f3456BF95;
mul.f32 %f560, %f557, 0f3456BF95;
abs.f32 %f561, %f558;
abs.f32 %f562, %f559;
abs.f32 %f563, %f560;
max.f32 %f564, %f561, %f562;
max.f32 %f565, %f564, %f563;
mov.f32 %f566, 0f38D1B717;
max.f32 %f567, %f565, %f566;
ld.local.f32 %f568, [%rd14+-12];
ld.local.f32 %f569, [%rd14+-8];
ld.local.f32 %f570, [%rd14+-4];
fma.rn.f32 %f72, %f567, %f568, %f555;
fma.rn.f32 %f73, %f567, %f569, %f556;
fma.rn.f32 %f74, %f567, %f570, %f557;
ld.global.v2.u32 {%r376, %r377}, [pixelID];
cvt.u64.u32 %rd107, %r376;
cvt.u64.u32 %rd108, %r377;
mov.u64 %rd117, GBufferPos;
cvta.global.u64 %rd106, %rd117;
// inline asm
call (%rd105), _rt_buffer_get_64, (%rd106, %r225, %r361, %rd107, %rd108, %rd253, %rd253);
// inline asm
st.f32 [%rd105+8], %f74;
st.f32 [%rd105+4], %f73;
st.f32 [%rd105], %f72;
ld.global.v2.u32 {%r380, %r381}, [pixelID];
cvt.u64.u32 %rd113, %r380;
cvt.u64.u32 %rd114, %r381;
mov.u64 %rd118, GBufferNormal;
cvta.global.u64 %rd112, %rd118;
// inline asm
call (%rd111), _rt_buffer_get_64, (%rd112, %r225, %r361, %rd113, %rd114, %rd253, %rd253);
// inline asm
ld.local.f32 %f571, [%rd14+-12];
ld.local.f32 %f572, [%rd14+-8];
ld.local.f32 %f573, [%rd14+-4];
st.f32 [%rd111+8], %f573;
st.f32 [%rd111+4], %f572;
st.f32 [%rd111], %f571;
ld.local.f32 %f574, [%rd14+12];
ld.local.f32 %f575, [%rd14+8];
ld.local.f32 %f576, [%rd14+4];
setp.lt.f32 %p38, %f576, 0f00000000;
neg.f32 %f577, %f576;
selp.f32 %f578, %f577, %f576, %p38;
ld.global.f32 %f579, [backFaceWeight];
selp.f32 %f580, %f579, 0f3F800000, %p38;
cvt.rmi.f32.f32 %f581, %f578;
cvt.rmi.f32.f32 %f582, %f575;
cvt.rmi.f32.f32 %f583, %f574;
sub.f32 %f584, %f578, %f581;
sub.f32 %f585, %f575, %f582;
sub.f32 %f586, %f574, %f583;
mul.f32 %f1516, %f580, %f584;
mul.f32 %f1517, %f580, %f585;
mul.f32 %f1518, %f580, %f586;
mul.f32 %f1513, %f581, 0f3B808081;
mul.f32 %f1514, %f582, 0f3B808081;
mul.f32 %f1515, %f583, 0f3B808081;
ld.global.u32 %r384, [bounceFlag];
setp.lt.s32 %p39, %r384, 1;
@%p39 bra BB0_54;
mul.f32 %f1516, %f69, %f1516;
mul.f32 %f1517, %f68, %f1517;
mul.f32 %f1518, %f70, %f1518;
mul.f32 %f1513, %f69, %f1513;
mul.f32 %f1514, %f68, %f1514;
mul.f32 %f1515, %f70, %f1515;
BB0_54:
mov.u64 %rd124, globalLights;
cvta.global.u64 %rd123, %rd124;
mov.u32 %r385, 1;
mov.u32 %r386, 48;
// inline asm
call (%rd119, %rd120, %rd121, %rd122), _rt_buffer_get_size_64, (%rd123, %r385, %r386);
// inline asm
cvt.u32.u64 %r72, %rd119;
setp.eq.s32 %p40, %r72, 0;
mov.f32 %f1499, 0f00000000;
mov.f32 %f1500, %f1499;
mov.f32 %f1501, %f1499;
@%p40 bra BB0_162;
// inline asm
call (%rd125, %rd126, %rd127, %rd128), _rt_buffer_get_size_64, (%rd123, %r385, %r386);
// inline asm
cvt.u32.u64 %r391, %rd125;
cvt.rn.f32.u32 %f590, %r391;
mul.f32 %f591, %f3, %f590;
cvt.rzi.u32.f32 %r392, %f591;
add.s32 %r393, %r391, -1;
min.u32 %r394, %r392, %r393;
cvt.u64.u32 %rd132, %r394;
// inline asm
call (%rd130), _rt_buffer_get_64, (%rd123, %r385, %r386, %rd132, %rd253, %rd253, %rd253);
// inline asm
ld.v4.f32 {%f592, %f593, %f594, %f595}, [%rd130+32];
ld.v4.f32 {%f596, %f597, %f598, %f599}, [%rd130+16];
ld.v4.f32 {%f600, %f601, %f602, %f603}, [%rd130];
setp.lt.f32 %p41, %f600, 0f3F800000;
@%p41 bra BB0_109;
bra.uni BB0_56;
BB0_109:
fma.rn.f32 %f723, %f601, 0f40000000, 0fBF800000;
fma.rn.f32 %f724, %f602, 0f40000000, 0fBF800000;
abs.f32 %f725, %f723;
mov.f32 %f1495, 0f3F800000;
sub.f32 %f727, %f1495, %f725;
abs.f32 %f728, %f724;
sub.f32 %f729, %f727, %f728;
neg.f32 %f730, %f729;
cvt.sat.f32.f32 %f731, %f730;
setp.ltu.f32 %p74, %f723, 0f00000000;
neg.f32 %f732, %f731;
selp.f32 %f733, %f731, %f732, %p74;
add.f32 %f734, %f723, %f733;
setp.ltu.f32 %p75, %f724, 0f00000000;
selp.f32 %f735, %f731, %f732, %p75;
add.f32 %f736, %f724, %f735;
mul.f32 %f737, %f736, %f736;
fma.rn.f32 %f738, %f734, %f734, %f737;
fma.rn.f32 %f739, %f729, %f729, %f738;
sqrt.rn.f32 %f740, %f739;
rcp.rn.f32 %f741, %f740;
mul.f32 %f180, %f741, %f734;
mul.f32 %f181, %f741, %f736;
mul.f32 %f182, %f729, %f741;
ld.local.f32 %f742, [%rd14+-12];
mul.f32 %f743, %f742, %f180;
ld.local.f32 %f744, [%rd14+-8];
mul.f32 %f745, %f181, %f744;
neg.f32 %f746, %f745;
sub.f32 %f747, %f746, %f743;
ld.local.f32 %f748, [%rd14+-4];
mul.f32 %f749, %f182, %f748;
sub.f32 %f1482, %f747, %f749;
setp.gt.f32 %p76, %f1482, 0f00000000;
setp.neu.f32 %p77, %f603, 0f00000000;
and.pred %p78, %p76, %p77;
@!%p78 bra BB0_111;
bra.uni BB0_110;
BB0_110:
abs.f32 %f758, %f180;
abs.f32 %f759, %f182;
setp.gt.f32 %p79, %f758, %f759;
neg.f32 %f760, %f181;
selp.f32 %f761, %f760, 0f00000000, %p79;
neg.f32 %f762, %f182;
selp.f32 %f763, %f180, %f762, %p79;
selp.f32 %f764, 0f00000000, %f181, %p79;
mul.f32 %f765, %f763, %f763;
fma.rn.f32 %f766, %f761, %f761, %f765;
fma.rn.f32 %f767, %f764, %f764, %f766;
sqrt.rn.f32 %f768, %f767;
rcp.rn.f32 %f769, %f768;
mul.f32 %f770, %f761, %f769;
mul.f32 %f771, %f763, %f769;
mul.f32 %f772, %f764, %f769;
mul.f32 %f773, %f182, %f771;
mul.f32 %f774, %f181, %f772;
sub.f32 %f775, %f773, %f774;
mul.f32 %f776, %f180, %f772;
mul.f32 %f777, %f182, %f770;
sub.f32 %f778, %f776, %f777;
mul.f32 %f779, %f181, %f770;
mul.f32 %f780, %f180, %f771;
sub.f32 %f781, %f779, %f780;
mul.f32 %f782, %f73, %f778;
fma.rn.f32 %f783, %f72, %f775, %f782;
fma.rn.f32 %f784, %f74, %f781, %f783;
fma.rn.f32 %f754, %f592, %f784, %f594;
mul.f32 %f785, %f73, %f771;
fma.rn.f32 %f786, %f72, %f770, %f785;
fma.rn.f32 %f787, %f74, %f772, %f786;
fma.rn.f32 %f755, %f593, %f787, %f595;
cvt.rzi.s32.f32 %r496, %f603;
mov.f32 %f757, 0f00000000;
// inline asm
call (%f750, %f751, %f752, %f753), _rt_texture_get_f_id, (%r496, %r225, %f754, %f755, %f757, %f757);
// inline asm
mul.f32 %f1482, %f1482, %f750;
BB0_111:
mov.f32 %f1496, 0f00000000;
setp.le.f32 %p80, %f1482, 0f00000000;
mov.f32 %f1497, %f1496;
mov.f32 %f1498, %f1496;
@%p80 bra BB0_161;
abs.f32 %f792, %f180;
abs.f32 %f793, %f182;
setp.gt.f32 %p81, %f792, %f793;
neg.f32 %f794, %f181;
selp.f32 %f795, %f794, 0f00000000, %p81;
neg.f32 %f796, %f182;
selp.f32 %f797, %f180, %f796, %p81;
selp.f32 %f798, 0f00000000, %f181, %p81;
mul.f32 %f799, %f797, %f797;
fma.rn.f32 %f800, %f795, %f795, %f799;
fma.rn.f32 %f801, %f798, %f798, %f800;
sqrt.rn.f32 %f802, %f801;
rcp.rn.f32 %f803, %f802;
mul.f32 %f186, %f795, %f803;
mul.f32 %f187, %f797, %f803;
mul.f32 %f188, %f798, %f803;
setp.ltu.f32 %p82, %f596, 0f00000000;
@%p82 bra BB0_160;
sqrt.rn.f32 %f189, %f1;
add.u64 %rd159, %SP, 32;
cvta.to.local.u64 %rd29, %rd159;
mul.f32 %f1489, %f2, 0f40C90FDB;
abs.f32 %f191, %f1489;
setp.neu.f32 %p83, %f191, 0f7F800000;
mov.f32 %f1483, %f1489;
@%p83 bra BB0_115;
mov.f32 %f804, 0f00000000;
mul.rn.f32 %f1483, %f1489, %f804;
BB0_115:
mul.f32 %f805, %f1483, 0f3F22F983;
cvt.rni.s32.f32 %r766, %f805;
cvt.rn.f32.s32 %f806, %r766;
neg.f32 %f807, %f806;
mov.f32 %f808, 0f3FC90FDA;
fma.rn.f32 %f809, %f807, %f808, %f1483;
mov.f32 %f810, 0f33A22168;
fma.rn.f32 %f811, %f807, %f810, %f809;
mov.f32 %f812, 0f27C234C5;
fma.rn.f32 %f1484, %f807, %f812, %f811;
abs.f32 %f813, %f1483;
add.s64 %rd30, %rd29, 24;
setp.leu.f32 %p84, %f813, 0f47CE4780;
@%p84 bra BB0_126;
mov.b32 %r144, %f1483;
shr.u32 %r145, %r144, 23;
shl.b32 %r500, %r144, 8;
or.b32 %r146, %r500, -2147483648;
mov.u32 %r757, 0;
mov.u64 %rd255, 0;
mov.u64 %rd254, %rd29;
mov.u32 %r758, %r757;
BB0_117:
.pragma "nounroll";
shl.b64 %rd161, %rd255, 2;
mov.u64 %rd162, __cudart_i2opi_f;
add.s64 %rd163, %rd162, %rd161;
ld.const.u32 %r503, [%rd163];
// inline asm
{
mad.lo.cc.u32 %r501, %r503, %r146, %r758;
madc.hi.u32 %r758, %r503, %r146, 0;
}
// inline asm
st.local.u32 [%rd254], %r501;
add.s32 %r757, %r757, 1;
cvt.s64.s32 %rd255, %r757;
mul.wide.s32 %rd164, %r757, 4;
add.s64 %rd254, %rd29, %rd164;
setp.ne.s32 %p85, %r757, 6;
@%p85 bra BB0_117;
and.b32 %r506, %r145, 255;
add.s32 %r507, %r506, -128;
shr.u32 %r508, %r507, 5;
and.b32 %r151, %r144, -2147483648;
st.local.u32 [%rd30], %r758;
mov.u32 %r509, 6;
sub.s32 %r510, %r509, %r508;
mul.wide.s32 %rd165, %r510, 4;
add.s64 %rd36, %rd29, %rd165;
ld.local.u32 %r759, [%rd36];
ld.local.u32 %r760, [%rd36+-4];
and.b32 %r154, %r145, 31;
setp.eq.s32 %p86, %r154, 0;
@%p86 bra BB0_120;
mov.u32 %r511, 32;
sub.s32 %r512, %r511, %r154;
shr.u32 %r513, %r760, %r512;
shl.b32 %r514, %r759, %r154;
add.s32 %r759, %r513, %r514;
ld.local.u32 %r515, [%rd36+-8];
shr.u32 %r516, %r515, %r512;
shl.b32 %r517, %r760, %r154;
add.s32 %r760, %r516, %r517;
BB0_120:
shr.u32 %r518, %r760, 30;
shl.b32 %r519, %r759, 2;
add.s32 %r761, %r518, %r519;
shl.b32 %r160, %r760, 2;
shr.u32 %r520, %r761, 31;
shr.u32 %r521, %r759, 30;
add.s32 %r161, %r520, %r521;
setp.eq.s32 %p87, %r520, 0;
@%p87 bra BB0_121;
not.b32 %r522, %r761;
neg.s32 %r763, %r160;
setp.eq.s32 %p88, %r160, 0;
selp.u32 %r523, 1, 0, %p88;
add.s32 %r761, %r523, %r522;
xor.b32 %r762, %r151, -2147483648;
bra.uni BB0_123;
BB0_56:
ld.local.f32 %f114, [%rd14+-8];
ld.local.f32 %f113, [%rd14+-4];
ld.local.f32 %f112, [%rd14+-12];
abs.f32 %f604, %f112;
abs.f32 %f605, %f113;
setp.gt.f32 %p42, %f604, %f605;
neg.f32 %f606, %f114;
neg.f32 %f607, %f113;
selp.f32 %f608, %f606, 0f00000000, %p42;
selp.f32 %f609, %f112, %f607, %p42;
selp.f32 %f610, 0f00000000, %f114, %p42;
mul.f32 %f611, %f609, %f609;
fma.rn.f32 %f612, %f608, %f608, %f611;
fma.rn.f32 %f613, %f610, %f610, %f612;
sqrt.rn.f32 %f614, %f613;
rcp.rn.f32 %f615, %f614;
mul.f32 %f115, %f608, %f615;
mul.f32 %f116, %f609, %f615;
mul.f32 %f117, %f610, %f615;
sqrt.rn.f32 %f118, %f1;
mul.f32 %f1467, %f2, 0f40C90FDB;
abs.f32 %f120, %f1467;
setp.neu.f32 %p43, %f120, 0f7F800000;
mov.f32 %f1461, %f1467;
@%p43 bra BB0_58;
mov.f32 %f616, 0f00000000;
mul.rn.f32 %f1461, %f1467, %f616;
BB0_58:
mul.f32 %f617, %f1461, 0f3F22F983;
cvt.rni.s32.f32 %r746, %f617;
cvt.rn.f32.s32 %f618, %r746;
neg.f32 %f619, %f618;
mov.f32 %f620, 0f3FC90FDA;
fma.rn.f32 %f621, %f619, %f620, %f1461;
mov.f32 %f622, 0f33A22168;
fma.rn.f32 %f623, %f619, %f622, %f621;
mov.f32 %f624, 0f27C234C5;
fma.rn.f32 %f1462, %f619, %f624, %f623;
abs.f32 %f625, %f1461;
setp.leu.f32 %p44, %f625, 0f47CE4780;
@%p44 bra BB0_69;
mov.b32 %r74, %f1461;
shl.b32 %r397, %r74, 8;
or.b32 %r75, %r397, -2147483648;
add.u64 %rd138, %SP, 32;
cvta.to.local.u64 %rd15, %rd138;
mov.u32 %r737, 0;
mov.u64 %rd251, 0;
mov.u64 %rd250, %rd15;
mov.u32 %r738, %r737;
BB0_60:
.pragma "nounroll";
shl.b64 %rd139, %rd251, 2;
mov.u64 %rd140, __cudart_i2opi_f;
add.s64 %rd141, %rd140, %rd139;
ld.const.u32 %r400, [%rd141];
// inline asm
{
mad.lo.cc.u32 %r398, %r400, %r75, %r738;
madc.hi.u32 %r738, %r400, %r75, 0;
}
// inline asm
st.local.u32 [%rd250], %r398;
add.s32 %r737, %r737, 1;
cvt.s64.s32 %rd251, %r737;
mul.wide.s32 %rd144, %r737, 4;
add.s64 %rd250, %rd15, %rd144;
setp.ne.s32 %p45, %r737, 6;
@%p45 bra BB0_60;
bfe.u32 %r403, %r74, 23, 8;
add.s32 %r404, %r403, -128;
shr.u32 %r405, %r404, 5;
and.b32 %r80, %r74, -2147483648;
cvta.to.local.u64 %rd146, %rd138;
st.local.u32 [%rd146+24], %r738;
bfe.u32 %r81, %r74, 23, 5;
mov.u32 %r406, 6;
sub.s32 %r407, %r406, %r405;
mul.wide.s32 %rd147, %r407, 4;
add.s64 %rd20, %rd146, %rd147;
ld.local.u32 %r739, [%rd20];
ld.local.u32 %r740, [%rd20+-4];
setp.eq.s32 %p46, %r81, 0;
@%p46 bra BB0_63;
mov.u32 %r408, 32;
sub.s32 %r409, %r408, %r81;
shr.u32 %r410, %r740, %r409;
shl.b32 %r411, %r739, %r81;
add.s32 %r739, %r410, %r411;
ld.local.u32 %r412, [%rd20+-8];
shr.u32 %r413, %r412, %r409;
shl.b32 %r414, %r740, %r81;
add.s32 %r740, %r413, %r414;
BB0_63:
shr.u32 %r415, %r740, 30;
shl.b32 %r416, %r739, 2;
add.s32 %r741, %r415, %r416;
shl.b32 %r89, %r740, 2;
shr.u32 %r417, %r741, 31;
shr.u32 %r418, %r739, 30;
add.s32 %r90, %r417, %r418;
setp.eq.s32 %p47, %r417, 0;
@%p47 bra BB0_64;
not.b32 %r419, %r741;
neg.s32 %r743, %r89;
setp.eq.s32 %p48, %r89, 0;
selp.u32 %r420, 1, 0, %p48;
add.s32 %r741, %r420, %r419;
xor.b32 %r742, %r80, -2147483648;
bra.uni BB0_66;
BB0_64:
mov.u32 %r742, %r80;
mov.u32 %r743, %r89;
BB0_66:
clz.b32 %r745, %r741;
setp.eq.s32 %p49, %r745, 0;
shl.b32 %r421, %r741, %r745;
mov.u32 %r422, 32;
sub.s32 %r423, %r422, %r745;
shr.u32 %r424, %r743, %r423;
add.s32 %r425, %r424, %r421;
selp.b32 %r98, %r741, %r425, %p49;
mov.u32 %r426, -921707870;
mul.hi.u32 %r744, %r98, %r426;
setp.eq.s32 %p50, %r80, 0;
neg.s32 %r427, %r90;
selp.b32 %r746, %r90, %r427, %p50;
setp.lt.s32 %p51, %r744, 1;
@%p51 bra BB0_68;
mul.lo.s32 %r428, %r98, -921707870;
shr.u32 %r429, %r428, 31;
shl.b32 %r430, %r744, 1;
add.s32 %r744, %r429, %r430;
add.s32 %r745, %r745, 1;
BB0_68:
mov.u32 %r431, 126;
sub.s32 %r432, %r431, %r745;
shl.b32 %r433, %r432, 23;
add.s32 %r434, %r744, 1;
shr.u32 %r435, %r434, 7;
add.s32 %r436, %r435, 1;
shr.u32 %r437, %r436, 1;
add.s32 %r438, %r437, %r433;
or.b32 %r439, %r438, %r742;
mov.b32 %f1462, %r439;
BB0_69:
mul.rn.f32 %f126, %f1462, %f1462;
add.s32 %r106, %r746, 1;
and.b32 %r107, %r106, 1;
setp.eq.s32 %p52, %r107, 0;
@%p52 bra BB0_71;
mov.f32 %f626, 0fBAB6061A;
mov.f32 %f627, 0f37CCF5CE;
fma.rn.f32 %f1463, %f627, %f126, %f626;
bra.uni BB0_72;
BB0_71:
mov.f32 %f628, 0f3C08839E;
mov.f32 %f629, 0fB94CA1F9;
fma.rn.f32 %f1463, %f629, %f126, %f628;
BB0_72:
@%p52 bra BB0_74;
mov.f32 %f630, 0f3D2AAAA5;
fma.rn.f32 %f631, %f1463, %f126, %f630;
mov.f32 %f632, 0fBF000000;
fma.rn.f32 %f1464, %f631, %f126, %f632;
bra.uni BB0_75;
BB0_74:
mov.f32 %f633, 0fBE2AAAA3;
fma.rn.f32 %f634, %f1463, %f126, %f633;
mov.f32 %f635, 0f00000000;
fma.rn.f32 %f1464, %f634, %f126, %f635;
BB0_75:
fma.rn.f32 %f1465, %f1464, %f1462, %f1462;
@%p52 bra BB0_77;
mov.f32 %f636, 0f3F800000;
fma.rn.f32 %f1465, %f1464, %f126, %f636;
BB0_77:
and.b32 %r440, %r106, 2;
setp.eq.s32 %p55, %r440, 0;
@%p55 bra BB0_79;
mov.f32 %f637, 0f00000000;
mov.f32 %f638, 0fBF800000;
fma.rn.f32 %f1465, %f1465, %f638, %f637;
BB0_79:
@%p43 bra BB0_81;
mov.f32 %f639, 0f00000000;
mul.rn.f32 %f1467, %f1467, %f639;
BB0_81:
mul.f32 %f640, %f1467, 0f3F22F983;
cvt.rni.s32.f32 %r756, %f640;
cvt.rn.f32.s32 %f641, %r756;
neg.f32 %f642, %f641;
fma.rn.f32 %f644, %f642, %f620, %f1467;
fma.rn.f32 %f646, %f642, %f622, %f644;
fma.rn.f32 %f1468, %f642, %f624, %f646;
abs.f32 %f648, %f1467;
setp.leu.f32 %p57, %f648, 0f47CE4780;
@%p57 bra BB0_92;
mov.b32 %r109, %f1467;
shr.u32 %r110, %r109, 23;
shl.b32 %r443, %r109, 8;
or.b32 %r111, %r443, -2147483648;
add.u64 %rd149, %SP, 32;
cvta.to.local.u64 %rd21, %rd149;
mov.u64 %rd252, %rd21;
mov.u32 %r747, %r363;
mov.u32 %r748, %r363;
BB0_83:
.pragma "nounroll";
shl.b64 %rd150, %rd253, 2;
mov.u64 %rd151, __cudart_i2opi_f;
add.s64 %rd152, %rd151, %rd150;
ld.const.u32 %r446, [%rd152];
// inline asm
{
mad.lo.cc.u32 %r444, %r446, %r111, %r748;
madc.hi.u32 %r748, %r446, %r111, 0;
}
// inline asm
st.local.u32 [%rd252], %r444;
add.s32 %r747, %r747, 1;
cvt.s64.s32 %rd253, %r747;
mul.wide.s32 %rd153, %r747, 4;
add.s64 %rd252, %rd21, %rd153;
setp.ne.s32 %p58, %r747, 6;
@%p58 bra BB0_83;
and.b32 %r449, %r110, 255;
add.s32 %r450, %r449, -128;
shr.u32 %r451, %r450, 5;
and.b32 %r116, %r109, -2147483648;
cvta.to.local.u64 %rd155, %rd149;
st.local.u32 [%rd155+24], %r748;
mov.u32 %r452, 6;
sub.s32 %r453, %r452, %r451;
mul.wide.s32 %rd156, %r453, 4;
add.s64 %rd27, %rd155, %rd156;
ld.local.u32 %r749, [%rd27];
ld.local.u32 %r750, [%rd27+-4];
and.b32 %r119, %r110, 31;
setp.eq.s32 %p59, %r119, 0;
@%p59 bra BB0_86;
mov.u32 %r454, 32;
sub.s32 %r455, %r454, %r119;
shr.u32 %r456, %r750, %r455;
shl.b32 %r457, %r749, %r119;
add.s32 %r749, %r456, %r457;
ld.local.u32 %r458, [%rd27+-8];
shr.u32 %r459, %r458, %r455;
shl.b32 %r460, %r750, %r119;
add.s32 %r750, %r459, %r460;
BB0_86:
shr.u32 %r461, %r750, 30;
shl.b32 %r462, %r749, 2;
add.s32 %r751, %r461, %r462;
shl.b32 %r125, %r750, 2;
shr.u32 %r463, %r751, 31;
shr.u32 %r464, %r749, 30;
add.s32 %r126, %r463, %r464;
setp.eq.s32 %p60, %r463, 0;
@%p60 bra BB0_87;
not.b32 %r465, %r751;
neg.s32 %r753, %r125;
setp.eq.s32 %p61, %r125, 0;
selp.u32 %r466, 1, 0, %p61;
add.s32 %r751, %r466, %r465;
xor.b32 %r752, %r116, -2147483648;
bra.uni BB0_89;
BB0_87:
mov.u32 %r752, %r116;
mov.u32 %r753, %r125;
BB0_89:
clz.b32 %r755, %r751;
setp.eq.s32 %p62, %r755, 0;
shl.b32 %r467, %r751, %r755;
mov.u32 %r468, 32;
sub.s32 %r469, %r468, %r755;
shr.u32 %r470, %r753, %r469;
add.s32 %r471, %r470, %r467;
selp.b32 %r134, %r751, %r471, %p62;
mov.u32 %r472, -921707870;
mul.hi.u32 %r754, %r134, %r472;
setp.eq.s32 %p63, %r116, 0;
neg.s32 %r473, %r126;
selp.b32 %r756, %r126, %r473, %p63;
setp.lt.s32 %p64, %r754, 1;
@%p64 bra BB0_91;
mul.lo.s32 %r474, %r134, -921707870;
shr.u32 %r475, %r474, 31;
shl.b32 %r476, %r754, 1;
add.s32 %r754, %r475, %r476;
add.s32 %r755, %r755, 1;
BB0_91:
mov.u32 %r477, 126;
sub.s32 %r478, %r477, %r755;
shl.b32 %r479, %r478, 23;
add.s32 %r480, %r754, 1;
shr.u32 %r481, %r480, 7;
add.s32 %r482, %r481, 1;
shr.u32 %r483, %r482, 1;
add.s32 %r484, %r483, %r479;
or.b32 %r485, %r484, %r752;
mov.b32 %f1468, %r485;
BB0_92:
mul.rn.f32 %f143, %f1468, %f1468;
and.b32 %r142, %r756, 1;
setp.eq.s32 %p65, %r142, 0;
@%p65 bra BB0_94;
mov.f32 %f649, 0fBAB6061A;
mov.f32 %f650, 0f37CCF5CE;
fma.rn.f32 %f1469, %f650, %f143, %f649;
bra.uni BB0_95;
BB0_94:
mov.f32 %f651, 0f3C08839E;
mov.f32 %f652, 0fB94CA1F9;
fma.rn.f32 %f1469, %f652, %f143, %f651;
BB0_95:
@%p65 bra BB0_97;
mov.f32 %f653, 0f3D2AAAA5;
fma.rn.f32 %f654, %f1469, %f143, %f653;
mov.f32 %f655, 0fBF000000;
fma.rn.f32 %f1470, %f654, %f143, %f655;
bra.uni BB0_98;
BB0_97:
mov.f32 %f656, 0fBE2AAAA3;
fma.rn.f32 %f657, %f1469, %f143, %f656;
mov.f32 %f658, 0f00000000;
fma.rn.f32 %f1470, %f657, %f143, %f658;
BB0_98:
fma.rn.f32 %f1471, %f1470, %f1468, %f1468;
@%p65 bra BB0_100;
mov.f32 %f659, 0f3F800000;
fma.rn.f32 %f1471, %f1470, %f143, %f659;
BB0_100:
and.b32 %r486, %r756, 2;
setp.eq.s32 %p68, %r486, 0;
@%p68 bra BB0_102;
mov.f32 %f660, 0f00000000;
mov.f32 %f661, 0fBF800000;
fma.rn.f32 %f1471, %f1471, %f661, %f660;
BB0_102:
mul.f32 %f665, %f118, %f1465;
mul.f32 %f666, %f665, %f665;
mov.f32 %f1473, 0f3F800000;
sub.f32 %f668, %f1473, %f666;
mul.f32 %f669, %f118, %f1471;
mul.f32 %f670, %f669, %f669;
sub.f32 %f671, %f668, %f670;
mov.f32 %f1476, 0f00000000;
max.f32 %f672, %f1476, %f671;
sqrt.rn.f32 %f673, %f672;
mul.f32 %f674, %f115, %f669;
mul.f32 %f675, %f116, %f669;
mul.f32 %f676, %f117, %f669;
mul.f32 %f677, %f113, %f116;
mul.f32 %f678, %f114, %f117;
sub.f32 %f679, %f677, %f678;
fma.rn.f32 %f680, %f679, %f665, %f674;
mul.f32 %f681, %f112, %f117;
mul.f32 %f682, %f113, %f115;
sub.f32 %f683, %f681, %f682;
fma.rn.f32 %f684, %f683, %f665, %f675;
mul.f32 %f685, %f114, %f115;
mul.f32 %f686, %f112, %f116;
sub.f32 %f687, %f685, %f686;
fma.rn.f32 %f688, %f687, %f665, %f676;
fma.rn.f32 %f155, %f112, %f673, %f680;
fma.rn.f32 %f156, %f114, %f673, %f684;
fma.rn.f32 %f157, %f113, %f673, %f688;
add.u64 %rd157, %SP, 28;
cvta.to.local.u64 %rd28, %rd157;
st.local.u32 [%rd28], %r363;
setp.gt.f32 %p69, %f156, 0f00000000;
setp.eq.f32 %p70, %f596, 0f00000000;
or.pred %p71, %p70, %p69;
mov.f32 %f1477, %f1476;
mov.f32 %f1478, %f1476;
@!%p71 bra BB0_106;
bra.uni BB0_103;
BB0_103:
mov.u32 %r491, 1065353216;
st.local.u32 [%rd28], %r491;
mul.f32 %f700, %f72, 0f3456BF95;
abs.f32 %f701, %f700;
mul.f32 %f702, %f73, 0f3456BF95;
abs.f32 %f703, %f702;
mul.f32 %f704, %f74, 0f3456BF95;
abs.f32 %f705, %f704;
max.f32 %f706, %f701, %f703;
max.f32 %f707, %f706, %f705;
max.f32 %f695, %f707, %f566;
ld.global.u32 %r488, [root];
mov.f32 %f696, 0f6C4ECB8F;
mov.u32 %r490, 4;
// inline asm
call _rt_trace_64, (%r488, %f72, %f73, %f74, %f155, %f156, %f157, %r385, %f695, %f696, %rd157, %r490);
// inline asm
setp.leu.f32 %p72, %f601, 0f00000000;
mov.f32 %f1474, %f1473;
mov.f32 %f1475, %f1473;
@%p72 bra BB0_105;
cvt.rzi.s32.f32 %r492, %f602;
neg.f32 %f715, %f155;
neg.f32 %f714, %f156;
neg.f32 %f713, %f157;
mov.u32 %r493, 6;
// inline asm
call (%f1473, %f1474, %f1475, %f712), _rt_texture_get_base_id, (%r492, %r493, %f713, %f714, %f715, %r363);
// inline asm
BB0_105:
ld.local.f32 %f716, [%rd28];
fma.rn.f32 %f1476, %f1473, %f716, 0f00000000;
fma.rn.f32 %f1477, %f1474, %f716, 0f00000000;
fma.rn.f32 %f1478, %f1475, %f716, 0f00000000;
BB0_106:
ld.global.u32 %r495, [bounceFlag];
setp.lt.s32 %p73, %r495, 1;
@%p73 bra BB0_108;
add.f32 %f717, %f600, 0fBF800000;
mul.f32 %f718, %f717, 0f42C80000;
mul.f32 %f1476, %f718, %f1476;
mul.f32 %f1477, %f718, %f1477;
mul.f32 %f1478, %f718, %f1478;
BB0_108:
cvt.rn.f32.u32 %f719, %r72;
mul.f32 %f720, %f597, %f1476;
mul.f32 %f1499, %f719, %f720;
mul.f32 %f721, %f598, %f1477;
mul.f32 %f1500, %f719, %f721;
mul.f32 %f722, %f599, %f1478;
mul.f32 %f1501, %f719, %f722;
bra.uni BB0_162;
BB0_121:
mov.u32 %r762, %r151;
mov.u32 %r763, %r160;
BB0_123:
clz.b32 %r765, %r761;
setp.eq.s32 %p89, %r765, 0;
shl.b32 %r524, %r761, %r765;
mov.u32 %r525, 32;
sub.s32 %r526, %r525, %r765;
shr.u32 %r527, %r763, %r526;
add.s32 %r528, %r527, %r524;
selp.b32 %r169, %r761, %r528, %p89;
mov.u32 %r529, -921707870;
mul.hi.u32 %r764, %r169, %r529;
setp.eq.s32 %p90, %r151, 0;
neg.s32 %r530, %r161;
selp.b32 %r766, %r161, %r530, %p90;
setp.lt.s32 %p91, %r764, 1;
@%p91 bra BB0_125;
mul.lo.s32 %r531, %r169, -921707870;
shr.u32 %r532, %r531, 31;
shl.b32 %r533, %r764, 1;
add.s32 %r764, %r532, %r533;
add.s32 %r765, %r765, 1;
BB0_125:
mov.u32 %r534, 126;
sub.s32 %r535, %r534, %r765;
shl.b32 %r536, %r535, 23;
add.s32 %r537, %r764, 1;
shr.u32 %r538, %r537, 7;
add.s32 %r539, %r538, 1;
shr.u32 %r540, %r539, 1;
add.s32 %r541, %r540, %r536;
or.b32 %r542, %r541, %r762;
mov.b32 %f1484, %r542;
BB0_126:
mul.rn.f32 %f197, %f1484, %f1484;
add.s32 %r177, %r766, 1;
and.b32 %r178, %r177, 1;
setp.eq.s32 %p92, %r178, 0;
@%p92 bra BB0_128;
mov.f32 %f814, 0fBAB6061A;
mov.f32 %f815, 0f37CCF5CE;
fma.rn.f32 %f1485, %f815, %f197, %f814;
bra.uni BB0_129;
BB0_128:
mov.f32 %f816, 0f3C08839E;
mov.f32 %f817, 0fB94CA1F9;
fma.rn.f32 %f1485, %f817, %f197, %f816;
BB0_129:
@%p92 bra BB0_131;
mov.f32 %f818, 0f3D2AAAA5;
fma.rn.f32 %f819, %f1485, %f197, %f818;
mov.f32 %f820, 0fBF000000;
fma.rn.f32 %f1486, %f819, %f197, %f820;
bra.uni BB0_132;
BB0_131:
mov.f32 %f821, 0fBE2AAAA3;
fma.rn.f32 %f822, %f1485, %f197, %f821;
mov.f32 %f823, 0f00000000;
fma.rn.f32 %f1486, %f822, %f197, %f823;
BB0_132:
fma.rn.f32 %f1487, %f1486, %f1484, %f1484;
@%p92 bra BB0_134;
mov.f32 %f824, 0f3F800000;
fma.rn.f32 %f1487, %f1486, %f197, %f824;
BB0_134:
and.b32 %r543, %r177, 2;
setp.eq.s32 %p95, %r543, 0;
@%p95 bra BB0_136;
mov.f32 %f825, 0f00000000;
mov.f32 %f826, 0fBF800000;
fma.rn.f32 %f1487, %f1487, %f826, %f825;
BB0_136:
@%p83 bra BB0_138;
mov.f32 %f827, 0f00000000;
mul.rn.f32 %f1489, %f1489, %f827;
BB0_138:
mul.f32 %f828, %f1489, 0f3F22F983;
cvt.rni.s32.f32 %r776, %f828;
cvt.rn.f32.s32 %f829, %r776;
neg.f32 %f830, %f829;
fma.rn.f32 %f832, %f830, %f808, %f1489;
fma.rn.f32 %f834, %f830, %f810, %f832;
fma.rn.f32 %f1490, %f830, %f812, %f834;
abs.f32 %f836, %f1489;
setp.leu.f32 %p97, %f836, 0f47CE4780;
@%p97 bra BB0_149;
mov.b32 %r180, %f1489;
shr.u32 %r181, %r180, 23;
shl.b32 %r546, %r180, 8;
or.b32 %r182, %r546, -2147483648;
mov.u32 %r768, 0;
mov.u64 %rd256, __cudart_i2opi_f;
mov.u32 %r767, -6;
mov.u64 %rd257, %rd29;
BB0_140:
.pragma "nounroll";
ld.const.u32 %r549, [%rd256];
// inline asm
{
mad.lo.cc.u32 %r547, %r549, %r182, %r768;
madc.hi.u32 %r768, %r549, %r182, 0;
}
// inline asm
st.local.u32 [%rd257], %r547;
add.s64 %rd257, %rd257, 4;
add.s64 %rd256, %rd256, 4;
add.s32 %r767, %r767, 1;
setp.ne.s32 %p98, %r767, 0;
@%p98 bra BB0_140;
and.b32 %r552, %r181, 255;
add.s32 %r553, %r552, -128;
shr.u32 %r554, %r553, 5;
and.b32 %r187, %r180, -2147483648;
st.local.u32 [%rd30], %r768;
mov.u32 %r555, 6;
sub.s32 %r556, %r555, %r554;
mul.wide.s32 %rd167, %r556, 4;
add.s64 %rd41, %rd29, %rd167;
ld.local.u32 %r769, [%rd41];
ld.local.u32 %r770, [%rd41+-4];
and.b32 %r190, %r181, 31;
setp.eq.s32 %p99, %r190, 0;
@%p99 bra BB0_143;
mov.u32 %r557, 32;
sub.s32 %r558, %r557, %r190;
shr.u32 %r559, %r770, %r558;
shl.b32 %r560, %r769, %r190;
add.s32 %r769, %r559, %r560;
ld.local.u32 %r561, [%rd41+-8];
shr.u32 %r562, %r561, %r558;
shl.b32 %r563, %r770, %r190;
add.s32 %r770, %r562, %r563;
BB0_143:
shr.u32 %r564, %r770, 30;
shl.b32 %r565, %r769, 2;
add.s32 %r771, %r564, %r565;
shl.b32 %r196, %r770, 2;
shr.u32 %r566, %r771, 31;
shr.u32 %r567, %r769, 30;
add.s32 %r197, %r566, %r567;
setp.eq.s32 %p100, %r566, 0;
@%p100 bra BB0_144;
not.b32 %r568, %r771;
neg.s32 %r773, %r196;
setp.eq.s32 %p101, %r196, 0;
selp.u32 %r569, 1, 0, %p101;
add.s32 %r771, %r569, %r568;
xor.b32 %r772, %r187, -2147483648;
bra.uni BB0_146;
BB0_144:
mov.u32 %r772, %r187;
mov.u32 %r773, %r196;
BB0_146:
clz.b32 %r775, %r771;
setp.eq.s32 %p102, %r775, 0;
shl.b32 %r570, %r771, %r775;
mov.u32 %r571, 32;
sub.s32 %r572, %r571, %r775;
shr.u32 %r573, %r773, %r572;
add.s32 %r574, %r573, %r570;
selp.b32 %r205, %r771, %r574, %p102;
mov.u32 %r575, -921707870;
mul.hi.u32 %r774, %r205, %r575;
setp.eq.s32 %p103, %r187, 0;
neg.s32 %r576, %r197;
selp.b32 %r776, %r197, %r576, %p103;
setp.lt.s32 %p104, %r774, 1;
@%p104 bra BB0_148;
mul.lo.s32 %r577, %r205, -921707870;
shr.u32 %r578, %r577, 31;
shl.b32 %r579, %r774, 1;
add.s32 %r774, %r578, %r579;
add.s32 %r775, %r775, 1;
BB0_148:
mov.u32 %r580, 126;
sub.s32 %r581, %r580, %r775;
shl.b32 %r582, %r581, 23;
add.s32 %r583, %r774, 1;
shr.u32 %r584, %r583, 7;
add.s32 %r585, %r584, 1;
shr.u32 %r586, %r585, 1;
add.s32 %r587, %r586, %r582;
or.b32 %r588, %r587, %r772;
mov.b32 %f1490, %r588;
BB0_149:
mul.rn.f32 %f214, %f1490, %f1490;
and.b32 %r213, %r776, 1;
setp.eq.s32 %p105, %r213, 0;
@%p105 bra BB0_151;
mov.f32 %f837, 0fBAB6061A;
mov.f32 %f838, 0f37CCF5CE;
fma.rn.f32 %f1491, %f838, %f214, %f837;
bra.uni BB0_152;
BB0_151:
mov.f32 %f839, 0f3C08839E;
mov.f32 %f840, 0fB94CA1F9;
fma.rn.f32 %f1491, %f840, %f214, %f839;
BB0_152:
@%p105 bra BB0_154;
mov.f32 %f841, 0f3D2AAAA5;
fma.rn.f32 %f842, %f1491, %f214, %f841;
mov.f32 %f843, 0fBF000000;
fma.rn.f32 %f1492, %f842, %f214, %f843;
bra.uni BB0_155;
BB0_154:
mov.f32 %f844, 0fBE2AAAA3;
fma.rn.f32 %f845, %f1491, %f214, %f844;
mov.f32 %f846, 0f00000000;
fma.rn.f32 %f1492, %f845, %f214, %f846;
BB0_155:
fma.rn.f32 %f1493, %f1492, %f1490, %f1490;
@%p105 bra BB0_157;
mov.f32 %f847, 0f3F800000;
fma.rn.f32 %f1493, %f1492, %f214, %f847;
BB0_157:
and.b32 %r589, %r776, 2;
setp.eq.s32 %p108, %r589, 0;
@%p108 bra BB0_159;
mov.f32 %f848, 0f00000000;
mov.f32 %f849, 0fBF800000;
fma.rn.f32 %f1493, %f1493, %f849, %f848;
BB0_159:
mul.f32 %f858, %f189, %f1487;
mul.f32 %f859, %f858, %f858;
mov.f32 %f860, 0f3F800000;
sub.f32 %f861, %f860, %f859;
mul.f32 %f862, %f189, %f1493;
mul.f32 %f863, %f862, %f862;
sub.f32 %f864, %f861, %f863;
mov.f32 %f865, 0f00000000;
max.f32 %f866, %f865, %f864;
sqrt.rn.f32 %f867, %f866;
mul.f32 %f868, %f186, %f862;
mul.f32 %f869, %f187, %f862;
mul.f32 %f870, %f188, %f862;
mul.f32 %f871, %f181, %f188;
mul.f32 %f872, %f182, %f187;
sub.f32 %f873, %f872, %f871;
fma.rn.f32 %f874, %f873, %f858, %f868;
mul.f32 %f875, %f182, %f186;
mul.f32 %f876, %f180, %f188;
sub.f32 %f877, %f876, %f875;
fma.rn.f32 %f878, %f877, %f858, %f869;
mul.f32 %f879, %f180, %f187;
mul.f32 %f880, %f181, %f186;
sub.f32 %f881, %f880, %f879;
fma.rn.f32 %f882, %f881, %f858, %f870;
fma.rn.f32 %f883, %f180, %f867, %f874;
fma.rn.f32 %f884, %f181, %f867, %f878;
fma.rn.f32 %f885, %f182, %f867, %f882;
add.f32 %f886, %f180, %f883;
add.f32 %f887, %f181, %f884;
add.f32 %f888, %f182, %f885;
mul.f32 %f889, %f596, %f886;
mul.f32 %f890, %f596, %f887;
mul.f32 %f891, %f596, %f888;
sub.f32 %f892, %f889, %f180;
sub.f32 %f893, %f890, %f181;
sub.f32 %f894, %f891, %f182;
mul.f32 %f895, %f893, %f893;
fma.rn.f32 %f896, %f892, %f892, %f895;
fma.rn.f32 %f897, %f894, %f894, %f896;
sqrt.rn.f32 %f898, %f897;
rcp.rn.f32 %f899, %f898;
mul.f32 %f853, %f899, %f892;
mul.f32 %f854, %f899, %f893;
mul.f32 %f855, %f899, %f894;
mul.f32 %f900, %f72, 0f3456BF95;
abs.f32 %f901, %f900;
mul.f32 %f902, %f73, 0f3456BF95;
abs.f32 %f903, %f902;
mul.f32 %f904, %f74, 0f3456BF95;
abs.f32 %f905, %f904;
max.f32 %f906, %f901, %f903;
max.f32 %f907, %f906, %f905;
max.f32 %f856, %f907, %f566;
add.u64 %rd168, %SP, 28;
cvta.to.local.u64 %rd169, %rd168;
mov.u32 %r593, 1065353216;
st.local.u32 [%rd169], %r593;
ld.global.u32 %r590, [root];
mov.f32 %f857, 0f6C4ECB8F;
mov.u32 %r592, 4;
// inline asm
call _rt_trace_64, (%r590, %f72, %f73, %f74, %f853, %f854, %f855, %r385, %f856, %f857, %rd168, %r592);
// inline asm
ld.local.f32 %f1495, [%rd169];
BB0_160:
ld.global.u32 %r594, [bounceFlag];
setp.gt.s32 %p109, %r594, 0;
mul.f32 %f909, %f600, 0f42C80000;
mul.f32 %f910, %f1482, %f1495;
mul.f32 %f911, %f909, %f910;
selp.f32 %f912, %f911, %f910, %p109;
mul.f32 %f1496, %f597, %f912;
mul.f32 %f1497, %f598, %f912;
mul.f32 %f1498, %f599, %f912;
BB0_161:
cvt.rn.f32.u32 %f913, %r72;
mul.f32 %f1499, %f913, %f1496;
mul.f32 %f1500, %f913, %f1497;
mul.f32 %f1501, %f913, %f1498;
BB0_162:
mov.u64 %rd175, localLights;
cvta.global.u64 %rd174, %rd175;
mov.u32 %r596, 96;
// inline asm
call (%rd170, %rd171, %rd172, %rd173), _rt_buffer_get_size_64, (%rd174, %r385, %r596);
// inline asm
cvt.u32.u64 %r597, %rd170;
setp.eq.s32 %p110, %r597, 0;
mov.u16 %rs17, 0;
@%p110 bra BB0_189;
ld.global.f32 %f921, [cameraPos];
sub.f32 %f918, %f72, %f921;
ld.global.f32 %f922, [cameraPos+4];
sub.f32 %f919, %f73, %f922;
ld.global.f32 %f923, [cameraPos+8];
sub.f32 %f920, %f74, %f923;
ld.global.u32 %r598, [tileCubemap];
mov.u32 %r599, 6;
mov.u32 %r600, 0;
// inline asm
call (%f914, %f915, %f916, %f917), _rt_texture_get_base_id, (%r598, %r599, %f918, %f919, %f920, %r600);
// inline asm
mov.b32 %r214, %f915;
setp.eq.s32 %p111, %r214, 0;
@%p111 bra BB0_189;
mov.b32 %r605, %f914;
cvt.rn.f32.u32 %f244, %r214;
mul.f32 %f926, %f3, %f244;
cvt.rzi.u32.f32 %r606, %f926;
add.s32 %r607, %r214, -1;
min.u32 %r608, %r606, %r607;
add.s32 %r609, %r608, %r605;
cvt.u64.u32 %rd178, %r609;
mov.u64 %rd188, localLightIndices;
cvta.global.u64 %rd177, %rd188;
mov.u32 %r602, 4;
mov.u64 %rd187, 0;
// inline asm
call (%rd176), _rt_buffer_get_64, (%rd177, %r385, %r602, %rd178, %rd187, %rd187, %rd187);
// inline asm
ld.u32 %rd184, [%rd176];
// inline asm
call (%rd182), _rt_buffer_get_64, (%rd174, %r385, %r596, %rd184, %rd187, %rd187, %rd187);
// inline asm
ld.v4.f32 {%f927, %f928, %f929, %f930}, [%rd182+80];
ld.v4.f32 {%f931, %f932, %f933, %f934}, [%rd182+64];
ld.v4.f32 {%f935, %f936, %f937, %f938}, [%rd182+48];
ld.v4.f32 {%f1505, %f1506, %f1507, %f942}, [%rd182+32];
ld.v4.f32 {%f943, %f944, %f945, %f946}, [%rd182+16];
ld.v4.f32 {%f947, %f948, %f949, %f950}, [%rd182];
sub.f32 %f951, %f948, %f72;
sub.f32 %f952, %f949, %f73;
sub.f32 %f953, %f950, %f74;
mul.f32 %f954, %f952, %f952;
fma.rn.f32 %f955, %f951, %f951, %f954;
fma.rn.f32 %f956, %f953, %f953, %f955;
sqrt.rn.f32 %f272, %f956;
rcp.rn.f32 %f957, %f272;
mul.f32 %f273, %f951, %f957;
mul.f32 %f274, %f952, %f957;
mul.f32 %f275, %f953, %f957;
mul.f32 %f276, %f946, %f272;
mov.f32 %f961, 0f40800000;
abs.f32 %f278, %f276;
setp.lt.f32 %p112, %f278, 0f00800000;
mul.f32 %f963, %f278, 0f4B800000;
selp.f32 %f964, 0fC3170000, 0fC2FE0000, %p112;
selp.f32 %f965, %f963, %f278, %p112;
mov.b32 %r610, %f965;
and.b32 %r611, %r610, 8388607;
or.b32 %r612, %r611, 1065353216;
mov.b32 %f966, %r612;
shr.u32 %r613, %r610, 23;
cvt.rn.f32.u32 %f967, %r613;
add.f32 %f968, %f964, %f967;
setp.gt.f32 %p113, %f966, 0f3FB504F3;
mul.f32 %f969, %f966, 0f3F000000;
add.f32 %f970, %f968, 0f3F800000;
selp.f32 %f971, %f969, %f966, %p113;
selp.f32 %f972, %f970, %f968, %p113;
add.f32 %f973, %f971, 0fBF800000;
add.f32 %f925, %f971, 0f3F800000;
// inline asm
rcp.approx.ftz.f32 %f924,%f925;
// inline asm
add.f32 %f974, %f973, %f973;
mul.f32 %f975, %f924, %f974;
mul.f32 %f976, %f975, %f975;
mov.f32 %f977, 0f3C4CAF63;
mov.f32 %f978, 0f3B18F0FE;
fma.rn.f32 %f979, %f978, %f976, %f977;
mov.f32 %f980, 0f3DAAAABD;
fma.rn.f32 %f981, %f979, %f976, %f980;
mul.rn.f32 %f982, %f981, %f976;
mul.rn.f32 %f983, %f982, %f975;
sub.f32 %f984, %f973, %f975;
neg.f32 %f985, %f975;
add.f32 %f986, %f984, %f984;
fma.rn.f32 %f987, %f985, %f973, %f986;
mul.rn.f32 %f988, %f924, %f987;
add.f32 %f989, %f983, %f975;
sub.f32 %f990, %f975, %f989;
add.f32 %f991, %f983, %f990;
add.f32 %f992, %f988, %f991;
add.f32 %f993, %f989, %f992;
sub.f32 %f994, %f989, %f993;
add.f32 %f995, %f992, %f994;
mov.f32 %f996, 0f3F317200;
mul.rn.f32 %f997, %f972, %f996;
mov.f32 %f998, 0f35BFBE8E;
mul.rn.f32 %f999, %f972, %f998;
add.f32 %f1000, %f997, %f993;
sub.f32 %f1001, %f997, %f1000;
add.f32 %f1002, %f993, %f1001;
add.f32 %f1003, %f995, %f1002;
add.f32 %f1004, %f999, %f1003;
add.f32 %f1005, %f1000, %f1004;
sub.f32 %f1006, %f1000, %f1005;
add.f32 %f1007, %f1004, %f1006;
mul.rn.f32 %f279, %f961, %f1005;
neg.f32 %f1008, %f279;
fma.rn.f32 %f1009, %f961, %f1005, %f1008;
fma.rn.f32 %f1010, %f961, %f1007, %f1009;
mov.f32 %f1011, 0f00000000;
fma.rn.f32 %f280, %f1011, %f1005, %f1010;
add.rn.f32 %f281, %f279, %f280;
mov.b32 %r614, %f281;
setp.eq.s32 %p1, %r614, 1118925336;
add.s32 %r615, %r614, -1;
mov.b32 %f1012, %r615;
selp.f32 %f1013, %f1012, %f281, %p1;
mul.f32 %f1014, %f1013, 0f3FB8AA3B;
cvt.rzi.f32.f32 %f1015, %f1014;
mov.f32 %f1016, 0fBF317200;
fma.rn.f32 %f1017, %f1015, %f1016, %f1013;
mov.f32 %f1018, 0fB5BFBE8E;
fma.rn.f32 %f1019, %f1015, %f1018, %f1017;
mul.f32 %f1020, %f1019, 0f3FB8AA3B;
ex2.approx.ftz.f32 %f1021, %f1020;
add.f32 %f1022, %f1015, 0f00000000;
ex2.approx.f32 %f1023, %f1022;
mul.f32 %f1024, %f1021, %f1023;
setp.lt.f32 %p114, %f1013, 0fC2D20000;
selp.f32 %f1025, 0f00000000, %f1024, %p114;
setp.gt.f32 %p115, %f1013, 0f42D20000;
selp.f32 %f1502, 0f7F800000, %f1025, %p115;
setp.eq.f32 %p116, %f1502, 0f7F800000;
@%p116 bra BB0_166;
neg.f32 %f1026, %f281;
add.rn.f32 %f1027, %f279, %f1026;
add.rn.f32 %f1028, %f1027, %f280;
add.f32 %f1029, %f1028, 0f37000000;
selp.f32 %f1030, %f1029, %f1028, %p1;
fma.rn.f32 %f1502, %f1502, %f1030, %f1502;
BB0_166:
mov.f32 %f1433, 0f40000000;
cvt.rzi.f32.f32 %f1432, %f1433;
add.f32 %f1431, %f1432, %f1432;
mov.f32 %f1430, 0f40800000;
sub.f32 %f1429, %f1430, %f1431;
abs.f32 %f1428, %f1429;
setp.lt.f32 %p117, %f276, 0f00000000;
setp.eq.f32 %p118, %f1428, 0f3F800000;
and.pred %p2, %p117, %p118;
mov.b32 %r616, %f1502;
xor.b32 %r617, %r616, -2147483648;
mov.b32 %f1031, %r617;
selp.f32 %f1504, %f1031, %f1502, %p2;
setp.eq.f32 %p119, %f276, 0f00000000;
@%p119 bra BB0_169;
bra.uni BB0_167;
BB0_169:
add.f32 %f1034, %f276, %f276;
selp.f32 %f1504, %f1034, 0f00000000, %p118;
bra.uni BB0_170;
BB0_167:
setp.geu.f32 %p120, %f276, 0f00000000;
@%p120 bra BB0_170;
mov.f32 %f1436, 0f40800000;
cvt.rzi.f32.f32 %f1033, %f1436;
setp.neu.f32 %p121, %f1033, 0f40800000;
selp.f32 %f1504, 0f7FFFFFFF, %f1504, %p121;
BB0_170:
add.f32 %f1035, %f278, 0f40800000;
mov.b32 %r618, %f1035;
setp.lt.s32 %p123, %r618, 2139095040;
@%p123 bra BB0_175;
setp.gtu.f32 %p124, %f278, 0f7F800000;
@%p124 bra BB0_174;
bra.uni BB0_172;
BB0_174:
add.f32 %f1504, %f276, 0f40800000;
bra.uni BB0_175;
BB0_172:
setp.neu.f32 %p125, %f278, 0f7F800000;
@%p125 bra BB0_175;
selp.f32 %f1504, 0fFF800000, 0f7F800000, %p2;
BB0_175:
add.u64 %rd243, %SP, 0;
cvta.to.local.u64 %rd242, %rd243;
add.s64 %rd241, %rd242, 12;
mul.f32 %f1036, %f944, %f272;
mov.f32 %f1509, 0f3F800000;
sub.f32 %f1038, %f1509, %f1504;
setp.eq.f32 %p126, %f276, 0f3F800000;
selp.f32 %f1039, 0f00000000, %f1038, %p126;
cvt.sat.f32.f32 %f1040, %f1039;
fma.rn.f32 %f1041, %f1036, %f1036, %f945;
div.rn.f32 %f1508, %f1040, %f1041;
ld.local.f32 %f1042, [%rd241+-12];
ld.local.f32 %f1043, [%rd241+-8];
mul.f32 %f1044, %f274, %f1043;
fma.rn.f32 %f1045, %f273, %f1042, %f1044;
ld.local.f32 %f1046, [%rd241+-4];
fma.rn.f32 %f1047, %f275, %f1046, %f1045;
cvt.sat.f32.f32 %f308, %f1047;
setp.eq.f32 %p127, %f947, 0f3F800000;
@%p127 bra BB0_181;
bra.uni BB0_176;
BB0_181:
setp.leu.f32 %p131, %f942, 0f00000000;
@%p131 bra BB0_183;
mov.u32 %r716, 2;
mul.f32 %f1078, %f927, %f273;
mul.f32 %f1079, %f928, %f274;
neg.f32 %f1080, %f1079;
sub.f32 %f1081, %f1080, %f1078;
mul.f32 %f1082, %f929, %f275;
sub.f32 %f1083, %f1081, %f1082;
setp.gt.f32 %p132, %f1083, 0f00000000;
selp.f32 %f1084, 0f3F800000, 0f00000000, %p132;
mul.f32 %f1085, %f936, %f274;
fma.rn.f32 %f1086, %f935, %f273, %f1085;
mul.f32 %f1087, %f932, %f274;
fma.rn.f32 %f1088, %f931, %f273, %f1087;
fma.rn.f32 %f1089, %f937, %f275, %f1086;
fma.rn.f32 %f1090, %f933, %f275, %f1088;
fma.rn.f32 %f1091, %f938, %f1089, 0f3F000000;
mov.f32 %f1092, 0f3F800000;
sub.f32 %f1074, %f1092, %f1091;
fma.rn.f32 %f1075, %f938, %f1090, 0f3F000000;
cvt.rzi.s32.f32 %r622, %f942;
mov.f32 %f1077, 0f00000000;
// inline asm
call (%f1070, %f1071, %f1072, %f1073), _rt_texture_get_f_id, (%r622, %r716, %f1074, %f1075, %f1077, %f1077);
// inline asm
mul.f32 %f1093, %f1084, %f1070;
mul.f32 %f1094, %f1084, %f1071;
mul.f32 %f1095, %f1084, %f1072;
mul.f32 %f1505, %f1505, %f1093;
mul.f32 %f1506, %f1506, %f1094;
mul.f32 %f1507, %f1507, %f1095;
bra.uni BB0_183;
BB0_176:
setp.eq.f32 %p128, %f947, 0f40000000;
@%p128 bra BB0_179;
bra.uni BB0_177;
BB0_179:
setp.leu.f32 %p130, %f942, 0f00000000;
@%p130 bra BB0_183;
mov.u32 %r715, 0;
mov.u32 %r714, 6;
mul.f32 %f1064, %f936, %f274;
fma.rn.f32 %f1065, %f935, %f273, %f1064;
mul.f32 %f1066, %f932, %f274;
fma.rn.f32 %f1067, %f931, %f273, %f1066;
mul.f32 %f1068, %f928, %f274;
fma.rn.f32 %f1069, %f927, %f273, %f1068;
fma.rn.f32 %f1061, %f937, %f275, %f1065;
fma.rn.f32 %f1062, %f933, %f275, %f1067;
fma.rn.f32 %f1063, %f929, %f275, %f1069;
cvt.rzi.s32.f32 %r619, %f942;
// inline asm
call (%f1057, %f1058, %f1059, %f1060), _rt_texture_get_base_id, (%r619, %r714, %f1061, %f1062, %f1063, %r715);
// inline asm
mul.f32 %f1505, %f1505, %f1057;
mul.f32 %f1506, %f1506, %f1058;
mul.f32 %f1507, %f1507, %f1059;
bra.uni BB0_183;
BB0_177:
setp.neu.f32 %p129, %f947, 0f40800000;
@%p129 bra BB0_183;
mul.f32 %f1048, %f927, %f273;
mul.f32 %f1049, %f928, %f274;
neg.f32 %f1050, %f1049;
sub.f32 %f1051, %f1050, %f1048;
mul.f32 %f1052, %f929, %f275;
sub.f32 %f1053, %f1051, %f1052;
fma.rn.f32 %f1054, %f942, %f1053, %f938;
cvt.sat.f32.f32 %f1055, %f1054;
mul.f32 %f1056, %f1055, %f1055;
mul.f32 %f1508, %f1508, %f1056;
BB0_183:
mov.f32 %f1510, 0f00000000;
max.f32 %f1099, %f1505, %f1506;
max.f32 %f1100, %f1099, %f1507;
mul.f32 %f320, %f308, %f1508;
mul.f32 %f1101, %f320, %f1100;
setp.lt.f32 %p133, %f1101, 0f3727C5AC;
mov.f32 %f1511, %f1510;
mov.f32 %f1512, %f1510;
@%p133 bra BB0_187;
add.u64 %rd190, %SP, 32;
cvta.to.local.u64 %rd42, %rd190;
mov.u32 %r624, 1065353216;
st.local.u32 [%rd42], %r624;
setp.leu.f32 %p134, %f930, 0f00000000;
@%p134 bra BB0_186;
mov.u32 %r706, 4;
mov.f32 %f1435, 0f38D1B717;
mov.u32 %r705, 1;
fma.rn.f32 %f1111, %f1, 0f40000000, 0fBF800000;
fma.rn.f32 %f1112, %f2, 0f40000000, 0fBF800000;
fma.rn.f32 %f1113, %f3, 0f40000000, 0fBF800000;
fma.rn.f32 %f1114, %f1111, %f943, %f948;
fma.rn.f32 %f1115, %f1112, %f943, %f949;
fma.rn.f32 %f1116, %f1113, %f943, %f950;
sub.f32 %f1117, %f1114, %f72;
sub.f32 %f1118, %f1115, %f73;
sub.f32 %f1119, %f1116, %f74;
mul.f32 %f1120, %f1118, %f1118;
fma.rn.f32 %f1121, %f1117, %f1117, %f1120;
fma.rn.f32 %f1122, %f1119, %f1119, %f1121;
sqrt.rn.f32 %f1110, %f1122;
rcp.rn.f32 %f1123, %f1110;
mul.f32 %f1106, %f1117, %f1123;
mul.f32 %f1107, %f1118, %f1123;
mul.f32 %f1108, %f1119, %f1123;
mul.f32 %f1124, %f72, 0f3456BF95;
abs.f32 %f1125, %f1124;
mul.f32 %f1126, %f73, 0f3456BF95;
abs.f32 %f1127, %f1126;
mul.f32 %f1128, %f74, 0f3456BF95;
abs.f32 %f1129, %f1128;
max.f32 %f1130, %f1125, %f1127;
max.f32 %f1131, %f1130, %f1129;
max.f32 %f1109, %f1131, %f1435;
ld.global.u32 %r625, [root];
// inline asm
call _rt_trace_64, (%r625, %f72, %f73, %f74, %f1106, %f1107, %f1108, %r705, %f1109, %f1110, %rd190, %r706);
// inline asm
ld.local.f32 %f1509, [%rd42];
BB0_186:
ld.global.u32 %r628, [bounceFlag];
setp.gt.s32 %p135, %r628, 0;
mul.f32 %f1133, %f320, %f1509;
mul.f32 %f1134, %f934, %f1133;
selp.f32 %f1135, %f1134, %f1133, %p135;
mul.f32 %f1510, %f1505, %f1135;
mul.f32 %f1511, %f1506, %f1135;
mul.f32 %f1512, %f1507, %f1135;
BB0_187:
mov.u16 %rs17, 0;
fma.rn.f32 %f1499, %f244, %f1510, %f1499;
fma.rn.f32 %f1500, %f244, %f1511, %f1500;
fma.rn.f32 %f1501, %f244, %f1512, %f1501;
BB0_189:
mov.u64 %rd245, GBufferAtten;
cvta.global.u64 %rd244, %rd245;
mov.u32 %r708, 12;
mov.u32 %r707, 2;
abs.f32 %f1145, %f1499;
setp.gtu.f32 %p137, %f1145, 0f7F800000;
selp.f32 %f1146, 0f00000000, %f1499, %p137;
abs.f32 %f1147, %f1500;
setp.gtu.f32 %p138, %f1147, 0f7F800000;
selp.f32 %f1148, 0f00000000, %f1500, %p138;
abs.f32 %f1149, %f1501;
setp.gtu.f32 %p139, %f1149, 0f7F800000;
selp.f32 %f1150, 0f00000000, %f1501, %p139;
fma.rn.f32 %f1525, %f1516, %f1146, %f1513;
fma.rn.f32 %f1526, %f1517, %f1148, %f1514;
fma.rn.f32 %f1527, %f1518, %f1150, %f1515;
ld.global.v2.u32 {%r634, %r635}, [pixelID];
cvt.u64.u32 %rd194, %r634;
cvt.u64.u32 %rd195, %r635;
mov.u64 %rd203, 0;
// inline asm
call (%rd192), _rt_buffer_get_64, (%rd244, %r707, %r708, %rd194, %rd195, %rd203, %rd203);
// inline asm
st.f32 [%rd192+8], %f1518;
st.f32 [%rd192+4], %f1517;
st.f32 [%rd192], %f1516;
ld.global.v2.u32 {%r638, %r639}, [pixelID];
cvt.u64.u32 %rd200, %r638;
cvt.u64.u32 %rd201, %r639;
mov.u64 %rd205, accumBufferAdd;
cvta.global.u64 %rd199, %rd205;
// inline asm
call (%rd198), _rt_buffer_get_64, (%rd199, %r707, %r708, %rd200, %rd201, %rd203, %rd203);
// inline asm
ld.global.u32 %r642, [bounceFlag];
setp.eq.s32 %p140, %r642, 0;
@%p140 bra BB0_191;
ld.f32 %f1151, [%rd198+8];
ld.f32 %f1152, [%rd198+4];
ld.f32 %f1153, [%rd198];
add.f32 %f1525, %f1525, %f1153;
add.f32 %f1526, %f1526, %f1152;
add.f32 %f1527, %f1527, %f1151;
bra.uni BB0_196;
BB0_191:
ld.global.u32 %r215, [firstSkylight];
setp.lt.s32 %p141, %r215, 0;
setp.eq.s16 %p142, %rs17, 0;
or.pred %p143, %p141, %p142;
@%p143 bra BB0_196;
cvt.s64.s32 %rd208, %r215;
mov.u64 %rd212, globalLights;
cvta.global.u64 %rd207, %rd212;
mov.u32 %r643, 1;
mov.u32 %r644, 48;
// inline asm
call (%rd206), _rt_buffer_get_64, (%rd207, %r643, %r644, %rd208, %rd203, %rd203, %rd203);
// inline asm
ld.v4.f32 {%f1158, %f1159, %f1160, %f1161}, [%rd206+16];
ld.v4.f32 {%f1162, %f1163, %f1164, %f1165}, [%rd206];
setp.neu.f32 %p144, %f1158, 0f00000000;
setp.leu.f32 %p145, %f63, 0f00000000;
and.pred %p146, %p144, %p145;
@%p146 bra BB0_196;
mov.f32 %f1522, 0f3F800000;
setp.leu.f32 %p147, %f1163, 0f00000000;
mov.f32 %f1523, %f1522;
mov.f32 %f1524, %f1522;
@%p147 bra BB0_195;
cvt.rzi.s32.f32 %r645, %f1164;
neg.f32 %f1175, %f62;
neg.f32 %f1174, %f63;
neg.f32 %f1173, %f64;
mov.u32 %r646, 6;
mov.u32 %r647, 0;
// inline asm
call (%f1524, %f1523, %f1522, %f1172), _rt_texture_get_base_id, (%r645, %r646, %f1173, %f1174, %f1175, %r647);
// inline asm
BB0_195:
mul.f32 %f1525, %f1159, %f1524;
mul.f32 %f1526, %f1160, %f1523;
mul.f32 %f1527, %f1161, %f1522;
BB0_196:
mov.u32 %r710, 12;
mov.u32 %r709, 2;
ld.global.v2.u32 {%r652, %r653}, [pixelID];
cvt.u64.u32 %rd215, %r652;
cvt.u64.u32 %rd216, %r653;
// inline asm
call (%rd213), _rt_buffer_get_64, (%rd199, %r709, %r710, %rd215, %rd216, %rd203, %rd203);
// inline asm
st.f32 [%rd213+8], %f1527;
st.f32 [%rd213+4], %f1526;
st.f32 [%rd213], %f1525;
ld.global.v2.u32 {%r656, %r657}, [pixelID];
cvt.u64.u32 %rd221, %r656;
cvt.u64.u32 %rd222, %r657;
mov.u64 %rd226, accumBufferLerp;
cvta.global.u64 %rd220, %rd226;
// inline asm
call (%rd219), _rt_buffer_get_64, (%rd220, %r709, %r710, %rd221, %rd222, %rd203, %rd203);
// inline asm
ld.f32 %f1176, [%rd219+8];
ld.f32 %f1177, [%rd219+4];
ld.f32 %f1178, [%rd219];
sub.f32 %f1179, %f1525, %f1178;
sub.f32 %f1180, %f1526, %f1177;
sub.f32 %f1181, %f1527, %f1176;
ld.global.f32 %f1182, [integration];
fma.rn.f32 %f371, %f1182, %f1179, %f1178;
fma.rn.f32 %f372, %f1182, %f1180, %f1177;
fma.rn.f32 %f373, %f1182, %f1181, %f1176;
ld.global.u32 %r660, [finalBounceFlag];
setp.eq.s32 %p148, %r660, 0;
@%p148 bra BB0_198;
mov.u32 %r712, 12;
mov.u32 %r711, 2;
ld.global.v2.u32 {%r663, %r664}, [pixelID];
cvt.u64.u32 %rd229, %r663;
cvt.u64.u32 %rd230, %r664;
// inline asm
call (%rd227), _rt_buffer_get_64, (%rd220, %r711, %r712, %rd229, %rd230, %rd203, %rd203);
// inline asm
st.f32 [%rd227+8], %f373;
st.f32 [%rd227+4], %f372;
st.f32 [%rd227], %f371;
BB0_198:
ld.global.v2.u32 {%r667, %r668}, [pixelID];
cvt.u64.u32 %rd44, %r667;
ld.global.u32 %r670, [resolution+4];
add.s32 %r671, %r670, -1;
sub.s32 %r216, %r671, %r668;
ld.global.f32 %f1185, [cameraExp];
mul.f32 %f374, %f371, %f1185;
mul.f32 %f375, %f372, %f1185;
mul.f32 %f376, %f373, %f1185;
mov.f32 %f1186, 0f3E68BA2E;
cvt.rzi.f32.f32 %f1187, %f1186;
fma.rn.f32 %f1188, %f1187, 0fC0000000, 0f3EE8BA2E;
abs.f32 %f377, %f1188;
abs.f32 %f378, %f374;
setp.lt.f32 %p149, %f378, 0f00800000;
mul.f32 %f1189, %f378, 0f4B800000;
selp.f32 %f1190, 0fC3170000, 0fC2FE0000, %p149;
selp.f32 %f1191, %f1189, %f378, %p149;
mov.b32 %r673, %f1191;
and.b32 %r674, %r673, 8388607;
or.b32 %r675, %r674, 1065353216;
mov.b32 %f1192, %r675;
shr.u32 %r676, %r673, 23;
cvt.rn.f32.u32 %f1193, %r676;
add.f32 %f1194, %f1190, %f1193;
setp.gt.f32 %p150, %f1192, 0f3FB504F3;
mul.f32 %f1195, %f1192, 0f3F000000;
add.f32 %f1196, %f1194, 0f3F800000;
selp.f32 %f1197, %f1195, %f1192, %p150;
selp.f32 %f1198, %f1196, %f1194, %p150;
add.f32 %f1199, %f1197, 0fBF800000;
add.f32 %f1184, %f1197, 0f3F800000;
// inline asm
rcp.approx.ftz.f32 %f1183,%f1184;
// inline asm
add.f32 %f1200, %f1199, %f1199;
mul.f32 %f1201, %f1183, %f1200;
mul.f32 %f1202, %f1201, %f1201;
mov.f32 %f1203, 0f3C4CAF63;
mov.f32 %f1204, 0f3B18F0FE;
fma.rn.f32 %f1205, %f1204, %f1202, %f1203;
mov.f32 %f1206, 0f3DAAAABD;
fma.rn.f32 %f1207, %f1205, %f1202, %f1206;
mul.rn.f32 %f1208, %f1207, %f1202;
mul.rn.f32 %f1209, %f1208, %f1201;
sub.f32 %f1210, %f1199, %f1201;
neg.f32 %f1211, %f1201;
add.f32 %f1212, %f1210, %f1210;
fma.rn.f32 %f1213, %f1211, %f1199, %f1212;
mul.rn.f32 %f1214, %f1183, %f1213;
add.f32 %f1215, %f1209, %f1201;
sub.f32 %f1216, %f1201, %f1215;
add.f32 %f1217, %f1209, %f1216;
add.f32 %f1218, %f1214, %f1217;
add.f32 %f1219, %f1215, %f1218;
sub.f32 %f1220, %f1215, %f1219;
add.f32 %f1221, %f1218, %f1220;
mov.f32 %f1222, 0f3F317200;
mul.rn.f32 %f1223, %f1198, %f1222;
mov.f32 %f1224, 0f35BFBE8E;
mul.rn.f32 %f1225, %f1198, %f1224;
add.f32 %f1226, %f1223, %f1219;
sub.f32 %f1227, %f1223, %f1226;
add.f32 %f1228, %f1219, %f1227;
add.f32 %f1229, %f1221, %f1228;
add.f32 %f1230, %f1225, %f1229;
add.f32 %f1231, %f1226, %f1230;
sub.f32 %f1232, %f1226, %f1231;
add.f32 %f1233, %f1230, %f1232;
mov.f32 %f1234, 0f3EE8BA2E;
mul.rn.f32 %f1235, %f1234, %f1231;
neg.f32 %f1236, %f1235;
fma.rn.f32 %f1237, %f1234, %f1231, %f1236;
fma.rn.f32 %f1238, %f1234, %f1233, %f1237;
mov.f32 %f1239, 0f00000000;
fma.rn.f32 %f1240, %f1239, %f1231, %f1238;
add.rn.f32 %f1241, %f1235, %f1240;
neg.f32 %f1242, %f1241;
add.rn.f32 %f1243, %f1235, %f1242;
add.rn.f32 %f1244, %f1243, %f1240;
mov.b32 %r677, %f1241;
setp.eq.s32 %p151, %r677, 1118925336;
add.s32 %r678, %r677, -1;
mov.b32 %f1245, %r678;
add.f32 %f1246, %f1244, 0f37000000;
selp.f32 %f1247, %f1245, %f1241, %p151;
selp.f32 %f379, %f1246, %f1244, %p151;
mul.f32 %f1248, %f1247, 0f3FB8AA3B;
cvt.rzi.f32.f32 %f1249, %f1248;
mov.f32 %f1250, 0fBF317200;
fma.rn.f32 %f1251, %f1249, %f1250, %f1247;
mov.f32 %f1252, 0fB5BFBE8E;
fma.rn.f32 %f1253, %f1249, %f1252, %f1251;
mul.f32 %f1254, %f1253, 0f3FB8AA3B;
ex2.approx.ftz.f32 %f1255, %f1254;
add.f32 %f1256, %f1249, 0f00000000;
ex2.approx.f32 %f1257, %f1256;
mul.f32 %f1258, %f1255, %f1257;
setp.lt.f32 %p152, %f1247, 0fC2D20000;
selp.f32 %f1259, 0f00000000, %f1258, %p152;
setp.gt.f32 %p153, %f1247, 0f42D20000;
selp.f32 %f1528, 0f7F800000, %f1259, %p153;
setp.eq.f32 %p154, %f1528, 0f7F800000;
@%p154 bra BB0_200;
fma.rn.f32 %f1528, %f1528, %f379, %f1528;
BB0_200:
setp.lt.f32 %p155, %f374, 0f00000000;
setp.eq.f32 %p156, %f377, 0f3F800000;
and.pred %p3, %p155, %p156;
mov.b32 %r679, %f1528;
xor.b32 %r680, %r679, -2147483648;
mov.b32 %f1260, %r680;
selp.f32 %f1530, %f1260, %f1528, %p3;
setp.eq.f32 %p157, %f374, 0f00000000;
@%p157 bra BB0_203;
bra.uni BB0_201;
BB0_203:
add.f32 %f1263, %f374, %f374;
selp.f32 %f1530, %f1263, 0f00000000, %p156;
bra.uni BB0_204;
BB0_201:
setp.geu.f32 %p158, %f374, 0f00000000;
@%p158 bra BB0_204;
cvt.rzi.f32.f32 %f1262, %f1234;
setp.neu.f32 %p159, %f1262, 0f3EE8BA2E;
selp.f32 %f1530, 0f7FFFFFFF, %f1530, %p159;
BB0_204:
add.f32 %f1264, %f378, 0f3EE8BA2E;
mov.b32 %r681, %f1264;
setp.lt.s32 %p161, %r681, 2139095040;
@%p161 bra BB0_209;
setp.gtu.f32 %p162, %f378, 0f7F800000;
@%p162 bra BB0_208;
bra.uni BB0_206;
BB0_208:
add.f32 %f1530, %f374, 0f3EE8BA2E;
bra.uni BB0_209;
BB0_206:
setp.neu.f32 %p163, %f378, 0f7F800000;
@%p163 bra BB0_209;
selp.f32 %f1530, 0fFF800000, 0f7F800000, %p3;
BB0_209:
setp.eq.f32 %p164, %f374, 0f3F800000;
selp.f32 %f1267, 0f3F800000, %f1530, %p164;
cvt.sat.f32.f32 %f390, %f1267;
abs.f32 %f391, %f375;
setp.lt.f32 %p165, %f391, 0f00800000;
mul.f32 %f1268, %f391, 0f4B800000;
selp.f32 %f1269, 0fC3170000, 0fC2FE0000, %p165;
selp.f32 %f1270, %f1268, %f391, %p165;
mov.b32 %r682, %f1270;
and.b32 %r683, %r682, 8388607;
or.b32 %r684, %r683, 1065353216;
mov.b32 %f1271, %r684;
shr.u32 %r685, %r682, 23;
cvt.rn.f32.u32 %f1272, %r685;
add.f32 %f1273, %f1269, %f1272;
setp.gt.f32 %p166, %f1271, 0f3FB504F3;
mul.f32 %f1274, %f1271, 0f3F000000;
add.f32 %f1275, %f1273, 0f3F800000;
selp.f32 %f1276, %f1274, %f1271, %p166;
selp.f32 %f1277, %f1275, %f1273, %p166;
add.f32 %f1278, %f1276, 0fBF800000;
add.f32 %f1266, %f1276, 0f3F800000;
// inline asm
rcp.approx.ftz.f32 %f1265,%f1266;
// inline asm
add.f32 %f1279, %f1278, %f1278;
mul.f32 %f1280, %f1265, %f1279;
mul.f32 %f1281, %f1280, %f1280;
fma.rn.f32 %f1284, %f1204, %f1281, %f1203;
fma.rn.f32 %f1286, %f1284, %f1281, %f1206;
mul.rn.f32 %f1287, %f1286, %f1281;
mul.rn.f32 %f1288, %f1287, %f1280;
sub.f32 %f1289, %f1278, %f1280;
neg.f32 %f1290, %f1280;
add.f32 %f1291, %f1289, %f1289;
fma.rn.f32 %f1292, %f1290, %f1278, %f1291;
mul.rn.f32 %f1293, %f1265, %f1292;
add.f32 %f1294, %f1288, %f1280;
sub.f32 %f1295, %f1280, %f1294;
add.f32 %f1296, %f1288, %f1295;
add.f32 %f1297, %f1293, %f1296;
add.f32 %f1298, %f1294, %f1297;
sub.f32 %f1299, %f1294, %f1298;
add.f32 %f1300, %f1297, %f1299;
mul.rn.f32 %f1302, %f1277, %f1222;
mul.rn.f32 %f1304, %f1277, %f1224;
add.f32 %f1305, %f1302, %f1298;
sub.f32 %f1306, %f1302, %f1305;
add.f32 %f1307, %f1298, %f1306;
add.f32 %f1308, %f1300, %f1307;
add.f32 %f1309, %f1304, %f1308;
add.f32 %f1310, %f1305, %f1309;
sub.f32 %f1311, %f1305, %f1310;
add.f32 %f1312, %f1309, %f1311;
mul.rn.f32 %f1314, %f1234, %f1310;
neg.f32 %f1315, %f1314;
fma.rn.f32 %f1316, %f1234, %f1310, %f1315;
fma.rn.f32 %f1317, %f1234, %f1312, %f1316;
fma.rn.f32 %f1319, %f1239, %f1310, %f1317;
add.rn.f32 %f1320, %f1314, %f1319;
neg.f32 %f1321, %f1320;
add.rn.f32 %f1322, %f1314, %f1321;
add.rn.f32 %f1323, %f1322, %f1319;
mov.b32 %r686, %f1320;
setp.eq.s32 %p167, %r686, 1118925336;
add.s32 %r687, %r686, -1;
mov.b32 %f1324, %r687;
add.f32 %f1325, %f1323, 0f37000000;
selp.f32 %f1326, %f1324, %f1320, %p167;
selp.f32 %f392, %f1325, %f1323, %p167;
mul.f32 %f1327, %f1326, 0f3FB8AA3B;
cvt.rzi.f32.f32 %f1328, %f1327;
fma.rn.f32 %f1330, %f1328, %f1250, %f1326;
fma.rn.f32 %f1332, %f1328, %f1252, %f1330;
mul.f32 %f1333, %f1332, 0f3FB8AA3B;
ex2.approx.ftz.f32 %f1334, %f1333;
add.f32 %f1335, %f1328, 0f00000000;
ex2.approx.f32 %f1336, %f1335;
mul.f32 %f1337, %f1334, %f1336;
setp.lt.f32 %p168, %f1326, 0fC2D20000;
selp.f32 %f1338, 0f00000000, %f1337, %p168;
setp.gt.f32 %p169, %f1326, 0f42D20000;
selp.f32 %f1531, 0f7F800000, %f1338, %p169;
setp.eq.f32 %p170, %f1531, 0f7F800000;
@%p170 bra BB0_211;
fma.rn.f32 %f1531, %f1531, %f392, %f1531;
BB0_211:
setp.lt.f32 %p171, %f375, 0f00000000;
and.pred %p4, %p171, %p156;
mov.b32 %r688, %f1531;
xor.b32 %r689, %r688, -2147483648;
mov.b32 %f1339, %r689;
selp.f32 %f1533, %f1339, %f1531, %p4;
setp.eq.f32 %p173, %f375, 0f00000000;
@%p173 bra BB0_214;
bra.uni BB0_212;
BB0_214:
add.f32 %f1342, %f375, %f375;
selp.f32 %f1533, %f1342, 0f00000000, %p156;
bra.uni BB0_215;
BB0_212:
setp.geu.f32 %p174, %f375, 0f00000000;
@%p174 bra BB0_215;
cvt.rzi.f32.f32 %f1341, %f1234;
setp.neu.f32 %p175, %f1341, 0f3EE8BA2E;
selp.f32 %f1533, 0f7FFFFFFF, %f1533, %p175;
BB0_215:
add.f32 %f1343, %f391, 0f3EE8BA2E;
mov.b32 %r690, %f1343;
setp.lt.s32 %p177, %r690, 2139095040;
@%p177 bra BB0_220;
setp.gtu.f32 %p178, %f391, 0f7F800000;
@%p178 bra BB0_219;
bra.uni BB0_217;
BB0_219:
add.f32 %f1533, %f375, 0f3EE8BA2E;
bra.uni BB0_220;
BB0_217:
setp.neu.f32 %p179, %f391, 0f7F800000;
@%p179 bra BB0_220;
selp.f32 %f1533, 0fFF800000, 0f7F800000, %p4;
BB0_220:
setp.eq.f32 %p180, %f375, 0f3F800000;
selp.f32 %f1346, 0f3F800000, %f1533, %p180;
cvt.sat.f32.f32 %f403, %f1346;
abs.f32 %f404, %f376;
setp.lt.f32 %p181, %f404, 0f00800000;
mul.f32 %f1347, %f404, 0f4B800000;
selp.f32 %f1348, 0fC3170000, 0fC2FE0000, %p181;
selp.f32 %f1349, %f1347, %f404, %p181;
mov.b32 %r691, %f1349;
and.b32 %r692, %r691, 8388607;
or.b32 %r693, %r692, 1065353216;
mov.b32 %f1350, %r693;
shr.u32 %r694, %r691, 23;
cvt.rn.f32.u32 %f1351, %r694;
add.f32 %f1352, %f1348, %f1351;
setp.gt.f32 %p182, %f1350, 0f3FB504F3;
mul.f32 %f1353, %f1350, 0f3F000000;
add.f32 %f1354, %f1352, 0f3F800000;
selp.f32 %f1355, %f1353, %f1350, %p182;
selp.f32 %f1356, %f1354, %f1352, %p182;
add.f32 %f1357, %f1355, 0fBF800000;
add.f32 %f1345, %f1355, 0f3F800000;
// inline asm
rcp.approx.ftz.f32 %f1344,%f1345;
// inline asm
add.f32 %f1358, %f1357, %f1357;
mul.f32 %f1359, %f1344, %f1358;
mul.f32 %f1360, %f1359, %f1359;
fma.rn.f32 %f1363, %f1204, %f1360, %f1203;
fma.rn.f32 %f1365, %f1363, %f1360, %f1206;
mul.rn.f32 %f1366, %f1365, %f1360;
mul.rn.f32 %f1367, %f1366, %f1359;
sub.f32 %f1368, %f1357, %f1359;
neg.f32 %f1369, %f1359;
add.f32 %f1370, %f1368, %f1368;
fma.rn.f32 %f1371, %f1369, %f1357, %f1370;
mul.rn.f32 %f1372, %f1344, %f1371;
add.f32 %f1373, %f1367, %f1359;
sub.f32 %f1374, %f1359, %f1373;
add.f32 %f1375, %f1367, %f1374;
add.f32 %f1376, %f1372, %f1375;
add.f32 %f1377, %f1373, %f1376;
sub.f32 %f1378, %f1373, %f1377;
add.f32 %f1379, %f1376, %f1378;
mul.rn.f32 %f1381, %f1356, %f1222;
mul.rn.f32 %f1383, %f1356, %f1224;
add.f32 %f1384, %f1381, %f1377;
sub.f32 %f1385, %f1381, %f1384;
add.f32 %f1386, %f1377, %f1385;
add.f32 %f1387, %f1379, %f1386;
add.f32 %f1388, %f1383, %f1387;
add.f32 %f1389, %f1384, %f1388;
sub.f32 %f1390, %f1384, %f1389;
add.f32 %f1391, %f1388, %f1390;
mul.rn.f32 %f1393, %f1234, %f1389;
neg.f32 %f1394, %f1393;
fma.rn.f32 %f1395, %f1234, %f1389, %f1394;
fma.rn.f32 %f1396, %f1234, %f1391, %f1395;
fma.rn.f32 %f1398, %f1239, %f1389, %f1396;
add.rn.f32 %f1399, %f1393, %f1398;
neg.f32 %f1400, %f1399;
add.rn.f32 %f1401, %f1393, %f1400;
add.rn.f32 %f1402, %f1401, %f1398;
mov.b32 %r695, %f1399;
setp.eq.s32 %p183, %r695, 1118925336;
add.s32 %r696, %r695, -1;
mov.b32 %f1403, %r696;
add.f32 %f1404, %f1402, 0f37000000;
selp.f32 %f1405, %f1403, %f1399, %p183;
selp.f32 %f405, %f1404, %f1402, %p183;
mul.f32 %f1406, %f1405, 0f3FB8AA3B;
cvt.rzi.f32.f32 %f1407, %f1406;
fma.rn.f32 %f1409, %f1407, %f1250, %f1405;
fma.rn.f32 %f1411, %f1407, %f1252, %f1409;
mul.f32 %f1412, %f1411, 0f3FB8AA3B;
ex2.approx.ftz.f32 %f1413, %f1412;
add.f32 %f1414, %f1407, 0f00000000;
ex2.approx.f32 %f1415, %f1414;
mul.f32 %f1416, %f1413, %f1415;
setp.lt.f32 %p184, %f1405, 0fC2D20000;
selp.f32 %f1417, 0f00000000, %f1416, %p184;
setp.gt.f32 %p185, %f1405, 0f42D20000;
selp.f32 %f1534, 0f7F800000, %f1417, %p185;
setp.eq.f32 %p186, %f1534, 0f7F800000;
@%p186 bra BB0_222;
fma.rn.f32 %f1534, %f1534, %f405, %f1534;
BB0_222:
setp.lt.f32 %p187, %f376, 0f00000000;
and.pred %p5, %p187, %p156;
mov.b32 %r697, %f1534;
xor.b32 %r698, %r697, -2147483648;
mov.b32 %f1418, %r698;
selp.f32 %f1536, %f1418, %f1534, %p5;
setp.eq.f32 %p189, %f376, 0f00000000;
@%p189 bra BB0_225;
bra.uni BB0_223;
BB0_225:
add.f32 %f1421, %f376, %f376;
selp.f32 %f1536, %f1421, 0f00000000, %p156;
bra.uni BB0_226;
BB0_223:
setp.geu.f32 %p190, %f376, 0f00000000;
@%p190 bra BB0_226;
cvt.rzi.f32.f32 %f1420, %f1234;
setp.neu.f32 %p191, %f1420, 0f3EE8BA2E;
selp.f32 %f1536, 0f7FFFFFFF, %f1536, %p191;
BB0_226:
add.f32 %f1422, %f404, 0f3EE8BA2E;
mov.b32 %r699, %f1422;
setp.lt.s32 %p193, %r699, 2139095040;
@%p193 bra BB0_231;
setp.gtu.f32 %p194, %f404, 0f7F800000;
@%p194 bra BB0_230;
bra.uni BB0_228;
BB0_230:
add.f32 %f1536, %f376, 0f3EE8BA2E;
bra.uni BB0_231;
BB0_228:
setp.neu.f32 %p195, %f404, 0f7F800000;
@%p195 bra BB0_231;
selp.f32 %f1536, 0fFF800000, 0f7F800000, %p5;
BB0_231:
mov.u32 %r713, 2;
setp.eq.f32 %p196, %f376, 0f3F800000;
selp.f32 %f1423, 0f3F800000, %f1536, %p196;
cvt.sat.f32.f32 %f1424, %f1423;
cvt.u64.u32 %rd237, %r216;
mov.u64 %rd240, colorOutput;
cvta.global.u64 %rd235, %rd240;
mov.u32 %r701, 4;
// inline asm
call (%rd234), _rt_buffer_get_64, (%rd235, %r713, %r701, %rd44, %rd237, %rd203, %rd203);
// inline asm
mul.f32 %f1425, %f390, 0f437F0000;
cvt.rzi.u32.f32 %r702, %f1425;
mul.f32 %f1426, %f403, 0f437F0000;
cvt.rzi.u32.f32 %r703, %f1426;
mul.f32 %f1427, %f1424, 0f437F0000;
cvt.rzi.u32.f32 %r704, %f1427;
cvt.u16.u32 %rs12, %r704;
cvt.u16.u32 %rs13, %r703;
cvt.u16.u32 %rs14, %r702;
mov.u16 %rs15, 255;
st.v4.u8 [%rd234], {%rs14, %rs13, %rs12, %rs15};
ret;
}