summaryrefslogtreecommitdiff
path: root/reference/webgl-water/webgl-water-40.asm
diff options
context:
space:
mode:
Diffstat (limited to 'reference/webgl-water/webgl-water-40.asm')
-rw-r--r--reference/webgl-water/webgl-water-40.asm3525
1 files changed, 1277 insertions, 2248 deletions
diff --git a/reference/webgl-water/webgl-water-40.asm b/reference/webgl-water/webgl-water-40.asm
index 1a0f09e..323714f 100644
--- a/reference/webgl-water/webgl-water-40.asm
+++ b/reference/webgl-water/webgl-water-40.asm
@@ -6,2331 +6,1360 @@
@out(r1.y) out1
@out(r1.z) out2
@out(r1.w) out3
+@const(c7.x) 0x3f000000, 0x3ba3d70a, 0x3f800000, 0x40000000
+@const(c8.x) 0x3f1013a9, 0x00000000, 0x3f400d1b, 0x3e800000
+@const(c9.x) 0x40400000, 0x40800000, 0x49742400, 0x3f666666
+@const(c10.x) 0x00000000, 0x3f800000, 0x3ec00000, 0xbf800000
+@const(c11.x) 0x3f7fbe77, 0xc39044fe, 0xbe2ab368, 0x41200000
+@const(c12.x) 0x3e2ab368, 0x459c4000, 0x3e800000, 0x3f800000
+@const(c13.x) 0x41200000, 0x41000000, 0x40c00000, 0x3e800000
+@const(c14.x) 0x3e800000, 0x3f800000, 0x3fa00000, 0x00000000
+@const(c15.x) 0x00000000, 0x3f800000, 0x43000000, 0x00000000
(sy)(ss)bary.f r0.z, 0, r0.x
absneg.f r0.w, (neg)c0.y
absneg.f r1.x, (neg)c0.y
absneg.f r1.y, (neg)c0.y
mad.f32 r1.z, c7.x, r0.z, c7.x
-mul.f r1.w, r0.w, r0.w
-mul.f r2.x, r1.x, r1.x
-mul.f r2.y, r1.y, r1.y
-mov.f32f32 r2.z, r1.z
-add.f r1.w, c7.z, (neg)r1.w
-add.f r2.x, c7.z, (neg)r2.x
+bary.f r2.x, 2, r0.x
+mul.f r2.y, r0.w, r0.w
+mul.f r2.z, r1.x, r1.x
+mul.f r2.w, r1.y, r1.y
+mad.f32 r1.w, c7.x, r2.x, c7.x
add.f r2.y, c7.z, (neg)r2.y
-mov.f32f32 r2.z, r2.z
-bary.f r3.x, 2, r0.x
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r2.x, r2.x
-mov.f32f32 r2.y, r2.y
-mad.f32 r3.y, c7.x, r3.x, c7.x
-mul.f r1.w, r1.w, c8.x
-mul.f r2.x, r2.x, c8.x
+add.f r2.z, c7.z, (neg)r2.z
+add.f r2.w, c7.z, (neg)r2.w
+absneg.f r3.x, (neg)c0.y
mul.f r2.y, r2.y, c8.x
-mov.f32f32 r2.w, r3.y
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r2.x, r2.x
-mov.f32f32 r2.y, r2.y
-mov.f32f32 r2.w, r2.w
-add.f r1.w, c7.z, (neg)r1.w
-add.f r2.x, c7.z, (neg)r2.x
+mul.f r2.z, r2.z, c8.x
+sam (f32)(zw)r3.y, r1.z, s#2, t#2
+(sy)mad.f32 r3.y, c7.y, r3.w, r1.z
+mad.f32 r3.z, c7.y, r4.x, r1.w
+(ss)add.f r1.z, c7.z, (neg)r2.y
+add.f r1.w, c7.z, (neg)r2.z
+mul.f r2.y, r2.w, c8.x
+mul.f r2.z, r3.x, r3.x
+mov.f32f32 r2.w, r1.z
+mov.f32f32 r3.w, r1.w
+sam (f32)(zw)r4.x, r3.y, s#2, t#2
+(ss)mov.f32f32 r3.y, r3.y
add.f r2.y, c7.z, (neg)r2.y
-absneg.f r3.z, (neg)c0.y
-absneg.f r3.w, (neg)c0.y
-absneg.f r4.x, (neg)c0.y
-sam (f32)(zw)r4.y, r2.z, s#2, t#2
-(sy)mad.f32 r1.z, c7.y, r4.w, r1.z
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r2.x, r2.x
-mov.f32f32 r2.y, r2.y
-mov.f32f32 r1.z, r1.z
-(ss)mov.f32f32 r2.z, r1.w
-mov.f32f32 r2.w, r2.x
-mov.f32f32 r4.y, r2.y
-mov.f32f32 r4.z, r1.z
-mul.f r4.w, r3.z, r3.z
-mul.f r5.y, r3.w, r3.w
-mul.f r5.z, r4.x, r4.x
-mov.f32f32 r5.w, r4.z
-mad.f32 r3.y, c7.y, r5.x, r3.y
-sqrt r2.z, r2.z
-(ss)mov.f32f32 r2.z, r2.z
-mov.f32f32 r4.z, r0.w
+(sy)mad.f32 r4.x, c7.y, r4.z, r3.y
+mov.f32f32 r3.y, r3.z
+add.f r2.z, c7.z, (neg)r2.z
+mad.f32 r4.y, c7.y, r4.w, r3.y
sqrt r2.w, r2.w
-(ss)mov.f32f32 r2.w, r2.w
-mov.f32f32 r3.y, r3.y
-mov.f32f32 r5.x, r1.x
-sqrt r4.y, r4.y
-(ss)mov.f32f32 r4.y, r4.y
-mad.f32 r2.z, c8.z, r4.z, r2.z
-mov.f32f32 r4.z, r3.y
-mad.f32 r2.w, c8.z, r5.x, r2.w
-mov.f32f32 r5.x, r1.y
-add.f r4.w, c7.z, (neg)r4.w
-mov.f32f32 r6.x, r4.z
-mov.f32f32 r2.z, r2.z
+(ss)mad.f32 r2.w, c8.z, r0.w, r2.w
+sqrt r3.y, r3.w
+(ss)mad.f32 r3.y, c8.z, r1.x, r3.y
+mov.f32f32 r3.z, r2.y
+mul.f r2.z, r2.z, c8.x
+(ss)mul.f r3.w, r2.w, c10.x
+absneg.f r4.z, (neg)c0.z
+sam (f32)(zw)r4.w, r4.x, s#2, t#2
+(ss)mov.f32f32 r4.x, r4.x
mov.f32f32 r2.w, r2.w
-mad.f32 r4.y, c8.z, r5.x, r4.y
-mov.f32f32 r4.z, r4.w
-add.f r4.w, c7.z, (neg)r5.y
-add.f r5.x, c7.z, (neg)r5.z
-sam (f32)(zw)r5.y, r5.w, s#2, t#2
-(sy)mad.f32 r1.z, c7.y, r5.w, r1.z
-mul.f r5.y, r2.z, c10.x
-mul.f r5.z, r2.z, c10.y
-mul.f r2.z, r2.z, c10.x
-mov.f32f32 r1.z, r1.z
-mov.f32f32 r5.y, r5.y
-(ss)absneg.f r5.w, (neg)c0.z
-mov.f32f32 r5.z, r5.z
-mov.f32f32 r6.y, r1.z
-mov.f32f32 r0.w, r0.w
-mov.f32f32 r2.z, r2.z
-absneg.f r6.z, (neg)c0.x
-mov.f32f32 r6.w, r6.y
-mad.f32 r3.y, c7.y, r6.x, r3.y
-mov.f32f32 r5.w, r5.w
-mad.f32 r0.w, c8.z, r0.w, (neg)r5.z
+(sy)mad.f32 r4.w, c7.y, r5.y, r4.x
+mov.f32f32 r4.x, r4.y
+mov.f32f32 r4.y, r3.y
+mad.f32 r5.x, c7.y, r5.z, r4.x
+mul.f r4.x, r2.w, c10.y
+mul.f r2.w, r2.w, c10.x
+absneg.f r5.y, (neg)c0.x
+mad.f32 r0.w, c8.z, r0.w, (neg)r4.x
+cmps.f.lt r1.z, r1.z, c8.y
+mul.f r4.x, r4.y, c10.y
+sam (f32)(zw)r5.z, r4.w, s#2, t#2
+(ss)mov.f32f32 r4.w, r4.w
+mad.f32 r2.w, c8.z, r5.y, (neg)r2.w
+(sy)mad.f32 r5.y, c7.y, r6.x, r4.w
+mov.f32f32 r4.w, r5.x
+cov.u32f32 r1.z, r1.z
+mad.f32 r5.z, c7.y, r6.y, r4.w
+mad.f32 r1.x, c8.z, r1.x, (neg)r4.x
cmps.f.lt r1.w, r1.w, c8.y
-mov.f32f32 r3.y, r3.y
-mad.f32 r5.y, c8.z, r5.w, (neg)r5.y
-mov.f32f32 r5.z, r6.z
+mul.f r4.x, r4.y, c10.x
+cmps.f.ne r1.z, r1.z, c8.y
+mov.f32f32 r4.y, c8.y
+mov.f32f32 r4.w, c8.y
+sam (f32)(zw)r5.w, r5.y, s#2, t#2
+mov.f32f32 r5.x, r5.y
cov.u32f32 r1.w, r1.w
-mov.f32f32 r5.w, r3.y
-mul.f r6.x, r2.w, c10.x
-mul.f r6.y, r2.w, c10.y
-mul.f r2.w, r2.w, c10.x
-mov.f32f32 r7.x, r5.w
+(sy)mad.f32 r5.x, c7.y, r6.y, r5.x
+(ss)mov.f32f32 r5.y, r5.z
+sel.b32 r0.w, r4.y, r1.z, r0.w
+mad.f32 r5.y, c7.y, r6.z, r5.y
+sel.b32 r2.w, r4.w, r1.z, r2.w
cmps.f.ne r1.w, r1.w, c8.y
-mov.f32f32 r5.w, c8.y
-mov.f32f32 r6.z, c8.y
-mad.f32 r2.z, c8.z, r5.z, (neg)r2.z
-mov.f32f32 r5.z, c8.y
-mov.f32f32 r6.x, r6.x
-sam (f32)(zw)r6.w, r6.w, s#2, t#2
-(sy)mad.f32 r1.z, c7.y, r7.y, r1.z
-sel.b32 r5.y, r5.w, r1.w, r5.y
-sel.b32 r0.w, r6.z, r1.w, r0.w
-sel.b32 r1.w, r5.z, r1.w, r2.z
-mov.f32f32 r1.z, r1.z
-absneg.f r2.z, (neg)r5.y
+mov.f32f32 r4.y, c8.y
absneg.f r0.w, (neg)r0.w
-absneg.f r1.w, (neg)r1.w
-mov.f32f32 r5.y, r1.z
-mov.f32f32 r5.z, r2.z
-mov.f32f32 r5.w, r2.z
-mov.f32f32 r6.z, r0.w
-(ss)mov.f32f32 r6.w, r5.y
-mad.f32 r3.y, c7.y, r7.z, r3.y
-mov.f32f32 r5.y, r0.w
-mov.f32f32 r7.x, r1.w
-mov.f32f32 r7.y, r1.w
-mov.f32f32 r3.y, r3.y
-rcp r5.z, r5.z
+absneg.f r2.w, (neg)r2.w
+absneg.f r4.w, (neg)c0.x
+sam (f32)(zw)r5.x, r5.x, s#2, t#2
+(sy)(ss)mul.f r5.x, r5.z, r5.z
+sel.b32 r1.x, r4.y, r1.w, r1.x
+mad.f32 r4.y, r5.w, r5.w, r5.x
+mad.f32 r4.x, c8.z, r4.w, (neg)r4.x
+mov.f32f32 r4.w, c8.y
+absneg.f r1.x, (neg)r1.x
+add.f r4.y, c7.z, (neg)r4.y
+rcp r5.x, r0.w
nop
-rcp r5.w, r5.w
+rcp r5.y, r0.w
nop
-rcp r6.z, r6.z
-mov.f32f32 r7.z, r0.w
-mov.f32f32 r7.w, r3.y
-rcp r5.y, r5.y
+rcp r6.x, r2.w
nop
-rcp r8.x, r7.x
+rcp r6.y, r2.w
nop
-rcp r7.y, r7.y
-absneg.f r8.y, (neg)c0.z
-(ss)mov.f32f32 r7.x, r7.w
-mov.f32f32 r6.y, r6.y
-mov.f32f32 r1.x, r1.x
-mov.f32f32 r2.w, r2.w
-rcp r7.z, r7.z
-mov.f32f32 r7.w, r8.y
-absneg.f r8.y, (neg)c0.x
-mad.f32 r1.x, c8.z, r1.x, (neg)r6.y
-sam (f32)(zw)r8.z, r6.w, s#2, t#2
-(sy)mad.f32 r1.z, c7.y, r9.x, r1.z
-mad.f32 r3.y, c7.y, r9.y, r3.y
-mad.f32 r6.x, c8.z, r7.w, (neg)r6.x
-cmps.f.lt r2.x, r2.x, c8.y
-mov.f32f32 r1.z, r1.z
-mov.f32f32 r3.y, r3.y
-mov.f32f32 r6.y, r8.y
-cov.u32f32 r2.x, r2.x
-(ss)mov.f32f32 r6.w, r1.z
-mov.f32f32 r7.x, r3.y
-mad.f32 r2.w, c8.z, r6.y, (neg)r2.w
-cmps.f.ne r2.x, r2.x, c8.y
-mov.f32f32 r8.y, r6.w
-mov.f32f32 r8.z, r7.x
-mov.f32f32 r6.y, c8.y
-mov.f32f32 r6.w, c8.y
-mov.f32f32 r7.x, c8.y
-mov.f32f32 r4.y, r4.y
-mul.f r4.z, r4.z, c8.x
-mov.f32f32 r4.w, r4.w
-sam (f32)(zw)r8.y, r8.y, s#2, t#2
-(sy)mad.f32 r1.z, c7.y, r8.w, r1.z
-mad.f32 r3.y, c7.y, r9.x, r3.y
-sel.b32 r6.x, r6.y, r2.x, r6.x
-sel.b32 r1.x, r6.w, r2.x, r1.x
-mov.f32f32 r1.z, r1.z
-mov.f32f32 r3.y, r3.y
-absneg.f r6.x, (neg)r6.x
-absneg.f r1.x, (neg)r1.x
-mov.f32f32 r1.z, r1.z
-mov.f32f32 r3.y, r3.y
-mov.f32f32 r6.y, r6.x
-mov.f32f32 r6.w, r6.x
-mov.f32f32 r1.z, r1.z
-mov.f32f32 r3.y, r3.y
-mov.f32f32 r7.w, r1.x
-(ss)mov.f32f32 r8.y, r1.x
-mov.f32f32 r8.z, r1.z
-mov.f32f32 r8.w, r3.y
-rcp r1.z, r6.y
+rcp r6.z, r0.w
+sel.b32 r4.x, r4.w, r1.w, r4.x
+rcp r4.w, r1.x
nop
-rcp r3.y, r6.w
-sel.b32 r2.x, r7.x, r2.x, r2.w
-mov.f32f32 r2.w, r1.x
-(ss)rcp r6.y, r7.w
-mul.f r6.w, r4.y, c10.x
-mul.f r7.x, r4.y, c10.y
-(ss)rcp r7.w, r8.y
-absneg.f r2.x, (neg)r2.x
-sam (f32)(zw)r8.y, r8.z, s#2, t#2
-(sy)(ss)mul.f r8.y, r8.w, r8.w
-mov.f32f32 r8.z, r9.x
-mad.f32 r8.y, r9.x, r9.x, r8.y
-mov.f32f32 r8.w, r8.w
-add.f r9.x, r0.z, (neg)c6.x
-mov.f32f32 r9.y, r2.x
-add.f r8.y, c7.z, (neg)r8.y
-mov.f32f32 r9.z, r8.z
-mov.f32f32 r9.w, r8.w
-mul.f r10.x, r9.x, r9.x
-mov.f32f32 r8.y, r8.y
-bary.f (ei)r0.x, 1, r0.x
-rcp r0.y, r9.y
-(ss)mov.f32f32 r9.y, r2.x
-rcp r2.w, r2.w
-mov.f32f32 r6.w, r6.w
-absneg.f r10.y, (neg)c0.z
-add.f r10.z, r0.x, (neg)c6.y
+rcp r6.w, r1.x
+nop
+sqrt r4.y, r4.y
+(ss)mov.f32f32 r7.x, r4.y
+add.f r7.y, r0.z, (neg)c6.x
+absneg.f r4.x, (neg)r4.x
+rcp r7.z, r1.x
+nop
+sqrt r3.z, r3.z
mov.f32f32 r7.x, r7.x
-sqrt r8.y, r8.y
-(ss)mov.f32f32 r8.y, r8.y
-mov.f32f32 r10.y, r10.y
-mov.f32f32 r1.y, r1.y
-mul.f r4.y, r4.y, c10.x
-mov.f32f32 r8.y, r8.y
-mad.f32 r10.x, r10.z, r10.z, r10.x
-rcp r9.y, r9.y
-mad.f32 r6.w, c8.z, r10.y, (neg)r6.w
+mov.f32f32 r7.w, r5.z
+mul.f r8.x, r7.y, r7.y
+bary.f (ei)r0.x, 1, r0.x
+(ss)mad.f32 r0.y, c8.z, r1.y, r3.z
+add.f r2.z, c7.z, (neg)r2.z
+(ss)mad.f32 r3.z, c8.z, r4.z, (neg)r3.w
+add.f r3.w, r0.x, (neg)c6.y
+rcp r4.z, r4.x
+nop
+rcp r8.y, r4.x
+mov.f32f32 r8.z, r0.y
+mov.f32f32 r8.w, r2.z
+mad.f32 r8.x, r3.w, r3.w, r8.x
+add.f r9.x, r2.x, (neg)c6.z
+mul.f r9.y, r8.z, c10.y
+mul.f r8.z, r8.z, c10.x
+absneg.f r9.z, (neg)c0.x
+mad.f32 r8.x, r9.x, r9.x, r8.x
+mad.f32 r1.y, c8.z, r1.y, (neg)r9.y
cmps.f.lt r2.y, r2.y, c8.y
-mov.f32f32 r10.y, r8.y
-mov.f32f32 r10.x, r10.x
-add.f r10.w, r3.x, (neg)c6.z
+mad.f32 r8.z, c8.z, r9.z, (neg)r8.z
+sqrt r8.w, r8.w
+(ss)mad.f32 r8.w, c8.z, r3.x, r8.w
+mov.f32f32 r9.y, c8.y
cov.u32f32 r2.y, r2.y
-mad.f32 r1.y, c8.z, r1.y, (neg)r7.x
-mov.f32f32 r4.y, r4.y
-mad.f32 r7.x, r10.w, r10.w, r10.x
+rsq r8.x, r8.x
+(ss)mov.f32f32 r9.z, r8.x
+mov.f32f32 r9.w, r8.w
+sel.b32 r1.z, r9.y, r1.z, r3.z
+mul.f r3.y, r3.y, c10.x
+mul.f r3.z, r7.y, r9.z
cmps.f.ne r2.y, r2.y, c8.y
-mov.f32f32 r10.x, c8.y
-mov.f32f32 r11.x, c8.y
-absneg.f r11.y, (neg)c0.x
-mov.f32f32 r4.z, r4.z
-mul.f r4.w, r4.w, c8.x
-rsq r7.x, r7.x
-(ss)mov.f32f32 r7.x, r7.x
-sel.b32 r6.w, r10.x, r2.y, r6.w
-sel.b32 r1.y, r11.x, r2.y, r1.y
-mov.f32f32 r10.x, r11.y
-mul.f r9.x, r9.x, r7.x
-absneg.f r6.w, (neg)r6.w
+mov.f32f32 r7.y, c8.y
+mov.f32f32 r9.y, c8.y
+mov.f32f32 r10.x, r3.z
+mul.f r3.z, r5.z, (neg)r3.z
+mul.f r3.w, r3.w, r9.z
+sel.b32 r1.y, r7.y, r2.y, r1.y
+mul.f r5.z, r7.w, r10.x
+mul.f r7.y, r7.w, r10.x
+mov.f32f32 r9.z, r3.w
+mad.f32 r3.z, r4.y, (neg)r3.w, r3.z
+mul.f r3.w, r9.x, r8.x
absneg.f r1.y, (neg)r1.y
+mad.f32 r4.y, r7.x, r9.z, r5.z
+mov.f32f32 r5.z, r5.w
+(ss)mov.f32f32 r8.x, r3.w
+mad.f32 r7.y, r7.x, r9.z, r7.y
+mad.f32 r3.z, r5.w, (neg)r3.w, r3.z
+sel.b32 r3.w, r9.y, r2.y, r8.z
+mad.f32 r4.y, r5.z, r8.x, r4.y
+mad.f32 r5.w, r5.z, r8.x, r7.y
+add.f r3.z, c7.z, (neg)r3.z
+rcp r7.y, r1.y
+nop
+rcp r8.z, r1.y
+mul.f r9.x, r4.y, r4.y
+mul.f r9.y, r5.w, r7.w
+mul.f r10.y, r5.w, r5.z
+mul.f r5.w, r5.w, r7.x
+add.f r9.x, c7.z, (neg)r9.x
+mul.f r9.y, c7.w, r9.y
+mul.f r10.y, c7.w, r10.y
+mul.f r5.w, c7.w, r5.w
+mul.f r9.x, r9.x, c8.x
+add.f r9.y, r10.x, (neg)r9.y
+add.f r10.y, r8.x, (neg)r10.y
+add.f r5.w, r9.z, (neg)r5.w
+add.f r9.x, c7.z, (neg)r9.x
+mov.f32f32 r10.z, r9.y
+add.f r10.w, r0.z, (neg)c1.x
+mov.f32f32 r11.x, r10.y
+mov.f32f32 r11.y, r9.x
+mov.f32f32 r11.z, r10.z
+mul.f r11.w, r10.w, r10.z
+add.f r12.x, r0.x, (neg)c1.y
+mov.f32f32 r12.y, r10.z
+mul.f r12.z, c0.x, r11.z
+mov.f32f32 r12.w, r5.w
+sqrt r11.y, r11.y
+(ss)mad.f32 r4.y, c8.z, r4.y, r11.y
+mad.f32 r5.w, r12.x, r5.w, r11.w
+(ss)add.f r11.y, r2.x, (neg)c1.z
+rcp r11.w, r11.z
+absneg.f r13.x, (neg)r0.z
+mov.f32f32 r13.y, r4.y
+rcp r13.z, r12.y
+absneg.f r13.w, (neg)r0.z
+mad.f32 r5.w, r11.y, r10.y, r5.w
+add.f r10.y, c7.z, r13.x
+mul.f r7.x, r13.y, r7.x
+add.f r14.x, c7.z, r13.w
+mad.f32 r7.x, c8.z, r9.z, (neg)r7.x
+cmps.f.lt r9.x, r9.x, c8.y
+mul.f r5.w, c7.w, r5.w
+(ss)mul.f r9.z, r10.y, r11.w
+rcp r10.y, r10.z
+add.f r11.w, c10.w, r13.x
+cov.u32f32 r9.x, r9.x
+mov.f32f32 r13.x, r5.w
+mul.f r14.y, r10.z, r10.z
+(ss)mul.f r10.y, r11.w, r10.y
+cmps.f.ne r9.x, r9.x, c8.y
+mov.f32f32 r11.w, c8.y
+mad.f32 r14.y, r12.w, r12.w, r14.y
+max.f r9.z, r10.y, r9.z
+mad.f32 r10.y, r11.x, r11.x, r14.y
+sel.b32 r7.x, r11.w, r9.x, r7.x
+mul.f r4.y, r4.y, r7.w
+mov.f32f32 r7.w, r12.w
mad.f32 r4.y, c8.z, r10.x, (neg)r4.y
-mov.f32f32 r9.x, r9.x
-mov.f32f32 r10.x, r6.w
-mov.f32f32 r11.x, r6.w
-mov.f32f32 r11.y, r1.y
-mul.f r11.z, r8.w, r9.x
-mul.f r10.z, r10.z, r7.x
-mul.f r11.w, r8.w, r9.x
-mul.f r12.x, r8.w, (neg)r9.x
-rcp r10.x, r10.x
-mov.f32f32 r12.y, r1.y
-mov.f32f32 r10.z, r10.z
-rcp r11.x, r11.x
+mov.f32f32 r10.x, r7.x
+mov.f32f32 r11.w, c8.y
+mul.f r14.y, c9.y, r10.y
+mul.f r10.w, r10.w, r10.w
+mov.f32f32 r14.z, r7.x
+sel.b32 r4.y, r11.w, r9.x, r4.y
+mad.f32 r10.w, r12.x, r12.x, r10.w
+rcp r11.w, r10.x
+absneg.f r12.x, (neg)r0.x
+add.f r14.w, r0.z, (neg)c1.x
+mad.f32 r10.w, r11.y, r11.y, r10.w
+mov.f32f32 r11.y, c2.x
+add.f r15.x, c10.w, r12.x
+mul.f r15.y, r14.w, r4.y
+add.f r15.z, r0.x, (neg)c1.y
+mul.f r11.y, r11.y, c2.x
+(ss)mul.f r11.w, r15.x, r11.w
+rcp r15.x, r10.x
+add.f r12.x, c7.w, r12.x
+mad.f32 r15.y, r15.z, r7.x, r15.y
+mul.f r5.z, r13.y, r5.z
+add.f r10.w, r10.w, (neg)r11.y
+(ss)mul.f r11.y, r12.x, r15.x
+mad.f32 r5.z, c8.z, r8.x, (neg)r5.z
+mov.f32f32 r8.x, c8.y
+mul.f r10.w, r14.y, r10.w
+max.f r11.y, r11.w, r11.y
+mov.f32f32 r11.w, r4.y
+sel.b32 r5.z, r8.x, r9.x, r5.z
+add.f r8.x, r2.x, (neg)c1.z
+mad.f32 r9.x, r13.x, r13.x, (neg)r10.w
+rcp r10.w, r7.w
nop
-rcp r11.y, r11.y
-mov.f32f32 r12.z, c8.y
-mov.f32f32 r12.w, r1.y
-mad.f32 r11.z, r8.y, r10.z, r11.z
-mad.f32 r11.w, r8.y, r10.z, r11.w
-mad.f32 r12.x, r8.y, (neg)r10.z, r12.x
-rcp r12.y, r12.y
-sel.b32 r2.y, r12.z, r2.y, r4.y
-mov.f32f32 r4.y, r11.z
-mul.f r7.x, r10.w, r7.x
-mov.f32f32 r10.w, r11.w
-mov.f32f32 r11.z, r12.x
-absneg.f r2.y, (neg)r2.y
-mov.f32f32 r7.x, r7.x
-rcp r11.w, r12.w
-add.f r4.z, c7.z, (neg)r4.z
-mov.f32f32 r4.w, r4.w
-mov.f32f32 r12.x, r2.y
-mad.f32 r4.y, r8.z, r7.x, r4.y
-mad.f32 r10.w, r8.z, r7.x, r10.w
-mad.f32 r11.z, r8.z, (neg)r7.x, r11.z
-mov.f32f32 r12.z, r2.y
-(ss)mul.f r12.w, r4.y, r4.y
-mul.f r8.w, r10.w, r8.w
-mul.f r8.z, r10.w, r8.z
-mul.f r8.y, r10.w, r8.y
-add.f r10.w, c7.z, (neg)r12.w
-mov.f32f32 r8.w, r8.w
-mov.f32f32 r8.z, r8.z
-mov.f32f32 r8.y, r8.y
-mov.f32f32 r10.w, r10.w
-mul.f r8.w, c7.w, r8.w
-mul.f r8.z, c7.w, r8.z
-mul.f r8.y, c7.w, r8.y
-mul.f r10.w, r10.w, c8.x
-mov.f32f32 r8.w, r8.w
-mov.f32f32 r8.z, r8.z
-mov.f32f32 r8.y, r8.y
-mov.f32f32 r10.w, r10.w
-add.f r8.w, r9.x, (neg)r8.w
-add.f r8.z, r7.x, (neg)r8.z
-add.f r8.y, r10.z, (neg)r8.y
-add.f r10.w, c7.z, (neg)r10.w
-mov.f32f32 r8.w, r8.w
-mov.f32f32 r8.z, r8.z
-mov.f32f32 r8.y, r8.y
-mov.f32f32 r10.w, r10.w
-mul.f r12.w, r8.w, r8.w
-mov.f32f32 r13.x, r8.w
-mad.f32 r12.w, r8.y, r8.y, r12.w
-mov.f32f32 r13.y, r10.w
-mov.f32f32 r13.z, r8.w
-mov.f32f32 r13.w, r13.x
-mov.f32f32 r12.w, r12.w
-mov.f32f32 r14.x, r13.x
-mov.f32f32 r14.y, r13.z
-mad.f32 r12.w, r8.z, r8.z, r12.w
-sqrt r13.y, r13.y
-(ss)mov.f32f32 r13.y, r13.y
-mov.f32f32 r4.y, r4.y
-rcp r13.w, r13.w
-absneg.f r14.z, (neg)r0.z
-mul.f r14.w, c9.y, r12.w
-add.f r15.x, r0.z, (neg)c1.x
-mad.f32 r4.y, c8.z, r4.y, r13.y
-add.f r13.y, c10.w, r14.z
-rcp r14.y, r14.y
-absneg.f r15.y, (neg)r0.z
-mul.f r15.z, r15.x, r15.x
-mov.f32f32 r4.y, r4.y
-add.f r15.w, r0.x, (neg)c1.y
-(ss)mul.f r13.y, r13.y, r13.w
-(ss)add.f r13.w, c10.w, r15.y
-mul.f r9.w, r4.y, r9.w
-mad.f32 r15.z, r15.w, r15.w, r15.z
-mov.f32f32 r13.y, r13.y
-mov.f32f32 r16.x, r13.x
-mov.f32f32 r9.w, r9.w
-mov.f32f32 r9.x, r9.x
-mov.f32f32 r15.z, r15.z
-add.f r16.y, r3.x, (neg)c1.z
-mul.f r13.w, r13.w, r14.y
-mad.f32 r9.x, c8.z, r9.x, (neg)r9.w
-cmps.f.lt r9.w, r10.w, c8.y
-mad.f32 r10.w, r16.y, r16.y, r15.z
-rcp r14.y, r16.x
-add.f r14.z, c7.z, r14.z
-mov.f32f32 r13.w, r13.w
-cov.u32f32 r9.w, r9.w
-mov.f32f32 r10.w, r10.w
-mov.f32f32 r15.z, c2.x
-mov.f32f32 r14.z, r14.z
-cmps.f.ne r9.w, r9.w, c8.y
-(ss)mov.f32f32 r16.x, c8.y
-mul.f r15.z, r15.z, c2.x
-(ss)mul.f r14.y, r14.z, r14.y
-mov.f32f32 r14.z, r13.z
-sel.b32 r9.x, r16.x, r9.w, r9.x
-add.f r10.w, r10.w, (neg)r15.z
-mov.f32f32 r14.y, r14.y
-mul.f r9.z, r4.y, r9.z
-mul.f r15.z, r9.x, r9.x
-mul.f r4.y, r4.y, r10.y
-mov.f32f32 r10.y, r9.x
-mov.f32f32 r10.w, r10.w
-mov.f32f32 r16.x, r9.x
-mov.f32f32 r4.y, r4.y
-mov.f32f32 r10.z, r10.z
-mov.f32f32 r16.z, r10.y
-mul.f r10.w, r14.w, r10.w
-mov.f32f32 r14.w, r16.x
-mad.f32 r4.y, c8.z, r10.z, (neg)r4.y
-mov.f32f32 r10.z, c8.y
-mov.f32f32 r10.w, r10.w
-mul.f r15.x, r15.x, r8.w
-rcp r16.z, r16.z
-absneg.f r16.w, (neg)r0.z
-sel.b32 r4.y, r10.z, r9.w, r4.y
-mad.f32 r10.z, r15.w, r8.y, r15.x
-rcp r14.w, r14.w
+rcp r12.x, r14.z
+absneg.f r13.x, (neg)r0.x
+absneg.f r13.y, (neg)r0.x
+rcp r14.y, r11.w
absneg.f r15.x, (neg)r0.z
-add.f r15.w, c10.w, r16.w
-mad.f32 r15.z, r4.y, r4.y, r15.z
-mov.f32f32 r10.z, r10.z
-add.f r17.x, c10.w, r15.x
-(ss)mul.f r15.w, r15.w, r16.z
-mov.f32f32 r15.z, r15.z
-mov.f32f32 r9.z, r9.z
-mov.f32f32 r7.x, r7.x
-mov.f32f32 r15.w, r15.w
-(ss)mov.f32f32 r16.z, r10.y
-mad.f32 r10.z, r16.y, r8.z, r10.z
-mad.f32 r7.x, c8.z, r7.x, (neg)r9.z
-mov.f32f32 r9.z, c8.y
+mad.f32 r15.y, r8.x, r5.z, r15.y
+add.f r15.w, c10.w, r13.x
+add.f r16.x, c10.w, r13.y
+add.f r16.y, c7.z, r15.x
+mul.f r15.y, c7.w, r15.y
+sqrt r16.z, r9.x
+(ss)add.f r5.w, (neg)r5.w, (neg)r16.z
+mul.f r10.y, c7.w, r10.y
+mul.f r14.y, r16.y, r14.y
+rcp r16.y, r4.y
+add.f r15.x, c10.w, r15.x
+mov.f32f32 r16.z, r15.y
+mul.f r16.w, r4.y, r4.y
+mul.f r10.w, r15.w, r10.w
+(ss)mul.f r15.x, r15.x, r16.y
+mad.f32 r15.w, r7.x, r7.x, r16.w
+rcp r10.y, r10.y
+(ss)mul.f r5.w, r5.w, r10.y
+(ss)mad.f32 r10.y, r5.z, r5.z, r15.w
+max.f r14.y, r15.x, r14.y
+rcp r15.x, r7.w
+mul.f r12.x, r16.x, r12.x
+rcp r14.z, r14.z
+cmps.f.lt r15.w, c8.y, r5.w
+mul.f r16.x, c9.y, r10.y
+min.f r11.y, r14.y, r11.y
+mov.f32f32 r14.y, r5.z
+mul.f r14.w, r14.w, r14.w
+cov.u32f32 r15.w, r15.w
+mad.f32 r14.w, r15.z, r15.z, r14.w
+add.f r13.x, c7.w, r13.x
+add.f r13.y, c7.w, r13.y
+mad.f32 r8.x, r8.x, r8.x, r14.w
+rcp r14.w, r14.y
+absneg.f r15.z, (neg)r2.x
+mov.f32f32 r16.y, c2.x
+cmps.f.ne r15.w, r15.w, c8.y
+mov.f32f32 r16.w, c8.y
+add.f r17.x, c7.z, r15.z
+mul.f r16.y, r16.y, c2.x
+mov.f32f32 r17.y, c7.z
+(ss)mul.f r13.x, r13.x, r15.x
mul.f r14.w, r17.x, r14.w
-mul.f r10.z, c7.w, r10.z
-max.f r13.y, r13.y, r14.y
-sel.b32 r7.x, r9.z, r9.w, r7.x
-rcp r9.z, r16.z
-add.f r9.w, c7.z, r16.w
-mov.f32f32 r10.z, r10.z
-mov.f32f32 r14.y, r14.w
-mad.f32 r14.w, r7.x, r7.x, r15.z
-mov.f32f32 r9.w, r9.w
-mad.f32 r10.w, r10.z, r10.z, (neg)r10.w
-mov.f32f32 r15.z, r16.x
-mul.f r16.y, c9.y, r14.w
-(ss)add.f r16.z, r0.z, (neg)c1.x
-(ss)mul.f r9.z, r9.w, r9.z
-mov.f32f32 r9.w, r10.w
-mov.f32f32 r10.w, r13.y
-mul.f r13.y, r16.z, r16.z
-add.f r16.w, r0.x, (neg)c1.y
-mov.f32f32 r9.z, r9.z
-mov.f32f32 r17.x, r9.w
-rcp r15.z, r15.z
-add.f r15.x, c7.z, r15.x
-mad.f32 r13.y, r16.w, r16.w, r13.y
-max.f r9.z, r15.w, r9.z
-mov.f32f32 r15.w, r8.y
-mov.f32f32 r15.x, r15.x
-mov.f32f32 r13.y, r13.y
-add.f r17.y, r3.x, (neg)c1.z
-mov.f32f32 r9.z, r9.z
-mov.f32f32 r17.z, r4.y
-sqrt r17.x, r17.x
-(ss)mov.f32f32 r17.x, r17.x
-mad.f32 r13.y, r17.y, r17.y, r13.y
-mov.f32f32 r10.z, r10.z
-mov.f32f32 r17.w, r17.z
-mul.f r15.x, r15.x, r15.z
-mov.f32f32 r13.y, r13.y
-mov.f32f32 r15.z, c2.x
-add.f r10.z, (neg)r10.z, (neg)r17.x
-mov.f32f32 r15.x, r15.x
-mov.f32f32 r17.x, r15.w
-mul.f r15.z, r15.z, c2.x
-rcp r17.w, r17.w
-absneg.f r18.x, (neg)r0.x
-mov.f32f32 r10.z, r10.z
-mov.f32f32 r12.w, r12.w
-add.f r13.y, r13.y, (neg)r15.z
-add.f r15.z, c10.w, r18.x
-max.f r14.y, r14.y, r15.x
-mul.f r12.w, c7.w, r12.w
-mov.f32f32 r13.y, r13.y
-(ss)mul.f r15.x, r15.z, r17.w
-mov.f32f32 r14.y, r14.y
-mov.f32f32 r15.z, r4.y
-mul.f r13.y, r16.y, r13.y
-mov.f32f32 r15.x, r15.x
-mov.f32f32 r16.y, r17.z
-mov.f32f32 r12.w, r12.w
-mov.f32f32 r13.y, r13.y
-mul.f r16.z, r16.z, r9.x
-(ss)mov.f32f32 r17.w, r15.z
-mad.f32 r16.z, r16.w, r4.y, r16.z
-rcp r16.w, r17.x
-(ss)absneg.f r17.x, (neg)r0.x
-rcp r16.y, r16.y
-add.f r18.x, c7.w, r18.x
-rcp r12.w, r12.w
-(ss)mov.f32f32 r12.w, r12.w
-mov.f32f32 r16.z, r16.z
-add.f r18.y, c10.w, r17.x
-mad.f32 r16.z, r17.y, r7.x, r16.z
-mov.f32f32 r17.y, r18.x
-mul.f r10.z, r10.z, r12.w
-rcp r12.w, r17.w
-(ss)absneg.f r17.w, (neg)r0.x
-mul.f r16.z, c7.w, r16.z
-mul.f r16.y, r17.y, r16.y
-mov.f32f32 r10.z, r10.z
-add.f r17.y, c10.w, r17.w
-mov.f32f32 r16.z, r16.z
-mov.f32f32 r16.y, r16.y
-cmps.f.lt r18.x, c8.y, r10.z
-(ss)mul.f r12.w, r17.y, r12.w
-mad.f32 r13.y, r16.z, r16.z, (neg)r13.y
-max.f r15.x, r15.x, r16.y
-cov.u32f32 r16.y, r18.x
-mov.f32f32 r12.w, r12.w
-mov.f32f32 r13.y, r13.y
-mov.f32f32 r15.x, r15.x
+rcp r15.x, r5.z
+add.f r15.z, c10.w, r15.z
+add.f r8.x, r8.x, (neg)r16.y
+sel.b32 r16.y, r16.w, r15.w, r17.y
+mov.f32f32 r9.x, r9.x
+(ss)mul.f r15.x, r15.z, r15.x
+mul.f r8.x, r16.x, r8.x
+max.f r10.w, r10.w, r13.x
+mul.f r13.x, r13.y, r14.z
+max.f r13.y, r15.x, r14.w
+mad.f32 r8.x, r16.z, r16.z, (neg)r8.x
+(ss)cmps.f.lt r14.z, c8.y, r9.x
+min.f r9.z, r9.z, r10.w
+min.f r10.w, r11.y, r13.y
+mov.f32f32 r11.y, r11.x
+max.f r12.x, r12.x, r13.x
+mov.f32f32 r13.x, r4.y
+mov.f32f32 r13.y, r10.w
+sqrt r14.w, r8.x
+(ss)add.f r14.w, (neg)r15.y, (neg)r14.w
+mul.f r10.y, c7.w, r10.y
+cov.u32f32 r14.z, r14.z
+mad.f32 r15.x, r11.w, r13.y, r0.z
+rcp r15.y, r11.y
+absneg.f r15.z, (neg)r2.x
+rcp r16.x, r13.x
+absneg.f r16.z, (neg)r0.z
+cmps.f.ne r14.z, r14.z, c8.y
+mov.f32f32 r16.w, r15.x
+rcp r10.y, r10.y
+(ss)mul.f r10.y, r14.w, r10.y
+add.f r14.w, c7.z, r15.z
+sel.b32 r16.y, r16.y, r14.z, r17.y
+mov.f32f32 r17.x, r16.w
+cmps.f.lt r17.y, c8.y, r10.y
+mul.f r14.w, r14.w, r15.y
+add.f r15.y, c7.z, r16.z
+add.f r17.x, c7.z, (neg)r17.x
+cov.u32f32 r17.y, r17.y
cmps.f.ne r16.y, r16.y, c8.y
-mov.f32f32 r17.y, c8.y
-mov.f32f32 r18.x, r13.y
-min.f r9.z, r9.z, r15.x
-mov.f32f32 r15.x, r7.x
-mov.f32f32 r18.z, c7.z
-mov.f32f32 r18.w, r15.z
-mul.f r16.w, r18.y, r16.w
-mov.f32f32 r18.y, r15.x
-sqrt r18.x, r18.x
-(ss)mov.f32f32 r18.x, r18.x
-mov.f32f32 r16.z, r16.z
-sel.b32 r17.y, r17.y, r16.y, r18.z
-cmps.f.lt r19.x, c8.y, r9.w
-rcp r18.w, r18.w
-add.f r17.w, c7.w, r17.w
-add.f r16.z, (neg)r16.z, (neg)r18.x
-rcp r18.x, r18.y
-(ss)absneg.f r18.y, (neg)r3.x
-cov.u32f32 r19.x, r19.x
-mov.f32f32 r17.w, r17.w
-mov.f32f32 r16.z, r16.z
-mov.f32f32 r14.w, r14.w
-add.f r19.y, c10.w, r18.y
-cmps.f.ne r19.x, r19.x, c8.y
-(ss)mul.f r17.w, r17.w, r18.w
-mul.f r14.w, c7.w, r14.w
-mul.f r18.x, r19.y, r18.x
-sel.b32 r17.y, r17.y, r19.x, r18.z
-mov.f32f32 r17.w, r17.w
-mov.f32f32 r14.w, r14.w
-mov.f32f32 r18.x, r18.x
-mov.f32f32 r18.z, r15.x
+mov.f32f32 r5.w, r5.w
+mul.f r6.x, r17.x, r6.x
+add.f r17.x, c10.w, (neg)r16.w
cmps.f.ne r17.y, r17.y, c8.y
-mov.f32f32 r18.w, r10.z
-max.f r12.w, r12.w, r17.w
-mov.f32f32 r16.w, r16.w
-rcp r14.w, r14.w
-(ss)mov.f32f32 r14.w, r14.w
-mov.f32f32 r17.w, r18.w
-rcp r18.z, r18.z
-add.f r18.y, c7.z, r18.y
-mov.f32f32 r12.w, r12.w
-mul.f r14.w, r16.z, r14.w
-mov.f32f32 r16.z, r17.w
-mov.f32f32 r17.w, r18.y
-min.f r12.w, r14.y, r12.w
-mov.f32f32 r14.y, r14.w
-sel.b32 r10.z, r16.z, r16.y, r10.z
-(ss)mul.f r14.w, r17.w, r18.z
-mov.f32f32 r16.y, r7.x
-cmps.f.lt r16.z, c8.y, r14.y
-sel.b32 r9.w, r10.z, r19.x, r9.w
-mov.f32f32 r10.z, c9.z
-mov.f32f32 r14.w, r14.w
-cov.u32f32 r16.z, r16.z
-mov.f32f32 r17.w, r16.y
-sel.b32 r9.w, r10.z, r17.y, r9.w
-max.f r10.z, r18.x, r14.w
-cmps.f.ne r14.w, r16.z, c8.y
-mov.f32f32 r16.z, c8.y
-mov.f32f32 r17.y, c7.z
-mov.f32f32 r10.z, r10.z
-mov.f32f32 r18.x, r9.w
-mov.f32f32 r8.w, r8.w
-sel.b32 r16.z, r16.z, r14.w, r17.y
-cmps.f.lt r18.y, c8.y, r13.y
-min.f r9.z, r9.z, r10.z
-mad.f32 r8.w, r8.w, r18.x, r0.z
-rcp r10.z, r17.w
-(ss)absneg.f r17.w, (neg)r3.x
-cov.u32f32 r18.x, r18.y
-mov.f32f32 r9.z, r9.z
-mov.f32f32 r18.y, r10.y
-absneg.f r18.z, (abs)r8.w
-cmps.f.ne r18.x, r18.x, c8.y
-mov.f32f32 r18.w, c7.z
-mad.f32 r18.y, r18.y, r9.z, r0.z
-add.f r19.x, c10.w, r17.w
-sel.b32 r16.z, r16.z, r18.x, r17.y
-add.f r17.y, r18.w, c2.x
-mov.f32f32 r18.y, r18.y
-(ss)mul.f r10.z, r19.x, r10.z
-cmps.f.ne r16.z, r16.z, c8.y
-mov.f32f32 r18.w, r14.y
-mov.f32f32 r19.x, r18.y
-add.f r18.z, r17.y, (neg)r18.z
-mov.f32f32 r10.z, r10.z
-mov.f32f32 r18.w, r18.w
-mov.f32f32 r19.y, r19.x
-mov.f32f32 r18.z, r18.z
-mov.f32f32 r19.z, c2.x
-mov.f32f32 r18.w, r18.w
-add.f r19.y, c10.w, (neg)r19.y
-mov.f32f32 r19.w, r16.y
-mov.f32f32 r20.x, r18.y
-sel.b32 r14.y, r18.w, r14.w, r14.y
-mul.f r7.y, r19.y, r7.y
-rcp r14.w, r19.z
-(ss)mul.f r18.z, r18.z, r14.w
-add.f r18.w, r20.x, (neg)c1.x
-sel.b32 r13.y, r14.y, r18.x, r13.y
-mov.f32f32 r14.y, c9.z
-mov.f32f32 r7.y, r7.y
-mov.f32f32 r18.x, r19.x
-mov.f32f32 r18.z, r18.z
-sel.b32 r13.y, r14.y, r16.z, r13.y
-rcp r14.y, r19.w
-add.f r16.z, c7.z, r17.w
-add.f r17.w, c7.z, (neg)r18.x
-mul.f r18.x, r18.w, r18.w
-mov.f32f32 r18.w, r13.y
-mov.f32f32 r9.x, r9.x
-mul.f r8.x, r17.w, r8.x
-log2 r17.w, r18.z
-(ss)mul.f r17.w, c9.x, r17.w
-mov.f32f32 r16.z, r16.z
-mad.f32 r9.x, r9.x, r18.w, r0.z
+mov.f32f32 r17.z, c8.y
+mov.f32f32 r17.w, c7.z
+mul.f r6.y, r17.x, r6.y
+sel.b32 r5.w, r5.w, r15.w, r5.w
+rcp r15.w, r11.x
+mul.f r15.y, r15.y, r16.x
+sel.b32 r16.x, r17.z, r17.y, r17.w
+max.f r17.x, r6.y, r6.x
+mad.f32 r10.w, r7.x, r10.w, r0.x
mov.f32f32 r8.x, r8.x
-mov.f32f32 r17.w, r17.w
-mul.f r14.y, r16.z, r14.y
-absneg.f r16.z, (abs)r9.x
-(ss)mov.f32f32 r18.z, c7.z
-max.f r18.w, r7.y, r8.x
-mov.f32f32 r14.y, r14.y
-mov.f32f32 r19.x, r13.y
-add.f r18.z, r18.z, c2.x
-mov.f32f32 r18.w, r18.w
-mov.f32f32 r19.y, r17.z
-exp2 r17.w, r17.w
+sel.b32 r5.w, r5.w, r14.z, r9.x
+mov.f32f32 r9.x, c9.z
+mov.f32f32 r14.z, r10.w
+cmps.f.lt r17.z, c8.y, r8.x
+add.f r15.z, c10.w, r15.z
+rcp r18.x, r4.y
+sel.b32 r5.w, r9.x, r16.y, r5.w
+mov.f32f32 r9.x, r14.z
+cov.u32f32 r16.y, r17.z
+(ss)mul.f r15.z, r15.z, r15.w
+add.f r15.w, c10.w, r16.z
+add.f r16.z, c7.w, (neg)r9.x
+cmps.f.ne r16.y, r16.y, c8.y
+mad.f32 r9.y, r9.y, r5.w, r0.z
+max.f r14.w, r15.z, r14.w
+mul.f r5.x, r16.z, r5.x
+add.f r15.z, c10.w, (neg)r14.z
+sel.b32 r16.x, r16.x, r16.y, r17.w
+absneg.f r16.z, (abs)r9.y
+mov.f32f32 r17.z, c7.z
+mul.f r5.y, r15.z, r5.y
+cmps.f.ne r15.z, r16.x, c8.y
+mov.f32f32 r10.y, r10.y
+add.f r16.x, r17.z, c2.x
+max.f r17.z, r5.y, r5.x
+min.f r9.z, r9.z, r14.w
+mul.f r14.w, r15.w, r18.x
+sel.b32 r10.y, r10.y, r17.y, r10.y
+min.f r15.w, r17.x, r17.z
+mad.f32 r13.y, r14.y, r13.y, r2.x
+add.f r16.z, r16.x, (neg)r16.z
+sel.b32 r8.x, r10.y, r16.y, r8.x
+mov.f32f32 r10.y, c2.x
+mov.f32f32 r16.y, r13.y
+mov.f32f32 r17.x, c9.z
+mov.f32f32 r17.y, r9.z
+max.f r14.w, r14.w, r15.y
+mov.f32f32 r15.y, r16.y
+sel.b32 r8.x, r17.x, r15.z, r8.x
+rcp r10.y, r10.y
+(ss)mul.f r15.z, r16.z, r10.y
+mad.f32 r16.z, r11.z, r17.y, r0.z
+add.f r15.y, c7.z, (neg)r15.y
+absneg.f r1.z, (neg)r1.z
+(ss)mad.f32 r4.y, r4.y, r8.x, r0.z
+mov.f32f32 r17.x, r16.z
+min.f r12.x, r14.w, r12.x
+mov.f32f32 r14.w, r5.z
+absneg.f r17.z, (abs)r4.y
+log2 r15.z, r15.z
+mov.f32f32 r17.w, c7.z
+rcp r18.x, r1.z
+(ss)mul.f r15.y, r15.y, r18.x
+add.f r18.x, c10.w, (neg)r16.y
+rcp r18.y, r1.z
+(ss)mul.f r15.z, c9.x, r15.z
+add.f r17.w, r17.w, c2.x
+mov.f32f32 r18.z, r17.x
+(ss)mul.f r18.x, r18.x, r18.y
+rcp r18.y, r14.w
+absneg.f r18.w, (neg)r2.x
+add.f r17.z, r17.w, (neg)r17.z
+mov.f32f32 r19.x, c2.x
+max.f r19.y, r18.x, r15.y
+exp2 r15.z, r15.z
nop
-(ss)rcp r17.w, r17.w
-add.f r16.z, r18.z, (neg)r16.z
-(ss)mov.f32f32 r17.w, r17.w
-mad.f32 r19.y, r19.y, r9.z, r0.x
-max.f r10.z, r10.z, r14.y
-mov.f32f32 r14.y, r16.z
-mov.f32f32 r16.z, c2.x
-mov.f32f32 r19.y, r19.y
-mul.f r17.w, c9.w, r17.w
-mov.f32f32 r10.z, r10.z
-mov.f32f32 r19.z, r4.y
-mov.f32f32 r19.w, r19.y
-mov.f32f32 r17.w, r17.w
-rcp r16.z, r16.z
-(ss)mul.f r14.y, r14.y, r16.z
-min.f r10.z, r12.w, r10.z
-mov.f32f32 r12.w, r19.w
-add.f r17.w, c7.z, (neg)r17.w
-mov.f32f32 r14.y, r14.y
-mov.f32f32 r10.z, r10.z
-mov.f32f32 r16.x, r16.x
-add.f r12.w, c10.w, (neg)r12.w
-mov.f32f32 r17.w, r17.w
-mad.f32 r19.x, r19.z, r19.x, r0.x
-mad.f32 r16.x, r16.x, r10.z, r0.z
-log2 r14.y, r14.y
-(ss)mul.f r14.y, c9.x, r14.y
-mul.f r5.y, r12.w, r5.y
-mul.f r12.w, c7.x, r17.w
-mul.f r19.z, c7.x, r17.w
-mov.f32f32 r14.y, r14.y
+(ss)rcp r15.z, r15.z
+(ss)mul.f r15.z, c9.w, r15.z
+add.f r18.z, c7.z, (neg)r18.z
+min.f r15.w, r15.w, r19.y
+absneg.f r3.w, (neg)r3.w
+add.f r19.y, c7.z, r18.w
+rcp r19.x, r19.x
+(ss)mul.f r17.z, r17.z, r19.x
+mov.f32f32 r19.z, r15.w
+mov.f32f32 r6.x, r6.x
+mov.f32f32 r6.y, r6.y
+add.f r15.z, c7.z, (neg)r15.z
+rcp r19.w, r3.w
+mul.f r18.y, r19.y, r18.y
+(ss)mul.f r18.z, r18.z, r19.w
+min.f r6.x, r6.y, r6.x
+mov.f32f32 r5.x, r5.x
mov.f32f32 r5.y, r5.y
-mov.f32f32 r20.x, r19.w
-mov.f32f32 r12.w, r12.w
-mov.f32f32 r19.z, r19.z
-mul.f r17.w, c7.x, r17.w
-add.f r20.x, c7.w, (neg)r20.x
-exp2 r14.y, r14.y
+log2 r6.y, r17.z
+(ss)mul.f r6.y, c9.x, r6.y
+(ss)mov.f32f32 r17.z, r15.z
+add.f r19.y, c10.w, (neg)r17.x
+min.f r5.x, r5.y, r5.x
+rcp r5.y, r3.w
nop
-(ss)rcp r14.y, r14.y
-(ss)mov.f32f32 r14.y, r14.y
-mov.f32f32 r20.y, r9.w
-mov.f32f32 r20.z, r8.z
-mov.f32f32 r17.w, r17.w
-mul.f r14.y, c9.w, r14.y
-mul.f r6.z, r20.x, r6.z
-mad.f32 r20.x, r20.z, r20.y, r3.x
-mov.f32f32 r16.x, r16.x
-mov.f32f32 r14.y, r14.y
-mov.f32f32 r6.z, r6.z
-absneg.f r20.y, (abs)r20.x
-mov.f32f32 r20.z, r16.x
-add.f r14.y, c7.z, (neg)r14.y
-max.f r20.w, r5.y, r6.z
-add.f r17.y, r17.y, (neg)r20.y
-add.f r20.y, c10.w, (neg)r20.z
-mov.f32f32 r14.y, r14.y
-mov.f32f32 r20.z, r20.w
-mov.f32f32 r17.y, r17.y
-mul.f r9.y, r20.y, r9.y
-mul.f r20.y, c7.x, r14.y
-mul.f r20.w, c7.x, r14.y
-mul.f r14.y, c7.x, r14.y
-min.f r18.w, r18.w, r20.z
-mov.f32f32 r20.y, r20.y
-mov.f32f32 r20.z, r13.y
-mov.f32f32 r7.x, r7.x
-mov.f32f32 r20.w, r20.w
-mov.f32f32 r14.y, r14.y
-mov.f32f32 r21.x, r15.x
-mad.f32 r7.x, r7.x, r20.z, r3.x
-mul.f r17.y, r17.y, r14.w
-mov.f32f32 r9.y, r9.y
-mov.f32f32 r20.z, r16.x
-absneg.f r21.y, (abs)r7.x
-mad.f32 r9.z, r21.x, r9.z, r3.x
-mov.f32f32 r17.y, r17.y
-add.f r20.z, c7.z, (neg)r20.z
-add.f r18.z, r18.z, (neg)r21.y
-mov.f32f32 r9.z, r9.z
-mov.f32f32 r21.x, r19.x
-mul.f r0.y, r20.z, r0.y
-mov.f32f32 r18.z, r18.z
-mov.f32f32 r20.z, r9.z
-log2 r17.y, r17.y
-(ss)mul.f r17.y, c9.x, r17.y
-mov.f32f32 r0.y, r0.y
-mul.f r18.z, r18.z, r16.z
-mov.f32f32 r21.y, r20.z
-mov.f32f32 r17.y, r17.y
-max.f r21.z, r9.y, r0.y
-mov.f32f32 r18.z, r18.z
-add.f r21.y, c10.w, (neg)r21.y
-add.f r4.w, c7.z, (neg)r4.w
-mov.f32f32 r21.z, r21.z
-mov.f32f32 r15.z, r15.z
-exp2 r17.y, r17.y
+rcp r19.w, r5.z
+mul.f r20.x, c7.x, r17.z
+mul.f r17.z, c7.x, r17.z
+max.f r5.x, r6.x, r5.x
+mov.f32f32 r6.x, r15.y
+mov.f32f32 r15.y, r18.x
+exp2 r6.y, r6.y
nop
-(ss)rcp r17.y, r17.y
-mul.f r5.w, r21.y, r5.w
-log2 r18.z, r18.z
-(ss)mul.f r18.z, c9.x, r18.z
-mov.f32f32 r17.y, r17.y
-mad.f32 r15.z, r15.z, r10.z, r0.x
-mov.f32f32 r5.w, r5.w
-mov.f32f32 r18.z, r18.z
-mov.f32f32 r20.z, r20.z
-mul.f r17.y, c9.w, r17.y
-mov.f32f32 r15.z, r15.z
-mov.f32f32 r4.w, r4.w
-add.f r20.z, c7.z, (neg)r20.z
-mov.f32f32 r17.y, r17.y
-exp2 r18.z, r18.z
+(ss)rcp r6.y, r6.y
+(ss)mul.f r6.y, c9.w, r6.y
+mad.f32 r18.x, r11.x, r5.w, r2.x
+min.f r6.x, r15.y, r6.x
+mul.f r5.y, r19.y, r5.y
+add.f r15.y, c10.w, r18.w
+add.f r6.y, c7.z, (neg)r6.y
+max.f r5.x, r5.x, r6.x
+absneg.f r6.x, (abs)r18.x
+max.f r18.w, r5.y, r18.z
+mul.f r15.y, r15.y, r19.w
+add.f r5.x, r19.z, (neg)r5.x
+mov.f32f32 r19.y, r6.y
+mul.f r6.y, c7.x, r6.y
+add.f r6.x, r16.x, (neg)r6.x
+mad.f32 r5.x, c11.w, r5.x, c7.z
+mul.f r16.x, c7.x, r19.y
+mul.f r19.y, c7.x, r19.y
+mad.f32 r5.z, r5.z, r8.x, r2.x
+mul.f r6.x, r6.x, r10.y
+mad.f32 r9.z, r12.w, r9.z, r0.x
+max.f r15.y, r15.y, r18.y
+rcp r5.x, r5.x
+mad.f32 r9.x, r0.w, r15.w, r9.x
+absneg.f r15.w, (abs)r5.z
+mov.f32f32 r18.y, r9.z
+min.f r12.x, r12.x, r15.y
+add.f r9.x, r9.x, c11.z
+add.f r15.y, r17.w, (neg)r15.w
+log2 r6.x, r6.x
+(ss)mul.f r6.x, c9.x, r6.x
+mov.f32f32 r15.w, r18.y
+mul.f r9.x, c11.y, r9.x
+mul.f r15.y, r15.y, r19.x
+mov.f32f32 r17.w, r12.x
+add.f r19.z, c7.w, (neg)r15.w
+mul.f r5.x, r9.x, r5.x
+exp2 r6.x, r6.x
nop
-(ss)rcp r18.z, r18.z
-(ss)mov.f32f32 r18.z, r18.z
-mul.f r5.z, r20.z, r5.z
-add.f r17.y, c7.z, (neg)r17.y
-mov.f32f32 r20.z, r15.z
-mul.f r18.z, c9.w, r18.z
-mov.f32f32 r5.z, r5.z
-mov.f32f32 r17.y, r17.y
-add.f r20.z, c10.w, (neg)r20.z
-mov.f32f32 r18.z, r18.z
-max.f r21.y, r5.w, r5.z
-mul.f r12.w, r12.w, r17.y
-mul.f r19.z, r19.z, r17.y
-add.f r18.z, c7.z, (neg)r18.z
-mov.f32f32 r21.y, r21.y
-mov.f32f32 r12.w, r12.w
-mov.f32f32 r19.z, r19.z
-mov.f32f32 r18.z, r18.z
+(ss)rcp r6.x, r6.x
+mad.f32 r9.x, r13.x, r17.w, r0.z
+(ss)mul.f r6.x, c9.w, r6.x
+log2 r13.x, r15.y
+(ss)mul.f r13.x, c9.x, r13.x
+mul.f r7.y, r19.z, r7.y
+(ss)mov.f32f32 r15.y, r9.x
+exp2 r5.x, r5.x
+(ss)add.f r5.x, c7.z, r5.x
+add.f r6.x, c7.z, (neg)r6.x
+add.f r19.z, c10.w, (neg)r18.y
+add.f r19.w, c10.w, (neg)r15.y
+exp2 r13.x, r13.x
+mad.f32 r20.y, r7.x, r8.x, r0.x
+(ss)rcp r13.x, r13.x
+(ss)mul.f r13.x, c9.w, r13.x
+mov.f32f32 r20.z, r6.x
+rcp r5.x, r5.x
+absneg.f r20.w, (abs)r16.y
+mul.f r8.z, r19.z, r8.z
+mul.f r8.y, r19.w, r8.y
+add.f r19.z, c7.z, (neg)r15.y
+cmps.f.lt r19.w, c11.x, r20.w
+add.f r13.x, c7.z, (neg)r13.x
+mul.f r20.x, r20.x, r20.z
+mul.f r17.z, r17.z, r20.z
+cov.u32f32 r19.w, r19.w
+mov.f32f32 r20.z, r13.x
+mul.f r6.y, r6.y, r13.x
+mad.f32 r13.x, r12.w, r5.w, r0.x
+cmps.f.ne r19.w, r19.w, c8.y
+mov.f32f32 r20.w, c8.y
+mov.f32f32 r21.x, c10.x
+mul.f r16.x, r16.x, r20.z
+mul.f r19.y, r19.y, r20.z
+add.f r20.z, r20.y, c7.z
+sel.b32 r20.w, r20.w, r19.w, r21.x
+absneg.f r15.x, (abs)r15.x
+add.f r21.x, r13.x, c7.z
+add.f r20.z, r20.z, c2.x
+max.f r21.y, r8.z, r7.y
+cmps.f.lt r15.x, c11.x, r15.x
+add.f r21.x, r21.x, c2.x
+mul.f r20.z, r20.z, r19.x
min.f r18.w, r18.w, r21.y
-mov.f32f32 r21.y, r9.w
-mov.f32f32 r21.w, r8.y
-mul.f r20.y, r20.y, r18.z
-mul.f r20.w, r20.w, r18.z
-mul.f r14.y, r14.y, r18.z
-mov.f32f32 r18.z, r18.w
-mov.f32f32 r18.w, r20.y
-add.f r20.y, r19.x, c7.z
-mov.f32f32 r20.w, r20.w
-mov.f32f32 r14.y, r14.y
-mov.f32f32 r19.w, r19.w
-add.f r20.y, r20.y, c2.x
-mov.f32f32 r22.x, r0.w
-mad.f32 r21.y, r21.w, r21.y, r0.x
-mul.f r17.y, r17.w, r17.y
-mov.f32f32 r17.w, r20.y
-mad.f32 r19.w, r22.x, r18.z, r19.w
-add.f r20.y, r21.y, c7.z
-mov.f32f32 r17.y, r17.y
-mul.f r17.w, r17.w, r16.z
-mov.f32f32 r19.w, r19.w
-add.f r20.y, r20.y, c2.x
-mul.f r7.w, r20.z, r7.w
-mov.f32f32 r17.w, r17.w
-add.f r19.w, r19.w, c11.z
-mov.f32f32 r20.y, r20.y
-mov.f32f32 r7.w, r7.w
-mov.f32f32 r20.z, r15.z
-mov.f32f32 r19.w, r19.w
-mul.f r20.y, r20.y, r14.w
-log2 r17.w, r17.w
-(ss)mul.f r17.w, c9.x, r17.w
-add.f r20.z, c7.w, (neg)r20.z
-mul.f r19.w, c11.y, r19.w
-mov.f32f32 r20.y, r20.y
-mov.f32f32 r17.w, r17.w
-mul.f r6.y, r20.z, r6.y
-mov.f32f32 r19.w, r19.w
-min.f r7.y, r7.y, r8.x
-mov.f32f32 r8.x, r4.w
-min.f r5.y, r5.y, r6.z
-mov.f32f32 r6.y, r6.y
-exp2 r6.z, r17.w
+cov.u32f32 r15.x, r15.x
+mul.f r21.x, r21.x, r10.y
+mad.f32 r17.y, r11.y, r17.y, r2.x
+mul.f r4.z, r19.z, r4.z
+cmps.f.ne r15.x, r15.x, c8.y
+absneg.f r19.z, (neg)r16.w
+log2 r20.z, r20.z
+(ss)mul.f r20.z, c9.x, r20.z
+mov.f32f32 r21.y, r17.y
+log2 r21.x, r21.x
+(ss)mul.f r21.x, c9.x, r21.x
+sel.b32 r19.z, r19.z, r15.x, r20.w
+max.f r20.w, r8.y, r4.z
+mad.f32 r12.x, r7.x, r12.x, r0.x
+mov.f32f32 r21.z, r21.y
+mul.f r19.z, r2.w, r19.z
+mov.f32f32 r21.w, c8.y
+mov.f32f32 r22.x, c10.y
+exp2 r20.z, r20.z
nop
-(ss)rcp r6.z, r6.z
-(ss)mov.f32f32 r6.z, r6.z
-max.f r5.y, r7.y, r5.y
-min.f r5.z, r5.w, r5.z
-log2 r5.w, r20.y
-(ss)mul.f r5.w, c9.x, r5.w
-mul.f r6.z, c9.w, r6.z
-max.f r7.y, r7.w, r6.y
-max.f r5.y, r5.y, r5.z
-mov.f32f32 r5.z, r5.w
-mov.f32f32 r5.w, r6.z
-mov.f32f32 r6.z, r7.y
-mov.f32f32 r5.y, r5.y
-sqrt r7.y, r8.x
-(ss)mov.f32f32 r7.y, r7.y
-add.f r5.w, c7.z, (neg)r5.w
-min.f r6.z, r21.z, r6.z
-(ss)mov.f32f32 r8.x, r16.y
-add.f r5.y, r18.z, (neg)r5.y
-mov.f32f32 r5.w, r5.w
-exp2 r5.z, r5.z
+(ss)rcp r20.z, r20.z
+(ss)mul.f r20.z, c9.w, r20.z
+exp2 r21.x, r21.x
nop
-(ss)rcp r5.z, r5.z
-(ss)mov.f32f32 r5.z, r5.z
-mov.f32f32 r5.y, r5.y
-mul.f r16.y, r18.w, r5.w
-mul.f r17.w, r20.w, r5.w
-mul.f r5.w, r14.y, r5.w
-mad.f32 r5.y, c11.w, r5.y, c7.z
-mov.f32f32 r14.y, r16.y
-mov.f32f32 r16.y, r3.w
-mov.f32f32 r17.w, r17.w
-mov.f32f32 r5.w, r5.w
-mov.f32f32 r5.y, r5.y
-mad.f32 r7.y, c8.z, r16.y, r7.y
-mul.f r5.z, c9.w, r5.z
-mad.f32 r8.x, r8.x, r10.z, r3.x
-mov.f32f32 r10.z, r19.y
-mov.f32f32 r7.y, r7.y
-mov.f32f32 r5.z, r5.z
-rcp r5.y, r5.y
-(ss)mov.f32f32 r5.y, r5.y
-mov.f32f32 r8.x, r8.x
-mul.f r16.y, r7.y, c10.x
-add.f r5.z, c7.z, (neg)r5.z
-mul.f r5.y, r19.w, r5.y
-mov.f32f32 r18.z, r8.x
-mov.f32f32 r16.y, r16.y
-absneg.f r18.w, (neg)c0.x
-mov.f32f32 r5.y, r5.y
-mov.f32f32 r5.z, r5.z
-add.f r18.z, c10.w, (neg)r18.z
-mov.f32f32 r18.w, r18.w
-add.f r10.z, r10.z, (neg)c1.y
-mul.f r17.y, r17.y, r5.z
-add.f r19.w, r9.x, (neg)c1.x
-mad.f32 r16.y, c8.z, r18.w, (neg)r16.y
-cmps.f.lt r4.w, r4.w, c8.y
-exp2 r5.y, r5.y
-(ss)mov.f32f32 r5.y, r5.y
-mul.f r12.w, r12.w, r5.z
-mul.f r5.z, r19.z, r5.z
-cov.u32f32 r4.w, r4.w
-add.f r5.y, c7.z, r5.y
-mov.f32f32 r12.w, r12.w
-mov.f32f32 r5.z, r5.z
-cmps.f.ne r4.w, r4.w, c8.y
-mov.f32f32 r18.w, c8.y
-mov.f32f32 r5.y, r5.y
-mov.f32f32 r19.z, r21.y
-mov.f32f32 r5.x, r5.x
-sel.b32 r16.y, r18.w, r4.w, r16.y
-mov.f32f32 r17.y, r17.y
-mul.f r3.y, r18.z, r3.y
-mul.f r5.x, r5.x, c8.x
-mov.f32f32 r18.z, r16.y
-rcp r5.y, r5.y
-(ss)mov.f32f32 r5.y, r5.y
-mov.f32f32 r18.w, r9.z
-mov.f32f32 r5.x, r5.x
-mul.f r18.z, r21.x, r18.z
-mul.f r20.y, r7.y, c10.y
-mov.f32f32 r20.z, r18.w
-add.f r5.x, c7.z, (neg)r5.x
-mov.f32f32 r3.y, r3.y
-mov.f32f32 r20.y, r20.y
-mov.f32f32 r3.w, r3.w
-absneg.f r20.z, (abs)r20.z
-mov.f32f32 r5.x, r5.x
-mov.f32f32 r20.w, r8.x
-mad.f32 r3.w, c8.z, r3.w, (neg)r20.y
-mov.f32f32 r20.y, c8.y
-cmps.f.lt r20.z, c11.x, r20.z
-mov.f32f32 r21.x, r5.x
-add.f r20.w, c7.z, (neg)r20.w
-sel.b32 r3.w, r20.y, r4.w, r3.w
-cov.u32f32 r20.y, r20.z
-mad.f32 r10.z, r10.z, r10.z, r18.x
-mul.f r18.x, r19.w, r16.z
-mov.f32f32 r19.w, r3.w
-mov.f32f32 r20.y, r20.y
-sqrt r20.z, r21.x
-(ss)mov.f32f32 r20.z, r20.z
-(ss)mov.f32f32 r21.x, r4.x
-mul.f r1.z, r20.w, r1.z
-cmps.f.ne r20.y, r20.y, c8.y
-mov.f32f32 r20.w, c8.y
-rcp r19.w, r19.w
-(ss)mul.f r18.z, r18.z, r19.w
-mad.f32 r20.z, c8.z, r21.x, r20.z
-mov.f32f32 r1.z, r1.z
-mov.f32f32 r20.w, r20.w
-mov.f32f32 r18.z, r18.z
-mov.f32f32 r21.x, r9.x
-mov.f32f32 r21.z, c10.x
-mov.f32f32 r20.z, r20.z
-max.f r21.w, r3.y, r1.z
-add.f r18.z, r21.x, (neg)r18.z
-sel.b32 r20.w, r20.w, r20.y, r21.z
-mov.f32f32 r21.x, r18.y
-mul.f r21.z, r20.z, c10.x
-mov.f32f32 r18.z, r18.z
-mov.f32f32 r21.w, r21.w
-absneg.f r21.x, (abs)r21.x
-mov.f32f32 r21.z, r21.z
-mad.f32 r18.z, c10.z, r18.z, c7.x
-absneg.f r22.x, (neg)c0.x
-cmps.f.lt r21.x, c11.x, r21.x
-min.f r6.z, r6.z, r21.w
-mov.f32f32 r18.z, r18.z
-mov.f32f32 r21.w, r22.x
-cov.u32f32 r21.x, r21.x
-mov.f32f32 r6.z, r6.z
-mov.f32f32 r18.z, r18.z
-mad.f32 r21.z, c8.z, r21.w, (neg)r21.z
-cmps.f.lt r5.x, r5.x, c8.y
-mov.f32f32 r21.x, r21.x
-mov.f32f32 r18.z, r18.z
-mov.f32f32 r21.w, r15.z
-mov.f32f32 r22.x, r1.x
-cmps.f.ne r21.x, r21.x, c8.y
-mov.f32f32 r22.y, r18.z
-mov.f32f32 r18.z, r19.x
-mul.f r7.y, r7.y, c10.x
-mov.f32f32 r22.z, r18.y
-cov.u32f32 r5.x, r5.x
-mad.f32 r21.w, r22.x, r6.z, r21.w
-mov.f32f32 r7.y, r7.y
-absneg.f r22.x, (neg)c0.z
-mov.f32f32 r22.z, r22.z
-cmps.f.ne r5.x, r5.x, c8.y
-mov.f32f32 r22.w, c8.y
-mov.f32f32 r22.x, r22.x
-absneg.f r22.z, (neg)r22.z
-mov.f32f32 r21.w, r21.w
-sel.b32 r21.z, r22.w, r5.x, r21.z
-mad.f32 r7.y, c8.z, r22.x, (neg)r7.y
+(ss)rcp r21.x, r21.x
+sel.b32 r21.w, r21.w, r19.w, r22.x
mov.f32f32 r22.x, c8.y
-mov.f32f32 r22.z, r22.z
-mov.f32f32 r22.w, r21.z
-add.f r21.w, r21.w, c11.z
-sel.b32 r4.w, r22.x, r4.w, r7.y
-mov.f32f32 r7.y, r22.z
-mul.f r19.z, r19.z, r22.w
-mul.f r22.x, r20.z, c10.y
-mov.f32f32 r22.z, r4.w
-sel.b32 r7.y, r7.y, r21.x, r20.w
-mov.f32f32 r20.w, r21.w
-mov.f32f32 r21.w, r22.x
-mul.f r18.z, r18.z, r22.z
-mul.f r7.y, r1.w, r7.y
+add.f r20.z, c7.z, (neg)r20.z
+(ss)mul.f r21.x, c9.w, r21.x
+add.f r21.z, c7.z, (neg)r21.z
+sel.b32 r21.w, r22.x, r15.x, r21.w
+mov.f32f32 r22.x, r20.z
+mul.f r6.y, r6.y, r20.z
+add.f r20.z, c7.z, (neg)r21.x
+mad.f32 r0.w, r0.w, r21.w, r19.z
+mov.f32f32 r19.z, r16.y
+mul.f r16.x, r16.x, r22.x
+mul.f r19.y, r19.y, r22.x
+add.f r21.x, r4.y, (neg)c1.x
+absneg.f r21.w, (neg)r19.z
+mov.f32f32 r22.x, c10.x
+mov.f32f32 r22.y, r20.z
+mul.f r0.y, r0.y, c10.x
+mov.f32f32 r22.z, r12.x
+sel.b32 r21.w, r21.w, r19.w, r22.x
mov.f32f32 r22.x, c8.y
-mov.f32f32 r4.x, r4.x
-mul.f r18.z, r18.z, r19.w
-(ss)mul.f r19.w, c11.y, r20.w
-mov.f32f32 r20.w, r22.x
-mad.f32 r4.x, c8.z, r4.x, (neg)r21.w
-mov.f32f32 r18.z, r18.z
-mov.f32f32 r21.w, r7.x
-mov.f32f32 r22.x, c10.y
-mov.f32f32 r22.z, c8.y
-mov.f32f32 r19.w, r19.w
-add.f r18.z, r21.w, (neg)r18.z
-sel.b32 r20.w, r20.w, r20.y, r22.x
-mov.f32f32 r21.w, c8.y
-sel.b32 r4.x, r22.z, r5.x, r4.x
-mov.f32f32 r18.z, r18.z
-min.f r0.y, r9.y, r0.y
-min.f r6.y, r7.w, r6.y
-mov.f32f32 r7.w, r21.w
-mad.f32 r9.y, c10.z, r18.z, c7.x
-mov.f32f32 r18.z, r4.x
-max.f r0.y, r0.y, r6.y
-min.f r1.z, r3.y, r1.z
-mov.f32f32 r3.y, r9.y
-mov.f32f32 r6.y, r7.w
-mov.f32f32 r7.w, r10.z
-mov.f32f32 r9.y, r18.x
-mov.f32f32 r3.y, r3.y
-sel.b32 r6.y, r6.y, r21.x, r20.w
-rcp r10.z, r18.z
-(ss)mul.f r18.x, r19.z, r10.z
-max.f r0.y, r0.y, r1.z
-mov.f32f32 r1.z, r3.y
-mad.f32 r0.w, r0.w, r6.y, r7.y
-mov.f32f32 r3.y, r18.x
-mov.f32f32 r6.y, r8.w
-mov.f32f32 r22.z, r1.z
-mov.f32f32 r0.w, r0.w
-mov.f32f32 r1.z, r18.w
-add.f r3.y, r6.y, (neg)r3.y
-mov.f32f32 r0.y, r0.y
-mov.f32f32 r6.y, r9.z
-mul.f r7.y, (neg)r16.y, r9.y
-sam (f32)(x)r21.w, r22.y, s#1, t#1
-(sy)mul.f r9.y, r21.w, c9.y
-mov.f32f32 r1.z, r1.z
-mov.f32f32 r3.y, r3.y
-add.f r0.y, r6.z, (neg)r0.y
-mov.f32f32 r6.z, r9.y
-add.f r9.y, r19.x, (neg)c1.y
-absneg.f r1.z, (neg)r1.z
-mad.f32 r3.y, c10.z, r3.y, c7.x
-mov.f32f32 r0.y, r0.y
-mul.f r9.y, r9.y, r16.z
-mov.f32f32 r1.z, r1.z
-mov.f32f32 r16.y, c10.x
-mov.f32f32 r3.y, r3.y
-mov.f32f32 r9.y, r9.y
-mad.f32 r0.y, c11.w, r0.y, c7.z
-sel.b32 r1.z, r1.z, r20.y, r16.y
-mov.f32f32 r3.y, r3.y
-mad.f32 r3.w, (neg)r3.w, r9.y, r7.y
-mov.f32f32 r7.y, c8.y
-mov.f32f32 r0.y, r0.y
-mov.f32f32 r3.y, r3.y
-mov.f32f32 r3.w, r3.w
-add.f r9.y, r7.x, (neg)c1.z
-mov.f32f32 r7.y, r7.y
-mov.f32f32 r21.w, r3.y
-mov.f32f32 r3.y, r21.y
-mul.f r9.y, r9.y, r16.z
-mov.f32f32 r7.y, r7.y
-mul.f r16.y, r20.z, c10.x
-rcp r0.y, r0.y
-(ss)mov.f32f32 r0.y, r0.y
-mov.f32f32 r9.y, r9.y
-sel.b32 r1.z, r7.y, r21.x, r1.z
-mov.f32f32 r7.y, r16.y
-absneg.f r16.y, (neg)c0.z
-mad.f32 r3.w, (neg)r4.w, r9.y, r3.w
-mad.f32 r0.w, r2.z, r1.z, r0.w
-mul.f r0.y, r19.w, r0.y
-mov.f32f32 r1.z, r16.y
-mov.f32f32 r3.w, r3.w
-mov.f32f32 r0.w, r0.w
-mov.f32f32 r0.y, r0.y
-mad.f32 r1.z, c8.z, r1.z, (neg)r7.y
-max.f r3.w, c8.y, r3.w
+mul.f r21.x, r21.x, r19.x
+absneg.f r22.w, (neg)c0.y
+mul.f r20.x, r20.x, r22.y
+sel.b32 r21.w, r22.x, r15.x, r21.w
+add.f r22.x, r9.y, (neg)c1.x
+mul.f r17.z, r17.z, r22.y
+absneg.f r22.y, (neg)c0.z
+mad.f32 r0.w, r1.z, r21.w, r0.w
+mul.f r21.w, r22.w, r22.w
+mul.f r22.x, r22.x, r10.y
+absneg.f r23.x, (neg)c0.y
max.f r0.w, c8.y, r0.w
-mov.f32f32 r4.w, c8.y
-add.f r6.y, r6.y, (neg)c1.z
-mov.f32f32 r3.w, r3.w
-mov.f32f32 r0.w, r0.w
-sel.b32 r1.z, r4.w, r5.x, r1.z
-exp2 r0.y, r0.y
-(ss)mov.f32f32 r0.y, r0.y
-mul.f r3.w, r3.w, c7.x
-mov.f32f32 r4.w, r0.w
-mov.f32f32 r5.x, r1.z
-add.f r0.y, c7.z, r0.y
-mov.f32f32 r3.w, r3.w
-mul.f r4.w, r4.w, r5.y
-mul.f r3.y, r3.y, r5.x
-mov.f32f32 r0.y, r0.y
-mov.f32f32 r5.x, r3.w
-mov.f32f32 r4.w, r4.w
-mad.f32 r5.y, r6.y, r6.y, r7.w
-mul.f r3.y, r3.y, r10.z
-mul.f r5.x, r5.x, r6.z
-mov.f32f32 r6.y, r15.w
-rcp r0.y, r0.y
-mov.f32f32 r5.y, r5.y
-mov.f32f32 r3.y, r3.y
-mov.f32f32 r5.x, r5.x
-mad.f32 r6.z, c7.x, r9.x, c7.x
-mov.f32f32 r7.y, r20.x
-(ss)mov.f32f32 r0.y, r0.y
-mov.f32f32 r7.w, r8.x
-mov.f32f32 r6.z, r6.z
-sqrt r5.y, r5.y
-(ss)mov.f32f32 r5.y, r5.y
-mov.f32f32 r9.x, c2.x
-add.f r3.y, r7.y, (neg)r3.y
-mov.f32f32 r6.z, r6.z
-absneg.f r7.y, (abs)r7.w
-rcp r6.y, r6.y
-add.f r7.w, c7.w, r17.x
-mov.f32f32 r3.y, r3.y
-mov.f32f32 r16.y, r6.z
-mad.f32 r6.z, c7.x, r7.x, c7.x
-rcp r7.x, r9.x
-(ss)mul.f r5.y, r5.y, r7.x
-mad.f32 r3.y, c10.z, r3.y, c7.x
-cmps.f.lt r7.x, c11.x, r7.y
-mov.f32f32 r6.z, r6.z
-mov.f32f32 r5.y, r5.y
-mov.f32f32 r3.y, r3.y
-cov.u32f32 r7.x, r7.x
-mov.f32f32 r6.z, r6.z
-mov.f32f32 r7.y, r7.w
-add.f r7.w, r16.x, (neg)c1.x
-(ss)rcp r9.x, r14.z
-mov.f32f32 r3.y, r3.y
-mov.f32f32 r16.z, r6.z
-log2 r5.y, r5.y
-(ss)mul.f r5.y, c9.y, r5.y
-mov.f32f32 r6.z, r7.x
-mov.f32f32 r3.y, r3.y
-mul.f r6.y, r7.y, r6.y
-mov.f32f32 r5.y, r5.y
-mul.f r7.x, r7.w, r7.w
-sam (f32)(x)r22.x, r16.y, s#2, t#2
-(sy)cmps.f.lt r7.y, r19.x, r22.x
-mov.f32f32 r22.x, r3.y
-cmps.f.ne r3.y, r6.z, c8.y
-mov.f32f32 r6.z, c8.y
-cov.u32f32 r7.y, r7.y
-exp2 r5.y, r5.y
+add.f r21.w, c7.z, (neg)r21.w
+mad.f32 r0.y, c8.z, r22.y, (neg)r0.y
+add.f r22.y, c10.w, (neg)r22.z
+mov.f32f32 r23.y, r0.w
+mul.f r21.w, r21.w, c8.x
+mul.f r23.z, r23.x, r23.x
+mov.f32f32 r23.w, c8.y
+mul.f r5.x, r23.y, r5.x
+add.f r23.y, r16.w, (neg)c1.x
+add.f r21.w, c7.z, (neg)r21.w
+add.f r23.z, c7.z, (neg)r23.z
+sel.b32 r0.y, r23.w, r2.y, r0.y
+mul.f r2.y, r23.y, r23.y
+add.f r23.y, r14.z, (neg)c1.y
+mov.f32f32 r23.w, r21.w
+mul.f r23.z, r23.z, c8.x
+absneg.f r0.y, (neg)r0.y
+mad.f32 r2.y, r23.y, r23.y, r2.y
+add.f r23.y, r16.y, (neg)c1.z
+add.f r23.z, c7.z, (neg)r23.z
+mul.f r6.w, r22.y, r6.w
+add.f r22.y, c7.w, (neg)r22.z
+mad.f32 r2.y, r23.y, r23.y, r2.y
+sqrt r23.y, r23.w
+(ss)mad.f32 r23.y, c8.z, r22.w, r23.y
+(ss)mov.f32f32 r23.w, r23.z
+rcp r24.x, r0.y
+mul.f r4.w, r22.y, r4.w
+(ss)mul.f r21.z, r21.z, r24.x
+mov.f32f32 r22.y, r23.y
+add.f r24.x, c10.w, (neg)r21.y
+sqrt r2.y, r2.y
+mov.f32f32 r24.y, c2.x
+rcp r24.z, r0.y
+max.f r24.w, r6.w, r4.w
+sqrt r23.w, r23.w
+(ss)mad.f32 r23.w, c8.z, r23.x, r23.w
+mul.f r24.x, r24.x, r24.z
+mul.f r24.z, r22.y, c10.x
+absneg.f r25.x, (neg)c0.x
+mov.f32f32 r25.y, r23.w
+rcp r24.y, r24.y
+(ss)mul.f r2.y, r2.y, r24.y
+(ss)max.f r24.y, r24.x, r21.z
+min.f r20.w, r20.w, r24.w
+mad.f32 r14.w, r14.w, r17.w, r2.x
+mul.f r17.w, r25.y, c10.x
+absneg.f r24.w, (neg)c0.x
+min.f r18.w, r18.w, r24.y
+log2 r2.y, r2.y
+(ss)mul.f r2.y, c9.y, r2.y
+mad.f32 r24.y, c8.z, r25.x, (neg)r24.z
+cmps.f.lt r21.w, r21.w, c8.y
+mad.f32 r17.w, c8.z, r24.w, (neg)r17.w
+cmps.f.lt r23.z, r23.z, c8.y
+mov.f32f32 r24.z, r18.w
+mov.f32f32 r24.w, r14.w
+exp2 r2.y, r2.y
nop
-(ss)rcp r5.y, r5.y
-(ss)mov.f32f32 r5.y, r5.y
-mov.f32f32 r6.z, r6.z
-mov.f32f32 r7.y, r7.y
-sam (f32)(x)r21.w, r21.w, s#1, t#1
-(sy)mul.f r7.w, r21.w, c9.y
-mul.f r5.y, c9.w, r5.y
-mov.f32f32 r9.y, c10.x
-cmps.f.ne r7.y, r7.y, c8.y
-mov.f32f32 r7.w, r7.w
-add.f r10.z, r8.w, (neg)c1.x
-mov.f32f32 r5.y, r5.y
-sel.b32 r3.w, r5.x, r7.y, r3.w
-sel.b32 r5.x, r6.z, r3.y, r9.y
-absneg.f r6.z, (abs)r16.x
-add.f r5.y, c7.z, (neg)r5.y
-add.f r7.y, r14.y, r3.w
-add.f r9.y, r17.w, r3.w
-add.f r3.w, r5.w, r3.w
+(ss)rcp r2.y, r2.y
+(ss)mul.f r2.y, c9.w, r2.y
+cov.u32f32 r21.w, r21.w
+cov.u32f32 r23.z, r23.z
+mov.f32f32 r18.z, r18.z
+add.f r2.y, c7.z, (neg)r2.y
+mul.f r25.x, r16.w, r16.w
+cmps.f.ne r21.w, r21.w, c8.y
+mad.f32 r25.x, r14.z, r14.z, r25.x
+mov.f32f32 r25.z, c8.y
+mad.f32 r25.x, r16.y, r16.y, r25.x
+cmps.f.ne r23.z, r23.z, c8.y
+mov.f32f32 r25.w, c8.y
mov.f32f32 r5.y, r5.y
-mov.f32f32 r5.w, r7.y
-mov.f32f32 r7.y, r9.y
-mov.f32f32 r3.w, r3.w
-mov.f32f32 r9.y, r18.y
-mov.f32f32 r5.w, r5.w
-mov.f32f32 r14.y, r18.y
+add.f r26.x, c10.w, (neg)r24.w
+absneg.f r26.y, (neg)c0.z
+sel.b32 r17.w, r25.w, r23.z, r17.w
+rsq r25.x, r25.x
+(ss)mul.f r25.x, c7.x, r25.x
+sel.b32 r24.y, r25.z, r21.w, r24.y
+min.f r5.y, r5.y, r18.z
+mad.f32 r3.y, c8.z, r26.y, (neg)r3.y
+mul.f r2.y, r25.x, r2.y
+mul.f r18.z, (neg)r24.y, r21.x
+add.f r21.x, r20.y, (neg)c1.y
+mul.f r22.x, (neg)r17.w, r22.x
+mov.f32f32 r25.x, r2.y
+add.f r25.z, r13.x, (neg)c1.y
+mad.f32 r5.x, c7.x, r5.x, r25.x
+mov.f32f32 r25.x, r14.z
+mul.f r21.x, r21.x, r19.x
+mul.f r22.y, r22.y, c10.y
+mul.f r25.z, r25.z, r10.y
+mul.f r1.z, r25.x, r1.z
+mad.f32 r22.y, c8.z, r22.w, (neg)r22.y
+mov.f32f32 r22.w, c8.y
+mul.f r25.x, r25.y, c10.y
+mul.f r1.z, r1.z, r6.z
+mad.f32 r23.x, c8.z, r23.x, (neg)r25.x
+mov.f32f32 r25.x, c8.y
mov.f32f32 r7.y, r7.y
-mov.f32f32 r3.w, r3.w
-mul.f r10.z, r10.z, r14.w
-mul.f r9.y, r9.y, r14.y
-mov.f32f32 r14.y, r19.y
-mov.f32f32 r14.z, r19.y
-mov.f32f32 r10.z, r10.z
-cmps.f.lt r6.z, c11.x, r6.z
-mov.f32f32 r6.y, r6.y
-mad.f32 r9.y, r14.y, r14.z, r9.y
-mul.f r10.z, (neg)r21.z, r10.z
-add.f r14.y, r21.y, (neg)c1.y
-cov.u32f32 r6.z, r6.z
-mov.f32f32 r9.y, r9.y
-mov.f32f32 r14.z, r9.z
-mov.f32f32 r16.y, r9.z
-mul.f r14.y, r14.y, r14.w
-mov.f32f32 r6.z, r6.z
-max.f r6.y, r16.w, r6.y
-mad.f32 r9.y, r14.z, r16.y, r9.y
-mov.f32f32 r14.y, r14.y
-cmps.f.ne r6.z, r6.z, c8.y
-mov.f32f32 r14.z, r16.x
-mov.f32f32 r6.y, r6.y
-add.f r16.y, r15.z, (neg)c1.y
-add.f r15.y, c7.z, r15.y
-rsq r9.y, r9.y
-(ss)mov.f32f32 r9.y, r9.y
-mad.f32 r4.x, (neg)r4.x, r14.y, r10.z
-absneg.f r10.z, (neg)r14.z
-min.f r6.y, r10.w, r6.y
-mul.f r9.y, c7.x, r9.y
-mov.f32f32 r4.x, r4.x
-add.f r10.w, r20.x, (neg)c1.z
-mov.f32f32 r10.z, r10.z
-mul.f r5.y, r9.y, r5.y
-mov.f32f32 r9.y, r8.z
-mad.f32 r7.x, r16.y, r16.y, r7.x
-mov.f32f32 r14.y, r15.y
-mov.f32f32 r5.y, r5.y
-mul.f r10.w, r10.w, r14.w
-mov.f32f32 r10.z, r10.z
-mov.f32f32 r14.z, r9.y
-mov.f32f32 r14.w, r5.y
-mov.f32f32 r10.w, r10.w
-mad.f32 r4.w, c7.x, r4.w, r14.w
-sel.b32 r5.x, r10.z, r6.z, r5.x
-mov.f32f32 r5.y, r5.y
-mad.f32 r1.z, (neg)r1.z, r10.w, r4.x
-mov.f32f32 r4.x, r4.w
-mov.f32f32 r0.w, r0.w
-mov.f32f32 r4.w, r19.y
-mov.f32f32 r1.z, r1.z
-mul.f r5.x, r2.x, r5.x
-mov.f32f32 r10.z, c8.y
-mov.f32f32 r10.w, r4.w
-mov.f32f32 r1.w, r1.w
+add.f r1.z, r16.y, (neg)r1.z
+sel.b32 r22.y, r22.w, r21.w, r22.y
+sel.b32 r22.w, r25.x, r23.z, r23.x
+mov.f32f32 r8.z, r8.z
+mad.f32 r25.y, c10.z, r1.z, c7.x
+mul.f r1.z, r14.z, r2.w
+mad.f32 r2.w, (neg)r22.y, r21.x, r18.z
+add.f r18.z, r5.z, (neg)c1.z
+mad.f32 r21.x, (neg)r22.w, r25.z, r22.x
+mul.f r1.z, r1.z, r6.z
+add.f r6.z, r18.x, (neg)c1.z
+min.f r7.y, r8.z, r7.y
+mov.f32f32 r8.z, c8.y
+add.f r1.z, r16.w, (neg)r1.z
+mul.f r18.z, r18.z, r19.x
+mul.f r19.x, r23.y, c10.x
+absneg.f r22.x, (neg)c0.z
+mad.f32 r25.x, c10.z, r1.z, c7.x
+mul.f r1.z, r6.z, r10.y
+mul.f r6.z, r23.w, c10.x
+max.f r5.y, r5.y, r7.y
+mad.f32 r7.y, c8.z, r22.x, (neg)r19.x
+mov.f32f32 r10.y, c8.y
+absneg.f r19.x, (neg)c0.z
+sam (f32)(xy)r25.x, r25.x, s#1, t#1
+(sy)mul.f r0.w, r0.w, r25.x
+mov.f32f32 r21.z, r21.z
+sel.b32 r1.w, r8.z, r1.w, r3.y
+mad.f32 r3.y, c8.z, r19.x, (neg)r6.z
+mul.f r0.w, r0.w, c7.w
+sel.b32 r6.z, r10.y, r21.w, r7.y
+mov.f32f32 r7.y, c8.y
+mov.f32f32 r8.z, r24.x
+mad.f32 r0.w, r0.w, r25.y, r2.y
+mad.f32 r21.w, c7.x, r16.w, c7.x
+mad.f32 r22.x, c7.x, r16.y, c7.x
+mad.f32 r2.y, (neg)r6.z, r18.z, r2.w
+sel.b32 r2.w, r7.y, r23.z, r3.y
+min.f r3.y, r8.z, r21.z
+absneg.f r1.w, (neg)r1.w
+max.f r2.y, c8.y, r2.y
+mad.f32 r1.z, (neg)r2.w, r1.z, r21.x
+sam (f32)(x)r23.x, r21.w, s#2, t#2
+(sy)cmps.f.lt r7.y, r14.z, r23.x
+max.f r3.y, r5.y, r3.y
+mul.f r2.y, r2.y, c7.x
max.f r1.z, c8.y, r1.z
-mov.f32f32 r10.z, r10.z
-mov.f32f32 r14.w, c10.y
-mul.f r1.w, r10.w, r1.w
-mov.f32f32 r1.z, r1.z
-rcp r10.w, r14.z
-(ss)absneg.f r14.z, (neg)r3.x
-sel.b32 r10.z, r10.z, r3.y, r14.w
-mul.f r1.w, r1.w, r7.z
+cov.u32f32 r5.y, r7.y
+mul.f r7.y, r20.y, r24.y
+rcp r8.z, r22.y
+add.f r3.y, r24.z, (neg)r3.y
mul.f r1.z, r1.z, c7.x
-mov.f32f32 r14.w, c8.y
-add.f r15.y, c10.w, r14.z
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r16.y, r18.y
-mov.f32f32 r1.z, r1.z
-mov.f32f32 r14.w, r14.w
-(ss)mul.f r10.w, r15.y, r10.w
-mov.f32f32 r15.y, r16.y
-mov.f32f32 r16.y, r1.z
-mov.f32f32 r14.w, r14.w
-mov.f32f32 r10.w, r10.w
-add.f r1.w, r15.y, (neg)r1.w
-mul.f r7.w, r16.y, r7.w
-sel.b32 r10.z, r14.w, r6.z, r10.z
-mov.f32f32 r14.w, r9.y
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r7.w, r7.w
-mad.f32 r8.w, c7.x, r8.w, c7.x
-mad.f32 r1.x, r1.x, r10.z, r5.x
-mad.f32 r1.w, c10.z, r1.w, c7.x
-mov.f32f32 r5.x, r7.x
-rcp r7.x, r14.w
-add.f r10.z, c7.z, r14.z
-mov.f32f32 r8.w, r8.w
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r1.x, r1.x
-mov.f32f32 r14.z, r8.x
-mov.f32f32 r8.w, r8.w
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r10.z, r10.z
-(ss)add.f r14.w, r8.x, (neg)c1.z
-mul.f r9.x, r14.y, r9.x
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r16.y, r8.w
-mad.f32 r8.w, c7.x, r20.x, c7.x
-mov.f32f32 r14.y, r14.z
-mov.f32f32 r16.w, r1.w
-mov.f32f32 r1.w, r4.w
-mov.f32f32 r2.z, r2.z
-mov.f32f32 r4.w, r8.w
-absneg.f r8.w, (neg)r14.y
-(ss)mul.f r7.x, r10.z, r7.x
-mul.f r1.w, r1.w, r2.z
-mov.f32f32 r2.z, r4.w
-mov.f32f32 r4.w, r8.w
-mov.f32f32 r8.w, c10.x
-mul.f r1.w, r1.w, r7.z
-mov.f32f32 r16.z, r2.z
-mov.f32f32 r2.z, r7.x
-mad.f32 r5.x, r14.w, r14.w, r5.x
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r7.x, r9.z
-sel.b32 r4.w, r4.w, r3.y, r8.w
-mov.f32f32 r7.z, c8.y
-sam (f32)(x)r21.z, r16.y, s#2, t#2
-(sy)cmps.f.lt r8.w, r21.y, r21.z
-mov.f32f32 r7.x, r7.x
-max.f r2.z, r10.w, r2.z
-mov.f32f32 r5.x, r5.x
-mov.f32f32 r9.x, r9.x
-add.f r1.w, r7.x, (neg)r1.w
-cov.u32f32 r7.x, r8.w
-mov.f32f32 r7.z, r7.z
-mov.f32f32 r2.z, r2.z
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r7.x, r7.x
-mov.f32f32 r7.z, r7.z
-min.f r2.z, r6.y, r2.z
-mad.f32 r1.w, c10.z, r1.w, c7.x
-cmps.f.ne r6.y, r7.x, c8.y
-sel.b32 r4.w, r7.z, r6.z, r4.w
-mov.f32f32 r2.z, r2.z
-mov.f32f32 r1.w, r1.w
-sel.b32 r1.z, r7.w, r6.y, r1.z
-mad.f32 r1.x, r6.x, r4.w, r1.x
-mov.f32f32 r4.w, r13.x
-mov.f32f32 r1.w, r1.w
-add.f r6.y, r12.w, r1.z
-add.f r5.z, r5.z, r1.z
-add.f r1.z, r17.y, r1.z
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r6.y, r6.y
-mov.f32f32 r5.z, r5.z
-mov.f32f32 r1.z, r1.z
-mov.f32f32 r17.x, r1.w
-mov.f32f32 r6.y, r6.y
-mov.f32f32 r5.z, r5.z
+cmps.f.ne r5.y, r5.y, c8.y
+(ss)mul.f r7.y, r7.y, r8.z
+mul.f r10.y, r13.x, r17.w
+rcp r16.y, r22.w
+mad.f32 r3.y, c11.w, r3.y, c7.z
+sel.b32 r0.w, r0.w, r5.y, r5.x
+mov.f32f32 r5.x, r16.w
+add.f r5.y, r4.y, (neg)r7.y
+(ss)mul.f r7.y, r10.y, r16.y
+rcp r10.y, r1.w
+(ss)mul.f r10.y, r26.x, r10.y
+mad.f32 r21.z, c7.x, r5.x, c7.x
+(ss)mad.f32 r21.w, c7.x, r19.z, c7.x
+mad.f32 r5.x, c10.z, r5.y, c7.x
+mul.f r5.y, r20.y, r6.z
+add.f r6.z, r9.y, (neg)r7.y
+rcp r3.y, r3.y
+add.f r7.y, c7.z, (neg)r24.w
+rcp r17.w, r1.w
+mad.f32 r15.w, r1.y, r18.w, r15.w
+mul.f r5.y, r5.y, r8.z
+sam (f32)(xyz)r21.z, r21.z, s#0, t#0
+mad.f32 r18.w, c7.x, r16.w, c7.x
+mad.f32 r18.z, c7.x, r14.z, c7.z
+mad.f32 r22.w, c10.z, r6.z, c7.x
+add.f r5.y, r5.z, (neg)r5.y
+mul.f r2.w, r13.x, r2.w
+add.f r6.z, r15.w, c11.z
+(ss)mul.f r7.y, r7.y, r17.w
+mad.f32 r5.y, c10.z, r5.y, c7.x
+sam (f32)(xyz)r23.x, r18.z, s#0, t#0
+(sy)sel.b32 r8.z, r23.z, r19.w, r22.x
+(ss)mad.f32 r18.w, c7.x, r13.y, c7.x
+mad.f32 r18.z, c7.x, r10.w, c7.z
+sel.b32 r10.w, r23.y, r19.w, r21.w
+sel.b32 r13.y, r23.x, r19.w, r21.z
+mul.f r2.w, r2.w, r16.y
+sam (f32)(x)r21.z, r5.x, s#1, t#1
+(sy)(ss)mul.f r5.x, r21.z, c9.y
+mul.f r5.y, c11.y, r6.z
+max.f r6.z, r10.y, r7.y
+sam (f32)(xyz)r21.z, r18.z, s#0, t#0
+(sy)sel.b32 r8.z, r22.x, r15.x, r8.z
+sel.b32 r10.w, r21.w, r15.x, r10.w
+sel.b32 r13.y, r21.z, r15.x, r13.y
+mul.f r5.x, r2.y, r5.x
+mul.f r8.z, r8.z, r0.w
+cmps.f.lt r14.z, r14.z, c12.x
+mul.f r10.w, r10.w, r0.w
+mul.f r0.w, r13.y, r0.w
+mov.f32f32 r2.y, r2.y
+cov.u32f32 r13.y, r14.z
+(ss)mad.f32 r18.z, c7.x, r4.y, c7.x
+mad.f32 r18.w, c7.x, r5.z, c7.x
+add.f r2.w, r18.x, (neg)r2.w
+cmps.f.ne r4.y, r13.y, c8.y
+mul.f r5.z, c0.x, r11.w
+mul.f r3.y, r5.y, r3.y
+mad.f32 r5.y, c0.y, r10.x, r5.z
+mad.f32 r23.x, c10.z, r2.w, c7.x
+mad.f32 r2.w, c0.z, r14.y, r5.y
+sam (f32)(x)r21.z, r18.z, s#2, t#2
+(sy)cmps.f.lt r5.y, r20.y, r21.z
+min.f r5.z, r20.w, r6.z
+mul.f r6.z, c7.x, r15.z
+max.f r2.w, c8.y, r2.w
+cov.u32f32 r5.y, r5.y
+sam (f32)(x)r21.z, r22.w, s#1, t#1
+(sy)mul.f r13.y, r21.z, c9.y
+exp2 r3.y, r3.y
+mov.f32f32 r14.z, r5.z
+mov.f32f32 r8.y, r8.y
+cmps.f.ne r5.y, r5.y, c8.y
+mul.f r13.y, r1.z, r13.y
+log2 r2.w, r2.w
+(ss)mul.f r2.w, c12.y, r2.w
mov.f32f32 r1.z, r1.z
-mad.f32 r1.w, r4.w, r2.z, r0.z
-mov.f32f32 r1.x, r1.x
-sqrt r4.w, r5.x
-(ss)mov.f32f32 r4.w, r4.w
+mad.f32 r15.z, c7.x, r9.y, c7.x
+add.f r3.y, c7.z, r3.y
+mov.f32f32 r4.z, r4.z
+mad.f32 r15.w, c7.x, r18.x, c7.x
+sel.b32 r2.y, r5.x, r5.y, r2.y
+exp2 r2.w, r2.w
+mov.f32f32 r18.w, r10.x
+mov.f32f32 r19.x, r14.y
+mov.f32f32 r18.z, r11.w
+add.f r5.x, r16.x, r2.y
+add.f r5.y, r19.y, r2.y
+add.f r2.y, r6.y, r2.y
+sam (f32)(x)r15.z, r15.z, s#2, t#2
+rcp r3.y, r3.y
+(sy)cmps.f.lt r6.y, r13.x, r15.z
+absneg.f r9.y, (abs)r21.y
+min.f r4.z, r8.y, r4.z
(ss)nop
-sam (f32)(xy)r16.y, r16.w, s#1, t#1
-(sy)mul.f r0.w, r0.w, r16.y
-mov.f32f32 r1.w, r1.w
-max.f r1.x, c8.y, r1.x
-mov.f32f32 r5.x, c2.x
-mul.f r0.w, r0.w, c7.w
-mov.f32f32 r7.x, r1.w
-mov.f32f32 r1.x, r1.x
-max.f r7.z, r13.w, r9.x
-mov.f32f32 r0.w, r0.w
-mov.f32f32 r7.w, r7.x
-mov.f32f32 r8.w, r1.x
-rcp r5.x, r5.x
-(ss)mul.f r4.w, r4.w, r5.x
-mad.f32 r0.w, r0.w, r16.z, r5.y
-(ss)add.f r5.x, c10.w, (neg)r7.w
-rcp r5.y, r12.z
-mul.f r0.y, r8.w, r0.y
+sam.3d (f32)(xyz)r15.z, r18.z, s#3, t#3
+(sy)(ss)mad.f32 r8.y, c13.z, r2.w, r16.x
+mad.f32 r10.x, c13.y, r2.w, r15.w
+mad.f32 r2.w, c13.x, r2.w, r15.z
+cov.u32f32 r6.y, r6.y
+sel.b32 r8.y, r8.z, r4.y, r8.y
+mov.f32f32 r6.w, r6.w
mov.f32f32 r4.w, r4.w
-mov.f32f32 r0.w, r0.w
-mov.f32f32 r7.w, r18.y
-(ss)mul.f r5.x, r5.x, r5.y
-mov.f32f32 r0.y, r0.y
-mov.f32f32 r5.y, r7.z
-mad.f32 r7.z, c7.x, r7.w, c7.x
-mov.f32f32 r5.x, r5.x
-mov.f32f32 r7.x, r7.x
+sel.b32 r8.z, r10.w, r4.y, r10.x
+sel.b32 r0.w, r0.w, r4.y, r2.w
+cmps.f.ne r2.w, r6.y, c8.y
+min.f r4.y, r6.w, r4.w
+cmps.f.lt r4.w, c11.x, r9.y
+mul.f r6.x, r6.z, r6.x
+add.f r6.y, r15.y, (neg)c1.x
+max.f r4.y, r4.z, r4.y
+mov.f32f32 r4.z, r10.y
+mov.f32f32 r6.z, r7.y
+sel.b32 r1.z, r13.y, r2.w, r1.z
+cov.u32f32 r2.w, r4.w
+mul.f r4.w, r6.x, r20.z
+min.f r4.z, r4.z, r6.z
+add.f r6.x, r20.x, r1.z
+add.f r6.z, r17.z, r1.z
+cmps.f.ne r2.w, r2.w, c8.y
+max.f r4.y, r4.y, r4.z
+mov.f32f32 r4.z, c8.y
+mov.f32f32 r6.w, c10.x
+add.f r1.z, r4.w, r1.z
+add.f r4.y, r14.z, (neg)r4.y
+mul.f r4.w, r6.y, r6.y
+add.f r6.y, r22.z, (neg)c1.y
+sel.b32 r4.z, r4.z, r2.w, r6.w
+mad.f32 r4.y, c11.w, r4.y, c7.z
+absneg.f r6.w, (abs)r16.z
+mad.f32 r4.w, r6.y, r6.y, r4.w
+add.f r6.y, r24.w, (neg)c1.z
+absneg.f r7.y, (abs)r24.w
+mul.f r9.y, r14.x, r13.z
+rcp r10.x, r10.z
+cmps.f.lt r6.w, c11.x, r6.w
+rcp r4.y, r4.y
+mad.f32 r5.z, r1.x, r5.z, r22.z
+mad.f32 r4.w, r6.y, r6.y, r4.w
+cmps.f.lt r6.y, c11.x, r7.y
+add.f r7.y, c10.w, r13.w
+add.f r5.z, r5.z, c11.z
+cov.u32f32 r6.w, r6.w
+cov.u32f32 r6.y, r6.y
+(ss)mul.f r7.y, r7.y, r10.x
+mul.f r5.z, c11.y, r5.z
+cmps.f.ne r6.w, r6.w, c8.y
+absneg.f r10.x, (neg)r17.x
+sqrt r4.w, r4.w
+mov.f32f32 r10.y, c2.x
+(ss)mul.f r4.y, r5.z, r4.y
+cmps.f.ne r5.z, r6.y, c8.y
+max.f r6.y, r7.y, r9.y
+mov.f32f32 r7.y, r12.w
+sel.b32 r4.z, r10.x, r6.w, r4.z
+mov.f32f32 r9.y, c8.y
+mov.f32f32 r10.x, c10.x
+exp2 r4.y, r4.y
+(ss)add.f r4.y, c7.z, r4.y
+mul.f r4.z, r3.w, r4.z
+mov.f32f32 r10.z, c8.y
+mov.f32f32 r10.w, c10.y
+rcp r10.y, r10.y
+(ss)mul.f r4.w, r4.w, r10.y
+sel.b32 r9.y, r9.y, r5.z, r10.x
+absneg.f r9.x, (abs)r9.x
+rcp r4.y, r4.y
+sel.b32 r10.x, r10.z, r2.w, r10.w
+(ss)mov.f32f32 r10.y, c8.y
+rcp r10.z, r7.y
+absneg.f r10.w, (neg)r0.x
+cmps.f.lt r9.x, c11.x, r9.x
log2 r4.w, r4.w
(ss)mul.f r4.w, c9.y, r4.w
-mov.f32f32 r7.z, r7.z
-mov.f32f32 r7.w, r8.y
-add.f r7.x, c7.z, (neg)r7.x
-mov.f32f32 r4.w, r4.w
-mov.f32f32 r7.z, r7.z
-rcp r8.w, r12.x
-mov.f32f32 r9.x, r7.w
-(ss)mul.f r7.x, r7.x, r8.w
-mov.f32f32 r1.x, r1.x
-mov.f32f32 r10.z, r7.z
-mov.f32f32 r7.z, r9.z
-mov.f32f32 r7.x, r7.x
+sel.b32 r10.x, r10.y, r6.w, r10.x
+add.f r10.y, c10.w, r10.w
+cov.u32f32 r9.x, r9.x
+cmps.f.lt r8.x, r8.x, c9.z
+mad.f32 r4.z, r1.y, r10.x, r4.z
+mul.f r10.x, r10.y, r10.z
+cmps.f.ne r9.x, r9.x, c8.y
+absneg.f r10.y, (neg)r15.y
+mov.f32f32 r10.z, r21.y
exp2 r4.w, r4.w
nop
(ss)rcp r4.w, r4.w
-(ss)mov.f32f32 r4.w, r4.w
-mad.f32 r7.z, c7.x, r7.z, c7.x
-max.f r8.w, r5.x, r7.x
-rcp r9.x, r9.x
-absneg.f r12.x, (neg)r0.x
-mul.f r4.w, c9.w, r4.w
-mov.f32f32 r7.z, r7.z
-mov.f32f32 r8.w, r8.w
-mov.f32f32 r10.w, r15.w
-mov.f32f32 r4.w, r4.w
-mov.f32f32 r7.z, r7.z
-add.f r12.z, c10.w, r12.x
-mad.f32 r12.w, r10.w, r2.z, r0.x
+(ss)mul.f r4.w, c9.w, r4.w
+sel.b32 r9.y, r10.y, r9.x, r9.y
+absneg.f r10.y, (neg)r10.z
+mov.f32f32 r11.w, c10.x
add.f r4.w, c7.z, (neg)r4.w
-mov.f32f32 r10.w, r7.z
-(ss)mul.f r7.z, r12.z, r9.x
-(ss)mov.f32f32 r9.x, r12.w
-mov.f32f32 r4.w, r4.w
-mul.f r12.z, r16.x, r16.x
-mov.f32f32 r7.z, r7.z
-mov.f32f32 r12.w, r7.w
-sam (f32)(x)r16.y, r10.z, s#2, t#2
-(ss)mov.f32f32 r10.z, r19.y
-mov.f32f32 r10.w, r9.x
-mad.f32 r12.z, r15.z, r15.z, r12.z
-mov.f32f32 r13.x, r15.z
-(sy)cmps.f.lt r10.z, r10.z, r16.y
-mov.f32f32 r13.w, r10.w
-mov.f32f32 r12.z, r12.z
-rcp r12.w, r12.w
-add.f r12.x, c7.w, r12.x
-cov.u32f32 r10.z, r10.z
-add.f r13.w, c10.w, (neg)r13.w
-mad.f32 r12.z, r8.x, r8.x, r12.z
-mov.f32f32 r12.x, r12.x
-mov.f32f32 r10.z, r10.z
-mul.f r12.y, r13.w, r12.y
-mov.f32f32 r2.x, r2.x
-(ss)mul.f r12.x, r12.x, r12.w
-cmps.f.ne r10.z, r10.z, c8.y
-mov.f32f32 r12.y, r12.y
-(ss)mov.f32f32 r12.w, r10.w
-rsq r12.z, r12.z
-(ss)mov.f32f32 r12.z, r12.z
-sel.b32 r0.w, r0.w, r10.z, r4.x
-mov.f32f32 r4.x, r19.y
-add.f r10.z, c7.w, (neg)r12.w
-mul.f r12.z, c7.x, r12.z
-mov.f32f32 r12.x, r12.x
-mov.f32f32 r4.x, r4.x
-mul.f r10.z, r10.z, r11.y
-mul.f r4.w, r12.z, r4.w
-max.f r7.z, r7.z, r12.x
-mov.f32f32 r4.x, r4.x
-mov.f32f32 r10.z, r10.z
-mov.f32f32 r4.w, r4.w
-mov.f32f32 r7.z, r7.z
-mad.f32 r4.x, c7.x, r4.x, c7.z
-max.f r11.y, r12.y, r10.z
-mov.f32f32 r12.x, r4.w
-mov.f32f32 r4.w, r4.w
-mov.f32f32 r4.x, r4.x
-mov.f32f32 r11.y, r11.y
-mad.f32 r0.y, c7.x, r0.y, r12.x
-mul.f r2.x, r13.x, r2.x
-mov.f32f32 r4.x, r4.x
-min.f r8.w, r8.w, r11.y
-mov.f32f32 r11.y, r9.y
-mov.f32f32 r0.y, r0.y
-mov.f32f32 r12.z, r4.x
-mov.f32f32 r4.x, r18.y
-mad.f32 r2.z, r11.y, r2.z, r3.x
-mul.f r2.x, r2.x, r2.w
-min.f r5.y, r5.y, r7.z
-mov.f32f32 r7.z, r4.x
-mov.f32f32 r2.z, r2.z
-mov.f32f32 r2.x, r2.x
-mov.f32f32 r11.y, r16.x
-mov.f32f32 r7.z, r7.z
-mov.f32f32 r12.x, r2.z
-mov.f32f32 r8.z, r8.z
-add.f r2.x, r11.y, (neg)r2.x
-mad.f32 r7.z, c7.x, r7.z, c7.x
-mov.f32f32 r11.y, r12.x
-mov.f32f32 r12.w, r8.z
-mov.f32f32 r2.x, r2.x
-mov.f32f32 r7.z, r7.z
-add.f r11.y, c10.w, (neg)r11.y
-mov.f32f32 r13.x, r1.w
-cmps.f.lt r13.y, r13.y, c9.z
-mov.f32f32 r7.z, r7.z
-mul.f r11.x, r11.y, r11.x
-mad.f32 r2.x, c10.z, r2.x, c7.x
-rcp r11.y, r12.w
-absneg.f r13.w, (neg)r3.x
-(ss)mov.f32f32 r12.w, r7.z
-mov.f32f32 r7.z, r11.x
-mov.f32f32 r11.x, r12.x
-mov.f32f32 r2.x, r2.x
-add.f r12.x, c10.w, r13.w
-add.f r13.x, r13.x, (neg)c1.x
-add.f r11.x, c7.z, (neg)r11.x
-sam (f32)(xyz)r16.y, r12.z, s#0, t#0
-(sy)(ss)mov.f32f32 r12.z, r16.w
-mov.f32f32 r4.x, r4.x
-mov.f32f32 r12.w, r16.z
-mov.f32f32 r14.y, r16.y
-mul.f r10.x, r11.x, r10.x
-mov.f32f32 r4.x, r4.x
-mov.f32f32 r2.x, r2.x
-(ss)mul.f r11.x, r12.x, r11.y
-mov.f32f32 r10.x, r10.x
-mad.f32 r4.x, c7.x, r4.x, c7.x
-mov.f32f32 r2.x, r2.x
-mov.f32f32 r11.x, r11.x
-mov.f32f32 r11.y, r8.z
-mov.f32f32 r4.x, r4.x
-max.f r12.x, r7.z, r10.x
-mov.f32f32 r14.z, r2.x
-mov.f32f32 r2.x, r15.z
-mov.f32f32 r4.x, r4.x
-mov.f32f32 r12.x, r12.x
-mov.f32f32 r6.x, r6.x
-rcp r11.y, r11.y
-add.f r13.w, c7.z, r13.w
-mov.f32f32 r16.y, r4.x
-mov.f32f32 r4.x, r18.w
-min.f r8.w, r8.w, r12.x
-mul.f r2.x, r2.x, r6.x
-mov.f32f32 r6.x, r13.w
-mov.f32f32 r4.x, r4.x
-mov.f32f32 r8.w, r8.w
-mov.f32f32 r10.w, r10.w
-mov.f32f32 r12.x, r1.y
-mad.f32 r4.x, c7.x, r4.x, c7.x
-mul.f r2.x, r2.x, r2.w
-(ss)mul.f r2.w, r6.x, r11.y
-mad.f32 r6.x, r12.x, r8.w, r10.w
-mov.f32f32 r4.x, r4.x
-mov.f32f32 r2.x, r2.x
-mov.f32f32 r10.w, r8.x
-mov.f32f32 r6.x, r6.x
-mov.f32f32 r4.x, r4.x
-mov.f32f32 r2.w, r2.w
-add.f r2.x, r10.w, (neg)r2.x
-add.f r6.x, r6.x, c11.z
-mov.f32f32 r16.z, r4.x
-max.f r2.w, r11.x, r2.w
-mov.f32f32 r2.x, r2.x
-mov.f32f32 r4.x, r6.x
-mul.f r6.x, r13.x, r13.x
-mov.f32f32 r2.w, r2.w
-mov.f32f32 r10.w, r9.x
-sam (f32)(xyz)r16.y, r16.y, s#0, t#0
-(sy)mov.f32f32 r11.x, r16.w
-(ss)mov.f32f32 r11.y, r16.z
-mov.f32f32 r12.x, r16.y
-mul.f r4.x, c11.y, r4.x
-sel.b32 r11.x, r12.z, r20.y, r11.x
-mov.f32f32 r12.z, r19.y
-sel.b32 r11.y, r12.w, r20.y, r11.y
-sel.b32 r12.x, r14.y, r20.y, r12.x
-mov.f32f32 r4.x, r4.x
-mov.f32f32 r12.z, r12.z
-min.f r5.x, r5.x, r7.x
-min.f r7.x, r12.y, r10.z
-mad.f32 r2.x, c10.z, r2.x, c7.x
-mad.f32 r10.z, c7.x, r12.z, c7.z
-min.f r2.w, r5.y, r2.w
-max.f r5.x, r5.x, r7.x
-min.f r5.y, r7.z, r10.x
-mov.f32f32 r7.x, r10.z
-mov.f32f32 r2.x, r2.x
-mov.f32f32 r2.w, r2.w
-mov.f32f32 r7.z, r13.z
-mov.f32f32 r7.x, r7.x
-max.f r5.x, r5.x, r5.y
-mov.f32f32 r2.x, r2.x
-mad.f32 r0.z, r7.z, r2.w, r0.z
-mov.f32f32 r12.y, r7.x
-mov.f32f32 r5.y, r9.z
-mov.f32f32 r5.x, r5.x
-mov.f32f32 r2.x, r2.x
-mov.f32f32 r0.z, r0.z
-mov.f32f32 r5.y, r5.y
-add.f r5.x, r8.w, (neg)r5.x
-mov.f32f32 r14.w, r2.x
-mov.f32f32 r2.x, r0.z
-mad.f32 r5.y, c7.x, r5.y, c7.x
-mov.f32f32 r5.x, r5.x
-add.f r7.x, r10.w, (neg)c1.y
-add.f r2.x, c10.w, (neg)r2.x
-mov.f32f32 r5.y, r5.y
-mad.f32 r5.x, c11.w, r5.x, c7.z
-sam (f32)(xy)r16.y, r14.z, s#1, t#1
-(sy)mul.f r1.x, r1.x, r16.y
-mov.f32f32 r4.z, r4.z
-mov.f32f32 r5.y, r5.y
-mov.f32f32 r5.x, r5.x
+mul.f r9.y, r4.x, r9.y
+mov.f32f32 r13.x, c8.y
+mov.f32f32 r13.y, c10.y
+sel.b32 r10.y, r10.y, r2.w, r11.w
+mov.f32f32 r11.w, c8.y
+mul.f r13.z, r15.y, r15.y
+sel.b32 r13.x, r13.x, r5.z, r13.y
+mov.f32f32 r13.y, c8.y
+sel.b32 r10.y, r11.w, r6.w, r10.y
+mad.f32 r11.w, r22.z, r22.z, r13.z
+rcp r7.y, r7.y
+add.f r10.w, c7.w, r10.w
+sel.b32 r13.x, r13.y, r9.x, r13.x
+mad.f32 r4.z, r0.y, r10.y, r4.z
+mad.f32 r10.y, r24.w, r24.w, r11.w
+(ss)mul.f r7.y, r10.w, r7.y
+mad.f32 r1.x, r1.x, r13.x, r9.y
+absneg.f r9.y, (neg)r24.w
+mov.f32f32 r10.w, c10.x
+max.f r4.z, c8.y, r4.z
+max.f r7.y, r10.x, r7.y
+cov.u32f32 r8.x, r8.x
+sel.b32 r9.y, r9.y, r5.z, r10.w
+mov.f32f32 r10.x, c8.y
+mov.f32f32 r10.w, r4.z
+rsq r10.y, r10.y
+(ss)mul.f r10.y, c7.x, r10.y
+min.f r6.y, r6.y, r7.y
+sel.b32 r7.y, r10.x, r9.x, r9.y
+mul.f r3.y, r10.w, r3.y
+add.f r9.y, r17.x, (neg)c1.x
+mul.f r4.w, r10.y, r4.w
+mad.f32 r1.x, r1.w, r7.y, r1.x
+mov.f32f32 r7.y, r11.x
+mul.f r9.y, r9.y, r9.y
+add.f r10.x, r18.y, (neg)c1.y
+max.f r1.x, c8.y, r1.x
+mov.f32f32 r10.y, r4.w
+mul.f r4.x, r22.z, r4.x
+mad.f32 r9.y, r10.x, r10.x, r9.y
+mov.f32f32 r10.x, r1.x
+add.f r10.w, r21.y, (neg)c1.z
+mul.f r4.x, r4.x, r7.z
+rcp r11.w, r7.y
+absneg.f r13.x, (neg)r2.x
+mul.f r4.y, r10.x, r4.y
+mad.f32 r9.y, r10.w, r10.w, r9.y
+add.f r4.x, r15.y, (neg)r4.x
+add.f r10.x, c7.z, r13.x
+mad.f32 r4.y, c7.x, r4.y, r10.y
+cmps.f.ne r8.x, r8.x, c8.y
+mad.f32 r13.y, c10.z, r4.x, c7.x
+mul.f r1.w, r22.z, r1.w
+sqrt r4.x, r9.y
+(ss)mov.f32f32 r9.y, c2.x
+(ss)mul.f r10.x, r10.x, r11.w
+rcp r10.y, r11.x
+add.f r10.w, c10.w, r13.x
+mul.f r1.w, r1.w, r7.z
+mad.f32 r14.x, c7.x, r15.y, c7.x
+mad.f32 r13.w, c7.x, r22.z, c7.z
+(ss)mul.f r7.z, r10.w, r10.y
+add.f r1.w, r24.w, (neg)r1.w
+rcp r9.y, r9.y
+(ss)mul.f r4.x, r4.x, r9.y
+(ss)mov.f32f32 r9.y, r18.y
+max.f r7.z, r7.z, r10.x
+mad.f32 r13.z, c10.z, r1.w, c7.x
+sam (f32)(xyz)r13.w, r13.w, s#0, t#0
+mad.f32 r10.x, c7.x, r15.y, c7.x
+mad.f32 r10.y, c7.x, r24.w, c7.x
+min.f r1.w, r6.y, r7.z
+log2 r4.x, r4.x
+(ss)mul.f r4.x, c9.y, r4.x
+mul.f r0.y, r9.y, r0.y
+rcp r1.y, r1.y
+mad.f32 r10.w, c7.x, r15.y, c7.x
+sam (f32)(xy)r15.x, r13.y, s#1, t#1
+(sy)mul.f r1.x, r1.x, r15.x
+mov.f32f32 r6.y, r1.w
+sam (f32)(xyz)r15.z, r10.x, s#0, t#0
+(sy)sel.b32 r7.z, r14.x, r5.z, r15.w
+sel.b32 r9.y, r14.y, r5.z, r16.x
mul.f r1.x, r1.x, c7.w
-mov.f32f32 r7.z, r4.z
-mov.f32f32 r12.z, r5.y
-mad.f32 r5.y, r7.x, r7.x, r6.x
-add.f r6.x, r0.z, (neg)c1.x
-cov.u32f32 r7.x, r13.y
-rcp r5.x, r5.x
-(ss)mov.f32f32 r5.x, r5.x
-mov.f32f32 r1.x, r1.x
-sqrt r7.z, r7.z
-(ss)mov.f32f32 r7.z, r7.z
-sam (f32)(xyz)r12.y, r12.y, s#0, t#0
-(sy)mov.f32f32 r8.w, r12.w
-mov.f32f32 r9.z, r12.z
-mov.f32f32 r10.x, r12.y
-mul.f r4.x, r4.x, r5.x
-mov.f32f32 r5.x, r8.w
-mov.f32f32 r8.w, r9.z
-mov.f32f32 r9.z, r10.x
-mov.f32f32 r4.x, r4.x
-sel.b32 r5.x, r5.x, r21.x, r11.x
-sel.b32 r8.w, r8.w, r21.x, r11.y
-sel.b32 r9.z, r9.z, r21.x, r12.x
-mad.f32 r1.x, r1.x, r16.z, r4.w
-mul.f r4.w, r5.x, r0.w
-cmps.f.lt r5.x, r19.y, c12.x
-mul.f r8.w, r8.w, r0.w
-mul.f r0.w, r9.z, r0.w
exp2 r4.x, r4.x
-(ss)mov.f32f32 r4.x, r4.x
+nop
+(ss)rcp r4.x, r4.x
+(ss)mul.f r4.x, c9.w, r4.x
+mad.f32 r0.z, r12.y, r6.y, r0.z
+mad.f32 r1.x, r1.x, r15.y, r4.w
+mad.f32 r11.x, c7.x, r24.w, c7.x
+add.f r4.x, c7.z, (neg)r4.x
+mul.f r4.w, r17.x, r17.x
+mov.f32f32 r10.x, r0.z
+mad.f32 r4.w, r18.y, r18.y, r4.w
+mad.f32 r13.y, c7.x, r14.w, c7.x
+mad.f32 r13.x, c7.x, r12.x, c7.z
+sam (f32)(x)r14.x, r10.w, s#2, t#2
+(sy)cmps.f.lt r10.y, r22.z, r14.x
+mad.f32 r4.w, r21.y, r21.y, r4.w
+(ss)add.f r10.w, c10.w, (neg)r10.x
+mul.f r11.x, r9.w, c10.x
+cov.u32f32 r10.y, r10.y
+absneg.f r11.w, (neg)c0.x
+sam (f32)(xyz)r14.x, r13.x, s#0, t#0
+(sy)sel.b32 r9.y, r14.z, r9.x, r9.y
+sel.b32 r7.z, r14.y, r9.x, r7.z
+cmps.f.ne r10.y, r10.y, c8.y
+rsq r4.w, r4.w
+(ss)mul.f r4.w, c7.x, r4.w
+mad.f32 r11.x, c8.z, r11.w, (neg)r11.x
+cmps.f.lt r2.z, r2.z, c8.y
+sel.b32 r1.x, r1.x, r10.y, r4.y
+sel.b32 r4.y, r13.w, r5.z, r15.z
+mul.f r4.x, r4.w, r4.x
+cov.u32f32 r2.z, r2.z
+mul.f r4.w, r9.y, r1.x
+cmps.f.lt r5.z, r7.x, c8.y
+mul.f r7.z, r7.z, r1.x
+sel.b32 r4.y, r14.x, r9.x, r4.y
+mov.f32f32 r9.x, r4.x
+cov.u32f32 r5.z, r5.z
+mad.f32 r3.y, c7.x, r3.y, r9.x
+mul.f r0.y, r0.y, r1.y
+mul.f r1.x, r4.y, r1.x
+cmps.f.ne r4.y, r5.z, c8.y
+cmps.f.ne r2.z, r2.z, c8.y
+mov.f32f32 r5.z, c8.y
+add.f r0.y, r21.y, (neg)r0.y
+sel.b32 r4.w, r4.w, r4.y, r8.y
+sel.b32 r7.z, r7.z, r4.y, r8.z
+sel.b32 r0.w, r1.x, r4.y, r0.w
+mad.f32 r8.z, c10.z, r0.y, c7.x
+sel.b32 r0.y, r5.x, r8.x, r4.w
+sel.b32 r1.x, r5.y, r8.x, r7.z
+sel.b32 r0.w, r2.y, r8.x, r0.w
+mul.f r2.y, r18.y, r3.w
+mul.f r3.w, r0.y, c14.z
+cmps.f.lt r4.y, r7.x, c8.y
+mul.f r4.w, r1.x, c14.y
+mul.f r5.x, r0.w, c14.x
+mul.f r1.y, r2.y, r1.y
+cov.u32f32 r2.y, r4.y
+sel.b32 r4.y, r5.z, r2.z, r11.x
+add.f r5.y, r10.x, (neg)c1.x
+add.f r1.y, r17.x, (neg)r1.y
+cmps.f.ne r2.y, r2.y, c8.y
+absneg.f r4.y, (neg)r4.y
+mul.f r5.y, r5.y, r5.y
+mad.f32 r8.y, c10.z, r1.y, c7.x
+sel.b32 r0.y, r3.w, r2.y, r0.y
+log2 r1.y, r3.z
+(ss)mul.f r1.y, c9.x, r1.y
+sel.b32 r1.x, r4.w, r2.y, r1.x
+sel.b32 r0.w, r5.x, r2.y, r0.w
+rcp r2.y, r4.y
+(ss)mul.f r2.y, r10.w, r2.y
+(ss)add.f r3.z, c7.z, (neg)r10.x
+sam (f32)(xy)r13.x, r8.y, s#1, t#1
+(sy)mul.f r3.w, r4.z, r13.x
+rcp r4.z, r4.y
+mad.f32 r0.x, r12.w, r1.w, r0.x
+exp2 r1.y, r1.y
+(ss)add.f r1.w, c15.y, (neg)r1.y
+mul.f r3.z, r3.z, r4.z
+mul.f r3.w, r3.w, c7.w
+mov.f32f32 r4.z, r0.x
+mul.f r1.w, r1.w, c8.w
+(ss)mul.f r1.y, r1.y, c7.z
+mad.f32 r3.w, r3.w, r13.y, r4.x
+mad.f32 r4.w, c7.x, r17.x, c7.x
+mad.f32 r5.x, c7.x, r21.y, c7.x
+add.f r1.y, r1.y, r1.w
+max.f r1.w, r2.y, r3.z
+add.f r4.x, c10.w, (neg)r4.z
+mul.f r5.z, r9.w, c10.y
+add.f r7.x, c15.y, (neg)r1.y
+add.f r7.z, c15.y, (neg)r1.y
+add.f r8.x, c15.y, (neg)r1.y
+sam (f32)(x)r13.x, r4.w, s#2, t#2
+(sy)(ss)cmps.f.lt r4.w, r18.y, r13.x
+mul.f r0.y, r7.x, r0.y
+mul.f r1.x, r7.z, r1.x
+mul.f r0.w, r8.x, r0.w
+cov.u32f32 r4.w, r4.w
+mad.f32 r3.x, c8.z, r3.x, (neg)r5.z
+mov.f32f32 r5.x, c8.y
+add.f r5.z, r4.z, (neg)c1.y
+cmps.f.ne r4.w, r4.w, c8.y
+mad.f32 r2.x, r7.y, r6.y, r2.x
+sel.b32 r3.x, r5.x, r2.z, r3.x
+mad.f32 r5.x, r5.z, r5.z, r5.y
+sel.b32 r3.y, r3.w, r4.w, r3.y
+mov.f32f32 r3.w, r17.x
+absneg.f r3.x, (neg)r3.x
+mov.f32f32 r4.w, r2.x
+cmps.f.lt r5.y, r5.w, c9.z
+mad.f32 r5.z, c7.x, r3.w, c7.x
+mad.f32 r5.w, c7.x, r10.z, c7.x
+add.f r3.w, r4.w, (neg)c1.z
+absneg.f r6.y, (abs)r4.w
+rcp r7.x, r3.x
+(ss)mul.f r4.x, r4.x, r7.x
+add.f r7.x, c7.w, (neg)r4.z
+rcp r7.y, r3.x
+mad.f32 r3.w, r3.w, r3.w, r5.x
+cmps.f.lt r5.x, c11.x, r6.y
+sam (f32)(xyz)r10.y, r5.z, s#0, t#0
+(ss)mad.f32 r5.w, c7.x, r17.x, c7.x
+mad.f32 r5.z, c7.x, r18.y, c7.z
+(ss)mul.f r6.y, r7.x, r7.y
cov.u32f32 r5.x, r5.x
-mov.f32f32 r1.x, r1.x
-mad.f32 r9.z, c7.x, r16.x, c7.x
-add.f r4.x, c7.z, r4.x
+cov.u32f32 r5.y, r5.y
+sqrt r3.w, r3.w
+mov.f32f32 r7.x, c2.x
+max.f r7.y, r4.x, r6.y
cmps.f.ne r5.x, r5.x, c8.y
-mov.f32f32 r10.x, r10.y
-mov.f32f32 r9.z, r9.z
-mov.f32f32 r4.x, r4.x
-mov.f32f32 r10.y, r3.z
-mov.f32f32 r10.z, r10.x
-mov.f32f32 r9.z, r9.z
-mov.f32f32 r5.y, r5.y
-mad.f32 r7.z, c8.z, r10.y, r7.z
-mul.f r10.y, c0.x, r10.z
-mov.f32f32 r10.z, r17.z
-rcp r4.x, r4.x
-(ss)mov.f32f32 r4.x, r4.x
-mov.f32f32 r10.w, r2.z
-mov.f32f32 r11.x, r9.z
-mov.f32f32 r9.z, r10.z
-mad.f32 r11.y, c7.x, r8.x, c7.x
-mov.f32f32 r12.x, r10.w
-mov.f32f32 r7.z, r7.z
-mad.f32 r9.z, c0.y, r9.z, r10.y
-mov.f32f32 r10.y, r11.y
-absneg.f r11.y, (abs)r12.x
-mul.f r12.x, r7.z, c10.x
-mov.f32f32 r9.z, r9.z
-mov.f32f32 r12.y, r15.x
-cmps.f.lt r11.y, c11.x, r11.y
-mov.f32f32 r10.y, r10.y
-mov.f32f32 r12.x, r12.x
-mov.f32f32 r12.z, r12.y
-cov.u32f32 r12.w, r11.y
-mov.f32f32 r11.y, r10.y
-absneg.f r10.y, (neg)c0.x
-mad.f32 r9.z, c0.z, r12.z, r9.z
-mov.f32f32 r12.z, r12.w
-mov.f32f32 r12.w, r2.z
-mov.f32f32 r10.y, r10.y
-max.f r9.z, c8.y, r9.z
-cmps.f.ne r12.z, r12.z, c8.y
-mov.f32f32 r13.x, c8.y
-sam (f32)(x)r14.y, r11.x, s#2, t#2
-(sy)(ss)cmps.f.lt r11.x, r15.z, r14.y
-mov.f32f32 r9.z, r9.z
-mad.f32 r10.y, c8.z, r10.y, (neg)r12.x
-cmps.f.lt r4.z, r4.z, c8.y
-mov.f32f32 r11.y, r13.x
-mov.f32f32 r12.x, c10.x
-add.f r12.w, r12.w, (neg)c1.z
-cov.u32f32 r4.z, r4.z
-log2 r9.z, r9.z
-(ss)mul.f r9.z, c12.y, r9.z
-sel.b32 r11.y, r11.y, r12.z, r12.x
-mov.f32f32 r12.x, r1.w
-cov.u32f32 r11.x, r11.x
-mov.f32f32 r9.z, r9.z
-cmps.f.ne r4.z, r4.z, c8.y
-mov.f32f32 r13.x, c8.y
-absneg.f r12.x, (abs)r12.x
-mad.f32 r5.y, r12.w, r12.w, r5.y
-mul.f r6.x, r6.x, r6.x
-mov.f32f32 r7.w, r7.w
-exp2 r9.z, r9.z
-mov.f32f32 r10.x, r10.x
-cmps.f.lt r12.x, c11.x, r12.x
-mov.f32f32 r11.x, r11.x
-sel.b32 r10.y, r13.x, r4.z, r10.y
-mov.f32f32 r10.x, r10.x
-cov.u32f32 r12.x, r12.x
-cmps.f.ne r11.x, r11.x, c8.y
-absneg.f r10.y, (neg)r10.y
-mov.f32f32 r12.w, r10.x
-mov.f32f32 r10.x, r10.z
-mov.f32f32 r10.z, r12.x
-sel.b32 r0.y, r1.x, r11.x, r0.y
-mov.f32f32 r1.x, r15.z
-mov.f32f32 r10.x, r10.x
-cmps.f.ne r10.z, r10.z, c8.y
-mov.f32f32 r11.x, r1.w
-mov.f32f32 r1.x, r1.x
-mov.f32f32 r13.x, r10.x
-mov.f32f32 r10.x, r12.y
-mov.f32f32 r11.x, r11.x
-mad.f32 r1.x, c7.x, r1.x, c7.z
-mov.f32f32 r12.x, r10.y
-mov.f32f32 r10.x, r10.x
-absneg.f r11.x, (neg)r11.x
-mov.f32f32 r1.x, r1.x
-mov.f32f32 r5.y, r5.y
-mov.f32f32 r13.y, r10.x
-mov.f32f32 r10.x, r11.x
-mov.f32f32 r1.x, r1.x
-rcp r11.x, r12.x
-(ss)mul.f r2.x, r2.x, r11.x
-mad.f32 r0.x, r7.w, r2.w, r0.x
-cmps.f.ne r7.x, r7.x, c8.y
-sqrt r5.y, r5.y
-mov.f32f32 r7.w, r10.x
-sam.3d (f32)(xyz)r12.w, r12.w, s#3, t#3
-(sy)mad.f32 r10.x, c13.z, r9.z, r13.y
-mad.f32 r11.x, c13.y, r9.z, r13.x
-(ss)mad.f32 r9.z, c13.x, r9.z, r12.w
-sel.b32 r7.w, r7.w, r10.z, r11.y
-sel.b32 r4.w, r4.w, r5.x, r10.x
-mov.f32f32 r12.x, r1.x
-mov.f32f32 r1.x, r16.x
-sel.b32 r8.w, r8.w, r5.x, r11.x
-sel.b32 r0.w, r0.w, r5.x, r9.z
-mul.f r5.x, r2.y, r7.w
-mov.f32f32 r1.x, r1.x
-mov.f32f32 r7.w, c8.y
-mov.f32f32 r2.x, r2.x
-mov.f32f32 r9.z, r0.z
-mad.f32 r1.x, c7.x, r1.x, c7.x
-mov.f32f32 r7.w, r7.w
-mov.f32f32 r10.x, c10.y
-add.f r9.z, c7.z, (neg)r9.z
-mov.f32f32 r1.x, r1.x
-mov.f32f32 r11.x, r10.y
-sel.b32 r7.w, r7.w, r12.z, r10.x
-mov.f32f32 r10.x, c8.y
-mov.f32f32 r1.x, r1.x
-(ss)mov.f32f32 r5.y, r5.y
-mov.f32f32 r11.y, c2.x
-mov.f32f32 r0.x, r0.x
-mov.f32f32 r12.y, r1.x
-mov.f32f32 r1.x, r10.x
-rcp r10.x, r11.x
-(ss)mul.f r9.z, r9.z, r10.x
-add.f r10.x, r0.x, (neg)c1.y
-mov.f32f32 r8.z, r8.z
-(ss)rcp r11.x, r11.y
-mov.f32f32 r1.x, r1.x
-mov.f32f32 r9.z, r9.z
-sam (f32)(xyz)r12.w, r12.x, s#0, t#0
-(sy)(ss)mov.f32f32 r11.y, r13.y
-mov.f32f32 r12.x, r16.x
-mov.f32f32 r12.y, r13.x
-mov.f32f32 r12.w, r12.w
-sel.b32 r1.x, r1.x, r10.z, r7.w
-mov.f32f32 r7.w, r12.x
-max.f r12.x, r2.x, r9.z
-(ss)mul.f r5.y, r5.y, r11.x
-mad.f32 r6.x, r10.x, r10.x, r6.x
-mad.f32 r7.w, c7.x, r7.w, c7.x
-mad.f32 r1.x, r1.y, r1.x, r5.x
-mov.f32f32 r1.y, r12.x
-mov.f32f32 r5.x, r0.x
-mov.f32f32 r7.w, r7.w
-mov.f32f32 r1.x, r1.x
-mov.f32f32 r10.x, r10.w
-add.f r5.x, c10.w, (neg)r5.x
-mov.f32f32 r7.w, r7.w
-mul.f r11.x, r7.z, c10.y
-mov.f32f32 r10.x, r10.x
-mov.f32f32 r5.y, r5.y
-mov.f32f32 r13.x, r7.w
-mov.f32f32 r7.w, r8.x
-absneg.f r10.x, (neg)r10.x
-mov.f32f32 r11.x, r11.x
-mov.f32f32 r3.z, r3.z
-mov.f32f32 r7.w, r7.w
-mov.f32f32 r10.x, r10.x
-mov.f32f32 r12.x, c10.x
-mad.f32 r3.z, c8.z, r3.z, (neg)r11.x
-mad.f32 r7.w, c7.x, r7.w, c7.x
-mov.f32f32 r11.x, c8.y
-sel.b32 r10.x, r10.x, r12.z, r12.x
-mov.f32f32 r12.x, c8.y
-mov.f32f32 r7.w, r7.w
-sel.b32 r3.z, r11.x, r4.z, r3.z
-log2 r5.y, r5.y
-(ss)mul.f r5.y, c9.y, r5.y
-mov.f32f32 r11.x, r12.x
-mov.f32f32 r7.w, r7.w
-absneg.f r3.z, (neg)r3.z
-mov.f32f32 r5.y, r5.y
-mov.f32f32 r6.x, r6.x
-mov.f32f32 r13.y, r7.w
-mov.f32f32 r7.w, r11.x
-mov.f32f32 r11.x, r3.z
-mad.f32 r2.w, r8.z, r2.w, r3.x
-mov.f32f32 r3.x, r15.z
-exp2 r5.y, r5.y
-sel.b32 r7.w, r7.w, r10.z, r10.x
-(ss)rcp r5.y, r5.y
-(ss)mov.f32f32 r5.y, r5.y
-sam (f32)(xyz)r13.x, r13.x, s#0, t#0
-(sy)mov.f32f32 r8.z, r13.z
-mov.f32f32 r10.x, r13.y
-mov.f32f32 r12.x, r13.x
-mad.f32 r1.x, r6.w, r7.w, r1.x
-sel.b32 r7.w, r11.y, r3.y, r8.z
-mad.f32 r3.x, c7.x, r3.x, c7.z
-sel.b32 r8.z, r12.y, r3.y, r10.x
-sel.b32 r3.y, r12.w, r3.y, r12.x
-mov.f32f32 r1.x, r1.x
-mov.f32f32 r3.x, r3.x
-rcp r10.x, r11.x
-(ss)mul.f r5.x, r5.x, r10.x
-mul.f r5.y, c9.w, r5.y
-max.f r1.x, c8.y, r1.x
-mov.f32f32 r3.x, r3.x
-mov.f32f32 r5.x, r5.x
-mov.f32f32 r10.x, r0.x
-mov.f32f32 r1.x, r1.x
-(ss)mov.f32f32 r11.x, r3.x
-mov.f32f32 r3.x, r8.x
-add.f r8.x, c7.w, (neg)r10.x
-mov.f32f32 r10.x, r3.z
-mov.f32f32 r11.y, r1.x
-mad.f32 r3.x, c7.x, r3.x, c7.x
-mov.f32f32 r5.y, r5.y
-mov.f32f32 r2.w, r2.w
-mov.f32f32 r1.x, r1.x
-mov.f32f32 r3.x, r3.x
-mul.f r4.x, r11.y, r4.x
-rcp r10.x, r10.x
-(ss)mul.f r8.x, r8.x, r10.x
-add.f r5.y, c7.z, (neg)r5.y
-mov.f32f32 r3.x, r3.x
-mov.f32f32 r4.x, r4.x
-mov.f32f32 r8.x, r8.x
-mov.f32f32 r5.y, r5.y
-mov.f32f32 r11.y, r3.x
-mov.f32f32 r3.x, r1.w
-(ss)mov.f32f32 r10.x, r1.w
-max.f r12.x, r5.x, r8.x
-add.f r12.y, r2.w, (neg)c1.z
-mov.f32f32 r12.w, r9.x
-mov.f32f32 r13.x, r2.w
-sam (f32)(xyz)r14.y, r11.x, s#0, t#0
-(sy)(ss)mov.f32f32 r11.x, r14.w
-mov.f32f32 r11.y, r14.z
-mov.f32f32 r13.y, r14.y
-mul.f r3.x, r3.x, r10.x
-mov.f32f32 r10.x, r11.x
-mov.f32f32 r11.x, r11.y
-mov.f32f32 r11.y, r13.y
-mov.f32f32 r13.y, r9.x
-sel.b32 r7.w, r10.x, r6.z, r7.w
-sel.b32 r8.z, r11.x, r6.z, r8.z
-sel.b32 r3.y, r11.y, r6.z, r3.y
-mov.f32f32 r6.z, r9.x
-mul.f r7.w, r7.w, r0.y
-mov.f32f32 r10.x, r4.y
-mul.f r8.z, r8.z, r0.y
-mul.f r0.y, r3.y, r0.y
-mad.f32 r3.x, r13.y, r6.z, r3.x
-cmps.f.lt r3.y, r10.x, c8.y
-mov.f32f32 r6.z, r12.x
-mad.f32 r6.x, r12.y, r12.y, r6.x
-mov.f32f32 r3.x, r3.x
-cov.u32f32 r3.y, r3.y
-mov.f32f32 r10.x, r2.z
-mov.f32f32 r11.x, r2.z
-min.f r1.y, r1.y, r6.z
-cmps.f.ne r3.y, r3.y, c8.y
-mov.f32f32 r6.z, r2.w
-mad.f32 r3.x, r10.x, r11.x, r3.x
-mov.f32f32 r6.x, r6.x
-sel.b32 r4.w, r7.w, r3.y, r4.w
-sel.b32 r7.w, r8.z, r3.y, r8.w
-sel.b32 r0.y, r0.y, r3.y, r0.w
-add.f r0.w, c10.w, (neg)r6.z
-sel.b32 r3.y, r5.w, r7.x, r4.w
-sel.b32 r4.w, r7.y, r7.x, r7.w
-sel.b32 r0.y, r3.w, r7.x, r0.y
-rsq r3.x, r3.x
-(ss)mov.f32f32 r3.x, r3.x
-mov.f32f32 r3.w, r3.y
-mov.f32f32 r5.w, r4.w
-mov.f32f32 r6.z, r0.y
-mul.f r3.x, c7.x, r3.x
-mul.f r3.w, r3.w, c14.z
-mul.f r5.w, r5.w, c14.y
-mul.f r6.z, r6.z, c14.x
-mul.f r3.x, r3.x, r5.y
-mov.f32f32 r3.w, r3.w
-cmps.f.lt r4.y, r4.y, c8.y
-mov.f32f32 r5.y, r5.w
-mov.f32f32 r5.w, r6.z
-mov.f32f32 r3.x, r3.x
-cov.u32f32 r4.y, r4.y
-mul.f r6.z, r7.z, c10.x
-sqrt r6.x, r6.x
-(ss)mov.f32f32 r6.x, r6.x
-mov.f32f32 r7.x, r3.x
-cmps.f.ne r4.y, r4.y, c8.y
-mad.f32 r4.x, c7.x, r4.x, r7.x
-mov.f32f32 r6.z, r6.z
-absneg.f r7.x, (neg)c0.z
-sel.b32 r3.y, r3.w, r4.y, r3.y
-mov.f32f32 r3.w, r11.z
-sel.b32 r4.w, r5.y, r4.y, r4.w
-sel.b32 r0.y, r5.w, r4.y, r0.y
-mov.f32f32 r4.x, r4.x
-add.f r3.w, c7.z, (neg)r3.w
-mov.f32f32 r3.x, r3.x
-mov.f32f32 r4.y, r12.w
-mov.f32f32 r2.y, r2.y
-mov.f32f32 r3.w, r3.w
-mov.f32f32 r5.y, r7.x
-mov.f32f32 r5.w, c2.x
-mul.f r2.y, r4.y, r2.y
-absneg.f r4.y, (abs)r13.x
-mad.f32 r5.y, c8.z, r5.y, (neg)r6.z
-mov.f32f32 r6.z, c8.y
+sam (f32)(xyz)r13.x, r5.z, s#0, t#0
+(sy)(ss)sel.b32 r5.z, r13.z, r2.w, r10.w
+mad.f32 r8.y, c7.x, r17.y, c7.x
+mad.f32 r8.x, c7.x, r9.z, c7.z
+sel.b32 r5.w, r13.y, r2.w, r10.z
+sel.b32 r2.w, r13.x, r2.w, r10.y
+min.f r1.w, r1.w, r7.y
+add.f r7.y, c10.w, (neg)r4.w
+mul.f r7.z, r8.w, c10.x
+absneg.f r8.z, (neg)c0.z
+sam (f32)(xyz)r8.w, r8.x, s#0, t#0
+(sy)sel.b32 r5.z, r9.y, r6.w, r5.z
+sel.b32 r5.w, r9.x, r6.w, r5.w
+sel.b32 r2.w, r8.w, r6.w, r2.w
+mad.f32 r6.w, c8.z, r8.z, (neg)r7.z
+mul.f r5.z, r5.z, r3.y
+cmps.f.lt r7.z, r18.y, c12.x
+mul.f r5.w, r5.w, r3.y
+mul.f r2.w, r2.w, r3.y
+mov.f32f32 r3.y, c8.y
+cov.u32f32 r7.z, r7.z
+rcp r7.x, r7.x
+(ss)mul.f r3.w, r3.w, r7.x
+(ss)mov.f32f32 r7.x, c8.y
+sel.b32 r2.z, r3.y, r2.z, r6.w
+cmps.f.ne r3.y, r7.z, c8.y
+mad.f32 r6.w, c0.y, r7.w, r12.z
+mov.f32f32 r7.z, c10.x
+mad.f32 r6.w, c0.z, r11.y, r6.w
+absneg.f r2.z, (neg)r2.z
log2 r3.w, r3.w
-(ss)mul.f r3.w, c9.x, r3.w
-mul.f r2.y, r2.y, r11.w
-rcp r5.w, r5.w
-(ss)mul.f r5.w, r6.x, r5.w
-sel.b32 r4.z, r6.z, r4.z, r5.y
-mov.f32f32 r3.w, r3.w
+(ss)mul.f r3.w, c9.y, r3.w
+sel.b32 r7.x, r7.x, r5.x, r7.z
+max.f r6.w, c8.y, r6.w
+absneg.f r0.z, (abs)r0.z
+cmps.f.ne r5.y, r5.y, c8.y
+mad.f32 r8.y, c7.x, r10.x, c7.x
+mad.f32 r8.x, c7.x, r4.z, c7.z
mov.f32f32 r2.y, r2.y
-mov.f32f32 r5.y, r1.w
-absneg.f r4.z, (neg)r4.z
-mov.f32f32 r5.w, r5.w
-cmps.f.lt r4.y, c11.x, r4.y
-mov.f32f32 r5.y, r5.y
+rcp r7.z, r2.z
+(ss)mul.f r7.y, r7.y, r7.z
+log2 r6.w, r6.w
+(ss)mul.f r6.w, c12.y, r6.w
+add.f r7.z, c7.z, (neg)r4.w
+rcp r8.z, r2.z
+nop
exp2 r3.w, r3.w
-(ss)add.f r6.x, c15.y, (neg)r3.w
-mov.f32f32 r6.z, r4.z
-cov.u32f32 r4.y, r4.y
-add.f r2.y, r5.y, (neg)r2.y
-mul.f r5.y, r6.x, c8.w
-(ss)mul.f r3.w, r3.w, c7.z
-log2 r5.w, r5.w
-(ss)mul.f r5.w, c9.y, r5.w
-mov.f32f32 r2.y, r2.y
-rcp r6.x, r6.z
-(ss)mul.f r0.w, r0.w, r6.x
-add.f r3.w, r3.w, r5.y
-mov.f32f32 r5.y, r5.w
-mad.f32 r2.y, c10.z, r2.y, c7.x
-mov.f32f32 r0.w, r0.w
-add.f r5.w, c15.y, (neg)r3.w
-add.f r6.x, c15.y, (neg)r3.w
-(ss)add.f r6.z, c15.y, (neg)r3.w
-mov.f32f32 r2.y, r2.y
-mul.f r3.y, r5.w, r3.y
-mul.f r4.w, r6.x, r4.w
-mul.f r0.y, r6.z, r0.y
-mov.f32f32 r2.y, r2.y
-mov.f32f32 r5.w, r2.w
-exp2 r5.y, r5.y
nop
-(ss)rcp r5.y, r5.y
-(ss)mov.f32f32 r5.y, r5.y
-mov.f32f32 r2.y, r2.y
-add.f r5.w, c7.z, (neg)r5.w
-mov.f32f32 r6.x, r4.z
-mul.f r5.y, c9.w, r5.y
-mov.f32f32 r7.x, r2.y
-mov.f32f32 r2.y, r12.w
-mov.f32f32 r6.z, r6.w
-mov.f32f32 r5.y, r5.y
-mov.f32f32 r4.y, r4.y
-rcp r6.x, r6.x
-(ss)mul.f r5.w, r5.w, r6.x
-mul.f r2.y, r2.y, r6.z
-add.f r5.y, c7.z, (neg)r5.y
-cmps.f.ne r4.y, r4.y, c8.y
-mov.f32f32 r5.w, r5.w
-mul.f r2.y, r2.y, r11.w
-mov.f32f32 r5.y, r5.y
-(ss)mul.f r6.x, r0.z, r0.z
-max.f r6.z, r0.w, r5.w
-mov.f32f32 r2.y, r2.y
-mov.f32f32 r6.w, r2.z
-mad.f32 r6.x, r0.x, r0.x, r6.x
-mov.f32f32 r6.z, r6.z
-mov.f32f32 r7.y, c8.y
-mov.f32f32 r6.w, r6.w
-mov.f32f32 r6.x, r6.x
-min.f r1.y, r1.y, r6.z
-mad.f32 r6.x, r2.w, r2.w, r6.x
-add.f r2.y, r6.w, (neg)r2.y
-mov.f32f32 r6.z, r7.y
-mov.f32f32 r1.y, r1.y
-mov.f32f32 r6.w, c10.x
-mov.f32f32 r2.y, r2.y
-mov.f32f32 r7.y, r0.x
-mov.f32f32 r7.z, r3.z
-rsq r6.x, r6.x
-(ss)mov.f32f32 r6.x, r6.x
-mad.f32 r2.y, c10.z, r2.y, c7.x
-sel.b32 r6.z, r6.z, r4.y, r6.w
-mad.f32 r6.w, r7.z, r1.y, r7.y
-absneg.f r7.y, (abs)r0.z
-mov.f32f32 r2.y, r2.y
-mul.f r6.x, c7.x, r6.x
-mov.f32f32 r6.w, r6.w
-cmps.f.lt r7.y, c11.x, r7.y
-mov.f32f32 r2.y, r2.y
-mul.f r5.y, r6.x, r5.y
-add.f r6.x, r6.w, c11.z
-cov.u32f32 r6.w, r7.y
-mov.f32f32 r2.y, r2.y
-mov.f32f32 r5.y, r5.y
-mov.f32f32 r6.x, r6.x
-mov.f32f32 r6.w, r6.w
-mov.f32f32 r7.y, r2.y
-mov.f32f32 r2.y, r5.y
-mov.f32f32 r5.y, r5.y
-mul.f r6.x, c11.y, r6.x
-cmps.f.ne r6.w, r6.w, c8.y
-mov.f32f32 r7.z, r0.z
-min.f r2.x, r2.x, r9.z
-sam (f32)(xy)r11.x, r7.x, s#1, t#1
-(sy)mul.f r1.x, r1.x, r11.x
-mov.f32f32 r6.x, r6.x
-min.f r5.x, r5.x, r8.x
-(ss)absneg.f r7.x, (neg)r7.z
-mul.f r1.x, r1.x, c7.w
-cmps.f.lt r7.y, r9.w, c9.z
-max.f r2.x, r2.x, r5.x
-min.f r0.w, r0.w, r5.w
-mov.f32f32 r1.x, r1.x
-mov.f32f32 r5.x, r7.x
-cov.u32f32 r5.w, r7.y
-max.f r0.w, r2.x, r0.w
-mad.f32 r1.x, r1.x, r11.y, r3.x
-mov.f32f32 r2.x, r5.x
-cmps.f.ne r3.x, r5.w, c8.y
-mov.f32f32 r0.w, r0.w
-mov.f32f32 r1.x, r1.x
-mov.f32f32 r5.x, r1.w
-sel.b32 r2.x, r2.x, r6.w, r6.z
-add.f r0.w, r1.y, (neg)r0.w
-mov.f32f32 r1.y, r0.x
-mad.f32 r5.x, c7.x, r5.x, c7.x
-mul.f r2.x, r10.y, r2.x
-mov.f32f32 r5.w, c8.y
-mov.f32f32 r0.w, r0.w
-mov.f32f32 r5.x, r5.x
-mov.f32f32 r6.z, r10.y
-mov.f32f32 r5.w, r5.w
-mov.f32f32 r7.x, r0.x
-mov.f32f32 r5.x, r5.x
-mad.f32 r0.w, c11.w, r0.w, c7.z
-mov.f32f32 r7.y, c10.y
-mul.f r1.y, r1.y, r6.z
-mov.f32f32 r7.z, r5.x
-mov.f32f32 r5.x, r2.z
-mov.f32f32 r0.w, r0.w
-sel.b32 r5.w, r5.w, r4.y, r7.y
-mov.f32f32 r6.z, c8.y
-mad.f32 r5.x, c7.x, r5.x, c7.x
-mov.f32f32 r7.y, r3.z
-mov.f32f32 r7.w, r4.z
-mov.f32f32 r6.z, r6.z
-mov.f32f32 r5.x, r5.x
-rcp r0.w, r0.w
-(ss)mov.f32f32 r0.w, r0.w
-mul.f r7.x, r7.x, r7.w
-mov.f32f32 r6.z, r6.z
-mov.f32f32 r5.x, r5.x
-mul.f r0.w, r6.x, r0.w
-rcp r6.x, r7.y
-(ss)mul.f r1.y, r1.y, r6.x
-sel.b32 r5.w, r6.z, r6.w, r5.w
-mov.f32f32 r7.w, r5.x
-mov.f32f32 r0.w, r0.w
-mov.f32f32 r1.y, r1.y
-mov.f32f32 r5.x, r0.z
-mad.f32 r2.x, r3.z, r5.w, r2.x
-mul.f r3.z, r7.x, r6.x
-mov.f32f32 r5.w, r9.x
-sam (f32)(x)r7.x, r7.z, s#2, t#2
-mov.f32f32 r6.x, r9.x
-exp2 r0.w, r0.w
-(ss)mov.f32f32 r0.w, r0.w
-mov.f32f32 r2.x, r2.x
-mov.f32f32 r6.z, r2.w
-(sy)cmps.f.lt r6.x, r6.x, r7.x
-add.f r0.w, c7.z, r0.w
-add.f r1.y, r5.x, (neg)r1.y
-mov.f32f32 r5.x, r6.z
-cov.u32f32 r6.x, r6.x
-mov.f32f32 r0.w, r0.w
-mov.f32f32 r1.y, r1.y
-absneg.f r5.x, (neg)r5.x
-mov.f32f32 r6.x, r6.x
-mov.f32f32 r3.z, r3.z
-mad.f32 r1.y, c10.z, r1.y, c7.x
-mov.f32f32 r5.x, r5.x
-cmps.f.ne r6.x, r6.x, c8.y
-rcp r0.w, r0.w
-(ss)mov.f32f32 r0.w, r0.w
-mov.f32f32 r6.z, c10.x
-mov.f32f32 r1.y, r1.y
-sel.b32 r1.x, r1.x, r6.x, r4.x
-mov.f32f32 r4.x, r5.w
-sel.b32 r5.x, r5.x, r4.y, r6.z
-mov.f32f32 r5.w, c8.y
-mov.f32f32 r1.y, r1.y
-mov.f32f32 r4.x, r4.x
-mov.f32f32 r6.x, r2.w
-mov.f32f32 r5.w, r5.w
-mov.f32f32 r1.y, r1.y
-mad.f32 r4.x, c7.x, r4.x, c7.z
-add.f r3.z, r6.x, (neg)r3.z
-mov.f32f32 r5.w, r5.w
-mov.f32f32 r6.x, r0.x
-mov.f32f32 r4.x, r4.x
-mov.f32f32 r7.x, r1.y
-mov.f32f32 r1.y, r3.z
-sel.b32 r3.z, r5.w, r6.w, r5.x
-mov.f32f32 r4.x, r4.x
-mov.f32f32 r5.x, r6.x
-mad.f32 r1.y, c10.z, r1.y, c7.x
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r5.w, r4.x
-mad.f32 r2.x, r4.z, r3.z, r2.x
-mov.f32f32 r1.y, r1.y
-mov.f32f32 r3.z, r1.w
-mad.f32 r4.x, c7.x, r5.x, c7.z
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r4.z, r9.x
-mov.f32f32 r3.z, r3.z
-mov.f32f32 r2.x, r2.x
-mov.f32f32 r1.y, r1.y
-mov.f32f32 r4.x, r4.x
-mad.f32 r3.z, c7.x, r3.z, c7.x
-max.f r2.x, c8.y, r2.x
-mov.f32f32 r1.y, r1.y
-mov.f32f32 r4.x, r4.x
+(ss)rcp r3.w, r3.w
+(ss)mul.f r3.w, c9.w, r3.w
+mul.f r7.z, r7.z, r8.z
+cmps.f.lt r0.z, c11.x, r0.z
+exp2 r6.w, r6.w
+mov.f32f32 r8.z, r11.z
+mov.f32f32 r8.w, r7.w
+mov.f32f32 r9.x, r11.y
+max.f r7.w, r7.y, r7.z
+add.f r3.w, c7.z, (neg)r3.w
+mul.f r9.y, r10.x, r10.x
+cov.u32f32 r0.z, r0.z
+min.f r1.w, r1.w, r7.w
+mad.f32 r7.w, r4.z, r4.z, r9.y
+sam.3d (f32)(xyz)r8.z, r8.z, s#3, t#3
+(sy)(ss)mad.f32 r9.x, c13.z, r6.w, r9.x
+mad.f32 r8.w, c13.y, r6.w, r8.w
+mad.f32 r6.w, c13.x, r6.w, r8.z
+mov.f32f32 r8.z, r1.w
+sel.b32 r5.z, r5.z, r3.y, r9.x
mov.f32f32 r3.z, r3.z
-mov.f32f32 r2.x, r2.x
-mov.f32f32 r7.y, r1.y
-mov.f32f32 r7.z, r4.x
-mov.f32f32 r1.y, r3.z
-mov.f32f32 r3.z, r2.x
-mov.f32f32 r2.x, r2.x
-mov.f32f32 r4.x, r0.z
-mov.f32f32 r6.x, r1.y
-mul.f r0.w, r3.z, r0.w
-sam (f32)(xy)r9.z, r7.x, s#1, t#1
-(sy)mul.f r1.y, r2.x, r9.z
-mov.f32f32 r2.x, r4.x
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r3.z, r4.z
-mad.f32 r4.x, c7.x, r0.z, c7.x
-sam (f32)(xyz)r11.x, r5.w, s#0, t#0
-(sy)mov.f32f32 r4.z, r11.z
-mad.f32 r1.w, c7.x, r1.w, c7.x
-mov.f32f32 r5.x, r11.y
-(ss)mov.f32f32 r5.w, r11.x
-mov.f32f32 r0.w, r0.w
-mov.f32f32 r1.w, r1.w
-mul.f r1.y, r1.y, c7.w
-mad.f32 r2.x, c7.x, r2.x, c7.x
-mad.f32 r3.z, c7.x, r3.z, c7.z
-mov.f32f32 r1.w, r1.w
-mad.f32 r0.w, c7.x, r0.w, r5.y
-mov.f32f32 r1.y, r1.y
-mov.f32f32 r2.x, r2.x
-mov.f32f32 r7.x, r1.w
-mov.f32f32 r1.w, r10.w
-mov.f32f32 r0.w, r0.w
-mad.f32 r1.y, r1.y, r9.w, r2.y
-mov.f32f32 r2.x, r2.x
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r2.y, r3.z
+sel.b32 r5.w, r5.w, r3.y, r8.w
+sel.b32 r2.w, r2.w, r3.y, r6.w
+mad.f32 r3.y, r4.w, r4.w, r7.w
+min.f r2.y, r2.y, r3.z
mov.f32f32 r3.z, r4.x
-mov.f32f32 r7.w, r2.x
-mad.f32 r1.w, c7.x, r1.w, c7.x
-mov.f32f32 r1.y, r1.y
-mov.f32f32 r2.x, r3.z
-mov.f32f32 r2.y, r2.y
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r0.z, r0.z
-sam (f32)(xyz)r9.z, r7.z, s#0, t#0
-mov.f32f32 r3.z, r0.x
-(ss)mov.f32f32 r7.z, r2.x
-mov.f32f32 r1.w, r1.w
-mad.f32 r2.x, c7.x, r2.w, c7.x
-(sy)mov.f32f32 r4.x, r10.x
-mov.f32f32 r5.y, r9.w
-mov.f32f32 r7.y, r1.w
-mov.f32f32 r1.w, r2.x
-mov.f32f32 r0.z, r0.z
-mov.f32f32 r2.x, r9.z
-mov.f32f32 r8.z, r2.y
-mov.f32f32 r2.y, r2.z
-mad.f32 r0.z, c7.x, r0.z, c7.x
-sam (f32)(xyz)r9.z, r7.x, s#0, t#0
-(sy)mov.f32f32 r2.z, r10.x
-mov.f32f32 r6.x, r9.w
-mov.f32f32 r6.z, r9.z
-mov.f32f32 r1.w, r1.w
-sel.b32 r2.z, r4.z, r12.z, r2.z
-mov.f32f32 r2.y, r2.y
-sel.b32 r4.z, r5.x, r12.z, r6.x
-sel.b32 r5.x, r5.w, r12.z, r6.z
-mov.f32f32 r7.w, r1.w
-mad.f32 r1.w, c7.x, r2.y, c7.x
-mov.f32f32 r0.z, r0.z
-mad.f32 r2.y, c7.x, r3.z, c7.z
-mov.f32f32 r3.z, r2.w
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r0.z, r0.z
-(ss)nop
-sam (f32)(x)r7.x, r7.z, s#2, t#2
-mov.f32f32 r2.y, r2.y
-(sy)cmps.f.lt r0.x, r0.x, r7.x
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r5.w, r0.z
-mov.f32f32 r0.z, r3.z
-cov.u32f32 r0.x, r0.x
-mov.f32f32 r8.w, r1.w
-mov.f32f32 r1.w, r2.y
-mad.f32 r0.z, c7.x, r0.z, c7.x
-mov.f32f32 r0.x, r0.x
-mov.f32f32 r2.y, r2.w
-mov.f32f32 r7.x, r1.w
-mov.f32f32 r0.z, r0.z
-(ss)nop
-sam (f32)(xyz)r7.y, r8.z, s#0, t#0
-(sy)mov.f32f32 r1.w, r7.w
-mov.f32f32 r2.w, r7.z
-mov.f32f32 r3.z, r7.y
-cmps.f.ne r0.x, r0.x, c8.y
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r2.w, r2.w
-mov.f32f32 r3.z, r3.z
-sel.b32 r0.x, r1.y, r0.x, r0.w
-sel.b32 r0.w, r1.w, r10.z, r2.z
-sel.b32 r1.y, r2.w, r10.z, r4.z
-sel.b32 r1.w, r3.z, r10.z, r5.x
-mov.f32f32 r0.z, r0.z
-mul.f r0.w, r0.w, r1.x
-cmps.f.lt r2.z, r9.x, c12.x
-mul.f r1.y, r1.y, r1.x
-mul.f r1.x, r1.w, r1.x
-mov.f32f32 r6.x, r0.z
-cov.u32f32 r0.z, r2.z
-mad.f32 r1.w, c7.x, r2.y, c7.x
-mov.f32f32 r2.y, r14.x
-mov.f32f32 r2.z, r14.x
+mov.f32f32 r4.x, r6.y
cmps.f.ne r0.z, r0.z, c8.y
-mov.f32f32 r1.w, r1.w
-mul.f r2.y, c0.x, r2.y
-mov.f32f32 r2.w, r15.w
-sam (f32)(xyz)r7.y, r5.w, s#0, t#0
-(sy)mov.f32f32 r3.z, r7.z
-mov.f32f32 r4.z, r7.y
-mov.f32f32 r5.x, r7.w
-(ss)mov.f32f32 r5.w, r2.w
-sel.b32 r3.z, r5.y, r4.y, r3.z
-sel.b32 r2.x, r2.x, r4.y, r4.z
-sel.b32 r4.x, r4.x, r4.y, r5.x
-mad.f32 r2.y, c0.y, r5.w, r2.y
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r2.z, r2.z
-mov.f32f32 r4.y, r9.y
-mov.f32f32 r2.y, r2.y
-mov.f32f32 r7.y, r1.w
-mov.f32f32 r7.z, r2.z
-mov.f32f32 r1.w, r4.y
-mov.f32f32 r2.z, r2.w
-mov.f32f32 r2.w, r4.y
-cmps.f.lt r4.y, r8.y, c8.y
-mad.f32 r1.w, c0.z, r1.w, r2.y
-sam (f32)(xyz)r8.z, r7.x, s#0, t#0
-(sy)mov.f32f32 r2.y, r8.z
-mov.f32f32 r4.z, r9.x
-mov.f32f32 r5.x, r8.w
-max.f r1.w, c8.y, r1.w
-mov.f32f32 r2.y, r2.y
-mov.f32f32 r4.z, r4.z
-mov.f32f32 r5.x, r5.x
-mov.f32f32 r1.w, r1.w
-sel.b32 r2.x, r2.y, r6.w, r2.x
-sel.b32 r2.y, r4.z, r6.w, r4.x
-sel.b32 r3.z, r5.x, r6.w, r3.z
-mov.f32f32 r2.z, r2.z
-mov.f32f32 r2.w, r2.w
-cov.u32f32 r4.x, r4.y
-log2 r1.w, r1.w
-(ss)mul.f r1.w, c12.y, r1.w
-mul.f r2.y, r2.y, r0.x
-mul.f r3.z, r3.z, r0.x
-mul.f r0.x, r2.x, r0.x
-mov.f32f32 r1.w, r1.w
-mov.f32f32 r7.w, r2.z
-mov.f32f32 r8.x, r2.w
-mov.f32f32 r2.x, r4.x
-mov.f32f32 r2.z, r8.y
-mov.f32f32 r2.w, c7.z
-nop
+absneg.f r6.y, (neg)r10.x
+mad.f32 r1.w, r3.x, r1.w, r4.z
+min.f r3.z, r3.z, r4.x
+rsq r3.y, r3.y
+(ss)mul.f r3.y, c7.x, r3.y
+sel.b32 r4.x, r6.y, r0.z, r7.x
+add.f r1.w, r1.w, c11.z
+max.f r2.y, r2.y, r3.z
+mov.f32f32 r3.z, r7.y
+mov.f32f32 r6.y, r7.z
+mul.f r3.y, r3.y, r3.w
+mul.f r3.w, r4.y, r4.x
+mov.f32f32 r4.x, c8.y
+min.f r3.z, r3.z, r6.y
+mov.f32f32 r6.y, r3.y
+mov.f32f32 r6.w, c10.y
+mul.f r1.w, c11.y, r1.w
+max.f r2.y, r2.y, r3.z
+sam (f32)(xyz)r7.x, r8.x, s#0, t#0
+absneg.f r3.z, (neg)r4.w
+sel.b32 r4.x, r4.x, r5.x, r6.w
+mov.f32f32 r6.w, c8.y
+add.f r2.y, r8.z, (neg)r2.y
+mad.f32 r7.w, c7.x, r10.x, c7.x
+(ss)mov.f32f32 r8.y, c10.x
+sel.b32 r4.x, r6.w, r0.z, r4.x
+mad.f32 r2.y, c11.w, r2.y, c7.z
+mad.f32 r8.x, c7.x, r4.w, c7.x
+sel.b32 r3.z, r3.z, r5.x, r8.y
+mad.f32 r8.y, c7.x, r10.x, c7.x
+mul.f r4.y, r4.z, r4.y
+rcp r6.w, r3.x
+(ss)mad.f32 r3.x, r3.x, r4.x, r3.w
+mov.f32f32 r3.w, c8.y
+rcp r2.y, r2.y
+(ss)mul.f r1.w, r1.w, r2.y
+sam (f32)(xyz)r8.z, r7.w, s#0, t#0
+(sy)(ss)sel.b32 r2.y, r7.x, r5.x, r8.z
+sel.b32 r4.x, r7.z, r5.x, r9.x
+sel.b32 r5.x, r7.y, r5.x, r8.w
+sel.b32 r3.z, r3.w, r0.z, r3.z
+mad.f32 r7.y, c7.x, r2.x, c7.x
+mad.f32 r8.z, c7.x, r4.w, c7.x
exp2 r1.w, r1.w
-cmps.f.ne r2.x, r2.x, c8.y
-cmps.f.lt r2.z, r2.z, c8.y
-sam.3d (f32)(xyz)r6.z, r7.z, s#3, t#3
-(sy)(ss)mad.f32 r4.x, c13.z, r1.w, r7.x
-mad.f32 r4.y, c13.y, r1.w, r6.w
-(ss)mad.f32 r1.w, c13.x, r1.w, r6.z
-cov.u32f32 r2.z, r2.z
-sel.b32 r0.w, r0.w, r0.z, r4.x
-sel.b32 r1.y, r1.y, r0.z, r4.y
-sel.b32 r0.z, r1.x, r0.z, r1.w
-cmps.f.ne r1.x, r2.z, c8.y
-mov.f32f32 r1.w, r2.w
-(rpt1)nop
-sel.b32 r0.w, r2.y, r1.x, r0.w
-sel.b32 r1.y, r3.z, r1.x, r1.y
-sel.b32 r0.x, r0.x, r1.x, r0.z
+(ss)add.f r1.w, c7.z, r1.w
+mad.f32 r2.x, r2.z, r3.z, r3.x
+mad.f32 r7.x, c7.x, r0.x, c7.z
+mul.f r0.x, r4.y, r6.w
+mul.f r2.z, r4.z, r2.z
+cmps.f.lt r3.x, r12.w, c8.y
+max.f r2.x, c8.y, r2.x
+rcp r1.w, r1.w
+add.f r0.x, r10.x, (neg)r0.x
+sam (f32)(x)r7.z, r8.y, s#2, t#2
+(sy)cmps.f.lt r3.z, r4.z, r7.z
+mul.f r2.z, r2.z, r6.w
+mov.f32f32 r3.w, r2.x
+mad.f32 r4.y, c10.z, r0.x, c7.x
+sam (f32)(xyz)r6.w, r7.x, s#0, t#0
+(sy)sel.b32 r0.x, r7.x, r0.z, r5.x
+add.f r2.z, r4.w, (neg)r2.z
+(ss)mul.f r1.w, r3.w, r1.w
+sel.b32 r3.w, r7.y, r0.z, r4.x
+cov.u32f32 r3.z, r3.z
+mad.f32 r4.z, c10.z, r2.z, c7.x
+mad.f32 r2.z, c7.x, r1.w, r6.y
+sel.b32 r0.z, r6.w, r0.z, r2.y
+cmps.f.ne r2.y, r3.z, c8.y
+cov.u32f32 r3.x, r3.x
+cmps.f.lt r3.z, r12.w, c8.y
+mov.f32f32 r1.w, c7.z
+sam (f32)(xy)r4.x, r4.y, s#1, t#1
+(sy)mul.f r2.x, r2.x, r4.x
+cmps.f.ne r3.x, r3.x, c8.y
+cov.u32f32 r3.z, r3.z
nop
-sel.b32 r0.z, r6.y, r3.x, r0.w
-sel.b32 r0.w, r5.z, r3.x, r1.y
-sel.b32 r0.x, r1.z, r3.x, r0.x
+mul.f r2.x, r2.x, c7.w
+(rpt2)nop
+mad.f32 r2.x, r2.x, r4.y, r3.y
+cmps.f.ne r3.y, r3.z, c8.y
+(rpt1)nop
+sel.b32 r2.x, r2.x, r2.y, r2.z
+(rpt2)nop
+mul.f r2.y, r3.w, r2.x
+mul.f r0.x, r0.x, r2.x
+mul.f r0.z, r0.z, r2.x
nop
-mov.f32f32 r1.x, r0.z
-mov.f32f32 r1.y, r0.w
-mov.f32f32 r1.z, r0.x
+sel.b32 r2.x, r2.y, r3.y, r5.z
+sel.b32 r0.x, r0.x, r3.y, r5.w
+sel.b32 r0.z, r0.z, r3.y, r2.w
nop
-mul.f r1.x, r1.x, c14.z
-mul.f r1.y, r1.y, c14.y
-mul.f r1.z, r1.z, c14.x
+sel.b32 r2.x, r6.x, r5.y, r2.x
+sel.b32 r0.x, r6.z, r5.y, r0.x
+sel.b32 r0.z, r1.z, r5.y, r0.z
nop
-mov.f32f32 r1.x, r1.x
-mov.f32f32 r1.y, r1.y
-mov.f32f32 r1.z, r1.z
+mul.f r1.z, r2.x, c14.z
+mul.f r2.y, r0.x, c14.y
+mul.f r2.z, r0.z, c14.x
nop
-sel.b32 r0.z, r1.x, r2.x, r0.z
-sel.b32 r0.w, r1.y, r2.x, r0.w
-sel.b32 r0.x, r1.z, r2.x, r0.x
+sel.b32 r1.z, r1.z, r3.x, r2.x
+sel.b32 r0.x, r2.y, r3.x, r0.x
+sel.b32 r0.z, r2.z, r3.x, r0.z
nop
-mul.f r0.z, r3.w, r0.z
-mul.f r0.w, r3.w, r0.w
-mul.f r0.x, r3.w, r0.x
+mul.f r1.z, r1.y, r1.z
+mul.f r0.x, r1.y, r0.x
+mul.f r0.z, r1.y, r0.z
nop
-add.f r0.z, r0.z, r3.y
-add.f r0.w, r0.w, r4.w
-add.f r0.x, r0.x, r0.y
-nop
-mov.f32f32 r1.z, r0.z
-mov.f32f32 r1.y, r0.w
-mov.f32f32 r1.x, r0.x
+add.f r1.z, r1.z, r0.y
+add.f r1.y, r0.x, r1.x
+add.f r1.x, r0.z, r0.w
end
nop
-nop
; FRAG: outputs: r1.x (1:0)
; FRAG: inputs: r0.x (5:20,cm=f,il=8,b=1)
-; FRAG: 2323 instructions, 0 half, 23 full
+; FRAG: 1348 instructions, 0 half, 27 full