diff options
Diffstat (limited to 'reference/webgl-water/webgl-water-38.asm')
-rw-r--r-- | reference/webgl-water/webgl-water-38.asm | 484 |
1 files changed, 173 insertions, 311 deletions
diff --git a/reference/webgl-water/webgl-water-38.asm b/reference/webgl-water/webgl-water-38.asm index 015bad5..a32e656 100644 --- a/reference/webgl-water/webgl-water-38.asm +++ b/reference/webgl-water/webgl-water-38.asm @@ -6,351 +6,213 @@ @out(r1.y) out1 @out(r1.z) out2 @out(r1.w) out3 +@const(c3.x) 0x3f000000, 0x3f7fbe77, 0x3f800000, 0x00000000 +@const(c4.x) 0x3f666666, 0x40800000, 0x3f1013a9, 0x3f400d1b +@const(c5.x) 0x3ec00000, 0x40000000, 0xbf800000, 0x3f800000 +@const(c6.x) 0xc39044fe, 0xbe2ab368, 0x41200000, 0x3ef5c28f +@const(c7.x) 0x3ef5c28f, 0x3f8a3d71, 0x3f99999a, 0x00000000 +@const(c8.x) 0x00000000, 0x3f800000, 0x43000000, 0x00000000 (sy)(ss)absneg.f r0.z, (neg)c0.y bary.f r0.w, 0, r0.x -bary.f r1.x, 1, r0.x -bary.f (ei)r0.x, 2, r0.x +bary.f r1.x, 2, r0.x +bary.f (ei)r0.x, 1, r0.x mul.f r0.y, r0.z, r0.z add.f r1.y, r0.w, (neg)c1.x -mad.f32 r1.z, c3.x, r0.w, c3.x +absneg.f r1.z, (abs)r1.x mad.f32 r1.w, c3.x, r0.w, c3.x add.f r0.y, c3.z, (neg)r0.y mul.f r1.y, r1.y, r1.y -add.f r2.x, r1.x, (neg)c1.y -mov.f32f32 r1.z, r1.z -mov.f32f32 r0.y, r0.y -mov.f32f32 r1.w, r1.w -mad.f32 r1.y, r2.x, r2.x, r1.y -mad.f32 r2.x, c3.x, r1.x, c3.z +add.f r2.y, r0.x, (neg)c1.y +cmps.f.lt r1.z, c3.y, r1.z mul.f r0.y, r0.y, c4.z -mov.f32f32 r1.z, r1.z -mov.f32f32 r1.w, r1.w -mov.f32f32 r1.y, r1.y -mov.f32f32 r0.y, r0.y -add.f r2.y, r0.x, (neg)c1.z -mov.f32f32 r2.z, r1.z -mov.f32f32 r1.z, r1.w +mad.f32 r2.x, c3.x, r1.x, c3.x +mad.f32 r2.z, c3.x, r0.w, c3.x +mul.f r2.w, r0.w, r0.w add.f r0.y, c3.z, (neg)r0.y mad.f32 r1.y, r2.y, r2.y, r1.y -mad.f32 r1.w, c3.x, r0.x, c3.x -mad.f32 r2.y, c3.x, r0.x, c3.x -mov.f32f32 r0.y, r0.y -mov.f32f32 r1.y, r1.y -mov.f32f32 r1.w, r1.w -mov.f32f32 r2.y, r2.y -mov.f32f32 r2.w, r0.y +add.f r2.y, r1.x, (neg)c1.z +cov.u32f32 r1.z, r1.z +mov.f32f32 r3.x, r0.y cmps.f.lt r0.y, r0.y, c3.w -mov.f32f32 r1.w, r1.w -mov.f32f32 r2.y, r2.y -sqrt r1.y, r1.y -mov.f32f32 r2.x, r2.x -(ss)mov.f32f32 r1.y, r1.y -mov.f32f32 r3.x, c2.x -sqrt r2.w, r2.w -(ss)mov.f32f32 r3.y, r2.w -mov.f32f32 r3.z, r0.z +mad.f32 r1.y, r2.y, r2.y, r1.y +cmps.f.ne r1.z, r1.z, c3.w +mad.f32 r3.y, c3.x, r0.x, c3.z +mov.f32f32 r2.y, c3.w +mov.f32f32 r3.w, c3.w +sqrt r3.x, r3.x +(ss)mad.f32 r3.x, c4.w, r0.z, r3.x cov.u32f32 r0.y, r0.y -(ss)mov.f32f32 r2.w, r1.w -mov.f32f32 r1.w, r2.y -mad.f32 r2.y, c4.w, r3.z, r3.y -rcp r3.x, r3.x -(ss)mul.f r1.y, r1.y, r3.x +sqrt r1.y, r1.y +mad.f32 r3.z, c3.x, r0.w, c3.x +mov.f32f32 r4.x, c2.x +mov.f32f32 r4.y, r3.x +mul.f r3.x, r3.x, c3.w +absneg.f r4.z, (neg)c0.z cmps.f.ne r0.y, r0.y, c3.w -mov.f32f32 r2.x, r2.x -mov.f32f32 r2.y, r2.y -mov.f32f32 r1.y, r1.y -sam (f32)(x)r2.z, r2.z, s#2, t#2 -(ss)nop -sam (f32)(x)r2.w, r1.z, s#2, t#2 -(sy)(ss)cmps.f.lt r1.z, r1.x, r2.z -cmps.f.lt r1.w, r1.x, r2.w -mul.f r2.z, r2.y, c3.w -mul.f r2.w, r2.y, c3.z -mul.f r2.y, r2.y, c3.w -cov.u32f32 r1.z, r1.z -mov.f32f32 r2.z, r2.z -absneg.f r3.x, (neg)c0.x -mov.f32f32 r2.w, r2.w -mov.f32f32 r0.z, r0.z -mov.f32f32 r2.y, r2.y -mov.f32f32 r3.x, r3.x -absneg.f r3.y, (neg)c0.z -mad.f32 r0.z, c4.w, r0.z, (neg)r2.w -mov.f32f32 r2.w, c3.w -mad.f32 r2.z, c4.w, r3.x, (neg)r2.z -mov.f32f32 r3.x, c3.w -mov.f32f32 r3.y, r3.y -sel.b32 r0.z, r2.w, r0.y, r0.z +mul.f r4.w, r4.y, c3.w +absneg.f r5.x, (neg)c0.x +mul.f r4.y, r4.y, c3.z +mad.f32 r3.x, c4.w, r4.z, (neg)r3.x +mad.f32 r0.z, c4.w, r0.z, (neg)r4.y +mad.f32 r4.y, c4.w, r5.x, (neg)r4.w +mov.f32f32 r4.z, c3.w +mov.f32f32 r4.w, c3.w +mov.f32f32 r5.x, c3.w +rcp r4.x, r4.x +(ss)mul.f r1.y, r1.y, r4.x +sel.b32 r4.x, r4.z, r0.y, r4.y +sel.b32 r0.z, r4.w, r0.y, r0.z +sel.b32 r0.y, r5.x, r0.y, r3.x +sam (f32)(xyz)r4.y, r3.y, s#0, t#0 +mad.f32 r3.x, c3.x, r0.w, c3.x +(ss)absneg.f r3.y, (neg)r4.x +absneg.f r0.z, (neg)r0.z +mov.f32f32 r3.z, c3.w +absneg.f r0.y, (neg)r0.y +mul.f r4.x, r0.x, r3.y log2 r1.y, r1.y (ss)mul.f r1.y, c4.y, r1.y -sel.b32 r2.z, r3.x, r0.y, r2.z -mad.f32 r2.y, c4.w, r3.y, (neg)r2.y -absneg.f r0.z, (neg)r0.z -mov.f32f32 r1.y, r1.y -absneg.f r2.z, (neg)r2.z -absneg.f r2.w, (abs)r0.x -mov.f32f32 r3.x, r0.z -mov.f32f32 r3.y, c3.w -mov.f32f32 r3.z, r2.z -cmps.f.lt r2.w, c3.y, r2.w -mov.f32f32 r3.w, r0.z +sel.b32 r2.y, r2.y, r1.z, r3.z +rcp r3.z, r3.y +absneg.f r5.x, (neg)r0.w +rcp r5.y, r0.z +(ss)mul.f r4.x, r4.x, r5.y +rcp r5.z, r0.z +absneg.f r5.w, (neg)r0.x +absneg.f r6.x, (abs)r0.w +add.f r6.y, c5.z, r5.x +add.f r4.x, r0.w, (neg)r4.x +add.f r6.z, c5.z, r5.w +cmps.f.lt r6.x, c3.y, r6.x +mul.f r3.z, r6.y, r3.z +rcp r6.y, r3.y +add.f r5.x, c5.w, r5.x +mad.f32 r6.w, c5.x, r4.x, c3.x +mul.f r4.x, r0.x, r0.y +mov.f32f32 r7.x, r3.z +(ss)mul.f r5.x, r5.x, r6.y +mul.f r5.z, r6.z, r5.z +cov.u32f32 r6.x, r6.x +mul.f r4.x, r4.x, r5.y +max.f r3.z, r3.z, r5.x +rcp r5.y, r0.z +add.f r5.w, c5.y, r5.w +mov.f32f32 r5.x, r5.x +add.f r4.x, r1.x, (neg)r4.x +mov.f32f32 r6.y, r5.z +(ss)mul.f r5.y, r5.w, r5.y +min.f r5.x, r7.x, r5.x +mad.f32 r7.x, c5.x, r4.x, c3.x +cmps.f.ne r4.x, r6.x, c3.w +max.f r5.z, r5.z, r5.y +mov.f32f32 r5.y, r5.y +absneg.f r0.w, (neg)r0.w +rcp r5.w, r0.y +absneg.f r6.x, (neg)r1.x +min.f r3.z, r3.z, r5.z +sam (f32)(xy)r6.z, r6.w, s#1, t#1 +min.f r5.y, r6.y, r5.y +sel.b32 r0.w, r0.w, r4.x, r2.y +add.f r2.y, c5.z, r6.x +rcp r5.z, r0.y +add.f r6.x, c5.w, r6.x +max.f r5.x, r5.x, r5.y +mul.f r0.w, r3.y, r0.w +(ss)mul.f r2.y, r2.y, r5.w +(ss)mul.f r3.y, r6.x, r5.z +mov.f32f32 r5.y, c3.z exp2 r1.y, r1.y nop (ss)rcp r1.y, r1.y -sel.b32 r0.y, r3.y, r0.y, r2.y -rcp r2.y, r3.x -(ss)mov.f32f32 r3.x, r2.z -cov.u32f32 r2.w, r2.w -rcp r3.y, r3.z -(ss)absneg.f r3.z, (neg)r0.w -absneg.f r0.y, (neg)r0.y -mul.f r3.x, r1.x, r3.x -mov.f32f32 r2.w, r2.w -add.f r4.x, c5.z, r3.z -mov.f32f32 r4.y, r0.y -(ss)mul.f r3.x, r3.x, r2.y -cmps.f.ne r2.w, r2.w, c3.w -mul.f r3.y, r4.x, r3.y -mul.f r4.x, r1.x, r4.y -mov.f32f32 r3.x, r3.x -mov.f32f32 r4.y, c3.w -mov.f32f32 r3.y, r3.y -mov.f32f32 r4.z, r2.z -add.f r3.x, r0.w, (neg)r3.x -mul.f r2.y, r4.x, r2.y -mov.f32f32 r4.x, r4.y -mov.f32f32 r4.y, c3.w -mov.f32f32 r4.w, r0.y -rcp r3.w, r3.w -mov.f32f32 r3.x, r3.x -rcp r4.z, r4.z -add.f r3.z, c5.w, r3.z -mov.f32f32 r2.y, r2.y -sel.b32 r4.x, r4.x, r2.w, r4.y -mad.f32 r3.x, c5.x, r3.x, c3.x -mov.f32f32 r3.z, r3.z -add.f r2.y, r0.x, (neg)r2.y -absneg.f r4.y, (abs)r0.w -rcp r4.w, r4.w -mov.f32f32 r3.x, r3.x -(ss)mul.f r3.z, r3.z, r4.z -mov.f32f32 r2.y, r2.y -cmps.f.lt r4.y, c3.y, r4.y -(ss)absneg.f r4.z, (neg)r0.x -mov.f32f32 r3.z, r3.z -mov.f32f32 r3.x, r3.x -mad.f32 r2.y, c5.x, r2.y, c3.x -cov.u32f32 r4.y, r4.y -max.f r5.x, r3.y, r3.z -mov.f32f32 r3.x, r3.x -mov.f32f32 r2.y, r2.y -min.f r3.y, r3.y, r3.z -mov.f32f32 r3.z, r5.x -absneg.f r5.x, (neg)r1.x -mov.f32f32 r5.y, r3.x -mov.f32f32 r2.y, r2.y -cmps.f.ne r3.x, r4.y, c3.w -add.f r4.y, c5.z, r5.x -absneg.f r5.z, (neg)r0.w -add.f r5.w, c5.z, r4.z -mov.f32f32 r1.y, r1.y -mul.f r3.w, r4.y, r3.w -mov.f32f32 r2.y, r2.y -mov.f32f32 r4.y, r5.z -mul.f r4.w, r5.w, r4.w -mov.f32f32 r3.w, r3.w -mov.f32f32 r5.w, r0.z mov.f32f32 r5.z, r2.y -mov.f32f32 r2.y, r4.y -mov.f32f32 r4.y, r4.w -mul.f r1.y, c4.x, r1.y -mov.f32f32 r4.w, r0.y -sel.b32 r2.y, r2.y, r3.x, r4.x -rcp r4.x, r5.w -add.f r5.x, c5.y, r5.x -sam (f32)(xy)r5.y, r5.y, s#1, t#1 -mov.f32f32 r1.y, r1.y -(ss)mov.f32f32 r5.w, r0.z -mul.f r2.y, r2.z, r2.y -mov.f32f32 r2.z, r5.x +max.f r2.y, r2.y, r3.y +sel.b32 r3.w, r3.w, r1.z, r5.y +mov.f32f32 r5.y, c3.w +mov.f32f32 r5.w, r3.y +min.f r2.y, r3.z, r2.y +(ss)mul.f r1.y, c4.x, r1.y +mad.f32 r3.y, c3.x, r1.x, c3.x +sel.b32 r3.z, r5.y, r4.x, r3.w +mov.f32f32 r3.w, r2.y +min.f r5.y, r5.z, r5.w +mad.f32 r2.y, r0.z, r2.y, r0.x +mad.f32 r0.z, r0.z, r3.z, r0.w +absneg.f r0.w, (neg)r1.x +max.f r3.z, r5.x, r5.y +add.f r2.y, r2.y, c6.y mov.f32f32 r5.x, c3.w -rcp r4.w, r4.w add.f r1.y, c3.z, (neg)r1.y -add.f r4.z, c5.w, r4.z -(ss)mul.f r2.z, r2.z, r4.x -mov.f32f32 r4.x, r5.x -mov.f32f32 r5.x, c3.z -mov.f32f32 r4.z, r4.z -mov.f32f32 r2.z, r2.z -mov.f32f32 r1.y, r1.y -mul.f r6.x, r0.w, r0.w -mul.f r4.z, r4.z, r4.w -(ss)max.f r4.w, r3.w, r2.z -sel.b32 r4.x, r4.x, r2.w, r5.x -mov.f32f32 r5.x, c3.w -min.f r2.z, r3.w, r2.z -mov.f32f32 r3.w, r4.w -mov.f32f32 r4.z, r4.z -mov.f32f32 r4.w, r5.x -mad.f32 r5.x, r1.x, r1.x, r6.x -min.f r3.z, r3.z, r3.w -max.f r3.w, r4.y, r4.z -mov.f32f32 r4.w, r4.w -max.f r2.z, r3.y, r2.z -min.f r3.y, r4.y, r4.z -mov.f32f32 r3.w, r3.w -sel.b32 r4.x, r4.w, r3.x, r4.x -mov.f32f32 r4.y, r5.x -mov.f32f32 r1.z, r1.z -min.f r3.z, r3.z, r3.w -mad.f32 r0.z, r0.z, r4.x, r2.y -max.f r2.y, r2.z, r3.y -nop -mov.f32f32 r2.z, r3.z -mov.f32f32 r0.z, r0.z -absneg.f r3.y, (neg)r0.x -mov.f32f32 r2.y, r2.y -mad.f32 r3.z, r5.w, r2.z, r1.x -mad.f32 r3.w, r0.x, r0.x, r4.y -mov.f32f32 r3.y, r3.y -mov.f32f32 r4.x, c3.w -mov.f32f32 r3.z, r3.z -add.f r2.y, r2.z, (neg)r2.y -cmps.f.ne r2.z, r1.z, c3.w -cov.u32f32 r1.z, r1.w -add.f r1.w, r3.z, c6.y -sel.b32 r3.y, r3.y, r2.w, r4.x -mov.f32f32 r3.z, c3.w -mov.f32f32 r2.y, r2.y -mov.f32f32 r1.w, r1.w -rsq r3.w, r3.w -(ss)mov.f32f32 r3.w, r3.w -mov.f32f32 r3.z, r3.z -mad.f32 r2.y, c6.z, r2.y, c3.z -mul.f r1.w, c6.x, r1.w -mul.f r3.w, c3.x, r3.w -mov.f32f32 r3.z, r3.z -mov.f32f32 r1.z, r1.z -mov.f32f32 r1.w, r1.w -mov.f32f32 r2.y, r2.y -sel.b32 r3.y, r3.z, r3.x, r3.y -mul.f r1.y, r3.w, r1.y -cmps.f.ne r1.z, r1.z, c3.w -mov.f32f32 r3.z, r2.x -mad.f32 r2.x, c3.x, r0.x, c3.x -mad.f32 r1.x, c3.x, r1.x, c3.z -rcp r2.y, r2.y -(ss)mov.f32f32 r2.y, r2.y -mad.f32 r0.y, r0.y, r3.y, r0.z -mov.f32f32 r0.z, r1.y -mov.f32f32 r1.y, r2.x -mul.f r1.w, r1.w, r2.y -mov.f32f32 r0.y, r0.y -mov.f32f32 r2.x, r0.z -mov.f32f32 r0.z, r0.z -mov.f32f32 r1.w, r1.w +add.f r3.z, r3.w, (neg)r3.z +mul.f r2.y, c6.x, r2.y +sel.b32 r0.w, r0.w, r1.z, r5.x +mov.f32f32 r3.w, c3.w +mad.f32 r3.z, c6.z, r3.z, c3.z +mad.f32 r2.w, r0.x, r0.x, r2.w +sam (f32)(xyz)r5.x, r3.x, s#0, t#0 +(sy)(ss)sel.b32 r3.x, r4.w, r1.z, r5.z +sel.b32 r3.y, r4.z, r1.z, r5.y +sel.b32 r0.w, r3.w, r4.x, r0.w +sel.b32 r1.z, r4.y, r1.z, r5.x +mad.f32 r3.w, r1.x, r1.x, r2.w +rcp r2.w, r3.z +(ss)mul.f r2.y, r2.y, r2.w +mad.f32 r0.y, r0.y, r0.w, r0.z +mad.f32 r0.z, c3.x, r0.x, c3.z +mad.f32 r0.w, c3.x, r1.x, c3.x +mad.f32 r2.w, c3.x, r1.x, c3.x +sam (f32)(x)r4.y, r1.w, s#2, t#2 max.f r0.y, c3.w, r0.y -mov.f32f32 r1.y, r1.y -mov.f32f32 r1.x, r1.x -mad.f32 r2.y, c3.x, r0.w, c3.x -mad.f32 r0.x, c3.x, r0.x, c3.x -mad.f32 r0.w, c3.x, r0.w, c3.x -exp2 r1.w, r1.w -(ss)mov.f32f32 r1.w, r1.w -mov.f32f32 r0.y, r0.y -mov.f32f32 r3.w, r1.y -mov.f32f32 r1.x, r1.x -add.f r1.y, c3.z, r1.w -mov.f32f32 r1.w, r0.y -mov.f32f32 r0.y, r0.y -mov.f32f32 r4.x, r1.x -mov.f32f32 r1.x, r1.y -(sy)mul.f r1.y, r1.w, r5.y -sam (f32)(xyz)r4.y, r3.z, s#0, t#0 -mov.f32f32 r0.w, r0.w -(sy)mov.f32f32 r1.w, r4.w -mov.f32f32 r3.y, r4.z -(ss)mov.f32f32 r3.z, r4.y -mov.f32f32 r0.w, r0.w -rcp r1.x, r1.x -(ss)mov.f32f32 r1.x, r1.x -mul.f r1.y, r1.y, c5.y -mov.f32f32 r3.w, r1.w -mov.f32f32 r3.y, r3.y -mul.f r0.y, r0.y, r1.x -mov.f32f32 r1.x, r1.y -mov.f32f32 r4.y, r0.w -mov.f32f32 r0.w, r3.z -mov.f32f32 r0.y, r0.y -mad.f32 r0.z, r1.x, r5.z, r0.z +rsq r1.x, r3.w +(ss)mul.f r1.x, c3.x, r1.x +(ss)exp2 r1.w, r2.y +(ss)add.f r2.x, c3.z, r1.w +(sy)(ss)cmps.f.lt r2.y, r0.x, r4.y +mov.f32f32 r1.w, c3.z (rpt1)nop -mad.f32 r0.y, c3.x, r0.y, r2.x -mov.f32f32 r0.z, r0.z -sam (f32)(xyz)r4.x, r4.x, s#0, t#0 -(sy)mov.f32f32 r1.x, r4.z -mov.f32f32 r1.y, r4.y +mul.f r3.z, r0.y, r6.z mov.f32f32 r0.y, r0.y -mov.f32f32 r1.w, r2.y -mov.f32f32 r2.x, r4.x -mov.f32f32 r0.x, r0.x -sel.b32 r0.y, r0.z, r1.z, r0.y -mov.f32f32 r0.z, r1.w -mov.f32f32 r1.z, c3.z +rcp r2.x, r2.x +mul.f r1.x, r1.x, r1.y (rpt1)nop -(ss)mov.f32f32 r4.x, r0.z -mov.f32f32 r0.x, r0.x -mov.f32f32 r0.z, r1.z -(rpt1)nop -mov.f32f32 r4.y, r0.x -mov.f32f32 r1.w, r0.z -(rpt4)nop -sam (f32)(xyz)r4.x, r4.x, s#0, t#0 -(sy)mov.f32f32 r0.x, r4.z -mov.f32f32 r0.z, r4.y -mov.f32f32 r1.z, r4.x -nop -sel.b32 r0.x, r1.x, r2.w, r0.x -sel.b32 r0.z, r1.y, r2.w, r0.z -sel.b32 r1.x, r2.x, r2.w, r1.z +(ss)mul.f r0.y, r0.y, r2.x +mov.f32f32 r1.y, r1.x +(ss)mul.f r2.x, r3.z, c5.y nop -sel.b32 r0.x, r3.w, r3.x, r0.x -sel.b32 r0.z, r3.y, r3.x, r0.z -sel.b32 r0.w, r0.w, r3.x, r1.x -nop -mul.f r0.x, r0.x, r0.y -mul.f r0.z, r0.z, r0.y -mul.f r0.y, r0.w, r0.y +mad.f32 r0.y, c3.x, r0.y, r1.y +sam (f32)(xyz)r4.y, r0.z, s#0, t#0 +(sy)(ss)sel.b32 r0.z, r4.w, r4.x, r3.x +mad.f32 r0.w, r2.x, r6.w, r1.x +sam (f32)(x)r4.w, r2.z, s#2, t#2 +(sy)cmps.f.lt r0.x, r0.x, r4.w +cov.u32f32 r1.x, r2.y +sel.b32 r1.y, r4.z, r4.x, r3.y +sel.b32 r1.z, r4.y, r4.x, r1.z +cov.u32f32 r0.x, r0.x +cmps.f.ne r1.x, r1.x, c3.w +(rpt1)nop +cmps.f.ne r0.x, r0.x, c3.w +(rpt2)nop +sel.b32 r0.x, r0.w, r0.x, r0.y +(rpt2)nop +mul.f r0.y, r0.z, r0.x +mul.f r0.z, r1.y, r0.x +mul.f r0.x, r1.z, r0.x nop -mov.f32f32 r0.x, r0.x -mov.f32f32 r0.z, r0.z +mul.f r0.w, r0.y, c7.z mov.f32f32 r0.y, r0.y -nop -mov.f32f32 r0.w, r0.x -mov.f32f32 r1.x, r0.z -mov.f32f32 r1.y, r0.y -mov.f32f32 r0.x, r0.x -mul.f r0.w, r0.w, c7.z -mul.f r1.x, r1.x, c7.y -mul.f r1.y, r1.y, c7.x -mov.f32f32 r0.x, r0.x +mul.f r1.y, r0.z, c7.y +mul.f r2.x, r0.x, c7.x mov.f32f32 r0.z, r0.z -mov.f32f32 r0.y, r0.y +sel.b32 r1.z, r0.w, r1.x, r0.y +mov.f32f32 r0.x, r0.x nop -sel.b32 r0.x, r0.w, r2.z, r0.x -mov.f32f32 r0.z, r0.z -mov.f32f32 r0.y, r0.y +sel.b32 r1.y, r1.y, r1.x, r0.z nop -mov.f32f32 r1.z, r0.x -sel.b32 r0.x, r1.x, r2.z, r0.z -sel.b32 r0.y, r1.y, r2.z, r0.y -(rpt1)nop -mov.f32f32 r1.y, r0.x -mov.f32f32 r1.x, r0.y +sel.b32 r1.x, r2.x, r1.x, r0.x end nop nop -nop ; FRAG: outputs: r1.x (1:0) ; FRAG: inputs: r0.x (5:20,cm=f,il=8,b=1) -; FRAG: 349 instructions, 0 half, 7 full +; FRAG: 205 instructions, 0 half, 8 full |