diff options
Diffstat (limited to 'reference/0ad-cycladic-archipelago/0ad-cycladic-archipelago-30.asm')
-rw-r--r-- | reference/0ad-cycladic-archipelago/0ad-cycladic-archipelago-30.asm | 285 |
1 files changed, 105 insertions, 180 deletions
diff --git a/reference/0ad-cycladic-archipelago/0ad-cycladic-archipelago-30.asm b/reference/0ad-cycladic-archipelago/0ad-cycladic-archipelago-30.asm index 1b081fa..eb8f852 100644 --- a/reference/0ad-cycladic-archipelago/0ad-cycladic-archipelago-30.asm +++ b/reference/0ad-cycladic-archipelago/0ad-cycladic-archipelago-30.asm @@ -4,210 +4,135 @@ @in(r0.w) in3 @in(r1.x) in4 @in(r1.y) in5 -@out(r4.x) out0 -@out(r4.y) out1 -@out(r4.z) out2 -@out(r4.w) out3 +@out(r2.x) out0 +@out(r2.y) out1 +@out(r2.z) out2 +@out(r2.w) out3 +@const(c8.x) 0x3f000000, 0x00000000, 0x3f800000, 0xba03126f +@const(c9.x) 0xbf000000, 0x40000000, 0x3f800000, 0x3fb8aa65 +@const(c10.x) 0x3de38866, 0x3cf5c28f, 0x00000000, 0x00000000 +@const(c11.x) 0x00000000, 0x3f800000, 0x43000000, 0x00000000 (sy)(ss)bary.f r0.x, 0, r1.x add.f r0.y, r0.w, c8.y bary.f r0.w, 1, r1.x bary.f r1.z, 4, r1.x -add.f r1.w, r0.x, c9.x -bary.f r2.x, 6, r1.x -bary.f r2.y, 2, r1.x -add.f r2.z, r0.w, c9.x -floor.f r2.w, r1.w +add.f r2.x, r0.x, c9.x +bary.f r1.w, 5, r1.x +add.f r2.y, r0.w, c9.x +bary.f r2.z, 2, r1.x +floor.f r2.w, r2.x rcp r0.y, r0.y add.f r0.z, r0.z, c8.y -mov.f32f32 r1.z, r1.z -floor.f r3.x, r2.z -add.f r1.w, r1.w, (neg)r2.w +floor.f r3.x, r2.y +add.f r3.w, r2.z, c8.w +add.f r2.x, r2.x, (neg)r2.w (ss)mul.f r0.y, r0.z, r0.y -mov.f32f32 r3.y, r1.z -add.f r0.z, r2.z, (neg)r3.x -mov.f32f32 r1.z, r1.w +absneg.f r0.z, (neg)c6.x +add.f r2.y, r2.y, (neg)r3.x +mov.f32f32 r2.z, r2.x +add.f r2.x, r2.x, c8.z +mul.f r0.z, r0.z, c6.x +sam (f32)(w)r4.x, r1.z, s#1, t#1 +(ss)mov.f32f32 r1.z, r2.y +mul.f r1.w, c8.x, r2.z +add.f r2.z, c9.y, (neg)r2.z +mul.f r0.z, r0.z, r0.y mov.f32f32 r0.y, r0.y -absneg.f r1.w, (neg)c6.x -mov.f32f32 r0.z, r0.z -mul.f r2.z, c8.x, r1.z -add.f r2.w, c9.y, (neg)r1.z -mul.f r1.w, r1.w, c6.x -add.f r3.x, c9.y, (neg)r0.z -mov.f32f32 r2.z, r2.z -mul.f r3.z, c8.x, r0.z -mul.f r1.w, r1.w, r0.y -mov.f32f32 r2.w, r2.w -add.f r0.x, r0.x, (neg)r2.z -mov.f32f32 r2.z, r3.z -mov.f32f32 r1.w, r1.w -mov.f32f32 r3.x, r3.x -mov.f32f32 r0.x, r0.x -add.f r0.w, r0.w, (neg)r2.z -mul.f r0.y, r1.w, r0.y -mul.f r1.w, r2.w, r3.x -add.f r2.z, c9.x, r0.x +add.f r0.x, r0.x, (neg)r1.w +mul.f r1.w, c8.x, r1.z +mov.f32f32 r2.w, r2.z +mul.f r0.y, r0.z, r0.y +mov.f32f32 r0.z, r0.x +add.f r0.w, r0.w, (neg)r1.w add.f r0.x, c9.z, r0.x -mov.f32f32 r0.y, r0.y -mov.f32f32 r0.w, r0.w -mov.f32f32 r2.z, r2.z -mov.f32f32 r0.x, r0.x mul.f r0.y, r0.y, c9.w -add.f r3.z, c9.z, r0.w -mul.f r2.z, r2.z, c3.z -mul.f r0.x, r0.x, c3.z -mov.f32f32 r0.y, r0.y -mov.f32f32 r3.z, r3.z -mov.f32f32 r3.w, r2.z -mov.f32f32 r4.x, r0.x -mov.f32f32 r0.x, r0.x -mov.f32f32 r2.z, r2.z -mov.f32f32 r4.y, r3.w -add.f r0.w, c9.x, r0.w -exp2 r0.y, r0.y -(ss)mov.f32f32 r0.y, r0.y -mov.f32f32 r3.w, r4.x -mov.f32f32 r5.x, r0.x -mov.f32f32 r0.x, r0.w -add.f r0.w, c11.y, (neg)r0.y -mov.f32f32 r5.w, r3.w -mul.f r3.z, r3.z, c3.w -mul.f r0.x, r0.x, c3.w -mul.f r0.w, r0.w, c6.y -mul.f r0.y, r0.y, c8.z -mov.f32f32 r3.w, r3.z -mov.f32f32 r4.x, r0.x -mov.f32f32 r0.x, r0.x -mov.f32f32 r6.z, r2.z -mov.f32f32 r2.z, r3.z -mov.f32f32 r4.z, r4.x -add.f r2.y, r2.y, c8.w -add.f r0.y, r0.y, r0.w -mov.f32f32 r0.w, r3.w -mov.f32f32 r5.y, r0.x -mov.f32f32 r0.x, r2.y -mov.f32f32 r0.y, r0.y -mov.f32f32 r6.x, r0.w -mov.f32f32 r0.w, r2.y -mov.f32f32 r4.w, r0.x -mov.f32f32 r0.x, r0.y -mov.f32f32 r0.y, r2.y -mov.f32f32 r6.w, r2.z -mov.f32f32 r6.y, r0.w -mov.f32f32 r0.w, r2.y -mov.f32f32 r5.z, r0.y -sam.s (f32)(x)r0.y, r4.y, s#2, t#2 -(sy)mov.f32f32 r0.y, r0.y +add.f r0.z, c9.x, r0.z +mov.f32f32 r1.w, r0.w +mul.f r3.y, r0.x, c3.z +add.f r0.x, c9.z, r0.w +mul.f r4.x, r0.z, c3.z +add.f r0.z, c9.x, r1.w +mov.f32f32 r5.x, r3.y +mul.f r3.z, r0.x, c3.w +mov.f32f32 r5.w, r4.x +mul.f r5.y, r0.z, c3.w +exp2 r0.x, r0.y +(ss)mov.f32f32 r0.y, r0.x +mov.f32f32 r5.z, r3.w +mov.f32f32 r4.y, r3.z +mov.f32f32 r6.x, r5.y +mov.f32f32 r6.y, r3.w +add.f r0.y, c11.y, (neg)r0.y +mov.f32f32 r4.z, r3.w +sam.s (f32)(x)r3.x, r3.y, s#2, t#2 +add.f r0.z, c9.y, (neg)r1.z +sam.s (f32)(x)r6.z, r5.x, s#2, t#2 +mul.f r0.x, r0.x, c8.z +add.f r0.w, r2.y, c8.z +mul.f r0.y, r0.y, c6.y +(ss)nop +sam.s (f32)(x)r5.x, r5.w, s#2, t#2 +mov.f32f32 r1.z, r0.z +mul.f r0.z, r2.x, r0.z +mul.f r1.w, r2.z, r0.w +add.f r0.x, r0.x, r0.y +mul.f r0.y, r2.w, r1.z +sam.s (f32)(x)r3.y, r4.x, s#2, t#2 +mul.f r0.w, r2.x, r0.w +(sy)cmps.f.lt r1.z, r4.w, c10.y +bary.f r2.x, 6, r1.x +mul.f r0.y, r0.y, r5.x max.f r0.x, r0.x, c8.y -mov.f32f32 r7.x, r0.w -mov.f32f32 r0.w, r1.w -mov.f32f32 r0.y, r0.y +mad.f32 r0.y, r0.z, r6.z, r0.y +cov.u32f32 r0.z, r1.z +mad.f32 r0.y, r1.w, r3.y, r0.y min.f r0.x, r0.x, c8.z -sam.s (f32)(x)r1.w, r5.w, s#2, t#2 -nop -(sy)mov.f32f32 r1.w, r1.w -mul.f r0.y, r0.w, r0.y -sam.s (f32)(x)r0.w, r5.x, s#2, t#2 -(sy)mov.f32f32 r0.w, r0.w -add.f r1.z, r1.z, c8.z -add.f r2.y, c11.y, (neg)r0.x -add.f r2.z, c11.y, (neg)r0.x -add.f r3.z, c11.y, (neg)r0.x -mul.f r3.x, r1.z, r3.x -mul.f r2.y, r2.y, c5.z -mul.f r2.z, r2.z, c5.y -mul.f r3.w, r3.z, c5.x -mov.f32f32 r3.x, r3.x -sam.s (f32)(x)r3.z, r6.z, s#2, t#2 -add.f r0.z, r0.z, c8.z -(sy)mov.f32f32 r3.z, r3.z -bary.f r4.x, 5, r1.x -mad.f32 r0.y, r3.x, r0.w, r0.y -mul.f r0.w, r2.w, r0.z +mad.f32 r0.y, r0.w, r3.x, r0.y +cmps.f.ne r0.z, r0.z, c8.y (rpt1)nop -mov.f32f32 r0.y, r0.y -mov.f32f32 r0.w, r0.w -mul.f r0.z, r1.z, r0.z -mov.f32f32 r1.z, r4.x -mov.f32f32 r2.x, r2.x -mad.f32 r0.y, r0.w, r3.z, r0.y -mov.f32f32 r0.z, r0.z -mov.f32f32 r3.z, r1.z -mov.f32f32 r2.w, r2.x -mov.f32f32 r0.y, r0.y -bary.f r0.w, 7, r1.x -mad.f32 r0.y, r0.z, r1.w, r0.y -mov.f32f32 r0.z, c8.z -bary.f r1.z, 10, r1.x -(ss)nop -sam (f32)(w)r4.x, r3.y, s#1, t#1 -(sy)cmps.f.lt r1.w, r4.w, c10.y -mov.f32f32 r0.y, r0.y -mov.f32f32 r2.x, r4.w -mov.f32f32 r0.w, r0.w -mov.f32f32 r4.w, r0.z mul.f r0.y, c10.x, r0.y -cov.u32f32 r0.z, r1.w -mov.f32f32 r1.w, r2.x -mov.f32f32 r3.x, r0.w -mov.f32f32 r0.y, r0.y -cmps.f.ne r0.z, r0.z, c8.y -nop -mov.f32f32 r0.w, c8.y -bary.f r2.x, 9, r1.x +bary.f r2.y, 7, r1.x +add.f r0.w, c11.y, (neg)r0.x +add.f r1.z, c11.y, (neg)r0.x +mov.f32f32 r1.w, r0.y +add.f r2.z, c11.y, (neg)r0.x +(rpt1)nop +sam (f32)(xyz)r2.w, r2.x, s#0, t#0 +(ss)bary.f r2.x, 10, r1.x +bary.f r2.y, 9, r1.x bary.f (ei)r1.x, 8, r1.x -(ss)nop -sam (f32)(xyz)r2.w, r2.w, s#0, t#0 -(sy)mul.f r1.y, r3.y, r1.z -sel.b32 r0.z, r0.w, r0.z, r1.w -mul.f r0.w, r3.x, r2.x +mul.f r0.w, r0.w, c5.z +(sy)mul.f r1.y, r3.y, r2.x +mul.f r2.x, r3.x, r2.y mul.f r1.x, r2.w, r1.x -mul.f r1.y, r1.y, r0.y -(rpt2)nop -mov.f32f32 r1.y, r1.y -mul.f r0.w, r0.w, r0.y +mul.f r1.z, r1.z, c5.y +mul.f r1.y, r1.y, r1.w +mul.f r1.w, r2.x, r1.w mad.f32 r1.y, c4.z, r3.y, r1.y +mad.f32 r1.w, c4.y, r3.x, r1.w mul.f r0.y, r1.x, r0.y -(rpt1)nop -mov.f32f32 r1.x, r1.y -mov.f32f32 r0.w, r0.w -mov.f32f32 r0.y, r0.y -mad.f32 r0.w, c4.y, r3.x, r0.w -mul.f r1.x, r0.x, r1.x +mul.f r1.x, r2.z, c5.x +mul.f r1.y, r0.x, r1.y +mul.f r1.w, r0.x, r1.w mad.f32 r0.y, c4.x, r2.w, r0.y -(rpt1)nop -add.f r1.x, r1.x, r2.y -mov.f32f32 r0.w, r0.w -mov.f32f32 r0.y, r0.y +mov.f32f32 r2.x, c8.y +add.f r0.w, r1.y, r0.w +add.f r1.y, r1.w, r1.z nop -mul.f r1.x, r1.x, r0.z -mul.f r0.w, r0.x, r0.w +sel.b32 r0.z, r2.x, r0.z, r4.w mul.f r0.x, r0.x, r0.y +mov.f32f32 r2.w, c8.z nop -mov.f32f32 r0.y, r1.x -add.f r0.w, r0.w, r2.z -add.f r0.x, r0.x, r3.w -nop -mov.f32f32 r0.y, r0.y -mul.f r0.w, r0.w, r0.z -mul.f r0.x, r0.x, r0.z -nop -mov.f32f32 r4.z, r0.y -mov.f32f32 r0.y, r0.w -mov.f32f32 r0.x, r0.x -(rpt1)nop -mov.f32f32 r0.y, r0.y -mov.f32f32 r0.x, r0.x -(rpt1)nop -mov.f32f32 r4.y, r0.y -mov.f32f32 r4.x, r0.x +mul.f r2.z, r0.w, r0.z +mul.f r2.y, r1.y, r0.z +add.f r0.x, r0.x, r1.x +(rpt2)nop +mul.f r2.x, r0.x, r0.z end nop nop nop -; FRAG: outputs: r4.x (1:0) -; FRAG: inputs: r0.x (0:0,cm=f,il=8,b=0) r1.x (5:9,cm=f,il=8,b=1) r0.x (5:10,cm=f,il=12,b=1) r3.x (5:11,cm=f,il=16,b=1) -; FRAG: 200 instructions, 0 half, 8 full -; pos (bary): r1.x -; color: r4.x -; fragcoord: r0.x +; FRAG: outputs: r2.x (1:0) +; FRAG: inputs: r0.x (0:0,cm=f,il=8,b=0) r1.x (5:9,cm=f,il=8,b=1) r1.z (5:10,cm=f,il=12,b=1) r3.x (5:11,cm=f,il=16,b=1) +; FRAG: 121 instructions, 0 half, 7 full |