summaryrefslogtreecommitdiff
path: root/reference/0ad-alpine-valley/0ad-70.asm
diff options
context:
space:
mode:
Diffstat (limited to 'reference/0ad-alpine-valley/0ad-70.asm')
-rw-r--r--reference/0ad-alpine-valley/0ad-70.asm278
1 files changed, 107 insertions, 171 deletions
diff --git a/reference/0ad-alpine-valley/0ad-70.asm b/reference/0ad-alpine-valley/0ad-70.asm
index 4377ecf..227a081 100644
--- a/reference/0ad-alpine-valley/0ad-70.asm
+++ b/reference/0ad-alpine-valley/0ad-70.asm
@@ -8,199 +8,135 @@
@out(r2.y) out1
@out(r2.z) out2
@out(r2.w) out3
+@const(c9.x) 0x3f000000, 0x00000000, 0x3f800000, 0xbb449ba6
+@const(c10.x) 0xbf000000, 0x40000000, 0x3f800000, 0x3de38866
+@const(c11.x) 0x3fb8aa65, 0x3cf5c28f, 0x00000000, 0x00000000
+@const(c12.x) 0x00000000, 0x3f800000, 0x43000000, 0x00000000
(sy)(ss)bary.f r0.x, 4, r1.x
add.f r0.y, r0.w, c9.y
bary.f r0.w, 5, r1.x
bary.f r1.z, 8, r1.x
-add.f r1.w, r0.x, c10.x
-bary.f r2.x, 10, r1.x
-bary.f r2.y, 6, r1.x
-add.f r2.z, r0.w, c10.x
-floor.f r2.w, r1.w
+add.f r2.x, r0.x, c10.x
+bary.f r1.w, 9, r1.x
+add.f r2.y, r0.w, c10.x
+bary.f r2.z, 6, r1.x
+floor.f r2.w, r2.x
rcp r0.y, r0.y
add.f r0.z, r0.z, c9.y
-mov.f32f32 r1.z, r1.z
-floor.f r3.x, r2.z
-add.f r1.w, r1.w, (neg)r2.w
+floor.f r3.x, r2.y
+add.f r3.w, r2.z, c9.w
+add.f r2.x, r2.x, (neg)r2.w
(ss)mul.f r0.y, r0.z, r0.y
-mov.f32f32 r3.y, r1.z
-add.f r0.z, r2.z, (neg)r3.x
-mov.f32f32 r1.z, r1.w
+absneg.f r0.z, (neg)c7.x
+add.f r2.y, r2.y, (neg)r3.x
+mov.f32f32 r2.z, r2.x
+add.f r2.x, r2.x, c9.z
+mul.f r0.z, r0.z, c7.x
+sam (f32)(w)r4.x, r1.z, s#1, t#1
+(ss)mov.f32f32 r1.z, r2.y
+mul.f r1.w, c9.x, r2.z
+add.f r2.z, c10.y, (neg)r2.z
+mul.f r0.z, r0.z, r0.y
mov.f32f32 r0.y, r0.y
-absneg.f r1.w, (neg)c7.x
-mov.f32f32 r0.z, r0.z
-mul.f r2.z, c9.x, r1.z
-add.f r2.w, c10.y, (neg)r1.z
-mul.f r1.w, r1.w, c7.x
-bary.f r3.x, 9, r1.x
-mov.f32f32 r2.z, r2.z
-mul.f r3.z, c9.x, r0.z
-mul.f r1.w, r1.w, r0.y
-mov.f32f32 r2.w, r2.w
-add.f r0.x, r0.x, (neg)r2.z
-mov.f32f32 r2.z, r3.z
-mov.f32f32 r1.w, r1.w
-add.f r3.z, c10.y, (neg)r0.z
-mov.f32f32 r0.x, r0.x
-add.f r0.w, r0.w, (neg)r2.z
-mul.f r0.y, r1.w, r0.y
-mov.f32f32 r1.w, r3.z
-add.f r2.z, c10.x, r0.x
+add.f r0.x, r0.x, (neg)r1.w
+mul.f r1.w, c9.x, r1.z
+mov.f32f32 r2.w, r2.z
+mul.f r0.y, r0.z, r0.y
+mov.f32f32 r0.z, r0.x
+add.f r0.w, r0.w, (neg)r1.w
add.f r0.x, c10.z, r0.x
-mov.f32f32 r0.y, r0.y
-mov.f32f32 r0.w, r0.w
-mov.f32f32 r2.z, r2.z
-mov.f32f32 r0.x, r0.x
mul.f r0.y, r0.y, c11.x
-add.f r3.z, c10.z, r0.w
-mul.f r2.z, r2.z, c3.z
-mul.f r0.x, r0.x, c3.z
-mov.f32f32 r0.y, r0.y
-mov.f32f32 r3.z, r3.z
-mov.f32f32 r3.w, r2.z
-mov.f32f32 r4.x, r0.x
-mov.f32f32 r0.x, r0.x
-mov.f32f32 r2.z, r2.z
-mov.f32f32 r4.y, r3.w
-add.f r0.w, c10.x, r0.w
-exp2 r0.y, r0.y
-(ss)mov.f32f32 r0.y, r0.y
-mov.f32f32 r3.w, r4.x
-mov.f32f32 r5.x, r0.x
-mov.f32f32 r0.x, r0.w
-add.f r0.w, c12.y, (neg)r0.y
-mov.f32f32 r5.w, r3.w
-mul.f r3.z, r3.z, c3.w
-mul.f r0.x, r0.x, c3.w
-mul.f r0.w, r0.w, c7.y
-mul.f r0.y, r0.y, c9.z
-mov.f32f32 r3.w, r3.z
-mov.f32f32 r4.x, r0.x
-mov.f32f32 r0.x, r0.x
-mov.f32f32 r6.z, r2.z
-mov.f32f32 r2.z, r3.z
-mov.f32f32 r4.z, r4.x
-add.f r2.y, r2.y, c9.w
-add.f r0.y, r0.y, r0.w
-mov.f32f32 r0.w, r3.w
-mov.f32f32 r5.y, r0.x
-mov.f32f32 r0.x, r2.y
-mov.f32f32 r0.y, r0.y
-mov.f32f32 r6.x, r0.w
-mov.f32f32 r0.w, r2.y
-mov.f32f32 r4.w, r0.x
-mov.f32f32 r0.x, r0.y
-mov.f32f32 r0.y, r2.y
-mov.f32f32 r6.w, r2.z
-mov.f32f32 r6.y, r0.w
-mov.f32f32 r0.w, r2.y
-mov.f32f32 r5.z, r0.y
-sam.s (f32)(x)r3.z, r4.y, s#2, t#2
-(sy)mov.f32f32 r0.y, r3.z
+add.f r0.z, c10.x, r0.z
+mov.f32f32 r1.w, r0.w
+mul.f r3.y, r0.x, c3.z
+add.f r0.x, c10.z, r0.w
+mul.f r4.x, r0.z, c3.z
+add.f r0.z, c10.x, r1.w
+mov.f32f32 r5.x, r3.y
+mul.f r3.z, r0.x, c3.w
+mov.f32f32 r5.w, r4.x
+mul.f r5.y, r0.z, c3.w
+exp2 r0.x, r0.y
+(ss)mov.f32f32 r0.y, r0.x
+mov.f32f32 r5.z, r3.w
+mov.f32f32 r4.y, r3.z
+mov.f32f32 r6.x, r5.y
+mov.f32f32 r6.y, r3.w
+add.f r0.y, c12.y, (neg)r0.y
+mov.f32f32 r4.z, r3.w
+sam.s (f32)(x)r3.x, r3.y, s#2, t#2
+add.f r0.z, c10.y, (neg)r1.z
+sam.s (f32)(x)r6.z, r5.x, s#2, t#2
+mul.f r0.x, r0.x, c9.z
+add.f r0.w, r2.y, c9.z
+mul.f r0.y, r0.y, c7.y
+(ss)nop
+sam.s (f32)(x)r5.x, r5.w, s#2, t#2
+mov.f32f32 r1.z, r0.z
+mul.f r0.z, r2.x, r0.z
+mul.f r1.w, r2.z, r0.w
+add.f r0.x, r0.x, r0.y
+mul.f r0.y, r2.w, r1.z
+sam.s (f32)(x)r3.y, r4.x, s#2, t#2
+mul.f r0.w, r2.x, r0.w
+(sy)cmps.f.lt r1.z, r4.w, c11.y
+bary.f r2.x, 10, r1.x
+mul.f r0.y, r0.y, r5.x
max.f r0.x, r0.x, c9.y
-mov.f32f32 r7.x, r0.w
-mul.f r0.w, r2.w, r1.w
-mov.f32f32 r0.y, r0.y
+mad.f32 r0.y, r0.z, r6.z, r0.y
+cov.u32f32 r0.z, r1.z
+mad.f32 r0.y, r1.w, r3.y, r0.y
min.f r0.x, r0.x, c9.z
-sam.s (f32)(x)r3.z, r5.w, s#2, t#2
-nop
-(sy)mov.f32f32 r2.y, r3.z
-mul.f r0.y, r0.w, r0.y
-sam.s (f32)(x)r3.z, r5.x, s#2, t#2
-(sy)mov.f32f32 r0.w, r3.z
-add.f r1.z, r1.z, c9.z
-add.f r2.z, c12.y, (neg)r0.x
-add.f r3.z, c12.y, (neg)r0.x
-add.f r3.w, c12.y, (neg)r0.x
-mul.f r1.w, r1.z, r1.w
-mul.f r2.z, r2.z, c6.z
-mul.f r4.x, r3.z, c6.y
-mul.f r3.w, r3.w, c6.x
-mad.f32 r0.y, r1.w, r0.w, r0.y
-(ss)nop
-sam.s (f32)(x)r4.y, r6.z, s#2, t#2
-add.f r0.z, r0.z, c9.z
-(sy)mov.f32f32 r0.w, r4.y
-mov.f32f32 r1.w, r3.x
-mov.f32f32 r0.y, r0.y
-mul.f r2.w, r2.w, r0.z
-mul.f r0.z, r1.z, r0.z
-mov.f32f32 r3.z, r1.w
-mov.f32f32 r1.z, r2.x
-mad.f32 r0.y, r2.w, r0.w, r0.y
-bary.f r0.w, 11, r1.x
-mov.f32f32 r1.w, c9.z
-bary.f r2.x, 2, r1.x
-mov.f32f32 r0.y, r0.y
-sam (f32)(w)r2.w, r3.y, s#1, t#1
-(sy)cmps.f.lt r2.w, r3.z, c11.y
-mad.f32 r0.y, r0.z, r2.y, r0.y
-mov.f32f32 r0.z, r3.z
-mov.f32f32 r3.x, r1.z
-mov.f32f32 r0.w, r0.w
-mov.f32f32 r0.y, r0.y
-cov.u32f32 r1.z, r2.w
-mov.f32f32 r0.z, r0.z
-(ss)mov.f32f32 r3.y, r0.w
+mad.f32 r0.y, r0.w, r3.x, r0.y
+cmps.f.ne r0.z, r0.z, c9.y
+(rpt1)nop
mul.f r0.y, c10.w, r0.y
-cmps.f.ne r0.w, r1.z, c9.y
+bary.f r2.y, 11, r1.x
+add.f r0.w, c12.y, (neg)r0.x
+add.f r1.z, c12.y, (neg)r0.x
+mov.f32f32 r1.w, r0.y
+add.f r2.z, c12.y, (neg)r0.x
(rpt1)nop
-mov.f32f32 r0.y, r0.y
-mov.f32f32 r1.z, c9.y
-sam (f32)(xyz)r4.y, r3.x, s#0, t#0
-(sy)mul.f r2.x, r4.w, r2.x
+sam (f32)(xyz)r2.w, r2.x, s#0, t#0
+(ss)bary.f r2.x, 2, r1.x
bary.f r2.y, 1, r1.x
bary.f (ei)r1.x, 0, r1.x
-sel.b32 r0.z, r1.z, r0.w, r0.z
-mul.f r0.w, r2.x, r0.y
-mul.f r1.y, r4.z, r2.y
-mul.f r1.x, r4.y, r1.x
-mov.f32f32 r2.w, r1.w
-mov.f32f32 r0.w, r0.w
-mul.f r1.y, r1.y, r0.y
-mad.f32 r0.w, c5.z, r4.w, r0.w
+mul.f r0.w, r0.w, c6.z
+(sy)mul.f r1.y, r3.y, r2.x
+mul.f r2.x, r3.x, r2.y
+mul.f r1.x, r2.w, r1.x
+mul.f r1.z, r1.z, c6.y
+mul.f r1.y, r1.y, r1.w
+mul.f r1.w, r2.x, r1.w
+mad.f32 r1.y, c5.z, r3.y, r1.y
+mad.f32 r1.w, c5.y, r3.x, r1.w
mul.f r0.y, r1.x, r0.y
-(rpt1)nop
-mov.f32f32 r0.w, r0.w
-mov.f32f32 r1.x, r1.y
-mov.f32f32 r0.y, r0.y
-mad.f32 r1.x, c5.y, r4.z, r1.x
-mul.f r0.w, r0.x, r0.w
-mad.f32 r0.y, c5.x, r4.y, r0.y
-(rpt1)nop
-add.f r0.w, r0.w, r2.z
-mov.f32f32 r1.x, r1.x
-mov.f32f32 r0.y, r0.y
-nop
-mul.f r0.w, r0.w, r0.z
-mul.f r1.x, r0.x, r1.x
+mul.f r1.x, r2.z, c6.x
+mul.f r1.y, r0.x, r1.y
+mul.f r1.w, r0.x, r1.w
+mad.f32 r0.y, c5.x, r2.w, r0.y
+mov.f32f32 r2.x, c9.y
+add.f r0.w, r1.y, r0.w
+add.f r1.y, r1.w, r1.z
mul.f r0.x, r0.x, r0.y
-nop
-mul.f r0.y, r0.w, c4.z
-add.f r0.w, r1.x, r4.x
-add.f r0.x, r0.x, r3.w
-nop
-mov.f32f32 r0.y, r0.y
-mul.f r0.w, r0.w, r0.z
-mul.f r0.x, r0.x, r0.z
-nop
-mov.f32f32 r0.y, r0.y
-mul.f r0.z, r0.w, c4.y
-mul.f r0.x, r0.x, c4.x
-nop
-mov.f32f32 r2.z, r0.y
-mov.f32f32 r0.y, r0.z
-mov.f32f32 r0.x, r0.x
+sel.b32 r0.y, r2.x, r0.z, r4.w
+mov.f32f32 r2.w, c9.z
(rpt1)nop
-mov.f32f32 r0.y, r0.y
-mov.f32f32 r0.x, r0.x
+mul.f r0.z, r0.w, r0.y
+mul.f r0.w, r1.y, r0.y
(rpt1)nop
-mov.f32f32 r2.y, r0.y
-mov.f32f32 r2.x, r0.x
+mul.f r2.z, r0.z, c4.z
+mul.f r2.y, r0.w, c4.y
+add.f r0.x, r0.x, r1.x
+(rpt2)nop
+mul.f r0.x, r0.x, r0.y
+(rpt2)nop
+mul.f r2.x, r0.x, c4.x
end
nop
nop
+nop
; FRAG: outputs: r2.x (1:0)
-; FRAG: inputs: r0.x (0:0,cm=f,il=8,b=0) r1.x (5:9,cm=f,il=8,b=1) r2.x (5:10,cm=f,il=12,b=1) r0.x (5:11,cm=f,il=16,b=1)
-; FRAG: 195 instructions, 0 half, 8 full
+; FRAG: inputs: r0.x (0:0,cm=f,il=8,b=0) r1.x (5:9,cm=f,il=8,b=1) r2.x (5:10,cm=f,il=12,b=1) r1.z (5:11,cm=f,il=16,b=1)
+; FRAG: 129 instructions, 0 half, 7 full