summaryrefslogtreecommitdiff
path: root/shaders/mpeg2/vld/field_read_x1y1_uv.g4i
blob: dd8877af3c80eda67de9de272ead11e242c92221 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
/* GRF allocation:
   g1~g30: constant buffer
           g1~g2:intra IQ matrix
           g3~g4:non intra IQ matrix
           g5~g20:IDCT table
   g31:    thread payload 
   g58~g81:reference data
   g82:    thread payload backup
   g83~g106:IDCT data
   g115:   message descriptor for reading reference data   */
mov (1) g32.8<1>UD 0x7000FUD {align1}; //8*16
send (16) 0 g40.0<1>UW g32<8,8,1>UW read(surface_u, 2, 0, 2) mlen 1 rlen 4 {align1};//U
send (16) 0 g46.0<1>UW g32<8,8,1>UW read(surface_v, 2, 0, 2) mlen 1 rlen 4 {align1};//V
add (1) g32.4<1>UD g32.4<1,1,1>UD 8UD {align1};
mov (1) g32.8<1>UD 0x0FUD {align1}; 
send (16) 0 g44.0<1>UW g32<8,8,1>UW read(surface_u, 2, 0, 2) mlen 1 rlen 1 {align1};//U
send (16) 0 g50.0<1>UW g32<8,8,1>UW read(surface_v, 2, 0, 2) mlen 1 rlen 1 {align1};//V
//U
add (8) g74.0<1>UW  g40.0<8,8,1>UB g40.1<8,8,1>UB {align1};
add (8) g74.16<1>UW g41.0<8,8,1>UB g41.1<8,8,1>UB {align1};
add (8) g75.0<1>UW  g42.0<8,8,1>UB g42.1<8,8,1>UB {align1};
add (8) g75.16<1>UW g43.0<8,8,1>UB g43.1<8,8,1>UB {align1};

add (8) g74.0<1>UW  g74.0<8,8,1>UW  g41.0<8,8,1>UB {align1};
add (8) g74.16<1>UW g74.16<8,8,1>UW g42.0<8,8,1>UB {align1};
add (8) g75.0<1>UW  g75.0<8,8,1>UW  g43.0<8,8,1>UB {align1};
add (8) g75.16<1>UW g75.16<8,8,1>UW g44.0<8,8,1>UB {align1};

add (8) g74.0<1>UW  g74.0<8,8,1>UW  g41.1<8,8,1>UB {align1};
add (8) g74.16<1>UW g74.16<8,8,1>UW g42.1<8,8,1>UB {align1};
add (8) g75.0<1>UW  g75.0<8,8,1>UW  g43.1<8,8,1>UB {align1};
add (8) g75.16<1>UW g75.16<8,8,1>UW g44.1<8,8,1>UB {align1};
//V
add (8) g78.0<1>UW  g46.0<8,8,1>UB g46.1<8,8,1>UB {align1};
add (8) g78.16<1>UW g47.0<8,8,1>UB g47.1<8,8,1>UB {align1};
add (8) g79.0<1>UW  g48.0<8,8,1>UB g48.1<8,8,1>UB {align1};
add (8) g79.16<1>UW g49.0<8,8,1>UB g49.1<8,8,1>UB {align1};

add (8) g78.0<1>UW  g78.0<8,8,1>UW  g47.0<8,8,1>UB {align1};
add (8) g78.16<1>UW g78.16<8,8,1>UW g48.0<8,8,1>UB {align1};
add (8) g79.0<1>UW  g79.0<8,8,1>UW  g49.0<8,8,1>UB {align1};
add (8) g79.16<1>UW g79.16<8,8,1>UW g50.0<8,8,1>UB {align1};

add (8) g78.0<1>UW  g78.0<8,8,1>UW  g47.1<8,8,1>UB {align1};
add (8) g78.16<1>UW g78.16<8,8,1>UW g48.1<8,8,1>UB {align1};
add (8) g79.0<1>UW  g79.0<8,8,1>UW  g49.1<8,8,1>UB {align1};
add (8) g79.16<1>UW g79.16<8,8,1>UW g50.1<8,8,1>UB {align1};

mov (1) g32.8<1>UD 0x7000FUD {align1}; //8*16
send (16) 0 g40.0<1>UW g32<8,8,1>UW read(surface_u, 2, 0, 2) mlen 1 rlen 4 {align1};//U
send (16) 0 g46.0<1>UW g32<8,8,1>UW read(surface_v, 2, 0, 2) mlen 1 rlen 4 {align1};//V
add (1) g32.4<1>UD g32.4<1,1,1>UD 8UD {align1};
mov (1) g32.8<1>UD 0x0FUD {align1}; 
send (16) 0 g44.0<1>UW g32<8,8,1>UW read(surface_u, 2, 0, 2) mlen 1 rlen 1 {align1};//U
send (16) 0 g50.0<1>UW g32<8,8,1>UW read(surface_v, 2, 0, 2) mlen 1 rlen 1 {align1};//V
//U
add (8) g76.0<1>UW  g40.0<8,8,1>UB g40.1<8,8,1>UB {align1};
add (8) g76.16<1>UW g41.0<8,8,1>UB g41.1<8,8,1>UB {align1};
add (8) g77.0<1>UW  g42.0<8,8,1>UB g42.1<8,8,1>UB {align1};
add (8) g77.16<1>UW g43.0<8,8,1>UB g43.1<8,8,1>UB {align1};

add (8) g76.0<1>UW  g76.0<8,8,1>UW  g41.0<8,8,1>UB {align1};
add (8) g76.16<1>UW g76.16<8,8,1>UW g42.0<8,8,1>UB {align1};
add (8) g77.0<1>UW  g77.0<8,8,1>UW  g43.0<8,8,1>UB {align1};
add (8) g77.16<1>UW g77.16<8,8,1>UW g44.0<8,8,1>UB {align1};

add (8) g76.0<1>UW  g76.0<8,8,1>UW  g41.1<8,8,1>UB {align1};
add (8) g76.16<1>UW g76.16<8,8,1>UW g42.1<8,8,1>UB {align1};
add (8) g77.0<1>UW  g77.0<8,8,1>UW  g43.1<8,8,1>UB {align1};
add (8) g77.16<1>UW g77.16<8,8,1>UW g44.1<8,8,1>UB {align1};
//V
add (8) g80.0<1>UW  g46.0<8,8,1>UB g46.1<8,8,1>UB {align1};
add (8) g80.16<1>UW g47.0<8,8,1>UB g47.1<8,8,1>UB {align1};
add (8) g81.0<1>UW  g48.0<8,8,1>UB g48.1<8,8,1>UB {align1};
add (8) g81.16<1>UW g49.0<8,8,1>UB g49.1<8,8,1>UB {align1};

add (8) g80.0<1>UW  g80.0<8,8,1>UW  g47.0<8,8,1>UB {align1};
add (8) g80.16<1>UW g80.16<8,8,1>UW g48.0<8,8,1>UB {align1};
add (8) g81.0<1>UW  g81.0<8,8,1>UW  g49.0<8,8,1>UB {align1};
add (8) g81.16<1>UW g81.16<8,8,1>UW g50.0<8,8,1>UB {align1};

add (8) g80.0<1>UW  g80.0<8,8,1>UW  g47.1<8,8,1>UB {align1};
add (8) g80.16<1>UW g80.16<8,8,1>UW g48.1<8,8,1>UB {align1};
add (8) g81.0<1>UW  g81.0<8,8,1>UW  g49.1<8,8,1>UB {align1};
add (8) g81.16<1>UW g81.16<8,8,1>UW g50.1<8,8,1>UB {align1};

shr (32) g74.0<1>UW g74.0<16,16,1>UW 2UW {align1 compr};
shr (32) g76.0<1>UW g76.0<16,16,1>UW 2UW {align1 compr};
shr (32) g78.0<1>UW g78.0<16,16,1>UW 2UW {align1 compr};
shr (32) g80.0<1>UW g80.0<16,16,1>UW 2UW {align1 compr};