blob: 18e657ce3c94d92f467029c0e67b3703af95a482 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
|
/*!
[config]
name: amdgcn call clobbers
clc_version_min: 10
device_regex: gfx[\d]*
[test]
name: callee saved sgpr
kernel_name: call_clobber_s40
dimensions: 1
global_size: 1 0 0
arg_out: 0 buffer int[1] 0xabcd1234
[test]
name: callee saved vgpr
kernel_name: call_clobber_v40
dimensions: 1
global_size: 1 0 0
arg_out: 0 buffer int[1] 0xabcd1234
!*/
#ifndef __AMDGCN__
#error This test is only for amdgcn
#endif
__attribute__((noinline))
void clobber_s40()
{
__asm volatile("s_mov_b32 s40, 0xdead" : : : "s40");
}
kernel void call_clobber_s40(__global int* ret)
{
__asm volatile("s_mov_b32 s40, 0xabcd1234" : : : "s40");
clobber_s40();
int tmp;
__asm volatile("v_mov_b32 %0, s40"
: "=v"(tmp)
:
: "s40");
*ret = tmp;
}
__attribute__((noinline))
void clobber_v40()
{
__asm volatile("v_mov_b32 v40, 0xdead" : : : "v40");
}
kernel void call_clobber_v40(__global int* ret)
{
__asm volatile("v_mov_b32 v40, 0xabcd1234" : : : "v40");
clobber_v40();
int tmp;
__asm volatile("v_mov_b32 %0, v40"
: "=v"(tmp)
:
: "v40");
*ret = tmp;
}
|