blob: b1432b2d1aae3e6f8f6e3123e66c858aa4c139da (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
|
#define SWAP64(A) \
((((A) & 0xff00000000000000) >> 56) | \
(((A) & 0x00ff000000000000) >> 40) | \
(((A) & 0x0000ff0000000000) >> 24) | \
(((A) & 0x000000ff00000000) >> 8) | \
(((A) & 0x00000000ff000000) << 8) | \
(((A) & 0x0000000000ff0000) << 24) | \
(((A) & 0x000000000000ff00) << 40) | \
(((A) & 0x00000000000000ff) << 56) )
kernel void compiler_bswap(global uint * src0, global uint * dst0, global ushort * src1, global ushort * dst1,
int src2, global int * dst2, short src3, global short * dst3, global ulong* src4, global ulong* dst4, long src5, global long* dst5) {
if (get_global_id(0) % 2 == 0) {
dst0[get_global_id(0)] = __builtin_bswap32(src0[get_global_id(0)]);
} else {
dst0[get_global_id(0)] = src0[get_global_id(0)];
}
dst1[get_global_id(0)] = __builtin_bswap16(src1[get_global_id(0)]);
if (get_global_id(0) % 2 == 1) {
dst1[get_global_id(0)] = __builtin_bswap16(dst1[get_global_id(0)] + 1);
}
dst2[get_global_id(0)] = __builtin_bswap32(src2);
dst3[get_global_id(0)] = __builtin_bswap16(src3);
dst4[get_global_id(0)] = SWAP64(src4[get_global_id(0)]);
dst5[get_global_id(0)] = SWAP64(src5);
}
|