summaryrefslogtreecommitdiff
path: root/opencl/box-max.cl.h
blob: 7a64f1d6b96ee7d5594ebb6073466cc055d6a380 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
static const char* box_max_cl_source = 
"__kernel void kernel_max_hor (__global const float4     *in,                  \n"
"                              __global       float4     *aux,                 \n"
"                              int width, int radius)                          \n"
"{                                                                             \n"
"  const int in_index = get_global_id(0) * (width + 2 * radius)                \n"
"                       + (radius + get_global_id (1));                        \n"
"                                                                              \n"
"  const int aux_index = get_global_id(0) * width + get_global_id (1);         \n"
"  int i;                                                                      \n"
"  float4 max;                                                                 \n"
"  float4 in_v;                                                                \n"
"                                                                              \n"
"  max = (float4)(FLT_MIN);                                                    \n"
"                                                                              \n"
"  if (get_global_id(1) < width)                                               \n"
"    {                                                                         \n"
"      for (i=-radius; i <= radius; i++)                                       \n"
"        {                                                                     \n"
"          in_v = in[in_index + i];                                            \n"
"          max = max < in_v ? in_v : max;                                      \n"
"        }                                                                     \n"
"        aux[aux_index] = max;                                                 \n"
"    }                                                                         \n"
"}                                                                             \n"
"                                                                              \n"
"__kernel void kernel_max_ver (__global const float4     *aux,                 \n"
"                              __global       float4     *out,                 \n"
"                              int width, int radius)                          \n"
"{                                                                             \n"
"                                                                              \n"
"  const int out_index = get_global_id(0) * width + get_global_id (1);         \n"
"  int aux_index = out_index;                                                  \n"
"  int i;                                                                      \n"
"  float4 max;                                                                 \n"
"  float4 aux_v;                                                               \n"
"                                                                              \n"
"  max = (float4)(FLT_MIN);                                                    \n"
"                                                                              \n"
"  if(get_global_id(1) < width)                                                \n"
"    {                                                                         \n"
"      for (i=-radius; i <= radius; i++)                                       \n"
"        {                                                                     \n"
"          aux_v = aux[aux_index];                                             \n"
"          max = max < aux_v ? aux_v : max;                                    \n"
"          aux_index += width;                                                 \n"
"        }                                                                     \n"
"        out[out_index] = max;                                                 \n"
"    }                                                                         \n"
"}                                                                             \n"
;