summaryrefslogtreecommitdiff
path: root/utests/compiler_program_global.cpp
blob: caadf8b836b533ead283f7cbc96f6f8cf301c322 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
#include "utest_helper.hpp"
#include "utest_file_map.hpp"

static int init_program(const char* name, cl_context ctx, cl_program *pg )
{
  cl_int err;
  char* ker_path = cl_do_kiss_path(name, device);

  cl_file_map_t *fm = cl_file_map_new();
  err = cl_file_map_open(fm, ker_path);
  if(err != CL_FILE_MAP_SUCCESS)
    OCL_ASSERT(0);
  const char *src = cl_file_map_begin(fm);

  *pg = clCreateProgramWithSource(ctx, 1, &src, NULL, &err);
  free(ker_path);
  cl_file_map_delete(fm);
  return 0;

}

void compiler_program_global()
{
  if(!cl_check_ocl20(false))
    return;
  const int n = 16;
  cl_int err;

  // Setup kernel and buffers
  cl_program program;
  init_program("compiler_program_global.cl", ctx, &program);
  OCL_CALL (clBuildProgram, program, 1, &device, "-cl-std=CL2.0", NULL, NULL);

  cl_kernel k0 = clCreateKernel(program, "compiler_program_global0", &err);
  assert(err == CL_SUCCESS);
  cl_kernel k1 = clCreateKernel(program, "compiler_program_global1", &err);
  assert(err == CL_SUCCESS);

  OCL_CREATE_BUFFER(buf[0], 0, n * sizeof(int), NULL);
  OCL_CREATE_BUFFER(buf[1], 0, n * sizeof(int), NULL);

  OCL_CALL (clSetKernelArg, k0, 0, sizeof(cl_mem), &buf[0]);
  OCL_CALL (clSetKernelArg, k1, 0, sizeof(cl_mem), &buf[1]);

  int dynamic = 1;
  OCL_CALL (clSetKernelArg, k0, 1, sizeof(cl_int), &dynamic);
  OCL_CALL (clSetKernelArg, k1, 1, sizeof(cl_int), &dynamic);

  globals[0] = 16;
  locals[0] = 16;

  OCL_MAP_BUFFER(0);
  for (int i = 0; i <  n; ++i)
    ((int*)buf_data[0])[i] = i;
  OCL_UNMAP_BUFFER(0);

  // Run the kernel on GPU
  OCL_CALL (clEnqueueNDRangeKernel, queue, k0, 1, NULL, globals, locals, 0, NULL, NULL);
  OCL_CALL (clEnqueueNDRangeKernel, queue, k1, 1, NULL, globals, locals, 0, NULL, NULL);

  // Compare
  OCL_MAP_BUFFER(1);
  for (int32_t i = 0; i < n; ++i) {
//    printf("i=%d dst=%d\n", i, ((int*)buf_data[1])[i]);
    switch(i) {
      default: OCL_ASSERT(((int*)buf_data[1])[i] == i); break;
      case 11: OCL_ASSERT(((int*)buf_data[1])[i] == 7); break;
      case 12: OCL_ASSERT(((int*)buf_data[1])[i] == 4); break;
      case 13: OCL_ASSERT(((int*)buf_data[1])[i] == 2); break;
      case 14: OCL_ASSERT(((int*)buf_data[1])[i] == 3); break;
      case 15: OCL_ASSERT(((int*)buf_data[1])[i] == 2); break;
    }
  }
  OCL_UNMAP_BUFFER(1);
  clReleaseKernel(k0);
  clReleaseKernel(k1);
  clReleaseProgram(program);
}

MAKE_UTEST_FROM_FUNCTION(compiler_program_global);