diff options
-rw-r--r-- | utests/compiler_copy_large_image.cpp | 198 |
1 files changed, 198 insertions, 0 deletions
diff --git a/utests/compiler_copy_large_image.cpp b/utests/compiler_copy_large_image.cpp index 66998a73..37fdaab5 100644 --- a/utests/compiler_copy_large_image.cpp +++ b/utests/compiler_copy_large_image.cpp @@ -119,3 +119,201 @@ static void compiler_copy_large_image_1(void) } MAKE_UTEST_FROM_FUNCTION(compiler_copy_large_image_1); + +static void compiler_copy_large_image_2(void) +{ + const size_t w = 4096; + const size_t h = 4096; + const size_t origin[3] = {0, 0, 0}; + const size_t region[3] = {w, h, 1}; + size_t image_row_pitch, image_slice_pitch; + cl_int status; + cl_image_format format; + cl_image_desc desc; + cl_sampler sampler; + uint8_t *p = NULL; + uint8_t *q = NULL; + + memset(&desc, 0x0, sizeof(cl_image_desc)); + memset(&format, 0x0, sizeof(cl_image_format)); + + // Setup kernel and images + OCL_CREATE_KERNEL("test_copy_image"); + buf_data[0] = (uint32_t*) malloc(sizeof(uint32_t) * w * h * 4); + for (uint32_t j = 0; j < h; ++j) + for (uint32_t i = 0; i < w; i++) + for (uint32_t k = 0; k < 4; k++) + ((uint32_t*)buf_data[0])[(j * w + i) * 4 + k] = k; + + format.image_channel_order = CL_RGBA; + format.image_channel_data_type = CL_UNSIGNED_INT32; + desc.image_type = CL_MEM_OBJECT_IMAGE2D; + desc.image_width = w; + desc.image_height = h; + desc.image_row_pitch = 0; + OCL_CREATE_IMAGE(buf[0], 0, &format, &desc, NULL); + OCL_CREATE_IMAGE(buf[1], 0, &format, &desc, NULL); + OCL_CREATE_SAMPLER(sampler, CL_ADDRESS_REPEAT, CL_FILTER_NEAREST); + + // Use mapping mode to fill data into src image + buf_data[1] = clEnqueueMapImage(queue, buf[0], CL_TRUE, CL_MAP_WRITE, origin, region, + &image_row_pitch, &image_slice_pitch, 0, NULL, NULL, &status); + + OCL_ASSERT(image_slice_pitch == 0); + memcpy(buf_data[1], buf_data[0], image_row_pitch * h); + + clEnqueueUnmapMemObject(queue, buf[0], buf_data[1], 0, NULL, NULL); + + // Check src image + buf_data[1] = clEnqueueMapImage(queue, buf[0], CL_TRUE, CL_MAP_READ, origin, region, + &image_row_pitch, &image_slice_pitch, 0, NULL, NULL, &status); + + OCL_ASSERT(image_slice_pitch == 0); + + for (uint32_t j = 0; j < h; ++j) { + p = ((uint8_t*)buf_data[0]) + j * image_row_pitch; + q = ((uint8_t*)buf_data[1]) + j * image_row_pitch; + for (uint32_t i = 0; i < w; i++) + for (uint32_t k = 0; k < 4; k++) + OCL_ASSERT(((uint32_t*)p)[i * 4 + k] == ((uint32_t*)q)[i * 4 + k]); + } + + clEnqueueUnmapMemObject(queue, buf[0], buf_data[1], 0, NULL, NULL); + + free(buf_data[0]); + buf_data[0] = NULL; + buf_data[1] = NULL; + + // Run the kernel + OCL_SET_ARG(0, sizeof(cl_mem), &buf[0]); + OCL_SET_ARG(1, sizeof(cl_mem), &buf[1]); + OCL_SET_ARG(2, sizeof(sampler), &sampler); + globals[0] = w; + globals[1] = h; + locals[0] = 16; + locals[1] = 16; + OCL_NDRANGE(2); + + // Check result + buf_data[0] = clEnqueueMapImage(queue, buf[0], CL_TRUE, CL_MAP_READ, origin, region, + &image_row_pitch, &image_slice_pitch, 0, NULL, NULL, &status); + buf_data[1] = clEnqueueMapImage(queue, buf[1], CL_TRUE, CL_MAP_READ, origin, region, + &image_row_pitch, &image_slice_pitch, 0, NULL, NULL, &status); + + for (uint32_t j = 0; j < h; ++j) { + p = ((uint8_t*)buf_data[0]) + j * image_row_pitch; + q = ((uint8_t*)buf_data[1]) + j * image_row_pitch; + for (uint32_t i = 0; i < w; i++) + for (uint32_t k = 0; k < 4; k++) + OCL_ASSERT(((uint32_t*)p)[i * 4 + k] == ((uint32_t*)q)[i * 4 + k]); + } + + clEnqueueUnmapMemObject(queue, buf[0], buf_data[0], 0, NULL, NULL); + clEnqueueUnmapMemObject(queue, buf[1], buf_data[1], 0, NULL, NULL); + + OCL_CALL(clReleaseSampler, sampler); +} + +MAKE_UTEST_FROM_FUNCTION(compiler_copy_large_image_2); + +static void compiler_copy_large_image_3(void) +{ + const size_t w = 4096; + const size_t h = 4096; + size_t origin[3] = {5, 5, 0}; + size_t region[3] = {8, 8, 1}; + size_t image_row_pitch, image_slice_pitch; + cl_int status; + cl_image_format format; + cl_image_desc desc; + cl_sampler sampler; + uint8_t *p = NULL; + uint8_t *q = NULL; + + memset(&desc, 0x0, sizeof(cl_image_desc)); + memset(&format, 0x0, sizeof(cl_image_format)); + + // Setup kernel and images + OCL_CREATE_KERNEL("test_copy_image"); + buf_data[0] = (uint32_t*) malloc(sizeof(uint32_t) * region[0] * region[1] * 4); + for (uint32_t j = 0; j < region[1]; ++j) + for (uint32_t i = 0; i < region[0]; i++) + for (uint32_t k = 0; k < 4; k++) + ((uint32_t*)buf_data[0])[(j * region[0] + i) * 4 + k] = k; + + format.image_channel_order = CL_RGBA; + format.image_channel_data_type = CL_UNSIGNED_INT32; + desc.image_type = CL_MEM_OBJECT_IMAGE2D; + desc.image_width = w; + desc.image_height = h; + desc.image_row_pitch = 0; + OCL_CREATE_IMAGE(buf[0], 0, &format, &desc, NULL); + OCL_CREATE_IMAGE(buf[1], 0, &format, &desc, NULL); + OCL_CREATE_SAMPLER(sampler, CL_ADDRESS_REPEAT, CL_FILTER_NEAREST); + + // Use mapping mode to fill data into src image + buf_data[1] = clEnqueueMapImage(queue, buf[0], CL_TRUE, CL_MAP_WRITE, origin, region, + &image_row_pitch, &image_slice_pitch, 0, NULL, NULL, &status); + + OCL_ASSERT(image_slice_pitch == 0); + memcpy(buf_data[1], buf_data[0], region[0] * region[1] * 4 * sizeof(uint32_t)); + + clEnqueueUnmapMemObject(queue, buf[0], buf_data[1], 0, NULL, NULL); + + // Check src image + buf_data[1] = clEnqueueMapImage(queue, buf[0], CL_TRUE, CL_MAP_READ, origin, region, + &image_row_pitch, &image_slice_pitch, 0, NULL, NULL, &status); + + OCL_ASSERT(image_slice_pitch == 0); + + for (uint32_t j = 0; j < region[1]; ++j) { + p = ((uint8_t*)buf_data[0]) + j * image_row_pitch; + q = ((uint8_t*)buf_data[1]) + j * image_row_pitch; + for (uint32_t i = 0; i < region[0]; i++) + for (uint32_t k = 0; k < 4; k++) + OCL_ASSERT(((uint32_t*)p)[i * 4 + k] == ((uint32_t*)q)[i * 4 + k]); + } + + clEnqueueUnmapMemObject(queue, buf[0], buf_data[1], 0, NULL, NULL); + + free(buf_data[0]); + buf_data[0] = NULL; + buf_data[1] = NULL; + + // Run the kernel + OCL_SET_ARG(0, sizeof(cl_mem), &buf[0]); + OCL_SET_ARG(1, sizeof(cl_mem), &buf[1]); + OCL_SET_ARG(2, sizeof(sampler), &sampler); + globals[0] = w; + globals[1] = h; + locals[0] = 16; + locals[1] = 16; + OCL_NDRANGE(2); + + // Check result + origin[0] = 0; + origin[1] = 0; + origin[2] = 0; + region[0] = w; + region[1] = h; + region[2] = 1; + buf_data[0] = clEnqueueMapImage(queue, buf[0], CL_TRUE, CL_MAP_READ, origin, region, + &image_row_pitch, &image_slice_pitch, 0, NULL, NULL, &status); + buf_data[1] = clEnqueueMapImage(queue, buf[1], CL_TRUE, CL_MAP_READ, origin, region, + &image_row_pitch, &image_slice_pitch, 0, NULL, NULL, &status); + + for (uint32_t j = 0; j < h; ++j) { + p = ((uint8_t*)buf_data[0]) + j * image_row_pitch; + q = ((uint8_t*)buf_data[1]) + j * image_row_pitch; + for (uint32_t i = 0; i < w; i++) + for (uint32_t k = 0; k < 4; k++) + OCL_ASSERT(((uint32_t*)p)[i * 4 + k] == ((uint32_t*)q)[i * 4 + k]); + } + + clEnqueueUnmapMemObject(queue, buf[0], buf_data[0], 0, NULL, NULL); + clEnqueueUnmapMemObject(queue, buf[1], buf_data[1], 0, NULL, NULL); + + OCL_CALL(clReleaseSampler, sampler); +} + +MAKE_UTEST_FROM_FUNCTION(compiler_copy_large_image_3); |