diff options
author | Luo Xionghu <xionghu.luo@intel.com> | 2017-03-08 23:00:38 +0800 |
---|---|---|
committer | Yang Rong <rong.r.yang@intel.com> | 2017-03-13 16:59:57 +0800 |
commit | db571247424b3189673ed6b73908971e5716a813 (patch) | |
tree | d1868eb738abf189381f74f00ef29db92df51c93 /utests/compiler_subgroup_media_block_read.cpp | |
parent | 9360073d15ec545cd40beef90f863dd28a3a14c9 (diff) |
cl_intel_media_block_io READ related unit tests.
Signed-off-by: Luo Xionghu <xionghu.luo@intel.com>
Reviewed-by: Pan Xiuli <xiuli.pan@intel.com>
Diffstat (limited to 'utests/compiler_subgroup_media_block_read.cpp')
-rw-r--r-- | utests/compiler_subgroup_media_block_read.cpp | 212 |
1 files changed, 212 insertions, 0 deletions
diff --git a/utests/compiler_subgroup_media_block_read.cpp b/utests/compiler_subgroup_media_block_read.cpp new file mode 100644 index 00000000..41289a22 --- /dev/null +++ b/utests/compiler_subgroup_media_block_read.cpp @@ -0,0 +1,212 @@ +#include <cstdint> +#include <cstring> +#include <iostream> +#include "utest_helper.hpp" + +using namespace std; + +/* set to 1 for debug, output of input-expected data */ +#define DEBUG_STDOUT 0 + +/* NDRANGE */ +#define WG_GLOBAL_SIZE_X 64 +#define WG_GLOBAL_SIZE_Y 1 +#define WG_LOCAL_SIZE_X 64 +#define WG_LOCAL_SIZE_Y 1 +/* + * Generic compute-expected function for meida block read + */ +template<class T> +static void compute_expected_media(T* input, + T* expected, + size_t VEC_SIZE) +{ + for(uint32_t w = 0; w < WG_GLOBAL_SIZE_X; ++w) { + for (uint32_t h = 0; h < VEC_SIZE * WG_GLOBAL_SIZE_Y; ++h) { + expected[h + w * VEC_SIZE * WG_GLOBAL_SIZE_Y] = w; + } + } +} + +/* + * Generic input-expected generate function for media block read + */ +template<class T> +static void generate_data_media(T* &input, + T* &expected, + size_t VEC_SIZE) +{ + /* allocate input and expected arrays */ + int* input_ui = new int[WG_GLOBAL_SIZE_X * WG_GLOBAL_SIZE_Y * VEC_SIZE]; + input = (T*)input_ui; + expected = new T[WG_GLOBAL_SIZE_X * WG_GLOBAL_SIZE_Y * VEC_SIZE]; + + /* seed for random inputs */ + srand (time(NULL)); + +#if DEBUG_STDOUT + cout << endl << "IN: " << endl; +#endif + uint32_t rpitch = sizeof(uint32_t) * WG_GLOBAL_SIZE_X / sizeof(T); + /* generate inputs and expected values */ + for (uint32_t h = 0; h < VEC_SIZE * WG_GLOBAL_SIZE_Y; ++h) { + for(uint32_t w = 0; w < WG_GLOBAL_SIZE_X; ++w) + { + /* initially 0, augment after */ + input[w + h * rpitch] = w; + +#if DEBUG_STDOUT + /* output generated input */ + cout << setw(4) << (uint32_t)input[w + h * rpitch] << ", " ; + if((w+ 1) % 8 == 0) + cout << endl; +#endif + } + } + /* expected values */ + compute_expected_media(input, expected, VEC_SIZE); + +#if DEBUG_STDOUT + /* output expected input */ + cout << endl << "EXP: " << endl; + for(uint32_t gid = 0; gid < WG_GLOBAL_SIZE_X; gid++) + { + cout << "("; + for(uint32_t vsz = 0; vsz < VEC_SIZE * WG_GLOBAL_SIZE_Y; vsz++) + cout << setw(4) << (uint32_t)expected[gid* VEC_SIZE * WG_GLOBAL_SIZE_Y + vsz] << ", " ; + cout << ")"; + if((gid + 1) % 8 == 0) + cout << endl; + cout << endl; + } +#endif +} + +/* + * Generic subgroup utest function for media block read + */ +template<class T> +static void subgroup_generic_media(T* input, + T* expected, + size_t VEC_SIZE, + const char* kernel_name) +{ + OCL_CALL(cl_kernel_init, "compiler_subgroup_image_block_read.cl", kernel_name, + SOURCE, "-DMEDIA_BLOCK_IO"); + + cl_image_format format; + cl_image_desc desc; + + memset(&desc, 0x0, sizeof(cl_image_desc)); + memset(&format, 0x0, sizeof(cl_image_format)); + + /* get simd size */ + globals[0] = WG_GLOBAL_SIZE_X; + globals[1] = WG_GLOBAL_SIZE_Y; + locals[0] = WG_LOCAL_SIZE_X; + locals[1] = WG_LOCAL_SIZE_Y; + size_t SIMD_SIZE = 0; + OCL_CALL(utestclGetKernelSubGroupInfoKHR,kernel,device,CL_KERNEL_MAX_SUB_GROUP_SIZE_FOR_NDRANGE_KHR,sizeof(size_t)*1,locals,sizeof(size_t),&SIMD_SIZE,NULL); + + if(SIMD_SIZE != 16) { + printf("skip! this case could only run under simd16 mode!\n"); + return; + } + + size_t buf_sz = VEC_SIZE * WG_GLOBAL_SIZE_X * WG_GLOBAL_SIZE_Y; + /* input and expected data */ + generate_data_media(input, expected, VEC_SIZE); + + /* prepare input for datatype */ + format.image_channel_order = CL_R; + format.image_channel_data_type = CL_UNSIGNED_INT32; + desc.image_type = CL_MEM_OBJECT_IMAGE2D; + desc.image_width = WG_GLOBAL_SIZE_X; + desc.image_height = VEC_SIZE * WG_GLOBAL_SIZE_Y; + desc.image_row_pitch = WG_GLOBAL_SIZE_X * sizeof(uint32_t); + + OCL_CREATE_IMAGE(buf[0], CL_MEM_COPY_HOST_PTR, &format, &desc, input); + OCL_CREATE_BUFFER(buf[1], 0, buf_sz * sizeof(T), NULL); + + OCL_SET_ARG(0, sizeof(cl_mem), &buf[0]); + OCL_SET_ARG(1, sizeof(cl_mem), &buf[1]); + + /* run the kernel on GPU */ + OCL_NDRANGE(2); + + /* check if mismatch */ + OCL_MAP_BUFFER(1); + uint32_t mismatches = 0; + + for (uint32_t i = 0; i < buf_sz; i++) + if(((T *)buf_data[1])[i] != *(expected + i)) + { + /* found mismatch, increment */ + mismatches++; + +#if DEBUG_STDOUT + /* output mismatch */ + cout << "Err at " << i << ", " << + (uint32_t)((T *)buf_data[1])[i] << " != " << (uint32_t)*(expected + i) << endl; +#endif + } + +#if DEBUG_STDOUT + /* output mismatch count */ + cout << "mismatches " << mismatches << endl; +#endif + + OCL_UNMAP_BUFFER(1); + + OCL_ASSERT(mismatches == 0); + free(input); + free(expected); +} + +#define compiler_subgroup_media_block_read_ui(name, kernel, vec_size) \ +void name(void) \ +{ \ + if(!cl_check_media_block_io()) \ + return; \ + cl_uint *input = NULL; \ + cl_uint *expected = NULL; \ + subgroup_generic_media(input, expected, vec_size, #kernel); \ +} \ +MAKE_UTEST_FROM_FUNCTION(name); +compiler_subgroup_media_block_read_ui(compiler_subgroup_media_block_read_ui1, compiler_subgroup_media_block_read_ui1, 1) +compiler_subgroup_media_block_read_ui(compiler_subgroup_media_block_read_ui2, compiler_subgroup_media_block_read_ui2, 2) +compiler_subgroup_media_block_read_ui(compiler_subgroup_media_block_read_ui4, compiler_subgroup_media_block_read_ui4, 4) +compiler_subgroup_media_block_read_ui(compiler_subgroup_media_block_read_ui8, compiler_subgroup_media_block_read_ui8, 8) + +#define compiler_subgroup_media_block_read_us(name, kernel, vec_size) \ +void name(void) \ +{ \ + if(!cl_check_media_block_io()) \ + return; \ + cl_ushort *input = NULL; \ + cl_ushort *expected = NULL; \ + subgroup_generic_media(input, expected, vec_size, #kernel); \ +} \ +MAKE_UTEST_FROM_FUNCTION(name); +compiler_subgroup_media_block_read_us(compiler_subgroup_media_block_read_us1, compiler_subgroup_media_block_read_us1, 1) +compiler_subgroup_media_block_read_us(compiler_subgroup_media_block_read_us2, compiler_subgroup_media_block_read_us2, 2) +compiler_subgroup_media_block_read_us(compiler_subgroup_media_block_read_us4, compiler_subgroup_media_block_read_us4, 4) +compiler_subgroup_media_block_read_us(compiler_subgroup_media_block_read_us8, compiler_subgroup_media_block_read_us8, 8) +//the us16 case could only run under SIMD8 mode. +//compiler_subgroup_media_block_read_us(compiler_subgroup_media_block_read_us16, compiler_subgroup_media_block_read_us16, 16) + +#define compiler_subgroup_media_block_read_uc(name, kernel, vec_size) \ +void name(void) \ +{ \ + if(!cl_check_media_block_io()) \ + return; \ + cl_uchar *input = NULL; \ + cl_uchar *expected = NULL; \ + subgroup_generic_media(input, expected, vec_size, #kernel); \ +} \ +MAKE_UTEST_FROM_FUNCTION(name); +compiler_subgroup_media_block_read_uc(compiler_subgroup_media_block_read_uc1, compiler_subgroup_media_block_read_uc1, 1) +compiler_subgroup_media_block_read_uc(compiler_subgroup_media_block_read_uc2, compiler_subgroup_media_block_read_uc2, 2) +compiler_subgroup_media_block_read_uc(compiler_subgroup_media_block_read_uc4, compiler_subgroup_media_block_read_uc4, 4) +compiler_subgroup_media_block_read_uc(compiler_subgroup_media_block_read_uc8, compiler_subgroup_media_block_read_uc8, 8) +compiler_subgroup_media_block_read_uc(compiler_subgroup_media_block_read_uc16, compiler_subgroup_media_block_read_uc16, 16) |