summaryrefslogtreecommitdiff
path: root/benchmark
diff options
context:
space:
mode:
authorMeng Mengmeng <mengmeng.meng@intel.com>2015-11-04 16:17:13 +0800
committerYang Rong <rong.r.yang@intel.com>2015-11-06 14:31:13 +0800
commit279b430ccddbf805f0ea372f9c6f47836c85a553 (patch)
tree852f3f4d96b9fe178f239f9a3d0b3e3def5ccfab /benchmark
parent0a8637910d114bce992c6a70134fb17fa9ac3ec1 (diff)
add benckmark for copy data from image to image
Set the data format as 1920 * 1080 four channels(RGBA) and type as char,short and int. Signed-off-by: Meng Mengmeng <mengmeng.meng@intel.com> Reviewed-by: Ruiling Song <ruiling.song@intel.com>
Diffstat (limited to 'benchmark')
-rw-r--r--benchmark/CMakeLists.txt3
-rw-r--r--benchmark/benchmark_copy_image.cpp70
2 files changed, 72 insertions, 1 deletions
diff --git a/benchmark/CMakeLists.txt b/benchmark/CMakeLists.txt
index 03a56f22..dd338293 100644
--- a/benchmark/CMakeLists.txt
+++ b/benchmark/CMakeLists.txt
@@ -17,7 +17,8 @@ set (benchmark_sources
benchmark_read_image.cpp
benchmark_copy_buffer_to_image.cpp
benchmark_copy_image_to_buffer.cpp
- benchmark_copy_buffer.cpp)
+ benchmark_copy_buffer.cpp
+ benchmark_copy_image.cpp)
SET(CMAKE_CXX_FLAGS "-DBUILD_BENCHMARK ${CMAKE_CXX_FLAGS}")
diff --git a/benchmark/benchmark_copy_image.cpp b/benchmark/benchmark_copy_image.cpp
new file mode 100644
index 00000000..92dffc91
--- /dev/null
+++ b/benchmark/benchmark_copy_image.cpp
@@ -0,0 +1,70 @@
+#include <string.h>
+#include "utests/utest_helper.hpp"
+#include <sys/time.h>
+
+#define BENCH_COPY_IMAGE(T, M, Q) \
+double benchmark_copy_image_ ##T(void) \
+{ \
+ struct timeval start,stop; \
+\
+ const size_t w = 1920; \
+ const size_t h = 1080; \
+ const size_t sz = 4 * w * h; \
+ cl_image_format format; \
+ cl_image_desc desc; \
+\
+ memset(&desc, 0x0, sizeof(cl_image_desc)); \
+ memset(&format, 0x0, sizeof(cl_image_format)); \
+\
+ OCL_CREATE_KERNEL("bench_copy_image"); \
+ buf_data[0] = (uint32_t*) malloc(sizeof(M) * sz); \
+ for (uint32_t i = 0; i < sz; ++i) { \
+ ((M*)buf_data[0])[i] = rand(); \
+ } \
+\
+ format.image_channel_order = CL_RGBA; \
+ format.image_channel_data_type = Q; \
+ desc.image_type = CL_MEM_OBJECT_IMAGE2D; \
+ desc.image_width = w; \
+ desc.image_height = h; \
+ desc.image_row_pitch = desc.image_width * sizeof(M) * 4; \
+ OCL_CREATE_IMAGE(buf[0], CL_MEM_COPY_HOST_PTR, &format, &desc, buf_data[0]); \
+\
+ desc.image_row_pitch = 0; \
+ OCL_CREATE_IMAGE(buf[1], 0, &format, &desc, NULL); \
+\
+ free(buf_data[0]); \
+ buf_data[0] = NULL; \
+\
+ OCL_SET_ARG(0, sizeof(cl_mem), &buf[0]); \
+ OCL_SET_ARG(1, sizeof(cl_mem), &buf[1]); \
+\
+ globals[0] = w; \
+ globals[1] = h; \
+ locals[0] = 16; \
+ locals[1] = 4; \
+\
+ gettimeofday(&start,0); \
+ for (size_t i=0; i<100; i++) { \
+ OCL_NDRANGE(2); \
+ } \
+ OCL_FINISH(); \
+\
+ OCL_MAP_BUFFER(1); \
+ OCL_UNMAP_BUFFER(1); \
+ gettimeofday(&stop,0); \
+\
+ clReleaseMemObject(buf[0]); \
+ free(buf_data[0]); \
+ buf_data[0] = NULL; \
+\
+ double elapsed = time_subtract(&stop, &start, 0); \
+\
+ return BANDWIDTH(sz * sizeof(M)*2 * 100, elapsed); \
+} \
+\
+MAKE_BENCHMARK_FROM_FUNCTION_KEEP_PROGRAM(benchmark_copy_image_ ##T,true);
+
+BENCH_COPY_IMAGE(uchar,unsigned char,CL_UNSIGNED_INT8)
+BENCH_COPY_IMAGE(ushort,unsigned short,CL_UNSIGNED_INT16)
+BENCH_COPY_IMAGE(uint,unsigned int,CL_UNSIGNED_INT32)