summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorJunyan He <junyan.he@intel.com>2017-06-11 13:50:09 +0800
committerYang Rong <rong.r.yang@intel.com>2017-08-02 17:16:29 +0800
commit10560132b3d6251d423588618de4d487a278a627 (patch)
treea58a887830a6350f503529c684a281a8fdddd9fa
parent16af56f366f3f673fe97adf866f926a842e15cd1 (diff)
Add cl_enqueue to handle all clEnqueueXXX API.
All clEnqueueXXX API will generate a cl_event and set the exec_data correctly. The cl_enqueue_handle function will call the real function in device_api to do the real job, when all events it depends on are completed. Signed-off-by: Junyan He <junyan.he@intel.com>
-rw-r--r--runtime/cl_enqueue.c126
-rw-r--r--runtime/cl_enqueue.h214
2 files changed, 340 insertions, 0 deletions
diff --git a/runtime/cl_enqueue.c b/runtime/cl_enqueue.c
new file mode 100644
index 00000000..7de3414d
--- /dev/null
+++ b/runtime/cl_enqueue.c
@@ -0,0 +1,126 @@
+/*
+ * Copyright © 2012 Intel Corporation
+ *
+ * This library is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2.1 of the License, or (at your option) any later version.
+ *
+ * This library is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with this library. If not, see <http://www.gnu.org/licenses/>.
+ *
+ * Author: Rong Yang <rong.r.yang@intel.com>
+ */
+
+//#include "cl_image.h"
+#include "cl_enqueue.h"
+#include "cl_event.h"
+#include "cl_kernel.h"
+#include "cl_command_queue.h"
+#include "cl_utils.h"
+#include "cl_alloc.h"
+#include "cl_mem.h"
+#include "cl_device_id.h"
+#include <stdio.h>
+#include <string.h>
+#include <assert.h>
+#include <pthread.h>
+
+LOCAL void
+cl_enqueue_delete_native_kernel(cl_event e)
+{
+ assert(e->exec_data.type == EnqueueNativeKernel);
+
+ if (e->exec_data.native_kernel.mem_list) {
+ CL_FREE(e->exec_data.native_kernel.mem_list);
+ e->exec_data.native_kernel.mem_list = NULL;
+ }
+ if (e->exec_data.native_kernel.args) {
+ CL_FREE(e->exec_data.native_kernel.args);
+ e->exec_data.native_kernel.args = NULL;
+ }
+ if (e->exec_data.native_kernel.mem_arg_loc) {
+ CL_FREE(e->exec_data.native_kernel.mem_arg_loc);
+ e->exec_data.native_kernel.mem_arg_loc = NULL;
+ }
+}
+
+static cl_int
+cl_enqueue_handle_native_kernel(cl_event e, cl_int status)
+{
+ cl_mem *mem_list = e->exec_data.native_kernel.mem_list;
+ cl_uint mem_n = e->exec_data.native_kernel.mem_num;
+ cl_uint i;
+ cl_command_queue queue = e->queue;
+ cl_int err = CL_SUCCESS;
+
+ if (status == CL_QUEUED) {
+ for (i = 0; i < mem_n; i++) {
+ assert(CL_OBJECT_IS_MEM(mem_list[i]));
+ err = cl_mem_assure_allocated(queue->device, mem_list[i]);
+ if (err != CL_SUCCESS) {
+ return err;
+ }
+ }
+ }
+
+ err = queue->device->api.native_kernel(e, status);
+ return err;
+}
+
+static cl_int
+cl_enqueue_handle_marker_or_barrier(cl_event e, cl_int status)
+{
+ return CL_COMPLETE;
+}
+
+LOCAL cl_int
+cl_enqueue_handle(cl_event e, cl_int status)
+{
+ switch (e->exec_data.type) {
+ case EnqueueReturnSuccesss:
+ return CL_SUCCESS;
+ case EnqueueReadBuffer:
+ case EnqueueReadBufferRect:
+ case EnqueueWriteBuffer:
+ case EnqueueWriteBufferRect:
+ case EnqueueReadImage:
+ case EnqueueWriteImage:
+ return cl_enqueue_handle_read_write_mem(e, status);
+ case EnqueueMapBuffer:
+ case EnqueueMapImage:
+ return cl_enqueue_handle_map_mem(e, status);
+ case EnqueueUnmapMemObject:
+ return cl_enqueue_handle_unmap_mem(e, status);
+ case EnqueueSVMMemFree:
+ return cl_enqueue_handle_svm_free(e, status);
+ case EnqueueSVMMemCopy:
+ return cl_enqueue_handle_svm_copy(e, status);
+ case EnqueueSVMMemFill:
+ return cl_enqueue_handle_svm_fill(e, status);
+ case EnqueueMarker:
+ case EnqueueBarrier:
+ return cl_enqueue_handle_marker_or_barrier(e, status);
+ case EnqueueCopyBufferRect:
+ case EnqueueCopyBuffer:
+ case EnqueueCopyImage:
+ case EnqueueCopyBufferToImage:
+ case EnqueueCopyImageToBuffer:
+ return cl_enqueue_handle_copy_mem(e, status);
+ case EnqueueNDRangeKernel:
+ return cl_enqueue_handle_kernel_ndrange(e, status);
+ case EnqueueFillBuffer:
+ case EnqueueFillImage:
+ return cl_enqueue_handle_fill_mem(e, status);
+ case EnqueueNativeKernel:
+ return cl_enqueue_handle_native_kernel(e, status);
+ case EnqueueMigrateMemObj:
+ default:
+ return CL_SUCCESS;
+ }
+}
diff --git a/runtime/cl_enqueue.h b/runtime/cl_enqueue.h
new file mode 100644
index 00000000..0ead4477
--- /dev/null
+++ b/runtime/cl_enqueue.h
@@ -0,0 +1,214 @@
+/*
+ * Copyright © 2012 Intel Corporation
+ *
+ * This library is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2.1 of the License, or (at your option) any later version.
+ *
+ * This library is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with this library. If not, see <http://www.gnu.org/licenses/>.
+ *
+ * Author: Rong Yang <rong.r.yang@intel.com>
+ */
+#ifndef __CL_ENQUEUE_H__
+#define __CL_ENQUEUE_H__
+
+#include "CL/cl.h"
+
+typedef enum {
+ EnqueueReturnSuccesss = 0, /* For some case, we have nothing to do, just return SUCCESS. */
+ EnqueueReadBuffer,
+ EnqueueReadBufferRect,
+ EnqueueWriteBuffer,
+ EnqueueWriteBufferRect,
+ EnqueueCopyBuffer,
+ EnqueueCopyBufferRect,
+ EnqueueReadImage,
+ EnqueueWriteImage,
+ EnqueueCopyImage,
+ EnqueueCopyImageToBuffer,
+ EnqueueCopyBufferToImage,
+ EnqueueMapBuffer,
+ EnqueueMapImage,
+ EnqueueUnmapMemObject,
+ EnqueueNDRangeKernel,
+ EnqueueNativeKernel,
+ EnqueueMarker,
+ EnqueueBarrier,
+ EnqueueFillBuffer,
+ EnqueueFillImage,
+ EnqueueMigrateMemObj,
+ EnqueueSVMMemFree,
+ EnqueueSVMMemMap,
+ EnqueueSVMMemUnMap,
+ EnqueueSVMMemCopy,
+ EnqueueSVMMemFill,
+ EnqueueInvalid
+} cl_event_enqueue_type;
+
+typedef struct _cl_event_enqueue_data {
+ cl_event_enqueue_type type; /* Command type */
+ void *exec_ctx;
+
+ union {
+ struct {
+ cl_mem *mem_list; /* mem_list of clEnqueueNativeKernel */
+ cl_uint mem_num;
+ void *args;
+ void **mem_arg_loc;
+ size_t cb_args;
+ void (*user_func)(void *);
+ } native_kernel;
+ struct {
+ cl_mem mem_obj;
+ size_t offset; /* Mem object's offset */
+ size_t size; /* Size */
+ cl_bool unsync_map; /* Indicate the clEnqueueMapBuffer/Image is unsync map */
+ cl_bool write_map; /* Indicate if the clEnqueueMapBuffer is write enable */
+ void *ptr; /* Ptr for write and return value */
+ } map_buffer;
+ struct {
+ cl_mem mem_obj;
+ size_t origin[3]; /* Origin */
+ size_t region[3]; /* Region */
+ size_t row_pitch; /* Row pitch */
+ size_t slice_pitch; /* Slice pitch */
+ cl_bool unsync_map; /* Indicate the clEnqueueMapBuffer/Image is unsync map */
+ cl_bool write_map; /* Indicate if the clEnqueueMapBuffer is write enable */
+ void *ptr; /* Ptr for write and return value */
+ } map_image;
+ struct {
+ cl_mem mem_obj;
+ void *ptr;
+ size_t offset;
+ size_t size;
+ size_t origin[3]; /* Origin */
+ size_t region[3]; /* Region */
+ size_t row_pitch; /* Row pitch */
+ size_t slice_pitch; /* Slice pitch */
+ } unmap;
+ struct {
+ cl_kernel kernel;
+ cl_int work_dim;
+ size_t global_wk_off[3];
+ size_t global_wk_sz[3];
+ size_t local_wk_sz[3];
+ } nd_range;
+ struct {
+ cl_mem src;
+ cl_mem dst;
+ size_t src_offset;
+ size_t dst_offset;
+ size_t cb;
+ } copy_buffer;
+ struct {
+ void *pattern;
+ size_t pattern_size;
+ cl_mem buffer;
+ size_t offset;
+ size_t size;
+ } fill_buffer;
+ struct {
+ cl_mem src_buf;
+ cl_mem dst_buf;
+ size_t src_origin[3];
+ size_t dst_origin[3];
+ size_t region[3];
+ size_t src_row_pitch;
+ size_t src_slice_pitch;
+ size_t dst_row_pitch;
+ size_t dst_slice_pitch;
+ } copy_buffer_rect;
+ struct {
+ void *pattern;
+ cl_mem image;
+ size_t origin[3];
+ size_t region[3];
+ } fill_image;
+ struct {
+ cl_mem src_image;
+ cl_mem dst_image;
+ size_t src_origin[3];
+ size_t dst_origin[3];
+ size_t region[3];
+ } copy_image;
+ struct {
+ cl_mem buffer;
+ size_t offset;
+ cl_mem image;
+ size_t origin[3];
+ size_t region[3];
+ } copy_image_and_buffer;
+ struct {
+ cl_mem buffer;
+ size_t offset;
+ size_t size;
+ void *ptr;
+ } read_write_buffer;
+ struct {
+ cl_mem buffer;
+ void *ptr;
+ size_t origin[3];
+ size_t host_origin[3];
+ size_t region[3];
+ size_t row_pitch;
+ size_t slice_pitch;
+ size_t host_row_pitch;
+ size_t host_slice_pitch;
+ } read_write_buffer_rect;
+ struct {
+ void *ptr;
+ cl_mem image;
+ size_t region[3];
+ size_t origin[3];
+ size_t row_pitch;
+ size_t slice_pitch;
+ } read_write_image;
+ struct {
+ void **ptrs;
+ cl_mem *mem_ptrs;
+ cl_uint mem_num;
+ cl_command_queue queue;
+ void (*free_func)(cl_command_queue, cl_uint, void **, void *);
+ void *user_data;
+ } svm_free;
+ struct {
+ void *ptr;
+ cl_mem svm;
+ size_t size;
+ cl_bool write_map;
+ cl_bool unsync_map;
+ } svm_map;
+ struct {
+ void *ptr;
+ cl_mem svm;
+ } svm_unmap;
+ struct {
+ void *src_ptr;
+ void *dst_ptr;
+ cl_mem src;
+ cl_mem dst;
+ size_t size;
+ } svm_copy;
+ struct {
+ void *ptr;
+ cl_mem svm;
+ void *pattern;
+ size_t pattern_size;
+ size_t size;
+ } svm_fill;
+ };
+} _cl_event_enqueue_data;
+typedef _cl_event_enqueue_data *cl_event_enqueue_data;
+
+/* Do real enqueue commands */
+extern cl_int cl_enqueue_handle(cl_event e, cl_int status);
+extern void cl_enqueue_delete_native_kernel(cl_event e);
+
+#endif /* __CL_ENQUEUE_H__ */