/*
* Copyright © 2012 Intel Corporation
*
* This library is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
* This library is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with this library. If not, see .
*
* Author: Benjamin Segovia
*/
#include "cl_kernel.h"
#include "cl_program.h"
#include "cl_device_id.h"
#include "cl_context.h"
#include "cl_alloc.h"
#include "cl_utils.h"
#include "cl_khr_icd.h"
#include "cl_gbe_loader.h"
#include "cl_cmrt.h"
#include "CL/cl.h"
#include "CL/cl_intel.h"
#include "CL/cl_ext.h"
#include
#include
#include
#include
#include
#include
#include
#include
static void
cl_program_release_sources(cl_program p)
{
if (p->source) {
cl_free(p->source);
p->source = NULL;
}
}
static void
cl_program_release_binary(cl_program p)
{
if (p->binary) {
cl_free(p->binary);
p->binary = NULL;
}
}
LOCAL void
cl_program_delete(cl_program p)
{
uint32_t ref, i;
if (p == NULL)
return;
/* We are not done with it yet */
if ((ref = CL_OBJECT_DEC_REF(p)) > 1) return;
/* Destroy the sources and binary if still allocated */
cl_program_release_sources(p);
cl_program_release_binary(p);
/* Release the build options. */
if (p->build_opts) {
cl_free(p->build_opts);
p->build_opts = NULL;
}
if (p->build_log) {
free(p->build_log);
p->build_log = NULL;
}
#ifdef HAS_CMRT
if (p->cmrt_program != NULL)
cmrt_destroy_program(p);
else
#endif
{
cl_free(p->bin); /* Free the blob */
for (i = 0; i < p->ker_n; ++i) /* Free the kernels */
cl_kernel_delete(p->ker[i]);
cl_free(p->ker);
}
if (p->global_data_ptr)
cl_buffer_unreference(p->global_data);
cl_free(p->global_data_ptr);
/* Remove it from the list */
cl_context_remove_program(p->ctx, p);
/* Free the program as allocated by the compiler */
if (p->opaque) {
if (CompilerSupported())
//For static variables release, gbeLoader may have been released, so
//compiler_program_clean_llvm_resource and interp_program_delete may be NULL.
if(compiler_program_clean_llvm_resource)
compiler_program_clean_llvm_resource(p->opaque);
if(interp_program_delete)
interp_program_delete(p->opaque);
}
CL_OBJECT_DESTROY_BASE(p);
cl_free(p);
}
#define BUILD_LOG_MAX_SIZE (1024*1024U)
LOCAL cl_program
cl_program_new(cl_context ctx)
{
cl_program p = NULL;
/* Allocate the structure */
TRY_ALLOC_NO_ERR (p, CALLOC(struct _cl_program));
CL_OBJECT_INIT_BASE(p, CL_OBJECT_PROGRAM_MAGIC);
p->build_status = CL_BUILD_NONE;
p->cmrt_program = NULL;
p->build_log = calloc(BUILD_LOG_MAX_SIZE, sizeof(char));
if (p->build_log)
p->build_log_max_sz = BUILD_LOG_MAX_SIZE;
/* The queue also belongs to its context */
cl_context_add_program(ctx, p);
exit:
return p;
error:
cl_program_delete(p);
goto exit;
}
LOCAL void
cl_program_add_ref(cl_program p)
{
assert(p);
CL_OBJECT_INC_REF(p);
}
static cl_int
cl_program_load_gen_program(cl_program p)
{
cl_int err = CL_SUCCESS;
uint32_t i;
assert(p->opaque != NULL);
p->ker_n = interp_program_get_kernel_num(p->opaque);
/* Allocate the kernel array */
TRY_ALLOC (p->ker, CALLOC_ARRAY(cl_kernel, p->ker_n));
for (i = 0; i < p->ker_n; ++i) {
const gbe_kernel opaque = interp_program_get_kernel(p->opaque, i);
assert(opaque != NULL);
TRY_ALLOC (p->ker[i], cl_kernel_new(p));
cl_kernel_setup(p->ker[i], opaque);
}
error:
return err;
}
#define BINARY_HEADER_LENGTH 5
static const unsigned char binary_type_header[BHI_MAX][BINARY_HEADER_LENGTH]= \
{{'B','C', 0xC0, 0xDE},
{1, 'B', 'C', 0xC0, 0xDE},
{2, 'B', 'C', 0xC0, 0xDE},
{1, 'G','E', 'N', 'C'},
{'C','I', 'S', 'A'},
};
LOCAL cl_bool headerCompare(const unsigned char *BufPtr, BINARY_HEADER_INDEX index)
{
bool matched = true;
int length = (index == BHI_SPIR || index == BHI_CMRT) ? BINARY_HEADER_LENGTH -1 :BINARY_HEADER_LENGTH;
int i = 0;
if(index == BHI_GEN_BINARY)
i = 1;
for (; i < length; ++i)
{
matched = matched && (BufPtr[i] == binary_type_header[index][i]);
}
if(index == BHI_GEN_BINARY && matched) {
if(BufPtr[0] != binary_type_header[index][0]) {
DEBUGP(DL_WARNING, "Beignet binary format have been changed, please generate binary again.\n");
matched = false;
}
}
return matched;
}
#define isSPIR(BufPtr) headerCompare(BufPtr, BHI_SPIR)
#define isLLVM_C_O(BufPtr) headerCompare(BufPtr, BHI_COMPIRED_OBJECT)
#define isLLVM_LIB(BufPtr) headerCompare(BufPtr, BHI_LIBRARY)
#define isGenBinary(BufPtr) headerCompare(BufPtr, BHI_GEN_BINARY)
#define isCMRT(BufPtr) headerCompare(BufPtr, BHI_CMRT)
static cl_int get_program_global_data(cl_program prog) {
//OpenCL 1.2 would never call this function, and OpenCL 2.0 alwasy HAS_BO_SET_SOFTPIN.
#ifdef HAS_BO_SET_SOFTPIN
cl_buffer_mgr bufmgr = NULL;
bufmgr = cl_context_get_bufmgr(prog->ctx);
assert(bufmgr);
size_t const_size = interp_program_get_global_constant_size(prog->opaque);
if (const_size == 0) return CL_SUCCESS;
int page_size = getpagesize();
size_t alignedSz = ALIGN(const_size, page_size);
char * p = (char*)cl_aligned_malloc(alignedSz, page_size);
prog->global_data_ptr = p;
interp_program_get_global_constant_data(prog->opaque, (char*)p);
prog->global_data = cl_buffer_alloc_userptr(bufmgr, "program global data", p, alignedSz, 0);
cl_buffer_set_softpin_offset(prog->global_data, (size_t)p);
cl_buffer_set_bo_use_full_range(prog->global_data, 1);
uint32_t reloc_count = interp_program_get_global_reloc_count(prog->opaque);
if (reloc_count > 0) {
uint32_t x;
struct RelocEntry {int refOffset; int defOffset;};
char *temp = (char*) malloc(reloc_count *sizeof(int)*2);
interp_program_get_global_reloc_table(prog->opaque, temp);
for (x = 0; x < reloc_count; x++) {
int ref_offset = ((struct RelocEntry *)temp)[x].refOffset;
*(uint64_t*)&(p[ref_offset]) = ((struct RelocEntry *)temp)[x].defOffset + (uint64_t)p;
}
free(temp);
}
#if 0
int x = 0;
for (x = 0; x < const_size; x++) {
printf("offset %d data: %x\n", x, (unsigned)p[x]);
}
#endif
#endif
return CL_SUCCESS;
}
LOCAL size_t cl_program_get_global_variable_size(cl_program prog) {
return interp_program_get_global_constant_size(prog->opaque);
}
LOCAL cl_program
cl_program_create_from_binary(cl_context ctx,
cl_uint num_devices,
const cl_device_id * devices,
const size_t * lengths,
const unsigned char ** binaries,
cl_int * binary_status,
cl_int * errcode_ret)
{
cl_program program = NULL;
cl_int err = CL_SUCCESS;
assert(ctx);
INVALID_DEVICE_IF (num_devices != 1);
INVALID_DEVICE_IF (devices == NULL);
INVALID_DEVICE_IF (devices[0] != ctx->devices[0]);
INVALID_VALUE_IF (binaries == NULL);
INVALID_VALUE_IF (lengths == NULL);
if (binaries[0] == NULL) {
err = CL_INVALID_VALUE;
if (binary_status)
binary_status[0] = CL_INVALID_VALUE;
goto error;
}
//need at least 4 bytes to check the binary type.
if (lengths[0] == 0 || lengths[0] < 4) {
err = CL_INVALID_VALUE;
if (binary_status)
binary_status[0] = CL_INVALID_VALUE;
goto error;
}
program = cl_program_new(ctx);
if (UNLIKELY(program == NULL)) {
err = CL_OUT_OF_HOST_MEMORY;
goto error;
}
TRY_ALLOC(program->binary, cl_calloc(lengths[0], sizeof(char)));
memcpy(program->binary, binaries[0], lengths[0]);
program->binary_sz = lengths[0];
program->source_type = FROM_BINARY;
if (isCMRT((unsigned char*)program->binary)) {
program->source_type = FROM_CMRT;
}else if(isSPIR((unsigned char*)program->binary)) {
char* typed_binary;
TRY_ALLOC(typed_binary, cl_calloc(lengths[0]+1, sizeof(char)));
memcpy(typed_binary+1, binaries[0], lengths[0]);
*typed_binary = 1;
program->opaque = compiler_program_new_from_llvm_binary(program->ctx->devices[0]->device_id, typed_binary, program->binary_sz+1);
cl_free(typed_binary);
if (UNLIKELY(program->opaque == NULL)) {
err = CL_INVALID_PROGRAM;
goto error;
}
program->source_type = FROM_LLVM_SPIR;
program->binary_type = CL_PROGRAM_BINARY_TYPE_INTERMEDIATE;
}else if(isLLVM_C_O((unsigned char*)program->binary) || isLLVM_LIB((unsigned char*)program->binary)) {
if(*program->binary == BHI_COMPIRED_OBJECT){
program->binary_type = CL_PROGRAM_BINARY_TYPE_COMPILED_OBJECT;
}else if(*program->binary == BHI_LIBRARY){
program->binary_type = CL_PROGRAM_BINARY_TYPE_LIBRARY;
}else{
err= CL_INVALID_BINARY;
goto error;
}
program->opaque = compiler_program_new_from_llvm_binary(program->ctx->devices[0]->device_id, program->binary, program->binary_sz);
if (UNLIKELY(program->opaque == NULL)) {
err = CL_INVALID_PROGRAM;
goto error;
}
program->source_type = FROM_LLVM;
}
else if (isGenBinary((unsigned char*)program->binary)) {
program->opaque = interp_program_new_from_binary(program->ctx->devices[0]->device_id, program->binary, program->binary_sz);
if (UNLIKELY(program->opaque == NULL)) {
DEBUGP(DL_ERROR, "Incompatible binary, please delete the binary and generate again.");
err = CL_INVALID_PROGRAM;
goto error;
}
/* Create all the kernels */
TRY (cl_program_load_gen_program, program);
program->binary_type = CL_PROGRAM_BINARY_TYPE_EXECUTABLE;
}
else {
err= CL_INVALID_BINARY;
goto error;
}
if (binary_status)
binary_status[0] = CL_SUCCESS;
exit:
if (errcode_ret)
*errcode_ret = err;
return program;
error:
cl_program_delete(program);
program = NULL;
goto exit;
return CL_SUCCESS;
}
LOCAL cl_program
cl_program_create_with_built_in_kernles(cl_context ctx,
cl_uint num_devices,
const cl_device_id * devices,
const char * kernel_names,
cl_int * errcode_ret)
{
cl_int err = CL_SUCCESS;
assert(ctx);
INVALID_DEVICE_IF (num_devices != 1);
INVALID_DEVICE_IF (devices == NULL);
INVALID_DEVICE_IF (devices[0] != ctx->devices[0]);
cl_int binary_status = CL_SUCCESS;
extern char cl_internal_built_in_kernel_str[];
extern size_t cl_internal_built_in_kernel_str_size;
char* p_built_in_kernel_str =cl_internal_built_in_kernel_str;
cl_program built_in_prgs = cl_program_create_from_binary(ctx, 1,
&ctx->devices[0],
(size_t*)&cl_internal_built_in_kernel_str_size,
(const unsigned char **)&p_built_in_kernel_str,
&binary_status, &err);
if (!built_in_prgs)
return NULL;
err = cl_program_build(built_in_prgs, NULL);
if (err != CL_SUCCESS)
return NULL;
built_in_prgs->is_built = 1;
exit:
if (errcode_ret)
*errcode_ret = err;
return built_in_prgs;
error:
goto exit;
return CL_SUCCESS;
}
LOCAL cl_program
cl_program_create_from_llvm(cl_context ctx,
cl_uint num_devices,
const cl_device_id *devices,
const char *file_name,
cl_int *errcode_ret)
{
cl_program program = NULL;
cl_int err = CL_SUCCESS;
assert(ctx);
INVALID_DEVICE_IF (num_devices != 1);
INVALID_DEVICE_IF (devices == NULL);
INVALID_DEVICE_IF (devices[0] != ctx->devices[0]);
INVALID_VALUE_IF (file_name == NULL);
program = cl_program_new(ctx);
if (UNLIKELY(program == NULL)) {
err = CL_OUT_OF_HOST_MEMORY;
goto error;
}
program->opaque = compiler_program_new_from_llvm_file(ctx->devices[0]->device_id, file_name, program->build_log_max_sz, program->build_log, &program->build_log_sz);
if (UNLIKELY(program->opaque == NULL)) {
err = CL_INVALID_PROGRAM;
goto error;
}
/* Create all the kernels */
TRY (cl_program_load_gen_program, program);
program->source_type = FROM_LLVM;
exit:
if (errcode_ret)
*errcode_ret = err;
return program;
error:
cl_program_delete(program);
program = NULL;
goto exit;
}
LOCAL cl_program
cl_program_create_from_source(cl_context ctx,
cl_uint count,
const char **strings,
const size_t *lengths,
cl_int *errcode_ret)
{
cl_program program = NULL;
cl_int err = CL_SUCCESS;
cl_uint i;
int32_t * lens = NULL;
int32_t len_total = 0;
assert(ctx);
char * p = NULL;
// the real compilation step will be done at build time since we do not have
// yet the compilation options
program = cl_program_new(ctx);
if (UNLIKELY(program == NULL)) {
err = CL_OUT_OF_HOST_MEMORY;
goto error;
}
TRY_ALLOC (lens, cl_calloc(count, sizeof(int32_t)));
for (i = 0; i < (int) count; ++i) {
size_t len;
if (lengths == NULL || lengths[i] == 0)
len = strlen(strings[i]);
else
len = lengths[i];
lens[i] = len;
len_total += len;
}
TRY_ALLOC(program->source, cl_calloc(len_total+1, sizeof(char)));
p = program->source;
for (i = 0; i < (int) count; ++i) {
memcpy(p, strings[i], lens[i]);
p += lens[i];
}
*p = '\0';
program->source_type = FROM_SOURCE;
program->binary_type = CL_PROGRAM_BINARY_TYPE_NONE;
exit:
cl_free(lens);
lens = NULL;
if (errcode_ret)
*errcode_ret = err;
return program;
error:
cl_program_delete(program);
program = NULL;
goto exit;
}
/* Before we do the real work, we need to check whether our platform
cl version can meet -cl-std= */
static int check_cl_version_option(cl_program p, const char* options) {
const char* s = NULL;
int ver1 = 0;
int ver2 = 0;
char version_str[64] = {0};
if (options && (s = strstr(options, "-cl-std="))) {
if (s + strlen("-cl-std=CLX.X") > options + strlen(options)) {
return 0;
}
if (s[8] != 'C' || s[9] != 'L' || s[10] > '9' || s[10] < '0' || s[11] != '.'
|| s[12] > '9' || s[12] < '0') {
return 0;
}
ver1 = (s[10] - '0') * 10 + (s[12] - '0');
if (cl_get_device_info(p->ctx->devices[0], CL_DEVICE_OPENCL_C_VERSION, sizeof(version_str),
version_str, NULL) != CL_SUCCESS)
return 0;
assert(strstr(version_str, "OpenCL") && version_str[0] == 'O');
ver2 = (version_str[9] - '0') * 10 + (version_str[11] - '0');
if (ver2 < ver1)
return 0;
return 1;
}
return 1;
}
LOCAL cl_int
cl_program_build(cl_program p, const char *options)
{
cl_int err = CL_SUCCESS;
int i = 0;
int copyed = 0;
if (CL_OBJECT_GET_REF(p) > 1) {
err = CL_INVALID_OPERATION;
goto error;
}
#if HAS_CMRT
if (p->source_type == FROM_CMRT) {
//only here we begins to invoke cmrt
//break spec to return other errors such as CL_DEVICE_NOT_FOUND
err = cmrt_build_program(p, options);
if (err == CL_SUCCESS) {
p->build_status = CL_BUILD_SUCCESS;
p->binary_type = CL_PROGRAM_BINARY_TYPE_EXECUTABLE;
return CL_SUCCESS;
} else
goto error;
}
#endif
if (!check_cl_version_option(p, options)) {
err = CL_BUILD_PROGRAM_FAILURE;
goto error;
}
if (options) {
if(p->build_opts == NULL || strcmp(options, p->build_opts) != 0) {
if(p->build_opts) {
cl_free(p->build_opts);
p->build_opts = NULL;
}
TRY_ALLOC (p->build_opts, cl_calloc(strlen(options) + 1, sizeof(char)));
memcpy(p->build_opts, options, strlen(options));
}
}
if (options == NULL && p->build_opts) {
cl_free(p->build_opts);
p->build_opts = NULL;
}
if (p->source_type == FROM_SOURCE) {
if (!CompilerSupported()) {
err = CL_COMPILER_NOT_AVAILABLE;
goto error;
}
p->opaque = compiler_program_new_from_source(p->ctx->devices[0]->device_id, p->source, p->build_log_max_sz, options, p->build_log, &p->build_log_sz);
if (UNLIKELY(p->opaque == NULL)) {
if (p->build_log_sz > 0 && strstr(p->build_log, "error: error reading 'options'"))
err = CL_INVALID_BUILD_OPTIONS;
else
err = CL_BUILD_PROGRAM_FAILURE;
goto error;
}
/* Create all the kernels */
TRY (cl_program_load_gen_program, p);
} else if (p->source_type == FROM_LLVM || p->source_type == FROM_LLVM_SPIR) {
if (!CompilerSupported()) {
err = CL_COMPILER_NOT_AVAILABLE;
goto error;
}
compiler_program_build_from_llvm(p->opaque, p->build_log_max_sz, p->build_log, &p->build_log_sz, options);
if (UNLIKELY(p->opaque == NULL)) {
if (p->build_log_sz > 0 && strstr(p->build_log, "error: error reading 'options'"))
err = CL_INVALID_BUILD_OPTIONS;
else
err = CL_BUILD_PROGRAM_FAILURE;
goto error;
}
/* Create all the kernels */
TRY (cl_program_load_gen_program, p);
} else if (p->source_type == FROM_BINARY && p->binary_type != CL_PROGRAM_BINARY_TYPE_EXECUTABLE) {
p->opaque = interp_program_new_from_binary(p->ctx->devices[0]->device_id, p->binary, p->binary_sz);
if (UNLIKELY(p->opaque == NULL)) {
err = CL_BUILD_PROGRAM_FAILURE;
goto error;
}
/* Create all the kernels */
TRY (cl_program_load_gen_program, p);
}
p->binary_type = CL_PROGRAM_BINARY_TYPE_EXECUTABLE;
for (i = 0; i < p->ker_n; i ++) {
const gbe_kernel opaque = interp_program_get_kernel(p->opaque, i);
p->bin_sz += interp_kernel_get_code_size(opaque);
}
TRY_ALLOC (p->bin, cl_calloc(p->bin_sz, sizeof(char)));
for (i = 0; i < p->ker_n; i ++) {
const gbe_kernel opaque = interp_program_get_kernel(p->opaque, i);
size_t sz = interp_kernel_get_code_size(opaque);
memcpy(p->bin + copyed, interp_kernel_get_code(opaque), sz);
copyed += sz;
}
uint32_t ocl_version = interp_kernel_get_ocl_version(interp_program_get_kernel(p->opaque, 0));
if (ocl_version >= 200 && (err = get_program_global_data(p)) != CL_SUCCESS)
goto error;
p->is_built = 1;
p->build_status = CL_BUILD_SUCCESS;
return CL_SUCCESS;
error:
p->build_status = CL_BUILD_ERROR;
return err;
}
cl_program
cl_program_link(cl_context context,
cl_uint num_input_programs,
const cl_program * input_programs,
const char * options,
cl_int* errcode_ret)
{
cl_program p = NULL;
cl_int err = CL_SUCCESS;
cl_int i = 0;
int copyed = 0;
cl_bool ret = 0;
int avialable_program = 0;
//Although we don't use options, but still need check options
if(!compiler_program_check_opt(options)) {
err = CL_INVALID_LINKER_OPTIONS;
goto error;
}
const char kernel_arg_option[] = "-cl-kernel-arg-info";
cl_bool option_exist = CL_TRUE;
for(i = 0; i < num_input_programs; i++) {
//num_input_programs >0 and input_programs MUST not NULL, so compare with input_programs[0] directly.
if(input_programs[i]->binary_type == CL_PROGRAM_BINARY_TYPE_LIBRARY ||
input_programs[i]->binary_type == CL_PROGRAM_BINARY_TYPE_COMPILED_OBJECT ||
input_programs[i]->binary_type == CL_PROGRAM_BINARY_TYPE_INTERMEDIATE) {
avialable_program++;
}
if(input_programs[i]->build_opts == NULL || strstr(input_programs[i]->build_opts, kernel_arg_option) == NULL ) {
option_exist = CL_FALSE;
}
}
//None of program contain a compilerd binary or library.
if(avialable_program == 0) {
goto done;
}
//Must all of program contain a compilerd binary or library.
if(avialable_program < num_input_programs) {
err = CL_INVALID_OPERATION;
goto error;
}
p = cl_program_new(context);
if (UNLIKELY(p == NULL)) {
err = CL_OUT_OF_HOST_MEMORY;
goto error;
}
if(option_exist) {
TRY_ALLOC (p->build_opts, cl_calloc(strlen(kernel_arg_option) + 1, sizeof(char)));
memcpy(p->build_opts, kernel_arg_option, strlen(kernel_arg_option));
}
if (!check_cl_version_option(p, options)) {
err = CL_BUILD_PROGRAM_FAILURE;
goto error;
}
p->opaque = compiler_program_new_gen_program(context->devices[0]->device_id, NULL, NULL, NULL);
for(i = 0; i < num_input_programs; i++) {
// if program create with llvm binary, need deserilize first to get module.
if(input_programs[i])
ret = compiler_program_link_program(p->opaque, input_programs[i]->opaque,
p->build_log_max_sz, p->build_log, &p->build_log_sz);
if (UNLIKELY(ret)) {
err = CL_LINK_PROGRAM_FAILURE;
goto error;
}
}
if(options && strstr(options, "-create-library")){
p->binary_type = CL_PROGRAM_BINARY_TYPE_LIBRARY;
goto done;
}else{
p->binary_type = CL_PROGRAM_BINARY_TYPE_EXECUTABLE;
}
compiler_program_build_from_llvm(p->opaque, p->build_log_max_sz, p->build_log, &p->build_log_sz, options);
/* Create all the kernels */
TRY (cl_program_load_gen_program, p);
for (i = 0; i < p->ker_n; i ++) {
const gbe_kernel opaque = interp_program_get_kernel(p->opaque, i);
p->bin_sz += interp_kernel_get_code_size(opaque);
}
TRY_ALLOC (p->bin, cl_calloc(p->bin_sz, sizeof(char)));
for (i = 0; i < p->ker_n; i ++) {
const gbe_kernel opaque = interp_program_get_kernel(p->opaque, i);
size_t sz = interp_kernel_get_code_size(opaque);
memcpy(p->bin + copyed, interp_kernel_get_code(opaque), sz);
copyed += sz;
}
uint32_t ocl_version = interp_kernel_get_ocl_version(interp_program_get_kernel(p->opaque, 0));
if (ocl_version >= 200 && (err = get_program_global_data(p)) != CL_SUCCESS)
goto error;
done:
if(p) p->is_built = 1;
if(p) p->build_status = CL_BUILD_SUCCESS;
if (errcode_ret)
*errcode_ret = err;
return p;
error:
if(p) p->build_status = CL_BUILD_ERROR;
if (errcode_ret)
*errcode_ret = err;
return p;
}
#define FILE_PATH_LENGTH 1024
LOCAL cl_int
cl_program_compile(cl_program p,
cl_uint num_input_headers,
const cl_program * input_headers,
const char ** header_include_names,
const char* options)
{
cl_int err = CL_SUCCESS;
int i = 0;
if (CL_OBJECT_GET_REF(p) > 1) {
err = CL_INVALID_OPERATION;
goto error;
}
if (!check_cl_version_option(p, options)) {
err = CL_BUILD_PROGRAM_FAILURE;
goto error;
}
if (options) {
if(p->build_opts == NULL || strcmp(options, p->build_opts) != 0) {
if(p->build_opts) {
cl_free(p->build_opts);
p->build_opts = NULL;
}
TRY_ALLOC (p->build_opts, cl_calloc(strlen(options) + 1, sizeof(char)));
memcpy(p->build_opts, options, strlen(options));
}
}
if (options == NULL && p->build_opts) {
cl_free(p->build_opts);
p->build_opts = NULL;
}
#if defined(__ANDROID__)
char temp_header_template[]= "/data/local/tmp/beignet.XXXXXX";
#else
char temp_header_template[]= "/tmp/beignet.XXXXXX";
#endif
char* temp_header_path = mkdtemp(temp_header_template);
if (p->source_type == FROM_SOURCE) {
if (!CompilerSupported()) {
err = CL_COMPILER_NOT_AVAILABLE;
goto error;
}
//write the headers to /tmp/beignet.XXXXXX for include.
for (i = 0; i < num_input_headers; i++) {
if(header_include_names[i] == NULL || input_headers[i] == NULL)
continue;
char temp_path[FILE_PATH_LENGTH]="";
strncat(temp_path, temp_header_path, strlen(temp_header_path));
strncat(temp_path, "/", 1);
strncat(temp_path, header_include_names[i], strlen(header_include_names[i]));
if(strlen(temp_path) >= FILE_PATH_LENGTH - 1 ) {
err = CL_COMPILE_PROGRAM_FAILURE;
goto error;
}
temp_path[strlen(temp_path)+1] = '\0';
char* dirc = strdup(temp_path);
char* dir = dirname(dirc);
mkdir(dir, 0755);
if(access(dir, R_OK|W_OK) != 0){
err = CL_COMPILE_PROGRAM_FAILURE;
goto error;
}
free(dirc);
FILE* pfile = fopen(temp_path, "wb");
if(pfile){
fwrite(input_headers[i]->source, strlen(input_headers[i]->source), 1, pfile);
fclose(pfile);
}else{
err = CL_COMPILE_PROGRAM_FAILURE;
goto error;
}
}
p->opaque = compiler_program_compile_from_source(p->ctx->devices[0]->device_id, p->source, temp_header_path,
p->build_log_max_sz, options, p->build_log, &p->build_log_sz);
char rm_path[255]="rm ";
strncat(rm_path, temp_header_path, strlen(temp_header_path));
strncat(rm_path, " -rf", 4);
int temp = system(rm_path);
if(temp){
assert(0);
}
if (UNLIKELY(p->opaque == NULL)) {
if (p->build_log_sz > 0 && strstr(p->build_log, "error: error reading 'options'"))
err = CL_INVALID_COMPILER_OPTIONS;
else
err = CL_COMPILE_PROGRAM_FAILURE;
goto error;
}
/* Create all the kernels */
p->binary_type = CL_PROGRAM_BINARY_TYPE_COMPILED_OBJECT;
}else if(p->source_type == FROM_BINARY){
err = CL_INVALID_OPERATION;
return err;
}
p->is_built = 1;
p->build_status = CL_BUILD_SUCCESS;
return CL_SUCCESS;
error:
p->build_status = CL_BUILD_ERROR;
return err;
}
LOCAL cl_kernel
cl_program_create_kernel(cl_program p, const char *name, cl_int *errcode_ret)
{
cl_kernel from = NULL, to = NULL;
cl_int err = CL_SUCCESS;
uint32_t i = 0;
#ifdef HAS_CMRT
if (p->cmrt_program != NULL) {
void* cmrt_kernel = cmrt_create_kernel(p, name);
if (cmrt_kernel != NULL) {
to = cl_kernel_new(p);
to->cmrt_kernel = cmrt_kernel;
goto exit;
} else {
err = CL_INVALID_KERNEL_NAME;
goto error;
}
}
#endif
/* Find the program first */
for (i = 0; i < p->ker_n; ++i) {
assert(p->ker[i]);
const char *ker_name = cl_kernel_get_name(p->ker[i]);
if (ker_name != NULL && strcmp(ker_name, name) == 0) {
from = p->ker[i];
break;
}
}
/* We were not able to find this named kernel */
if (UNLIKELY(from == NULL)) {
err = CL_INVALID_KERNEL_NAME;
goto error;
}
TRY_ALLOC(to, cl_kernel_dup(from));
exit:
if (errcode_ret)
*errcode_ret = err;
return to;
error:
cl_kernel_delete(to);
to = NULL;
goto exit;
}
LOCAL cl_int
cl_program_create_kernels_in_program(cl_program p, cl_kernel* ker)
{
int i = 0;
if(ker == NULL)
return CL_SUCCESS;
for (i = 0; i < p->ker_n; ++i) {
TRY_ALLOC_NO_ERR(ker[i], cl_kernel_dup(p->ker[i]));
}
return CL_SUCCESS;
error:
do {
cl_kernel_delete(ker[i]);
ker[i--] = NULL;
} while(i > 0);
return CL_OUT_OF_HOST_MEMORY;
}
LOCAL void
cl_program_get_kernel_names(cl_program p, size_t size, char *names, size_t *size_ret)
{
int i = 0;
const char *ker_name = NULL;
size_t len = 0;
if(size_ret) *size_ret = 0;
if(p->ker == NULL) {
return;
}
ker_name = cl_kernel_get_name(p->ker[0]);
if (ker_name != NULL)
len = strlen(ker_name);
else
len = 0;
if(names && ker_name) {
strncpy(names, ker_name, size - 1);
names[size - 1] = '\0';
if(size < len - 1) {
if(size_ret) *size_ret = size;
return;
}
size = size - len - 1; //sub \0
}
if(size_ret) *size_ret = len + 1; //add NULL
for (i = 1; i < p->ker_n; ++i) {
ker_name = cl_kernel_get_name(p->ker[i]);
if (ker_name != NULL)
len = strlen(ker_name);
else
len = 0;
if(names && ker_name) {
strncat(names, ";", size);
if(size >= 1)
strncat(names, ker_name, size - 1);
if(size < len + 1) {
if(size_ret) *size_ret = size;
break;
}
size = size - len - 1;
}
if(size_ret) *size_ret += len + 1; //add ';'
}
}