compute-runtime/runtime/api/api.cpp

3850 lines
137 KiB
C++

/*
* Copyright (c) 2017 - 2018, Intel Corporation
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
* and/or sell copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included
* in all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
* OTHER DEALINGS IN THE SOFTWARE.
*/
#include "config.h"
#include "api.h"
#include "CL/cl.h"
#include "runtime/accelerators/intel_motion_estimation.h"
#include "runtime/built_ins/built_ins.h"
#include "runtime/command_queue/command_queue.h"
#include "runtime/command_stream/command_stream_receiver.h"
#include "runtime/context/context.h"
#include "runtime/context/driver_diagnostics.h"
#include "runtime/device/device.h"
#include "runtime/device_queue/device_queue.h"
#include "runtime/gtpin/gtpin_notify.h"
#include "runtime/helpers/aligned_memory.h"
#include "runtime/helpers/get_info.h"
#include "runtime/helpers/hw_info.h"
#include "runtime/helpers/options.h"
#include "runtime/helpers/queue_helpers.h"
#include "runtime/helpers/validators.h"
#include "runtime/kernel/kernel.h"
#include "runtime/mem_obj/buffer.h"
#include "runtime/mem_obj/image.h"
#include "runtime/mem_obj/pipe.h"
#include "runtime/memory_manager/svm_memory_manager.h"
#include "runtime/os_interface/debug_settings_manager.h"
#include "runtime/platform/platform.h"
#include "runtime/program/program.h"
#include "runtime/sampler/sampler.h"
#include "runtime/sharings/sharing_factory.h"
#include "runtime/utilities/api_intercept.h"
#include "runtime/utilities/stackvec.h"
#include <cstring>
using namespace OCLRT;
cl_int CL_API_CALL clGetPlatformIDs(cl_uint numEntries,
cl_platform_id *platforms,
cl_uint *numPlatforms) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
do {
// if platforms is nullptr, we must return the number of valid platforms we
// support in the num_platforms variable (if it is non-nullptr)
if ((platforms == nullptr) && (numPlatforms == nullptr)) {
retVal = CL_INVALID_VALUE;
break;
}
// platform != nullptr and num_entries == 0 is defined by spec as invalid
if (numEntries == 0 && platforms != nullptr) {
retVal = CL_INVALID_VALUE;
break;
}
while (platforms != nullptr) {
auto pPlatform = constructPlatform();
bool ret = pPlatform->initialize();
DEBUG_BREAK_IF(ret != true);
if (!ret) {
retVal = CL_INVALID_VALUE;
break;
}
// we only have one platform so we can program that directly
platforms[0] = pPlatform;
break;
}
// we only have a single platform at this time, so return 1 if num_platforms
// is non-nullptr
if (numPlatforms && retVal == CL_SUCCESS) {
*numPlatforms = 1;
}
} while (false);
return retVal;
}
CL_API_ENTRY cl_int CL_API_CALL clIcdGetPlatformIDsKHR(cl_uint numEntries,
cl_platform_id *platforms,
cl_uint *numPlatforms) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
retVal = clGetPlatformIDs(numEntries, platforms, numPlatforms);
return retVal;
}
cl_int CL_API_CALL clGetPlatformInfo(cl_platform_id platform,
cl_platform_info paramName,
size_t paramValueSize,
void *paramValue,
size_t *paramValueSizeRet) {
cl_int retVal = CL_INVALID_PLATFORM;
API_ENTER(&retVal);
auto pPlatform = castToObject<Platform>(platform);
if (pPlatform) {
retVal = pPlatform->getInfo(paramName, paramValueSize,
paramValue, paramValueSizeRet);
}
return retVal;
}
cl_int CL_API_CALL clGetDeviceIDs(cl_platform_id platform,
cl_device_type deviceType,
cl_uint numEntries,
cl_device_id *devices,
cl_uint *numDevices) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
const cl_device_type validType = CL_DEVICE_TYPE_GPU | CL_DEVICE_TYPE_CPU |
CL_DEVICE_TYPE_ACCELERATOR | CL_DEVICE_TYPE_DEFAULT |
CL_DEVICE_TYPE_CUSTOM;
Platform *pPlatform = nullptr;
do {
/* Check parameter consistency */
if (devices == nullptr && numDevices == nullptr) {
retVal = CL_INVALID_VALUE;
break;
}
if (devices && numEntries == 0) {
retVal = CL_INVALID_VALUE;
break;
}
if ((deviceType & validType) == 0) {
retVal = CL_INVALID_DEVICE_TYPE;
break;
}
if (platform != nullptr) {
pPlatform = castToObject<Platform>(platform);
if (pPlatform == nullptr) {
retVal = CL_INVALID_PLATFORM;
break;
}
} else {
pPlatform = constructPlatform();
bool ret = pPlatform->initialize();
DEBUG_BREAK_IF(ret != true);
((void)(ret));
}
DEBUG_BREAK_IF(pPlatform->isInitialized() != true);
cl_uint numDev = static_cast<cl_uint>(pPlatform->getNumDevices());
if (numDev == 0) {
retVal = CL_DEVICE_NOT_FOUND;
break;
}
Device **allDevs = pPlatform->getDevices();
DEBUG_BREAK_IF(allDevs == nullptr);
if (deviceType == CL_DEVICE_TYPE_ALL) {
/* According to Spec, set it to all except TYPE_CUSTOM. */
deviceType = CL_DEVICE_TYPE_GPU | CL_DEVICE_TYPE_CPU |
CL_DEVICE_TYPE_ACCELERATOR | CL_DEVICE_TYPE_DEFAULT;
} else if (deviceType == CL_DEVICE_TYPE_DEFAULT) {
/* We just set it to GPU now. */
deviceType = CL_DEVICE_TYPE_GPU;
}
cl_uint retNum = 0;
for (cl_uint i = 0; i < numDev; i++) {
if (deviceType & allDevs[i]->getDeviceInfo().deviceType) {
if (devices) {
devices[retNum] = allDevs[i];
}
retNum++;
if (numEntries > 0 && retNum >= numEntries) {
/* find enough, get out. */
break;
}
}
}
if (numDevices) {
*numDevices = retNum;
}
/* If no suitable device, set a error. */
if (retNum == 0)
retVal = CL_DEVICE_NOT_FOUND;
} while (false);
return retVal;
}
cl_int CL_API_CALL clGetDeviceInfo(cl_device_id device,
cl_device_info paramName,
size_t paramValueSize,
void *paramValue,
size_t *paramValueSizeRet) {
cl_int retVal = CL_INVALID_DEVICE;
API_ENTER(&retVal);
DBG_LOG_INPUTS("clDevice", device, "paramName", paramName, "paramValueSize", paramValueSize, "paramValue", DebugManager.deviceInfoPointerToString(paramValue, paramValueSize), "paramValueSizeRet", paramValueSizeRet);
Device *pDevice = castToObject<Device>(device);
if (pDevice != nullptr) {
retVal = pDevice->getDeviceInfo(paramName, paramValueSize,
paramValue, paramValueSizeRet);
}
return retVal;
}
cl_int CL_API_CALL clCreateSubDevices(cl_device_id inDevice,
const cl_device_partition_property *properties,
cl_uint numDevices,
cl_device_id *outDevices,
cl_uint *numDevicesRet) {
return CL_INVALID_DEVICE;
}
cl_int CL_API_CALL clRetainDevice(cl_device_id device) {
cl_int retVal = CL_INVALID_DEVICE;
API_ENTER(&retVal);
auto pDevice = castToObject<Device>(device);
if (pDevice) {
pDevice->retain();
retVal = CL_SUCCESS;
}
return retVal;
}
cl_int CL_API_CALL clReleaseDevice(cl_device_id device) {
cl_int retVal = CL_INVALID_DEVICE;
API_ENTER(&retVal);
auto pDevice = castToObject<Device>(device);
if (pDevice) {
pDevice->release();
retVal = CL_SUCCESS;
}
return retVal;
}
cl_context CL_API_CALL clCreateContext(const cl_context_properties *properties,
cl_uint numDevices,
const cl_device_id *devices,
void(CL_CALLBACK *funcNotify)(const char *, const void *,
size_t, void *),
void *userData,
cl_int *errcodeRet) {
cl_int retVal = CL_SUCCESS;
cl_context context = nullptr;
API_ENTER(&retVal);
DBG_LOG_INPUTS("properties", properties, "numDevices", numDevices, "cl_device_id", devices, "funcNotify", funcNotify, "userData", userData);
do {
if (devices == nullptr) {
/* Must have device. */
retVal = CL_INVALID_VALUE;
break;
}
/* validateObjects make sure numDevices != 0. */
retVal = validateObjects(DeviceList(numDevices, devices));
if (retVal != CL_SUCCESS)
break;
if (funcNotify == nullptr && userData != nullptr) {
retVal = CL_INVALID_VALUE;
break;
}
DeviceVector allDevs(devices, numDevices);
context = Context::create<Context>(properties, allDevs, funcNotify, userData, retVal);
if (context != nullptr) {
gtpinNotifyContextCreate(context);
}
} while (false);
if (errcodeRet) {
*errcodeRet = retVal;
}
return context;
}
cl_context CL_API_CALL clCreateContextFromType(const cl_context_properties *properties,
cl_device_type deviceType,
void(CL_CALLBACK *funcNotify)(const char *, const void *,
size_t, void *),
void *userData,
cl_int *errcodeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
Context *pContext = nullptr;
do {
if (funcNotify == nullptr && userData != nullptr) {
retVal = CL_INVALID_VALUE;
break;
}
cl_uint numDevices = 0;
/* Query the number of device first. */
retVal = clGetDeviceIDs(nullptr, deviceType, 0, nullptr, &numDevices);
if (retVal != CL_SUCCESS) {
break;
}
DEBUG_BREAK_IF(numDevices <= 0);
StackVec<cl_device_id, 2> supportedDevs;
supportedDevs.resize(numDevices);
retVal = clGetDeviceIDs(nullptr, deviceType, numDevices, supportedDevs.begin(), nullptr);
DEBUG_BREAK_IF(retVal != CL_SUCCESS);
DeviceVector allDevs(supportedDevs.begin(), numDevices);
pContext = Context::create<Context>(properties, allDevs, funcNotify, userData, retVal);
if (pContext != nullptr) {
gtpinNotifyContextCreate((cl_context)pContext);
}
} while (false);
if (errcodeRet) {
*errcodeRet = retVal;
}
return pContext;
}
cl_int CL_API_CALL clRetainContext(cl_context context) {
API_ENTER(0);
Context *pContext = castToObject<Context>(context);
if (pContext) {
pContext->retain();
return CL_SUCCESS;
}
return CL_INVALID_CONTEXT;
}
cl_int CL_API_CALL clReleaseContext(cl_context context) {
API_ENTER(0);
Context *pContext = castToObject<Context>(context);
if (pContext) {
pContext->release();
return CL_SUCCESS;
}
return CL_INVALID_CONTEXT;
}
cl_int CL_API_CALL clGetContextInfo(cl_context context,
cl_context_info paramName,
size_t paramValueSize,
void *paramValue,
size_t *paramValueSizeRet) {
auto retVal = CL_INVALID_CONTEXT;
API_ENTER(&retVal);
auto pContext = castToObject<Context>(context);
if (pContext) {
retVal = pContext->getInfo(paramName, paramValueSize,
paramValue, paramValueSizeRet);
}
return retVal;
}
cl_command_queue CL_API_CALL clCreateCommandQueue(cl_context context,
cl_device_id device,
const cl_command_queue_properties properties,
cl_int *errcodeRet) {
cl_command_queue commandQueue = nullptr;
ErrorCodeHelper err(errcodeRet, CL_SUCCESS);
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
do {
if (properties &
~(CL_QUEUE_OUT_OF_ORDER_EXEC_MODE_ENABLE | CL_QUEUE_PROFILING_ENABLE)) {
retVal = CL_INVALID_VALUE;
break;
}
Context *pContext = nullptr;
Device *pDevice = nullptr;
retVal = validateObjects(
WithCastToInternal(context, &pContext),
WithCastToInternal(device, &pDevice));
if (retVal != CL_SUCCESS) {
break;
}
cl_queue_properties props[] = {
CL_QUEUE_PROPERTIES, properties,
0};
commandQueue = CommandQueue::create(pContext,
pDevice,
props,
retVal);
if (pContext->isProvidingPerformanceHints()) {
pContext->providePerformanceHint(CL_CONTEXT_DIAGNOSTICS_LEVEL_NEUTRAL_INTEL, DRIVER_CALLS_INTERNAL_CL_FLUSH);
if (castToObjectOrAbort<CommandQueue>(commandQueue)->isProfilingEnabled()) {
pContext->providePerformanceHint(CL_CONTEXT_DIAGNOSTICS_LEVEL_NEUTRAL_INTEL, PROFILING_ENABLED);
if (pDevice->getDeviceInfo().preemptionSupported && pDevice->getHardwareInfo().pPlatform->eProductFamily < IGFX_SKYLAKE) {
pContext->providePerformanceHint(CL_CONTEXT_DIAGNOSTICS_LEVEL_NEUTRAL_INTEL, PROFILING_ENABLED_WITH_DISABLED_PREEMPTION);
}
}
}
} while (false);
err.set(retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue);
return commandQueue;
}
cl_int CL_API_CALL clRetainCommandQueue(cl_command_queue commandQueue) {
cl_int retVal = CL_INVALID_COMMAND_QUEUE;
API_ENTER(&retVal);
retainQueue<CommandQueue>(commandQueue, retVal);
if (retVal == CL_SUCCESS) {
return retVal;
}
// if host queue not found - try to query device queue
retainQueue<DeviceQueue>(commandQueue, retVal);
return retVal;
}
cl_int CL_API_CALL clReleaseCommandQueue(cl_command_queue commandQueue) {
cl_int retVal = CL_INVALID_COMMAND_QUEUE;
API_ENTER(&retVal);
releaseQueue<CommandQueue>(commandQueue, retVal);
if (retVal == CL_SUCCESS) {
return retVal;
}
// if host queue not found - try to query device queue
releaseQueue<DeviceQueue>(commandQueue, retVal);
return retVal;
}
cl_int CL_API_CALL clGetCommandQueueInfo(cl_command_queue commandQueue,
cl_command_queue_info paramName,
size_t paramValueSize,
void *paramValue,
size_t *paramValueSizeRet) {
cl_int retVal = CL_INVALID_COMMAND_QUEUE;
API_ENTER(&retVal);
getQueueInfo<CommandQueue>(commandQueue, paramName, paramValueSize, paramValue, paramValueSizeRet, retVal);
// if host queue not found - try to query device queue
if (retVal == CL_SUCCESS) {
return retVal;
}
getQueueInfo<DeviceQueue>(commandQueue, paramName, paramValueSize, paramValue, paramValueSizeRet, retVal);
return retVal;
}
// deprecated OpenCL 1.0
cl_int CL_API_CALL clSetCommandQueueProperty(cl_command_queue commandQueue,
cl_command_queue_properties properties,
cl_bool enable,
cl_command_queue_properties *oldProperties) {
return CL_INVALID_VALUE;
}
cl_mem CL_API_CALL clCreateBuffer(cl_context context,
cl_mem_flags flags,
size_t size,
void *hostPtr,
cl_int *errcodeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
DBG_LOG_INPUTS("cl_context", context,
"cl_mem_flags", flags,
"size", size,
"hostPtr", hostPtr);
cl_mem buffer = nullptr;
const cl_mem_flags allValidFlags =
CL_MEM_READ_WRITE | CL_MEM_WRITE_ONLY | CL_MEM_READ_ONLY |
CL_MEM_ALLOC_HOST_PTR | CL_MEM_COPY_HOST_PTR | CL_MEM_USE_HOST_PTR |
CL_MEM_HOST_WRITE_ONLY | CL_MEM_HOST_READ_ONLY | CL_MEM_HOST_NO_ACCESS;
do {
if (size == 0) {
retVal = CL_INVALID_BUFFER_SIZE;
break;
}
/* Are there some invalid flag bits? */
if ((flags & (~allValidFlags)) != 0) {
retVal = CL_INVALID_VALUE;
break;
}
/* Check all the invalid flags combination. */
if (((flags & CL_MEM_READ_WRITE) && (flags & (CL_MEM_READ_ONLY | CL_MEM_WRITE_ONLY))) ||
((flags & CL_MEM_READ_ONLY) && (flags & (CL_MEM_WRITE_ONLY))) ||
((flags & CL_MEM_ALLOC_HOST_PTR) && (flags & CL_MEM_USE_HOST_PTR)) ||
((flags & CL_MEM_COPY_HOST_PTR) && (flags & CL_MEM_USE_HOST_PTR)) ||
((flags & CL_MEM_HOST_READ_ONLY) && (flags & CL_MEM_HOST_NO_ACCESS)) ||
((flags & CL_MEM_HOST_READ_ONLY) && (flags & CL_MEM_HOST_WRITE_ONLY)) ||
((flags & CL_MEM_HOST_WRITE_ONLY) && (flags & CL_MEM_HOST_NO_ACCESS))) {
retVal = CL_INVALID_VALUE;
break;
}
/* Check the host ptr and data */
if ((((flags & CL_MEM_COPY_HOST_PTR) || (flags & CL_MEM_USE_HOST_PTR)) && hostPtr == nullptr) ||
(!(flags & (CL_MEM_COPY_HOST_PTR | CL_MEM_USE_HOST_PTR)) && (hostPtr != nullptr))) {
retVal = CL_INVALID_HOST_PTR;
break;
}
Context *pContext = nullptr;
retVal = validateObjects(WithCastToInternal(context, &pContext));
if (retVal != CL_SUCCESS) {
break;
}
// create the buffer
buffer = Buffer::create(pContext, flags, size, hostPtr, retVal);
} while (false);
if (errcodeRet) {
*errcodeRet = retVal;
}
DBG_LOG_INPUTS("buffer", buffer);
return buffer;
}
cl_mem CL_API_CALL clCreateSubBuffer(cl_mem buffer,
cl_mem_flags flags,
cl_buffer_create_type bufferCreateType,
const void *bufferCreateInfo,
cl_int *errcodeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
cl_mem subBuffer = nullptr;
Buffer *parentBuffer = castToObject<Buffer>(buffer);
const cl_mem_flags allValidFlags =
CL_MEM_READ_WRITE | CL_MEM_WRITE_ONLY | CL_MEM_READ_ONLY |
CL_MEM_HOST_WRITE_ONLY | CL_MEM_HOST_READ_ONLY | CL_MEM_HOST_NO_ACCESS;
do {
if (parentBuffer == nullptr) {
retVal = CL_INVALID_MEM_OBJECT;
break;
}
/* Are there some invalid flag bits? */
if ((flags & (~allValidFlags)) != 0) {
retVal = CL_INVALID_VALUE;
break;
}
cl_mem_flags parentFlags = parentBuffer->getFlags();
if (parentBuffer->isSubBuffer() == true) {
retVal = CL_INVALID_MEM_OBJECT;
break;
}
/* Check whether flag is valid. */
if (((flags & CL_MEM_HOST_READ_ONLY) && (flags & CL_MEM_HOST_NO_ACCESS)) ||
((flags & CL_MEM_HOST_READ_ONLY) && (flags & CL_MEM_HOST_WRITE_ONLY)) ||
((flags & CL_MEM_HOST_WRITE_ONLY) && (flags & CL_MEM_HOST_NO_ACCESS))) {
retVal = CL_INVALID_VALUE;
break;
}
/* Check whether flag is valid and compatible with parent. */
if (flags &&
(((parentFlags & CL_MEM_WRITE_ONLY) && (flags & (CL_MEM_READ_WRITE | CL_MEM_READ_ONLY))) ||
((parentFlags & CL_MEM_READ_ONLY) && (flags & (CL_MEM_READ_WRITE | CL_MEM_WRITE_ONLY))) ||
((parentFlags & CL_MEM_HOST_WRITE_ONLY) && (flags & CL_MEM_HOST_READ_ONLY)) ||
((parentFlags & CL_MEM_HOST_READ_ONLY) && (flags & CL_MEM_HOST_WRITE_ONLY)) ||
((parentFlags & CL_MEM_HOST_NO_ACCESS) &&
(flags & (CL_MEM_HOST_WRITE_ONLY | CL_MEM_HOST_READ_ONLY))))) {
retVal = CL_INVALID_VALUE;
break;
}
/* Inherit some flags if we do not set. */
if ((flags & (CL_MEM_WRITE_ONLY | CL_MEM_READ_ONLY | CL_MEM_READ_WRITE)) == 0) {
flags |= parentFlags & (CL_MEM_WRITE_ONLY | CL_MEM_READ_ONLY | CL_MEM_READ_WRITE);
}
if ((flags & (CL_MEM_HOST_WRITE_ONLY | CL_MEM_HOST_READ_ONLY | CL_MEM_HOST_NO_ACCESS)) == 0) {
flags |= parentFlags & (CL_MEM_HOST_WRITE_ONLY | CL_MEM_HOST_READ_ONLY |
CL_MEM_HOST_NO_ACCESS);
}
flags |= parentFlags & (CL_MEM_USE_HOST_PTR | CL_MEM_ALLOC_HOST_PTR | CL_MEM_COPY_HOST_PTR);
if (bufferCreateType != CL_BUFFER_CREATE_TYPE_REGION) {
retVal = CL_INVALID_VALUE;
break;
}
if (bufferCreateInfo == nullptr) {
retVal = CL_INVALID_VALUE;
break;
}
/* Must have non-zero size. */
const cl_buffer_region *region = reinterpret_cast<const cl_buffer_region *>(bufferCreateInfo);
if (region->size == 0) {
retVal = CL_INVALID_BUFFER_SIZE;
break;
}
/* Out of range. */
if (region->origin > parentBuffer->getSize() ||
region->origin + region->size > parentBuffer->getSize()) {
retVal = CL_INVALID_VALUE;
break;
}
if (!parentBuffer->isValidSubBufferOffset(region->origin)) {
retVal = CL_MISALIGNED_SUB_BUFFER_OFFSET;
break;
}
subBuffer = parentBuffer->createSubBuffer(flags, region, retVal);
} while (false);
if (errcodeRet) {
*errcodeRet = retVal;
}
return subBuffer;
}
cl_mem CL_API_CALL clCreateImage(cl_context context,
cl_mem_flags flags,
const cl_image_format *imageFormat,
const cl_image_desc *imageDesc,
void *hostPtr,
cl_int *errcodeRet) {
Context *pContext = nullptr;
auto retVal = validateObjects(WithCastToInternal(context, &pContext));
API_ENTER(&retVal);
DBG_LOG_INPUTS("cl_context", context,
"cl_mem_flags", flags,
"cl_image_format.channel_data_type", imageFormat->image_channel_data_type,
"cl_image_format.channel_order", imageFormat->image_channel_order,
"cl_image_desc.width", imageDesc->image_width,
"cl_image_desc.heigth", imageDesc->image_height,
"cl_image_desc.depth", imageDesc->image_depth,
"cl_image_desc.type", imageDesc->image_type,
"cl_image_desc.array_size", imageDesc->image_array_size,
"hostPtr", hostPtr);
cl_mem image = nullptr;
cl_mem_flags allValidFlags =
CL_MEM_READ_WRITE | CL_MEM_WRITE_ONLY | CL_MEM_READ_ONLY |
CL_MEM_ALLOC_HOST_PTR | CL_MEM_COPY_HOST_PTR | CL_MEM_USE_HOST_PTR |
CL_MEM_HOST_WRITE_ONLY | CL_MEM_HOST_READ_ONLY | CL_MEM_HOST_NO_ACCESS |
CL_MEM_NO_ACCESS_INTEL | CL_MEM_ACCESS_FLAGS_UNRESTRICTED_INTEL;
do {
/* Are there some invalid flag bits? */
if ((flags & (~allValidFlags)) != 0) {
retVal = CL_INVALID_VALUE;
break;
}
/* Check all the invalid flags combination. */
if (((((CL_MEM_READ_WRITE | CL_MEM_WRITE_ONLY) | flags) == flags) ||
(((CL_MEM_READ_WRITE | CL_MEM_READ_ONLY) | flags) == flags) ||
(((CL_MEM_WRITE_ONLY | CL_MEM_READ_ONLY) | flags) == flags) ||
(((CL_MEM_ALLOC_HOST_PTR | CL_MEM_USE_HOST_PTR) | flags) == flags) ||
(((CL_MEM_COPY_HOST_PTR | CL_MEM_USE_HOST_PTR) | flags) == flags) ||
(((CL_MEM_HOST_WRITE_ONLY | CL_MEM_HOST_READ_ONLY) | flags) == flags) ||
(((CL_MEM_HOST_WRITE_ONLY | CL_MEM_HOST_NO_ACCESS) | flags) == flags) ||
(((CL_MEM_HOST_READ_ONLY | CL_MEM_HOST_NO_ACCESS) | flags) == flags) ||
(((CL_MEM_NO_ACCESS_INTEL | CL_MEM_READ_WRITE) | flags) == flags) ||
(((CL_MEM_NO_ACCESS_INTEL | CL_MEM_WRITE_ONLY) | flags) == flags) ||
(((CL_MEM_NO_ACCESS_INTEL | CL_MEM_READ_ONLY) | flags) == flags)) &&
(!(flags & CL_MEM_ACCESS_FLAGS_UNRESTRICTED_INTEL))) {
retVal = CL_INVALID_VALUE;
break;
}
MemObj *parentMemObj = castToObject<MemObj>(imageDesc->mem_object);
if (parentMemObj != nullptr) {
cl_mem_flags allValidFlags =
CL_MEM_READ_WRITE | CL_MEM_WRITE_ONLY | CL_MEM_READ_ONLY |
CL_MEM_HOST_WRITE_ONLY | CL_MEM_HOST_READ_ONLY | CL_MEM_HOST_NO_ACCESS |
CL_MEM_NO_ACCESS_INTEL | CL_MEM_ACCESS_FLAGS_UNRESTRICTED_INTEL;
/* Are there some invalid flag bits? */
if ((flags & (~allValidFlags)) != 0) {
retVal = CL_INVALID_VALUE;
break;
}
cl_mem_flags parentFlags = parentMemObj->getFlags();
/* Check whether flag is valid and compatible with parent. */
if (((!(flags & CL_MEM_ACCESS_FLAGS_UNRESTRICTED_INTEL)) && (!(parentFlags & CL_MEM_ACCESS_FLAGS_UNRESTRICTED_INTEL))) &&
(flags &&
(((parentFlags & CL_MEM_WRITE_ONLY) && (flags & (CL_MEM_READ_WRITE | CL_MEM_READ_ONLY))) ||
((parentFlags & CL_MEM_READ_ONLY) && (flags & (CL_MEM_READ_WRITE | CL_MEM_WRITE_ONLY))) ||
((parentFlags & CL_MEM_NO_ACCESS_INTEL) && (flags & (CL_MEM_READ_WRITE | CL_MEM_WRITE_ONLY | CL_MEM_READ_ONLY))) ||
((parentFlags & CL_MEM_HOST_NO_ACCESS) && (flags & (CL_MEM_HOST_WRITE_ONLY | CL_MEM_HOST_READ_ONLY)))))) {
retVal = CL_INVALID_VALUE;
break;
}
}
if ((flags & (CL_MEM_COPY_HOST_PTR | CL_MEM_USE_HOST_PTR)) && !hostPtr) {
retVal = CL_INVALID_HOST_PTR;
break;
}
image = Image::validateAndCreateImage(pContext, flags, imageFormat, imageDesc, hostPtr, retVal);
} while (false);
if (errcodeRet) {
*errcodeRet = retVal;
}
DBG_LOG_INPUTS("image", image);
return image;
}
// deprecated OpenCL 1.1
cl_mem CL_API_CALL clCreateImage2D(cl_context context,
cl_mem_flags flags,
const cl_image_format *imageFormat,
size_t imageWidth,
size_t imageHeight,
size_t imageRowPitch,
void *hostPtr,
cl_int *errcodeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
Context *pContext = nullptr;
retVal = validateObjects(WithCastToInternal(context, &pContext));
cl_mem image2D = nullptr;
cl_image_desc imageDesc;
memset(&imageDesc, 0, sizeof(cl_image_desc));
imageDesc.image_height = imageHeight;
imageDesc.image_width = imageWidth;
imageDesc.image_row_pitch = imageRowPitch;
imageDesc.image_type = CL_MEM_OBJECT_IMAGE2D;
image2D = Image::validateAndCreateImage(pContext, flags, imageFormat, &imageDesc, hostPtr, retVal);
if (errcodeRet) {
*errcodeRet = retVal;
}
return image2D;
}
// deprecated OpenCL 1.1
cl_mem CL_API_CALL clCreateImage3D(cl_context context,
cl_mem_flags flags,
const cl_image_format *imageFormat,
size_t imageWidth,
size_t imageHeight,
size_t imageDepth,
size_t imageRowPitch,
size_t imageSlicePitch,
void *hostPtr,
cl_int *errcodeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
Context *pContext = nullptr;
retVal = validateObjects(WithCastToInternal(context, &pContext));
cl_mem image3D = nullptr;
cl_image_desc imageDesc;
memset(&imageDesc, 0, sizeof(cl_image_desc));
imageDesc.image_depth = imageDepth;
imageDesc.image_height = imageHeight;
imageDesc.image_width = imageWidth;
imageDesc.image_row_pitch = imageRowPitch;
imageDesc.image_slice_pitch = imageSlicePitch;
imageDesc.image_type = CL_MEM_OBJECT_IMAGE3D;
image3D = Image::validateAndCreateImage(pContext, flags, imageFormat, &imageDesc, hostPtr, retVal);
if (errcodeRet) {
*errcodeRet = retVal;
}
return image3D;
}
cl_int CL_API_CALL clRetainMemObject(cl_mem memobj) {
cl_int retVal = CL_INVALID_MEM_OBJECT;
API_ENTER(&retVal);
DBG_LOG_INPUTS("memobj", memobj);
auto pMemObj = castToObject<MemObj>(memobj);
if (pMemObj) {
pMemObj->retain();
retVal = CL_SUCCESS;
return retVal;
}
return retVal;
}
cl_int CL_API_CALL clReleaseMemObject(cl_mem memobj) {
cl_int retVal = CL_INVALID_MEM_OBJECT;
API_ENTER(&retVal);
DBG_LOG_INPUTS("memobj", memobj);
auto pMemObj = castToObject<MemObj>(memobj);
if (pMemObj) {
pMemObj->release();
retVal = CL_SUCCESS;
return retVal;
}
return retVal;
}
cl_int CL_API_CALL clGetSupportedImageFormats(cl_context context,
cl_mem_flags flags,
cl_mem_object_type imageType,
cl_uint numEntries,
cl_image_format *imageFormats,
cl_uint *numImageFormats) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
auto pContext = castToObject<Context>(context);
auto pPlatform = platform();
auto pDevice = pPlatform->getDevice(0);
retVal = pContext->getSupportedImageFormats(pDevice, flags, imageType, numEntries,
imageFormats, numImageFormats);
return retVal;
}
cl_int CL_API_CALL clGetMemObjectInfo(cl_mem memobj,
cl_mem_info paramName,
size_t paramValueSize,
void *paramValue,
size_t *paramValueSizeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
MemObj *pMemObj = nullptr;
retVal = validateObjects(WithCastToInternal(memobj, &pMemObj));
if (CL_SUCCESS != retVal) {
return retVal;
}
retVal = pMemObj->getMemObjectInfo(paramName, paramValueSize,
paramValue, paramValueSizeRet);
return retVal;
}
cl_int CL_API_CALL clGetImageInfo(cl_mem image,
cl_image_info paramName,
size_t paramValueSize,
void *paramValue,
size_t *paramValueSizeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
retVal = validateObjects(image);
if (CL_SUCCESS != retVal) {
return retVal;
}
auto pImgObj = castToObject<Image>(image);
if (pImgObj == nullptr) {
return CL_INVALID_MEM_OBJECT;
}
retVal = pImgObj->getImageInfo(paramName, paramValueSize, paramValue, paramValueSizeRet);
return retVal;
}
cl_int CL_API_CALL clGetImageParamsINTEL(cl_context context,
const cl_image_format *imageFormat,
const cl_image_desc *imageDesc,
size_t *imageRowPitch,
size_t *imageSlicePitch) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
SurfaceFormatInfo *surfaceFormat = nullptr;
cl_mem_flags memFlags = CL_MEM_READ_ONLY;
retVal = validateObjects(context);
auto pContext = castToObject<Context>(context);
if (CL_SUCCESS == retVal) {
if ((imageFormat == nullptr) || (imageDesc == nullptr) || (imageRowPitch == nullptr) || (imageSlicePitch == nullptr)) {
retVal = CL_INVALID_VALUE;
}
}
if (CL_SUCCESS == retVal) {
retVal = Image::validateImageFormat(imageFormat);
}
if (CL_SUCCESS == retVal) {
surfaceFormat = (SurfaceFormatInfo *)Image::getSurfaceFormatFromTable(memFlags, imageFormat);
retVal = Image::validate(pContext, memFlags, surfaceFormat, imageDesc, nullptr);
}
if (CL_SUCCESS == retVal) {
retVal = Image::getImageParams(pContext, memFlags, surfaceFormat, imageDesc, imageRowPitch, imageSlicePitch);
}
return retVal;
}
cl_int CL_API_CALL clSetMemObjectDestructorCallback(cl_mem memobj,
void(CL_CALLBACK *funcNotify)(cl_mem, void *),
void *userData) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
retVal = validateObjects(memobj, (void *)funcNotify);
if (CL_SUCCESS != retVal) {
return retVal;
}
auto pMemObj = castToObject<MemObj>(memobj);
retVal = pMemObj->setDestructorCallback(funcNotify, userData);
return retVal;
}
cl_sampler CL_API_CALL clCreateSampler(cl_context context,
cl_bool normalizedCoords,
cl_addressing_mode addressingMode,
cl_filter_mode filterMode,
cl_int *errcodeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
retVal = validateObjects(context);
cl_sampler sampler = nullptr;
if (retVal == CL_SUCCESS) {
auto pContext = castToObject<Context>(context);
sampler = Sampler::create(
pContext,
normalizedCoords,
addressingMode,
filterMode,
CL_FILTER_NEAREST,
0.0f,
std::numeric_limits<float>::max(),
retVal);
}
if (errcodeRet) {
*errcodeRet = retVal;
}
return sampler;
}
cl_int CL_API_CALL clRetainSampler(cl_sampler sampler) {
API_ENTER(0);
auto pSampler = castToObject<Sampler>(sampler);
if (pSampler) {
pSampler->retain();
return CL_SUCCESS;
}
return CL_INVALID_SAMPLER;
}
cl_int CL_API_CALL clReleaseSampler(cl_sampler sampler) {
API_ENTER(0);
auto pSampler = castToObject<Sampler>(sampler);
if (pSampler) {
pSampler->release();
return CL_SUCCESS;
}
return CL_INVALID_SAMPLER;
}
cl_int CL_API_CALL clGetSamplerInfo(cl_sampler sampler,
cl_sampler_info paramName,
size_t paramValueSize,
void *paramValue,
size_t *paramValueSizeRet) {
cl_int retVal = CL_INVALID_SAMPLER;
API_ENTER(&retVal);
auto pSampler = castToObject<Sampler>(sampler);
if (pSampler) {
retVal = pSampler->getInfo(paramName, paramValueSize,
paramValue, paramValueSizeRet);
}
return retVal;
}
cl_program CL_API_CALL clCreateProgramWithSource(cl_context context,
cl_uint count,
const char **strings,
const size_t *lengths,
cl_int *errcodeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
retVal = validateObjects(context, count, strings);
cl_program program = nullptr;
if (CL_SUCCESS == retVal) {
program = Program::create(
context,
count,
strings,
lengths,
retVal);
}
if (errcodeRet) {
*errcodeRet = retVal;
}
return program;
}
cl_program CL_API_CALL clCreateProgramWithBinary(cl_context context,
cl_uint numDevices,
const cl_device_id *deviceList,
const size_t *lengths,
const unsigned char **binaries,
cl_int *binaryStatus,
cl_int *errcodeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
retVal = validateObjects(context, deviceList, *deviceList, binaries, *binaries, lengths, *lengths);
cl_program program = nullptr;
DebugManager.dumpBinaryProgram(numDevices, lengths, binaries);
if (CL_SUCCESS == retVal) {
program = Program::create(
context,
numDevices,
deviceList,
lengths,
binaries,
binaryStatus,
retVal);
}
if (errcodeRet) {
*errcodeRet = retVal;
}
return program;
}
cl_program CL_API_CALL clCreateProgramWithIL(cl_context context,
const void *il,
size_t length,
cl_int *errcodeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
cl_program program = nullptr;
retVal = validateObjects(context, il);
if (retVal == CL_SUCCESS) {
program = Program::createFromIL(
castToObjectOrAbort<Context>(context),
il,
length,
retVal);
}
if (errcodeRet != nullptr) {
*errcodeRet = retVal;
}
return program;
}
cl_program CL_API_CALL clCreateProgramWithBuiltInKernels(cl_context context,
cl_uint numDevices,
const cl_device_id *deviceList,
const char *kernelNames,
cl_int *errcodeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
cl_program program = nullptr;
retVal = validateObjects(
context, deviceList, kernelNames, errcodeRet);
if (numDevices == 0) {
retVal = CL_INVALID_VALUE;
}
if (retVal == CL_SUCCESS) {
for (cl_uint i = 0; i < numDevices; i++) {
auto pContext = castToObject<Context>(context);
validateObject(pContext);
auto pDev = castToObject<Device>(*deviceList);
validateObject(pDev);
program = BuiltIns::getInstance().createBuiltInProgram(
*pContext,
*pDev,
kernelNames,
retVal);
if (program && retVal == CL_SUCCESS) {
break;
}
}
}
if (errcodeRet) {
*errcodeRet = retVal;
}
return program;
}
cl_int CL_API_CALL clRetainProgram(cl_program program) {
API_ENTER(0);
auto pProgram = castToObject<Program>(program);
if (pProgram) {
pProgram->retain();
return CL_SUCCESS;
}
return CL_INVALID_PROGRAM;
}
cl_int CL_API_CALL clReleaseProgram(cl_program program) {
API_ENTER(0);
auto pProgram = castToObject<Program>(program);
if (pProgram) {
pProgram->release();
return CL_SUCCESS;
}
return CL_INVALID_PROGRAM;
}
cl_int CL_API_CALL clBuildProgram(cl_program program,
cl_uint numDevices,
const cl_device_id *deviceList,
const char *options,
void(CL_CALLBACK *funcNotify)(cl_program program, void *userData),
void *userData) {
cl_int retVal = CL_INVALID_PROGRAM;
API_ENTER(&retVal);
DBG_LOG_INPUTS("clProgram", program, "numDevices", numDevices, "cl_device_id", deviceList, "options", (options != nullptr) ? options : "", "funcNotify", funcNotify, "userData", userData);
auto pProgram = castToObject<Program>(program);
if (pProgram) {
retVal = pProgram->build(numDevices, deviceList, options, funcNotify, userData, clCacheEnabled);
}
return retVal;
}
cl_int CL_API_CALL clCompileProgram(cl_program program,
cl_uint numDevices,
const cl_device_id *deviceList,
const char *options,
cl_uint numInputHeaders,
const cl_program *inputHeaders,
const char **headerIncludeNames,
void(CL_CALLBACK *funcNotify)(cl_program program, void *userData),
void *userData) {
cl_int retVal = CL_INVALID_PROGRAM;
API_ENTER(&retVal);
DBG_LOG_INPUTS("clProgram", program, "numDevices", numDevices, "cl_device_id", deviceList, "options", (options != nullptr) ? options : "", "numInputHeaders", numInputHeaders);
auto pProgram = castToObject<Program>(program);
if (pProgram != nullptr) {
retVal = pProgram->compile(numDevices, deviceList, options,
numInputHeaders, inputHeaders, headerIncludeNames,
funcNotify, userData);
}
return retVal;
}
cl_program CL_API_CALL clLinkProgram(cl_context context,
cl_uint numDevices,
const cl_device_id *deviceList,
const char *options,
cl_uint numInputPrograms,
const cl_program *inputPrograms,
void(CL_CALLBACK *funcNotify)(cl_program program, void *userData),
void *userData,
cl_int *errcodeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
DBG_LOG_INPUTS("cl_context", context, "numDevices", numDevices, "cl_device_id", deviceList, "options", (options != nullptr) ? options : "", "numInputPrograms", numInputPrograms);
ErrorCodeHelper err(errcodeRet, CL_SUCCESS);
Context *pContext = nullptr;
cl_program program = nullptr;
retVal = validateObject(context);
if (CL_SUCCESS == retVal) {
pContext = castToObject<Context>(context);
}
if (pContext != nullptr) {
program = new Program(pContext, false);
Program *pProgram = castToObject<Program>(program);
retVal = pProgram->link(numDevices, deviceList, options,
numInputPrograms, inputPrograms,
funcNotify, userData);
}
err.set(retVal);
return program;
}
cl_int CL_API_CALL clUnloadPlatformCompiler(cl_platform_id platform) {
return CL_OUT_OF_HOST_MEMORY;
}
cl_int CL_API_CALL clGetProgramInfo(cl_program program,
cl_program_info paramName,
size_t paramValueSize,
void *paramValue,
size_t *paramValueSizeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
DBG_LOG_INPUTS("clProgram", program, "paramName", paramName, "paramValueSize", paramValueSize, "paramValue", paramValue, "paramValueSizeRet", paramValueSizeRet);
retVal = validateObjects(program);
if (CL_SUCCESS == retVal) {
Program *pProgram = (Program *)(program);
retVal = pProgram->getInfo(
paramName,
paramValueSize,
paramValue,
paramValueSizeRet);
}
return retVal;
}
cl_int CL_API_CALL clGetProgramBuildInfo(cl_program program,
cl_device_id device,
cl_program_build_info paramName,
size_t paramValueSize,
void *paramValue,
size_t *paramValueSizeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
DBG_LOG_INPUTS("clProgram", program, "cl_device_id", device, "paramName", paramName, "paramValueSize", paramValueSize, "paramValue", paramValue, "paramValueSizeRet", paramValueSizeRet);
retVal = validateObjects(program);
if (CL_SUCCESS == retVal) {
Program *pProgram = (Program *)(program);
retVal = pProgram->getBuildInfo(
device,
paramName,
paramValueSize,
paramValue,
paramValueSizeRet);
}
return retVal;
}
cl_kernel CL_API_CALL clCreateKernel(cl_program clProgram,
const char *kernelName,
cl_int *errcodeRet) {
API_ENTER(errcodeRet);
Program *pProgram = nullptr;
cl_kernel kernel = nullptr;
cl_int retVal = CL_SUCCESS;
DBG_LOG_INPUTS("clProgram", clProgram, "kernelName", kernelName);
do {
if (!isValidObject(clProgram) ||
!(pProgram = castToObject<Program>(clProgram))) {
retVal = CL_INVALID_PROGRAM;
break;
}
const KernelInfo *pKernelInfo = pProgram->getKernelInfo(kernelName);
if (!pKernelInfo) {
retVal = CL_INVALID_KERNEL_NAME;
break;
}
if (pKernelInfo->isValid == false) {
retVal = CL_INVALID_KERNEL;
break;
}
kernel = Kernel::create(
pProgram,
*pKernelInfo,
&retVal);
DBG_LOG_INPUTS("kernel", kernel);
} while (false);
if (errcodeRet) {
*errcodeRet = retVal;
}
if (kernel != nullptr) {
gtpinNotifyKernelCreate(kernel);
}
return kernel;
}
cl_int CL_API_CALL clCreateKernelsInProgram(cl_program clProgram,
cl_uint numKernels,
cl_kernel *kernels,
cl_uint *numKernelsRet) {
API_ENTER(0);
auto program = castToObject<Program>(clProgram);
if (program) {
auto numKernels = program->getNumKernels();
for (unsigned int ordinal = 0; ordinal < numKernels; ++ordinal) {
const auto kernelInfo = program->getKernelInfo(ordinal);
DEBUG_BREAK_IF(kernelInfo == nullptr);
DEBUG_BREAK_IF(!kernelInfo->isValid);
if (kernels) {
kernels[ordinal] = Kernel::create(
program,
*kernelInfo,
nullptr);
if (kernels[ordinal] != nullptr) {
gtpinNotifyKernelCreate(kernels[ordinal]);
}
}
}
if (numKernelsRet) {
*numKernelsRet = static_cast<cl_uint>(numKernels);
}
return CL_SUCCESS;
}
return CL_INVALID_PROGRAM;
}
cl_int CL_API_CALL clRetainKernel(cl_kernel kernel) {
API_ENTER(0);
auto pKernel = castToObject<Kernel>(kernel);
if (pKernel) {
pKernel->retain();
return CL_SUCCESS;
}
return CL_INVALID_KERNEL;
}
cl_int CL_API_CALL clReleaseKernel(cl_kernel kernel) {
API_ENTER(0);
auto pKernel = castToObject<Kernel>(kernel);
if (pKernel) {
pKernel->release();
return CL_SUCCESS;
}
return CL_INVALID_KERNEL;
}
cl_int CL_API_CALL clSetKernelArg(cl_kernel kernel,
cl_uint argIndex,
size_t argSize,
const void *argValue) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
auto pKernel = castToObject<Kernel>(kernel);
DBG_LOG_INPUTS("kernel", kernel, "argIndex", argIndex, "argSize", argSize, "argValue", argValue);
do {
if (!pKernel) {
retVal = CL_INVALID_KERNEL;
break;
}
if (pKernel->getKernelInfo().kernelArgInfo.size() <= argIndex) {
retVal = CL_INVALID_ARG_INDEX;
break;
}
retVal = pKernel->checkCorrectImageAccessQualifier(argIndex, argSize, argValue);
if (retVal != CL_SUCCESS) {
pKernel->unsetArg(argIndex);
break;
}
retVal = pKernel->setArg(
argIndex,
argSize,
argValue);
break;
} while (false);
return retVal;
}
cl_int CL_API_CALL clGetKernelInfo(cl_kernel kernel,
cl_kernel_info paramName,
size_t paramValueSize,
void *paramValue,
size_t *paramValueSizeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
DBG_LOG_INPUTS("kernel", kernel, "paramName", paramName, "paramValueSize", paramValueSize, "paramValue", paramValue, "paramValueSizeRet", paramValueSizeRet);
auto pKernel = castToObject<Kernel>(kernel);
retVal = pKernel
? pKernel->getInfo(
paramName,
paramValueSize,
paramValue,
paramValueSizeRet)
: CL_INVALID_KERNEL;
return retVal;
}
cl_int CL_API_CALL clGetKernelArgInfo(cl_kernel kernel,
cl_uint argIndx,
cl_kernel_arg_info paramName,
size_t paramValueSize,
void *paramValue,
size_t *paramValueSizeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
auto pKernel = castToObject<Kernel>(kernel);
retVal = pKernel
? pKernel->getArgInfo(
argIndx,
paramName,
paramValueSize,
paramValue,
paramValueSizeRet)
: CL_INVALID_KERNEL;
return retVal;
}
cl_int CL_API_CALL clGetKernelWorkGroupInfo(cl_kernel kernel,
cl_device_id device,
cl_kernel_work_group_info paramName,
size_t paramValueSize,
void *paramValue,
size_t *paramValueSizeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
auto pKernel = castToObject<Kernel>(kernel);
retVal = pKernel
? pKernel->getWorkGroupInfo(
device,
paramName,
paramValueSize,
paramValue,
paramValueSizeRet)
: CL_INVALID_KERNEL;
return retVal;
}
cl_int CL_API_CALL clWaitForEvents(cl_uint numEvents,
const cl_event *eventList) {
auto retVal = CL_SUCCESS;
API_ENTER(&retVal);
DBG_LOG_INPUTS("eventList", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(eventList), numEvents));
for (unsigned int i = 0; i < numEvents && retVal == CL_SUCCESS; i++)
retVal = validateObjects(eventList[i]);
if (retVal != CL_SUCCESS)
return retVal;
retVal = Event::waitForEvents(numEvents, eventList);
return retVal;
}
cl_int CL_API_CALL clGetEventInfo(cl_event event,
cl_event_info paramName,
size_t paramValueSize,
void *paramValue,
size_t *paramValueSizeRet) {
API_ENTER(0);
Event *neoEvent = castToObject<Event>(event);
if (neoEvent == nullptr) {
return CL_INVALID_EVENT;
}
GetInfoHelper info(paramValue, paramValueSize, paramValueSizeRet);
switch (paramName) {
default:
return CL_INVALID_VALUE;
// From OCL spec :
// "Return the command-queue associated with event. For user event objects,"
// a nullptr value is returned."
case CL_EVENT_COMMAND_QUEUE: {
if (neoEvent->isUserEvent()) {
return info.set<cl_command_queue>(nullptr);
}
return info.set<cl_command_queue>(neoEvent->getCommandQueue());
}
case CL_EVENT_CONTEXT:
return info.set<cl_context>(neoEvent->getContext());
case CL_EVENT_COMMAND_TYPE:
return info.set<cl_command_type>(neoEvent->getCommandType());
case CL_EVENT_COMMAND_EXECUTION_STATUS:
neoEvent->tryFlushEvent();
if (neoEvent->isUserEvent()) {
auto executionStatus = neoEvent->peekExecutionStatus();
//Spec requires initial state to be queued
//our current design relies heavily on SUBMITTED status which directly corresponds
//to command being able to be submitted, to overcome this we set initial status to queued
//and we override the value stored with the value required by the spec.
if (executionStatus == CL_QUEUED) {
executionStatus = CL_SUBMITTED;
}
return info.set<cl_int>(executionStatus);
}
return info.set<cl_int>(neoEvent->updateEventAndReturnCurrentStatus());
case CL_EVENT_REFERENCE_COUNT:
return info.set<cl_uint>(neoEvent->getReference());
}
}
cl_event CL_API_CALL clCreateUserEvent(cl_context context,
cl_int *errcodeRet) {
API_ENTER(0);
ErrorCodeHelper err(errcodeRet, CL_SUCCESS);
Context *ctx = castToObject<Context>(context);
if (ctx == nullptr) {
err.set(CL_INVALID_CONTEXT);
return nullptr;
}
Event *userEvent = new UserEvent(ctx);
cl_event userClEvent = userEvent;
DebugManager.logInputs("cl_event", userClEvent, "UserEvent", userEvent);
return userClEvent;
}
cl_int CL_API_CALL clRetainEvent(cl_event event) {
API_ENTER(0);
auto pEvent = castToObject<Event>(event);
DebugManager.logInputs("cl_event", event, "Event", pEvent);
if (pEvent) {
pEvent->retain();
return CL_SUCCESS;
}
return CL_INVALID_EVENT;
}
cl_int CL_API_CALL clReleaseEvent(cl_event event) {
API_ENTER(0);
DBG_LOG_INPUTS("cl_event", event);
auto pEvent = castToObject<Event>(event);
DebugManager.logInputs("cl_event", event, "Event", pEvent);
if (pEvent) {
pEvent->release();
return CL_SUCCESS;
}
return CL_INVALID_EVENT;
}
cl_int CL_API_CALL clSetUserEventStatus(cl_event event,
cl_int executionStatus) {
API_ENTER(0);
auto userEvent = castToObject<UserEvent>(event);
DBG_LOG_INPUTS("cl_event", event, "executionStatus", executionStatus, "UserEvent", userEvent);
if (userEvent == nullptr)
return CL_INVALID_EVENT;
if (executionStatus > CL_COMPLETE) {
return CL_INVALID_VALUE;
}
if (!userEvent->isInitialEventStatus()) {
return CL_INVALID_OPERATION;
}
TakeOwnershipWrapper<Device> deviceOwnership(*userEvent->getContext()->getDevice(0));
userEvent->setStatus(executionStatus);
return CL_SUCCESS;
}
cl_int CL_API_CALL clSetEventCallback(cl_event event,
cl_int commandExecCallbackType,
void(CL_CALLBACK *funcNotify)(cl_event, cl_int, void *),
void *userData) {
API_ENTER(0);
auto eventObject = castToObject<Event>(event);
DBG_LOG_INPUTS("cl_event", event, "commandExecCallbackType", commandExecCallbackType, "Event", eventObject);
if (eventObject == nullptr)
return CL_INVALID_EVENT;
switch (commandExecCallbackType) {
case CL_COMPLETE:
case CL_SUBMITTED:
case CL_RUNNING:
break;
default:
return CL_INVALID_VALUE;
}
if (funcNotify == nullptr)
return CL_INVALID_VALUE;
eventObject->tryFlushEvent();
eventObject->addCallback(funcNotify, commandExecCallbackType, userData);
return CL_SUCCESS;
}
cl_int CL_API_CALL clGetEventProfilingInfo(cl_event event,
cl_profiling_info paramName,
size_t paramValueSize,
void *paramValue,
size_t *paramValueSizeRet) {
API_ENTER(0);
auto eventObject = castToObject<Event>(event);
if (eventObject == nullptr)
return CL_INVALID_EVENT;
return eventObject->getEventProfilingInfo(paramName,
paramValueSize,
paramValue,
paramValueSizeRet);
}
cl_int CL_API_CALL clFlush(cl_command_queue commandQueue) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue);
auto pCommandQueue = castToObject<CommandQueue>(commandQueue);
retVal = pCommandQueue
? pCommandQueue->flush()
: CL_INVALID_COMMAND_QUEUE;
return retVal;
}
cl_int CL_API_CALL clFinish(cl_command_queue commandQueue) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue);
auto pCommandQueue = castToObject<CommandQueue>(commandQueue);
retVal = pCommandQueue
? pCommandQueue->finish(false)
: CL_INVALID_COMMAND_QUEUE;
return retVal;
}
cl_int CL_API_CALL clEnqueueReadBuffer(cl_command_queue commandQueue,
cl_mem buffer,
cl_bool blockingRead,
size_t offset,
size_t cb,
void *ptr,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
CommandQueue *pCommandQueue = nullptr;
Buffer *pBuffer = nullptr;
auto retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
WithCastToInternal(buffer, &pBuffer),
ptr);
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue, "buffer", buffer, "blockingRead", blockingRead,
"offset", offset, "cb", cb, "ptr", ptr,
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(eventWaitList), numEventsInWaitList),
"event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1));
if (CL_SUCCESS == retVal) {
if (pBuffer->readMemObjFlagsInvalid()) {
retVal = CL_INVALID_OPERATION;
return retVal;
}
retVal = pCommandQueue->enqueueReadBuffer(
pBuffer,
blockingRead,
offset,
cb,
ptr,
numEventsInWaitList,
eventWaitList,
event);
}
DBG_LOG_INPUTS("event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1u));
return retVal;
}
cl_int CL_API_CALL clEnqueueReadBufferRect(cl_command_queue commandQueue,
cl_mem buffer,
cl_bool blockingRead,
const size_t *bufferOrigin,
const size_t *hostOrigin,
const size_t *region,
size_t bufferRowPitch,
size_t bufferSlicePitch,
size_t hostRowPitch,
size_t hostSlicePitch,
void *ptr,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
CommandQueue *pCommandQueue = nullptr;
Buffer *pBuffer = nullptr;
retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
WithCastToInternal(buffer, &pBuffer),
ptr);
if (CL_SUCCESS != retVal) {
return retVal;
}
if (pBuffer->readMemObjFlagsInvalid()) {
retVal = CL_INVALID_OPERATION;
return retVal;
}
if (pBuffer->bufferRectPitchSet(bufferOrigin,
region,
bufferRowPitch,
bufferSlicePitch,
hostRowPitch,
hostSlicePitch) == false) {
retVal = CL_INVALID_VALUE;
return retVal;
}
retVal = pCommandQueue->enqueueReadBufferRect(
pBuffer,
blockingRead,
bufferOrigin,
hostOrigin,
region,
bufferRowPitch,
bufferSlicePitch,
hostRowPitch,
hostSlicePitch,
ptr,
numEventsInWaitList,
eventWaitList,
event);
return retVal;
}
cl_int CL_API_CALL clEnqueueWriteBuffer(cl_command_queue commandQueue,
cl_mem buffer,
cl_bool blockingWrite,
size_t offset,
size_t cb,
const void *ptr,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue, "buffer", buffer, "blockingWrite", blockingWrite,
"offset", offset, "cb", cb, "ptr", ptr,
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(eventWaitList), numEventsInWaitList),
"event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1));
CommandQueue *pCommandQueue = nullptr;
Buffer *pBuffer = nullptr;
retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
WithCastToInternal(buffer, &pBuffer),
ptr);
if (CL_SUCCESS == retVal) {
if (pBuffer->writeMemObjFlagsInvalid()) {
retVal = CL_INVALID_OPERATION;
return retVal;
}
retVal = pCommandQueue->enqueueWriteBuffer(
pBuffer,
blockingWrite,
offset,
cb,
ptr,
numEventsInWaitList,
eventWaitList,
event);
}
DBG_LOG_INPUTS("event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1u));
return retVal;
}
cl_int CL_API_CALL clEnqueueWriteBufferRect(cl_command_queue commandQueue,
cl_mem buffer,
cl_bool blockingWrite,
const size_t *bufferOrigin,
const size_t *hostOrigin,
const size_t *region,
size_t bufferRowPitch,
size_t bufferSlicePitch,
size_t hostRowPitch,
size_t hostSlicePitch,
const void *ptr,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
CommandQueue *pCommandQueue = nullptr;
Buffer *pBuffer = nullptr;
retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
WithCastToInternal(buffer, &pBuffer),
ptr);
if (CL_SUCCESS != retVal) {
return retVal;
}
if (pBuffer->writeMemObjFlagsInvalid()) {
retVal = CL_INVALID_OPERATION;
return retVal;
}
if (pBuffer->bufferRectPitchSet(bufferOrigin,
region,
bufferRowPitch,
bufferSlicePitch,
hostRowPitch,
hostSlicePitch) == false) {
retVal = CL_INVALID_VALUE;
return retVal;
}
retVal = pCommandQueue->enqueueWriteBufferRect(
pBuffer,
blockingWrite,
bufferOrigin,
hostOrigin,
region,
bufferRowPitch,
bufferSlicePitch,
hostRowPitch,
hostSlicePitch,
ptr,
numEventsInWaitList,
eventWaitList,
event);
return retVal;
}
cl_int CL_API_CALL clEnqueueFillBuffer(cl_command_queue commandQueue,
cl_mem buffer,
const void *pattern,
size_t patternSize,
size_t offset,
size_t size,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
CommandQueue *pCommandQueue = nullptr;
Buffer *pBuffer = nullptr;
retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
WithCastToInternal(buffer, &pBuffer),
pattern,
(PatternSize)patternSize,
EventWaitList(numEventsInWaitList, eventWaitList));
if (CL_SUCCESS == retVal) {
retVal = pCommandQueue->enqueueFillBuffer(
pBuffer,
pattern,
patternSize,
offset,
size,
numEventsInWaitList,
eventWaitList,
event);
}
return retVal;
}
cl_int CL_API_CALL clEnqueueCopyBuffer(cl_command_queue commandQueue,
cl_mem srcBuffer,
cl_mem dstBuffer,
size_t srcOffset,
size_t dstOffset,
size_t cb,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue, "srcBuffer", srcBuffer, "dstBuffer", dstBuffer,
"srcOffset", srcOffset, "dstOffset", dstOffset, "cb", cb,
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(eventWaitList), numEventsInWaitList),
"event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1));
CommandQueue *pCommandQueue = nullptr;
Buffer *pSrcBuffer = nullptr;
Buffer *pDstBuffer = nullptr;
retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
WithCastToInternal(srcBuffer, &pSrcBuffer),
WithCastToInternal(dstBuffer, &pDstBuffer));
if (CL_SUCCESS == retVal) {
size_t srcSize = pSrcBuffer->getSize();
size_t dstSize = pDstBuffer->getSize();
if (srcOffset + cb > srcSize || dstOffset + cb > dstSize) {
retVal = CL_INVALID_VALUE;
return retVal;
}
retVal = pCommandQueue->enqueueCopyBuffer(
pSrcBuffer,
pDstBuffer,
srcOffset,
dstOffset,
cb,
numEventsInWaitList,
eventWaitList,
event);
}
DBG_LOG_INPUTS("event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1u));
return retVal;
}
cl_int CL_API_CALL clEnqueueCopyBufferRect(cl_command_queue commandQueue,
cl_mem srcBuffer,
cl_mem dstBuffer,
const size_t *srcOrigin,
const size_t *dstOrigin,
const size_t *region,
size_t srcRowPitch,
size_t srcSlicePitch,
size_t dstRowPitch,
size_t dstSlicePitch,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue, "srcBuffer", srcBuffer, "dstBuffer", dstBuffer,
"srcOrigin[0]", DebugManager.getInput(srcOrigin, 0), "srcOrigin[1]", DebugManager.getInput(srcOrigin, 1), "srcOrigin[2]", DebugManager.getInput(srcOrigin, 2),
"dstOrigin[0]", DebugManager.getInput(dstOrigin, 0), "dstOrigin[1]", DebugManager.getInput(dstOrigin, 1), "dstOrigin[2]", DebugManager.getInput(dstOrigin, 2),
"region[0]", DebugManager.getInput(region, 0), "region[1]", DebugManager.getInput(region, 1), "region[2]", DebugManager.getInput(region, 2),
"srcRowPitch", srcRowPitch, "srcSlicePitch", srcSlicePitch,
"dstRowPitch", dstRowPitch, "dstSlicePitch", dstSlicePitch,
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(eventWaitList), numEventsInWaitList),
"event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1));
CommandQueue *pCommandQueue = nullptr;
Buffer *pSrcBuffer = nullptr;
Buffer *pDstBuffer = nullptr;
retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
WithCastToInternal(srcBuffer, &pSrcBuffer),
WithCastToInternal(dstBuffer, &pDstBuffer));
if (CL_SUCCESS == retVal) {
retVal = pCommandQueue->enqueueCopyBufferRect(
pSrcBuffer,
pDstBuffer,
srcOrigin,
dstOrigin,
region,
srcRowPitch,
srcSlicePitch,
dstRowPitch,
dstSlicePitch,
numEventsInWaitList,
eventWaitList,
event);
}
DBG_LOG_INPUTS("event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1u));
return retVal;
}
cl_int CL_API_CALL clEnqueueReadImage(cl_command_queue commandQueue,
cl_mem image,
cl_bool blockingRead,
const size_t *origin,
const size_t *region,
size_t rowPitch,
size_t slicePitch,
void *ptr,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
CommandQueue *pCommandQueue = nullptr;
Image *pImage = nullptr;
auto retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
WithCastToInternal(image, &pImage));
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue, "image", image, "blockingRead", blockingRead,
"origin[0]", DebugManager.getInput(origin, 0), "origin[1]", DebugManager.getInput(origin, 1), "origin[2]", DebugManager.getInput(origin, 2),
"region[0]", DebugManager.getInput(region, 0), "region[1]", DebugManager.getInput(region, 1), "region[2]", DebugManager.getInput(region, 2),
"rowPitch", rowPitch, "slicePitch", slicePitch, "ptr", ptr,
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(eventWaitList), numEventsInWaitList),
"event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1));
if (CL_SUCCESS == retVal) {
if (pImage->readMemObjFlagsInvalid()) {
retVal = CL_INVALID_OPERATION;
return retVal;
}
if (IsPackedYuvImage(&pImage->getImageFormat())) {
retVal = validateYuvOperation(origin, region);
if (retVal != CL_SUCCESS)
return retVal;
}
if (!Image::validateRegionAndOrigin(origin, region, pImage->getImageDesc())) {
return CL_INVALID_VALUE;
}
retVal = pCommandQueue->enqueueReadImage(
pImage,
blockingRead,
origin,
region,
rowPitch,
slicePitch,
ptr,
numEventsInWaitList,
eventWaitList,
event);
}
DBG_LOG_INPUTS("event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1u));
return retVal;
}
cl_int CL_API_CALL clEnqueueWriteImage(cl_command_queue commandQueue,
cl_mem image,
cl_bool blockingWrite,
const size_t *origin,
const size_t *region,
size_t inputRowPitch,
size_t inputSlicePitch,
const void *ptr,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
CommandQueue *pCommandQueue = nullptr;
Image *pImage = nullptr;
auto retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
WithCastToInternal(image, &pImage));
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue, "image", image, "blockingWrite", blockingWrite,
"origin[0]", DebugManager.getInput(origin, 0), "origin[1]", DebugManager.getInput(origin, 1), "origin[2]", DebugManager.getInput(origin, 2),
"region[0]", DebugManager.getInput(region, 0), "region[1]", DebugManager.getInput(region, 1), "region[2]", DebugManager.getInput(region, 2),
"inputRowPitch", inputRowPitch, "inputSlicePitch", inputSlicePitch, "ptr", ptr,
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(eventWaitList), numEventsInWaitList),
"event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1));
if (CL_SUCCESS == retVal) {
if (pImage->writeMemObjFlagsInvalid()) {
retVal = CL_INVALID_OPERATION;
return retVal;
}
if (IsPackedYuvImage(&pImage->getImageFormat())) {
retVal = validateYuvOperation(origin, region);
if (retVal != CL_SUCCESS)
return retVal;
}
if (!Image::validateRegionAndOrigin(origin, region, pImage->getImageDesc())) {
return CL_INVALID_VALUE;
}
retVal = pCommandQueue->enqueueWriteImage(
pImage,
blockingWrite,
origin,
region,
inputRowPitch,
inputSlicePitch,
ptr,
numEventsInWaitList,
eventWaitList,
event);
}
DBG_LOG_INPUTS("event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1u));
return retVal;
}
cl_int CL_API_CALL clEnqueueFillImage(cl_command_queue commandQueue,
cl_mem image,
const void *fillColor,
const size_t *origin,
const size_t *region,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
CommandQueue *pCommandQueue = nullptr;
Image *dstImage = nullptr;
auto retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
WithCastToInternal(image, &dstImage),
fillColor,
EventWaitList(numEventsInWaitList, eventWaitList));
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue, "image", image, "fillColor", fillColor,
"origin[0]", origin[0], "origin[1]", origin[1], "origin[2]", origin[2],
"region[0]", region[0], "region[1]", region[1], "region[2]", region[2],
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(eventWaitList), numEventsInWaitList),
"event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1));
if (CL_SUCCESS == retVal) {
if (!Image::validateRegionAndOrigin(origin, region, dstImage->getImageDesc())) {
return CL_INVALID_VALUE;
}
retVal = pCommandQueue->enqueueFillImage(
dstImage,
fillColor,
origin,
region,
numEventsInWaitList,
eventWaitList,
event);
}
DBG_LOG_INPUTS("event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1u));
return retVal;
}
cl_int CL_API_CALL clEnqueueCopyImage(cl_command_queue commandQueue,
cl_mem srcImage,
cl_mem dstImage,
const size_t *srcOrigin,
const size_t *dstOrigin,
const size_t *region,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
CommandQueue *pCommandQueue = nullptr;
Image *pSrcImage = nullptr;
Image *pDstImage = nullptr;
auto retVal = validateObjects(WithCastToInternal(commandQueue, &pCommandQueue),
WithCastToInternal(srcImage, &pSrcImage),
WithCastToInternal(dstImage, &pDstImage));
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue, "srcImage", srcImage, "dstImage", dstImage,
"origin[0]", DebugManager.getInput(srcOrigin, 0), "origin[1]", DebugManager.getInput(srcOrigin, 1), "origin[2]", DebugManager.getInput(srcOrigin, 2),
"region[0]", DebugManager.getInput(dstOrigin, 0), "region[1]", DebugManager.getInput(dstOrigin, 1), "region[2]", DebugManager.getInput(dstOrigin, 2),
"region[0]", region ? region[0] : 0, "region[1]", region ? region[1] : 0, "region[2]", region ? region[2] : 0,
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(eventWaitList), numEventsInWaitList),
"event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1));
if (CL_SUCCESS == retVal) {
if (memcmp(&pSrcImage->getImageFormat(), &pDstImage->getImageFormat(), sizeof(cl_image_format))) {
return CL_IMAGE_FORMAT_MISMATCH;
}
if (IsPackedYuvImage(&pSrcImage->getImageFormat())) {
retVal = validateYuvOperation(srcOrigin, region);
if (retVal != CL_SUCCESS)
return retVal;
}
if (IsPackedYuvImage(&pDstImage->getImageFormat())) {
retVal = validateYuvOperation(dstOrigin, region);
if (retVal != CL_SUCCESS)
return retVal;
if (pDstImage->getImageDesc().image_type == CL_MEM_OBJECT_IMAGE2D && dstOrigin[2] != 0)
return CL_INVALID_VALUE;
}
if (!Image::validateRegionAndOrigin(srcOrigin, region, pSrcImage->getImageDesc())) {
return CL_INVALID_VALUE;
}
if (!Image::validateRegionAndOrigin(dstOrigin, region, pDstImage->getImageDesc())) {
return CL_INVALID_VALUE;
}
pCommandQueue->enqueueCopyImage(
pSrcImage,
pDstImage,
srcOrigin,
dstOrigin,
region,
numEventsInWaitList,
eventWaitList,
event);
}
DBG_LOG_INPUTS("event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1u));
return retVal;
}
cl_int CL_API_CALL clEnqueueCopyImageToBuffer(cl_command_queue commandQueue,
cl_mem srcImage,
cl_mem dstBuffer,
const size_t *srcOrigin,
const size_t *region,
const size_t dstOffset,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue, "srcImage", srcImage, "dstBuffer", dstBuffer,
"srcOrigin[0]", srcOrigin[0], "srcOrigin[1]", srcOrigin[1], "srcOrigin[2]", srcOrigin[2],
"region[0]", region[0], "region[1]", region[1], "region[2]", region[2],
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(eventWaitList), numEventsInWaitList),
"event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1));
CommandQueue *pCommandQueue = nullptr;
Image *pSrcImage = nullptr;
Buffer *pDstBuffer = nullptr;
retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
WithCastToInternal(srcImage, &pSrcImage),
WithCastToInternal(dstBuffer, &pDstBuffer));
if (CL_SUCCESS == retVal) {
if (IsPackedYuvImage(&pSrcImage->getImageFormat())) {
retVal = validateYuvOperation(srcOrigin, region);
if (retVal != CL_SUCCESS)
return retVal;
}
if (!Image::validateRegionAndOrigin(srcOrigin, region, pSrcImage->getImageDesc())) {
return CL_INVALID_VALUE;
}
retVal = pCommandQueue->enqueueCopyImageToBuffer(
pSrcImage,
pDstBuffer,
srcOrigin,
region,
dstOffset,
numEventsInWaitList,
eventWaitList,
event);
}
DBG_LOG_INPUTS("event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1u));
return retVal;
}
cl_int CL_API_CALL clEnqueueCopyBufferToImage(cl_command_queue commandQueue,
cl_mem srcBuffer,
cl_mem dstImage,
size_t srcOffset,
const size_t *dstOrigin,
const size_t *region,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue, "srcBuffer", srcBuffer, "dstImage", dstImage, "srcOffset", srcOffset,
"dstOrigin[0]", dstOrigin[0], "dstOrigin[1]", dstOrigin[1], "dstOrigin[2]", dstOrigin[2],
"region[0]", region[0], "region[1]", region[1], "region[2]", region[2],
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(eventWaitList), numEventsInWaitList),
"event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1));
CommandQueue *pCommandQueue = nullptr;
Buffer *pSrcBuffer = nullptr;
Image *pDstImage = nullptr;
retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
WithCastToInternal(srcBuffer, &pSrcBuffer),
WithCastToInternal(dstImage, &pDstImage));
if (CL_SUCCESS == retVal) {
if (IsPackedYuvImage(&pDstImage->getImageFormat())) {
retVal = validateYuvOperation(dstOrigin, region);
if (retVal != CL_SUCCESS)
return retVal;
}
if (!Image::validateRegionAndOrigin(dstOrigin, region, pDstImage->getImageDesc())) {
return CL_INVALID_VALUE;
}
retVal = pCommandQueue->enqueueCopyBufferToImage(
pSrcBuffer,
pDstImage,
srcOffset,
dstOrigin,
region,
numEventsInWaitList,
eventWaitList,
event);
}
DBG_LOG_INPUTS("event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1u));
return retVal;
}
void *CL_API_CALL clEnqueueMapBuffer(cl_command_queue commandQueue,
cl_mem buffer,
cl_bool blockingMap,
cl_map_flags mapFlags,
size_t offset,
size_t cb,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event,
cl_int *errcodeRet) {
void *retPtr = nullptr;
ErrorCodeHelper err(errcodeRet, CL_SUCCESS);
cl_int retVal;
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue, "buffer", buffer, "blockingMap", blockingMap,
"mapFlags", mapFlags, "offset", offset, "cb", cb,
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(eventWaitList), numEventsInWaitList),
"event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1));
do {
auto pCommandQueue = castToObject<CommandQueue>(commandQueue);
if (!pCommandQueue) {
retVal = CL_INVALID_COMMAND_QUEUE;
break;
}
auto pBuffer = castToObject<Buffer>(buffer);
if (!pBuffer) {
retVal = CL_INVALID_MEM_OBJECT;
break;
}
if (pBuffer->mapMemObjFlagsInvalid(mapFlags)) {
retVal = CL_INVALID_OPERATION;
break;
}
retPtr = pCommandQueue->enqueueMapBuffer(
pBuffer,
blockingMap,
mapFlags,
offset,
cb,
numEventsInWaitList,
eventWaitList,
event,
retVal);
} while (false);
err.set(retVal);
DBG_LOG_INPUTS("retPtr", retPtr, "event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1u));
return retPtr;
}
void *CL_API_CALL clEnqueueMapImage(cl_command_queue commandQueue,
cl_mem image,
cl_bool blockingMap,
cl_map_flags mapFlags,
const size_t *origin,
const size_t *region,
size_t *imageRowPitch,
size_t *imageSlicePitch,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event,
cl_int *errcodeRet) {
void *retPtr = nullptr;
ErrorCodeHelper err(errcodeRet, CL_SUCCESS);
cl_int retVal;
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue,
"image", image,
"blockingMap", blockingMap,
"mapFlags", mapFlags,
"origin[0]", origin[0],
"origin[1]", origin[1],
"origin[2]", origin[2],
"region[0]", region[0],
"region[1]", region[1],
"region[2]", region[2],
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(eventWaitList), numEventsInWaitList),
"event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1));
do {
Image *pImage = nullptr;
CommandQueue *pCommandQueue = nullptr;
retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
WithCastToInternal(image, &pImage));
if (retVal != CL_SUCCESS) {
break;
}
if (pImage->mapMemObjFlagsInvalid(mapFlags)) {
retVal = CL_INVALID_OPERATION;
break;
}
if (IsPackedYuvImage(&pImage->getImageFormat())) {
retVal = validateYuvOperation(origin, region);
if (retVal != CL_SUCCESS) {
break;
}
}
if (!Image::validateRegionAndOrigin(origin, region, pImage->getImageDesc())) {
retVal = CL_INVALID_VALUE;
break;
}
retPtr = pCommandQueue->enqueueMapImage(
pImage,
blockingMap,
mapFlags,
origin,
region,
imageRowPitch,
imageSlicePitch,
numEventsInWaitList,
eventWaitList,
event,
retVal);
} while (false);
err.set(retVal);
DBG_LOG_INPUTS("retPtr", retPtr, "event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1u));
return retPtr;
}
cl_int CL_API_CALL clEnqueueUnmapMemObject(cl_command_queue commandQueue,
cl_mem memObj,
void *mappedPtr,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
CommandQueue *pCommandQueue = nullptr;
MemObj *pMemObj = nullptr;
cl_int retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
WithCastToInternal(memObj, &pMemObj));
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue,
"memObj", memObj,
"mappedPtr", mappedPtr,
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(eventWaitList), numEventsInWaitList),
"event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1));
if (retVal == CL_SUCCESS) {
if (pMemObj->peekClMemObjType() == CL_MEM_OBJECT_PIPE) {
return CL_INVALID_MEM_OBJECT;
}
retVal = pCommandQueue->enqueueUnmapMemObject(pMemObj, mappedPtr, numEventsInWaitList, eventWaitList, event);
}
DBG_LOG_INPUTS("event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1u));
return retVal;
}
cl_int CL_API_CALL clEnqueueMigrateMemObjects(cl_command_queue commandQueue,
cl_uint numMemObjects,
const cl_mem *memObjects,
cl_mem_migration_flags flags,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue,
"numMemObjects", numMemObjects,
"memObjects", memObjects,
"flags", flags,
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(eventWaitList), numEventsInWaitList),
"event", event);
CommandQueue *pCommandQueue = nullptr;
retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
EventWaitList(numEventsInWaitList, eventWaitList));
if (CL_SUCCESS != retVal) {
return retVal;
}
if (numMemObjects == 0 || memObjects == nullptr)
return CL_INVALID_VALUE;
const cl_mem_migration_flags allValidFlags = CL_MIGRATE_MEM_OBJECT_CONTENT_UNDEFINED | CL_MIGRATE_MEM_OBJECT_HOST;
if ((flags & (~allValidFlags)) != 0) {
return CL_INVALID_VALUE;
}
retVal = pCommandQueue->enqueueMigrateMemObjects(numMemObjects,
memObjects,
flags,
numEventsInWaitList,
eventWaitList,
event);
DBG_LOG_INPUTS("event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1u));
return retVal;
}
cl_int CL_API_CALL clEnqueueNDRangeKernel(cl_command_queue commandQueue,
cl_kernel kernel,
cl_uint workDim,
const size_t *globalWorkOffset,
const size_t *globalWorkSize,
const size_t *localWorkSize,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue, "cl_kernel", kernel, "globalWorkOffset", globalWorkOffset,
DebugManager.getSizes(globalWorkSize, workDim, false), DebugManager.getSizes(localWorkSize, workDim, true),
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(eventWaitList), numEventsInWaitList),
"event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1));
CommandQueue *pCommandQueue = nullptr;
retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
kernel,
EventWaitList(numEventsInWaitList, eventWaitList));
if (CL_SUCCESS != retVal) {
return retVal;
}
auto pKernel = castToObjectOrAbort<Kernel>(kernel);
TakeOwnershipWrapper<Kernel> kernelOwnership(*pKernel, gtpinIsGTPinInitialized());
if (gtpinIsGTPinInitialized()) {
gtpinNotifyKernelSubmit(kernel, pCommandQueue);
}
retVal = pCommandQueue->enqueueKernel(
kernel,
workDim,
globalWorkOffset,
globalWorkSize,
localWorkSize,
numEventsInWaitList,
eventWaitList,
event);
DBG_LOG_INPUTS("event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1u));
return retVal;
}
cl_int CL_API_CALL clEnqueueTask(cl_command_queue commandQueue,
cl_kernel kernel,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
cl_uint workDim = 3;
size_t *globalWorkOffset = nullptr;
size_t globalWorkSize[3] = {1, 1, 1};
size_t localWorkSize[3] = {1, 1, 1};
retVal = (clEnqueueNDRangeKernel(
commandQueue,
kernel,
workDim,
globalWorkOffset,
globalWorkSize,
localWorkSize,
numEventsInWaitList,
eventWaitList,
event));
return retVal;
}
cl_int CL_API_CALL clEnqueueNativeKernel(cl_command_queue commandQueue,
void(CL_CALLBACK *userFunc)(void *),
void *args,
size_t cbArgs,
cl_uint numMemObjects,
const cl_mem *memList,
const void **argsMemLoc,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
return CL_OUT_OF_HOST_MEMORY;
}
// deprecated OpenCL 1.1
cl_int CL_API_CALL clEnqueueMarker(cl_command_queue commandQueue,
cl_event *event) {
API_ENTER(0);
DBG_LOG_INPUTS("commandQueue", commandQueue, "cl_event", event);
auto pCommandQueue = castToObject<CommandQueue>(commandQueue);
if (pCommandQueue) {
return pCommandQueue->enqueueMarkerWithWaitList(
0,
nullptr,
event);
}
return CL_INVALID_COMMAND_QUEUE;
}
// deprecated OpenCL 1.1
cl_int CL_API_CALL clEnqueueWaitForEvents(cl_command_queue commandQueue,
cl_uint numEvents,
const cl_event *eventList) {
return CL_OUT_OF_HOST_MEMORY;
}
// deprecated OpenCL 1.1
cl_int CL_API_CALL clEnqueueBarrier(cl_command_queue commandQueue) {
API_ENTER(0);
auto pCommandQueue = castToObject<CommandQueue>(commandQueue);
if (pCommandQueue) {
return pCommandQueue->enqueueBarrierWithWaitList(
0,
nullptr,
nullptr);
}
return CL_INVALID_COMMAND_QUEUE;
}
cl_int CL_API_CALL clEnqueueMarkerWithWaitList(cl_command_queue commandQueue,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
DebugManager.logInputs("cl_command_queue", commandQueue,
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(eventWaitList), numEventsInWaitList),
"event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1));
CommandQueue *pCommandQueue = nullptr;
retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
EventWaitList(numEventsInWaitList, eventWaitList));
if (CL_SUCCESS != retVal) {
return retVal;
}
return pCommandQueue->enqueueMarkerWithWaitList(
numEventsInWaitList,
eventWaitList,
event);
}
cl_int CL_API_CALL clEnqueueBarrierWithWaitList(cl_command_queue commandQueue,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
DBG_LOG_INPUTS("cl_command_queue", commandQueue,
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(eventWaitList), numEventsInWaitList),
"event", DebugManager.getEvents(reinterpret_cast<const uintptr_t *>(event), 1));
CommandQueue *pCommandQueue = nullptr;
retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
EventWaitList(numEventsInWaitList, eventWaitList));
if (CL_SUCCESS != retVal) {
return retVal;
}
return pCommandQueue->enqueueBarrierWithWaitList(
numEventsInWaitList,
eventWaitList,
event);
}
CL_API_ENTRY cl_command_queue CL_API_CALL
clCreatePerfCountersCommandQueueINTEL(
cl_context context,
cl_device_id device,
cl_command_queue_properties properties,
cl_uint configuration,
cl_int *errcodeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
cl_command_queue commandQueue = nullptr;
ErrorCodeHelper err(errcodeRet, CL_SUCCESS);
Device *pDevice = nullptr;
WithCastToInternal(device, &pDevice);
if (pDevice == nullptr) {
err.set(CL_INVALID_DEVICE);
return commandQueue;
}
if (!pDevice->getHardwareInfo().capabilityTable.instrumentationEnabled) {
err.set(CL_INVALID_DEVICE);
return commandQueue;
}
if ((properties & CL_QUEUE_PROFILING_ENABLE) == 0) {
err.set(CL_INVALID_QUEUE_PROPERTIES);
return commandQueue;
}
if ((properties & CL_QUEUE_ON_DEVICE) != 0) {
err.set(CL_INVALID_QUEUE_PROPERTIES);
return commandQueue;
}
if ((properties & CL_QUEUE_ON_DEVICE_DEFAULT) != 0) {
err.set(CL_INVALID_QUEUE_PROPERTIES);
return commandQueue;
}
commandQueue = clCreateCommandQueue(context, device, properties, errcodeRet);
if (commandQueue != nullptr) {
auto commandQueueObject = castToObjectOrAbort<CommandQueue>(commandQueue);
bool ret = commandQueueObject->setPerfCountersEnabled(true, configuration);
if (!ret) {
clReleaseCommandQueue(commandQueue);
commandQueue = nullptr;
err.set(CL_OUT_OF_RESOURCES);
}
}
return commandQueue;
}
CL_API_ENTRY cl_int CL_API_CALL
clSetPerformanceConfigurationINTEL(
cl_device_id device,
cl_uint count,
cl_uint *offsets,
cl_uint *values) {
API_ENTER(0);
Device *pDevice = nullptr;
auto retVal = validateObjects(WithCastToInternal(device, &pDevice));
if (CL_SUCCESS != retVal) {
return retVal;
}
if (!pDevice->getHardwareInfo().capabilityTable.instrumentationEnabled) {
return CL_PROFILING_INFO_NOT_AVAILABLE;
}
auto perfCounters = pDevice->getPerformanceCounters();
return perfCounters->sendPerfConfiguration(count, offsets, values);
}
cl_command_queue CL_API_CALL clCreateCommandQueueWithPropertiesKHR(cl_context context,
cl_device_id device,
const cl_queue_properties_khr *properties,
cl_int *errcodeRet) {
return clCreateCommandQueueWithProperties(context, device, properties, errcodeRet);
}
cl_accelerator_intel CL_API_CALL clCreateAcceleratorINTEL(
cl_context context,
cl_accelerator_type_intel acceleratorType,
size_t descriptorSize,
const void *descriptor,
cl_int *errcodeRet) {
API_ENTER(0);
cl_int retVal = CL_SUCCESS;
cl_accelerator_intel accelerator = nullptr;
do {
retVal = validateObjects(context);
if (retVal != CL_SUCCESS) {
retVal = CL_INVALID_CONTEXT;
break;
}
Context *pContext = castToObject<Context>(context);
DEBUG_BREAK_IF(!pContext);
switch (acceleratorType) {
case CL_ACCELERATOR_TYPE_MOTION_ESTIMATION_INTEL:
accelerator = VmeAccelerator::create(
pContext,
acceleratorType,
descriptorSize,
descriptor,
retVal);
break;
default:
retVal = CL_INVALID_ACCELERATOR_TYPE_INTEL;
}
} while (false);
if (errcodeRet) {
*errcodeRet = retVal;
}
return accelerator;
}
cl_int CL_API_CALL clRetainAcceleratorINTEL(
cl_accelerator_intel accelerator) {
API_ENTER(0);
cl_int retVal = CL_SUCCESS;
IntelAccelerator *pAccelerator = nullptr;
do {
pAccelerator = castToObject<IntelAccelerator>(accelerator);
if (!pAccelerator) {
retVal = CL_INVALID_ACCELERATOR_INTEL;
break;
}
pAccelerator->retain();
} while (false);
return retVal;
}
cl_int CL_API_CALL clGetAcceleratorInfoINTEL(
cl_accelerator_intel accelerator,
cl_accelerator_info_intel paramName,
size_t paramValueSize,
void *paramValue,
size_t *paramValueSizeRet) {
API_ENTER(0);
cl_int retVal = CL_SUCCESS;
IntelAccelerator *pAccelerator = nullptr;
do {
pAccelerator = castToObject<IntelAccelerator>(accelerator);
if (!pAccelerator) {
retVal = CL_INVALID_ACCELERATOR_INTEL;
break;
}
retVal = pAccelerator->getInfo(
paramName, paramValueSize, paramValue, paramValueSizeRet);
} while (false);
return retVal;
}
cl_int CL_API_CALL clReleaseAcceleratorINTEL(
cl_accelerator_intel accelerator) {
API_ENTER(0);
cl_int retVal = CL_SUCCESS;
IntelAccelerator *pAccelerator = nullptr;
do {
pAccelerator = castToObject<IntelAccelerator>(accelerator);
if (!pAccelerator) {
retVal = CL_INVALID_ACCELERATOR_INTEL;
break;
}
pAccelerator->release();
} while (false);
return retVal;
}
cl_program CL_API_CALL clCreateProgramWithILKHR(cl_context context,
const void *il,
size_t length,
cl_int *errcodeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
cl_program program = nullptr;
retVal = validateObjects(context, il);
if (retVal == CL_SUCCESS) {
program = Program::createFromIL(
castToObjectOrAbort<Context>(context),
il,
length,
retVal);
}
if (errcodeRet != nullptr) {
*errcodeRet = retVal;
}
return program;
}
#define RETURN_FUNC_PTR_IF_EXIST(name) \
{ \
if (!strcmp(func_name, #name)) { \
return ((void *)(name)); \
} \
}
void *CL_API_CALL clGetExtensionFunctionAddress(const char *func_name) {
// Support an internal call by the ICD
RETURN_FUNC_PTR_IF_EXIST(clIcdGetPlatformIDsKHR);
//perf counters
RETURN_FUNC_PTR_IF_EXIST(clCreatePerfCountersCommandQueueINTEL);
RETURN_FUNC_PTR_IF_EXIST(clSetPerformanceConfigurationINTEL);
// Support device extensions
RETURN_FUNC_PTR_IF_EXIST(clCreateAcceleratorINTEL);
RETURN_FUNC_PTR_IF_EXIST(clGetAcceleratorInfoINTEL);
RETURN_FUNC_PTR_IF_EXIST(clRetainAcceleratorINTEL);
RETURN_FUNC_PTR_IF_EXIST(clReleaseAcceleratorINTEL);
void *ret = sharingFactory.getExtensionFunctionAddress(func_name);
if (ret != nullptr)
return ret;
// SPIR-V support through the cl_khr_il_program extension
RETURN_FUNC_PTR_IF_EXIST(clCreateProgramWithILKHR);
RETURN_FUNC_PTR_IF_EXIST(clCreateCommandQueueWithPropertiesKHR);
return nullptr;
}
// OpenCL 1.2
void *CL_API_CALL clGetExtensionFunctionAddressForPlatform(cl_platform_id platform,
const char *funcName) {
auto pPlatform = castToObject<Platform>(platform);
if (pPlatform == nullptr) {
return nullptr;
}
return clGetExtensionFunctionAddress(funcName);
}
void *CL_API_CALL clSVMAlloc(cl_context context,
cl_svm_mem_flags flags,
size_t size,
cl_uint alignment) {
void *pAlloc = nullptr;
auto pPlatform = platform();
auto pDevice = pPlatform->getDevice(0);
Context *pContext = nullptr;
if (validateObjects(WithCastToInternal(context, &pContext), pDevice) != CL_SUCCESS) {
return pAlloc;
}
if (flags == 0) {
flags = CL_MEM_READ_WRITE;
}
if (!((flags == CL_MEM_READ_WRITE) ||
(flags == CL_MEM_WRITE_ONLY) ||
(flags == CL_MEM_READ_ONLY) ||
(flags == CL_MEM_SVM_FINE_GRAIN_BUFFER) ||
(flags == (CL_MEM_SVM_FINE_GRAIN_BUFFER | CL_MEM_SVM_ATOMICS)) ||
(flags == (CL_MEM_READ_WRITE | CL_MEM_SVM_FINE_GRAIN_BUFFER)) ||
(flags == (CL_MEM_READ_WRITE | CL_MEM_SVM_FINE_GRAIN_BUFFER | CL_MEM_SVM_ATOMICS)) ||
(flags == (CL_MEM_WRITE_ONLY | CL_MEM_SVM_FINE_GRAIN_BUFFER)) ||
(flags == (CL_MEM_WRITE_ONLY | CL_MEM_SVM_FINE_GRAIN_BUFFER | CL_MEM_SVM_ATOMICS)) ||
(flags == (CL_MEM_READ_ONLY | CL_MEM_SVM_FINE_GRAIN_BUFFER)) ||
(flags == (CL_MEM_READ_ONLY | CL_MEM_SVM_FINE_GRAIN_BUFFER | CL_MEM_SVM_ATOMICS)))) {
return pAlloc;
}
if ((size == 0) || (size > pDevice->getDeviceInfo().maxMemAllocSize)) {
return pAlloc;
}
if ((alignment && (alignment & (alignment - 1))) || (alignment > sizeof(cl_ulong16))) {
return pAlloc;
}
const HardwareInfo &hwInfo = pDevice->getHardwareInfo();
if (!hwInfo.capabilityTable.ftrSvm) {
return pAlloc;
}
if (!hwInfo.capabilityTable.ftrSupportsCoherency &&
(flags & (CL_MEM_SVM_FINE_GRAIN_BUFFER | CL_MEM_SVM_ATOMICS))) {
return pAlloc;
}
pAlloc = pContext->getSVMAllocsManager()->createSVMAlloc(size, !!(flags & CL_MEM_SVM_FINE_GRAIN_BUFFER));
if (pContext->isProvidingPerformanceHints()) {
pContext->providePerformanceHint(CL_CONTEXT_DIAGNOSTICS_LEVEL_GOOD_INTEL, CL_SVM_ALLOC_MEETS_ALIGNMENT_RESTRICTIONS, pAlloc, size);
}
return pAlloc;
}
void CL_API_CALL clSVMFree(cl_context context,
void *svmPointer) {
Context *pContext = nullptr;
if (validateObject(WithCastToInternal(context, &pContext)) == CL_SUCCESS) {
pContext->getSVMAllocsManager()->freeSVMAlloc(svmPointer);
}
}
cl_int CL_API_CALL clEnqueueSVMFree(cl_command_queue commandQueue,
cl_uint numSvmPointers,
void *svmPointers[],
void(CL_CALLBACK *pfnFreeFunc)(cl_command_queue queue,
cl_uint numSvmPointers,
void *svmPointers[],
void *userData),
void *userData,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
CommandQueue *pCommandQueue = nullptr;
cl_int retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
EventWaitList(numEventsInWaitList, eventWaitList));
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue,
"numSvmPointers", numSvmPointers,
"svmPointers", svmPointers,
"pfnFreeFunc", pfnFreeFunc,
"userData", userData,
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", eventWaitList,
"event", event);
if (retVal != CL_SUCCESS) {
return retVal;
}
if (((svmPointers != nullptr) && (numSvmPointers == 0)) ||
((svmPointers == nullptr) && (numSvmPointers != 0))) {
return CL_INVALID_VALUE;
}
retVal = pCommandQueue->enqueueSVMFree(
numSvmPointers,
svmPointers,
pfnFreeFunc,
userData,
numEventsInWaitList,
eventWaitList,
event);
return retVal;
}
cl_int CL_API_CALL clEnqueueSVMMemcpy(cl_command_queue commandQueue,
cl_bool blockingCopy,
void *dstPtr,
const void *srcPtr,
size_t size,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
CommandQueue *pCommandQueue = nullptr;
cl_int retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
EventWaitList(numEventsInWaitList, eventWaitList));
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue,
"blockingCopy", blockingCopy,
"dstPtr", dstPtr,
"srcPtr", srcPtr,
"size", size,
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", eventWaitList,
"event", event);
if (retVal != CL_SUCCESS) {
return retVal;
}
if ((dstPtr == nullptr) || (srcPtr == nullptr)) {
return CL_INVALID_VALUE;
}
retVal = pCommandQueue->enqueueSVMMemcpy(
blockingCopy,
dstPtr,
srcPtr,
size,
numEventsInWaitList,
eventWaitList,
event);
return retVal;
}
cl_int CL_API_CALL clEnqueueSVMMemFill(cl_command_queue commandQueue,
void *svmPtr,
const void *pattern,
size_t patternSize,
size_t size,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
CommandQueue *pCommandQueue = nullptr;
cl_int retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
EventWaitList(numEventsInWaitList, eventWaitList));
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue,
"svmPtr", svmPtr,
"pattern", pattern,
"patternSize", patternSize,
"size", size,
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", eventWaitList,
"event", event);
if (retVal != CL_SUCCESS) {
return retVal;
}
if ((svmPtr == nullptr) || (size == 0)) {
return CL_INVALID_VALUE;
}
retVal = pCommandQueue->enqueueSVMMemFill(
svmPtr,
pattern,
patternSize,
size,
numEventsInWaitList,
eventWaitList,
event);
return retVal;
}
cl_int CL_API_CALL clEnqueueSVMMap(cl_command_queue commandQueue,
cl_bool blockingMap,
cl_map_flags mapFlags,
void *svmPtr,
size_t size,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
CommandQueue *pCommandQueue = nullptr;
cl_int retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
EventWaitList(numEventsInWaitList, eventWaitList));
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue,
"blockingMap", blockingMap,
"mapFlags", mapFlags,
"svmPtr", svmPtr,
"size", size,
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", eventWaitList,
"event", event);
if (CL_SUCCESS != retVal) {
return retVal;
}
if ((svmPtr == nullptr) || (size == 0)) {
return CL_INVALID_VALUE;
}
retVal = pCommandQueue->enqueueSVMMap(
blockingMap,
mapFlags,
svmPtr,
size,
numEventsInWaitList,
eventWaitList,
event);
return retVal;
}
cl_int CL_API_CALL clEnqueueSVMUnmap(cl_command_queue commandQueue,
void *svmPtr,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
CommandQueue *pCommandQueue = nullptr;
cl_int retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
EventWaitList(numEventsInWaitList, eventWaitList),
svmPtr);
API_ENTER(&retVal);
DBG_LOG_INPUTS("commandQueue", commandQueue,
"svmPtr", svmPtr,
"numEventsInWaitList", numEventsInWaitList,
"eventWaitList", eventWaitList,
"event", event);
if (retVal != CL_SUCCESS) {
return retVal;
}
retVal = pCommandQueue->enqueueSVMUnmap(
svmPtr,
numEventsInWaitList,
eventWaitList,
event);
return retVal;
}
cl_int CL_API_CALL clSetKernelArgSVMPointer(cl_kernel kernel,
cl_uint argIndex,
const void *argValue) {
Kernel *pKernel = nullptr;
auto retVal = validateObjects(WithCastToInternal(kernel, &pKernel));
API_ENTER(&retVal);
DBG_LOG_INPUTS("kernel", kernel, "argIndex", argIndex, "argValue", argValue);
if (CL_SUCCESS != retVal) {
return retVal;
}
if (argIndex >= pKernel->getKernelArgsNumber()) {
return CL_INVALID_ARG_INDEX;
}
cl_int kernelArgAddressQualifier = pKernel->getKernelArgAddressQualifier(argIndex);
if ((kernelArgAddressQualifier != CL_KERNEL_ARG_ADDRESS_GLOBAL) &&
(kernelArgAddressQualifier != CL_KERNEL_ARG_ADDRESS_CONSTANT)) {
return CL_INVALID_ARG_VALUE;
}
GraphicsAllocation *pSvmAlloc = nullptr;
if (argValue != nullptr) {
pSvmAlloc = pKernel->getContext().getSVMAllocsManager()->getSVMAlloc(argValue);
if (pSvmAlloc == nullptr) {
return CL_INVALID_ARG_VALUE;
}
}
return pKernel->setArgSvmAlloc(argIndex, const_cast<void *>(argValue), pSvmAlloc);
}
cl_int CL_API_CALL clSetKernelExecInfo(cl_kernel kernel,
cl_kernel_exec_info paramName,
size_t paramValueSize,
const void *paramValue) {
Kernel *pKernel = nullptr;
auto retVal = validateObjects(WithCastToInternal(kernel, &pKernel));
API_ENTER(&retVal);
DBG_LOG_INPUTS("kernel", kernel, "paramName", paramName,
"paramValueSize", paramValueSize, "paramValue", paramValue);
if (CL_SUCCESS != retVal) {
return retVal;
}
switch (paramName) {
case CL_KERNEL_EXEC_INFO_SVM_PTRS: {
if ((paramValueSize == 0) ||
(paramValueSize % sizeof(void *)) ||
(paramValue == nullptr)) {
return CL_INVALID_VALUE;
}
size_t numPointers = paramValueSize / sizeof(void *);
size_t *pSvmPtrList = (size_t *)paramValue;
pKernel->clearKernelExecInfo();
for (uint32_t i = 0; i < numPointers; i++) {
OCLRT::GraphicsAllocation *pSvmAlloc =
pKernel->getContext().getSVMAllocsManager()->getSVMAlloc((const void *)pSvmPtrList[i]);
if (pSvmAlloc == nullptr) {
return CL_INVALID_VALUE;
}
pKernel->setKernelExecInfo(pSvmAlloc);
}
break;
}
case CL_KERNEL_EXEC_INFO_SVM_FINE_GRAIN_SYSTEM:
return CL_INVALID_OPERATION;
default:
return CL_INVALID_VALUE;
}
return retVal;
};
cl_mem CL_API_CALL clCreatePipe(cl_context context,
cl_mem_flags flags,
cl_uint pipePacketSize,
cl_uint pipeMaxPackets,
const cl_pipe_properties *properties,
cl_int *errcodeRet) {
cl_mem pipe = nullptr;
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
DBG_LOG_INPUTS("cl_context", context,
"cl_mem_flags", flags,
"cl_uint", pipePacketSize,
"cl_uint", pipeMaxPackets,
"const cl_pipe_properties", properties,
"cl_int", errcodeRet);
auto pPlatform = platform();
auto pDevice = pPlatform->getDevice(0);
Context *pContext = nullptr;
const cl_mem_flags allValidFlags =
CL_MEM_READ_WRITE | CL_MEM_HOST_NO_ACCESS;
do {
if ((pipePacketSize == 0) || (pipeMaxPackets == 0)) {
retVal = CL_INVALID_PIPE_SIZE;
break;
}
/* Are there some invalid flag bits? */
if ((flags & (~allValidFlags)) != 0) {
retVal = CL_INVALID_VALUE;
break;
}
if (properties != nullptr) {
retVal = CL_INVALID_VALUE;
break;
}
retVal = validateObjects(WithCastToInternal(context, &pContext));
if (retVal != CL_SUCCESS) {
break;
}
if (pipePacketSize > pDevice->getDeviceInfo().pipeMaxPacketSize) {
retVal = CL_INVALID_PIPE_SIZE;
break;
}
// create the pipe
pipe = Pipe::create(pContext, flags, pipePacketSize, pipeMaxPackets, properties, retVal);
} while (false);
if (errcodeRet) {
*errcodeRet = retVal;
}
DBG_LOG_INPUTS("pipe", pipe);
return pipe;
}
cl_int CL_API_CALL clGetPipeInfo(cl_mem pipe,
cl_pipe_info paramName,
size_t paramValueSize,
void *paramValue,
size_t *paramValueSizeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
DBG_LOG_INPUTS("cl_mem", pipe,
"cl_pipe_info", paramName,
"size_t", paramValueSize,
"void *", paramValue,
"size_t*", paramValueSizeRet);
retVal = validateObjects(pipe);
if (CL_SUCCESS != retVal) {
return retVal;
}
auto pPipeObj = castToObject<Pipe>(pipe);
if (pPipeObj == nullptr) {
return CL_INVALID_MEM_OBJECT;
}
retVal = pPipeObj->getPipeInfo(paramName, paramValueSize, paramValue, paramValueSizeRet);
return retVal;
}
cl_command_queue CL_API_CALL clCreateCommandQueueWithProperties(cl_context context,
cl_device_id device,
const cl_queue_properties *properties,
cl_int *errcodeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
cl_command_queue commandQueue = nullptr;
ErrorCodeHelper err(errcodeRet, CL_SUCCESS);
Context *pContext = nullptr;
Device *pDevice = nullptr;
retVal = validateObjects(
WithCastToInternal(context, &pContext),
WithCastToInternal(device, &pDevice));
if (CL_SUCCESS != retVal) {
err.set(retVal);
return commandQueue;
}
auto minimumCreateDeviceQueueFlags = static_cast<cl_command_queue_properties>(CL_QUEUE_ON_DEVICE |
CL_QUEUE_OUT_OF_ORDER_EXEC_MODE_ENABLE);
auto tokenValue = properties ? *properties : 0;
auto propertiesAddress = properties;
while (tokenValue != 0) {
if (tokenValue != CL_QUEUE_PROPERTIES &&
tokenValue != CL_QUEUE_SIZE &&
tokenValue != CL_QUEUE_PRIORITY_KHR &&
tokenValue != CL_QUEUE_THROTTLE_KHR) {
err.set(CL_INVALID_VALUE);
return commandQueue;
}
propertiesAddress += 2;
tokenValue = *propertiesAddress;
}
auto commandQueueProperties = getCmdQueueProperties<cl_command_queue_properties>(properties);
uint32_t maxOnDeviceQueueSize = pDevice->getDeviceInfo().queueOnDeviceMaxSize;
uint32_t maxOnDeviceQueues = pDevice->getDeviceInfo().maxOnDeviceQueues;
if (commandQueueProperties & static_cast<cl_command_queue_properties>(CL_QUEUE_ON_DEVICE)) {
if (!(commandQueueProperties & static_cast<cl_command_queue_properties>(CL_QUEUE_OUT_OF_ORDER_EXEC_MODE_ENABLE))) {
err.set(CL_INVALID_VALUE);
return commandQueue;
}
}
if (commandQueueProperties & static_cast<cl_command_queue_properties>(CL_QUEUE_ON_DEVICE_DEFAULT)) {
if (!(commandQueueProperties & static_cast<cl_command_queue_properties>(CL_QUEUE_ON_DEVICE))) {
err.set(CL_INVALID_VALUE);
return commandQueue;
}
} else if (commandQueueProperties & static_cast<cl_command_queue_properties>(CL_QUEUE_ON_DEVICE)) {
if ((maxOnDeviceQueues == 0) || ((maxOnDeviceQueues == 1) && pContext->getDefaultDeviceQueue())) {
err.set(CL_OUT_OF_RESOURCES);
return commandQueue;
}
}
if (getCmdQueueProperties<cl_command_queue_properties>(properties, CL_QUEUE_SIZE) > maxOnDeviceQueueSize) {
err.set(CL_INVALID_QUEUE_PROPERTIES);
return commandQueue;
}
if (commandQueueProperties & static_cast<cl_command_queue_properties>(CL_QUEUE_ON_DEVICE)) {
if (getCmdQueueProperties<cl_queue_priority_khr>(properties, CL_QUEUE_PRIORITY_KHR)) {
err.set(CL_INVALID_QUEUE_PROPERTIES);
return commandQueue;
}
}
if (commandQueueProperties & static_cast<cl_command_queue_properties>(CL_QUEUE_ON_DEVICE)) {
if (getCmdQueueProperties<cl_queue_throttle_khr>(properties, CL_QUEUE_THROTTLE_KHR)) {
err.set(CL_INVALID_QUEUE_PROPERTIES);
return commandQueue;
}
}
auto maskedFlags = commandQueueProperties & minimumCreateDeviceQueueFlags;
if (maskedFlags == minimumCreateDeviceQueueFlags) {
commandQueue = DeviceQueue::create(
pContext,
pDevice,
*properties,
retVal);
} else {
commandQueue = CommandQueue::create(
pContext,
pDevice,
properties,
retVal);
if (pContext->isProvidingPerformanceHints()) {
pContext->providePerformanceHint(CL_CONTEXT_DIAGNOSTICS_LEVEL_NEUTRAL_INTEL, DRIVER_CALLS_INTERNAL_CL_FLUSH);
if (castToObjectOrAbort<CommandQueue>(commandQueue)->isProfilingEnabled()) {
pContext->providePerformanceHint(CL_CONTEXT_DIAGNOSTICS_LEVEL_NEUTRAL_INTEL, PROFILING_ENABLED);
if (pDevice->getDeviceInfo().preemptionSupported && pDevice->getHardwareInfo().pPlatform->eProductFamily < IGFX_SKYLAKE) {
pContext->providePerformanceHint(CL_CONTEXT_DIAGNOSTICS_LEVEL_NEUTRAL_INTEL, PROFILING_ENABLED_WITH_DISABLED_PREEMPTION);
}
}
}
}
if (!commandQueue)
retVal = CL_OUT_OF_HOST_MEMORY;
DBG_LOG_INPUTS("commandQueue", commandQueue, "properties", static_cast<int>(getCmdQueueProperties<cl_command_queue_properties>(properties)));
err.set(retVal);
return commandQueue;
}
cl_sampler CL_API_CALL clCreateSamplerWithProperties(cl_context context,
const cl_sampler_properties *samplerProperties,
cl_int *errcodeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
cl_sampler sampler = nullptr;
retVal = validateObjects(context);
if (CL_SUCCESS == retVal) {
sampler = Sampler::create(
castToObject<Context>(context),
samplerProperties,
retVal);
}
if (errcodeRet) {
*errcodeRet = retVal;
}
return sampler;
}
cl_int CL_API_CALL clUnloadCompiler() {
return CL_OUT_OF_HOST_MEMORY;
}
cl_int CL_API_CALL clGetKernelSubGroupInfoKHR(cl_kernel kernel,
cl_device_id device,
cl_kernel_sub_group_info paramName,
size_t inputValueSize,
const void *inputValue,
size_t paramValueSize,
void *paramValue,
size_t *paramValueSizeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
Kernel *pKernel = nullptr;
retVal = validateObjects(device,
WithCastToInternal(kernel, &pKernel));
if (CL_SUCCESS != retVal) {
return retVal;
}
switch (paramName) {
case CL_KERNEL_MAX_SUB_GROUP_SIZE_FOR_NDRANGE:
case CL_KERNEL_SUB_GROUP_COUNT_FOR_NDRANGE:
case CL_KERNEL_COMPILE_SUB_GROUP_SIZE_INTEL:
return pKernel->getSubGroupInfo(paramName,
inputValueSize, inputValue,
paramValueSize, paramValue,
paramValueSizeRet);
default:
return CL_INVALID_VALUE;
}
}
cl_int CL_API_CALL clGetDeviceAndHostTimer(cl_device_id device,
cl_ulong *deviceTimestamp,
cl_ulong *hostTimestamp) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
do {
Device *pDevice = castToObject<Device>(device);
if (pDevice == nullptr) {
retVal = CL_INVALID_DEVICE;
break;
}
if (deviceTimestamp == nullptr || hostTimestamp == nullptr) {
retVal = CL_INVALID_VALUE;
break;
}
if (!pDevice->getDeviceAndHostTimer(static_cast<uint64_t *>(deviceTimestamp), static_cast<uint64_t *>(hostTimestamp))) {
retVal = CL_OUT_OF_RESOURCES;
break;
}
} while (false);
return retVal;
}
cl_int CL_API_CALL clGetHostTimer(cl_device_id device,
cl_ulong *hostTimestamp) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
do {
Device *pDevice = castToObject<Device>(device);
if (pDevice == nullptr) {
retVal = CL_INVALID_DEVICE;
break;
}
if (hostTimestamp == nullptr) {
retVal = CL_INVALID_VALUE;
break;
}
if (!pDevice->getHostTimer(static_cast<uint64_t *>(hostTimestamp))) {
retVal = CL_OUT_OF_RESOURCES;
break;
}
} while (false);
return retVal;
}
cl_int CL_API_CALL clGetKernelSubGroupInfo(cl_kernel kernel,
cl_device_id device,
cl_kernel_sub_group_info paramName,
size_t inputValueSize,
const void *inputValue,
size_t paramValueSize,
void *paramValue,
size_t *paramValueSizeRet) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
Kernel *pKernel = nullptr;
retVal = validateObjects(device,
WithCastToInternal(kernel, &pKernel));
if (CL_SUCCESS != retVal) {
return retVal;
}
return pKernel->getSubGroupInfo(paramName,
inputValueSize, inputValue,
paramValueSize, paramValue,
paramValueSizeRet);
}
cl_int CL_API_CALL clSetDefaultDeviceCommandQueue(cl_context context,
cl_device_id device,
cl_command_queue commandQueue) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
Context *pContext = nullptr;
retVal = validateObjects(WithCastToInternal(context, &pContext), device);
if (CL_SUCCESS != retVal) {
return retVal;
}
auto pDeviceQueue = castToObject<DeviceQueue>(static_cast<_device_queue *>(commandQueue));
if (!pDeviceQueue) {
return CL_INVALID_COMMAND_QUEUE;
}
if (&pDeviceQueue->getContext() != pContext) {
return CL_INVALID_COMMAND_QUEUE;
}
pContext->setDefaultDeviceQueue(pDeviceQueue);
return CL_SUCCESS;
}
cl_int CL_API_CALL clEnqueueSVMMigrateMem(cl_command_queue commandQueue,
cl_uint numSvmPointers,
const void **svmPointers,
const size_t *sizes,
const cl_mem_migration_flags flags,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
cl_int retVal = CL_SUCCESS;
API_ENTER(&retVal);
CommandQueue *pCommandQueue = nullptr;
retVal = validateObjects(
WithCastToInternal(commandQueue, &pCommandQueue),
EventWaitList(numEventsInWaitList, eventWaitList));
if (CL_SUCCESS != retVal) {
return retVal;
}
if (numSvmPointers == 0 || svmPointers == nullptr)
return CL_INVALID_VALUE;
const cl_mem_migration_flags allValidFlags =
CL_MIGRATE_MEM_OBJECT_HOST | CL_MIGRATE_MEM_OBJECT_CONTENT_UNDEFINED;
if ((flags & (~allValidFlags)) != 0) {
return CL_INVALID_VALUE;
}
for (uint32_t i = 0; i < numSvmPointers; i++) {
SVMAllocsManager *pSvmAllocMgr = pCommandQueue->getContext().getSVMAllocsManager();
GraphicsAllocation *pSvmAlloc = pSvmAllocMgr->getSVMAlloc(svmPointers[i]);
if (pSvmAlloc == nullptr) {
return CL_INVALID_VALUE;
}
if (sizes != nullptr && sizes[i] != 0) {
pSvmAlloc = pSvmAllocMgr->getSVMAlloc(reinterpret_cast<void *>((size_t)svmPointers[i] + sizes[i] - 1));
if (pSvmAlloc == nullptr) {
return CL_INVALID_VALUE;
}
}
}
for (uint32_t i = 0; i < numEventsInWaitList; i++) {
auto pEvent = castToObject<Event>(eventWaitList[i]);
if (pEvent->getContext() != &pCommandQueue->getContext()) {
return CL_INVALID_CONTEXT;
}
}
return pCommandQueue->enqueueSVMMigrateMem(numSvmPointers,
svmPointers,
sizes,
flags,
numEventsInWaitList,
eventWaitList,
event);
}
cl_kernel CL_API_CALL clCloneKernel(cl_kernel sourceKernel,
cl_int *errcodeRet) {
Kernel *pSourceKernel = nullptr;
Kernel *pClonedKernel = nullptr;
auto retVal = validateObjects(WithCastToInternal(sourceKernel, &pSourceKernel));
API_ENTER(&retVal);
if (CL_SUCCESS == retVal) {
pClonedKernel = Kernel::create(pSourceKernel->getProgram(),
pSourceKernel->getKernelInfo(),
&retVal);
UNRECOVERABLE_IF((pClonedKernel == nullptr) || (retVal != CL_SUCCESS));
retVal = pClonedKernel->cloneKernel(pSourceKernel);
}
if (errcodeRet) {
*errcodeRet = retVal;
}
if (pClonedKernel != nullptr) {
gtpinNotifyKernelCreate(pClonedKernel);
}
return pClonedKernel;
}