compute-runtime/opencl/source/command_queue/enqueue_read_buffer.h

/*
 * Copyright (C) 2018-2021 Intel Corporation
 *
 * SPDX-License-Identifier: MIT
 *
 */

#pragma once
#include "shared/source/built_ins/built_ins.h"
#include "shared/source/command_stream/command_stream_receiver.h"
#include "shared/source/helpers/cache_policy.h"
#include "shared/source/helpers/engine_node_helper.h"
#include "shared/source/memory_manager/unified_memory_manager.h"
#include "shared/source/os_interface/os_context.h"

#include "opencl/source/command_queue/command_queue_hw.h"
#include "opencl/source/command_queue/enqueue_common.h"
#include "opencl/source/helpers/hardware_commands_helper.h"
#include "opencl/source/mem_obj/buffer.h"
#include "opencl/source/memory_manager/mem_obj_surface.h"

#include <new>

namespace NEO {

template <typename GfxFamily>
cl_int CommandQueueHw<GfxFamily>::enqueueReadBuffer(
    Buffer *buffer,
    cl_bool blockingRead,
    size_t offset,
    size_t size,
    void *ptr,
    GraphicsAllocation *mapAllocation,
    cl_uint numEventsInWaitList,
    const cl_event *eventWaitList,
    cl_event *event) {

    const cl_command_type cmdType = CL_COMMAND_READ_BUFFER;

    CsrSelectionArgs csrSelectionArgs{cmdType, buffer, {}, device->getRootDeviceIndex(), &size};
    CommandStreamReceiver &csr = selectCsrForBuiltinOperation(csrSelectionArgs);

    if (nullptr == mapAllocation) {
        notifyEnqueueReadBuffer(buffer, !!blockingRead, EngineHelpers::isBcs(csr.getOsContext().getEngineType()));
    }

    auto rootDeviceIndex = getDevice().getRootDeviceIndex();
    bool isMemTransferNeeded = buffer->isMemObjZeroCopy() ? buffer->checkIfMemoryTransferIsRequired(offset, 0, ptr, cmdType) : true;
    bool isCpuCopyAllowed = bufferCpuCopyAllowed(buffer, cmdType, blockingRead, size, ptr,
                                                 numEventsInWaitList, eventWaitList);

    InternalMemoryType memoryType = InternalMemoryType::NOT_SPECIFIED;
    //check if we are dealing with SVM pointer here for which we already have an allocation
    if (!mapAllocation && this->getContext().getSVMAllocsManager()) {
        auto svmEntry = this->getContext().getSVMAllocsManager()->getSVMAlloc(ptr);
        if (svmEntry) {
            memoryType = svmEntry->memoryType;
            if ((svmEntry->gpuAllocations.getGraphicsAllocation(rootDeviceIndex)->getGpuAddress() + svmEntry->size) < (castToUint64(ptr) + size)) {
                return CL_INVALID_OPERATION;
            }
            mapAllocation = svmEntry->cpuAllocation ? svmEntry->cpuAllocation : svmEntry->gpuAllocations.getGraphicsAllocation(rootDeviceIndex);
            if (isCpuCopyAllowed) {
                if (svmEntry->memoryType == DEVICE_UNIFIED_MEMORY) {
                    isCpuCopyAllowed = false;
                }
            }
        }
    }

    if (isCpuCopyAllowed) {
        if (isMemTransferNeeded) {
            return enqueueReadWriteBufferOnCpuWithMemoryTransfer(cmdType, buffer, offset, size, ptr,
                                                                 numEventsInWaitList, eventWaitList, event);
        } else {
            return enqueueReadWriteBufferOnCpuWithoutMemoryTransfer(cmdType, buffer, offset, size, ptr,
                                                                    numEventsInWaitList, eventWaitList, event);
        }
    } else if (!isMemTransferNeeded) {
        return enqueueMarkerForReadWriteOperation(buffer, ptr, cmdType, blockingRead,
                                                  numEventsInWaitList, eventWaitList, event);
    }

    auto eBuiltInOps = EBuiltInOps::CopyBufferToBuffer;
    if (forceStateless(buffer->getSize())) {
        eBuiltInOps = EBuiltInOps::CopyBufferToBufferStateless;
    }

    void *dstPtr = ptr;

    MemObjSurface bufferSurf(buffer);
    HostPtrSurface hostPtrSurf(dstPtr, size);
    GeneralSurface mapSurface;
    Surface *surfaces[] = {&bufferSurf, nullptr};

    if (mapAllocation) {
        surfaces[1] = &mapSurface;
        mapSurface.setGraphicsAllocation(mapAllocation);
        //get offset between base cpu ptr of map allocation and dst ptr
        if ((memoryType != DEVICE_UNIFIED_MEMORY) && (memoryType != SHARED_UNIFIED_MEMORY)) {
            size_t dstOffset = ptrDiff(dstPtr, mapAllocation->getUnderlyingBuffer());
            dstPtr = reinterpret_cast<void *>(mapAllocation->getGpuAddress() + dstOffset);
        }
    } else {
        surfaces[1] = &hostPtrSurf;
        if (size != 0) {
            bool status = csr.createAllocationForHostSurface(hostPtrSurf, true);
            if (!status) {
                return CL_OUT_OF_RESOURCES;
            }
            dstPtr = reinterpret_cast<void *>(hostPtrSurf.getAllocation()->getGpuAddress());
        }
    }
    void *alignedDstPtr = alignDown(dstPtr, 4);
    size_t dstPtrOffset = ptrDiff(dstPtr, alignedDstPtr);

    BuiltinOpParams dc;
    dc.dstPtr = alignedDstPtr;
    dc.dstOffset = {dstPtrOffset, 0, 0};
    dc.srcMemObj = buffer;
    dc.srcOffset = {offset, 0, 0};
    dc.size = {size, 0, 0};
    dc.transferAllocation = mapAllocation ? mapAllocation : hostPtrSurf.getAllocation();

    MultiDispatchInfo dispatchInfo(dc);

    if (context->isProvidingPerformanceHints()) {
        context->providePerformanceHintForMemoryTransfer(CL_COMMAND_READ_BUFFER, true, static_cast<cl_mem>(buffer), ptr);
        if (!isL3Capable(ptr, size)) {
            context->providePerformanceHint(CL_CONTEXT_DIAGNOSTICS_LEVEL_BAD_INTEL, CL_ENQUEUE_READ_BUFFER_DOESNT_MEET_ALIGNMENT_RESTRICTIONS, ptr, size, MemoryConstants::pageSize, MemoryConstants::pageSize);
        }
    }
    dispatchBcsOrGpgpuEnqueue<CL_COMMAND_READ_BUFFER>(dispatchInfo, surfaces, eBuiltInOps, numEventsInWaitList, eventWaitList, event, blockingRead, csr);

    return CL_SUCCESS;
}
} // namespace NEO
Initial commit Change-Id: I4bf1707bd3dfeadf2c17b0a7daff372b1925ebbd 2017-12-21 07:45:38 +08:00			`/*`
Copyright header update Dates corrected in copyright headers to reflect original publication date (2018 for OpenCL, 2020 for Level Zero). Signed-off-by: lgotszal <lukasz.gotszald@intel.com> 2021-05-17 02:51:16 +08:00			`* Copyright (C) 2018-2021 Intel Corporation`
Initial commit Change-Id: I4bf1707bd3dfeadf2c17b0a7daff372b1925ebbd 2017-12-21 07:45:38 +08:00			`*`
Update copyright headers Updating files modified in 2018 only. Older files remain with old style copyright header Change-Id: Ic99f2e190ad74b4b7f2bd79dd7b9fa5fbe36ec92 Signed-off-by: Artur Harasimiuk <artur.harasimiuk@intel.com> 2018-09-18 15:11:08 +08:00			`* SPDX-License-Identifier: MIT`
Initial commit Change-Id: I4bf1707bd3dfeadf2c17b0a7daff372b1925ebbd 2017-12-21 07:45:38 +08:00			`*`
			`*/`

			`#pragma once`
Move built ins to share directory Change-Id: I740a349a0f15229cd356fffe996932029bf0f98b Signed-off-by: Maciej Plewka <maciej.plewka@intel.com> 2020-02-24 20:10:44 +08:00			`#include "shared/source/built_ins/built_ins.h"`
Add absolute include paths Change-Id: I67a6919bbbff1d30c7d6cdb257b41c87bad51e7f Signed-off-by: Mateusz Jablonski <mateusz.jablonski@intel.com> 2020-02-24 05:44:01 +08:00			`#include "shared/source/command_stream/command_stream_receiver.h"`
			`#include "shared/source/helpers/cache_policy.h"`
Fix dumping allocations when BCS copy is allowed Change-Id: I0d56e0d2e8007e7dc1686fab0e40502b658c254e Signed-off-by: Bartosz Dunajski <bartosz.dunajski@intel.com> 2020-07-10 22:04:01 +08:00			`#include "shared/source/helpers/engine_node_helper.h"`
Add absolute include paths Change-Id: I67a6919bbbff1d30c7d6cdb257b41c87bad51e7f Signed-off-by: Mateusz Jablonski <mateusz.jablonski@intel.com> 2020-02-24 05:44:01 +08:00			`#include "shared/source/memory_manager/unified_memory_manager.h"`
Fix dumping allocations when BCS copy is allowed Change-Id: I0d56e0d2e8007e7dc1686fab0e40502b658c254e Signed-off-by: Bartosz Dunajski <bartosz.dunajski@intel.com> 2020-07-10 22:04:01 +08:00			`#include "shared/source/os_interface/os_context.h"`
Clang-format: restore sorting includes Change-Id: I34eb993b562c77f56d8fbd51a02ee266c1f76678 Signed-off-by: Mateusz Jablonski <mateusz.jablonski@intel.com> 2020-02-24 17:22:30 +08:00
Add absolute path to include Change-Id: Ib0782b4ab8d9a26ec358ecfb57721f4fe8d51b06 2020-02-23 05:50:57 +08:00			`#include "opencl/source/command_queue/command_queue_hw.h"`
			`#include "opencl/source/command_queue/enqueue_common.h"`
			`#include "opencl/source/helpers/hardware_commands_helper.h"`
			`#include "opencl/source/mem_obj/buffer.h"`
			`#include "opencl/source/memory_manager/mem_obj_surface.h"`
clang-format: enable sorting includes Include files are now grouped and sorted in following order: 1. Header file of the class the current file implements 2. Project files 3. Third party files 4. Standard library Change-Id: If31af05652184169f7fee1d7ad08f1b2ed602cf0 Signed-off-by: Filip Hazubski <filip.hazubski@intel.com> 2019-02-27 18:39:32 +08:00
Initial commit Change-Id: I4bf1707bd3dfeadf2c17b0a7daff372b1925ebbd 2017-12-21 07:45:38 +08:00			`#include <new>`

Change namespace from OCLRT to NEO Change-Id: If965c79d70392db26597aea4c2f3b7ae2820fe96 Signed-off-by: Maciej Plewka <maciej.plewka@intel.com> 2019-03-26 18:59:46 +08:00			`namespace NEO {`
Initial commit Change-Id: I4bf1707bd3dfeadf2c17b0a7daff372b1925ebbd 2017-12-21 07:45:38 +08:00
			`template <typename GfxFamily>`
			`cl_int CommandQueueHw<GfxFamily>::enqueueReadBuffer(`
			`Buffer *buffer,`
			`cl_bool blockingRead,`
			`size_t offset,`
			`size_t size,`
			`void *ptr,`
Add dedicated map allocation Related-To: NEO-2917 Change-Id: Ieeca40f5faf29433a5c464d2c3ca3b8910695a9b Signed-off-by: Zbigniew Zdanowicz <zbigniew.zdanowicz@intel.com> 2019-04-08 20:49:35 +08:00			`GraphicsAllocation *mapAllocation,`
Initial commit Change-Id: I4bf1707bd3dfeadf2c17b0a7daff372b1925ebbd 2017-12-21 07:45:38 +08:00			`cl_uint numEventsInWaitList,`
			`const cl_event *eventWaitList,`
			`cl_event *event) {`

Fix dumping allocations when BCS copy is allowed Change-Id: I0d56e0d2e8007e7dc1686fab0e40502b658c254e Signed-off-by: Bartosz Dunajski <bartosz.dunajski@intel.com> 2020-07-10 22:04:01 +08:00			`const cl_command_type cmdType = CL_COMMAND_READ_BUFFER;`
Add selectCsrForBuiltinOperation method to OpenCL CommandQueue Signed-off-by: Maciej Dziuban <maciej.dziuban@intel.com> Related-To: NEO-6057 2021-09-07 01:04:14 +08:00
			`CsrSelectionArgs csrSelectionArgs{cmdType, buffer, {}, device->getRootDeviceIndex(), &size};`
			`CommandStreamReceiver &csr = selectCsrForBuiltinOperation(csrSelectionArgs);`
Revert "Create single point for selecting engine for builtin ops" This reverts commit 6513bd371a69cb821ea45c7c1964ea1f51dd75b2. Signed-off-by: Maciej Dziuban <maciej.dziuban@intel.com> 2021-09-02 18:14:12 +08:00
			`if (nullptr == mapAllocation) {`
			`notifyEnqueueReadBuffer(buffer, !!blockingRead, EngineHelpers::isBcs(csr.getOsContext().getEngineType()));`
			`}`
Add notify functions to enqueue read buffer and image calls This commit adds notifications to enqueue read buffer and image calls and setters/getters to mark/check if an allocation is dumpable. Change-Id: I123f24752d2a86abcf934e0d404f4e0ecf1729cc 2018-08-23 00:41:52 +08:00
Add MultiGraphicsAllocation to USM Related-To: NEO-4672 Change-Id: I53ea4bea73ae6d52840146f63bc561bb90f9fe62 Signed-off-by: Mateusz Jablonski <mateusz.jablonski@intel.com> 2020-06-29 18:47:13 +08:00			`auto rootDeviceIndex = getDevice().getRootDeviceIndex();`
Don't take BCS path when Queue is blocked Change-Id: Ie6faa276ce1173ce075693bc81d1e91d1ace27fc Signed-off-by: Dunajski, Bartosz <bartosz.dunajski@intel.com> Related-To: NEO-3020 2019-06-18 17:02:47 +08:00			`bool isMemTransferNeeded = buffer->isMemObjZeroCopy() ? buffer->checkIfMemoryTransferIsRequired(offset, 0, ptr, cmdType) : true;`
			`bool isCpuCopyAllowed = bufferCpuCopyAllowed(buffer, cmdType, blockingRead, size, ptr,`
Simplify read/write enqueue operations on CPU Change-Id: I7f59b04d484be2699e325d10e16298016231faf2 Signed-off-by: Dunajski, Bartosz <bartosz.dunajski@intel.com> 2019-05-30 20:36:12 +08:00			`numEventsInWaitList, eventWaitList);`
Initial commit Change-Id: I4bf1707bd3dfeadf2c17b0a7daff372b1925ebbd 2017-12-21 07:45:38 +08:00
Enabling USM path for write buffer Signed-off-by: Andrzej Koska <andrzej.koska@intel.com> Related-To: NEO-5360 2021-01-05 19:39:04 +08:00			`InternalMemoryType memoryType = InternalMemoryType::NOT_SPECIFIED;`
Allow device allocations for transfer calls. - make sure that transfer is not handled via cpu. Change-Id: Ieffb1d8920b72d44cbe108410c00f76f4b110d83 Signed-off-by: Michal Mrozek <michal.mrozek@intel.com> 2020-01-24 18:47:19 +08:00			`//check if we are dealing with SVM pointer here for which we already have an allocation`
			`if (!mapAllocation && this->getContext().getSVMAllocsManager()) {`
			`auto svmEntry = this->getContext().getSVMAllocsManager()->getSVMAlloc(ptr);`
			`if (svmEntry) {`
Enabling USM path for write buffer Signed-off-by: Andrzej Koska <andrzej.koska@intel.com> Related-To: NEO-5360 2021-01-05 19:39:04 +08:00			`memoryType = svmEntry->memoryType;`
Add MultiGraphicsAllocation to USM Related-To: NEO-4672 Change-Id: I53ea4bea73ae6d52840146f63bc561bb90f9fe62 Signed-off-by: Mateusz Jablonski <mateusz.jablonski@intel.com> 2020-06-29 18:47:13 +08:00			`if ((svmEntry->gpuAllocations.getGraphicsAllocation(rootDeviceIndex)->getGpuAddress() + svmEntry->size) < (castToUint64(ptr) + size)) {`
Allow device allocations for transfer calls. - make sure that transfer is not handled via cpu. Change-Id: Ieffb1d8920b72d44cbe108410c00f76f4b110d83 Signed-off-by: Michal Mrozek <michal.mrozek@intel.com> 2020-01-24 18:47:19 +08:00			`return CL_INVALID_OPERATION;`
			`}`
Add MultiGraphicsAllocation to USM Related-To: NEO-4672 Change-Id: I53ea4bea73ae6d52840146f63bc561bb90f9fe62 Signed-off-by: Mateusz Jablonski <mateusz.jablonski@intel.com> 2020-06-29 18:47:13 +08:00			`mapAllocation = svmEntry->cpuAllocation ? svmEntry->cpuAllocation : svmEntry->gpuAllocations.getGraphicsAllocation(rootDeviceIndex);`
Allow device allocations for transfer calls. - make sure that transfer is not handled via cpu. Change-Id: Ieffb1d8920b72d44cbe108410c00f76f4b110d83 Signed-off-by: Michal Mrozek <michal.mrozek@intel.com> 2020-01-24 18:47:19 +08:00			`if (isCpuCopyAllowed) {`
			`if (svmEntry->memoryType == DEVICE_UNIFIED_MEMORY) {`
			`isCpuCopyAllowed = false;`
			`}`
			`}`
			`}`
			`}`

Simplify read/write enqueue operations on CPU Change-Id: I7f59b04d484be2699e325d10e16298016231faf2 Signed-off-by: Dunajski, Bartosz <bartosz.dunajski@intel.com> 2019-05-30 20:36:12 +08:00			`if (isCpuCopyAllowed) {`
			`if (isMemTransferNeeded) {`
Don't take BCS path when Queue is blocked Change-Id: Ie6faa276ce1173ce075693bc81d1e91d1ace27fc Signed-off-by: Dunajski, Bartosz <bartosz.dunajski@intel.com> Related-To: NEO-3020 2019-06-18 17:02:47 +08:00			`return enqueueReadWriteBufferOnCpuWithMemoryTransfer(cmdType, buffer, offset, size, ptr,`
Simplify read/write enqueue operations on CPU Change-Id: I7f59b04d484be2699e325d10e16298016231faf2 Signed-off-by: Dunajski, Bartosz <bartosz.dunajski@intel.com> 2019-05-30 20:36:12 +08:00			`numEventsInWaitList, eventWaitList, event);`
			`} else {`
Don't take BCS path when Queue is blocked Change-Id: Ie6faa276ce1173ce075693bc81d1e91d1ace27fc Signed-off-by: Dunajski, Bartosz <bartosz.dunajski@intel.com> Related-To: NEO-3020 2019-06-18 17:02:47 +08:00			`return enqueueReadWriteBufferOnCpuWithoutMemoryTransfer(cmdType, buffer, offset, size, ptr,`
Simplify read/write enqueue operations on CPU Change-Id: I7f59b04d484be2699e325d10e16298016231faf2 Signed-off-by: Dunajski, Bartosz <bartosz.dunajski@intel.com> 2019-05-30 20:36:12 +08:00			`numEventsInWaitList, eventWaitList, event);`
Add support for zero-copy r/w buffer Change-Id: Ie9f3f2211d107eb338bd97692d36e9c7d7a0feab 2018-01-11 22:42:55 +08:00			`}`
Simplify read/write enqueue operations on CPU Change-Id: I7f59b04d484be2699e325d10e16298016231faf2 Signed-off-by: Dunajski, Bartosz <bartosz.dunajski@intel.com> 2019-05-30 20:36:12 +08:00			`} else if (!isMemTransferNeeded) {`
Don't take BCS path when Queue is blocked Change-Id: Ie6faa276ce1173ce075693bc81d1e91d1ace27fc Signed-off-by: Dunajski, Bartosz <bartosz.dunajski@intel.com> Related-To: NEO-3020 2019-06-18 17:02:47 +08:00			`return enqueueMarkerForReadWriteOperation(buffer, ptr, cmdType, blockingRead,`
Simplify read/write enqueue operations on CPU Change-Id: I7f59b04d484be2699e325d10e16298016231faf2 Signed-off-by: Dunajski, Bartosz <bartosz.dunajski@intel.com> 2019-05-30 20:36:12 +08:00			`numEventsInWaitList, eventWaitList, event);`
Initial commit Change-Id: I4bf1707bd3dfeadf2c17b0a7daff372b1925ebbd 2017-12-21 07:45:38 +08:00			`}`
Add support for zero-copy r/w buffer Change-Id: Ie9f3f2211d107eb338bd97692d36e9c7d7a0feab 2018-01-11 22:42:55 +08:00
Add support for stateless read buffer. Change-Id: Iadf46a6d8651de3fd6bb07efc0eda278e04c86f6 Signed-off-by: Kamil Kopryk <kamil.kopryk@intel.com> Related-To: NEO-3314 2019-11-04 21:30:00 +08:00			`auto eBuiltInOps = EBuiltInOps::CopyBufferToBuffer;`
Fix for forceStateless check Change-Id: Ic1d4787c3d8c7bdd70f13451d703bbc9958af7c7 Signed-off-by: Kamil Kopryk <kamil.kopryk@intel.com> Related-To: NEO-3314 2019-11-06 17:01:37 +08:00			`if (forceStateless(buffer->getSize())) {`
Add support for stateless read buffer. Change-Id: Iadf46a6d8651de3fd6bb07efc0eda278e04c86f6 Signed-off-by: Kamil Kopryk <kamil.kopryk@intel.com> Related-To: NEO-3314 2019-11-04 21:30:00 +08:00			`eBuiltInOps = EBuiltInOps::CopyBufferToBufferStateless;`
			`}`
Simplify read/write enqueue operations on CPU Change-Id: I7f59b04d484be2699e325d10e16298016231faf2 Signed-off-by: Dunajski, Bartosz <bartosz.dunajski@intel.com> 2019-05-30 20:36:12 +08:00
For HostPtr surfaces of enqueue calls use GPU address Change-Id: I67bf5076d23d43438f5e82c5cb6cbd3b9ed2f152 2018-02-09 05:52:58 +08:00			`void *dstPtr = ptr;`

			`MemObjSurface bufferSurf(buffer);`
Do not align down pointer passed to hostPtr allocation - do not align up hostPtr allocation size - align BaseAddress programmed in SurfaceState to DWORD Change-Id: Ic6d02e53fd13dda881f8eb845a131bffe4deb45c 2019-01-03 23:18:53 +08:00			`HostPtrSurface hostPtrSurf(dstPtr, size);`
Add dedicated map allocation Related-To: NEO-2917 Change-Id: Ieeca40f5faf29433a5c464d2c3ca3b8910695a9b Signed-off-by: Zbigniew Zdanowicz <zbigniew.zdanowicz@intel.com> 2019-04-08 20:49:35 +08:00			`GeneralSurface mapSurface;`
			`Surface *surfaces[] = {&bufferSurf, nullptr};`
For HostPtr surfaces of enqueue calls use GPU address Change-Id: I67bf5076d23d43438f5e82c5cb6cbd3b9ed2f152 2018-02-09 05:52:58 +08:00
Add dedicated map allocation Related-To: NEO-2917 Change-Id: Ieeca40f5faf29433a5c464d2c3ca3b8910695a9b Signed-off-by: Zbigniew Zdanowicz <zbigniew.zdanowicz@intel.com> 2019-04-08 20:49:35 +08:00			`if (mapAllocation) {`
			`surfaces[1] = &mapSurface;`
			`mapSurface.setGraphicsAllocation(mapAllocation);`
			`//get offset between base cpu ptr of map allocation and dst ptr`
Enable sharedMemory path for write buffer Signed-off-by: Andrzej Koska <andrzej.koska@intel.com> Related-To: NEO-5360 2021-01-25 17:48:31 +08:00			`if ((memoryType != DEVICE_UNIFIED_MEMORY) && (memoryType != SHARED_UNIFIED_MEMORY)) {`
Enabling USM path for write buffer Signed-off-by: Andrzej Koska <andrzej.koska@intel.com> Related-To: NEO-5360 2021-01-05 19:39:04 +08:00			`size_t dstOffset = ptrDiff(dstPtr, mapAllocation->getUnderlyingBuffer());`
			`dstPtr = reinterpret_cast<void *>(mapAllocation->getGpuAddress() + dstOffset);`
			`}`
Add dedicated map allocation Related-To: NEO-2917 Change-Id: Ieeca40f5faf29433a5c464d2c3ca3b8910695a9b Signed-off-by: Zbigniew Zdanowicz <zbigniew.zdanowicz@intel.com> 2019-04-08 20:49:35 +08:00			`} else {`
			`surfaces[1] = &hostPtrSurf;`
			`if (size != 0) {`
Revert "Create single point for selecting engine for builtin ops" This reverts commit 6513bd371a69cb821ea45c7c1964ea1f51dd75b2. Signed-off-by: Maciej Dziuban <maciej.dziuban@intel.com> 2021-09-02 18:14:12 +08:00			`bool status = csr.createAllocationForHostSurface(hostPtrSurf, true);`
Add dedicated map allocation Related-To: NEO-2917 Change-Id: Ieeca40f5faf29433a5c464d2c3ca3b8910695a9b Signed-off-by: Zbigniew Zdanowicz <zbigniew.zdanowicz@intel.com> 2019-04-08 20:49:35 +08:00			`if (!status) {`
			`return CL_OUT_OF_RESOURCES;`
			`}`
			`dstPtr = reinterpret_cast<void *>(hostPtrSurf.getAllocation()->getGpuAddress());`
For HostPtr surfaces of enqueue calls use GPU address Change-Id: I67bf5076d23d43438f5e82c5cb6cbd3b9ed2f152 2018-02-09 05:52:58 +08:00			`}`
			`}`
Fixes for misaligned hostPtr enqueueReadWrite - use getGpuAddress for BuiltinOpParams - fix read/writeImage Change-Id: I2e6e9a1d91871fa9f22851f31eb5a7b337b5aecc 2019-01-10 22:38:56 +08:00			`void *alignedDstPtr = alignDown(dstPtr, 4);`
			`size_t dstPtrOffset = ptrDiff(dstPtr, alignedDstPtr);`

Move enqueue blit logic to enqueueHandler Change-Id: Ibbad22906387c15243708d37b272601f4734697d Related-To: NEO-3020 2019-07-03 15:30:30 +08:00			`BuiltinOpParams dc;`
Fix Read/WriteBuffer for unaligned offsets Change-Id: I08d33e80243f41174f4629c8a611e286629d2e10 2018-12-27 20:34:55 +08:00			`dc.dstPtr = alignedDstPtr;`
			`dc.dstOffset = {dstPtrOffset, 0, 0};`
Initial commit Change-Id: I4bf1707bd3dfeadf2c17b0a7daff372b1925ebbd 2017-12-21 07:45:38 +08:00			`dc.srcMemObj = buffer;`
			`dc.srcOffset = {offset, 0, 0};`
			`dc.size = {size, 0, 0};`
Unify mapAllocation and hostPtrAllocation to transferAllocation Change-Id: I875d6886ce3b0866da7679925ba973d2d16a1141 Signed-off-by: Dunajski, Bartosz <bartosz.dunajski@intel.com> 2019-10-24 20:18:39 +08:00			`dc.transferAllocation = mapAllocation ? mapAllocation : hostPtrSurf.getAllocation();`
Add support for stateless read buffer. Change-Id: Iadf46a6d8651de3fd6bb07efc0eda278e04c86f6 Signed-off-by: Kamil Kopryk <kamil.kopryk@intel.com> Related-To: NEO-3314 2019-11-04 21:30:00 +08:00
Move builtin kernel logic out of blit enqueue path Change-Id: I857ac7d1304f8b228bf558904ee929aa114ab003 Signed-off-by: Bartosz Dunajski <bartosz.dunajski@intel.com> 2020-09-01 17:39:32 +08:00			`MultiDispatchInfo dispatchInfo(dc);`
Initial commit Change-Id: I4bf1707bd3dfeadf2c17b0a7daff372b1925ebbd 2017-12-21 07:45:38 +08:00
			`if (context->isProvidingPerformanceHints()) {`
Simplify read/write enqueue operations on CPU Change-Id: I7f59b04d484be2699e325d10e16298016231faf2 Signed-off-by: Dunajski, Bartosz <bartosz.dunajski@intel.com> 2019-05-30 20:36:12 +08:00			`context->providePerformanceHintForMemoryTransfer(CL_COMMAND_READ_BUFFER, true, static_cast<cl_mem>(buffer), ptr);`
Initial commit Change-Id: I4bf1707bd3dfeadf2c17b0a7daff372b1925ebbd 2017-12-21 07:45:38 +08:00			`if (!isL3Capable(ptr, size)) {`
			`context->providePerformanceHint(CL_CONTEXT_DIAGNOSTICS_LEVEL_BAD_INTEL, CL_ENQUEUE_READ_BUFFER_DOESNT_MEET_ALIGNMENT_RESTRICTIONS, ptr, size, MemoryConstants::pageSize, MemoryConstants::pageSize);`
			`}`
			`}`
Add selectCsrForBuiltinOperation method to OpenCL CommandQueue Signed-off-by: Maciej Dziuban <maciej.dziuban@intel.com> Related-To: NEO-6057 2021-09-07 01:04:14 +08:00			`dispatchBcsOrGpgpuEnqueue<CL_COMMAND_READ_BUFFER>(dispatchInfo, surfaces, eBuiltInOps, numEventsInWaitList, eventWaitList, event, blockingRead, csr);`
Add support for zero-copy r/w buffer Change-Id: Ie9f3f2211d107eb338bd97692d36e9c7d7a0feab 2018-01-11 22:42:55 +08:00
Initial commit Change-Id: I4bf1707bd3dfeadf2c17b0a7daff372b1925ebbd 2017-12-21 07:45:38 +08:00			`return CL_SUCCESS;`
			`}`
Change namespace from OCLRT to NEO Change-Id: If965c79d70392db26597aea4c2f3b7ae2820fe96 Signed-off-by: Maciej Plewka <maciej.plewka@intel.com> 2019-03-26 18:59:46 +08:00			`} // namespace NEO`