240 lines
8.7 KiB
C++
240 lines
8.7 KiB
C++
/*
|
|
* Copyright (c) 2017, Intel Corporation
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
* to deal in the Software without restriction, including without limitation
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice shall be included
|
|
* in all copies or substantial portions of the Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
|
|
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
|
|
* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
|
|
* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
|
|
* OTHER DEALINGS IN THE SOFTWARE.
|
|
*/
|
|
|
|
#include "unit_tests/command_queue/enqueue_fixture.h"
|
|
#include "unit_tests/fixtures/hello_world_fixture.h"
|
|
#include "unit_tests/fixtures/image_fixture.h"
|
|
#include "unit_tests/mocks/mock_buffer.h"
|
|
|
|
using namespace OCLRT;
|
|
|
|
typedef HelloWorldTest<HelloWorldFixtureFactory> IOQTaskTestsMt;
|
|
|
|
TEST_F(IOQTaskTestsMt, enqueueReadBuffer_blockingAndBlockedOnUserEvent) {
|
|
auto buffer = std::unique_ptr<Buffer>(BufferHelper<>::create());
|
|
|
|
auto alignedReadPtr = alignedMalloc(BufferDefaults::sizeInBytes, MemoryConstants::cacheLineSize);
|
|
ASSERT_NE(nullptr, alignedReadPtr);
|
|
|
|
auto userEvent = clCreateUserEvent(pContext, &retVal);
|
|
EXPECT_EQ(CL_SUCCESS, retVal);
|
|
|
|
auto previousTaskLevel = pCmdQ->taskLevel;
|
|
auto previousTaskCount = pCmdQ->taskCount;
|
|
|
|
std::thread t([=]() {
|
|
Event *ev = castToObject<Event>(userEvent);
|
|
while (ev->peekHasChildEvents() == false) {
|
|
// active wait for VirtualEvent (which is added after queue is blocked)
|
|
}
|
|
auto ret = clSetUserEventStatus(userEvent, CL_COMPLETE);
|
|
ASSERT_EQ(CL_SUCCESS, ret);
|
|
});
|
|
|
|
buffer->forceDisallowCPUCopy = true; // no task level incrasing when cpu copy
|
|
retVal = EnqueueReadBufferHelper<>::enqueueReadBuffer(pCmdQ,
|
|
buffer.get(),
|
|
CL_TRUE,
|
|
0,
|
|
BufferDefaults::sizeInBytes,
|
|
alignedReadPtr,
|
|
1,
|
|
&userEvent,
|
|
nullptr);
|
|
EXPECT_EQ(CL_SUCCESS, retVal);
|
|
|
|
EXPECT_LT(previousTaskCount, pCmdQ->taskCount);
|
|
EXPECT_LT(previousTaskLevel, pCmdQ->taskLevel);
|
|
|
|
t.join();
|
|
|
|
retVal = clReleaseEvent(userEvent);
|
|
EXPECT_EQ(CL_SUCCESS, retVal);
|
|
|
|
alignedFree(alignedReadPtr);
|
|
}
|
|
|
|
TEST_F(IOQTaskTestsMt, enqueueMarker_blockedOnUserEvent) {
|
|
|
|
auto userEvent = clCreateUserEvent(pContext, &retVal);
|
|
EXPECT_EQ(CL_SUCCESS, retVal);
|
|
|
|
std::thread t([=]() {
|
|
Event *ev = castToObject<Event>(userEvent);
|
|
while (ev->peekHasChildEvents() == false) {
|
|
// active wait for VirtualEvent (which is added after queue is blocked)
|
|
}
|
|
auto ret = clSetUserEventStatus(userEvent, CL_COMPLETE);
|
|
ASSERT_EQ(CL_SUCCESS, ret);
|
|
});
|
|
|
|
retVal = pCmdQ->enqueueMarkerWithWaitList(
|
|
1,
|
|
&userEvent,
|
|
nullptr);
|
|
EXPECT_EQ(CL_SUCCESS, retVal);
|
|
|
|
t.join();
|
|
|
|
retVal = clReleaseEvent(userEvent);
|
|
EXPECT_EQ(CL_SUCCESS, retVal);
|
|
}
|
|
|
|
TEST_F(IOQTaskTestsMt, enqueueMapBuffer) {
|
|
AlignedBuffer alignedBuffer;
|
|
|
|
auto userEvent = clCreateUserEvent(pContext, &retVal);
|
|
EXPECT_EQ(CL_SUCCESS, retVal);
|
|
|
|
cl_event outputEvent = nullptr;
|
|
void *mappedPtr = pCmdQ->enqueueMapBuffer(&alignedBuffer, false, CL_MAP_READ, 0, alignedBuffer.getSize(), 1, &userEvent, &outputEvent, retVal);
|
|
|
|
EXPECT_EQ(CL_SUCCESS, retVal);
|
|
|
|
const int32_t numThreads = 20;
|
|
|
|
std::thread threads[numThreads];
|
|
std::thread threadUnblocking;
|
|
|
|
cl_event ouputEventsFromThreads[numThreads];
|
|
void *mappedPtrs[numThreads];
|
|
|
|
for (int32_t i = 0; i < numThreads; i++) {
|
|
threads[i] = std::thread([&](int32_t index) {
|
|
cl_int errCode = CL_SUCCESS;
|
|
cl_int success = CL_SUCCESS;
|
|
mappedPtrs[index] = pCmdQ->enqueueMapBuffer(&alignedBuffer, false, CL_MAP_READ, 0, alignedBuffer.getSize(), 0, nullptr, &ouputEventsFromThreads[index], errCode);
|
|
EXPECT_EQ(success, errCode);
|
|
},
|
|
i);
|
|
|
|
if (i == numThreads / 2) {
|
|
threadUnblocking = std::thread([=]() {
|
|
auto ret = clSetUserEventStatus(userEvent, CL_COMPLETE);
|
|
EXPECT_EQ(CL_SUCCESS, ret);
|
|
});
|
|
}
|
|
}
|
|
|
|
cl_int errCode = clWaitForEvents(1, &outputEvent);
|
|
EXPECT_EQ(CL_SUCCESS, errCode);
|
|
|
|
cl_int eventStatus = 0;
|
|
errCode = clGetEventInfo(outputEvent, CL_EVENT_COMMAND_EXECUTION_STATUS, sizeof(cl_int), &eventStatus, nullptr);
|
|
EXPECT_EQ(CL_SUCCESS, errCode);
|
|
EXPECT_EQ(CL_COMPLETE, eventStatus);
|
|
|
|
for (int32_t i = 0; i < numThreads; i++) {
|
|
threads[i].join();
|
|
cl_int errCode = clWaitForEvents(1, &ouputEventsFromThreads[i]);
|
|
EXPECT_EQ(CL_SUCCESS, errCode);
|
|
errCode = clGetEventInfo(outputEvent, CL_EVENT_COMMAND_EXECUTION_STATUS, sizeof(cl_int), &eventStatus, nullptr);
|
|
EXPECT_EQ(CL_SUCCESS, errCode);
|
|
EXPECT_EQ(CL_COMPLETE, eventStatus);
|
|
}
|
|
|
|
threadUnblocking.join();
|
|
retVal = clReleaseEvent(userEvent);
|
|
|
|
for (int32_t i = 0; i < numThreads; i++) {
|
|
pCmdQ->enqueueUnmapMemObject(&alignedBuffer, mappedPtrs[i], 0, nullptr, nullptr);
|
|
retVal = clReleaseEvent(ouputEventsFromThreads[i]);
|
|
EXPECT_EQ(CL_SUCCESS, retVal);
|
|
}
|
|
|
|
pCmdQ->enqueueUnmapMemObject(&alignedBuffer, mappedPtr, 0, nullptr, nullptr);
|
|
|
|
retVal = clReleaseEvent(outputEvent);
|
|
EXPECT_EQ(CL_SUCCESS, retVal);
|
|
}
|
|
|
|
TEST_F(IOQTaskTestsMt, enqueueMapImage) {
|
|
auto image = std::unique_ptr<Image>(ImageHelper<Image1dDefaults>::create(context));
|
|
|
|
auto userEvent = clCreateUserEvent(pContext, &retVal);
|
|
EXPECT_EQ(CL_SUCCESS, retVal);
|
|
|
|
cl_event outputEvent = nullptr;
|
|
const size_t origin[] = {0, 0, 0};
|
|
const size_t region[] = {1, 1, 1};
|
|
|
|
void *mappedPtr = pCmdQ->enqueueMapImage(image.get(), false, CL_MAP_READ, origin, region, nullptr, nullptr, 1, &userEvent, &outputEvent, retVal);
|
|
|
|
EXPECT_EQ(CL_SUCCESS, retVal);
|
|
|
|
const int32_t numThreads = 20;
|
|
|
|
std::thread threads[numThreads];
|
|
std::thread threadUnblocking;
|
|
|
|
cl_event ouputEventsFromThreads[numThreads];
|
|
void *mappedPtrs[numThreads];
|
|
|
|
for (int32_t i = 0; i < numThreads; i++) {
|
|
threads[i] = std::thread([&](int32_t index) {
|
|
cl_int errCode = CL_SUCCESS;
|
|
cl_int success = CL_SUCCESS;
|
|
mappedPtrs[index] = pCmdQ->enqueueMapImage(image.get(), false, CL_MAP_READ, origin, region, nullptr, nullptr, 0, nullptr, &ouputEventsFromThreads[index], errCode);
|
|
EXPECT_EQ(success, errCode);
|
|
},
|
|
i);
|
|
|
|
if (i == numThreads / 2) {
|
|
threadUnblocking = std::thread([=]() {
|
|
auto ret = clSetUserEventStatus(userEvent, CL_COMPLETE);
|
|
EXPECT_EQ(CL_SUCCESS, ret);
|
|
});
|
|
}
|
|
}
|
|
|
|
cl_int errCode = clWaitForEvents(1, &outputEvent);
|
|
EXPECT_EQ(CL_SUCCESS, errCode);
|
|
|
|
cl_int eventStatus = 0;
|
|
errCode = clGetEventInfo(outputEvent, CL_EVENT_COMMAND_EXECUTION_STATUS, sizeof(cl_int), &eventStatus, nullptr);
|
|
EXPECT_EQ(CL_SUCCESS, errCode);
|
|
EXPECT_EQ(CL_COMPLETE, eventStatus);
|
|
|
|
for (int32_t i = 0; i < numThreads; i++) {
|
|
threads[i].join();
|
|
cl_int errCode = clWaitForEvents(1, &ouputEventsFromThreads[i]);
|
|
EXPECT_EQ(CL_SUCCESS, errCode);
|
|
errCode = clGetEventInfo(outputEvent, CL_EVENT_COMMAND_EXECUTION_STATUS, sizeof(cl_int), &eventStatus, nullptr);
|
|
EXPECT_EQ(CL_SUCCESS, errCode);
|
|
EXPECT_EQ(CL_COMPLETE, eventStatus);
|
|
}
|
|
|
|
threadUnblocking.join();
|
|
retVal = clReleaseEvent(userEvent);
|
|
|
|
for (int32_t i = 0; i < numThreads; i++) {
|
|
pCmdQ->enqueueUnmapMemObject(image.get(), mappedPtrs[i], 0, nullptr, nullptr);
|
|
retVal = clReleaseEvent(ouputEventsFromThreads[i]);
|
|
EXPECT_EQ(CL_SUCCESS, retVal);
|
|
}
|
|
|
|
pCmdQ->enqueueUnmapMemObject(image.get(), mappedPtr, 0, nullptr, nullptr);
|
|
|
|
retVal = clReleaseEvent(outputEvent);
|
|
EXPECT_EQ(CL_SUCCESS, retVal);
|
|
}
|