compute-runtime/unit_tests/command_queue/ioq_task_tests_mt.cpp

240 lines
8.7 KiB
C++

/*
* Copyright (c) 2017, Intel Corporation
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
* and/or sell copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included
* in all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
* OTHER DEALINGS IN THE SOFTWARE.
*/
#include "unit_tests/command_queue/enqueue_fixture.h"
#include "unit_tests/fixtures/hello_world_fixture.h"
#include "unit_tests/fixtures/image_fixture.h"
#include "unit_tests/mocks/mock_buffer.h"
using namespace OCLRT;
typedef HelloWorldTest<HelloWorldFixtureFactory> IOQTaskTestsMt;
TEST_F(IOQTaskTestsMt, enqueueReadBuffer_blockingAndBlockedOnUserEvent) {
auto buffer = std::unique_ptr<Buffer>(BufferHelper<>::create());
auto alignedReadPtr = alignedMalloc(BufferDefaults::sizeInBytes, MemoryConstants::cacheLineSize);
ASSERT_NE(nullptr, alignedReadPtr);
auto userEvent = clCreateUserEvent(pContext, &retVal);
EXPECT_EQ(CL_SUCCESS, retVal);
auto previousTaskLevel = pCmdQ->taskLevel;
auto previousTaskCount = pCmdQ->taskCount;
std::thread t([=]() {
Event *ev = castToObject<Event>(userEvent);
while (ev->peekHasChildEvents() == false) {
// active wait for VirtualEvent (which is added after queue is blocked)
}
auto ret = clSetUserEventStatus(userEvent, CL_COMPLETE);
ASSERT_EQ(CL_SUCCESS, ret);
});
buffer->forceDisallowCPUCopy = true; // no task level incrasing when cpu copy
retVal = EnqueueReadBufferHelper<>::enqueueReadBuffer(pCmdQ,
buffer.get(),
CL_TRUE,
0,
BufferDefaults::sizeInBytes,
alignedReadPtr,
1,
&userEvent,
nullptr);
EXPECT_EQ(CL_SUCCESS, retVal);
EXPECT_LT(previousTaskCount, pCmdQ->taskCount);
EXPECT_LT(previousTaskLevel, pCmdQ->taskLevel);
t.join();
retVal = clReleaseEvent(userEvent);
EXPECT_EQ(CL_SUCCESS, retVal);
alignedFree(alignedReadPtr);
}
TEST_F(IOQTaskTestsMt, enqueueMarker_blockedOnUserEvent) {
auto userEvent = clCreateUserEvent(pContext, &retVal);
EXPECT_EQ(CL_SUCCESS, retVal);
std::thread t([=]() {
Event *ev = castToObject<Event>(userEvent);
while (ev->peekHasChildEvents() == false) {
// active wait for VirtualEvent (which is added after queue is blocked)
}
auto ret = clSetUserEventStatus(userEvent, CL_COMPLETE);
ASSERT_EQ(CL_SUCCESS, ret);
});
retVal = pCmdQ->enqueueMarkerWithWaitList(
1,
&userEvent,
nullptr);
EXPECT_EQ(CL_SUCCESS, retVal);
t.join();
retVal = clReleaseEvent(userEvent);
EXPECT_EQ(CL_SUCCESS, retVal);
}
TEST_F(IOQTaskTestsMt, enqueueMapBuffer) {
AlignedBuffer alignedBuffer;
auto userEvent = clCreateUserEvent(pContext, &retVal);
EXPECT_EQ(CL_SUCCESS, retVal);
cl_event outputEvent = nullptr;
void *mappedPtr = pCmdQ->enqueueMapBuffer(&alignedBuffer, false, CL_MAP_READ, 0, alignedBuffer.getSize(), 1, &userEvent, &outputEvent, retVal);
EXPECT_EQ(CL_SUCCESS, retVal);
const int32_t numThreads = 20;
std::thread threads[numThreads];
std::thread threadUnblocking;
cl_event ouputEventsFromThreads[numThreads];
void *mappedPtrs[numThreads];
for (int32_t i = 0; i < numThreads; i++) {
threads[i] = std::thread([&](int32_t index) {
cl_int errCode = CL_SUCCESS;
cl_int success = CL_SUCCESS;
mappedPtrs[index] = pCmdQ->enqueueMapBuffer(&alignedBuffer, false, CL_MAP_READ, 0, alignedBuffer.getSize(), 0, nullptr, &ouputEventsFromThreads[index], errCode);
EXPECT_EQ(success, errCode);
},
i);
if (i == numThreads / 2) {
threadUnblocking = std::thread([=]() {
auto ret = clSetUserEventStatus(userEvent, CL_COMPLETE);
EXPECT_EQ(CL_SUCCESS, ret);
});
}
}
cl_int errCode = clWaitForEvents(1, &outputEvent);
EXPECT_EQ(CL_SUCCESS, errCode);
cl_int eventStatus = 0;
errCode = clGetEventInfo(outputEvent, CL_EVENT_COMMAND_EXECUTION_STATUS, sizeof(cl_int), &eventStatus, nullptr);
EXPECT_EQ(CL_SUCCESS, errCode);
EXPECT_EQ(CL_COMPLETE, eventStatus);
for (int32_t i = 0; i < numThreads; i++) {
threads[i].join();
cl_int errCode = clWaitForEvents(1, &ouputEventsFromThreads[i]);
EXPECT_EQ(CL_SUCCESS, errCode);
errCode = clGetEventInfo(outputEvent, CL_EVENT_COMMAND_EXECUTION_STATUS, sizeof(cl_int), &eventStatus, nullptr);
EXPECT_EQ(CL_SUCCESS, errCode);
EXPECT_EQ(CL_COMPLETE, eventStatus);
}
threadUnblocking.join();
retVal = clReleaseEvent(userEvent);
for (int32_t i = 0; i < numThreads; i++) {
pCmdQ->enqueueUnmapMemObject(&alignedBuffer, mappedPtrs[i], 0, nullptr, nullptr);
retVal = clReleaseEvent(ouputEventsFromThreads[i]);
EXPECT_EQ(CL_SUCCESS, retVal);
}
pCmdQ->enqueueUnmapMemObject(&alignedBuffer, mappedPtr, 0, nullptr, nullptr);
retVal = clReleaseEvent(outputEvent);
EXPECT_EQ(CL_SUCCESS, retVal);
}
TEST_F(IOQTaskTestsMt, enqueueMapImage) {
auto image = std::unique_ptr<Image>(ImageHelper<Image1dDefaults>::create(context));
auto userEvent = clCreateUserEvent(pContext, &retVal);
EXPECT_EQ(CL_SUCCESS, retVal);
cl_event outputEvent = nullptr;
const size_t origin[] = {0, 0, 0};
const size_t region[] = {1, 1, 1};
void *mappedPtr = pCmdQ->enqueueMapImage(image.get(), false, CL_MAP_READ, origin, region, nullptr, nullptr, 1, &userEvent, &outputEvent, retVal);
EXPECT_EQ(CL_SUCCESS, retVal);
const int32_t numThreads = 20;
std::thread threads[numThreads];
std::thread threadUnblocking;
cl_event ouputEventsFromThreads[numThreads];
void *mappedPtrs[numThreads];
for (int32_t i = 0; i < numThreads; i++) {
threads[i] = std::thread([&](int32_t index) {
cl_int errCode = CL_SUCCESS;
cl_int success = CL_SUCCESS;
mappedPtrs[index] = pCmdQ->enqueueMapImage(image.get(), false, CL_MAP_READ, origin, region, nullptr, nullptr, 0, nullptr, &ouputEventsFromThreads[index], errCode);
EXPECT_EQ(success, errCode);
},
i);
if (i == numThreads / 2) {
threadUnblocking = std::thread([=]() {
auto ret = clSetUserEventStatus(userEvent, CL_COMPLETE);
EXPECT_EQ(CL_SUCCESS, ret);
});
}
}
cl_int errCode = clWaitForEvents(1, &outputEvent);
EXPECT_EQ(CL_SUCCESS, errCode);
cl_int eventStatus = 0;
errCode = clGetEventInfo(outputEvent, CL_EVENT_COMMAND_EXECUTION_STATUS, sizeof(cl_int), &eventStatus, nullptr);
EXPECT_EQ(CL_SUCCESS, errCode);
EXPECT_EQ(CL_COMPLETE, eventStatus);
for (int32_t i = 0; i < numThreads; i++) {
threads[i].join();
cl_int errCode = clWaitForEvents(1, &ouputEventsFromThreads[i]);
EXPECT_EQ(CL_SUCCESS, errCode);
errCode = clGetEventInfo(outputEvent, CL_EVENT_COMMAND_EXECUTION_STATUS, sizeof(cl_int), &eventStatus, nullptr);
EXPECT_EQ(CL_SUCCESS, errCode);
EXPECT_EQ(CL_COMPLETE, eventStatus);
}
threadUnblocking.join();
retVal = clReleaseEvent(userEvent);
for (int32_t i = 0; i < numThreads; i++) {
pCmdQ->enqueueUnmapMemObject(image.get(), mappedPtrs[i], 0, nullptr, nullptr);
retVal = clReleaseEvent(ouputEventsFromThreads[i]);
EXPECT_EQ(CL_SUCCESS, retVal);
}
pCmdQ->enqueueUnmapMemObject(image.get(), mappedPtr, 0, nullptr, nullptr);
retVal = clReleaseEvent(outputEvent);
EXPECT_EQ(CL_SUCCESS, retVal);
}