/* * Copyright (c) 2017, Intel Corporation * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included * in all copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR * OTHER DEALINGS IN THE SOFTWARE. */ #include "unit_tests/command_queue/enqueue_fixture.h" #include "unit_tests/fixtures/hello_world_fixture.h" #include "unit_tests/fixtures/image_fixture.h" #include "unit_tests/mocks/mock_buffer.h" using namespace OCLRT; typedef HelloWorldTest IOQTaskTestsMt; TEST_F(IOQTaskTestsMt, enqueueReadBuffer_blockingAndBlockedOnUserEvent) { auto buffer = std::unique_ptr(BufferHelper<>::create()); auto alignedReadPtr = alignedMalloc(BufferDefaults::sizeInBytes, MemoryConstants::cacheLineSize); ASSERT_NE(nullptr, alignedReadPtr); auto userEvent = clCreateUserEvent(pContext, &retVal); EXPECT_EQ(CL_SUCCESS, retVal); auto previousTaskLevel = pCmdQ->taskLevel; auto previousTaskCount = pCmdQ->taskCount; std::thread t([=]() { Event *ev = castToObject(userEvent); while (ev->peekHasChildEvents() == false) { // active wait for VirtualEvent (which is added after queue is blocked) } auto ret = clSetUserEventStatus(userEvent, CL_COMPLETE); ASSERT_EQ(CL_SUCCESS, ret); }); buffer->forceDisallowCPUCopy = true; // no task level incrasing when cpu copy retVal = EnqueueReadBufferHelper<>::enqueueReadBuffer(pCmdQ, buffer.get(), CL_TRUE, 0, BufferDefaults::sizeInBytes, alignedReadPtr, 1, &userEvent, nullptr); EXPECT_EQ(CL_SUCCESS, retVal); EXPECT_LT(previousTaskCount, pCmdQ->taskCount); EXPECT_LT(previousTaskLevel, pCmdQ->taskLevel); t.join(); retVal = clReleaseEvent(userEvent); EXPECT_EQ(CL_SUCCESS, retVal); alignedFree(alignedReadPtr); } TEST_F(IOQTaskTestsMt, enqueueMarker_blockedOnUserEvent) { auto userEvent = clCreateUserEvent(pContext, &retVal); EXPECT_EQ(CL_SUCCESS, retVal); std::thread t([=]() { Event *ev = castToObject(userEvent); while (ev->peekHasChildEvents() == false) { // active wait for VirtualEvent (which is added after queue is blocked) } auto ret = clSetUserEventStatus(userEvent, CL_COMPLETE); ASSERT_EQ(CL_SUCCESS, ret); }); retVal = pCmdQ->enqueueMarkerWithWaitList( 1, &userEvent, nullptr); EXPECT_EQ(CL_SUCCESS, retVal); t.join(); retVal = clReleaseEvent(userEvent); EXPECT_EQ(CL_SUCCESS, retVal); } TEST_F(IOQTaskTestsMt, enqueueMapBuffer) { AlignedBuffer alignedBuffer; auto userEvent = clCreateUserEvent(pContext, &retVal); EXPECT_EQ(CL_SUCCESS, retVal); cl_event outputEvent = nullptr; void *mappedPtr = pCmdQ->enqueueMapBuffer(&alignedBuffer, false, CL_MAP_READ, 0, alignedBuffer.getSize(), 1, &userEvent, &outputEvent, retVal); EXPECT_EQ(CL_SUCCESS, retVal); const int32_t numThreads = 20; std::thread threads[numThreads]; std::thread threadUnblocking; cl_event ouputEventsFromThreads[numThreads]; void *mappedPtrs[numThreads]; for (int32_t i = 0; i < numThreads; i++) { threads[i] = std::thread([&](int32_t index) { cl_int errCode = CL_SUCCESS; cl_int success = CL_SUCCESS; mappedPtrs[index] = pCmdQ->enqueueMapBuffer(&alignedBuffer, false, CL_MAP_READ, 0, alignedBuffer.getSize(), 0, nullptr, &ouputEventsFromThreads[index], errCode); EXPECT_EQ(success, errCode); }, i); if (i == numThreads / 2) { threadUnblocking = std::thread([=]() { auto ret = clSetUserEventStatus(userEvent, CL_COMPLETE); EXPECT_EQ(CL_SUCCESS, ret); }); } } cl_int errCode = clWaitForEvents(1, &outputEvent); EXPECT_EQ(CL_SUCCESS, errCode); cl_int eventStatus = 0; errCode = clGetEventInfo(outputEvent, CL_EVENT_COMMAND_EXECUTION_STATUS, sizeof(cl_int), &eventStatus, nullptr); EXPECT_EQ(CL_SUCCESS, errCode); EXPECT_EQ(CL_COMPLETE, eventStatus); for (int32_t i = 0; i < numThreads; i++) { threads[i].join(); cl_int errCode = clWaitForEvents(1, &ouputEventsFromThreads[i]); EXPECT_EQ(CL_SUCCESS, errCode); errCode = clGetEventInfo(outputEvent, CL_EVENT_COMMAND_EXECUTION_STATUS, sizeof(cl_int), &eventStatus, nullptr); EXPECT_EQ(CL_SUCCESS, errCode); EXPECT_EQ(CL_COMPLETE, eventStatus); } threadUnblocking.join(); retVal = clReleaseEvent(userEvent); for (int32_t i = 0; i < numThreads; i++) { pCmdQ->enqueueUnmapMemObject(&alignedBuffer, mappedPtrs[i], 0, nullptr, nullptr); retVal = clReleaseEvent(ouputEventsFromThreads[i]); EXPECT_EQ(CL_SUCCESS, retVal); } pCmdQ->enqueueUnmapMemObject(&alignedBuffer, mappedPtr, 0, nullptr, nullptr); retVal = clReleaseEvent(outputEvent); EXPECT_EQ(CL_SUCCESS, retVal); } TEST_F(IOQTaskTestsMt, enqueueMapImage) { auto image = std::unique_ptr(ImageHelper::create(context)); auto userEvent = clCreateUserEvent(pContext, &retVal); EXPECT_EQ(CL_SUCCESS, retVal); cl_event outputEvent = nullptr; const size_t origin[] = {0, 0, 0}; const size_t region[] = {1, 1, 1}; void *mappedPtr = pCmdQ->enqueueMapImage(image.get(), false, CL_MAP_READ, origin, region, nullptr, nullptr, 1, &userEvent, &outputEvent, retVal); EXPECT_EQ(CL_SUCCESS, retVal); const int32_t numThreads = 20; std::thread threads[numThreads]; std::thread threadUnblocking; cl_event ouputEventsFromThreads[numThreads]; void *mappedPtrs[numThreads]; for (int32_t i = 0; i < numThreads; i++) { threads[i] = std::thread([&](int32_t index) { cl_int errCode = CL_SUCCESS; cl_int success = CL_SUCCESS; mappedPtrs[index] = pCmdQ->enqueueMapImage(image.get(), false, CL_MAP_READ, origin, region, nullptr, nullptr, 0, nullptr, &ouputEventsFromThreads[index], errCode); EXPECT_EQ(success, errCode); }, i); if (i == numThreads / 2) { threadUnblocking = std::thread([=]() { auto ret = clSetUserEventStatus(userEvent, CL_COMPLETE); EXPECT_EQ(CL_SUCCESS, ret); }); } } cl_int errCode = clWaitForEvents(1, &outputEvent); EXPECT_EQ(CL_SUCCESS, errCode); cl_int eventStatus = 0; errCode = clGetEventInfo(outputEvent, CL_EVENT_COMMAND_EXECUTION_STATUS, sizeof(cl_int), &eventStatus, nullptr); EXPECT_EQ(CL_SUCCESS, errCode); EXPECT_EQ(CL_COMPLETE, eventStatus); for (int32_t i = 0; i < numThreads; i++) { threads[i].join(); cl_int errCode = clWaitForEvents(1, &ouputEventsFromThreads[i]); EXPECT_EQ(CL_SUCCESS, errCode); errCode = clGetEventInfo(outputEvent, CL_EVENT_COMMAND_EXECUTION_STATUS, sizeof(cl_int), &eventStatus, nullptr); EXPECT_EQ(CL_SUCCESS, errCode); EXPECT_EQ(CL_COMPLETE, eventStatus); } threadUnblocking.join(); retVal = clReleaseEvent(userEvent); for (int32_t i = 0; i < numThreads; i++) { pCmdQ->enqueueUnmapMemObject(image.get(), mappedPtrs[i], 0, nullptr, nullptr); retVal = clReleaseEvent(ouputEventsFromThreads[i]); EXPECT_EQ(CL_SUCCESS, retVal); } pCmdQ->enqueueUnmapMemObject(image.get(), mappedPtr, 0, nullptr, nullptr); retVal = clReleaseEvent(outputEvent); EXPECT_EQ(CL_SUCCESS, retVal); }