2018-08-24 14:48:59 +08:00
|
|
|
/*
|
|
|
|
* Copyright (c) 2018, Intel Corporation
|
|
|
|
*
|
|
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
|
|
* to deal in the Software without restriction, including without limitation
|
|
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
|
|
*
|
|
|
|
* The above copyright notice and this permission notice shall be included
|
|
|
|
* in all copies or substantial portions of the Software.
|
|
|
|
*
|
|
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
|
|
|
|
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
|
|
|
|
* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
|
|
|
|
* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
|
|
|
|
* OTHER DEALINGS IN THE SOFTWARE.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "runtime/command_queue/gpgpu_walker.h"
|
|
|
|
#include "runtime/helpers/options.h"
|
|
|
|
#include "runtime/helpers/timestamp_packet.h"
|
2018-08-28 20:11:25 +08:00
|
|
|
#include "runtime/utilities/tag_allocator.h"
|
2018-08-24 14:48:59 +08:00
|
|
|
#include "unit_tests/helpers/hw_parse.h"
|
|
|
|
#include "unit_tests/mocks/mock_context.h"
|
|
|
|
#include "unit_tests/mocks/mock_device.h"
|
|
|
|
#include "unit_tests/mocks/mock_command_queue.h"
|
|
|
|
#include "unit_tests/mocks/mock_kernel.h"
|
|
|
|
#include "unit_tests/mocks/mock_mdi.h"
|
2018-08-28 20:11:25 +08:00
|
|
|
#include "unit_tests/mocks/mock_memory_manager.h"
|
2018-08-24 14:48:59 +08:00
|
|
|
|
|
|
|
#include "test.h"
|
|
|
|
|
|
|
|
using namespace OCLRT;
|
|
|
|
|
2018-08-28 20:11:25 +08:00
|
|
|
struct TimestampPacketTests : public ::testing::Test {
|
|
|
|
class MockTimestampPacket : public TimestampPacket {
|
|
|
|
public:
|
|
|
|
using TimestampPacket::data;
|
|
|
|
};
|
|
|
|
|
2018-08-30 19:37:39 +08:00
|
|
|
template <typename TagType = TimestampPacket>
|
|
|
|
class MockTagAllocator : public TagAllocator<TagType> {
|
2018-08-28 20:11:25 +08:00
|
|
|
public:
|
2018-08-30 19:37:39 +08:00
|
|
|
using BaseClass = TagAllocator<TagType>;
|
2018-09-10 20:24:11 +08:00
|
|
|
using BaseClass::freeTags;
|
2018-08-30 19:37:39 +08:00
|
|
|
using BaseClass::usedTags;
|
|
|
|
using NodeType = typename BaseClass::NodeType;
|
|
|
|
|
|
|
|
MockTagAllocator(MemoryManager *memoryManager, size_t tagCount = 10) : BaseClass(memoryManager, tagCount, 10) {}
|
2018-08-24 14:48:59 +08:00
|
|
|
|
2018-08-28 20:11:25 +08:00
|
|
|
void returnTag(NodeType *node) override {
|
|
|
|
releaseReferenceNodes.push_back(node);
|
2018-08-30 19:37:39 +08:00
|
|
|
BaseClass::returnTag(node);
|
2018-08-28 20:11:25 +08:00
|
|
|
}
|
|
|
|
|
2018-09-04 15:05:55 +08:00
|
|
|
void returnTagToFreePool(NodeType *node) override {
|
|
|
|
returnedToFreePoolNodes.push_back(node);
|
|
|
|
BaseClass::returnTagToFreePool(node);
|
2018-08-28 20:11:25 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
std::vector<NodeType *> releaseReferenceNodes;
|
2018-09-04 15:05:55 +08:00
|
|
|
std::vector<NodeType *> returnedToFreePoolNodes;
|
2018-08-28 20:11:25 +08:00
|
|
|
};
|
|
|
|
};
|
2018-08-24 14:48:59 +08:00
|
|
|
|
2018-09-04 15:05:55 +08:00
|
|
|
TEST_F(TimestampPacketTests, whenEndTagIsNotOneThenCanBeReleased) {
|
|
|
|
MockTimestampPacket timestampPacket;
|
|
|
|
auto contextEndIndex = static_cast<uint32_t>(TimestampPacket::DataIndex::ContextEnd);
|
|
|
|
auto globalEndIndex = static_cast<uint32_t>(TimestampPacket::DataIndex::GlobalEnd);
|
|
|
|
|
|
|
|
timestampPacket.data[contextEndIndex] = 1;
|
|
|
|
timestampPacket.data[globalEndIndex] = 1;
|
|
|
|
EXPECT_FALSE(timestampPacket.canBeReleased());
|
|
|
|
|
|
|
|
timestampPacket.data[contextEndIndex] = 1;
|
|
|
|
timestampPacket.data[globalEndIndex] = 0;
|
|
|
|
EXPECT_FALSE(timestampPacket.canBeReleased());
|
|
|
|
|
|
|
|
timestampPacket.data[contextEndIndex] = 0;
|
|
|
|
timestampPacket.data[globalEndIndex] = 1;
|
|
|
|
EXPECT_FALSE(timestampPacket.canBeReleased());
|
|
|
|
|
|
|
|
timestampPacket.data[contextEndIndex] = 0;
|
|
|
|
timestampPacket.data[globalEndIndex] = 0;
|
|
|
|
EXPECT_TRUE(timestampPacket.canBeReleased());
|
|
|
|
}
|
|
|
|
|
2018-08-30 19:37:39 +08:00
|
|
|
TEST_F(TimestampPacketTests, whenNewTagIsTakenThenReinitialize) {
|
|
|
|
MockMemoryManager memoryManager;
|
|
|
|
MockTagAllocator<MockTimestampPacket> allocator(&memoryManager, 1);
|
|
|
|
|
|
|
|
auto firstNode = allocator.getTag();
|
2018-09-03 15:34:57 +08:00
|
|
|
firstNode->tag->data = {{5, 6, 7, 8, 9}};
|
2018-08-30 19:37:39 +08:00
|
|
|
|
|
|
|
allocator.returnTag(firstNode);
|
|
|
|
|
|
|
|
auto secondNode = allocator.getTag();
|
|
|
|
EXPECT_EQ(secondNode, firstNode);
|
|
|
|
|
|
|
|
for (uint32_t i = 0; i < static_cast<uint32_t>(TimestampPacket::DataIndex::Max); i++) {
|
|
|
|
EXPECT_EQ(1u, secondNode->tag->data[i]);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-08-24 14:48:59 +08:00
|
|
|
TEST_F(TimestampPacketTests, whenObjectIsCreatedThenInitializeAllStamps) {
|
|
|
|
MockTimestampPacket timestampPacket;
|
|
|
|
auto maxElements = static_cast<uint32_t>(TimestampPacket::DataIndex::Max);
|
2018-09-03 15:34:57 +08:00
|
|
|
EXPECT_EQ(5u, maxElements);
|
2018-08-24 14:48:59 +08:00
|
|
|
|
|
|
|
EXPECT_EQ(maxElements, timestampPacket.data.size());
|
|
|
|
|
|
|
|
for (uint32_t i = 0; i < maxElements; i++) {
|
|
|
|
EXPECT_EQ(1u, timestampPacket.data[i]);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_F(TimestampPacketTests, whenAskedForStampAddressThenReturnWithValidOffset) {
|
|
|
|
MockTimestampPacket timestampPacket;
|
|
|
|
|
2018-09-03 15:34:57 +08:00
|
|
|
for (size_t i = 0; i < static_cast<uint32_t>(TimestampPacket::DataIndex::Max); i++) {
|
|
|
|
auto address = timestampPacket.pickAddressForDataWrite(static_cast<TimestampPacket::DataIndex>(i));
|
|
|
|
EXPECT_EQ(address, reinterpret_cast<uint64_t>(×tampPacket.data[i]));
|
|
|
|
}
|
2018-08-24 14:48:59 +08:00
|
|
|
}
|
|
|
|
|
2018-09-06 16:01:51 +08:00
|
|
|
HWCMDTEST_F(IGFX_GEN8_CORE, TimestampPacketTests, givenTimestampPacketWriteEnabledWhenEstimatingStreamSizeThenAddTwoPipeControls) {
|
2018-08-24 14:48:59 +08:00
|
|
|
auto device = std::unique_ptr<MockDevice>(MockDevice::createWithNewExecutionEnvironment<MockDevice>(platformDevices[0]));
|
|
|
|
MockCommandQueue cmdQ(nullptr, device.get(), nullptr);
|
|
|
|
MockKernelWithInternals kernel1(*device);
|
|
|
|
MockKernelWithInternals kernel2(*device);
|
|
|
|
MockMultiDispatchInfo multiDispatchInfo(std::vector<Kernel *>({kernel1.mockKernel, kernel2.mockKernel}));
|
|
|
|
|
2018-09-06 15:03:07 +08:00
|
|
|
device->getUltCommandStreamReceiver<FamilyType>().timestampPacketWriteEnabled = false;
|
2018-09-07 15:09:24 +08:00
|
|
|
getCommandStream<FamilyType, CL_COMMAND_NDRANGE_KERNEL>(cmdQ, 0, false, false, multiDispatchInfo);
|
2018-08-24 14:48:59 +08:00
|
|
|
auto sizeWithDisabled = cmdQ.requestedCmdStreamSize;
|
|
|
|
|
2018-09-06 15:03:07 +08:00
|
|
|
device->getUltCommandStreamReceiver<FamilyType>().timestampPacketWriteEnabled = true;
|
2018-09-07 15:09:24 +08:00
|
|
|
getCommandStream<FamilyType, CL_COMMAND_NDRANGE_KERNEL>(cmdQ, 0, false, false, multiDispatchInfo);
|
2018-08-24 14:48:59 +08:00
|
|
|
auto sizeWithEnabled = cmdQ.requestedCmdStreamSize;
|
|
|
|
|
2018-09-03 15:34:57 +08:00
|
|
|
EXPECT_EQ(sizeWithEnabled, sizeWithDisabled + (2 * sizeof(typename FamilyType::PIPE_CONTROL)));
|
2018-08-24 14:48:59 +08:00
|
|
|
}
|
|
|
|
|
2018-09-07 15:09:24 +08:00
|
|
|
HWTEST_F(TimestampPacketTests, givenTimestampPacketWriteEnabledWhenEstimatingStreamSizeWithWaitlistThenAddSizeForSemaphores) {
|
|
|
|
auto device = std::unique_ptr<MockDevice>(MockDevice::createWithNewExecutionEnvironment<MockDevice>(platformDevices[0]));
|
|
|
|
MockCommandQueue cmdQ(nullptr, device.get(), nullptr);
|
|
|
|
MockKernelWithInternals kernel1(*device);
|
|
|
|
MockKernelWithInternals kernel2(*device);
|
|
|
|
MockMultiDispatchInfo multiDispatchInfo(std::vector<Kernel *>({kernel1.mockKernel, kernel2.mockKernel}));
|
|
|
|
|
|
|
|
cl_uint numEventsOnWaitlist = 5;
|
|
|
|
|
|
|
|
device->getUltCommandStreamReceiver<FamilyType>().timestampPacketWriteEnabled = false;
|
|
|
|
getCommandStream<FamilyType, CL_COMMAND_NDRANGE_KERNEL>(cmdQ, numEventsOnWaitlist, false, false, multiDispatchInfo);
|
|
|
|
auto sizeWithDisabled = cmdQ.requestedCmdStreamSize;
|
|
|
|
|
|
|
|
device->getUltCommandStreamReceiver<FamilyType>().timestampPacketWriteEnabled = true;
|
|
|
|
getCommandStream<FamilyType, CL_COMMAND_NDRANGE_KERNEL>(cmdQ, numEventsOnWaitlist, false, false, multiDispatchInfo);
|
|
|
|
auto sizeWithEnabled = cmdQ.requestedCmdStreamSize;
|
|
|
|
|
2018-09-10 15:54:04 +08:00
|
|
|
size_t extendedSize = sizeWithDisabled + EnqueueOperation<FamilyType>::getSizeRequiredForTimestampPacketWrite() +
|
2018-09-07 15:09:24 +08:00
|
|
|
(numEventsOnWaitlist * sizeof(typename FamilyType::MI_SEMAPHORE_WAIT));
|
|
|
|
|
|
|
|
EXPECT_EQ(sizeWithEnabled, extendedSize);
|
|
|
|
}
|
|
|
|
|
2018-08-28 20:11:25 +08:00
|
|
|
HWCMDTEST_F(IGFX_GEN8_CORE, TimestampPacketTests, givenTimestampPacketWhenDispatchingGpuWalkerThenAddTwoPcForLastWalker) {
|
2018-08-24 14:48:59 +08:00
|
|
|
using GPGPU_WALKER = typename FamilyType::GPGPU_WALKER;
|
|
|
|
using PIPE_CONTROL = typename FamilyType::PIPE_CONTROL;
|
|
|
|
MockTimestampPacket timestampPacket;
|
|
|
|
|
|
|
|
auto device = std::unique_ptr<MockDevice>(MockDevice::createWithNewExecutionEnvironment<MockDevice>(platformDevices[0]));
|
|
|
|
MockKernelWithInternals kernel1(*device);
|
|
|
|
MockKernelWithInternals kernel2(*device);
|
|
|
|
|
|
|
|
MockMultiDispatchInfo multiDispatchInfo(std::vector<Kernel *>({kernel1.mockKernel, kernel2.mockKernel}));
|
|
|
|
|
|
|
|
MockCommandQueue cmdQ(nullptr, device.get(), nullptr);
|
|
|
|
auto &cmdStream = cmdQ.getCS(0);
|
|
|
|
|
|
|
|
GpgpuWalkerHelper<FamilyType>::dispatchWalker(
|
|
|
|
cmdQ,
|
|
|
|
multiDispatchInfo,
|
|
|
|
0,
|
|
|
|
nullptr,
|
|
|
|
nullptr,
|
|
|
|
nullptr,
|
|
|
|
nullptr,
|
|
|
|
×tampPacket,
|
|
|
|
device->getPreemptionMode(),
|
|
|
|
false);
|
|
|
|
|
|
|
|
HardwareParse hwParser;
|
|
|
|
hwParser.parseCommands<FamilyType>(cmdStream, 0);
|
|
|
|
|
|
|
|
auto verifyPipeControl = [](PIPE_CONTROL *pipeControl, uint64_t expectedAddress) {
|
|
|
|
EXPECT_EQ(1u, pipeControl->getCommandStreamerStallEnable());
|
|
|
|
EXPECT_EQ(PIPE_CONTROL::POST_SYNC_OPERATION_WRITE_IMMEDIATE_DATA, pipeControl->getPostSyncOperation());
|
|
|
|
EXPECT_EQ(0u, pipeControl->getImmediateData());
|
|
|
|
EXPECT_EQ(static_cast<uint32_t>(expectedAddress & 0x0000FFFFFFFFULL), pipeControl->getAddress());
|
|
|
|
EXPECT_EQ(static_cast<uint32_t>(expectedAddress >> 32), pipeControl->getAddressHigh());
|
|
|
|
};
|
|
|
|
|
|
|
|
uint32_t walkersFound = 0;
|
|
|
|
for (auto it = hwParser.cmdList.begin(); it != hwParser.cmdList.end(); it++) {
|
|
|
|
if (genCmdCast<GPGPU_WALKER *>(*it)) {
|
|
|
|
walkersFound++;
|
|
|
|
if (walkersFound == 1) {
|
|
|
|
EXPECT_EQ(nullptr, genCmdCast<PIPE_CONTROL *>(*--it));
|
|
|
|
it++;
|
|
|
|
EXPECT_EQ(nullptr, genCmdCast<PIPE_CONTROL *>(*++it));
|
|
|
|
it--;
|
|
|
|
} else if (walkersFound == 2) {
|
|
|
|
auto pipeControl = genCmdCast<PIPE_CONTROL *>(*--it);
|
|
|
|
EXPECT_NE(nullptr, pipeControl);
|
2018-09-03 15:34:57 +08:00
|
|
|
verifyPipeControl(pipeControl, timestampPacket.pickAddressForDataWrite(TimestampPacket::DataIndex::Submit));
|
2018-08-24 14:48:59 +08:00
|
|
|
it++;
|
|
|
|
pipeControl = genCmdCast<PIPE_CONTROL *>(*++it);
|
|
|
|
EXPECT_NE(nullptr, pipeControl);
|
2018-09-03 15:34:57 +08:00
|
|
|
verifyPipeControl(pipeControl, timestampPacket.pickAddressForDataWrite(TimestampPacket::DataIndex::ContextEnd));
|
2018-08-24 14:48:59 +08:00
|
|
|
it--;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
EXPECT_EQ(2u, walkersFound);
|
|
|
|
}
|
2018-08-28 20:11:25 +08:00
|
|
|
|
2018-09-06 15:03:07 +08:00
|
|
|
HWTEST_F(TimestampPacketTests, givenTimestampPacketWriteEnabledWhenEnqueueingThenObtainNewStampAndPassToEvent) {
|
2018-08-28 20:11:25 +08:00
|
|
|
|
|
|
|
auto device = std::unique_ptr<MockDevice>(MockDevice::createWithNewExecutionEnvironment<MockDevice>(platformDevices[0]));
|
|
|
|
auto mockMemoryManager = new MockMemoryManager();
|
|
|
|
device->injectMemoryManager(mockMemoryManager);
|
2018-08-30 19:37:39 +08:00
|
|
|
auto mockTagAllocator = new MockTagAllocator<>(mockMemoryManager);
|
2018-08-28 20:11:25 +08:00
|
|
|
mockMemoryManager->timestampPacketAllocator.reset(mockTagAllocator);
|
|
|
|
MockContext context(device.get());
|
|
|
|
auto cmdQ = std::make_unique<MockCommandQueueHw<FamilyType>>(&context, device.get(), nullptr);
|
|
|
|
MockKernelWithInternals kernel(*device, &context);
|
|
|
|
|
2018-09-06 15:03:07 +08:00
|
|
|
device->getUltCommandStreamReceiver<FamilyType>().timestampPacketWriteEnabled = false;
|
|
|
|
|
2018-08-28 20:11:25 +08:00
|
|
|
size_t gws[] = {1, 1, 1};
|
|
|
|
|
|
|
|
cmdQ->enqueueKernel(kernel.mockKernel, 1, nullptr, gws, nullptr, 0, nullptr, nullptr);
|
|
|
|
EXPECT_EQ(nullptr, cmdQ->timestampPacketNode);
|
|
|
|
EXPECT_EQ(nullptr, mockTagAllocator->usedTags.peekHead());
|
|
|
|
|
2018-09-06 15:03:07 +08:00
|
|
|
device->getUltCommandStreamReceiver<FamilyType>().timestampPacketWriteEnabled = true;
|
2018-08-28 20:11:25 +08:00
|
|
|
cl_event event1, event2;
|
|
|
|
|
|
|
|
// obtain first node for cmdQ and event1
|
|
|
|
cmdQ->enqueueKernel(kernel.mockKernel, 1, nullptr, gws, nullptr, 0, nullptr, &event1);
|
|
|
|
auto node1 = cmdQ->timestampPacketNode;
|
|
|
|
EXPECT_NE(nullptr, node1);
|
|
|
|
EXPECT_EQ(node1, cmdQ->timestampPacketNode);
|
|
|
|
|
|
|
|
// obtain new node for cmdQ and event2
|
|
|
|
cmdQ->enqueueKernel(kernel.mockKernel, 1, nullptr, gws, nullptr, 0, nullptr, &event2);
|
|
|
|
auto node2 = cmdQ->timestampPacketNode;
|
|
|
|
EXPECT_NE(nullptr, node2);
|
|
|
|
EXPECT_EQ(node2, cmdQ->timestampPacketNode);
|
2018-09-04 15:05:55 +08:00
|
|
|
EXPECT_EQ(0u, mockTagAllocator->returnedToFreePoolNodes.size()); // nothing returned. event1 owns previous node
|
|
|
|
EXPECT_EQ(1u, mockTagAllocator->releaseReferenceNodes.size()); // cmdQ released first node
|
2018-08-28 20:11:25 +08:00
|
|
|
EXPECT_EQ(node1, mockTagAllocator->releaseReferenceNodes.at(0));
|
|
|
|
|
|
|
|
EXPECT_NE(node1, node2);
|
2018-09-04 15:05:55 +08:00
|
|
|
size_t dataSize = sizeof(uint32_t) * static_cast<size_t>(TimestampPacket::DataIndex::Max);
|
|
|
|
// mark nodes as ready
|
2018-09-03 15:34:57 +08:00
|
|
|
memset(reinterpret_cast<void *>(node1->tag->pickAddressForDataWrite(TimestampPacket::DataIndex::ContextStart)), 0, dataSize);
|
|
|
|
memset(reinterpret_cast<void *>(node2->tag->pickAddressForDataWrite(TimestampPacket::DataIndex::ContextStart)), 0, dataSize);
|
2018-08-28 20:11:25 +08:00
|
|
|
|
|
|
|
clReleaseEvent(event2);
|
2018-09-04 15:05:55 +08:00
|
|
|
EXPECT_EQ(0u, mockTagAllocator->returnedToFreePoolNodes.size()); // nothing returned. cmdQ owns node2
|
|
|
|
EXPECT_EQ(2u, mockTagAllocator->releaseReferenceNodes.size()); // event2 released node2
|
2018-08-28 20:11:25 +08:00
|
|
|
EXPECT_EQ(node2, mockTagAllocator->releaseReferenceNodes.at(1));
|
|
|
|
|
|
|
|
clReleaseEvent(event1);
|
2018-09-04 15:05:55 +08:00
|
|
|
EXPECT_EQ(1u, mockTagAllocator->returnedToFreePoolNodes.size()); // removed last reference on node1
|
|
|
|
EXPECT_EQ(node1, mockTagAllocator->returnedToFreePoolNodes.at(0));
|
2018-08-28 20:11:25 +08:00
|
|
|
EXPECT_EQ(3u, mockTagAllocator->releaseReferenceNodes.size()); // event1 released node1
|
|
|
|
EXPECT_EQ(node1, mockTagAllocator->releaseReferenceNodes.at(2));
|
|
|
|
|
|
|
|
cmdQ.reset(nullptr);
|
2018-09-04 15:05:55 +08:00
|
|
|
EXPECT_EQ(2u, mockTagAllocator->returnedToFreePoolNodes.size()); // removed last reference on node2
|
|
|
|
EXPECT_EQ(node2, mockTagAllocator->returnedToFreePoolNodes.at(1));
|
2018-08-28 20:11:25 +08:00
|
|
|
EXPECT_EQ(4u, mockTagAllocator->releaseReferenceNodes.size()); // cmdQ released node2
|
|
|
|
EXPECT_EQ(node2, mockTagAllocator->releaseReferenceNodes.at(3));
|
|
|
|
}
|
2018-08-31 18:22:57 +08:00
|
|
|
|
2018-09-06 15:03:07 +08:00
|
|
|
HWCMDTEST_F(IGFX_GEN8_CORE, TimestampPacketTests, givenTimestampPacketWriteEnabledWhenEnqueueingThenWriteWalkerStamp) {
|
2018-08-31 18:22:57 +08:00
|
|
|
using GPGPU_WALKER = typename FamilyType::GPGPU_WALKER;
|
|
|
|
using PIPE_CONTROL = typename FamilyType::PIPE_CONTROL;
|
|
|
|
|
|
|
|
auto device = std::unique_ptr<MockDevice>(MockDevice::createWithNewExecutionEnvironment<MockDevice>(platformDevices[0]));
|
|
|
|
MockContext context(device.get());
|
|
|
|
auto cmdQ = std::make_unique<MockCommandQueueHw<FamilyType>>(&context, device.get(), nullptr);
|
|
|
|
MockKernelWithInternals kernel(*device, &context);
|
|
|
|
|
2018-09-06 15:03:07 +08:00
|
|
|
device->getUltCommandStreamReceiver<FamilyType>().timestampPacketWriteEnabled = true;
|
|
|
|
|
2018-08-31 18:22:57 +08:00
|
|
|
size_t gws[] = {1, 1, 1};
|
|
|
|
cmdQ->enqueueKernel(kernel.mockKernel, 1, nullptr, gws, nullptr, 0, nullptr, nullptr);
|
|
|
|
EXPECT_NE(nullptr, cmdQ->timestampPacketNode);
|
|
|
|
|
|
|
|
HardwareParse hwParser;
|
|
|
|
hwParser.parseCommands<FamilyType>(cmdQ->getCS(0), 0);
|
|
|
|
|
|
|
|
bool walkerFound = false;
|
|
|
|
for (auto it = hwParser.cmdList.begin(); it != hwParser.cmdList.end(); it++) {
|
|
|
|
if (genCmdCast<GPGPU_WALKER *>(*it)) {
|
|
|
|
walkerFound = true;
|
|
|
|
auto pipeControl = genCmdCast<PIPE_CONTROL *>(*++it);
|
|
|
|
ASSERT_NE(nullptr, pipeControl);
|
|
|
|
EXPECT_EQ(PIPE_CONTROL::POST_SYNC_OPERATION_WRITE_IMMEDIATE_DATA, pipeControl->getPostSyncOperation());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
EXPECT_TRUE(walkerFound);
|
|
|
|
}
|
2018-09-07 15:09:24 +08:00
|
|
|
|
2018-09-07 20:31:37 +08:00
|
|
|
HWTEST_F(TimestampPacketTests, givenEventsRequestWhenEstimatingStreamSizeForCsrThenAddSizeForSemaphores) {
|
|
|
|
auto device = std::unique_ptr<MockDevice>(MockDevice::createWithNewExecutionEnvironment<MockDevice>(platformDevices[0]));
|
|
|
|
|
|
|
|
cl_uint numEventsOnWaitlist = 5;
|
|
|
|
EventsRequest eventsRequest(numEventsOnWaitlist, nullptr, nullptr);
|
|
|
|
DispatchFlags flags;
|
|
|
|
|
|
|
|
auto sizeWithoutEvents = device->getUltCommandStreamReceiver<FamilyType>().getRequiredCmdStreamSize(flags, *device.get());
|
|
|
|
|
|
|
|
flags.outOfDeviceDependencies = &eventsRequest;
|
|
|
|
auto sizeWithEvents = device->getUltCommandStreamReceiver<FamilyType>().getRequiredCmdStreamSize(flags, *device.get());
|
|
|
|
|
|
|
|
size_t extendedSize = sizeWithoutEvents + (numEventsOnWaitlist * sizeof(typename FamilyType::MI_SEMAPHORE_WAIT));
|
|
|
|
|
|
|
|
EXPECT_EQ(sizeWithEvents, extendedSize);
|
|
|
|
}
|
|
|
|
|
|
|
|
HWTEST_F(TimestampPacketTests, givenTimestampPacketWriteEnabledWhenEnqueueingThenProgramSemaphoresOnCsrStream) {
|
|
|
|
using MI_SEMAPHORE_WAIT = typename FamilyType::MI_SEMAPHORE_WAIT;
|
|
|
|
|
|
|
|
ExecutionEnvironment executionEnvironment;
|
|
|
|
executionEnvironment.incRefInternal();
|
2018-09-11 17:28:19 +08:00
|
|
|
auto device1 = std::unique_ptr<MockDevice>(Device::create<MockDevice>(nullptr, &executionEnvironment, 0u));
|
|
|
|
auto device2 = std::unique_ptr<MockDevice>(Device::create<MockDevice>(nullptr, &executionEnvironment, 1u));
|
2018-09-07 20:31:37 +08:00
|
|
|
|
|
|
|
device1->getUltCommandStreamReceiver<FamilyType>().timestampPacketWriteEnabled = true;
|
|
|
|
MockContext context1(device1.get());
|
|
|
|
MockContext context2(device2.get());
|
|
|
|
|
|
|
|
MockKernelWithInternals kernel(*device1, &context1);
|
|
|
|
|
|
|
|
auto cmdQ1 = std::make_unique<MockCommandQueueHw<FamilyType>>(&context1, device1.get(), nullptr);
|
|
|
|
auto cmdQ2 = std::make_unique<MockCommandQueueHw<FamilyType>>(&context2, device2.get(), nullptr);
|
|
|
|
|
|
|
|
const cl_uint eventsOnWaitlist = 6;
|
|
|
|
TagNode<TimestampPacket> *tagNodes[eventsOnWaitlist];
|
|
|
|
for (size_t i = 0; i < eventsOnWaitlist; i++) {
|
|
|
|
tagNodes[i] = executionEnvironment.memoryManager->getTimestampPacketAllocator()->getTag();
|
|
|
|
}
|
|
|
|
|
|
|
|
UserEvent event1;
|
|
|
|
event1.setStatus(CL_COMPLETE);
|
|
|
|
UserEvent event2;
|
|
|
|
event2.setStatus(CL_COMPLETE);
|
|
|
|
Event event3(cmdQ1.get(), 0, 0, 0);
|
|
|
|
event3.setTimestampPacketNode(tagNodes[2]);
|
|
|
|
Event event4(cmdQ2.get(), 0, 0, 0);
|
|
|
|
event4.setTimestampPacketNode(tagNodes[3]);
|
|
|
|
Event event5(cmdQ1.get(), 0, 0, 0);
|
|
|
|
event5.setTimestampPacketNode(tagNodes[4]);
|
|
|
|
Event event6(cmdQ2.get(), 0, 0, 0);
|
|
|
|
event6.setTimestampPacketNode(tagNodes[5]);
|
|
|
|
|
|
|
|
cl_event waitlist[] = {&event1, &event2, &event3, &event4, &event5, &event6};
|
|
|
|
|
|
|
|
size_t gws[] = {1, 1, 1};
|
|
|
|
cmdQ1->enqueueKernel(kernel.mockKernel, 1, nullptr, gws, nullptr, eventsOnWaitlist, waitlist, nullptr);
|
|
|
|
auto &cmdStream = device1->getUltCommandStreamReceiver<FamilyType>().commandStream;
|
|
|
|
|
|
|
|
HardwareParse hwParser;
|
|
|
|
hwParser.parseCommands<FamilyType>(cmdStream, 0);
|
|
|
|
|
|
|
|
auto verifySemaphore = [](MI_SEMAPHORE_WAIT *semaphoreCmd, Event *compareEvent) {
|
|
|
|
EXPECT_NE(nullptr, semaphoreCmd);
|
|
|
|
EXPECT_EQ(semaphoreCmd->getCompareOperation(), MI_SEMAPHORE_WAIT::COMPARE_OPERATION::COMPARE_OPERATION_SAD_NOT_EQUAL_SDD);
|
|
|
|
EXPECT_EQ(1u, semaphoreCmd->getSemaphoreDataDword());
|
|
|
|
EXPECT_EQ(compareEvent->getTimestampPacket()->pickAddressForDataWrite(TimestampPacket::DataIndex::ContextEnd),
|
|
|
|
semaphoreCmd->getSemaphoreGraphicsAddress());
|
|
|
|
};
|
|
|
|
|
|
|
|
auto it = hwParser.cmdList.begin();
|
|
|
|
verifySemaphore(genCmdCast<MI_SEMAPHORE_WAIT *>(*it++), &event4);
|
|
|
|
verifySemaphore(genCmdCast<MI_SEMAPHORE_WAIT *>(*it++), &event6);
|
|
|
|
|
|
|
|
while (it != hwParser.cmdList.end()) {
|
|
|
|
EXPECT_EQ(nullptr, genCmdCast<MI_SEMAPHORE_WAIT *>(*it));
|
|
|
|
it++;
|
|
|
|
}
|
|
|
|
}
|
2018-09-07 15:09:24 +08:00
|
|
|
HWTEST_F(TimestampPacketTests, givenTimestampPacketWriteEnabledWhenDispatchingThenProgramSemaphoresForWaitlist) {
|
|
|
|
using MI_SEMAPHORE_WAIT = typename FamilyType::MI_SEMAPHORE_WAIT;
|
|
|
|
using WALKER = WALKER_TYPE<FamilyType>;
|
|
|
|
ExecutionEnvironment executionEnvironment;
|
|
|
|
executionEnvironment.incRefInternal();
|
2018-09-11 17:28:19 +08:00
|
|
|
auto device1 = std::unique_ptr<MockDevice>(Device::create<MockDevice>(nullptr, &executionEnvironment, 0u));
|
|
|
|
auto device2 = std::unique_ptr<MockDevice>(Device::create<MockDevice>(nullptr, &executionEnvironment, 1u));
|
2018-09-07 15:09:24 +08:00
|
|
|
MockKernelWithInternals kernel1(*device1);
|
|
|
|
device1->getUltCommandStreamReceiver<FamilyType>().timestampPacketWriteEnabled = true;
|
|
|
|
MockContext context1(device1.get());
|
|
|
|
MockContext context2(device2.get());
|
|
|
|
|
|
|
|
MockMultiDispatchInfo
|
|
|
|
multiDispatchInfo(std::vector<Kernel *>({kernel1.mockKernel}));
|
|
|
|
|
|
|
|
MockCommandQueue cmdQ1(&context1, device1.get(), nullptr);
|
|
|
|
MockCommandQueue cmdQ2(&context2, device2.get(), nullptr);
|
|
|
|
auto &cmdStream = cmdQ1.getCS(0);
|
|
|
|
|
|
|
|
const cl_uint eventsOnWaitlist = 6;
|
|
|
|
TagNode<TimestampPacket> *tagNodes[eventsOnWaitlist];
|
|
|
|
for (size_t i = 0; i < eventsOnWaitlist; i++) {
|
|
|
|
tagNodes[i] = executionEnvironment.memoryManager->getTimestampPacketAllocator()->getTag();
|
|
|
|
}
|
|
|
|
|
|
|
|
UserEvent event1;
|
|
|
|
UserEvent event2;
|
|
|
|
Event event3(&cmdQ1, 0, 0, 0);
|
|
|
|
event3.setTimestampPacketNode(tagNodes[2]);
|
|
|
|
Event event4(&cmdQ2, 0, 0, 0);
|
|
|
|
event4.setTimestampPacketNode(tagNodes[3]);
|
|
|
|
Event event5(&cmdQ1, 0, 0, 0);
|
|
|
|
event5.setTimestampPacketNode(tagNodes[4]);
|
|
|
|
Event event6(&cmdQ2, 0, 0, 0);
|
|
|
|
event6.setTimestampPacketNode(tagNodes[5]);
|
|
|
|
|
|
|
|
cl_event waitlist[] = {&event1, &event2, &event3, &event4, &event5, &event6};
|
|
|
|
|
|
|
|
GpgpuWalkerHelper<FamilyType>::dispatchWalker(
|
|
|
|
cmdQ1,
|
|
|
|
multiDispatchInfo,
|
|
|
|
eventsOnWaitlist,
|
|
|
|
waitlist,
|
|
|
|
nullptr,
|
|
|
|
nullptr,
|
|
|
|
nullptr,
|
|
|
|
nullptr,
|
|
|
|
device1->getPreemptionMode(),
|
|
|
|
false);
|
|
|
|
|
|
|
|
HardwareParse hwParser;
|
|
|
|
hwParser.parseCommands<FamilyType>(cmdStream, 0);
|
|
|
|
|
|
|
|
auto verifySemaphore = [](MI_SEMAPHORE_WAIT *semaphoreCmd, Event *compareEvent) {
|
|
|
|
EXPECT_EQ(semaphoreCmd->getCompareOperation(), MI_SEMAPHORE_WAIT::COMPARE_OPERATION::COMPARE_OPERATION_SAD_NOT_EQUAL_SDD);
|
|
|
|
EXPECT_EQ(1u, semaphoreCmd->getSemaphoreDataDword());
|
|
|
|
EXPECT_EQ(compareEvent->getTimestampPacket()->pickAddressForDataWrite(TimestampPacket::DataIndex::ContextEnd),
|
|
|
|
semaphoreCmd->getSemaphoreGraphicsAddress());
|
|
|
|
};
|
|
|
|
|
|
|
|
uint32_t semaphoresFound = 0;
|
|
|
|
uint32_t walkersFound = 0;
|
|
|
|
|
|
|
|
for (auto it = hwParser.cmdList.begin(); it != hwParser.cmdList.end(); it++) {
|
|
|
|
auto semaphoreCmd = genCmdCast<MI_SEMAPHORE_WAIT *>(*it);
|
|
|
|
if (semaphoreCmd) {
|
|
|
|
semaphoresFound++;
|
|
|
|
if (semaphoresFound == 1) {
|
|
|
|
verifySemaphore(semaphoreCmd, &event3);
|
|
|
|
} else if (semaphoresFound == 2) {
|
|
|
|
verifySemaphore(semaphoreCmd, &event5);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (genCmdCast<WALKER *>(*it)) {
|
|
|
|
walkersFound++;
|
|
|
|
EXPECT_EQ(2u, semaphoresFound); // semaphores from events programmed before walker
|
|
|
|
}
|
|
|
|
}
|
|
|
|
EXPECT_EQ(1u, walkersFound);
|
|
|
|
EXPECT_EQ(2u, semaphoresFound); // total number of semaphores found in cmdList
|
|
|
|
}
|
2018-09-10 20:24:11 +08:00
|
|
|
|
|
|
|
TEST_F(TimestampPacketTests, givenAlreadyAssignedNodeWhenObtainingThenGetNewBeforeReleasing) {
|
|
|
|
auto device = std::unique_ptr<MockDevice>(MockDevice::createWithNewExecutionEnvironment<MockDevice>(platformDevices[0]));
|
|
|
|
auto mockMemoryManager = new MockMemoryManager();
|
|
|
|
device->injectMemoryManager(mockMemoryManager);
|
|
|
|
auto mockTagAllocator = new MockTagAllocator<>(mockMemoryManager, 1);
|
|
|
|
mockMemoryManager->timestampPacketAllocator.reset(mockTagAllocator);
|
|
|
|
|
|
|
|
MockCommandQueue cmdQ(nullptr, device.get(), nullptr);
|
|
|
|
cmdQ.obtainNewTimestampPacketNode();
|
|
|
|
auto firstNode = cmdQ.timestampPacketNode;
|
|
|
|
EXPECT_TRUE(mockTagAllocator->freeTags.peekIsEmpty());
|
|
|
|
|
|
|
|
// mark as ready to release
|
|
|
|
size_t dataSize = sizeof(uint32_t) * static_cast<size_t>(TimestampPacket::DataIndex::Max);
|
|
|
|
memset(reinterpret_cast<void *>(firstNode->tag->pickAddressForDataWrite(TimestampPacket::DataIndex::ContextStart)), 0, dataSize);
|
|
|
|
|
|
|
|
cmdQ.obtainNewTimestampPacketNode();
|
|
|
|
auto secondNode = cmdQ.timestampPacketNode;
|
|
|
|
EXPECT_FALSE(mockTagAllocator->freeTags.peekIsEmpty()); // new pool allocated for secondNode
|
|
|
|
EXPECT_NE(firstNode, secondNode);
|
|
|
|
}
|