/* * Copyright (c) 2018, Intel Corporation * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included * in all copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR * OTHER DEALINGS IN THE SOFTWARE. */ #include "runtime/command_queue/gpgpu_walker.h" #include "runtime/helpers/options.h" #include "runtime/helpers/timestamp_packet.h" #include "runtime/utilities/tag_allocator.h" #include "unit_tests/helpers/hw_parse.h" #include "unit_tests/mocks/mock_context.h" #include "unit_tests/mocks/mock_device.h" #include "unit_tests/mocks/mock_command_queue.h" #include "unit_tests/mocks/mock_kernel.h" #include "unit_tests/mocks/mock_mdi.h" #include "unit_tests/mocks/mock_memory_manager.h" #include "test.h" using namespace OCLRT; struct TimestampPacketTests : public ::testing::Test { class MockTimestampPacket : public TimestampPacket { public: using TimestampPacket::data; }; template class MockTagAllocator : public TagAllocator { public: using BaseClass = TagAllocator; using BaseClass::freeTags; using BaseClass::usedTags; using NodeType = typename BaseClass::NodeType; MockTagAllocator(MemoryManager *memoryManager, size_t tagCount = 10) : BaseClass(memoryManager, tagCount, 10) {} void returnTag(NodeType *node) override { releaseReferenceNodes.push_back(node); BaseClass::returnTag(node); } void returnTagToFreePool(NodeType *node) override { returnedToFreePoolNodes.push_back(node); BaseClass::returnTagToFreePool(node); } std::vector releaseReferenceNodes; std::vector returnedToFreePoolNodes; }; void setTagToReadyState(TimestampPacket *tag) { memset(reinterpret_cast(tag->pickAddressForDataWrite(TimestampPacket::DataIndex::ContextStart)), 0, timestampDataSize); } const size_t timestampDataSize = sizeof(uint32_t) * static_cast(TimestampPacket::DataIndex::Max); }; TEST_F(TimestampPacketTests, whenEndTagIsNotOneThenCanBeReleased) { MockTimestampPacket timestampPacket; auto contextEndIndex = static_cast(TimestampPacket::DataIndex::ContextEnd); auto globalEndIndex = static_cast(TimestampPacket::DataIndex::GlobalEnd); timestampPacket.data[contextEndIndex] = 1; timestampPacket.data[globalEndIndex] = 1; EXPECT_FALSE(timestampPacket.canBeReleased()); timestampPacket.data[contextEndIndex] = 1; timestampPacket.data[globalEndIndex] = 0; EXPECT_FALSE(timestampPacket.canBeReleased()); timestampPacket.data[contextEndIndex] = 0; timestampPacket.data[globalEndIndex] = 1; EXPECT_FALSE(timestampPacket.canBeReleased()); timestampPacket.data[contextEndIndex] = 0; timestampPacket.data[globalEndIndex] = 0; EXPECT_TRUE(timestampPacket.canBeReleased()); } TEST_F(TimestampPacketTests, whenNewTagIsTakenThenReinitialize) { MockMemoryManager memoryManager; MockTagAllocator allocator(&memoryManager, 1); auto firstNode = allocator.getTag(); firstNode->tag->data = {{5, 6, 7, 8, 9}}; allocator.returnTag(firstNode); auto secondNode = allocator.getTag(); EXPECT_EQ(secondNode, firstNode); for (uint32_t i = 0; i < static_cast(TimestampPacket::DataIndex::Max); i++) { EXPECT_EQ(1u, secondNode->tag->data[i]); } } TEST_F(TimestampPacketTests, whenObjectIsCreatedThenInitializeAllStamps) { MockTimestampPacket timestampPacket; auto maxElements = static_cast(TimestampPacket::DataIndex::Max); EXPECT_EQ(5u, maxElements); EXPECT_EQ(maxElements, timestampPacket.data.size()); for (uint32_t i = 0; i < maxElements; i++) { EXPECT_EQ(1u, timestampPacket.data[i]); } } TEST_F(TimestampPacketTests, whenAskedForStampAddressThenReturnWithValidOffset) { MockTimestampPacket timestampPacket; for (size_t i = 0; i < static_cast(TimestampPacket::DataIndex::Max); i++) { auto address = timestampPacket.pickAddressForDataWrite(static_cast(i)); EXPECT_EQ(address, reinterpret_cast(×tampPacket.data[i])); } } HWCMDTEST_F(IGFX_GEN8_CORE, TimestampPacketTests, givenTimestampPacketWriteEnabledWhenEstimatingStreamSizeThenAddTwoPipeControls) { auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(platformDevices[0])); MockCommandQueue cmdQ(nullptr, device.get(), nullptr); MockKernelWithInternals kernel1(*device); MockKernelWithInternals kernel2(*device); MockMultiDispatchInfo multiDispatchInfo(std::vector({kernel1.mockKernel, kernel2.mockKernel})); device->getUltCommandStreamReceiver().timestampPacketWriteEnabled = false; getCommandStream(cmdQ, 0, false, false, multiDispatchInfo); auto sizeWithDisabled = cmdQ.requestedCmdStreamSize; device->getUltCommandStreamReceiver().timestampPacketWriteEnabled = true; getCommandStream(cmdQ, 0, false, false, multiDispatchInfo); auto sizeWithEnabled = cmdQ.requestedCmdStreamSize; auto extendedSize = sizeWithDisabled + (2 * sizeof(typename FamilyType::PIPE_CONTROL)) + sizeof(typename FamilyType::MI_SEMAPHORE_WAIT); EXPECT_EQ(sizeWithEnabled, extendedSize); } HWTEST_F(TimestampPacketTests, givenTimestampPacketWriteEnabledWhenEstimatingStreamSizeWithWaitlistThenAddSizeForSemaphores) { auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(platformDevices[0])); MockCommandQueue cmdQ(nullptr, device.get(), nullptr); MockKernelWithInternals kernel1(*device); MockKernelWithInternals kernel2(*device); MockMultiDispatchInfo multiDispatchInfo(std::vector({kernel1.mockKernel, kernel2.mockKernel})); cl_uint numEventsOnWaitlist = 5; device->getUltCommandStreamReceiver().timestampPacketWriteEnabled = false; getCommandStream(cmdQ, numEventsOnWaitlist, false, false, multiDispatchInfo); auto sizeWithDisabled = cmdQ.requestedCmdStreamSize; device->getUltCommandStreamReceiver().timestampPacketWriteEnabled = true; getCommandStream(cmdQ, numEventsOnWaitlist, false, false, multiDispatchInfo); auto sizeWithEnabled = cmdQ.requestedCmdStreamSize; size_t extendedSize = sizeWithDisabled + EnqueueOperation::getSizeRequiredForTimestampPacketWrite() + ((numEventsOnWaitlist + 1) * sizeof(typename FamilyType::MI_SEMAPHORE_WAIT)); EXPECT_EQ(sizeWithEnabled, extendedSize); } HWCMDTEST_F(IGFX_GEN8_CORE, TimestampPacketTests, givenTimestampPacketWhenDispatchingGpuWalkerThenAddTwoPcForLastWalker) { using GPGPU_WALKER = typename FamilyType::GPGPU_WALKER; using PIPE_CONTROL = typename FamilyType::PIPE_CONTROL; MockTimestampPacket timestampPacket; auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(platformDevices[0])); MockKernelWithInternals kernel1(*device); MockKernelWithInternals kernel2(*device); MockMultiDispatchInfo multiDispatchInfo(std::vector({kernel1.mockKernel, kernel2.mockKernel})); MockCommandQueue cmdQ(nullptr, device.get(), nullptr); auto &cmdStream = cmdQ.getCS(0); GpgpuWalkerHelper::dispatchWalker( cmdQ, multiDispatchInfo, 0, nullptr, nullptr, nullptr, nullptr, nullptr, ×tampPacket, device->getPreemptionMode(), false); HardwareParse hwParser; hwParser.parseCommands(cmdStream, 0); auto verifyPipeControl = [](PIPE_CONTROL *pipeControl, uint64_t expectedAddress) { EXPECT_EQ(1u, pipeControl->getCommandStreamerStallEnable()); EXPECT_EQ(PIPE_CONTROL::POST_SYNC_OPERATION_WRITE_IMMEDIATE_DATA, pipeControl->getPostSyncOperation()); EXPECT_EQ(0u, pipeControl->getImmediateData()); EXPECT_EQ(static_cast(expectedAddress & 0x0000FFFFFFFFULL), pipeControl->getAddress()); EXPECT_EQ(static_cast(expectedAddress >> 32), pipeControl->getAddressHigh()); }; uint32_t walkersFound = 0; for (auto it = hwParser.cmdList.begin(); it != hwParser.cmdList.end(); it++) { if (genCmdCast(*it)) { walkersFound++; if (walkersFound == 1) { EXPECT_EQ(nullptr, genCmdCast(*--it)); it++; EXPECT_EQ(nullptr, genCmdCast(*++it)); it--; } else if (walkersFound == 2) { auto pipeControl = genCmdCast(*--it); EXPECT_NE(nullptr, pipeControl); verifyPipeControl(pipeControl, timestampPacket.pickAddressForDataWrite(TimestampPacket::DataIndex::Submit)); it++; pipeControl = genCmdCast(*++it); EXPECT_NE(nullptr, pipeControl); verifyPipeControl(pipeControl, timestampPacket.pickAddressForDataWrite(TimestampPacket::DataIndex::ContextEnd)); it--; } } } EXPECT_EQ(2u, walkersFound); } HWTEST_F(TimestampPacketTests, givenTimestampPacketWriteEnabledWhenEnqueueingThenObtainNewStampAndPassToEvent) { auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(platformDevices[0])); auto mockMemoryManager = new MockMemoryManager(); device->injectMemoryManager(mockMemoryManager); auto mockTagAllocator = new MockTagAllocator<>(mockMemoryManager); mockMemoryManager->timestampPacketAllocator.reset(mockTagAllocator); MockContext context(device.get()); auto cmdQ = std::make_unique>(&context, device.get(), nullptr); MockKernelWithInternals kernel(*device, &context); device->getUltCommandStreamReceiver().timestampPacketWriteEnabled = false; size_t gws[] = {1, 1, 1}; cmdQ->enqueueKernel(kernel.mockKernel, 1, nullptr, gws, nullptr, 0, nullptr, nullptr); EXPECT_EQ(nullptr, cmdQ->timestampPacketNode); EXPECT_EQ(nullptr, mockTagAllocator->usedTags.peekHead()); device->getUltCommandStreamReceiver().timestampPacketWriteEnabled = true; cl_event event1, event2; // obtain first node for cmdQ and event1 cmdQ->enqueueKernel(kernel.mockKernel, 1, nullptr, gws, nullptr, 0, nullptr, &event1); auto node1 = cmdQ->timestampPacketNode; EXPECT_NE(nullptr, node1); EXPECT_EQ(node1, cmdQ->timestampPacketNode); // obtain new node for cmdQ and event2 cmdQ->enqueueKernel(kernel.mockKernel, 1, nullptr, gws, nullptr, 0, nullptr, &event2); auto node2 = cmdQ->timestampPacketNode; EXPECT_NE(nullptr, node2); EXPECT_EQ(node2, cmdQ->timestampPacketNode); EXPECT_EQ(0u, mockTagAllocator->returnedToFreePoolNodes.size()); // nothing returned. event1 owns previous node EXPECT_EQ(1u, mockTagAllocator->releaseReferenceNodes.size()); // cmdQ released first node EXPECT_EQ(node1, mockTagAllocator->releaseReferenceNodes.at(0)); EXPECT_NE(node1, node2); setTagToReadyState(node1->tag); setTagToReadyState(node2->tag); clReleaseEvent(event2); EXPECT_EQ(0u, mockTagAllocator->returnedToFreePoolNodes.size()); // nothing returned. cmdQ owns node2 EXPECT_EQ(2u, mockTagAllocator->releaseReferenceNodes.size()); // event2 released node2 EXPECT_EQ(node2, mockTagAllocator->releaseReferenceNodes.at(1)); clReleaseEvent(event1); EXPECT_EQ(1u, mockTagAllocator->returnedToFreePoolNodes.size()); // removed last reference on node1 EXPECT_EQ(node1, mockTagAllocator->returnedToFreePoolNodes.at(0)); EXPECT_EQ(3u, mockTagAllocator->releaseReferenceNodes.size()); // event1 released node1 EXPECT_EQ(node1, mockTagAllocator->releaseReferenceNodes.at(2)); cmdQ.reset(nullptr); EXPECT_EQ(2u, mockTagAllocator->returnedToFreePoolNodes.size()); // removed last reference on node2 EXPECT_EQ(node2, mockTagAllocator->returnedToFreePoolNodes.at(1)); EXPECT_EQ(4u, mockTagAllocator->releaseReferenceNodes.size()); // cmdQ released node2 EXPECT_EQ(node2, mockTagAllocator->releaseReferenceNodes.at(3)); } HWCMDTEST_F(IGFX_GEN8_CORE, TimestampPacketTests, givenTimestampPacketWriteEnabledWhenEnqueueingThenWriteWalkerStamp) { using GPGPU_WALKER = typename FamilyType::GPGPU_WALKER; using PIPE_CONTROL = typename FamilyType::PIPE_CONTROL; auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(platformDevices[0])); MockContext context(device.get()); auto cmdQ = std::make_unique>(&context, device.get(), nullptr); MockKernelWithInternals kernel(*device, &context); device->getUltCommandStreamReceiver().timestampPacketWriteEnabled = true; size_t gws[] = {1, 1, 1}; cmdQ->enqueueKernel(kernel.mockKernel, 1, nullptr, gws, nullptr, 0, nullptr, nullptr); EXPECT_NE(nullptr, cmdQ->timestampPacketNode); HardwareParse hwParser; hwParser.parseCommands(cmdQ->getCS(0), 0); bool walkerFound = false; for (auto it = hwParser.cmdList.begin(); it != hwParser.cmdList.end(); it++) { if (genCmdCast(*it)) { walkerFound = true; auto pipeControl = genCmdCast(*++it); ASSERT_NE(nullptr, pipeControl); EXPECT_EQ(PIPE_CONTROL::POST_SYNC_OPERATION_WRITE_IMMEDIATE_DATA, pipeControl->getPostSyncOperation()); } } EXPECT_TRUE(walkerFound); } HWTEST_F(TimestampPacketTests, givenEventsRequestWhenEstimatingStreamSizeForCsrThenAddSizeForSemaphores) { auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(platformDevices[0])); cl_uint numEventsOnWaitlist = 5; EventsRequest eventsRequest(numEventsOnWaitlist, nullptr, nullptr); DispatchFlags flags; auto sizeWithoutEvents = device->getUltCommandStreamReceiver().getRequiredCmdStreamSize(flags, *device.get()); flags.outOfDeviceDependencies = &eventsRequest; auto sizeWithEvents = device->getUltCommandStreamReceiver().getRequiredCmdStreamSize(flags, *device.get()); size_t extendedSize = sizeWithoutEvents + (numEventsOnWaitlist * sizeof(typename FamilyType::MI_SEMAPHORE_WAIT)); EXPECT_EQ(sizeWithEvents, extendedSize); } HWTEST_F(TimestampPacketTests, givenTimestampPacketWriteEnabledWhenEnqueueingThenProgramSemaphoresOnCsrStream) { using MI_SEMAPHORE_WAIT = typename FamilyType::MI_SEMAPHORE_WAIT; ExecutionEnvironment executionEnvironment; executionEnvironment.incRefInternal(); auto device1 = std::unique_ptr(Device::create(nullptr, &executionEnvironment, 0u)); auto device2 = std::unique_ptr(Device::create(nullptr, &executionEnvironment, 1u)); device1->getUltCommandStreamReceiver().timestampPacketWriteEnabled = true; MockContext context1(device1.get()); MockContext context2(device2.get()); MockKernelWithInternals kernel(*device1, &context1); auto cmdQ1 = std::make_unique>(&context1, device1.get(), nullptr); auto cmdQ2 = std::make_unique>(&context2, device2.get(), nullptr); const cl_uint eventsOnWaitlist = 6; TagNode *tagNodes[eventsOnWaitlist]; for (size_t i = 0; i < eventsOnWaitlist; i++) { tagNodes[i] = executionEnvironment.memoryManager->getTimestampPacketAllocator()->getTag(); } UserEvent event1; event1.setStatus(CL_COMPLETE); UserEvent event2; event2.setStatus(CL_COMPLETE); Event event3(cmdQ1.get(), 0, 0, 0); event3.setTimestampPacketNode(tagNodes[2]); Event event4(cmdQ2.get(), 0, 0, 0); event4.setTimestampPacketNode(tagNodes[3]); Event event5(cmdQ1.get(), 0, 0, 0); event5.setTimestampPacketNode(tagNodes[4]); Event event6(cmdQ2.get(), 0, 0, 0); event6.setTimestampPacketNode(tagNodes[5]); cl_event waitlist[] = {&event1, &event2, &event3, &event4, &event5, &event6}; size_t gws[] = {1, 1, 1}; cmdQ1->enqueueKernel(kernel.mockKernel, 1, nullptr, gws, nullptr, eventsOnWaitlist, waitlist, nullptr); auto &cmdStream = device1->getUltCommandStreamReceiver().commandStream; HardwareParse hwParser; hwParser.parseCommands(cmdStream, 0); auto verifySemaphore = [](MI_SEMAPHORE_WAIT *semaphoreCmd, Event *compareEvent) { EXPECT_NE(nullptr, semaphoreCmd); EXPECT_EQ(semaphoreCmd->getCompareOperation(), MI_SEMAPHORE_WAIT::COMPARE_OPERATION::COMPARE_OPERATION_SAD_NOT_EQUAL_SDD); EXPECT_EQ(1u, semaphoreCmd->getSemaphoreDataDword()); EXPECT_EQ(compareEvent->getTimestampPacket()->pickAddressForDataWrite(TimestampPacket::DataIndex::ContextEnd), semaphoreCmd->getSemaphoreGraphicsAddress()); }; auto it = hwParser.cmdList.begin(); verifySemaphore(genCmdCast(*it++), &event4); verifySemaphore(genCmdCast(*it++), &event6); while (it != hwParser.cmdList.end()) { EXPECT_EQ(nullptr, genCmdCast(*it)); it++; } } HWTEST_F(TimestampPacketTests, givenTimestampPacketWriteEnabledWhenDispatchingThenProgramSemaphoresForWaitlist) { using MI_SEMAPHORE_WAIT = typename FamilyType::MI_SEMAPHORE_WAIT; using WALKER = WALKER_TYPE; ExecutionEnvironment executionEnvironment; executionEnvironment.incRefInternal(); auto device1 = std::unique_ptr(Device::create(nullptr, &executionEnvironment, 0u)); auto device2 = std::unique_ptr(Device::create(nullptr, &executionEnvironment, 1u)); MockKernelWithInternals kernel1(*device1); device1->getUltCommandStreamReceiver().timestampPacketWriteEnabled = true; MockContext context1(device1.get()); MockContext context2(device2.get()); MockMultiDispatchInfo multiDispatchInfo(std::vector({kernel1.mockKernel})); MockCommandQueue cmdQ1(&context1, device1.get(), nullptr); MockCommandQueue cmdQ2(&context2, device2.get(), nullptr); auto &cmdStream = cmdQ1.getCS(0); const cl_uint eventsOnWaitlist = 6; TagNode *tagNodes[eventsOnWaitlist]; for (size_t i = 0; i < eventsOnWaitlist; i++) { tagNodes[i] = executionEnvironment.memoryManager->getTimestampPacketAllocator()->getTag(); } UserEvent event1; UserEvent event2; Event event3(&cmdQ1, 0, 0, 0); event3.setTimestampPacketNode(tagNodes[2]); Event event4(&cmdQ2, 0, 0, 0); event4.setTimestampPacketNode(tagNodes[3]); Event event5(&cmdQ1, 0, 0, 0); event5.setTimestampPacketNode(tagNodes[4]); Event event6(&cmdQ2, 0, 0, 0); event6.setTimestampPacketNode(tagNodes[5]); cl_event waitlist[] = {&event1, &event2, &event3, &event4, &event5, &event6}; GpgpuWalkerHelper::dispatchWalker( cmdQ1, multiDispatchInfo, eventsOnWaitlist, waitlist, nullptr, nullptr, nullptr, nullptr, nullptr, device1->getPreemptionMode(), false); HardwareParse hwParser; hwParser.parseCommands(cmdStream, 0); auto verifySemaphore = [](MI_SEMAPHORE_WAIT *semaphoreCmd, Event *compareEvent) { EXPECT_EQ(semaphoreCmd->getCompareOperation(), MI_SEMAPHORE_WAIT::COMPARE_OPERATION::COMPARE_OPERATION_SAD_NOT_EQUAL_SDD); EXPECT_EQ(1u, semaphoreCmd->getSemaphoreDataDword()); EXPECT_EQ(compareEvent->getTimestampPacket()->pickAddressForDataWrite(TimestampPacket::DataIndex::ContextEnd), semaphoreCmd->getSemaphoreGraphicsAddress()); }; uint32_t semaphoresFound = 0; uint32_t walkersFound = 0; for (auto it = hwParser.cmdList.begin(); it != hwParser.cmdList.end(); it++) { auto semaphoreCmd = genCmdCast(*it); if (semaphoreCmd) { semaphoresFound++; if (semaphoresFound == 1) { verifySemaphore(semaphoreCmd, &event3); } else if (semaphoresFound == 2) { verifySemaphore(semaphoreCmd, &event5); } } if (genCmdCast(*it)) { walkersFound++; EXPECT_EQ(2u, semaphoresFound); // semaphores from events programmed before walker } } EXPECT_EQ(1u, walkersFound); EXPECT_EQ(2u, semaphoresFound); // total number of semaphores found in cmdList } TEST_F(TimestampPacketTests, givenAlreadyAssignedNodeWhenObtainingThenGetNewBeforeReleasing) { auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(platformDevices[0])); auto mockMemoryManager = new MockMemoryManager(); device->injectMemoryManager(mockMemoryManager); auto mockTagAllocator = new MockTagAllocator<>(mockMemoryManager, 1); mockMemoryManager->timestampPacketAllocator.reset(mockTagAllocator); MockCommandQueue cmdQ(nullptr, device.get(), nullptr); cmdQ.obtainNewTimestampPacketNode(); auto firstNode = cmdQ.timestampPacketNode; EXPECT_TRUE(mockTagAllocator->freeTags.peekIsEmpty()); setTagToReadyState(firstNode->tag); cmdQ.obtainNewTimestampPacketNode(); auto secondNode = cmdQ.timestampPacketNode; EXPECT_FALSE(mockTagAllocator->freeTags.peekIsEmpty()); // new pool allocated for secondNode EXPECT_NE(firstNode, secondNode); } HWTEST_F(TimestampPacketTests, givenAlreadyAssignedNodeWhenEnqueueingThenDontKeepDependencyOnPreviousNodeIfItsReady) { auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(platformDevices[0])); device->getUltCommandStreamReceiver().timestampPacketWriteEnabled = true; MockContext context(device.get()); MockKernelWithInternals kernel(*device); MockCommandQueueHw cmdQ(&context, device.get(), nullptr); cmdQ.obtainNewTimestampPacketNode(); auto firstNode = cmdQ.timestampPacketNode; setTagToReadyState(firstNode->tag); size_t gws[] = {1, 1, 1}; cmdQ.enqueueKernel(kernel.mockKernel, 1, nullptr, gws, nullptr, 0, nullptr, nullptr); HardwareParse hwParser; hwParser.parseCommands(*cmdQ.commandStream, 0); uint32_t semaphoresFound = 0; for (auto it = hwParser.cmdList.begin(); it != hwParser.cmdList.end(); it++) { if (genCmdCast(*it)) { semaphoresFound++; } } EXPECT_EQ(0u, semaphoresFound); } HWTEST_F(TimestampPacketTests, givenAlreadyAssignedNodeWhenEnqueueingThenKeepDependencyOnPreviousNodeIfItsNotReady) { using MI_SEMAPHORE_WAIT = typename FamilyType::MI_SEMAPHORE_WAIT; auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(platformDevices[0])); device->getUltCommandStreamReceiver().timestampPacketWriteEnabled = true; MockContext context(device.get()); MockKernelWithInternals kernel(*device); MockCommandQueueHw cmdQ(&context, device.get(), nullptr); cmdQ.obtainNewTimestampPacketNode(); auto firstNode = cmdQ.timestampPacketNode; size_t gws[] = {1, 1, 1}; cmdQ.enqueueKernel(kernel.mockKernel, 1, nullptr, gws, nullptr, 0, nullptr, nullptr); HardwareParse hwParser; hwParser.parseCommands(*cmdQ.commandStream, 0); auto semaphoreCmd = genCmdCast(*hwParser.cmdList.begin()); EXPECT_NE(nullptr, semaphoreCmd); EXPECT_EQ(firstNode->tag->pickAddressForDataWrite(TimestampPacket::DataIndex::ContextEnd), semaphoreCmd->getSemaphoreGraphicsAddress()); EXPECT_EQ(1u, semaphoreCmd->getSemaphoreDataDword()); EXPECT_EQ(MI_SEMAPHORE_WAIT::COMPARE_OPERATION::COMPARE_OPERATION_SAD_NOT_EQUAL_SDD, semaphoreCmd->getCompareOperation()); uint32_t semaphoresFound = 0; auto it = hwParser.cmdList.begin(); for (++it; it != hwParser.cmdList.end(); it++) { if (genCmdCast(*it)) { semaphoresFound++; } } EXPECT_EQ(0u, semaphoresFound); }