/* * Copyright (C) 2021-2024 Intel Corporation * * SPDX-License-Identifier: MIT * */ #include "shared/source/device/device.h" #include "shared/source/gmm_helper/gmm.h" #include "shared/source/helpers/api_specific_config.h" #include "shared/source/helpers/array_count.h" #include "shared/source/helpers/gfx_core_helper.h" #include "shared/source/helpers/ray_tracing_helper.h" #include "shared/source/memory_manager/allocations_list.h" #include "shared/source/memory_manager/gfx_partition.h" #include "shared/source/memory_manager/unified_memory_pooling.h" #include "shared/source/os_interface/device_factory.h" #include "shared/source/os_interface/driver_info.h" #include "shared/source/os_interface/os_context.h" #include "shared/source/os_interface/os_interface.h" #include "shared/source/release_helper/release_helper.h" #include "shared/test/common/fixtures/device_fixture.h" #include "shared/test/common/helpers/debug_manager_state_restore.h" #include "shared/test/common/helpers/default_hw_info.h" #include "shared/test/common/helpers/raii_product_helper.h" #include "shared/test/common/helpers/ult_hw_config.h" #include "shared/test/common/helpers/variable_backup.h" #include "shared/test/common/mocks/mock_allocation_properties.h" #include "shared/test/common/mocks/mock_builtins.h" #include "shared/test/common/mocks/mock_compiler_interface.h" #include "shared/test/common/mocks/mock_compilers.h" #include "shared/test/common/mocks/mock_device.h" #include "shared/test/common/mocks/mock_driver_model.h" #include "shared/test/common/mocks/mock_io_functions.h" #include "shared/test/common/mocks/mock_memory_manager.h" #include "shared/test/common/mocks/mock_product_helper.h" #include "shared/test/common/mocks/ult_device_factory.h" #include "shared/test/common/test_macros/hw_test.h" #include "shared/test/common/test_macros/test.h" using namespace NEO; extern ApiSpecificConfig::ApiType apiTypeForUlts; namespace NEO { extern bool isDeviceUsmPoolingEnabledForUlts; } TEST(DeviceBlitterTest, whenBlitterOperationsSupportIsDisabledThenNoInternalCopyEngineIsReturned) { VariableBackup backupHwInfo(defaultHwInfo.get()); defaultHwInfo->capabilityTable.blitterOperationsSupported = false; UltDeviceFactory factory{1, 0}; EXPECT_EQ(nullptr, factory.rootDevices[0]->getInternalCopyEngine()); } TEST(DeviceBlitterTest, givenForceBCSForInternalCopyEngineToIndexZeroWhenGetInternalCopyEngineIsCalledThenInternalMainCopyEngineIsReturned) { DebugManagerStateRestore dbgRestorer; debugManager.flags.ForceBCSForInternalCopyEngine.set(0); VariableBackup backupHwInfo(defaultHwInfo.get()); defaultHwInfo->capabilityTable.blitterOperationsSupported = true; UltDeviceFactory factory{1, 0}; factory.rootDevices[0]->createEngine({aub_stream::EngineType::ENGINE_BCS, EngineUsage::internal}); auto engine = factory.rootDevices[0]->getInternalCopyEngine(); EXPECT_NE(nullptr, engine); EXPECT_EQ(aub_stream::EngineType::ENGINE_BCS, engine->getEngineType()); EXPECT_EQ(EngineUsage::internal, engine->getEngineUsage()); } TEST(DeviceBlitterTest, givenForceBCSForInternalCopyEngineToIndexOneWhenGetInternalLinkCopyEngineIsCalledThenInternalLinkCopyEngineOneIsReturned) { DebugManagerStateRestore dbgRestorer; debugManager.flags.ForceBCSForInternalCopyEngine.set(1); VariableBackup backupHwInfo(defaultHwInfo.get()); defaultHwInfo->capabilityTable.blitterOperationsSupported = true; UltDeviceFactory factory{1, 0}; factory.rootDevices[0]->createEngine({aub_stream::EngineType::ENGINE_BCS1, EngineUsage::internal}); auto engine = factory.rootDevices[0]->getInternalCopyEngine(); EXPECT_NE(nullptr, engine); EXPECT_EQ(aub_stream::EngineType::ENGINE_BCS1, engine->getEngineType()); EXPECT_EQ(EngineUsage::internal, engine->getEngineUsage()); } TEST(DeviceBlitterTest, givenBlitterOperationsDisabledWhenCreatingBlitterEngineThenAbort) { VariableBackup backupHwInfo(defaultHwInfo.get()); defaultHwInfo->capabilityTable.blitterOperationsSupported = false; UltDeviceFactory factory{1, 0}; EXPECT_THROW(factory.rootDevices[0]->createEngine({aub_stream::EngineType::ENGINE_BCS, EngineUsage::regular}), std::runtime_error); EXPECT_THROW(factory.rootDevices[0]->createEngine({aub_stream::EngineType::ENGINE_BCS, EngineUsage::cooperative}), std::runtime_error); EXPECT_THROW(factory.rootDevices[0]->createEngine({aub_stream::EngineType::ENGINE_BCS, EngineUsage::internal}), std::runtime_error); EXPECT_THROW(factory.rootDevices[0]->createEngine({aub_stream::EngineType::ENGINE_BCS, EngineUsage::lowPriority}), std::runtime_error); } TEST(Device, givenNoDebuggerWhenGettingDebuggerThenNullptrIsReturned) { auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(defaultHwInfo.get())); EXPECT_EQ(nullptr, device->getDebugger()); EXPECT_EQ(nullptr, device->getL0Debugger()); } struct DeviceWithDisabledL0DebuggerTests : public DeviceFixture, public ::testing::Test { void SetUp() override { debugManager.flags.DisableSupportForL0Debugger.set(true); DeviceFixture::setUp(); } void TearDown() override { DeviceFixture::tearDown(); } DebugManagerStateRestore dbgRestorer; }; TEST_F(DeviceWithDisabledL0DebuggerTests, givenSetFlagDisableSupportForL0DebuggerWhenCreateDeviceThenCapabilityL0DebuggerSupportedIsDisabled) { EXPECT_FALSE(pDevice->getHardwareInfo().capabilityTable.l0DebuggerSupported); } TEST(Device, givenDeviceWithBrandingStringNameWhenGettingDeviceNameThenBrandingStringIsReturned) { auto hwInfo = *defaultHwInfo; hwInfo.capabilityTable.deviceName = "Custom Device"; auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(&hwInfo)); EXPECT_STREQ("Custom Device", device->getDeviceName().c_str()); } TEST(Device, givenDeviceWithoutBrandingStringNameWhenGettingDeviceNameThenGenericNameWithHexadecimalDeviceIdIsReturned) { auto hwInfo = *defaultHwInfo; hwInfo.capabilityTable.deviceName = ""; hwInfo.platform.usDeviceID = 0x1AB; auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(&hwInfo)); EXPECT_STREQ("Intel(R) Graphics [0x01ab]", device->getDeviceName().c_str()); } TEST(Device, WhenCreatingDeviceThenCapsInitilizedBeforeEnginesAreCreated) { class CapsInitMockDevice : public RootDevice { public: using Device::createDeviceImpl; using RootDevice::RootDevice; void initializeCaps() override { capsInitialized = true; return Device::initializeCaps(); } bool createEngines() override { capsInitializedWhenCreatingEngines = capsInitialized; return RootDevice::createEngines(); } bool capsInitialized = false; bool capsInitializedWhenCreatingEngines = false; }; auto hwInfo = *defaultHwInfo; hwInfo.capabilityTable.deviceName = ""; hwInfo.platform.usDeviceID = 0x1AB; auto executionEnvironment = new ExecutionEnvironment(); executionEnvironment->prepareRootDeviceEnvironments(1); for (auto i = 0u; i < executionEnvironment->rootDeviceEnvironments.size(); i++) { executionEnvironment->rootDeviceEnvironments[i]->setHwInfoAndInitHelpers(&hwInfo); executionEnvironment->rootDeviceEnvironments[i]->initGmm(); } executionEnvironment->setDeviceHierarchy(executionEnvironment->rootDeviceEnvironments[0]->getHelper()); executionEnvironment->calculateMaxOsContextCount(); executionEnvironment->initializeMemoryManager(); auto device = std::make_unique(executionEnvironment, 0); device->createDeviceImpl(); EXPECT_TRUE(device->capsInitializedWhenCreatingEngines); } using DeviceTest = Test; TEST_F(DeviceTest, whenInitializeRayTracingIsCalledAndRtBackedBufferIsNullptrThenMemoryBackedBufferIsCreated) { EXPECT_EQ(nullptr, pDevice->getRTMemoryBackedBuffer()); EXPECT_EQ(false, pDevice->rayTracingIsInitialized()); pDevice->initializeRayTracing(0); EXPECT_NE(nullptr, pDevice->getRTMemoryBackedBuffer()); EXPECT_EQ(true, pDevice->rayTracingIsInitialized()); pDevice->initializeRayTracing(0); EXPECT_NE(nullptr, pDevice->getRTMemoryBackedBuffer()); EXPECT_EQ(true, pDevice->rayTracingIsInitialized()); } TEST_F(DeviceTest, whenGetRTDispatchGlobalsIsCalledWithUnsupportedBVHLevelsThenNullptrIsReturned) { pDevice->initializeRayTracing(5); EXPECT_EQ(nullptr, pDevice->getRTDispatchGlobals(100)); } TEST_F(DeviceTest, whenInitializeRayTracingIsCalledWithMockAllocatorThenDispatchGlobalsArrayAllocationIsLockable) { DebugManagerStateRestore restorer; debugManager.flags.ForceLocalMemoryAccessMode.set(0); auto maxBvhLevel = 3; pDevice->initializeRayTracing(maxBvhLevel); for (auto i = 0; i < maxBvhLevel; i++) { auto rtDispatchGlobals = pDevice->getRTDispatchGlobals(i); EXPECT_NE(nullptr, rtDispatchGlobals); auto dispatchGlobalsArray = rtDispatchGlobals->rtDispatchGlobalsArray; EXPECT_NE(nullptr, dispatchGlobalsArray); EXPECT_FALSE(dispatchGlobalsArray->getDefaultGmm()->resourceParams.Flags.Info.NotLockable); } } TEST_F(DeviceTest, whenInitializeRayTracingIsCalledWithMockAllocatorThenRTDispatchGlobalsIsAllocated) { pDevice->initializeRayTracing(5); EXPECT_NE(nullptr, pDevice->getRTDispatchGlobals(3)); EXPECT_NE(nullptr, pDevice->getRTDispatchGlobals(3)); EXPECT_NE(nullptr, pDevice->getRTDispatchGlobals(5)); } TEST_F(DeviceTest, whenInitializeRayTracingIsCalledMultipleTimesWithMockAllocatorThenInitializeRayTracingIsIdempotent) { pDevice->initializeRayTracing(5); EXPECT_NE(nullptr, pDevice->getRTDispatchGlobals(5)); pDevice->initializeRayTracing(5); EXPECT_NE(nullptr, pDevice->getRTDispatchGlobals(5)); } TEST_F(DeviceTest, whenGetRTDispatchGlobalsIsCalledBeforeInitializationThenNullPtrIsReturned) { EXPECT_EQ(nullptr, pDevice->getRTDispatchGlobals(1)); } TEST_F(DeviceTest, whenGetRTDispatchGlobalsIsCalledWithZeroSizeAndMockAllocatorThenDispatchGlobalsIsReturned) { EXPECT_EQ(nullptr, pDevice->getRTDispatchGlobals(0)); pDevice->initializeRayTracing(5); EXPECT_NE(nullptr, pDevice->getRTDispatchGlobals(0)); } TEST_F(DeviceTest, whenAllocateRTDispatchGlobalsIsCalledThenRTDispatchGlobalsIsAllocated) { pDevice->initializeRayTracing(5); pDevice->allocateRTDispatchGlobals(3); EXPECT_NE(nullptr, pDevice->getRTDispatchGlobals(3)); } TEST_F(DeviceTest, whenAllocateRTDispatchGlobalsIsCalledThenStackSizePerRayIsSetCorrectly) { pDevice->initializeRayTracing(5); pDevice->allocateRTDispatchGlobals(3); EXPECT_NE(nullptr, pDevice->getRTDispatchGlobals(3)); struct RTDispatchGlobals dispatchGlobals = *reinterpret_cast(pDevice->getRTDispatchGlobals(3)->rtDispatchGlobalsArray->getUnderlyingBuffer()); auto releaseHelper = getReleaseHelper(); if (releaseHelper) { EXPECT_EQ(dispatchGlobals.stackSizePerRay, releaseHelper->getStackSizePerRay()); } else { EXPECT_EQ(dispatchGlobals.stackSizePerRay, 0u); } } TEST_F(DeviceTest, givenNot48bResourceForRtWhenAllocateRTDispatchGlobalsIsCalledThenRTDispatchGlobalsIsAllocatedWithout48bResourceFlag) { auto mockProductHelper = std::make_unique(); mockProductHelper->is48bResourceNeededForRayTracingResult = false; std::unique_ptr productHelper = std::move(mockProductHelper); auto &rootDeviceEnvironment = pDevice->getRootDeviceEnvironmentRef(); auto memoryManager = static_cast(pDevice->getMemoryManager()); memoryManager->validateAllocateProperties = [](const AllocationProperties &properties) -> void { EXPECT_FALSE(properties.flags.resource48Bit); }; std::swap(rootDeviceEnvironment.productHelper, productHelper); pDevice->initializeRayTracing(5); pDevice->allocateRTDispatchGlobals(3); EXPECT_NE(nullptr, pDevice->getRTDispatchGlobals(3)); std::swap(rootDeviceEnvironment.productHelper, productHelper); } HWTEST2_F(DeviceTest, whenAllocateRTDispatchGlobalsIsCalledAndRTStackAllocationFailsRTDispatchGlobalsIsNotAllocated, IsPVC) { DebugManagerStateRestore restorer; debugManager.flags.CreateMultipleSubDevices.set(2); VariableBackup mockDeviceFlagBackup(&MockDevice::createSingleDevice, false); auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(defaultHwInfo.get())); std::unique_ptr otherMemoryManager; otherMemoryManager = std::make_unique(*device->executionEnvironment); static_cast(*otherMemoryManager).capacity = MemoryConstants::pageSize; device->executionEnvironment->memoryManager.swap(otherMemoryManager); device->initializeRayTracing(5); EXPECT_EQ(nullptr, device->getRTDispatchGlobals(3)); device->executionEnvironment->memoryManager.swap(otherMemoryManager); } TEST_F(DeviceTest, givenDispatchGlobalsAllocationFailsThenRTDispatchGlobalsInfoIsNull) { std::unique_ptr otherMemoryManager; otherMemoryManager = std::make_unique(1, *pDevice->getExecutionEnvironment()); pDevice->getExecutionEnvironment()->memoryManager.swap(otherMemoryManager); pDevice->initializeRayTracing(5); auto rtDispatchGlobalsInfo = pDevice->getRTDispatchGlobals(5); EXPECT_EQ(nullptr, rtDispatchGlobalsInfo); pDevice->getExecutionEnvironment()->memoryManager.swap(otherMemoryManager); } TEST_F(DeviceTest, GivenDeviceWhenGenerateUuidThenValidValuesAreSet) { std::array uuid, expectedUuid; pDevice->generateUuid(uuid); uint32_t rootDeviceIndex = pDevice->getRootDeviceIndex(); expectedUuid.fill(0); uint16_t vendorId = 0x8086; // Intel uint16_t deviceId = static_cast(pDevice->getHardwareInfo().platform.usDeviceID); uint16_t revisionId = static_cast(pDevice->getHardwareInfo().platform.usRevId); memcpy_s(&expectedUuid[0], sizeof(uint16_t), &vendorId, sizeof(uint16_t)); memcpy_s(&expectedUuid[2], sizeof(uint16_t), &deviceId, sizeof(uint16_t)); memcpy_s(&expectedUuid[4], sizeof(uint16_t), &revisionId, sizeof(uint16_t)); memcpy_s(&expectedUuid[6], sizeof(uint32_t), &rootDeviceIndex, sizeof(rootDeviceIndex)); EXPECT_EQ(memcmp(&uuid, &expectedUuid, ProductHelper::uuidSize), 0); } TEST_F(DeviceTest, GivenDeviceWhenGenerateUuidFromPciBusInfoThenValidValuesAreSet) { std::array uuid, expectedUuid; PhysicalDevicePciBusInfo pciBusInfo = {1, 1, 1, 1}; pDevice->generateUuidFromPciBusInfo(pciBusInfo, uuid); expectedUuid.fill(0); uint16_t vendorId = 0x8086; // Intel uint16_t deviceId = static_cast(pDevice->getHardwareInfo().platform.usDeviceID); uint16_t revisionId = static_cast(pDevice->getHardwareInfo().platform.usRevId); uint16_t pciDomain = static_cast(pciBusInfo.pciDomain); uint8_t pciBus = static_cast(pciBusInfo.pciBus); uint8_t pciDevice = static_cast(pciBusInfo.pciDevice); uint8_t pciFunction = static_cast(pciBusInfo.pciFunction); memcpy_s(&expectedUuid[0], sizeof(uint16_t), &vendorId, sizeof(uint16_t)); memcpy_s(&expectedUuid[2], sizeof(uint16_t), &deviceId, sizeof(uint16_t)); memcpy_s(&expectedUuid[4], sizeof(uint16_t), &revisionId, sizeof(uint16_t)); memcpy_s(&expectedUuid[6], sizeof(uint16_t), &pciDomain, sizeof(uint16_t)); memcpy_s(&expectedUuid[8], sizeof(uint8_t), &pciBus, sizeof(uint8_t)); memcpy_s(&expectedUuid[9], sizeof(uint8_t), &pciDevice, sizeof(uint8_t)); memcpy_s(&expectedUuid[10], sizeof(uint8_t), &pciFunction, sizeof(uint8_t)); EXPECT_EQ(memcmp(&uuid, &expectedUuid, ProductHelper::uuidSize), 0); } using DeviceGetCapsTest = Test; TEST_F(DeviceGetCapsTest, givenMockCompilerInterfaceWhenInitializeCapsIsCalledThenMaxParameterSizeIsSetCorrectly) { auto pCompilerInterface = new MockCompilerInterface; pDevice->getExecutionEnvironment()->rootDeviceEnvironments[pDevice->getRootDeviceIndex()]->compilerInterface.reset(pCompilerInterface); pDevice->maxParameterSizeFromIGC = 2u; pDevice->callBaseGetMaxParameterSizeFromIGC = true; MockIgcFeaturesAndWorkarounds mockIgcFtrWa; pCompilerInterface->igcFeaturesAndWorkaroundsTagOCL = &mockIgcFtrWa; mockIgcFtrWa.maxOCLParamSize = 0u; pDevice->initializeCaps(); EXPECT_EQ(2048u, pDevice->getDeviceInfo().maxParameterSize); mockIgcFtrWa.maxOCLParamSize = 1u; pDevice->initializeCaps(); EXPECT_EQ(1u, pDevice->getDeviceInfo().maxParameterSize); } TEST_F(DeviceGetCapsTest, givenImplicitScalingWhenInitializeCapsIsCalledThenMaxMemAllocSizeIsSetCorrectly) { DebugManagerStateRestore dbgRestorer; debugManager.flags.CreateMultipleSubDevices.set(4); pDevice->deviceBitfield = 15; debugManager.flags.EnableWalkerPartition.set(1); pDevice->initializeCaps(); EXPECT_EQ(pDevice->getDeviceInfo().maxMemAllocSize, pDevice->getDeviceInfo().globalMemSize); debugManager.flags.EnableWalkerPartition.set(0); pDevice->initializeCaps(); EXPECT_LE(pDevice->getDeviceInfo().maxMemAllocSize, pDevice->getDeviceInfo().globalMemSize); } TEST_F(DeviceGetCapsTest, givenImplicitScalingTrueWhenInitializeCapsIsCalledThenMaxMemAllocSizeIsSetCorrectly) { DebugManagerStateRestore dbgRestorer; debugManager.flags.CreateMultipleSubDevices.set(4); pDevice->deviceBitfield = 15; debugManager.flags.EnableImplicitScaling.set(1); debugManager.flags.EnableWalkerPartition.set(1); pDevice->initializeCaps(); EXPECT_EQ(pDevice->getDeviceInfo().maxMemAllocSize, pDevice->getDeviceInfo().globalMemSize); } TEST_F(DeviceGetCapsTest, givenImplicitScalingFalseWhenInitializeCapsIsCalledThenMaxMemAllocSizeIsSetCorrectly) { DebugManagerStateRestore dbgRestorer; debugManager.flags.CreateMultipleSubDevices.set(4); pDevice->deviceBitfield = 15; debugManager.flags.EnableImplicitScaling.set(0); debugManager.flags.EnableWalkerPartition.set(1); pDevice->initializeCaps(); EXPECT_LE(pDevice->getDeviceInfo().maxMemAllocSize, pDevice->getDeviceInfo().globalMemSize); } TEST_F(DeviceGetCapsTest, givenDontForcePreemptionModeDebugVariableWhenCreateDeviceThenSetDefaultHwPreemptionMode) { DebugManagerStateRestore dbgRestorer; { debugManager.flags.ForcePreemptionMode.set(-1); auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(defaultHwInfo.get())); EXPECT_TRUE(device->getHardwareInfo().capabilityTable.defaultPreemptionMode == device->getPreemptionMode()); } } TEST_F(DeviceGetCapsTest, givenDebugFlagSetWhenCreatingDeviceInfoThenOverrideProfilingTimerResolution) { DebugManagerStateRestore dbgRestorer; debugManager.flags.OverrideProfilingTimerResolution.set(123); auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(defaultHwInfo.get())); EXPECT_EQ(double(123), device->getDeviceInfo().profilingTimerResolution); EXPECT_EQ(123u, device->getDeviceInfo().outProfilingTimerResolution); } TEST_F(DeviceGetCapsTest, givenForcePreemptionModeDebugVariableWhenCreateDeviceThenSetForcedMode) { DebugManagerStateRestore dbgRestorer; { PreemptionMode forceMode = PreemptionMode::MidThread; if (defaultHwInfo->capabilityTable.defaultPreemptionMode == forceMode) { // force non-default mode forceMode = PreemptionMode::ThreadGroup; } debugManager.flags.ForcePreemptionMode.set((int32_t)forceMode); auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(defaultHwInfo.get())); EXPECT_TRUE(forceMode == device->getPreemptionMode()); } } TEST_F(DeviceGetCapsTest, givenDeviceWithMidThreadPreemptionWhenDeviceIsCreatedThenSipKernelIsNotCreated) { VariableBackup mockSipBackup(&MockSipData::useMockSip, false); DebugManagerStateRestore dbgRestorer; { auto builtIns = new MockBuiltins(); MockSipData::called = false; debugManager.flags.ForcePreemptionMode.set((int32_t)PreemptionMode::MidThread); auto executionEnvironment = new ExecutionEnvironment(); executionEnvironment->prepareRootDeviceEnvironments(1); MockRootDeviceEnvironment::resetBuiltins(executionEnvironment->rootDeviceEnvironments[0u].get(), builtIns); auto device = std::unique_ptr(MockDevice::createWithExecutionEnvironment(defaultHwInfo.get(), executionEnvironment, 0u)); ASSERT_EQ(builtIns, device->getBuiltIns()); EXPECT_FALSE(MockSipData::called); } } TEST_F(DeviceGetCapsTest, whenDriverModelHasLimitationForMaxMemoryAllocationSizeThenTakeItIntoAccount) { DebugManagerStateRestore dbgRestorer; size_t maxAllocSizeTestValue = 512; auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(defaultHwInfo.get())); device->executionEnvironment->rootDeviceEnvironments[0]->osInterface.reset(new NEO::OSInterface()); auto driverModel = std::make_unique(); driverModel->maxAllocSize = maxAllocSizeTestValue; device->executionEnvironment->rootDeviceEnvironments[0]->osInterface->setDriverModel(std::move(driverModel)); device->initializeCaps(); const auto &caps = device->getDeviceInfo(); EXPECT_EQ(maxAllocSizeTestValue, caps.maxMemAllocSize); } TEST_F(DeviceGetCapsTest, WhenDeviceIsCreatedThenVmeIsEnabled) { DebugSettingsManager freshDebugSettingsManager(""); EXPECT_TRUE(freshDebugSettingsManager.flags.EnableIntelVme.get()); } TEST(DeviceGetCapsSimpleTest, givenVariousOclVersionsWhenCapsAreCreatedThenDeviceReportsSpirvAsSupportedIl) { DebugManagerStateRestore dbgRestorer; int32_t oclVersionsToTest[] = {12, 21, 30}; for (auto oclVersion : oclVersionsToTest) { debugManager.flags.ForceOCLVersion.set(oclVersion); auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(defaultHwInfo.get())); const auto &caps = device->getDeviceInfo(); EXPECT_STREQ("SPIR-V_1.3 SPIR-V_1.2 SPIR-V_1.1 SPIR-V_1.0 ", caps.ilVersion); } } TEST(DeviceGetCapsSimpleTest, givenDebugFlagToSetWorkgroupSizeWhenDeviceIsCreatedThenItUsesThatWorkgroupSize) { DebugManagerStateRestore dbgRestorer; debugManager.flags.OverrideMaxWorkgroupSize.set(16u); HardwareInfo myHwInfo = *defaultHwInfo; GT_SYSTEM_INFO &mySysInfo = myHwInfo.gtSystemInfo; mySysInfo.EUCount = 24; mySysInfo.SubSliceCount = 3; mySysInfo.ThreadCount = 24 * 7; auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(&myHwInfo)); EXPECT_EQ(16u, device->getDeviceInfo().maxWorkGroupSize); } TEST_F(DeviceGetCapsTest, givenFlagEnabled64kbPagesWhenCallConstructorMemoryManagerThenReturnCorrectValue) { DebugManagerStateRestore dbgRestore; VariableBackup osEnabled64kbPagesBackup(&OSInterface::osEnabled64kbPages); class MockMemoryManager : public MemoryManager { public: MockMemoryManager(ExecutionEnvironment &executionEnvironment) : MemoryManager(executionEnvironment) {} void addAllocationToHostPtrManager(GraphicsAllocation *memory) override{}; void removeAllocationFromHostPtrManager(GraphicsAllocation *memory) override{}; GraphicsAllocation *createGraphicsAllocationFromMultipleSharedHandles(const std::vector &handles, AllocationProperties &properties, bool requireSpecificBitness, bool isHostIpcAllocation, bool reuseSharedAllocation, void *mapPointer) override { return nullptr; } GraphicsAllocation *createGraphicsAllocationFromSharedHandle(const OsHandleData &osHandleData, const AllocationProperties &properties, bool requireSpecificBitness, bool isHostIpcAllocation, bool reuseSharedAllocation, void *mapPointer) override { return nullptr; }; AllocationStatus populateOsHandles(OsHandleStorage &handleStorage, uint32_t rootDeviceIndex) override { return AllocationStatus::Success; }; void cleanOsHandles(OsHandleStorage &handleStorage, uint32_t rootDeviceIndex) override{}; void freeGraphicsMemoryImpl(GraphicsAllocation *gfxAllocation) override{}; void freeGraphicsMemoryImpl(GraphicsAllocation *gfxAllocation, bool isImportedAllocation) override{}; uint64_t getSystemSharedMemory(uint32_t rootDeviceIndex) override { return 0; }; uint64_t getLocalMemorySize(uint32_t rootDeviceIndex, uint32_t deviceBitfield) override { return 0; }; double getPercentOfGlobalMemoryAvailable(uint32_t rootDeviceIndex) override { return 0; } AddressRange reserveGpuAddress(const uint64_t requiredStartAddress, size_t size, RootDeviceIndicesContainer rootDeviceIndices, uint32_t *reservedOnRootDeviceIndex) override { return {}; } AddressRange reserveGpuAddressOnHeap(const uint64_t requiredStartAddress, size_t size, RootDeviceIndicesContainer rootDeviceIndices, uint32_t *reservedOnRootDeviceIndex, HeapIndex heap, size_t alignment) override { return {}; } size_t selectAlignmentAndHeap(size_t size, HeapIndex *heap) override { *heap = HeapIndex::heapStandard; return MemoryConstants::pageSize64k; } void freeGpuAddress(AddressRange addressRange, uint32_t rootDeviceIndex) override{}; AddressRange reserveCpuAddress(const uint64_t requiredStartAddress, size_t size) override { return {}; } void freeCpuAddress(AddressRange addressRange) override{}; GraphicsAllocation *createGraphicsAllocation(OsHandleStorage &handleStorage, const AllocationData &allocationData) override { return nullptr; }; GraphicsAllocation *allocateGraphicsMemoryForNonSvmHostPtr(const AllocationData &allocationData) override { return nullptr; }; GraphicsAllocation *allocateGraphicsMemoryWithAlignment(const AllocationData &allocationData) override { return nullptr; }; GraphicsAllocation *allocateUSMHostGraphicsMemory(const AllocationData &allocationData) override { return nullptr; }; GraphicsAllocation *allocateGraphicsMemory64kb(const AllocationData &allocationData) override { return nullptr; }; GraphicsAllocation *allocate32BitGraphicsMemoryImpl(const AllocationData &allocationData) override { return nullptr; }; GraphicsAllocation *allocateGraphicsMemoryInDevicePool(const AllocationData &allocationData, AllocationStatus &status) override { return nullptr; }; GraphicsAllocation *allocateGraphicsMemoryWithGpuVa(const AllocationData &allocationData) override { return nullptr; }; GraphicsAllocation *allocatePhysicalDeviceMemory(const AllocationData &allocationData, AllocationStatus &status) override { return nullptr; }; GraphicsAllocation *allocatePhysicalLocalDeviceMemory(const AllocationData &allocationData, AllocationStatus &status) override { return nullptr; }; void unMapPhysicalToVirtualMemory(GraphicsAllocation *physicalAllocation, uint64_t gpuRange, size_t bufferSize, OsContext *osContext, uint32_t rootDeviceIndex) override { return; }; bool mapPhysicalToVirtualMemory(GraphicsAllocation *physicalAllocation, uint64_t gpuRange, size_t bufferSize) override { return false; }; GraphicsAllocation *allocateGraphicsMemoryForImageImpl(const AllocationData &allocationData, std::unique_ptr gmm) override { return nullptr; }; GraphicsAllocation *allocateMemoryByKMD(const AllocationData &allocationData) override { return nullptr; }; void *lockResourceImpl(GraphicsAllocation &graphicsAllocation) override { return nullptr; }; void unlockResourceImpl(GraphicsAllocation &graphicsAllocation) override{}; }; MockExecutionEnvironment executionEnvironment; executionEnvironment.prepareRootDeviceEnvironments(1); auto &capabilityTable = executionEnvironment.rootDeviceEnvironments[0]->getMutableHardwareInfo()->capabilityTable; std::unique_ptr memoryManager; debugManager.flags.Enable64kbpages.set(-1); capabilityTable.ftr64KBpages = false; OSInterface::osEnabled64kbPages = false; memoryManager.reset(new MockMemoryManager(executionEnvironment)); EXPECT_FALSE(memoryManager->peek64kbPagesEnabled(0u)); capabilityTable.ftr64KBpages = false; OSInterface::osEnabled64kbPages = true; memoryManager.reset(new MockMemoryManager(executionEnvironment)); EXPECT_FALSE(memoryManager->peek64kbPagesEnabled(0u)); capabilityTable.ftr64KBpages = true; OSInterface::osEnabled64kbPages = false; memoryManager.reset(new MockMemoryManager(executionEnvironment)); EXPECT_FALSE(memoryManager->peek64kbPagesEnabled(0u)); capabilityTable.ftr64KBpages = true; OSInterface::osEnabled64kbPages = true; memoryManager.reset(new MockMemoryManager(executionEnvironment)); EXPECT_TRUE(memoryManager->peek64kbPagesEnabled(0u)); debugManager.flags.Enable64kbpages.set(0); // force false memoryManager.reset(new MockMemoryManager(executionEnvironment)); EXPECT_FALSE(memoryManager->peek64kbPagesEnabled(0u)); debugManager.flags.Enable64kbpages.set(1); // force true memoryManager.reset(new MockMemoryManager(executionEnvironment)); EXPECT_TRUE(memoryManager->peek64kbPagesEnabled(0u)); } using DeviceTests = ::testing::Test; TEST_F(DeviceTests, givenDispatchGlobalsAllocationFailsOnSecondSubDeviceThenRtDispatchGlobalsInfoIsNull) { class FailMockMemoryManager : public MockMemoryManager { public: FailMockMemoryManager(NEO::ExecutionEnvironment &executionEnvironment) : MockMemoryManager(false, false, executionEnvironment) {} GraphicsAllocation *allocateGraphicsMemoryWithProperties(const AllocationProperties &properties) override { allocateGraphicsMemoryWithPropertiesCount++; if (allocateGraphicsMemoryWithPropertiesCount > 2) { return nullptr; } else { return MockMemoryManager::allocateGraphicsMemoryWithProperties(properties); } } }; DebugManagerStateRestore restorer; debugManager.flags.EnableWalkerPartition.set(-1); debugManager.flags.CreateMultipleSubDevices.set(2u); UltDeviceFactory deviceFactory{1, 2}; ExecutionEnvironment &executionEnvironment = *deviceFactory.rootDevices[0]->executionEnvironment; executionEnvironment.memoryManager = std::make_unique(executionEnvironment); deviceFactory.rootDevices[0]->initializeRayTracing(5); auto rtDispatchGlobalsInfo = deviceFactory.rootDevices[0]->getRTDispatchGlobals(5); EXPECT_EQ(nullptr, rtDispatchGlobalsInfo); } TEST_F(DeviceTests, givenMtPreemptionEnabledWhenCreatingRootCsrThenCreatePreemptionAllocation) { DebugManagerStateRestore restorer; debugManager.flags.CreateMultipleSubDevices.set(2); debugManager.flags.ForcePreemptionMode.set(4); UltDeviceFactory deviceFactory{1, 2}; EXPECT_TRUE(deviceFactory.rootDevices[0]->getDefaultEngine().osContext->isRootDevice()); EXPECT_NE(nullptr, deviceFactory.rootDevices[0]->getDefaultEngine().commandStreamReceiver->getPreemptionAllocation()); } TEST_F(DeviceTests, givenPreemptionModeWhenOverridePreemptionModeThenProperlySet) { auto newPreemptionMode = PreemptionMode::ThreadGroup; auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(defaultHwInfo.get())); device->overridePreemptionMode(newPreemptionMode); EXPECT_EQ(newPreemptionMode, device->getPreemptionMode()); newPreemptionMode = PreemptionMode::Disabled; device->overridePreemptionMode(newPreemptionMode); EXPECT_EQ(newPreemptionMode, device->getPreemptionMode()); } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTests, givenZexNumberOfCssEnvVariableDefinedWhenDeviceIsCreatedThenCreateDevicesWithProperCcsCount) { VariableBackup backup(&ultHwConfig); ultHwConfig.useMockedPrepareDeviceEnvironmentsFunc = false; DebugManagerStateRestore restorer; debugManager.flags.ZEX_NUMBER_OF_CCS.set("0:4,1:1,2:2,3:1"); debugManager.flags.SetCommandStreamReceiver.set(1); auto hwInfo = *defaultHwInfo; MockExecutionEnvironment executionEnvironment(&hwInfo, false, 4); executionEnvironment.incRefInternal(); UltDeviceFactory deviceFactory{4, 0, executionEnvironment}; { auto device = deviceFactory.rootDevices[0]; auto computeEngineGroupIndex = device->getEngineGroupIndexFromEngineGroupType(EngineGroupType::compute); auto computeEngineGroup = device->getRegularEngineGroups()[computeEngineGroupIndex]; auto expectedNumberOfCcs = std::min(4u, defaultHwInfo->gtSystemInfo.CCSInfo.NumberOfCCSEnabled); EXPECT_EQ(expectedNumberOfCcs, computeEngineGroup.engines.size()); } { auto device = deviceFactory.rootDevices[1]; auto computeEngineGroupIndex = device->getEngineGroupIndexFromEngineGroupType(EngineGroupType::compute); auto computeEngineGroup = device->getRegularEngineGroups()[computeEngineGroupIndex]; EXPECT_EQ(1u, computeEngineGroup.engines.size()); } { auto device = deviceFactory.rootDevices[2]; auto computeEngineGroupIndex = device->getEngineGroupIndexFromEngineGroupType(EngineGroupType::compute); auto computeEngineGroup = device->getRegularEngineGroups()[computeEngineGroupIndex]; auto expectedNumberOfCcs = std::min(2u, defaultHwInfo->gtSystemInfo.CCSInfo.NumberOfCCSEnabled); EXPECT_EQ(expectedNumberOfCcs, computeEngineGroup.engines.size()); } { auto device = deviceFactory.rootDevices[3]; auto computeEngineGroupIndex = device->getEngineGroupIndexFromEngineGroupType(EngineGroupType::compute); auto computeEngineGroup = device->getRegularEngineGroups()[computeEngineGroupIndex]; EXPECT_EQ(1u, computeEngineGroup.engines.size()); } } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTests, givenDeviceIsCreatedWithZexNumberOfCssEnvVariableDefinedAndHwInfoCcsCountIsSetToDefaultWhenAdjustCcsCountForSpecificRootDeviceIsInvokedThenVerifyHwInfoCcsCountIsRestored) { VariableBackup backup(&ultHwConfig); ultHwConfig.useMockedPrepareDeviceEnvironmentsFunc = false; DebugManagerStateRestore restorer; debugManager.flags.ZEX_NUMBER_OF_CCS.set("0:1,1:2"); debugManager.flags.SetCommandStreamReceiver.set(1); auto hwInfo = *defaultHwInfo; MockExecutionEnvironment executionEnvironment(&hwInfo, false, 2); executionEnvironment.incRefInternal(); UltDeviceFactory deviceFactory{1, 0, executionEnvironment}; { auto hardwareInfo = executionEnvironment.rootDeviceEnvironments[0]->getMutableHardwareInfo(); hardwareInfo->gtSystemInfo.CCSInfo.NumberOfCCSEnabled = defaultHwInfo->gtSystemInfo.CCSInfo.NumberOfCCSEnabled; executionEnvironment.adjustCcsCount(0); EXPECT_EQ(1u, hardwareInfo->gtSystemInfo.CCSInfo.NumberOfCCSEnabled); } { auto hardwareInfo = executionEnvironment.rootDeviceEnvironments[1]->getMutableHardwareInfo(); hardwareInfo->gtSystemInfo.CCSInfo.NumberOfCCSEnabled = defaultHwInfo->gtSystemInfo.CCSInfo.NumberOfCCSEnabled; executionEnvironment.adjustCcsCount(1); EXPECT_EQ(std::min(2u, defaultHwInfo->gtSystemInfo.CCSInfo.NumberOfCCSEnabled), hardwareInfo->gtSystemInfo.CCSInfo.NumberOfCCSEnabled); } } HWTEST2_F(DeviceTests, givenDeviceIsCreatedWithAmbiguousZexNumberOfCssEnvVariableAndHwInfoCcsCountIsModifiedWhenAdjustCcsCountForSpecificDeviceIsInvokedThenVerifyCcsCountIsAdjustedToOne, IsPVC) { VariableBackup backup(&ultHwConfig); ultHwConfig.useMockedPrepareDeviceEnvironmentsFunc = false; DebugManagerStateRestore restorer; debugManager.flags.SetCommandStreamReceiver.set(1); for (const auto &numberOfCcsString : {"default", "", "0"}) { debugManager.flags.ZEX_NUMBER_OF_CCS.set(numberOfCcsString); auto hwInfo = *defaultHwInfo; MockExecutionEnvironment executionEnvironment(&hwInfo); executionEnvironment.incRefInternal(); UltDeviceFactory deviceFactory{1, 0, executionEnvironment}; auto device = deviceFactory.rootDevices[0]; auto computeEngineGroupIndex = device->getEngineGroupIndexFromEngineGroupType(EngineGroupType::compute); auto computeEngineGroup = device->getRegularEngineGroups()[computeEngineGroupIndex]; EXPECT_EQ(1u, computeEngineGroup.engines.size()); auto hardwareInfo = executionEnvironment.rootDeviceEnvironments[0]->getMutableHardwareInfo(); hardwareInfo->gtSystemInfo.CCSInfo.NumberOfCCSEnabled = defaultHwInfo->gtSystemInfo.CCSInfo.NumberOfCCSEnabled; executionEnvironment.adjustCcsCount(0); EXPECT_EQ(1u, hardwareInfo->gtSystemInfo.CCSInfo.NumberOfCCSEnabled); } } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTests, givenZexNumberOfCssAndZeAffinityMaskSetWhenDeviceIsCreatedThenProperNumberOfCcsIsExposed) { VariableBackup backup(&ultHwConfig); ultHwConfig.useMockedPrepareDeviceEnvironmentsFunc = false; DebugManagerStateRestore restorer; debugManager.flags.CreateMultipleRootDevices.set(2); debugManager.flags.ZE_AFFINITY_MASK.set("1"); debugManager.flags.ZEX_NUMBER_OF_CCS.set("0:1,1:2"); debugManager.flags.SetCommandStreamReceiver.set(1); auto hwInfo = *defaultHwInfo; MockExecutionEnvironment executionEnvironment(&hwInfo, false, 2); executionEnvironment.incRefInternal(); auto devices = DeviceFactory::createDevices(executionEnvironment); { auto device = devices[0].get(); EXPECT_EQ(0u, device->getRootDeviceIndex()); auto computeEngineGroupIndex = device->getEngineGroupIndexFromEngineGroupType(EngineGroupType::compute); auto computeEngineGroup = device->getRegularEngineGroups()[computeEngineGroupIndex]; EXPECT_EQ(1u, computeEngineGroup.engines.size()); } } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTests, givenZeAffinityMaskSetAndTilesAsDevicesModelThenProperSubDeviceHierarchyMapisSet) { std::unordered_map mockableEnvs = {{"ZE_FLAT_DEVICE_HIERARCHY", "FLAT"}}; VariableBackup *> mockableEnvValuesBackup(&IoFunctions::mockableEnvValues, &mockableEnvs); VariableBackup backup(&ultHwConfig); ultHwConfig.useMockedPrepareDeviceEnvironmentsFunc = false; DebugManagerStateRestore restorer; uint32_t numRootDevices = 4; uint32_t numSubDevices = 4; debugManager.flags.CreateMultipleRootDevices.set(numRootDevices); debugManager.flags.CreateMultipleSubDevices.set(numSubDevices); uint32_t expectedRootDevices = 4; debugManager.flags.ZE_AFFINITY_MASK.set("0,3,4,1.1,9,15,25"); debugManager.flags.SetCommandStreamReceiver.set(1); auto hwInfo = *defaultHwInfo; MockExecutionEnvironment executionEnvironment(&hwInfo, false, numRootDevices); executionEnvironment.incRefInternal(); auto devices = DeviceFactory::createDevices(executionEnvironment); EXPECT_EQ(devices.size(), expectedRootDevices); std::vector expectedRootDeviceIndices = {0, 0, 1, 2}; std::vector expectedSubDeviceIndices = {0, 3, 0, 1}; for (uint32_t i = 0u; i < devices.size(); i++) { std::tuple subDeviceMap; EXPECT_TRUE(executionEnvironment.getSubDeviceHierarchy(i, &subDeviceMap)); auto hwRootDeviceIndex = std::get<0>(subDeviceMap); auto hwSubDeviceIndex = std::get<1>(subDeviceMap); auto hwSubDevicesCount = std::get<2>(subDeviceMap); EXPECT_EQ(hwRootDeviceIndex, expectedRootDeviceIndices[i]); EXPECT_EQ(hwSubDeviceIndex, expectedSubDeviceIndices[i]); EXPECT_EQ(hwSubDevicesCount, numSubDevices); } } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTests, givenZeAffinityMaskSetThenProperSubDeviceHierarchyMapIsSet) { std::unordered_map mockableEnvs = {{"ZE_FLAT_DEVICE_HIERARCHY", "COMPOSITE"}}; VariableBackup *> mockableEnvValuesBackup(&IoFunctions::mockableEnvValues, &mockableEnvs); VariableBackup backup(&ultHwConfig); ultHwConfig.useMockedPrepareDeviceEnvironmentsFunc = false; DebugManagerStateRestore restorer; uint32_t numRootDevices = 4; uint32_t numSubDevices = 4; debugManager.flags.CreateMultipleRootDevices.set(numRootDevices); debugManager.flags.CreateMultipleSubDevices.set(numSubDevices); uint32_t expectedRootDevices = 4; debugManager.flags.ZE_AFFINITY_MASK.set("0.2,1.2,2.3,3.3,15,25"); debugManager.flags.SetCommandStreamReceiver.set(1); auto hwInfo = *defaultHwInfo; MockExecutionEnvironment executionEnvironment(&hwInfo, false, numRootDevices); executionEnvironment.incRefInternal(); auto devices = DeviceFactory::createDevices(executionEnvironment); EXPECT_EQ(devices.size(), expectedRootDevices); std::vector expectedRootDeviceIndices = {0, 1, 2, 3}; std::vector expectedSubDeviceIndices = {2, 2, 3, 3}; for (uint32_t i = 0u; i < devices.size(); i++) { std::tuple subDeviceMap; EXPECT_TRUE(executionEnvironment.getSubDeviceHierarchy(i, &subDeviceMap)); auto hwRootDeviceIndex = std::get<0>(subDeviceMap); auto hwSubDeviceIndex = std::get<1>(subDeviceMap); auto hwSubDevicesCount = std::get<2>(subDeviceMap); EXPECT_EQ(hwRootDeviceIndex, expectedRootDeviceIndices[i]); EXPECT_EQ(hwSubDeviceIndex, expectedSubDeviceIndices[i]); EXPECT_EQ(hwSubDevicesCount, numSubDevices); } } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTests, givenZeAffinityMaskSetWithoutTilesThenProperSubDeviceHierarchyMapisUnset) { std::unordered_map mockableEnvs = {{"ZE_FLAT_DEVICE_HIERARCHY", "COMPOSITE"}}; VariableBackup *> mockableEnvValuesBackup(&IoFunctions::mockableEnvValues, &mockableEnvs); VariableBackup backup(&ultHwConfig); ultHwConfig.useMockedPrepareDeviceEnvironmentsFunc = false; DebugManagerStateRestore restorer; uint32_t numRootDevices = 4; uint32_t numSubDevices = 4; debugManager.flags.CreateMultipleRootDevices.set(numRootDevices); debugManager.flags.CreateMultipleSubDevices.set(numSubDevices); uint32_t expectedRootDevices = 4; debugManager.flags.ZE_AFFINITY_MASK.set("0,1,2,3,15,25"); debugManager.flags.SetCommandStreamReceiver.set(1); auto hwInfo = *defaultHwInfo; MockExecutionEnvironment executionEnvironment(&hwInfo, false, numRootDevices); executionEnvironment.incRefInternal(); auto devices = DeviceFactory::createDevices(executionEnvironment); EXPECT_EQ(devices.size(), expectedRootDevices); for (uint32_t i = 0u; i < devices.size(); i++) { std::tuple subDeviceMap; EXPECT_FALSE(executionEnvironment.getSubDeviceHierarchy(i, &subDeviceMap)); } } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTests, givenZeAffinityMaskSetWhenAllocateRTDispatchGlobalsIsCalledThenRTDispatchGlobalsIsAllocated) { std::unordered_map mockableEnvs = {{"ZE_FLAT_DEVICE_HIERARCHY", "COMPOSITE"}}; VariableBackup *> mockableEnvValuesBackup(&IoFunctions::mockableEnvValues, &mockableEnvs); VariableBackup backup(&ultHwConfig); ultHwConfig.useMockedPrepareDeviceEnvironmentsFunc = false; DebugManagerStateRestore restorer; uint32_t numRootDevices = 4; uint32_t numSubDevices = 4; debugManager.flags.CreateMultipleRootDevices.set(numRootDevices); debugManager.flags.CreateMultipleSubDevices.set(numSubDevices); uint32_t expectedRootDevices = 4; debugManager.flags.ZE_AFFINITY_MASK.set("0.2,1.2,2.3,3.3"); auto hwInfo = *defaultHwInfo; MockExecutionEnvironment executionEnvironment(&hwInfo, false, numRootDevices); executionEnvironment.incRefInternal(); auto devices = DeviceFactory::createDevices(executionEnvironment); EXPECT_EQ(devices.size(), expectedRootDevices); for (uint32_t i = 0u; i < devices.size(); i++) { devices[0]->initializeRayTracing(5); EXPECT_NE(nullptr, devices[0]->getRTDispatchGlobals(3)); } } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTests, givenZexNumberOfCssEnvVariableIsLargerThanNumberOfAvailableCcsCountWhenDeviceIsCreatedThenCreateDevicesWithAvailableCcsCount) { VariableBackup backup(&ultHwConfig); ultHwConfig.useMockedPrepareDeviceEnvironmentsFunc = false; DebugManagerStateRestore restorer; debugManager.flags.ZEX_NUMBER_OF_CCS.set("0:13"); debugManager.flags.SetCommandStreamReceiver.set(1); auto hwInfo = *defaultHwInfo; MockExecutionEnvironment executionEnvironment(&hwInfo); executionEnvironment.incRefInternal(); UltDeviceFactory deviceFactory{1, 0, executionEnvironment}; auto device = deviceFactory.rootDevices[0]; auto computeEngineGroupIndex = device->getEngineGroupIndexFromEngineGroupType(EngineGroupType::compute); auto computeEngineGroup = device->getRegularEngineGroups()[computeEngineGroupIndex]; EXPECT_EQ(defaultHwInfo->gtSystemInfo.CCSInfo.NumberOfCCSEnabled, computeEngineGroup.engines.size()); } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTests, givenZexNumberOfCssEnvVariableSetAmbigouslyWhenDeviceIsCreatedThenDontApplyAnyLimitations) { VariableBackup backup(&ultHwConfig); ultHwConfig.useMockedPrepareDeviceEnvironmentsFunc = false; DebugManagerStateRestore restorer; debugManager.flags.SetCommandStreamReceiver.set(1); for (const auto &numberOfCcsString : {"default", "", "0"}) { debugManager.flags.ZEX_NUMBER_OF_CCS.set(numberOfCcsString); auto hwInfo = *defaultHwInfo; MockExecutionEnvironment executionEnvironment(&hwInfo); executionEnvironment.incRefInternal(); UltDeviceFactory deviceFactory{1, 0, executionEnvironment}; auto device = deviceFactory.rootDevices[0]; auto computeEngineGroupIndex = device->getEngineGroupIndexFromEngineGroupType(EngineGroupType::compute); auto computeEngineGroup = device->getRegularEngineGroups()[computeEngineGroupIndex]; EXPECT_EQ(defaultHwInfo->gtSystemInfo.CCSInfo.NumberOfCCSEnabled, computeEngineGroup.engines.size()); } } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTests, givenDebuggableOsContextWhenDeviceCreatesEnginesThenDeviceIsInitializedWithFirstSubmission) { VariableBackup backup(&ultHwConfig); ultHwConfig.useFirstSubmissionInitDevice = true; auto hwInfo = *defaultHwInfo; auto releaseHelper = ReleaseHelper::create(hwInfo.ipVersion); hardwareInfoSetup[hwInfo.platform.eProductFamily](&hwInfo, true, 0, releaseHelper.get()); MockExecutionEnvironment executionEnvironment(&hwInfo); executionEnvironment.memoryManager.reset(new MockMemoryManagerWithDebuggableOsContext(executionEnvironment)); executionEnvironment.incRefInternal(); UltDeviceFactory deviceFactory{1, 0, executionEnvironment}; auto device = deviceFactory.rootDevices[0]; auto csr = device->allEngines[device->defaultEngineIndex].commandStreamReceiver; EXPECT_EQ(1u, csr->peekLatestSentTaskCount()); } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTests, whenDeviceCreatesEnginesThenDeviceIsInitializedWithFirstSubmission) { VariableBackup backup(&ultHwConfig); ultHwConfig.useFirstSubmissionInitDevice = true; auto hwInfo = *defaultHwInfo; auto releaseHelper = ReleaseHelper::create(hwInfo.ipVersion); hardwareInfoSetup[hwInfo.platform.eProductFamily](&hwInfo, true, 0, releaseHelper.get()); MockExecutionEnvironment executionEnvironment(&hwInfo); executionEnvironment.incRefInternal(); UltDeviceFactory deviceFactory{1, 0, executionEnvironment}; auto device = deviceFactory.rootDevices[0]; auto csr = device->allEngines[device->defaultEngineIndex].commandStreamReceiver; if (device->isInitDeviceWithFirstSubmissionSupported(csr->getType())) { EXPECT_EQ(1u, csr->peekLatestSentTaskCount()); } } TEST(FailDeviceTest, GivenFailedDeviceWhenCreatingDeviceThenNullIsReturned) { auto hwInfo = defaultHwInfo.get(); DebugManagerStateRestore dbgRestore; debugManager.flags.ForcePreemptionMode.set(static_cast(NEO::PreemptionMode::Disabled)); auto pDevice = MockDevice::createWithNewExecutionEnvironment(hwInfo); EXPECT_EQ(nullptr, pDevice); } TEST(FailDeviceTest, GivenMidThreadPreemptionAndFailedDeviceWhenCreatingDeviceThenNullIsReturned) { VariableBackup backupSipInitType(&MockSipData::useMockSip, true); VariableBackup mockSipCalled(&NEO::MockSipData::called, false); DebugManagerStateRestore dbgRestore; debugManager.flags.ForcePreemptionMode.set(static_cast(PreemptionMode::MidThread)); auto pDevice = MockDevice::createWithNewExecutionEnvironment(defaultHwInfo.get()); EXPECT_EQ(nullptr, pDevice); } TEST_F(DeviceTests, givenDeviceMidThreadPreemptionWhenDebuggerDisabledThenStateSipRequired) { auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(defaultHwInfo.get())); device->setPreemptionMode(NEO::PreemptionMode::MidThread); EXPECT_TRUE(device->isStateSipRequired()); } TEST_F(DeviceTests, givenDeviceThreadGroupPreemptionWhenDebuggerEnabledThenStateSipRequired) { auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(defaultHwInfo.get())); device->setPreemptionMode(NEO::PreemptionMode::ThreadGroup); device->getExecutionEnvironment()->rootDeviceEnvironments[0]->initDebuggerL0(device.get()); EXPECT_TRUE(device->isStateSipRequired()); } TEST_F(DeviceTests, givenDeviceThreadGroupPreemptionWhenDebuggerDisabledThenStateSipNotRequired) { auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(defaultHwInfo.get())); device->setPreemptionMode(NEO::PreemptionMode::ThreadGroup); EXPECT_FALSE(device->isStateSipRequired()); } TEST_F(DeviceTests, WhenIsStateSipRequiredIsCalledThenCorrectValueIsReturned) { struct MockRootDeviceEnvironment : RootDeviceEnvironment { using RootDeviceEnvironment::RootDeviceEnvironment; CompilerInterface *getCompilerInterface() override { return compilerInterfaceReturnValue; } CompilerInterface *compilerInterfaceReturnValue = nullptr; }; auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(defaultHwInfo.get())); auto mockRootDeviceEnvironment = new MockRootDeviceEnvironment{*device->executionEnvironment}; auto backupenv = device->executionEnvironment->rootDeviceEnvironments[0].release(); device->executionEnvironment->rootDeviceEnvironments[0].reset(mockRootDeviceEnvironment); device->executionEnvironment->rootDeviceEnvironments[0]->compilerInterface.release(); device->executionEnvironment->rootDeviceEnvironments[0]->debugger.release(); std::array, 8> testParameters = { {{PreemptionMode::Disabled, nullptr, nullptr, false}, {PreemptionMode::MidThread, nullptr, nullptr, false}, {PreemptionMode::Disabled, (Debugger *)0x1234, nullptr, false}, {PreemptionMode::MidThread, (Debugger *)0x1234, nullptr, false}, {PreemptionMode::Disabled, nullptr, (CompilerInterface *)0x1234, false}, {PreemptionMode::MidThread, nullptr, (CompilerInterface *)0x1234, true}, {PreemptionMode::Disabled, (Debugger *)0x1234, (CompilerInterface *)0x1234, true}, {PreemptionMode::MidThread, (Debugger *)0x1234, (CompilerInterface *)0x1234, true}}}; for (const auto &[preemptionMode, debugger, compilerInterface, expectedResult] : testParameters) { device->setPreemptionMode(preemptionMode); device->executionEnvironment->rootDeviceEnvironments[0]->debugger.release(); device->executionEnvironment->rootDeviceEnvironments[0]->debugger.reset(debugger); mockRootDeviceEnvironment->compilerInterfaceReturnValue = compilerInterface; EXPECT_EQ(expectedResult, device->isStateSipRequired()); } device->executionEnvironment->rootDeviceEnvironments[0]->debugger.release(); mockRootDeviceEnvironment->compilerInterfaceReturnValue = nullptr; delete device->executionEnvironment->rootDeviceEnvironments[0].release(); device->executionEnvironment->rootDeviceEnvironments[0].reset(backupenv); } HWTEST2_F(DeviceTests, GivenXeHpAndLaterThenDefaultPreemptionModeIsThreadGroup, IsWithinXeGfxFamily) { EXPECT_EQ(PreemptionMode::ThreadGroup, defaultHwInfo->capabilityTable.defaultPreemptionMode); } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTest, GivenXeHpAndLaterThenProfilingTimerResolutionIs83) { const auto &caps = pDevice->getDeviceInfo(); EXPECT_EQ(83u, caps.outProfilingTimerResolution); } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTests, GivenXeHpAndLaterThenKmdNotifyIsDisabled) { EXPECT_FALSE(defaultHwInfo->capabilityTable.kmdNotifyProperties.enableKmdNotify); EXPECT_EQ(0, defaultHwInfo->capabilityTable.kmdNotifyProperties.delayKmdNotifyMicroseconds); EXPECT_FALSE(defaultHwInfo->capabilityTable.kmdNotifyProperties.enableQuickKmdSleep); EXPECT_EQ(0, defaultHwInfo->capabilityTable.kmdNotifyProperties.delayQuickKmdSleepMicroseconds); EXPECT_FALSE(defaultHwInfo->capabilityTable.kmdNotifyProperties.enableQuickKmdSleepForSporadicWaits); EXPECT_EQ(0, defaultHwInfo->capabilityTable.kmdNotifyProperties.delayQuickKmdSleepForSporadicWaitsMicroseconds); EXPECT_FALSE(defaultHwInfo->capabilityTable.kmdNotifyProperties.enableQuickKmdSleepForDirectSubmission); EXPECT_EQ(0, defaultHwInfo->capabilityTable.kmdNotifyProperties.delayQuickKmdSleepForDirectSubmissionMicroseconds); } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTests, GivenXeHpAndLaterThenCompressionFeatureFlagIsFalse) { EXPECT_FALSE(defaultHwInfo->capabilityTable.ftrRenderCompressedBuffers); EXPECT_FALSE(defaultHwInfo->capabilityTable.ftrRenderCompressedImages); } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTest, givenHwInfoWhenRequestedComputeUnitsUsedForScratchThenReturnValidValue) { const auto &hwInfo = pDevice->getHardwareInfo(); auto &gfxCoreHelper = pDevice->getRootDeviceEnvironment().getHelper(); auto &productHelper = pDevice->getProductHelper(); const uint32_t multiplyFactor = productHelper.getThreadEuRatioForScratch(hwInfo) / 8u; const uint32_t numThreadsPerEu = (hwInfo.gtSystemInfo.ThreadCount / hwInfo.gtSystemInfo.EUCount) * multiplyFactor; uint32_t expectedValue = productHelper.computeMaxNeededSubSliceSpace(hwInfo) * hwInfo.gtSystemInfo.MaxEuPerSubSlice * numThreadsPerEu; EXPECT_EQ(expectedValue, gfxCoreHelper.getComputeUnitsUsedForScratch(pDevice->getRootDeviceEnvironment())); EXPECT_EQ(expectedValue, pDevice->getDeviceInfo().computeUnitsUsedForScratch); } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTests, givenDebugFlagSetWhenAskingForComputeUnitsForScratchThenReturnNewValue) { DebugManagerStateRestore restore; uint32_t expectedValue = defaultHwInfo->gtSystemInfo.ThreadCount + 11; debugManager.flags.OverrideNumComputeUnitsForScratch.set(static_cast(expectedValue)); auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(defaultHwInfo.get())); auto &gfxCoreHelper = device->getRootDeviceEnvironment().getHelper(); EXPECT_EQ(expectedValue, gfxCoreHelper.getComputeUnitsUsedForScratch(device->getRootDeviceEnvironment())); EXPECT_EQ(expectedValue, device->getDeviceInfo().computeUnitsUsedForScratch); } HWTEST2_F(DeviceTests, givenHwInfoWhenSlmSizeIsRequiredThenReturnCorrectValue, IsXeHpgCore) { EXPECT_EQ(64u, defaultHwInfo->capabilityTable.slmSize); } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTests, givenXeHPAndLaterProductWhenCheckingDeviceEnqueueSupportThenFalseIsReturned) { EXPECT_FALSE(defaultHwInfo->capabilityTable.supportsDeviceEnqueue); } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTests, givenXeHPAndLaterProductWhenCheckingPipesSupportThenFalseIsReturned) { EXPECT_FALSE(defaultHwInfo->capabilityTable.supportsPipes); } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTests, givenXeHPAndLaterProductWhenRequestedVmeFlagsThenReturnFalse) { EXPECT_FALSE(defaultHwInfo->capabilityTable.supportsVme); EXPECT_FALSE(defaultHwInfo->capabilityTable.ftrSupportsVmeAvcTextureSampler); EXPECT_FALSE(defaultHwInfo->capabilityTable.ftrSupportsVmeAvcPreemption); } TEST_F(DeviceTests, whenCheckingPreferredPlatformNameThenNullIsReturned) { EXPECT_EQ(nullptr, defaultHwInfo->capabilityTable.preferredPlatformName); } TEST(Device, givenDifferentEngineTypesWhenIsSecondaryContextEngineTypeCalledThenTrueReturnedForCcsOrBcs) { auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(defaultHwInfo.get())); for (uint32_t i = 0; i < static_cast(aub_stream::EngineType::NUM_ENGINES); i++) { auto type = static_cast(i); if (EngineHelpers::isBcs(type) || EngineHelpers::isCcs(type)) { EXPECT_TRUE(device->isSecondaryContextEngineType(type)); } else { EXPECT_FALSE(device->isSecondaryContextEngineType(type)); } } } TEST(Device, whenAllocateDebugSurfaceIsCalledThenEachSubDeviceContainsCorrectDebugSurface) { DebugManagerStateRestore dbgRestorer; debugManager.flags.CreateMultipleSubDevices.set(4); auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(defaultHwInfo.get())); size_t size = 8u; device->allocateDebugSurface(size); auto *debugSurface = device->getDebugSurface(); for (auto *subDevice : device->getSubDevices()) { EXPECT_EQ(debugSurface, subDevice->getDebugSurface()); } } HWCMDTEST_F(IGFX_XE_HP_CORE, DeviceTests, givenCCSEngineAndContextGroupSizeEnabledWhenCreatingEngineThenItsContextHasContextGroupFlagSet) { DebugManagerStateRestore dbgRestorer; const uint32_t contextGroupSize = 8; debugManager.flags.ContextGroupSize.set(contextGroupSize); HardwareInfo hwInfo = *defaultHwInfo; hwInfo.featureTable.flags.ftrRcsNode = false; hwInfo.featureTable.flags.ftrCCSNode = true; hwInfo.featureTable.ftrBcsInfo = 0; hwInfo.capabilityTable.defaultEngineType = aub_stream::ENGINE_CCS; hwInfo.gtSystemInfo.CCSInfo.NumberOfCCSEnabled = 1; MockExecutionEnvironment executionEnvironment(&hwInfo, false, 1); executionEnvironment.incRefInternal(); UltDeviceFactory deviceFactory{1, 0, executionEnvironment}; auto defaultEngine = deviceFactory.rootDevices[0]->getDefaultEngine(); EXPECT_NE(nullptr, &defaultEngine); EXPECT_EQ(aub_stream::EngineType::ENGINE_CCS, defaultEngine.getEngineType()); EXPECT_EQ(EngineUsage::regular, defaultEngine.getEngineUsage()); EXPECT_TRUE(defaultEngine.osContext->isPartOfContextGroup()); } HWTEST_F(DeviceTests, givenCCSEnginesAndContextGroupSizeEnabledWhenDeviceIsCreatedThenSecondaryEnginesAreCreated) { DebugManagerStateRestore dbgRestorer; const uint32_t contextGroupSize = 8; debugManager.flags.ContextGroupSize.set(contextGroupSize); HardwareInfo hwInfo = *defaultHwInfo; hwInfo.featureTable.flags.ftrCCSNode = true; hwInfo.featureTable.ftrBcsInfo = 0; hwInfo.capabilityTable.defaultEngineType = aub_stream::ENGINE_CCS; uint32_t numOfCCS[] = {1, 2, 4}; for (size_t i = 0; i < arrayCount(numOfCCS); i++) { hwInfo.gtSystemInfo.CCSInfo.NumberOfCCSEnabled = numOfCCS[i]; auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(&hwInfo)); auto &engineGroups = device->getRegularEngineGroups(); auto engineGroupType = EngineGroupType::compute; size_t computeEnginesCount = 0; for (const auto &engine : engineGroups) { if (engine.engineGroupType == engineGroupType) { computeEnginesCount = engine.engines.size(); } } if (computeEnginesCount == 0) { GTEST_SKIP(); } ASSERT_EQ(computeEnginesCount, device->secondaryEngines.size()); ASSERT_EQ(contextGroupSize / numOfCCS[i], device->secondaryEngines[aub_stream::EngineType::ENGINE_CCS].engines.size()); auto defaultEngine = device->getDefaultEngine(); EXPECT_EQ(defaultEngine.commandStreamReceiver, device->secondaryEngines[aub_stream::EngineType::ENGINE_CCS].engines[0].commandStreamReceiver); const uint32_t regularContextCount = std::min(contextGroupSize / 2, 4u) / numOfCCS[i]; for (uint32_t ccsIndex = 0; ccsIndex < computeEnginesCount; ccsIndex++) { auto &secondaryEngines = device->secondaryEngines[EngineHelpers::mapCcsIndexToEngineType(ccsIndex)]; EXPECT_TRUE(secondaryEngines.engines[0].osContext->isPartOfContextGroup()); EXPECT_EQ(nullptr, secondaryEngines.engines[0].osContext->getPrimaryContext()); for (size_t i = 1; i < device->secondaryEngines[aub_stream::EngineType::ENGINE_CCS].engines.size(); i++) { EXPECT_EQ(secondaryEngines.engines[0].osContext, secondaryEngines.engines[i].osContext->getPrimaryContext()); EXPECT_TRUE(secondaryEngines.engines[i].osContext->isPartOfContextGroup()); } EXPECT_EQ(0u, secondaryEngines.regularCounter.load()); EXPECT_EQ(0u, secondaryEngines.highPriorityCounter.load()); EXPECT_EQ(regularContextCount, secondaryEngines.regularEnginesTotal); EXPECT_EQ(contextGroupSize / numOfCCS[i] - regularContextCount, secondaryEngines.highPriorityEnginesTotal); for (size_t contextId = 0; contextId < regularContextCount + 1; contextId++) { auto engine = device->getSecondaryEngineCsr({EngineHelpers::mapCcsIndexToEngineType(ccsIndex), EngineUsage::regular}, false); ASSERT_NE(nullptr, engine); EXPECT_EQ(contextId + 1, secondaryEngines.regularCounter.load()); if (contextId == regularContextCount) { EXPECT_EQ(&secondaryEngines.engines[0], engine); } } auto hpCount = contextGroupSize / numOfCCS[i] - regularContextCount; for (size_t contextId = 0; contextId < hpCount + 1; contextId++) { auto engine = device->getSecondaryEngineCsr({EngineHelpers::mapCcsIndexToEngineType(ccsIndex), EngineUsage::highPriority}, false); ASSERT_NE(nullptr, engine); EXPECT_EQ(contextId + 1, secondaryEngines.highPriorityCounter.load()); if (contextId == hpCount) { EXPECT_EQ(&secondaryEngines.engines[regularContextCount], engine); } } } auto internalEngine = device->getInternalEngine(); EXPECT_NE(internalEngine.commandStreamReceiver, device->getSecondaryEngineCsr({aub_stream::EngineType::ENGINE_CCS, EngineUsage::internal}, false)->commandStreamReceiver); } } HWTEST_F(DeviceTests, givenRootDeviceWithCCSEngineAndContextGroupSizeEnabledWhenDeviceIsCreatedThenSecondaryEnginesAreCreated) { if (defaultHwInfo->capabilityTable.defaultEngineType != aub_stream::EngineType::ENGINE_CCS) { GTEST_SKIP(); } DebugManagerStateRestore dbgRestorer; const uint32_t contextGroupSize = 8; debugManager.flags.ContextGroupSize.set(contextGroupSize); debugManager.flags.CreateMultipleSubDevices.set(2); HardwareInfo hwInfo = *defaultHwInfo; hwInfo.featureTable.flags.ftrCCSNode = true; hwInfo.featureTable.ftrBcsInfo = 0; hwInfo.capabilityTable.defaultEngineType = aub_stream::ENGINE_CCS; hwInfo.gtSystemInfo.CCSInfo.NumberOfCCSEnabled = 1; auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(&hwInfo)); auto &engineGroups = device->getRegularEngineGroups(); auto engineGroupType = EngineGroupType::compute; size_t computeEnginesCount = 0; for (const auto &engine : engineGroups) { if (engine.engineGroupType == engineGroupType) { computeEnginesCount = engine.engines.size(); } } if (computeEnginesCount == 0) { GTEST_SKIP(); } ASSERT_EQ(computeEnginesCount, device->secondaryEngines.size()); ASSERT_EQ(contextGroupSize, device->secondaryEngines[aub_stream::EngineType::ENGINE_CCS].engines.size()); auto defaultEngine = device->getDefaultEngine(); EXPECT_EQ(defaultEngine.commandStreamReceiver, device->secondaryEngines[aub_stream::EngineType::ENGINE_CCS].engines[0].commandStreamReceiver); const uint32_t regularContextCount = std::min(contextGroupSize / 2, 4u); for (uint32_t ccsIndex = 0; ccsIndex < computeEnginesCount; ccsIndex++) { auto &secondaryEngines = device->secondaryEngines[EngineHelpers::mapCcsIndexToEngineType(ccsIndex)]; EXPECT_TRUE(secondaryEngines.engines[0].osContext->isPartOfContextGroup()); EXPECT_EQ(nullptr, secondaryEngines.engines[0].osContext->getPrimaryContext()); for (size_t i = 1; i < device->secondaryEngines[aub_stream::EngineType::ENGINE_CCS].engines.size(); i++) { EXPECT_EQ(secondaryEngines.engines[0].osContext, secondaryEngines.engines[i].osContext->getPrimaryContext()); EXPECT_TRUE(secondaryEngines.engines[i].osContext->isPartOfContextGroup()); } EXPECT_EQ(0u, secondaryEngines.regularCounter.load()); EXPECT_EQ(0u, secondaryEngines.highPriorityCounter.load()); EXPECT_EQ(regularContextCount, secondaryEngines.regularEnginesTotal); EXPECT_EQ(contextGroupSize - regularContextCount, secondaryEngines.highPriorityEnginesTotal); for (size_t contextId = 0; contextId < regularContextCount + 1; contextId++) { auto engine = device->getSecondaryEngineCsr({EngineHelpers::mapCcsIndexToEngineType(ccsIndex), EngineUsage::regular}, false); ASSERT_NE(nullptr, engine); EXPECT_EQ(contextId + 1, secondaryEngines.regularCounter.load()); if (contextId == regularContextCount) { EXPECT_EQ(&secondaryEngines.engines[0], engine); } } for (size_t contextId = 0; contextId < contextGroupSize - regularContextCount + 1; contextId++) { auto engine = device->getSecondaryEngineCsr({EngineHelpers::mapCcsIndexToEngineType(ccsIndex), EngineUsage::highPriority}, false); ASSERT_NE(nullptr, engine); EXPECT_EQ(contextId + 1, secondaryEngines.highPriorityCounter.load()); if (contextId == contextGroupSize - regularContextCount) { EXPECT_EQ(&secondaryEngines.engines[regularContextCount], engine); } } } } HWTEST_F(DeviceTests, givenContextGroupSizeEnabledWhenMoreHpEnginesCreatedThenFreeEnginesAreAssignedUpToHalfOfContextGroup) { DebugManagerStateRestore dbgRestorer; const uint32_t contextGroupSize = 14; debugManager.flags.ContextGroupSize.set(contextGroupSize); HardwareInfo hwInfo = *defaultHwInfo; hwInfo.featureTable.flags.ftrCCSNode = true; hwInfo.featureTable.ftrBcsInfo = 0; hwInfo.capabilityTable.defaultEngineType = aub_stream::ENGINE_CCS; hwInfo.gtSystemInfo.CCSInfo.NumberOfCCSEnabled = 1; auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(&hwInfo)); auto &engineGroups = device->getRegularEngineGroups(); auto engineGroupType = EngineGroupType::compute; size_t computeEnginesCount = 0; for (const auto &engine : engineGroups) { if (engine.engineGroupType == engineGroupType) { computeEnginesCount = engine.engines.size(); } } if (computeEnginesCount == 0) { GTEST_SKIP(); } ASSERT_EQ(computeEnginesCount, device->secondaryEngines.size()); ASSERT_EQ(contextGroupSize, device->secondaryEngines[aub_stream::EngineType::ENGINE_CCS].engines.size()); auto defaultEngine = device->getDefaultEngine(); EXPECT_EQ(defaultEngine.commandStreamReceiver, device->secondaryEngines[aub_stream::EngineType::ENGINE_CCS].engines[0].commandStreamReceiver); const uint32_t maxHpContextCount = contextGroupSize / 2; for (uint32_t ccsIndex = 0; ccsIndex < computeEnginesCount; ccsIndex++) { auto &secondaryEngines = device->secondaryEngines[EngineHelpers::mapCcsIndexToEngineType(ccsIndex)]; EXPECT_TRUE(secondaryEngines.engines[0].osContext->isPartOfContextGroup()); EXPECT_EQ(nullptr, secondaryEngines.engines[0].osContext->getPrimaryContext()); for (size_t i = 1; i < device->secondaryEngines[aub_stream::EngineType::ENGINE_CCS].engines.size(); i++) { EXPECT_EQ(secondaryEngines.engines[0].osContext, secondaryEngines.engines[i].osContext->getPrimaryContext()); EXPECT_TRUE(secondaryEngines.engines[i].osContext->isPartOfContextGroup()); } EXPECT_EQ(0u, secondaryEngines.regularCounter.load()); EXPECT_EQ(0u, secondaryEngines.highPriorityCounter.load()); auto regularContextCount = secondaryEngines.regularEnginesTotal; EXPECT_EQ(contextGroupSize - regularContextCount, secondaryEngines.highPriorityEnginesTotal); uint32_t npCounter = 0; uint32_t hpCounter = 0; std::vector hpEngines; for (size_t contextId = 0; contextId < maxHpContextCount + 2; contextId++) { if (contextId == 2) { auto engine = device->getSecondaryEngineCsr({EngineHelpers::mapCcsIndexToEngineType(ccsIndex), EngineUsage::regular}, false); ASSERT_NE(nullptr, engine); EXPECT_EQ(1, secondaryEngines.regularCounter.load()); EXPECT_EQ(&secondaryEngines.engines[npCounter], engine); EXPECT_FALSE(secondaryEngines.engines[npCounter].osContext->isHighPriority()); npCounter++; } if (contextId == 6) { auto engine = device->getSecondaryEngineCsr({EngineHelpers::mapCcsIndexToEngineType(ccsIndex), EngineUsage::regular}, false); ASSERT_NE(nullptr, engine); EXPECT_EQ(2, secondaryEngines.regularCounter.load()); EXPECT_EQ(&secondaryEngines.engines[npCounter], engine); EXPECT_FALSE(secondaryEngines.engines[npCounter].osContext->isHighPriority()); npCounter++; } auto engine = device->getSecondaryEngineCsr({EngineHelpers::mapCcsIndexToEngineType(ccsIndex), EngineUsage::highPriority}, false); ASSERT_NE(nullptr, engine); hpEngines.push_back(engine); hpCounter++; if (contextId < secondaryEngines.highPriorityEnginesTotal) { EXPECT_EQ(&secondaryEngines.engines[regularContextCount + hpCounter - 1], engine); EXPECT_TRUE(secondaryEngines.engines[regularContextCount + hpCounter - 1].osContext->isHighPriority()); } else if (contextId >= secondaryEngines.highPriorityEnginesTotal) { if (hpCounter <= maxHpContextCount) { EXPECT_EQ(&secondaryEngines.engines[npCounter], engine); EXPECT_TRUE(secondaryEngines.engines[npCounter].osContext->isHighPriority()); npCounter++; } else { EXPECT_EQ(hpEngines[hpCounter - 1 % maxHpContextCount], engine); EXPECT_TRUE(hpEngines[hpCounter - 1 % maxHpContextCount]->osContext->isHighPriority()); } } } } } HWTEST_F(DeviceTests, givenDebugFlagSetWhenCreatingSecondaryEnginesThenCreateCorrectNumberOfHighPriorityContexts) { DebugManagerStateRestore dbgRestorer; constexpr uint32_t contextGroupSize = 16; constexpr uint32_t numHighPriorityContexts = 6; debugManager.flags.ContextGroupSize.set(contextGroupSize); debugManager.flags.OverrideNumHighPriorityContexts.set(numHighPriorityContexts); HardwareInfo hwInfo = *defaultHwInfo; hwInfo.featureTable.flags.ftrCCSNode = true; hwInfo.featureTable.ftrBcsInfo = 0; hwInfo.capabilityTable.defaultEngineType = aub_stream::ENGINE_CCS; hwInfo.gtSystemInfo.CCSInfo.NumberOfCCSEnabled = 1; { auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(&hwInfo)); auto &engineGroups = device->getRegularEngineGroups(); auto engineGroupType = EngineGroupType::compute; size_t computeEnginesCount = 0; for (const auto &engine : engineGroups) { if (engine.engineGroupType == engineGroupType) { computeEnginesCount = engine.engines.size(); } } if (computeEnginesCount == 0) { GTEST_SKIP(); } ASSERT_EQ(computeEnginesCount, device->secondaryEngines.size()); ASSERT_EQ(contextGroupSize, device->secondaryEngines[aub_stream::EngineType::ENGINE_CCS].engines.size()); constexpr uint32_t regularContextCount = contextGroupSize - numHighPriorityContexts; auto &secondaryEngines = device->secondaryEngines[EngineHelpers::mapCcsIndexToEngineType(0)]; EXPECT_EQ(regularContextCount, secondaryEngines.regularEnginesTotal); EXPECT_EQ(contextGroupSize - regularContextCount, secondaryEngines.highPriorityEnginesTotal); } { debugManager.flags.OverrideNumHighPriorityContexts.set(0); auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(&hwInfo)); ASSERT_EQ(contextGroupSize, device->secondaryEngines[aub_stream::EngineType::ENGINE_CCS].engines.size()); auto &secondaryEngines = device->secondaryEngines[EngineHelpers::mapCcsIndexToEngineType(0)]; EXPECT_EQ(nullptr, secondaryEngines.getEngine(EngineUsage::highPriority)); } { debugManager.flags.OverrideNumHighPriorityContexts.set(contextGroupSize); auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(&hwInfo)); ASSERT_EQ(contextGroupSize, device->secondaryEngines[aub_stream::EngineType::ENGINE_CCS].engines.size()); auto &secondaryEngines = device->secondaryEngines[EngineHelpers::mapCcsIndexToEngineType(0)]; EXPECT_EQ(nullptr, secondaryEngines.getEngine(EngineUsage::regular)); } } HWTEST_F(DeviceTests, givenContextGroupEnabledWhenGettingSecondaryEngineThenResourcesAndContextAreInitialized) { HardwareInfo hwInfo = *defaultHwInfo; if (hwInfo.capabilityTable.defaultEngineType != aub_stream::EngineType::ENGINE_CCS) { GTEST_SKIP(); } DebugManagerStateRestore dbgRestorer; debugManager.flags.ContextGroupSize.set(5); hwInfo.featureTable.flags.ftrCCSNode = true; hwInfo.capabilityTable.defaultEngineType = aub_stream::ENGINE_CCS; hwInfo.gtSystemInfo.CCSInfo.NumberOfCCSEnabled = 1; hwInfo.capabilityTable.defaultPreemptionMode = PreemptionMode::MidThread; auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(&hwInfo)); const auto &gfxCoreHelper = device->getRootDeviceEnvironment().getHelper(); const auto ccsIndex = 0; auto &secondaryEngines = device->secondaryEngines[EngineHelpers::mapCcsIndexToEngineType(ccsIndex)]; auto secondaryEnginesCount = secondaryEngines.engines.size(); ASSERT_EQ(5u, secondaryEnginesCount); EXPECT_TRUE(secondaryEngines.engines[0].commandStreamReceiver->isInitialized()); EXPECT_EQ(1u, secondaryEngines.engines[0].commandStreamReceiver->peekLatestSentTaskCount()); auto primaryCsr = secondaryEngines.engines[0].commandStreamReceiver; for (uint32_t secondaryIndex = 1; secondaryIndex < secondaryEnginesCount; secondaryIndex++) { EXPECT_FALSE(secondaryEngines.engines[secondaryIndex].osContext->isInitialized()); EXPECT_FALSE(secondaryEngines.engines[secondaryIndex].commandStreamReceiver->isInitialized()); EXPECT_EQ(nullptr, secondaryEngines.engines[secondaryIndex].commandStreamReceiver->getTagAllocation()); EXPECT_EQ(primaryCsr->getGlobalFenceAllocation(), secondaryEngines.engines[secondaryIndex].commandStreamReceiver->getGlobalFenceAllocation()); if (device->getPreemptionMode() == PreemptionMode::MidThread) { EXPECT_EQ(primaryCsr->getPreemptionAllocation(), secondaryEngines.engines[secondaryIndex].commandStreamReceiver->getPreemptionAllocation()); } device->getSecondaryEngineCsr({EngineHelpers::mapCcsIndexToEngineType(ccsIndex), EngineUsage::regular}, false); } for (uint32_t i = 0; i < secondaryEngines.highPriorityEnginesTotal; i++) { device->getSecondaryEngineCsr({EngineHelpers::mapCcsIndexToEngineType(ccsIndex), EngineUsage::highPriority}, false); } for (uint32_t secondaryIndex = 0; secondaryIndex < secondaryEnginesCount; secondaryIndex++) { EXPECT_TRUE(secondaryEngines.engines[secondaryIndex].osContext->isInitialized()); EXPECT_TRUE(secondaryEngines.engines[secondaryIndex].commandStreamReceiver->isInitialized()); EXPECT_NE(nullptr, secondaryEngines.engines[secondaryIndex].commandStreamReceiver->getTagAllocation()); if (gfxCoreHelper.isFenceAllocationRequired(hwInfo)) { EXPECT_NE(nullptr, secondaryEngines.engines[secondaryIndex].commandStreamReceiver->getGlobalFenceAllocation()); } if (device->getPreemptionMode() == PreemptionMode::MidThread) { EXPECT_NE(nullptr, secondaryEngines.engines[secondaryIndex].commandStreamReceiver->getPreemptionAllocation()); } } } HWTEST_F(DeviceTests, givenContextGroupEnabledWhenDeviceIsDestroyedThenSecondaryContextsAreReleased) { HardwareInfo hwInfo = *defaultHwInfo; if (hwInfo.capabilityTable.defaultEngineType != aub_stream::EngineType::ENGINE_CCS) { GTEST_SKIP(); } DebugManagerStateRestore dbgRestorer; debugManager.flags.ContextGroupSize.set(5); hwInfo.featureTable.flags.ftrCCSNode = true; hwInfo.capabilityTable.defaultEngineType = aub_stream::ENGINE_CCS; hwInfo.gtSystemInfo.CCSInfo.NumberOfCCSEnabled = 1; auto executionEnvironment = NEO::MockDevice::prepareExecutionEnvironment(&hwInfo, 0u); executionEnvironment->incRefInternal(); auto device = std::unique_ptr(MockDevice::createWithExecutionEnvironment(&hwInfo, executionEnvironment, 0)); auto memoryManager = static_cast(executionEnvironment->memoryManager.get()); const auto ccsIndex = 0; auto &secondaryEngines = device->secondaryEngines[EngineHelpers::mapCcsIndexToEngineType(ccsIndex)]; auto secondaryEnginesCount = secondaryEngines.engines.size(); ASSERT_EQ(5u, secondaryEnginesCount); ASSERT_LE(1u, memoryManager->secondaryEngines.size()); EXPECT_EQ(secondaryEnginesCount - 1, memoryManager->secondaryEngines[0].size()); device.reset(nullptr); EXPECT_EQ(0u, memoryManager->secondaryEngines[0].size()); executionEnvironment->decRefInternal(); } HWTEST_F(DeviceTests, givenContextGroupEnabledAndAllocationUsedBySeconadryContextWhenDeviceIsDestroyedThenNotCompletedAllocationsAreWaitedOn) { HardwareInfo hwInfo = *defaultHwInfo; if (hwInfo.capabilityTable.defaultEngineType != aub_stream::EngineType::ENGINE_CCS) { GTEST_SKIP(); } DebugManagerStateRestore dbgRestorer; debugManager.flags.ContextGroupSize.set(5); hwInfo.featureTable.flags.ftrCCSNode = true; hwInfo.capabilityTable.defaultEngineType = aub_stream::ENGINE_CCS; hwInfo.gtSystemInfo.CCSInfo.NumberOfCCSEnabled = 1; auto executionEnvironment = NEO::MockDevice::prepareExecutionEnvironment(&hwInfo, 0u); executionEnvironment->incRefInternal(); auto device = std::unique_ptr(MockDevice::createWithExecutionEnvironment(&hwInfo, executionEnvironment, 0)); auto memoryManager = static_cast(executionEnvironment->memoryManager.get()); EXPECT_NE(device->secondaryEngines.end(), device->secondaryEngines.find(aub_stream::ENGINE_CCS)); auto &secondaryEngines = device->secondaryEngines[aub_stream::ENGINE_CCS]; auto secondaryEnginesCount = secondaryEngines.engines.size(); ASSERT_EQ(5u, secondaryEnginesCount); auto engine = device->getSecondaryEngineCsr({aub_stream::ENGINE_CCS, EngineUsage::regular}, false); ASSERT_NE(nullptr, engine); auto csr = engine->commandStreamReceiver; auto engine2 = device->getSecondaryEngineCsr({aub_stream::ENGINE_CCS, EngineUsage::regular}, false); ASSERT_NE(nullptr, engine2); auto csr2 = engine2->commandStreamReceiver; ASSERT_NE(csr, csr2); auto tagAddress = csr->getTagAddress(); auto tagAddress2 = csr2->getTagAddress(); EXPECT_NE(csr->getOsContext().getContextId(), csr2->getOsContext().getContextId()); EXPECT_NE(tagAddress, tagAddress2); auto usedAllocationAndNotGpuCompleted = memoryManager->allocateGraphicsMemoryWithProperties(MockAllocationProperties{csr->getRootDeviceIndex(), MemoryConstants::pageSize}); usedAllocationAndNotGpuCompleted->updateTaskCount(*tagAddress + 1, csr->getOsContext().getContextId()); auto usedAllocationAndNotGpuCompleted2 = memoryManager->allocateGraphicsMemoryWithProperties(MockAllocationProperties{csr->getRootDeviceIndex(), MemoryConstants::pageSize}); usedAllocationAndNotGpuCompleted2->updateTaskCount(*tagAddress2 + 1, csr2->getOsContext().getContextId()); memoryManager->checkGpuUsageAndDestroyGraphicsAllocations(usedAllocationAndNotGpuCompleted); memoryManager->checkGpuUsageAndDestroyGraphicsAllocations(usedAllocationAndNotGpuCompleted2); EXPECT_TRUE(csr->getTemporaryAllocations().peekIsEmpty()); EXPECT_FALSE(csr->getDeferredAllocations().peekIsEmpty()); EXPECT_EQ(csr->getDeferredAllocations().peekHead(), usedAllocationAndNotGpuCompleted); usedAllocationAndNotGpuCompleted->updateTaskCount(csr->peekLatestFlushedTaskCount(), csr->getOsContext().getContextId()); usedAllocationAndNotGpuCompleted2->updateTaskCount(csr2->peekLatestFlushedTaskCount(), csr2->getOsContext().getContextId()); device.reset(nullptr); EXPECT_EQ(0u, memoryManager->secondaryEngines[0].size()); EXPECT_EQ(0u, memoryManager->allRegisteredEngines[0].size()); executionEnvironment->decRefInternal(); } HWTEST_F(DeviceTests, givenCopyEnginesWhenCreatingSecondaryContextsThenUseCopyTypes) { HardwareInfo hwInfo = *defaultHwInfo; DebugManagerStateRestore dbgRestorer; debugManager.flags.ContextGroupSize.set(5); hwInfo.capabilityTable.blitterOperationsSupported = true; hwInfo.featureTable.ftrBcsInfo = 0b1111; auto executionEnvironment = NEO::MockDevice::prepareExecutionEnvironment(&hwInfo, 0u); executionEnvironment->incRefInternal(); auto device = std::unique_ptr(MockDevice::createWithExecutionEnvironment(&hwInfo, executionEnvironment, 0)); auto &gfxCoreHelper = device->getRootDeviceEnvironment().getHelper(); auto memoryManager = static_cast(executionEnvironment->memoryManager.get()); auto &enabledEngines = gfxCoreHelper.getGpgpuEngineInstances(device->getRootDeviceEnvironment()); for (auto engineType : {aub_stream::EngineType::ENGINE_BCS, aub_stream::EngineType::ENGINE_BCS1, aub_stream::EngineType::ENGINE_BCS2, aub_stream::EngineType::ENGINE_BCS3}) { auto supportedRegular = std::find_if(enabledEngines.begin(), enabledEngines.end(), [&engineType](const auto &engine) { return (engine.first == engineType) && (engine.second == EngineUsage::regular); }) != enabledEngines.end(); auto supportedHp = std::find_if(enabledEngines.begin(), enabledEngines.end(), [&engineType](const auto &engine) { return (engine.first == engineType) && (engine.second == EngineUsage::highPriority); }) != enabledEngines.end(); if (supportedRegular || supportedHp) { auto usage = supportedRegular ? EngineUsage::regular : EngineUsage::highPriority; EXPECT_NE(device->secondaryEngines.end(), device->secondaryEngines.find(engineType)); auto expectedEngineCount = 5u; if (supportedRegular) { gfxCoreHelper.adjustCopyEngineRegularContextCount(device->secondaryEngines[engineType].engines.size(), expectedEngineCount); } EXPECT_EQ(expectedEngineCount, device->secondaryEngines[engineType].engines.size()); auto engine = device->getSecondaryEngineCsr({engineType, usage}, false); ASSERT_NE(nullptr, engine); auto csr = engine->commandStreamReceiver; auto engine2 = device->getSecondaryEngineCsr({engineType, usage}, false); ASSERT_NE(nullptr, engine2); auto csr2 = engine2->commandStreamReceiver; ASSERT_NE(csr, csr2); auto tagAddress = csr->getTagAddress(); auto tagAddress2 = csr2->getTagAddress(); EXPECT_NE(csr->getOsContext().getContextId(), csr2->getOsContext().getContextId()); EXPECT_NE(tagAddress, tagAddress2); } else { EXPECT_EQ(device->secondaryEngines.end(), device->secondaryEngines.find(engineType)); } } device.reset(nullptr); EXPECT_EQ(0u, memoryManager->secondaryEngines[0].size()); EXPECT_EQ(0u, memoryManager->allRegisteredEngines[0].size()); EXPECT_GT(memoryManager->maxOsContextCount, memoryManager->latestContextId); executionEnvironment->decRefInternal(); } HWTEST_F(DeviceTests, givenDebugFlagSetWhenCreatingSecondaryEnginesThenSkipSelectedEngineTypes) { HardwareInfo hwInfo = *defaultHwInfo; if (hwInfo.capabilityTable.defaultEngineType != aub_stream::EngineType::ENGINE_CCS) { GTEST_SKIP(); } uint32_t computeEngineBit = 1 << static_cast(aub_stream::EngineType::ENGINE_CCS); DebugManagerStateRestore dbgRestorer; debugManager.flags.ContextGroupSize.set(5); debugManager.flags.SecondaryContextEngineTypeMask.set(~computeEngineBit); hwInfo.featureTable.flags.ftrCCSNode = true; hwInfo.capabilityTable.defaultEngineType = aub_stream::ENGINE_CCS; hwInfo.gtSystemInfo.CCSInfo.NumberOfCCSEnabled = 1; auto executionEnvironment = NEO::MockDevice::prepareExecutionEnvironment(&hwInfo, 0u); executionEnvironment->incRefInternal(); auto device = std::unique_ptr(MockDevice::createWithExecutionEnvironment(&hwInfo, executionEnvironment, 0)); EXPECT_EQ(device->secondaryEngines.end(), device->secondaryEngines.find(aub_stream::ENGINE_CCS)); executionEnvironment->decRefInternal(); } HWTEST_F(DeviceTests, givenHpCopyEngineAndDebugFlagSetWhenCreatingSecondaryEnginesThenSkipSelectedEngineTypes) { HardwareInfo hwInfo = *defaultHwInfo; DebugManagerStateRestore dbgRestorer; debugManager.flags.ContextGroupSize.set(5); hwInfo.featureTable.flags.ftrCCSNode = true; hwInfo.capabilityTable.defaultEngineType = aub_stream::ENGINE_CCS; hwInfo.gtSystemInfo.CCSInfo.NumberOfCCSEnabled = 1; hwInfo.capabilityTable.blitterOperationsSupported = true; hwInfo.featureTable.ftrBcsInfo = 0b111; auto executionEnvironment = std::unique_ptr(NEO::MockDevice::prepareExecutionEnvironment(&hwInfo, 0u)); const auto &gfxCoreHelper = executionEnvironment->rootDeviceEnvironments[0]->getHelper(); auto hpEngine = gfxCoreHelper.getDefaultHpCopyEngine(hwInfo); if (hpEngine == aub_stream::EngineType::NUM_ENGINES) { GTEST_SKIP(); } uint32_t computeEngineBit = 1 << static_cast(hpEngine); debugManager.flags.SecondaryContextEngineTypeMask.set(~computeEngineBit); auto device = std::unique_ptr(MockDevice::createWithExecutionEnvironment(&hwInfo, executionEnvironment.release(), 0)); EXPECT_NE(nullptr, device->getHpCopyEngine()); EXPECT_EQ(device->secondaryEngines.end(), device->secondaryEngines.find(hpEngine)); } TEST_F(DeviceTests, GivenDebuggingEnabledWhenDeviceIsInitializedThenL0DebuggerIsCreated) { auto executionEnvironment = MockDevice::prepareExecutionEnvironment(defaultHwInfo.get(), 0u); executionEnvironment->setDebuggingMode(NEO::DebuggingMode::online); auto device = std::unique_ptr(MockDevice::createWithExecutionEnvironment(defaultHwInfo.get(), executionEnvironment, 0u)); EXPECT_NE(nullptr, device->getL0Debugger()); } TEST_F(DeviceTests, givenDebuggerRequestedByUserAndNotAvailableWhenDeviceIsInitializedThenErrorIsPrintedButNotReturned) { extern bool forceCreateNullptrDebugger; VariableBackup backupForceCreateNullptrDebugger{&forceCreateNullptrDebugger, true}; DebugManagerStateRestore restorer; auto executionEnvironment = MockDevice::prepareExecutionEnvironment(defaultHwInfo.get(), 0u); executionEnvironment->setDebuggingMode(NEO::DebuggingMode::online); NEO::debugManager.flags.PrintDebugMessages.set(1); ::testing::internal::CaptureStderr(); auto device = std::unique_ptr(MockDevice::createWithExecutionEnvironment(defaultHwInfo.get(), executionEnvironment, 0u)); auto output = testing::internal::GetCapturedStderr(); EXPECT_EQ(std::string("Debug mode is not enabled in the system.\n"), output); EXPECT_EQ(nullptr, device->getL0Debugger()); } TEST_F(DeviceTests, givenDebuggerRequestedByUserWhenDeviceWithSubDevicesCreatedThenInitializeDebuggerOncePerRootDevice) { extern size_t createDebuggerCallCount; DebugManagerStateRestore dbgRestorer; debugManager.flags.DeferStateInitSubmissionToFirstRegularUsage.set(1); createDebuggerCallCount = 0; auto executionEnvironment = MockDevice::prepareExecutionEnvironment(defaultHwInfo.get(), 0u); executionEnvironment->setDebuggingMode(DebuggingMode::online); UltDeviceFactory deviceFactory{1, 4, *executionEnvironment}; EXPECT_EQ(1u, createDebuggerCallCount); EXPECT_NE(nullptr, deviceFactory.rootDevices[0]->getL0Debugger()); } TEST_F(DeviceTests, givenNewUsmPoolingEnabledWhenDeviceInitializedThenUsmMemAllocPoolsManagerIsCreatedButNotInitialized) { VariableBackup backupIsDeviceUsmPoolingEnabledForUlts(&isDeviceUsmPoolingEnabledForUlts); isDeviceUsmPoolingEnabledForUlts = true; { DebugManagerStateRestore restorer; debugManager.flags.ExperimentalUSMAllocationReuseVersion.set(2); auto executionEnvironment = MockDevice::prepareExecutionEnvironment(defaultHwInfo.get(), 0u); auto mockProductHelper = new MockProductHelper; executionEnvironment->rootDeviceEnvironments[0]->productHelper.reset(mockProductHelper); mockProductHelper->isUsmPoolAllocatorSupportedResult = true; UltDeviceFactory deviceFactory{1, 1, *executionEnvironment}; auto device = deviceFactory.rootDevices[0]; auto usmMemAllocPoolsManager = device->getUsmMemAllocPoolsManager(); ASSERT_NE(nullptr, usmMemAllocPoolsManager); EXPECT_FALSE(usmMemAllocPoolsManager->isInitialized()); } { DebugManagerStateRestore restorer; debugManager.flags.ExperimentalUSMAllocationReuseVersion.set(-1); auto executionEnvironment = MockDevice::prepareExecutionEnvironment(defaultHwInfo.get(), 0u); auto mockProductHelper = new MockProductHelper; executionEnvironment->rootDeviceEnvironments[0]->productHelper.reset(mockProductHelper); mockProductHelper->isUsmPoolAllocatorSupportedResult = true; UltDeviceFactory deviceFactory{1, 1, *executionEnvironment}; auto device = deviceFactory.rootDevices[0]; auto usmMemAllocPoolsManager = device->getUsmMemAllocPoolsManager(); EXPECT_EQ(nullptr, usmMemAllocPoolsManager); } { DebugManagerStateRestore restorer; debugManager.flags.ExperimentalUSMAllocationReuseVersion.set(2); auto executionEnvironment = MockDevice::prepareExecutionEnvironment(defaultHwInfo.get(), 0u); auto mockProductHelper = new MockProductHelper; executionEnvironment->rootDeviceEnvironments[0]->productHelper.reset(mockProductHelper); mockProductHelper->isUsmPoolAllocatorSupportedResult = false; UltDeviceFactory deviceFactory{1, 1, *executionEnvironment}; auto device = deviceFactory.rootDevices[0]; auto usmMemAllocPoolsManager = device->getUsmMemAllocPoolsManager(); EXPECT_EQ(nullptr, usmMemAllocPoolsManager); } isDeviceUsmPoolingEnabledForUlts = false; { DebugManagerStateRestore restorer; debugManager.flags.ExperimentalUSMAllocationReuseVersion.set(2); auto executionEnvironment = MockDevice::prepareExecutionEnvironment(defaultHwInfo.get(), 0u); auto mockProductHelper = new MockProductHelper; executionEnvironment->rootDeviceEnvironments[0]->productHelper.reset(mockProductHelper); mockProductHelper->isUsmPoolAllocatorSupportedResult = true; UltDeviceFactory deviceFactory{1, 1, *executionEnvironment}; auto device = deviceFactory.rootDevices[0]; auto usmMemAllocPoolsManager = device->getUsmMemAllocPoolsManager(); EXPECT_EQ(nullptr, usmMemAllocPoolsManager); } } TEST(DeviceWithoutAILTest, givenNoAILWhenCreateDeviceThenDeviceIsCreated) { DebugManagerStateRestore dbgRestorer; debugManager.flags.EnableAIL.set(false); auto hwInfo = *defaultHwInfo; setupDefaultFeatureTableAndWorkaroundTable(&hwInfo); auto device = std::unique_ptr(MockDevice::createWithNewExecutionEnvironment(&hwInfo)); EXPECT_NE(nullptr, device.get()); }