/* * Copyright (C) 2018-2024 Intel Corporation * * SPDX-License-Identifier: MIT * */ #include "shared/source/helpers/hw_info.h" #include "shared/source/command_stream/linear_stream.h" #include "shared/source/debug_settings/debug_settings_manager.h" #include "shared/source/helpers/basic_math.h" #include "shared/source/helpers/gfx_core_helper.h" #include "shared/source/release_helper/release_helper.h" #include namespace NEO { HardwareInfo::HardwareInfo(const PLATFORM *platform, const FeatureTable *featureTable, const WorkaroundTable *workaroundTable, const GT_SYSTEM_INFO *gtSystemInfo, const RuntimeCapabilityTable &capabilityTable) : platform(*platform), featureTable(*featureTable), workaroundTable(*workaroundTable), gtSystemInfo(*gtSystemInfo), capabilityTable(capabilityTable) { } // Global table of hardware prefixes const char *hardwarePrefix[IGFX_MAX_PRODUCT] = { nullptr, }; // Global table of family names bool familyEnabled[IGFX_MAX_CORE] = { false, }; const HardwareInfo *hardwareInfoTable[IGFX_MAX_PRODUCT] = {}; void (*hardwareInfoSetup[IGFX_MAX_PRODUCT])(HardwareInfo *, bool, uint64_t, const ReleaseHelper *) = { 0x0, }; void (*hardwareInfoBaseSetup[IGFX_MAX_PRODUCT])(HardwareInfo *, bool, const ReleaseHelper *) = { 0x0, }; bool getHwInfoForPlatformString(std::string &platform, const HardwareInfo *&hwInfoIn) { std::transform(platform.begin(), platform.end(), platform.begin(), ::tolower); bool ret = false; for (int j = 0; j < IGFX_MAX_PRODUCT; j++) { if (hardwarePrefix[j] == nullptr) continue; if (hardwarePrefix[j] == platform) { hwInfoIn = hardwareInfoTable[j]; ret = true; break; } } return ret; } void setHwInfoValuesFromConfig(const uint64_t hwInfoConfig, HardwareInfo &hwInfoIn) { uint32_t sliceCount = static_cast(hwInfoConfig >> 32); uint32_t subSlicePerSliceCount = static_cast(hwInfoConfig >> 16); uint32_t euPerSubSliceCount = static_cast(hwInfoConfig); hwInfoIn.gtSystemInfo.SliceCount = sliceCount; hwInfoIn.gtSystemInfo.SubSliceCount = subSlicePerSliceCount * sliceCount; hwInfoIn.gtSystemInfo.DualSubSliceCount = subSlicePerSliceCount * sliceCount; hwInfoIn.gtSystemInfo.EUCount = euPerSubSliceCount * subSlicePerSliceCount * sliceCount; hwInfoIn.gtSystemInfo.IsDynamicallyPopulated = true; for (uint32_t slice = 0; slice < hwInfoIn.gtSystemInfo.SliceCount; slice++) { hwInfoIn.gtSystemInfo.SliceInfo[slice].Enabled = true; } if (hwInfoIn.gtSystemInfo.MaxSlicesSupported == 0) { hwInfoIn.gtSystemInfo.MaxSlicesSupported = sliceCount; } if (hwInfoIn.gtSystemInfo.MaxSubSlicesSupported == 0) { hwInfoIn.gtSystemInfo.MaxSubSlicesSupported = hwInfoIn.gtSystemInfo.SubSliceCount; } if (hwInfoIn.gtSystemInfo.MaxDualSubSlicesSupported == 0) { hwInfoIn.gtSystemInfo.MaxDualSubSlicesSupported = hwInfoIn.gtSystemInfo.SubSliceCount; } if (hwInfoIn.gtSystemInfo.MaxEuPerSubSlice == 0) { hwInfoIn.gtSystemInfo.MaxEuPerSubSlice = euPerSubSliceCount; } } bool parseHwInfoConfigString(const std::string &hwInfoConfigStr, uint64_t &hwInfoConfig) { hwInfoConfig = 0u; size_t currPos = hwInfoConfigStr.find('x', 0); if (currPos == std::string::npos) { return false; } uint32_t sliceCount = static_cast(std::stoul(hwInfoConfigStr.substr(0, currPos))); if (sliceCount > std::numeric_limits::max()) { return false; } size_t prevPos = currPos + 1; currPos = hwInfoConfigStr.find('x', prevPos); if (currPos == std::string::npos) { return false; } uint32_t subSlicePerSliceCount = static_cast(std::stoul(hwInfoConfigStr.substr(prevPos, currPos))); if (subSlicePerSliceCount > std::numeric_limits::max()) { return false; } uint32_t subSliceCount = subSlicePerSliceCount * sliceCount; if (subSliceCount > std::numeric_limits::max()) { return false; } prevPos = currPos + 1; uint32_t euPerSubSliceCount = static_cast(std::stoul(hwInfoConfigStr.substr(prevPos, std::string::npos))); if (euPerSubSliceCount > std::numeric_limits::max()) { return false; } uint32_t euCount = euPerSubSliceCount * subSliceCount; if (euCount > std::numeric_limits::max()) { return false; } hwInfoConfig = static_cast(sliceCount & 0xffff) << 32 | static_cast(subSlicePerSliceCount & 0xffff) << 16 | static_cast(euPerSubSliceCount & 0xffff); return true; } aub_stream::EngineType getChosenEngineType(const HardwareInfo &hwInfo) { return debugManager.flags.NodeOrdinal.get() == -1 ? hwInfo.capabilityTable.defaultEngineType : static_cast(debugManager.flags.NodeOrdinal.get()); } void setupDefaultGtSysInfo(HardwareInfo *hwInfo, const ReleaseHelper *releaseHelper) { GT_SYSTEM_INFO *gtSysInfo = &hwInfo->gtSystemInfo; gtSysInfo->L3CacheSizeInKb = 1; gtSysInfo->CCSInfo.IsValid = 1; gtSysInfo->CCSInfo.NumberOfCCSEnabled = 1; gtSysInfo->CCSInfo.Instances.CCSEnableMask = 0b1; // non-zero values for unit tests if (gtSysInfo->SliceCount == 0) { gtSysInfo->SliceCount = 2; gtSysInfo->SubSliceCount = 8; gtSysInfo->DualSubSliceCount = gtSysInfo->SubSliceCount; gtSysInfo->EUCount = 64; gtSysInfo->MaxEuPerSubSlice = gtSysInfo->EUCount / gtSysInfo->SubSliceCount; gtSysInfo->MaxSlicesSupported = gtSysInfo->SliceCount; gtSysInfo->MaxSubSlicesSupported = gtSysInfo->SubSliceCount; gtSysInfo->MaxDualSubSlicesSupported = gtSysInfo->DualSubSliceCount; } gtSysInfo->ThreadCount = gtSysInfo->EUCount * releaseHelper->getNumThreadsPerEu(); } void setupDefaultFeatureTableAndWorkaroundTable(HardwareInfo *hwInfo, const ReleaseHelper &releaseHelper) { FeatureTable *featureTable = &hwInfo->featureTable; featureTable->flags.ftrAstcHdr2D = true; featureTable->flags.ftrAstcLdr2D = true; featureTable->flags.ftrCCSNode = true; featureTable->flags.ftrCCSRing = true; featureTable->flags.ftrFbc = true; featureTable->flags.ftrGpGpuMidBatchPreempt = true; featureTable->flags.ftrGpGpuThreadGroupLevelPreempt = true; featureTable->flags.ftrIA32eGfxPTEs = true; featureTable->flags.ftrL3IACoherency = true; featureTable->flags.ftrLinearCCS = true; featureTable->flags.ftrPPGTT = true; featureTable->flags.ftrSVM = true; featureTable->flags.ftrStandardMipTailFormat = true; featureTable->flags.ftrTileMappedResource = true; featureTable->flags.ftrTranslationTable = true; featureTable->flags.ftrUserModeTranslationTable = true; featureTable->flags.ftrXe2Compression = releaseHelper.getFtrXe2Compression(); WorkaroundTable *workaroundTable = &hwInfo->workaroundTable; workaroundTable->flags.wa4kAlignUVOffsetNV12LinearSurface = true; } uint32_t getNumSubSlicesPerSlice(const HardwareInfo &hwInfo) { return static_cast(Math::divideAndRoundUp(hwInfo.gtSystemInfo.SubSliceCount, hwInfo.gtSystemInfo.SliceCount)); } } // namespace NEO