mirror of
https://github.com/intel/compute-runtime.git
synced 2025-09-15 13:01:45 +08:00
Reorganization directory structure [1/n]
Change-Id: Id1a94577437a4826a32411869f516fec20314ec0
This commit is contained in:
298
opencl/source/gen9/hw_info_kbl.inl
Normal file
298
opencl/source/gen9/hw_info_kbl.inl
Normal file
@ -0,0 +1,298 @@
|
||||
/*
|
||||
* Copyright (C) 2017-2020 Intel Corporation
|
||||
*
|
||||
* SPDX-License-Identifier: MIT
|
||||
*
|
||||
*/
|
||||
|
||||
#include "core/gen9/hw_cmds.h"
|
||||
#include "core/memory_manager/memory_constants.h"
|
||||
|
||||
#include "aub_mem_dump/aub_services.h"
|
||||
#include "engine_node.h"
|
||||
|
||||
namespace NEO {
|
||||
|
||||
const char *HwMapper<IGFX_KABYLAKE>::abbreviation = "kbl";
|
||||
|
||||
bool isSimulationKBL(unsigned short deviceId) {
|
||||
return false;
|
||||
};
|
||||
|
||||
const PLATFORM KBL::platform = {
|
||||
IGFX_KABYLAKE,
|
||||
PCH_UNKNOWN,
|
||||
IGFX_GEN9_CORE,
|
||||
IGFX_GEN9_CORE,
|
||||
PLATFORM_NONE, // default init
|
||||
0, // usDeviceID
|
||||
0, // usRevId. 0 sets the stepping to A0
|
||||
0, // usDeviceID_PCH
|
||||
0, // usRevId_PCH
|
||||
GTTYPE_UNDEFINED};
|
||||
|
||||
const RuntimeCapabilityTable KBL::capabilityTable{
|
||||
EngineDirectSubmissionInitVec{
|
||||
{aub_stream::ENGINE_RCS, {true, true}}}, // directSubmissionEngines
|
||||
{0, 0, 0, false, false, false}, // kmdNotifyProperties
|
||||
MemoryConstants::max48BitAddress, // gpuAddressSpace
|
||||
83.333, // defaultProfilingTimerResolution
|
||||
MemoryConstants::pageSize, // requiredPreemptionSurfaceSize
|
||||
&isSimulationKBL, // isSimulation
|
||||
PreemptionMode::MidThread, // defaultPreemptionMode
|
||||
aub_stream::ENGINE_RCS, // defaultEngineType
|
||||
0, // maxRenderFrequency
|
||||
21, // clVersionSupport
|
||||
CmdServicesMemTraceVersion::DeviceValues::Kbl, // aubDeviceId
|
||||
0, // extraQuantityThreadsPerEU
|
||||
64, // slmSize
|
||||
sizeof(KBL::GRF), // grfSize
|
||||
false, // blitterOperationsSupported
|
||||
true, // ftrSupportsInteger64BitAtomics
|
||||
true, // ftrSupportsFP64
|
||||
true, // ftrSupports64BitMath
|
||||
true, // ftrSvm
|
||||
true, // ftrSupportsCoherency
|
||||
true, // ftrSupportsVmeAvcTextureSampler
|
||||
false, // ftrSupportsVmeAvcPreemption
|
||||
false, // ftrRenderCompressedBuffers
|
||||
false, // ftrRenderCompressedImages
|
||||
true, // ftr64KBpages
|
||||
true, // instrumentationEnabled
|
||||
true, // forceStatelessCompilationFor32Bit
|
||||
"core", // platformType
|
||||
true, // sourceLevelDebuggerSupported
|
||||
true, // supportsVme
|
||||
false, // supportCacheFlushAfterWalker
|
||||
true, // supportsImages
|
||||
true, // supportsDeviceEnqueue
|
||||
true // hostPtrTrackingEnabled
|
||||
};
|
||||
|
||||
WorkaroundTable KBL::workaroundTable = {};
|
||||
FeatureTable KBL::featureTable = {};
|
||||
|
||||
void KBL::setupFeatureAndWorkaroundTable(HardwareInfo *hwInfo) {
|
||||
PLATFORM *platform = &hwInfo->platform;
|
||||
FeatureTable *featureTable = &hwInfo->featureTable;
|
||||
WorkaroundTable *workaroundTable = &hwInfo->workaroundTable;
|
||||
|
||||
featureTable->ftrGpGpuMidBatchPreempt = true;
|
||||
featureTable->ftrGpGpuThreadGroupLevelPreempt = true;
|
||||
featureTable->ftrL3IACoherency = true;
|
||||
featureTable->ftrVEBOX = true;
|
||||
featureTable->ftrGpGpuMidThreadLevelPreempt = true;
|
||||
featureTable->ftr3dMidBatchPreempt = true;
|
||||
featureTable->ftr3dObjectLevelPreempt = true;
|
||||
featureTable->ftrPerCtxtPreemptionGranularityControl = true;
|
||||
featureTable->ftrPPGTT = true;
|
||||
featureTable->ftrSVM = true;
|
||||
featureTable->ftrIA32eGfxPTEs = true;
|
||||
featureTable->ftrDisplayYTiling = true;
|
||||
featureTable->ftrTranslationTable = true;
|
||||
featureTable->ftrUserModeTranslationTable = true;
|
||||
featureTable->ftrEnableGuC = true;
|
||||
featureTable->ftrFbc = true;
|
||||
featureTable->ftrFbc2AddressTranslation = true;
|
||||
featureTable->ftrFbcBlitterTracking = true;
|
||||
featureTable->ftrFbcCpuTracking = true;
|
||||
featureTable->ftrTileY = true;
|
||||
|
||||
workaroundTable->waEnablePreemptionGranularityControlByUMD = true;
|
||||
workaroundTable->waSendMIFLUSHBeforeVFE = true;
|
||||
workaroundTable->waReportPerfCountUseGlobalContextID = true;
|
||||
workaroundTable->waMsaa8xTileYDepthPitchAlignment = true;
|
||||
workaroundTable->waLosslessCompressionSurfaceStride = true;
|
||||
workaroundTable->waFbcLinearSurfaceStride = true;
|
||||
workaroundTable->wa4kAlignUVOffsetNV12LinearSurface = true;
|
||||
workaroundTable->waSamplerCacheFlushBetweenRedescribedSurfaceReads = true;
|
||||
|
||||
if (platform->usRevId <= 0x6) {
|
||||
workaroundTable->waDisableLSQCROPERFforOCL = true;
|
||||
workaroundTable->waEncryptedEdramOnlyPartials = true;
|
||||
}
|
||||
if (platform->usRevId <= 0x8) {
|
||||
workaroundTable->waForcePcBbFullCfgRestore = true;
|
||||
}
|
||||
}
|
||||
|
||||
const HardwareInfo KBL_1x2x6::hwInfo = {
|
||||
&KBL::platform,
|
||||
&KBL::featureTable,
|
||||
&KBL::workaroundTable,
|
||||
&KBL_1x2x6::gtSystemInfo,
|
||||
KBL::capabilityTable,
|
||||
};
|
||||
GT_SYSTEM_INFO KBL_1x2x6::gtSystemInfo = {0};
|
||||
void KBL_1x2x6::setupHardwareInfo(HardwareInfo *hwInfo, bool setupFeatureTableAndWorkaroundTable) {
|
||||
GT_SYSTEM_INFO *gtSysInfo = &hwInfo->gtSystemInfo;
|
||||
gtSysInfo->ThreadCount = gtSysInfo->EUCount * KBL::threadsPerEu;
|
||||
gtSysInfo->SliceCount = 1;
|
||||
gtSysInfo->L3CacheSizeInKb = 384;
|
||||
gtSysInfo->L3BankCount = 2;
|
||||
gtSysInfo->MaxFillRate = 8;
|
||||
gtSysInfo->TotalVsThreads = 336;
|
||||
gtSysInfo->TotalHsThreads = 336;
|
||||
gtSysInfo->TotalDsThreads = 336;
|
||||
gtSysInfo->TotalGsThreads = 336;
|
||||
gtSysInfo->TotalPsThreadsWindowerRange = 64;
|
||||
gtSysInfo->CsrSizeInMb = 8;
|
||||
gtSysInfo->MaxEuPerSubSlice = KBL::maxEuPerSubslice;
|
||||
gtSysInfo->MaxSlicesSupported = KBL::maxSlicesSupported;
|
||||
gtSysInfo->MaxSubSlicesSupported = KBL::maxSubslicesSupported;
|
||||
gtSysInfo->IsL3HashModeEnabled = false;
|
||||
gtSysInfo->IsDynamicallyPopulated = false;
|
||||
if (setupFeatureTableAndWorkaroundTable) {
|
||||
setupFeatureAndWorkaroundTable(hwInfo);
|
||||
}
|
||||
};
|
||||
|
||||
const HardwareInfo KBL_1x3x6::hwInfo = {
|
||||
&KBL::platform,
|
||||
&KBL::featureTable,
|
||||
&KBL::workaroundTable,
|
||||
&KBL_1x3x6::gtSystemInfo,
|
||||
KBL::capabilityTable,
|
||||
};
|
||||
|
||||
GT_SYSTEM_INFO KBL_1x3x6::gtSystemInfo = {0};
|
||||
void KBL_1x3x6::setupHardwareInfo(HardwareInfo *hwInfo, bool setupFeatureTableAndWorkaroundTable) {
|
||||
GT_SYSTEM_INFO *gtSysInfo = &hwInfo->gtSystemInfo;
|
||||
gtSysInfo->ThreadCount = gtSysInfo->EUCount * KBL::threadsPerEu;
|
||||
gtSysInfo->SliceCount = 1;
|
||||
gtSysInfo->L3CacheSizeInKb = 768;
|
||||
gtSysInfo->L3BankCount = 4;
|
||||
gtSysInfo->MaxFillRate = 8;
|
||||
gtSysInfo->TotalVsThreads = 336;
|
||||
gtSysInfo->TotalHsThreads = 336;
|
||||
gtSysInfo->TotalDsThreads = 336;
|
||||
gtSysInfo->TotalGsThreads = 336;
|
||||
gtSysInfo->TotalPsThreadsWindowerRange = 64;
|
||||
gtSysInfo->CsrSizeInMb = 8;
|
||||
gtSysInfo->MaxEuPerSubSlice = KBL::maxEuPerSubslice;
|
||||
gtSysInfo->MaxSlicesSupported = KBL::maxSlicesSupported;
|
||||
gtSysInfo->MaxSubSlicesSupported = KBL::maxSubslicesSupported;
|
||||
gtSysInfo->IsL3HashModeEnabled = false;
|
||||
gtSysInfo->IsDynamicallyPopulated = false;
|
||||
if (setupFeatureTableAndWorkaroundTable) {
|
||||
setupFeatureAndWorkaroundTable(hwInfo);
|
||||
}
|
||||
};
|
||||
|
||||
const HardwareInfo KBL_1x3x8::hwInfo = {
|
||||
&KBL::platform,
|
||||
&KBL::featureTable,
|
||||
&KBL::workaroundTable,
|
||||
&KBL_1x3x8::gtSystemInfo,
|
||||
KBL::capabilityTable,
|
||||
};
|
||||
GT_SYSTEM_INFO KBL_1x3x8::gtSystemInfo = {0};
|
||||
void KBL_1x3x8::setupHardwareInfo(HardwareInfo *hwInfo, bool setupFeatureTableAndWorkaroundTable) {
|
||||
GT_SYSTEM_INFO *gtSysInfo = &hwInfo->gtSystemInfo;
|
||||
gtSysInfo->ThreadCount = gtSysInfo->EUCount * KBL::threadsPerEu;
|
||||
gtSysInfo->SliceCount = 1;
|
||||
gtSysInfo->L3CacheSizeInKb = 768;
|
||||
gtSysInfo->L3BankCount = 4;
|
||||
gtSysInfo->MaxFillRate = 8;
|
||||
gtSysInfo->TotalVsThreads = 336;
|
||||
gtSysInfo->TotalHsThreads = 336;
|
||||
gtSysInfo->TotalDsThreads = 336;
|
||||
gtSysInfo->TotalGsThreads = 336;
|
||||
gtSysInfo->TotalPsThreadsWindowerRange = 64;
|
||||
gtSysInfo->CsrSizeInMb = 8;
|
||||
gtSysInfo->MaxEuPerSubSlice = KBL::maxEuPerSubslice;
|
||||
gtSysInfo->MaxSlicesSupported = KBL::maxSlicesSupported;
|
||||
gtSysInfo->MaxSubSlicesSupported = KBL::maxSubslicesSupported;
|
||||
gtSysInfo->IsL3HashModeEnabled = false;
|
||||
gtSysInfo->IsDynamicallyPopulated = false;
|
||||
if (setupFeatureTableAndWorkaroundTable) {
|
||||
setupFeatureAndWorkaroundTable(hwInfo);
|
||||
}
|
||||
};
|
||||
|
||||
const HardwareInfo KBL_2x3x8::hwInfo = {
|
||||
&KBL::platform,
|
||||
&KBL::featureTable,
|
||||
&KBL::workaroundTable,
|
||||
&KBL_2x3x8::gtSystemInfo,
|
||||
KBL::capabilityTable,
|
||||
};
|
||||
GT_SYSTEM_INFO KBL_2x3x8::gtSystemInfo = {0};
|
||||
void KBL_2x3x8::setupHardwareInfo(HardwareInfo *hwInfo, bool setupFeatureTableAndWorkaroundTable) {
|
||||
GT_SYSTEM_INFO *gtSysInfo = &hwInfo->gtSystemInfo;
|
||||
gtSysInfo->ThreadCount = gtSysInfo->EUCount * KBL::threadsPerEu;
|
||||
gtSysInfo->SliceCount = 2;
|
||||
gtSysInfo->L3CacheSizeInKb = 1536;
|
||||
gtSysInfo->L3BankCount = 8;
|
||||
gtSysInfo->MaxFillRate = 16;
|
||||
gtSysInfo->TotalVsThreads = 336;
|
||||
gtSysInfo->TotalHsThreads = 336;
|
||||
gtSysInfo->TotalDsThreads = 336;
|
||||
gtSysInfo->TotalGsThreads = 336;
|
||||
gtSysInfo->TotalPsThreadsWindowerRange = 64;
|
||||
gtSysInfo->CsrSizeInMb = 8;
|
||||
gtSysInfo->MaxEuPerSubSlice = KBL::maxEuPerSubslice;
|
||||
gtSysInfo->MaxSlicesSupported = KBL::maxSlicesSupported;
|
||||
gtSysInfo->MaxSubSlicesSupported = KBL::maxSubslicesSupported;
|
||||
gtSysInfo->IsL3HashModeEnabled = false;
|
||||
gtSysInfo->IsDynamicallyPopulated = false;
|
||||
if (setupFeatureTableAndWorkaroundTable) {
|
||||
setupFeatureAndWorkaroundTable(hwInfo);
|
||||
}
|
||||
};
|
||||
|
||||
const HardwareInfo KBL_3x3x8::hwInfo = {
|
||||
&KBL::platform,
|
||||
&KBL::featureTable,
|
||||
&KBL::workaroundTable,
|
||||
&KBL_3x3x8::gtSystemInfo,
|
||||
KBL::capabilityTable,
|
||||
};
|
||||
GT_SYSTEM_INFO KBL_3x3x8::gtSystemInfo = {0};
|
||||
void KBL_3x3x8::setupHardwareInfo(HardwareInfo *hwInfo, bool setupFeatureTableAndWorkaroundTable) {
|
||||
GT_SYSTEM_INFO *gtSysInfo = &hwInfo->gtSystemInfo;
|
||||
gtSysInfo->ThreadCount = gtSysInfo->EUCount * KBL::threadsPerEu;
|
||||
gtSysInfo->SliceCount = 3;
|
||||
gtSysInfo->L3CacheSizeInKb = 2304;
|
||||
gtSysInfo->L3BankCount = 12;
|
||||
gtSysInfo->MaxFillRate = 23;
|
||||
gtSysInfo->TotalVsThreads = 336;
|
||||
gtSysInfo->TotalHsThreads = 336;
|
||||
gtSysInfo->TotalDsThreads = 336;
|
||||
gtSysInfo->TotalGsThreads = 336;
|
||||
gtSysInfo->TotalPsThreadsWindowerRange = 64;
|
||||
gtSysInfo->CsrSizeInMb = 8;
|
||||
gtSysInfo->MaxEuPerSubSlice = KBL::maxEuPerSubslice;
|
||||
gtSysInfo->MaxSlicesSupported = KBL::maxSlicesSupported;
|
||||
gtSysInfo->MaxSubSlicesSupported = KBL::maxSubslicesSupported;
|
||||
gtSysInfo->IsL3HashModeEnabled = false;
|
||||
gtSysInfo->IsDynamicallyPopulated = false;
|
||||
if (setupFeatureTableAndWorkaroundTable) {
|
||||
setupFeatureAndWorkaroundTable(hwInfo);
|
||||
}
|
||||
};
|
||||
|
||||
const HardwareInfo KBL::hwInfo = KBL_1x3x6::hwInfo;
|
||||
const uint64_t KBL::defaultHardwareInfoConfig = 0x100030006;
|
||||
|
||||
void setupKBLHardwareInfoImpl(HardwareInfo *hwInfo, bool setupFeatureTableAndWorkaroundTable, uint64_t hwInfoConfig) {
|
||||
if (hwInfoConfig == 0x100030008) {
|
||||
KBL_1x3x8::setupHardwareInfo(hwInfo, setupFeatureTableAndWorkaroundTable);
|
||||
} else if (hwInfoConfig == 0x200030008) {
|
||||
KBL_2x3x8::setupHardwareInfo(hwInfo, setupFeatureTableAndWorkaroundTable);
|
||||
} else if (hwInfoConfig == 0x300030008) {
|
||||
KBL_3x3x8::setupHardwareInfo(hwInfo, setupFeatureTableAndWorkaroundTable);
|
||||
} else if (hwInfoConfig == 0x100020006) {
|
||||
KBL_1x2x6::setupHardwareInfo(hwInfo, setupFeatureTableAndWorkaroundTable);
|
||||
} else if (hwInfoConfig == 0x100030006) {
|
||||
KBL_1x3x6::setupHardwareInfo(hwInfo, setupFeatureTableAndWorkaroundTable);
|
||||
} else if (hwInfoConfig == 0x0) {
|
||||
// Default config
|
||||
KBL_1x3x6::setupHardwareInfo(hwInfo, setupFeatureTableAndWorkaroundTable);
|
||||
} else {
|
||||
UNRECOVERABLE_IF(true);
|
||||
}
|
||||
}
|
||||
|
||||
void (*KBL::setupHardwareInfo)(HardwareInfo *, bool, uint64_t) = setupKBLHardwareInfoImpl;
|
||||
} // namespace NEO
|
Reference in New Issue
Block a user