mirror of
https://github.com/intel/compute-runtime.git
synced 2026-01-04 07:14:10 +08:00
ftrL3IACoherency, ftrGpGpuMidBatchPreempt, ftrGpGpuThreadGroupLevelPreempt from configureHardwareCustom to setupFeatureAndWorkaroundTable Related-To: NEO-2755 Change-Id: I508ad321c60bfd88eef3654b3f418343fc5b6b31 Signed-off-by: Katarzyna Cencelewska <katarzyna.cencelewska@intel.com>
188 lines
7.6 KiB
C++
188 lines
7.6 KiB
C++
/*
|
|
* Copyright (C) 2017-2019 Intel Corporation
|
|
*
|
|
* SPDX-License-Identifier: MIT
|
|
*
|
|
*/
|
|
|
|
#include "runtime/aub_mem_dump/aub_services.h"
|
|
#include "runtime/memory_manager/memory_constants.h"
|
|
|
|
#include "engine_node.h"
|
|
#include "hw_cmds.h"
|
|
#include "hw_info_glk.h"
|
|
|
|
namespace NEO {
|
|
|
|
const char *HwMapper<IGFX_GEMINILAKE>::abbreviation = "glk";
|
|
|
|
bool isSimulationGLK(unsigned short deviceId) {
|
|
return false;
|
|
};
|
|
|
|
const PLATFORM GLK::platform = {
|
|
IGFX_GEMINILAKE,
|
|
PCH_UNKNOWN,
|
|
IGFX_GEN9_CORE,
|
|
IGFX_GEN9_CORE,
|
|
PLATFORM_MOBILE, // default init
|
|
0, // usDeviceID
|
|
0, // usRevId. 0 sets the stepping to A0
|
|
0, // usDeviceID_PCH
|
|
0, // usRevId_PCH
|
|
GTTYPE_UNDEFINED};
|
|
|
|
const RuntimeCapabilityTable GLK::capabilityTable{
|
|
{30000, 0, 0, true, false, false}, // kmdNotifyProperties
|
|
{true, false}, // whitelistedRegisters
|
|
MemoryConstants::max48BitAddress, // gpuAddressSpace
|
|
52.083, // defaultProfilingTimerResolution
|
|
MemoryConstants::pageSize, // requiredPreemptionSurfaceSize
|
|
&isSimulationGLK, // isSimulation
|
|
PreemptionMode::MidThread, // defaultPreemptionMode
|
|
aub_stream::ENGINE_RCS, // defaultEngineType
|
|
0, // maxRenderFrequency
|
|
12, // clVersionSupport
|
|
CmdServicesMemTraceVersion::DeviceValues::Glk, // aubDeviceId
|
|
0, // extraQuantityThreadsPerEU
|
|
64, // slmSize
|
|
false, // blitterOperationsSupported
|
|
true, // ftrSupportsFP64
|
|
true, // ftrSupports64BitMath
|
|
false, // ftrSvm
|
|
true, // ftrSupportsCoherency
|
|
true, // ftrSupportsVmeAvcTextureSampler
|
|
false, // ftrSupportsVmeAvcPreemption
|
|
false, // ftrRenderCompressedBuffers
|
|
false, // ftrRenderCompressedImages
|
|
false, // ftr64KBpages
|
|
true, // instrumentationEnabled
|
|
false, // forceStatelessCompilationFor32Bit
|
|
false, // isCore
|
|
true, // sourceLevelDebuggerSupported
|
|
true, // supportsVme
|
|
false // supportCacheFlushAfterWalker
|
|
};
|
|
|
|
WorkaroundTable GLK::workaroundTable = {};
|
|
FeatureTable GLK::featureTable = {};
|
|
|
|
void GLK::setupFeatureAndWorkaroundTable(HardwareInfo *hwInfo) {
|
|
FeatureTable *pSkuTable = const_cast<FeatureTable *>(hwInfo->pSkuTable);
|
|
WorkaroundTable *pWaTable = const_cast<WorkaroundTable *>(hwInfo->pWaTable);
|
|
|
|
pSkuTable->ftrGpGpuMidBatchPreempt = true;
|
|
pSkuTable->ftrGpGpuThreadGroupLevelPreempt = true;
|
|
pSkuTable->ftrL3IACoherency = true;
|
|
pSkuTable->ftrGpGpuMidThreadLevelPreempt = false;
|
|
pSkuTable->ftr3dMidBatchPreempt = true;
|
|
pSkuTable->ftr3dObjectLevelPreempt = true;
|
|
pSkuTable->ftrPerCtxtPreemptionGranularityControl = true;
|
|
pSkuTable->ftrLCIA = true;
|
|
pSkuTable->ftrPPGTT = true;
|
|
pSkuTable->ftrIA32eGfxPTEs = true;
|
|
pSkuTable->ftrTranslationTable = true;
|
|
pSkuTable->ftrUserModeTranslationTable = true;
|
|
pSkuTable->ftrEnableGuC = true;
|
|
pSkuTable->ftrTileMappedResource = true;
|
|
pSkuTable->ftrULT = true;
|
|
pSkuTable->ftrAstcHdr2D = true;
|
|
pSkuTable->ftrAstcLdr2D = true;
|
|
pSkuTable->ftrTileY = true;
|
|
|
|
pWaTable->waLLCCachingUnsupported = true;
|
|
pWaTable->waMsaa8xTileYDepthPitchAlignment = true;
|
|
pWaTable->waFbcLinearSurfaceStride = true;
|
|
pWaTable->wa4kAlignUVOffsetNV12LinearSurface = true;
|
|
pWaTable->waEnablePreemptionGranularityControlByUMD = true;
|
|
pWaTable->waSendMIFLUSHBeforeVFE = true;
|
|
pWaTable->waForcePcBbFullCfgRestore = true;
|
|
pWaTable->waReportPerfCountUseGlobalContextID = true;
|
|
pWaTable->waSamplerCacheFlushBetweenRedescribedSurfaceReads = true;
|
|
}
|
|
|
|
const HardwareInfo GLK_1x3x6::hwInfo = {
|
|
&GLK::platform,
|
|
&GLK::featureTable,
|
|
&GLK::workaroundTable,
|
|
&GLK_1x3x6::gtSystemInfo,
|
|
GLK::capabilityTable,
|
|
};
|
|
|
|
GT_SYSTEM_INFO GLK_1x3x6::gtSystemInfo = {0};
|
|
void GLK_1x3x6::setupHardwareInfo(HardwareInfo *hwInfo, bool setupFeatureTableAndWorkaroundTable) {
|
|
GT_SYSTEM_INFO *gtSysInfo = const_cast<GT_SYSTEM_INFO *>(hwInfo->pSysInfo);
|
|
gtSysInfo->EUCount = 18;
|
|
gtSysInfo->ThreadCount = 18 * GLK::threadsPerEu;
|
|
gtSysInfo->SliceCount = 1;
|
|
gtSysInfo->SubSliceCount = 3;
|
|
gtSysInfo->L3CacheSizeInKb = 384;
|
|
gtSysInfo->L3BankCount = 2;
|
|
gtSysInfo->MaxFillRate = 8;
|
|
gtSysInfo->TotalVsThreads = 112;
|
|
gtSysInfo->TotalHsThreads = 112;
|
|
gtSysInfo->TotalDsThreads = 112;
|
|
gtSysInfo->TotalGsThreads = 112;
|
|
gtSysInfo->TotalPsThreadsWindowerRange = 64;
|
|
gtSysInfo->CsrSizeInMb = 8;
|
|
gtSysInfo->MaxEuPerSubSlice = GLK::maxEuPerSubslice;
|
|
gtSysInfo->MaxSlicesSupported = GLK::maxSlicesSupported;
|
|
gtSysInfo->MaxSubSlicesSupported = GLK::maxSubslicesSupported;
|
|
gtSysInfo->IsL3HashModeEnabled = false;
|
|
gtSysInfo->IsDynamicallyPopulated = false;
|
|
if (setupFeatureTableAndWorkaroundTable) {
|
|
setupFeatureAndWorkaroundTable(hwInfo);
|
|
}
|
|
};
|
|
|
|
const HardwareInfo GLK_1x2x6::hwInfo = {
|
|
&GLK::platform,
|
|
&GLK::featureTable,
|
|
&GLK::workaroundTable,
|
|
&GLK_1x2x6::gtSystemInfo,
|
|
GLK::capabilityTable,
|
|
};
|
|
GT_SYSTEM_INFO GLK_1x2x6::gtSystemInfo = {0};
|
|
void GLK_1x2x6::setupHardwareInfo(HardwareInfo *hwInfo, bool setupFeatureTableAndWorkaroundTable) {
|
|
GT_SYSTEM_INFO *gtSysInfo = const_cast<GT_SYSTEM_INFO *>(hwInfo->pSysInfo);
|
|
gtSysInfo->EUCount = 12;
|
|
gtSysInfo->ThreadCount = 12 * GLK::threadsPerEu;
|
|
gtSysInfo->SliceCount = 1;
|
|
gtSysInfo->SubSliceCount = 2;
|
|
gtSysInfo->L3CacheSizeInKb = 384;
|
|
gtSysInfo->L3BankCount = 2;
|
|
gtSysInfo->MaxFillRate = 8;
|
|
gtSysInfo->TotalVsThreads = 112;
|
|
gtSysInfo->TotalHsThreads = 112;
|
|
gtSysInfo->TotalDsThreads = 112;
|
|
gtSysInfo->TotalGsThreads = 112;
|
|
gtSysInfo->TotalPsThreadsWindowerRange = 64;
|
|
gtSysInfo->CsrSizeInMb = 8;
|
|
gtSysInfo->MaxEuPerSubSlice = GLK::maxEuPerSubslice;
|
|
gtSysInfo->MaxSlicesSupported = GLK::maxSlicesSupported;
|
|
gtSysInfo->MaxSubSlicesSupported = GLK::maxSubslicesSupported;
|
|
gtSysInfo->IsL3HashModeEnabled = false;
|
|
gtSysInfo->IsDynamicallyPopulated = false;
|
|
if (setupFeatureTableAndWorkaroundTable) {
|
|
setupFeatureAndWorkaroundTable(hwInfo);
|
|
}
|
|
};
|
|
|
|
const HardwareInfo GLK::hwInfo = GLK_1x3x6::hwInfo;
|
|
|
|
void setupGLKHardwareInfoImpl(HardwareInfo *hwInfo, bool setupFeatureTableAndWorkaroundTable, const std::string &hwInfoConfig) {
|
|
if (hwInfoConfig == "1x2x6") {
|
|
GLK_1x2x6::setupHardwareInfo(hwInfo, setupFeatureTableAndWorkaroundTable);
|
|
} else if (hwInfoConfig == "1x3x6") {
|
|
GLK_1x3x6::setupHardwareInfo(hwInfo, setupFeatureTableAndWorkaroundTable);
|
|
} else if (hwInfoConfig == "default") {
|
|
// Default config
|
|
GLK_1x3x6::setupHardwareInfo(hwInfo, setupFeatureTableAndWorkaroundTable);
|
|
} else {
|
|
UNRECOVERABLE_IF(true);
|
|
}
|
|
}
|
|
|
|
void (*GLK::setupHardwareInfo)(HardwareInfo *, bool, const std::string &) = setupGLKHardwareInfoImpl;
|
|
} // namespace NEO
|