mirror of
https://github.com/intel/compute-runtime.git
synced 2026-01-03 14:55:24 +08:00
refactor: rename global debug manager to debugManager
Signed-off-by: Mateusz Jablonski <mateusz.jablonski@intel.com>
This commit is contained in:
committed by
Compute-Runtime-Automation
parent
f2ede40d2e
commit
c9664e6bad
@@ -18,8 +18,8 @@ bool failBuildProgramWithStatefulAccess(const RootDeviceEnvironment &rootDeviceE
|
||||
const auto &compilerProductHelper = rootDeviceEnvironment.getHelper<CompilerProductHelper>();
|
||||
|
||||
auto failBuildProgram = compilerProductHelper.failBuildProgramWithStatefulAccessPreference();
|
||||
if (NEO::DebugManager.flags.FailBuildProgramWithStatefulAccess.get() != -1) {
|
||||
failBuildProgram = static_cast<bool>(NEO::DebugManager.flags.FailBuildProgramWithStatefulAccess.get());
|
||||
if (NEO::debugManager.flags.FailBuildProgramWithStatefulAccess.get() != -1) {
|
||||
failBuildProgram = static_cast<bool>(NEO::debugManager.flags.FailBuildProgramWithStatefulAccess.get());
|
||||
}
|
||||
|
||||
auto forceToStatelessRequired = compilerProductHelper.isForceToStatelessRequired();
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
/*
|
||||
* Copyright (C) 2019-2021 Intel Corporation
|
||||
* Copyright (C) 2019-2023 Intel Corporation
|
||||
*
|
||||
* SPDX-License-Identifier: MIT
|
||||
*
|
||||
@@ -10,6 +10,6 @@
|
||||
|
||||
namespace NEO {
|
||||
bool isDeferredDeleterEnabled() {
|
||||
return DebugManager.flags.EnableDeferredDeleter.get();
|
||||
return debugManager.flags.EnableDeferredDeleter.get();
|
||||
}
|
||||
} // namespace NEO
|
||||
|
||||
@@ -14,7 +14,7 @@
|
||||
namespace NEO {
|
||||
|
||||
void AppResourceHelper::copyResourceTagStr(char *dst, AllocationType type, size_t size) {
|
||||
if (DebugManager.flags.EnableResourceTags.get()) {
|
||||
if (debugManager.flags.EnableResourceTags.get()) {
|
||||
auto tag = getResourceTagStr(type);
|
||||
strcpy_s(dst, size, tag);
|
||||
}
|
||||
|
||||
@@ -18,8 +18,8 @@ namespace NEO {
|
||||
|
||||
template <typename GfxFamily>
|
||||
uint64_t BlitCommandsHelper<GfxFamily>::getMaxBlitWidth(const RootDeviceEnvironment &rootDeviceEnvironment) {
|
||||
if (DebugManager.flags.LimitBlitterMaxWidth.get() != -1) {
|
||||
return static_cast<uint64_t>(DebugManager.flags.LimitBlitterMaxWidth.get());
|
||||
if (debugManager.flags.LimitBlitterMaxWidth.get() != -1) {
|
||||
return static_cast<uint64_t>(debugManager.flags.LimitBlitterMaxWidth.get());
|
||||
}
|
||||
auto maxBlitWidthOverride = getMaxBlitWidthOverride(rootDeviceEnvironment);
|
||||
if (maxBlitWidthOverride > 0) {
|
||||
@@ -30,8 +30,8 @@ uint64_t BlitCommandsHelper<GfxFamily>::getMaxBlitWidth(const RootDeviceEnvironm
|
||||
|
||||
template <typename GfxFamily>
|
||||
uint64_t BlitCommandsHelper<GfxFamily>::getMaxBlitHeight(const RootDeviceEnvironment &rootDeviceEnvironment, bool isSystemMemoryPoolUsed) {
|
||||
if (DebugManager.flags.LimitBlitterMaxHeight.get() != -1) {
|
||||
return static_cast<uint64_t>(DebugManager.flags.LimitBlitterMaxHeight.get());
|
||||
if (debugManager.flags.LimitBlitterMaxHeight.get() != -1) {
|
||||
return static_cast<uint64_t>(debugManager.flags.LimitBlitterMaxHeight.get());
|
||||
}
|
||||
auto maxBlitHeightOverride = getMaxBlitHeightOverride(rootDeviceEnvironment, isSystemMemoryPoolUsed);
|
||||
if (maxBlitHeightOverride > 0) {
|
||||
@@ -63,8 +63,8 @@ size_t BlitCommandsHelper<GfxFamily>::estimatePreBlitCommandSize(const RootDevic
|
||||
template <typename GfxFamily>
|
||||
void BlitCommandsHelper<GfxFamily>::dispatchPostBlitCommand(LinearStream &linearStream, EncodeDummyBlitWaArgs &waArgs) {
|
||||
MiFlushArgs args{waArgs};
|
||||
if (DebugManager.flags.PostBlitCommand.get() != BlitterConstants::PostBlitMode::Default) {
|
||||
switch (DebugManager.flags.PostBlitCommand.get()) {
|
||||
if (debugManager.flags.PostBlitCommand.get() != BlitterConstants::PostBlitMode::Default) {
|
||||
switch (debugManager.flags.PostBlitCommand.get()) {
|
||||
case BlitterConstants::PostBlitMode::MiArbCheck:
|
||||
EncodeMiArbCheck<GfxFamily>::programWithWa(linearStream, std::nullopt, waArgs);
|
||||
return;
|
||||
@@ -88,8 +88,8 @@ template <typename GfxFamily>
|
||||
size_t BlitCommandsHelper<GfxFamily>::estimatePostBlitCommandSize(const RootDeviceEnvironment &rootDeviceEnvironment) {
|
||||
EncodeDummyBlitWaArgs waArgs{true, const_cast<RootDeviceEnvironment *>(&rootDeviceEnvironment)};
|
||||
|
||||
if (DebugManager.flags.PostBlitCommand.get() != BlitterConstants::PostBlitMode::Default) {
|
||||
switch (DebugManager.flags.PostBlitCommand.get()) {
|
||||
if (debugManager.flags.PostBlitCommand.get() != BlitterConstants::PostBlitMode::Default) {
|
||||
switch (debugManager.flags.PostBlitCommand.get()) {
|
||||
case BlitterConstants::PostBlitMode::MiArbCheck:
|
||||
return EncodeMiArbCheck<GfxFamily>::getCommandSizeWithWa(waArgs);
|
||||
case BlitterConstants::PostBlitMode::MiFlush:
|
||||
@@ -195,7 +195,7 @@ void BlitCommandsHelper<GfxFamily>::dispatchBlitCommandsForBufferPerRow(const Bl
|
||||
uint64_t width = 1;
|
||||
uint64_t height = 1;
|
||||
|
||||
PRINT_DEBUG_STRING(DebugManager.flags.PrintBlitDispatchDetails.get(), stdout,
|
||||
PRINT_DEBUG_STRING(debugManager.flags.PrintBlitDispatchDetails.get(), stdout,
|
||||
"\nBlit dispatch with AuxTranslationDirection %u ", static_cast<uint32_t>(blitProperties.auxTranslationDirection));
|
||||
|
||||
dispatchPreBlitCommand(linearStream, *waArgs.rootDeviceEnvironment);
|
||||
@@ -228,7 +228,7 @@ void BlitCommandsHelper<GfxFamily>::dispatchBlitCommandsForBufferPerRow(const Bl
|
||||
auto dstAddr = calculateBlitCommandDestinationBaseAddress(blitProperties, offset, row, slice);
|
||||
auto srcAddr = calculateBlitCommandSourceBaseAddress(blitProperties, offset, row, slice);
|
||||
|
||||
PRINT_DEBUG_STRING(DebugManager.flags.PrintBlitDispatchDetails.get(), stdout,
|
||||
PRINT_DEBUG_STRING(debugManager.flags.PrintBlitDispatchDetails.get(), stdout,
|
||||
"\nBlit command. width: %u, height: %u, srcAddr: %#llx, dstAddr: %#llx ", width, height, srcAddr, dstAddr);
|
||||
|
||||
bltCmd.setDestinationBaseAddress(dstAddr);
|
||||
@@ -322,7 +322,7 @@ void BlitCommandsHelper<GfxFamily>::dispatchBlitCommandsForImageRegion(const Bli
|
||||
for (uint32_t i = 0; i < blitProperties.copySize.z; i++) {
|
||||
appendSliceOffsets(blitProperties, bltCmd, i, *(waArgs.rootDeviceEnvironment), srcSlicePitch, dstSlicePitch);
|
||||
|
||||
if (DebugManager.flags.PrintImageBlitBlockCopyCmdDetails.get()) {
|
||||
if (debugManager.flags.PrintImageBlitBlockCopyCmdDetails.get()) {
|
||||
printImageBlitBlockCopyCommand(bltCmd, i);
|
||||
}
|
||||
|
||||
|
||||
@@ -46,8 +46,8 @@ void BlitCommandsHelper<GfxFamily>::appendBlitCommandsForFillBuffer(NEO::Graphic
|
||||
using XY_COLOR_BLT = typename GfxFamily::XY_COLOR_BLT;
|
||||
|
||||
uint32_t compressionFormat = rootDeviceEnvironment.getGmmClientContext()->getSurfaceStateCompressionFormat(GMM_RESOURCE_FORMAT::GMM_FORMAT_GENERIC_8BIT);
|
||||
if (DebugManager.flags.ForceBufferCompressionFormat.get() != -1) {
|
||||
compressionFormat = DebugManager.flags.ForceBufferCompressionFormat.get();
|
||||
if (debugManager.flags.ForceBufferCompressionFormat.get() != -1) {
|
||||
compressionFormat = debugManager.flags.ForceBufferCompressionFormat.get();
|
||||
}
|
||||
|
||||
if (dstAlloc->isCompressionEnabled()) {
|
||||
@@ -60,16 +60,16 @@ void BlitCommandsHelper<GfxFamily>::appendBlitCommandsForFillBuffer(NEO::Graphic
|
||||
appendExtraMemoryProperties(blitCmd, rootDeviceEnvironment);
|
||||
|
||||
auto mocs = rootDeviceEnvironment.getGmmHelper()->getMOCS(GMM_RESOURCE_USAGE_OCL_BUFFER_CACHELINE_MISALIGNED);
|
||||
if (DebugManager.flags.OverrideBlitterMocs.get() == 1) {
|
||||
if (debugManager.flags.OverrideBlitterMocs.get() == 1) {
|
||||
mocs = rootDeviceEnvironment.getGmmHelper()->getMOCS(GMM_RESOURCE_USAGE_OCL_BUFFER);
|
||||
}
|
||||
|
||||
blitCmd.setDestinationMOCS(mocs);
|
||||
|
||||
if (DebugManager.flags.OverrideBlitterTargetMemory.get() != -1) {
|
||||
if (DebugManager.flags.OverrideBlitterTargetMemory.get() == 0u) {
|
||||
if (debugManager.flags.OverrideBlitterTargetMemory.get() != -1) {
|
||||
if (debugManager.flags.OverrideBlitterTargetMemory.get() == 0u) {
|
||||
blitCmd.setDestinationTargetMemory(XY_COLOR_BLT::DESTINATION_TARGET_MEMORY::DESTINATION_TARGET_MEMORY_SYSTEM_MEM);
|
||||
} else if (DebugManager.flags.OverrideBlitterTargetMemory.get() == 1u) {
|
||||
} else if (debugManager.flags.OverrideBlitterTargetMemory.get() == 1u) {
|
||||
blitCmd.setDestinationTargetMemory(XY_COLOR_BLT::DESTINATION_TARGET_MEMORY::DESTINATION_TARGET_MEMORY_LOCAL_MEM);
|
||||
}
|
||||
}
|
||||
@@ -285,7 +285,7 @@ void BlitCommandsHelper<GfxFamily>::appendTilingEnable(typename GfxFamily::XY_CO
|
||||
|
||||
template <typename GfxFamily>
|
||||
void BlitCommandsHelper<GfxFamily>::programGlobalSequencerFlush(LinearStream &commandStream) {
|
||||
if (DebugManager.flags.GlobalSequencerFlushOnCopyEngine.get() != 0) {
|
||||
if (debugManager.flags.GlobalSequencerFlushOnCopyEngine.get() != 0) {
|
||||
using COMPARE_OPERATION = typename GfxFamily::MI_SEMAPHORE_WAIT::COMPARE_OPERATION;
|
||||
constexpr uint32_t globalInvalidationRegister = 0xB404u;
|
||||
LriHelper<GfxFamily>::program(&commandStream, globalInvalidationRegister, 1u, false);
|
||||
@@ -299,7 +299,7 @@ void BlitCommandsHelper<GfxFamily>::programGlobalSequencerFlush(LinearStream &co
|
||||
|
||||
template <typename GfxFamily>
|
||||
size_t BlitCommandsHelper<GfxFamily>::getSizeForGlobalSequencerFlush() {
|
||||
if (DebugManager.flags.GlobalSequencerFlushOnCopyEngine.get() != 0) {
|
||||
if (debugManager.flags.GlobalSequencerFlushOnCopyEngine.get() != 0) {
|
||||
return sizeof(typename GfxFamily::MI_LOAD_REGISTER_IMM) + NEO::EncodeSemaphore<GfxFamily>::getSizeMiSemaphoreWait();
|
||||
}
|
||||
return 0u;
|
||||
@@ -360,8 +360,8 @@ template <typename GfxFamily>
|
||||
bool BlitCommandsHelper<GfxFamily>::isDummyBlitWaNeeded(const EncodeDummyBlitWaArgs &waArgs) {
|
||||
if (waArgs.isWaRequired) {
|
||||
UNRECOVERABLE_IF(!waArgs.rootDeviceEnvironment);
|
||||
if (DebugManager.flags.ForceDummyBlitWa.get() != -1) {
|
||||
return DebugManager.flags.ForceDummyBlitWa.get();
|
||||
if (debugManager.flags.ForceDummyBlitWa.get() != -1) {
|
||||
return debugManager.flags.ForceDummyBlitWa.get();
|
||||
}
|
||||
auto &productHelper = waArgs.rootDeviceEnvironment->getProductHelper();
|
||||
return productHelper.isDummyBlitWaRequired();
|
||||
|
||||
@@ -14,11 +14,11 @@ namespace NEO {
|
||||
|
||||
template <PRODUCT_FAMILY gfxProduct>
|
||||
uint32_t L1CachePolicyHelper<gfxProduct>::getL1CachePolicy(bool isDebuggerActive) {
|
||||
if (DebugManager.flags.ForceAllResourcesUncached.get()) {
|
||||
if (debugManager.flags.ForceAllResourcesUncached.get()) {
|
||||
return L1CachePolicyHelper<gfxProduct>::getUncachedL1CachePolicy();
|
||||
}
|
||||
if (DebugManager.flags.OverrideL1CachePolicyInSurfaceStateAndStateless.get() != -1) {
|
||||
return DebugManager.flags.OverrideL1CachePolicyInSurfaceStateAndStateless.get();
|
||||
if (debugManager.flags.OverrideL1CachePolicyInSurfaceStateAndStateless.get() != -1) {
|
||||
return debugManager.flags.OverrideL1CachePolicyInSurfaceStateAndStateless.get();
|
||||
}
|
||||
return L1CachePolicyHelper<gfxProduct>::getDefaultL1CachePolicy(isDebuggerActive);
|
||||
}
|
||||
|
||||
@@ -14,8 +14,8 @@ namespace NEO {
|
||||
CompilerProductHelperCreateFunctionType compilerProductHelperFactory[IGFX_MAX_PRODUCT] = {};
|
||||
|
||||
uint32_t CompilerProductHelper::getHwIpVersion(const HardwareInfo &hwInfo) const {
|
||||
if (DebugManager.flags.OverrideHwIpVersion.get() != -1) {
|
||||
return DebugManager.flags.OverrideHwIpVersion.get();
|
||||
if (debugManager.flags.OverrideHwIpVersion.get() != -1) {
|
||||
return debugManager.flags.OverrideHwIpVersion.get();
|
||||
}
|
||||
return getProductConfigFromHwInfo(hwInfo);
|
||||
}
|
||||
|
||||
@@ -81,8 +81,8 @@ std::string CompilerProductHelperHw<gfxProduct>::getDeviceExtensions(const Hardw
|
||||
"cl_intel_split_work_group_barrier ";
|
||||
|
||||
auto supportsFp64 = hwInfo.capabilityTable.ftrSupportsFP64;
|
||||
if (DebugManager.flags.OverrideDefaultFP64Settings.get() != -1) {
|
||||
supportsFp64 = DebugManager.flags.OverrideDefaultFP64Settings.get();
|
||||
if (debugManager.flags.OverrideDefaultFP64Settings.get() != -1) {
|
||||
supportsFp64 = debugManager.flags.OverrideDefaultFP64Settings.get();
|
||||
}
|
||||
if (supportsFp64) {
|
||||
extensions += "cl_khr_fp64 ";
|
||||
@@ -94,12 +94,12 @@ std::string CompilerProductHelperHw<gfxProduct>::getDeviceExtensions(const Hardw
|
||||
|
||||
auto enabledClVersion = hwInfo.capabilityTable.clVersionSupport;
|
||||
auto ocl21FeaturesEnabled = hwInfo.capabilityTable.supportsOcl21Features;
|
||||
if (DebugManager.flags.ForceOCLVersion.get() != 0) {
|
||||
enabledClVersion = DebugManager.flags.ForceOCLVersion.get();
|
||||
if (debugManager.flags.ForceOCLVersion.get() != 0) {
|
||||
enabledClVersion = debugManager.flags.ForceOCLVersion.get();
|
||||
ocl21FeaturesEnabled = (enabledClVersion == 21);
|
||||
}
|
||||
if (DebugManager.flags.ForceOCL21FeaturesSupport.get() != -1) {
|
||||
ocl21FeaturesEnabled = DebugManager.flags.ForceOCL21FeaturesSupport.get();
|
||||
if (debugManager.flags.ForceOCL21FeaturesSupport.get() != -1) {
|
||||
ocl21FeaturesEnabled = debugManager.flags.ForceOCL21FeaturesSupport.get();
|
||||
}
|
||||
if (ocl21FeaturesEnabled) {
|
||||
|
||||
@@ -120,20 +120,20 @@ std::string CompilerProductHelperHw<gfxProduct>::getDeviceExtensions(const Hardw
|
||||
extensions += "cl_ext_float_atomics ";
|
||||
}
|
||||
|
||||
if (enabledClVersion >= 30 && DebugManager.flags.ClKhrExternalMemoryExtension.get()) {
|
||||
if (enabledClVersion >= 30 && debugManager.flags.ClKhrExternalMemoryExtension.get()) {
|
||||
extensions += "cl_khr_external_memory ";
|
||||
}
|
||||
|
||||
if (DebugManager.flags.EnableNV12.get() && hwInfo.capabilityTable.supportsImages) {
|
||||
if (debugManager.flags.EnableNV12.get() && hwInfo.capabilityTable.supportsImages) {
|
||||
extensions += "cl_intel_planar_yuv ";
|
||||
}
|
||||
if (DebugManager.flags.EnablePackedYuv.get() && hwInfo.capabilityTable.supportsImages) {
|
||||
if (debugManager.flags.EnablePackedYuv.get() && hwInfo.capabilityTable.supportsImages) {
|
||||
extensions += "cl_intel_packed_yuv ";
|
||||
}
|
||||
|
||||
auto supportsVme = hwInfo.capabilityTable.supportsVme;
|
||||
if (DebugManager.flags.EnableIntelVme.get() != -1) {
|
||||
supportsVme = !!DebugManager.flags.EnableIntelVme.get();
|
||||
if (debugManager.flags.EnableIntelVme.get() != -1) {
|
||||
supportsVme = !!debugManager.flags.EnableIntelVme.get();
|
||||
}
|
||||
|
||||
if (supportsVme) {
|
||||
@@ -144,8 +144,8 @@ std::string CompilerProductHelperHw<gfxProduct>::getDeviceExtensions(const Hardw
|
||||
}
|
||||
|
||||
auto supportsAdvancedVme = hwInfo.capabilityTable.supportsVme;
|
||||
if (DebugManager.flags.EnableIntelAdvancedVme.get() != -1) {
|
||||
supportsAdvancedVme = !!DebugManager.flags.EnableIntelAdvancedVme.get();
|
||||
if (debugManager.flags.EnableIntelAdvancedVme.get() != -1) {
|
||||
supportsAdvancedVme = !!debugManager.flags.EnableIntelAdvancedVme.get();
|
||||
}
|
||||
if (supportsAdvancedVme) {
|
||||
extensions += "cl_intel_advanced_motion_estimation ";
|
||||
|
||||
@@ -14,7 +14,7 @@ namespace NEO {
|
||||
|
||||
template <PRODUCT_FAMILY gfxProduct>
|
||||
bool CompilerProductHelperHw<gfxProduct>::isForceToStatelessRequired() const {
|
||||
if (DebugManager.flags.DisableForceToStateless.get()) {
|
||||
if (debugManager.flags.DisableForceToStateless.get()) {
|
||||
return false;
|
||||
}
|
||||
return true;
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
/*
|
||||
* Copyright (C) 2018-2022 Intel Corporation
|
||||
* Copyright (C) 2018-2023 Intel Corporation
|
||||
*
|
||||
* SPDX-License-Identifier: MIT
|
||||
*
|
||||
@@ -15,7 +15,7 @@
|
||||
|
||||
namespace NEO {
|
||||
void debugBreak(int line, const char *file) {
|
||||
if (DebugManager.flags.EnableDebugBreak.get()) {
|
||||
if (debugManager.flags.EnableDebugBreak.get()) {
|
||||
printf("Assert was called at %d line in file:\n%s\n", line, file);
|
||||
fflush(stdout);
|
||||
assert(false);
|
||||
|
||||
@@ -87,8 +87,8 @@ bool isBcsVirtualEngineEnabled(aub_stream::EngineType engineType) {
|
||||
bool useVirtualEnginesForBcs = engineType == aub_stream::EngineType::ENGINE_BCS ||
|
||||
engineType == aub_stream::EngineType::ENGINE_BCS1;
|
||||
|
||||
if (DebugManager.flags.UseDrmVirtualEnginesForBcs.get() != -1) {
|
||||
useVirtualEnginesForBcs = !!DebugManager.flags.UseDrmVirtualEnginesForBcs.get();
|
||||
if (debugManager.flags.UseDrmVirtualEnginesForBcs.get() != -1) {
|
||||
useVirtualEnginesForBcs = !!debugManager.flags.UseDrmVirtualEnginesForBcs.get();
|
||||
}
|
||||
|
||||
return useVirtualEnginesForBcs;
|
||||
@@ -97,8 +97,8 @@ bool isBcsVirtualEngineEnabled(aub_stream::EngineType engineType) {
|
||||
aub_stream::EngineType getBcsEngineType(const RootDeviceEnvironment &rootDeviceEnvironment, const DeviceBitfield &deviceBitfield, SelectorCopyEngine &selectorCopyEngine, bool internalUsage) {
|
||||
auto &hwInfo = *rootDeviceEnvironment.getHardwareInfo();
|
||||
auto &productHelper = rootDeviceEnvironment.getHelper<ProductHelper>();
|
||||
if (DebugManager.flags.ForceBcsEngineIndex.get() != -1) {
|
||||
auto index = DebugManager.flags.ForceBcsEngineIndex.get();
|
||||
if (debugManager.flags.ForceBcsEngineIndex.get() != -1) {
|
||||
auto index = debugManager.flags.ForceBcsEngineIndex.get();
|
||||
UNRECOVERABLE_IF(index > 8);
|
||||
|
||||
return (index == 0) ? aub_stream::EngineType::ENGINE_BCS
|
||||
@@ -110,17 +110,17 @@ aub_stream::EngineType getBcsEngineType(const RootDeviceEnvironment &rootDeviceE
|
||||
}
|
||||
|
||||
if (internalUsage) {
|
||||
if (DebugManager.flags.ForceBCSForInternalCopyEngine.get() != -1) {
|
||||
return DebugManager.flags.ForceBCSForInternalCopyEngine.get() == 0 ? aub_stream::EngineType::ENGINE_BCS
|
||||
: static_cast<aub_stream::EngineType>(aub_stream::EngineType::ENGINE_BCS1 + DebugManager.flags.ForceBCSForInternalCopyEngine.get() - 1);
|
||||
if (debugManager.flags.ForceBCSForInternalCopyEngine.get() != -1) {
|
||||
return debugManager.flags.ForceBCSForInternalCopyEngine.get() == 0 ? aub_stream::EngineType::ENGINE_BCS
|
||||
: static_cast<aub_stream::EngineType>(aub_stream::EngineType::ENGINE_BCS1 + debugManager.flags.ForceBCSForInternalCopyEngine.get() - 1);
|
||||
}
|
||||
return aub_stream::ENGINE_BCS3;
|
||||
}
|
||||
|
||||
auto enableSelector = productHelper.isCopyEngineSelectorEnabled(hwInfo);
|
||||
|
||||
if (DebugManager.flags.EnableCopyEngineSelector.get() != -1) {
|
||||
enableSelector = DebugManager.flags.EnableCopyEngineSelector.get();
|
||||
if (debugManager.flags.EnableCopyEngineSelector.get() != -1) {
|
||||
enableSelector = debugManager.flags.EnableCopyEngineSelector.get();
|
||||
}
|
||||
|
||||
if (enableSelector) {
|
||||
@@ -192,8 +192,8 @@ aub_stream::EngineType selectLinkCopyEngine(const RootDeviceEnvironment &rootDev
|
||||
auto &hwInfo = *rootDeviceEnvironment.getHardwareInfo();
|
||||
auto enableCmdQRoundRobindBcsEngineAssign = false;
|
||||
|
||||
if (DebugManager.flags.EnableCmdQRoundRobindBcsEngineAssign.get() != -1) {
|
||||
enableCmdQRoundRobindBcsEngineAssign = DebugManager.flags.EnableCmdQRoundRobindBcsEngineAssign.get();
|
||||
if (debugManager.flags.EnableCmdQRoundRobindBcsEngineAssign.get() != -1) {
|
||||
enableCmdQRoundRobindBcsEngineAssign = debugManager.flags.EnableCmdQRoundRobindBcsEngineAssign.get();
|
||||
}
|
||||
|
||||
if (enableCmdQRoundRobindBcsEngineAssign) {
|
||||
@@ -203,8 +203,8 @@ aub_stream::EngineType selectLinkCopyEngine(const RootDeviceEnvironment &rootDev
|
||||
auto engineOffset = 0u;
|
||||
auto mainCE = false;
|
||||
|
||||
if (DebugManager.flags.EnableCmdQRoundRobindBcsEngineAssignStartingValue.get() != -1) {
|
||||
engineOffset = DebugManager.flags.EnableCmdQRoundRobindBcsEngineAssignStartingValue.get();
|
||||
if (debugManager.flags.EnableCmdQRoundRobindBcsEngineAssignStartingValue.get() != -1) {
|
||||
engineOffset = debugManager.flags.EnableCmdQRoundRobindBcsEngineAssignStartingValue.get();
|
||||
mainCE = engineOffset == 0;
|
||||
}
|
||||
|
||||
@@ -212,8 +212,8 @@ aub_stream::EngineType selectLinkCopyEngine(const RootDeviceEnvironment &rootDev
|
||||
bcsRoundRobinLimit++;
|
||||
}
|
||||
|
||||
if (DebugManager.flags.EnableCmdQRoundRobindBcsEngineAssignLimit.get() != -1) {
|
||||
bcsRoundRobinLimit = DebugManager.flags.EnableCmdQRoundRobindBcsEngineAssignLimit.get();
|
||||
if (debugManager.flags.EnableCmdQRoundRobindBcsEngineAssignLimit.get() != -1) {
|
||||
bcsRoundRobinLimit = debugManager.flags.EnableCmdQRoundRobindBcsEngineAssignLimit.get();
|
||||
}
|
||||
|
||||
do {
|
||||
|
||||
@@ -33,21 +33,21 @@ std::unique_ptr<GfxCoreHelper> GfxCoreHelper::create(const GFXCORE_FAMILY gfxCor
|
||||
}
|
||||
|
||||
bool GfxCoreHelper::compressedBuffersSupported(const HardwareInfo &hwInfo) {
|
||||
if (DebugManager.flags.RenderCompressedBuffersEnabled.get() != -1) {
|
||||
return !!DebugManager.flags.RenderCompressedBuffersEnabled.get();
|
||||
if (debugManager.flags.RenderCompressedBuffersEnabled.get() != -1) {
|
||||
return !!debugManager.flags.RenderCompressedBuffersEnabled.get();
|
||||
}
|
||||
return hwInfo.capabilityTable.ftrRenderCompressedBuffers;
|
||||
}
|
||||
|
||||
bool GfxCoreHelper::compressedImagesSupported(const HardwareInfo &hwInfo) {
|
||||
if (DebugManager.flags.RenderCompressedImagesEnabled.get() != -1) {
|
||||
return !!DebugManager.flags.RenderCompressedImagesEnabled.get();
|
||||
if (debugManager.flags.RenderCompressedImagesEnabled.get() != -1) {
|
||||
return !!debugManager.flags.RenderCompressedImagesEnabled.get();
|
||||
}
|
||||
return hwInfo.capabilityTable.ftrRenderCompressedImages;
|
||||
}
|
||||
|
||||
bool GfxCoreHelper::cacheFlushAfterWalkerSupported(const HardwareInfo &hwInfo) {
|
||||
int32_t dbgFlag = DebugManager.flags.EnableCacheFlushAfterWalker.get();
|
||||
int32_t dbgFlag = debugManager.flags.EnableCacheFlushAfterWalker.get();
|
||||
if (dbgFlag == 1) {
|
||||
return true;
|
||||
} else if (dbgFlag == 0) {
|
||||
@@ -60,18 +60,18 @@ uint32_t GfxCoreHelper::getMaxThreadsForVfe(const HardwareInfo &hwInfo) {
|
||||
uint32_t threadsPerEU = (hwInfo.gtSystemInfo.ThreadCount / hwInfo.gtSystemInfo.EUCount) + hwInfo.capabilityTable.extraQuantityThreadsPerEU;
|
||||
auto maxHwThreadsCapable = hwInfo.gtSystemInfo.EUCount * threadsPerEU;
|
||||
auto maxHwThreadsReturned = maxHwThreadsCapable;
|
||||
if (DebugManager.flags.MaxHwThreadsPercent.get() != 0) {
|
||||
maxHwThreadsReturned = int(maxHwThreadsCapable * (DebugManager.flags.MaxHwThreadsPercent.get() / 100.0f));
|
||||
if (debugManager.flags.MaxHwThreadsPercent.get() != 0) {
|
||||
maxHwThreadsReturned = int(maxHwThreadsCapable * (debugManager.flags.MaxHwThreadsPercent.get() / 100.0f));
|
||||
}
|
||||
if (DebugManager.flags.MinHwThreadsUnoccupied.get() != 0) {
|
||||
maxHwThreadsReturned = std::min(maxHwThreadsReturned, maxHwThreadsCapable - DebugManager.flags.MinHwThreadsUnoccupied.get());
|
||||
if (debugManager.flags.MinHwThreadsUnoccupied.get() != 0) {
|
||||
maxHwThreadsReturned = std::min(maxHwThreadsReturned, maxHwThreadsCapable - debugManager.flags.MinHwThreadsUnoccupied.get());
|
||||
}
|
||||
return maxHwThreadsReturned;
|
||||
}
|
||||
|
||||
uint32_t GfxCoreHelper::getSubDevicesCount(const HardwareInfo *pHwInfo) {
|
||||
if (DebugManager.flags.CreateMultipleSubDevices.get() > 0) {
|
||||
return DebugManager.flags.CreateMultipleSubDevices.get();
|
||||
if (debugManager.flags.CreateMultipleSubDevices.get() > 0) {
|
||||
return debugManager.flags.CreateMultipleSubDevices.get();
|
||||
} else if (pHwInfo->gtSystemInfo.MultiTileArchInfo.IsValid && pHwInfo->gtSystemInfo.MultiTileArchInfo.TileCount > 0u) {
|
||||
return pHwInfo->gtSystemInfo.MultiTileArchInfo.TileCount;
|
||||
} else {
|
||||
|
||||
@@ -34,8 +34,8 @@ const AuxTranslationMode GfxCoreHelperHw<Family>::defaultAuxTranslationMode = Au
|
||||
|
||||
template <typename Family>
|
||||
bool GfxCoreHelperHw<Family>::isBufferSizeSuitableForCompression(const size_t size) const {
|
||||
if (DebugManager.flags.OverrideBufferSuitableForRenderCompression.get() != -1) {
|
||||
return !!DebugManager.flags.OverrideBufferSuitableForRenderCompression.get();
|
||||
if (debugManager.flags.OverrideBufferSuitableForRenderCompression.get() != -1) {
|
||||
return !!debugManager.flags.OverrideBufferSuitableForRenderCompression.get();
|
||||
}
|
||||
return size > KB;
|
||||
}
|
||||
@@ -62,7 +62,7 @@ SipKernelType GfxCoreHelperHw<Family>::getSipKernelType(bool debuggingActive) co
|
||||
if (!debuggingActive) {
|
||||
return SipKernelType::Csr;
|
||||
}
|
||||
return DebugManager.flags.UseBindlessDebugSip.get() ? SipKernelType::DbgBindless : SipKernelType::DbgCsr;
|
||||
return debugManager.flags.UseBindlessDebugSip.get() ? SipKernelType::DbgBindless : SipKernelType::DbgCsr;
|
||||
}
|
||||
|
||||
template <typename Family>
|
||||
@@ -137,8 +137,8 @@ void GfxCoreHelperHw<Family>::setRenderSurfaceStateForScratchResource(const Root
|
||||
} else {
|
||||
state.setMemoryObjectControlState(gmmHelper->getMOCS(GMM_RESOURCE_USAGE_OCL_BUFFER_CACHELINE_MISALIGNED));
|
||||
}
|
||||
if (DebugManager.flags.OverrideMocsIndexForScratchSpace.get() != -1) {
|
||||
auto mocsIndex = static_cast<uint32_t>(DebugManager.flags.OverrideMocsIndexForScratchSpace.get()) << 1;
|
||||
if (debugManager.flags.OverrideMocsIndexForScratchSpace.get() != -1) {
|
||||
auto mocsIndex = static_cast<uint32_t>(debugManager.flags.OverrideMocsIndexForScratchSpace.get()) << 1;
|
||||
state.setMemoryObjectControlState(mocsIndex);
|
||||
}
|
||||
|
||||
@@ -163,9 +163,9 @@ void NEO::GfxCoreHelperHw<GfxFamily>::setL1CachePolicy(bool useL1Cache, typename
|
||||
|
||||
template <typename Family>
|
||||
bool GfxCoreHelperHw<Family>::getEnableLocalMemory(const HardwareInfo &hwInfo) const {
|
||||
if (DebugManager.flags.EnableLocalMemory.get() != -1) {
|
||||
return DebugManager.flags.EnableLocalMemory.get();
|
||||
} else if (DebugManager.flags.AUBDumpForceAllToLocalMemory.get()) {
|
||||
if (debugManager.flags.EnableLocalMemory.get() != -1) {
|
||||
return debugManager.flags.EnableLocalMemory.get();
|
||||
} else if (debugManager.flags.AUBDumpForceAllToLocalMemory.get()) {
|
||||
return true;
|
||||
}
|
||||
|
||||
@@ -180,8 +180,8 @@ bool GfxCoreHelperHw<Family>::is1MbAlignmentSupported(const HardwareInfo &hwInfo
|
||||
template <typename Family>
|
||||
AuxTranslationMode GfxCoreHelperHw<Family>::getAuxTranslationMode(const HardwareInfo &hwInfo) {
|
||||
auto mode = GfxCoreHelperHw<Family>::defaultAuxTranslationMode;
|
||||
if (DebugManager.flags.ForceAuxTranslationMode.get() != -1) {
|
||||
mode = static_cast<AuxTranslationMode>(DebugManager.flags.ForceAuxTranslationMode.get());
|
||||
if (debugManager.flags.ForceAuxTranslationMode.get() != -1) {
|
||||
mode = static_cast<AuxTranslationMode>(debugManager.flags.ForceAuxTranslationMode.get());
|
||||
}
|
||||
|
||||
if (mode == AuxTranslationMode::Blit && !hwInfo.capabilityTable.blitterOperationsSupported) {
|
||||
@@ -270,7 +270,7 @@ void MemorySynchronizationCommands<GfxFamily>::setSingleBarrier(void *commandsBu
|
||||
pipeControl.setGenericMediaStateClear(args.genericMediaStateClear);
|
||||
}
|
||||
|
||||
if (DebugManager.flags.FlushAllCaches.get()) {
|
||||
if (debugManager.flags.FlushAllCaches.get()) {
|
||||
pipeControl.setDcFlushEnable(true);
|
||||
pipeControl.setRenderTargetCacheFlushEnable(true);
|
||||
pipeControl.setInstructionCacheInvalidateEnable(true);
|
||||
@@ -281,7 +281,7 @@ void MemorySynchronizationCommands<GfxFamily>::setSingleBarrier(void *commandsBu
|
||||
pipeControl.setStateCacheInvalidationEnable(true);
|
||||
pipeControl.setTlbInvalidate(true);
|
||||
}
|
||||
if (DebugManager.flags.DoNotFlushCaches.get()) {
|
||||
if (debugManager.flags.DoNotFlushCaches.get()) {
|
||||
pipeControl.setDcFlushEnable(false);
|
||||
pipeControl.setRenderTargetCacheFlushEnable(false);
|
||||
pipeControl.setInstructionCacheInvalidateEnable(false);
|
||||
@@ -447,15 +447,15 @@ template <typename GfxFamily>
|
||||
std::unique_ptr<TagAllocatorBase> GfxCoreHelperHw<GfxFamily>::createTimestampPacketAllocator(const RootDeviceIndicesContainer &rootDeviceIndices, MemoryManager *memoryManager,
|
||||
size_t initialTagCount, CommandStreamReceiverType csrType, DeviceBitfield deviceBitfield) const {
|
||||
bool doNotReleaseNodes = (csrType > CommandStreamReceiverType::CSR_HW) ||
|
||||
DebugManager.flags.DisableTimestampPacketOptimizations.get();
|
||||
debugManager.flags.DisableTimestampPacketOptimizations.get();
|
||||
|
||||
auto tagAlignment = getTimestampPacketAllocatorAlignment();
|
||||
|
||||
if (DebugManager.flags.OverrideTimestampPacketSize.get() != -1) {
|
||||
if (DebugManager.flags.OverrideTimestampPacketSize.get() == 4) {
|
||||
if (debugManager.flags.OverrideTimestampPacketSize.get() != -1) {
|
||||
if (debugManager.flags.OverrideTimestampPacketSize.get() == 4) {
|
||||
using TimestampPackets32T = TimestampPackets<uint32_t, GfxFamily::timestampPacketCount>;
|
||||
return std::make_unique<TagAllocator<TimestampPackets32T>>(rootDeviceIndices, memoryManager, initialTagCount, tagAlignment, sizeof(TimestampPackets32T), doNotReleaseNodes, deviceBitfield);
|
||||
} else if (DebugManager.flags.OverrideTimestampPacketSize.get() == 8) {
|
||||
} else if (debugManager.flags.OverrideTimestampPacketSize.get() == 8) {
|
||||
using TimestampPackets64T = TimestampPackets<uint64_t, GfxFamily::timestampPacketCount>;
|
||||
return std::make_unique<TagAllocator<TimestampPackets64T>>(rootDeviceIndices, memoryManager, initialTagCount, tagAlignment, sizeof(TimestampPackets64T), doNotReleaseNodes, deviceBitfield);
|
||||
} else {
|
||||
@@ -481,10 +481,10 @@ size_t GfxCoreHelperHw<GfxFamily>::getSingleTimestampPacketSize() const {
|
||||
|
||||
template <typename GfxFamily>
|
||||
size_t GfxCoreHelperHw<GfxFamily>::getSingleTimestampPacketSizeHw() {
|
||||
if (DebugManager.flags.OverrideTimestampPacketSize.get() != -1) {
|
||||
if (DebugManager.flags.OverrideTimestampPacketSize.get() == 4) {
|
||||
if (debugManager.flags.OverrideTimestampPacketSize.get() != -1) {
|
||||
if (debugManager.flags.OverrideTimestampPacketSize.get() == 4) {
|
||||
return TimestampPackets<uint32_t, GfxFamily::timestampPacketCount>::getSinglePacketSize();
|
||||
} else if (DebugManager.flags.OverrideTimestampPacketSize.get() == 8) {
|
||||
} else if (debugManager.flags.OverrideTimestampPacketSize.get() == 8) {
|
||||
return TimestampPackets<uint64_t, GfxFamily::timestampPacketCount>::getSinglePacketSize();
|
||||
} else {
|
||||
UNRECOVERABLE_IF(true);
|
||||
@@ -651,16 +651,16 @@ uint64_t GfxCoreHelperHw<GfxFamily>::getPatIndex(CacheRegion cacheRegion, CacheP
|
||||
|
||||
template <typename gfxProduct>
|
||||
bool GfxCoreHelperHw<gfxProduct>::copyThroughLockedPtrEnabled(const HardwareInfo &hwInfo, const ProductHelper &productHelper) const {
|
||||
if (DebugManager.flags.ExperimentalCopyThroughLock.get() != -1) {
|
||||
return DebugManager.flags.ExperimentalCopyThroughLock.get() == 1;
|
||||
if (debugManager.flags.ExperimentalCopyThroughLock.get() != -1) {
|
||||
return debugManager.flags.ExperimentalCopyThroughLock.get() == 1;
|
||||
}
|
||||
return false;
|
||||
}
|
||||
|
||||
template <typename gfxProduct>
|
||||
uint32_t GfxCoreHelperHw<gfxProduct>::getAmountOfAllocationsToFill() const {
|
||||
if (DebugManager.flags.SetAmountOfReusableAllocations.get() != -1) {
|
||||
return DebugManager.flags.SetAmountOfReusableAllocations.get();
|
||||
if (debugManager.flags.SetAmountOfReusableAllocations.get() != -1) {
|
||||
return debugManager.flags.SetAmountOfReusableAllocations.get();
|
||||
}
|
||||
return 0u;
|
||||
}
|
||||
|
||||
@@ -41,8 +41,8 @@ bool GfxCoreHelperHw<GfxFamily>::isEngineTypeRemappingToHwSpecificRequired() con
|
||||
|
||||
template <typename Family>
|
||||
size_t GfxCoreHelperHw<Family>::getPaddingForISAAllocation() const {
|
||||
if (DebugManager.flags.ForceExtendedKernelIsaSize.get() >= 1) {
|
||||
return 512 + (MemoryConstants::pageSize * DebugManager.flags.ForceExtendedKernelIsaSize.get());
|
||||
if (debugManager.flags.ForceExtendedKernelIsaSize.get() >= 1) {
|
||||
return 512 + (MemoryConstants::pageSize * debugManager.flags.ForceExtendedKernelIsaSize.get());
|
||||
}
|
||||
return 512;
|
||||
}
|
||||
|
||||
@@ -21,12 +21,12 @@ inline void MemorySynchronizationCommands<GfxFamily>::setBarrierExtraProperties(
|
||||
pipeControl.setWorkloadPartitionIdOffsetEnable(args.workloadPartitionOffset);
|
||||
pipeControl.setAmfsFlushEnable(args.amfsFlushEnable);
|
||||
|
||||
if (DebugManager.flags.FlushAllCaches.get()) {
|
||||
if (debugManager.flags.FlushAllCaches.get()) {
|
||||
pipeControl.setHdcPipelineFlush(true);
|
||||
pipeControl.setUnTypedDataPortCacheFlush(true);
|
||||
pipeControl.setCompressionControlSurfaceCcsFlush(true);
|
||||
}
|
||||
if (DebugManager.flags.DoNotFlushCaches.get()) {
|
||||
if (debugManager.flags.DoNotFlushCaches.get()) {
|
||||
pipeControl.setHdcPipelineFlush(false);
|
||||
pipeControl.setUnTypedDataPortCacheFlush(false);
|
||||
pipeControl.setCompressionControlSurfaceCcsFlush(false);
|
||||
|
||||
@@ -12,9 +12,9 @@ namespace NEO {
|
||||
|
||||
template <typename Family>
|
||||
bool GfxCoreHelperHw<Family>::isFenceAllocationRequired(const HardwareInfo &hwInfo) const {
|
||||
if ((DebugManager.flags.ProgramGlobalFenceAsMiMemFenceCommandInCommandStream.get() == 0) &&
|
||||
(DebugManager.flags.ProgramGlobalFenceAsPostSyncOperationInComputeWalker.get() == 0) &&
|
||||
(DebugManager.flags.ProgramGlobalFenceAsKernelInstructionInEUKernel.get() == 0)) {
|
||||
if ((debugManager.flags.ProgramGlobalFenceAsMiMemFenceCommandInCommandStream.get() == 0) &&
|
||||
(debugManager.flags.ProgramGlobalFenceAsPostSyncOperationInComputeWalker.get() == 0) &&
|
||||
(debugManager.flags.ProgramGlobalFenceAsKernelInstructionInEUKernel.get() == 0)) {
|
||||
return false;
|
||||
}
|
||||
return true;
|
||||
@@ -51,8 +51,8 @@ bool GfxCoreHelperHw<Family>::isCooperativeDispatchSupported(const EngineGroupTy
|
||||
template <typename Family>
|
||||
uint32_t GfxCoreHelperHw<Family>::adjustMaxWorkGroupCount(uint32_t maxWorkGroupCount, const EngineGroupType engineGroupType,
|
||||
const RootDeviceEnvironment &rootDeviceEnvironment, bool isEngineInstanced) const {
|
||||
if ((DebugManager.flags.ForceTheoreticalMaxWorkGroupCount.get()) ||
|
||||
(DebugManager.flags.OverrideMaxWorkGroupCount.get() != -1)) {
|
||||
if ((debugManager.flags.ForceTheoreticalMaxWorkGroupCount.get()) ||
|
||||
(debugManager.flags.OverrideMaxWorkGroupCount.get() != -1)) {
|
||||
return maxWorkGroupCount;
|
||||
}
|
||||
if (!isCooperativeDispatchSupported(engineGroupType, rootDeviceEnvironment)) {
|
||||
@@ -80,8 +80,8 @@ bool GfxCoreHelperHw<Family>::isEngineTypeRemappingToHwSpecificRequired() const
|
||||
|
||||
template <typename Family>
|
||||
size_t GfxCoreHelperHw<Family>::getPaddingForISAAllocation() const {
|
||||
if (DebugManager.flags.ForceExtendedKernelIsaSize.get() >= 1) {
|
||||
return 0xE00 + (MemoryConstants::pageSize * DebugManager.flags.ForceExtendedKernelIsaSize.get());
|
||||
if (debugManager.flags.ForceExtendedKernelIsaSize.get() >= 1) {
|
||||
return 0xE00 + (MemoryConstants::pageSize * debugManager.flags.ForceExtendedKernelIsaSize.get());
|
||||
}
|
||||
return 0xE00;
|
||||
}
|
||||
|
||||
@@ -15,8 +15,8 @@ inline bool GfxCoreHelperHw<GfxFamily>::isFusedEuDispatchEnabled(const HardwareI
|
||||
auto fusedEuDispatchEnabled = !hwInfo.workaroundTable.flags.waDisableFusedThreadScheduling;
|
||||
fusedEuDispatchEnabled &= hwInfo.capabilityTable.fusedEuEnabled;
|
||||
|
||||
if (DebugManager.flags.CFEFusedEUDispatch.get() != -1) {
|
||||
fusedEuDispatchEnabled = (DebugManager.flags.CFEFusedEUDispatch.get() == 0);
|
||||
if (debugManager.flags.CFEFusedEUDispatch.get() != -1) {
|
||||
fusedEuDispatchEnabled = (debugManager.flags.CFEFusedEUDispatch.get() == 0);
|
||||
}
|
||||
return fusedEuDispatchEnabled;
|
||||
}
|
||||
|
||||
@@ -21,8 +21,8 @@ namespace NEO {
|
||||
|
||||
template <typename GfxFamily>
|
||||
uint32_t GfxCoreHelperHw<GfxFamily>::getComputeUnitsUsedForScratch(const RootDeviceEnvironment &rootDeviceEnvironment) const {
|
||||
if (DebugManager.flags.OverrideNumComputeUnitsForScratch.get() != -1) {
|
||||
return static_cast<uint32_t>(DebugManager.flags.OverrideNumComputeUnitsForScratch.get());
|
||||
if (debugManager.flags.OverrideNumComputeUnitsForScratch.get() != -1) {
|
||||
return static_cast<uint32_t>(debugManager.flags.OverrideNumComputeUnitsForScratch.get());
|
||||
}
|
||||
|
||||
auto &productHelper = rootDeviceEnvironment.getHelper<ProductHelper>();
|
||||
@@ -70,7 +70,7 @@ const EngineInstancesContainer GfxCoreHelperHw<GfxFamily>::getGpgpuEngineInstanc
|
||||
}
|
||||
}
|
||||
|
||||
if ((DebugManager.flags.NodeOrdinal.get() == static_cast<int32_t>(aub_stream::EngineType::ENGINE_RCS)) ||
|
||||
if ((debugManager.flags.NodeOrdinal.get() == static_cast<int32_t>(aub_stream::EngineType::ENGINE_RCS)) ||
|
||||
hwInfo.featureTable.flags.ftrRcsNode) {
|
||||
engines.push_back({aub_stream::ENGINE_RCS, EngineUsage::Regular});
|
||||
}
|
||||
@@ -103,7 +103,7 @@ EngineGroupType GfxCoreHelperHw<GfxFamily>::getEngineGroupType(aub_stream::Engin
|
||||
template <typename GfxFamily>
|
||||
uint32_t GfxCoreHelperHw<GfxFamily>::getMocsIndex(const GmmHelper &gmmHelper, bool l3enabled, bool l1enabled) const {
|
||||
if (l3enabled) {
|
||||
if (DebugManager.flags.ForceL1Caching.get() == 0) {
|
||||
if (debugManager.flags.ForceL1Caching.get() == 0) {
|
||||
if (l1enabled) {
|
||||
return gmmHelper.getMOCS(GMM_RESOURCE_USAGE_OCL_BUFFER_CONST) >> 1;
|
||||
}
|
||||
@@ -135,8 +135,8 @@ template <typename GfxFamily>
|
||||
aub_stream::MMIOList GfxCoreHelperHw<GfxFamily>::getExtraMmioList(const HardwareInfo &hwInfo, const GmmHelper &gmmHelper) const {
|
||||
aub_stream::MMIOList mmioList;
|
||||
|
||||
if (DebugManager.flags.EnableStatelessCompressionWithUnifiedMemory.get()) {
|
||||
auto format = static_cast<uint32_t>(DebugManager.flags.FormatForStatelessCompressionWithUnifiedMemory.get());
|
||||
if (debugManager.flags.EnableStatelessCompressionWithUnifiedMemory.get()) {
|
||||
auto format = static_cast<uint32_t>(debugManager.flags.FormatForStatelessCompressionWithUnifiedMemory.get());
|
||||
|
||||
UNRECOVERABLE_IF(format > 0x1F);
|
||||
|
||||
@@ -154,7 +154,7 @@ aub_stream::MMIOList GfxCoreHelperHw<GfxFamily>::getExtraMmioList(const Hardware
|
||||
template <typename GfxFamily>
|
||||
bool MemorySynchronizationCommands<GfxFamily>::isBarrierWaRequired(const RootDeviceEnvironment &rootDeviceEnvironment) {
|
||||
auto &hwInfo = *rootDeviceEnvironment.getHardwareInfo();
|
||||
if (DebugManager.flags.DisablePipeControlPrecedingPostSyncCommand.get() == 1) {
|
||||
if (debugManager.flags.DisablePipeControlPrecedingPostSyncCommand.get() == 1) {
|
||||
return hwInfo.featureTable.flags.ftrLocalMemory;
|
||||
}
|
||||
return false;
|
||||
@@ -177,8 +177,8 @@ inline bool GfxCoreHelperHw<GfxFamily>::platformSupportsImplicitScaling(const NE
|
||||
template <typename GfxFamily>
|
||||
inline bool GfxCoreHelperHw<GfxFamily>::preferInternalBcsEngine() const {
|
||||
auto preferInternalBcsEngine = true;
|
||||
if (DebugManager.flags.PreferInternalBcsEngine.get() != -1) {
|
||||
preferInternalBcsEngine = static_cast<bool>(DebugManager.flags.PreferInternalBcsEngine.get());
|
||||
if (debugManager.flags.PreferInternalBcsEngine.get() != -1) {
|
||||
preferInternalBcsEngine = static_cast<bool>(debugManager.flags.PreferInternalBcsEngine.get());
|
||||
}
|
||||
|
||||
return preferInternalBcsEngine;
|
||||
|
||||
@@ -124,8 +124,8 @@ bool parseHwInfoConfigString(const std::string &hwInfoConfigStr, uint64_t &hwInf
|
||||
}
|
||||
|
||||
aub_stream::EngineType getChosenEngineType(const HardwareInfo &hwInfo) {
|
||||
return DebugManager.flags.NodeOrdinal.get() == -1
|
||||
return debugManager.flags.NodeOrdinal.get() == -1
|
||||
? hwInfo.capabilityTable.defaultEngineType
|
||||
: static_cast<aub_stream::EngineType>(DebugManager.flags.NodeOrdinal.get());
|
||||
: static_cast<aub_stream::EngineType>(debugManager.flags.NodeOrdinal.get());
|
||||
}
|
||||
} // namespace NEO
|
||||
|
||||
@@ -21,8 +21,8 @@ namespace NEO {
|
||||
uint32_t KernelHelper::getMaxWorkGroupCount(uint32_t simd, uint32_t availableThreadCount, uint32_t dssCount, uint32_t availableSlmSize,
|
||||
uint32_t usedSlmSize, uint32_t maxBarrierCount, uint32_t numberOfBarriers, uint32_t workDim,
|
||||
const size_t *localWorkSize) {
|
||||
if (DebugManager.flags.OverrideMaxWorkGroupCount.get() != -1) {
|
||||
return static_cast<uint32_t>(DebugManager.flags.OverrideMaxWorkGroupCount.get());
|
||||
if (debugManager.flags.OverrideMaxWorkGroupCount.get() != -1) {
|
||||
return static_cast<uint32_t>(debugManager.flags.OverrideMaxWorkGroupCount.get());
|
||||
}
|
||||
|
||||
UNRECOVERABLE_IF((workDim == 0) || (workDim > 3));
|
||||
@@ -61,18 +61,18 @@ KernelHelper::ErrorCode KernelHelper::checkIfThereIsSpaceForScratchOrPrivate(Ker
|
||||
auto totalScratchSize = KernelHelper::getScratchSize(attributes.perThreadScratchSize[0], computeUnitsForScratch);
|
||||
auto totalPrivateScratchSize = KernelHelper::getPrivateScratchSize(attributes.perThreadScratchSize[1], computeUnitsForScratch);
|
||||
|
||||
PRINT_DEBUG_STRING(DebugManager.flags.PrintDebugMessages.get(), stderr,
|
||||
PRINT_DEBUG_STRING(debugManager.flags.PrintDebugMessages.get(), stderr,
|
||||
"computeUnits for each thread: %u\n", computeUnitsForScratch);
|
||||
|
||||
PRINT_DEBUG_STRING(DebugManager.flags.PrintDebugMessages.get(), stderr,
|
||||
PRINT_DEBUG_STRING(debugManager.flags.PrintDebugMessages.get(), stderr,
|
||||
"perHwThreadPrivateMemorySize: %u\t totalPrivateMemorySize: %lu\n",
|
||||
attributes.perHwThreadPrivateMemorySize, totalPrivateMemorySize);
|
||||
|
||||
PRINT_DEBUG_STRING(DebugManager.flags.PrintDebugMessages.get(), stderr,
|
||||
PRINT_DEBUG_STRING(debugManager.flags.PrintDebugMessages.get(), stderr,
|
||||
"perHwThreadScratchSize: %u\t totalScratchSize: %lu\n",
|
||||
attributes.perThreadScratchSize[0], totalScratchSize);
|
||||
|
||||
PRINT_DEBUG_STRING(DebugManager.flags.PrintDebugMessages.get(), stderr,
|
||||
PRINT_DEBUG_STRING(debugManager.flags.PrintDebugMessages.get(), stderr,
|
||||
"perHwThreadPrivateScratchSize: %u\t totalPrivateScratchSize: %lu\n",
|
||||
attributes.perThreadScratchSize[1], totalPrivateScratchSize);
|
||||
|
||||
|
||||
@@ -35,7 +35,7 @@ WaitParams KmdNotifyHelper::obtainTimeoutParams(bool quickKmdSleepRequest,
|
||||
return WaitParams{};
|
||||
}
|
||||
|
||||
if (DebugManager.flags.PowerSavingMode.get() || throttle == QueueThrottle::LOW) {
|
||||
if (debugManager.flags.PowerSavingMode.get() || throttle == QueueThrottle::LOW) {
|
||||
return WaitParams{false, true, 1};
|
||||
}
|
||||
|
||||
|
||||
@@ -363,7 +363,7 @@ void computeWorkgroupSizeND(WorkSizeInfo &wsInfo, size_t workGroupSize[3], const
|
||||
|
||||
// Find biggest power of two which devide each dimension size
|
||||
if (wsInfo.slmTotalSize == 0 && !wsInfo.hasBarriers) {
|
||||
if (DebugManager.flags.EnableComputeWorkSizeSquared.get() && workDim == 2 && !wsInfo.imgUsed) {
|
||||
if (debugManager.flags.EnableComputeWorkSizeSquared.get() && workDim == 2 && !wsInfo.imgUsed) {
|
||||
return computeWorkgroupSizeSquared(wsInfo.maxWorkGroupSize, workGroupSize, workItems, wsInfo.simdSize, workDim);
|
||||
}
|
||||
|
||||
|
||||
@@ -54,7 +54,7 @@ GraphicsAllocation::UsmInitialPlacement MemoryPropertiesHelper::getUSMInitialPla
|
||||
if (memoryProperties.allocFlags.usmInitialPlacementCpu) {
|
||||
initialPlacement = GraphicsAllocation::UsmInitialPlacement::CPU;
|
||||
}
|
||||
if (const int32_t debugFlag = DebugManager.flags.UsmInitialPlacement.get(); debugFlag != -1) {
|
||||
if (const int32_t debugFlag = debugManager.flags.UsmInitialPlacement.get(); debugFlag != -1) {
|
||||
initialPlacement = debugFlag != 1 ? GraphicsAllocation::UsmInitialPlacement::CPU : GraphicsAllocation::UsmInitialPlacement::GPU;
|
||||
}
|
||||
return initialPlacement;
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
/*
|
||||
* Copyright (C) 2020-2022 Intel Corporation
|
||||
* Copyright (C) 2020-2023 Intel Corporation
|
||||
*
|
||||
* SPDX-License-Identifier: MIT
|
||||
*
|
||||
@@ -35,7 +35,7 @@ inline bool pauseModeAllowed(int32_t debugFlagValue, TaskCountType taskCount, Pa
|
||||
return false;
|
||||
}
|
||||
|
||||
if ((DebugManager.flags.PauseOnGpuMode.get() != PauseMode::BeforeAndAfterWorkload) && (DebugManager.flags.PauseOnGpuMode.get() != pauseMode)) {
|
||||
if ((debugManager.flags.PauseOnGpuMode.get() != PauseMode::BeforeAndAfterWorkload) && (debugManager.flags.PauseOnGpuMode.get() != pauseMode)) {
|
||||
// mode not allowed
|
||||
return false;
|
||||
}
|
||||
|
||||
@@ -31,8 +31,8 @@ void PreambleHelper<GfxFamily>::programGenSpecificPreambleWorkArounds(LinearStre
|
||||
|
||||
template <typename GfxFamily>
|
||||
void PreambleHelper<GfxFamily>::programSemaphoreDelay(LinearStream *pCommandStream) {
|
||||
if (DebugManager.flags.ForceSemaphoreDelayBetweenWaits.get() > -1) {
|
||||
uint32_t valueOfNewSemaphoreDelay = DebugManager.flags.ForceSemaphoreDelayBetweenWaits.get();
|
||||
if (debugManager.flags.ForceSemaphoreDelayBetweenWaits.get() > -1) {
|
||||
uint32_t valueOfNewSemaphoreDelay = debugManager.flags.ForceSemaphoreDelayBetweenWaits.get();
|
||||
LriHelper<GfxFamily>::program(pCommandStream,
|
||||
SEMA_WAIT_POLL,
|
||||
valueOfNewSemaphoreDelay,
|
||||
|
||||
@@ -32,7 +32,7 @@ void PreambleHelper<Family>::programPipelineSelect(LinearStream *pCommandStream,
|
||||
MemorySynchronizationCommands<Family>::addSingleBarrier(*pCommandStream, args);
|
||||
}
|
||||
|
||||
if (DebugManager.flags.CleanStateInPreamble.get()) {
|
||||
if (debugManager.flags.CleanStateInPreamble.get()) {
|
||||
auto cmdBuffer = pCommandStream->getSpaceForCmd<PIPELINE_SELECT>();
|
||||
cmd.setPipelineSelection(PIPELINE_SELECT::PIPELINE_SELECTION_3D);
|
||||
*cmdBuffer = cmd;
|
||||
@@ -54,7 +54,7 @@ void PreambleHelper<Family>::programPipelineSelect(LinearStream *pCommandStream,
|
||||
|
||||
bool systolicSupport = pipelineSelectArgs.systolicPipelineSelectSupport;
|
||||
bool systolicValue = pipelineSelectArgs.systolicPipelineSelectMode;
|
||||
int32_t overrideSystolic = DebugManager.flags.OverrideSystolicPipelineSelect.get();
|
||||
int32_t overrideSystolic = debugManager.flags.OverrideSystolicPipelineSelect.get();
|
||||
|
||||
if (overrideSystolic != -1) {
|
||||
systolicSupport = true;
|
||||
@@ -70,7 +70,7 @@ void PreambleHelper<Family>::programPipelineSelect(LinearStream *pCommandStream,
|
||||
|
||||
*cmdBuffer = cmd;
|
||||
|
||||
if (DebugManager.flags.CleanStateInPreamble.get()) {
|
||||
if (debugManager.flags.CleanStateInPreamble.get()) {
|
||||
PipeControlArgs args = {};
|
||||
args.stateCacheInvalidationEnable = true;
|
||||
MemorySynchronizationCommands<Family>::addSingleBarrier(*pCommandStream, args);
|
||||
@@ -85,7 +85,7 @@ size_t PreambleHelper<Family>::getCmdSizeForPipelineSelect(const RootDeviceEnvir
|
||||
if (MemorySynchronizationCommands<Family>::isBarrierPriorToPipelineSelectWaRequired(rootDeviceEnvironment)) {
|
||||
size += MemorySynchronizationCommands<Family>::getSizeForSingleBarrier(false);
|
||||
}
|
||||
if (DebugManager.flags.CleanStateInPreamble.get()) {
|
||||
if (debugManager.flags.CleanStateInPreamble.get()) {
|
||||
size += sizeof(PIPELINE_SELECT);
|
||||
size += 2 * MemorySynchronizationCommands<Family>::getSizeForSingleBarrier(false);
|
||||
}
|
||||
|
||||
@@ -55,14 +55,14 @@ void PreambleHelper<GfxFamily>::programVfeState(void *pVfeState,
|
||||
cmd.setMaximumNumberOfThreads(maxFrontEndThreads);
|
||||
appendProgramVFEState(rootDeviceEnvironment, streamProperties, &cmd);
|
||||
|
||||
if (DebugManager.flags.CFEMaximumNumberOfThreads.get() != -1) {
|
||||
cmd.setMaximumNumberOfThreads(DebugManager.flags.CFEMaximumNumberOfThreads.get());
|
||||
if (debugManager.flags.CFEMaximumNumberOfThreads.get() != -1) {
|
||||
cmd.setMaximumNumberOfThreads(debugManager.flags.CFEMaximumNumberOfThreads.get());
|
||||
}
|
||||
if (DebugManager.flags.CFEOverDispatchControl.get() != -1) {
|
||||
cmd.setOverDispatchControl(static_cast<typename CFE_STATE::OVER_DISPATCH_CONTROL>(DebugManager.flags.CFEOverDispatchControl.get()));
|
||||
if (debugManager.flags.CFEOverDispatchControl.get() != -1) {
|
||||
cmd.setOverDispatchControl(static_cast<typename CFE_STATE::OVER_DISPATCH_CONTROL>(debugManager.flags.CFEOverDispatchControl.get()));
|
||||
}
|
||||
if (DebugManager.flags.CFELargeGRFThreadAdjustDisable.get() != -1) {
|
||||
cmd.setLargeGRFThreadAdjustDisable(DebugManager.flags.CFELargeGRFThreadAdjustDisable.get());
|
||||
if (debugManager.flags.CFELargeGRFThreadAdjustDisable.get() != -1) {
|
||||
cmd.setLargeGRFThreadAdjustDisable(debugManager.flags.CFELargeGRFThreadAdjustDisable.get());
|
||||
}
|
||||
|
||||
*cfeState = cmd;
|
||||
|
||||
@@ -101,7 +101,7 @@ void StateBaseAddressHelper<GfxFamily>::programStateBaseAddress(
|
||||
args.stateBaseAddressCmd->setInstructionBufferSize(MemoryConstants::sizeOf4GBinPageEntities);
|
||||
|
||||
auto &productHelper = args.gmmHelper->getRootDeviceEnvironment().template getHelper<ProductHelper>();
|
||||
auto resourceUsage = CacheSettingsHelper::getGmmUsageType(AllocationType::INTERNAL_HEAP, DebugManager.flags.DisableCachingForHeaps.get(), productHelper);
|
||||
auto resourceUsage = CacheSettingsHelper::getGmmUsageType(AllocationType::INTERNAL_HEAP, debugManager.flags.DisableCachingForHeaps.get(), productHelper);
|
||||
|
||||
args.stateBaseAddressCmd->setInstructionMemoryObjectControlState(args.gmmHelper->getMOCS(resourceUsage));
|
||||
}
|
||||
@@ -119,8 +119,8 @@ void StateBaseAddressHelper<GfxFamily>::programStateBaseAddress(
|
||||
args.stateBaseAddressCmd->setSurfaceStateBaseAddress(args.surfaceStateBaseAddress);
|
||||
}
|
||||
|
||||
if (DebugManager.flags.OverrideStatelessMocsIndex.get() != -1) {
|
||||
args.statelessMocsIndex = DebugManager.flags.OverrideStatelessMocsIndex.get();
|
||||
if (debugManager.flags.OverrideStatelessMocsIndex.get() != -1) {
|
||||
args.statelessMocsIndex = debugManager.flags.OverrideStatelessMocsIndex.get();
|
||||
}
|
||||
|
||||
args.statelessMocsIndex = args.statelessMocsIndex << 1;
|
||||
|
||||
@@ -65,7 +65,7 @@ void StateBaseAddressHelper<GfxFamily>::appendStateBaseAddressParameters(
|
||||
|
||||
auto &productHelper = args.gmmHelper->getRootDeviceEnvironment().template getHelper<ProductHelper>();
|
||||
|
||||
auto heapResourceUsage = CacheSettingsHelper::getGmmUsageType(AllocationType::INTERNAL_HEAP, DebugManager.flags.DisableCachingForHeaps.get(), productHelper);
|
||||
auto heapResourceUsage = CacheSettingsHelper::getGmmUsageType(AllocationType::INTERNAL_HEAP, debugManager.flags.DisableCachingForHeaps.get(), productHelper);
|
||||
auto heapMocsValue = args.gmmHelper->getMOCS(heapResourceUsage);
|
||||
|
||||
args.stateBaseAddressCmd->setSurfaceStateMemoryObjectControlState(heapMocsValue);
|
||||
@@ -75,19 +75,19 @@ void StateBaseAddressHelper<GfxFamily>::appendStateBaseAddressParameters(
|
||||
args.stateBaseAddressCmd->setBindlessSamplerStateMemoryObjectControlState(heapMocsValue);
|
||||
|
||||
bool enableMultiGpuAtomics = args.isMultiOsContextCapable;
|
||||
if (DebugManager.flags.EnableMultiGpuAtomicsOptimization.get()) {
|
||||
if (debugManager.flags.EnableMultiGpuAtomicsOptimization.get()) {
|
||||
enableMultiGpuAtomics = args.useGlobalAtomics && (args.isMultiOsContextCapable || args.areMultipleSubDevicesInContext);
|
||||
}
|
||||
args.stateBaseAddressCmd->setDisableSupportForMultiGpuAtomicsForStatelessAccesses(!enableMultiGpuAtomics);
|
||||
|
||||
args.stateBaseAddressCmd->setDisableSupportForMultiGpuPartialWritesForStatelessMessages(!args.isMultiOsContextCapable);
|
||||
|
||||
if (DebugManager.flags.ForceMultiGpuAtomics.get() != -1) {
|
||||
args.stateBaseAddressCmd->setDisableSupportForMultiGpuAtomicsForStatelessAccesses(!!DebugManager.flags.ForceMultiGpuAtomics.get());
|
||||
if (debugManager.flags.ForceMultiGpuAtomics.get() != -1) {
|
||||
args.stateBaseAddressCmd->setDisableSupportForMultiGpuAtomicsForStatelessAccesses(!!debugManager.flags.ForceMultiGpuAtomics.get());
|
||||
}
|
||||
|
||||
if (DebugManager.flags.ForceMultiGpuPartialWrites.get() != -1) {
|
||||
args.stateBaseAddressCmd->setDisableSupportForMultiGpuPartialWritesForStatelessMessages(!!DebugManager.flags.ForceMultiGpuPartialWrites.get());
|
||||
if (debugManager.flags.ForceMultiGpuPartialWrites.get() != -1) {
|
||||
args.stateBaseAddressCmd->setDisableSupportForMultiGpuPartialWritesForStatelessMessages(!!debugManager.flags.ForceMultiGpuPartialWrites.get());
|
||||
}
|
||||
|
||||
if (args.memoryCompressionState != MemoryCompressionState::NotApplicable) {
|
||||
@@ -95,7 +95,7 @@ void StateBaseAddressHelper<GfxFamily>::appendStateBaseAddressParameters(
|
||||
}
|
||||
|
||||
bool l3MocsEnabled = (args.stateBaseAddressCmd->getStatelessDataPortAccessMemoryObjectControlState() >> 1) == (args.gmmHelper->getMOCS(GMM_RESOURCE_USAGE_OCL_BUFFER) >> 1);
|
||||
bool constMocsAllowed = (l3MocsEnabled && (DebugManager.flags.ForceL1Caching.get() != 0));
|
||||
bool constMocsAllowed = (l3MocsEnabled && (debugManager.flags.ForceL1Caching.get() != 0));
|
||||
|
||||
if (constMocsAllowed) {
|
||||
auto constMocsIndex = args.gmmHelper->getMOCS(GMM_RESOURCE_USAGE_OCL_BUFFER_CONST);
|
||||
@@ -116,7 +116,7 @@ void StateBaseAddressHelper<GfxFamily>::programBindingTableBaseAddress(LinearStr
|
||||
cmd.setBindingTablePoolBaseAddress(baseAddress);
|
||||
cmd.setBindingTablePoolBufferSize(sizeInPages);
|
||||
cmd.setSurfaceObjectControlStateIndexToMocsTables(gmmHelper->getMOCS(GMM_RESOURCE_USAGE_OCL_STATE_HEAP_BUFFER));
|
||||
if (DebugManager.flags.DisableCachingForHeaps.get()) {
|
||||
if (debugManager.flags.DisableCachingForHeaps.get()) {
|
||||
cmd.setSurfaceObjectControlStateIndexToMocsTables(gmmHelper->getMOCS(GMM_RESOURCE_USAGE_OCL_SYSTEM_MEMORY_BUFFER_CACHELINE_MISALIGNED));
|
||||
}
|
||||
|
||||
@@ -133,9 +133,9 @@ void StateBaseAddressHelper<GfxFamily>::appendExtraCacheSettings(StateBaseAddres
|
||||
auto cachePolicy = args.isDebuggerActive ? args.l1CachePolicyDebuggerActive : args.l1CachePolicy;
|
||||
args.stateBaseAddressCmd->setL1CachePolicyL1CacheControl(static_cast<typename STATE_BASE_ADDRESS::L1_CACHE_POLICY>(cachePolicy));
|
||||
|
||||
if (DebugManager.flags.ForceStatelessL1CachingPolicy.get() != -1 &&
|
||||
DebugManager.flags.ForceAllResourcesUncached.get() == false) {
|
||||
args.stateBaseAddressCmd->setL1CachePolicyL1CacheControl(static_cast<typename STATE_BASE_ADDRESS::L1_CACHE_POLICY>(DebugManager.flags.ForceStatelessL1CachingPolicy.get()));
|
||||
if (debugManager.flags.ForceStatelessL1CachingPolicy.get() != -1 &&
|
||||
debugManager.flags.ForceAllResourcesUncached.get() == false) {
|
||||
args.stateBaseAddressCmd->setL1CachePolicyL1CacheControl(static_cast<typename STATE_BASE_ADDRESS::L1_CACHE_POLICY>(debugManager.flags.ForceStatelessL1CachingPolicy.get()));
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
@@ -96,7 +96,7 @@ struct TimestampPacketHelper {
|
||||
static void programSemaphore(LinearStream &cmdStream, TagNodeBase ×tampPacketNode) {
|
||||
using COMPARE_OPERATION = typename GfxFamily::MI_SEMAPHORE_WAIT::COMPARE_OPERATION;
|
||||
|
||||
if (DebugManager.flags.PrintTimestampPacketUsage.get() == 1) {
|
||||
if (debugManager.flags.PrintTimestampPacketUsage.get() == 1) {
|
||||
printf("\nPID: %u, TSP used for Semaphore: 0x%" PRIX64 ", cmdBuffer pos: 0x%" PRIX64, SysCalls::getProcessId(), timestampPacketNode.getGpuAddress(), cmdStream.getCurrentGpuAddressPosition());
|
||||
}
|
||||
|
||||
|
||||
@@ -18,7 +18,7 @@ template <typename GfxFamily>
|
||||
long __stdcall DeviceCallbacks<GfxFamily>::notifyAubCapture(void *csrHandle, uint64_t gfxAddress, size_t gfxSize, bool allocate) {
|
||||
auto csr = reinterpret_cast<CommandStreamReceiverHw<GfxFamily> *>(csrHandle);
|
||||
|
||||
if (DebugManager.flags.SetCommandStreamReceiver.get() == CSR_HW_WITH_AUB) {
|
||||
if (debugManager.flags.SetCommandStreamReceiver.get() == CSR_HW_WITH_AUB) {
|
||||
auto csrWithAub = static_cast<CommandStreamReceiverWithAUBDump<WddmCommandStreamReceiver<GfxFamily>> *>(csr);
|
||||
auto aubCsr = static_cast<AUBCommandStreamReceiverHw<GfxFamily> *>(csrWithAub->aubCSR.get());
|
||||
if (allocate) {
|
||||
|
||||
Reference in New Issue
Block a user