mirror of
https://github.com/intel/compute-runtime.git
synced 2025-12-24 21:18:24 +08:00
feature(internal): logging kernel dispatch params
Use debug flag PrintKernelDispatchParameters to print params used in thread group dispatch size heuristic when encoding kernel dispatch. Related-To: NEO-6989 Signed-off-by: Dominik Dabek <dominik.dabek@intel.com>
This commit is contained in:
committed by
Compute-Runtime-Automation
parent
ef6ea0b30c
commit
75c4844987
@@ -328,6 +328,20 @@ void EncodeDispatchKernel<Family>::encode(CommandContainer &container, EncodeDis
|
||||
|
||||
auto threadGroupCount = walkerCmd.getThreadGroupIdXDimension() * walkerCmd.getThreadGroupIdYDimension() * walkerCmd.getThreadGroupIdZDimension();
|
||||
EncodeDispatchKernel<Family>::adjustInterfaceDescriptorData(idd, *args.device, hwInfo, threadGroupCount, kernelDescriptor.kernelAttributes.numGrfRequired, walkerCmd);
|
||||
if (DebugManager.flags.PrintKernelDispatchParameters.get()) {
|
||||
fprintf(stdout, "kernel, %s, numGrf, %d, simdSize, %d, tilesCount, %d, implicitScaling, %s, threadGroupCount, %d, numberOfThreadsInGpgpuThreadGroup, %d, threadGroupDimensions, %d, %d, %d, threadGroupDispatchSize enum, %d\n",
|
||||
kernelDescriptor.kernelMetadata.kernelName.c_str(),
|
||||
kernelDescriptor.kernelAttributes.numGrfRequired,
|
||||
kernelDescriptor.kernelAttributes.simdSize,
|
||||
args.device->getNumSubDevices(),
|
||||
ImplicitScalingHelper::isImplicitScalingEnabled(args.device->getDeviceBitfield(), true) ? "Yes" : "no",
|
||||
threadGroupCount,
|
||||
idd.getNumberOfThreadsInGpgpuThreadGroup(),
|
||||
walkerCmd.getThreadGroupIdXDimension(),
|
||||
walkerCmd.getThreadGroupIdYDimension(),
|
||||
walkerCmd.getThreadGroupIdZDimension(),
|
||||
idd.getThreadGroupDispatchSize());
|
||||
}
|
||||
|
||||
EncodeDispatchKernel<Family>::appendAdditionalIDDFields(&idd, rootDeviceEnvironment, threadsPerThreadGroup,
|
||||
args.dispatchInterface->getSlmTotalSize(),
|
||||
|
||||
Reference in New Issue
Block a user