mirror of
https://github.com/intel/compute-runtime.git
synced 2025-12-21 09:14:47 +08:00
fix: to always use grfs count in calculateNumThreadsPerThreadGroup
grf size != grf count Related-To: GSD-8437 Signed-off-by: Katarzyna Cencelewska <katarzyna.cencelewska@intel.com>
This commit is contained in:
committed by
Compute-Runtime-Automation
parent
df54d67f40
commit
da7b03dd15
@@ -21,6 +21,7 @@ struct PerThreadDataHelper {
|
||||
static inline size_t getPerThreadDataSizeTotal(
|
||||
uint32_t simd,
|
||||
uint32_t grfSize,
|
||||
uint32_t grfCount,
|
||||
uint32_t numChannels,
|
||||
size_t localWorkSize,
|
||||
bool isHwLocalIdGeneration,
|
||||
@@ -30,7 +31,7 @@ struct PerThreadDataHelper {
|
||||
return perThreadSizeLocalIDs * localWorkSize;
|
||||
}
|
||||
auto &gfxCoreHelper = rootDeviceEnvironment.getHelper<NEO::GfxCoreHelper>();
|
||||
return perThreadSizeLocalIDs * gfxCoreHelper.calculateNumThreadsPerThreadGroup(simd, static_cast<uint32_t>(localWorkSize), grfSize, isHwLocalIdGeneration, rootDeviceEnvironment);
|
||||
return perThreadSizeLocalIDs * gfxCoreHelper.calculateNumThreadsPerThreadGroup(simd, static_cast<uint32_t>(localWorkSize), grfCount, isHwLocalIdGeneration, rootDeviceEnvironment);
|
||||
}
|
||||
}; // namespace PerThreadDataHelper
|
||||
} // namespace NEO
|
||||
|
||||
Reference in New Issue
Block a user