fix: Align thread group count to dss on all platforms

Related-To: NEO-13263, GSD-10327
Signed-off-by: Maciej Plewka <maciej.plewka@intel.com>
This commit is contained in:
Maciej Plewka
2024-11-18 15:57:22 +00:00
committed by Compute-Runtime-Automation
parent 9b4bb0c9ea
commit 62d8e3e4b0
2 changed files with 26 additions and 2 deletions

View File

@@ -802,6 +802,8 @@ uint32_t GfxCoreHelperHw<GfxFamily>::calculateAvailableThreadCount(const Hardwar
template <typename GfxFamily>
void GfxCoreHelperHw<GfxFamily>::alignThreadGroupCountToDssSize(uint32_t &threadCount, uint32_t dssCount, uint32_t threadsPerDss, uint32_t threadGroupSize) const {
uint32_t availableTreadCount = (threadsPerDss / threadGroupSize) * dssCount;
threadCount = std::min(threadCount, availableTreadCount);
}
template <typename GfxFamily>