75 lines
2.9 KiB
C++
75 lines
2.9 KiB
C++
/*
|
|
* Copyright (C) 2018-2024 Intel Corporation
|
|
*
|
|
* SPDX-License-Identifier: MIT
|
|
*
|
|
*/
|
|
|
|
#pragma once
|
|
|
|
#include "shared/source/device/device.h"
|
|
#include "shared/source/helpers/aligned_memory.h"
|
|
#include "shared/source/helpers/basic_math.h"
|
|
#include "shared/source/helpers/gfx_core_helper.h"
|
|
#include "shared/source/helpers/hw_info.h"
|
|
#include "shared/source/helpers/non_copyable_or_moveable.h"
|
|
#include "shared/source/release_helper/release_helper.h"
|
|
|
|
#include "ocl_igc_shared/raytracing/ocl_raytracing_structures.h"
|
|
|
|
#include <cstdint>
|
|
|
|
namespace NEO {
|
|
class RayTracingHelper : public NonCopyableOrMovableClass {
|
|
public:
|
|
static constexpr uint32_t hitInfoSize = 64;
|
|
static constexpr uint32_t bvhStackSize = 96;
|
|
static constexpr uint32_t memoryBackedFifoSizePerDss = 8 * MemoryConstants::kiloByte;
|
|
static constexpr uint32_t maxBvhLevels = 8;
|
|
|
|
static constexpr uint32_t maxSizeOfRtStacksPerDss = 4096;
|
|
static constexpr uint32_t fixedSizeOfRtStacksPerDss = 2048;
|
|
|
|
static size_t getDispatchGlobalSize() {
|
|
return static_cast<size_t>(alignUp(sizeof(RTDispatchGlobals), MemoryConstants::cacheLineSize));
|
|
}
|
|
|
|
static size_t getRTStackSizePerTile(const Device &device, uint32_t tiles, uint32_t maxBvhLevel, uint32_t extraBytesLocal, uint32_t extraBytesGlobal) {
|
|
return static_cast<size_t>(alignUp(getStackSizePerRay(maxBvhLevel, extraBytesLocal) * (getNumRtStacks(device)) + extraBytesGlobal, MemoryConstants::cacheLineSize));
|
|
}
|
|
|
|
static size_t getTotalMemoryBackedFifoSize(const Device &device) {
|
|
return static_cast<size_t>(NEO::GfxCoreHelper::getHighestEnabledDualSubSlice(device.getHardwareInfo())) * memoryBackedFifoSizePerDss;
|
|
}
|
|
|
|
static size_t getMemoryBackedFifoSizeToPatch() {
|
|
return static_cast<size_t>(Math::log2(memoryBackedFifoSizePerDss / MemoryConstants::kiloByte) - 1);
|
|
}
|
|
|
|
static uint32_t getNumRtStacks(const Device &device) {
|
|
return NEO::GfxCoreHelper::getHighestEnabledDualSubSlice(device.getHardwareInfo()) * getNumRtStacksPerDss(device);
|
|
}
|
|
|
|
static uint32_t getNumRtStacksPerDss(const Device &device) {
|
|
auto releaseHelper = device.getReleaseHelper();
|
|
|
|
if (releaseHelper == nullptr || releaseHelper->isNumRtStacksPerDssFixedValue()) {
|
|
return fixedSizeOfRtStacksPerDss;
|
|
}
|
|
|
|
const auto &hwInfo = device.getHardwareInfo();
|
|
UNRECOVERABLE_IF(hwInfo.gtSystemInfo.EUCount == 0)
|
|
|
|
uint32_t maxNumEUsPerDSS = hwInfo.gtSystemInfo.MaxEuPerSubSlice;
|
|
uint32_t maxNumThreadsPerEU = hwInfo.gtSystemInfo.ThreadCount / hwInfo.gtSystemInfo.EUCount;
|
|
uint32_t maxSIMTThreadsPerThread = CommonConstants::maximalSimdSize;
|
|
|
|
return std::min(maxSizeOfRtStacksPerDss, maxNumEUsPerDSS * maxNumThreadsPerEU * maxSIMTThreadsPerThread);
|
|
}
|
|
|
|
static uint32_t getStackSizePerRay(uint32_t maxBvhLevel, uint32_t extraBytesLocal) {
|
|
return hitInfoSize + bvhStackSize * maxBvhLevel + extraBytesLocal;
|
|
}
|
|
};
|
|
} // namespace NEO
|