mirror of
https://github.com/intel/compute-runtime.git
synced 2025-09-15 13:01:45 +08:00

Previously we used an array-of-pointers approach, but using an array-of-structures is in some ways simpler. We also split out the RTStack as a separate allocation. Related-To: LOCI-2966 Signed-off-by: Jim Snow <jim.m.snow@intel.com>
60 lines
2.1 KiB
C++
60 lines
2.1 KiB
C++
/*
|
|
* Copyright (C) 2018-2022 Intel Corporation
|
|
*
|
|
* SPDX-License-Identifier: MIT
|
|
*
|
|
*/
|
|
|
|
#pragma once
|
|
|
|
#include "shared/source/device/device.h"
|
|
#include "shared/source/helpers/aligned_memory.h"
|
|
#include "shared/source/helpers/basic_math.h"
|
|
#include "shared/source/helpers/non_copyable_or_moveable.h"
|
|
|
|
#include "ocl_igc_shared/raytracing/ocl_raytracing_structures.h"
|
|
|
|
#include <cstdint>
|
|
namespace NEO {
|
|
class RayTracingHelper : public NonCopyableOrMovableClass {
|
|
public:
|
|
static constexpr uint32_t stackDssMultiplier = 2048;
|
|
static constexpr uint32_t hitInfoSize = 64;
|
|
static constexpr uint32_t bvhStackSize = 96;
|
|
static constexpr uint32_t memoryBackedFifoSizePerDss = 8 * KB;
|
|
static constexpr uint32_t maxBvhLevels = 8;
|
|
|
|
static size_t getDispatchGlobalSize() {
|
|
return static_cast<size_t>(alignUp(sizeof(RTDispatchGlobals), MemoryConstants::cacheLineSize));
|
|
}
|
|
|
|
static size_t getRTStackSizePerTile(const Device &device, uint32_t tiles, uint32_t maxBvhLevel, uint32_t extraBytesLocal, uint32_t extraBytesGlobal) {
|
|
return static_cast<size_t>(getStackSizePerRay(maxBvhLevel, extraBytesLocal) * (getNumRtStacks(device) / tiles) + extraBytesGlobal);
|
|
}
|
|
|
|
static size_t getTotalMemoryBackedFifoSize(const Device &device) {
|
|
return static_cast<size_t>(getNumDss(device)) * memoryBackedFifoSizePerDss;
|
|
}
|
|
|
|
static size_t getMemoryBackedFifoSizeToPatch() {
|
|
return static_cast<size_t>(Math::log2(memoryBackedFifoSizePerDss / KB) - 1);
|
|
}
|
|
|
|
static uint32_t getNumRtStacks(const Device &device) {
|
|
return device.getHardwareInfo().gtSystemInfo.MaxDualSubSlicesSupported * stackDssMultiplier;
|
|
}
|
|
|
|
static uint32_t getNumRtStacksPerDss(const Device &device) {
|
|
return stackDssMultiplier;
|
|
}
|
|
|
|
static uint32_t getNumDss(const Device &device) {
|
|
return device.getHardwareInfo().gtSystemInfo.MaxDualSubSlicesSupported;
|
|
}
|
|
|
|
static uint32_t getStackSizePerRay(uint32_t maxBvhLevel, uint32_t extraBytesLocal) {
|
|
return hitInfoSize + bvhStackSize * maxBvhLevel + extraBytesLocal;
|
|
}
|
|
};
|
|
} // namespace NEO
|