Files
compute-runtime/level_zero/core/source/device/device.cpp
Mateusz Jablonski 7660b29bbb fix: reduce types for tagSize and tagCount within TagAllocator
Related-To: NEO-16444

Signed-off-by: Mateusz Jablonski <mateusz.jablonski@intel.com>
2025-11-17 10:47:51 +01:00

127 lines
5.3 KiB
C++

/*
* Copyright (C) 2023-2025 Intel Corporation
*
* SPDX-License-Identifier: MIT
*
*/
#include "level_zero/core/source/device/device.h"
#include "shared/source/device/device.h"
#include "shared/source/helpers/aligned_memory.h"
#include "shared/source/helpers/fill_pattern_tag_node.h"
#include "shared/source/helpers/gfx_core_helper.h"
#include "shared/source/helpers/in_order_cmd_helpers.h"
#include "level_zero/core/source/gfx_core_helpers/l0_gfx_core_helper.h"
namespace L0 {
uint32_t Device::getRootDeviceIndex() const {
return neoDevice->getRootDeviceIndex();
}
NEO::DebuggerL0 *Device::getL0Debugger() {
return getNEODevice()->getL0Debugger();
}
template <typename NodeT>
NEO::TagAllocatorBase *getInOrderCounterAllocator(std::unique_ptr<NEO::TagAllocatorBase> &allocator, std::mutex &inOrderAllocatorMutex, NEO::Device &neoDevice, uint32_t immediateWritePostSyncOffset) {
if (!allocator.get()) {
std::unique_lock<std::mutex> lock(inOrderAllocatorMutex);
if (!allocator.get()) {
RootDeviceIndicesContainer rootDeviceIndices = {neoDevice.getRootDeviceIndex()};
const size_t maxPartitionCount = neoDevice.getDeviceBitfield().count();
const size_t nodeSize = immediateWritePostSyncOffset * maxPartitionCount * 2; // Multiplied by 2 to handle 32b overflow
DEBUG_BREAK_IF(alignUp(nodeSize, MemoryConstants::cacheLineSize) * NodeT::defaultAllocatorTagCount > MemoryConstants::pageSize64k);
allocator = std::make_unique<NEO::TagAllocator<NodeT>>(rootDeviceIndices, neoDevice.getMemoryManager(), NodeT::defaultAllocatorTagCount,
MemoryConstants::cacheLineSize, nodeSize, 0, false, false, neoDevice.getDeviceBitfield());
}
}
return allocator.get();
}
NEO::TagAllocatorBase *Device::getDeviceInOrderCounterAllocator() {
return getInOrderCounterAllocator<NEO::DeviceAllocNodeType<true>>(deviceInOrderCounterAllocator, inOrderAllocatorMutex, *getNEODevice(), getL0GfxCoreHelper().getImmediateWritePostSyncOffset());
}
NEO::TagAllocatorBase *Device::getHostInOrderCounterAllocator() {
return getInOrderCounterAllocator<NEO::DeviceAllocNodeType<false>>(hostInOrderCounterAllocator, inOrderAllocatorMutex, *getNEODevice(), getL0GfxCoreHelper().getImmediateWritePostSyncOffset());
}
NEO::TagAllocatorBase *Device::getInOrderTimestampAllocator() {
if (!inOrderTimestampAllocator.get()) {
std::unique_lock<std::mutex> lock(inOrderAllocatorMutex);
if (!inOrderTimestampAllocator.get()) {
RootDeviceIndicesContainer rootDeviceIndices = {getNEODevice()->getRootDeviceIndex()};
size_t packetsCountPerElement = getEventMaxPacketCount();
size_t alignment = getGfxCoreHelper().getTimestampPacketAllocatorAlignment();
inOrderTimestampAllocator = getL0GfxCoreHelper().getInOrderTimestampAllocator(rootDeviceIndices, getNEODevice()->getMemoryManager(), 64, packetsCountPerElement, alignment, getNEODevice()->getDeviceBitfield());
}
}
return inOrderTimestampAllocator.get();
}
NEO::TagAllocatorBase *Device::getFillPatternAllocator() {
if (!this->fillPatternAllocator.get()) {
static std::mutex mtx;
std::unique_lock<std::mutex> lock(mtx);
if (!this->fillPatternAllocator.get()) {
RootDeviceIndicesContainer rootDeviceIndices = {getNEODevice()->getRootDeviceIndex()};
fillPatternAllocator = std::make_unique<NEO::TagAllocator<NEO::FillPaternNodeType>>(rootDeviceIndices, getNEODevice()->getMemoryManager(), static_cast<uint32_t>(MemoryConstants::pageSize2M / MemoryConstants::cacheLineSize),
MemoryConstants::cacheLineSize, MemoryConstants::cacheLineSize, 0, false, false, getNEODevice()->getDeviceBitfield());
}
}
return this->fillPatternAllocator.get();
}
uint32_t Device::getNextSyncDispatchQueueId() {
auto newValue = syncDispatchQueueIdAllocator.fetch_add(1);
UNRECOVERABLE_IF(newValue == (std::numeric_limits<uint32_t>::max() - 1));
ensureSyncDispatchTokenAllocation();
return newValue;
}
void Device::ensureSyncDispatchTokenAllocation() {
if (!syncDispatchTokenAllocation) {
std::unique_lock<std::mutex> lock(syncDispatchTokenMutex);
if (!syncDispatchTokenAllocation) {
const NEO::AllocationProperties allocationProperties(getRootDeviceIndex(), true, MemoryConstants::pageSize,
NEO::AllocationType::syncDispatchToken,
true, false, getNEODevice()->getDeviceBitfield());
syncDispatchTokenAllocation = getNEODevice()->getMemoryManager()->allocateGraphicsMemoryWithProperties(allocationProperties);
UNRECOVERABLE_IF(syncDispatchTokenAllocation == nullptr);
memset(syncDispatchTokenAllocation->getUnderlyingBuffer(), 0, syncDispatchTokenAllocation->getUnderlyingBufferSize());
}
}
}
ze_result_t Device::getPriorityLevels(int32_t *lowestPriority, int32_t *highestPriority) {
*highestPriority = queuePriorityHigh;
*lowestPriority = queuePriorityLow;
return ZE_RESULT_SUCCESS;
}
} // namespace L0