Files
compute-runtime/level_zero/api/driver_experimental/public/zex_event.cpp
Bartosz Dunajski 3717187cbc feature: zexDeviceGetAggregatedCopyOffloadIncrementValue implementation
Related-To: NEO-14557

Signed-off-by: Bartosz Dunajski <bartosz.dunajski@intel.com>
2025-09-25 11:46:02 +02:00

278 lines
11 KiB
C++

/*
* Copyright (C) 2023-2025 Intel Corporation
*
* SPDX-License-Identifier: MIT
*
*/
#include "level_zero/driver_experimental/zex_event.h"
#include "shared/source/helpers/in_order_cmd_helpers.h"
#include "shared/source/memory_manager/graphics_allocation.h"
#include "shared/source/memory_manager/unified_memory_manager.h"
#include "level_zero/core/source/context/context_imp.h"
#include "level_zero/core/source/device/bcs_split.h"
#include "level_zero/core/source/device/device_imp.h"
#include "level_zero/core/source/driver/driver_handle.h"
#include "level_zero/core/source/event/event.h"
#include "level_zero/core/source/gfx_core_helpers/l0_gfx_core_helper.h"
#include "level_zero/core/source/helpers/default_descriptors.h"
#include <numeric>
namespace L0 {
ze_result_t ZE_APICALL
zexEventGetDeviceAddress(ze_event_handle_t event, uint64_t *completionValue, uint64_t *address) {
auto eventObj = Event::fromHandle(toInternalType(event));
if (!eventObj || !completionValue || !address) {
return ZE_RESULT_ERROR_INVALID_ARGUMENT;
}
if (eventObj->isCounterBased()) {
if (!eventObj->getInOrderExecInfo()) {
return ZE_RESULT_ERROR_INVALID_ARGUMENT;
}
*completionValue = eventObj->getInOrderExecSignalValueWithSubmissionCounter();
*address = eventObj->getInOrderExecInfo()->getBaseDeviceAddress() + eventObj->getInOrderAllocationOffset();
} else if (eventObj->isEventTimestampFlagSet()) {
return ZE_RESULT_ERROR_INVALID_ARGUMENT;
} else {
*completionValue = Event::State::STATE_SIGNALED;
*address = eventObj->getCompletionFieldGpuAddress(eventObj->peekEventPool()->getDevice());
}
return ZE_RESULT_SUCCESS;
}
ze_result_t ZE_APICALL
zexCounterBasedEventCreate2(ze_context_handle_t hContext, ze_device_handle_t hDevice, const zex_counter_based_event_desc_t *desc, ze_event_handle_t *phEvent) {
constexpr uint32_t supportedBasedFlags = (ZEX_COUNTER_BASED_EVENT_FLAG_IMMEDIATE | ZEX_COUNTER_BASED_EVENT_FLAG_NON_IMMEDIATE);
auto device = Device::fromHandle(toInternalType(hDevice));
auto counterBasedEventDesc = desc ? desc : &defaultIntelCounterBasedEventDesc;
if (!hDevice || !phEvent) {
return ZE_RESULT_ERROR_INVALID_ARGUMENT;
}
const bool ipcFlag = !!(counterBasedEventDesc->flags & ZEX_COUNTER_BASED_EVENT_FLAG_IPC);
const bool timestampFlag = !!(counterBasedEventDesc->flags & ZEX_COUNTER_BASED_EVENT_FLAG_KERNEL_TIMESTAMP);
const bool mappedTimestampFlag = !!(counterBasedEventDesc->flags & ZEX_COUNTER_BASED_EVENT_FLAG_KERNEL_MAPPED_TIMESTAMP);
const bool graphExternalEvent = !!(counterBasedEventDesc->flags & ZEX_COUNTER_BASED_EVENT_FLAG_GRAPH_EXTERNAL_EVENT);
uint32_t inputCbFlags = counterBasedEventDesc->flags & supportedBasedFlags;
if (inputCbFlags == 0) {
inputCbFlags = ZEX_COUNTER_BASED_EVENT_FLAG_IMMEDIATE;
}
if (ipcFlag && (timestampFlag || mappedTimestampFlag)) {
return ZE_RESULT_ERROR_INVALID_ARGUMENT;
}
auto signalScope = counterBasedEventDesc->signalScope;
if (NEO::debugManager.flags.MitigateHostVisibleSignal.get()) {
signalScope &= ~ZE_EVENT_SCOPE_FLAG_HOST;
}
EventDescriptor eventDescriptor = {
.eventPoolAllocation = nullptr,
.extensions = counterBasedEventDesc->pNext,
.totalEventSize = 0,
.maxKernelCount = EventPacketsCount::maxKernelSplit,
.maxPacketsCount = 1,
.counterBasedFlags = inputCbFlags,
.index = 0,
.signalScope = signalScope,
.waitScope = counterBasedEventDesc->waitScope,
.timestampPool = timestampFlag,
.kernelMappedTsPoolFlag = mappedTimestampFlag,
.importedIpcPool = false,
.ipcPool = ipcFlag,
.graphExternalEvent = graphExternalEvent,
};
ze_result_t result = ZE_RESULT_SUCCESS;
auto l0Event = device->getL0GfxCoreHelper().createStandaloneEvent(eventDescriptor, device, result);
if (signalScope ^ counterBasedEventDesc->signalScope) {
l0Event->setMitigateHostVisibleSignal();
}
*phEvent = l0Event;
return result;
}
ze_result_t ZE_APICALL
zexCounterBasedEventCreate(ze_context_handle_t hContext, ze_device_handle_t hDevice, uint64_t *deviceAddress, uint64_t *hostAddress, uint64_t completionValue, const ze_event_desc_t *desc, ze_event_handle_t *phEvent) {
constexpr uint32_t counterBasedFlags = ZEX_COUNTER_BASED_EVENT_FLAG_IMMEDIATE | ZEX_COUNTER_BASED_EVENT_FLAG_NON_IMMEDIATE;
if (!desc) {
return ZE_RESULT_ERROR_INVALID_ARGUMENT;
}
zex_counter_based_event_external_sync_alloc_properties_t externalSyncAllocProperties = {ZEX_STRUCTURE_COUNTER_BASED_EVENT_EXTERNAL_SYNC_ALLOC_PROPERTIES};
externalSyncAllocProperties.completionValue = completionValue;
externalSyncAllocProperties.deviceAddress = deviceAddress;
externalSyncAllocProperties.hostAddress = hostAddress;
zex_counter_based_event_desc_t counterBasedDesc = {ZEX_STRUCTURE_COUNTER_BASED_EVENT_DESC};
counterBasedDesc.flags = counterBasedFlags;
counterBasedDesc.signalScope = desc->signal;
counterBasedDesc.waitScope = desc->wait;
counterBasedDesc.pNext = desc->pNext;
if (deviceAddress && hostAddress) {
externalSyncAllocProperties.pNext = desc->pNext;
counterBasedDesc.pNext = &externalSyncAllocProperties;
}
return L0::zexCounterBasedEventCreate2(hContext, hDevice, &counterBasedDesc, phEvent);
}
ze_result_t ZE_APICALL zexIntelAllocateNetworkInterrupt(ze_context_handle_t hContext, uint32_t &networkInterruptId) {
auto context = static_cast<ContextImp *>(L0::Context::fromHandle(toInternalType(hContext)));
if (!context) {
return ZE_RESULT_ERROR_INVALID_ARGUMENT;
}
if (!context->getDriverHandle()->getMemoryManager()->allocateInterrupt(networkInterruptId, context->rootDeviceIndices[0])) {
return ZE_RESULT_ERROR_NOT_AVAILABLE;
}
return ZE_RESULT_SUCCESS;
}
ze_result_t ZE_APICALL zexIntelReleaseNetworkInterrupt(ze_context_handle_t hContext, uint32_t networkInterruptId) {
auto context = static_cast<ContextImp *>(L0::Context::fromHandle(toInternalType(hContext)));
if (!context || !context->getDriverHandle()->getMemoryManager()->releaseInterrupt(networkInterruptId, context->rootDeviceIndices[0])) {
return ZE_RESULT_ERROR_INVALID_ARGUMENT;
}
return ZE_RESULT_SUCCESS;
}
ze_result_t ZE_APICALL zexCounterBasedEventGetIpcHandle(ze_event_handle_t hEvent, zex_ipc_counter_based_event_handle_t *phIpc) {
auto event = Event::fromHandle(hEvent);
if (!event || !phIpc || !event->isCounterBasedExplicitlyEnabled()) {
return ZE_RESULT_ERROR_INVALID_ARGUMENT;
}
auto ipcData = reinterpret_cast<IpcCounterBasedEventData *>(phIpc->data);
return event->getCounterBasedIpcHandle(*ipcData);
}
ze_result_t ZE_APICALL zexCounterBasedEventOpenIpcHandle(ze_context_handle_t hContext, zex_ipc_counter_based_event_handle_t hIpc, ze_event_handle_t *phEvent) {
auto context = static_cast<ContextImp *>(L0::Context::fromHandle(hContext));
if (!context || !phEvent) {
return ZE_RESULT_ERROR_INVALID_ARGUMENT;
}
auto ipcData = reinterpret_cast<IpcCounterBasedEventData *>(hIpc.data);
return context->openCounterBasedIpcHandle(*ipcData, phEvent);
}
ze_result_t ZE_APICALL zexCounterBasedEventCloseIpcHandle(ze_event_handle_t hEvent) {
return Event::fromHandle(hEvent)->destroy();
}
ze_result_t ZE_APICALL zexDeviceGetAggregatedCopyOffloadIncrementValue(ze_device_handle_t hDevice, uint32_t *incrementValue) {
auto device = static_cast<DeviceImp *>(Device::fromHandle(hDevice));
if (!device || !incrementValue) {
return ZE_RESULT_ERROR_INVALID_ARGUMENT;
}
if (device->getAggregatedCopyOffloadIncrementValue() == 0) {
uint32_t numTiles = std::max(device->getNEODevice()->getNumSubDevices(), 1u);
auto bcsSplit = device->bcsSplit.get();
uint32_t bcsSplitEngines = 1;
uint64_t lcmResult = 1;
if (device->getNEODevice()->isBcsSplitSupported()) {
if (bcsSplit->cmdLists.empty()) {
auto csr = device->getNEODevice()->tryGetRegularEngineGroup(NEO::EngineGroupType::copy)->engines[0].commandStreamReceiver;
UNRECOVERABLE_IF(!csr);
bcsSplit->setupDevice(csr, false);
UNRECOVERABLE_IF(bcsSplit->cmdLists.empty());
}
bcsSplitEngines = static_cast<uint32_t>(bcsSplit->cmdLists.size());
}
for (uint32_t i = 2; i <= bcsSplitEngines; i++) {
lcmResult = std::lcm(lcmResult, i);
}
UNRECOVERABLE_IF(lcmResult * numTiles > std::numeric_limits<uint32_t>::max());
device->setAggregatedCopyOffloadIncrementValue(static_cast<uint32_t>(lcmResult * numTiles));
}
*incrementValue = device->getAggregatedCopyOffloadIncrementValue();
return ZE_RESULT_SUCCESS;
}
} // namespace L0
extern "C" {
ZE_APIEXPORT ze_result_t ZE_APICALL
zexEventGetDeviceAddress(
ze_event_handle_t event,
uint64_t *completionValue,
uint64_t *address) {
return L0::zexEventGetDeviceAddress(event, completionValue, address);
}
// deprecated
ZE_APIEXPORT ze_result_t ZE_APICALL
zexCounterBasedEventCreate(
ze_context_handle_t hContext,
ze_device_handle_t hDevice,
uint64_t *deviceAddress,
uint64_t *hostAddress,
uint64_t completionValue,
const ze_event_desc_t *desc,
ze_event_handle_t *phEvent) {
return L0::zexCounterBasedEventCreate(hContext, hDevice, deviceAddress, hostAddress, completionValue, desc, phEvent);
}
ZE_APIEXPORT ze_result_t ZE_APICALL zexIntelAllocateNetworkInterrupt(ze_context_handle_t hContext, uint32_t &networkInterruptId) {
return L0::zexIntelAllocateNetworkInterrupt(hContext, networkInterruptId);
}
ZE_APIEXPORT ze_result_t ZE_APICALL zexIntelReleaseNetworkInterrupt(ze_context_handle_t hContext, uint32_t networkInterruptId) {
return L0::zexIntelReleaseNetworkInterrupt(hContext, networkInterruptId);
}
ZE_APIEXPORT ze_result_t ZE_APICALL zexCounterBasedEventCreate2(ze_context_handle_t hContext, ze_device_handle_t hDevice, const zex_counter_based_event_desc_t *desc, ze_event_handle_t *phEvent) {
return L0::zexCounterBasedEventCreate2(hContext, hDevice, desc, phEvent);
}
ZE_APIEXPORT ze_result_t ZE_APICALL zexCounterBasedEventGetIpcHandle(ze_event_handle_t hEvent, zex_ipc_counter_based_event_handle_t *phIpc) {
return L0::zexCounterBasedEventGetIpcHandle(hEvent, phIpc);
}
ZE_APIEXPORT ze_result_t ZE_APICALL zexCounterBasedEventOpenIpcHandle(ze_context_handle_t hContext, zex_ipc_counter_based_event_handle_t hIpc, ze_event_handle_t *phEvent) {
return L0::zexCounterBasedEventOpenIpcHandle(hContext, hIpc, phEvent);
}
ZE_APIEXPORT ze_result_t ZE_APICALL zexCounterBasedEventCloseIpcHandle(ze_event_handle_t hEvent) {
return L0::zexCounterBasedEventCloseIpcHandle(hEvent);
}
ZE_APIEXPORT ze_result_t ZE_APICALL zexDeviceGetAggregatedCopyOffloadIncrementValue(ze_device_handle_t hDevice, uint32_t *incrementValue) {
return L0::zexDeviceGetAggregatedCopyOffloadIncrementValue(hDevice, incrementValue);
}
} // extern "C"