Files
compute-runtime/opencl/source/platform/platform.cpp
Compute-Runtime-Validation a0d1a88f96 Revert "performance: move host/device memUsmAllocPool init to platform/contex...
This reverts commit f0f869ed42.

Signed-off-by: Compute-Runtime-Validation <compute-runtime-validation@intel.com>
2025-09-20 07:34:13 +02:00

358 lines
12 KiB
C++

/*
* Copyright (C) 2018-2025 Intel Corporation
*
* SPDX-License-Identifier: MIT
*
*/
#include "platform.h"
#include "shared/source/built_ins/sip.h"
#include "shared/source/command_stream/command_stream_receiver.h"
#include "shared/source/compiler_interface/oclc_extensions.h"
#include "shared/source/debug_settings/debug_settings_manager.h"
#include "shared/source/device/root_device.h"
#include "shared/source/execution_environment/execution_environment.h"
#include "shared/source/execution_environment/root_device_environment.h"
#include "shared/source/helpers/api_specific_config.h"
#include "shared/source/helpers/debug_helpers.h"
#include "shared/source/helpers/get_info.h"
#include "shared/source/helpers/hw_info.h"
#include "shared/source/memory_manager/usm_pool_params.h"
#include "shared/source/os_interface/debug_env_reader.h"
#include "shared/source/os_interface/device_factory.h"
#include "shared/source/pin/pin.h"
#include "opencl/source/api/api.h"
#include "opencl/source/cl_device/cl_device.h"
#include "opencl/source/gtpin/gtpin_notify.h"
#include "opencl/source/helpers/get_info_status_mapper.h"
#include "opencl/source/platform/platform_info.h"
#include "opencl/source/sharings/sharing_factory.h"
#include "CL/cl_ext.h"
#include <algorithm>
#include <map>
namespace NEO {
std::vector<std::unique_ptr<Platform>> *platformsImpl = nullptr;
Platform::Platform(ExecutionEnvironment &executionEnvironmentIn) : executionEnvironment(executionEnvironmentIn) {
clDevices.reserve(4);
executionEnvironment.incRefInternal();
}
Platform::~Platform() {
executionEnvironment.prepareForCleanup();
usmHostMemAllocPool.cleanup();
if (isInitialized()) {
delete stagingBufferManager;
svmAllocsManager->cleanupUSMAllocCaches();
delete svmAllocsManager;
}
devicesCleanup(false);
gtpinNotifyPlatformShutdown();
executionEnvironment.decRefInternal();
}
cl_int Platform::getInfo(cl_platform_info paramName,
size_t paramValueSize,
void *paramValue,
size_t *paramValueSizeRet) {
auto retVal = CL_INVALID_VALUE;
const std::string *param = nullptr;
size_t paramSize = GetInfo::invalidSourceSize;
auto getInfoStatus = GetInfoStatus::invalidValue;
switch (paramName) {
case CL_PLATFORM_HOST_TIMER_RESOLUTION: {
auto pVal = static_cast<uint64_t>(this->clDevices[0]->getPlatformHostTimerResolution());
paramSize = sizeof(uint64_t);
getInfoStatus = GetInfo::getInfo(paramValue, paramValueSize, &pVal, paramSize);
break;
}
case CL_PLATFORM_NUMERIC_VERSION: {
auto pVal = platformInfo->numericVersion;
paramSize = sizeof(pVal);
getInfoStatus = GetInfo::getInfo(paramValue, paramValueSize, &pVal, paramSize);
break;
}
case CL_PLATFORM_EXTENSIONS_WITH_VERSION: {
std::call_once(initializeExtensionsWithVersionOnce, [this]() {
this->clDevices[0]->getDeviceInfo(CL_DEVICE_EXTENSIONS_WITH_VERSION, 0, nullptr, nullptr);
this->platformInfo->extensionsWithVersion = this->clDevices[0]->getDeviceInfo().extensionsWithVersion;
});
auto pVal = platformInfo->extensionsWithVersion.data();
paramSize = platformInfo->extensionsWithVersion.size() * sizeof(cl_name_version);
getInfoStatus = GetInfo::getInfo(paramValue, paramValueSize, pVal, paramSize);
break;
}
case CL_PLATFORM_PROFILE:
param = &platformInfo->profile;
break;
case CL_PLATFORM_VERSION:
param = &platformInfo->version;
break;
case CL_PLATFORM_NAME:
param = &platformInfo->name;
break;
case CL_PLATFORM_VENDOR:
param = &platformInfo->vendor;
break;
case CL_PLATFORM_EXTENSIONS:
param = &platformInfo->extensions;
break;
case CL_PLATFORM_ICD_SUFFIX_KHR:
param = &platformInfo->icdSuffixKhr;
break;
case CL_PLATFORM_EXTERNAL_MEMORY_IMPORT_HANDLE_TYPES_KHR: {
paramSize = sizeof(this->clDevices[0]->getDeviceInfo().externalMemorySharing);
getInfoStatus = GetInfo::getInfo(paramValue, paramValueSize, &this->clDevices[0]->getDeviceInfo().externalMemorySharing, paramSize);
break;
}
default:
break;
}
// Case for string parameters
if (param) {
paramSize = param->length() + 1;
getInfoStatus = GetInfo::getInfo(paramValue, paramValueSize, param->c_str(), paramSize);
}
retVal = changeGetInfoStatusToCLResultType(getInfoStatus);
GetInfo::setParamValueReturnSize(paramValueSizeRet, paramSize, getInfoStatus);
return retVal;
}
bool Platform::initialize(std::vector<std::unique_ptr<Device>> devices) {
TakeOwnershipWrapper<Platform> platformOwnership(*this);
if (devices.empty()) {
return false;
}
if (state == StateInited) {
return true;
}
state = StateIniting;
RootDeviceIndicesContainer rootDeviceIndices;
std::map<uint32_t, DeviceBitfield> deviceBitfields;
for (auto &inputDevice : devices) {
ClDevice *pClDevice = nullptr;
auto pDevice = inputDevice.release();
UNRECOVERABLE_IF(!pDevice);
pClDevice = new ClDevice{*pDevice, this};
this->clDevices.push_back(pClDevice);
rootDeviceIndices.pushUnique(pClDevice->getRootDeviceIndex());
}
for (auto &rootDeviceIndex : rootDeviceIndices) {
DeviceBitfield deviceBitfield{};
for (const auto &pDevice : this->clDevices) {
if (pDevice->getRootDeviceIndex() == rootDeviceIndex) {
deviceBitfield |= pDevice->getDeviceBitfield();
}
}
deviceBitfields.insert({rootDeviceIndex, deviceBitfield});
}
this->svmAllocsManager = new SVMAllocsManager(this->clDevices[0]->getMemoryManager());
this->svmAllocsManager->initUsmAllocationsCaches(this->clDevices[0]->getDevice());
bool requiresWritableStaging = this->clDevices[0]->getDefaultEngine().commandStreamReceiver->getType() != CommandStreamReceiverType::hardware;
this->stagingBufferManager = new StagingBufferManager(this->svmAllocsManager, rootDeviceIndices, deviceBitfields, requiresWritableStaging);
DEBUG_BREAK_IF(this->platformInfo);
this->platformInfo.reset(new PlatformInfo);
this->platformInfo->extensions = this->clDevices[0]->getDeviceInfo().deviceExtensions;
auto preferredPlatformName = this->clDevices[0]->getHardwareInfo().capabilityTable.preferredPlatformName;
if (preferredPlatformName != nullptr) {
this->platformInfo->name = preferredPlatformName;
}
if (debugManager.flags.OverridePlatformName.get() != "unk") {
this->platformInfo->name.assign(debugManager.flags.OverridePlatformName.get().c_str());
}
switch (this->clDevices[0]->getEnabledClVersion()) {
case 30:
this->platformInfo->version = "OpenCL 3.0 ";
this->platformInfo->numericVersion = CL_MAKE_VERSION(3, 0, 0);
break;
case 21:
this->platformInfo->version = "OpenCL 2.1 ";
this->platformInfo->numericVersion = CL_MAKE_VERSION(2, 1, 0);
break;
default:
this->platformInfo->version = "OpenCL 1.2 ";
this->platformInfo->numericVersion = CL_MAKE_VERSION(1, 2, 0);
break;
}
this->fillGlobalDispatchTable();
DEBUG_BREAK_IF(debugManager.flags.CreateMultipleSubDevices.get() > 1 && !this->clDevices[0]->getDefaultEngine().commandStreamReceiver->peekTimestampPacketWriteEnabled());
state = StateInited;
return true;
}
void Platform::tryNotifyGtpinInit() {
auto notifyGTPin = []() {
EnvironmentVariableReader envReader;
if (envReader.getSetting("ZET_ENABLE_PROGRAM_INSTRUMENTATION", false)) {
const std::string gtpinFuncName{"OpenGTPinOCL"};
PinContext::init(gtpinFuncName);
}
};
std::call_once(this->oclInitGTPinOnce, notifyGTPin);
}
void Platform::fillGlobalDispatchTable() {
sharingFactory.fillGlobalDispatchTable();
}
bool Platform::isInitialized() {
TakeOwnershipWrapper<Platform> platformOwnership(*this);
bool ret = (this->state == StateInited);
return ret;
}
ClDevice *Platform::getClDevice(size_t deviceOrdinal) {
TakeOwnershipWrapper<Platform> platformOwnership(*this);
if (this->state != StateInited || deviceOrdinal >= clDevices.size()) {
return nullptr;
}
auto pClDevice = clDevices[deviceOrdinal];
DEBUG_BREAK_IF(pClDevice == nullptr);
return pClDevice;
}
size_t Platform::getNumDevices() const {
TakeOwnershipWrapper<const Platform> platformOwnership(*this);
if (this->state != StateInited) {
return 0;
}
return clDevices.size();
}
ClDevice **Platform::getClDevices() {
TakeOwnershipWrapper<Platform> platformOwnership(*this);
if (this->state != StateInited) {
return nullptr;
}
return clDevices.data();
}
void Platform::devicesCleanup(bool processTermination) {
for (auto clDevice : this->clDevices) {
clDevice->getDevice().stopDirectSubmissionAndWaitForCompletion();
clDevice->getDevice().pollForCompletion();
if (processTermination) {
continue;
}
clDevice->getDevice().getRootDeviceEnvironmentRef().debugger.reset(nullptr);
clDevice->decRefInternal();
}
if (!processTermination) {
this->clDevices.clear();
}
}
const PlatformInfo &Platform::getPlatformInfo() const {
DEBUG_BREAK_IF(!platformInfo);
return *platformInfo;
}
std::unique_ptr<Platform> (*Platform::createFunc)(ExecutionEnvironment &) = [](ExecutionEnvironment &executionEnvironment) -> std::unique_ptr<Platform> {
return std::make_unique<Platform>(executionEnvironment);
};
SVMAllocsManager *Platform::getSVMAllocsManager() const {
return this->svmAllocsManager;
}
StagingBufferManager *Platform::getStagingBufferManager() const {
return this->stagingBufferManager;
}
UsmMemAllocPool &Platform::getHostMemAllocPool() {
return this->usmHostMemAllocPool;
}
void Platform::incActiveContextCount() {
TakeOwnershipWrapper<Platform> platformOwnership(*this);
this->activeContextCount++;
}
void Platform::decActiveContextCount() {
TakeOwnershipWrapper<Platform> platformOwnership(*this);
this->activeContextCount--;
DEBUG_BREAK_IF(this->activeContextCount < 0);
if (this->activeContextCount == 0) {
this->stagingBufferManager->freeAllocations();
}
}
void Platform::initializeHostUsmAllocationPool() {
if (this->usmPoolInitialized) {
return;
}
auto svmMemoryManager = this->getSVMAllocsManager();
TakeOwnershipWrapper<Platform> platformOwnership(*this);
if (this->usmPoolInitialized) {
return;
}
auto usmHostAllocPoolingEnabled = ApiSpecificConfig::isHostUsmPoolingEnabled();
for (auto &device : this->clDevices) {
usmHostAllocPoolingEnabled &= device->getProductHelper().isHostUsmPoolAllocatorSupported() && DeviceFactory::isHwModeSelected();
}
auto usmHostPoolParams = UsmPoolParams::getUsmPoolParams();
if (debugManager.flags.EnableHostUsmAllocationPool.get() != -1) {
usmHostAllocPoolingEnabled = debugManager.flags.EnableHostUsmAllocationPool.get() > 0;
usmHostPoolParams.poolSize = debugManager.flags.EnableHostUsmAllocationPool.get() * MemoryConstants::megaByte;
}
if (usmHostAllocPoolingEnabled) {
RootDeviceIndicesContainer rootDeviceIndices;
std::map<uint32_t, DeviceBitfield> deviceBitfields;
for (auto &device : this->clDevices) {
rootDeviceIndices.pushUnique(device->getRootDeviceIndex());
}
for (auto &rootDeviceIndex : rootDeviceIndices) {
DeviceBitfield deviceBitfield{};
for (const auto &pDevice : this->clDevices) {
if (pDevice->getRootDeviceIndex() == rootDeviceIndex) {
deviceBitfield |= pDevice->getDeviceBitfield();
}
}
deviceBitfields.insert({rootDeviceIndex, deviceBitfield});
}
SVMAllocsManager::UnifiedMemoryProperties memoryProperties(InternalMemoryType::hostUnifiedMemory, MemoryConstants::pageSize2M,
rootDeviceIndices, deviceBitfields);
this->usmHostMemAllocPool.initialize(svmMemoryManager, memoryProperties, usmHostPoolParams.poolSize, usmHostPoolParams.minServicedSize, usmHostPoolParams.maxServicedSize);
}
this->usmPoolInitialized = true;
}
} // namespace NEO