150 lines
6.4 KiB
C++
150 lines
6.4 KiB
C++
/*
|
|
* Copyright (C) 2019-2022 Intel Corporation
|
|
*
|
|
* SPDX-License-Identifier: MIT
|
|
*
|
|
*/
|
|
|
|
#include "shared/source/page_fault_manager/cpu_page_fault_manager.h"
|
|
|
|
#include "shared/source/debug_settings/debug_settings_manager.h"
|
|
#include "shared/source/helpers/memory_properties_helpers.h"
|
|
#include "shared/source/memory_manager/unified_memory_manager.h"
|
|
#include "shared/source/utilities/spinlock.h"
|
|
|
|
#include <algorithm>
|
|
|
|
namespace NEO {
|
|
void PageFaultManager::insertAllocation(void *ptr, size_t size, SVMAllocsManager *unifiedMemoryManager, void *cmdQ, const MemoryProperties &memoryProperties) {
|
|
auto initialPlacement = MemoryPropertiesHelper::getUSMInitialPlacement(memoryProperties);
|
|
const auto domain = (initialPlacement == GraphicsAllocation::UsmInitialPlacement::CPU) ? AllocationDomain::Cpu : AllocationDomain::None;
|
|
|
|
std::unique_lock<SpinLock> lock{mtx};
|
|
this->memoryData.insert(std::make_pair(ptr, PageFaultData{size, unifiedMemoryManager, cmdQ, domain}));
|
|
if (initialPlacement != GraphicsAllocation::UsmInitialPlacement::CPU) {
|
|
this->protectCPUMemoryAccess(ptr, size);
|
|
}
|
|
unifiedMemoryManager->nonGpuDomainAllocs.push_back(ptr);
|
|
}
|
|
|
|
void PageFaultManager::removeAllocation(void *ptr) {
|
|
std::unique_lock<SpinLock> lock{mtx};
|
|
auto alloc = memoryData.find(ptr);
|
|
if (alloc != memoryData.end()) {
|
|
auto &pageFaultData = alloc->second;
|
|
if (pageFaultData.domain == AllocationDomain::Gpu) {
|
|
allowCPUMemoryAccess(ptr, pageFaultData.size);
|
|
} else {
|
|
auto &cpuAllocs = pageFaultData.unifiedMemoryManager->nonGpuDomainAllocs;
|
|
if (auto it = std::find(cpuAllocs.begin(), cpuAllocs.end(), ptr); it != cpuAllocs.end()) {
|
|
cpuAllocs.erase(it);
|
|
}
|
|
}
|
|
this->memoryData.erase(ptr);
|
|
}
|
|
}
|
|
|
|
void PageFaultManager::moveAllocationToGpuDomain(void *ptr) {
|
|
std::unique_lock<SpinLock> lock{mtx};
|
|
auto alloc = memoryData.find(ptr);
|
|
if (alloc != memoryData.end()) {
|
|
auto &pageFaultData = alloc->second;
|
|
if (pageFaultData.domain != AllocationDomain::Gpu) {
|
|
this->migrateStorageToGpuDomain(ptr, pageFaultData);
|
|
|
|
auto &cpuAllocs = pageFaultData.unifiedMemoryManager->nonGpuDomainAllocs;
|
|
if (auto it = std::find(cpuAllocs.begin(), cpuAllocs.end(), ptr); it != cpuAllocs.end()) {
|
|
cpuAllocs.erase(it);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
void PageFaultManager::moveAllocationsWithinUMAllocsManagerToGpuDomain(SVMAllocsManager *unifiedMemoryManager) {
|
|
std::unique_lock<SpinLock> lock{mtx};
|
|
for (auto allocPtr : unifiedMemoryManager->nonGpuDomainAllocs) {
|
|
auto &pageFaultData = this->memoryData[allocPtr];
|
|
this->migrateStorageToGpuDomain(allocPtr, pageFaultData);
|
|
}
|
|
unifiedMemoryManager->nonGpuDomainAllocs.clear();
|
|
}
|
|
|
|
inline void PageFaultManager::migrateStorageToGpuDomain(void *ptr, PageFaultData &pageFaultData) {
|
|
if (pageFaultData.domain == AllocationDomain::Cpu) {
|
|
std::chrono::steady_clock::time_point start;
|
|
std::chrono::steady_clock::time_point end;
|
|
|
|
start = std::chrono::steady_clock::now();
|
|
this->transferToGpu(ptr, pageFaultData.cmdQ);
|
|
end = std::chrono::steady_clock::now();
|
|
long long elapsedTime = std::chrono::duration_cast<std::chrono::nanoseconds>(end - start).count();
|
|
|
|
if (DebugManager.flags.PrintUmdSharedMigration.get()) {
|
|
printf("UMD transferred shared allocation %llx (%zu B) from CPU to GPU (%f us)\n", reinterpret_cast<unsigned long long int>(ptr), pageFaultData.size, elapsedTime / 1e3);
|
|
}
|
|
|
|
this->protectCPUMemoryAccess(ptr, pageFaultData.size);
|
|
}
|
|
pageFaultData.domain = AllocationDomain::Gpu;
|
|
}
|
|
|
|
bool PageFaultManager::verifyPageFault(void *ptr) {
|
|
std::unique_lock<SpinLock> lock{mtx};
|
|
for (auto &alloc : this->memoryData) {
|
|
auto allocPtr = alloc.first;
|
|
auto &pageFaultData = alloc.second;
|
|
if (ptr >= allocPtr && ptr < ptrOffset(allocPtr, pageFaultData.size)) {
|
|
this->setAubWritable(true, allocPtr, pageFaultData.unifiedMemoryManager);
|
|
gpuDomainHandler(this, allocPtr, pageFaultData);
|
|
return true;
|
|
}
|
|
}
|
|
return false;
|
|
}
|
|
|
|
void PageFaultManager::setGpuDomainHandler(gpuDomainHandlerFunc gpuHandlerFuncPtr) {
|
|
this->gpuDomainHandler = gpuHandlerFuncPtr;
|
|
}
|
|
|
|
void PageFaultManager::transferAndUnprotectMemory(PageFaultManager *pageFaultHandler, void *allocPtr, PageFaultData &pageFaultData) {
|
|
pageFaultHandler->migrateStorageToCpuDomain(allocPtr, pageFaultData);
|
|
pageFaultHandler->allowCPUMemoryAccess(allocPtr, pageFaultData.size);
|
|
}
|
|
|
|
void PageFaultManager::unprotectAndTransferMemory(PageFaultManager *pageFaultHandler, void *allocPtr, PageFaultData &pageFaultData) {
|
|
pageFaultHandler->allowCPUMemoryAccess(allocPtr, pageFaultData.size);
|
|
pageFaultHandler->migrateStorageToCpuDomain(allocPtr, pageFaultData);
|
|
}
|
|
|
|
inline void PageFaultManager::migrateStorageToCpuDomain(void *ptr, PageFaultData &pageFaultData) {
|
|
if (pageFaultData.domain == AllocationDomain::Gpu) {
|
|
std::chrono::steady_clock::time_point start;
|
|
std::chrono::steady_clock::time_point end;
|
|
|
|
start = std::chrono::steady_clock::now();
|
|
this->transferToCpu(ptr, pageFaultData.size, pageFaultData.cmdQ);
|
|
end = std::chrono::steady_clock::now();
|
|
long long elapsedTime = std::chrono::duration_cast<std::chrono::nanoseconds>(end - start).count();
|
|
|
|
if (DebugManager.flags.PrintUmdSharedMigration.get()) {
|
|
printf("UMD transferred shared allocation %llx (%zu B) from GPU to CPU (%f us)\n", reinterpret_cast<unsigned long long int>(ptr), pageFaultData.size, elapsedTime / 1e3);
|
|
}
|
|
pageFaultData.unifiedMemoryManager->nonGpuDomainAllocs.push_back(ptr);
|
|
}
|
|
pageFaultData.domain = AllocationDomain::Cpu;
|
|
}
|
|
|
|
void PageFaultManager::selectGpuDomainHandler() {
|
|
if (DebugManager.flags.SetCommandStreamReceiver.get() > CommandStreamReceiverType::CSR_HW || DebugManager.flags.NEO_CAL_ENABLED.get()) {
|
|
this->gpuDomainHandler = &PageFaultManager::unprotectAndTransferMemory;
|
|
}
|
|
}
|
|
|
|
void PageFaultManager::setAubWritable(bool writable, void *ptr, SVMAllocsManager *unifiedMemoryManager) {
|
|
UNRECOVERABLE_IF(ptr == nullptr);
|
|
auto gpuAlloc = unifiedMemoryManager->getSVMAlloc(ptr)->gpuAllocations.getDefaultGraphicsAllocation();
|
|
gpuAlloc->setAubWritable(writable, GraphicsAllocation::allBanks);
|
|
}
|
|
|
|
} // namespace NEO
|