/* * Copyright (C) 2018 Intel Corporation * * SPDX-License-Identifier: MIT * */ #include "runtime/helpers/aligned_memory.h" #include "runtime/helpers/options.h" #include "runtime/os_interface/windows/gdi_interface.h" #include "runtime/os_interface/windows/kmdaf_listener.h" #include "runtime/gmm_helper/gmm.h" #include "runtime/gmm_helper/gmm_helper.h" #include "runtime/gmm_helper/resource_info.h" #include "runtime/gmm_helper/page_table_mngr.h" #include "runtime/os_interface/windows/wddm/wddm.h" #include "runtime/os_interface/hw_info_config.h" #include "runtime/os_interface/windows/gdi_interface.h" #include "runtime/os_interface/windows/os_context_win.h" #include "runtime/os_interface/windows/wddm_allocation.h" #include "runtime/os_interface/windows/registry_reader.h" #include "runtime/helpers/debug_helpers.h" #include "runtime/helpers/hw_info.h" #include "runtime/helpers/wddm_helper.h" #include "runtime/command_stream/linear_stream.h" #include "runtime/sku_info/operations/sku_info_receiver.h" #include "runtime/utilities/stackvec.h" #include #include "CL/cl.h" namespace OCLRT { extern Wddm::CreateDXGIFactoryFcn getCreateDxgiFactory(); extern Wddm::GetSystemInfoFcn getGetSystemInfo(); extern Wddm::VirtualAllocFcn getVirtualAlloc(); extern Wddm::VirtualFreeFcn getVirtualFree(); class WddmMemoryManager; Wddm::CreateDXGIFactoryFcn Wddm::createDxgiFactory = getCreateDxgiFactory(); Wddm::GetSystemInfoFcn Wddm::getSystemInfo = getGetSystemInfo(); Wddm::VirtualAllocFcn Wddm::virtualAllocFnc = getVirtualAlloc(); Wddm::VirtualFreeFcn Wddm::virtualFreeFnc = getVirtualFree(); Wddm::Wddm() { featureTable.reset(new FeatureTable()); waTable.reset(new WorkaroundTable()); gtSystemInfo.reset(new GT_SYSTEM_INFO); gfxPlatform.reset(new PLATFORM); memset(gtSystemInfo.get(), 0, sizeof(*gtSystemInfo)); memset(gfxPlatform.get(), 0, sizeof(*gfxPlatform)); registryReader.reset(new RegistryReader("System\\CurrentControlSet\\Control\\GraphicsDrivers\\Scheduler")); adapterLuid.HighPart = 0; adapterLuid.LowPart = 0; kmDafListener = std::unique_ptr(new KmDafListener); gdi = std::unique_ptr(new Gdi()); } Wddm::~Wddm() { resetPageTableManager(nullptr); destroyPagingQueue(); destroyDevice(); closeAdapter(); } bool Wddm::enumAdapters(HardwareInfo &outHardwareInfo) { if (!gdi->isInitialized()) { return false; } if (!openAdapter()) { return false; } if (!queryAdapterInfo()) { return false; } auto productFamily = gfxPlatform->eProductFamily; if (!hardwareInfoTable[productFamily]) { return false; } outHardwareInfo.pPlatform = new PLATFORM(*gfxPlatform); outHardwareInfo.pSkuTable = new FeatureTable(*featureTable); outHardwareInfo.pWaTable = new WorkaroundTable(*waTable); outHardwareInfo.pSysInfo = new GT_SYSTEM_INFO(*gtSystemInfo); outHardwareInfo.capabilityTable = hardwareInfoTable[productFamily]->capabilityTable; outHardwareInfo.capabilityTable.maxRenderFrequency = maxRenderFrequency; outHardwareInfo.capabilityTable.instrumentationEnabled &= instrumentationEnabled; HwInfoConfig *hwConfig = HwInfoConfig::get(productFamily); hwConfig->adjustPlatformForProductFamily(&outHardwareInfo); return true; } bool Wddm::queryAdapterInfo() { NTSTATUS status = STATUS_UNSUCCESSFUL; D3DKMT_QUERYADAPTERINFO QueryAdapterInfo = {0}; ADAPTER_INFO adapterInfo = {0}; QueryAdapterInfo.hAdapter = adapter; QueryAdapterInfo.Type = KMTQAITYPE_UMDRIVERPRIVATE; QueryAdapterInfo.pPrivateDriverData = &adapterInfo; QueryAdapterInfo.PrivateDriverDataSize = sizeof(ADAPTER_INFO); status = gdi->queryAdapterInfo(&QueryAdapterInfo); DEBUG_BREAK_IF(status != STATUS_SUCCESS); // translate if (status == STATUS_SUCCESS) { memcpy_s(gtSystemInfo.get(), sizeof(GT_SYSTEM_INFO), &adapterInfo.SystemInfo, sizeof(GT_SYSTEM_INFO)); memcpy_s(gfxPlatform.get(), sizeof(PLATFORM), &adapterInfo.GfxPlatform, sizeof(PLATFORM)); SkuInfoReceiver::receiveFtrTableFromAdapterInfo(featureTable.get(), &adapterInfo); SkuInfoReceiver::receiveWaTableFromAdapterInfo(waTable.get(), &adapterInfo); memcpy_s(&gfxPartition, sizeof(gfxPartition), &adapterInfo.GfxPartition, sizeof(GMM_GFX_PARTITIONING)); deviceRegistryPath = adapterInfo.DeviceRegistryPath; systemSharedMemory = adapterInfo.SystemSharedMemory; maxRenderFrequency = adapterInfo.MaxRenderFreq; instrumentationEnabled = adapterInfo.Caps.InstrumentationIsEnabled != 0; } return status == STATUS_SUCCESS; } bool Wddm::createPagingQueue() { NTSTATUS status = STATUS_UNSUCCESSFUL; D3DKMT_CREATEPAGINGQUEUE CreatePagingQueue = {0}; CreatePagingQueue.hDevice = device; CreatePagingQueue.Priority = D3DDDI_PAGINGQUEUE_PRIORITY_NORMAL; status = gdi->createPagingQueue(&CreatePagingQueue); if (status == STATUS_SUCCESS) { pagingQueue = CreatePagingQueue.hPagingQueue; pagingQueueSyncObject = CreatePagingQueue.hSyncObject; pagingFenceAddress = reinterpret_cast(CreatePagingQueue.FenceValueCPUVirtualAddress); } return status == STATUS_SUCCESS; } bool Wddm::destroyPagingQueue() { D3DDDI_DESTROYPAGINGQUEUE DestroyPagingQueue = {0}; if (pagingQueue) { DestroyPagingQueue.hPagingQueue = pagingQueue; NTSTATUS status = gdi->destroyPagingQueue(&DestroyPagingQueue); DEBUG_BREAK_IF(status != STATUS_SUCCESS); pagingQueue = 0; } return true; } bool Wddm::createDevice() { NTSTATUS status = STATUS_UNSUCCESSFUL; D3DKMT_CREATEDEVICE CreateDevice = {{0}}; if (adapter) { CreateDevice.hAdapter = adapter; CreateDevice.Flags.LegacyMode = FALSE; if (preemptionMode >= PreemptionMode::MidBatch) { CreateDevice.Flags.DisableGpuTimeout = readEnablePreemptionRegKey(); } status = gdi->createDevice(&CreateDevice); if (status == STATUS_SUCCESS) { device = CreateDevice.hDevice; } } return status == STATUS_SUCCESS; } bool Wddm::destroyDevice() { NTSTATUS status = STATUS_UNSUCCESSFUL; D3DKMT_DESTROYDEVICE DestroyDevice = {0}; if (device) { DestroyDevice.hDevice = device; status = gdi->destroyDevice(&DestroyDevice); DEBUG_BREAK_IF(status != STATUS_SUCCESS); device = 0; } return true; } bool Wddm::closeAdapter() { NTSTATUS status = STATUS_UNSUCCESSFUL; D3DKMT_CLOSEADAPTER CloseAdapter = {0}; CloseAdapter.hAdapter = adapter; status = gdi->closeAdapter(&CloseAdapter); DEBUG_BREAK_IF(status != STATUS_SUCCESS); adapter = 0; return true; } bool Wddm::openAdapter() { NTSTATUS status = STATUS_UNSUCCESSFUL; D3DKMT_OPENADAPTERFROMLUID OpenAdapterData = {{0}}; DXGI_ADAPTER_DESC1 OpenAdapterDesc = {{0}}; IDXGIFactory1 *pFactory = nullptr; IDXGIAdapter1 *pAdapter = nullptr; DWORD iDevNum = 0; HRESULT hr = Wddm::createDxgiFactory(__uuidof(IDXGIFactory), (void **)(&pFactory)); if ((hr != S_OK) || (pFactory == nullptr)) { return false; } while (pFactory->EnumAdapters1(iDevNum++, &pAdapter) != DXGI_ERROR_NOT_FOUND) { hr = pAdapter->GetDesc1(&OpenAdapterDesc); if (hr == S_OK) { // Check for adapters that include either "Intel" or "Citrix" (which may // be virtualizing one of our adapters) in the description if ((wcsstr(OpenAdapterDesc.Description, L"Intel") != 0) || (wcsstr(OpenAdapterDesc.Description, L"Citrix") != 0)) { break; } } // Release all the non-Intel adapters pAdapter->Release(); pAdapter = nullptr; } OpenAdapterData.AdapterLuid = OpenAdapterDesc.AdapterLuid; status = gdi->openAdapterFromLuid(&OpenAdapterData); if (pAdapter != nullptr) { // If an Intel adapter was found, release it here pAdapter->Release(); pAdapter = nullptr; } if (pFactory != nullptr) { pFactory->Release(); pFactory = nullptr; } if (status == STATUS_SUCCESS) { adapter = OpenAdapterData.hAdapter; adapterLuid = OpenAdapterDesc.AdapterLuid; } return status == STATUS_SUCCESS; } bool Wddm::evict(D3DKMT_HANDLE *handleList, uint32_t numOfHandles, uint64_t &sizeToTrim) { NTSTATUS status = STATUS_SUCCESS; D3DKMT_EVICT Evict = {0}; Evict.AllocationList = handleList; Evict.hDevice = device; Evict.NumAllocations = numOfHandles; Evict.NumBytesToTrim = 0; status = gdi->evict(&Evict); sizeToTrim = Evict.NumBytesToTrim; kmDafListener->notifyEvict(featureTable->ftrKmdDaf, adapter, device, handleList, numOfHandles, gdi->escape); return status == STATUS_SUCCESS; } bool Wddm::makeResident(D3DKMT_HANDLE *handles, uint32_t count, bool cantTrimFurther, uint64_t *numberOfBytesToTrim) { NTSTATUS status = STATUS_SUCCESS; D3DDDI_MAKERESIDENT makeResident = {0}; UINT priority = 0; bool success = false; makeResident.AllocationList = handles; makeResident.hPagingQueue = pagingQueue; makeResident.NumAllocations = count; makeResident.PriorityList = &priority; makeResident.Flags.CantTrimFurther = cantTrimFurther ? 1 : 0; makeResident.Flags.MustSucceed = cantTrimFurther ? 1 : 0; status = gdi->makeResident(&makeResident); if (status == STATUS_PENDING) { interlockedMax(currentPagingFenceValue, makeResident.PagingFenceValue); success = true; } else if (status == STATUS_SUCCESS) { success = true; } else { DEBUG_BREAK_IF(true); if (numberOfBytesToTrim != nullptr) *numberOfBytesToTrim = makeResident.NumBytesToTrim; UNRECOVERABLE_IF(cantTrimFurther); } kmDafListener->notifyMakeResident(featureTable->ftrKmdDaf, adapter, device, handles, count, gdi->escape); return success; } bool Wddm::mapGpuVirtualAddress(WddmAllocation *allocation, void *cpuPtr, bool allocation32bit, bool use64kbPages, bool useHeap1) { void *mapPtr = allocation->getReservedAddress() != nullptr ? allocation->getReservedAddress() : cpuPtr; return mapGpuVirtualAddressImpl(allocation->gmm, allocation->handle, mapPtr, allocation->gpuPtr, allocation32bit, use64kbPages, useHeap1); } bool Wddm::mapGpuVirtualAddress(AllocationStorageData *allocationStorageData, bool allocation32bit, bool use64kbPages) { return mapGpuVirtualAddressImpl(allocationStorageData->osHandleStorage->gmm, allocationStorageData->osHandleStorage->handle, const_cast(allocationStorageData->cpuPtr), allocationStorageData->osHandleStorage->gpuPtr, allocation32bit, use64kbPages, false); } bool Wddm::mapGpuVirtualAddressImpl(Gmm *gmm, D3DKMT_HANDLE handle, void *cpuPtr, D3DGPU_VIRTUAL_ADDRESS &gpuPtr, bool allocation32bit, bool use64kbPages, bool useHeap1) { NTSTATUS status = STATUS_SUCCESS; D3DDDI_MAPGPUVIRTUALADDRESS MapGPUVA = {0}; D3DDDIGPUVIRTUALADDRESS_PROTECTION_TYPE protectionType = {{{0}}}; protectionType.Write = TRUE; uint64_t size = static_cast(gmm->gmmResourceInfo->getSizeAllocation()); MapGPUVA.hPagingQueue = pagingQueue; MapGPUVA.hAllocation = handle; MapGPUVA.Protection = protectionType; MapGPUVA.SizeInPages = size / MemoryConstants::pageSize; MapGPUVA.OffsetInPages = 0; auto productFamily = gfxPlatform->eProductFamily; UNRECOVERABLE_IF(!hardwareInfoTable[productFamily]); if (useHeap1) { MapGPUVA.MinimumAddress = gfxPartition.Heap32[1].Base; MapGPUVA.MaximumAddress = gfxPartition.Heap32[1].Limit; MapGPUVA.BaseAddress = 0; } else if (use64kbPages) { MapGPUVA.MinimumAddress = gfxPartition.Standard64KB.Base; MapGPUVA.MaximumAddress = gfxPartition.Standard64KB.Limit; } else { if (hardwareInfoTable[productFamily]->capabilityTable.gpuAddressSpace == MemoryConstants::max48BitAddress) { MapGPUVA.BaseAddress = reinterpret_cast(cpuPtr); MapGPUVA.MinimumAddress = static_cast(0x0); MapGPUVA.MaximumAddress = static_cast((sizeof(size_t) == 8) ? 0x7fffffffffff : (D3DGPU_VIRTUAL_ADDRESS)0xffffffff); if (!cpuPtr) { MapGPUVA.MinimumAddress = gfxPartition.Standard.Base; MapGPUVA.MaximumAddress = gfxPartition.Standard.Limit; } } else { MapGPUVA.BaseAddress = 0; MapGPUVA.MinimumAddress = 0x0; MapGPUVA.MaximumAddress = hardwareInfoTable[productFamily]->capabilityTable.gpuAddressSpace; } if (allocation32bit) { MapGPUVA.MinimumAddress = gfxPartition.Heap32[0].Base; MapGPUVA.MaximumAddress = gfxPartition.Heap32[0].Limit; MapGPUVA.BaseAddress = 0; } } status = gdi->mapGpuVirtualAddress(&MapGPUVA); gpuPtr = GmmHelper::canonize(MapGPUVA.VirtualAddress); if (status == STATUS_PENDING) { interlockedMax(currentPagingFenceValue, MapGPUVA.PagingFenceValue); status = STATUS_SUCCESS; } if (status != STATUS_SUCCESS) { DEBUG_BREAK_IF(true); return false; } kmDafListener->notifyMapGpuVA(featureTable->ftrKmdDaf, adapter, device, handle, MapGPUVA.VirtualAddress, gdi->escape); if (gmm->isRenderCompressed && pageTableManager.get()) { return updateAuxTable(gpuPtr, gmm, true); } return true; } bool Wddm::freeGpuVirtualAddres(D3DGPU_VIRTUAL_ADDRESS &gpuPtr, uint64_t size) { NTSTATUS status = STATUS_SUCCESS; D3DKMT_FREEGPUVIRTUALADDRESS FreeGPUVA = {0}; FreeGPUVA.hAdapter = adapter; FreeGPUVA.BaseAddress = GmmHelper::decanonize(gpuPtr); FreeGPUVA.Size = size; status = gdi->freeGpuVirtualAddress(&FreeGPUVA); gpuPtr = static_cast(0); kmDafListener->notifyUnmapGpuVA(featureTable->ftrKmdDaf, adapter, device, FreeGPUVA.BaseAddress, gdi->escape); return status == STATUS_SUCCESS; } NTSTATUS Wddm::createAllocation(WddmAllocation *alloc) { NTSTATUS status = STATUS_UNSUCCESSFUL; D3DDDI_ALLOCATIONINFO AllocationInfo = {0}; D3DKMT_CREATEALLOCATION CreateAllocation = {0}; size_t size; if (alloc == nullptr) return false; size = alloc->getAlignedSize(); if (size == 0) return false; AllocationInfo.pSystemMem = alloc->getAlignedCpuPtr(); AllocationInfo.pPrivateDriverData = alloc->gmm->gmmResourceInfo->peekHandle(); AllocationInfo.PrivateDriverDataSize = static_cast(sizeof(GMM_RESOURCE_INFO)); AllocationInfo.Flags.Primary = 0; CreateAllocation.hGlobalShare = 0; CreateAllocation.PrivateRuntimeDataSize = 0; CreateAllocation.PrivateDriverDataSize = 0; CreateAllocation.Flags.Reserved = 0; CreateAllocation.NumAllocations = 1; CreateAllocation.pPrivateRuntimeData = NULL; CreateAllocation.pPrivateDriverData = NULL; CreateAllocation.Flags.NonSecure = FALSE; CreateAllocation.Flags.CreateShared = FALSE; CreateAllocation.Flags.RestrictSharedAccess = FALSE; CreateAllocation.Flags.CreateResource = alloc->getAlignedCpuPtr() == 0 ? TRUE : FALSE; CreateAllocation.pAllocationInfo = &AllocationInfo; CreateAllocation.hDevice = device; status = gdi->createAllocation(&CreateAllocation); if (status != STATUS_SUCCESS) { DEBUG_BREAK_IF(true); return status; } alloc->handle = AllocationInfo.hAllocation; kmDafListener->notifyWriteTarget(featureTable->ftrKmdDaf, adapter, device, alloc->handle, gdi->escape); return status; } bool Wddm::createAllocation64k(WddmAllocation *alloc) { NTSTATUS status = STATUS_SUCCESS; D3DDDI_ALLOCATIONINFO AllocationInfo = {0}; D3DKMT_CREATEALLOCATION CreateAllocation = {0}; AllocationInfo.pSystemMem = 0; AllocationInfo.pPrivateDriverData = alloc->gmm->gmmResourceInfo->peekHandle(); AllocationInfo.PrivateDriverDataSize = static_cast(sizeof(GMM_RESOURCE_INFO)); AllocationInfo.Flags.Primary = 0; CreateAllocation.NumAllocations = 1; CreateAllocation.pPrivateRuntimeData = NULL; CreateAllocation.pPrivateDriverData = NULL; CreateAllocation.Flags.CreateResource = TRUE; CreateAllocation.pAllocationInfo = &AllocationInfo; CreateAllocation.hDevice = device; status = gdi->createAllocation(&CreateAllocation); if (status != STATUS_SUCCESS) { DEBUG_BREAK_IF(true); return false; } alloc->handle = AllocationInfo.hAllocation; kmDafListener->notifyWriteTarget(featureTable->ftrKmdDaf, adapter, device, alloc->handle, gdi->escape); return true; } NTSTATUS Wddm::createAllocationsAndMapGpuVa(OsHandleStorage &osHandles) { NTSTATUS status = STATUS_UNSUCCESSFUL; D3DDDI_ALLOCATIONINFO AllocationInfo[maxFragmentsCount] = {{0}}; D3DKMT_CREATEALLOCATION CreateAllocation = {0}; auto allocationCount = 0; for (unsigned int i = 0; i < maxFragmentsCount; i++) { if (!osHandles.fragmentStorageData[i].osHandleStorage) { break; } if (osHandles.fragmentStorageData[i].osHandleStorage->handle == (D3DKMT_HANDLE) nullptr && osHandles.fragmentStorageData[i].fragmentSize) { AllocationInfo[allocationCount].pPrivateDriverData = osHandles.fragmentStorageData[i].osHandleStorage->gmm->gmmResourceInfo->peekHandle(); auto pSysMem = osHandles.fragmentStorageData[i].cpuPtr; auto PSysMemFromGmm = osHandles.fragmentStorageData[i].osHandleStorage->gmm->gmmResourceInfo->getSystemMemPointer(CL_TRUE); DEBUG_BREAK_IF(PSysMemFromGmm != pSysMem); AllocationInfo[allocationCount].pSystemMem = osHandles.fragmentStorageData[i].cpuPtr; AllocationInfo[allocationCount].PrivateDriverDataSize = static_cast(sizeof(GMM_RESOURCE_INFO)); allocationCount++; } } if (allocationCount == 0) { return STATUS_SUCCESS; } CreateAllocation.hGlobalShare = 0; CreateAllocation.PrivateRuntimeDataSize = 0; CreateAllocation.PrivateDriverDataSize = 0; CreateAllocation.Flags.Reserved = 0; CreateAllocation.NumAllocations = allocationCount; CreateAllocation.pPrivateRuntimeData = NULL; CreateAllocation.pPrivateDriverData = NULL; CreateAllocation.Flags.NonSecure = FALSE; CreateAllocation.Flags.CreateShared = FALSE; CreateAllocation.Flags.RestrictSharedAccess = FALSE; CreateAllocation.Flags.CreateResource = FALSE; CreateAllocation.pAllocationInfo = AllocationInfo; CreateAllocation.hDevice = device; while (status == STATUS_UNSUCCESSFUL) { status = gdi->createAllocation(&CreateAllocation); if (status != STATUS_SUCCESS) { DBG_LOG(PrintDebugMessages, __FUNCTION__, "status: ", status); DEBUG_BREAK_IF(true); break; } auto allocationIndex = 0; for (int i = 0; i < allocationCount; i++) { while (osHandles.fragmentStorageData[allocationIndex].osHandleStorage->handle) { allocationIndex++; } osHandles.fragmentStorageData[allocationIndex].osHandleStorage->handle = AllocationInfo[i].hAllocation; bool success = mapGpuVirtualAddress(&osHandles.fragmentStorageData[allocationIndex], false, false); allocationIndex++; if (!success) { DBG_LOG(PrintDebugMessages, __FUNCTION__, "mapGpuVirtualAddress: ", success); DEBUG_BREAK_IF(true); break; } kmDafListener->notifyWriteTarget(featureTable->ftrKmdDaf, adapter, device, AllocationInfo[i].hAllocation, gdi->escape); } status = STATUS_SUCCESS; } return status; } bool Wddm::destroyAllocations(D3DKMT_HANDLE *handles, uint32_t allocationCount, D3DKMT_HANDLE resourceHandle) { NTSTATUS status = STATUS_SUCCESS; D3DKMT_DESTROYALLOCATION2 DestroyAllocation = {0}; DEBUG_BREAK_IF(!(allocationCount <= 1 || resourceHandle == 0)); DestroyAllocation.hDevice = device; DestroyAllocation.hResource = resourceHandle; DestroyAllocation.phAllocationList = handles; DestroyAllocation.AllocationCount = allocationCount; DestroyAllocation.Flags.AssumeNotInUse = 1; status = gdi->destroyAllocation2(&DestroyAllocation); return status == STATUS_SUCCESS; } bool Wddm::openSharedHandle(D3DKMT_HANDLE handle, WddmAllocation *alloc) { D3DKMT_QUERYRESOURCEINFO QueryResourceInfo = {0}; QueryResourceInfo.hDevice = device; QueryResourceInfo.hGlobalShare = handle; auto status = gdi->queryResourceInfo(&QueryResourceInfo); DEBUG_BREAK_IF(status != STATUS_SUCCESS); if (QueryResourceInfo.NumAllocations == 0) { return false; } std::unique_ptr allocPrivateData(new char[QueryResourceInfo.TotalPrivateDriverDataSize]); std::unique_ptr resPrivateData(new char[QueryResourceInfo.ResourcePrivateDriverDataSize]); std::unique_ptr resPrivateRuntimeData(new char[QueryResourceInfo.PrivateRuntimeDataSize]); std::unique_ptr allocationInfo(new D3DDDI_OPENALLOCATIONINFO[QueryResourceInfo.NumAllocations]); D3DKMT_OPENRESOURCE OpenResource = {0}; OpenResource.hDevice = device; OpenResource.hGlobalShare = handle; OpenResource.NumAllocations = QueryResourceInfo.NumAllocations; OpenResource.pOpenAllocationInfo = allocationInfo.get(); OpenResource.pTotalPrivateDriverDataBuffer = allocPrivateData.get(); OpenResource.TotalPrivateDriverDataBufferSize = QueryResourceInfo.TotalPrivateDriverDataSize; OpenResource.pResourcePrivateDriverData = resPrivateData.get(); OpenResource.ResourcePrivateDriverDataSize = QueryResourceInfo.ResourcePrivateDriverDataSize; OpenResource.pPrivateRuntimeData = resPrivateRuntimeData.get(); OpenResource.PrivateRuntimeDataSize = QueryResourceInfo.PrivateRuntimeDataSize; status = gdi->openResource(&OpenResource); DEBUG_BREAK_IF(status != STATUS_SUCCESS); alloc->handle = allocationInfo[0].hAllocation; alloc->resourceHandle = OpenResource.hResource; auto resourceInfo = const_cast(allocationInfo[0].pPrivateDriverData); alloc->gmm = new Gmm(static_cast(resourceInfo)); return true; } bool Wddm::openNTHandle(HANDLE handle, WddmAllocation *alloc) { D3DKMT_QUERYRESOURCEINFOFROMNTHANDLE queryResourceInfoFromNtHandle = {}; queryResourceInfoFromNtHandle.hDevice = device; queryResourceInfoFromNtHandle.hNtHandle = handle; auto status = gdi->queryResourceInfoFromNtHandle(&queryResourceInfoFromNtHandle); DEBUG_BREAK_IF(status != STATUS_SUCCESS); std::unique_ptr allocPrivateData(new char[queryResourceInfoFromNtHandle.TotalPrivateDriverDataSize]); std::unique_ptr resPrivateData(new char[queryResourceInfoFromNtHandle.ResourcePrivateDriverDataSize]); std::unique_ptr resPrivateRuntimeData(new char[queryResourceInfoFromNtHandle.PrivateRuntimeDataSize]); std::unique_ptr allocationInfo2(new D3DDDI_OPENALLOCATIONINFO2[queryResourceInfoFromNtHandle.NumAllocations]); D3DKMT_OPENRESOURCEFROMNTHANDLE openResourceFromNtHandle = {}; openResourceFromNtHandle.hDevice = device; openResourceFromNtHandle.hNtHandle = handle; openResourceFromNtHandle.NumAllocations = queryResourceInfoFromNtHandle.NumAllocations; openResourceFromNtHandle.pOpenAllocationInfo2 = allocationInfo2.get(); openResourceFromNtHandle.pTotalPrivateDriverDataBuffer = allocPrivateData.get(); openResourceFromNtHandle.TotalPrivateDriverDataBufferSize = queryResourceInfoFromNtHandle.TotalPrivateDriverDataSize; openResourceFromNtHandle.pResourcePrivateDriverData = resPrivateData.get(); openResourceFromNtHandle.ResourcePrivateDriverDataSize = queryResourceInfoFromNtHandle.ResourcePrivateDriverDataSize; openResourceFromNtHandle.pPrivateRuntimeData = resPrivateRuntimeData.get(); openResourceFromNtHandle.PrivateRuntimeDataSize = queryResourceInfoFromNtHandle.PrivateRuntimeDataSize; status = gdi->openResourceFromNtHandle(&openResourceFromNtHandle); DEBUG_BREAK_IF(status != STATUS_SUCCESS); alloc->handle = allocationInfo2[0].hAllocation; alloc->resourceHandle = openResourceFromNtHandle.hResource; auto resourceInfo = const_cast(allocationInfo2[0].pPrivateDriverData); alloc->gmm = new Gmm(static_cast(resourceInfo)); return true; } void *Wddm::lockResource(WddmAllocation *wddmAllocation) { NTSTATUS status = STATUS_UNSUCCESSFUL; D3DKMT_LOCK2 lock2 = {}; lock2.hAllocation = wddmAllocation->handle; lock2.hDevice = this->device; status = gdi->lock2(&lock2); DEBUG_BREAK_IF(status != STATUS_SUCCESS); kmDafListener->notifyLock(featureTable->ftrKmdDaf, adapter, device, wddmAllocation->handle, 0, gdi->escape); return lock2.pData; } void Wddm::unlockResource(WddmAllocation *wddmAllocation) { NTSTATUS status = STATUS_UNSUCCESSFUL; D3DKMT_UNLOCK2 unlock2 = {}; unlock2.hAllocation = wddmAllocation->handle; unlock2.hDevice = this->device; status = gdi->unlock2(&unlock2); DEBUG_BREAK_IF(status != STATUS_SUCCESS); kmDafListener->notifyUnlock(featureTable->ftrKmdDaf, adapter, device, &wddmAllocation->handle, 1, gdi->escape); } void Wddm::kmDafLock(WddmAllocation *wddmAllocation) { kmDafListener->notifyLock(featureTable->ftrKmdDaf, adapter, device, wddmAllocation->handle, 0, gdi->escape); } bool Wddm::createContext(D3DKMT_HANDLE &context) { NTSTATUS status = STATUS_UNSUCCESSFUL; D3DKMT_CREATECONTEXTVIRTUAL CreateContext = {0}; CREATECONTEXT_PVTDATA PrivateData = {{0}}; PrivateData.IsProtectedProcess = FALSE; PrivateData.IsDwm = FALSE; PrivateData.ProcessID = GetCurrentProcessId(); PrivateData.GpuVAContext = TRUE; PrivateData.pHwContextId = &hwContextId; PrivateData.IsMediaUsage = false; PrivateData.NoRingFlushes = DebugManager.flags.UseNoRingFlushesKmdMode.get(); applyAdditionalContextFlags(PrivateData); CreateContext.EngineAffinity = 0; CreateContext.Flags.NullRendering = static_cast(DebugManager.flags.EnableNullHardware.get()); CreateContext.Flags.HwQueueSupported = wddmInterface->hwQueuesSupported(); if (preemptionMode >= PreemptionMode::MidBatch) { CreateContext.Flags.DisableGpuTimeout = readEnablePreemptionRegKey(); } CreateContext.PrivateDriverDataSize = sizeof(PrivateData); CreateContext.NodeOrdinal = node; CreateContext.pPrivateDriverData = &PrivateData; CreateContext.ClientHint = D3DKMT_CLIENTHINT_OPENGL; CreateContext.hDevice = device; status = gdi->createContext(&CreateContext); context = CreateContext.hContext; return status == STATUS_SUCCESS; } bool Wddm::destroyContext(D3DKMT_HANDLE context) { D3DKMT_DESTROYCONTEXT DestroyContext = {0}; NTSTATUS status = STATUS_UNSUCCESSFUL; if (context != static_cast(0)) { DestroyContext.hContext = context; status = gdi->destroyContext(&DestroyContext); } return status == STATUS_SUCCESS; } bool Wddm::submit(uint64_t commandBuffer, size_t size, void *commandHeader, OsContextWin &osContext) { bool status = false; if (currentPagingFenceValue > *pagingFenceAddress && !waitOnGPU(osContext.getContext())) { return false; } DBG_LOG(ResidencyDebugEnable, "Residency:", __FUNCTION__, "currentFenceValue =", osContext.getMonitoredFence().currentFenceValue); status = wddmInterface->submit(commandBuffer, size, commandHeader, osContext); if (status) { osContext.getMonitoredFence().lastSubmittedFence = osContext.getMonitoredFence().currentFenceValue; osContext.getMonitoredFence().currentFenceValue++; } getDeviceState(); UNRECOVERABLE_IF(!status); return status; } void Wddm::getDeviceState() { #ifdef _DEBUG D3DKMT_GETDEVICESTATE GetDevState; memset(&GetDevState, 0, sizeof(GetDevState)); NTSTATUS status = STATUS_SUCCESS; GetDevState.hDevice = device; GetDevState.StateType = D3DKMT_DEVICESTATE_EXECUTION; status = gdi->getDeviceState(&GetDevState); DEBUG_BREAK_IF(status != STATUS_SUCCESS); if (status == STATUS_SUCCESS) { DEBUG_BREAK_IF(GetDevState.ExecutionState != D3DKMT_DEVICEEXECUTION_ACTIVE); } #endif } void Wddm::handleCompletion(OsContextWin &osContext) { if (osContext.getMonitoredFence().cpuAddress) { auto *currentTag = osContext.getMonitoredFence().cpuAddress; while (*currentTag < osContext.getMonitoredFence().currentFenceValue - 1) ; } } unsigned int Wddm::readEnablePreemptionRegKey() { return static_cast(registryReader->getSetting("EnablePreemption", 1)); } bool Wddm::waitOnGPU(D3DKMT_HANDLE context) { D3DKMT_WAITFORSYNCHRONIZATIONOBJECTFROMGPU WaitOnGPU = {0}; WaitOnGPU.hContext = context; WaitOnGPU.ObjectCount = 1; WaitOnGPU.ObjectHandleArray = &pagingQueueSyncObject; uint64_t localPagingFenceValue = currentPagingFenceValue; WaitOnGPU.MonitoredFenceValueArray = &localPagingFenceValue; NTSTATUS status = gdi->waitForSynchronizationObjectFromGpu(&WaitOnGPU); return status == STATUS_SUCCESS; } bool Wddm::waitFromCpu(uint64_t lastFenceValue, OsContextWin &osContext) { NTSTATUS status = STATUS_SUCCESS; if (lastFenceValue > *osContext.getMonitoredFence().cpuAddress) { D3DKMT_WAITFORSYNCHRONIZATIONOBJECTFROMCPU waitFromCpu = {0}; waitFromCpu.ObjectCount = 1; waitFromCpu.ObjectHandleArray = &osContext.getMonitoredFence().fenceHandle; waitFromCpu.FenceValueArray = &lastFenceValue; waitFromCpu.hDevice = device; waitFromCpu.hAsyncEvent = NULL; status = gdi->waitForSynchronizationObjectFromCpu(&waitFromCpu); DEBUG_BREAK_IF(status != STATUS_SUCCESS); } return status == STATUS_SUCCESS; } uint64_t Wddm::getSystemSharedMemory() const { return systemSharedMemory; } uint64_t Wddm::getMaxApplicationAddress() const { return maximumApplicationAddress; } NTSTATUS Wddm::escape(D3DKMT_ESCAPE &escapeCommand) { escapeCommand.hAdapter = adapter; return gdi->escape(&escapeCommand); }; PFND3DKMT_ESCAPE Wddm::getEscapeHandle() const { return gdi->escape; } uint64_t Wddm::getHeap32Base() { return alignUp(gfxPartition.Heap32[0].Base, MemoryConstants::pageSize); } uint64_t Wddm::getHeap32Size() { return alignDown(gfxPartition.Heap32[0].Limit, MemoryConstants::pageSize); } void Wddm::registerTrimCallback(PFND3DKMT_TRIMNOTIFICATIONCALLBACK callback, WddmMemoryManager *memoryManager) { if (DebugManager.flags.DoNotRegisterTrimCallback.get()) { return; } D3DKMT_REGISTERTRIMNOTIFICATION registerTrimNotification; registerTrimNotification.Callback = callback; registerTrimNotification.AdapterLuid = this->adapterLuid; registerTrimNotification.Context = memoryManager; registerTrimNotification.hDevice = this->device; NTSTATUS status = gdi->registerTrimNotification(®isterTrimNotification); if (status == STATUS_SUCCESS) { trimCallbackHandle = registerTrimNotification.Handle; } } void Wddm::unregisterTrimCallback(PFND3DKMT_TRIMNOTIFICATIONCALLBACK callback) { if (callback == nullptr) { return; } D3DKMT_UNREGISTERTRIMNOTIFICATION unregisterTrimNotification; unregisterTrimNotification.Callback = callback; unregisterTrimNotification.Handle = this->trimCallbackHandle; NTSTATUS status = gdi->unregisterTrimNotification(&unregisterTrimNotification); DEBUG_BREAK_IF(status != STATUS_SUCCESS); } void Wddm::releaseReservedAddress(void *reservedAddress) { if (reservedAddress) { auto status = virtualFree(reservedAddress, 0, MEM_RELEASE); DEBUG_BREAK_IF(!status); } } bool Wddm::updateAuxTable(D3DGPU_VIRTUAL_ADDRESS gpuVa, Gmm *gmm, bool map) { GMM_DDI_UPDATEAUXTABLE ddiUpdateAuxTable = {}; ddiUpdateAuxTable.BaseGpuVA = gpuVa; ddiUpdateAuxTable.BaseResInfo = gmm->gmmResourceInfo->peekHandle(); ddiUpdateAuxTable.DoNotWait = true; ddiUpdateAuxTable.Map = map ? 1u : 0u; return pageTableManager->updateAuxTable(&ddiUpdateAuxTable) == GMM_STATUS::GMM_SUCCESS; } void Wddm::resetPageTableManager(GmmPageTableMngr *newPageTableManager) { pageTableManager.reset(newPageTableManager); } bool Wddm::reserveValidAddressRange(size_t size, void *&reservedMem) { reservedMem = virtualAlloc(nullptr, size, MEM_RESERVE, PAGE_READWRITE); if (reservedMem == nullptr) { return false; } else if (minAddress > reinterpret_cast(reservedMem)) { StackVec invalidAddrVector; invalidAddrVector.push_back(reservedMem); do { reservedMem = virtualAlloc(nullptr, size, MEM_RESERVE | MEM_TOP_DOWN, PAGE_READWRITE); if (minAddress > reinterpret_cast(reservedMem) && reservedMem != nullptr) { invalidAddrVector.push_back(reservedMem); } else { break; } } while (1); for (auto &it : invalidAddrVector) { auto status = virtualFree(it, 0, MEM_RELEASE); DEBUG_BREAK_IF(!status); } if (reservedMem == nullptr) { return false; } } return true; } void *Wddm::virtualAlloc(void *inPtr, size_t size, unsigned long flags, unsigned long type) { return virtualAllocFnc(inPtr, size, flags, type); } int Wddm::virtualFree(void *ptr, size_t size, unsigned long flags) { return virtualFreeFnc(ptr, size, flags); } bool Wddm::configureDeviceAddressSpace() { SYSTEM_INFO sysInfo; Wddm::getSystemInfo(&sysInfo); maximumApplicationAddress = reinterpret_cast(sysInfo.lpMaximumApplicationAddress); auto productFamily = gfxPlatform->eProductFamily; if (!hardwareInfoTable[productFamily]) { return false; } auto svmSize = hardwareInfoTable[productFamily]->capabilityTable.gpuAddressSpace == MemoryConstants::max48BitAddress ? maximumApplicationAddress + 1u : 0u; return gmmMemory->configureDevice(adapter, device, gdi->escape, svmSize, featureTable->ftrL3IACoherency, gfxPartition, minAddress); } bool Wddm::init() { if (gdi != nullptr && gdi->isInitialized() && !initialized) { if (!openAdapter()) { return false; } if (!queryAdapterInfo()) { return false; } if (!wddmInterface) { if (featureTable->ftrWddmHwQueues) { wddmInterface = std::make_unique(*this); } else { wddmInterface = std::make_unique(*this); } } if (!createDevice()) { return false; } if (!createPagingQueue()) { return false; } if (!gmmMemory) { gmmMemory.reset(GmmMemory::create()); } initialized = configureDeviceAddressSpace(); } return initialized; } } // namespace OCLRT