mirror of
https://github.com/intel/compute-runtime.git
synced 2025-12-22 01:48:50 +08:00
When upstream ioctl helper is created it will try to create small allocation, adding I915_GEM_CREATE_EXT_SET_PAT extension. If it succeeds, for all resources with valid pat index value it will then explicitly program pat index value with gem create ext call. PrintBOCreateDestroyResult value can be used to: - print whether the set pat extension is supported by the kernel, when ioctl helper is created - print whether set pat extension was added for a given gem create ext call and what pat index value was programmed Resolves: NEO-7896 Signed-off-by: Filip Hazubski <filip.hazubski@intel.com>
304 lines
17 KiB
C++
304 lines
17 KiB
C++
/*
|
|
* Copyright (C) 2021-2023 Intel Corporation
|
|
*
|
|
* SPDX-License-Identifier: MIT
|
|
*
|
|
*/
|
|
|
|
#pragma once
|
|
#include "shared/source/command_stream/task_count_helper.h"
|
|
#include "shared/source/helpers/topology_map.h"
|
|
#include "shared/source/os_interface/linux/drm_wrappers.h"
|
|
#include "shared/source/utilities/stackvec.h"
|
|
|
|
#include "igfxfmid.h"
|
|
|
|
#include <cstddef>
|
|
#include <cstdint>
|
|
#include <memory>
|
|
#include <optional>
|
|
#include <string>
|
|
#include <vector>
|
|
|
|
namespace NEO {
|
|
class Drm;
|
|
class OsContextLinux;
|
|
class IoctlHelper;
|
|
enum class CacheRegion : uint16_t;
|
|
enum class PreferredLocation : int16_t;
|
|
struct HardwareInfo;
|
|
struct HardwareIpVersion;
|
|
struct EngineInfo;
|
|
struct DrmQueryTopologyData;
|
|
|
|
class MemoryInfo;
|
|
|
|
struct MemoryRegion {
|
|
MemoryClassInstance region;
|
|
uint64_t probedSize;
|
|
uint64_t unallocatedSize;
|
|
};
|
|
|
|
struct EngineCapabilities {
|
|
EngineClassInstance engine;
|
|
uint64_t capabilities;
|
|
};
|
|
|
|
struct DistanceInfo {
|
|
MemoryClassInstance region;
|
|
EngineClassInstance engine;
|
|
int32_t distance;
|
|
};
|
|
|
|
struct VmBindParams {
|
|
uint32_t vmId;
|
|
uint32_t handle;
|
|
uint64_t start;
|
|
uint64_t offset;
|
|
uint64_t length;
|
|
uint64_t flags;
|
|
uint64_t extensions;
|
|
};
|
|
|
|
struct UuidRegisterResult {
|
|
int32_t retVal;
|
|
uint32_t handle;
|
|
};
|
|
|
|
using MemRegionsVec = StackVec<MemoryClassInstance, 5>;
|
|
using VmBindExtSetPatT = uint8_t[40];
|
|
using VmBindExtUserFenceT = uint8_t[56];
|
|
|
|
class IoctlHelper {
|
|
public:
|
|
IoctlHelper(Drm &drmArg) : drm(drmArg){};
|
|
virtual ~IoctlHelper() {}
|
|
static std::unique_ptr<IoctlHelper> getI915Helper(const PRODUCT_FAMILY productFamily, const std::string &prelimVersion, Drm &drm);
|
|
virtual int ioctl(DrmIoctl request, void *arg);
|
|
|
|
virtual bool initialize() = 0;
|
|
virtual bool isSetPairAvailable() = 0;
|
|
virtual bool isChunkingAvailable() = 0;
|
|
virtual bool isVmBindAvailable() = 0;
|
|
virtual int createGemExt(const MemRegionsVec &memClassInstances, size_t allocSize, uint32_t &handle, uint64_t patIndex, std::optional<uint32_t> vmId, int32_t pairHandle, bool isChunked, uint32_t numOfChunks) = 0;
|
|
virtual CacheRegion closAlloc() = 0;
|
|
virtual uint16_t closAllocWays(CacheRegion closIndex, uint16_t cacheLevel, uint16_t numWays) = 0;
|
|
virtual CacheRegion closFree(CacheRegion closIndex) = 0;
|
|
virtual int waitUserFence(uint32_t ctxId, uint64_t address,
|
|
uint64_t value, uint32_t dataWidth, int64_t timeout, uint16_t flags) = 0;
|
|
virtual uint32_t getAtomicAdvise(bool isNonAtomic) = 0;
|
|
virtual uint32_t getPreferredLocationAdvise() = 0;
|
|
virtual std::optional<MemoryClassInstance> getPreferredLocationRegion(PreferredLocation memoryLocation, uint32_t memoryInstance) = 0;
|
|
virtual bool setVmBoAdvise(int32_t handle, uint32_t attribute, void *region) = 0;
|
|
virtual bool setVmBoAdviseForChunking(int32_t handle, uint64_t start, uint64_t length, uint32_t attribute, void *region) = 0;
|
|
virtual bool setVmPrefetch(uint64_t start, uint64_t length, uint32_t region, uint32_t vmId) = 0;
|
|
virtual uint32_t getDirectSubmissionFlag() = 0;
|
|
virtual std::unique_ptr<uint8_t[]> prepareVmBindExt(const StackVec<uint32_t, 2> &bindExtHandles) = 0;
|
|
virtual uint64_t getFlagsForVmBind(bool bindCapture, bool bindImmediate, bool bindMakeResident) = 0;
|
|
virtual int queryDistances(std::vector<QueryItem> &queryItems, std::vector<DistanceInfo> &distanceInfos) = 0;
|
|
virtual uint16_t getWaitUserFenceSoftFlag() = 0;
|
|
virtual int execBuffer(ExecBuffer *execBuffer, uint64_t completionGpuAddress, TaskCountType counterValue) = 0;
|
|
virtual bool completionFenceExtensionSupported(const bool isVmBindAvailable) = 0;
|
|
virtual std::optional<DrmParam> getHasPageFaultParamId() = 0;
|
|
virtual std::unique_ptr<uint8_t[]> createVmControlExtRegion(const std::optional<MemoryClassInstance> ®ionInstanceClass) = 0;
|
|
virtual uint32_t getFlagsForVmCreate(bool disableScratch, bool enablePageFault, bool useVmBind) = 0;
|
|
virtual uint32_t createContextWithAccessCounters(GemContextCreateExt &gcc) = 0;
|
|
virtual uint32_t createCooperativeContext(GemContextCreateExt &gcc) = 0;
|
|
virtual void fillVmBindExtSetPat(VmBindExtSetPatT &vmBindExtSetPat, uint64_t patIndex, uint64_t nextExtension) = 0;
|
|
virtual void fillVmBindExtUserFence(VmBindExtUserFenceT &vmBindExtUserFence, uint64_t fenceAddress, uint64_t fenceValue, uint64_t nextExtension) = 0;
|
|
virtual std::optional<uint64_t> getCopyClassSaturatePCIECapability() = 0;
|
|
virtual std::optional<uint64_t> getCopyClassSaturateLinkCapability() = 0;
|
|
virtual uint32_t getVmAdviseAtomicAttribute() = 0;
|
|
virtual int vmBind(const VmBindParams &vmBindParams) = 0;
|
|
virtual int vmUnbind(const VmBindParams &vmBindParams) = 0;
|
|
virtual bool getEuStallProperties(std::array<uint64_t, 12u> &properties, uint64_t dssBufferSize,
|
|
uint64_t samplingRate, uint64_t pollPeriod, uint64_t engineInstance, uint64_t notifyNReports) = 0;
|
|
virtual uint32_t getEuStallFdParameter() = 0;
|
|
virtual UuidRegisterResult registerUuid(const std::string &uuid, uint32_t uuidClass, uint64_t ptr, uint64_t size) = 0;
|
|
virtual UuidRegisterResult registerStringClassUuid(const std::string &uuid, uint64_t ptr, uint64_t size) = 0;
|
|
virtual int unregisterUuid(uint32_t handle) = 0;
|
|
virtual bool isContextDebugSupported() = 0;
|
|
virtual int setContextDebugFlag(uint32_t drmContextId) = 0;
|
|
virtual bool isDebugAttachAvailable() = 0;
|
|
virtual unsigned int getIoctlRequestValue(DrmIoctl ioctlRequest) const = 0;
|
|
virtual int getDrmParamValue(DrmParam drmParam) const = 0;
|
|
virtual std::string getDrmParamString(DrmParam param) const = 0;
|
|
virtual std::string getIoctlString(DrmIoctl ioctlRequest) const = 0;
|
|
|
|
virtual bool checkIfIoctlReinvokeRequired(int error, DrmIoctl ioctlRequest) const;
|
|
virtual std::vector<MemoryRegion> translateToMemoryRegions(const std::vector<uint8_t> ®ionInfo);
|
|
|
|
virtual int createDrmContext(Drm &drm, OsContextLinux &osContext, uint32_t drmVmId, uint32_t deviceIndex);
|
|
std::vector<EngineCapabilities> translateToEngineCaps(const std::vector<uint8_t> &data);
|
|
|
|
void fillExecObject(ExecObject &execObject, uint32_t handle, uint64_t gpuAddress, uint32_t drmContextId, bool bindInfo, bool isMarkedForCapture);
|
|
void logExecObject(const ExecObject &execObject, std::stringstream &logger, size_t size);
|
|
|
|
void fillExecBuffer(ExecBuffer &execBuffer, uintptr_t buffersPtr, uint32_t bufferCount, uint32_t startOffset, uint32_t size, uint64_t flags, uint32_t drmContextId);
|
|
void logExecBuffer(const ExecBuffer &execBuffer, std::stringstream &logger);
|
|
virtual int getDrmParamValueBase(DrmParam drmParam) const;
|
|
unsigned int getIoctlRequestValueBase(DrmIoctl ioctlRequest) const;
|
|
bool setDomainCpu(uint32_t handle, bool writeEnable);
|
|
|
|
std::string getDrmParamStringBase(DrmParam param) const;
|
|
std::string getIoctlStringBase(DrmIoctl ioctlRequest) const;
|
|
virtual std::string getFileForMaxGpuFrequency() const;
|
|
virtual std::string getFileForMaxGpuFrequencyOfSubDevice(int subDeviceId) const;
|
|
virtual std::string getFileForMaxMemoryFrequencyOfSubDevice(int subDeviceId) const;
|
|
virtual std::string getFileForMemoryAddrRange(int subdeviceId) const;
|
|
virtual bool getFabricLatency(uint32_t fabricId, uint32_t &latency, uint32_t &bandwidth) = 0;
|
|
virtual bool isWaitBeforeBindRequired(bool bind) const = 0;
|
|
virtual void *pciBarrierMmap() { return nullptr; };
|
|
virtual void setupIpVersion();
|
|
|
|
uint32_t getFlagsForPrimeHandleToFd() const;
|
|
virtual std::unique_ptr<MemoryInfo> createMemoryInfo();
|
|
virtual std::unique_ptr<EngineInfo> createEngineInfo(bool isSysmanEnabled);
|
|
virtual bool getTopologyDataAndMap(const HardwareInfo &hwInfo, DrmQueryTopologyData &topologyData, TopologyMap &topologyMap);
|
|
bool translateTopologyInfo(const QueryTopologyInfo *queryTopologyInfo, DrmQueryTopologyData &topologyData, TopologyMapping &mapping);
|
|
|
|
protected:
|
|
Drm &drm;
|
|
};
|
|
|
|
class IoctlHelperUpstream : public IoctlHelper {
|
|
public:
|
|
using IoctlHelper::IoctlHelper;
|
|
|
|
bool initialize() override;
|
|
bool isSetPairAvailable() override;
|
|
bool isChunkingAvailable() override;
|
|
bool isVmBindAvailable() override;
|
|
int createGemExt(const MemRegionsVec &memClassInstances, size_t allocSize, uint32_t &handle, uint64_t patIndex, std::optional<uint32_t> vmId, int32_t pairHandle, bool isChunked, uint32_t numOfChunks) override;
|
|
CacheRegion closAlloc() override;
|
|
uint16_t closAllocWays(CacheRegion closIndex, uint16_t cacheLevel, uint16_t numWays) override;
|
|
CacheRegion closFree(CacheRegion closIndex) override;
|
|
int waitUserFence(uint32_t ctxId, uint64_t address,
|
|
uint64_t value, uint32_t dataWidth, int64_t timeout, uint16_t flags) override;
|
|
uint32_t getAtomicAdvise(bool isNonAtomic) override;
|
|
uint32_t getPreferredLocationAdvise() override;
|
|
std::optional<MemoryClassInstance> getPreferredLocationRegion(PreferredLocation memoryLocation, uint32_t memoryInstance) override;
|
|
bool setVmBoAdvise(int32_t handle, uint32_t attribute, void *region) override;
|
|
bool setVmBoAdviseForChunking(int32_t handle, uint64_t start, uint64_t length, uint32_t attribute, void *region) override;
|
|
bool setVmPrefetch(uint64_t start, uint64_t length, uint32_t region, uint32_t vmId) override;
|
|
uint32_t getDirectSubmissionFlag() override;
|
|
std::unique_ptr<uint8_t[]> prepareVmBindExt(const StackVec<uint32_t, 2> &bindExtHandles) override;
|
|
uint64_t getFlagsForVmBind(bool bindCapture, bool bindImmediate, bool bindMakeResident) override;
|
|
int queryDistances(std::vector<QueryItem> &queryItems, std::vector<DistanceInfo> &distanceInfos) override;
|
|
uint16_t getWaitUserFenceSoftFlag() override;
|
|
int execBuffer(ExecBuffer *execBuffer, uint64_t completionGpuAddress, TaskCountType counterValue) override;
|
|
bool completionFenceExtensionSupported(const bool isVmBindAvailable) override;
|
|
std::optional<DrmParam> getHasPageFaultParamId() override;
|
|
std::unique_ptr<uint8_t[]> createVmControlExtRegion(const std::optional<MemoryClassInstance> ®ionInstanceClass) override;
|
|
uint32_t getFlagsForVmCreate(bool disableScratch, bool enablePageFault, bool useVmBind) override;
|
|
uint32_t createContextWithAccessCounters(GemContextCreateExt &gcc) override;
|
|
uint32_t createCooperativeContext(GemContextCreateExt &gcc) override;
|
|
void fillVmBindExtSetPat(VmBindExtSetPatT &vmBindExtSetPat, uint64_t patIndex, uint64_t nextExtension) override;
|
|
void fillVmBindExtUserFence(VmBindExtUserFenceT &vmBindExtUserFence, uint64_t fenceAddress, uint64_t fenceValue, uint64_t nextExtension) override;
|
|
std::optional<uint64_t> getCopyClassSaturatePCIECapability() override;
|
|
std::optional<uint64_t> getCopyClassSaturateLinkCapability() override;
|
|
uint32_t getVmAdviseAtomicAttribute() override;
|
|
int vmBind(const VmBindParams &vmBindParams) override;
|
|
int vmUnbind(const VmBindParams &vmBindParams) override;
|
|
bool getEuStallProperties(std::array<uint64_t, 12u> &properties, uint64_t dssBufferSize, uint64_t samplingRate,
|
|
uint64_t pollPeriod, uint64_t engineInstance, uint64_t notifyNReports) override;
|
|
uint32_t getEuStallFdParameter() override;
|
|
UuidRegisterResult registerUuid(const std::string &uuid, uint32_t uuidClass, uint64_t ptr, uint64_t size) override;
|
|
UuidRegisterResult registerStringClassUuid(const std::string &uuid, uint64_t ptr, uint64_t size) override;
|
|
int unregisterUuid(uint32_t handle) override;
|
|
bool isContextDebugSupported() override;
|
|
int setContextDebugFlag(uint32_t drmContextId) override;
|
|
bool isDebugAttachAvailable() override;
|
|
unsigned int getIoctlRequestValue(DrmIoctl ioctlRequest) const override;
|
|
int getDrmParamValue(DrmParam drmParam) const override;
|
|
std::string getDrmParamString(DrmParam param) const override;
|
|
std::string getIoctlString(DrmIoctl ioctlRequest) const override;
|
|
bool getFabricLatency(uint32_t fabricId, uint32_t &latency, uint32_t &bandwidth) override;
|
|
bool isWaitBeforeBindRequired(bool bind) const override;
|
|
|
|
protected:
|
|
MOCKABLE_VIRTUAL void detectExtSetPatSupport();
|
|
bool isSetPatSupported = false;
|
|
};
|
|
|
|
template <PRODUCT_FAMILY gfxProduct>
|
|
class IoctlHelperImpl : public IoctlHelperUpstream {
|
|
public:
|
|
using IoctlHelperUpstream::IoctlHelperUpstream;
|
|
static std::unique_ptr<IoctlHelper> get(Drm &drm) {
|
|
return std::make_unique<IoctlHelperImpl<gfxProduct>>(drm);
|
|
}
|
|
|
|
int createGemExt(const MemRegionsVec &memClassInstances, size_t allocSize, uint32_t &handle, uint64_t patIndex, std::optional<uint32_t> vmId, int32_t pairHandle, bool isChunked, uint32_t numOfChunks) override;
|
|
std::vector<MemoryRegion> translateToMemoryRegions(const std::vector<uint8_t> ®ionInfo) override;
|
|
unsigned int getIoctlRequestValue(DrmIoctl ioctlRequest) const override;
|
|
std::string getIoctlString(DrmIoctl ioctlRequest) const override;
|
|
};
|
|
|
|
class IoctlHelperPrelim20 : public IoctlHelper {
|
|
public:
|
|
IoctlHelperPrelim20(Drm &drmArg);
|
|
|
|
bool initialize() override;
|
|
bool isSetPairAvailable() override;
|
|
bool isChunkingAvailable() override;
|
|
bool isVmBindAvailable() override;
|
|
int createGemExt(const MemRegionsVec &memClassInstances, size_t allocSize, uint32_t &handle, uint64_t patIndex, std::optional<uint32_t> vmId, int32_t pairHandle, bool isChunked, uint32_t numOfChunks) override;
|
|
CacheRegion closAlloc() override;
|
|
uint16_t closAllocWays(CacheRegion closIndex, uint16_t cacheLevel, uint16_t numWays) override;
|
|
CacheRegion closFree(CacheRegion closIndex) override;
|
|
int waitUserFence(uint32_t ctxId, uint64_t address,
|
|
uint64_t value, uint32_t dataWidth, int64_t timeout, uint16_t flags) override;
|
|
uint32_t getAtomicAdvise(bool isNonAtomic) override;
|
|
uint32_t getPreferredLocationAdvise() override;
|
|
std::optional<MemoryClassInstance> getPreferredLocationRegion(PreferredLocation memoryLocation, uint32_t memoryInstance) override;
|
|
bool setVmBoAdvise(int32_t handle, uint32_t attribute, void *region) override;
|
|
bool setVmBoAdviseForChunking(int32_t handle, uint64_t start, uint64_t length, uint32_t attribute, void *region) override;
|
|
bool setVmPrefetch(uint64_t start, uint64_t length, uint32_t region, uint32_t vmId) override;
|
|
uint32_t getDirectSubmissionFlag() override;
|
|
std::unique_ptr<uint8_t[]> prepareVmBindExt(const StackVec<uint32_t, 2> &bindExtHandles) override;
|
|
uint64_t getFlagsForVmBind(bool bindCapture, bool bindImmediate, bool bindMakeResident) override;
|
|
int queryDistances(std::vector<QueryItem> &queryItems, std::vector<DistanceInfo> &distanceInfos) override;
|
|
uint16_t getWaitUserFenceSoftFlag() override;
|
|
int execBuffer(ExecBuffer *execBuffer, uint64_t completionGpuAddress, TaskCountType counterValue) override;
|
|
bool completionFenceExtensionSupported(const bool isVmBindAvailable) override;
|
|
std::optional<DrmParam> getHasPageFaultParamId() override;
|
|
std::unique_ptr<uint8_t[]> createVmControlExtRegion(const std::optional<MemoryClassInstance> ®ionInstanceClass) override;
|
|
uint32_t getFlagsForVmCreate(bool disableScratch, bool enablePageFault, bool useVmBind) override;
|
|
uint32_t createContextWithAccessCounters(GemContextCreateExt &gcc) override;
|
|
uint32_t createCooperativeContext(GemContextCreateExt &gcc) override;
|
|
void fillVmBindExtSetPat(VmBindExtSetPatT &vmBindExtSetPat, uint64_t patIndex, uint64_t nextExtension) override;
|
|
void fillVmBindExtUserFence(VmBindExtUserFenceT &vmBindExtUserFence, uint64_t fenceAddress, uint64_t fenceValue, uint64_t nextExtension) override;
|
|
std::optional<uint64_t> getCopyClassSaturatePCIECapability() override;
|
|
std::optional<uint64_t> getCopyClassSaturateLinkCapability() override;
|
|
uint32_t getVmAdviseAtomicAttribute() override;
|
|
int vmBind(const VmBindParams &vmBindParams) override;
|
|
int vmUnbind(const VmBindParams &vmBindParams) override;
|
|
bool getEuStallProperties(std::array<uint64_t, 12u> &properties, uint64_t dssBufferSize, uint64_t samplingRate,
|
|
uint64_t pollPeriod, uint64_t engineInstance, uint64_t notifyNReports) override;
|
|
uint32_t getEuStallFdParameter() override;
|
|
UuidRegisterResult registerUuid(const std::string &uuid, uint32_t uuidClass, uint64_t ptr, uint64_t size) override;
|
|
UuidRegisterResult registerStringClassUuid(const std::string &uuid, uint64_t ptr, uint64_t size) override;
|
|
int unregisterUuid(uint32_t handle) override;
|
|
bool isContextDebugSupported() override;
|
|
int setContextDebugFlag(uint32_t drmContextId) override;
|
|
bool isDebugAttachAvailable() override;
|
|
unsigned int getIoctlRequestValue(DrmIoctl ioctlRequest) const override;
|
|
int getDrmParamValue(DrmParam drmParam) const override;
|
|
std::string getDrmParamString(DrmParam param) const override;
|
|
std::string getIoctlString(DrmIoctl ioctlRequest) const override;
|
|
bool checkIfIoctlReinvokeRequired(int error, DrmIoctl ioctlRequest) const override;
|
|
bool getFabricLatency(uint32_t fabricId, uint32_t &latency, uint32_t &bandwidth) override;
|
|
bool isWaitBeforeBindRequired(bool bind) const override;
|
|
void *pciBarrierMmap() override;
|
|
void setupIpVersion() override;
|
|
bool getTopologyDataAndMap(const HardwareInfo &hwInfo, DrmQueryTopologyData &topologyData, TopologyMap &topologyMap) override;
|
|
|
|
protected:
|
|
bool queryHwIpVersion(EngineClassInstance &engineInfo, HardwareIpVersion &ipVersion, int &ret);
|
|
|
|
bool handleExecBufferInNonBlockMode = false;
|
|
};
|
|
|
|
} // namespace NEO
|