208 lines
8.6 KiB
C++
208 lines
8.6 KiB
C++
/*
|
|
* Copyright (C) 2017-2019 Intel Corporation
|
|
*
|
|
* SPDX-License-Identifier: MIT
|
|
*
|
|
*/
|
|
|
|
#pragma once
|
|
#include "runtime/built_ins/sip.h"
|
|
#include "runtime/command_stream/linear_stream.h"
|
|
#include "runtime/gen_common/aub_mapper.h"
|
|
#include "runtime/gen_common/hw_cmds.h"
|
|
|
|
#include "CL/cl.h"
|
|
|
|
#include <cstdint>
|
|
#include <type_traits>
|
|
|
|
namespace OCLRT {
|
|
class ExecutionEnvironment;
|
|
class GraphicsAllocation;
|
|
struct HardwareCapabilities;
|
|
|
|
class HwHelper {
|
|
public:
|
|
static HwHelper &get(GFXCORE_FAMILY gfxCore);
|
|
virtual uint32_t getBindingTableStateSurfaceStatePointer(void *pBindingTable, uint32_t index) = 0;
|
|
virtual size_t getBindingTableStateSize() const = 0;
|
|
virtual uint32_t getBindingTableStateAlignement() const = 0;
|
|
virtual size_t getInterfaceDescriptorDataSize() const = 0;
|
|
virtual size_t getMaxBarrierRegisterPerSlice() const = 0;
|
|
virtual uint32_t getComputeUnitsUsedForScratch(const HardwareInfo *pHwInfo) const = 0;
|
|
virtual void setCapabilityCoherencyFlag(const HardwareInfo *pHwInfo, bool &coherencyFlag) = 0;
|
|
virtual bool setupPreemptionRegisters(HardwareInfo *pHwInfo, bool enable) = 0;
|
|
virtual void adjustDefaultEngineType(HardwareInfo *pHwInfo) = 0;
|
|
virtual void setupHardwareCapabilities(HardwareCapabilities *caps, const HardwareInfo &hwInfo) = 0;
|
|
virtual SipKernelType getSipKernelType(bool debuggingActive) = 0;
|
|
virtual uint32_t getConfigureAddressSpaceMode() = 0;
|
|
virtual bool isLocalMemoryEnabled(const HardwareInfo &hwInfo) const = 0;
|
|
virtual bool isPageTableManagerSupported(const HardwareInfo &hwInfo) const = 0;
|
|
virtual const AubMemDump::LrcaHelper &getCsTraits(EngineInstanceT engineInstance) const = 0;
|
|
virtual bool supportsYTiling() const = 0;
|
|
virtual bool obtainRenderBufferCompressionPreference(const HardwareInfo &hwInfo) const = 0;
|
|
static bool renderCompressedBuffersSupported(const HardwareInfo &hwInfo);
|
|
static bool renderCompressedImagesSupported(const HardwareInfo &hwInfo);
|
|
static bool cacheFlushAfterWalkerSupported(const HardwareInfo &hwInfo);
|
|
virtual bool timestampPacketWriteSupported() const = 0;
|
|
virtual size_t getRenderSurfaceStateSize() const = 0;
|
|
virtual void setRenderSurfaceStateForBuffer(ExecutionEnvironment &executionEnvironment,
|
|
void *surfaceStateBuffer,
|
|
size_t bufferSize,
|
|
uint64_t gpuVa,
|
|
size_t offset,
|
|
uint32_t pitch,
|
|
GraphicsAllocation *gfxAlloc,
|
|
cl_mem_flags flags,
|
|
uint32_t surfaceType,
|
|
bool forceNonAuxMode) = 0;
|
|
virtual size_t getScratchSpaceOffsetFor64bit() = 0;
|
|
virtual const std::vector<EngineInstanceT> getGpgpuEngineInstances() const = 0;
|
|
virtual bool getEnableLocalMemory(const HardwareInfo &hwInfo) const = 0;
|
|
|
|
protected:
|
|
HwHelper() = default;
|
|
};
|
|
|
|
template <typename GfxFamily>
|
|
class HwHelperHw : public HwHelper {
|
|
public:
|
|
static HwHelper &get() {
|
|
static HwHelperHw<GfxFamily> hwHelper;
|
|
return hwHelper;
|
|
}
|
|
|
|
uint32_t getBindingTableStateSurfaceStatePointer(void *pBindingTable, uint32_t index) override {
|
|
using BINDING_TABLE_STATE = typename GfxFamily::BINDING_TABLE_STATE;
|
|
|
|
BINDING_TABLE_STATE *bindingTableState = static_cast<BINDING_TABLE_STATE *>(pBindingTable);
|
|
return bindingTableState[index].getRawData(0);
|
|
}
|
|
|
|
size_t getBindingTableStateSize() const override {
|
|
using BINDING_TABLE_STATE = typename GfxFamily::BINDING_TABLE_STATE;
|
|
return sizeof(BINDING_TABLE_STATE);
|
|
}
|
|
|
|
uint32_t getBindingTableStateAlignement() const override {
|
|
using BINDING_TABLE_STATE = typename GfxFamily::BINDING_TABLE_STATE;
|
|
return BINDING_TABLE_STATE::SURFACESTATEPOINTER_ALIGN_SIZE;
|
|
}
|
|
|
|
size_t getInterfaceDescriptorDataSize() const override {
|
|
using INTERFACE_DESCRIPTOR_DATA = typename GfxFamily::INTERFACE_DESCRIPTOR_DATA;
|
|
return sizeof(INTERFACE_DESCRIPTOR_DATA);
|
|
}
|
|
|
|
size_t getRenderSurfaceStateSize() const override {
|
|
using RENDER_SURFACE_STATE = typename GfxFamily::RENDER_SURFACE_STATE;
|
|
return sizeof(RENDER_SURFACE_STATE);
|
|
}
|
|
|
|
const AubMemDump::LrcaHelper &getCsTraits(EngineInstanceT engineInstance) const override;
|
|
|
|
size_t getMaxBarrierRegisterPerSlice() const override;
|
|
|
|
uint32_t getComputeUnitsUsedForScratch(const HardwareInfo *pHwInfo) const override;
|
|
|
|
void setCapabilityCoherencyFlag(const HardwareInfo *pHwInfo, bool &coherencyFlag) override;
|
|
|
|
bool setupPreemptionRegisters(HardwareInfo *pHwInfo, bool enable) override;
|
|
|
|
void adjustDefaultEngineType(HardwareInfo *pHwInfo) override;
|
|
|
|
void setupHardwareCapabilities(HardwareCapabilities *caps, const HardwareInfo &hwInfo) override;
|
|
|
|
SipKernelType getSipKernelType(bool debuggingActive) override;
|
|
|
|
uint32_t getConfigureAddressSpaceMode() override;
|
|
|
|
bool isLocalMemoryEnabled(const HardwareInfo &hwInfo) const override;
|
|
|
|
bool supportsYTiling() const override;
|
|
|
|
bool obtainRenderBufferCompressionPreference(const HardwareInfo &hwInfo) const override;
|
|
|
|
bool timestampPacketWriteSupported() const override;
|
|
|
|
bool isPageTableManagerSupported(const HardwareInfo &hwInfo) const override;
|
|
|
|
void setRenderSurfaceStateForBuffer(ExecutionEnvironment &executionEnvironment,
|
|
void *surfaceStateBuffer,
|
|
size_t bufferSize,
|
|
uint64_t gpuVa,
|
|
size_t offset,
|
|
uint32_t pitch,
|
|
GraphicsAllocation *gfxAlloc,
|
|
cl_mem_flags flags,
|
|
uint32_t surfaceType,
|
|
bool forceNonAuxMode) override;
|
|
|
|
size_t getScratchSpaceOffsetFor64bit() override;
|
|
|
|
const std::vector<EngineInstanceT> getGpgpuEngineInstances() const override;
|
|
|
|
bool getEnableLocalMemory(const HardwareInfo &hwInfo) const override;
|
|
|
|
protected:
|
|
HwHelperHw() = default;
|
|
};
|
|
|
|
struct DwordBuilder {
|
|
static uint32_t build(uint32_t bitNumberToSet, bool masked, bool set = true, uint32_t initValue = 0) {
|
|
uint32_t dword = initValue;
|
|
if (set) {
|
|
dword |= (1 << bitNumberToSet);
|
|
}
|
|
if (masked) {
|
|
dword |= (1 << (bitNumberToSet + 16));
|
|
}
|
|
return dword;
|
|
};
|
|
};
|
|
|
|
template <typename GfxFamily>
|
|
struct LriHelper {
|
|
using MI_LOAD_REGISTER_IMM = typename GfxFamily::MI_LOAD_REGISTER_IMM;
|
|
|
|
static MI_LOAD_REGISTER_IMM *program(LinearStream *cmdStream, uint32_t address, uint32_t value) {
|
|
auto lri = (MI_LOAD_REGISTER_IMM *)cmdStream->getSpace(sizeof(MI_LOAD_REGISTER_IMM));
|
|
*lri = GfxFamily::cmdInitLoadRegisterImm;
|
|
lri->setRegisterOffset(address);
|
|
lri->setDataDword(value);
|
|
return lri;
|
|
}
|
|
};
|
|
|
|
template <typename GfxFamily>
|
|
struct PipeControlHelper {
|
|
using PIPE_CONTROL = typename GfxFamily::PIPE_CONTROL;
|
|
using POST_SYNC_OPERATION = typename GfxFamily::PIPE_CONTROL::POST_SYNC_OPERATION;
|
|
static PIPE_CONTROL *obtainPipeControlAndProgramPostSyncOperation(LinearStream *commandStream,
|
|
POST_SYNC_OPERATION operation,
|
|
uint64_t gpuAddress,
|
|
uint64_t immediateData) {
|
|
auto pipeControl = reinterpret_cast<PIPE_CONTROL *>(commandStream->getSpace(sizeof(PIPE_CONTROL)));
|
|
*pipeControl = GfxFamily::cmdInitPipeControl;
|
|
pipeControl->setCommandStreamerStallEnable(true);
|
|
pipeControl->setPostSyncOperation(operation);
|
|
pipeControl->setAddress(static_cast<uint32_t>(gpuAddress & 0x0000FFFFFFFFULL));
|
|
pipeControl->setAddressHigh(static_cast<uint32_t>(gpuAddress >> 32));
|
|
if (operation == POST_SYNC_OPERATION::POST_SYNC_OPERATION_WRITE_IMMEDIATE_DATA) {
|
|
pipeControl->setImmediateData(immediateData);
|
|
}
|
|
return pipeControl;
|
|
}
|
|
};
|
|
|
|
union SURFACE_STATE_BUFFER_LENGTH {
|
|
uint32_t Length;
|
|
struct SurfaceState {
|
|
uint32_t Width : BITFIELD_RANGE(0, 6);
|
|
uint32_t Height : BITFIELD_RANGE(7, 20);
|
|
uint32_t Depth : BITFIELD_RANGE(21, 31);
|
|
} SurfaceState;
|
|
};
|
|
|
|
} // namespace OCLRT
|