Files
intel-graphics-compiler/IGC/LLVM3DBuilder/BuiltinsFrontend.hpp
mkarigan 44fe17526d Add support for DG2 256
Add support for DG2 256
2022-03-30 06:46:42 +02:00

865 lines
29 KiB
C++

/*========================== begin_copyright_notice ============================
Copyright (C) 2017-2021 Intel Corporation
SPDX-License-Identifier: MIT
============================= end_copyright_notice ===========================*/
#ifndef _BUILTINSFRONTEND_H_
#define _BUILTINSFRONTEND_H_
#include "common/LLVMWarningsPush.hpp"
#include <llvm/IR/Module.h>
#include <llvm/IR/LLVMContext.h>
#include <llvm/IR/Constants.h>
#include <llvm/IR/Intrinsics.h>
#include <llvm/Support/MemoryBuffer.h>
#include <llvm/Support/SourceMgr.h>
#include <llvm/AsmParser/Parser.h>
#include "common/LLVMWarningsPop.hpp"
#include "Compiler/CodeGenPublicEnums.h"
#include "inc/common/Compiler/API/SurfaceFormats.h"
#include "inc/common/igfxfmid.h"
#include "common/IGCIRBuilder.h"
#include "../common/EmUtils.h"
#include "../../../skuwa/iacm_g10_rev_id.h"
#include "../../../skuwa/iacm_g11_rev_id.h"
#include "../../../skuwa/iacm_g12_rev_id.h"
struct genplatform
{
private:
const PLATFORM* m_platformInfo;
public:
genplatform(const PLATFORM* platform) { m_platformInfo = platform; }
genplatform() {}
GFXCORE_FAMILY GetPlatformFamily() const { return m_platformInfo->eRenderCoreFamily; }
bool hasHDCSupportForTypedReads() const { return m_platformInfo->eRenderCoreFamily >= IGFX_GEN10_CORE; }
bool hasHDCSupportForTypedReadsUnormSnormToFloatConversion() const;
bool hasSupportForAllOCLImageFormats() const;
};
inline bool genplatform::hasHDCSupportForTypedReadsUnormSnormToFloatConversion() const
{
return m_platformInfo->eRenderCoreFamily >= IGFX_GEN10_CORE;
}
inline bool genplatform::hasSupportForAllOCLImageFormats() const
{
bool isDG2B0Plus = SI_WA_FROM(m_platformInfo->usRevId, ACM_G10_GT_REV_ID_B0);
bool isDG2C0Plus = SI_WA_FROM(m_platformInfo->usRevId, ACM_G10_GT_REV_ID_C0);
bool isDG2G11EUConfig = GFX_IS_DG2_G11_CONFIG(m_platformInfo->usDeviceID);
bool isDG2G12EUConfig = GFX_IS_DG2_G12_CONFIG(m_platformInfo->usDeviceID);
if ((m_platformInfo->eProductFamily == IGFX_DG2 && isDG2C0Plus) ||
(m_platformInfo->eProductFamily == IGFX_DG2 && isDG2G11EUConfig && isDG2B0Plus))
{
return true;
}
return m_platformInfo->eRenderCoreFamily >= IGFX_XE_HPC_CORE;
}
class SampleParamsFromCube
{
public:
llvm::Value* float_xcube;
llvm::Value* float_ycube;
llvm::Value* float_aicube;
llvm::Value* float_address_3;
llvm::Value* int32_textureIdx;
llvm::Value* int32_sampler;
llvm::Value* offsetU;
llvm::Value* offsetV;
llvm::Value* offsetR;
llvm::Value* get_float_xcube() { return float_xcube; }
llvm::Value* get_float_ycube() { return float_ycube; }
llvm::Value* get_float_aicube() { return float_aicube; }
llvm::Value* get_float_address_3() { return float_address_3; }
llvm::Value* get_int32_textureIdx() { return int32_textureIdx; }
llvm::Value* get_int32_sampler() { return int32_sampler; }
llvm::Value* get_offsetU() { return offsetU; }
llvm::Value* get_offsetV() { return offsetV; }
llvm::Value* get_offsetR() { return offsetR; }
void operator=(const SampleParamsFromCube &CUBE_params)
{
float_xcube = CUBE_params.float_xcube;
float_ycube = CUBE_params.float_ycube;
float_aicube = CUBE_params.float_aicube;
float_address_3 = CUBE_params.float_address_3;
int32_textureIdx = CUBE_params.int32_textureIdx;
int32_sampler = CUBE_params.int32_sampler;
offsetU = CUBE_params.offsetU;
offsetV = CUBE_params.offsetV;
offsetR = CUBE_params.offsetR;
}
};
class SampleD_DC_FromCubeParams
{
public:
llvm::Value* float_src_u;
llvm::Value* dxu;
llvm::Value* dyu;
llvm::Value* float_src_v;
llvm::Value* dxv;
llvm::Value* dyv;
llvm::Value* float_src_r;
llvm::Value* dxr;
llvm::Value* dyr;
llvm::Value* float_src_ai;
llvm::Value* int32_textureIdx;
llvm::Value* int32_sampler;
llvm::Value* int32_offsetU;
llvm::Value* int32_offsetV;
llvm::Value* int32_offsetW;
llvm::Value* get_float_src_u() { return float_src_u; }
llvm::Value* get_dxu() { return dxu; }
llvm::Value* get_dyu() { return dyu; }
llvm::Value* get_float_src_v() { return float_src_v; }
llvm::Value* get_dxv() { return dxv; }
llvm::Value* get_dyv() { return dyv; }
llvm::Value* get_float_src_r() { return float_src_r; }
llvm::Value* get_dxr() { return dxr; }
llvm::Value* get_dyr() { return dyr; }
llvm::Value* get_float_src_ai() { return float_src_ai; }
llvm::Value* get_int32_textureIdx() { return int32_textureIdx; }
llvm::Value* get_int32_sampler() { return int32_sampler; }
llvm::Value* get_int32_offsetU() { return int32_offsetU; }
llvm::Value* get_int32_offsetV() { return int32_offsetV; }
llvm::Value* get_int32_offsetW() { return int32_offsetW; }
void operator=(const SampleD_DC_FromCubeParams &D_DC_CUBE_params)
{
float_src_u = D_DC_CUBE_params.float_src_u;
dxu = D_DC_CUBE_params.dxu;
dyu = D_DC_CUBE_params.dyu;
float_src_v = D_DC_CUBE_params.float_src_v;
dxv = D_DC_CUBE_params.dxv;
dyv = D_DC_CUBE_params.dyv;
float_src_r = D_DC_CUBE_params.float_src_r;
dxr = D_DC_CUBE_params.dxr;
dyr = D_DC_CUBE_params.dyr;
float_src_ai = D_DC_CUBE_params.float_src_ai;
int32_textureIdx = D_DC_CUBE_params.int32_textureIdx;
int32_sampler = D_DC_CUBE_params.int32_sampler;
int32_offsetU = D_DC_CUBE_params.int32_offsetU;
int32_offsetV = D_DC_CUBE_params.int32_offsetV;
int32_offsetW = D_DC_CUBE_params.int32_offsetW;
}
};
template<bool preserveNames = true, typename T = llvm::ConstantFolder,
typename InserterTyDef() = llvm::IRBuilderDefaultInserter>
class LLVM3DBuilder : public llvm::IGCIRBuilder<T, InserterTyDef()>
{
public:
LLVM3DBuilder(llvm::LLVMContext &pCtx, const PLATFORM &pPlatform)
: llvm::IGCIRBuilder<T, InserterTyDef()>(pCtx),
m_Platform(new genplatform(&pPlatform))
{
Init();
}
~LLVM3DBuilder()
{
if (m_Platform)
{
delete m_Platform;
m_Platform = NULL;
}
}
static unsigned EncodeASForGFXResource(
const llvm::Value& bufIdx,
IGC::BufferType bufType,
unsigned uniqueIndAS);
llvm::Value* CreateFAbs(llvm::Value* V);
llvm::Value* CreateFSat(llvm::Value* V);
llvm::Value* CreateSqrt(llvm::Value* V);
llvm::Value* CreateDiscard(llvm::Value* V);
llvm::Value* CreateFLog(llvm::Value* V);
llvm::Value* CreateFExp(llvm::Value* V);
llvm::Value* CreateFloor(llvm::Value* V);
llvm::Value* CreateCeil(llvm::Value* V);
llvm::Value* CreateRoundZ(llvm::Value* V);
llvm::Value* CreateRoundNE(llvm::Value* V);
llvm::Value* CreateFPow(llvm::Value *LHS, llvm::Value *RHS);
llvm::Value* CreateFMax(llvm::Value *LHS, llvm::Value *RHS);
llvm::Value* CreateFMin(llvm::Value *LHS, llvm::Value *RHS);
llvm::Value* CreateIMulH(llvm::Value* LHS, llvm::Value* RHS);
llvm::Value* CreateUMulH(llvm::Value* LHS, llvm::Value* RHS);
llvm::Value* CreateDeriveRTX(llvm::Value* V);
llvm::Value* CreateDeriveRTX_Fine(llvm::Value* V);
llvm::Value* CreateDeriveRTY(llvm::Value* V);
llvm::Value* CreateDeriveRTY_Fine(llvm::Value* V);
llvm::Value* CreateSin(llvm::Value* V);
llvm::Value* CreateCos(llvm::Value* V);
llvm::Value* CreateIsNan(llvm::Value *V);
llvm::Value* CreateCtpop(llvm::Value* V);
llvm::Value* CreateFrc(llvm::Value* V);
llvm::Value* CreateCPSRqstCoarseSize(
llvm::Value* pSrcVal);
llvm::Value* CreateCPSActualCoarseSize(
llvm::Value* pSrcVal);
llvm::Value* getHalf(float f);
llvm::Value* getFloat(float f);
llvm::Value* getDouble(double d);
llvm::Value* CreatePow(llvm::Value* src0, llvm::Value* src1);
llvm::Value* Create_MAD_Scalar(
llvm::Value* float_src0,
llvm::Value* float_src1,
llvm::Value* float_src2);
llvm::Value* Create_resinfo(
llvm::Value* int32_src_s_mip,
llvm::Value* int32_textureIdx);
llvm::Value* Create_resinfoptr_msaa(
llvm::Value* srcBuffer,
llvm::Value* float_src_s_mip);
llvm::Value* CreateReadSurfaceInfo(llvm::Value* resource, llvm::Value* mimap);
llvm::Value* Create_typedwrite(
llvm::Value* dstBuffer,
llvm::Value* srcAddressU,
llvm::Value* srcAddressV,
llvm::Value* srcAddressW,
llvm::Value* lod,
llvm::Value* float_X,
llvm::Value* float_Y,
llvm::Value* float_Z,
llvm::Value* float_W);
llvm::Value* Create_typedread(
llvm::Value* dstBuffer,
llvm::Value* srcAddressU,
llvm::Value* srcAddressV,
llvm::Value* srcAddressW,
llvm::Value* lod);
llvm::Value* Create_typedread_msaa2D(
llvm::Value* srcBuffer,
llvm::Value* sampleIdx,
llvm::Value* srcAddressU,
llvm::Value* srcAddressV,
llvm::Value* lod);
llvm::Value* Create_typedread_msaa2DArray(
llvm::Value* srcBuffer,
llvm::Value* sampleIdx,
llvm::Value* srcAddressU,
llvm::Value* srcAddressV,
llvm::Value* srcAddressR,
llvm::Value* lod);
llvm::Value* Create_typedwrite_msaa2D(
llvm::Value* dstBuffer,
llvm::Value* sampleIdx,
llvm::Value* srcAddressU,
llvm::Value* srcAddressV,
llvm::Value* float_X,
llvm::Value* float_Y,
llvm::Value* float_Z,
llvm::Value* float_W);
llvm::Value* Create_typedwrite_msaa2DArray(
llvm::Value* dstBuffer,
llvm::Value* sampleIdx,
llvm::Value* srcAddressU,
llvm::Value* srcAddressV,
llvm::Value* srcAddressR,
llvm::Value* float_X,
llvm::Value* float_Y,
llvm::Value* float_Z,
llvm::Value* float_W);
llvm::Value* Create_dwordatomictypedMsaa2D(
llvm::Value* dstBuffer,
llvm::Value* sampleIdx,
llvm::Value* srcAddressU,
llvm::Value* srcAddressV,
llvm::Value* src,
llvm::Value* instType);
llvm::Value* Create_dwordatomictypedMsaa2DArray(
llvm::Value* dstBuffer,
llvm::Value* sampleIdx,
llvm::Value* srcAddressU,
llvm::Value* srcAddressV,
llvm::Value* srcAddressR,
llvm::Value* src,
llvm::Value* instType);
llvm::Value* Create_cmpxchgatomictypedMsaa2D(
llvm::Value* dstBuffer,
llvm::Value* sampleIdx,
llvm::Value* srcAddressU,
llvm::Value* srcAddressV,
llvm::Value* src0,
llvm::Value* src1);
llvm::Value* Create_cmpxchgatomictypedMsaa2DArray(
llvm::Value* dstBuffer,
llvm::Value* sampleIdx,
llvm::Value* srcAddressU,
llvm::Value* srcAddressV,
llvm::Value* srcAddressR,
llvm::Value* src0,
llvm::Value* src1);
llvm::Value* Create_StatelessAtomic(
llvm::Value* ptr,
llvm::Value* data,
IGC::AtomicOp opcode);
llvm::Value* Create_InidrectAtomic(
llvm::Value* resource,
llvm::Value* offset,
llvm::Value* data,
IGC::AtomicOp opcode);
llvm::Value* Create_StatelessAtomicCmpXChg(
llvm::Value* ptr,
llvm::Value* data0,
llvm::Value* data1);
llvm::Value* Create_InidrectAtomicCmpXChg(
llvm::Value* resource,
llvm::Value* offset,
llvm::Value* data0,
llvm::Value* data1);
llvm::Value* Create_TypedAtomic(
llvm::Value* resource,
llvm::Value* addressU,
llvm::Value* addressV,
llvm::Value* addressR,
llvm::Value* data,
IGC::AtomicOp opcode);
llvm::Value* Create_TypedAtomicCmpXChg(
llvm::Value* resource,
llvm::Value* addressU,
llvm::Value* addressV,
llvm::Value* addressR,
llvm::Value* data0,
llvm::Value* data1);
llvm::CallInst* Create_SampleInfo(
llvm::Value* int32_resourceIdx);
llvm::Value* Create_SamplePos(
llvm::Value* int32_resourceIdx,
llvm::Value* int32_samplerIdx);
llvm::Value* Create_SyncThreadGroup();
llvm::Value* Create_FlushSampler();
llvm::Value* Create_LscFence(
llvm::Value* SFID,
llvm::Value* FenceOp,
llvm::Value* Scope);
llvm::Value* Create_MemoryFence(
bool commit,
bool flushRWDataCache,
bool flushConstantCache,
bool flushTextureCache,
bool flushInstructionCache,
bool globalFence);
llvm::Value* Create_GlobalSync();
llvm::CallInst* Create_SAMPLE(
llvm::Value* coordinate_u,
llvm::Value* coordinate_v,
llvm::Value* coordinate_r,
llvm::Value* coordinate_ai,
llvm::Value* ptr_textureIdx,
llvm::Value* ptr_sampler,
llvm::Value* offsetU,
llvm::Value* offsetV,
llvm::Value* offsetW,
llvm::Value* minlod,
bool feedback_enabled = false,
llvm::Type* returnType = nullptr);
SampleParamsFromCube Prepare_SAMPLE_Cube_ParamsFromUnormalizedCoords(
llvm::Value* int32_lod,
llvm::Value* int32_textureIdx,
llvm::Value* int32_u,
llvm::Value* int32_v,
llvm::Value* int32_faceid,
llvm::Value* int32_cube_array_index,
llvm::Value *float_array_6_3,
llvm::Value *int32_sampler);
SampleParamsFromCube Prepare_SAMPLE_Cube_Params(
llvm::Value* float_address_0,
llvm::Value* float_address_1,
llvm::Value* float_address_2,
llvm::Value* float_address_3,
llvm::Value* int32_textureIdx,
llvm::Value* int32_sampler);
llvm::CallInst* Create_SAMPLED(
SampleD_DC_FromCubeParams& sampleParams,
llvm::Value* minlod = nullptr,
bool feedback_enabled = false,
llvm::Type* returnType = nullptr);
llvm::CallInst* Create_SAMPLED(
llvm::Value* float_src1_s_chan0,
llvm::Value* float_src1_s_chan1,
llvm::Value* float_src1_s_chan2,
llvm::Value* float_src2_s_chan0,
llvm::Value* float_src2_s_chan1,
llvm::Value* float_src2_s_chan2,
llvm::Value* float_src3_s_chan0,
llvm::Value* float_src3_s_chan1,
llvm::Value* float_src3_s_chan2,
llvm::Value* float_src1_s_chan3,
llvm::Value* int32_textureIdx_356,
llvm::Value* int32_sampler_357,
llvm::Value* int32_offsetU_358,
llvm::Value* int32_offsetV_359,
llvm::Value* int32_offsetW_359,
llvm::Value* minlod,
bool feedback_enabled = false,
llvm::Type* returnType = nullptr);
llvm::CallInst* Create_SAMPLEDC(
llvm::Value* float_ref,
llvm::Value* float_src_u,
llvm::Value* dxu,
llvm::Value* dyu,
llvm::Value* float_src_v,
llvm::Value* dxv,
llvm::Value* dyv,
llvm::Value* float_src_r,
llvm::Value* dxr,
llvm::Value* dyr,
llvm::Value* float_src_ai,
llvm::Value* int32_textureIdx,
llvm::Value* int32_sampler,
llvm::Value* int32_offsetU,
llvm::Value* int32_offsetV,
llvm::Value* int32_offsetW,
bool feedback_enabled = false,
llvm::Type* returnType = nullptr);
SampleD_DC_FromCubeParams Prepare_SAMPLE_D_DC_Cube_Params(SampleD_DC_FromCubeParams& params);
SampleD_DC_FromCubeParams Prepare_SAMPLE_D_DC_Cube_Params(
llvm::Value* float_src_x,
llvm::Value* float_src_y,
llvm::Value* float_src_z,
llvm::Value* float_src_ai,
llvm::Value* dxu,
llvm::Value* dyu,
llvm::Value* dzu,
llvm::Value* dxv,
llvm::Value* dyv,
llvm::Value* dzv,
llvm::Value* int32_textureIdx_356,
llvm::Value* int32_sampler_357,
llvm::Value* int32_offsetU_358,
llvm::Value* int32_offsetV_359,
llvm::Value* int32_offsetW_359);
llvm::CallInst* Create_SAMPLEB(
llvm::Value* float_bias_0,
llvm::Value* float_address_0,
llvm::Value* float_address_1,
llvm::Value* float_address_2,
llvm::Value* float_address_3,
llvm::Value* int32_textureIdx,
llvm::Value* int32_sampler,
llvm::Value* int32_offsetU,
llvm::Value* int32_offsetV,
llvm::Value* int32_offsetW,
llvm::Value* minlod,
bool feedback_enabled = false,
llvm::Type* returnType = nullptr);
llvm::CallInst* Create_SAMPLEL(
llvm::Value* float_lod_0,
llvm::Value* float_address_0,
llvm::Value* float_address_1,
llvm::Value* float_address_2,
llvm::Value* float_address_3,
llvm::Value* int32_textureIdx,
llvm::Value* int32_sampler,
llvm::Value* int32_offsetU,
llvm::Value* int32_offsetV,
llvm::Value* int32_offsetW,
bool feedback_enabled = false,
llvm::Type* returnType = nullptr);
llvm::CallInst* Create_SAMPLEC(
llvm::Value* float_reference_0,
llvm::Value* float_address_0,
llvm::Value* float_address_1,
llvm::Value* float_address_2,
llvm::Value* float_address_3,
llvm::Value* int32_textureIdx,
llvm::Value* int32_sampler,
llvm::Value* int32_offsetU,
llvm::Value* int32_offsetV,
llvm::Value* int32_offsetR,
llvm::Value* minlod,
bool feedback_enabled = false,
llvm::Type* returnType = nullptr);
llvm::CallInst* Create_SAMPLELC(
llvm::Value* float_reference_0,
llvm::Value* float_address_0,
llvm::Value* float_address_1,
llvm::Value* float_address_2,
llvm::Value* float_address_3,
llvm::Value* float_lod,
llvm::Value* int32_textureIdx,
llvm::Value* int32_sampler,
llvm::Value* int32_offsetU,
llvm::Value* int32_offsetV,
llvm::Value* int32_offsetW,
bool feedback_enabled = false,
llvm::Type* returnType = nullptr);
llvm::CallInst* Create_SAMPLEC_LZ(
llvm::Value* float_reference_0,
llvm::Value* float_address_0,
llvm::Value* float_address_1,
llvm::Value* float_address_2,
llvm::Value* float_address_3,
llvm::Value* int32_textureIdx,
llvm::Value* int32_sampler,
llvm::Value* int32_offsetU,
llvm::Value* int32_offsetV,
llvm::Value* int32_offsetW,
bool feedback_enabled = false,
llvm::Type* returnType = nullptr);
llvm::CallInst* Create_lod(
llvm::Value* float_address_0,
llvm::Value* float_address_1,
llvm::Value* float_address_2,
llvm::Value* float_address_3,
llvm::Value* int32_textureIdx_356,
llvm::Value* int32_sampler_357,
bool feedback_enabled = false,
llvm::Type* returnType = nullptr);
llvm::CallInst* Create_gather4(
llvm::Value* float_address_0,
llvm::Value* float_address_1,
llvm::Value* float_address_2,
llvm::Value* float_address_3,
llvm::Value* int32_textureIdx_356,
llvm::Value* int32_sampler_357,
llvm::Value* int32_offsetU,
llvm::Value* int32_offsetV,
llvm::Value* int32_offsetW,
llvm::Value* int32_srcChannel,
bool feedback_enabled = false,
llvm::Type* returnType = nullptr);
llvm::CallInst* Create_load(
llvm::Value* int32_sampleIdxU,
llvm::Value* int32_sampleIdxV,
llvm::Value* int32_sampleIdxR,
llvm::Value* int32_lod,
llvm::Value* ptr_textureIdx,
llvm::Value* int32_offsetU,
llvm::Value* int32_offsetV,
llvm::Value* int32_offsetR,
bool feedback_enabled = false,
llvm::Type* returnType = nullptr);
llvm::CallInst* Create_ldms(
llvm::Value* int32_srcIdxU,
llvm::Value* int32_srcIdxV,
llvm::Value* int32_srcIdxR,
llvm::Value* int32_sampleIdx,
llvm::Value* int32_textureIdx,
llvm::Value* int32_offsetU,
llvm::Value* int32_offsetV,
llvm::Value* int32_offsetR,
bool feedback_enabled = false,
llvm::Type* returnType = nullptr);
llvm::CallInst* Create_gather4C(
llvm::Value* float_reference_0,
llvm::Value* float_address_0,
llvm::Value* float_address_1,
llvm::Value* float_address_2,
llvm::Value* float_address_3,
llvm::Value* int32_textureIdx,
llvm::Value* int32_sampler,
llvm::Value* int32_offsetU,
llvm::Value* int32_offsetV,
llvm::Value* int32_srcChannel,
bool feedback_enabled = false,
llvm::Type* returnType = nullptr);
llvm::CallInst* Create_gather4PO(
llvm::Value* float_address_0,
llvm::Value* float_address_1,
llvm::Value* float_address_2,
llvm::Value* float_src_offset_0,
llvm::Value* float_src_offset_1,
llvm::Value* int32_textureIdx,
llvm::Value* int32_sampler,
llvm::Value* int32_offsetU,
llvm::Value* int32_offsetV,
llvm::Value* int32_srcChannel,
bool feedback_enabled = false,
llvm::Type* returnType = nullptr);
llvm::CallInst* Create_gather4POC(
llvm::Value* float_address_0,
llvm::Value* float_address_1,
llvm::Value* float_address_2,
llvm::Value* int_src_offset_0,
llvm::Value* int_src_offset_1,
llvm::Value* float_src_reference_0,
llvm::Value* int32_textureIdx,
llvm::Value* int32_sampler,
llvm::Value* int32_offsetU,
llvm::Value* int32_offsetV,
llvm::Value* int32_srcChannel,
bool feedback_enabled = false,
llvm::Type* returnType = nullptr);
llvm::Value* Create_gather4PositionOffsets(
llvm::Value* float_address_0,
llvm::Value* float_address_1,
llvm::Value* float_address_2,
llvm::ArrayRef<llvm::Value *> int_src_offsets,
llvm::Value* int32_textureIdx_356,
llvm::Value* int32_sampler_357,
llvm::Value* int32_offsetU,
llvm::Value* int32_offsetV,
llvm::Value* int32_srcChannel,
bool feedback_enabled = false);
llvm::Value* Create_gather4PositionOffsetsC(
llvm::Value* float_reference_0,
llvm::Value* float_address_0,
llvm::Value* float_address_1,
llvm::Value* float_address_2,
llvm::ArrayRef<llvm::Value *> int_src_offsets,
llvm::Value* int32_textureIdx_356,
llvm::Value* int32_sampler_357,
llvm::Value* int32_offsetU,
llvm::Value* int32_offsetV,
llvm::Value* int32_srcChannel,
bool feedback_enabled = false);
llvm::CallInst* Create_SAMPLEBC(
llvm::Value* float_ref_value,
llvm::Value* bias_value,
llvm::Value* address_u,
llvm::Value* address_v,
llvm::Value* address_r,
llvm::Value* address_ai,
llvm::Value* int32_textureIdx,
llvm::Value* int32_sampler,
llvm::Value* int32_offsetU,
llvm::Value* int32_offsetV,
llvm::Value* int32_offsetW,
bool feedback_enabled = false,
llvm::Type* returnType = nullptr);
llvm::Value* create_indirectLoad(
llvm::Value* srcBuffer,
llvm::Value* offset,
llvm::Value* alignment,
llvm::Type* returnType,
bool isVolatile = false);
llvm::Value* create_indirectStore(
llvm::Value* srcBuffer,
llvm::Value* offset,
llvm::Value* data,
bool isVolatile = false);
llvm::Value* create_atomicCounterIncrement(llvm::Value* srcBuffer);
llvm::Value* create_atomicCounterDecrement(llvm::Value* srcBuffer);
llvm::Value* createThreadLocalId(unsigned int dim);
llvm::Value* createGroupId(unsigned int dim);
llvm::Value* CreateF16TOF32(
llvm::Value* f16_src);
IGC::SURFACE_FORMAT GetSubstituteImageFormat(
const IGC::SURFACE_FORMAT format) const;
llvm::Value* CreateImageDataConversion(
IGC::SURFACE_FORMAT format,
llvm::Value* data);
llvm::Value* Create_UBFE(
llvm::Value* int32_width,
llvm::Value* int32_offset,
llvm::Value* int32_source);
llvm::Value* Create_IBFE(
llvm::Value* int32_width,
llvm::Value* int32_offset,
llvm::Value* int32_source);
llvm::Value* Create_BFI(
llvm::Value* int32_width,
llvm::Value* int32_offset,
llvm::Value* int32_source,
llvm::Value* int32_replace);
llvm::Value* Create_BFREV(
llvm::Value* int32_source);
llvm::Value* Create_FirstBitHi(
llvm::Value* int32_source);
llvm::Value* Create_FirstBitLo(
llvm::Value* int32_source);
llvm::Value* Create_FirstBitShi(
llvm::Value* int32_source);
llvm::Value* CreateEvalSampleIndex(
llvm::Value* inputIndex,
llvm::Value* sampleIndex,
llvm::Value* perspective);
llvm::Value* CreateEvalSnapped(
llvm::Value* inputIndex,
llvm::Value* xOffset,
llvm::Value* yOffset,
llvm::Value* perspective);
llvm::Value* CreateSetStream(llvm::Value* StreamId, llvm::Value* emitCount);
llvm::Value* CreateEndPrimitive(llvm::Value* emitCount);
llvm::Value* CreateControlPointId();
llvm::Value* CreatePrimitiveID();
llvm::Value* CreateInstanceID();
llvm::Value* CreateCoverage();
llvm::Value* CreateSampleIndex();
llvm::Value* CreateDomainPointInput(unsigned int dimension);
llvm::Value* create_inputVecF32(llvm::Value* inputIndex, llvm::Value* interpolationMode);
llvm::Value* create_uavSerializeAll();
llvm::Value* create_discard(llvm::Value* condition);
llvm::Value* create_runtime(llvm::Value* offset);
llvm::CallInst* create_countbits(llvm::Value* src);
llvm::Value* create_waveBallot(llvm::Value* src);
llvm::Value* create_waveInverseBallot(llvm::Value* src);
llvm::Value* create_waveshuffleIndex(llvm::Value* src, llvm::Value* index, llvm::Value* helperLaneMode = nullptr);
llvm::Value* create_waveAll(llvm::Value* src, llvm::Value* type);
llvm::Value* create_wavePrefix(
llvm::Value* src, llvm::Value* type, bool inclusive,
llvm::Value *Mask = nullptr);
llvm::Value* create_wavePrefixBitCount(
llvm::Value* src, llvm::Value *Mask = nullptr);
llvm::Value* create_waveMatch(llvm::Instruction *inst, llvm::Value *src);
llvm::Value* create_waveMultiPrefix(
llvm::Instruction *I,
llvm::Value *Val,
llvm::Value *Mask,
IGC::WaveOps OpKind);
llvm::Value* create_waveMultiPrefixBitCount(
llvm::Instruction *I,
llvm::Value *Val,
llvm::Value *Mask);
llvm::Value* create_quadPrefix(llvm::Value* src, llvm::Value* type, bool inclusive = false);
llvm::Value* get32BitLaneID();
llvm::Value* getSimdSize();
llvm::Value* getFirstLaneID();
llvm::Value* readFirstLane(llvm::Value* src);
void VectorToScalars(
llvm::Value* vector,
llvm::Value** outScalars,
unsigned maxSize,
llvm::Value* initializer = nullptr);
llvm::Value* ScalarsToVector(
llvm::Value* (&scalars)[4],
unsigned vectorElementCnt);
private:
/// @brief helper structure for keeping image format properties used by image read emulation
struct ImageFormatInfo
{
IGC::SURFACE_FORMAT m_Format; ///< original image format
unsigned m_NumComponents; ///< number of components in the original format, only valid when m_RequiresConversion is true
unsigned m_BPE; ///< number of bits per component in the original format, valid only if all components have the same, only valid when m_RequiresConversion is true
bool m_RequiresConversion; ///< true if conversion is required
IGC::SURFACE_FORMAT m_SubstituteFormat; ///< image format programmed in the additional surface state, only valid when m_RequiresConversion is true
bool m_Is128b; ///< true for 128 bit formats, only valid when m_RequiresConversion is true
};
llvm::Constant* GetSnormFactor(unsigned bits);
llvm::Constant* GetUnormFactor(unsigned bits);
bool NeedConversionFor128FormatRead(
IGC::SURFACE_FORMAT format) const;
// these functions are taken from OCL builtins
llvm::Value* CreateDFloor(llvm::Value* val);
llvm::Value* CreateDTrunc(llvm::Value* val);
llvm::Value* CreateDCeil(llvm::Value* val);
llvm::Value* CreateDRoundNE(llvm::Value* val);
genplatform* m_Platform;
llvm::Function* llvm_GenISA_ubfe() const;
llvm::Function* llvm_GenISA_ibfe() const;
llvm::Function* llvm_GenISA_bfi() const;
llvm::Function* llvm_GenISA_bfrev() const;
llvm::Function* llvm_GenISA_firstbitHi() const;
llvm::Function* llvm_GenISA_firstbitLo() const;
llvm::Function* llvm_GenISA_firstbitShi() const;
llvm::Function* llvm_GenISA_ld() const;
llvm::Function* llvm_GenISA_ldms() const;
llvm::Function* llvm_GenISA_ldmcs() const;
llvm::Function* llvm_GenISA_sampleBC_v4f32_f32() const;
llvm::ConstantInt* m_int0; // 0
llvm::ConstantInt* m_int1; // 1
llvm::ConstantInt* m_int2; // 2
llvm::ConstantInt* m_int3; // 3
llvm::ConstantFP* m_float0; // 0.0f
llvm::ConstantFP* m_float1; // 1.0f
void Init();
};
#include "BuiltinsFrontendDefinitions.hpp"
#endif