performance: Bidirectional BCS split implementation for OCL

Related-To: NEO-7877

Signed-off-by: Lukasz Jobczyk <lukasz.jobczyk@intel.com>
This commit is contained in:
Lukasz Jobczyk
2023-05-12 10:36:06 +00:00
committed by Compute-Runtime-Automation
parent 7f24a4ba25
commit 9f755b54ad
19 changed files with 287 additions and 12 deletions

View File

@@ -56,11 +56,9 @@ struct BcsSplit {
std::vector<CommandQueue *> h2dCmdQs;
std::vector<CommandQueue *> d2hCmdQs;
inline static constexpr size_t h2dEngineMask = 0b000001010;
inline static constexpr size_t d2hEngineMask = 0b010100000;
NEO::BcsInfoMask engines = NEO::EngineHelpers::oddLinkedCopyEnginesMask;
NEO::BcsInfoMask h2dEngines = h2dEngineMask;
NEO::BcsInfoMask d2hEngines = d2hEngineMask;
NEO::BcsInfoMask h2dEngines = NEO::EngineHelpers::h2dCopyEngineMask;
NEO::BcsInfoMask d2hEngines = NEO::EngineHelpers::d2hCopyEngineMask;
template <GFXCORE_FAMILY gfxCoreFamily, typename T, typename K>
ze_result_t appendSplitCall(CommandListCoreFamilyImmediate<gfxCoreFamily> *cmdList,