Introduce MultiDeviceKernel class

Related-To: NEO-5001
Signed-off-by: Mateusz Jablonski <mateusz.jablonski@intel.com>
This commit is contained in:
Mateusz Jablonski
2021-03-09 10:30:21 +00:00
committed by Compute-Runtime-Automation
parent 71940061b8
commit 04eca48ee0
62 changed files with 778 additions and 596 deletions

View File

@ -1,5 +1,5 @@
/*
* Copyright (C) 2018-2020 Intel Corporation
* Copyright (C) 2018-2021 Intel Corporation
*
* SPDX-License-Identifier: MIT
*
@ -9,7 +9,7 @@
#include "shared/source/built_ins/built_ins.h"
#include "shared/source/helpers/vec.h"
#include "opencl/source/kernel/kernel.h"
#include "opencl/source/kernel/multi_device_kernel.h"
#include "CL/cl.h"
#include "built_in_ops.h"
@ -60,7 +60,7 @@ class BuiltinDispatchInfoBuilder {
virtual ~BuiltinDispatchInfoBuilder() = default;
template <typename... KernelsDescArgsT>
void populate(EBuiltInOps::Type operation, ConstStringRef options, KernelsDescArgsT &&... desc);
void populate(EBuiltInOps::Type operation, ConstStringRef options, KernelsDescArgsT &&...desc);
virtual bool buildDispatchInfos(MultiDispatchInfo &multiDispatchInfo) const {
return false;
@ -81,13 +81,13 @@ class BuiltinDispatchInfoBuilder {
return true;
}
std::vector<std::unique_ptr<Kernel>> &peekUsedKernels() { return usedKernels; }
std::vector<std::unique_ptr<MultiDeviceKernel>> &peekUsedKernels() { return usedKernels; }
static std::unique_ptr<Program> createProgramFromCode(const BuiltinCode &bc, const ClDeviceVector &device);
protected:
template <typename KernelNameT, typename... KernelsDescArgsT>
void grabKernels(KernelNameT &&kernelName, Kernel *&kernelDst, KernelsDescArgsT &&... kernelsDesc) {
void grabKernels(KernelNameT &&kernelName, MultiDeviceKernel *&kernelDst, KernelsDescArgsT &&...kernelsDesc) {
auto rootDeviceIndex = clDevice.getRootDeviceIndex();
const KernelInfo *kernelInfo = prog->getKernelInfo(kernelName, rootDeviceIndex);
UNRECOVERABLE_IF(nullptr == kernelInfo);
@ -95,16 +95,16 @@ class BuiltinDispatchInfoBuilder {
KernelInfoContainer kernelInfos;
kernelInfos.resize(rootDeviceIndex + 1);
kernelInfos[rootDeviceIndex] = kernelInfo;
kernelDst = Kernel::create(prog.get(), kernelInfos, &err);
kernelDst->isBuiltIn = true;
usedKernels.push_back(std::unique_ptr<Kernel>(kernelDst));
kernelDst = MultiDeviceKernel::create(prog.get(), kernelInfos, &err);
kernelDst->getKernel(rootDeviceIndex)->isBuiltIn = true;
usedKernels.push_back(std::unique_ptr<MultiDeviceKernel>(kernelDst));
grabKernels(std::forward<KernelsDescArgsT>(kernelsDesc)...);
}
cl_int grabKernels() { return CL_SUCCESS; }
std::unique_ptr<Program> prog;
std::vector<std::unique_ptr<Kernel>> usedKernels;
std::vector<std::unique_ptr<MultiDeviceKernel>> usedKernels;
BuiltIns &kernelsLib;
ClDevice &clDevice;
};