compute-runtime/unit_tests/helpers/dispatch_info_builder_tests...

1010 lines
46 KiB
C++

/*
* Copyright (C) 2017-2018 Intel Corporation
*
* SPDX-License-Identifier: MIT
*
*/
#include "runtime/helpers/dispatch_info_builder.h"
#include "unit_tests/fixtures/context_fixture.h"
#include "unit_tests/mocks/mock_kernel.h"
#include "unit_tests/mocks/mock_buffer.h"
#include "unit_tests/fixtures/device_fixture.h"
#include "test.h"
namespace OCLRT {
using namespace SplitDispatch;
class DispatchInfoBuilderFixture : public ContextFixture, public DeviceFixture {
using ContextFixture::SetUp;
public:
DispatchInfoBuilderFixture() {}
void clearCrossThreadData() {
memset(pCrossThreadData, 0, sizeof(pCrossThreadData));
}
protected:
void SetUp() {
DeviceFixture::SetUp();
cl_device_id device = pDevice;
ContextFixture::SetUp(1, &device);
pKernelInfo = std::make_unique<KernelInfo>();
pMediaVFEstate = new SPatchMediaVFEState();
pMediaVFEstate->PerThreadScratchSpace = 1024;
pMediaVFEstate->ScratchSpaceOffset = 0;
pExecutionEnvironment = new SPatchExecutionEnvironment();
pExecutionEnvironment->CompiledSIMD32 = 1;
pExecutionEnvironment->LargestCompiledSIMDSize = 32;
pExecutionEnvironment->NumGRFRequired = GrfConfig::DefaultGrfNumber;
pPrintfSurface = new SPatchAllocateStatelessPrintfSurface();
pKernelInfo->patchInfo.mediavfestate = pMediaVFEstate;
pKernelInfo->patchInfo.executionEnvironment = pExecutionEnvironment;
pKernelInfo->patchInfo.pAllocateStatelessPrintfSurface = pPrintfSurface;
KernelArgPatchInfo kernelArg1PatchInfo;
KernelArgPatchInfo kernelArg2PatchInfo;
KernelArgPatchInfo kernelArg3PatchInfo;
pKernelInfo->kernelArgInfo.resize(3);
pKernelInfo->kernelArgInfo[0].kernelArgPatchInfoVector.push_back(kernelArg1PatchInfo);
pKernelInfo->kernelArgInfo[0].kernelArgPatchInfoVector[0].crossthreadOffset = 0x10;
pKernelInfo->kernelArgInfo[0].kernelArgPatchInfoVector[0].size = (uint32_t)sizeof(void *);
pKernelInfo->kernelArgInfo[1].kernelArgPatchInfoVector.push_back(kernelArg2PatchInfo);
pKernelInfo->kernelArgInfo[1].kernelArgPatchInfoVector[0].crossthreadOffset = 0x30;
pKernelInfo->kernelArgInfo[1].kernelArgPatchInfoVector[0].size = (uint32_t)sizeof(void *);
pKernelInfo->kernelArgInfo[2].kernelArgPatchInfoVector.push_back(kernelArg3PatchInfo);
pKernelInfo->kernelArgInfo[2].kernelArgPatchInfoVector[0].crossthreadOffset = 0x50;
pKernelInfo->kernelArgInfo[2].kernelArgPatchInfoVector[0].size = (uint32_t)sizeof(void *);
pProgram = new MockProgram(*pDevice->getExecutionEnvironment(), pContext, false);
pKernel = new MockKernel(pProgram, *pKernelInfo, *pDevice);
ASSERT_EQ(CL_SUCCESS, pKernel->initialize());
pKernel->setCrossThreadData(pCrossThreadData, sizeof(pCrossThreadData));
pKernel->setKernelArgHandler(0, &Kernel::setArgBuffer);
pKernel->slmTotalSize = 128;
pKernel->isBuiltIn = true;
}
void TearDown() override {
delete pKernel;
delete pPrintfSurface;
delete pExecutionEnvironment;
delete pMediaVFEstate;
delete pProgram;
ContextFixture::TearDown();
DeviceFixture::TearDown();
}
std::unique_ptr<KernelInfo> pKernelInfo;
SPatchMediaVFEState *pMediaVFEstate = nullptr;
SPatchExecutionEnvironment *pExecutionEnvironment;
SPatchAllocateStatelessPrintfSurface *pPrintfSurface = nullptr;
MockProgram *pProgram = nullptr;
MockKernel *pKernel = nullptr;
char pCrossThreadData[128];
};
typedef Test<DispatchInfoBuilderFixture> DispatchInfoBuilderTest;
template <SplitDispatch::Dim Dim, SplitDispatch::SplitMode Mode>
class DispatchInfoBuilderMock : DispatchInfoBuilder<Dim, Mode> {
public:
void pushSplit(const DispatchInfo &dispatchInfo, MultiDispatchInfo &outMdi) {
DispatchInfoBuilder<Dim, Mode>::pushSplit(dispatchInfo, outMdi);
}
};
TEST_F(DispatchInfoBuilderTest, setDispatchInfoNoDim) {
MultiDispatchInfo multiDispatchInfo;
DispatchInfoBuilderMock<SplitDispatch::Dim::d1D, SplitDispatch::SplitMode::NoSplit> *diBuilder = new DispatchInfoBuilderMock<SplitDispatch::Dim::d1D, SplitDispatch::SplitMode::NoSplit>();
ASSERT_NE(nullptr, diBuilder);
DispatchInfo dispatchInfo;
diBuilder->pushSplit(dispatchInfo, multiDispatchInfo);
EXPECT_TRUE(multiDispatchInfo.empty());
delete diBuilder;
}
TEST_F(DispatchInfoBuilderTest, setDispatchInfoDim) {
MultiDispatchInfo mdi1D, mdi2D, mdi3D;
DispatchInfoBuilder<SplitDispatch::Dim::d1D, SplitDispatch::SplitMode::NoSplit> *diBuilder1D = new DispatchInfoBuilder<SplitDispatch::Dim::d1D, SplitDispatch::SplitMode::NoSplit>();
ASSERT_NE(nullptr, diBuilder1D);
DispatchInfoBuilder<SplitDispatch::Dim::d2D, SplitDispatch::SplitMode::NoSplit> *diBuilder2D = new DispatchInfoBuilder<SplitDispatch::Dim::d2D, SplitDispatch::SplitMode::NoSplit>();
ASSERT_NE(nullptr, diBuilder2D);
DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::NoSplit> *diBuilder3D = new DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::NoSplit>();
ASSERT_NE(nullptr, diBuilder3D);
diBuilder1D->setDispatchGeometry(Vec3<size_t>(1, 0, 0), Vec3<size_t>(0, 0, 0), Vec3<size_t>(0, 0, 0));
diBuilder1D->bake(mdi1D);
for (auto &dispatchInfo : mdi1D) {
EXPECT_EQ(1u, dispatchInfo.getDim());
}
diBuilder2D->setDispatchGeometry(Vec3<size_t>(1, 2, 0), Vec3<size_t>(0, 0, 0), Vec3<size_t>(0, 0, 0));
diBuilder2D->bake(mdi2D);
for (auto &dispatchInfo : mdi2D) {
EXPECT_EQ(2u, dispatchInfo.getDim());
}
diBuilder3D->setDispatchGeometry(Vec3<size_t>(1, 2, 3), Vec3<size_t>(0, 0, 0), Vec3<size_t>(0, 0, 0));
diBuilder3D->bake(mdi3D);
for (auto &dispatchInfo : mdi3D) {
EXPECT_EQ(3u, dispatchInfo.getDim());
}
delete diBuilder3D;
delete diBuilder2D;
delete diBuilder1D;
}
TEST_F(DispatchInfoBuilderTest, setDispatchInfoGWS) {
DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::NoSplit> *diBuilder = new DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::NoSplit>();
ASSERT_NE(nullptr, diBuilder);
MultiDispatchInfo mdi0, mdi1, mdi2, mdi3;
diBuilder->setDispatchGeometry(Vec3<size_t>(0, 0, 0), Vec3<size_t>(0, 0, 0), Vec3<size_t>(0, 0, 0));
diBuilder->bake(mdi0);
EXPECT_TRUE(mdi0.empty());
diBuilder->setDispatchGeometry(Vec3<size_t>(1, 0, 0), Vec3<size_t>(0, 0, 0), Vec3<size_t>(0, 0, 0));
diBuilder->bake(mdi1);
for (auto &dispatchInfo : mdi1) {
EXPECT_EQ(1u, dispatchInfo.getGWS().x);
EXPECT_EQ(1u, dispatchInfo.getGWS().y);
EXPECT_EQ(1u, dispatchInfo.getGWS().z);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().z);
}
diBuilder->setDispatchGeometry(Vec3<size_t>(1, 2, 0), Vec3<size_t>(0, 0, 0), Vec3<size_t>(0, 0, 0));
diBuilder->bake(mdi2);
for (auto &dispatchInfo : mdi2) {
EXPECT_EQ(1u, dispatchInfo.getGWS().x);
EXPECT_EQ(2u, dispatchInfo.getGWS().y);
EXPECT_EQ(1u, dispatchInfo.getGWS().z);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().x);
EXPECT_EQ(2u, dispatchInfo.getActualWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().z);
}
diBuilder->setDispatchGeometry(Vec3<size_t>(1, 2, 3), Vec3<size_t>(0, 0, 0), Vec3<size_t>(0, 0, 0));
diBuilder->bake(mdi3);
for (auto &dispatchInfo : mdi3) {
EXPECT_EQ(1u, dispatchInfo.getGWS().x);
EXPECT_EQ(2u, dispatchInfo.getGWS().y);
EXPECT_EQ(3u, dispatchInfo.getGWS().z);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().x);
EXPECT_EQ(2u, dispatchInfo.getActualWorkgroupSize().y);
EXPECT_EQ(3u, dispatchInfo.getActualWorkgroupSize().z);
}
delete diBuilder;
}
TEST_F(DispatchInfoBuilderTest, setDispatchInfoELWS) {
DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::NoSplit> *diBuilder = new DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::NoSplit>();
ASSERT_NE(nullptr, diBuilder);
MultiDispatchInfo mdi0, mdi1, mdi2, mdi3;
diBuilder->setDispatchGeometry(Vec3<size_t>(0, 0, 0), Vec3<size_t>(1, 1, 1), Vec3<size_t>(0, 0, 0));
diBuilder->bake(mdi0);
EXPECT_TRUE(mdi0.empty());
diBuilder->setDispatchGeometry(Vec3<size_t>(1, 0, 0), Vec3<size_t>(1, 0, 0), Vec3<size_t>(0, 0, 0));
diBuilder->bake(mdi1);
for (auto &dispatchInfo : mdi1) {
EXPECT_EQ(1u, dispatchInfo.getEnqueuedWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getEnqueuedWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getEnqueuedWorkgroupSize().z);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().z);
}
diBuilder->setDispatchGeometry(Vec3<size_t>(1, 1, 0), Vec3<size_t>(1, 2, 0), Vec3<size_t>(0, 0, 0));
diBuilder->bake(mdi2);
for (auto &dispatchInfo : mdi2) {
EXPECT_EQ(1u, dispatchInfo.getEnqueuedWorkgroupSize().x);
EXPECT_EQ(2u, dispatchInfo.getEnqueuedWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getEnqueuedWorkgroupSize().z);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(2u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().z);
}
diBuilder->setDispatchGeometry(Vec3<size_t>(1, 1, 1), Vec3<size_t>(1, 2, 3), Vec3<size_t>(0, 0, 0));
diBuilder->bake(mdi3);
for (auto &dispatchInfo : mdi3) {
EXPECT_EQ(1u, dispatchInfo.getEnqueuedWorkgroupSize().x);
EXPECT_EQ(2u, dispatchInfo.getEnqueuedWorkgroupSize().y);
EXPECT_EQ(3u, dispatchInfo.getEnqueuedWorkgroupSize().z);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(2u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(3u, dispatchInfo.getLocalWorkgroupSize().z);
}
delete diBuilder;
}
TEST_F(DispatchInfoBuilderTest, setDispatchInfoLWS) {
DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::NoSplit> *diBuilder = new DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::NoSplit>();
ASSERT_NE(nullptr, diBuilder);
MultiDispatchInfo mdi0, mdi1, mdi2, mdi3;
diBuilder->setKernel(pKernel);
diBuilder->setDispatchGeometry(Vec3<size_t>(0, 0, 0), Vec3<size_t>(0, 0, 0), Vec3<size_t>(0, 0, 0));
diBuilder->bake(mdi0);
EXPECT_TRUE(mdi0.empty());
diBuilder->setKernel(pKernel);
diBuilder->setDispatchGeometry(Vec3<size_t>(16, 0, 0), Vec3<size_t>(0, 0, 0), Vec3<size_t>(0, 0, 0));
diBuilder->bake(mdi1);
for (auto &dispatchInfo : mdi1) {
EXPECT_EQ(16u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().z);
}
diBuilder->setKernel(pKernel);
diBuilder->setDispatchGeometry(Vec3<size_t>(16, 16, 0), Vec3<size_t>(0, 0, 0), Vec3<size_t>(0, 0, 0));
diBuilder->bake(mdi2);
for (auto &dispatchInfo : mdi2) {
EXPECT_EQ(16u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(16u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().z);
}
diBuilder->setKernel(pKernel);
diBuilder->setDispatchGeometry(Vec3<size_t>(16, 16, 16), Vec3<size_t>(0, 0, 0), Vec3<size_t>(0, 0, 0));
diBuilder->bake(mdi3);
for (auto &dispatchInfo : mdi3) {
EXPECT_EQ(16u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(16u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().z);
}
delete diBuilder;
}
TEST_F(DispatchInfoBuilderTest, setKernelNoSplit) {
DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::NoSplit> *diBuilder = new DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::NoSplit>();
ASSERT_NE(nullptr, diBuilder);
diBuilder->setKernel(pKernel);
diBuilder->setDispatchGeometry(Vec3<size_t>(256, 256, 256), Vec3<size_t>(16, 16, 16), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo multiDispatchInfo;
diBuilder->bake(multiDispatchInfo);
for (auto &dispatchInfo : multiDispatchInfo) {
ASSERT_EQ(pKernel, dispatchInfo.getKernel());
EXPECT_TRUE(dispatchInfo.getKernel()->isBuiltIn);
}
delete diBuilder;
}
TEST_F(DispatchInfoBuilderTest, setKernelSplit) {
DispatchInfoBuilder<SplitDispatch::Dim::d1D, SplitDispatch::SplitMode::KernelSplit> *diBuilder1D = new DispatchInfoBuilder<SplitDispatch::Dim::d1D, SplitDispatch::SplitMode::KernelSplit>();
ASSERT_NE(nullptr, diBuilder1D);
DispatchInfoBuilder<SplitDispatch::Dim::d2D, SplitDispatch::SplitMode::KernelSplit> *diBuilder2D = new DispatchInfoBuilder<SplitDispatch::Dim::d2D, SplitDispatch::SplitMode::KernelSplit>();
ASSERT_NE(nullptr, diBuilder2D);
DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::KernelSplit> *diBuilder3D = new DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::KernelSplit>();
ASSERT_NE(nullptr, diBuilder3D);
// 1D
diBuilder1D->setKernel(RegionCoordX::Left, pKernel);
diBuilder1D->setDispatchGeometry(RegionCoordX::Left, Vec3<size_t>(256, 0, 0), Vec3<size_t>(16, 0, 0), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdi1D;
diBuilder1D->bake(mdi1D);
for (auto &dispatchInfo : mdi1D) {
EXPECT_EQ(pKernel, dispatchInfo.getKernel());
EXPECT_TRUE(dispatchInfo.getKernel()->isBuiltIn);
}
//2D
diBuilder2D->setKernel(RegionCoordX::Left, RegionCoordY::Bottom, pKernel);
diBuilder2D->setDispatchGeometry(RegionCoordX::Left, RegionCoordY::Bottom, Vec3<size_t>(256, 256, 0), Vec3<size_t>(16, 16, 0), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdi2D;
diBuilder2D->bake(mdi2D);
for (auto &dispatchInfo : mdi2D) {
EXPECT_EQ(pKernel, dispatchInfo.getKernel());
EXPECT_TRUE(dispatchInfo.getKernel()->isBuiltIn);
}
//3D
diBuilder3D->setKernel(RegionCoordX::Right, RegionCoordY::Bottom, RegionCoordZ::Back, pKernel);
diBuilder3D->setDispatchGeometry(RegionCoordX::Right, RegionCoordY::Bottom, RegionCoordZ::Back, Vec3<size_t>(256, 256, 256), Vec3<size_t>(16, 16, 16), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdi3D;
diBuilder3D->bake(mdi3D);
for (auto &dispatchInfo : mdi3D) {
EXPECT_EQ(pKernel, dispatchInfo.getKernel());
EXPECT_TRUE(dispatchInfo.getKernel()->isBuiltIn);
}
delete diBuilder3D;
delete diBuilder2D;
delete diBuilder1D;
}
TEST_F(DispatchInfoBuilderTest, setWalkerNoSplit) {
DispatchInfoBuilder<SplitDispatch::Dim::d1D, SplitDispatch::SplitMode::WalkerSplit> *diBuilder1D = new DispatchInfoBuilder<SplitDispatch::Dim::d1D, SplitDispatch::SplitMode::WalkerSplit>();
ASSERT_NE(nullptr, diBuilder1D);
DispatchInfoBuilder<SplitDispatch::Dim::d2D, SplitDispatch::SplitMode::WalkerSplit> *diBuilder2D = new DispatchInfoBuilder<SplitDispatch::Dim::d2D, SplitDispatch::SplitMode::WalkerSplit>();
ASSERT_NE(nullptr, diBuilder2D);
DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::WalkerSplit> *diBuilder3D = new DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::WalkerSplit>();
ASSERT_NE(nullptr, diBuilder3D);
// 1D
diBuilder1D->setKernel(pKernel);
diBuilder1D->setDispatchGeometry(Vec3<size_t>(256, 0, 0), Vec3<size_t>(16, 0, 0), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdi1D;
diBuilder1D->bake(mdi1D);
EXPECT_EQ(1u, mdi1D.size());
const DispatchInfo *di1D = mdi1D.begin();
EXPECT_EQ(pKernel, di1D->getKernel());
EXPECT_EQ(256u, di1D->getGWS().x);
EXPECT_EQ(1u, di1D->getGWS().y);
EXPECT_EQ(1u, di1D->getGWS().z);
EXPECT_EQ(16u, di1D->getEnqueuedWorkgroupSize().x);
EXPECT_EQ(1u, di1D->getEnqueuedWorkgroupSize().y);
EXPECT_EQ(1u, di1D->getEnqueuedWorkgroupSize().z);
EXPECT_EQ(0u, di1D->getOffset().x);
EXPECT_EQ(0u, di1D->getOffset().y);
EXPECT_EQ(0u, di1D->getOffset().z);
EXPECT_EQ(16u, di1D->getLocalWorkgroupSize().x);
EXPECT_EQ(1u, di1D->getLocalWorkgroupSize().y);
EXPECT_EQ(1u, di1D->getLocalWorkgroupSize().z);
EXPECT_EQ(256u, di1D->getActualWorkgroupSize().x);
EXPECT_EQ(1u, di1D->getActualWorkgroupSize().y);
EXPECT_EQ(1u, di1D->getActualWorkgroupSize().z);
EXPECT_EQ(16u, di1D->getTotalNumberOfWorkgroups().x);
EXPECT_EQ(1u, di1D->getTotalNumberOfWorkgroups().y);
EXPECT_EQ(1u, di1D->getTotalNumberOfWorkgroups().z);
EXPECT_EQ(16u, di1D->getNumberOfWorkgroups().x);
EXPECT_EQ(1u, di1D->getNumberOfWorkgroups().y);
EXPECT_EQ(1u, di1D->getNumberOfWorkgroups().z);
EXPECT_EQ(0u, di1D->getStartOfWorkgroups().x);
EXPECT_EQ(0u, di1D->getStartOfWorkgroups().y);
EXPECT_EQ(0u, di1D->getStartOfWorkgroups().z);
// 2D
diBuilder2D->setKernel(pKernel);
diBuilder2D->setDispatchGeometry(Vec3<size_t>(256, 256, 0), Vec3<size_t>(16, 16, 0), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdi2D;
diBuilder2D->bake(mdi2D);
EXPECT_EQ(1u, mdi2D.size());
const DispatchInfo *di2D = mdi2D.begin();
EXPECT_EQ(pKernel, di2D->getKernel());
EXPECT_EQ(256u, di2D->getGWS().x);
EXPECT_EQ(256u, di2D->getGWS().y);
EXPECT_EQ(1u, di2D->getGWS().z);
EXPECT_EQ(16u, di2D->getEnqueuedWorkgroupSize().x);
EXPECT_EQ(16u, di2D->getEnqueuedWorkgroupSize().y);
EXPECT_EQ(1u, di2D->getEnqueuedWorkgroupSize().z);
EXPECT_EQ(0u, di2D->getOffset().x);
EXPECT_EQ(0u, di2D->getOffset().y);
EXPECT_EQ(0u, di2D->getOffset().z);
EXPECT_EQ(16u, di2D->getLocalWorkgroupSize().x);
EXPECT_EQ(16u, di2D->getLocalWorkgroupSize().y);
EXPECT_EQ(1u, di2D->getLocalWorkgroupSize().z);
EXPECT_EQ(16u, di2D->getTotalNumberOfWorkgroups().x);
EXPECT_EQ(16u, di2D->getTotalNumberOfWorkgroups().y);
EXPECT_EQ(1u, di2D->getTotalNumberOfWorkgroups().z);
EXPECT_EQ(16u, di2D->getNumberOfWorkgroups().x);
EXPECT_EQ(16u, di2D->getNumberOfWorkgroups().y);
EXPECT_EQ(1u, di2D->getNumberOfWorkgroups().z);
EXPECT_EQ(0u, di2D->getStartOfWorkgroups().x);
EXPECT_EQ(0u, di2D->getStartOfWorkgroups().y);
EXPECT_EQ(0u, di2D->getStartOfWorkgroups().z);
// 3D
diBuilder3D->setKernel(pKernel);
diBuilder3D->setDispatchGeometry(Vec3<size_t>(256, 256, 256), Vec3<size_t>(16, 16, 16), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdi3D;
diBuilder3D->bake(mdi3D);
EXPECT_EQ(1u, mdi3D.size());
const DispatchInfo *di3D = mdi3D.begin();
EXPECT_EQ(pKernel, di3D->getKernel());
EXPECT_EQ(256u, di3D->getGWS().x);
EXPECT_EQ(256u, di3D->getGWS().y);
EXPECT_EQ(256u, di3D->getGWS().z);
EXPECT_EQ(16u, di3D->getEnqueuedWorkgroupSize().x);
EXPECT_EQ(16u, di3D->getEnqueuedWorkgroupSize().y);
EXPECT_EQ(16u, di3D->getEnqueuedWorkgroupSize().z);
EXPECT_EQ(0u, di3D->getOffset().x);
EXPECT_EQ(0u, di3D->getOffset().y);
EXPECT_EQ(0u, di3D->getOffset().z);
EXPECT_EQ(16u, di3D->getLocalWorkgroupSize().x);
EXPECT_EQ(16u, di3D->getLocalWorkgroupSize().y);
EXPECT_EQ(16u, di3D->getLocalWorkgroupSize().z);
EXPECT_EQ(16u, di3D->getTotalNumberOfWorkgroups().x);
EXPECT_EQ(16u, di3D->getTotalNumberOfWorkgroups().y);
EXPECT_EQ(16u, di3D->getTotalNumberOfWorkgroups().z);
EXPECT_EQ(16u, di3D->getNumberOfWorkgroups().x);
EXPECT_EQ(16u, di3D->getNumberOfWorkgroups().y);
EXPECT_EQ(16u, di3D->getNumberOfWorkgroups().z);
EXPECT_EQ(0u, di3D->getStartOfWorkgroups().x);
EXPECT_EQ(0u, di3D->getStartOfWorkgroups().y);
EXPECT_EQ(0u, di3D->getStartOfWorkgroups().z);
delete diBuilder3D;
delete diBuilder2D;
delete diBuilder1D;
}
TEST_F(DispatchInfoBuilderTest, setWalkerSplit) {
DispatchInfoBuilder<SplitDispatch::Dim::d1D, SplitDispatch::SplitMode::WalkerSplit> *diBuilder1D = new DispatchInfoBuilder<SplitDispatch::Dim::d1D, SplitDispatch::SplitMode::WalkerSplit>();
ASSERT_NE(nullptr, diBuilder1D);
DispatchInfoBuilder<SplitDispatch::Dim::d2D, SplitDispatch::SplitMode::WalkerSplit> *diBuilder2D = new DispatchInfoBuilder<SplitDispatch::Dim::d2D, SplitDispatch::SplitMode::WalkerSplit>();
ASSERT_NE(nullptr, diBuilder2D);
DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::WalkerSplit> *diBuilder3D = new DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::WalkerSplit>();
ASSERT_NE(nullptr, diBuilder3D);
// 1D
diBuilder1D->setKernel(pKernel);
diBuilder1D->setDispatchGeometry(Vec3<size_t>(256, 0, 0), Vec3<size_t>(15, 0, 0), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdi1D;
diBuilder1D->bake(mdi1D);
EXPECT_EQ(2u, mdi1D.size());
auto dispatchId = 0;
for (auto &dispatchInfo : mdi1D) {
EXPECT_EQ(pKernel, dispatchInfo.getKernel());
EXPECT_EQ(256u, dispatchInfo.getGWS().x);
EXPECT_EQ(1u, dispatchInfo.getGWS().y);
EXPECT_EQ(1u, dispatchInfo.getGWS().z);
EXPECT_EQ(15u, dispatchInfo.getEnqueuedWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getEnqueuedWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getEnqueuedWorkgroupSize().z);
EXPECT_EQ(0u, dispatchInfo.getOffset().x);
EXPECT_EQ(0u, dispatchInfo.getOffset().y);
EXPECT_EQ(0u, dispatchInfo.getOffset().z);
EXPECT_EQ(18u, dispatchInfo.getTotalNumberOfWorkgroups().x);
EXPECT_EQ(1u, dispatchInfo.getTotalNumberOfWorkgroups().y);
EXPECT_EQ(1u, dispatchInfo.getTotalNumberOfWorkgroups().z);
switch (dispatchId) {
case 0:
EXPECT_EQ(255u, dispatchInfo.getActualWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().z);
EXPECT_EQ(15u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().z);
EXPECT_EQ(17u, dispatchInfo.getNumberOfWorkgroups().x);
EXPECT_EQ(1u, dispatchInfo.getNumberOfWorkgroups().y);
EXPECT_EQ(1u, dispatchInfo.getNumberOfWorkgroups().z);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().x);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().y);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().z);
break;
case 1:
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().z);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().z);
EXPECT_EQ(18u, dispatchInfo.getNumberOfWorkgroups().x);
EXPECT_EQ(1u, dispatchInfo.getNumberOfWorkgroups().y);
EXPECT_EQ(1u, dispatchInfo.getNumberOfWorkgroups().z);
EXPECT_EQ(17u, dispatchInfo.getStartOfWorkgroups().x);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().y);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().z);
break;
}
dispatchId++;
}
//2D
diBuilder2D->setKernel(pKernel);
diBuilder2D->setDispatchGeometry(Vec3<size_t>(256, 256, 0), Vec3<size_t>(15, 15, 0), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdi2D;
diBuilder2D->bake(mdi2D);
EXPECT_EQ(4u, mdi2D.size());
dispatchId = 0;
for (auto &dispatchInfo : mdi2D) {
EXPECT_EQ(pKernel, dispatchInfo.getKernel());
EXPECT_EQ(256u, dispatchInfo.getGWS().x);
EXPECT_EQ(256u, dispatchInfo.getGWS().y);
EXPECT_EQ(1u, dispatchInfo.getGWS().z);
EXPECT_EQ(15u, dispatchInfo.getEnqueuedWorkgroupSize().x);
EXPECT_EQ(15u, dispatchInfo.getEnqueuedWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getEnqueuedWorkgroupSize().z);
EXPECT_EQ(0u, dispatchInfo.getOffset().x);
EXPECT_EQ(0u, dispatchInfo.getOffset().y);
EXPECT_EQ(0u, dispatchInfo.getOffset().z);
EXPECT_EQ(18u, dispatchInfo.getTotalNumberOfWorkgroups().x);
EXPECT_EQ(18u, dispatchInfo.getTotalNumberOfWorkgroups().y);
EXPECT_EQ(1u, dispatchInfo.getTotalNumberOfWorkgroups().z);
switch (dispatchId) {
case 0:
EXPECT_EQ(255u, dispatchInfo.getActualWorkgroupSize().x);
EXPECT_EQ(255u, dispatchInfo.getActualWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().z);
EXPECT_EQ(15u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(15u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().z);
EXPECT_EQ(17u, dispatchInfo.getNumberOfWorkgroups().x);
EXPECT_EQ(17u, dispatchInfo.getNumberOfWorkgroups().y);
EXPECT_EQ(1u, dispatchInfo.getNumberOfWorkgroups().z);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().x);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().y);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().z);
break;
case 1:
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().x);
EXPECT_EQ(255u, dispatchInfo.getActualWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().z);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(15u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().z);
EXPECT_EQ(18u, dispatchInfo.getNumberOfWorkgroups().x);
EXPECT_EQ(17u, dispatchInfo.getNumberOfWorkgroups().y);
EXPECT_EQ(1u, dispatchInfo.getNumberOfWorkgroups().z);
EXPECT_EQ(17u, dispatchInfo.getStartOfWorkgroups().x);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().y);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().z);
break;
case 2:
EXPECT_EQ(255u, dispatchInfo.getActualWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().z);
EXPECT_EQ(15u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().z);
EXPECT_EQ(17u, dispatchInfo.getNumberOfWorkgroups().x);
EXPECT_EQ(18u, dispatchInfo.getNumberOfWorkgroups().y);
EXPECT_EQ(1u, dispatchInfo.getNumberOfWorkgroups().z);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().x);
EXPECT_EQ(17u, dispatchInfo.getStartOfWorkgroups().y);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().z);
break;
case 3:
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().z);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().z);
EXPECT_EQ(18u, dispatchInfo.getNumberOfWorkgroups().x);
EXPECT_EQ(18u, dispatchInfo.getNumberOfWorkgroups().y);
EXPECT_EQ(1u, dispatchInfo.getNumberOfWorkgroups().z);
EXPECT_EQ(17u, dispatchInfo.getStartOfWorkgroups().x);
EXPECT_EQ(17u, dispatchInfo.getStartOfWorkgroups().y);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().z);
break;
}
dispatchId++;
}
//3D
diBuilder3D->setKernel(pKernel);
diBuilder3D->setDispatchGeometry(Vec3<size_t>(256, 256, 256), Vec3<size_t>(15, 15, 15), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdi3D;
diBuilder3D->bake(mdi3D);
EXPECT_EQ(8u, mdi3D.size());
dispatchId = 0;
for (auto &dispatchInfo : mdi3D) {
EXPECT_EQ(pKernel, dispatchInfo.getKernel());
EXPECT_EQ(256u, dispatchInfo.getGWS().x);
EXPECT_EQ(256u, dispatchInfo.getGWS().y);
EXPECT_EQ(256u, dispatchInfo.getGWS().z);
EXPECT_EQ(15u, dispatchInfo.getEnqueuedWorkgroupSize().x);
EXPECT_EQ(15u, dispatchInfo.getEnqueuedWorkgroupSize().y);
EXPECT_EQ(15u, dispatchInfo.getEnqueuedWorkgroupSize().z);
EXPECT_EQ(0u, dispatchInfo.getOffset().x);
EXPECT_EQ(0u, dispatchInfo.getOffset().y);
EXPECT_EQ(0u, dispatchInfo.getOffset().z);
EXPECT_EQ(18u, dispatchInfo.getTotalNumberOfWorkgroups().x);
EXPECT_EQ(18u, dispatchInfo.getTotalNumberOfWorkgroups().y);
EXPECT_EQ(18u, dispatchInfo.getTotalNumberOfWorkgroups().z);
switch (dispatchId) {
case 0:
EXPECT_EQ(255u, dispatchInfo.getActualWorkgroupSize().x);
EXPECT_EQ(255u, dispatchInfo.getActualWorkgroupSize().y);
EXPECT_EQ(255u, dispatchInfo.getActualWorkgroupSize().z);
EXPECT_EQ(15u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(15u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(15u, dispatchInfo.getLocalWorkgroupSize().z);
EXPECT_EQ(17u, dispatchInfo.getNumberOfWorkgroups().x);
EXPECT_EQ(17u, dispatchInfo.getNumberOfWorkgroups().y);
EXPECT_EQ(17u, dispatchInfo.getNumberOfWorkgroups().z);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().x);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().y);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().z);
break;
case 1:
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().x);
EXPECT_EQ(255u, dispatchInfo.getActualWorkgroupSize().y);
EXPECT_EQ(255u, dispatchInfo.getActualWorkgroupSize().z);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(15u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(15u, dispatchInfo.getLocalWorkgroupSize().z);
EXPECT_EQ(18u, dispatchInfo.getNumberOfWorkgroups().x);
EXPECT_EQ(17u, dispatchInfo.getNumberOfWorkgroups().y);
EXPECT_EQ(17u, dispatchInfo.getNumberOfWorkgroups().z);
EXPECT_EQ(17u, dispatchInfo.getStartOfWorkgroups().x);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().y);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().z);
break;
case 2:
EXPECT_EQ(255u, dispatchInfo.getActualWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().y);
EXPECT_EQ(255u, dispatchInfo.getActualWorkgroupSize().z);
EXPECT_EQ(15u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(15u, dispatchInfo.getLocalWorkgroupSize().z);
EXPECT_EQ(17u, dispatchInfo.getNumberOfWorkgroups().x);
EXPECT_EQ(18u, dispatchInfo.getNumberOfWorkgroups().y);
EXPECT_EQ(17u, dispatchInfo.getNumberOfWorkgroups().z);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().x);
EXPECT_EQ(17u, dispatchInfo.getStartOfWorkgroups().y);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().z);
break;
case 3:
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().y);
EXPECT_EQ(255u, dispatchInfo.getActualWorkgroupSize().z);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(15u, dispatchInfo.getLocalWorkgroupSize().z);
EXPECT_EQ(18u, dispatchInfo.getNumberOfWorkgroups().x);
EXPECT_EQ(18u, dispatchInfo.getNumberOfWorkgroups().y);
EXPECT_EQ(17u, dispatchInfo.getNumberOfWorkgroups().z);
EXPECT_EQ(17u, dispatchInfo.getStartOfWorkgroups().x);
EXPECT_EQ(17u, dispatchInfo.getStartOfWorkgroups().y);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().z);
break;
case 4:
EXPECT_EQ(255u, dispatchInfo.getActualWorkgroupSize().x);
EXPECT_EQ(255u, dispatchInfo.getActualWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().z);
EXPECT_EQ(15u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(15u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().z);
EXPECT_EQ(17u, dispatchInfo.getNumberOfWorkgroups().x);
EXPECT_EQ(17u, dispatchInfo.getNumberOfWorkgroups().y);
EXPECT_EQ(18u, dispatchInfo.getNumberOfWorkgroups().z);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().x);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().y);
EXPECT_EQ(17u, dispatchInfo.getStartOfWorkgroups().z);
break;
case 5:
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().x);
EXPECT_EQ(255u, dispatchInfo.getActualWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().z);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(15u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().z);
EXPECT_EQ(18u, dispatchInfo.getNumberOfWorkgroups().x);
EXPECT_EQ(17u, dispatchInfo.getNumberOfWorkgroups().y);
EXPECT_EQ(18u, dispatchInfo.getNumberOfWorkgroups().z);
EXPECT_EQ(17u, dispatchInfo.getStartOfWorkgroups().x);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().y);
EXPECT_EQ(17u, dispatchInfo.getStartOfWorkgroups().z);
break;
case 6:
EXPECT_EQ(255u, dispatchInfo.getActualWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().z);
EXPECT_EQ(15u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().z);
EXPECT_EQ(17u, dispatchInfo.getNumberOfWorkgroups().x);
EXPECT_EQ(18u, dispatchInfo.getNumberOfWorkgroups().y);
EXPECT_EQ(18u, dispatchInfo.getNumberOfWorkgroups().z);
EXPECT_EQ(0u, dispatchInfo.getStartOfWorkgroups().x);
EXPECT_EQ(17u, dispatchInfo.getStartOfWorkgroups().y);
EXPECT_EQ(17u, dispatchInfo.getStartOfWorkgroups().z);
break;
case 7:
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getActualWorkgroupSize().z);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().x);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().y);
EXPECT_EQ(1u, dispatchInfo.getLocalWorkgroupSize().z);
EXPECT_EQ(18u, dispatchInfo.getNumberOfWorkgroups().x);
EXPECT_EQ(18u, dispatchInfo.getNumberOfWorkgroups().y);
EXPECT_EQ(18u, dispatchInfo.getNumberOfWorkgroups().z);
EXPECT_EQ(17u, dispatchInfo.getStartOfWorkgroups().x);
EXPECT_EQ(17u, dispatchInfo.getStartOfWorkgroups().y);
EXPECT_EQ(17u, dispatchInfo.getStartOfWorkgroups().z);
break;
}
dispatchId++;
}
delete diBuilder3D;
delete diBuilder2D;
delete diBuilder1D;
}
TEST_F(DispatchInfoBuilderTest, mdiSizesForWalkerSplit1D) {
DispatchInfoBuilder<SplitDispatch::Dim::d1D, SplitDispatch::SplitMode::WalkerSplit> *diBuilder = new DispatchInfoBuilder<SplitDispatch::Dim::d1D, SplitDispatch::SplitMode::WalkerSplit>();
ASSERT_NE(nullptr, diBuilder);
diBuilder->setDispatchGeometry(Vec3<size_t>(0, 0, 0), Vec3<size_t>(2, 0, 0), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdiSize0;
diBuilder->bake(mdiSize0);
EXPECT_EQ(0u, mdiSize0.size());
diBuilder->setDispatchGeometry(Vec3<size_t>(2, 0, 0), Vec3<size_t>(2, 0, 0), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdiSize1;
diBuilder->bake(mdiSize1);
EXPECT_EQ(1u, mdiSize1.size());
diBuilder->setDispatchGeometry(Vec3<size_t>(3, 0, 0), Vec3<size_t>(2, 0, 0), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdiSize2;
diBuilder->bake(mdiSize2);
EXPECT_EQ(2u, mdiSize2.size());
delete diBuilder;
}
TEST_F(DispatchInfoBuilderTest, mdiSizesForWalkerSplit2D) {
DispatchInfoBuilder<SplitDispatch::Dim::d2D, SplitDispatch::SplitMode::WalkerSplit> *diBuilder = new DispatchInfoBuilder<SplitDispatch::Dim::d2D, SplitDispatch::SplitMode::WalkerSplit>();
ASSERT_NE(nullptr, diBuilder);
diBuilder->setDispatchGeometry(Vec3<size_t>(0, 0, 0), Vec3<size_t>(2, 2, 0), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdiSize00;
diBuilder->bake(mdiSize00);
EXPECT_EQ(0u, mdiSize00.size());
diBuilder->setDispatchGeometry(Vec3<size_t>(2, 2, 0), Vec3<size_t>(2, 2, 0), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdiSize11;
diBuilder->bake(mdiSize11);
EXPECT_EQ(1u, mdiSize11.size());
diBuilder->setDispatchGeometry(Vec3<size_t>(3, 2, 0), Vec3<size_t>(2, 2, 0), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdiSize21;
diBuilder->bake(mdiSize21);
EXPECT_EQ(2u, mdiSize21.size());
diBuilder->setDispatchGeometry(Vec3<size_t>(2, 3, 0), Vec3<size_t>(2, 2, 0), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdiSize12;
diBuilder->bake(mdiSize12);
EXPECT_EQ(2u, mdiSize12.size());
diBuilder->setDispatchGeometry(Vec3<size_t>(3, 3, 0), Vec3<size_t>(2, 2, 0), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdiSize22;
diBuilder->bake(mdiSize22);
EXPECT_EQ(4u, mdiSize22.size());
delete diBuilder;
}
TEST_F(DispatchInfoBuilderTest, mdiSizesForWalkerSplit3D) {
DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::WalkerSplit> *diBuilder = new DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::WalkerSplit>();
ASSERT_NE(nullptr, diBuilder);
diBuilder->setDispatchGeometry(Vec3<size_t>(0, 0, 0), Vec3<size_t>(2, 2, 2), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdiSize000;
diBuilder->bake(mdiSize000);
EXPECT_EQ(0u, mdiSize000.size());
diBuilder->setDispatchGeometry(Vec3<size_t>(2, 2, 2), Vec3<size_t>(2, 2, 2), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdiSize111;
diBuilder->bake(mdiSize111);
EXPECT_EQ(1u, mdiSize111.size());
diBuilder->setDispatchGeometry(Vec3<size_t>(3, 2, 2), Vec3<size_t>(2, 2, 2), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdiSize211;
diBuilder->bake(mdiSize211);
EXPECT_EQ(2u, mdiSize211.size());
diBuilder->setDispatchGeometry(Vec3<size_t>(2, 3, 2), Vec3<size_t>(2, 2, 2), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdiSize121;
diBuilder->bake(mdiSize121);
EXPECT_EQ(2u, mdiSize121.size());
diBuilder->setDispatchGeometry(Vec3<size_t>(2, 2, 3), Vec3<size_t>(2, 2, 2), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdiSize112;
diBuilder->bake(mdiSize112);
EXPECT_EQ(2u, mdiSize112.size());
diBuilder->setDispatchGeometry(Vec3<size_t>(3, 3, 2), Vec3<size_t>(2, 2, 2), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdiSize221;
diBuilder->bake(mdiSize221);
EXPECT_EQ(4u, mdiSize221.size());
diBuilder->setDispatchGeometry(Vec3<size_t>(3, 2, 3), Vec3<size_t>(2, 2, 2), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdiSize212;
diBuilder->bake(mdiSize212);
EXPECT_EQ(4u, mdiSize212.size());
diBuilder->setDispatchGeometry(Vec3<size_t>(2, 3, 3), Vec3<size_t>(2, 2, 2), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdiSize122;
diBuilder->bake(mdiSize122);
EXPECT_EQ(4u, mdiSize122.size());
diBuilder->setDispatchGeometry(Vec3<size_t>(3, 3, 3), Vec3<size_t>(2, 2, 2), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo mdiSize222;
diBuilder->bake(mdiSize222);
EXPECT_EQ(8u, mdiSize222.size());
delete diBuilder;
}
TEST_F(DispatchInfoBuilderTest, setKernelArg) {
Buffer *buffer = new MockBuffer();
auto val = (cl_mem)buffer;
auto pVal = &val;
DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::NoSplit> *diBuilder = new DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::NoSplit>();
ASSERT_NE(nullptr, diBuilder);
diBuilder->setKernel(pKernel);
diBuilder->setDispatchGeometry(Vec3<size_t>(256, 256, 256), Vec3<size_t>(16, 16, 16), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo multiDispatchInfo;
diBuilder->bake(multiDispatchInfo);
clearCrossThreadData();
EXPECT_EQ(CL_SUCCESS, diBuilder->setArg(0, sizeof(cl_mem *), pVal));
char data[128];
void *svmPtr = &data;
EXPECT_EQ(CL_SUCCESS, diBuilder->setArgSvm(1, sizeof(svmPtr), svmPtr));
MockGraphicsAllocation svmAlloc(svmPtr, 128);
EXPECT_EQ(CL_SUCCESS, diBuilder->setArgSvmAlloc(2, svmPtr, &svmAlloc));
for (auto &dispatchInfo : multiDispatchInfo) {
auto crossthreadOffset0 = pKernelInfo->kernelArgInfo[0].kernelArgPatchInfoVector[0].crossthreadOffset;
EXPECT_EQ(buffer->getCpuAddress(), *reinterpret_cast<void **>((dispatchInfo.getKernel()->getCrossThreadData() + crossthreadOffset0)));
auto crossthreadOffset1 = pKernelInfo->kernelArgInfo[1].kernelArgPatchInfoVector[0].crossthreadOffset;
EXPECT_EQ(svmPtr, *(reinterpret_cast<void **>(dispatchInfo.getKernel()->getCrossThreadData() + crossthreadOffset1)));
auto crossthreadOffset2 = pKernelInfo->kernelArgInfo[2].kernelArgPatchInfoVector[0].crossthreadOffset;
EXPECT_EQ(svmPtr, *(reinterpret_cast<void **>(dispatchInfo.getKernel()->getCrossThreadData() + crossthreadOffset2)));
}
delete buffer;
delete diBuilder;
}
TEST_F(DispatchInfoBuilderTest, SetArgSplit) {
DispatchInfoBuilder<SplitDispatch::Dim::d1D, SplitDispatch::SplitMode::KernelSplit> builder1D;
DispatchInfoBuilder<SplitDispatch::Dim::d2D, SplitDispatch::SplitMode::KernelSplit> builder2D;
DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::KernelSplit> builder3D;
Buffer *buffer = new MockBuffer();
auto val = (cl_mem)buffer;
auto pVal = &val;
char data[128];
void *svmPtr = &data;
builder1D.setKernel(pKernel);
builder2D.setKernel(pKernel);
builder3D.setKernel(pKernel);
Vec3<size_t> GWS(256, 256, 256);
Vec3<size_t> ELWS(16, 16, 16);
Vec3<size_t> offset(0, 0, 0);
builder1D.setDispatchGeometry(SplitDispatch::RegionCoordX::Left, GWS, ELWS, offset);
builder2D.setDispatchGeometry(SplitDispatch::RegionCoordX::Left, SplitDispatch::RegionCoordY::Top, GWS, ELWS, offset);
builder3D.setDispatchGeometry(SplitDispatch::RegionCoordX::Left, SplitDispatch::RegionCoordY::Top, SplitDispatch::RegionCoordZ::Front, GWS, ELWS, offset);
MultiDispatchInfo mdi1D;
MultiDispatchInfo mdi2D;
MultiDispatchInfo mdi3D;
builder1D.bake(mdi1D);
builder1D.bake(mdi2D);
builder1D.bake(mdi3D);
//Set arg
clearCrossThreadData();
builder1D.setArg(SplitDispatch::RegionCoordX::Left, static_cast<uint32_t>(0), sizeof(cl_mem *), pVal);
for (auto &dispatchInfo : mdi1D) {
EXPECT_EQ(buffer->getCpuAddress(), *reinterpret_cast<void **>((dispatchInfo.getKernel()->getCrossThreadData() + 0x10)));
}
clearCrossThreadData();
builder2D.setArg(SplitDispatch::RegionCoordX::Left, SplitDispatch::RegionCoordY::Top, static_cast<uint32_t>(0), sizeof(cl_mem *), pVal);
for (auto &dispatchInfo : mdi2D) {
EXPECT_EQ(buffer->getCpuAddress(), *reinterpret_cast<void **>((dispatchInfo.getKernel()->getCrossThreadData() + 0x10)));
}
clearCrossThreadData();
builder3D.setArg(SplitDispatch::RegionCoordX::Left, SplitDispatch::RegionCoordY::Top, SplitDispatch::RegionCoordZ::Front, static_cast<uint32_t>(0), sizeof(cl_mem *), pVal);
for (auto &dispatchInfo : mdi3D) {
EXPECT_EQ(buffer->getCpuAddress(), *reinterpret_cast<void **>((dispatchInfo.getKernel()->getCrossThreadData() + 0x10)));
}
//Set arg SVM
clearCrossThreadData();
builder1D.setArgSvm(SplitDispatch::RegionCoordX::Left, 1, sizeof(svmPtr), svmPtr);
for (auto &dispatchInfo : mdi1D) {
EXPECT_EQ(svmPtr, *(reinterpret_cast<void **>(dispatchInfo.getKernel()->getCrossThreadData() + 0x30)));
}
clearCrossThreadData();
builder2D.setArgSvm(SplitDispatch::RegionCoordX::Left, SplitDispatch::RegionCoordY::Top, 1, sizeof(svmPtr), svmPtr);
for (auto &dispatchInfo : mdi2D) {
EXPECT_EQ(svmPtr, *(reinterpret_cast<void **>(dispatchInfo.getKernel()->getCrossThreadData() + 0x30)));
}
clearCrossThreadData();
builder3D.setArgSvm(SplitDispatch::RegionCoordX::Left, SplitDispatch::RegionCoordY::Top, SplitDispatch::RegionCoordZ::Front, 1, sizeof(svmPtr), svmPtr);
for (auto &dispatchInfo : mdi3D) {
EXPECT_EQ(svmPtr, *(reinterpret_cast<void **>(dispatchInfo.getKernel()->getCrossThreadData() + 0x30)));
}
delete buffer;
}
TEST_F(DispatchInfoBuilderTest, setKernelArgNegative) {
char *buffer = new char[sizeof(Buffer)];
auto val = (cl_mem)buffer;
auto pVal = &val;
DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::NoSplit> *diBuilder = new DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::NoSplit>();
ASSERT_NE(nullptr, diBuilder);
diBuilder->setKernel(pKernel);
diBuilder->setDispatchGeometry(Vec3<size_t>(256, 256, 256), Vec3<size_t>(16, 16, 16), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo multiDispatchInfo;
diBuilder->bake(multiDispatchInfo);
EXPECT_NE(CL_SUCCESS, diBuilder->setArg(0, sizeof(cl_mem *), pVal));
EXPECT_EQ(CL_SUCCESS, diBuilder->setArgSvm(1, sizeof(void *), nullptr));
delete diBuilder;
delete[] buffer;
}
TEST_F(DispatchInfoBuilderTest, setKernelArgNullKernel) {
Buffer *buffer = new MockBuffer();
auto val = (cl_mem)buffer;
auto pVal = &val;
char data[128];
void *svmPtr = &data;
MockGraphicsAllocation svmAlloc(svmPtr, 128);
DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::NoSplit> *diBuilder = new DispatchInfoBuilder<SplitDispatch::Dim::d3D, SplitDispatch::SplitMode::NoSplit>();
ASSERT_NE(nullptr, diBuilder);
diBuilder->setDispatchGeometry(Vec3<size_t>(256, 256, 256), Vec3<size_t>(16, 16, 16), Vec3<size_t>(0, 0, 0));
MultiDispatchInfo multiDispatchInfo;
diBuilder->bake(multiDispatchInfo);
EXPECT_EQ(CL_SUCCESS, diBuilder->setArg(0, sizeof(cl_mem *), pVal));
EXPECT_EQ(CL_SUCCESS, diBuilder->setArgSvm(1, sizeof(svmPtr), svmPtr));
EXPECT_EQ(CL_SUCCESS, diBuilder->setArgSvmAlloc(2, svmPtr, &svmAlloc));
delete diBuilder;
delete buffer;
}
} // namespace OCLRT