2017-12-21 07:45:38 +08:00
|
|
|
/*
|
2018-01-08 11:07:46 +08:00
|
|
|
* Copyright (c) 2018, Intel Corporation
|
2017-12-21 07:45:38 +08:00
|
|
|
*
|
|
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
|
|
* to deal in the Software without restriction, including without limitation
|
|
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
|
|
*
|
|
|
|
* The above copyright notice and this permission notice shall be included
|
|
|
|
* in all copies or substantial portions of the Software.
|
|
|
|
*
|
|
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
|
|
|
|
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
|
|
|
|
* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
|
|
|
|
* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
|
|
|
|
* OTHER DEALINGS IN THE SOFTWARE.
|
|
|
|
*/
|
|
|
|
|
2018-01-08 11:07:46 +08:00
|
|
|
#include "runtime/command_stream/preemption.h"
|
2017-12-21 07:45:38 +08:00
|
|
|
#include "unit_tests/command_queue/enqueue_fixture.h"
|
2018-01-08 11:07:46 +08:00
|
|
|
#include "unit_tests/fixtures/preemption_fixture.h"
|
2017-12-21 07:45:38 +08:00
|
|
|
#include "unit_tests/helpers/hw_parse.h"
|
2018-01-08 11:07:46 +08:00
|
|
|
#include "unit_tests/mocks/mock_command_queue.h"
|
2017-12-21 07:45:38 +08:00
|
|
|
#include "unit_tests/mocks/mock_csr.h"
|
|
|
|
#include "unit_tests/mocks/mock_buffer.h"
|
|
|
|
#include "unit_tests/mocks/mock_submissions_aggregator.h"
|
|
|
|
|
|
|
|
namespace OCLRT {
|
|
|
|
|
|
|
|
template <>
|
|
|
|
void HardwareParse::findCsrBaseAddress<SKLFamily>() {
|
|
|
|
typedef typename GEN9::GPGPU_CSR_BASE_ADDRESS GPGPU_CSR_BASE_ADDRESS;
|
|
|
|
itorGpgpuCsrBaseAddress = find<GPGPU_CSR_BASE_ADDRESS *>(cmdList.begin(), itorWalker);
|
|
|
|
if (itorGpgpuCsrBaseAddress != itorWalker) {
|
|
|
|
cmdGpgpuCsrBaseAddress = *itorGpgpuCsrBaseAddress;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} // namespace OCLRT
|
|
|
|
|
|
|
|
using namespace OCLRT;
|
|
|
|
|
|
|
|
typedef DevicePreemptionTests Gen9PreemptionTests;
|
|
|
|
typedef PreemptionEnqueueKernelTest Gen9PreemptionEnqueueKernelTest;
|
|
|
|
typedef MidThreadPreemptionEnqueueKernelTest Gen9MidThreadPreemptionEnqueueKernelTest;
|
|
|
|
typedef ThreadGroupPreemptionEnqueueKernelTest Gen9ThreadGroupPreemptionEnqueueKernelTest;
|
|
|
|
|
|
|
|
GEN9TEST_F(Gen9PreemptionTests, programThreadGroupPreemptionLri) {
|
|
|
|
preemptionMode = PreemptionMode::ThreadGroup;
|
|
|
|
typedef typename FamilyType::MI_LOAD_REGISTER_IMM MI_LOAD_REGISTER_IMM;
|
|
|
|
size_t requiredSize = PreemptionHelper::getRequiredCsrSize<FamilyType>(preemptionMode);
|
|
|
|
size_t expectedSize = sizeof(MI_LOAD_REGISTER_IMM);
|
|
|
|
EXPECT_EQ(expectedSize, requiredSize);
|
|
|
|
|
|
|
|
auto &cmdStream = cmdQ->getCS(requiredSize);
|
|
|
|
|
2018-01-08 11:07:46 +08:00
|
|
|
EXPECT_TRUE(PreemptionHelper::allowThreadGroupPreemption(kernel.get(), waTable));
|
2017-12-21 07:45:38 +08:00
|
|
|
PreemptionHelper::programPreemptionMode<FamilyType>(&cmdStream, preemptionMode, nullptr, nullptr);
|
|
|
|
EXPECT_EQ(requiredSize, cmdStream.getUsed());
|
|
|
|
|
|
|
|
auto lri = (MI_LOAD_REGISTER_IMM *)cmdStream.getBase();
|
|
|
|
EXPECT_EQ(0x2580u, lri->getRegisterOffset());
|
|
|
|
uint32_t expectedData = DwordBuilder::build(1, true) | DwordBuilder::build(2, true, false);
|
|
|
|
EXPECT_EQ(expectedData, lri->getDataDword());
|
|
|
|
}
|
|
|
|
|
|
|
|
GEN9TEST_F(Gen9PreemptionTests, programMidBatchPreemptionLri) {
|
|
|
|
preemptionMode = PreemptionMode::MidBatch;
|
|
|
|
typedef typename FamilyType::MI_LOAD_REGISTER_IMM MI_LOAD_REGISTER_IMM;
|
|
|
|
size_t requiredSize = PreemptionHelper::getRequiredCsrSize<FamilyType>(preemptionMode);
|
|
|
|
size_t expectedSize = sizeof(MI_LOAD_REGISTER_IMM);
|
|
|
|
EXPECT_EQ(expectedSize, requiredSize);
|
|
|
|
auto &cmdStream = cmdQ->getCS(requiredSize);
|
2018-01-08 11:07:46 +08:00
|
|
|
EXPECT_TRUE(PreemptionHelper::allowThreadGroupPreemption(kernel.get(), waTable));
|
2017-12-21 07:45:38 +08:00
|
|
|
|
|
|
|
PreemptionHelper::programPreemptionMode<FamilyType>(&cmdStream, preemptionMode, nullptr, nullptr);
|
|
|
|
EXPECT_EQ(requiredSize, cmdStream.getUsed());
|
|
|
|
|
|
|
|
auto lri = (MI_LOAD_REGISTER_IMM *)cmdStream.getBase();
|
|
|
|
EXPECT_EQ(0x2580u, lri->getRegisterOffset());
|
|
|
|
uint32_t expectedData = DwordBuilder::build(2, true) | DwordBuilder::build(1, true, false);
|
|
|
|
EXPECT_EQ(expectedData, lri->getDataDword());
|
|
|
|
}
|
|
|
|
|
|
|
|
GEN9TEST_F(Gen9PreemptionTests, programMidThreadPreemptionLri) {
|
|
|
|
preemptionMode = PreemptionMode::MidThread;
|
|
|
|
typedef typename FamilyType::MI_LOAD_REGISTER_IMM MI_LOAD_REGISTER_IMM;
|
|
|
|
typedef typename FamilyType::GPGPU_CSR_BASE_ADDRESS GPGPU_CSR_BASE_ADDRESS;
|
|
|
|
size_t requiredSize = PreemptionHelper::getRequiredCsrSize<FamilyType>(preemptionMode);
|
|
|
|
size_t expectedSize = sizeof(MI_LOAD_REGISTER_IMM) + sizeof(GPGPU_CSR_BASE_ADDRESS);
|
|
|
|
EXPECT_EQ(expectedSize, requiredSize);
|
|
|
|
auto &cmdStream = cmdQ->getCS(requiredSize);
|
|
|
|
size_t minSize = device->getHardwareInfo().pSysInfo->CsrSizeInMb * MemoryConstants::megaByte;
|
|
|
|
uint64_t minAlignment = 2 * 256 * MemoryConstants::kiloByte;
|
|
|
|
MockGraphicsAllocation csrSurface((void *)minAlignment, minSize);
|
2018-01-08 11:07:46 +08:00
|
|
|
executionEnvironment->DisableMidThreadPreemption = 0;
|
2017-12-21 07:45:38 +08:00
|
|
|
|
|
|
|
device->setPreemptionMode(preemptionMode);
|
2018-01-08 11:07:46 +08:00
|
|
|
EXPECT_TRUE(PreemptionHelper::allowMidThreadPreemption(kernel.get(), *device));
|
2017-12-21 07:45:38 +08:00
|
|
|
|
|
|
|
PreemptionHelper::programPreemptionMode<FamilyType>(&cmdStream, preemptionMode, &csrSurface, nullptr);
|
|
|
|
EXPECT_EQ(requiredSize, cmdStream.getUsed());
|
|
|
|
|
|
|
|
auto lri = (MI_LOAD_REGISTER_IMM *)cmdStream.getBase();
|
|
|
|
EXPECT_EQ(0x2580u, lri->getRegisterOffset());
|
|
|
|
uint32_t expectedData = DwordBuilder::build(2, true, false) | DwordBuilder::build(1, true, false);
|
|
|
|
EXPECT_EQ(expectedData, lri->getDataDword());
|
|
|
|
|
|
|
|
auto gpgpuCsr = (GPGPU_CSR_BASE_ADDRESS *)((uintptr_t)lri + sizeof(MI_LOAD_REGISTER_IMM));
|
|
|
|
EXPECT_EQ(minAlignment, gpgpuCsr->getGpgpuCsrBaseAddress());
|
|
|
|
}
|
|
|
|
|
2018-01-02 19:10:34 +08:00
|
|
|
GEN9TEST_F(Gen9ThreadGroupPreemptionEnqueueKernelTest, givenSecondEnqueueWithTheSamePreemptionRequestThenDontReprogramThreadGroupNoWa) {
|
2017-12-21 07:45:38 +08:00
|
|
|
pDevice->setPreemptionMode(PreemptionMode::ThreadGroup);
|
|
|
|
WhitelistedRegisters regs = {};
|
|
|
|
regs.csChicken1_0x2580 = true;
|
|
|
|
pDevice->setForceWhitelistedRegs(true, ®s);
|
2018-01-02 19:10:34 +08:00
|
|
|
const_cast<WorkaroundTable *>(pDevice->getWaTable())->waModifyVFEStateAfterGPGPUPreemption = false;
|
2017-12-21 07:45:38 +08:00
|
|
|
auto &csr = pDevice->getUltCommandStreamReceiver<FamilyType>();
|
|
|
|
csr.getMemoryManager()->setForce32BitAllocations(false);
|
|
|
|
csr.overrideMediaVFEStateDirty(false);
|
|
|
|
auto csrSurface = csr.getPreemptionCsrAllocation();
|
|
|
|
EXPECT_EQ(nullptr, csrSurface);
|
2018-01-02 19:10:34 +08:00
|
|
|
HardwareParse hwCsrParser;
|
|
|
|
HardwareParse hwCmdQParser;
|
2017-12-21 07:45:38 +08:00
|
|
|
size_t off[3] = {0, 0, 0};
|
|
|
|
size_t gws[3] = {1, 1, 1};
|
|
|
|
|
|
|
|
MockKernelWithInternals mockKernel(*pDevice);
|
|
|
|
|
|
|
|
pCmdQ->enqueueKernel(mockKernel.mockKernel, 1, off, gws, nullptr, 0, nullptr, nullptr);
|
2018-01-02 19:10:34 +08:00
|
|
|
hwCsrParser.parseCommands<FamilyType>(csr.commandStream);
|
|
|
|
hwCsrParser.findHardwareCommands<FamilyType>();
|
|
|
|
hwCmdQParser.parseCommands<FamilyType>(pCmdQ->getCS());
|
|
|
|
hwCmdQParser.findHardwareCommands<FamilyType>();
|
|
|
|
auto offsetCsr = csr.commandStream.getUsed();
|
|
|
|
auto offsetCmdQ = pCmdQ->getCS().getUsed();
|
2017-12-21 07:45:38 +08:00
|
|
|
|
|
|
|
bool foundOne = false;
|
2018-01-02 19:10:34 +08:00
|
|
|
for (auto it : hwCsrParser.lriList) {
|
2017-12-21 07:45:38 +08:00
|
|
|
auto cmd = genCmdCast<typename FamilyType::MI_LOAD_REGISTER_IMM *>(it);
|
|
|
|
if (cmd->getRegisterOffset() == 0x2580u) {
|
|
|
|
EXPECT_FALSE(foundOne);
|
|
|
|
foundOne = true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
EXPECT_TRUE(foundOne);
|
2018-01-02 19:10:34 +08:00
|
|
|
hwCsrParser.cmdList.clear();
|
|
|
|
hwCsrParser.lriList.clear();
|
2017-12-21 07:45:38 +08:00
|
|
|
|
2018-01-02 19:10:34 +08:00
|
|
|
bool foundWaLri = false;
|
|
|
|
for (auto it : hwCmdQParser.lriList) {
|
|
|
|
auto cmd = genCmdCast<typename FamilyType::MI_LOAD_REGISTER_IMM *>(it);
|
|
|
|
if (cmd->getRegisterOffset() == 0x2600u) {
|
|
|
|
foundWaLri = true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
EXPECT_FALSE(foundWaLri);
|
|
|
|
hwCmdQParser.cmdList.clear();
|
|
|
|
hwCmdQParser.lriList.clear();
|
2017-12-21 07:45:38 +08:00
|
|
|
|
|
|
|
pCmdQ->enqueueKernel(mockKernel.mockKernel, 1, off, gws, nullptr, 0, nullptr, nullptr);
|
2018-01-02 19:10:34 +08:00
|
|
|
hwCsrParser.parseCommands<FamilyType>(csr.commandStream, offsetCsr);
|
|
|
|
hwCsrParser.findHardwareCommands<FamilyType>();
|
|
|
|
hwCmdQParser.parseCommands<FamilyType>(pCmdQ->getCS(), offsetCmdQ);
|
|
|
|
hwCmdQParser.findHardwareCommands<FamilyType>();
|
2017-12-21 07:45:38 +08:00
|
|
|
|
2018-01-02 19:10:34 +08:00
|
|
|
for (auto it : hwCsrParser.lriList) {
|
2017-12-21 07:45:38 +08:00
|
|
|
auto cmd = genCmdCast<typename FamilyType::MI_LOAD_REGISTER_IMM *>(it);
|
|
|
|
EXPECT_FALSE(cmd->getRegisterOffset() == 0x2580u);
|
|
|
|
}
|
2018-01-02 19:10:34 +08:00
|
|
|
for (auto it : hwCmdQParser.lriList) {
|
|
|
|
auto cmd = genCmdCast<typename FamilyType::MI_LOAD_REGISTER_IMM *>(it);
|
|
|
|
EXPECT_FALSE(cmd->getRegisterOffset() == 0x2600u);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
GEN9TEST_F(Gen9ThreadGroupPreemptionEnqueueKernelTest, givenSecondEnqueueWithTheSamePreemptionRequestThenDontReprogramThreadGroupWa) {
|
|
|
|
pDevice->setPreemptionMode(PreemptionMode::ThreadGroup);
|
|
|
|
WhitelistedRegisters regs = {};
|
|
|
|
regs.csChicken1_0x2580 = true;
|
|
|
|
pDevice->setForceWhitelistedRegs(true, ®s);
|
|
|
|
const_cast<WorkaroundTable *>(pDevice->getWaTable())->waModifyVFEStateAfterGPGPUPreemption = true;
|
|
|
|
auto &csr = pDevice->getUltCommandStreamReceiver<FamilyType>();
|
|
|
|
csr.getMemoryManager()->setForce32BitAllocations(false);
|
|
|
|
csr.overrideMediaVFEStateDirty(false);
|
|
|
|
auto csrSurface = csr.getPreemptionCsrAllocation();
|
|
|
|
EXPECT_EQ(nullptr, csrSurface);
|
|
|
|
HardwareParse hwCsrParser;
|
|
|
|
HardwareParse hwCmdQParser;
|
|
|
|
size_t off[3] = {0, 0, 0};
|
|
|
|
size_t gws[3] = {1, 1, 1};
|
|
|
|
|
|
|
|
MockKernelWithInternals mockKernel(*pDevice);
|
|
|
|
|
|
|
|
pCmdQ->enqueueKernel(mockKernel.mockKernel, 1, off, gws, nullptr, 0, nullptr, nullptr);
|
|
|
|
hwCsrParser.parseCommands<FamilyType>(csr.commandStream);
|
|
|
|
hwCsrParser.findHardwareCommands<FamilyType>();
|
|
|
|
hwCmdQParser.parseCommands<FamilyType>(pCmdQ->getCS());
|
|
|
|
hwCmdQParser.findHardwareCommands<FamilyType>();
|
|
|
|
auto offsetCsr = csr.commandStream.getUsed();
|
|
|
|
auto offsetCmdQ = pCmdQ->getCS().getUsed();
|
|
|
|
|
|
|
|
bool foundOne = false;
|
|
|
|
for (auto it : hwCsrParser.lriList) {
|
|
|
|
auto cmd = genCmdCast<typename FamilyType::MI_LOAD_REGISTER_IMM *>(it);
|
|
|
|
if (cmd->getRegisterOffset() == 0x2580u) {
|
|
|
|
EXPECT_FALSE(foundOne);
|
|
|
|
foundOne = true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
EXPECT_TRUE(foundOne);
|
|
|
|
hwCsrParser.cmdList.clear();
|
|
|
|
hwCsrParser.lriList.clear();
|
|
|
|
|
|
|
|
int foundWaLri = 0;
|
|
|
|
int foundWaLriBegin = 0;
|
|
|
|
int foundWaLriEnd = 0;
|
|
|
|
for (auto it : hwCmdQParser.lriList) {
|
|
|
|
auto cmd = genCmdCast<typename FamilyType::MI_LOAD_REGISTER_IMM *>(it);
|
|
|
|
if (cmd->getRegisterOffset() == 0x2600u) {
|
|
|
|
foundWaLri++;
|
|
|
|
if (cmd->getDataDword() == 0xFFFFFFFF) {
|
|
|
|
foundWaLriBegin++;
|
|
|
|
}
|
|
|
|
if (cmd->getDataDword() == 0x0) {
|
|
|
|
foundWaLriEnd++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
EXPECT_EQ(2, foundWaLri);
|
|
|
|
EXPECT_EQ(1, foundWaLriBegin);
|
|
|
|
EXPECT_EQ(1, foundWaLriEnd);
|
|
|
|
hwCmdQParser.cmdList.clear();
|
|
|
|
hwCmdQParser.lriList.clear();
|
|
|
|
|
|
|
|
pCmdQ->enqueueKernel(mockKernel.mockKernel, 1, off, gws, nullptr, 0, nullptr, nullptr);
|
|
|
|
hwCsrParser.parseCommands<FamilyType>(csr.commandStream, offsetCsr);
|
|
|
|
hwCsrParser.findHardwareCommands<FamilyType>();
|
|
|
|
|
|
|
|
hwCmdQParser.parseCommands<FamilyType>(pCmdQ->getCS(), offsetCmdQ);
|
|
|
|
hwCmdQParser.findHardwareCommands<FamilyType>();
|
|
|
|
|
|
|
|
for (auto it : hwCsrParser.lriList) {
|
|
|
|
auto cmd = genCmdCast<typename FamilyType::MI_LOAD_REGISTER_IMM *>(it);
|
|
|
|
EXPECT_FALSE(cmd->getRegisterOffset() == 0x2580u);
|
|
|
|
}
|
|
|
|
|
|
|
|
foundWaLri = 0;
|
|
|
|
foundWaLriBegin = 0;
|
|
|
|
foundWaLriEnd = 0;
|
|
|
|
for (auto it : hwCmdQParser.lriList) {
|
|
|
|
auto cmd = genCmdCast<typename FamilyType::MI_LOAD_REGISTER_IMM *>(it);
|
|
|
|
if (cmd->getRegisterOffset() == 0x2600u) {
|
|
|
|
foundWaLri++;
|
|
|
|
if (cmd->getDataDword() == 0xFFFFFFFF) {
|
|
|
|
foundWaLriBegin++;
|
|
|
|
}
|
|
|
|
if (cmd->getDataDword() == 0x0) {
|
|
|
|
foundWaLriEnd++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
EXPECT_EQ(2, foundWaLri);
|
|
|
|
EXPECT_EQ(1, foundWaLriBegin);
|
|
|
|
EXPECT_EQ(1, foundWaLriEnd);
|
2017-12-21 07:45:38 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
GEN9TEST_F(Gen9PreemptionEnqueueKernelTest, givenValidKernelForPreemptionWhenEnqueueKernelCalledThenPassDevicePreemptionModeThreadGroup) {
|
|
|
|
pDevice->setPreemptionMode(PreemptionMode::ThreadGroup);
|
|
|
|
WhitelistedRegisters regs = {};
|
|
|
|
regs.csChicken1_0x2580 = true;
|
|
|
|
pDevice->setForceWhitelistedRegs(true, ®s);
|
|
|
|
auto mockCsr = new MockCsrHw2<FamilyType>(pDevice->getHardwareInfo());
|
|
|
|
pDevice->resetCommandStreamReceiver(mockCsr);
|
|
|
|
|
|
|
|
MockKernelWithInternals mockKernel(*pDevice);
|
|
|
|
EXPECT_EQ(PreemptionMode::ThreadGroup, PreemptionHelper::taskPreemptionMode(*pDevice, mockKernel.mockKernel));
|
|
|
|
|
|
|
|
size_t gws[3] = {1, 0, 0};
|
|
|
|
pCmdQ->enqueueKernel(mockKernel.mockKernel, 1, nullptr, gws, nullptr, 0, nullptr, nullptr);
|
|
|
|
pCmdQ->flush();
|
|
|
|
|
|
|
|
EXPECT_EQ(1, mockCsr->flushCalledCount);
|
|
|
|
EXPECT_EQ(PreemptionMode::ThreadGroup, mockCsr->passedDispatchFlags.preemptionMode);
|
|
|
|
}
|
|
|
|
|
|
|
|
GEN9TEST_F(Gen9PreemptionEnqueueKernelTest, givenValidKernelForPreemptionWhenEnqueueKernelCalledAndBlockedThenPassDevicePreemptionModeThreadGroup) {
|
|
|
|
pDevice->setPreemptionMode(PreemptionMode::ThreadGroup);
|
|
|
|
WhitelistedRegisters regs = {};
|
|
|
|
regs.csChicken1_0x2580 = true;
|
|
|
|
pDevice->setForceWhitelistedRegs(true, ®s);
|
|
|
|
auto mockCsr = new MockCsrHw2<FamilyType>(pDevice->getHardwareInfo());
|
|
|
|
pDevice->resetCommandStreamReceiver(mockCsr);
|
|
|
|
|
|
|
|
MockKernelWithInternals mockKernel(*pDevice);
|
|
|
|
EXPECT_EQ(PreemptionMode::ThreadGroup, PreemptionHelper::taskPreemptionMode(*pDevice, mockKernel.mockKernel));
|
|
|
|
|
|
|
|
UserEvent userEventObj;
|
|
|
|
cl_event userEvent = &userEventObj;
|
|
|
|
size_t gws[3] = {1, 0, 0};
|
|
|
|
pCmdQ->enqueueKernel(mockKernel.mockKernel, 1, nullptr, gws, nullptr, 1, &userEvent, nullptr);
|
|
|
|
pCmdQ->flush();
|
|
|
|
EXPECT_EQ(0, mockCsr->flushCalledCount);
|
|
|
|
|
|
|
|
userEventObj.setStatus(CL_COMPLETE);
|
|
|
|
pCmdQ->flush();
|
|
|
|
EXPECT_EQ(1, mockCsr->flushCalledCount);
|
|
|
|
EXPECT_EQ(PreemptionMode::ThreadGroup, mockCsr->passedDispatchFlags.preemptionMode);
|
|
|
|
}
|
|
|
|
|
2018-01-02 19:10:34 +08:00
|
|
|
GEN9TEST_F(Gen9MidThreadPreemptionEnqueueKernelTest, givenSecondEnqueueWithTheSamePreemptionRequestThenDontReprogramMidThreadNoWa) {
|
|
|
|
typedef typename FamilyType::MI_LOAD_REGISTER_IMM MI_LOAD_REGISTER_IMM;
|
|
|
|
typedef typename FamilyType::GPGPU_CSR_BASE_ADDRESS GPGPU_CSR_BASE_ADDRESS;
|
|
|
|
|
|
|
|
WhitelistedRegisters regs = {};
|
|
|
|
regs.csChicken1_0x2580 = true;
|
|
|
|
pDevice->setForceWhitelistedRegs(true, ®s);
|
|
|
|
const_cast<WorkaroundTable *>(pDevice->getWaTable())->waModifyVFEStateAfterGPGPUPreemption = false;
|
|
|
|
|
|
|
|
auto &csr = pDevice->getUltCommandStreamReceiver<FamilyType>();
|
|
|
|
csr.getMemoryManager()->setForce32BitAllocations(false);
|
|
|
|
csr.overrideMediaVFEStateDirty(false);
|
|
|
|
auto csrSurface = csr.getPreemptionCsrAllocation();
|
|
|
|
ASSERT_NE(nullptr, csrSurface);
|
|
|
|
HardwareParse hwCsrParser;
|
|
|
|
HardwareParse hwCmdQParser;
|
|
|
|
size_t off[3] = {0, 0, 0};
|
|
|
|
size_t gws[3] = {1, 1, 1};
|
|
|
|
|
|
|
|
MockKernelWithInternals mockKernel(*pDevice);
|
|
|
|
|
|
|
|
pCmdQ->enqueueKernel(mockKernel.mockKernel, 1, off, gws, nullptr, 0, nullptr, nullptr);
|
|
|
|
hwCsrParser.parseCommands<FamilyType>(csr.commandStream);
|
|
|
|
hwCsrParser.findHardwareCommands<FamilyType>();
|
|
|
|
hwCmdQParser.parseCommands<FamilyType>(pCmdQ->getCS());
|
|
|
|
hwCmdQParser.findHardwareCommands<FamilyType>();
|
|
|
|
auto offsetCsr = csr.commandStream.getUsed();
|
|
|
|
auto offsetCmdQ = pCmdQ->getCS().getUsed();
|
|
|
|
|
|
|
|
bool foundOneLri = false;
|
|
|
|
for (auto it : hwCsrParser.lriList) {
|
|
|
|
auto cmdLri = genCmdCast<MI_LOAD_REGISTER_IMM *>(it);
|
|
|
|
if (cmdLri->getRegisterOffset() == 0x2580u) {
|
|
|
|
EXPECT_FALSE(foundOneLri);
|
|
|
|
foundOneLri = true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
EXPECT_TRUE(foundOneLri);
|
|
|
|
|
|
|
|
bool foundWaLri = false;
|
|
|
|
for (auto it : hwCmdQParser.lriList) {
|
|
|
|
auto cmdLri = genCmdCast<MI_LOAD_REGISTER_IMM *>(it);
|
|
|
|
if (cmdLri->getRegisterOffset() == 0x2600u) {
|
|
|
|
foundWaLri = true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
EXPECT_FALSE(foundWaLri);
|
|
|
|
|
|
|
|
hwCsrParser.findCsrBaseAddress<FamilyType>();
|
|
|
|
ASSERT_NE(nullptr, hwCsrParser.cmdGpgpuCsrBaseAddress);
|
|
|
|
auto cmdCsr = genCmdCast<GPGPU_CSR_BASE_ADDRESS *>(hwCsrParser.cmdGpgpuCsrBaseAddress);
|
|
|
|
ASSERT_NE(nullptr, cmdCsr);
|
|
|
|
EXPECT_EQ(csrSurface->getGpuAddressToPatch(), cmdCsr->getGpgpuCsrBaseAddress());
|
|
|
|
|
|
|
|
hwCsrParser.cmdList.clear();
|
|
|
|
hwCsrParser.lriList.clear();
|
|
|
|
hwCsrParser.cmdGpgpuCsrBaseAddress = nullptr;
|
|
|
|
hwCmdQParser.cmdList.clear();
|
|
|
|
hwCmdQParser.lriList.clear();
|
|
|
|
|
|
|
|
pCmdQ->enqueueKernel(mockKernel.mockKernel, 1, off, gws, nullptr, 0, nullptr, nullptr);
|
|
|
|
hwCsrParser.parseCommands<FamilyType>(csr.commandStream, offsetCsr);
|
|
|
|
hwCsrParser.findHardwareCommands<FamilyType>();
|
|
|
|
hwCmdQParser.parseCommands<FamilyType>(csr.commandStream, offsetCmdQ);
|
|
|
|
hwCmdQParser.findHardwareCommands<FamilyType>();
|
|
|
|
|
|
|
|
for (auto it : hwCsrParser.lriList) {
|
|
|
|
auto cmd = genCmdCast<MI_LOAD_REGISTER_IMM *>(it);
|
|
|
|
EXPECT_FALSE(cmd->getRegisterOffset() == 0x2580u);
|
|
|
|
}
|
|
|
|
|
|
|
|
hwCsrParser.findCsrBaseAddress<FamilyType>();
|
|
|
|
EXPECT_EQ(nullptr, hwCsrParser.cmdGpgpuCsrBaseAddress);
|
|
|
|
|
|
|
|
for (auto it : hwCmdQParser.lriList) {
|
|
|
|
auto cmd = genCmdCast<MI_LOAD_REGISTER_IMM *>(it);
|
|
|
|
EXPECT_FALSE(cmd->getRegisterOffset() == 0x2600u);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
GEN9TEST_F(Gen9MidThreadPreemptionEnqueueKernelTest, givenSecondEnqueueWithTheSamePreemptionRequestThenDontReprogramMidThreadWa) {
|
2017-12-21 07:45:38 +08:00
|
|
|
typedef typename FamilyType::MI_LOAD_REGISTER_IMM MI_LOAD_REGISTER_IMM;
|
|
|
|
typedef typename FamilyType::GPGPU_CSR_BASE_ADDRESS GPGPU_CSR_BASE_ADDRESS;
|
|
|
|
|
|
|
|
WhitelistedRegisters regs = {};
|
|
|
|
regs.csChicken1_0x2580 = true;
|
|
|
|
pDevice->setForceWhitelistedRegs(true, ®s);
|
2018-01-02 19:10:34 +08:00
|
|
|
const_cast<WorkaroundTable *>(pDevice->getWaTable())->waModifyVFEStateAfterGPGPUPreemption = true;
|
2017-12-21 07:45:38 +08:00
|
|
|
|
|
|
|
auto &csr = pDevice->getUltCommandStreamReceiver<FamilyType>();
|
|
|
|
csr.getMemoryManager()->setForce32BitAllocations(false);
|
|
|
|
csr.overrideMediaVFEStateDirty(false);
|
|
|
|
auto csrSurface = csr.getPreemptionCsrAllocation();
|
|
|
|
ASSERT_NE(nullptr, csrSurface);
|
2018-01-02 19:10:34 +08:00
|
|
|
HardwareParse hwCsrParser;
|
|
|
|
HardwareParse hwCmdQParser;
|
2017-12-21 07:45:38 +08:00
|
|
|
size_t off[3] = {0, 0, 0};
|
|
|
|
size_t gws[3] = {1, 1, 1};
|
|
|
|
|
|
|
|
MockKernelWithInternals mockKernel(*pDevice);
|
|
|
|
|
|
|
|
pCmdQ->enqueueKernel(mockKernel.mockKernel, 1, off, gws, nullptr, 0, nullptr, nullptr);
|
2018-01-02 19:10:34 +08:00
|
|
|
hwCsrParser.parseCommands<FamilyType>(csr.commandStream);
|
|
|
|
hwCsrParser.findHardwareCommands<FamilyType>();
|
|
|
|
hwCmdQParser.parseCommands<FamilyType>(pCmdQ->getCS());
|
|
|
|
hwCmdQParser.findHardwareCommands<FamilyType>();
|
|
|
|
auto offsetCsr = csr.commandStream.getUsed();
|
|
|
|
auto offsetCmdQ = pCmdQ->getCS().getUsed();
|
2017-12-21 07:45:38 +08:00
|
|
|
|
|
|
|
bool foundOneLri = false;
|
2018-01-02 19:10:34 +08:00
|
|
|
for (auto it : hwCsrParser.lriList) {
|
2017-12-21 07:45:38 +08:00
|
|
|
auto cmdLri = genCmdCast<MI_LOAD_REGISTER_IMM *>(it);
|
|
|
|
if (cmdLri->getRegisterOffset() == 0x2580u) {
|
|
|
|
EXPECT_FALSE(foundOneLri);
|
|
|
|
foundOneLri = true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
EXPECT_TRUE(foundOneLri);
|
2018-01-02 19:10:34 +08:00
|
|
|
|
|
|
|
int foundWaLri = 0;
|
|
|
|
int foundWaLriBegin = 0;
|
|
|
|
int foundWaLriEnd = 0;
|
|
|
|
for (auto it : hwCmdQParser.lriList) {
|
|
|
|
auto cmdLri = genCmdCast<MI_LOAD_REGISTER_IMM *>(it);
|
|
|
|
if (cmdLri->getRegisterOffset() == 0x2600u) {
|
|
|
|
foundWaLri++;
|
|
|
|
if (cmdLri->getDataDword() == 0xFFFFFFFF) {
|
|
|
|
foundWaLriBegin++;
|
|
|
|
}
|
|
|
|
if (cmdLri->getDataDword() == 0x0) {
|
|
|
|
foundWaLriEnd++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
EXPECT_EQ(2, foundWaLri);
|
|
|
|
EXPECT_EQ(1, foundWaLriBegin);
|
|
|
|
EXPECT_EQ(1, foundWaLriEnd);
|
|
|
|
|
|
|
|
hwCsrParser.findCsrBaseAddress<FamilyType>();
|
|
|
|
ASSERT_NE(nullptr, hwCsrParser.cmdGpgpuCsrBaseAddress);
|
|
|
|
auto cmdCsr = genCmdCast<GPGPU_CSR_BASE_ADDRESS *>(hwCsrParser.cmdGpgpuCsrBaseAddress);
|
2017-12-21 07:45:38 +08:00
|
|
|
ASSERT_NE(nullptr, cmdCsr);
|
|
|
|
EXPECT_EQ(csrSurface->getGpuAddressToPatch(), cmdCsr->getGpgpuCsrBaseAddress());
|
|
|
|
|
2018-01-02 19:10:34 +08:00
|
|
|
hwCsrParser.cmdList.clear();
|
|
|
|
hwCsrParser.lriList.clear();
|
|
|
|
hwCsrParser.cmdGpgpuCsrBaseAddress = nullptr;
|
|
|
|
hwCmdQParser.cmdList.clear();
|
|
|
|
hwCmdQParser.lriList.clear();
|
2017-12-21 07:45:38 +08:00
|
|
|
|
|
|
|
pCmdQ->enqueueKernel(mockKernel.mockKernel, 1, off, gws, nullptr, 0, nullptr, nullptr);
|
2018-01-02 19:10:34 +08:00
|
|
|
hwCsrParser.parseCommands<FamilyType>(csr.commandStream, offsetCsr);
|
|
|
|
hwCsrParser.findHardwareCommands<FamilyType>();
|
|
|
|
hwCmdQParser.parseCommands<FamilyType>(pCmdQ->getCS(), offsetCmdQ);
|
|
|
|
hwCmdQParser.findHardwareCommands<FamilyType>();
|
2017-12-21 07:45:38 +08:00
|
|
|
|
2018-01-02 19:10:34 +08:00
|
|
|
for (auto it : hwCsrParser.lriList) {
|
2017-12-21 07:45:38 +08:00
|
|
|
auto cmd = genCmdCast<MI_LOAD_REGISTER_IMM *>(it);
|
|
|
|
EXPECT_FALSE(cmd->getRegisterOffset() == 0x2580u);
|
|
|
|
}
|
|
|
|
|
2018-01-02 19:10:34 +08:00
|
|
|
hwCsrParser.findCsrBaseAddress<FamilyType>();
|
|
|
|
EXPECT_EQ(nullptr, hwCsrParser.cmdGpgpuCsrBaseAddress);
|
|
|
|
|
|
|
|
foundWaLri = 0;
|
|
|
|
foundWaLriBegin = 0;
|
|
|
|
foundWaLriEnd = 0;
|
|
|
|
for (auto it : hwCmdQParser.lriList) {
|
|
|
|
auto cmd = genCmdCast<MI_LOAD_REGISTER_IMM *>(it);
|
|
|
|
if (cmd->getRegisterOffset() == 0x2600u) {
|
|
|
|
foundWaLri++;
|
|
|
|
if (cmd->getDataDword() == 0xFFFFFFFF) {
|
|
|
|
foundWaLriBegin++;
|
|
|
|
}
|
|
|
|
if (cmd->getDataDword() == 0x0) {
|
|
|
|
foundWaLriEnd++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
EXPECT_EQ(2, foundWaLri);
|
|
|
|
EXPECT_EQ(1, foundWaLriBegin);
|
|
|
|
EXPECT_EQ(1, foundWaLriEnd);
|
2017-12-21 07:45:38 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
GEN9TEST_F(Gen9PreemptionEnqueueKernelTest, givenDisabledPreemptionWhenEnqueueKernelCalledThenPassDisabledPreemptionMode) {
|
|
|
|
pDevice->setPreemptionMode(PreemptionMode::Disabled);
|
|
|
|
WhitelistedRegisters regs = {};
|
|
|
|
pDevice->setForceWhitelistedRegs(true, ®s);
|
|
|
|
auto mockCsr = new MockCsrHw2<FamilyType>(pDevice->getHardwareInfo());
|
|
|
|
pDevice->resetCommandStreamReceiver(mockCsr);
|
|
|
|
|
|
|
|
MockKernelWithInternals mockKernel(*pDevice);
|
|
|
|
EXPECT_EQ(PreemptionMode::Disabled, PreemptionHelper::taskPreemptionMode(*pDevice, mockKernel.mockKernel));
|
|
|
|
|
|
|
|
size_t gws[3] = {1, 0, 0};
|
|
|
|
pCmdQ->enqueueKernel(mockKernel.mockKernel, 1, nullptr, gws, nullptr, 0, nullptr, nullptr);
|
|
|
|
pCmdQ->flush();
|
|
|
|
|
|
|
|
EXPECT_EQ(1, mockCsr->flushCalledCount);
|
|
|
|
EXPECT_EQ(PreemptionMode::Disabled, mockCsr->passedDispatchFlags.preemptionMode);
|
|
|
|
}
|
2018-01-02 19:10:34 +08:00
|
|
|
|
|
|
|
GEN9TEST_F(Gen9PreemptionTests, getPreemptionWaCsSizeMidBatch) {
|
|
|
|
size_t expectedSize = 0;
|
|
|
|
device->setPreemptionMode(PreemptionMode::MidBatch);
|
|
|
|
size_t size = PreemptionHelper::getPreemptionWaCsSize<FamilyType>(*device);
|
|
|
|
EXPECT_EQ(expectedSize, size);
|
|
|
|
}
|
|
|
|
|
|
|
|
GEN9TEST_F(Gen9PreemptionTests, getPreemptionWaCsSizeThreadGroupNoWa) {
|
|
|
|
size_t expectedSize = 0;
|
|
|
|
device->setPreemptionMode(PreemptionMode::ThreadGroup);
|
|
|
|
const_cast<WorkaroundTable *>(device->getWaTable())->waModifyVFEStateAfterGPGPUPreemption = false;
|
|
|
|
size_t size = PreemptionHelper::getPreemptionWaCsSize<FamilyType>(*device);
|
|
|
|
EXPECT_EQ(expectedSize, size);
|
|
|
|
}
|
|
|
|
|
|
|
|
GEN9TEST_F(Gen9PreemptionTests, getPreemptionWaCsSizeThreadGroupWa) {
|
|
|
|
typedef typename FamilyType::MI_LOAD_REGISTER_IMM MI_LOAD_REGISTER_IMM;
|
|
|
|
size_t expectedSize = 2 * sizeof(MI_LOAD_REGISTER_IMM);
|
|
|
|
device->setPreemptionMode(PreemptionMode::ThreadGroup);
|
|
|
|
const_cast<WorkaroundTable *>(device->getWaTable())->waModifyVFEStateAfterGPGPUPreemption = true;
|
|
|
|
size_t size = PreemptionHelper::getPreemptionWaCsSize<FamilyType>(*device);
|
|
|
|
EXPECT_EQ(expectedSize, size);
|
|
|
|
}
|
|
|
|
|
|
|
|
GEN9TEST_F(Gen9PreemptionTests, getPreemptionWaCsSizeMidThreadNoWa) {
|
|
|
|
size_t expectedSize = 0;
|
|
|
|
device->setPreemptionMode(PreemptionMode::MidThread);
|
|
|
|
const_cast<WorkaroundTable *>(device->getWaTable())->waModifyVFEStateAfterGPGPUPreemption = false;
|
|
|
|
size_t size = PreemptionHelper::getPreemptionWaCsSize<FamilyType>(*device);
|
|
|
|
EXPECT_EQ(expectedSize, size);
|
|
|
|
}
|
|
|
|
|
|
|
|
GEN9TEST_F(Gen9PreemptionTests, getPreemptionWaCsSizeMidThreadWa) {
|
|
|
|
typedef typename FamilyType::MI_LOAD_REGISTER_IMM MI_LOAD_REGISTER_IMM;
|
|
|
|
size_t expectedSize = 2 * sizeof(MI_LOAD_REGISTER_IMM);
|
|
|
|
device->setPreemptionMode(PreemptionMode::MidThread);
|
|
|
|
const_cast<WorkaroundTable *>(device->getWaTable())->waModifyVFEStateAfterGPGPUPreemption = true;
|
|
|
|
size_t size = PreemptionHelper::getPreemptionWaCsSize<FamilyType>(*device);
|
|
|
|
EXPECT_EQ(expectedSize, size);
|
|
|
|
}
|