/* * Copyright (C) 2020-2023 Intel Corporation * * SPDX-License-Identifier: MIT * */ #include "shared/source/command_container/command_encoder.h" #include "shared/source/helpers/register_offsets.h" #include "shared/source/indirect_heap/heap_size.h" #include "shared/test/common/cmd_parse/gen_cmd_parse.h" #include "shared/test/common/fixtures/device_fixture.h" #include "shared/test/common/mocks/mock_device.h" #include "shared/test/common/test_macros/hw_test.h" using namespace NEO; using EncodeMathMMIOTest = testing::Test; HWTEST_F(EncodeMathMMIOTest, WhenEncodingAluThenCorrectOpcodesOperandsAdded) { using MI_MATH_ALU_INST_INLINE = typename FamilyType::MI_MATH_ALU_INST_INLINE; MI_MATH_ALU_INST_INLINE aluParam[5]; AluRegisters regA = AluRegisters::R_0; AluRegisters regB = AluRegisters::R_1; AluRegisters finalResultRegister = AluRegisters::R_2; memset(aluParam, 0, sizeof(MI_MATH_ALU_INST_INLINE) * 5); EncodeMathMMIO::encodeAluAdd(aluParam, regA, regB, finalResultRegister); EXPECT_EQ(aluParam[0].DW0.BitField.ALUOpcode, static_cast(AluRegisters::OPCODE_LOAD)); EXPECT_EQ(aluParam[0].DW0.BitField.Operand1, static_cast(AluRegisters::R_SRCA)); EXPECT_EQ(aluParam[0].DW0.BitField.Operand2, static_cast(regA)); EXPECT_EQ(aluParam[1].DW0.BitField.ALUOpcode, static_cast(AluRegisters::OPCODE_LOAD)); EXPECT_EQ(aluParam[1].DW0.BitField.Operand1, static_cast(AluRegisters::R_SRCB)); EXPECT_EQ(aluParam[1].DW0.BitField.Operand2, static_cast(regB)); EXPECT_EQ(aluParam[2].DW0.BitField.ALUOpcode, static_cast(AluRegisters::OPCODE_ADD)); EXPECT_EQ(aluParam[2].DW0.BitField.Operand1, 0u); EXPECT_EQ(aluParam[2].DW0.BitField.Operand2, 0u); EXPECT_EQ(aluParam[3].DW0.BitField.ALUOpcode, static_cast(AluRegisters::OPCODE_STORE)); EXPECT_EQ(aluParam[3].DW0.BitField.Operand1, static_cast(AluRegisters::R_2)); EXPECT_EQ(aluParam[3].DW0.BitField.Operand2, static_cast(AluRegisters::R_ACCU)); EXPECT_EQ(aluParam[4].DW0.Value, 0u); } HWTEST_F(EncodeMathMMIOTest, WhenEncodingAluSubStoreCarryThenCorrectOpcodesOperandsAdded) { using MI_MATH_ALU_INST_INLINE = typename FamilyType::MI_MATH_ALU_INST_INLINE; MI_MATH_ALU_INST_INLINE aluParam[5]; AluRegisters regA = AluRegisters::R_0; AluRegisters regB = AluRegisters::R_1; AluRegisters finalResultRegister = AluRegisters::R_2; memset(aluParam, 0, sizeof(MI_MATH_ALU_INST_INLINE) * 5); EncodeMathMMIO::encodeAluSubStoreCarry(aluParam, regA, regB, finalResultRegister); EXPECT_EQ(aluParam[0].DW0.BitField.ALUOpcode, static_cast(AluRegisters::OPCODE_LOAD)); EXPECT_EQ(aluParam[0].DW0.BitField.Operand1, static_cast(AluRegisters::R_SRCA)); EXPECT_EQ(aluParam[0].DW0.BitField.Operand2, static_cast(regA)); EXPECT_EQ(aluParam[1].DW0.BitField.ALUOpcode, static_cast(AluRegisters::OPCODE_LOAD)); EXPECT_EQ(aluParam[1].DW0.BitField.Operand1, static_cast(AluRegisters::R_SRCB)); EXPECT_EQ(aluParam[1].DW0.BitField.Operand2, static_cast(regB)); EXPECT_EQ(aluParam[2].DW0.BitField.ALUOpcode, static_cast(AluRegisters::OPCODE_SUB)); EXPECT_EQ(aluParam[2].DW0.BitField.Operand1, 0u); EXPECT_EQ(aluParam[2].DW0.BitField.Operand2, 0u); EXPECT_EQ(aluParam[3].DW0.BitField.ALUOpcode, static_cast(AluRegisters::OPCODE_STORE)); EXPECT_EQ(aluParam[3].DW0.BitField.Operand1, static_cast(AluRegisters::R_2)); EXPECT_EQ(aluParam[3].DW0.BitField.Operand2, static_cast(AluRegisters::R_CF)); EXPECT_EQ(aluParam[4].DW0.Value, 0u); } HWTEST_F(EncodeMathMMIOTest, givenAluRegistersWhenEncodeAluAndIsCalledThenAluParamHasCorrectOpcodesAndOperands) { using MI_MATH_ALU_INST_INLINE = typename FamilyType::MI_MATH_ALU_INST_INLINE; MI_MATH_ALU_INST_INLINE aluParam[5]; AluRegisters regA = AluRegisters::R_0; AluRegisters regB = AluRegisters::R_1; AluRegisters finalResultRegister = AluRegisters::R_2; memset(aluParam, 0, sizeof(MI_MATH_ALU_INST_INLINE) * 5); EncodeMathMMIO::encodeAluAnd(aluParam, regA, regB, finalResultRegister); EXPECT_EQ(aluParam[0].DW0.BitField.ALUOpcode, static_cast(AluRegisters::OPCODE_LOAD)); EXPECT_EQ(aluParam[0].DW0.BitField.Operand1, static_cast(AluRegisters::R_SRCA)); EXPECT_EQ(aluParam[0].DW0.BitField.Operand2, static_cast(regA)); EXPECT_EQ(aluParam[1].DW0.BitField.ALUOpcode, static_cast(AluRegisters::OPCODE_LOAD)); EXPECT_EQ(aluParam[1].DW0.BitField.Operand1, static_cast(AluRegisters::R_SRCB)); EXPECT_EQ(aluParam[1].DW0.BitField.Operand2, static_cast(regB)); EXPECT_EQ(aluParam[2].DW0.BitField.ALUOpcode, static_cast(AluRegisters::OPCODE_AND)); EXPECT_EQ(aluParam[2].DW0.BitField.Operand1, 0u); EXPECT_EQ(aluParam[2].DW0.BitField.Operand2, 0u); EXPECT_EQ(aluParam[3].DW0.BitField.ALUOpcode, static_cast(AluRegisters::OPCODE_STORE)); EXPECT_EQ(aluParam[3].DW0.BitField.Operand1, static_cast(AluRegisters::R_2)); EXPECT_EQ(aluParam[3].DW0.BitField.Operand2, static_cast(AluRegisters::R_ACCU)); EXPECT_EQ(aluParam[4].DW0.Value, 0u); } using CommandEncoderMathTest = Test; HWTEST_F(CommandEncoderMathTest, WhenReservingCommandThenBitfieldSetCorrectly) { using MI_MATH = typename FamilyType::MI_MATH; GenCmdList commands; CommandContainer cmdContainer; cmdContainer.initialize(pDevice, nullptr, HeapSize::defaultHeapSize, true, false); EncodeMath::commandReserve(cmdContainer); CmdParse::parseCommandBuffer(commands, ptrOffset(cmdContainer.getCommandStream()->getCpuBase(), 0), cmdContainer.getCommandStream()->getUsed()); auto itor = commands.begin(); itor = find(itor, commands.end()); ASSERT_NE(itor, commands.end()); auto cmdMATH = genCmdCast(*itor); EXPECT_EQ(cmdMATH->DW0.BitField.InstructionType, static_cast(MI_MATH::COMMAND_TYPE_MI_COMMAND)); EXPECT_EQ(cmdMATH->DW0.BitField.InstructionOpcode, static_cast(MI_MATH::MI_COMMAND_OPCODE_MI_MATH)); EXPECT_EQ(cmdMATH->DW0.BitField.DwordLength, static_cast(NUM_ALU_INST_FOR_READ_MODIFY_WRITE - 1)); } HWTEST_F(CommandEncoderMathTest, givenOffsetAndValueWhenEncodeBitwiseAndValIsCalledThenContainerHasCorrectMathCommands) { using MI_LOAD_REGISTER_REG = typename FamilyType::MI_LOAD_REGISTER_REG; using MI_LOAD_REGISTER_IMM = typename FamilyType::MI_LOAD_REGISTER_IMM; using MI_MATH = typename FamilyType::MI_MATH; using MI_STORE_REGISTER_MEM = typename FamilyType::MI_STORE_REGISTER_MEM; GenCmdList commands; CommandContainer cmdContainer; cmdContainer.initialize(pDevice, nullptr, HeapSize::defaultHeapSize, true, false); constexpr uint32_t regOffset = 0x2000u; constexpr uint32_t immVal = 0xbaau; constexpr uint64_t dstAddress = 0xDEADCAF0u; EncodeMathMMIO::encodeBitwiseAndVal(cmdContainer, regOffset, immVal, dstAddress, false); CmdParse::parseCommandBuffer(commands, ptrOffset(cmdContainer.getCommandStream()->getCpuBase(), 0), cmdContainer.getCommandStream()->getUsed()); auto itor = find(commands.begin(), commands.end()); // load regOffset to R13 EXPECT_NE(commands.end(), itor); auto cmdLoadReg = genCmdCast(*itor); EXPECT_EQ(cmdLoadReg->getSourceRegisterAddress(), regOffset); EXPECT_EQ(cmdLoadReg->getDestinationRegisterAddress(), CS_GPR_R13); // load immVal to R14 itor++; EXPECT_NE(commands.end(), itor); auto cmdLoadImm = genCmdCast(*itor); EXPECT_EQ(cmdLoadImm->getRegisterOffset(), CS_GPR_R14); EXPECT_EQ(cmdLoadImm->getDataDword(), immVal); // encodeAluAnd should have its own unit tests, so we only check // that the MI_MATH exists and length is set to 3u itor++; EXPECT_NE(commands.end(), itor); auto cmdMath = genCmdCast(*itor); EXPECT_EQ(cmdMath->DW0.BitField.DwordLength, 3u); // store R15 to address itor++; EXPECT_NE(commands.end(), itor); auto cmdMem = genCmdCast(*itor); EXPECT_EQ(cmdMem->getRegisterAddress(), CS_GPR_R15); EXPECT_EQ(cmdMem->getMemoryAddress(), dstAddress); } HWTEST_F(CommandEncoderMathTest, WhenSettingGroupSizeIndirectThenCommandsAreCorrect) { using MI_MATH = typename FamilyType::MI_MATH; using MI_MATH_ALU_INST_INLINE = typename FamilyType::MI_MATH_ALU_INST_INLINE; using MI_STORE_REGISTER_MEM = typename FamilyType::MI_STORE_REGISTER_MEM; CommandContainer cmdContainer; cmdContainer.initialize(pDevice, nullptr, HeapSize::defaultHeapSize, true, false); CrossThreadDataOffset offsets[3] = {0, sizeof(uint32_t), 2 * sizeof(uint32_t)}; uint32_t crossThreadAddress[3] = {}; uint32_t lws[3] = {2, 1, 1}; EncodeIndirectParams::setGlobalWorkSizeIndirect(cmdContainer, offsets, reinterpret_cast(crossThreadAddress), lws); GenCmdList commands; CmdParse::parseCommandBuffer(commands, ptrOffset(cmdContainer.getCommandStream()->getCpuBase(), 0), cmdContainer.getCommandStream()->getUsed()); auto itor = commands.begin(); itor = find(itor, commands.end()); ASSERT_NE(itor, commands.end()); itor = find(itor, commands.end()); ASSERT_NE(itor, commands.end()); } HWTEST_F(CommandEncoderMathTest, WhenSettingGroupCountIndirectThenCommandsAreCorrect) { using MI_MATH = typename FamilyType::MI_MATH; using MI_MATH_ALU_INST_INLINE = typename FamilyType::MI_MATH_ALU_INST_INLINE; using MI_STORE_REGISTER_MEM = typename FamilyType::MI_STORE_REGISTER_MEM; CommandContainer cmdContainer; cmdContainer.initialize(pDevice, nullptr, HeapSize::defaultHeapSize, true, false); CrossThreadDataOffset offsets[3] = {0, sizeof(uint32_t), 2 * sizeof(uint32_t)}; uint32_t crossThreadAddress[3] = {}; EncodeIndirectParams::setGroupCountIndirect(cmdContainer, offsets, reinterpret_cast(crossThreadAddress)); GenCmdList commands; CmdParse::parseCommandBuffer(commands, ptrOffset(cmdContainer.getCommandStream()->getCpuBase(), 0), cmdContainer.getCommandStream()->getUsed()); auto itor = commands.begin(); itor = find(itor, commands.end()); ASSERT_NE(itor, commands.end()); itor = find(++itor, commands.end()); ASSERT_NE(itor, commands.end()); itor = find(++itor, commands.end()); ASSERT_NE(itor, commands.end()); itor = find(++itor, commands.end()); ASSERT_EQ(itor, commands.end()); } using CommandEncodeAluTests = ::testing::Test; HWTEST_F(CommandEncodeAluTests, whenAskingForIncrementOrDecrementCmdsSizeThenReturnCorrectValue) { constexpr size_t expectedSize = (2 * sizeof(typename FamilyType::MI_LOAD_REGISTER_IMM)) + sizeof(typename FamilyType::MI_MATH) + (4 * sizeof(typename FamilyType::MI_MATH_ALU_INST_INLINE)); EXPECT_EQ(EncodeMathMMIO::getCmdSizeForIncrementOrDecrement(), expectedSize); } HWTEST_F(CommandEncodeAluTests, whenProgrammingIncrementOperationThenUseCorrectAluCommands) { using MI_LOAD_REGISTER_IMM = typename FamilyType::MI_LOAD_REGISTER_IMM; using MI_MATH_ALU_INST_INLINE = typename FamilyType::MI_MATH_ALU_INST_INLINE; using MI_MATH = typename FamilyType::MI_MATH; constexpr size_t bufferSize = EncodeMathMMIO::getCmdSizeForIncrementOrDecrement(); constexpr AluRegisters incRegister = AluRegisters::R_1; uint8_t buffer[bufferSize] = {}; LinearStream cmdStream(buffer, bufferSize); EncodeMathMMIO::encodeIncrement(cmdStream, incRegister); EXPECT_EQ(bufferSize, cmdStream.getUsed()); auto lriCmd = reinterpret_cast(buffer); EXPECT_EQ(lriCmd->getRegisterOffset(), CS_GPR_R7); EXPECT_EQ(lriCmd->getDataDword(), 1u); lriCmd++; EXPECT_EQ(CS_GPR_R7 + 4, lriCmd->getRegisterOffset()); EXPECT_EQ(0u, lriCmd->getDataDword()); auto miMathCmd = reinterpret_cast(++lriCmd); EXPECT_EQ(3u, miMathCmd->DW0.BitField.DwordLength); auto miAluCmd = reinterpret_cast(++miMathCmd); EXPECT_EQ(static_cast(AluRegisters::OPCODE_LOAD), miAluCmd->DW0.BitField.ALUOpcode); EXPECT_EQ(static_cast(AluRegisters::R_SRCA), miAluCmd->DW0.BitField.Operand1); EXPECT_EQ(static_cast(incRegister), miAluCmd->DW0.BitField.Operand2); miAluCmd++; EXPECT_EQ(static_cast(AluRegisters::OPCODE_LOAD), miAluCmd->DW0.BitField.ALUOpcode); EXPECT_EQ(static_cast(AluRegisters::R_SRCB), miAluCmd->DW0.BitField.Operand1); EXPECT_EQ(static_cast(AluRegisters::R_7), miAluCmd->DW0.BitField.Operand2); miAluCmd++; EXPECT_EQ(static_cast(AluRegisters::OPCODE_ADD), miAluCmd->DW0.BitField.ALUOpcode); EXPECT_EQ(0u, miAluCmd->DW0.BitField.Operand1); EXPECT_EQ(0u, miAluCmd->DW0.BitField.Operand2); miAluCmd++; EXPECT_EQ(static_cast(AluRegisters::OPCODE_STORE), miAluCmd->DW0.BitField.ALUOpcode); EXPECT_EQ(static_cast(incRegister), miAluCmd->DW0.BitField.Operand1); EXPECT_EQ(static_cast(AluRegisters::R_ACCU), miAluCmd->DW0.BitField.Operand2); } HWTEST_F(CommandEncodeAluTests, whenProgrammingDecrementOperationThenUseCorrectAluCommands) { using MI_LOAD_REGISTER_IMM = typename FamilyType::MI_LOAD_REGISTER_IMM; using MI_MATH_ALU_INST_INLINE = typename FamilyType::MI_MATH_ALU_INST_INLINE; using MI_MATH = typename FamilyType::MI_MATH; constexpr size_t bufferSize = EncodeMathMMIO::getCmdSizeForIncrementOrDecrement(); constexpr AluRegisters decRegister = AluRegisters::R_1; uint8_t buffer[bufferSize] = {}; LinearStream cmdStream(buffer, bufferSize); EncodeMathMMIO::encodeDecrement(cmdStream, decRegister); EXPECT_EQ(bufferSize, cmdStream.getUsed()); auto lriCmd = reinterpret_cast(buffer); EXPECT_EQ(lriCmd->getRegisterOffset(), CS_GPR_R7); EXPECT_EQ(lriCmd->getDataDword(), 1u); lriCmd++; EXPECT_EQ(CS_GPR_R7 + 4, lriCmd->getRegisterOffset()); EXPECT_EQ(0u, lriCmd->getDataDword()); auto miMathCmd = reinterpret_cast(++lriCmd); EXPECT_EQ(3u, miMathCmd->DW0.BitField.DwordLength); auto miAluCmd = reinterpret_cast(++miMathCmd); EXPECT_EQ(static_cast(AluRegisters::OPCODE_LOAD), miAluCmd->DW0.BitField.ALUOpcode); EXPECT_EQ(static_cast(AluRegisters::R_SRCA), miAluCmd->DW0.BitField.Operand1); EXPECT_EQ(static_cast(decRegister), miAluCmd->DW0.BitField.Operand2); miAluCmd++; EXPECT_EQ(static_cast(AluRegisters::OPCODE_LOAD), miAluCmd->DW0.BitField.ALUOpcode); EXPECT_EQ(static_cast(AluRegisters::R_SRCB), miAluCmd->DW0.BitField.Operand1); EXPECT_EQ(static_cast(AluRegisters::R_7), miAluCmd->DW0.BitField.Operand2); miAluCmd++; EXPECT_EQ(static_cast(AluRegisters::OPCODE_SUB), miAluCmd->DW0.BitField.ALUOpcode); EXPECT_EQ(0u, miAluCmd->DW0.BitField.Operand1); EXPECT_EQ(0u, miAluCmd->DW0.BitField.Operand2); miAluCmd++; EXPECT_EQ(static_cast(AluRegisters::OPCODE_STORE), miAluCmd->DW0.BitField.ALUOpcode); EXPECT_EQ(static_cast(decRegister), miAluCmd->DW0.BitField.Operand1); EXPECT_EQ(static_cast(AluRegisters::R_ACCU), miAluCmd->DW0.BitField.Operand2); }