Remove deprecated code

Signed-off-by: Bartosz Dunajski <bartosz.dunajski@intel.com>
This commit is contained in:
Bartosz Dunajski
2021-12-14 09:15:22 +00:00
committed by Compute-Runtime-Automation
parent 4ae2f6e111
commit fe8cb190bc
21 changed files with 2 additions and 111 deletions

View File

@@ -36,7 +36,6 @@ class Kernel;
class MemObj; class MemObj;
class PerformanceCounters; class PerformanceCounters;
struct CompletionStamp; struct CompletionStamp;
struct DispatchGlobalsArgs;
struct MultiDispatchInfo; struct MultiDispatchInfo;
enum class QueuePriority { enum class QueuePriority {
@@ -188,8 +187,6 @@ class CommandQueue : public BaseObject<_cl_command_queue> {
const cl_event *eventWaitList, cl_event *event) = 0; const cl_event *eventWaitList, cl_event *event) = 0;
virtual cl_int finish() = 0; virtual cl_int finish() = 0;
virtual cl_int enqueueInitDispatchGlobals(DispatchGlobalsArgs *dispatchGlobalsArgs, cl_uint numEventsInWaitList,
const cl_event *eventWaitList, cl_event *event) = 0;
virtual cl_int flush() = 0; virtual cl_int flush() = 0;

View File

@@ -341,10 +341,6 @@ class CommandQueueHw : public CommandQueue {
cl_event *event) override; cl_event *event) override;
cl_int finish() override; cl_int finish() override;
cl_int enqueueInitDispatchGlobals(DispatchGlobalsArgs *dispatchGlobalsArgs,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) override;
cl_int flush() override; cl_int flush() override;
template <uint32_t enqueueType> template <uint32_t enqueueType>

View File

@@ -1,23 +0,0 @@
/*
* Copyright (C) 2020-2021 Intel Corporation
*
* SPDX-License-Identifier: MIT
*
*/
#pragma once
#include "opencl/source/command_queue/command_queue_hw.h"
namespace NEO {
struct DispatchGlobalsArgs {
};
template <typename GfxFamily>
cl_int CommandQueueHw<GfxFamily>::enqueueInitDispatchGlobals(DispatchGlobalsArgs *dispatchGlobalsArgs,
cl_uint numEventsInWaitList,
const cl_event *eventWaitList,
cl_event *event) {
return CL_INVALID_VALUE;
}
} // namespace NEO

View File

@@ -794,7 +794,6 @@ CompletionStamp CommandQueueHw<GfxFamily>::enqueueNonBlocked(
uint32_t numGrfRequired = GrfConfig::DefaultGrfNumber; uint32_t numGrfRequired = GrfConfig::DefaultGrfNumber;
auto specialPipelineSelectMode = false; auto specialPipelineSelectMode = false;
Kernel *kernel = nullptr; Kernel *kernel = nullptr;
bool usePerDssBackedBuffer = false;
bool auxTranslationRequired = false; bool auxTranslationRequired = false;
bool useGlobalAtomics = false; bool useGlobalAtomics = false;
@@ -815,10 +814,6 @@ CompletionStamp CommandQueueHw<GfxFamily>::enqueueNonBlocked(
anyUncacheableArgs = true; anyUncacheableArgs = true;
} }
if (kernel->requiresPerDssBackedBuffer()) {
usePerDssBackedBuffer = true;
}
if (kernel->getKernelInfo().kernelDescriptor.kernelAttributes.flags.useGlobalAtomics) { if (kernel->getKernelInfo().kernelDescriptor.kernelAttributes.flags.useGlobalAtomics) {
useGlobalAtomics = true; useGlobalAtomics = true;
} }
@@ -889,7 +884,7 @@ CompletionStamp CommandQueueHw<GfxFamily>::enqueueNonBlocked(
implicitFlush, //implicitFlush implicitFlush, //implicitFlush
!eventBuilder.getEvent() || getGpgpuCommandStreamReceiver().isNTo1SubmissionModelEnabled(), //outOfOrderExecutionAllowed !eventBuilder.getEvent() || getGpgpuCommandStreamReceiver().isNTo1SubmissionModelEnabled(), //outOfOrderExecutionAllowed
false, //epilogueRequired false, //epilogueRequired
usePerDssBackedBuffer, //usePerDssBackedBuffer false, //usePerDssBackedBuffer
kernel->isSingleSubdevicePreferred(), //useSingleSubdevice kernel->isSingleSubdevicePreferred(), //useSingleSubdevice
useGlobalAtomics, //useGlobalAtomics useGlobalAtomics, //useGlobalAtomics
kernel->areMultipleSubDevicesInContext(), //areMultipleSubDevicesInContext kernel->areMultipleSubDevicesInContext(), //areMultipleSubDevicesInContext

View File

@@ -13,8 +13,6 @@
#include "opencl/source/command_queue/command_queue_hw_enabled_device_enqueue.inl" #include "opencl/source/command_queue/command_queue_hw_enabled_device_enqueue.inl"
#include "opencl/source/command_queue/enqueue_resource_barrier.h" #include "opencl/source/command_queue/enqueue_resource_barrier.h"
#include "enqueue_init_dispatch_globals.h"
namespace NEO { namespace NEO {
typedef ICLFamily Family; typedef ICLFamily Family;

View File

@@ -12,7 +12,6 @@
#include "opencl/source/command_queue/command_queue_hw_disabled_device_enqueue.inl" #include "opencl/source/command_queue/command_queue_hw_disabled_device_enqueue.inl"
#include "command_queue_helpers_gen12lp.inl" #include "command_queue_helpers_gen12lp.inl"
#include "enqueue_init_dispatch_globals.h"
namespace NEO { namespace NEO {

View File

@@ -13,8 +13,6 @@
#include "opencl/source/command_queue/command_queue_hw_disabled_device_enqueue.inl" #include "opencl/source/command_queue/command_queue_hw_disabled_device_enqueue.inl"
#include "opencl/source/command_queue/enqueue_resource_barrier.h" #include "opencl/source/command_queue/enqueue_resource_barrier.h"
#include "enqueue_init_dispatch_globals.h"
namespace NEO { namespace NEO {
typedef BDWFamily Family; typedef BDWFamily Family;

View File

@@ -13,8 +13,6 @@
#include "opencl/source/command_queue/command_queue_hw_enabled_device_enqueue.inl" #include "opencl/source/command_queue/command_queue_hw_enabled_device_enqueue.inl"
#include "opencl/source/command_queue/enqueue_resource_barrier.h" #include "opencl/source/command_queue/enqueue_resource_barrier.h"
#include "enqueue_init_dispatch_globals.h"
namespace NEO { namespace NEO {
typedef SKLFamily Family; typedef SKLFamily Family;

View File

@@ -247,7 +247,7 @@ CompletionStamp &CommandComputeKernel::submit(uint32_t taskLevel, bool terminate
false, //implicitFlush false, //implicitFlush
commandQueue.getGpgpuCommandStreamReceiver().isNTo1SubmissionModelEnabled(), //outOfOrderExecutionAllowed commandQueue.getGpgpuCommandStreamReceiver().isNTo1SubmissionModelEnabled(), //outOfOrderExecutionAllowed
false, //epilogueRequired false, //epilogueRequired
kernel->requiresPerDssBackedBuffer(), //usePerDssBackedBuffer false, //usePerDssBackedBuffer
kernel->isSingleSubdevicePreferred(), //useSingleSubdevice kernel->isSingleSubdevicePreferred(), //useSingleSubdevice
kernel->getKernelInfo().kernelDescriptor.kernelAttributes.flags.useGlobalAtomics, //useGlobalAtomics kernel->getKernelInfo().kernelDescriptor.kernelAttributes.flags.useGlobalAtomics, //useGlobalAtomics
kernel->areMultipleSubDevicesInContext(), //areMultipleSubDevicesInContext kernel->areMultipleSubDevicesInContext(), //areMultipleSubDevicesInContext

View File

@@ -384,7 +384,6 @@ class Kernel : public ReferenceTrackedObject<Kernel> {
const bool kernelUsesLocalIds, const bool kernelUsesLocalIds,
const bool isCssUsed) const; const bool isCssUsed) const;
bool requiresPerDssBackedBuffer() const;
bool requiresLimitedWorkgroupSize() const; bool requiresLimitedWorkgroupSize() const;
bool isKernelDebugEnabled() const { return debugEnabled; } bool isKernelDebugEnabled() const { return debugEnabled; }
int32_t setAdditionalKernelExecInfoWithParam(uint32_t paramName, size_t paramValueSize, const void *paramValue); int32_t setAdditionalKernelExecInfoWithParam(uint32_t paramName, size_t paramValueSize, const void *paramValue);

View File

@@ -12,10 +12,6 @@
namespace NEO { namespace NEO {
bool Kernel::requiresPerDssBackedBuffer() const {
return DebugManager.flags.ForcePerDssBackedBufferProgramming.get();
}
int32_t Kernel::setAdditionalKernelExecInfoWithParam(uint32_t paramName, size_t paramValueSize, const void *paramValue) { int32_t Kernel::setAdditionalKernelExecInfoWithParam(uint32_t paramName, size_t paramValueSize, const void *paramValue) {
return CL_INVALID_VALUE; return CL_INVALID_VALUE;
} }

View File

@@ -11,8 +11,6 @@
#include "opencl/source/command_queue/command_queue_hw.h" #include "opencl/source/command_queue/command_queue_hw.h"
#include "opencl/source/command_queue/enqueue_resource_barrier.h" #include "opencl/source/command_queue/enqueue_resource_barrier.h"
#include "enqueue_init_dispatch_globals.h"
namespace NEO { namespace NEO {
using Family = XeHpFamily; using Family = XeHpFamily;

View File

@@ -11,8 +11,6 @@
#include "opencl/source/command_queue/command_queue_hw.h" #include "opencl/source/command_queue/command_queue_hw.h"
#include "opencl/source/command_queue/enqueue_resource_barrier.h" #include "opencl/source/command_queue/enqueue_resource_barrier.h"
#include "enqueue_init_dispatch_globals.h"
namespace NEO { namespace NEO {
using Family = XE_HPC_COREFamily; using Family = XE_HPC_COREFamily;

View File

@@ -11,8 +11,6 @@
#include "opencl/source/command_queue/command_queue_hw.h" #include "opencl/source/command_queue/command_queue_hw.h"
#include "opencl/source/command_queue/enqueue_resource_barrier.h" #include "opencl/source/command_queue/enqueue_resource_barrier.h"
#include "enqueue_init_dispatch_globals.h"
namespace NEO { namespace NEO {
using Family = XE_HPG_COREFamily; using Family = XE_HPG_COREFamily;

View File

@@ -1486,27 +1486,6 @@ HWTEST_F(CommandQueueHwTest, givenFinishWhenFlushBatchedSubmissionsFailsThenErro
EXPECT_EQ(CL_OUT_OF_RESOURCES, errorCode); EXPECT_EQ(CL_OUT_OF_RESOURCES, errorCode);
} }
HWTEST_F(CommandQueueHwTest, givenEmptyDispatchGlobalsArgsWhenEnqueueInitDispatchGlobalsCalledThenErrorIsReturned) {
EXPECT_EQ(CL_INVALID_VALUE, pCmdQ->enqueueInitDispatchGlobals(nullptr, 0, nullptr, nullptr));
}
HWTEST_F(CommandQueueHwTest, WhenForcePerDssBackedBufferProgrammingSetThenDispatchFlagsAreSetAccordingly) {
DebugManagerStateRestore restore;
DebugManager.flags.ForcePerDssBackedBufferProgramming = true;
MockKernelWithInternals mockKernelWithInternals(*pClDevice);
auto mockKernel = mockKernelWithInternals.mockKernel;
auto &csr = pDevice->getUltCommandStreamReceiver<FamilyType>();
size_t offset = 0;
size_t gws = 64;
size_t lws = 16;
cl_int status = pCmdQ->enqueueKernel(mockKernel, 1, &offset, &gws, &lws, 0, nullptr, nullptr);
EXPECT_EQ(CL_SUCCESS, status);
EXPECT_TRUE(csr.recordedDispatchFlags.usePerDssBackedBuffer);
}
template <bool ooq> template <bool ooq>
struct CommandQueueHwBlitTest : ClDeviceFixture, ContextFixture, CommandQueueHwFixture, ::testing::Test { struct CommandQueueHwBlitTest : ClDeviceFixture, ContextFixture, CommandQueueHwFixture, ::testing::Test {
using ContextFixture::SetUp; using ContextFixture::SetUp;

View File

@@ -1251,18 +1251,6 @@ TEST(CommandQueue, GivenCommandQueueWhenCheckingIfIsCacheFlushCommandCalledThenF
EXPECT_FALSE(isCommandCacheFlush); EXPECT_FALSE(isCommandCacheFlush);
} }
TEST(CommandQueue, GivenCommandQueueWhenEnqueueInitDispatchGlobalsCalledThenSuccessReturned) {
MockContext context;
MockCommandQueue cmdQ(&context, nullptr, 0, false);
cl_int result = cmdQ.enqueueInitDispatchGlobals(
nullptr,
0,
nullptr,
nullptr);
EXPECT_EQ(CL_SUCCESS, result);
}
TEST(CommandQueue, givenBlitterOperationsSupportedWhenCreatingQueueThenTimestampPacketIsCreated) { TEST(CommandQueue, givenBlitterOperationsSupportedWhenCreatingQueueThenTimestampPacketIsCreated) {
DebugManagerStateRestore restore; DebugManagerStateRestore restore;
DebugManager.flags.EnableTimestampPacket.set(0); DebugManager.flags.EnableTimestampPacket.set(0);

View File

@@ -6,7 +6,6 @@
*/ */
#include "shared/source/helpers/l3_range.h" #include "shared/source/helpers/l3_range.h"
#include "shared/source/helpers/ray_tracing_helper.h"
#include "shared/test/common/cmd_parse/hw_parse.h" #include "shared/test/common/cmd_parse/hw_parse.h"
#include "shared/test/common/helpers/debug_manager_state_restore.h" #include "shared/test/common/helpers/debug_manager_state_restore.h"
#include "shared/test/common/mocks/mock_csr.h" #include "shared/test/common/mocks/mock_csr.h"

View File

@@ -3027,23 +3027,6 @@ TEST(KernelTest, givenKernelLocalIdGenerationByRuntimeFalseAndLocalIdsNotUsedWhe
device->getMemoryManager()->freeGraphicsMemory(mockKernel.kernelInfo.getGraphicsAllocation()); device->getMemoryManager()->freeGraphicsMemory(mockKernel.kernelInfo.getGraphicsAllocation());
} }
TEST(KernelTest, givenKernelWhenForcePerDssBackedBufferProgrammingIsSetThenKernelRequiresPerDssBackedBuffer) {
DebugManagerStateRestore restore;
DebugManager.flags.ForcePerDssBackedBufferProgramming.set(true);
auto device = clUniquePtr(new MockClDevice(MockDevice::createWithNewExecutionEnvironment<MockDevice>(defaultHwInfo.get())));
MockKernelWithInternals kernel(*device);
EXPECT_TRUE(kernel.mockKernel->requiresPerDssBackedBuffer());
}
TEST(KernelTest, givenKernelWhenForcePerDssBackedBufferProgrammingIsNotSetThenKernelDoesntRequirePerDssBackedBuffer) {
auto device = clUniquePtr(new MockClDevice(MockDevice::createWithNewExecutionEnvironment<MockDevice>(defaultHwInfo.get())));
MockKernelWithInternals kernel(*device);
EXPECT_FALSE(kernel.mockKernel->requiresPerDssBackedBuffer());
}
TEST(KernelTest, whenKernelIsInitializedThenThreadArbitrationPolicyIsSetToDefaultValue) { TEST(KernelTest, whenKernelIsInitializedThenThreadArbitrationPolicyIsSetToDefaultValue) {
UltClDeviceFactory deviceFactory{1, 0}; UltClDeviceFactory deviceFactory{1, 0};

View File

@@ -198,9 +198,6 @@ class MockCommandQueue : public CommandQueue {
cl_int finish() override { return CL_SUCCESS; } cl_int finish() override { return CL_SUCCESS; }
cl_int enqueueInitDispatchGlobals(DispatchGlobalsArgs *dispatchGlobalsArgs, cl_uint numEventsInWaitList,
const cl_event *eventWaitList, cl_event *event) override { return CL_SUCCESS; }
cl_int flush() override { return CL_SUCCESS; } cl_int flush() override { return CL_SUCCESS; }
bool obtainTimestampPacketForCacheFlush(bool isCacheFlushRequired) const override { return isCacheFlushRequired; } bool obtainTimestampPacketForCacheFlush(bool isCacheFlushRequired) const override { return isCacheFlushRequired; }

View File

@@ -182,7 +182,6 @@ AllocateSharedAllocationsWithCpuAndGpuStorage = -1
UseMaxSimdSizeToDeduceMaxWorkgroupSize = 0 UseMaxSimdSizeToDeduceMaxWorkgroupSize = 0
ReturnRawGpuTimestamps = 0 ReturnRawGpuTimestamps = 0
EnableDeviceBasedTimestamps = 0 EnableDeviceBasedTimestamps = 0
ForcePerDssBackedBufferProgramming = 0
MaxHwThreadsPercent = 0 MaxHwThreadsPercent = 0
MinHwThreadsUnoccupied = 0 MinHwThreadsUnoccupied = 0
LimitBlitterMaxWidth = -1 LimitBlitterMaxWidth = -1

View File

@@ -374,7 +374,6 @@ DECLARE_DEBUG_VARIABLE(int32_t, ForceHostPointerImport, -1, "-1: default, 0: dis
DECLARE_DEBUG_VARIABLE(bool, UseMaxSimdSizeToDeduceMaxWorkgroupSize, false, "With this flag on, max workgroup size is deduced using SIMD32 instead of SIMD8, this causes the max wkg size to be 4 times bigger") DECLARE_DEBUG_VARIABLE(bool, UseMaxSimdSizeToDeduceMaxWorkgroupSize, false, "With this flag on, max workgroup size is deduced using SIMD32 instead of SIMD8, this causes the max wkg size to be 4 times bigger")
DECLARE_DEBUG_VARIABLE(bool, ReturnRawGpuTimestamps, false, "Driver returns raw GPU tiemstamps instead of calculated ones.") DECLARE_DEBUG_VARIABLE(bool, ReturnRawGpuTimestamps, false, "Driver returns raw GPU tiemstamps instead of calculated ones.")
DECLARE_DEBUG_VARIABLE(bool, EnableDeviceBasedTimestamps, false, "Driver returns timestamps in nanoseconds based on device timer.") DECLARE_DEBUG_VARIABLE(bool, EnableDeviceBasedTimestamps, false, "Driver returns timestamps in nanoseconds based on device timer.")
DECLARE_DEBUG_VARIABLE(bool, ForcePerDssBackedBufferProgramming, false, "Always program per-DSS memory backed buffer in preamble")
DECLARE_DEBUG_VARIABLE(bool, UseCommandBufferHeaderSizeForWddmQueueSubmission, true, "0: Page size (4096), 1: sizeof(COMMAND_BUFFER_HEADER)") DECLARE_DEBUG_VARIABLE(bool, UseCommandBufferHeaderSizeForWddmQueueSubmission, true, "0: Page size (4096), 1: sizeof(COMMAND_BUFFER_HEADER)")
DECLARE_DEBUG_VARIABLE(bool, DisableDeepBind, false, "Disable passing RTLD_DEEPBIND flag to all dlopen calls.") DECLARE_DEBUG_VARIABLE(bool, DisableDeepBind, false, "Disable passing RTLD_DEEPBIND flag to all dlopen calls.")
DECLARE_DEBUG_VARIABLE(bool, UseUmKmDataTranslator, false, "Use helper library for UMD<->KMD (WDDM) struct layout compatibility") DECLARE_DEBUG_VARIABLE(bool, UseUmKmDataTranslator, false, "Use helper library for UMD<->KMD (WDDM) struct layout compatibility")