compute-runtime/opencl/source/device_queue/device_queue.h

140 lines
5.2 KiB
C++

/*
* Copyright (C) 2018-2021 Intel Corporation
*
* SPDX-License-Identifier: MIT
*
*/
#pragma once
#include "shared/source/helpers/hw_info.h"
#include "shared/source/indirect_heap/indirect_heap.h"
#include "shared/source/memory_manager/graphics_allocation.h"
#include "opencl/source/api/cl_types.h"
#include "opencl/source/execution_model/device_enqueue.h"
#include "opencl/source/helpers/base_object.h"
namespace NEO {
class ClDevice;
class CommandQueue;
class Context;
class Device;
class Kernel;
class Event;
struct MultiDispatchInfo;
class SchedulerKernel;
class HwTimeStamps;
class TagNodeBase;
template <>
struct OpenCLObjectMapper<_device_queue> {
typedef class DeviceQueue DerivedType;
};
class DeviceQueue : public BaseObject<_device_queue> {
public:
static const cl_ulong objectMagic = 0x1734547890087154LL;
DeviceQueue() {
for (uint32_t i = 0; i < IndirectHeap::NUM_TYPES; i++) {
heaps[i] = nullptr;
}
offsetDsh = 0;
}
DeviceQueue(Context *context, ClDevice *device, cl_queue_properties &properties);
~DeviceQueue() override;
Device &getDevice();
ClDevice *getClDevice() const;
Context &getContext() { return *context; }
cl_uint getQueueSize() { return queueSize; }
cl_command_queue_properties getCommandQueueProperties() const { return commandQueueProperties; }
const std::vector<uint64_t> &getPropertiesVector() const { return propertiesVector; }
GraphicsAllocation *getQueueBuffer() { return queueBuffer; }
GraphicsAllocation *getEventPoolBuffer() { return eventPoolBuffer; }
GraphicsAllocation *getSlbBuffer() { return slbBuffer; }
GraphicsAllocation *getStackBuffer() { return stackBuffer; }
GraphicsAllocation *getQueueStorageBuffer() { return queueStorageBuffer; }
GraphicsAllocation *getDshBuffer() { return dshBuffer; }
GraphicsAllocation *getDebugQueue() { return debugQueue; }
bool isProfilingEnabled() {
return !!(commandQueueProperties & CL_QUEUE_PROFILING_ENABLE);
}
static DeviceQueue *create(Context *context,
ClDevice *device,
const cl_queue_properties &properties,
cl_int &errcodeRet);
cl_int getCommandQueueInfo(cl_command_queue_info paramName,
size_t paramValueSize, void *paramValue,
size_t *paramValueSizeRet);
void setupExecutionModelDispatch(IndirectHeap &surfaceStateHeap, IndirectHeap &dynamicStateHeap, Kernel *parentKernel, uint32_t parentCount, uint64_t tagAddress, uint32_t taskCount, TagNodeBase *hwTimeStamp, bool isCcsUsed);
virtual void setupIndirectState(IndirectHeap &surfaceStateHeap, IndirectHeap &dynamicStateHeap, Kernel *parentKernel, uint32_t parentIDCount, bool isCcsUsed);
virtual void addExecutionModelCleanUpSection(Kernel *parentKernel, TagNodeBase *hwTimeStamp, uint64_t tagAddress, uint32_t taskCount);
MOCKABLE_VIRTUAL bool isEMCriticalSectionFree() {
auto igilCmdQueue = reinterpret_cast<IGIL_CommandQueue *>(queueBuffer->getUnderlyingBuffer());
auto igilCriticalSection = const_cast<volatile uint *>(&igilCmdQueue->m_controls.m_CriticalSection);
return *igilCriticalSection == ExecutionModelCriticalSection::Free;
}
virtual void resetDeviceQueue();
virtual void dispatchScheduler(LinearStream &commandStream, SchedulerKernel &scheduler, PreemptionMode preemptionMode, IndirectHeap *ssh, IndirectHeap *dsh, bool isCcsUsed);
virtual IndirectHeap *getIndirectHeap(IndirectHeap::Type type);
void acquireEMCriticalSection() {
if (DebugManager.flags.EnableNullHardware.get()) {
return;
}
auto igilCmdQueue = reinterpret_cast<IGIL_CommandQueue *>(queueBuffer->getUnderlyingBuffer());
igilCmdQueue->m_controls.m_CriticalSection = ExecutionModelCriticalSection::Taken;
}
uint32_t getDshOffset() const {
return offsetDsh;
}
enum ExecutionModelCriticalSection {
Free = 0,
Taken = 1
};
static const uint32_t numberOfIDTables = 2;
static const uint32_t interfaceDescriptorEntries = 64;
static const uint32_t colorCalcStateSize = 192;
static const uint32_t schedulerIDIndex = 62;
static const uint32_t numberOfDeviceEnqueues;
protected:
void storeProperties(const cl_queue_properties *properties);
void allocateResources();
void initDeviceQueue();
Context *context = nullptr;
ClDevice *device = nullptr;
cl_command_queue_properties commandQueueProperties = 0;
std::vector<uint64_t> propertiesVector;
cl_uint queueSize = 0;
GraphicsAllocation *queueBuffer = nullptr;
GraphicsAllocation *eventPoolBuffer = nullptr;
GraphicsAllocation *slbBuffer = nullptr;
GraphicsAllocation *stackBuffer = nullptr;
GraphicsAllocation *queueStorageBuffer = nullptr;
GraphicsAllocation *dshBuffer = nullptr;
GraphicsAllocation *debugQueue = nullptr;
DebugDataBuffer *debugData = nullptr;
IndirectHeap *heaps[IndirectHeap::NUM_TYPES];
uint32_t offsetDsh;
};
typedef DeviceQueue *(*DeviceQueueCreateFunc)(
Context *context, ClDevice *device, cl_queue_properties &properties);
} // namespace NEO