179 lines
7.7 KiB
C++
179 lines
7.7 KiB
C++
/*
|
|
* Copyright (C) 2017-2021 Intel Corporation
|
|
*
|
|
* SPDX-License-Identifier: MIT
|
|
*
|
|
*/
|
|
|
|
#include "shared/source/command_stream/linear_stream.h"
|
|
#include "shared/source/direct_submission/linux/drm_direct_submission.h"
|
|
#include "shared/source/execution_environment/execution_environment.h"
|
|
#include "shared/source/gmm_helper/gmm_helper.h"
|
|
#include "shared/source/gmm_helper/page_table_mngr.h"
|
|
#include "shared/source/helpers/aligned_memory.h"
|
|
#include "shared/source/helpers/flush_stamp.h"
|
|
#include "shared/source/helpers/hw_helper.h"
|
|
#include "shared/source/helpers/preamble.h"
|
|
#include "shared/source/memory_manager/residency.h"
|
|
#include "shared/source/os_interface/linux/drm_allocation.h"
|
|
#include "shared/source/os_interface/linux/drm_buffer_object.h"
|
|
#include "shared/source/os_interface/linux/drm_engine_mapper.h"
|
|
#include "shared/source/os_interface/linux/drm_memory_manager.h"
|
|
#include "shared/source/os_interface/linux/drm_memory_operations_handler.h"
|
|
#include "shared/source/os_interface/linux/drm_neo.h"
|
|
#include "shared/source/os_interface/linux/os_context_linux.h"
|
|
#include "shared/source/os_interface/linux/os_interface.h"
|
|
|
|
#include "opencl/source/os_interface/linux/drm_command_stream.h"
|
|
|
|
#include <cstdlib>
|
|
#include <cstring>
|
|
|
|
namespace NEO {
|
|
|
|
template <typename GfxFamily>
|
|
DrmCommandStreamReceiver<GfxFamily>::DrmCommandStreamReceiver(ExecutionEnvironment &executionEnvironment,
|
|
uint32_t rootDeviceIndex,
|
|
const DeviceBitfield deviceBitfield,
|
|
gemCloseWorkerMode mode)
|
|
: BaseClass(executionEnvironment, rootDeviceIndex, deviceBitfield), gemCloseWorkerOperationMode(mode) {
|
|
|
|
auto rootDeviceEnvironment = executionEnvironment.rootDeviceEnvironments[rootDeviceIndex].get();
|
|
|
|
this->drm = rootDeviceEnvironment->osInterface->get()->getDrm();
|
|
residency.reserve(512);
|
|
execObjectsStorage.reserve(512);
|
|
|
|
auto hwInfo = rootDeviceEnvironment->getHardwareInfo();
|
|
auto localMemoryEnabled = HwHelper::get(hwInfo->platform.eRenderCoreFamily).getEnableLocalMemory(*hwInfo);
|
|
|
|
this->dispatchMode = localMemoryEnabled ? DispatchMode::BatchedDispatch : DispatchMode::ImmediateDispatch;
|
|
|
|
if (DebugManager.flags.CsrDispatchMode.get()) {
|
|
this->dispatchMode = static_cast<DispatchMode>(DebugManager.flags.CsrDispatchMode.get());
|
|
}
|
|
}
|
|
|
|
template <typename GfxFamily>
|
|
bool DrmCommandStreamReceiver<GfxFamily>::flush(BatchBuffer &batchBuffer, ResidencyContainer &allocationsForResidency) {
|
|
this->printDeviceIndex();
|
|
DrmAllocation *alloc = static_cast<DrmAllocation *>(batchBuffer.commandBufferAllocation);
|
|
DEBUG_BREAK_IF(!alloc);
|
|
|
|
BufferObject *bb = alloc->getBO();
|
|
if (bb == nullptr) {
|
|
return false;
|
|
}
|
|
|
|
if (this->lastSentSliceCount != batchBuffer.sliceCount) {
|
|
if (drm->setQueueSliceCount(batchBuffer.sliceCount)) {
|
|
this->lastSentSliceCount = batchBuffer.sliceCount;
|
|
}
|
|
}
|
|
|
|
auto memoryOperationsInterface = static_cast<DrmMemoryOperationsHandler *>(this->executionEnvironment.rootDeviceEnvironments[this->rootDeviceIndex]->memoryOperationsInterface.get());
|
|
|
|
std::unique_lock<std::mutex> lock;
|
|
if (!this->directSubmission.get() && !this->blitterDirectSubmission.get()) {
|
|
lock = memoryOperationsInterface->lockHandlerIfUsed();
|
|
}
|
|
|
|
memoryOperationsInterface->mergeWithResidencyContainer(this->osContext, allocationsForResidency);
|
|
|
|
if (this->directSubmission.get()) {
|
|
memoryOperationsInterface->makeResidentWithinOsContext(this->osContext, ArrayRef<GraphicsAllocation *>(&batchBuffer.commandBufferAllocation, 1), true);
|
|
return this->directSubmission->dispatchCommandBuffer(batchBuffer, *this->flushStamp.get());
|
|
}
|
|
if (this->blitterDirectSubmission.get()) {
|
|
memoryOperationsInterface->makeResidentWithinOsContext(this->osContext, ArrayRef<GraphicsAllocation *>(&batchBuffer.commandBufferAllocation, 1), true);
|
|
return this->blitterDirectSubmission->dispatchCommandBuffer(batchBuffer, *this->flushStamp.get());
|
|
}
|
|
|
|
this->flushStamp->setStamp(bb->peekHandle());
|
|
this->flushInternal(batchBuffer, allocationsForResidency);
|
|
|
|
if (this->gemCloseWorkerOperationMode == gemCloseWorkerMode::gemCloseWorkerActive) {
|
|
bb->reference();
|
|
this->getMemoryManager()->peekGemCloseWorker()->push(bb);
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
template <typename GfxFamily>
|
|
void DrmCommandStreamReceiver<GfxFamily>::exec(const BatchBuffer &batchBuffer, uint32_t vmHandleId, uint32_t drmContextId) {
|
|
DrmAllocation *alloc = static_cast<DrmAllocation *>(batchBuffer.commandBufferAllocation);
|
|
DEBUG_BREAK_IF(!alloc);
|
|
BufferObject *bb = alloc->getBO();
|
|
DEBUG_BREAK_IF(!bb);
|
|
|
|
auto execFlags = static_cast<OsContextLinux *>(osContext)->getEngineFlag() | I915_EXEC_NO_RELOC;
|
|
|
|
// Residency hold all allocation except command buffer, hence + 1
|
|
auto requiredSize = this->residency.size() + 1;
|
|
if (requiredSize > this->execObjectsStorage.size()) {
|
|
this->execObjectsStorage.resize(requiredSize);
|
|
}
|
|
|
|
int err = bb->exec(static_cast<uint32_t>(alignUp(batchBuffer.usedSize - batchBuffer.startOffset, 8)),
|
|
batchBuffer.startOffset, execFlags,
|
|
batchBuffer.requiresCoherency,
|
|
this->osContext,
|
|
vmHandleId,
|
|
drmContextId,
|
|
this->residency.data(), this->residency.size(),
|
|
this->execObjectsStorage.data());
|
|
UNRECOVERABLE_IF(err != 0);
|
|
|
|
this->residency.clear();
|
|
}
|
|
|
|
template <typename GfxFamily>
|
|
void DrmCommandStreamReceiver<GfxFamily>::processResidency(const ResidencyContainer &inputAllocationsForResidency, uint32_t handleId) {
|
|
for (auto &alloc : inputAllocationsForResidency) {
|
|
auto drmAlloc = static_cast<DrmAllocation *>(alloc);
|
|
drmAlloc->makeBOsResident(osContext, handleId, &this->residency, false);
|
|
}
|
|
}
|
|
|
|
template <typename GfxFamily>
|
|
void DrmCommandStreamReceiver<GfxFamily>::makeNonResident(GraphicsAllocation &gfxAllocation) {
|
|
// Vector is moved to command buffer inside flush.
|
|
// If flush wasn't called we need to make all objects non-resident.
|
|
// If makeNonResident is called before flush, vector will be cleared.
|
|
if (gfxAllocation.isResident(this->osContext->getContextId())) {
|
|
if (this->residency.size() != 0) {
|
|
this->residency.clear();
|
|
}
|
|
for (auto fragmentId = 0u; fragmentId < gfxAllocation.fragmentsStorage.fragmentCount; fragmentId++) {
|
|
gfxAllocation.fragmentsStorage.fragmentStorageData[fragmentId].residency->resident[osContext->getContextId()] = false;
|
|
}
|
|
}
|
|
gfxAllocation.releaseResidencyInOsContext(this->osContext->getContextId());
|
|
}
|
|
|
|
template <typename GfxFamily>
|
|
DrmMemoryManager *DrmCommandStreamReceiver<GfxFamily>::getMemoryManager() const {
|
|
return static_cast<DrmMemoryManager *>(CommandStreamReceiver::getMemoryManager());
|
|
}
|
|
|
|
template <typename GfxFamily>
|
|
GmmPageTableMngr *DrmCommandStreamReceiver<GfxFamily>::createPageTableManager() {
|
|
GmmPageTableMngr *gmmPageTableMngr = GmmPageTableMngr::create(this->executionEnvironment.rootDeviceEnvironments[this->rootDeviceIndex]->getGmmClientContext(), TT_TYPE::AUXTT, nullptr);
|
|
gmmPageTableMngr->setCsrHandle(this);
|
|
this->executionEnvironment.rootDeviceEnvironments[this->rootDeviceIndex]->pageTableManager.reset(gmmPageTableMngr);
|
|
return gmmPageTableMngr;
|
|
}
|
|
|
|
template <typename GfxFamily>
|
|
bool DrmCommandStreamReceiver<GfxFamily>::waitForFlushStamp(FlushStamp &flushStamp) {
|
|
drm_i915_gem_wait wait = {};
|
|
wait.bo_handle = static_cast<uint32_t>(flushStamp);
|
|
wait.timeout_ns = -1;
|
|
|
|
drm->ioctl(DRM_IOCTL_I915_GEM_WAIT, &wait);
|
|
return true;
|
|
}
|
|
|
|
} // namespace NEO
|