mirror of
https://github.com/intel/compute-runtime.git
synced 2025-12-24 12:23:05 +08:00
51 lines
1.2 KiB
C++
51 lines
1.2 KiB
C++
/*
|
|
* Copyright (C) 2018-2025 Intel Corporation
|
|
*
|
|
* SPDX-License-Identifier: MIT
|
|
*
|
|
*/
|
|
|
|
#pragma once
|
|
#include "shared/source/command_stream/command_stream_receiver.h"
|
|
#include "shared/source/command_stream/wait_status.h"
|
|
|
|
#include "opencl/source/command_queue/command_queue_hw.h"
|
|
|
|
namespace NEO {
|
|
|
|
template <typename GfxFamily>
|
|
cl_int CommandQueueHw<GfxFamily>::finish() {
|
|
|
|
auto &csr = getGpgpuCommandStreamReceiver();
|
|
|
|
auto result = csr.flushBatchedSubmissions();
|
|
if (!result) {
|
|
return CL_OUT_OF_RESOURCES;
|
|
}
|
|
|
|
bool waitForTaskCountRequired = false;
|
|
|
|
if (!l3FlushedAfterCpuRead && l3FlushAfterPostSyncEnabled) {
|
|
csr.flushTagUpdate();
|
|
|
|
CompletionStamp completionStamp = {
|
|
csr.peekTaskCount(),
|
|
csr.peekTaskLevel(),
|
|
csr.obtainCurrentFlushStamp()};
|
|
|
|
this->updateFromCompletionStamp(completionStamp, nullptr);
|
|
|
|
this->l3FlushedAfterCpuRead = true;
|
|
waitForTaskCountRequired = true;
|
|
}
|
|
|
|
// Stall until HW reaches taskCount on all its engines
|
|
const auto waitStatus = waitForAllEngines(true, nullptr, waitForTaskCountRequired);
|
|
if (waitStatus == WaitStatus::gpuHang) {
|
|
return CL_OUT_OF_RESOURCES;
|
|
}
|
|
|
|
return CL_SUCCESS;
|
|
}
|
|
} // namespace NEO
|