2020-03-06 18:09:57 +08:00
|
|
|
/*
|
2021-03-31 02:11:00 +08:00
|
|
|
* Copyright (C) 2019-2021 Intel Corporation
|
2020-03-06 18:09:57 +08:00
|
|
|
*
|
|
|
|
* SPDX-License-Identifier: MIT
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
|
2020-03-19 13:21:57 +08:00
|
|
|
#include "level_zero/core/source/fence/fence.h"
|
2020-03-06 18:09:57 +08:00
|
|
|
|
|
|
|
#include "shared/source/command_stream/command_stream_receiver.h"
|
2020-04-02 17:28:38 +08:00
|
|
|
#include "shared/source/helpers/constants.h"
|
2021-03-24 04:12:41 +08:00
|
|
|
#include "shared/source/helpers/string.h"
|
2020-03-06 18:09:57 +08:00
|
|
|
#include "shared/source/memory_manager/memory_manager.h"
|
2021-03-31 02:11:00 +08:00
|
|
|
#include "shared/source/utilities/wait_util.h"
|
2020-03-06 18:09:57 +08:00
|
|
|
|
2020-03-07 07:52:16 +08:00
|
|
|
#include "hw_helpers.h"
|
|
|
|
|
2020-03-06 18:09:57 +08:00
|
|
|
namespace L0 {
|
|
|
|
|
|
|
|
Fence *Fence::create(CommandQueueImp *cmdQueue, const ze_fence_desc_t *desc) {
|
|
|
|
auto fence = new FenceImp(cmdQueue);
|
|
|
|
UNRECOVERABLE_IF(fence == nullptr);
|
|
|
|
|
|
|
|
fence->initialize();
|
|
|
|
|
|
|
|
return fence;
|
|
|
|
}
|
|
|
|
|
2020-05-13 17:25:29 +08:00
|
|
|
FenceImp::~FenceImp() {
|
|
|
|
cmdQueue->getDevice()->getDriverHandle()->getMemoryManager()->freeGraphicsMemory(allocation);
|
|
|
|
allocation = nullptr;
|
|
|
|
}
|
|
|
|
|
|
|
|
ze_result_t FenceImp::queryStatus() {
|
|
|
|
auto csr = cmdQueue->getCsr();
|
|
|
|
if (csr) {
|
|
|
|
csr->downloadAllocations();
|
|
|
|
}
|
|
|
|
|
2021-03-24 04:12:41 +08:00
|
|
|
uint64_t *hostAddr = static_cast<uint64_t *>(allocation->getUnderlyingBuffer());
|
|
|
|
uint32_t queryVal = Fence::STATE_CLEARED;
|
|
|
|
memcpy_s(static_cast<void *>(&queryVal), sizeof(uint32_t), static_cast<void *>(hostAddr), sizeof(uint32_t));
|
|
|
|
return queryVal == Fence::STATE_CLEARED ? ZE_RESULT_NOT_READY : ZE_RESULT_SUCCESS;
|
2020-05-13 17:25:29 +08:00
|
|
|
}
|
|
|
|
|
2020-09-18 20:18:23 +08:00
|
|
|
void FenceImp::initialize() {
|
2020-03-06 18:09:57 +08:00
|
|
|
NEO::AllocationProperties properties(
|
2020-07-08 18:09:05 +08:00
|
|
|
cmdQueue->getDevice()->getRootDeviceIndex(), MemoryConstants::cacheLineSize, NEO::GraphicsAllocation::AllocationType::BUFFER_HOST_MEMORY, cmdQueue->getDevice()->getNEODevice()->getDeviceBitfield());
|
2020-02-26 22:20:19 +08:00
|
|
|
properties.alignment = MemoryConstants::cacheLineSize;
|
2020-03-06 18:09:57 +08:00
|
|
|
allocation = cmdQueue->getDevice()->getDriverHandle()->getMemoryManager()->allocateGraphicsMemoryWithProperties(properties);
|
|
|
|
UNRECOVERABLE_IF(allocation == nullptr);
|
|
|
|
|
|
|
|
reset();
|
|
|
|
}
|
|
|
|
|
|
|
|
ze_result_t FenceImp::reset() {
|
|
|
|
auto hostAddress = static_cast<uint64_t *>(allocation->getUnderlyingBuffer());
|
|
|
|
*(hostAddress) = Fence::STATE_CLEARED;
|
|
|
|
|
|
|
|
NEO::CpuIntrinsics::clFlush(hostAddress);
|
|
|
|
|
|
|
|
return ZE_RESULT_SUCCESS;
|
|
|
|
}
|
|
|
|
|
2020-07-29 17:45:54 +08:00
|
|
|
ze_result_t FenceImp::hostSynchronize(uint64_t timeout) {
|
2020-03-06 18:09:57 +08:00
|
|
|
std::chrono::high_resolution_clock::time_point time1, time2;
|
2020-07-29 17:45:54 +08:00
|
|
|
uint64_t timeDiff = 0;
|
2020-03-06 18:09:57 +08:00
|
|
|
ze_result_t ret = ZE_RESULT_NOT_READY;
|
|
|
|
|
|
|
|
if (cmdQueue->getCsr()->getType() == NEO::CommandStreamReceiverType::CSR_AUB) {
|
|
|
|
return ZE_RESULT_SUCCESS;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (timeout == 0) {
|
|
|
|
return queryStatus();
|
|
|
|
}
|
|
|
|
|
|
|
|
time1 = std::chrono::high_resolution_clock::now();
|
|
|
|
while (timeDiff < timeout) {
|
|
|
|
ret = queryStatus();
|
|
|
|
if (ret == ZE_RESULT_SUCCESS) {
|
|
|
|
return ZE_RESULT_SUCCESS;
|
|
|
|
}
|
|
|
|
|
2021-03-31 02:11:00 +08:00
|
|
|
NEO::WaitUtils::waitFunction(nullptr, 0u);
|
2020-03-06 18:09:57 +08:00
|
|
|
|
2020-07-29 17:45:54 +08:00
|
|
|
if (timeout == std::numeric_limits<uint64_t>::max()) {
|
2020-03-06 18:09:57 +08:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
time2 = std::chrono::high_resolution_clock::now();
|
|
|
|
timeDiff = std::chrono::duration_cast<std::chrono::nanoseconds>(time2 - time1).count();
|
|
|
|
}
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
} // namespace L0
|