204 lines
6.5 KiB
C++
204 lines
6.5 KiB
C++
/*
|
|
* Copyright (c) 2017 - 2018, Intel Corporation
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
* to deal in the Software without restriction, including without limitation
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice shall be included
|
|
* in all copies or substantial portions of the Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
|
|
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
|
|
* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
|
|
* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
|
|
* OTHER DEALINGS IN THE SOFTWARE.
|
|
*/
|
|
|
|
#include "runtime/helpers/aligned_memory.h"
|
|
#include "runtime/helpers/debug_helpers.h"
|
|
#include "runtime/os_interface/linux/drm_buffer_object.h"
|
|
#include "runtime/os_interface/linux/drm_memory_manager.h"
|
|
#include "runtime/os_interface/linux/drm_neo.h"
|
|
#include "runtime/os_interface/linux/os_time_linux.h"
|
|
#include "runtime/utilities/stackvec.h"
|
|
|
|
#include <sys/syscall.h>
|
|
#include <sys/mman.h>
|
|
#include <sys/ioctl.h>
|
|
#include <sys/types.h>
|
|
#include <errno.h>
|
|
#include <fcntl.h>
|
|
#include <string.h>
|
|
#include <unistd.h>
|
|
#include <stdarg.h>
|
|
|
|
#include "drm/i915_drm.h"
|
|
|
|
#include <map>
|
|
|
|
namespace OCLRT {
|
|
|
|
BufferObject::BufferObject(Drm *drm, int handle, bool isAllocated) : isResident(false), drm(drm), refCount(1), handle(handle), isReused(false), isAllocated(isAllocated) {
|
|
this->isSoftpin = false;
|
|
|
|
this->tiling_mode = I915_TILING_NONE;
|
|
this->stride = 0;
|
|
|
|
execObjectsStorage = nullptr;
|
|
|
|
this->size = 0;
|
|
this->address = nullptr;
|
|
this->lockedAddress = nullptr;
|
|
this->offset64 = 0;
|
|
}
|
|
|
|
uint32_t BufferObject::getRefCount() const {
|
|
return this->refCount.load();
|
|
}
|
|
|
|
bool BufferObject::softPin(uint64_t offset) {
|
|
this->isSoftpin = true;
|
|
this->offset64 = offset;
|
|
|
|
return true;
|
|
};
|
|
|
|
bool BufferObject::close() {
|
|
drm_gem_close close = {};
|
|
close.handle = this->handle;
|
|
|
|
int ret = this->drm->ioctl(DRM_IOCTL_GEM_CLOSE, &close);
|
|
if (ret != 0) {
|
|
int err = errno;
|
|
printDebugString(DebugManager.flags.PrintDebugMessages.get(), stderr, "ioctl(GEM_CLOSE) failed with %d. errno=%d(%s)\n", ret, err, strerror(err));
|
|
DEBUG_BREAK_IF(true);
|
|
return false;
|
|
}
|
|
|
|
this->handle = -1;
|
|
|
|
return true;
|
|
}
|
|
|
|
int BufferObject::wait(int64_t timeoutNs) {
|
|
drm_i915_gem_wait wait = {};
|
|
wait.bo_handle = this->handle;
|
|
wait.timeout_ns = -1;
|
|
|
|
int ret = this->drm->ioctl(DRM_IOCTL_I915_GEM_WAIT, &wait);
|
|
if (ret != 0) {
|
|
int err = errno;
|
|
printDebugString(DebugManager.flags.PrintDebugMessages.get(), stderr, "ioctl(I915_GEM_WAIT) failed with %d. errno=%d(%s)\n", ret, err, strerror(err));
|
|
}
|
|
UNRECOVERABLE_IF(ret != 0);
|
|
|
|
return ret;
|
|
}
|
|
|
|
bool BufferObject::setTiling(uint32_t mode, uint32_t stride) {
|
|
if (this->tiling_mode == mode) {
|
|
return true;
|
|
}
|
|
|
|
drm_i915_gem_set_tiling set_tiling = {};
|
|
set_tiling.handle = this->handle;
|
|
set_tiling.tiling_mode = mode;
|
|
set_tiling.stride = stride;
|
|
|
|
if (this->drm->ioctl(DRM_IOCTL_I915_GEM_SET_TILING, &set_tiling) != 0) {
|
|
return false;
|
|
}
|
|
|
|
this->tiling_mode = set_tiling.tiling_mode;
|
|
this->stride = set_tiling.stride;
|
|
|
|
return set_tiling.tiling_mode == mode;
|
|
}
|
|
|
|
void BufferObject::fillExecObject(drm_i915_gem_exec_object2 &execObject) {
|
|
execObject.handle = this->handle;
|
|
execObject.relocation_count = 0; //No relocations, we are SoftPinning
|
|
execObject.relocs_ptr = 0ul;
|
|
execObject.alignment = 0;
|
|
execObject.offset = this->isSoftpin ? this->offset64 : 0;
|
|
execObject.flags = this->isSoftpin ? EXEC_OBJECT_PINNED : 0;
|
|
#ifdef __x86_64__
|
|
execObject.flags |= reinterpret_cast<uint64_t>(this->address) & MemoryConstants::zoneHigh ? EXEC_OBJECT_SUPPORTS_48B_ADDRESS : 0;
|
|
#endif
|
|
execObject.rsvd1 = this->drm->lowPriorityContextId;
|
|
execObject.rsvd2 = 0;
|
|
}
|
|
|
|
void BufferObject::processRelocs(int &idx) {
|
|
for (size_t i = 0; i < this->residency.size(); i++) {
|
|
residency[i]->fillExecObject(execObjectsStorage[idx]);
|
|
idx++;
|
|
}
|
|
}
|
|
|
|
int BufferObject::exec(uint32_t used, size_t startOffset, unsigned int flags, bool requiresCoherency, bool lowPriority) {
|
|
drm_i915_gem_execbuffer2 execbuf = {};
|
|
|
|
int idx = 0;
|
|
processRelocs(idx);
|
|
this->fillExecObject(execObjectsStorage[idx]);
|
|
idx++;
|
|
|
|
execbuf.buffers_ptr = reinterpret_cast<uintptr_t>(execObjectsStorage);
|
|
execbuf.buffer_count = idx;
|
|
execbuf.batch_start_offset = static_cast<uint32_t>(startOffset);
|
|
execbuf.batch_len = alignUp(used, 8);
|
|
execbuf.flags = flags;
|
|
|
|
if (lowPriority) {
|
|
execbuf.rsvd1 = this->drm->lowPriorityContextId & I915_EXEC_CONTEXT_ID_MASK;
|
|
}
|
|
|
|
int ret = this->drm->ioctl(DRM_IOCTL_I915_GEM_EXECBUFFER2, &execbuf);
|
|
if (ret != 0) {
|
|
int err = errno;
|
|
printDebugString(DebugManager.flags.PrintDebugMessages.get(), stderr, "ioctl(I915_GEM_EXECBUFFER2) failed with %d. errno=%d(%s)\n", ret, err, strerror(err));
|
|
UNRECOVERABLE_IF(true);
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
int BufferObject::pin(BufferObject *boToPin[], size_t numberOfBos) {
|
|
drm_i915_gem_execbuffer2 execbuf = {};
|
|
StackVec<drm_i915_gem_exec_object2, max_fragments_count + 1> execObject;
|
|
|
|
reinterpret_cast<uint32_t *>(this->address)[0] = 0x05000000;
|
|
reinterpret_cast<uint32_t *>(this->address)[1] = 0x00000000;
|
|
|
|
execObject.resize(numberOfBos + 1);
|
|
|
|
uint32_t boIndex = 0;
|
|
for (boIndex = 0; boIndex < (uint32_t)numberOfBos; boIndex++) {
|
|
boToPin[boIndex]->fillExecObject(execObject[boIndex]);
|
|
}
|
|
|
|
this->fillExecObject(execObject[boIndex]);
|
|
|
|
execbuf.buffers_ptr = reinterpret_cast<uintptr_t>(&execObject[0]);
|
|
execbuf.buffer_count = boIndex + 1;
|
|
execbuf.batch_len = alignUp(static_cast<uint32_t>(sizeof(uint32_t)), 8);
|
|
|
|
int err = 0;
|
|
int ret = this->drm->ioctl(DRM_IOCTL_I915_GEM_EXECBUFFER2, &execbuf);
|
|
if (ret != 0) {
|
|
err = this->drm->getErrno();
|
|
printDebugString(DebugManager.flags.PrintDebugMessages.get(), stderr, "ioctl(I915_GEM_EXECBUFFER2) failed with %d. errno=%d(%s)\n", ret, err, strerror(err));
|
|
}
|
|
|
|
return err;
|
|
}
|
|
|
|
} // namespace OCLRT
|