mirror of
https://github.com/intel/llvm.git
synced 2026-01-28 10:38:23 +08:00
CUDA unified variable where set to use the same allocator than managed variable. This patch adds a specific allocator for the unified variables. Currently it will call the managed allocator underneath but we want to have the flexibility to change that in the future.
73 lines
2.1 KiB
C++
73 lines
2.1 KiB
C++
//===-- runtime/CUDA/allocator.cpp ----------------------------------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "flang/Runtime/CUDA/allocator.h"
|
|
#include "../derived.h"
|
|
#include "../stat.h"
|
|
#include "../terminator.h"
|
|
#include "../type-info.h"
|
|
#include "flang/Common/Fortran.h"
|
|
#include "flang/ISO_Fortran_binding_wrapper.h"
|
|
#include "flang/Runtime/allocator-registry.h"
|
|
|
|
#include "cuda.h"
|
|
|
|
namespace Fortran::runtime::cuda {
|
|
|
|
void CUFRegisterAllocator() {
|
|
allocatorRegistry.Register(
|
|
kPinnedAllocatorPos, {&CUFAllocPinned, CUFFreePinned});
|
|
allocatorRegistry.Register(
|
|
kDeviceAllocatorPos, {&CUFAllocDevice, CUFFreeDevice});
|
|
allocatorRegistry.Register(
|
|
kManagedAllocatorPos, {&CUFAllocManaged, CUFFreeManaged});
|
|
allocatorRegistry.Register(
|
|
kUnifiedAllocatorPos, {&CUFAllocUnified, CUFFreeUnified});
|
|
}
|
|
|
|
void *CUFAllocPinned(std::size_t sizeInBytes) {
|
|
void *p;
|
|
CUDA_REPORT_IF_ERROR(cuMemAllocHost(&p, sizeInBytes));
|
|
return p;
|
|
}
|
|
|
|
void CUFFreePinned(void *p) { CUDA_REPORT_IF_ERROR(cuMemFreeHost(p)); }
|
|
|
|
void *CUFAllocDevice(std::size_t sizeInBytes) {
|
|
CUdeviceptr p = 0;
|
|
CUDA_REPORT_IF_ERROR(cuMemAlloc(&p, sizeInBytes));
|
|
return reinterpret_cast<void *>(p);
|
|
}
|
|
|
|
void CUFFreeDevice(void *p) {
|
|
CUDA_REPORT_IF_ERROR(cuMemFree(reinterpret_cast<CUdeviceptr>(p)));
|
|
}
|
|
|
|
void *CUFAllocManaged(std::size_t sizeInBytes) {
|
|
CUdeviceptr p = 0;
|
|
CUDA_REPORT_IF_ERROR(
|
|
cuMemAllocManaged(&p, sizeInBytes, CU_MEM_ATTACH_GLOBAL));
|
|
return reinterpret_cast<void *>(p);
|
|
}
|
|
|
|
void CUFFreeManaged(void *p) {
|
|
CUDA_REPORT_IF_ERROR(cuMemFree(reinterpret_cast<CUdeviceptr>(p)));
|
|
}
|
|
|
|
void *CUFAllocUnified(std::size_t sizeInBytes) {
|
|
// Call alloc managed for the time being.
|
|
return CUFAllocManaged(sizeInBytes);
|
|
}
|
|
|
|
void CUFFreeUnified(void *p) {
|
|
// Call free managed for the time being.
|
|
CUFFreeManaged(p);
|
|
}
|
|
|
|
} // namespace Fortran::runtime::cuda
|