blob: 640d6f52dcfb8aaae37687d273d8a4d02f7006f9 [file] [log] [blame]
// Copyright 2021 The IREE Authors
//
// Licensed under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
#ifndef IREE_HAL_DRIVERS_CUDA_BUFFER_H_
#define IREE_HAL_DRIVERS_CUDA_BUFFER_H_
#include "iree/base/api.h"
#include "iree/hal/api.h"
#include "iree/hal/drivers/cuda/cuda_headers.h"
#ifdef __cplusplus
extern "C" {
#endif // __cplusplus
typedef enum iree_hal_cuda_buffer_type_e {
// cuMemAlloc/cuMemAllocManaged + cuMemFree
IREE_HAL_CUDA_BUFFER_TYPE_DEVICE = 0,
// cuMemHostAlloc + cuMemFreeHost
IREE_HAL_CUDA_BUFFER_TYPE_HOST,
// cuMemHostRegister + cuMemHostUnregister
IREE_HAL_CUDA_BUFFER_TYPE_HOST_REGISTERED,
// cuMemAllocFromPoolAsync + cuMemFree/cuMemFreeAsync
IREE_HAL_CUDA_BUFFER_TYPE_ASYNC,
} iree_hal_cuda_buffer_type_t;
// Wraps a CUDA allocation in an iree_hal_buffer_t.
iree_status_t iree_hal_cuda_buffer_wrap(
iree_hal_allocator_t* allocator, iree_hal_memory_type_t memory_type,
iree_hal_memory_access_t allowed_access,
iree_hal_buffer_usage_t allowed_usage, iree_device_size_t allocation_size,
iree_device_size_t byte_offset, iree_device_size_t byte_length,
iree_hal_cuda_buffer_type_t buffer_type, CUdeviceptr device_ptr,
void* host_ptr, iree_hal_buffer_release_callback_t release_callback,
iree_allocator_t host_allocator, iree_hal_buffer_t** out_buffer);
// Returns the underlying CUDA buffer type.
iree_hal_cuda_buffer_type_t iree_hal_cuda_buffer_type(
const iree_hal_buffer_t* buffer);
// Returns the CUDA base pointer for the given |buffer|.
// This is the entire allocated_buffer and must be offset by the buffer
// byte_offset and byte_length when used.
CUdeviceptr iree_hal_cuda_buffer_device_pointer(
const iree_hal_buffer_t* buffer);
// Returns the CUDA host pointer for the given |buffer|, if available.
void* iree_hal_cuda_buffer_host_pointer(const iree_hal_buffer_t* buffer);
// Drops the release callback so that when the buffer is destroyed no callback
// will be made. This is not thread safe but all callers are expected to be
// holding an allocation and the earliest the buffer could be destroyed is after
// this call returns and the caller has released its reference.
void iree_hal_cuda_buffer_drop_release_callback(iree_hal_buffer_t* buffer);
#ifdef __cplusplus
} // extern "C"
#endif // __cplusplus
#endif // IREE_HAL_DRIVERS_CUDA_BUFFER_H_