blob: dfeed297a5a9af76fe45bf4b4386e165cabc7124 [file] [log] [blame]
// Copyright 2023 The IREE Authors
//
// Licensed under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
#ifndef EXPERIMENTAL_CUDA2_CUDA_BUFFER_H_
#define EXPERIMENTAL_CUDA2_CUDA_BUFFER_H_
#include "experimental/cuda2/cuda_headers.h"
#include "iree/base/api.h"
#include "iree/hal/api.h"
#ifdef __cplusplus
extern "C" {
#endif // __cplusplus
typedef enum iree_hal_cuda2_buffer_type_e {
// Device local buffer; allocated with cuMemAlloc/cuMemAllocManaged, freed
// with cuMemFree.
IREE_HAL_CUDA_BUFFER_TYPE_DEVICE = 0,
// Host local buffer; allocated with cuMemHostAlloc, freed with cuMemFreeHost.
IREE_HAL_CUDA_BUFFER_TYPE_HOST,
// Host local buffer; registered with cuMemHostRegister, freed with
// cuMemHostUnregister.
IREE_HAL_CUDA_BUFFER_TYPE_HOST_REGISTERED,
// Device local buffer, allocated with cuMemAllocFromPoolAsync, freed with
// cuMemFree/cuMemFreeAsync.
IREE_HAL_CUDA_BUFFER_TYPE_ASYNC,
// Externally registered buffer whose providence is unknown.
// Must be freed by the user.
IREE_HAL_CUDA_BUFFER_TYPE_EXTERNAL,
} iree_hal_cuda2_buffer_type_t;
// Wraps a CUDA allocation in an iree_hal_buffer_t.
iree_status_t iree_hal_cuda2_buffer_wrap(
iree_hal_allocator_t* allocator, iree_hal_memory_type_t memory_type,
iree_hal_memory_access_t allowed_access,
iree_hal_buffer_usage_t allowed_usage, iree_device_size_t allocation_size,
iree_device_size_t byte_offset, iree_device_size_t byte_length,
iree_hal_cuda2_buffer_type_t buffer_type, CUdeviceptr device_ptr,
void* host_ptr, iree_hal_buffer_release_callback_t release_callback,
iree_allocator_t host_allocator, iree_hal_buffer_t** out_buffer);
// Returns the underlying CUDA buffer type of the given |buffer|.
iree_hal_cuda2_buffer_type_t iree_hal_cuda2_buffer_type(
const iree_hal_buffer_t* buffer);
// Returns the CUDA base device pointer for the given |buffer|.
//
// Note that this is the entire allocated_buffer and must be offset by the
// buffer byte_offset and byte_length when used.
CUdeviceptr iree_hal_cuda2_buffer_device_pointer(
const iree_hal_buffer_t* buffer);
// Returns the CUDA host pointer for the given |buffer|, if available.
void* iree_hal_cuda2_buffer_host_pointer(const iree_hal_buffer_t* buffer);
// Drops the release callback so that when the buffer is destroyed no callback
// will be made. This is not thread safe but all callers are expected to be
// holding an allocation and the earliest the buffer could be destroyed is after
// this call returns and the caller has released its reference.
void iree_hal_cuda2_buffer_drop_release_callback(iree_hal_buffer_t* buffer);
#ifdef __cplusplus
} // extern "C"
#endif // __cplusplus
#endif // EXPERIMENTAL_CUDA2_CUDA_BUFFER_H_