blob: 50f96242afa2d88d0963294c1b2a959207dd2908 [file] [log] [blame]
// Copyright 2023 The IREE Authors
//
// Licensed under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
#ifndef EXPERIMENTAL_CUDA2_EVENT_POOL_H_
#define EXPERIMENTAL_CUDA2_EVENT_POOL_H_
#include "experimental/cuda2/cuda_dynamic_symbols.h"
#include "iree/base/api.h"
#ifdef __cplusplus
extern "C" {
#endif // __cplusplus
//===----------------------------------------------------------------------===//
// iree_hal_cuda2_event_t
//===----------------------------------------------------------------------===//
// An struct that wraps a CUevent object with a reference count for lifetime
// management.
//
// iree_hal_cuda2_event_t objects cannot be directly created; they should be
// acquired from the event pool and released back to the pool once done.
//
// Thread-safe; multiple threads may retain and release the same event.
typedef struct iree_hal_cuda2_event_t iree_hal_cuda2_event_t;
// Returns the underlying CUevent handle behind |event|.
CUevent iree_hal_cuda2_event_handle(const iree_hal_cuda2_event_t* event);
// Retains the given |event| by increasing its reference count.
void iree_hal_cuda2_event_retain(iree_hal_cuda2_event_t* event);
// Releases the given |event| by decreasing its reference count.
//
// |event| will be returned to its owning pool when the reference count is 0.
void iree_hal_cuda2_event_release(iree_hal_cuda2_event_t* event);
//===----------------------------------------------------------------------===//
// iree_hal_cuda2_event_pool_t
//===----------------------------------------------------------------------===//
// A simple pool of iree_hal_event_t objects to recycle.
//
// Thread-safe; multiple threads may acquire and release events from the pool.
typedef struct iree_hal_cuda2_event_pool_t iree_hal_cuda2_event_pool_t;
// Allocates a new event pool with up to |available_capacity| events.
//
// Extra events requested beyond the capability are directly created and
// destroyed without pooling.
iree_status_t iree_hal_cuda2_event_pool_allocate(
const iree_hal_cuda2_dynamic_symbols_t* symbols,
iree_host_size_t available_capacity, iree_allocator_t host_allocator,
iree_hal_cuda2_event_pool_t** out_event_pool);
// Deallocates an event pool and destroys all events.
//
// All events that were acquired from the pool must have already been released
// back to it prior to deallocation.
void iree_hal_cuda2_event_pool_free(iree_hal_cuda2_event_pool_t* event_pool);
// Acquires one or more events from the event pool.
//
// Each returned event have an initial reference count of 1. The returned
// CUevent objects may retain captured states of some queues from previous
// uses; callers should record again to overwrite.
iree_status_t iree_hal_cuda2_event_pool_acquire(
iree_hal_cuda2_event_pool_t* event_pool, iree_host_size_t event_count,
iree_hal_cuda2_event_t** out_events);
#ifdef __cplusplus
} // extern "C"
#endif // __cplusplus
#endif // EXPERIMENTAL_CUDA2_EVENT_POOL_H_