blob: d05ba3e680b82fe7559542f0f1f25fe61d116349 [file] [log] [blame]
// Copyright 2023 The IREE Authors
//
// Licensed under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
#include "experimental/cuda2/pipeline_layout.h"
#include <stddef.h>
#include "iree/base/api.h"
#include "iree/base/tracing.h"
//===----------------------------------------------------------------------===//
// iree_hal_cuda2_descriptor_set_layout_t
//===----------------------------------------------------------------------===//
typedef struct iree_hal_cuda2_descriptor_set_layout_t {
// Abstract resource used for injecting reference counting and vtable;
// must be at offset 0.
iree_hal_resource_t resource;
// The host allocator used for creating this descriptor set layout struct.
iree_allocator_t host_allocator;
// The total number of bindings in this descriptor set.
iree_host_size_t binding_count;
} iree_hal_cuda2_descriptor_set_layout_t;
static const iree_hal_descriptor_set_layout_vtable_t
iree_hal_cuda2_descriptor_set_layout_vtable;
static iree_hal_cuda2_descriptor_set_layout_t*
iree_hal_cuda2_descriptor_set_layout_cast(
iree_hal_descriptor_set_layout_t* base_value) {
IREE_HAL_ASSERT_TYPE(base_value,
&iree_hal_cuda2_descriptor_set_layout_vtable);
return (iree_hal_cuda2_descriptor_set_layout_t*)base_value;
}
iree_status_t iree_hal_cuda2_descriptor_set_layout_create(
iree_hal_descriptor_set_layout_flags_t flags,
iree_host_size_t binding_count,
const iree_hal_descriptor_set_layout_binding_t* bindings,
iree_allocator_t host_allocator,
iree_hal_descriptor_set_layout_t** out_descriptor_set_layout) {
IREE_ASSERT_ARGUMENT(!binding_count || bindings);
IREE_ASSERT_ARGUMENT(out_descriptor_set_layout);
IREE_TRACE_ZONE_BEGIN(z0);
*out_descriptor_set_layout = NULL;
iree_hal_cuda2_descriptor_set_layout_t* descriptor_set_layout = NULL;
iree_status_t status =
iree_allocator_malloc(host_allocator, sizeof(*descriptor_set_layout),
(void**)&descriptor_set_layout);
if (iree_status_is_ok(status)) {
iree_hal_resource_initialize(&iree_hal_cuda2_descriptor_set_layout_vtable,
&descriptor_set_layout->resource);
descriptor_set_layout->host_allocator = host_allocator;
descriptor_set_layout->binding_count = binding_count;
*out_descriptor_set_layout =
(iree_hal_descriptor_set_layout_t*)descriptor_set_layout;
}
IREE_TRACE_ZONE_END(z0);
return status;
}
iree_host_size_t iree_hal_cuda2_descriptor_set_layout_binding_count(
iree_hal_descriptor_set_layout_t* base_descriptor_set_layout) {
iree_hal_cuda2_descriptor_set_layout_t* descriptor_set_layout =
iree_hal_cuda2_descriptor_set_layout_cast(base_descriptor_set_layout);
return descriptor_set_layout->binding_count;
}
static void iree_hal_cuda2_descriptor_set_layout_destroy(
iree_hal_descriptor_set_layout_t* base_descriptor_set_layout) {
iree_hal_cuda2_descriptor_set_layout_t* descriptor_set_layout =
iree_hal_cuda2_descriptor_set_layout_cast(base_descriptor_set_layout);
IREE_TRACE_ZONE_BEGIN(z0);
iree_allocator_t host_allocator = descriptor_set_layout->host_allocator;
iree_allocator_free(host_allocator, descriptor_set_layout);
IREE_TRACE_ZONE_END(z0);
}
static const iree_hal_descriptor_set_layout_vtable_t
iree_hal_cuda2_descriptor_set_layout_vtable = {
.destroy = iree_hal_cuda2_descriptor_set_layout_destroy,
};
//===----------------------------------------------------------------------===//
// iree_hal_cuda2_pipeline_layout_t
//===----------------------------------------------------------------------===//
typedef struct iree_hal_cuda2_pipeline_layout_t {
// Abstract resource used for injecting reference counting and vtable;
// must be at offset 0.
iree_hal_resource_t resource;
// The host allocator used for creating this pipeline layout struct.
iree_allocator_t host_allocator;
// The kernel argument index for push constants.
// Note that push constants are placed after all normal descriptors.
iree_host_size_t push_constant_base_index;
iree_host_size_t push_constant_count;
iree_host_size_t set_layout_count;
// The list of descriptor set layout pointers, pointing to trailing inline
// allocation after the end of this struct.
struct {
iree_hal_descriptor_set_layout_t* set_layout;
// Base kernel argument index for this descriptor set.
iree_host_size_t base_index;
} set_layouts[];
} iree_hal_cuda2_pipeline_layout_t;
// + Additional inline allocation for holding all descriptor sets.
static const iree_hal_pipeline_layout_vtable_t
iree_hal_cuda2_pipeline_layout_vtable;
static iree_hal_cuda2_pipeline_layout_t* iree_hal_cuda2_pipeline_layout_cast(
iree_hal_pipeline_layout_t* base_value) {
IREE_HAL_ASSERT_TYPE(base_value, &iree_hal_cuda2_pipeline_layout_vtable);
return (iree_hal_cuda2_pipeline_layout_t*)base_value;
}
iree_status_t iree_hal_cuda2_pipeline_layout_create(
iree_host_size_t set_layout_count,
iree_hal_descriptor_set_layout_t* const* set_layouts,
iree_host_size_t push_constant_count, iree_allocator_t host_allocator,
iree_hal_pipeline_layout_t** out_pipeline_layout) {
IREE_ASSERT_ARGUMENT(!set_layout_count || set_layouts);
IREE_ASSERT_ARGUMENT(out_pipeline_layout);
IREE_TRACE_ZONE_BEGIN(z0);
*out_pipeline_layout = NULL;
if (push_constant_count > IREE_HAL_CUDA_MAX_PUSH_CONSTANT_COUNT) {
IREE_TRACE_ZONE_END(z0);
return iree_make_status(
IREE_STATUS_INVALID_ARGUMENT,
"push constant count %" PRIhsz " over the limit of %d",
push_constant_count, IREE_HAL_CUDA_MAX_PUSH_CONSTANT_COUNT);
}
// Currently the pipeline layout doesn't do anything.
// TODO: Handle creating the argument layout at that time hadling both push
// constant and buffers.
iree_hal_cuda2_pipeline_layout_t* pipeline_layout = NULL;
iree_host_size_t total_size =
sizeof(*pipeline_layout) +
set_layout_count * sizeof(*pipeline_layout->set_layouts);
iree_status_t status = iree_allocator_malloc(host_allocator, total_size,
(void**)&pipeline_layout);
if (iree_status_is_ok(status)) {
iree_hal_resource_initialize(&iree_hal_cuda2_pipeline_layout_vtable,
&pipeline_layout->resource);
pipeline_layout->host_allocator = host_allocator;
pipeline_layout->set_layout_count = set_layout_count;
iree_host_size_t base_index = 0;
for (iree_host_size_t i = 0; i < set_layout_count; ++i) {
pipeline_layout->set_layouts[i].set_layout = set_layouts[i];
// Copy and retain all descriptor sets so we don't lose them.
iree_hal_descriptor_set_layout_retain(set_layouts[i]);
pipeline_layout->set_layouts[i].base_index = base_index;
base_index +=
iree_hal_cuda2_descriptor_set_layout_binding_count(set_layouts[i]);
}
pipeline_layout->push_constant_base_index = base_index;
pipeline_layout->push_constant_count = push_constant_count;
*out_pipeline_layout = (iree_hal_pipeline_layout_t*)pipeline_layout;
}
IREE_TRACE_ZONE_END(z0);
return status;
}
static void iree_hal_cuda2_pipeline_layout_destroy(
iree_hal_pipeline_layout_t* base_pipeline_layout) {
iree_hal_cuda2_pipeline_layout_t* pipeline_layout =
iree_hal_cuda2_pipeline_layout_cast(base_pipeline_layout);
IREE_TRACE_ZONE_BEGIN(z0);
iree_allocator_t host_allocator = pipeline_layout->host_allocator;
for (iree_host_size_t i = 0; i < pipeline_layout->set_layout_count; ++i) {
iree_hal_descriptor_set_layout_release(
pipeline_layout->set_layouts[i].set_layout);
}
iree_allocator_free(host_allocator, pipeline_layout);
IREE_TRACE_ZONE_END(z0);
}
iree_host_size_t iree_hal_cuda2_pipeline_layout_base_binding_index(
iree_hal_pipeline_layout_t* base_pipeline_layout, uint32_t set) {
iree_hal_cuda2_pipeline_layout_t* pipeline_layout =
iree_hal_cuda2_pipeline_layout_cast(base_pipeline_layout);
return pipeline_layout->set_layouts[set].base_index;
}
iree_host_size_t iree_hal_cuda2_pipeline_layout_push_constant_index(
iree_hal_pipeline_layout_t* base_pipeline_layout) {
iree_hal_cuda2_pipeline_layout_t* pipeline_layout =
iree_hal_cuda2_pipeline_layout_cast(base_pipeline_layout);
return pipeline_layout->push_constant_base_index;
}
iree_host_size_t iree_hal_cuda2_pipeline_layout_push_constant_count(
iree_hal_pipeline_layout_t* base_pipeline_layout) {
iree_hal_cuda2_pipeline_layout_t* pipeline_layout =
iree_hal_cuda2_pipeline_layout_cast(base_pipeline_layout);
return pipeline_layout->push_constant_count;
}
static const iree_hal_pipeline_layout_vtable_t
iree_hal_cuda2_pipeline_layout_vtable = {
.destroy = iree_hal_cuda2_pipeline_layout_destroy,
};