blob: b41f900b0c31ba7d9930ffca91c95e76e39aadee [file] [log] [blame]
// Copyright 2023 The IREE Authors
//
// Licensed under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
#include <stdio.h>
#include "iree/base/api.h"
#include "iree/base/internal/file_io.h"
#include "iree/base/internal/path.h"
#include "iree/hal/local/elf/fatelf.h"
// NOTE: we don't verify ELF information in here and just pass it along. Don't
// run this on untrusted ELFs.
// NOTE: errors are handled in here just enough to get error messages - we don't
// care about leaks on failure as the process is going to die right away.
// TODO(benvanik): make this based on the archs used? It needs to be the common
// page size across all targets used within the file.
#define IREE_FATELF_PAGE_SIZE 4096
#if defined(IREE_PLATFORM_WINDOWS)
#include <fcntl.h>
#include <io.h>
#define IREE_SET_BINARY_MODE(handle) _setmode(_fileno(handle), O_BINARY)
#else
#define IREE_SET_BINARY_MODE(handle) ((void)0)
#endif // IREE_PLATFORM_WINDOWS
static int print_usage() {
fprintf(stderr, "Syntax: iree-fatelf [join|split|select|dump] files...\n");
fprintf(stderr, "\n");
fprintf(stderr, "Join multiple ELFs into a FatELF:\n");
fprintf(stderr, " iree-fatelf join elf_a.so elf_b.so > fatelf.sos\n");
fprintf(stderr, "\n");
fprintf(stderr, "Split a FatELF into multiple ELF files (to dir):\n");
fprintf(stderr, " iree-fatelf split fatelf.sos\n");
fprintf(stderr, "\n");
fprintf(stderr, "Select a FatELF matching the current arch:\n");
fprintf(stderr, " iree-fatelf select fatelf.sos > elf.so\n");
fprintf(stderr, "\n");
fprintf(stderr, "Dump header records:\n");
fprintf(stderr, " iree-fatelf dump fatelf.sos\n");
fprintf(stderr, "\n");
return 1;
}
// NOTE: this is somewhat redundant with fatelf.c but that's ok - this is a
// developer tool and I'd rather have the implementation linked into every
// runtime be kept as simple as possible than not repeating 100 lines of code.
// The runtime version is also designed to gracefully accept ELF files where
// here we only want FatELF files.
static iree_status_t fatelf_parse(iree_const_byte_span_t file_data,
iree_fatelf_header_t** out_header) {
*out_header = NULL;
if (file_data.data_length <
sizeof(iree_fatelf_header_t) + sizeof(iree_fatelf_record_t)) {
return iree_make_status(
IREE_STATUS_INVALID_ARGUMENT,
"file does not have enough data to even hold a FatELF header");
}
const iree_fatelf_header_t* raw_header =
(const iree_fatelf_header_t*)file_data.data;
iree_fatelf_header_t host_header = {
.magic = iree_unaligned_load_le_u32(&raw_header->magic),
.version = iree_unaligned_load_le_u16(&raw_header->version),
.record_count = iree_unaligned_load_le_u8(&raw_header->record_count),
.reserved = iree_unaligned_load_le_u8(&raw_header->reserved),
};
if (host_header.magic != IREE_FATELF_MAGIC) {
return iree_make_status(
IREE_STATUS_INVALID_ARGUMENT,
"file magic %08X does not match expected FatELF magic %08X",
host_header.magic, IREE_FATELF_MAGIC);
}
if (host_header.version != IREE_FATELF_FORMAT_VERSION) {
return iree_make_status(
IREE_STATUS_UNIMPLEMENTED,
"FatELF has version %d but runtime only supports version %d",
host_header.version, IREE_FATELF_FORMAT_VERSION);
}
iree_host_size_t required_bytes =
sizeof(iree_fatelf_header_t) +
host_header.record_count * sizeof(iree_fatelf_record_t);
if (file_data.data_length < required_bytes) {
return iree_make_status(IREE_STATUS_INVALID_ARGUMENT,
"FatELF file truncated, requires at least %" PRIhsz
"B for headers but only have %" PRIhsz
"B available",
required_bytes, file_data.data_length);
}
// Allocate storage for the parsed header and records.
iree_fatelf_header_t* header = NULL;
IREE_RETURN_IF_ERROR(iree_allocator_malloc(
iree_allocator_system(),
sizeof(iree_fatelf_header_t) +
host_header.record_count * sizeof(iree_fatelf_record_t),
(void**)&header));
memcpy(header, &host_header, sizeof(*header));
for (iree_elf64_byte_t i = 0; i < host_header.record_count; ++i) {
const iree_fatelf_record_t* raw_record = &raw_header->records[i];
const iree_fatelf_record_t host_record = {
.machine = iree_unaligned_load_le_u16(&raw_record->machine),
.osabi = iree_unaligned_load_le_u8(&raw_record->osabi),
.osabi_version = iree_unaligned_load_le_u8(&raw_record->osabi_version),
.word_size = iree_unaligned_load_le_u8(&raw_record->word_size),
.byte_order = iree_unaligned_load_le_u8(&raw_record->byte_order),
.reserved0 = iree_unaligned_load_le_u8(&raw_record->reserved0),
.reserved1 = iree_unaligned_load_le_u8(&raw_record->reserved1),
.offset = iree_unaligned_load_le_u64(&raw_record->offset),
.size = iree_unaligned_load_le_u64(&raw_record->size),
};
memcpy(&header->records[i], &host_record, sizeof(host_record));
}
*out_header = header;
return iree_ok_status();
}
// Tries to parse basic ELF metadata from |elf_data|.
// Very little verification done. Note that this must support both 32 and 64-bit
// ELF files regardless of the tool host configuration.
// The returned fields match the ELF spec and may differ from FatELF.
static iree_status_t fatelf_parse_elf_metadata(
iree_const_byte_span_t elf_data, iree_elf64_half_t* out_machine,
iree_elf64_byte_t* out_osabi, iree_elf64_byte_t* out_osabi_version,
iree_elf64_byte_t* out_elf_class, iree_elf64_byte_t* out_elf_data) {
*out_machine = 0;
*out_osabi = 0;
*out_osabi_version = 0;
*out_elf_data = 0;
*out_elf_class = 0;
if (elf_data.data_length < sizeof(iree_elf32_ehdr_t)) {
return iree_make_status(IREE_STATUS_FAILED_PRECONDITION,
"ELF data provided (%" PRIhsz
") is smaller than ehdr (%zu)",
elf_data.data_length, sizeof(iree_elf32_ehdr_t));
}
// The fields we're checking are the same in both 32 and 64 classes so we just
// use 32 for consistency.
const iree_elf32_ehdr_t* ehdr = (const iree_elf32_ehdr_t*)elf_data.data;
static const iree_elf_byte_t elf_magic[4] = {0x7F, 'E', 'L', 'F'};
if (memcmp(ehdr->e_ident, elf_magic, sizeof(elf_magic)) != 0) {
return iree_make_status(
IREE_STATUS_FAILED_PRECONDITION,
"data provided does not contain the ELF identifier");
}
*out_osabi = ehdr->e_ident[IREE_ELF_EI_OSABI];
*out_osabi_version = ehdr->e_ident[IREE_ELF_EI_ABIVERSION];
*out_elf_class = ehdr->e_ident[IREE_ELF_EI_CLASS];
*out_elf_data = ehdr->e_ident[IREE_ELF_EI_DATA];
// Note machine is multibyte and respects the declared endianness.
if (ehdr->e_ident[IREE_ELF_EI_DATA] == IREE_ELF_ELFDATA2LSB) {
*out_machine = iree_unaligned_load_le_u16(&ehdr->e_machine);
} else {
#if IREE_ENDIANNESS_BIG
// TODO(benvanik): helpers for big<->little endian
// *out_machine = iree_unaligned_load_be_u16(&ehdr->e_machine);
#error "ELF parsing support only available on little-endian systems today"
#endif // IREE_ENDIANNESS_BIG
}
return iree_ok_status();
}
typedef struct {
uint64_t offset;
iree_file_contents_t* contents;
iree_const_byte_span_t elf_data;
} fatelf_entry_t;
// Joins one or more ELF files together and writes the output to stdout.
static iree_status_t fatelf_join(int argc, char** argv) {
IREE_SET_BINARY_MODE(stdout); // ensure binary output mode
#if IREE_ENDIANNESS_BIG
#error "FatELF writing support only available on little-endian systems today"
#endif // IREE_ENDIANNESS_BIG
// Load all source files.
iree_elf64_byte_t entry_count = argc;
fatelf_entry_t* entries =
(fatelf_entry_t*)iree_alloca(entry_count * sizeof(fatelf_entry_t));
memset(entries, 0, entry_count * sizeof(*entries));
for (iree_elf64_byte_t i = 0; i < entry_count; ++i) {
IREE_RETURN_IF_ERROR(
iree_file_read_contents(argv[i], IREE_FILE_READ_FLAG_DEFAULT,
iree_allocator_system(), &entries[i].contents));
entries[i].elf_data = entries[i].contents->const_buffer;
}
// Compute offsets of all files based on their size and padding.
uint64_t file_offset = iree_host_align(
sizeof(iree_fatelf_header_t) + entry_count * sizeof(iree_fatelf_record_t),
IREE_FATELF_PAGE_SIZE);
for (iree_elf64_byte_t i = 0; i < entry_count; ++i) {
entries[i].offset = file_offset;
file_offset += iree_host_align(
entries[i].contents->const_buffer.data_length, IREE_FATELF_PAGE_SIZE);
}
// Write header without records.
iree_fatelf_header_t host_header = {
.magic = IREE_FATELF_MAGIC,
.version = IREE_FATELF_FORMAT_VERSION,
.record_count = entry_count,
.reserved = 0,
};
fwrite(&host_header, 1, sizeof(host_header), stdout);
// Write all records.
for (iree_elf64_byte_t i = 0; i < entry_count; ++i) {
iree_elf64_half_t machine = 0;
iree_elf64_byte_t osabi = 0;
iree_elf64_byte_t osabi_version = 0;
iree_elf64_byte_t elf_class = 0;
iree_elf64_byte_t elf_data = 0;
IREE_RETURN_IF_ERROR(
fatelf_parse_elf_metadata(entries[i].elf_data, &machine, &osabi,
&osabi_version, &elf_class, &elf_data));
iree_fatelf_record_t host_record = {
.machine = machine,
.osabi = osabi,
.osabi_version = osabi_version,
.word_size = elf_class == IREE_ELF_ELFCLASS32
? IREE_FATELF_WORD_SIZE_32
: IREE_FATELF_WORD_SIZE_64,
.byte_order = elf_data == IREE_ELF_ELFDATA2LSB
? IREE_FATELF_BYTE_ORDER_LSB
: IREE_FATELF_BYTE_ORDER_MSB,
.reserved0 = 0,
.reserved1 = 0,
.offset = (iree_elf64_off_t)entries[i].offset,
.size = (iree_elf64_xword_t)entries[i].elf_data.data_length,
};
fwrite(&host_record, 1, sizeof(host_record), stdout);
}
// Write all files, padding with zeros in-between as needed.
uint64_t write_offset =
sizeof(iree_fatelf_header_t) + entry_count * sizeof(iree_fatelf_record_t);
for (iree_elf64_byte_t i = 0; i < entry_count; ++i) {
uint64_t padding = entries[i].offset - write_offset;
for (uint64_t i = 0; i < padding; ++i) fputc(0, stdout);
write_offset += padding;
if (write_offset != entries[i].offset) {
return iree_make_status(IREE_STATUS_INTERNAL,
"actual offset does not match expected");
}
fwrite(entries[i].elf_data.data, 1, entries[i].elf_data.data_length,
stdout);
write_offset += entries[i].elf_data.data_length;
}
fflush(stdout);
for (iree_elf64_byte_t i = 0; i < entry_count; ++i) {
iree_file_contents_free(entries[i].contents);
}
return iree_ok_status();
}
static const char* fatelf_machine_id_str(iree_elf64_half_t value) {
// TODO(benvanik): include a full table from the spec?
// http://formats.kaitai.io/elf/ has a good source of canonical short names.
// For now we just support what we have in our ELF loader.
switch (value) {
case 0x03: // EM_386 / 3
return "x86";
case 0x28: // EM_ARM / 40
return "arm";
case 0xB7: // EM_AARCH64 / 183
return "aarch64";
case 0xF3: // EM_RISCV / 243
return "risvc";
case 0x3E: // EM_X86_64 / 62
return "x86_64";
default:
return "unknown";
}
}
static const char* fatelf_osabi_id_str(iree_elf64_byte_t value) {
switch (value) {
case IREE_ELF_ELFOSABI_NONE:
return "none";
case IREE_ELF_ELFOSABI_LINUX:
return "linux";
case IREE_ELF_ELFOSABI_STANDALONE:
return "standalone";
default:
return "unknown";
}
}
static const char* fatelf_word_size_id_str(iree_elf64_byte_t value) {
switch (value) {
case IREE_FATELF_WORD_SIZE_32:
return "lp32";
case IREE_FATELF_WORD_SIZE_64:
return "lp64";
default:
return "lpUNK";
}
}
static const char* fatelf_byte_order_id_str(iree_elf64_byte_t value) {
switch (value) {
case IREE_FATELF_BYTE_ORDER_MSB:
return "be";
case IREE_FATELF_BYTE_ORDER_LSB:
return "le";
default:
return "xx";
}
}
// Splits a FatELF into multiple files, writing each beside the input file.
static iree_status_t fatelf_split(int argc, char** argv) {
iree_file_contents_t* fatelf_contents = NULL;
IREE_RETURN_IF_ERROR(
iree_file_read_contents(argv[0], IREE_FILE_READ_FLAG_DEFAULT,
iree_allocator_system(), &fatelf_contents));
iree_fatelf_header_t* header = NULL;
IREE_RETURN_IF_ERROR(fatelf_parse(fatelf_contents->const_buffer, &header));
iree_string_view_t dirname, basename;
iree_file_path_split(iree_make_cstring_view(argv[0]), &dirname, &basename);
iree_string_view_t stem, extension;
iree_file_path_split_basename(basename, &stem, &extension);
for (iree_elf64_byte_t i = 0; i < header->record_count; ++i) {
const iree_fatelf_record_t* record = &header->records[i];
const char* machine_str = fatelf_machine_id_str(record->machine);
const char* osabi_str = fatelf_osabi_id_str(record->osabi);
const char* word_size_str = fatelf_word_size_id_str(record->word_size);
const char* byte_order_str = fatelf_byte_order_id_str(record->byte_order);
char record_path[2048];
iree_host_size_t record_path_length =
snprintf(record_path, IREE_ARRAYSIZE(record_path),
"%.*s%s%.*s.%s_%s_%s%s.so", (int)dirname.size, dirname.data,
dirname.size ? "/" : "", (int)stem.size, stem.data,
machine_str, osabi_str, word_size_str, byte_order_str);
record_path_length =
iree_file_path_canonicalize(record_path, record_path_length);
fprintf(stdout, "Writing record[%d] to '%.*s'...\n", i,
(int)record_path_length, record_path);
iree_const_byte_span_t record_data = iree_make_const_byte_span(
fatelf_contents->const_buffer.data + record->offset, record->size);
IREE_RETURN_IF_ERROR(iree_file_write_contents(record_path, record_data));
}
fprintf(stdout, "Wrote %d records to %.*s!\n", header->record_count,
(int)dirname.size, dirname.data);
iree_allocator_free(iree_allocator_system(), header);
iree_file_contents_free(fatelf_contents);
return iree_ok_status();
}
// Selects the ELF matching the current host config from a FatELF and writes
// it to stdout.
static iree_status_t fatelf_select(int argc, char** argv) {
IREE_SET_BINARY_MODE(stdout); // ensure binary output mode
iree_file_contents_t* fatelf_contents = NULL;
IREE_RETURN_IF_ERROR(
iree_file_read_contents(argv[0], IREE_FILE_READ_FLAG_DEFAULT,
iree_allocator_system(), &fatelf_contents));
iree_const_byte_span_t elf_data = iree_const_byte_span_empty();
IREE_RETURN_IF_ERROR(
iree_fatelf_select(fatelf_contents->const_buffer, &elf_data));
fwrite(elf_data.data, 1, elf_data.data_length, stdout);
iree_file_contents_free(fatelf_contents);
return iree_ok_status();
}
static const char* fatelf_word_size_enum_str(iree_elf64_byte_t value) {
switch (value) {
case IREE_FATELF_WORD_SIZE_32:
return "ELFCLASS32";
case IREE_FATELF_WORD_SIZE_64:
return "ELFCLASS64";
default:
return "<unknown>";
}
}
static const char* fatelf_byte_order_enum_str(iree_elf64_byte_t value) {
switch (value) {
case IREE_FATELF_BYTE_ORDER_MSB:
return "ELFDATA2MSB (big-endian)";
case IREE_FATELF_BYTE_ORDER_LSB:
return "ELFDATA2LSB (little-endian)";
default:
return "<unknown>";
}
}
// Dumps the FatELF file records.
static iree_status_t fatelf_dump(int argc, char** argv) {
iree_file_contents_t* fatelf_contents = NULL;
IREE_RETURN_IF_ERROR(
iree_file_read_contents(argv[0], IREE_FILE_READ_FLAG_DEFAULT,
iree_allocator_system(), &fatelf_contents));
iree_fatelf_header_t* header = NULL;
IREE_RETURN_IF_ERROR(fatelf_parse(fatelf_contents->const_buffer, &header));
fprintf(stdout, "iree_fatelf_header_t:\n");
fprintf(stdout, " magic: %" PRIX32 "\n", header->magic);
fprintf(stdout, " version: %d\n", header->version);
fprintf(stdout, " records: %d\n", header->record_count);
fprintf(stdout, " reserved: %" PRIX8 "\n", header->reserved);
fprintf(stdout, "\n");
for (iree_elf64_byte_t i = 0; i < header->record_count; ++i) {
const iree_fatelf_record_t* record = &header->records[i];
fprintf(stdout, "iree_fatelf_record_t[%d]:\n", i);
fprintf(stdout, " machine: %d / %04X = %s\n", record->machine,
record->machine, fatelf_machine_id_str(record->machine));
fprintf(stdout, " osabi: %d / %02X = %s\n", record->osabi,
record->osabi, fatelf_osabi_id_str(record->osabi));
fprintf(stdout, " version: %d / %02X\n", record->osabi_version,
record->osabi_version);
fprintf(stdout, " word_size: %d / %02X = %s\n", record->word_size,
record->word_size, fatelf_word_size_enum_str(record->word_size));
fprintf(stdout, " byte_order: %d / %02X = %s\n", record->byte_order,
record->byte_order, fatelf_byte_order_enum_str(record->byte_order));
fprintf(stdout, " reserved0: %d / %02X\n", record->reserved0,
record->reserved0);
fprintf(stdout, " reserved1: %d / %02X\n", record->reserved1,
record->reserved1);
fprintf(stdout, " offset: %" PRIu64 " / %016" PRIX64 "\n",
record->offset, record->offset);
fprintf(stdout, " size: %" PRIu64 " / %016" PRIX64 "\n", record->size,
record->size);
fprintf(stdout, "\n");
}
iree_allocator_free(iree_allocator_system(), header);
iree_file_contents_free(fatelf_contents);
return iree_ok_status();
}
int main(int argc, char** argv) {
if (argc < 2) {
return print_usage();
}
char* command = argv[1];
int command_argc = argc - 2;
char** command_argv = argv + 2;
iree_status_t status = iree_ok_status();
if (strcmp(command, "join") == 0) {
if (command_argc < 1) return print_usage();
status = fatelf_join(command_argc, command_argv);
} else if (strcmp(command, "split") == 0) {
if (command_argc != 1) return print_usage();
status = fatelf_split(command_argc, command_argv);
} else if (strcmp(command, "select") == 0) {
if (command_argc != 1) return print_usage();
status = fatelf_select(command_argc, command_argv);
} else if (strcmp(command, "dump") == 0) {
if (command_argc != 1) return print_usage();
status = fatelf_dump(command_argc, command_argv);
} else {
return print_usage();
}
if (!iree_status_is_ok(status)) {
fprintf(stderr, "iree-fatelf encountered error:\n");
iree_status_fprint(stderr, status);
iree_status_free(status);
return 1;
}
return 0;
}