| // Copyright 2023 The IREE Authors |
| // |
| // Licensed under the Apache License v2.0 with LLVM Exceptions. |
| // See https://llvm.org/LICENSE.txt for license information. |
| // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| |
| #include <stdio.h> |
| |
| #include "iree/base/api.h" |
| #include "iree/base/internal/file_io.h" |
| #include "iree/base/internal/path.h" |
| #include "iree/hal/local/elf/fatelf.h" |
| |
| // NOTE: we don't verify ELF information in here and just pass it along. Don't |
| // run this on untrusted ELFs. |
| |
| // NOTE: errors are handled in here just enough to get error messages - we don't |
| // care about leaks on failure as the process is going to die right away. |
| |
| // TODO(benvanik): make this based on the archs used? It needs to be the common |
| // page size across all targets used within the file. |
| #define IREE_FATELF_PAGE_SIZE 4096 |
| |
| #if defined(IREE_PLATFORM_WINDOWS) |
| #include <fcntl.h> |
| #include <io.h> |
| #define IREE_SET_BINARY_MODE(handle) _setmode(_fileno(handle), O_BINARY) |
| #else |
| #define IREE_SET_BINARY_MODE(handle) ((void)0) |
| #endif // IREE_PLATFORM_WINDOWS |
| |
| static int print_usage() { |
| fprintf(stderr, "Syntax: iree-fatelf [join|split|select|dump] files...\n"); |
| fprintf(stderr, "\n"); |
| fprintf(stderr, "Join multiple ELFs into a FatELF:\n"); |
| fprintf(stderr, " iree-fatelf join elf_a.so elf_b.so > fatelf.sos\n"); |
| fprintf(stderr, "\n"); |
| fprintf(stderr, "Split a FatELF into multiple ELF files (to dir):\n"); |
| fprintf(stderr, " iree-fatelf split fatelf.sos\n"); |
| fprintf(stderr, "\n"); |
| fprintf(stderr, "Select a FatELF matching the current arch:\n"); |
| fprintf(stderr, " iree-fatelf select fatelf.sos > elf.so\n"); |
| fprintf(stderr, "\n"); |
| fprintf(stderr, "Dump header records:\n"); |
| fprintf(stderr, " iree-fatelf dump fatelf.sos\n"); |
| fprintf(stderr, "\n"); |
| return 1; |
| } |
| |
| // NOTE: this is somewhat redundant with fatelf.c but that's ok - this is a |
| // developer tool and I'd rather have the implementation linked into every |
| // runtime be kept as simple as possible than not repeating 100 lines of code. |
| // The runtime version is also designed to gracefully accept ELF files where |
| // here we only want FatELF files. |
| static iree_status_t fatelf_parse(iree_const_byte_span_t file_data, |
| iree_fatelf_header_t** out_header) { |
| *out_header = NULL; |
| |
| if (file_data.data_length < |
| sizeof(iree_fatelf_header_t) + sizeof(iree_fatelf_record_t)) { |
| return iree_make_status( |
| IREE_STATUS_INVALID_ARGUMENT, |
| "file does not have enough data to even hold a FatELF header"); |
| } |
| |
| const iree_fatelf_header_t* raw_header = |
| (const iree_fatelf_header_t*)file_data.data; |
| iree_fatelf_header_t host_header = { |
| .magic = iree_unaligned_load_le_u32(&raw_header->magic), |
| .version = iree_unaligned_load_le_u16(&raw_header->version), |
| .record_count = iree_unaligned_load_le_u8(&raw_header->record_count), |
| .reserved = iree_unaligned_load_le_u8(&raw_header->reserved), |
| }; |
| |
| if (host_header.magic != IREE_FATELF_MAGIC) { |
| return iree_make_status( |
| IREE_STATUS_INVALID_ARGUMENT, |
| "file magic %08X does not match expected FatELF magic %08X", |
| host_header.magic, IREE_FATELF_MAGIC); |
| } |
| if (host_header.version != IREE_FATELF_FORMAT_VERSION) { |
| return iree_make_status( |
| IREE_STATUS_UNIMPLEMENTED, |
| "FatELF has version %d but runtime only supports version %d", |
| host_header.version, IREE_FATELF_FORMAT_VERSION); |
| } |
| |
| iree_host_size_t required_bytes = |
| sizeof(iree_fatelf_header_t) + |
| host_header.record_count * sizeof(iree_fatelf_record_t); |
| if (file_data.data_length < required_bytes) { |
| return iree_make_status(IREE_STATUS_INVALID_ARGUMENT, |
| "FatELF file truncated, requires at least %" PRIhsz |
| "B for headers but only have %" PRIhsz |
| "B available", |
| required_bytes, file_data.data_length); |
| } |
| |
| // Allocate storage for the parsed header and records. |
| iree_fatelf_header_t* header = NULL; |
| IREE_RETURN_IF_ERROR(iree_allocator_malloc( |
| iree_allocator_system(), |
| sizeof(iree_fatelf_header_t) + |
| host_header.record_count * sizeof(iree_fatelf_record_t), |
| (void**)&header)); |
| memcpy(header, &host_header, sizeof(*header)); |
| for (iree_elf64_byte_t i = 0; i < host_header.record_count; ++i) { |
| const iree_fatelf_record_t* raw_record = &raw_header->records[i]; |
| const iree_fatelf_record_t host_record = { |
| .machine = iree_unaligned_load_le_u16(&raw_record->machine), |
| .osabi = iree_unaligned_load_le_u8(&raw_record->osabi), |
| .osabi_version = iree_unaligned_load_le_u8(&raw_record->osabi_version), |
| .word_size = iree_unaligned_load_le_u8(&raw_record->word_size), |
| .byte_order = iree_unaligned_load_le_u8(&raw_record->byte_order), |
| .reserved0 = iree_unaligned_load_le_u8(&raw_record->reserved0), |
| .reserved1 = iree_unaligned_load_le_u8(&raw_record->reserved1), |
| .offset = iree_unaligned_load_le_u64(&raw_record->offset), |
| .size = iree_unaligned_load_le_u64(&raw_record->size), |
| }; |
| memcpy(&header->records[i], &host_record, sizeof(host_record)); |
| } |
| |
| *out_header = header; |
| return iree_ok_status(); |
| } |
| |
| // Tries to parse basic ELF metadata from |elf_data|. |
| // Very little verification done. Note that this must support both 32 and 64-bit |
| // ELF files regardless of the tool host configuration. |
| // The returned fields match the ELF spec and may differ from FatELF. |
| static iree_status_t fatelf_parse_elf_metadata( |
| iree_const_byte_span_t elf_data, iree_elf64_half_t* out_machine, |
| iree_elf64_byte_t* out_osabi, iree_elf64_byte_t* out_osabi_version, |
| iree_elf64_byte_t* out_elf_class, iree_elf64_byte_t* out_elf_data) { |
| *out_machine = 0; |
| *out_osabi = 0; |
| *out_osabi_version = 0; |
| *out_elf_data = 0; |
| *out_elf_class = 0; |
| |
| if (elf_data.data_length < sizeof(iree_elf32_ehdr_t)) { |
| return iree_make_status(IREE_STATUS_FAILED_PRECONDITION, |
| "ELF data provided (%" PRIhsz |
| ") is smaller than ehdr (%zu)", |
| elf_data.data_length, sizeof(iree_elf32_ehdr_t)); |
| } |
| |
| // The fields we're checking are the same in both 32 and 64 classes so we just |
| // use 32 for consistency. |
| const iree_elf32_ehdr_t* ehdr = (const iree_elf32_ehdr_t*)elf_data.data; |
| static const iree_elf_byte_t elf_magic[4] = {0x7F, 'E', 'L', 'F'}; |
| if (memcmp(ehdr->e_ident, elf_magic, sizeof(elf_magic)) != 0) { |
| return iree_make_status( |
| IREE_STATUS_FAILED_PRECONDITION, |
| "data provided does not contain the ELF identifier"); |
| } |
| |
| *out_osabi = ehdr->e_ident[IREE_ELF_EI_OSABI]; |
| *out_osabi_version = ehdr->e_ident[IREE_ELF_EI_ABIVERSION]; |
| *out_elf_class = ehdr->e_ident[IREE_ELF_EI_CLASS]; |
| *out_elf_data = ehdr->e_ident[IREE_ELF_EI_DATA]; |
| |
| // Note machine is multibyte and respects the declared endianness. |
| if (ehdr->e_ident[IREE_ELF_EI_DATA] == IREE_ELF_ELFDATA2LSB) { |
| *out_machine = iree_unaligned_load_le_u16(&ehdr->e_machine); |
| } else { |
| #if IREE_ENDIANNESS_BIG |
| // TODO(benvanik): helpers for big<->little endian |
| // *out_machine = iree_unaligned_load_be_u16(&ehdr->e_machine); |
| #error "ELF parsing support only available on little-endian systems today" |
| #endif // IREE_ENDIANNESS_BIG |
| } |
| |
| return iree_ok_status(); |
| } |
| |
| typedef struct { |
| uint64_t offset; |
| iree_file_contents_t* contents; |
| iree_const_byte_span_t elf_data; |
| } fatelf_entry_t; |
| |
| // Joins one or more ELF files together and writes the output to stdout. |
| static iree_status_t fatelf_join(int argc, char** argv) { |
| IREE_SET_BINARY_MODE(stdout); // ensure binary output mode |
| |
| #if IREE_ENDIANNESS_BIG |
| #error "FatELF writing support only available on little-endian systems today" |
| #endif // IREE_ENDIANNESS_BIG |
| |
| // Load all source files. |
| iree_elf64_byte_t entry_count = argc; |
| fatelf_entry_t* entries = |
| (fatelf_entry_t*)iree_alloca(entry_count * sizeof(fatelf_entry_t)); |
| memset(entries, 0, entry_count * sizeof(*entries)); |
| for (iree_elf64_byte_t i = 0; i < entry_count; ++i) { |
| IREE_RETURN_IF_ERROR( |
| iree_file_read_contents(argv[i], IREE_FILE_READ_FLAG_DEFAULT, |
| iree_allocator_system(), &entries[i].contents)); |
| entries[i].elf_data = entries[i].contents->const_buffer; |
| } |
| |
| // Compute offsets of all files based on their size and padding. |
| uint64_t file_offset = iree_host_align( |
| sizeof(iree_fatelf_header_t) + entry_count * sizeof(iree_fatelf_record_t), |
| IREE_FATELF_PAGE_SIZE); |
| for (iree_elf64_byte_t i = 0; i < entry_count; ++i) { |
| entries[i].offset = file_offset; |
| file_offset += iree_host_align( |
| entries[i].contents->const_buffer.data_length, IREE_FATELF_PAGE_SIZE); |
| } |
| |
| // Write header without records. |
| iree_fatelf_header_t host_header = { |
| .magic = IREE_FATELF_MAGIC, |
| .version = IREE_FATELF_FORMAT_VERSION, |
| .record_count = entry_count, |
| .reserved = 0, |
| }; |
| fwrite(&host_header, 1, sizeof(host_header), stdout); |
| |
| // Write all records. |
| for (iree_elf64_byte_t i = 0; i < entry_count; ++i) { |
| iree_elf64_half_t machine = 0; |
| iree_elf64_byte_t osabi = 0; |
| iree_elf64_byte_t osabi_version = 0; |
| iree_elf64_byte_t elf_class = 0; |
| iree_elf64_byte_t elf_data = 0; |
| IREE_RETURN_IF_ERROR( |
| fatelf_parse_elf_metadata(entries[i].elf_data, &machine, &osabi, |
| &osabi_version, &elf_class, &elf_data)); |
| iree_fatelf_record_t host_record = { |
| .machine = machine, |
| .osabi = osabi, |
| .osabi_version = osabi_version, |
| .word_size = elf_class == IREE_ELF_ELFCLASS32 |
| ? IREE_FATELF_WORD_SIZE_32 |
| : IREE_FATELF_WORD_SIZE_64, |
| .byte_order = elf_data == IREE_ELF_ELFDATA2LSB |
| ? IREE_FATELF_BYTE_ORDER_LSB |
| : IREE_FATELF_BYTE_ORDER_MSB, |
| .reserved0 = 0, |
| .reserved1 = 0, |
| .offset = (iree_elf64_off_t)entries[i].offset, |
| .size = (iree_elf64_xword_t)entries[i].elf_data.data_length, |
| }; |
| fwrite(&host_record, 1, sizeof(host_record), stdout); |
| } |
| |
| // Write all files, padding with zeros in-between as needed. |
| uint64_t write_offset = |
| sizeof(iree_fatelf_header_t) + entry_count * sizeof(iree_fatelf_record_t); |
| for (iree_elf64_byte_t i = 0; i < entry_count; ++i) { |
| uint64_t padding = entries[i].offset - write_offset; |
| for (uint64_t i = 0; i < padding; ++i) fputc(0, stdout); |
| write_offset += padding; |
| if (write_offset != entries[i].offset) { |
| return iree_make_status(IREE_STATUS_INTERNAL, |
| "actual offset does not match expected"); |
| } |
| fwrite(entries[i].elf_data.data, 1, entries[i].elf_data.data_length, |
| stdout); |
| write_offset += entries[i].elf_data.data_length; |
| } |
| fflush(stdout); |
| |
| for (iree_elf64_byte_t i = 0; i < entry_count; ++i) { |
| iree_file_contents_free(entries[i].contents); |
| } |
| return iree_ok_status(); |
| } |
| |
| static const char* fatelf_machine_id_str(iree_elf64_half_t value) { |
| // TODO(benvanik): include a full table from the spec? |
| // http://formats.kaitai.io/elf/ has a good source of canonical short names. |
| // For now we just support what we have in our ELF loader. |
| switch (value) { |
| case 0x03: // EM_386 / 3 |
| return "x86"; |
| case 0x28: // EM_ARM / 40 |
| return "arm"; |
| case 0xB7: // EM_AARCH64 / 183 |
| return "aarch64"; |
| case 0xF3: // EM_RISCV / 243 |
| return "risvc"; |
| case 0x3E: // EM_X86_64 / 62 |
| return "x86_64"; |
| default: |
| return "unknown"; |
| } |
| } |
| |
| static const char* fatelf_osabi_id_str(iree_elf64_byte_t value) { |
| switch (value) { |
| case IREE_ELF_ELFOSABI_NONE: |
| return "none"; |
| case IREE_ELF_ELFOSABI_LINUX: |
| return "linux"; |
| case IREE_ELF_ELFOSABI_STANDALONE: |
| return "standalone"; |
| default: |
| return "unknown"; |
| } |
| } |
| |
| static const char* fatelf_word_size_id_str(iree_elf64_byte_t value) { |
| switch (value) { |
| case IREE_FATELF_WORD_SIZE_32: |
| return "lp32"; |
| case IREE_FATELF_WORD_SIZE_64: |
| return "lp64"; |
| default: |
| return "lpUNK"; |
| } |
| } |
| |
| static const char* fatelf_byte_order_id_str(iree_elf64_byte_t value) { |
| switch (value) { |
| case IREE_FATELF_BYTE_ORDER_MSB: |
| return "be"; |
| case IREE_FATELF_BYTE_ORDER_LSB: |
| return "le"; |
| default: |
| return "xx"; |
| } |
| } |
| |
| // Splits a FatELF into multiple files, writing each beside the input file. |
| static iree_status_t fatelf_split(int argc, char** argv) { |
| iree_file_contents_t* fatelf_contents = NULL; |
| IREE_RETURN_IF_ERROR( |
| iree_file_read_contents(argv[0], IREE_FILE_READ_FLAG_DEFAULT, |
| iree_allocator_system(), &fatelf_contents)); |
| iree_fatelf_header_t* header = NULL; |
| IREE_RETURN_IF_ERROR(fatelf_parse(fatelf_contents->const_buffer, &header)); |
| |
| iree_string_view_t dirname, basename; |
| iree_file_path_split(iree_make_cstring_view(argv[0]), &dirname, &basename); |
| iree_string_view_t stem, extension; |
| iree_file_path_split_basename(basename, &stem, &extension); |
| |
| for (iree_elf64_byte_t i = 0; i < header->record_count; ++i) { |
| const iree_fatelf_record_t* record = &header->records[i]; |
| |
| const char* machine_str = fatelf_machine_id_str(record->machine); |
| const char* osabi_str = fatelf_osabi_id_str(record->osabi); |
| const char* word_size_str = fatelf_word_size_id_str(record->word_size); |
| const char* byte_order_str = fatelf_byte_order_id_str(record->byte_order); |
| |
| char record_path[2048]; |
| iree_host_size_t record_path_length = |
| snprintf(record_path, IREE_ARRAYSIZE(record_path), |
| "%.*s%s%.*s.%s_%s_%s%s.so", (int)dirname.size, dirname.data, |
| dirname.size ? "/" : "", (int)stem.size, stem.data, |
| machine_str, osabi_str, word_size_str, byte_order_str); |
| record_path_length = |
| iree_file_path_canonicalize(record_path, record_path_length); |
| |
| fprintf(stdout, "Writing record[%d] to '%.*s'...\n", i, |
| (int)record_path_length, record_path); |
| |
| iree_const_byte_span_t record_data = iree_make_const_byte_span( |
| fatelf_contents->const_buffer.data + record->offset, record->size); |
| IREE_RETURN_IF_ERROR(iree_file_write_contents(record_path, record_data)); |
| } |
| |
| fprintf(stdout, "Wrote %d records to %.*s!\n", header->record_count, |
| (int)dirname.size, dirname.data); |
| iree_allocator_free(iree_allocator_system(), header); |
| iree_file_contents_free(fatelf_contents); |
| return iree_ok_status(); |
| } |
| |
| // Selects the ELF matching the current host config from a FatELF and writes |
| // it to stdout. |
| static iree_status_t fatelf_select(int argc, char** argv) { |
| IREE_SET_BINARY_MODE(stdout); // ensure binary output mode |
| iree_file_contents_t* fatelf_contents = NULL; |
| IREE_RETURN_IF_ERROR( |
| iree_file_read_contents(argv[0], IREE_FILE_READ_FLAG_DEFAULT, |
| iree_allocator_system(), &fatelf_contents)); |
| iree_const_byte_span_t elf_data = iree_const_byte_span_empty(); |
| IREE_RETURN_IF_ERROR( |
| iree_fatelf_select(fatelf_contents->const_buffer, &elf_data)); |
| fwrite(elf_data.data, 1, elf_data.data_length, stdout); |
| iree_file_contents_free(fatelf_contents); |
| return iree_ok_status(); |
| } |
| |
| static const char* fatelf_word_size_enum_str(iree_elf64_byte_t value) { |
| switch (value) { |
| case IREE_FATELF_WORD_SIZE_32: |
| return "ELFCLASS32"; |
| case IREE_FATELF_WORD_SIZE_64: |
| return "ELFCLASS64"; |
| default: |
| return "<unknown>"; |
| } |
| } |
| |
| static const char* fatelf_byte_order_enum_str(iree_elf64_byte_t value) { |
| switch (value) { |
| case IREE_FATELF_BYTE_ORDER_MSB: |
| return "ELFDATA2MSB (big-endian)"; |
| case IREE_FATELF_BYTE_ORDER_LSB: |
| return "ELFDATA2LSB (little-endian)"; |
| default: |
| return "<unknown>"; |
| } |
| } |
| |
| // Dumps the FatELF file records. |
| static iree_status_t fatelf_dump(int argc, char** argv) { |
| iree_file_contents_t* fatelf_contents = NULL; |
| IREE_RETURN_IF_ERROR( |
| iree_file_read_contents(argv[0], IREE_FILE_READ_FLAG_DEFAULT, |
| iree_allocator_system(), &fatelf_contents)); |
| iree_fatelf_header_t* header = NULL; |
| IREE_RETURN_IF_ERROR(fatelf_parse(fatelf_contents->const_buffer, &header)); |
| |
| fprintf(stdout, "iree_fatelf_header_t:\n"); |
| fprintf(stdout, " magic: %" PRIX32 "\n", header->magic); |
| fprintf(stdout, " version: %d\n", header->version); |
| fprintf(stdout, " records: %d\n", header->record_count); |
| fprintf(stdout, " reserved: %" PRIX8 "\n", header->reserved); |
| fprintf(stdout, "\n"); |
| |
| for (iree_elf64_byte_t i = 0; i < header->record_count; ++i) { |
| const iree_fatelf_record_t* record = &header->records[i]; |
| fprintf(stdout, "iree_fatelf_record_t[%d]:\n", i); |
| fprintf(stdout, " machine: %d / %04X = %s\n", record->machine, |
| record->machine, fatelf_machine_id_str(record->machine)); |
| fprintf(stdout, " osabi: %d / %02X = %s\n", record->osabi, |
| record->osabi, fatelf_osabi_id_str(record->osabi)); |
| fprintf(stdout, " version: %d / %02X\n", record->osabi_version, |
| record->osabi_version); |
| fprintf(stdout, " word_size: %d / %02X = %s\n", record->word_size, |
| record->word_size, fatelf_word_size_enum_str(record->word_size)); |
| fprintf(stdout, " byte_order: %d / %02X = %s\n", record->byte_order, |
| record->byte_order, fatelf_byte_order_enum_str(record->byte_order)); |
| fprintf(stdout, " reserved0: %d / %02X\n", record->reserved0, |
| record->reserved0); |
| fprintf(stdout, " reserved1: %d / %02X\n", record->reserved1, |
| record->reserved1); |
| fprintf(stdout, " offset: %" PRIu64 " / %016" PRIX64 "\n", |
| record->offset, record->offset); |
| fprintf(stdout, " size: %" PRIu64 " / %016" PRIX64 "\n", record->size, |
| record->size); |
| fprintf(stdout, "\n"); |
| } |
| |
| iree_allocator_free(iree_allocator_system(), header); |
| iree_file_contents_free(fatelf_contents); |
| return iree_ok_status(); |
| } |
| |
| int main(int argc, char** argv) { |
| if (argc < 2) { |
| return print_usage(); |
| } |
| |
| char* command = argv[1]; |
| int command_argc = argc - 2; |
| char** command_argv = argv + 2; |
| |
| iree_status_t status = iree_ok_status(); |
| if (strcmp(command, "join") == 0) { |
| if (command_argc < 1) return print_usage(); |
| status = fatelf_join(command_argc, command_argv); |
| } else if (strcmp(command, "split") == 0) { |
| if (command_argc != 1) return print_usage(); |
| status = fatelf_split(command_argc, command_argv); |
| } else if (strcmp(command, "select") == 0) { |
| if (command_argc != 1) return print_usage(); |
| status = fatelf_select(command_argc, command_argv); |
| } else if (strcmp(command, "dump") == 0) { |
| if (command_argc != 1) return print_usage(); |
| status = fatelf_dump(command_argc, command_argv); |
| } else { |
| return print_usage(); |
| } |
| |
| if (!iree_status_is_ok(status)) { |
| fprintf(stderr, "iree-fatelf encountered error:\n"); |
| iree_status_fprint(stderr, status); |
| iree_status_free(status); |
| return 1; |
| } |
| return 0; |
| } |