[otbn,sw] Change how we expose OTBN symbols to Ibex Before this commit, we made this work by linking against the OTBN ELF file, after dropping the sections that couldn't be seen (.scratchpad) and fiddling around with names and section flags. Once that was done, Ibex code could get initialised OTBN data by looking at the special symbol. What's more, we could convert one of these symbols into an OTBN address by subtracting the base of DMEM. (There are some other wrinkles to do with .bss sections, but that's the basic idea). This commit simplifies what Ibex does by putting a bit more of the "symbol relocation" logic into the build system. We still link against a mangled OTBN ELF file, but this now exposes symbols in two different ways: - Any code or initialised data (.text or .data) gets copied across as before. Symbols pointing into these sections get a prefix that looks like "_otbn_local_app_APPNAME_". (Here, local because the value of the symbol is an Ibex address). - Zero-initialised data (.bss) now gets dropped and doesn't appear in the Ibex image at all. In particular, this means that Ibex won't allocate an unused chunk of zeros in its own .bss section. - All visible symbols get added a second time, but this time with the "_otbn_remote_app_APPNAME_" prefix. These have been turned into ABS symbols, which means that they will keep their (OTBN) addresses and won't get relocated when linking. The Ibex driver code can get get pointers to the OTBN .text/.data sections (which are .rodata as far as Ibex is concerned) with a similar set of macros as before. However, application code probably won't need to do this and we've actually got rid of the otbn_ptr_t type that was being used there and added some warning messages. Most Ibex code that's interacting with OTBN *really* just wants to copy stuff from the OTBN address space. So we've now got a new type (addr_t, which is just a uint32_t) and a couple of new macros (OTBN_DECLARE_SYMBOL_ADDR, OTBN_ADDR_T_INIT) to initialise it. This works with the second sort of symbol described above and is just an integer holding an OTBN address. The otbn_copy_data_to_otbn and otbn_copy_data_from_otbn functions have been switched to use otbn_addr_t instead of otbn_ptr_t, which makes a bit more sense since they fundamentally want an OTBN address. Finally, otbn_data_ptr_to_dmem_addr can now be removed! If code actually wants to know how to map between the addresses of two symbols, it should just use both of the macro types above and everything will get resolved at link time, with no computation needed at runtime. Signed-off-by: Rupert Swarbrick <rswarbrick@lowrisc.org>

commit: 48b9a95dc6883fbe8a2b48f668ee1de5eba2f600 [log] [tgz]
author: Rupert Swarbrick <rswarbrick@lowrisc.org> Fri Jan 14 16:20:16 2022 +0000
committer: Rupert Swarbrick <rswarbrick@gmail.com> Tue Jan 18 15:31:06 2022 +0000
tree: 01d1b91f38c9e9974d952ada83b5537ea29f61bf
parent: 51abd9f8d94d9a362c49b2de851ff17d6bee5d46 [diff] [blame]
diff --git a/util/otbn_build.py b/util/otbn_build.py
index 68957bb..11e3be9 100755
--- a/util/otbn_build.py
+++ b/util/otbn_build.py

@@ -43,7 +43,10 @@
 import sys
 import tempfile
 from pathlib import Path
-from typing import List, Optional
+from typing import List, Optional, Tuple
+
+from elftools.elf.elffile import ELFFile, SymbolTableSection  # type: ignore
+
 
 REPO_TOP = Path(__file__).parent.parent.resolve()
 
@@ -127,6 +130,43 @@
     run_cmd([rv32_tool_ar] + args)
 
 
+def get_otbn_syms(elf_path: str) -> List[Tuple[str, int]]:
+    '''Get externally-visible symbols from an ELF
+
+    Symbols are returned as a list of triples: (name, address). This
+    discards locals and also anything in .scratchpad, since those addresses
+    aren't bus-accessible.
+    '''
+    with tempfile.TemporaryDirectory() as tmpdir:
+        # First, run objcopy to discard local symbols and the .scratchpad
+        # section. We also use --extract-symbol since we don't care about
+        # anything but the symbol data anyway.
+        syms_path = os.path.join(tmpdir, 'syms.elf')
+        call_rv32_objcopy(['-O', 'elf32-littleriscv',
+                           '--remove-section=.scratchpad',
+                           '--extract-symbol'] +
+                          [elf_path, syms_path])
+
+        # Load the file and use elftools to grab any symbol table
+        with open(syms_path, 'rb') as syms_fd:
+            syms_file = ELFFile(syms_fd)
+            symtab = syms_file.get_section_by_name('.symtab')
+            if symtab is None or not isinstance(symtab, SymbolTableSection):
+                # No symbol table found or we did find a section called
+                # .symtab, but it isn't actually a symbol table (huh?!). Give
+                # up.
+                return []
+
+            ret = []
+            for sym in symtab.iter_symbols():
+                if sym['st_info']['bind'] != 'STB_GLOBAL':
+                    continue
+                addr = sym['st_value']
+                assert isinstance(addr, int)
+                ret.append((sym.name, addr))
+            return ret
+
+
 def main() -> int:
     parser = argparse.ArgumentParser(description=__doc__,
                                      formatter_class=argparse.RawDescriptionHelpFormatter)
@@ -184,34 +224,42 @@
         out_elf = out_dir / (app_name + '.elf')
         call_otbn_ld(obj_files, out_elf, linker_script = args.linker_script)
 
-        # Use objcopy to create an ELF that can be linked into a RISC-V binary
-        # (to run on Ibex). This should set flags for all sections to look like
-        # rodata (since they're not executable on Ibex, nor does it make sense
-        # for Ibex code to manipulate OTBN data sections "in place"). We name
-        # them with a .otbn prefix, so end up with e.g. .rodata.otbn.text and
-        # .rodata.otbn.data.
+        # out_elf is a fully-linked OTBN binary, but we want to be able to use
+        # it from Ibex, the host processor. To make this work, we generate an
+        # ELF file that can be linked into the Ibex image.
         #
-        # Symbols that are exposed by the binary (including those giving the
-        # start and end of imem and dmem) will be relocated as part of the
-        # link, so they'll give addresses in the Ibex address space. So that
-        # the RISC-V binary can link multiple OTBN applications, we give them
-        # an application-specific prefix. (Note: This prefix is used in
-        # sw/device/lib/runtime/otbn.h: so needs to be kept in sync with that).
-        sym_pfx = '_otbn_app_{}_'.format(app_name)
+        # This ELF contains all initialised data (the .text and .data
+        # sections). We change the flags to treat them like rodata (since
+        # they're not executable on Ibex, nor does it make sense for Ibex code
+        # to manipulate OTBN data sections "in place") and add a .rodata.otbn
+        # prefix to the section names.
+        #
+        # The symbols exposed by the binary will be relocated as part of the
+        # link, so they'll point into the Ibex address space. To allow linking
+        # against multiple OTBN applications, we give the symbols an
+        # application-specific prefix. (Note: This prefix is used in driver
+        # code: so needs to be kept in sync with that).
+        #
+        # As well as the initialised data and relocated symbols, we also want
+        # to add (absolute) symbols that have the OTBN addresses of the symbols
+        # in question. Unfortunately, objcopy doesn't seem to have a "make all
+        # symbols absolute" command, so we have to do it by hand. This also
+        # means constructing an enormous objcopy command line :-/ If we run out
+        # of space, we might have to use elftools to inject the addresses after
+        # the objcopy.
+        host_side_pfx = '_otbn_local_app_{}_'.format(app_name)
+        otbn_side_pfx = '_otbn_remote_app_{}_'.format(app_name)
         out_embedded_obj = out_dir / (app_name + '.rv32embed.o')
-        args = (['-O', 'elf32-littleriscv',
-                 '--set-section-flags=*=alloc,load,readonly',
-                 '--set-section-flags=.bss=alloc,readonly',
-                 '--rename-section=.text=.rodata.otbn.text',
-                 '--rename-section=.start=.rodata.otbn.start',
-                 '--rename-section=.data=.rodata.otbn.data',
-                 '--rename-section=.bss=.bss.otbn.bss',
-                 '--remove-section=.scratchpad',
-                 '--prefix-symbols', sym_pfx] +
-                [out_elf,
-                 out_embedded_obj])
+        args = ['-O', 'elf32-littleriscv',
+                '--set-section-flags=*=alloc,load,readonly',
+                '--remove-section=.scratchpad',
+                '--remove-section=.bss',
+                '--prefix-sections=.rodata.otbn',
+                '--prefix-symbols', host_side_pfx]
+        for name, addr in get_otbn_syms(out_elf):
+            args += ['--add-symbol', f'{otbn_side_pfx}{name}=0x{addr:x}']
 
-        call_rv32_objcopy(args)
+        call_rv32_objcopy(args + [out_elf, out_embedded_obj])
 
         # After objcopy has finished, we have to do a little surgery to
         # overwrite the ELF e_type field (a 16-bit little-endian number at file
commit	48b9a95dc6883fbe8a2b48f668ee1de5eba2f600	[log] [tgz]
author	Rupert Swarbrick <rswarbrick@lowrisc.org>	Fri Jan 14 16:20:16 2022 +0000
committer	Rupert Swarbrick <rswarbrick@gmail.com>	Tue Jan 18 15:31:06 2022 +0000
tree	01d1b91f38c9e9974d952ada83b5537ea29f61bf
parent	51abd9f8d94d9a362c49b2de851ff17d6bee5d46 [diff] [blame]