Remove dependency on TargetIsa from Wasmtime crates (#3178)

This commit started off by deleting the `cranelift_codegen::settings` reexport in the `wasmtime-environ` crate and then basically played whack-a-mole until everything compiled again. The main result of this is that the `wasmtime-*` family of crates have generally less of a dependency on the `TargetIsa` trait and type from Cranelift. While the dependency isn't entirely severed yet this is at least a significant start. This commit is intended to be largely refactorings, no functional changes are intended here. The refactorings are: * A `CompilerBuilder` trait has been added to `wasmtime_environ` which server as an abstraction used to create compilers and configure them in a uniform fashion. The `wasmtime::Config` type now uses this instead of cranelift-specific settings. The `wasmtime-jit` crate exports the ability to create a compiler builder from a `CompilationStrategy`, which only works for Cranelift right now. In a cranelift-less build of Wasmtime this is expected to return a trait object that fails all requests to compile. * The `Compiler` trait in the `wasmtime_environ` crate has been souped up with a number of methods that Wasmtime and other crates needed. * The `wasmtime-debug` crate is now moved entirely behind the `wasmtime-cranelift` crate. * The `wasmtime-cranelift` crate is now only depended on by the `wasmtime-jit` crate. * Wasm types in `cranelift-wasm` no longer contain their IR type, instead they only contain the `WasmType`. This is required to get everything to align correctly but will also be required in a future refactoring where the types used by `cranelift-wasm` will be extracted to a separate crate. * I moved around a fair bit of code in `wasmtime-cranelift`. * Some gdb-specific jit-specific code has moved from `wasmtime-debug` to `wasmtime-jit`.
2021-08-16 09:55:39 -05:00
parent 7c0948fe0b
commit 0313e30d76
47 changed files with 1529 additions and 1384 deletions
--- a/crates/jit/src/debug.rs
+++ b/crates/jit/src/debug.rs
@@ -0,0 +1,212 @@
+use anyhow::{bail, ensure, Error};
+use object::endian::{BigEndian, Endian, Endianness, LittleEndian};
+use object::{RelocationEncoding, RelocationKind};
+use std::collections::HashMap;
+
+pub fn create_gdbjit_image(
+    mut bytes: Vec<u8>,
+    code_region: (*const u8, usize),
+    defined_funcs_offset: usize,
+    funcs: &[*const u8],
+) -> Result<Vec<u8>, Error> {
+    let e = ensure_supported_elf_format(&bytes)?;
+
+    // patch relocs
+    relocate_dwarf_sections(&bytes, defined_funcs_offset, funcs)?;
+
+    // elf is still missing details...
+    match e {
+        Endianness::Little => {
+            convert_object_elf_to_loadable_file::<LittleEndian>(&mut bytes, code_region)
+        }
+        Endianness::Big => {
+            convert_object_elf_to_loadable_file::<BigEndian>(&mut bytes, code_region)
+        }
+    }
+
+    // let mut file = ::std::fs::File::create(::std::path::Path::new("test.o")).expect("file");
+    // ::std::io::Write::write_all(&mut file, &bytes).expect("write");
+
+    Ok(bytes)
+}
+
+fn relocate_dwarf_sections(
+    bytes: &[u8],
+    defined_funcs_offset: usize,
+    funcs: &[*const u8],
+) -> Result<(), Error> {
+    use object::read::{File, Object, ObjectSection, ObjectSymbol, RelocationTarget};
+
+    let obj = File::parse(bytes)?;
+    let mut func_symbols = HashMap::new();
+    for sym in obj.symbols() {
+        match (sym.name(), sym.section_index()) {
+            (Ok(name), Some(_section_index)) if name.starts_with("_wasm_function_") => {
+                let index = name["_wasm_function_".len()..].parse::<usize>()?;
+                let data = funcs[index - defined_funcs_offset];
+                func_symbols.insert(sym.index(), data);
+            }
+            _ => (),
+        }
+    }
+
+    for section in obj.sections() {
+        for (off, r) in section.relocations() {
+            if r.kind() != RelocationKind::Absolute
+                || r.encoding() != RelocationEncoding::Generic
+                || r.size() != 64
+            {
+                continue;
+            }
+
+            let data = match r.target() {
+                RelocationTarget::Symbol(ref index) => func_symbols.get(index),
+                _ => None,
+            };
+            let data: *const u8 = match data {
+                Some(data) => *data,
+                None => {
+                    continue;
+                }
+            };
+
+            let target = (data as u64).wrapping_add(r.addend() as u64);
+
+            let entry_ptr = section.data_range(off, 8).unwrap().unwrap().as_ptr();
+            unsafe {
+                std::ptr::write(entry_ptr as *mut u64, target);
+            }
+        }
+    }
+    Ok(())
+}
+
+fn ensure_supported_elf_format(bytes: &[u8]) -> Result<Endianness, Error> {
+    use object::elf::*;
+    use object::read::elf::*;
+    use std::mem::size_of;
+
+    let kind = match object::FileKind::parse(bytes) {
+        Ok(file) => file,
+        Err(err) => {
+            bail!("Failed to parse file: {}", err);
+        }
+    };
+    let header = match kind {
+        object::FileKind::Elf64 => match object::elf::FileHeader64::<Endianness>::parse(bytes) {
+            Ok(header) => header,
+            Err(err) => {
+                bail!("Unsupported ELF file: {}", err);
+            }
+        },
+        _ => {
+            bail!("only 64-bit ELF files currently supported")
+        }
+    };
+    let e = header.endian().unwrap();
+
+    match header.e_machine.get(e) {
+        EM_AARCH64 => (),
+        EM_X86_64 => (),
+        EM_S390 => (),
+        machine => {
+            bail!("Unsupported ELF target machine: {:x}", machine);
+        }
+    }
+    ensure!(
+        header.e_phoff.get(e) == 0 && header.e_phnum.get(e) == 0,
+        "program header table is empty"
+    );
+    let e_shentsize = header.e_shentsize.get(e);
+    let req_shentsize = match e {
+        Endianness::Little => size_of::<SectionHeader64<LittleEndian>>(),
+        Endianness::Big => size_of::<SectionHeader64<BigEndian>>(),
+    };
+    ensure!(e_shentsize as usize == req_shentsize, "size of sh");
+    Ok(e)
+}
+
+fn convert_object_elf_to_loadable_file<E: Endian>(
+    bytes: &mut Vec<u8>,
+    code_region: (*const u8, usize),
+) {
+    use object::elf::*;
+    use std::ffi::CStr;
+    use std::mem::size_of;
+    use std::os::raw::c_char;
+
+    let e = E::default();
+    let header: &FileHeader64<E> = unsafe { &*(bytes.as_mut_ptr() as *const FileHeader64<_>) };
+
+    let e_shentsize = header.e_shentsize.get(e);
+    let e_shoff = header.e_shoff.get(e);
+    let e_shnum = header.e_shnum.get(e);
+    let mut shstrtab_off = 0;
+    for i in 0..e_shnum {
+        let off = e_shoff as isize + i as isize * e_shentsize as isize;
+        let section: &SectionHeader64<E> =
+            unsafe { &*(bytes.as_ptr().offset(off) as *const SectionHeader64<_>) };
+        if section.sh_type.get(e) != SHT_STRTAB {
+            continue;
+        }
+        shstrtab_off = section.sh_offset.get(e);
+    }
+    let mut segment: Option<_> = None;
+    for i in 0..e_shnum {
+        let off = e_shoff as isize + i as isize * e_shentsize as isize;
+        let section: &mut SectionHeader64<E> =
+            unsafe { &mut *(bytes.as_mut_ptr().offset(off) as *mut SectionHeader64<_>) };
+        if section.sh_type.get(e) != SHT_PROGBITS {
+            continue;
+        }
+        // It is a SHT_PROGBITS, but we need to check sh_name to ensure it is our function
+        let sh_name_off = section.sh_name.get(e);
+        let sh_name = unsafe {
+            CStr::from_ptr(
+                bytes
+                    .as_ptr()
+                    .offset((shstrtab_off + sh_name_off as u64) as isize)
+                    as *const c_char,
+            )
+            .to_str()
+            .expect("name")
+        };
+        if sh_name != ".text" {
+            continue;
+        }
+
+        assert!(segment.is_none());
+        // Patch vaddr, and save file location and its size.
+        section.sh_addr.set(e, code_region.0 as u64);
+        let sh_offset = section.sh_offset.get(e);
+        let sh_size = section.sh_size.get(e);
+        segment = Some((sh_offset, sh_size));
+    }
+
+    // LLDB wants segment with virtual address set, placing them at the end of ELF.
+    let ph_off = bytes.len();
+    let e_phentsize = size_of::<ProgramHeader64<E>>();
+    let e_phnum = 1;
+    bytes.resize(ph_off + e_phentsize * e_phnum, 0);
+    if let Some((sh_offset, sh_size)) = segment {
+        let (v_offset, size) = code_region;
+        let program: &mut ProgramHeader64<E> =
+            unsafe { &mut *(bytes.as_ptr().add(ph_off) as *mut ProgramHeader64<_>) };
+        program.p_type.set(e, PT_LOAD);
+        program.p_offset.set(e, sh_offset);
+        program.p_vaddr.set(e, v_offset as u64);
+        program.p_paddr.set(e, v_offset as u64);
+        program.p_filesz.set(e, sh_size);
+        program.p_memsz.set(e, size as u64);
+    } else {
+        unreachable!();
+    }
+
+    // It is somewhat loadable ELF file at this moment.
+    let header: &mut FileHeader64<E> =
+        unsafe { &mut *(bytes.as_mut_ptr() as *mut FileHeader64<_>) };
+    header.e_type.set(e, ET_DYN);
+    header.e_phoff.set(e, ph_off as u64);
+    header.e_phentsize.set(e, e_phentsize as u16);
+    header.e_phnum.set(e, e_phnum as u16);
+}