This enables the object backend for s390x, in particular the processing of all required relocations. This uncovered a bug: we need to use PLT relocations for the target of calls, which we currently do not. Fixed by adding a new S390xPLTRel32Dbl reloc type and using it where needed.
106 lines
4.2 KiB
Rust
106 lines
4.2 KiB
Rust
//! Binary machine code emission.
|
|
//!
|
|
//! The `binemit` module contains code for translating Cranelift's intermediate representation into
|
|
//! binary machine code.
|
|
|
|
mod stack_map;
|
|
|
|
pub use self::stack_map::StackMap;
|
|
use core::fmt;
|
|
#[cfg(feature = "enable-serde")]
|
|
use serde::{Deserialize, Serialize};
|
|
|
|
/// Offset in bytes from the beginning of the function.
|
|
///
|
|
/// Cranelift can be used as a cross compiler, so we don't want to use a type like `usize` which
|
|
/// depends on the *host* platform, not the *target* platform.
|
|
pub type CodeOffset = u32;
|
|
|
|
/// Addend to add to the symbol value.
|
|
pub type Addend = i64;
|
|
|
|
/// Relocation kinds for every ISA
|
|
#[derive(Copy, Clone, Debug, PartialEq, Eq)]
|
|
#[cfg_attr(feature = "enable-serde", derive(Serialize, Deserialize))]
|
|
pub enum Reloc {
|
|
/// absolute 4-byte
|
|
Abs4,
|
|
/// absolute 8-byte
|
|
Abs8,
|
|
/// x86 PC-relative 4-byte
|
|
X86PCRel4,
|
|
/// x86 call to PC-relative 4-byte
|
|
X86CallPCRel4,
|
|
/// x86 call to PLT-relative 4-byte
|
|
X86CallPLTRel4,
|
|
/// x86 GOT PC-relative 4-byte
|
|
X86GOTPCRel4,
|
|
/// Arm32 call target
|
|
Arm32Call,
|
|
/// Arm64 call target. Encoded as bottom 26 bits of instruction. This
|
|
/// value is sign-extended, multiplied by 4, and added to the PC of
|
|
/// the call instruction to form the destination address.
|
|
Arm64Call,
|
|
/// s390x PC-relative 4-byte offset
|
|
S390xPCRel32Dbl,
|
|
/// s390x PC-relative 4-byte offset to PLT
|
|
S390xPLTRel32Dbl,
|
|
|
|
/// Elf x86_64 32 bit signed PC relative offset to two GOT entries for GD symbol.
|
|
ElfX86_64TlsGd,
|
|
|
|
/// Mach-O x86_64 32 bit signed PC relative offset to a `__thread_vars` entry.
|
|
MachOX86_64Tlv,
|
|
|
|
/// AArch64 TLS GD
|
|
/// Set an ADRP immediate field to the top 21 bits of the final address. Checks for overflow.
|
|
/// This is equivalent to `R_AARCH64_TLSGD_ADR_PAGE21` in the [aaelf64](https://github.com/ARM-software/abi-aa/blob/2bcab1e3b22d55170c563c3c7940134089176746/aaelf64/aaelf64.rst#relocations-for-thread-local-storage)
|
|
Aarch64TlsGdAdrPage21,
|
|
|
|
/// AArch64 TLS GD
|
|
/// Set the add immediate field to the low 12 bits of the final address. Does not check for overflow.
|
|
/// This is equivalent to `R_AARCH64_TLSGD_ADD_LO12_NC` in the [aaelf64](https://github.com/ARM-software/abi-aa/blob/2bcab1e3b22d55170c563c3c7940134089176746/aaelf64/aaelf64.rst#relocations-for-thread-local-storage)
|
|
Aarch64TlsGdAddLo12Nc,
|
|
|
|
/// s390x TLS GD64 - 64-bit offset of tls_index for GD symbol in GOT
|
|
S390xTlsGd64,
|
|
/// s390x TLS GDCall - marker to enable optimization of TLS calls
|
|
S390xTlsGdCall,
|
|
}
|
|
|
|
impl fmt::Display for Reloc {
|
|
/// Display trait implementation drops the arch, since its used in contexts where the arch is
|
|
/// already unambiguous, e.g. clif syntax with isa specified. In other contexts, use Debug.
|
|
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
|
|
match *self {
|
|
Self::Abs4 => write!(f, "Abs4"),
|
|
Self::Abs8 => write!(f, "Abs8"),
|
|
Self::S390xPCRel32Dbl => write!(f, "PCRel32Dbl"),
|
|
Self::S390xPLTRel32Dbl => write!(f, "PLTRel32Dbl"),
|
|
Self::X86PCRel4 => write!(f, "PCRel4"),
|
|
Self::X86CallPCRel4 => write!(f, "CallPCRel4"),
|
|
Self::X86CallPLTRel4 => write!(f, "CallPLTRel4"),
|
|
Self::X86GOTPCRel4 => write!(f, "GOTPCRel4"),
|
|
Self::Arm32Call | Self::Arm64Call => write!(f, "Call"),
|
|
|
|
Self::ElfX86_64TlsGd => write!(f, "ElfX86_64TlsGd"),
|
|
Self::MachOX86_64Tlv => write!(f, "MachOX86_64Tlv"),
|
|
Self::Aarch64TlsGdAdrPage21 => write!(f, "Aarch64TlsGdAdrPage21"),
|
|
Self::Aarch64TlsGdAddLo12Nc => write!(f, "Aarch64TlsGdAddLo12Nc"),
|
|
Self::S390xTlsGd64 => write!(f, "TlsGd64"),
|
|
Self::S390xTlsGdCall => write!(f, "TlsGdCall"),
|
|
}
|
|
}
|
|
}
|
|
|
|
/// Container for information about a vector of compiled code and its supporting read-only data.
|
|
///
|
|
/// The code starts at offset 0 and is followed optionally by relocatable jump tables and copyable
|
|
/// (raw binary) read-only data. Any padding between sections is always part of the section that
|
|
/// precedes the boundary between the sections.
|
|
#[derive(PartialEq)]
|
|
pub struct CodeInfo {
|
|
/// Number of bytes in total.
|
|
pub total_size: CodeOffset,
|
|
}
|