* Rework the blockorder module to reuse the dom tree's cfg postorder * Update domtree tests * Treat br_table with an empty jump table as multiple block exits * Bless tests * Change branch_idx to succ_idx and fix the comment
510 lines
19 KiB
Rust
510 lines
19 KiB
Rust
//! X86_64-bit Instruction Set Architecture.
|
|
|
|
pub use self::inst::{args, EmitInfo, EmitState, Inst};
|
|
|
|
use super::{OwnedTargetIsa, TargetIsa};
|
|
use crate::dominator_tree::DominatorTree;
|
|
use crate::ir::{condcodes::IntCC, Function, Type};
|
|
#[cfg(feature = "unwind")]
|
|
use crate::isa::unwind::systemv;
|
|
use crate::isa::x64::{inst::regs::create_reg_env_systemv, settings as x64_settings};
|
|
use crate::isa::Builder as IsaBuilder;
|
|
use crate::machinst::{
|
|
compile, CompiledCode, CompiledCodeStencil, MachTextSectionBuilder, Reg, SigSet,
|
|
TextSectionBuilder, VCode,
|
|
};
|
|
use crate::result::{CodegenError, CodegenResult};
|
|
use crate::settings::{self as shared_settings, Flags};
|
|
use alloc::{boxed::Box, vec::Vec};
|
|
use core::fmt;
|
|
use regalloc2::MachineEnv;
|
|
use target_lexicon::Triple;
|
|
|
|
mod abi;
|
|
pub mod encoding;
|
|
mod inst;
|
|
mod lower;
|
|
pub mod settings;
|
|
|
|
/// An X64 backend.
|
|
pub(crate) struct X64Backend {
|
|
triple: Triple,
|
|
flags: Flags,
|
|
x64_flags: x64_settings::Flags,
|
|
reg_env: MachineEnv,
|
|
}
|
|
|
|
impl X64Backend {
|
|
/// Create a new X64 backend with the given (shared) flags.
|
|
fn new_with_flags(triple: Triple, flags: Flags, x64_flags: x64_settings::Flags) -> Self {
|
|
let reg_env = create_reg_env_systemv(&flags);
|
|
Self {
|
|
triple,
|
|
flags,
|
|
x64_flags,
|
|
reg_env,
|
|
}
|
|
}
|
|
|
|
fn compile_vcode(
|
|
&self,
|
|
func: &Function,
|
|
domtree: &DominatorTree,
|
|
) -> CodegenResult<(VCode<inst::Inst>, regalloc2::Output)> {
|
|
// This performs lowering to VCode, register-allocates the code, computes
|
|
// block layout and finalizes branches. The result is ready for binary emission.
|
|
let emit_info = EmitInfo::new(self.flags.clone(), self.x64_flags.clone());
|
|
let sigs = SigSet::new::<abi::X64ABIMachineSpec>(func, &self.flags)?;
|
|
let abi = abi::X64Callee::new(func, self, &self.x64_flags, &sigs)?;
|
|
compile::compile::<Self>(func, domtree, self, abi, emit_info, sigs)
|
|
}
|
|
}
|
|
|
|
impl TargetIsa for X64Backend {
|
|
fn compile_function(
|
|
&self,
|
|
func: &Function,
|
|
domtree: &DominatorTree,
|
|
want_disasm: bool,
|
|
) -> CodegenResult<CompiledCodeStencil> {
|
|
let (vcode, regalloc_result) = self.compile_vcode(func, domtree)?;
|
|
|
|
let emit_result = vcode.emit(
|
|
®alloc_result,
|
|
want_disasm,
|
|
self.flags.machine_code_cfg_info(),
|
|
);
|
|
let frame_size = emit_result.frame_size;
|
|
let value_labels_ranges = emit_result.value_labels_ranges;
|
|
let buffer = emit_result.buffer.finish();
|
|
let sized_stackslot_offsets = emit_result.sized_stackslot_offsets;
|
|
let dynamic_stackslot_offsets = emit_result.dynamic_stackslot_offsets;
|
|
|
|
if let Some(disasm) = emit_result.disasm.as_ref() {
|
|
log::trace!("disassembly:\n{}", disasm);
|
|
}
|
|
|
|
Ok(CompiledCodeStencil {
|
|
buffer,
|
|
frame_size,
|
|
vcode: emit_result.disasm,
|
|
value_labels_ranges,
|
|
sized_stackslot_offsets,
|
|
dynamic_stackslot_offsets,
|
|
bb_starts: emit_result.bb_offsets,
|
|
bb_edges: emit_result.bb_edges,
|
|
alignment: emit_result.alignment,
|
|
})
|
|
}
|
|
|
|
fn flags(&self) -> &Flags {
|
|
&self.flags
|
|
}
|
|
|
|
fn machine_env(&self) -> &MachineEnv {
|
|
&self.reg_env
|
|
}
|
|
|
|
fn isa_flags(&self) -> Vec<shared_settings::Value> {
|
|
self.x64_flags.iter().collect()
|
|
}
|
|
|
|
fn dynamic_vector_bytes(&self, _dyn_ty: Type) -> u32 {
|
|
16
|
|
}
|
|
|
|
fn name(&self) -> &'static str {
|
|
"x64"
|
|
}
|
|
|
|
fn triple(&self) -> &Triple {
|
|
&self.triple
|
|
}
|
|
|
|
fn unsigned_add_overflow_condition(&self) -> IntCC {
|
|
// Unsigned `<`; this corresponds to the carry flag set on x86, which
|
|
// indicates an add has overflowed.
|
|
IntCC::UnsignedLessThan
|
|
}
|
|
|
|
#[cfg(feature = "unwind")]
|
|
fn emit_unwind_info(
|
|
&self,
|
|
result: &CompiledCode,
|
|
kind: crate::machinst::UnwindInfoKind,
|
|
) -> CodegenResult<Option<crate::isa::unwind::UnwindInfo>> {
|
|
use crate::isa::unwind::UnwindInfo;
|
|
use crate::machinst::UnwindInfoKind;
|
|
Ok(match kind {
|
|
UnwindInfoKind::SystemV => {
|
|
let mapper = self::inst::unwind::systemv::RegisterMapper;
|
|
Some(UnwindInfo::SystemV(
|
|
crate::isa::unwind::systemv::create_unwind_info_from_insts(
|
|
&result.buffer.unwind_info[..],
|
|
result.buffer.data().len(),
|
|
&mapper,
|
|
)?,
|
|
))
|
|
}
|
|
UnwindInfoKind::Windows => Some(UnwindInfo::WindowsX64(
|
|
crate::isa::unwind::winx64::create_unwind_info_from_insts::<
|
|
self::inst::unwind::winx64::RegisterMapper,
|
|
>(&result.buffer.unwind_info[..])?,
|
|
)),
|
|
_ => None,
|
|
})
|
|
}
|
|
|
|
#[cfg(feature = "unwind")]
|
|
fn create_systemv_cie(&self) -> Option<gimli::write::CommonInformationEntry> {
|
|
Some(inst::unwind::systemv::create_cie())
|
|
}
|
|
|
|
#[cfg(feature = "unwind")]
|
|
fn map_regalloc_reg_to_dwarf(&self, reg: Reg) -> Result<u16, systemv::RegisterMappingError> {
|
|
inst::unwind::systemv::map_reg(reg).map(|reg| reg.0)
|
|
}
|
|
|
|
fn text_section_builder(&self, num_funcs: usize) -> Box<dyn TextSectionBuilder> {
|
|
Box::new(MachTextSectionBuilder::<inst::Inst>::new(num_funcs))
|
|
}
|
|
|
|
/// Align functions on x86 to 16 bytes, ensuring that rip-relative loads to SSE registers are
|
|
/// always from aligned memory.
|
|
fn function_alignment(&self) -> u32 {
|
|
16
|
|
}
|
|
|
|
#[cfg(feature = "disas")]
|
|
fn to_capstone(&self) -> Result<capstone::Capstone, capstone::Error> {
|
|
use capstone::prelude::*;
|
|
Capstone::new()
|
|
.x86()
|
|
.mode(arch::x86::ArchMode::Mode64)
|
|
.syntax(arch::x86::ArchSyntax::Att)
|
|
.build()
|
|
}
|
|
}
|
|
|
|
impl fmt::Display for X64Backend {
|
|
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
|
|
f.debug_struct("MachBackend")
|
|
.field("name", &self.name())
|
|
.field("triple", &self.triple())
|
|
.field("flags", &format!("{}", self.flags()))
|
|
.finish()
|
|
}
|
|
}
|
|
|
|
/// Create a new `isa::Builder`.
|
|
pub(crate) fn isa_builder(triple: Triple) -> IsaBuilder {
|
|
IsaBuilder {
|
|
triple,
|
|
setup: x64_settings::builder(),
|
|
constructor: isa_constructor,
|
|
}
|
|
}
|
|
|
|
fn isa_constructor(
|
|
triple: Triple,
|
|
shared_flags: Flags,
|
|
builder: shared_settings::Builder,
|
|
) -> CodegenResult<OwnedTargetIsa> {
|
|
let isa_flags = x64_settings::Flags::new(&shared_flags, builder);
|
|
|
|
// Check for compatibility between flags and ISA level
|
|
// requested. In particular, SIMD support requires SSE4.2.
|
|
if shared_flags.enable_simd() {
|
|
if !isa_flags.has_sse3()
|
|
|| !isa_flags.has_ssse3()
|
|
|| !isa_flags.has_sse41()
|
|
|| !isa_flags.has_sse42()
|
|
{
|
|
return Err(CodegenError::Unsupported(
|
|
"SIMD support requires SSE3, SSSE3, SSE4.1, and SSE4.2 on x86_64.".into(),
|
|
));
|
|
}
|
|
}
|
|
|
|
let backend = X64Backend::new_with_flags(triple, shared_flags, isa_flags);
|
|
Ok(backend.wrapped())
|
|
}
|
|
|
|
#[cfg(test)]
|
|
mod test {
|
|
use super::*;
|
|
use crate::cursor::{Cursor, FuncCursor};
|
|
use crate::dominator_tree::DominatorTree;
|
|
use crate::flowgraph::ControlFlowGraph;
|
|
use crate::ir::{types::*, RelSourceLoc, SourceLoc, UserFuncName, ValueLabel, ValueLabelStart};
|
|
use crate::ir::{AbiParam, Function, InstBuilder, JumpTableData, Signature};
|
|
use crate::isa::CallConv;
|
|
use crate::settings;
|
|
use crate::settings::Configurable;
|
|
use core::str::FromStr;
|
|
use cranelift_entity::EntityRef;
|
|
use target_lexicon::Triple;
|
|
|
|
/// We have to test cold blocks by observing final machine code,
|
|
/// rather than VCode, because the VCode orders blocks in lowering
|
|
/// order, not emission order. (The exact difference between the
|
|
/// two is that cold blocks are sunk in the latter.) We might as
|
|
/// well do the test here, where we have a backend to use.
|
|
#[test]
|
|
fn test_cold_blocks() {
|
|
let name = UserFuncName::testcase("test0");
|
|
let mut sig = Signature::new(CallConv::SystemV);
|
|
sig.params.push(AbiParam::new(I32));
|
|
sig.returns.push(AbiParam::new(I32));
|
|
let mut func = Function::with_name_signature(name, sig);
|
|
// Add debug info: this tests the debug machinery wrt cold
|
|
// blocks as well.
|
|
func.dfg.collect_debug_info();
|
|
|
|
let bb0 = func.dfg.make_block();
|
|
let arg0 = func.dfg.append_block_param(bb0, I32);
|
|
let bb1 = func.dfg.make_block();
|
|
let bb2 = func.dfg.make_block();
|
|
let bb3 = func.dfg.make_block();
|
|
let bb1_param = func.dfg.append_block_param(bb1, I32);
|
|
let bb3_param = func.dfg.append_block_param(bb3, I32);
|
|
|
|
let mut pos = FuncCursor::new(&mut func);
|
|
|
|
pos.insert_block(bb0);
|
|
pos.set_srcloc(SourceLoc::new(1));
|
|
let v0 = pos.ins().iconst(I32, 0x1234);
|
|
pos.set_srcloc(SourceLoc::new(2));
|
|
let v1 = pos.ins().iadd(arg0, v0);
|
|
pos.ins().brif(v1, bb1, &[v1], bb2, &[]);
|
|
|
|
pos.insert_block(bb1);
|
|
pos.set_srcloc(SourceLoc::new(3));
|
|
let v2 = pos.ins().isub(v1, v0);
|
|
pos.set_srcloc(SourceLoc::new(4));
|
|
let v3 = pos.ins().iadd(v2, bb1_param);
|
|
pos.ins().brif(v1, bb2, &[], bb3, &[v3]);
|
|
|
|
pos.func.layout.set_cold(bb2);
|
|
pos.insert_block(bb2);
|
|
pos.set_srcloc(SourceLoc::new(5));
|
|
let v4 = pos.ins().iadd(v1, v0);
|
|
pos.ins().brif(v4, bb2, &[], bb1, &[v4]);
|
|
|
|
pos.insert_block(bb3);
|
|
pos.set_srcloc(SourceLoc::new(6));
|
|
pos.ins().return_(&[bb3_param]);
|
|
|
|
// Create some debug info. Make one label that follows all the
|
|
// values around. Note that this is usually done via an API on
|
|
// the FunctionBuilder, but that's in cranelift_frontend
|
|
// (i.e., a higher level of the crate DAG) so we have to build
|
|
// it manually here.
|
|
pos.func.dfg.values_labels.as_mut().unwrap().insert(
|
|
v0,
|
|
crate::ir::ValueLabelAssignments::Starts(vec![ValueLabelStart {
|
|
from: RelSourceLoc::new(1),
|
|
label: ValueLabel::new(1),
|
|
}]),
|
|
);
|
|
pos.func.dfg.values_labels.as_mut().unwrap().insert(
|
|
v1,
|
|
crate::ir::ValueLabelAssignments::Starts(vec![ValueLabelStart {
|
|
from: RelSourceLoc::new(2),
|
|
label: ValueLabel::new(1),
|
|
}]),
|
|
);
|
|
pos.func.dfg.values_labels.as_mut().unwrap().insert(
|
|
v2,
|
|
crate::ir::ValueLabelAssignments::Starts(vec![ValueLabelStart {
|
|
from: RelSourceLoc::new(3),
|
|
label: ValueLabel::new(1),
|
|
}]),
|
|
);
|
|
pos.func.dfg.values_labels.as_mut().unwrap().insert(
|
|
v3,
|
|
crate::ir::ValueLabelAssignments::Starts(vec![ValueLabelStart {
|
|
from: RelSourceLoc::new(4),
|
|
label: ValueLabel::new(1),
|
|
}]),
|
|
);
|
|
pos.func.dfg.values_labels.as_mut().unwrap().insert(
|
|
v4,
|
|
crate::ir::ValueLabelAssignments::Starts(vec![ValueLabelStart {
|
|
from: RelSourceLoc::new(5),
|
|
label: ValueLabel::new(1),
|
|
}]),
|
|
);
|
|
|
|
let mut shared_flags_builder = settings::builder();
|
|
shared_flags_builder.set("opt_level", "none").unwrap();
|
|
shared_flags_builder.set("enable_verifier", "true").unwrap();
|
|
let shared_flags = settings::Flags::new(shared_flags_builder);
|
|
let isa_flags = x64_settings::Flags::new(&shared_flags, x64_settings::builder());
|
|
let backend = X64Backend::new_with_flags(
|
|
Triple::from_str("x86_64").unwrap(),
|
|
shared_flags,
|
|
isa_flags,
|
|
);
|
|
let cfg = ControlFlowGraph::with_function(&func);
|
|
let domtree = DominatorTree::with_function(&func, &cfg);
|
|
let result = backend
|
|
.compile_function(&mut func, &domtree, /* want_disasm = */ false)
|
|
.unwrap();
|
|
let code = result.buffer.data();
|
|
|
|
// To update this comment, write the golden bytes to a file, and run the following
|
|
// command on it:
|
|
// > objdump -b binary -D <file> -m i386:x86-64 -M intel
|
|
//
|
|
// 0: 55 push rbp
|
|
// 1: 48 89 e5 mov rbp,rsp
|
|
// 4: 48 89 fe mov rsi,rdi
|
|
// 7: 81 c6 34 12 00 00 add esi,0x1234
|
|
// d: 85 f6 test esi,esi
|
|
// f: 0f 84 21 00 00 00 je 0x36
|
|
// 15: 49 89 f0 mov r8,rsi
|
|
// 18: 48 89 f0 mov rax,rsi
|
|
// 1b: 81 e8 34 12 00 00 sub eax,0x1234
|
|
// 21: 44 01 c0 add eax,r8d
|
|
// 24: 85 f6 test esi,esi
|
|
// 26: 0f 85 0a 00 00 00 jne 0x36
|
|
// 2c: 48 89 ec mov rsp,rbp
|
|
// 2f: 5d pop rbp
|
|
// 30: c3 ret
|
|
// 31: e9 e2 ff ff ff jmp 0x18
|
|
// 36: 49 89 f0 mov r8,rsi
|
|
// 39: 41 81 c0 34 12 00 00 add r8d,0x1234
|
|
// 40: 45 85 c0 test r8d,r8d
|
|
// 43: 0f 84 cf ff ff ff je 0x18
|
|
// 49: e9 e8 ff ff ff jmp 0x36
|
|
|
|
let golden = vec![
|
|
85, 72, 137, 229, 72, 137, 254, 129, 198, 52, 18, 0, 0, 133, 246, 15, 132, 33, 0, 0, 0,
|
|
73, 137, 240, 72, 137, 240, 129, 232, 52, 18, 0, 0, 68, 1, 192, 133, 246, 15, 133, 10,
|
|
0, 0, 0, 72, 137, 236, 93, 195, 233, 226, 255, 255, 255, 73, 137, 240, 65, 129, 192,
|
|
52, 18, 0, 0, 69, 133, 192, 15, 132, 207, 255, 255, 255, 233, 232, 255, 255, 255,
|
|
];
|
|
|
|
assert_eq!(code, &golden[..]);
|
|
}
|
|
|
|
// Check that feature tests for SIMD work correctly.
|
|
#[test]
|
|
fn simd_required_features() {
|
|
let mut shared_flags_builder = settings::builder();
|
|
shared_flags_builder.set("enable_simd", "true").unwrap();
|
|
let shared_flags = settings::Flags::new(shared_flags_builder);
|
|
let mut isa_builder = crate::isa::lookup_by_name("x86_64").unwrap();
|
|
isa_builder.set("has_sse3", "false").unwrap();
|
|
isa_builder.set("has_ssse3", "false").unwrap();
|
|
isa_builder.set("has_sse41", "false").unwrap();
|
|
isa_builder.set("has_sse42", "false").unwrap();
|
|
assert!(matches!(
|
|
isa_builder.finish(shared_flags),
|
|
Err(CodegenError::Unsupported(_)),
|
|
));
|
|
}
|
|
|
|
// Check that br_table lowers properly. We can't test this with an
|
|
// ordinary compile-test because the br_table pseudoinstruction
|
|
// expands during emission.
|
|
#[test]
|
|
fn br_table() {
|
|
let name = UserFuncName::testcase("test0");
|
|
let mut sig = Signature::new(CallConv::SystemV);
|
|
sig.params.push(AbiParam::new(I32));
|
|
sig.returns.push(AbiParam::new(I32));
|
|
let mut func = Function::with_name_signature(name, sig);
|
|
|
|
let bb0 = func.dfg.make_block();
|
|
let arg0 = func.dfg.append_block_param(bb0, I32);
|
|
let bb1 = func.dfg.make_block();
|
|
let bb2 = func.dfg.make_block();
|
|
let bb3 = func.dfg.make_block();
|
|
|
|
let mut pos = FuncCursor::new(&mut func);
|
|
|
|
pos.insert_block(bb0);
|
|
let jt_data = JumpTableData::new(
|
|
pos.func.dfg.block_call(bb3, &[]),
|
|
&[
|
|
pos.func.dfg.block_call(bb1, &[]),
|
|
pos.func.dfg.block_call(bb2, &[]),
|
|
],
|
|
);
|
|
let jt = pos.func.create_jump_table(jt_data);
|
|
pos.ins().br_table(arg0, jt);
|
|
|
|
pos.insert_block(bb1);
|
|
let v1 = pos.ins().iconst(I32, 1);
|
|
pos.ins().return_(&[v1]);
|
|
|
|
pos.insert_block(bb2);
|
|
let v2 = pos.ins().iconst(I32, 2);
|
|
pos.ins().return_(&[v2]);
|
|
|
|
pos.insert_block(bb3);
|
|
let v3 = pos.ins().iconst(I32, 3);
|
|
pos.ins().return_(&[v3]);
|
|
|
|
let mut shared_flags_builder = settings::builder();
|
|
shared_flags_builder.set("opt_level", "none").unwrap();
|
|
shared_flags_builder.set("enable_verifier", "true").unwrap();
|
|
let shared_flags = settings::Flags::new(shared_flags_builder);
|
|
let isa_flags = x64_settings::Flags::new(&shared_flags, x64_settings::builder());
|
|
let backend = X64Backend::new_with_flags(
|
|
Triple::from_str("x86_64").unwrap(),
|
|
shared_flags,
|
|
isa_flags,
|
|
);
|
|
let cfg = ControlFlowGraph::with_function(&func);
|
|
let domtree = DominatorTree::with_function(&func, &cfg);
|
|
let result = backend
|
|
.compile_function(&mut func, &domtree, /* want_disasm = */ false)
|
|
.unwrap();
|
|
let code = result.buffer.data();
|
|
|
|
// To update this comment, write the golden bytes to a file, and run the following
|
|
// command on it:
|
|
// > objdump -b binary -D <file> -m i386:x86-64 -M intel
|
|
//
|
|
// 0: 55 push rbp
|
|
// 1: 48 89 e5 mov rbp,rsp
|
|
// 4: 83 ff 02 cmp edi,0x2
|
|
// 7: 0f 83 3b 00 00 00 jae 0x48
|
|
// d: 44 8b d7 mov r10d,edi
|
|
// 10: 41 b9 00 00 00 00 mov r9d,0x0
|
|
// 16: 4d 0f 43 d1 cmovae r10,r9
|
|
// 1a: 4c 8d 0d 0b 00 00 00 lea r9,[rip+0xb] # 0x2c
|
|
// 21: 4f 63 54 91 00 movsxd r10,DWORD PTR [r9+r10*4+0x0]
|
|
// 26: 4d 01 d1 add r9,r10
|
|
// 29: 41 ff e1 jmp r9
|
|
// 2c: 12 00 adc al,BYTE PTR [rax]
|
|
// 2e: 00 00 add BYTE PTR [rax],al
|
|
// 30: 08 00 or BYTE PTR [rax],al
|
|
// 32: 00 00 add BYTE PTR [rax],al
|
|
// 34: b8 02 00 00 00 mov eax,0x2
|
|
// 39: 48 89 ec mov rsp,rbp
|
|
// 3c: 5d pop rbp
|
|
// 3d: c3 ret
|
|
// 3e: b8 01 00 00 00 mov eax,0x1
|
|
// 43: 48 89 ec mov rsp,rbp
|
|
// 46: 5d pop rbp
|
|
// 47: c3 ret
|
|
// 48: b8 03 00 00 00 mov eax,0x3
|
|
// 4d: 48 89 ec mov rsp,rbp
|
|
// 50: 5d pop rbp
|
|
// 51: c3 ret
|
|
|
|
let golden = vec![
|
|
85, 72, 137, 229, 131, 255, 2, 15, 131, 59, 0, 0, 0, 68, 139, 215, 65, 185, 0, 0, 0, 0,
|
|
77, 15, 67, 209, 76, 141, 13, 11, 0, 0, 0, 79, 99, 84, 145, 0, 77, 1, 209, 65, 255,
|
|
225, 18, 0, 0, 0, 8, 0, 0, 0, 184, 2, 0, 0, 0, 72, 137, 236, 93, 195, 184, 1, 0, 0, 0,
|
|
72, 137, 236, 93, 195, 184, 3, 0, 0, 0, 72, 137, 236, 93, 195,
|
|
];
|
|
|
|
assert_eq!(code, &golden[..]);
|
|
}
|
|
}
|