//! Cranelift compilation context and main entry point. //! //! When compiling many small functions, it is important to avoid repeatedly allocating and //! deallocating the data structures needed for compilation. The `Context` struct is used to hold //! on to memory allocations between function compilations. //! //! The context does not hold a `TargetIsa` instance which has to be provided as an argument //! instead. This is because an ISA instance is immutable and can be used by multiple compilation //! contexts concurrently. Typically, you would have one context per compilation thread and only a //! single ISA instance. use crate::binemit::{CodeInfo, MemoryCodeSink, RelocSink, StackMapSink, TrapSink}; use crate::dce::do_dce; use crate::dominator_tree::DominatorTree; use crate::flowgraph::ControlFlowGraph; use crate::ir::Function; use crate::isa::TargetIsa; use crate::legalizer::simple_legalize; use crate::licm::do_licm; use crate::loop_analysis::LoopAnalysis; use crate::machinst::{MachCompileResult, MachStackMap}; use crate::nan_canonicalization::do_nan_canonicalization; use crate::remove_constant_phis::do_remove_constant_phis; use crate::result::CodegenResult; use crate::settings::{FlagsOrIsa, OptLevel}; use crate::simple_gvn::do_simple_gvn; use crate::simple_preopt::do_preopt; use crate::timing; use crate::unreachable_code::eliminate_unreachable_code; use crate::verifier::{verify_context, VerifierErrors, VerifierResult}; #[cfg(feature = "souper-harvest")] use alloc::string::String; use alloc::vec::Vec; #[cfg(feature = "souper-harvest")] use crate::souper_harvest::do_souper_harvest; /// Persistent data structures and compilation pipeline. pub struct Context { /// The function we're compiling. pub func: Function, /// The control flow graph of `func`. pub cfg: ControlFlowGraph, /// Dominator tree for `func`. pub domtree: DominatorTree, /// Loop analysis of `func`. pub loop_analysis: LoopAnalysis, /// Result of MachBackend compilation, if computed. pub mach_compile_result: Option, /// Flag: do we want a disassembly with the MachCompileResult? pub want_disasm: bool, } impl Context { /// Allocate a new compilation context. /// /// The returned instance should be reused for compiling multiple functions in order to avoid /// needless allocator thrashing. pub fn new() -> Self { Self::for_function(Function::new()) } /// Allocate a new compilation context with an existing Function. /// /// The returned instance should be reused for compiling multiple functions in order to avoid /// needless allocator thrashing. pub fn for_function(func: Function) -> Self { Self { func, cfg: ControlFlowGraph::new(), domtree: DominatorTree::new(), loop_analysis: LoopAnalysis::new(), mach_compile_result: None, want_disasm: false, } } /// Clear all data structures in this context. pub fn clear(&mut self) { self.func.clear(); self.cfg.clear(); self.domtree.clear(); self.loop_analysis.clear(); self.mach_compile_result = None; self.want_disasm = false; } /// Set the flag to request a disassembly when compiling with a /// `MachBackend` backend. pub fn set_disasm(&mut self, val: bool) { self.want_disasm = val; } /// Compile the function, and emit machine code into a `Vec`. /// /// Run the function through all the passes necessary to generate code for the target ISA /// represented by `isa`, as well as the final step of emitting machine code into a /// `Vec`. The machine code is not relocated. Instead, any relocations are emitted /// into `relocs`. /// /// This function calls `compile` and `emit_to_memory`, taking care to resize `mem` as /// needed, so it provides a safe interface. /// /// Returns information about the function's code and read-only data. pub fn compile_and_emit( &mut self, isa: &dyn TargetIsa, mem: &mut Vec, relocs: &mut dyn RelocSink, traps: &mut dyn TrapSink, stack_maps: &mut dyn StackMapSink, ) -> CodegenResult<()> { let info = self.compile(isa)?; let old_len = mem.len(); mem.resize(old_len + info.total_size as usize, 0); let new_info = unsafe { self.emit_to_memory(mem.as_mut_ptr().add(old_len), relocs, traps, stack_maps) }; debug_assert!(new_info == info); Ok(()) } /// Compile the function. /// /// Run the function through all the passes necessary to generate code for the target ISA /// represented by `isa`. This does not include the final step of emitting machine code into a /// code sink. /// /// Returns information about the function's code and read-only data. pub fn compile(&mut self, isa: &dyn TargetIsa) -> CodegenResult { let _tt = timing::compile(); self.verify_if(isa)?; let opt_level = isa.flags().opt_level(); log::debug!( "Compiling (opt level {:?}):\n{}", opt_level, self.func.display() ); self.compute_cfg(); if opt_level != OptLevel::None { self.preopt(isa)?; } if isa.flags().enable_nan_canonicalization() { self.canonicalize_nans(isa)?; } self.legalize(isa)?; if opt_level != OptLevel::None { self.compute_domtree(); self.compute_loop_analysis(); self.licm(isa)?; self.simple_gvn(isa)?; } self.compute_domtree(); self.eliminate_unreachable_code(isa)?; if opt_level != OptLevel::None { self.dce(isa)?; } self.remove_constant_phis(isa)?; let backend = isa.get_mach_backend(); let result = backend.compile_function(&self.func, self.want_disasm)?; let info = result.code_info(); self.mach_compile_result = Some(result); Ok(info) } /// Emit machine code directly into raw memory. /// /// Write all of the function's machine code to the memory at `mem`. The size of the machine /// code is returned by `compile` above. /// /// The machine code is not relocated. Instead, any relocations are emitted into `relocs`. /// /// # Safety /// /// This function is unsafe since it does not perform bounds checking on the memory buffer, /// and it can't guarantee that the `mem` pointer is valid. /// /// Returns information about the emitted code and data. pub unsafe fn emit_to_memory( &self, mem: *mut u8, relocs: &mut dyn RelocSink, traps: &mut dyn TrapSink, stack_maps: &mut dyn StackMapSink, ) -> CodeInfo { let _tt = timing::binemit(); let mut sink = MemoryCodeSink::new(mem, relocs, traps); let result = self .mach_compile_result .as_ref() .expect("only using mach backend now"); result.buffer.emit(&mut sink); let info = sink.info; // New backends do not emit StackMaps through the `CodeSink` because its interface // requires `Value`s; instead, the `StackMap` objects are directly accessible via // `result.buffer.stack_maps()`. for &MachStackMap { offset_end, ref stack_map, .. } in result.buffer.stack_maps() { stack_maps.add_stack_map(offset_end, stack_map.clone()); } info } /// If available, return information about the code layout in the /// final machine code: the offsets (in bytes) of each basic-block /// start, and all basic-block edges. pub fn get_code_bb_layout(&self) -> Option<(Vec, Vec<(usize, usize)>)> { if let Some(result) = self.mach_compile_result.as_ref() { Some(( result.bb_starts.iter().map(|&off| off as usize).collect(), result .bb_edges .iter() .map(|&(from, to)| (from as usize, to as usize)) .collect(), )) } else { None } } /// Creates unwind information for the function. /// /// Returns `None` if the function has no unwind information. #[cfg(feature = "unwind")] pub fn create_unwind_info( &self, isa: &dyn TargetIsa, ) -> CodegenResult> { let backend = isa.get_mach_backend(); let unwind_info_kind = isa.unwind_info_kind(); let result = self.mach_compile_result.as_ref().unwrap(); backend.emit_unwind_info(result, unwind_info_kind) } /// Run the verifier on the function. /// /// Also check that the dominator tree and control flow graph are consistent with the function. pub fn verify<'a, FOI: Into>>(&self, fisa: FOI) -> VerifierResult<()> { let mut errors = VerifierErrors::default(); let _ = verify_context(&self.func, &self.cfg, &self.domtree, fisa, &mut errors); if errors.is_empty() { Ok(()) } else { Err(errors) } } /// Run the verifier only if the `enable_verifier` setting is true. pub fn verify_if<'a, FOI: Into>>(&self, fisa: FOI) -> CodegenResult<()> { let fisa = fisa.into(); if fisa.flags.enable_verifier() { self.verify(fisa)?; } Ok(()) } /// Perform dead-code elimination on the function. pub fn dce<'a, FOI: Into>>(&mut self, fisa: FOI) -> CodegenResult<()> { do_dce(&mut self.func, &mut self.domtree); self.verify_if(fisa)?; Ok(()) } /// Perform constant-phi removal on the function. pub fn remove_constant_phis<'a, FOI: Into>>( &mut self, fisa: FOI, ) -> CodegenResult<()> { do_remove_constant_phis(&mut self.func, &mut self.domtree); self.verify_if(fisa)?; Ok(()) } /// Perform pre-legalization rewrites on the function. pub fn preopt(&mut self, isa: &dyn TargetIsa) -> CodegenResult<()> { do_preopt(&mut self.func, &mut self.cfg, isa); self.verify_if(isa)?; Ok(()) } /// Perform NaN canonicalizing rewrites on the function. pub fn canonicalize_nans(&mut self, isa: &dyn TargetIsa) -> CodegenResult<()> { do_nan_canonicalization(&mut self.func); self.verify_if(isa) } /// Run the legalizer for `isa` on the function. pub fn legalize(&mut self, isa: &dyn TargetIsa) -> CodegenResult<()> { // Legalization invalidates the domtree and loop_analysis by mutating the CFG. // TODO: Avoid doing this when legalization doesn't actually mutate the CFG. self.domtree.clear(); self.loop_analysis.clear(); // Run some specific legalizations only. simple_legalize(&mut self.func, &mut self.cfg, isa); self.verify_if(isa) } /// Compute the control flow graph. pub fn compute_cfg(&mut self) { self.cfg.compute(&self.func) } /// Compute dominator tree. pub fn compute_domtree(&mut self) { self.domtree.compute(&self.func, &self.cfg) } /// Compute the loop analysis. pub fn compute_loop_analysis(&mut self) { self.loop_analysis .compute(&self.func, &self.cfg, &self.domtree) } /// Compute the control flow graph and dominator tree. pub fn flowgraph(&mut self) { self.compute_cfg(); self.compute_domtree() } /// Perform simple GVN on the function. pub fn simple_gvn<'a, FOI: Into>>(&mut self, fisa: FOI) -> CodegenResult<()> { do_simple_gvn(&mut self.func, &mut self.domtree); self.verify_if(fisa) } /// Perform LICM on the function. pub fn licm(&mut self, isa: &dyn TargetIsa) -> CodegenResult<()> { do_licm( &mut self.func, &mut self.cfg, &mut self.domtree, &mut self.loop_analysis, ); self.verify_if(isa) } /// Perform unreachable code elimination. pub fn eliminate_unreachable_code<'a, FOI>(&mut self, fisa: FOI) -> CodegenResult<()> where FOI: Into>, { eliminate_unreachable_code(&mut self.func, &mut self.cfg, &self.domtree); self.verify_if(fisa) } /// Harvest candidate left-hand sides for superoptimization with Souper. #[cfg(feature = "souper-harvest")] pub fn souper_harvest( &mut self, out: &mut std::sync::mpsc::Sender, ) -> CodegenResult<()> { do_souper_harvest(&self.func, out); Ok(()) } }