LICM pass (#87)
* LICM pass * Uses loop analysis to detect loop tree * For each loop (starting with the inner ones), create a pre-header and move there loop-invariant instructions * An instruction is loop invariant if it does not use as argument a value defined earlier in the loop * File tests to check LICM's correctness * Optimized pre-header creation If the loop already has a natural pre-header, we use it instead of creating a new one. The natural pre-header of a loop is the only predecessor of the header it doesn't dominate.
This commit is contained in:
committed by
Jakob Stoklund Olesen
parent
402cb8e1f6
commit
e47f4a49fb
31
cranelift/filetests/licm/basic.cton
Normal file
31
cranelift/filetests/licm/basic.cton
Normal file
@@ -0,0 +1,31 @@
|
||||
test licm
|
||||
|
||||
function simple_loop(i32) -> i32 {
|
||||
|
||||
ebb1(v0: i32):
|
||||
v1 = iconst.i32 1
|
||||
v2 = iconst.i32 2
|
||||
v3 = iadd v1, v2
|
||||
brz v0, ebb2(v0)
|
||||
v4 = isub v0, v1
|
||||
jump ebb1(v4)
|
||||
|
||||
ebb2(v5: i32):
|
||||
return v5
|
||||
|
||||
}
|
||||
; sameln: function simple_loop(i32) -> i32 {
|
||||
; nextln: ebb2(v6: i32):
|
||||
; nextln: v1 = iconst.i32 1
|
||||
; nextln: v2 = iconst.i32 2
|
||||
; nextln: v3 = iadd v1, v2
|
||||
; nextln: jump ebb0(v6)
|
||||
; nextln:
|
||||
; nextln: ebb0(v0: i32):
|
||||
; nextln: brz v0, ebb1(v0)
|
||||
; nextln: v4 = isub v0, v1
|
||||
; nextln: jump ebb0(v4)
|
||||
; nextln:
|
||||
; nextln: ebb1(v5: i32):
|
||||
; nextln: return v5
|
||||
; nextln: }
|
||||
81
cranelift/filetests/licm/complex.cton
Normal file
81
cranelift/filetests/licm/complex.cton
Normal file
@@ -0,0 +1,81 @@
|
||||
test licm
|
||||
|
||||
function complex(i32) -> i32 {
|
||||
|
||||
ebb0(v0: i32):
|
||||
v1 = iconst.i32 1
|
||||
v19 = iconst.i32 4
|
||||
v2 = iadd v1, v0
|
||||
brz v0, ebb1(v1)
|
||||
jump ebb3(v2)
|
||||
|
||||
ebb1(v3: i32):
|
||||
v4 = iconst.i32 2
|
||||
v5 = iadd v3, v2
|
||||
v6 = iadd v4, v0
|
||||
jump ebb2(v6)
|
||||
|
||||
ebb2(v7: i32):
|
||||
v8 = iadd v7, v3
|
||||
v9 = iadd v0, v2
|
||||
brz v0, ebb1(v7)
|
||||
jump ebb5(v8)
|
||||
|
||||
ebb3(v10: i32):
|
||||
v11 = iconst.i32 3
|
||||
v12 = iadd v10, v11
|
||||
v13 = iadd v2, v11
|
||||
jump ebb4(v11)
|
||||
|
||||
ebb4(v14: i32):
|
||||
v15 = iadd v12, v2
|
||||
brz v0, ebb3(v14)
|
||||
jump ebb5(v14)
|
||||
|
||||
ebb5(v16: i32):
|
||||
v17 = iadd v16, v1
|
||||
v18 = iadd v1, v19
|
||||
brz v0, ebb0(v18)
|
||||
return v17
|
||||
}
|
||||
|
||||
; sameln: function complex(i32) -> i32 {
|
||||
; nextln: ebb6(v20: i32):
|
||||
; nextln: v1 = iconst.i32 1
|
||||
; nextln: v2 = iconst.i32 4
|
||||
; nextln: v5 = iconst.i32 2
|
||||
; nextln: v12 = iconst.i32 3
|
||||
; nextln: v19 = iadd v1, v2
|
||||
; nextln: jump ebb0(v20)
|
||||
; nextln:
|
||||
; nextln: ebb0(v0: i32):
|
||||
; nextln: v3 = iadd.i32 v1, v0
|
||||
; nextln: v7 = iadd.i32 v5, v0
|
||||
; nextln: v10 = iadd v0, v3
|
||||
; nextln: brz v0, ebb1(v1)
|
||||
; nextln: v14 = iadd v3, v12
|
||||
; nextln: jump ebb3(v3)
|
||||
; nextln:
|
||||
; nextln: ebb1(v4: i32):
|
||||
; nextln: v6 = iadd v4, v3
|
||||
; nextln: jump ebb2(v7)
|
||||
; nextln:
|
||||
; nextln: ebb2(v8: i32):
|
||||
; nextln: v9 = iadd v8, v4
|
||||
; nextln: brz.i32 v0, ebb1(v8)
|
||||
; nextln: jump ebb5(v9)
|
||||
; nextln:
|
||||
; nextln: ebb3(v11: i32):
|
||||
; nextln: v13 = iadd v11, v12
|
||||
; nextln: jump ebb4(v12)
|
||||
; nextln:
|
||||
; nextln: ebb4(v15: i32):
|
||||
; nextln: v16 = iadd.i32 v13, v3
|
||||
; nextln: brz.i32 v0, ebb3(v15)
|
||||
; nextln: jump ebb5(v15)
|
||||
; nextln:
|
||||
; nextln: ebb5(v17: i32):
|
||||
; nextln: v18 = iadd v17, v1
|
||||
; nextln: brz.i32 v0, ebb0(v19)
|
||||
; nextln: return v18
|
||||
; nextln: }
|
||||
46
cranelift/filetests/licm/multiple-blocks.cton
Normal file
46
cranelift/filetests/licm/multiple-blocks.cton
Normal file
@@ -0,0 +1,46 @@
|
||||
test licm
|
||||
|
||||
function multiple_blocks(i32) -> i32 {
|
||||
|
||||
ebb0(v0: i32):
|
||||
jump ebb1(v0)
|
||||
|
||||
ebb1(v10: i32):
|
||||
v11 = iconst.i32 1
|
||||
v12 = iconst.i32 2
|
||||
v13 = iadd v11, v12
|
||||
brz v10, ebb2(v10)
|
||||
v15 = isub v10, v11
|
||||
brz v15, ebb3(v15)
|
||||
v14 = isub v10, v11
|
||||
jump ebb1(v14)
|
||||
|
||||
ebb2(v20: i32):
|
||||
return v20
|
||||
|
||||
ebb3(v30: i32):
|
||||
v31 = iadd v11, v13
|
||||
jump ebb1(v30)
|
||||
|
||||
}
|
||||
; sameln:function multiple_blocks(i32) -> i32 {
|
||||
; nextln: ebb0(v0: i32):
|
||||
; nextln: v2 = iconst.i32 1
|
||||
; nextln: v3 = iconst.i32 2
|
||||
; nextln: v4 = iadd v2, v3
|
||||
; nextln: v9 = iadd v2, v4
|
||||
; nextln: jump ebb1(v0)
|
||||
; nextln:
|
||||
; nextln: ebb1(v1: i32):
|
||||
; nextln: brz v1, ebb2(v1)
|
||||
; nextln: v5 = isub v1, v2
|
||||
; nextln: brz v5, ebb3(v5)
|
||||
; nextln: v6 = isub v1, v2
|
||||
; nextln: jump ebb1(v6)
|
||||
; nextln:
|
||||
; nextln: ebb2(v7: i32):
|
||||
; nextln: return v7
|
||||
; nextln:
|
||||
; nextln: ebb3(v8: i32):
|
||||
; nextln: jump ebb1(v8)
|
||||
; nextln: }
|
||||
52
cranelift/filetests/licm/nested_loops.cton
Normal file
52
cranelift/filetests/licm/nested_loops.cton
Normal file
@@ -0,0 +1,52 @@
|
||||
test licm
|
||||
|
||||
function nested_loops(i32) -> i32 {
|
||||
|
||||
ebb0(v0: i32):
|
||||
v1 = iconst.i32 1
|
||||
v2 = iconst.i32 2
|
||||
v3 = iadd v1, v2
|
||||
v4 = isub v0, v1
|
||||
jump ebb1(v4,v4)
|
||||
|
||||
ebb1(v10: i32,v11: i32):
|
||||
brz v11, ebb2(v10)
|
||||
v12 = iconst.i32 1
|
||||
v15 = iadd v12, v4
|
||||
v13 = isub v11, v12
|
||||
jump ebb1(v10,v13)
|
||||
|
||||
ebb2(v20: i32):
|
||||
brz v20, ebb3(v20)
|
||||
jump ebb0(v20)
|
||||
|
||||
ebb3(v30: i32):
|
||||
return v30
|
||||
|
||||
}
|
||||
|
||||
; sameln:function nested_loops(i32) -> i32 {
|
||||
; nextln: ebb4(v12: i32):
|
||||
; nextln: v1 = iconst.i32 1
|
||||
; nextln: v2 = iconst.i32 2
|
||||
; nextln: v3 = iadd v1, v2
|
||||
; nextln: v7 = iconst.i32 1
|
||||
; nextln: jump ebb0(v12)
|
||||
; nextln:
|
||||
; nextln: ebb0(v0: i32):
|
||||
; nextln: v4 = isub v0, v1
|
||||
; nextln: v8 = iadd.i32 v7, v4
|
||||
; nextln: jump ebb1(v4, v4)
|
||||
; nextln:
|
||||
; nextln: ebb1(v5: i32, v6: i32):
|
||||
; nextln: brz v6, ebb2(v5)
|
||||
; nextln: v9 = isub v6, v7
|
||||
; nextln: jump ebb1(v5, v9)
|
||||
; nextln:
|
||||
; nextln: ebb2(v10: i32):
|
||||
; nextln: brz v10, ebb3(v10)
|
||||
; nextln: jump ebb0(v10)
|
||||
; nextln:
|
||||
; nextln: ebb3(v11: i32):
|
||||
; nextln: return v11
|
||||
; nextln: }
|
||||
51
cranelift/src/filetest/licm.rs
Normal file
51
cranelift/src/filetest/licm.rs
Normal file
@@ -0,0 +1,51 @@
|
||||
//! Test command for testing the LICM pass.
|
||||
//!
|
||||
//! The `licm` test command runs each function through the LICM pass after ensuring
|
||||
//! that all instructions are legal for the target.
|
||||
//!
|
||||
//! The resulting function is sent to `filecheck`.
|
||||
|
||||
use cretonne::ir::Function;
|
||||
use cretonne;
|
||||
use cton_reader::TestCommand;
|
||||
use filetest::subtest::{SubTest, Context, Result, run_filecheck};
|
||||
use std::borrow::Cow;
|
||||
use std::fmt::Write;
|
||||
use utils::pretty_error;
|
||||
|
||||
struct TestLICM;
|
||||
|
||||
pub fn subtest(parsed: &TestCommand) -> Result<Box<SubTest>> {
|
||||
assert_eq!(parsed.command, "licm");
|
||||
if !parsed.options.is_empty() {
|
||||
Err(format!("No options allowed on {}", parsed))
|
||||
} else {
|
||||
Ok(Box::new(TestLICM))
|
||||
}
|
||||
}
|
||||
|
||||
impl SubTest for TestLICM {
|
||||
fn name(&self) -> Cow<str> {
|
||||
Cow::from("licm")
|
||||
}
|
||||
|
||||
fn is_mutating(&self) -> bool {
|
||||
true
|
||||
}
|
||||
|
||||
fn run(&self, func: Cow<Function>, context: &Context) -> Result<()> {
|
||||
// Create a compilation context, and drop in the function.
|
||||
let mut comp_ctx = cretonne::Context::new();
|
||||
comp_ctx.func = func.into_owned();
|
||||
|
||||
comp_ctx.flowgraph();
|
||||
comp_ctx
|
||||
.licm()
|
||||
.map_err(|e| pretty_error(&comp_ctx.func, e))?;
|
||||
|
||||
let mut text = String::new();
|
||||
write!(&mut text, "{}", &comp_ctx.func)
|
||||
.map_err(|e| e.to_string())?;
|
||||
run_filecheck(&text, context)
|
||||
}
|
||||
}
|
||||
@@ -17,6 +17,7 @@ mod binemit;
|
||||
mod concurrent;
|
||||
mod domtree;
|
||||
mod legalizer;
|
||||
mod licm;
|
||||
mod regalloc;
|
||||
mod runner;
|
||||
mod runone;
|
||||
@@ -61,6 +62,7 @@ fn new_subtest(parsed: &TestCommand) -> subtest::Result<Box<subtest::SubTest>> {
|
||||
"domtree" => domtree::subtest(parsed),
|
||||
"verifier" => verifier::subtest(parsed),
|
||||
"legalizer" => legalizer::subtest(parsed),
|
||||
"licm" => licm::subtest(parsed),
|
||||
"regalloc" => regalloc::subtest(parsed),
|
||||
"binemit" => binemit::subtest(parsed),
|
||||
"simple-gvn" => simple_gvn::subtest(parsed),
|
||||
|
||||
Reference in New Issue
Block a user