Add FunctionBuilder::emit_small_memory_compare
This takes an IntCC for the comparison to do, though panics for Signed* since memcmp is an unsigned comparison. Currently it's most useful for (Not)Equal, but once big-endian loads are implemented it'll be able to support the other Unsigned* comparisons nicely on more than just bytes.
This commit is contained in:
@@ -4,6 +4,7 @@ use crate::variable::Variable;
|
|||||||
use cranelift_codegen::cursor::{Cursor, FuncCursor};
|
use cranelift_codegen::cursor::{Cursor, FuncCursor};
|
||||||
use cranelift_codegen::entity::{EntitySet, SecondaryMap};
|
use cranelift_codegen::entity::{EntitySet, SecondaryMap};
|
||||||
use cranelift_codegen::ir;
|
use cranelift_codegen::ir;
|
||||||
|
use cranelift_codegen::ir::condcodes::IntCC;
|
||||||
use cranelift_codegen::ir::{
|
use cranelift_codegen::ir::{
|
||||||
types, AbiParam, Block, DataFlowGraph, ExtFuncData, ExternalName, FuncRef, Function,
|
types, AbiParam, Block, DataFlowGraph, ExtFuncData, ExternalName, FuncRef, Function,
|
||||||
GlobalValue, GlobalValueData, Heap, HeapData, Inst, InstBuilder, InstBuilderBase,
|
GlobalValue, GlobalValueData, Heap, HeapData, Inst, InstBuilder, InstBuilderBase,
|
||||||
@@ -840,6 +841,94 @@ impl<'a> FunctionBuilder<'a> {
|
|||||||
let call = self.ins().call(libc_memcmp, &[left, right, size]);
|
let call = self.ins().call(libc_memcmp, &[left, right, size]);
|
||||||
self.func.dfg.first_result(call)
|
self.func.dfg.first_result(call)
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/// Optimised [`Self::call_memcmp`] for small copies.
|
||||||
|
///
|
||||||
|
/// This implements the byte slice comparison `int_cc(left[..size], right[..size])`.
|
||||||
|
///
|
||||||
|
/// `left_align` and `right_align` are the statically-known alignments of the
|
||||||
|
/// `left` and `right` pointers respectively. These are used to know whether
|
||||||
|
/// to mark `load`s as aligned. It's always fine to pass `1` for these, but
|
||||||
|
/// passing something higher than the true alignment may trap or otherwise
|
||||||
|
/// misbehave as described in [`MemFlags::aligned`].
|
||||||
|
///
|
||||||
|
/// Note that `memcmp` is a *big-endian* and *unsigned* comparison.
|
||||||
|
/// As such, this panics when called with `IntCC::Signed*` or `IntCC::*Overflow`.
|
||||||
|
pub fn emit_small_memory_compare(
|
||||||
|
&mut self,
|
||||||
|
config: TargetFrontendConfig,
|
||||||
|
int_cc: IntCC,
|
||||||
|
left: Value,
|
||||||
|
right: Value,
|
||||||
|
size: u64,
|
||||||
|
left_align: std::num::NonZeroU8,
|
||||||
|
right_align: std::num::NonZeroU8,
|
||||||
|
flags: MemFlags,
|
||||||
|
) -> Value {
|
||||||
|
use IntCC::*;
|
||||||
|
let (zero_cc, empty_imm) = match int_cc {
|
||||||
|
//
|
||||||
|
Equal => (Equal, true),
|
||||||
|
NotEqual => (NotEqual, false),
|
||||||
|
|
||||||
|
UnsignedLessThan => (SignedLessThan, false),
|
||||||
|
UnsignedGreaterThanOrEqual => (SignedGreaterThanOrEqual, true),
|
||||||
|
UnsignedGreaterThan => (SignedGreaterThan, false),
|
||||||
|
UnsignedLessThanOrEqual => (SignedLessThanOrEqual, true),
|
||||||
|
|
||||||
|
SignedLessThan
|
||||||
|
| SignedGreaterThanOrEqual
|
||||||
|
| SignedGreaterThan
|
||||||
|
| SignedLessThanOrEqual => {
|
||||||
|
panic!("Signed comparison {} not supported by memcmp", int_cc)
|
||||||
|
}
|
||||||
|
Overflow | NotOverflow => {
|
||||||
|
panic!("Overflow comparison {} not supported by memcmp", int_cc)
|
||||||
|
}
|
||||||
|
};
|
||||||
|
|
||||||
|
if size == 0 {
|
||||||
|
return self.ins().bconst(types::B1, empty_imm);
|
||||||
|
}
|
||||||
|
|
||||||
|
// Future work could consider expanding this to handle more-complex scenarios.
|
||||||
|
fn type_from_byte_size(size: u64) -> Option<Type> {
|
||||||
|
if size > 16 {
|
||||||
|
return None;
|
||||||
|
}
|
||||||
|
Type::int(size as u16 * 8)
|
||||||
|
}
|
||||||
|
if let Some(small_type) = type_from_byte_size(size) {
|
||||||
|
if let Equal | NotEqual = zero_cc {
|
||||||
|
let mut left_flags = flags;
|
||||||
|
if size == left_align.get().into() {
|
||||||
|
left_flags.set_aligned();
|
||||||
|
}
|
||||||
|
let mut right_flags = flags;
|
||||||
|
if size == right_align.get().into() {
|
||||||
|
right_flags.set_aligned();
|
||||||
|
}
|
||||||
|
let left_val = self.ins().load(small_type, left_flags, left, 0);
|
||||||
|
let right_val = self.ins().load(small_type, right_flags, right, 0);
|
||||||
|
return self.ins().icmp(int_cc, left_val, right_val);
|
||||||
|
} else if small_type == types::I8 {
|
||||||
|
// Once the big-endian loads from wasmtime#2492 are implemented in
|
||||||
|
// the backends, we could easily handle comparisons for more sizes here.
|
||||||
|
// But for now, just handle single bytes where we don't need to worry.
|
||||||
|
|
||||||
|
let mut aligned_flags = flags;
|
||||||
|
aligned_flags.set_aligned();
|
||||||
|
let left_val = self.ins().load(small_type, aligned_flags, left, 0);
|
||||||
|
let right_val = self.ins().load(small_type, aligned_flags, right, 0);
|
||||||
|
return self.ins().icmp(int_cc, left_val, right_val);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
let pointer_type = config.pointer_type();
|
||||||
|
let size = self.ins().iconst(pointer_type, size as i64);
|
||||||
|
let cmp = self.call_memcmp(config, left, right, size);
|
||||||
|
self.ins().icmp_imm(zero_cc, cmp, 0)
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
fn greatest_divisible_power_of_two(size: u64) -> u64 {
|
fn greatest_divisible_power_of_two(size: u64) -> u64 {
|
||||||
@@ -876,11 +965,12 @@ mod tests {
|
|||||||
use crate::Variable;
|
use crate::Variable;
|
||||||
use alloc::string::ToString;
|
use alloc::string::ToString;
|
||||||
use cranelift_codegen::entity::EntityRef;
|
use cranelift_codegen::entity::EntityRef;
|
||||||
|
use cranelift_codegen::ir::condcodes::IntCC;
|
||||||
use cranelift_codegen::ir::types::*;
|
use cranelift_codegen::ir::types::*;
|
||||||
use cranelift_codegen::ir::{
|
use cranelift_codegen::ir::{
|
||||||
AbiParam, ExternalName, Function, InstBuilder, MemFlags, Signature,
|
AbiParam, ExternalName, Function, InstBuilder, MemFlags, Signature, Value,
|
||||||
};
|
};
|
||||||
use cranelift_codegen::isa::{CallConv, TargetFrontendConfig};
|
use cranelift_codegen::isa::{CallConv, TargetFrontendConfig, TargetIsa};
|
||||||
use cranelift_codegen::settings;
|
use cranelift_codegen::settings;
|
||||||
use cranelift_codegen::verifier::verify_function;
|
use cranelift_codegen::verifier::verify_function;
|
||||||
use target_lexicon::PointerWidth;
|
use target_lexicon::PointerWidth;
|
||||||
@@ -1251,7 +1341,7 @@ block0:
|
|||||||
#[test]
|
#[test]
|
||||||
fn memcmp() {
|
fn memcmp() {
|
||||||
use core::str::FromStr;
|
use core::str::FromStr;
|
||||||
use cranelift_codegen::{isa, settings};
|
use cranelift_codegen::isa;
|
||||||
|
|
||||||
let shared_builder = settings::builder();
|
let shared_builder = settings::builder();
|
||||||
let shared_flags = settings::Flags::new(shared_builder);
|
let shared_flags = settings::Flags::new(shared_builder);
|
||||||
@@ -1293,7 +1383,7 @@ block0:
|
|||||||
}
|
}
|
||||||
|
|
||||||
assert_eq!(
|
assert_eq!(
|
||||||
func.display(None).to_string(),
|
func.display().to_string(),
|
||||||
"function %sample() -> i32 system_v {
|
"function %sample() -> i32 system_v {
|
||||||
sig0 = (i64, i64, i64) -> i32 system_v
|
sig0 = (i64, i64, i64) -> i32 system_v
|
||||||
fn0 = %Memcmp sig0
|
fn0 = %Memcmp sig0
|
||||||
@@ -1312,6 +1402,205 @@ block0:
|
|||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn small_memcmp_zero_size() {
|
||||||
|
let align_eight = std::num::NonZeroU8::new(8).unwrap();
|
||||||
|
small_memcmp_helper(
|
||||||
|
"
|
||||||
|
block0:
|
||||||
|
v4 = iconst.i64 0
|
||||||
|
v1 -> v4
|
||||||
|
v3 = iconst.i64 0
|
||||||
|
v0 -> v3
|
||||||
|
v2 = bconst.b1 true
|
||||||
|
return v2",
|
||||||
|
|builder, target, x, y| {
|
||||||
|
builder.emit_small_memory_compare(
|
||||||
|
target.frontend_config(),
|
||||||
|
IntCC::UnsignedGreaterThanOrEqual,
|
||||||
|
x,
|
||||||
|
y,
|
||||||
|
0,
|
||||||
|
align_eight,
|
||||||
|
align_eight,
|
||||||
|
MemFlags::new(),
|
||||||
|
)
|
||||||
|
},
|
||||||
|
);
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn small_memcmp_byte_ugt() {
|
||||||
|
let align_one = std::num::NonZeroU8::new(1).unwrap();
|
||||||
|
small_memcmp_helper(
|
||||||
|
"
|
||||||
|
block0:
|
||||||
|
v6 = iconst.i64 0
|
||||||
|
v1 -> v6
|
||||||
|
v5 = iconst.i64 0
|
||||||
|
v0 -> v5
|
||||||
|
v2 = load.i8 aligned v0
|
||||||
|
v3 = load.i8 aligned v1
|
||||||
|
v4 = icmp ugt v2, v3
|
||||||
|
return v4",
|
||||||
|
|builder, target, x, y| {
|
||||||
|
builder.emit_small_memory_compare(
|
||||||
|
target.frontend_config(),
|
||||||
|
IntCC::UnsignedGreaterThan,
|
||||||
|
x,
|
||||||
|
y,
|
||||||
|
1,
|
||||||
|
align_one,
|
||||||
|
align_one,
|
||||||
|
MemFlags::new(),
|
||||||
|
)
|
||||||
|
},
|
||||||
|
);
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn small_memcmp_aligned_eq() {
|
||||||
|
let align_four = std::num::NonZeroU8::new(4).unwrap();
|
||||||
|
small_memcmp_helper(
|
||||||
|
"
|
||||||
|
block0:
|
||||||
|
v6 = iconst.i64 0
|
||||||
|
v1 -> v6
|
||||||
|
v5 = iconst.i64 0
|
||||||
|
v0 -> v5
|
||||||
|
v2 = load.i32 aligned v0
|
||||||
|
v3 = load.i32 aligned v1
|
||||||
|
v4 = icmp eq v2, v3
|
||||||
|
return v4",
|
||||||
|
|builder, target, x, y| {
|
||||||
|
builder.emit_small_memory_compare(
|
||||||
|
target.frontend_config(),
|
||||||
|
IntCC::Equal,
|
||||||
|
x,
|
||||||
|
y,
|
||||||
|
4,
|
||||||
|
align_four,
|
||||||
|
align_four,
|
||||||
|
MemFlags::new(),
|
||||||
|
)
|
||||||
|
},
|
||||||
|
);
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn small_memcmp_ipv6_ne() {
|
||||||
|
let align_two = std::num::NonZeroU8::new(2).unwrap();
|
||||||
|
small_memcmp_helper(
|
||||||
|
"
|
||||||
|
block0:
|
||||||
|
v6 = iconst.i64 0
|
||||||
|
v1 -> v6
|
||||||
|
v5 = iconst.i64 0
|
||||||
|
v0 -> v5
|
||||||
|
v2 = load.i128 v0
|
||||||
|
v3 = load.i128 v1
|
||||||
|
v4 = icmp ne v2, v3
|
||||||
|
return v4",
|
||||||
|
|builder, target, x, y| {
|
||||||
|
builder.emit_small_memory_compare(
|
||||||
|
target.frontend_config(),
|
||||||
|
IntCC::NotEqual,
|
||||||
|
x,
|
||||||
|
y,
|
||||||
|
16,
|
||||||
|
align_two,
|
||||||
|
align_two,
|
||||||
|
MemFlags::new(),
|
||||||
|
)
|
||||||
|
},
|
||||||
|
);
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn small_memcmp_odd_size_uge() {
|
||||||
|
let one = std::num::NonZeroU8::new(1).unwrap();
|
||||||
|
small_memcmp_helper(
|
||||||
|
"
|
||||||
|
sig0 = (i64, i64, i64) -> i32 system_v
|
||||||
|
fn0 = %Memcmp sig0
|
||||||
|
|
||||||
|
block0:
|
||||||
|
v6 = iconst.i64 0
|
||||||
|
v1 -> v6
|
||||||
|
v5 = iconst.i64 0
|
||||||
|
v0 -> v5
|
||||||
|
v2 = iconst.i64 3
|
||||||
|
v3 = call fn0(v0, v1, v2)
|
||||||
|
v4 = icmp_imm sge v3, 0
|
||||||
|
return v4",
|
||||||
|
|builder, target, x, y| {
|
||||||
|
builder.emit_small_memory_compare(
|
||||||
|
target.frontend_config(),
|
||||||
|
IntCC::UnsignedGreaterThanOrEqual,
|
||||||
|
x,
|
||||||
|
y,
|
||||||
|
3,
|
||||||
|
one,
|
||||||
|
one,
|
||||||
|
MemFlags::new(),
|
||||||
|
)
|
||||||
|
},
|
||||||
|
);
|
||||||
|
}
|
||||||
|
|
||||||
|
fn small_memcmp_helper(
|
||||||
|
expected: &str,
|
||||||
|
f: impl FnOnce(&mut FunctionBuilder, &dyn TargetIsa, Value, Value) -> Value,
|
||||||
|
) {
|
||||||
|
use core::str::FromStr;
|
||||||
|
use cranelift_codegen::isa;
|
||||||
|
|
||||||
|
let shared_builder = settings::builder();
|
||||||
|
let shared_flags = settings::Flags::new(shared_builder);
|
||||||
|
|
||||||
|
let triple =
|
||||||
|
::target_lexicon::Triple::from_str("x86_64").expect("Couldn't create x86_64 triple");
|
||||||
|
|
||||||
|
let target = isa::lookup(triple)
|
||||||
|
.ok()
|
||||||
|
.map(|b| b.finish(shared_flags))
|
||||||
|
.expect("This test requires x86_64 support.");
|
||||||
|
|
||||||
|
let mut sig = Signature::new(target.default_call_conv());
|
||||||
|
sig.returns.push(AbiParam::new(B1));
|
||||||
|
|
||||||
|
let mut fn_ctx = FunctionBuilderContext::new();
|
||||||
|
let mut func = Function::with_name_signature(ExternalName::testcase("sample"), sig);
|
||||||
|
{
|
||||||
|
let mut builder = FunctionBuilder::new(&mut func, &mut fn_ctx);
|
||||||
|
|
||||||
|
let block0 = builder.create_block();
|
||||||
|
let x = Variable::new(0);
|
||||||
|
let y = Variable::new(1);
|
||||||
|
builder.declare_var(x, target.pointer_type());
|
||||||
|
builder.declare_var(y, target.pointer_type());
|
||||||
|
builder.append_block_params_for_function_params(block0);
|
||||||
|
builder.switch_to_block(block0);
|
||||||
|
|
||||||
|
let left = builder.use_var(x);
|
||||||
|
let right = builder.use_var(y);
|
||||||
|
let ret = f(&mut builder, &*target, left, right);
|
||||||
|
builder.ins().return_(&[ret]);
|
||||||
|
|
||||||
|
builder.seal_all_blocks();
|
||||||
|
builder.finalize();
|
||||||
|
}
|
||||||
|
|
||||||
|
let actual_ir = func.display().to_string();
|
||||||
|
let expected_ir = format!("function %sample() -> b1 system_v {{{}\n}}\n", expected);
|
||||||
|
assert!(
|
||||||
|
expected_ir == actual_ir,
|
||||||
|
"Expected\n{}, but got\n{}",
|
||||||
|
expected_ir,
|
||||||
|
actual_ir
|
||||||
|
);
|
||||||
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn undef_vector_vars() {
|
fn undef_vector_vars() {
|
||||||
let mut sig = Signature::new(CallConv::SystemV);
|
let mut sig = Signature::new(CallConv::SystemV);
|
||||||
|
|||||||
Reference in New Issue
Block a user