x64: Peephole optimization for x < 0 (#4625)

https://github.com/bytecodealliance/wasmtime/pull/4625

Fixes #4607
This commit is contained in:
Trevor Elliott
2022-08-09 09:45:53 -07:00
committed by GitHub
parent a36a52a017
commit ed7dfd3925
3 changed files with 224 additions and 0 deletions

View File

@@ -73,3 +73,135 @@ block2:
; popq %rbp
; ret
function %test_x_slt_0_i64(i64) -> b1 {
block0(v0: i64):
v1 = iconst.i64 0
v2 = icmp slt v0, v1
return v2
}
; pushq %rbp
; movq %rsp, %rbp
; block0:
; shrq $63, %rdi, %rdi
; movq %rdi, %rax
; movq %rbp, %rsp
; popq %rbp
; ret
function %test_x_slt_0_i32f4(i32) -> b1 {
block0(v0: i32):
v1 = iconst.i32 0
v2 = icmp slt v0, v1
return v2
}
; pushq %rbp
; movq %rsp, %rbp
; block0:
; shrl $31, %edi, %edi
; movq %rdi, %rax
; movq %rbp, %rsp
; popq %rbp
; ret
function %test_0_sgt_x_i64(i64) -> b1 {
block0(v0: i64):
v1 = iconst.i64 0
v2 = icmp sgt v1, v0
return v2
}
; pushq %rbp
; movq %rsp, %rbp
; block0:
; shrq $63, %rdi, %rdi
; movq %rdi, %rax
; movq %rbp, %rsp
; popq %rbp
; ret
function %test_0_sgt_x_i32f4(i32) -> b1 {
block0(v0: i32):
v1 = iconst.i32 0
v2 = icmp sgt v1, v0
return v2
}
; pushq %rbp
; movq %rsp, %rbp
; block0:
; shrl $31, %edi, %edi
; movq %rdi, %rax
; movq %rbp, %rsp
; popq %rbp
; ret
function %test_0_sle_x_i64(i64) -> b1 {
block0(v0: i64):
v1 = iconst.i64 0
v2 = icmp sle v1, v0
return v2
}
; pushq %rbp
; movq %rsp, %rbp
; block0:
; notq %rdi, %rdi
; shrq $63, %rdi, %rdi
; movq %rdi, %rax
; movq %rbp, %rsp
; popq %rbp
; ret
function %test_0_sle_x_i32f4(i32) -> b1 {
block0(v0: i32):
v1 = iconst.i32 0
v2 = icmp sle v1, v0
return v2
}
; pushq %rbp
; movq %rsp, %rbp
; block0:
; notq %rdi, %rdi
; shrl $31, %edi, %edi
; movq %rdi, %rax
; movq %rbp, %rsp
; popq %rbp
; ret
function %test_x_sge_x_i64(i64) -> b1 {
block0(v0: i64):
v1 = iconst.i64 0
v2 = icmp sge v0, v1
return v2
}
; pushq %rbp
; movq %rsp, %rbp
; block0:
; notq %rdi, %rdi
; shrq $63, %rdi, %rdi
; movq %rdi, %rax
; movq %rbp, %rsp
; popq %rbp
; ret
function %test_x_sge_x_i32f4(i32) -> b1 {
block0(v0: i32):
v1 = iconst.i32 0
v2 = icmp sge v0, v1
return v2
}
; pushq %rbp
; movq %rsp, %rbp
; block0:
; notq %rdi, %rdi
; shrl $31, %edi, %edi
; movq %rdi, %rax
; movq %rbp, %rsp
; popq %rbp
; ret

View File

@@ -223,3 +223,63 @@ block2:
; popq %rbp
; ret
function %f6(i64) -> b1 {
block0(v0: i64):
v1 = iconst.i64 0
v2 = icmp slt v0, v1
brnz v2, block1
jump block2
block1:
v3 = bconst.b1 true
return v3
block2:
v4 = bconst.b1 false
return v4
}
; pushq %rbp
; movq %rsp, %rbp
; block0:
; cmpq $0, %rdi
; jl label1; j label2
; block1:
; movl $1, %eax
; movq %rbp, %rsp
; popq %rbp
; ret
; block2:
; xorl %eax, %eax, %eax
; movq %rbp, %rsp
; popq %rbp
; ret
function %f7(i32) -> b1 {
block0(v0: i32):
v1 = iconst.i32 0
v2 = icmp slt v0, v1
brnz v2, block1
jump block2
block1:
v3 = bconst.b1 true
return v3
block2:
v4 = bconst.b1 false
return v4
}
; pushq %rbp
; movq %rsp, %rbp
; block0:
; cmpl $0, %edi
; jl label1; j label2
; block1:
; movl $1, %eax
; movq %rbp, %rsp
; popq %rbp
; ret
; block2:
; xorl %eax, %eax, %eax
; movq %rbp, %rsp
; popq %rbp
; ret