This PR switches Cranelift over to the new register allocator, regalloc2. See [this document](https://gist.github.com/cfallin/08553421a91f150254fe878f67301801) for a summary of the design changes. This switchover has implications for core VCode/MachInst types and the lowering pass. Overall, this change brings improvements to both compile time and speed of generated code (runtime), as reported in #3942: ``` Benchmark Compilation (wallclock) Execution (wallclock) blake3-scalar 25% faster 28% faster blake3-simd no diff no diff meshoptimizer 19% faster 17% faster pulldown-cmark 17% faster no diff bz2 15% faster no diff SpiderMonkey, 21% faster 2% faster fib(30) clang.wasm 42% faster N/A ```
82 lines
1021 B
Plaintext
82 lines
1021 B
Plaintext
test compile precise-output
|
|
target s390x
|
|
|
|
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
;; TRAP/RESUMABLE_TRAP
|
|
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
|
|
function %trap() {
|
|
block0:
|
|
trap user0
|
|
}
|
|
|
|
; block0:
|
|
; trap
|
|
|
|
function %resumable_trap() {
|
|
block0:
|
|
trap user0
|
|
}
|
|
|
|
; block0:
|
|
; trap
|
|
|
|
function %trapz(i64) {
|
|
block0(v0: i64):
|
|
v1 = iconst.i64 42
|
|
v2 = icmp eq v0, v1
|
|
trapz v2, user0
|
|
return
|
|
}
|
|
|
|
; block0:
|
|
; clgfi %r2, 42
|
|
; jge label1 ; jg label2
|
|
; block1:
|
|
; br %r14
|
|
; block2:
|
|
; trap
|
|
|
|
function %trapnz(i64) {
|
|
block0(v0: i64):
|
|
v1 = iconst.i64 42
|
|
v2 = icmp eq v0, v1
|
|
trapnz v2, user0
|
|
return
|
|
}
|
|
|
|
; block0:
|
|
; clgfi %r2, 42
|
|
; jgne label1 ; jg label2
|
|
; block1:
|
|
; br %r14
|
|
; block2:
|
|
; trap
|
|
|
|
function %resumable_trapnz(i64) {
|
|
block0(v0: i64):
|
|
v1 = iconst.i64 42
|
|
v2 = icmp eq v0, v1
|
|
trapnz v2, user0
|
|
return
|
|
}
|
|
|
|
; block0:
|
|
; clgfi %r2, 42
|
|
; jgne label1 ; jg label2
|
|
; block1:
|
|
; br %r14
|
|
; block2:
|
|
; trap
|
|
|
|
function %h() {
|
|
block0:
|
|
debugtrap
|
|
return
|
|
}
|
|
|
|
; block0:
|
|
; debugtrap
|
|
; br %r14
|
|
|