cranelift: Add inline stack probing for x64 (#4747)

* cranelift: Add inline stack probe for x64

* cranelift: Cleanups comments

Thanks @jameysharp!
This commit is contained in:
Afonso Bordado
2022-09-01 23:32:54 +01:00
committed by GitHub
parent 84ac24c23d
commit 08e7a7f1a0
16 changed files with 394 additions and 17 deletions

View File

@@ -0,0 +1,67 @@
test compile precise-output
set enable_probestack=true
; Test with the larger size of 64k
set probestack_size_log2=16
set probestack_strategy=inline
target x86_64
; If the stack size is just one page, we can avoid the stack probe entirely
function %single_page() -> i64 system_v {
ss0 = explicit_slot 8192
block0:
v1 = stack_addr.i64 ss0
return v1
}
; pushq %rbp
; movq %rsp, %rbp
; subq %rsp, $8192, %rsp
; block0:
; lea rsp(0 + virtual offset), %rax
; addq %rsp, $8192, %rsp
; movq %rbp, %rsp
; popq %rbp
; ret
function %unrolled() -> i64 system_v {
ss0 = explicit_slot 196608
block0:
v1 = stack_addr.i64 ss0
return v1
}
; pushq %rbp
; movq %rsp, %rbp
; movl %esp, -65536(%rsp)
; movl %esp, -131072(%rsp)
; movl %esp, -196608(%rsp)
; subq %rsp, $196608, %rsp
; block0:
; lea rsp(0 + virtual offset), %rax
; addq %rsp, $196608, %rsp
; movq %rbp, %rsp
; popq %rbp
; ret
function %large() -> i64 system_v {
ss0 = explicit_slot 2097152
block0:
v1 = stack_addr.i64 ss0
return v1
}
; pushq %rbp
; movq %rsp, %rbp
; stack_probe_loop %r11, frame_size=2097152, guard_size=65536
; subq %rsp, $2097152, %rsp
; block0:
; lea rsp(0 + virtual offset), %rax
; addq %rsp, $2097152, %rsp
; movq %rbp, %rsp
; popq %rbp
; ret

View File

@@ -0,0 +1,66 @@
test compile precise-output
set enable_probestack=true
set probestack_strategy=inline
; This is the default and is equivalent to a page size of 4096
set probestack_size_log2=12
target x86_64
; If the stack size is just one page, we can avoid the stack probe entirely
function %single_page() -> i64 system_v {
ss0 = explicit_slot 2048
block0:
v1 = stack_addr.i64 ss0
return v1
}
; pushq %rbp
; movq %rsp, %rbp
; subq %rsp, $2048, %rsp
; block0:
; lea rsp(0 + virtual offset), %rax
; addq %rsp, $2048, %rsp
; movq %rbp, %rsp
; popq %rbp
; ret
function %unrolled() -> i64 system_v {
ss0 = explicit_slot 12288
block0:
v1 = stack_addr.i64 ss0
return v1
}
; pushq %rbp
; movq %rsp, %rbp
; movl %esp, -4096(%rsp)
; movl %esp, -8192(%rsp)
; movl %esp, -12288(%rsp)
; subq %rsp, $12288, %rsp
; block0:
; lea rsp(0 + virtual offset), %rax
; addq %rsp, $12288, %rsp
; movq %rbp, %rsp
; popq %rbp
; ret
function %large() -> i64 system_v {
ss0 = explicit_slot 100000
block0:
v1 = stack_addr.i64 ss0
return v1
}
; pushq %rbp
; movq %rsp, %rbp
; stack_probe_loop %r11, frame_size=100000, guard_size=4096
; subq %rsp, $100000, %rsp
; block0:
; lea rsp(0 + virtual offset), %rax
; addq %rsp, $100000, %rsp
; movq %rbp, %rsp
; popq %rbp
; ret