Avoid introducing a move for struct return (#6245)
* Move sret_reg handling to Lower:new, from gen_arg_setup * Update exp files * Review feedback * Review feedback
This commit is contained in:
@@ -377,12 +377,27 @@ impl<'func, I: VCodeInst> Lower<'func, I> {
|
||||
}
|
||||
}
|
||||
|
||||
// Make a sret register, if one is needed.
|
||||
// Find the sret register, if it's used.
|
||||
let mut sret_reg = None;
|
||||
for ret in &vcode.abi().signature().returns.clone() {
|
||||
for ret in vcode.abi().signature().returns.iter() {
|
||||
if ret.purpose == ArgumentPurpose::StructReturn {
|
||||
assert!(sret_reg.is_none());
|
||||
sret_reg = Some(vregs.alloc(ret.value_type)?);
|
||||
let entry_bb = f.stencil.layout.entry_block().unwrap();
|
||||
for (¶m, sig_param) in f
|
||||
.dfg
|
||||
.block_params(entry_bb)
|
||||
.iter()
|
||||
.zip(vcode.abi().signature().params.iter())
|
||||
{
|
||||
if sig_param.purpose == ArgumentPurpose::StructReturn {
|
||||
let regs = value_regs[param];
|
||||
assert!(regs.len() == 1);
|
||||
|
||||
assert!(sret_reg.is_none());
|
||||
sret_reg = Some(regs);
|
||||
}
|
||||
}
|
||||
|
||||
assert!(sret_reg.is_some());
|
||||
}
|
||||
}
|
||||
|
||||
@@ -576,24 +591,6 @@ impl<'func, I: VCodeInst> Lower<'func, I> {
|
||||
{
|
||||
self.emit(insn);
|
||||
}
|
||||
if self.abi().signature().params[i].purpose == ArgumentPurpose::StructReturn {
|
||||
assert!(regs.len() == 1);
|
||||
let ty = self.abi().signature().params[i].value_type;
|
||||
// The ABI implementation must have ensured that a StructReturn
|
||||
// arg is present in the return values.
|
||||
assert!(self
|
||||
.abi()
|
||||
.signature()
|
||||
.returns
|
||||
.iter()
|
||||
.position(|ret| ret.purpose == ArgumentPurpose::StructReturn)
|
||||
.is_some());
|
||||
self.emit(I::gen_move(
|
||||
Writable::from_reg(self.sret_reg.unwrap().regs()[0]),
|
||||
regs.regs()[0].to_reg(),
|
||||
ty,
|
||||
));
|
||||
}
|
||||
}
|
||||
if let Some(insn) = self
|
||||
.vcode
|
||||
|
||||
@@ -850,16 +850,14 @@ block0(v0: i64):
|
||||
|
||||
; VCode:
|
||||
; block0:
|
||||
; mov x5, x8
|
||||
; movz x4, #42
|
||||
; str x4, [x8]
|
||||
; movz x2, #42
|
||||
; str x2, [x8]
|
||||
; ret
|
||||
;
|
||||
; Disassembled:
|
||||
; block0: ; offset 0x0
|
||||
; mov x5, x8
|
||||
; mov x4, #0x2a
|
||||
; str x4, [x8]
|
||||
; mov x2, #0x2a
|
||||
; str x2, [x8]
|
||||
; ret
|
||||
|
||||
function %f18(i64) -> i64 {
|
||||
@@ -905,13 +903,14 @@ block0(v0: i64):
|
||||
; VCode:
|
||||
; stp fp, lr, [sp, #-16]!
|
||||
; mov fp, sp
|
||||
; str x24, [sp, #-16]!
|
||||
; str x23, [sp, #-16]!
|
||||
; block0:
|
||||
; mov x24, x8
|
||||
; load_ext_name x4, TestCase(%g)+0
|
||||
; blr x4
|
||||
; mov x8, x24
|
||||
; ldr x24, [sp], #16
|
||||
; mov x23, x8
|
||||
; load_ext_name x2, TestCase(%g)+0
|
||||
; mov x8, x23
|
||||
; blr x2
|
||||
; mov x8, x23
|
||||
; ldr x23, [sp], #16
|
||||
; ldp fp, lr, [sp], #16
|
||||
; ret
|
||||
;
|
||||
@@ -919,16 +918,17 @@ block0(v0: i64):
|
||||
; block0: ; offset 0x0
|
||||
; stp x29, x30, [sp, #-0x10]!
|
||||
; mov x29, sp
|
||||
; str x24, [sp, #-0x10]!
|
||||
; str x23, [sp, #-0x10]!
|
||||
; block1: ; offset 0xc
|
||||
; mov x24, x8
|
||||
; ldr x4, #0x18
|
||||
; mov x23, x8
|
||||
; ldr x2, #0x18
|
||||
; b #0x20
|
||||
; .byte 0x00, 0x00, 0x00, 0x00 ; reloc_external Abs8 %g 0
|
||||
; .byte 0x00, 0x00, 0x00, 0x00
|
||||
; blr x4
|
||||
; mov x8, x24
|
||||
; ldr x24, [sp], #0x10
|
||||
; mov x8, x23
|
||||
; blr x2
|
||||
; mov x8, x23
|
||||
; ldr x23, [sp], #0x10
|
||||
; ldp x29, x30, [sp], #0x10
|
||||
; ret
|
||||
|
||||
|
||||
@@ -12,9 +12,9 @@ block0(v0: i64):
|
||||
; pushq %rbp
|
||||
; movq %rsp, %rbp
|
||||
; block0:
|
||||
; movl $42, %eax
|
||||
; movq %rax, 0(%rdi)
|
||||
; movq %rdi, %rax
|
||||
; movl $42, %edx
|
||||
; movq %rdx, 0(%rdi)
|
||||
; movq %rbp, %rsp
|
||||
; popq %rbp
|
||||
; ret
|
||||
@@ -24,9 +24,9 @@ block0(v0: i64):
|
||||
; pushq %rbp
|
||||
; movq %rsp, %rbp
|
||||
; block1: ; offset 0x4
|
||||
; movl $0x2a, %eax
|
||||
; movq %rax, (%rdi) ; trap: heap_oob
|
||||
; movq %rdi, %rax
|
||||
; movl $0x2a, %edx
|
||||
; movq %rdx, (%rdi) ; trap: heap_oob
|
||||
; movq %rbp, %rsp
|
||||
; popq %rbp
|
||||
; retq
|
||||
@@ -79,8 +79,9 @@ block0(v0: i64):
|
||||
; movq %r15, 0(%rsp)
|
||||
; block0:
|
||||
; movq %rdi, %r15
|
||||
; load_ext_name %f4+0, %rdx
|
||||
; call *%rdx
|
||||
; load_ext_name %f4+0, %rax
|
||||
; movq %r15, %rdi
|
||||
; call *%rax
|
||||
; movq %r15, %rax
|
||||
; movq 0(%rsp), %r15
|
||||
; addq %rsp, $16, %rsp
|
||||
@@ -96,8 +97,9 @@ block0(v0: i64):
|
||||
; movq %r15, (%rsp)
|
||||
; block1: ; offset 0xc
|
||||
; movq %rdi, %r15
|
||||
; movabsq $0, %rdx ; reloc_external Abs8 %f4 0
|
||||
; callq *%rdx
|
||||
; movabsq $0, %rax ; reloc_external Abs8 %f4 0
|
||||
; movq %r15, %rdi
|
||||
; callq *%rax
|
||||
; movq %r15, %rax
|
||||
; movq (%rsp), %r15
|
||||
; addq $0x10, %rsp
|
||||
|
||||
Reference in New Issue
Block a user