Merge pull request #2181 from jgouly/madd-opt
arm64: Combine mul + add into madd
This commit is contained in:
@@ -74,9 +74,35 @@ pub(crate) fn lower_insn_to_regs<C: LowerCtx<I = Inst>>(
|
|||||||
}
|
}
|
||||||
Opcode::Iadd => {
|
Opcode::Iadd => {
|
||||||
let rd = get_output_reg(ctx, outputs[0]);
|
let rd = get_output_reg(ctx, outputs[0]);
|
||||||
let rn = put_input_in_reg(ctx, inputs[0], NarrowValueMode::None);
|
|
||||||
let ty = ty.unwrap();
|
let ty = ty.unwrap();
|
||||||
if !ty.is_vector() {
|
if !ty.is_vector() {
|
||||||
|
let mul_insn =
|
||||||
|
if let Some(mul_insn) = maybe_input_insn(ctx, inputs[1], Opcode::Imul) {
|
||||||
|
Some((mul_insn, 0))
|
||||||
|
} else if let Some(mul_insn) = maybe_input_insn(ctx, inputs[0], Opcode::Imul) {
|
||||||
|
Some((mul_insn, 1))
|
||||||
|
} else {
|
||||||
|
None
|
||||||
|
};
|
||||||
|
// If possible combine mul + add into madd.
|
||||||
|
if let Some((insn, addend_idx)) = mul_insn {
|
||||||
|
let alu_op = choose_32_64(ty, ALUOp3::MAdd32, ALUOp3::MAdd64);
|
||||||
|
let rn_input = InsnInput { insn, input: 0 };
|
||||||
|
let rm_input = InsnInput { insn, input: 1 };
|
||||||
|
|
||||||
|
let rn = put_input_in_reg(ctx, rn_input, NarrowValueMode::None);
|
||||||
|
let rm = put_input_in_reg(ctx, rm_input, NarrowValueMode::None);
|
||||||
|
let ra = put_input_in_reg(ctx, inputs[addend_idx], NarrowValueMode::None);
|
||||||
|
|
||||||
|
ctx.emit(Inst::AluRRRR {
|
||||||
|
alu_op,
|
||||||
|
rd,
|
||||||
|
rn,
|
||||||
|
rm,
|
||||||
|
ra,
|
||||||
|
});
|
||||||
|
} else {
|
||||||
|
let rn = put_input_in_reg(ctx, inputs[0], NarrowValueMode::None);
|
||||||
let (rm, negated) = put_input_in_rse_imm12_maybe_negated(
|
let (rm, negated) = put_input_in_rse_imm12_maybe_negated(
|
||||||
ctx,
|
ctx,
|
||||||
inputs[1],
|
inputs[1],
|
||||||
@@ -89,8 +115,10 @@ pub(crate) fn lower_insn_to_regs<C: LowerCtx<I = Inst>>(
|
|||||||
choose_32_64(ty, ALUOp::Sub32, ALUOp::Sub64)
|
choose_32_64(ty, ALUOp::Sub32, ALUOp::Sub64)
|
||||||
};
|
};
|
||||||
ctx.emit(alu_inst_imm12(alu_op, rd, rn, rm));
|
ctx.emit(alu_inst_imm12(alu_op, rd, rn, rm));
|
||||||
|
}
|
||||||
} else {
|
} else {
|
||||||
let rm = put_input_in_reg(ctx, inputs[1], NarrowValueMode::None);
|
let rm = put_input_in_reg(ctx, inputs[1], NarrowValueMode::None);
|
||||||
|
let rn = put_input_in_reg(ctx, inputs[0], NarrowValueMode::None);
|
||||||
ctx.emit(Inst::VecRRR {
|
ctx.emit(Inst::VecRRR {
|
||||||
rd,
|
rd,
|
||||||
rn,
|
rn,
|
||||||
|
|||||||
Reference in New Issue
Block a user