[AArch64] Merge 32- and 64-bit ALUOps (#3802)

Combine the two opcodes into one and pass and add an OperandSize field to these instructions, as well as an ISLE helper to perform the conversion from Type. This saves us from having having to write ISLE helpers to select the correct opcode, based on type, and reduces the amount of code needed for emission. Copyright (c) 2022, Arm Limited.
2022-02-17 18:03:54 +00:00
parent b62fe21914
commit e572198f85
10 changed files with 1786 additions and 1987 deletions
--- a/cranelift/codegen/src/isa/aarch64/inst/emit.rs
+++ b/cranelift/codegen/src/isa/aarch64/inst/emit.rs
@@ -67,7 +67,8 @@ pub fn mem_finalize(
                // is a valid base (for SPOffset) which we must handle here.
                // Also, SP needs to be the first arg, not second.
                let add_inst = Inst::AluRRRExtend {
-                    alu_op: ALUOp::Add64,
+                    alu_op: ALUOp::Add,
+                    size: OperandSize::Size64,
                    rd: tmp,
                    rn: basereg,
                    rm: tmp.to_reg(),
@@ -682,52 +683,48 @@ impl MachInstEmit for Inst {
        let mut start_off = sink.cur_offset();

        match self {
-            &Inst::AluRRR { alu_op, rd, rn, rm } => {
+            &Inst::AluRRR {
+                alu_op,
+                size,
+                rd,
+                rn,
+                rm,
+            } => {
+                debug_assert!(match alu_op {
+                    ALUOp::SDiv | ALUOp::UDiv | ALUOp::SMulH | ALUOp::UMulH =>
+                        size == OperandSize::Size64,
+                    _ => true,
+                });
                let top11 = match alu_op {
-                    ALUOp::Add32 => 0b00001011_000,
-                    ALUOp::Add64 => 0b10001011_000,
-                    ALUOp::Adc32 => 0b00011010_000,
-                    ALUOp::Adc64 => 0b10011010_000,
-                    ALUOp::AdcS32 => 0b00111010_000,
-                    ALUOp::AdcS64 => 0b10111010_000,
-                    ALUOp::Sub32 => 0b01001011_000,
-                    ALUOp::Sub64 => 0b11001011_000,
-                    ALUOp::Sbc32 => 0b01011010_000,
-                    ALUOp::Sbc64 => 0b11011010_000,
-                    ALUOp::SbcS32 => 0b01111010_000,
-                    ALUOp::SbcS64 => 0b11111010_000,
-                    ALUOp::Orr32 => 0b00101010_000,
-                    ALUOp::Orr64 => 0b10101010_000,
-                    ALUOp::And32 => 0b00001010_000,
-                    ALUOp::And64 => 0b10001010_000,
-                    ALUOp::AndS32 => 0b01101010_000,
-                    ALUOp::AndS64 => 0b11101010_000,
-                    ALUOp::Eor32 => 0b01001010_000,
-                    ALUOp::Eor64 => 0b11001010_000,
-                    ALUOp::OrrNot32 => 0b00101010_001,
-                    ALUOp::OrrNot64 => 0b10101010_001,
-                    ALUOp::AndNot32 => 0b00001010_001,
-                    ALUOp::AndNot64 => 0b10001010_001,
-                    ALUOp::EorNot32 => 0b01001010_001,
-                    ALUOp::EorNot64 => 0b11001010_001,
-                    ALUOp::AddS32 => 0b00101011_000,
-                    ALUOp::AddS64 => 0b10101011_000,
-                    ALUOp::SubS32 => 0b01101011_000,
-                    ALUOp::SubS64 => 0b11101011_000,
-                    ALUOp::SDiv64 => 0b10011010_110,
-                    ALUOp::UDiv64 => 0b10011010_110,
-                    ALUOp::RotR32 | ALUOp::Lsr32 | ALUOp::Asr32 | ALUOp::Lsl32 => 0b00011010_110,
-                    ALUOp::RotR64 | ALUOp::Lsr64 | ALUOp::Asr64 | ALUOp::Lsl64 => 0b10011010_110,
+                    ALUOp::Add => 0b00001011_000,
+                    ALUOp::Adc => 0b00011010_000,
+                    ALUOp::AdcS => 0b00111010_000,
+                    ALUOp::Sub => 0b01001011_000,
+                    ALUOp::Sbc => 0b01011010_000,
+                    ALUOp::SbcS => 0b01111010_000,
+                    ALUOp::Orr => 0b00101010_000,
+                    ALUOp::And => 0b00001010_000,
+                    ALUOp::AndS => 0b01101010_000,
+                    ALUOp::Eor => 0b01001010_000,
+                    ALUOp::OrrNot => 0b00101010_001,
+                    ALUOp::AndNot => 0b00001010_001,
+                    ALUOp::EorNot => 0b01001010_001,
+                    ALUOp::AddS => 0b00101011_000,
+                    ALUOp::SubS => 0b01101011_000,
+                    ALUOp::SDiv => 0b10011010_110,
+                    ALUOp::UDiv => 0b10011010_110,
+                    ALUOp::RotR | ALUOp::Lsr | ALUOp::Asr | ALUOp::Lsl => 0b00011010_110,
                    ALUOp::SMulH => 0b10011011_010,
                    ALUOp::UMulH => 0b10011011_110,
                };
+                let top11 = top11 | size.sf_bit() << 10;
                let bit15_10 = match alu_op {
-                    ALUOp::SDiv64 => 0b000011,
-                    ALUOp::UDiv64 => 0b000010,
-                    ALUOp::RotR32 | ALUOp::RotR64 => 0b001011,
-                    ALUOp::Lsr32 | ALUOp::Lsr64 => 0b001001,
-                    ALUOp::Asr32 | ALUOp::Asr64 => 0b001010,
-                    ALUOp::Lsl32 | ALUOp::Lsl64 => 0b001000,
+                    ALUOp::SDiv => 0b000011,
+                    ALUOp::UDiv => 0b000010,
+                    ALUOp::RotR => 0b001011,
+                    ALUOp::Lsr => 0b001001,
+                    ALUOp::Asr => 0b001010,
+                    ALUOp::Lsl => 0b001000,
                    ALUOp::SMulH | ALUOp::UMulH => 0b011111,
                    _ => 0b000000,
                };
@@ -755,21 +752,19 @@ impl MachInstEmit for Inst {
            }
            &Inst::AluRRImm12 {
                alu_op,
+                size,
                rd,
                rn,
                ref imm12,
            } => {
                let top8 = match alu_op {
-                    ALUOp::Add32 => 0b000_10001,
-                    ALUOp::Add64 => 0b100_10001,
-                    ALUOp::Sub32 => 0b010_10001,
-                    ALUOp::Sub64 => 0b110_10001,
-                    ALUOp::AddS32 => 0b001_10001,
-                    ALUOp::AddS64 => 0b101_10001,
-                    ALUOp::SubS32 => 0b011_10001,
-                    ALUOp::SubS64 => 0b111_10001,
+                    ALUOp::Add => 0b000_10001,
+                    ALUOp::Sub => 0b010_10001,
+                    ALUOp::AddS => 0b001_10001,
+                    ALUOp::SubS => 0b011_10001,
                    _ => unimplemented!("{:?}", alu_op),
                };
+                let top8 = top8 | size.sf_bit() << 7;
                sink.put4(enc_arith_rr_imm12(
                    top8,
                    imm12.shift_bits(),
@@ -780,57 +775,53 @@ impl MachInstEmit for Inst {
            }
            &Inst::AluRRImmLogic {
                alu_op,
+                size,
                rd,
                rn,
                ref imml,
            } => {
                let (top9, inv) = match alu_op {
-                    ALUOp::Orr32 => (0b001_100100, false),
-                    ALUOp::Orr64 => (0b101_100100, false),
-                    ALUOp::And32 => (0b000_100100, false),
-                    ALUOp::And64 => (0b100_100100, false),
-                    ALUOp::AndS32 => (0b011_100100, false),
-                    ALUOp::AndS64 => (0b111_100100, false),
-                    ALUOp::Eor32 => (0b010_100100, false),
-                    ALUOp::Eor64 => (0b110_100100, false),
-                    ALUOp::OrrNot32 => (0b001_100100, true),
-                    ALUOp::OrrNot64 => (0b101_100100, true),
-                    ALUOp::AndNot32 => (0b000_100100, true),
-                    ALUOp::AndNot64 => (0b100_100100, true),
-                    ALUOp::EorNot32 => (0b010_100100, true),
-                    ALUOp::EorNot64 => (0b110_100100, true),
+                    ALUOp::Orr => (0b001_100100, false),
+                    ALUOp::And => (0b000_100100, false),
+                    ALUOp::AndS => (0b011_100100, false),
+                    ALUOp::Eor => (0b010_100100, false),
+                    ALUOp::OrrNot => (0b001_100100, true),
+                    ALUOp::AndNot => (0b000_100100, true),
+                    ALUOp::EorNot => (0b010_100100, true),
                    _ => unimplemented!("{:?}", alu_op),
                };
+                let top9 = top9 | size.sf_bit() << 8;
                let imml = if inv { imml.invert() } else { imml.clone() };
                sink.put4(enc_arith_rr_imml(top9, imml.enc_bits(), rn, rd));
            }

            &Inst::AluRRImmShift {
                alu_op,
+                size,
                rd,
                rn,
                ref immshift,
            } => {
                let amt = immshift.value();
                let (top10, immr, imms) = match alu_op {
-                    ALUOp::RotR32 => (0b0001001110, machreg_to_gpr(rn), u32::from(amt)),
-                    ALUOp::RotR64 => (0b1001001111, machreg_to_gpr(rn), u32::from(amt)),
-                    ALUOp::Lsr32 => (0b0101001100, u32::from(amt), 0b011111),
-                    ALUOp::Lsr64 => (0b1101001101, u32::from(amt), 0b111111),
-                    ALUOp::Asr32 => (0b0001001100, u32::from(amt), 0b011111),
-                    ALUOp::Asr64 => (0b1001001101, u32::from(amt), 0b111111),
-                    ALUOp::Lsl32 => (
-                        0b0101001100,
-                        u32::from((32 - amt) % 32),
-                        u32::from(31 - amt),
-                    ),
-                    ALUOp::Lsl64 => (
-                        0b1101001101,
-                        u32::from((64 - amt) % 64),
-                        u32::from(63 - amt),
-                    ),
+                    ALUOp::RotR => (0b0001001110, machreg_to_gpr(rn), u32::from(amt)),
+                    ALUOp::Lsr => (0b0101001100, u32::from(amt), 0b011111),
+                    ALUOp::Asr => (0b0001001100, u32::from(amt), 0b011111),
+                    ALUOp::Lsl => {
+                        let bits = if size.is64() { 64 } else { 32 };
+                        (
+                            0b0101001100,
+                            u32::from((bits - amt) % bits),
+                            u32::from(bits - 1 - amt),
+                        )
+                    }
                    _ => unimplemented!("{:?}", alu_op),
                };
+                let top10 = top10 | size.sf_bit() << 9 | size.sf_bit();
+                let imms = match alu_op {
+                    ALUOp::Lsr | ALUOp::Asr => imms | size.sf_bit() << 5,
+                    _ => imms,
+                };
                sink.put4(
                    (top10 << 22)
                        | (immr << 16)
@@ -842,36 +833,27 @@ impl MachInstEmit for Inst {

            &Inst::AluRRRShift {
                alu_op,
+                size,
                rd,
                rn,
                rm,
                ref shiftop,
            } => {
                let top11: u32 = match alu_op {
-                    ALUOp::Add32 => 0b000_01011000,
-                    ALUOp::Add64 => 0b100_01011000,
-                    ALUOp::AddS32 => 0b001_01011000,
-                    ALUOp::AddS64 => 0b101_01011000,
-                    ALUOp::Sub32 => 0b010_01011000,
-                    ALUOp::Sub64 => 0b110_01011000,
-                    ALUOp::SubS32 => 0b011_01011000,
-                    ALUOp::SubS64 => 0b111_01011000,
-                    ALUOp::Orr32 => 0b001_01010000,
-                    ALUOp::Orr64 => 0b101_01010000,
-                    ALUOp::And32 => 0b000_01010000,
-                    ALUOp::And64 => 0b100_01010000,
-                    ALUOp::AndS32 => 0b011_01010000,
-                    ALUOp::AndS64 => 0b111_01010000,
-                    ALUOp::Eor32 => 0b010_01010000,
-                    ALUOp::Eor64 => 0b110_01010000,
-                    ALUOp::OrrNot32 => 0b001_01010001,
-                    ALUOp::OrrNot64 => 0b101_01010001,
-                    ALUOp::EorNot32 => 0b010_01010001,
-                    ALUOp::EorNot64 => 0b110_01010001,
-                    ALUOp::AndNot32 => 0b000_01010001,
-                    ALUOp::AndNot64 => 0b100_01010001,
+                    ALUOp::Add => 0b000_01011000,
+                    ALUOp::AddS => 0b001_01011000,
+                    ALUOp::Sub => 0b010_01011000,
+                    ALUOp::SubS => 0b011_01011000,
+                    ALUOp::Orr => 0b001_01010000,
+                    ALUOp::And => 0b000_01010000,
+                    ALUOp::AndS => 0b011_01010000,
+                    ALUOp::Eor => 0b010_01010000,
+                    ALUOp::OrrNot => 0b001_01010001,
+                    ALUOp::EorNot => 0b010_01010001,
+                    ALUOp::AndNot => 0b000_01010001,
                    _ => unimplemented!("{:?}", alu_op),
                };
+                let top11 = top11 | size.sf_bit() << 10;
                let top11 = top11 | (u32::from(shiftop.op().bits()) << 1);
                let bits_15_10 = u32::from(shiftop.amt().value());
                sink.put4(enc_arith_rrr(top11, bits_15_10, rd, rn, rm));
@@ -879,22 +861,20 @@ impl MachInstEmit for Inst {

            &Inst::AluRRRExtend {
                alu_op,
+                size,
                rd,
                rn,
                rm,
                extendop,
            } => {
                let top11: u32 = match alu_op {
-                    ALUOp::Add32 => 0b00001011001,
-                    ALUOp::Add64 => 0b10001011001,
-                    ALUOp::Sub32 => 0b01001011001,
-                    ALUOp::Sub64 => 0b11001011001,
-                    ALUOp::AddS32 => 0b00101011001,
-                    ALUOp::AddS64 => 0b10101011001,
-                    ALUOp::SubS32 => 0b01101011001,
-                    ALUOp::SubS64 => 0b11101011001,
+                    ALUOp::Add => 0b00001011001,
+                    ALUOp::Sub => 0b01001011001,
+                    ALUOp::AddS => 0b00101011001,
+                    ALUOp::SubS => 0b01101011001,
                    _ => unimplemented!("{:?}", alu_op),
                };
+                let top11 = top11 | size.sf_bit() << 10;
                let bits_15_10 = u32::from(extendop.bits()) << 3;
                sink.put4(enc_arith_rrr(top11, bits_15_10, rd, rn, rm));
            }
@@ -1394,7 +1374,8 @@ impl MachInstEmit for Inst {
                        // mvn x28, x28

                        Inst::AluRRR {
-                            alu_op: ALUOp::And64,
+                            alu_op: ALUOp::And,
+                            size: OperandSize::Size64,
                            rd: x28wr,
                            rn: x27,
                            rm: x26,
@@ -1402,7 +1383,8 @@ impl MachInstEmit for Inst {
                        .emit(sink, emit_info, state);

                        Inst::AluRRR {
-                            alu_op: ALUOp::OrrNot64,
+                            alu_op: ALUOp::OrrNot,
+                            size: OperandSize::Size64,
                            rd: x28wr,
                            rn: xzr,
                            rm: x28,
@@ -1425,11 +1407,8 @@ impl MachInstEmit for Inst {
                        };

                        Inst::AluRRR {
-                            alu_op: if ty == I64 {
-                                ALUOp::SubS64
-                            } else {
-                                ALUOp::SubS32
-                            },
+                            alu_op: ALUOp::SubS,
+                            size: OperandSize::from_ty(ty),
                            rd: writable_zero_reg(),
                            rn: x27,
                            rm: x26,
@@ -1447,11 +1426,11 @@ impl MachInstEmit for Inst {
                    _ => {
                        // add/sub/and/orr/eor x28, x27, x26
                        let alu_op = match op {
-                            AtomicRmwOp::Add => ALUOp::Add64,
-                            AtomicRmwOp::Sub => ALUOp::Sub64,
-                            AtomicRmwOp::And => ALUOp::And64,
-                            AtomicRmwOp::Or => ALUOp::Orr64,
-                            AtomicRmwOp::Xor => ALUOp::Eor64,
+                            AtomicRmwOp::Add => ALUOp::Add,
+                            AtomicRmwOp::Sub => ALUOp::Sub,
+                            AtomicRmwOp::And => ALUOp::And,
+                            AtomicRmwOp::Or => ALUOp::Orr,
+                            AtomicRmwOp::Xor => ALUOp::Eor,
                            AtomicRmwOp::Nand
                            | AtomicRmwOp::Umin
                            | AtomicRmwOp::Umax
@@ -1462,6 +1441,7 @@ impl MachInstEmit for Inst {

                        Inst::AluRRR {
                            alu_op,
+                            size: OperandSize::Size64,
                            rd: x28wr,
                            rn: x27,
                            rm: x26,
@@ -2478,7 +2458,8 @@ impl MachInstEmit for Inst {
                // than AND on smaller cores.
                let imml = ImmLogic::maybe_from_u64(1, I32).unwrap();
                Inst::AluRRImmLogic {
-                    alu_op: ALUOp::And32,
+                    alu_op: ALUOp::And,
+                    size: OperandSize::Size32,
                    rd,
                    rn,
                    imml,
@@ -2655,7 +2636,8 @@ impl MachInstEmit for Inst {
                inst.emit(sink, emit_info, state);
                // Add base of jump table to jump-table-sourced block offset
                let inst = Inst::AluRRR {
-                    alu_op: ALUOp::Add64,
+                    alu_op: ALUOp::Add,
+                    size: OperandSize::Size64,
                    rd: rtmp1,
                    rn: rtmp1.to_reg(),
                    rm: rtmp2.to_reg(),
@@ -2731,15 +2713,12 @@ impl MachInstEmit for Inst {
                } else {
                    offset as u64
                };
-                let alu_op = if offset < 0 {
-                    ALUOp::Sub64
-                } else {
-                    ALUOp::Add64
-                };
+                let alu_op = if offset < 0 { ALUOp::Sub } else { ALUOp::Add };

                if let Some((idx, extendop)) = index_reg {
                    let add = Inst::AluRRRExtend {
-                        alu_op: ALUOp::Add64,
+                        alu_op: ALUOp::Add,
+                        size: OperandSize::Size64,
                        rd,
                        rn: reg,
                        rm: idx,
@@ -2756,6 +2735,7 @@ impl MachInstEmit for Inst {
                } else if let Some(imm12) = Imm12::maybe_from_u64(abs_offset) {
                    let add = Inst::AluRRImm12 {
                        alu_op,
+                        size: OperandSize::Size64,
                        rd,
                        rn: reg,
                        imm12,
@@ -2775,6 +2755,7 @@ impl MachInstEmit for Inst {
                    }
                    let add = Inst::AluRRR {
                        alu_op,
+                        size: OperandSize::Size64,
                        rd,
                        rn: reg,
                        rm: tmp.to_reg(),