* [AArch64] Port SIMD narrowing to ISLE Fvdemote, snarrow, unarrow and uunarrow. Also refactor the aarch64 instructions descriptions to parameterize on ScalarSize instead of using different opcodes. The zero_value pure constructor has been introduced and used by the integer narrow operations and it replaces, and extends, the compare zero patterns. Copright (c) 2022, Arm Limited. * use short 'if' patterns
101 lines
4.8 KiB
Common Lisp
101 lines
4.8 KiB
Common Lisp
|
|
;;;; Rules for `iadd` ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
(rule (lower (has_type ty @ (dynamic_lane _ _) (iadd x y)))
|
|
(value_reg (add_vec (put_in_reg x) (put_in_reg y) (vector_size ty))))
|
|
|
|
;;;; Rules for `isub` ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
(rule (lower (has_type ty @ (dynamic_lane _ _) (isub x y)))
|
|
(value_reg (sub_vec (put_in_reg x) (put_in_reg y) (vector_size ty))))
|
|
|
|
;;;; Rules for `imul` ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
(rule (lower (has_type (lane_fits_in_32 ty @ (dynamic_lane _ _)) (imul x y)))
|
|
(value_reg (vec_rrr (VecALUOp.Mul) (put_in_reg x) (put_in_reg y) (vector_size ty))))
|
|
|
|
;;;; Rules for `fadd` ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
(rule (lower (has_type ty @ (dynamic_lane _ _) (fadd x y)))
|
|
(value_reg (vec_rrr (VecALUOp.Fadd) (put_in_reg x) (put_in_reg y) (vector_size ty))))
|
|
|
|
;;;; Rules for `fsub` ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
(rule (lower (has_type ty @ (dynamic_lane _ _) (fsub x y)))
|
|
(value_reg (vec_rrr (VecALUOp.Fsub) (put_in_reg x) (put_in_reg y) (vector_size ty))))
|
|
|
|
;;;; Rules for `fmul` ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
(rule (lower (has_type ty @ (dynamic_lane _ _) (fmul x y)))
|
|
(value_reg (vec_rrr (VecALUOp.Fmul) (put_in_reg x) (put_in_reg y) (vector_size ty))))
|
|
|
|
;;;; Rules for `fdiv` ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
(rule (lower (has_type ty @ (dynamic_lane _ _) (fdiv x y)))
|
|
(value_reg (vec_rrr (VecALUOp.Fdiv) (put_in_reg x) (put_in_reg y) (vector_size ty))))
|
|
|
|
;;;; Rules for `fmin` ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
(rule (lower (has_type ty @ (dynamic_lane _ _) (fmin x y)))
|
|
(value_reg (vec_rrr (VecALUOp.Fmin) (put_in_reg x) (put_in_reg y) (vector_size ty))))
|
|
|
|
;;;; Rules for `fmax` ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
(rule (lower (has_type ty @ (dynamic_lane _ _) (fmax x y)))
|
|
(value_reg (vec_rrr (VecALUOp.Fmax) (put_in_reg x) (put_in_reg y) (vector_size ty))))
|
|
|
|
;;;; Rules for `fmin_pseudo` ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
(rule (lower (has_type ty @ (dynamic_lane _ _) (fmin_pseudo x y)))
|
|
(value_reg (bsl ty
|
|
(vec_rrr (VecALUOp.Fcmgt) (put_in_reg x) (put_in_reg y)
|
|
(vector_size ty)) (put_in_reg y) (put_in_reg x))))
|
|
|
|
;;;; Rules for `fmax_pseudo` ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
(rule (lower (has_type ty @ (dynamic_lane _ _) (fmax_pseudo x y)))
|
|
(value_reg (bsl ty
|
|
(vec_rrr (VecALUOp.Fcmgt) (put_in_reg y) (put_in_reg x)
|
|
(vector_size ty)) (put_in_reg y) (put_in_reg x))))
|
|
|
|
;;;; Rules for `snarrow` ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
(rule (lower (has_type (ty_dyn128_int ty) (snarrow x y)))
|
|
(if-let _ (zero_value y))
|
|
(sqxtn x (lane_size ty)))
|
|
|
|
(rule (lower (has_type (ty_dyn64_int ty) (snarrow x y)))
|
|
(let ((dst Reg (mov_vec_elem x y 1 0 (VectorSize.Size64x2))))
|
|
(sqxtn dst (lane_size ty))))
|
|
|
|
(rule (lower (has_type (ty_dyn128_int ty) (snarrow x y)))
|
|
(let ((low_half Reg (sqxtn x (lane_size ty)))
|
|
(result Reg (sqxtn2 low_half y (lane_size ty))))
|
|
result))
|
|
|
|
;;;; Rules for `unarrow` ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
(rule (lower (has_type (ty_dyn128_int ty) (unarrow x y)))
|
|
(if-let _ (zero_value y))
|
|
(sqxtun x (lane_size ty)))
|
|
|
|
(rule (lower (has_type (ty_dyn64_int ty) (unarrow x y)))
|
|
(let ((dst Reg (mov_vec_elem x y 1 0 (VectorSize.Size64x2))))
|
|
(sqxtun dst (lane_size ty))))
|
|
|
|
(rule (lower (has_type (ty_dyn128_int ty) (unarrow x y)))
|
|
(let ((low_half Reg (sqxtun x (lane_size ty)))
|
|
(result Reg (sqxtun2 low_half y (lane_size ty))))
|
|
result))
|
|
|
|
;;;; Rules for `uunarrow` ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
(rule (lower (has_type (ty_dyn128_int ty) (uunarrow x y)))
|
|
(if-let _ (zero_value y))
|
|
(uqxtn x (lane_size ty)))
|
|
|
|
(rule (lower (has_type (ty_dyn64_int ty) (uunarrow x y)))
|
|
(let ((dst Reg (mov_vec_elem x y 1 0 (VectorSize.Size64x2))))
|
|
(uqxtn dst (lane_size ty))))
|
|
|
|
(rule (lower (has_type (ty_dyn128_int ty) (uunarrow x y)))
|
|
(let ((low_half Reg (uqxtn x (lane_size ty)))
|
|
(result Reg (uqxtn2 low_half y (lane_size ty))))
|
|
result))
|
|
|
|
;;; Rules for `dynamic_stack_addr` ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
(rule (lower (dynamic_stack_addr stack_slot))
|
|
(let ((dst WritableReg (temp_writable_reg $I64))
|
|
(_ Unit (emit (abi_dynamic_stackslot_addr dst stack_slot))))
|
|
(value_reg dst)))
|
|
|
|
;;; Rules for `extract_vector` ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
(rule (lower (extract_vector x 0))
|
|
(value_reg (fpu_move_128 (put_in_reg x))))
|