Add x86-specific instruction for i64x2 multiplication
Without this special instruction, legalizing to the AVX512 instruction AND the SSE instruction sequence is impossible. This extra instruction would be rendered unnecessary by the x64 backend.
This commit is contained in:
@@ -69,3 +69,10 @@ block0:
|
||||
; nextln: v1 = band v0, v4
|
||||
return
|
||||
}
|
||||
|
||||
function %imul(i64x2, i64x2) {
|
||||
block0(v0:i64x2, v1:i64x2):
|
||||
v2 = imul v0, v1
|
||||
; check: v2 = x86_pmullq v0, v1
|
||||
return
|
||||
}
|
||||
|
||||
@@ -6,7 +6,7 @@ function %imul_i64x2() {
|
||||
block0:
|
||||
[-, %xmm1] v0 = vconst.i64x2 [1 2]
|
||||
[-, %xmm2] v1 = vconst.i64x2 [2 2]
|
||||
[-, %xmm14] v2 = imul v0, v1 ; bin: 62 72 f5 08 40 f2
|
||||
[-, %xmm14] v2 = x86_pmullq v0, v1 ; bin: 62 72 f5 08 40 f2
|
||||
; 62, mandatory EVEX prefix
|
||||
; 72 = 0111 0010, R is set (MSB in %xmm14) while X, B, and R' are unset (note these are all inverted); mm is set to 0F38
|
||||
; f5 = 1111 0101, W is set (64-bit op), vvvv set to 1 (inverted), bit 2 always set, pp set to 01
|
||||
|
||||
Reference in New Issue
Block a user