wasmtime/filetests/isa/intel/binary32-float.cton

; Binary emission of 32-bit floating point code.
test binemit
isa intel has_sse2

; The binary encodings can be verified with the command:
;
;   sed -ne 's/^ *; asm: *//p' filetests/isa/intel/binary32-float.cton | llvm-mc -show-encoding -triple=i386
;

function %F32() {
ebb0:
    [-,%rcx]            v0 = iconst.i32 1
    [-,%rsi]            v1 = iconst.i32 2

    ; asm: cvtsi2ss %ecx, %xmm5
    [-,%xmm5]           v10 = fcvt_from_sint.f32 v0             ; bin: f3 0f 2a e9
    ; asm: cvtsi2ss %esi, %xmm2
    [-,%xmm2]           v11 = fcvt_from_sint.f32 v1             ; bin: f3 0f 2a d6

    ; asm: cvtss2sd %xmm2, %xmm5
    [-,%xmm5]           v12 = fpromote.f64 v11                  ; bin: f3 0f 5a ea
    ; asm: cvtss2sd %xmm5, %xmm2
    [-,%xmm2]           v13 = fpromote.f64 v10                  ; bin: f3 0f 5a d5

    ; asm: movd %ecx, %xmm5
    [-,%xmm5]           v14 = bitcast.f32 v0                    ; bin: 66 0f 6e e9
    ; asm: movd %esi, %xmm2
    [-,%xmm2]           v15 = bitcast.f32 v1                    ; bin: 66 0f 6e d6

    ; asm: movd %xmm5, %ecx
    [-,%rcx]            v16 = bitcast.i32 v10                   ; bin: 66 0f 7e e9
    ; asm: movd %xmm2, %esi
    [-,%rsi]            v17 = bitcast.i32 v11                   ; bin: 66 0f 7e d6

    ; Binary arithmetic.

    ; asm: addss %xmm2, %xmm5
    [-,%xmm5]           v20 = fadd v10, v11                     ; bin: f3 0f 58 ea
    ; asm: addss %xmm5, %xmm2
    [-,%xmm2]           v21 = fadd v11, v10                     ; bin: f3 0f 58 d5

    ; asm: subss %xmm2, %xmm5
    [-,%xmm5]           v22 = fsub v10, v11                     ; bin: f3 0f 5c ea
    ; asm: subss %xmm5, %xmm2
    [-,%xmm2]           v23 = fsub v11, v10                     ; bin: f3 0f 5c d5

    ; asm: mulss %xmm2, %xmm5
    [-,%xmm5]           v24 = fmul v10, v11                     ; bin: f3 0f 59 ea
    ; asm: mulss %xmm5, %xmm2
    [-,%xmm2]           v25 = fmul v11, v10                     ; bin: f3 0f 59 d5

    ; asm: divss %xmm2, %xmm5
    [-,%xmm5]           v26 = fdiv v10, v11                     ; bin: f3 0f 5e ea
    ; asm: divss %xmm5, %xmm2
    [-,%xmm2]           v27 = fdiv v11, v10                     ; bin: f3 0f 5e d5

    ; Bitwise ops.
    ; We use the *ps SSE instructions for everything because they are smaller.

    ; asm: andps %xmm2, %xmm5
    [-,%xmm5]           v30 = band v10, v11                     ; bin: 0f 54 ea
    ; asm: andps %xmm5, %xmm2
    [-,%xmm2]           v31 = band v11, v10                     ; bin: 0f 54 d5

    ; asm: andnps %xmm2, %xmm5
    [-,%xmm5]           v32 = band_not v10, v11                 ; bin: 0f 55 ea
    ; asm: andnps %xmm5, %xmm2
    [-,%xmm2]           v33 = band_not v11, v10                 ; bin: 0f 55 d5

    ; asm: orps %xmm2, %xmm5
    [-,%xmm5]           v34 = bor v10, v11                      ; bin: 0f 56 ea
    ; asm: orps %xmm5, %xmm2
    [-,%xmm2]           v35 = bor v11, v10                      ; bin: 0f 56 d5

    ; asm: xorps %xmm2, %xmm5
    [-,%xmm5]           v36 = bxor v10, v11                     ; bin: 0f 57 ea
    ; asm: xorps %xmm5, %xmm2
    [-,%xmm2]           v37 = bxor v11, v10                     ; bin: 0f 57 d5

    return
}

function %F64() {
ebb0:
    [-,%rcx]            v0 = iconst.i32 1
    [-,%rsi]            v1 = iconst.i32 2

    ; asm: cvtsi2sd %ecx, %xmm5
    [-,%xmm5]           v10 = fcvt_from_sint.f64 v0             ; bin: f2 0f 2a e9
    ; asm: cvtsi2sd %esi, %xmm2
    [-,%xmm2]           v11 = fcvt_from_sint.f64 v1             ; bin: f2 0f 2a d6

    ; asm: cvtsd2ss %xmm2, %xmm5
    [-,%xmm5]           v12 = fdemote.f32 v11                   ; bin: f2 0f 5a ea
    ; asm: cvtsd2ss %xmm5, %xmm2
    [-,%xmm2]           v13 = fdemote.f32 v10                   ; bin: f2 0f 5a d5

    ; No i64 <-> f64 bitcasts in 32-bit mode.

    ; Binary arithmetic.

    ; asm: addsd %xmm2, %xmm5
    [-,%xmm5]           v20 = fadd v10, v11                     ; bin: f2 0f 58 ea
    ; asm: addsd %xmm5, %xmm2
    [-,%xmm2]           v21 = fadd v11, v10                     ; bin: f2 0f 58 d5

    ; asm: subsd %xmm2, %xmm5
    [-,%xmm5]           v22 = fsub v10, v11                     ; bin: f2 0f 5c ea
    ; asm: subsd %xmm5, %xmm2
    [-,%xmm2]           v23 = fsub v11, v10                     ; bin: f2 0f 5c d5

    ; asm: mulsd %xmm2, %xmm5
    [-,%xmm5]           v24 = fmul v10, v11                     ; bin: f2 0f 59 ea
    ; asm: mulsd %xmm5, %xmm2
    [-,%xmm2]           v25 = fmul v11, v10                     ; bin: f2 0f 59 d5

    ; asm: divsd %xmm2, %xmm5
    [-,%xmm5]           v26 = fdiv v10, v11                     ; bin: f2 0f 5e ea
    ; asm: divsd %xmm5, %xmm2
    [-,%xmm2]           v27 = fdiv v11, v10                     ; bin: f2 0f 5e d5

    ; Bitwise ops.
    ; We use the *ps SSE instructions for everything because they are smaller.

    ; asm: andps %xmm2, %xmm5
    [-,%xmm5]           v30 = band v10, v11                     ; bin: 0f 54 ea
    ; asm: andps %xmm5, %xmm2
    [-,%xmm2]           v31 = band v11, v10                     ; bin: 0f 54 d5

    ; asm: andnps %xmm2, %xmm5
    [-,%xmm5]           v32 = band_not v10, v11                 ; bin: 0f 55 ea
    ; asm: andnps %xmm5, %xmm2
    [-,%xmm2]           v33 = band_not v11, v10                 ; bin: 0f 55 d5

    ; asm: orps %xmm2, %xmm5
    [-,%xmm5]           v34 = bor v10, v11                      ; bin: 0f 56 ea
    ; asm: orps %xmm5, %xmm2
    [-,%xmm2]           v35 = bor v11, v10                      ; bin: 0f 56 d5

    ; asm: xorps %xmm2, %xmm5
    [-,%xmm5]           v36 = bxor v10, v11                     ; bin: 0f 57 ea
    ; asm: xorps %xmm5, %xmm2
    [-,%xmm2]           v37 = bxor v11, v10                     ; bin: 0f 57 d5

    return
}