nuudlman/llvm: llvm/test/CodeGen/X86/cvt16-2.ll

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mattr=-avx512fp16 | FileCheck %s -check-prefix=LIBCALL
; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mattr=+avx512fp16 | FileCheck %s -check-prefix=FP16

define void @test1(float %src, ptr %dest) {
; LIBCALL-LABEL: test1:
; LIBCALL:       # %bb.0:
; LIBCALL-NEXT:    pushq %rbx
; LIBCALL-NEXT:    .cfi_def_cfa_offset 16
; LIBCALL-NEXT:    .cfi_offset %rbx, -16
; LIBCALL-NEXT:    movq %rdi, %rbx
; LIBCALL-NEXT:    callq __truncsfhf2@PLT
; LIBCALL-NEXT:    pextrw $0, %xmm0, %eax
; LIBCALL-NEXT:    movw %ax, (%rbx)
; LIBCALL-NEXT:    popq %rbx
; LIBCALL-NEXT:    .cfi_def_cfa_offset 8
; LIBCALL-NEXT:    retq
;
; FP16-LABEL: test1:
; FP16:       # %bb.0:
; FP16-NEXT:    vcvtss2sh %xmm0, %xmm0, %xmm0
; FP16-NEXT:    vmovsh %xmm0, (%rdi)
; FP16-NEXT:    retq
  %1 = tail call i16 @llvm.convert.to.fp16.f32(float %src)
  store i16 %1, ptr %dest, align 2
  ret void
}

define float @test2(ptr nocapture %src) {
; LIBCALL-LABEL: test2:
; LIBCALL:       # %bb.0:
; LIBCALL-NEXT:    pinsrw $0, (%rdi), %xmm0
; LIBCALL-NEXT:    jmp __extendhfsf2@PLT # TAILCALL
;
; FP16-LABEL: test2:
; FP16:       # %bb.0:
; FP16-NEXT:    vmovsh (%rdi), %xmm0
; FP16-NEXT:    vcvtsh2ss %xmm0, %xmm0, %xmm0
; FP16-NEXT:    retq
  %1 = load i16, ptr %src, align 2
  %2 = tail call float @llvm.convert.from.fp16.f32(i16 %1)
  ret float %2
}

define float @test3(float %src) nounwind uwtable readnone {
; LIBCALL-LABEL: test3:
; LIBCALL:       # %bb.0:
; LIBCALL-NEXT:    pushq %rax
; LIBCALL-NEXT:    .cfi_def_cfa_offset 16
; LIBCALL-NEXT:    callq __truncsfhf2@PLT
; LIBCALL-NEXT:    popq %rax
; LIBCALL-NEXT:    .cfi_def_cfa_offset 8
; LIBCALL-NEXT:    jmp __extendhfsf2@PLT # TAILCALL
;
; FP16-LABEL: test3:
; FP16:       # %bb.0:
; FP16-NEXT:    vcvtss2sh %xmm0, %xmm0, %xmm0
; FP16-NEXT:    vcvtsh2ss %xmm0, %xmm0, %xmm0
; FP16-NEXT:    retq
  %1 = tail call i16 @llvm.convert.to.fp16.f32(float %src)
  %2 = tail call float @llvm.convert.from.fp16.f32(i16 %1)
  ret float %2
}

; FIXME: Should it be __extendhfdf2?
define double @test4(ptr nocapture %src) {
; LIBCALL-LABEL: test4:
; LIBCALL:       # %bb.0:
; LIBCALL-NEXT:    pushq %rax
; LIBCALL-NEXT:    .cfi_def_cfa_offset 16
; LIBCALL-NEXT:    pinsrw $0, (%rdi), %xmm0
; LIBCALL-NEXT:    callq __extendhfsf2@PLT
; LIBCALL-NEXT:    cvtss2sd %xmm0, %xmm0
; LIBCALL-NEXT:    popq %rax
; LIBCALL-NEXT:    .cfi_def_cfa_offset 8
; LIBCALL-NEXT:    retq
;
; FP16-LABEL: test4:
; FP16:       # %bb.0:
; FP16-NEXT:    vmovsh (%rdi), %xmm0
; FP16-NEXT:    vcvtsh2sd %xmm0, %xmm0, %xmm0
; FP16-NEXT:    retq
  %1 = load i16, ptr %src, align 2
  %2 = tail call double @llvm.convert.from.fp16.f64(i16 %1)
  ret double %2
}

define i16 @test5(double %src) {
; LIBCALL-LABEL: test5:
; LIBCALL:       # %bb.0:
; LIBCALL-NEXT:    pushq %rax
; LIBCALL-NEXT:    .cfi_def_cfa_offset 16
; LIBCALL-NEXT:    callq __truncdfhf2@PLT
; LIBCALL-NEXT:    pextrw $0, %xmm0, %eax
; LIBCALL-NEXT:    # kill: def $ax killed $ax killed $eax
; LIBCALL-NEXT:    popq %rcx
; LIBCALL-NEXT:    .cfi_def_cfa_offset 8
; LIBCALL-NEXT:    retq
;
; FP16-LABEL: test5:
; FP16:       # %bb.0:
; FP16-NEXT:    vcvtsd2sh %xmm0, %xmm0, %xmm0
; FP16-NEXT:    vmovw %xmm0, %eax
; FP16-NEXT:    # kill: def $ax killed $ax killed $eax
; FP16-NEXT:    retq
  %val = tail call i16 @llvm.convert.to.fp16.f64(double %src)
  ret i16 %val
}

; FIXME: Should it be __extendhfxf2?
define x86_fp80 @test6(ptr nocapture %src) {
; LIBCALL-LABEL: test6:
; LIBCALL:       # %bb.0:
; LIBCALL-NEXT:    pushq %rax
; LIBCALL-NEXT:    .cfi_def_cfa_offset 16
; LIBCALL-NEXT:    pinsrw $0, (%rdi), %xmm0
; LIBCALL-NEXT:    callq __extendhfxf2@PLT
; LIBCALL-NEXT:    popq %rax
; LIBCALL-NEXT:    .cfi_def_cfa_offset 8
; LIBCALL-NEXT:    retq
;
; FP16-LABEL: test6:
; FP16:       # %bb.0:
; FP16-NEXT:    pushq %rax
; FP16-NEXT:    .cfi_def_cfa_offset 16
; FP16-NEXT:    vmovsh (%rdi), %xmm0
; FP16-NEXT:    callq __extendhfxf2@PLT
; FP16-NEXT:    popq %rax
; FP16-NEXT:    .cfi_def_cfa_offset 8
; FP16-NEXT:    retq
  %1 = load i16, ptr %src, align 2
  %2 = tail call x86_fp80 @llvm.convert.from.fp16.f80(i16 %1)
  ret x86_fp80 %2
}

define i16 @test7(x86_fp80 %src) {
; LIBCALL-LABEL: test7:
; LIBCALL:       # %bb.0:
; LIBCALL-NEXT:    subq $24, %rsp
; LIBCALL-NEXT:    .cfi_def_cfa_offset 32
; LIBCALL-NEXT:    fldt {{[0-9]+}}(%rsp)
; LIBCALL-NEXT:    fstpt (%rsp)
; LIBCALL-NEXT:    callq __truncxfhf2@PLT
; LIBCALL-NEXT:    pextrw $0, %xmm0, %eax
; LIBCALL-NEXT:    # kill: def $ax killed $ax killed $eax
; LIBCALL-NEXT:    addq $24, %rsp
; LIBCALL-NEXT:    .cfi_def_cfa_offset 8
; LIBCALL-NEXT:    retq
;
; FP16-LABEL: test7:
; FP16:       # %bb.0:
; FP16-NEXT:    subq $24, %rsp
; FP16-NEXT:    .cfi_def_cfa_offset 32
; FP16-NEXT:    fldt {{[0-9]+}}(%rsp)
; FP16-NEXT:    fstpt (%rsp)
; FP16-NEXT:    callq __truncxfhf2@PLT
; FP16-NEXT:    vmovw %xmm0, %eax
; FP16-NEXT:    # kill: def $ax killed $ax killed $eax
; FP16-NEXT:    addq $24, %rsp
; FP16-NEXT:    .cfi_def_cfa_offset 8
; FP16-NEXT:    retq
  %val = tail call i16 @llvm.convert.to.fp16.f80(x86_fp80 %src)
  ret i16 %val
}

declare float @llvm.convert.from.fp16.f32(i16) nounwind readnone
declare i16 @llvm.convert.to.fp16.f32(float) nounwind readnone
declare double @llvm.convert.from.fp16.f64(i16) nounwind readnone
declare i16 @llvm.convert.to.fp16.f64(double) nounwind readnone
declare x86_fp80 @llvm.convert.from.fp16.f80(i16) nounwind readnone
declare i16 @llvm.convert.to.fp16.f80(x86_fp80) nounwind readnone