llvm/test/CodeGen/X86/cvt16-2.ll - llvm-project - Git at Google

 ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
 ; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mattr=-avx512fp16 | FileCheck %s -check-prefix=LIBCALL
 ; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mattr=+avx512fp16 | FileCheck %s -check-prefix=FP16

 define void @test1(float %src, i16* %dest) {
 ; LIBCALL-LABEL: test1:
 ; LIBCALL:       # %bb.0:
 ; LIBCALL-NEXT:    pushq %rbx
 ; LIBCALL-NEXT:    .cfi_def_cfa_offset 16
 ; LIBCALL-NEXT:    .cfi_offset %rbx, -16
 ; LIBCALL-NEXT:    movq %rdi, %rbx
 ; LIBCALL-NEXT:    callq __gnu_f2h_ieee@PLT
 ; LIBCALL-NEXT:    movw %ax, (%rbx)
 ; LIBCALL-NEXT:    popq %rbx
 ; LIBCALL-NEXT:    .cfi_def_cfa_offset 8
 ; LIBCALL-NEXT:    retq
 ;
 ; FP16-LABEL: test1:
 ; FP16:       # %bb.0:
 ; FP16-NEXT:    vcvtss2sh %xmm0, %xmm0, %xmm0
 ; FP16-NEXT:    vmovsh %xmm0, (%rdi)
 ; FP16-NEXT:    retq
   %1 = tail call i16 @llvm.convert.to.fp16.f32(float %src)
   store i16 %1, i16* %dest, align 2
   ret void
 }

 define float @test2(i16* nocapture %src) {
 ; LIBCALL-LABEL: test2:
 ; LIBCALL:       # %bb.0:
 ; LIBCALL-NEXT:    movzwl (%rdi), %edi
 ; LIBCALL-NEXT:    jmp __gnu_h2f_ieee@PLT # TAILCALL
 ;
 ; FP16-LABEL: test2:
 ; FP16:       # %bb.0:
 ; FP16-NEXT:    vmovsh (%rdi), %xmm0
 ; FP16-NEXT:    vcvtsh2ss %xmm0, %xmm0, %xmm0
 ; FP16-NEXT:    retq
   %1 = load i16, i16* %src, align 2
   %2 = tail call float @llvm.convert.from.fp16.f32(i16 %1)
   ret float %2
 }

 define float @test3(float %src) nounwind uwtable readnone {
 ; LIBCALL-LABEL: test3:
 ; LIBCALL:       # %bb.0:
 ; LIBCALL-NEXT:    pushq %rax
 ; LIBCALL-NEXT:    .cfi_def_cfa_offset 16
 ; LIBCALL-NEXT:    callq __gnu_f2h_ieee@PLT
 ; LIBCALL-NEXT:    movzwl %ax, %edi
 ; LIBCALL-NEXT:    popq %rax
 ; LIBCALL-NEXT:    .cfi_def_cfa_offset 8
 ; LIBCALL-NEXT:    jmp __gnu_h2f_ieee@PLT # TAILCALL
 ;
 ; FP16-LABEL: test3:
 ; FP16:       # %bb.0:
 ; FP16-NEXT:    vcvtss2sh %xmm0, %xmm0, %xmm0
 ; FP16-NEXT:    vcvtsh2ss %xmm0, %xmm0, %xmm0
 ; FP16-NEXT:    retq
   %1 = tail call i16 @llvm.convert.to.fp16.f32(float %src)
   %2 = tail call float @llvm.convert.from.fp16.f32(i16 %1)
   ret float %2
 }

 ; FIXME: Should it be __extendhfdf2?
 define double @test4(i16* nocapture %src) {
 ; LIBCALL-LABEL: test4:
 ; LIBCALL:       # %bb.0:
 ; LIBCALL-NEXT:    pushq %rax
 ; LIBCALL-NEXT:    .cfi_def_cfa_offset 16
 ; LIBCALL-NEXT:    movzwl (%rdi), %edi
 ; LIBCALL-NEXT:    callq __gnu_h2f_ieee@PLT
 ; LIBCALL-NEXT:    cvtss2sd %xmm0, %xmm0
 ; LIBCALL-NEXT:    popq %rax
 ; LIBCALL-NEXT:    .cfi_def_cfa_offset 8
 ; LIBCALL-NEXT:    retq
 ;
 ; FP16-LABEL: test4:
 ; FP16:       # %bb.0:
 ; FP16-NEXT:    vmovsh (%rdi), %xmm0
 ; FP16-NEXT:    vcvtsh2sd %xmm0, %xmm0, %xmm0
 ; FP16-NEXT:    retq
   %1 = load i16, i16* %src, align 2
   %2 = tail call double @llvm.convert.from.fp16.f64(i16 %1)
   ret double %2
 }

 define i16 @test5(double %src) {
 ; LIBCALL-LABEL: test5:
 ; LIBCALL:       # %bb.0:
 ; LIBCALL-NEXT:    jmp __truncdfhf2@PLT # TAILCALL
 ;
 ; FP16-LABEL: test5:
 ; FP16:       # %bb.0:
 ; FP16-NEXT:    vcvtsd2sh %xmm0, %xmm0, %xmm0
 ; FP16-NEXT:    vmovw %xmm0, %eax
 ; FP16-NEXT:    # kill: def $ax killed $ax killed $eax
 ; FP16-NEXT:    retq
   %val = tail call i16 @llvm.convert.to.fp16.f64(double %src)
   ret i16 %val
 }

 ; FIXME: Should it be __extendhfxf2?
 define x86_fp80 @test6(i16* nocapture %src) {
 ; LIBCALL-LABEL: test6:
 ; LIBCALL:       # %bb.0:
 ; LIBCALL-NEXT:    pushq %rax
 ; LIBCALL-NEXT:    .cfi_def_cfa_offset 16
 ; LIBCALL-NEXT:    movzwl (%rdi), %edi
 ; LIBCALL-NEXT:    callq __gnu_h2f_ieee@PLT
 ; LIBCALL-NEXT:    movss %xmm0, {{[0-9]+}}(%rsp)
 ; LIBCALL-NEXT:    flds {{[0-9]+}}(%rsp)
 ; LIBCALL-NEXT:    popq %rax
 ; LIBCALL-NEXT:    .cfi_def_cfa_offset 8
 ; LIBCALL-NEXT:    retq
 ;
 ; FP16-LABEL: test6:
 ; FP16:       # %bb.0:
 ; FP16-NEXT:    pushq %rax
 ; FP16-NEXT:    .cfi_def_cfa_offset 16
 ; FP16-NEXT:    vmovsh (%rdi), %xmm0
 ; FP16-NEXT:    callq __extendhfxf2@PLT
 ; FP16-NEXT:    popq %rax
 ; FP16-NEXT:    .cfi_def_cfa_offset 8
 ; FP16-NEXT:    retq
   %1 = load i16, i16* %src, align 2
   %2 = tail call x86_fp80 @llvm.convert.from.fp16.f80(i16 %1)
   ret x86_fp80 %2
 }

 define i16 @test7(x86_fp80 %src) {
 ; LIBCALL-LABEL: test7:
 ; LIBCALL:       # %bb.0:
 ; LIBCALL-NEXT:    jmp __truncxfhf2@PLT # TAILCALL
 ;
 ; FP16-LABEL: test7:
 ; FP16:       # %bb.0:
 ; FP16-NEXT:    subq $24, %rsp
 ; FP16-NEXT:    .cfi_def_cfa_offset 32
 ; FP16-NEXT:    fldt {{[0-9]+}}(%rsp)
 ; FP16-NEXT:    fstpt (%rsp)
 ; FP16-NEXT:    callq __truncxfhf2@PLT
 ; FP16-NEXT:    vmovw %xmm0, %eax
 ; FP16-NEXT:    # kill: def $ax killed $ax killed $eax
 ; FP16-NEXT:    addq $24, %rsp
 ; FP16-NEXT:    .cfi_def_cfa_offset 8
 ; FP16-NEXT:    retq
   %val = tail call i16 @llvm.convert.to.fp16.f80(x86_fp80 %src)
   ret i16 %val
 }

 declare float @llvm.convert.from.fp16.f32(i16) nounwind readnone
 declare i16 @llvm.convert.to.fp16.f32(float) nounwind readnone
 declare double @llvm.convert.from.fp16.f64(i16) nounwind readnone
 declare i16 @llvm.convert.to.fp16.f64(double) nounwind readnone
 declare x86_fp80 @llvm.convert.from.fp16.f80(i16) nounwind readnone
 declare i16 @llvm.convert.to.fp16.f80(x86_fp80) nounwind readnone
	; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
	; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mattr=-avx512fp16 \| FileCheck %s -check-prefix=LIBCALL
	; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mattr=+avx512fp16 \| FileCheck %s -check-prefix=FP16

	define void @test1(float %src, i16* %dest) {
	; LIBCALL-LABEL: test1:
	; LIBCALL: # %bb.0:
	; LIBCALL-NEXT: pushq %rbx
	; LIBCALL-NEXT: .cfi_def_cfa_offset 16
	; LIBCALL-NEXT: .cfi_offset %rbx, -16
	; LIBCALL-NEXT: movq %rdi, %rbx
	; LIBCALL-NEXT: callq __gnu_f2h_ieee@PLT
	; LIBCALL-NEXT: movw %ax, (%rbx)
	; LIBCALL-NEXT: popq %rbx
	; LIBCALL-NEXT: .cfi_def_cfa_offset 8
	; LIBCALL-NEXT: retq
	;
	; FP16-LABEL: test1:
	; FP16: # %bb.0:
	; FP16-NEXT: vcvtss2sh %xmm0, %xmm0, %xmm0
	; FP16-NEXT: vmovsh %xmm0, (%rdi)
	; FP16-NEXT: retq
	%1 = tail call i16 @llvm.convert.to.fp16.f32(float %src)
	store i16 %1, i16* %dest, align 2
	ret void
	}

	define float @test2(i16* nocapture %src) {
	; LIBCALL-LABEL: test2:
	; LIBCALL: # %bb.0:
	; LIBCALL-NEXT: movzwl (%rdi), %edi
	; LIBCALL-NEXT: jmp __gnu_h2f_ieee@PLT # TAILCALL
	;
	; FP16-LABEL: test2:
	; FP16: # %bb.0:
	; FP16-NEXT: vmovsh (%rdi), %xmm0
	; FP16-NEXT: vcvtsh2ss %xmm0, %xmm0, %xmm0
	; FP16-NEXT: retq
	%1 = load i16, i16* %src, align 2
	%2 = tail call float @llvm.convert.from.fp16.f32(i16 %1)
	ret float %2
	}

	define float @test3(float %src) nounwind uwtable readnone {
	; LIBCALL-LABEL: test3:
	; LIBCALL: # %bb.0:
	; LIBCALL-NEXT: pushq %rax
	; LIBCALL-NEXT: .cfi_def_cfa_offset 16
	; LIBCALL-NEXT: callq __gnu_f2h_ieee@PLT
	; LIBCALL-NEXT: movzwl %ax, %edi
	; LIBCALL-NEXT: popq %rax
	; LIBCALL-NEXT: .cfi_def_cfa_offset 8
	; LIBCALL-NEXT: jmp __gnu_h2f_ieee@PLT # TAILCALL
	;
	; FP16-LABEL: test3:
	; FP16: # %bb.0:
	; FP16-NEXT: vcvtss2sh %xmm0, %xmm0, %xmm0
	; FP16-NEXT: vcvtsh2ss %xmm0, %xmm0, %xmm0
	; FP16-NEXT: retq
	%1 = tail call i16 @llvm.convert.to.fp16.f32(float %src)
	%2 = tail call float @llvm.convert.from.fp16.f32(i16 %1)
	ret float %2
	}

	; FIXME: Should it be __extendhfdf2?
	define double @test4(i16* nocapture %src) {
	; LIBCALL-LABEL: test4:
	; LIBCALL: # %bb.0:
	; LIBCALL-NEXT: pushq %rax
	; LIBCALL-NEXT: .cfi_def_cfa_offset 16
	; LIBCALL-NEXT: movzwl (%rdi), %edi
	; LIBCALL-NEXT: callq __gnu_h2f_ieee@PLT
	; LIBCALL-NEXT: cvtss2sd %xmm0, %xmm0
	; LIBCALL-NEXT: popq %rax
	; LIBCALL-NEXT: .cfi_def_cfa_offset 8
	; LIBCALL-NEXT: retq
	;
	; FP16-LABEL: test4:
	; FP16: # %bb.0:
	; FP16-NEXT: vmovsh (%rdi), %xmm0
	; FP16-NEXT: vcvtsh2sd %xmm0, %xmm0, %xmm0
	; FP16-NEXT: retq
	%1 = load i16, i16* %src, align 2
	%2 = tail call double @llvm.convert.from.fp16.f64(i16 %1)
	ret double %2
	}

	define i16 @test5(double %src) {
	; LIBCALL-LABEL: test5:
	; LIBCALL: # %bb.0:
	; LIBCALL-NEXT: jmp __truncdfhf2@PLT # TAILCALL
	;
	; FP16-LABEL: test5:
	; FP16: # %bb.0:
	; FP16-NEXT: vcvtsd2sh %xmm0, %xmm0, %xmm0
	; FP16-NEXT: vmovw %xmm0, %eax
	; FP16-NEXT: # kill: def $ax killed $ax killed $eax
	; FP16-NEXT: retq
	%val = tail call i16 @llvm.convert.to.fp16.f64(double %src)
	ret i16 %val
	}

	; FIXME: Should it be __extendhfxf2?
	define x86_fp80 @test6(i16* nocapture %src) {
	; LIBCALL-LABEL: test6:
	; LIBCALL: # %bb.0:
	; LIBCALL-NEXT: pushq %rax
	; LIBCALL-NEXT: .cfi_def_cfa_offset 16
	; LIBCALL-NEXT: movzwl (%rdi), %edi
	; LIBCALL-NEXT: callq __gnu_h2f_ieee@PLT
	; LIBCALL-NEXT: movss %xmm0, {{[0-9]+}}(%rsp)
	; LIBCALL-NEXT: flds {{[0-9]+}}(%rsp)
	; LIBCALL-NEXT: popq %rax
	; LIBCALL-NEXT: .cfi_def_cfa_offset 8
	; LIBCALL-NEXT: retq
	;
	; FP16-LABEL: test6:
	; FP16: # %bb.0:
	; FP16-NEXT: pushq %rax
	; FP16-NEXT: .cfi_def_cfa_offset 16
	; FP16-NEXT: vmovsh (%rdi), %xmm0
	; FP16-NEXT: callq __extendhfxf2@PLT
	; FP16-NEXT: popq %rax
	; FP16-NEXT: .cfi_def_cfa_offset 8
	; FP16-NEXT: retq
	%1 = load i16, i16* %src, align 2
	%2 = tail call x86_fp80 @llvm.convert.from.fp16.f80(i16 %1)
	ret x86_fp80 %2
	}

	define i16 @test7(x86_fp80 %src) {
	; LIBCALL-LABEL: test7:
	; LIBCALL: # %bb.0:
	; LIBCALL-NEXT: jmp __truncxfhf2@PLT # TAILCALL
	;
	; FP16-LABEL: test7:
	; FP16: # %bb.0:
	; FP16-NEXT: subq $24, %rsp
	; FP16-NEXT: .cfi_def_cfa_offset 32
	; FP16-NEXT: fldt {{[0-9]+}}(%rsp)
	; FP16-NEXT: fstpt (%rsp)
	; FP16-NEXT: callq __truncxfhf2@PLT
	; FP16-NEXT: vmovw %xmm0, %eax
	; FP16-NEXT: # kill: def $ax killed $ax killed $eax
	; FP16-NEXT: addq $24, %rsp
	; FP16-NEXT: .cfi_def_cfa_offset 8
	; FP16-NEXT: retq
	%val = tail call i16 @llvm.convert.to.fp16.f80(x86_fp80 %src)
	ret i16 %val
	}

	declare float @llvm.convert.from.fp16.f32(i16) nounwind readnone
	declare i16 @llvm.convert.to.fp16.f32(float) nounwind readnone
	declare double @llvm.convert.from.fp16.f64(i16) nounwind readnone
	declare i16 @llvm.convert.to.fp16.f64(double) nounwind readnone
	declare x86_fp80 @llvm.convert.from.fp16.f80(i16) nounwind readnone
	declare i16 @llvm.convert.to.fp16.f80(x86_fp80) nounwind readnone