179 lines
5.9 KiB
LLVM
179 lines
5.9 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mcpu=corei7 -mattr=-f16c | FileCheck %s -check-prefix=LIBCALL
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mcpu=corei7 -mattr=+f16c | FileCheck %s -check-prefix=F16C
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mcpu=corei7 -mattr=-f16c,+soft-float | FileCheck %s -check-prefix=SOFTFLOAT
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mcpu=corei7 -mattr=+f16c,+soft-float | FileCheck %s -check-prefix=SOFTFLOAT
|
|
|
|
; This is a test for float to half float conversions on x86-64.
|
|
;
|
|
; If flag -soft-float is set, or if there is no F16C support, then:
|
|
; 1) half float to float conversions are
|
|
; translated into calls to __gnu_h2f_ieee defined
|
|
; by the compiler runtime library;
|
|
; 2) float to half float conversions are translated into calls
|
|
; to __gnu_f2h_ieee which expected to be defined by the
|
|
; compiler runtime library.
|
|
;
|
|
; Otherwise (we have F16C support):
|
|
; 1) half float to float conversion are translated using
|
|
; vcvtph2ps instructions;
|
|
; 2) float to half float conversions are translated using
|
|
; vcvtps2ph instructions
|
|
|
|
|
|
define void @test1(float %src, i16* %dest) {
|
|
; LIBCALL-LABEL: test1:
|
|
; LIBCALL: # %bb.0:
|
|
; LIBCALL-NEXT: pushq %rbx
|
|
; LIBCALL-NEXT: .cfi_def_cfa_offset 16
|
|
; LIBCALL-NEXT: .cfi_offset %rbx, -16
|
|
; LIBCALL-NEXT: movq %rdi, %rbx
|
|
; LIBCALL-NEXT: callq __gnu_f2h_ieee
|
|
; LIBCALL-NEXT: movw %ax, (%rbx)
|
|
; LIBCALL-NEXT: popq %rbx
|
|
; LIBCALL-NEXT: .cfi_def_cfa_offset 8
|
|
; LIBCALL-NEXT: retq
|
|
;
|
|
; F16C-LABEL: test1:
|
|
; F16C: # %bb.0:
|
|
; F16C-NEXT: vcvtps2ph $4, %xmm0, %xmm0
|
|
; F16C-NEXT: vpextrw $0, %xmm0, (%rdi)
|
|
; F16C-NEXT: retq
|
|
;
|
|
; SOFTFLOAT-LABEL: test1:
|
|
; SOFTFLOAT: # %bb.0:
|
|
; SOFTFLOAT-NEXT: pushq %rbx
|
|
; SOFTFLOAT-NEXT: .cfi_def_cfa_offset 16
|
|
; SOFTFLOAT-NEXT: .cfi_offset %rbx, -16
|
|
; SOFTFLOAT-NEXT: movq %rsi, %rbx
|
|
; SOFTFLOAT-NEXT: callq __gnu_f2h_ieee
|
|
; SOFTFLOAT-NEXT: movw %ax, (%rbx)
|
|
; SOFTFLOAT-NEXT: popq %rbx
|
|
; SOFTFLOAT-NEXT: .cfi_def_cfa_offset 8
|
|
; SOFTFLOAT-NEXT: retq
|
|
%1 = tail call i16 @llvm.convert.to.fp16.f32(float %src)
|
|
store i16 %1, i16* %dest, align 2
|
|
ret void
|
|
}
|
|
|
|
define float @test2(i16* nocapture %src) {
|
|
; LIBCALL-LABEL: test2:
|
|
; LIBCALL: # %bb.0:
|
|
; LIBCALL-NEXT: movzwl (%rdi), %edi
|
|
; LIBCALL-NEXT: jmp __gnu_h2f_ieee@PLT # TAILCALL
|
|
;
|
|
; F16C-LABEL: test2:
|
|
; F16C: # %bb.0:
|
|
; F16C-NEXT: movzwl (%rdi), %eax
|
|
; F16C-NEXT: vmovd %eax, %xmm0
|
|
; F16C-NEXT: vcvtph2ps %xmm0, %xmm0
|
|
; F16C-NEXT: retq
|
|
;
|
|
; SOFTFLOAT-LABEL: test2:
|
|
; SOFTFLOAT: # %bb.0:
|
|
; SOFTFLOAT-NEXT: pushq %rax
|
|
; SOFTFLOAT-NEXT: .cfi_def_cfa_offset 16
|
|
; SOFTFLOAT-NEXT: movzwl (%rdi), %edi
|
|
; SOFTFLOAT-NEXT: callq __gnu_h2f_ieee
|
|
; SOFTFLOAT-NEXT: popq %rcx
|
|
; SOFTFLOAT-NEXT: .cfi_def_cfa_offset 8
|
|
; SOFTFLOAT-NEXT: retq
|
|
%1 = load i16, i16* %src, align 2
|
|
%2 = tail call float @llvm.convert.from.fp16.f32(i16 %1)
|
|
ret float %2
|
|
}
|
|
|
|
define float @test3(float %src) nounwind uwtable readnone {
|
|
; LIBCALL-LABEL: test3:
|
|
; LIBCALL: # %bb.0:
|
|
; LIBCALL-NEXT: pushq %rax
|
|
; LIBCALL-NEXT: .cfi_def_cfa_offset 16
|
|
; LIBCALL-NEXT: callq __gnu_f2h_ieee
|
|
; LIBCALL-NEXT: movzwl %ax, %edi
|
|
; LIBCALL-NEXT: popq %rax
|
|
; LIBCALL-NEXT: .cfi_def_cfa_offset 8
|
|
; LIBCALL-NEXT: jmp __gnu_h2f_ieee@PLT # TAILCALL
|
|
;
|
|
; F16C-LABEL: test3:
|
|
; F16C: # %bb.0:
|
|
; F16C-NEXT: vcvtps2ph $4, %xmm0, %xmm0
|
|
; F16C-NEXT: vcvtph2ps %xmm0, %xmm0
|
|
; F16C-NEXT: retq
|
|
;
|
|
; SOFTFLOAT-LABEL: test3:
|
|
; SOFTFLOAT: # %bb.0:
|
|
; SOFTFLOAT-NEXT: pushq %rax
|
|
; SOFTFLOAT-NEXT: .cfi_def_cfa_offset 16
|
|
; SOFTFLOAT-NEXT: callq __gnu_f2h_ieee
|
|
; SOFTFLOAT-NEXT: movzwl %ax, %edi
|
|
; SOFTFLOAT-NEXT: callq __gnu_h2f_ieee
|
|
; SOFTFLOAT-NEXT: popq %rcx
|
|
; SOFTFLOAT-NEXT: .cfi_def_cfa_offset 8
|
|
; SOFTFLOAT-NEXT: retq
|
|
%1 = tail call i16 @llvm.convert.to.fp16.f32(float %src)
|
|
%2 = tail call float @llvm.convert.from.fp16.f32(i16 %1)
|
|
ret float %2
|
|
}
|
|
|
|
define double @test4(i16* nocapture %src) {
|
|
; LIBCALL-LABEL: test4:
|
|
; LIBCALL: # %bb.0:
|
|
; LIBCALL-NEXT: pushq %rax
|
|
; LIBCALL-NEXT: .cfi_def_cfa_offset 16
|
|
; LIBCALL-NEXT: movzwl (%rdi), %edi
|
|
; LIBCALL-NEXT: callq __gnu_h2f_ieee
|
|
; LIBCALL-NEXT: cvtss2sd %xmm0, %xmm0
|
|
; LIBCALL-NEXT: popq %rax
|
|
; LIBCALL-NEXT: .cfi_def_cfa_offset 8
|
|
; LIBCALL-NEXT: retq
|
|
;
|
|
; F16C-LABEL: test4:
|
|
; F16C: # %bb.0:
|
|
; F16C-NEXT: movzwl (%rdi), %eax
|
|
; F16C-NEXT: vmovd %eax, %xmm0
|
|
; F16C-NEXT: vcvtph2ps %xmm0, %xmm0
|
|
; F16C-NEXT: vcvtss2sd %xmm0, %xmm0, %xmm0
|
|
; F16C-NEXT: retq
|
|
;
|
|
; SOFTFLOAT-LABEL: test4:
|
|
; SOFTFLOAT: # %bb.0:
|
|
; SOFTFLOAT-NEXT: pushq %rax
|
|
; SOFTFLOAT-NEXT: .cfi_def_cfa_offset 16
|
|
; SOFTFLOAT-NEXT: movzwl (%rdi), %edi
|
|
; SOFTFLOAT-NEXT: callq __gnu_h2f_ieee
|
|
; SOFTFLOAT-NEXT: movl %eax, %edi
|
|
; SOFTFLOAT-NEXT: callq __extendsfdf2
|
|
; SOFTFLOAT-NEXT: popq %rcx
|
|
; SOFTFLOAT-NEXT: .cfi_def_cfa_offset 8
|
|
; SOFTFLOAT-NEXT: retq
|
|
%1 = load i16, i16* %src, align 2
|
|
%2 = tail call double @llvm.convert.from.fp16.f64(i16 %1)
|
|
ret double %2
|
|
}
|
|
|
|
define i16 @test5(double %src) {
|
|
; LIBCALL-LABEL: test5:
|
|
; LIBCALL: # %bb.0:
|
|
; LIBCALL-NEXT: jmp __truncdfhf2@PLT # TAILCALL
|
|
;
|
|
; F16C-LABEL: test5:
|
|
; F16C: # %bb.0:
|
|
; F16C-NEXT: jmp __truncdfhf2@PLT # TAILCALL
|
|
;
|
|
; SOFTFLOAT-LABEL: test5:
|
|
; SOFTFLOAT: # %bb.0:
|
|
; SOFTFLOAT-NEXT: pushq %rax
|
|
; SOFTFLOAT-NEXT: .cfi_def_cfa_offset 16
|
|
; SOFTFLOAT-NEXT: callq __truncdfhf2
|
|
; SOFTFLOAT-NEXT: popq %rcx
|
|
; SOFTFLOAT-NEXT: .cfi_def_cfa_offset 8
|
|
; SOFTFLOAT-NEXT: retq
|
|
%val = tail call i16 @llvm.convert.to.fp16.f64(double %src)
|
|
ret i16 %val
|
|
}
|
|
|
|
declare float @llvm.convert.from.fp16.f32(i16) nounwind readnone
|
|
declare i16 @llvm.convert.to.fp16.f32(float) nounwind readnone
|
|
declare double @llvm.convert.from.fp16.f64(i16) nounwind readnone
|
|
declare i16 @llvm.convert.to.fp16.f64(double) nounwind readnone
|