llvm-for-llvmta/test/CodeGen/ARM/misched-fp-basic.ll

70 lines
2.1 KiB
LLVM

; REQUIRES: asserts
; RUN: llc < %s -mtriple=arm-eabi -mcpu=cortex-a9 -enable-misched -verify-misched -debug-only=machine-scheduler -o - 2>&1 > \
; RUN: /dev/null | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK_A9
; RUN: llc < %s -mtriple=arm-eabi -mcpu=swift -enable-misched -verify-misched -debug-only=machine-scheduler -o - 2>&1 > \
; RUN: /dev/null | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK_SWIFT
; RUN: llc < %s -mtriple=arm-eabi -mcpu=cortex-r52 -enable-misched -verify-misched -debug-only=machine-scheduler -o - 2>&1 > \
; RUN: /dev/null | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK_R52
;
; Check the latency of instructions for processors with sched-models
;
; Function Attrs: norecurse nounwind readnone
define i32 @foo(float %a, float %b, float %c, i32 %d) local_unnamed_addr #0 {
entry:
;
; CHECK: ********** MI Scheduling **********
; CHECK_A9: VADDS
; CHECK_SWIFT: VADDfd
; CHECK_R52: VADDS
; CHECK_A9: Latency : 5
; CHECK_SWIFT: Latency : 4
; CHECK_R52: Latency : 6
;
; CHECK_A9: VMULS
; CHECK_SWIFT: VMULfd
; CHECK_R52: VMULS
; CHECK_SWIFT: Latency : 4
; CHECK_A9: Latency : 6
; CHECK_R52: Latency : 6
;
; CHECK: VDIVS
; CHECK_SWIFT: Latency : 17
; CHECK_A9: Latency : 16
; CHECK_R52: Latency : 7
;
; CHECK: VCVTDS
; CHECK_SWIFT: Latency : 4
; CHECK_A9: Latency : 5
; CHECK_R52: Latency : 6
;
; CHECK: VADDD
; CHECK_SWIFT: Latency : 6
; CHECK_A9: Latency : 5
; CHECK_R52: Latency : 6
;
; CHECK: VMULD
; CHECK_SWIFT: Latency : 6
; CHECK_A9: Latency : 7
; CHECK_R52: Latency : 6
;
; CHECK: VDIVD
; CHECK_SWIFT: Latency : 32
; CHECK_A9: Latency : 26
; CHECK_R52: Latency : 17
;
; CHECK: VTOSIZD
; CHECK_SWIFT: Latency : 4
; CHECK_A9: Latency : 5
; CHECK_R52: Latency : 6
;
%add = fadd float %a, %b
%mul = fmul float %add, %add
%div = fdiv float %mul, %b
%conv1 = fpext float %div to double
%add3 = fadd double %conv1, %conv1
%mul4 = fmul double %add3, %add3
%div5 = fdiv double %mul4, %conv1
%conv6 = fptosi double %div5 to i32
ret i32 %conv6
}