1
0
mirror of https://github.com/RPCS3/llvm-mirror.git synced 2024-10-23 04:52:54 +02:00
llvm-mirror/test/CodeGen/ARM/misched-fp-basic.ll
Javed Absar 97ef1a63f1 [ARM] Classification Improvements to ARM Sched-Models. NFCI.
This is a series of patches to enable adding of machine sched
models for ARM processors easier and compact. They define new
sched-readwrites for groups of ARM instructions. This has been
missing so far, and as a consequence, machine scheduler models
for individual sub-targets have tended to be larger than they
needed to be. 

The current patch focuses on floating-point instructions.

Reviewers: Diana Picus (rovka), Renato Golin (rengolin)

Differential Revision: https://reviews.llvm.org/D28194

llvm-svn: 292825
2017-01-23 20:20:39 +00:00

70 lines
2.1 KiB
LLVM

; REQUIRES: asserts
; RUN: llc < %s -mtriple=arm-eabi -mcpu=cortex-a9 -enable-misched -verify-misched -debug-only=misched -o - 2>&1 > \
; RUN: /dev/null | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK_A9
; RUN: llc < %s -mtriple=arm-eabi -mcpu=swift -enable-misched -verify-misched -debug-only=misched -o - 2>&1 > \
; RUN: /dev/null | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK_SWIFT
; RUN: llc < %s -mtriple=arm-eabi -mcpu=cortex-r52 -enable-misched -verify-misched -debug-only=misched -o - 2>&1 > \
; RUN: /dev/null | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK_R52
;
; Check the latency of instructions for processors with sched-models
;
; Function Attrs: norecurse nounwind readnone
define i32 @foo(float %a, float %b, float %c, i32 %d) local_unnamed_addr #0 {
entry:
;
; CHECK: ********** MI Scheduling **********
; CHECK_A9: VADDS
; CHECK_SWIFT: VADDfd
; CHECK_R52: VADDS
; CHECK_A9: Latency : 5
; CHECK_SWIFT: Latency : 4
; CHECK_R52: Latency : 6
;
; CHECK_A9: VMULS
; CHECK_SWIFT: VMULfd
; CHECK_R52: VMULS
; CHECK_SWIFT: Latency : 4
; CHECK_A9: Latency : 6
; CHECK_R52: Latency : 6
;
; CHECK: VDIVS
; CHECK_SWIFT: Latency : 17
; CHECK_A9: Latency : 16
; CHECK_R52: Latency : 7
;
; CHECK: VCVTDS
; CHECK_SWIFT: Latency : 4
; CHECK_A9: Latency : 5
; CHECK_R52: Latency : 6
;
; CHECK: VADDD
; CHECK_SWIFT: Latency : 6
; CHECK_A9: Latency : 5
; CHECK_R52: Latency : 6
;
; CHECK: VMULD
; CHECK_SWIFT: Latency : 6
; CHECK_A9: Latency : 7
; CHECK_R52: Latency : 6
;
; CHECK: VDIVD
; CHECK_SWIFT: Latency : 32
; CHECK_A9: Latency : 26
; CHECK_R52: Latency : 17
;
; CHECK: VTOSIZD
; CHECK_SWIFT: Latency : 4
; CHECK_A9: Latency : 5
; CHECK_R52: Latency : 6
;
%add = fadd float %a, %b
%mul = fmul float %add, %add
%div = fdiv float %mul, %b
%conv1 = fpext float %div to double
%add3 = fadd double %conv1, %conv1
%mul4 = fmul double %add3, %add3
%div5 = fdiv double %mul4, %conv1
%conv6 = fptosi double %div5 to i32
ret i32 %conv6
}