summaryrefslogtreecommitdiffstats
path: root/llvm/test/CodeGen
diff options
context:
space:
mode:
authorJaved Absar <javed.absar@arm.com>2017-01-23 20:20:39 +0000
committerJaved Absar <javed.absar@arm.com>2017-01-23 20:20:39 +0000
commit00cce417524d3ebd19c68fbb338b8042dc76bf73 (patch)
treea70781d38ef7c9824a323e695addd68982570e5c /llvm/test/CodeGen
parent5b54a42c0f1178dbb367866f92cd4efe88710bd6 (diff)
downloadbcm5719-llvm-00cce417524d3ebd19c68fbb338b8042dc76bf73.tar.gz
bcm5719-llvm-00cce417524d3ebd19c68fbb338b8042dc76bf73.zip
[ARM] Classification Improvements to ARM Sched-Models. NFCI.
This is a series of patches to enable adding of machine sched models for ARM processors easier and compact. They define new sched-readwrites for groups of ARM instructions. This has been missing so far, and as a consequence, machine scheduler models for individual sub-targets have tended to be larger than they needed to be. The current patch focuses on floating-point instructions. Reviewers: Diana Picus (rovka), Renato Golin (rengolin) Differential Revision: https://reviews.llvm.org/D28194 llvm-svn: 292825
Diffstat (limited to 'llvm/test/CodeGen')
-rw-r--r--llvm/test/CodeGen/ARM/misched-fp-basic.ll69
1 files changed, 69 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/ARM/misched-fp-basic.ll b/llvm/test/CodeGen/ARM/misched-fp-basic.ll
new file mode 100644
index 00000000000..27ad2cec34f
--- /dev/null
+++ b/llvm/test/CodeGen/ARM/misched-fp-basic.ll
@@ -0,0 +1,69 @@
+; REQUIRES: asserts
+; RUN: llc < %s -mtriple=arm-eabi -mcpu=cortex-a9 -enable-misched -verify-misched -debug-only=misched -o - 2>&1 > \
+; RUN: /dev/null | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK_A9
+; RUN: llc < %s -mtriple=arm-eabi -mcpu=swift -enable-misched -verify-misched -debug-only=misched -o - 2>&1 > \
+; RUN: /dev/null | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK_SWIFT
+; RUN: llc < %s -mtriple=arm-eabi -mcpu=cortex-r52 -enable-misched -verify-misched -debug-only=misched -o - 2>&1 > \
+; RUN: /dev/null | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK_R52
+;
+; Check the latency of instructions for processors with sched-models
+;
+; Function Attrs: norecurse nounwind readnone
+define i32 @foo(float %a, float %b, float %c, i32 %d) local_unnamed_addr #0 {
+entry:
+;
+; CHECK: ********** MI Scheduling **********
+; CHECK_A9: VADDS
+; CHECK_SWIFT: VADDfd
+; CHECK_R52: VADDS
+; CHECK_A9: Latency : 5
+; CHECK_SWIFT: Latency : 4
+; CHECK_R52: Latency : 6
+;
+; CHECK_A9: VMULS
+; CHECK_SWIFT: VMULfd
+; CHECK_R52: VMULS
+; CHECK_SWIFT: Latency : 4
+; CHECK_A9: Latency : 6
+; CHECK_R52: Latency : 6
+;
+; CHECK: VDIVS
+; CHECK_SWIFT: Latency : 17
+; CHECK_A9: Latency : 16
+; CHECK_R52: Latency : 7
+;
+; CHECK: VCVTDS
+; CHECK_SWIFT: Latency : 4
+; CHECK_A9: Latency : 5
+; CHECK_R52: Latency : 6
+;
+; CHECK: VADDD
+; CHECK_SWIFT: Latency : 6
+; CHECK_A9: Latency : 5
+; CHECK_R52: Latency : 6
+;
+; CHECK: VMULD
+; CHECK_SWIFT: Latency : 6
+; CHECK_A9: Latency : 7
+; CHECK_R52: Latency : 6
+;
+; CHECK: VDIVD
+; CHECK_SWIFT: Latency : 32
+; CHECK_A9: Latency : 26
+; CHECK_R52: Latency : 17
+;
+; CHECK: VTOSIZD
+; CHECK_SWIFT: Latency : 4
+; CHECK_A9: Latency : 5
+; CHECK_R52: Latency : 6
+;
+ %add = fadd float %a, %b
+ %mul = fmul float %add, %add
+ %div = fdiv float %mul, %b
+ %conv1 = fpext float %div to double
+ %add3 = fadd double %conv1, %conv1
+ %mul4 = fmul double %add3, %add3
+ %div5 = fdiv double %mul4, %conv1
+ %conv6 = fptosi double %div5 to i32
+ ret i32 %conv6
+}
OpenPOWER on IntegriCloud