summaryrefslogtreecommitdiffstats
path: root/llvm/test/CodeGen/SystemZ/fp-sub-02.ll
diff options
context:
space:
mode:
authorRichard Sandiford <rsandifo@linux.vnet.ibm.com>2013-07-03 10:10:02 +0000
committerRichard Sandiford <rsandifo@linux.vnet.ibm.com>2013-07-03 10:10:02 +0000
commited1fab6b5bfb54d63102319a761011e985081cb4 (patch)
tree6f875f92916f0dc214d1f28035000331faccbac7 /llvm/test/CodeGen/SystemZ/fp-sub-02.ll
parentd36cbaa4231e51a42d761d298ff20aaa6e88d014 (diff)
downloadbcm5719-llvm-ed1fab6b5bfb54d63102319a761011e985081cb4.tar.gz
bcm5719-llvm-ed1fab6b5bfb54d63102319a761011e985081cb4.zip
[SystemZ] Fold more spills
Add a mapping from register-based <INSN>R instructions to the corresponding memory-based <INSN>. Use it to cut down on the number of spill loads. Some instructions extend their operands from smaller fields, so this required a new TSFlags field to say how big the unextended operand is. This optimisation doesn't trigger for C(G)R and CL(G)R because in practice we always combine those instructions with a branch. Adding a test for every other case probably seems excessive, but it did catch a missed optimisation for DSGF (fixed in r185435). llvm-svn: 185529
Diffstat (limited to 'llvm/test/CodeGen/SystemZ/fp-sub-02.ll')
-rw-r--r--llvm/test/CodeGen/SystemZ/fp-sub-02.ll48
1 files changed, 48 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/SystemZ/fp-sub-02.ll b/llvm/test/CodeGen/SystemZ/fp-sub-02.ll
index bf9848c2fd5..b6409fcd6ee 100644
--- a/llvm/test/CodeGen/SystemZ/fp-sub-02.ll
+++ b/llvm/test/CodeGen/SystemZ/fp-sub-02.ll
@@ -2,6 +2,8 @@
;
; RUN: llc < %s -mtriple=s390x-linux-gnu | FileCheck %s
+declare double @foo()
+
; Check register subtraction.
define double @f1(double %f1, double %f2) {
; CHECK: f1:
@@ -69,3 +71,49 @@ define double @f6(double %f1, double *%base, i64 %index) {
%res = fsub double %f1, %f2
ret double %res
}
+
+; Check that subtractions of spilled values can use SDB rather than SDBR.
+define double @f7(double *%ptr0) {
+; CHECK: f7:
+; CHECK: brasl %r14, foo@PLT
+; CHECK: sdb %f0, 16{{[04]}}(%r15)
+; CHECK: br %r14
+ %ptr1 = getelementptr double *%ptr0, i64 2
+ %ptr2 = getelementptr double *%ptr0, i64 4
+ %ptr3 = getelementptr double *%ptr0, i64 6
+ %ptr4 = getelementptr double *%ptr0, i64 8
+ %ptr5 = getelementptr double *%ptr0, i64 10
+ %ptr6 = getelementptr double *%ptr0, i64 12
+ %ptr7 = getelementptr double *%ptr0, i64 14
+ %ptr8 = getelementptr double *%ptr0, i64 16
+ %ptr9 = getelementptr double *%ptr0, i64 18
+ %ptr10 = getelementptr double *%ptr0, i64 20
+
+ %val0 = load double *%ptr0
+ %val1 = load double *%ptr1
+ %val2 = load double *%ptr2
+ %val3 = load double *%ptr3
+ %val4 = load double *%ptr4
+ %val5 = load double *%ptr5
+ %val6 = load double *%ptr6
+ %val7 = load double *%ptr7
+ %val8 = load double *%ptr8
+ %val9 = load double *%ptr9
+ %val10 = load double *%ptr10
+
+ %ret = call double @foo()
+
+ %sub0 = fsub double %ret, %val0
+ %sub1 = fsub double %sub0, %val1
+ %sub2 = fsub double %sub1, %val2
+ %sub3 = fsub double %sub2, %val3
+ %sub4 = fsub double %sub3, %val4
+ %sub5 = fsub double %sub4, %val5
+ %sub6 = fsub double %sub5, %val6
+ %sub7 = fsub double %sub6, %val7
+ %sub8 = fsub double %sub7, %val8
+ %sub9 = fsub double %sub8, %val9
+ %sub10 = fsub double %sub9, %val10
+
+ ret double %sub10
+}
OpenPOWER on IntegriCloud