diff options
author | Richard Sandiford <rsandifo@linux.vnet.ibm.com> | 2013-07-03 10:10:02 +0000 |
---|---|---|
committer | Richard Sandiford <rsandifo@linux.vnet.ibm.com> | 2013-07-03 10:10:02 +0000 |
commit | ed1fab6b5bfb54d63102319a761011e985081cb4 (patch) | |
tree | 6f875f92916f0dc214d1f28035000331faccbac7 /llvm/test/CodeGen/SystemZ/fp-sub-02.ll | |
parent | d36cbaa4231e51a42d761d298ff20aaa6e88d014 (diff) | |
download | bcm5719-llvm-ed1fab6b5bfb54d63102319a761011e985081cb4.tar.gz bcm5719-llvm-ed1fab6b5bfb54d63102319a761011e985081cb4.zip |
[SystemZ] Fold more spills
Add a mapping from register-based <INSN>R instructions to the corresponding
memory-based <INSN>. Use it to cut down on the number of spill loads.
Some instructions extend their operands from smaller fields, so this
required a new TSFlags field to say how big the unextended operand is.
This optimisation doesn't trigger for C(G)R and CL(G)R because in practice
we always combine those instructions with a branch. Adding a test for every
other case probably seems excessive, but it did catch a missed optimisation
for DSGF (fixed in r185435).
llvm-svn: 185529
Diffstat (limited to 'llvm/test/CodeGen/SystemZ/fp-sub-02.ll')
-rw-r--r-- | llvm/test/CodeGen/SystemZ/fp-sub-02.ll | 48 |
1 files changed, 48 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/SystemZ/fp-sub-02.ll b/llvm/test/CodeGen/SystemZ/fp-sub-02.ll index bf9848c2fd5..b6409fcd6ee 100644 --- a/llvm/test/CodeGen/SystemZ/fp-sub-02.ll +++ b/llvm/test/CodeGen/SystemZ/fp-sub-02.ll @@ -2,6 +2,8 @@ ; ; RUN: llc < %s -mtriple=s390x-linux-gnu | FileCheck %s +declare double @foo() + ; Check register subtraction. define double @f1(double %f1, double %f2) { ; CHECK: f1: @@ -69,3 +71,49 @@ define double @f6(double %f1, double *%base, i64 %index) { %res = fsub double %f1, %f2 ret double %res } + +; Check that subtractions of spilled values can use SDB rather than SDBR. +define double @f7(double *%ptr0) { +; CHECK: f7: +; CHECK: brasl %r14, foo@PLT +; CHECK: sdb %f0, 16{{[04]}}(%r15) +; CHECK: br %r14 + %ptr1 = getelementptr double *%ptr0, i64 2 + %ptr2 = getelementptr double *%ptr0, i64 4 + %ptr3 = getelementptr double *%ptr0, i64 6 + %ptr4 = getelementptr double *%ptr0, i64 8 + %ptr5 = getelementptr double *%ptr0, i64 10 + %ptr6 = getelementptr double *%ptr0, i64 12 + %ptr7 = getelementptr double *%ptr0, i64 14 + %ptr8 = getelementptr double *%ptr0, i64 16 + %ptr9 = getelementptr double *%ptr0, i64 18 + %ptr10 = getelementptr double *%ptr0, i64 20 + + %val0 = load double *%ptr0 + %val1 = load double *%ptr1 + %val2 = load double *%ptr2 + %val3 = load double *%ptr3 + %val4 = load double *%ptr4 + %val5 = load double *%ptr5 + %val6 = load double *%ptr6 + %val7 = load double *%ptr7 + %val8 = load double *%ptr8 + %val9 = load double *%ptr9 + %val10 = load double *%ptr10 + + %ret = call double @foo() + + %sub0 = fsub double %ret, %val0 + %sub1 = fsub double %sub0, %val1 + %sub2 = fsub double %sub1, %val2 + %sub3 = fsub double %sub2, %val3 + %sub4 = fsub double %sub3, %val4 + %sub5 = fsub double %sub4, %val5 + %sub6 = fsub double %sub5, %val6 + %sub7 = fsub double %sub6, %val7 + %sub8 = fsub double %sub7, %val8 + %sub9 = fsub double %sub8, %val9 + %sub10 = fsub double %sub9, %val10 + + ret double %sub10 +} |