diff options
| author | Nemanja Ivanovic <nemanjai@ca.ibm.com> | 2019-11-07 19:31:00 -0600 |
|---|---|---|
| committer | Nemanja Ivanovic <nemanjai@ca.ibm.com> | 2019-11-07 19:33:15 -0600 |
| commit | 9af28400d6ff59614dad2584f5de03be2e294151 (patch) | |
| tree | aa28115c4e70103f6b86302b2dacaea9983d0056 | |
| parent | 7215b7ef530bff896a1da70c6b062e9259f5fde7 (diff) | |
| download | bcm5719-llvm-9af28400d6ff59614dad2584f5de03be2e294151.tar.gz bcm5719-llvm-9af28400d6ff59614dad2584f5de03be2e294151.zip | |
[PowerPC] Option for enabling absolute jumptables with command line
This option allows the user to specify the use of absolute jumptables instead
of relative which is the default on most PPC subtargets.
Patch by Kamauu Bridgeman
Differential revision: https://reviews.llvm.org/D69108
| -rw-r--r-- | llvm/lib/Target/PowerPC/PPCISelLowering.cpp | 5 | ||||
| -rw-r--r-- | llvm/test/CodeGen/PowerPC/absol-jump-table-enabled.ll | 100 |
2 files changed, 105 insertions, 0 deletions
diff --git a/llvm/lib/Target/PowerPC/PPCISelLowering.cpp b/llvm/lib/Target/PowerPC/PPCISelLowering.cpp index 87ba74cf860..a2ffe9e3540 100644 --- a/llvm/lib/Target/PowerPC/PPCISelLowering.cpp +++ b/llvm/lib/Target/PowerPC/PPCISelLowering.cpp @@ -119,6 +119,9 @@ cl::desc("don't always align innermost loop to 32 bytes on ppc"), cl::Hidden); static cl::opt<bool> EnableQuadPrecision("enable-ppc-quad-precision", cl::desc("enable quad precision float support on ppc"), cl::Hidden); +static cl::opt<bool> UseAbsoluteJumpTables("ppc-use-absolute-jumptables", +cl::desc("use absolute jump tables on ppc"), cl::Hidden); + STATISTIC(NumTailCalls, "Number of tail calls"); STATISTIC(NumSiblingCalls, "Number of sibling calls"); @@ -2744,6 +2747,8 @@ unsigned PPCTargetLowering::getJumpTableEncoding() const { } bool PPCTargetLowering::isJumpTableRelative() const { + if (UseAbsoluteJumpTables) + return false; if (Subtarget.isPPC64()) return true; return TargetLowering::isJumpTableRelative(); diff --git a/llvm/test/CodeGen/PowerPC/absol-jump-table-enabled.ll b/llvm/test/CodeGen/PowerPC/absol-jump-table-enabled.ll new file mode 100644 index 00000000000..4a9492d8e10 --- /dev/null +++ b/llvm/test/CodeGen/PowerPC/absol-jump-table-enabled.ll @@ -0,0 +1,100 @@ +; NOTE: This test case generates a jump table on PowerPC big and little endian +; NOTE: then verifies that the command line option to enable absolute jump +; NOTE: table works correctly. +; RUN: llc -mtriple=powerpc64le-unknown-linux-gnu -o - \ +; RUN: -ppc-use-absolute-jumptables -ppc-asm-full-reg-names \ +; RUN: -verify-machineinstrs %s | FileCheck %s -check-prefix=CHECK-LE +; RUN: llc -mtriple=powerpc64-unknown-linux-gnu -o - \ +; RUN: -ppc-use-absolute-jumptables -ppc-asm-full-reg-names \ +; RUN: -verify-machineinstrs %s | FileCheck %s -check-prefix=CHECK-BE + +%struct.node = type { i8, %struct.node* } + +; Function Attrs: norecurse nounwind readonly +define zeroext i32 @jumpTableTest(%struct.node* readonly %list) { +; CHECK-LE-LABEL: jumpTableTest: +; CHECK-LE: # %bb.0: # %entry +; CHECK-LE: rldic r[[REG:[0-9]+]], r[[REG]], 3, 29 +; CHECK-LE: ldx r[[REG]], r[[REG]], r[[REG1:[0-9]+]] +; CHECK-LE: mtctr r[[REG]] +; CHECK-LE: bctr +; CHECK-LE: blr +; +; CHECK-BE-LABEL: jumpTableTest: +; CHECK-BE: # %bb.0: # %entry +; CHECK-BE: rldic r[[REG:[0-9]+]], r[[REG]], 2, 30 +; CHECK-BE: lwax r[[REG]], r[[REG]], r[[REG1:[0-9]+]] +; CHECK-BE: mtctr r[[REG]] +; CHECK-BE: bctr +; CHECK-BE: blr +entry: + %cmp36 = icmp eq %struct.node* %list, null + br i1 %cmp36, label %while.end, label %while.body + +while.body: ; preds = %entry, %sw.epilog + %result.038 = phi i32 [ %result.1, %sw.epilog ], [ 0, %entry ] + %current.037 = phi %struct.node* [ %spec.store.select, %sw.epilog ], [ %list, %entry ] + %next1 = getelementptr inbounds %struct.node, %struct.node* %current.037, i64 0, i32 1 + %0 = load %struct.node*, %struct.node** %next1, align 8 + %cmp2 = icmp eq %struct.node* %0, %current.037 + %spec.store.select = select i1 %cmp2, %struct.node* null, %struct.node* %0 + %type = getelementptr inbounds %struct.node, %struct.node* %current.037, i64 0, i32 0 + %1 = load i8, i8* %type, align 8 + switch i8 %1, label %sw.epilog [ + i8 1, label %sw.bb + i8 2, label %sw.bb3 + i8 3, label %sw.bb5 + i8 4, label %sw.bb7 + i8 5, label %sw.bb9 + i8 6, label %sw.bb11 + i8 7, label %sw.bb13 + i8 8, label %sw.bb15 + i8 9, label %sw.bb17 + ] + +sw.bb: ; preds = %while.body + %add = add nsw i32 %result.038, 13 + br label %sw.epilog + +sw.bb3: ; preds = %while.body + %add4 = add nsw i32 %result.038, 5 + br label %sw.epilog + +sw.bb5: ; preds = %while.body + %add6 = add nsw i32 %result.038, 2 + br label %sw.epilog + +sw.bb7: ; preds = %while.body + %add8 = add nsw i32 %result.038, 7 + br label %sw.epilog + +sw.bb9: ; preds = %while.body + %add10 = add nsw i32 %result.038, 11 + br label %sw.epilog + +sw.bb11: ; preds = %while.body + %add12 = add nsw i32 %result.038, 17 + br label %sw.epilog + +sw.bb13: ; preds = %while.body + %add14 = add nsw i32 %result.038, 16 + br label %sw.epilog + +sw.bb15: ; preds = %while.body + %add16 = add nsw i32 %result.038, 81 + br label %sw.epilog + +sw.bb17: ; preds = %while.body + %add18 = add nsw i32 %result.038, 72 + br label %sw.epilog + +sw.epilog: ; preds = %while.body, %sw.bb17, %sw.bb15, %sw.bb13, %sw.bb11, %sw.bb9, %sw.bb7, %sw.bb5, %sw.bb3, %sw.bb + %result.1 = phi i32 [ %result.038, %while.body ], [ %add18, %sw.bb17 ], [ %add16, %sw.bb15 ], [ %add14, %sw.bb13 ], [ %add12, %sw.bb11 ], [ %add10, %sw.bb9 ], [ %add8, %sw.bb7 ], [ %add6, %sw.bb5 ], [ %add4, %sw.bb3 ], [ %add, %sw.bb ] + %cmp = icmp eq %struct.node* %spec.store.select, null + br i1 %cmp, label %while.end, label %while.body + +while.end: ; preds = %sw.epilog, %entry + %result.0.lcssa = phi i32 [ 0, %entry ], [ %result.1, %sw.epilog ] + ret i32 %result.0.lcssa +} + |

