diff options
author | Nirav Dave <niravd@google.com> | 2018-01-31 15:23:17 +0000 |
---|---|---|
committer | Nirav Dave <niravd@google.com> | 2018-01-31 15:23:17 +0000 |
commit | c3a1e16db1fed06ba707a3f6173ffbd805db36c6 (patch) | |
tree | 68cd8f7d76c77ef4c65702c9b1bce36e879c194b /llvm | |
parent | 98f0021dd37d88bd6ff5b87caf3b01f0ebfb46a7 (diff) | |
download | bcm5719-llvm-c3a1e16db1fed06ba707a3f6173ffbd805db36c6.tar.gz bcm5719-llvm-c3a1e16db1fed06ba707a3f6173ffbd805db36c6.zip |
[DAG] Prevent NodeId pruning of TokenFactors in Instruction Selection.
Summary:
Instruction Selection preserves relative orders of all nodes save
TokenFactors which we treat specially. As a result Node Ids for
TokenFactors may violate the topological ordering and should not be
considered as valid pruning candidates in predecessor search.
Fixes PR35316.
Reviewers: RKSimon, hfinkel
Subscribers: hiraditya, llvm-commits
Differential Revision: https://reviews.llvm.org/D42701
llvm-svn: 323880
Diffstat (limited to 'llvm')
-rw-r--r-- | llvm/lib/CodeGen/SelectionDAG/SelectionDAGISel.cpp | 4 | ||||
-rw-r--r-- | llvm/test/CodeGen/X86/pr35316.ll | 76 |
2 files changed, 79 insertions, 1 deletions
diff --git a/llvm/lib/CodeGen/SelectionDAG/SelectionDAGISel.cpp b/llvm/lib/CodeGen/SelectionDAG/SelectionDAGISel.cpp index e90ec20bcdb..b3a316b93b4 100644 --- a/llvm/lib/CodeGen/SelectionDAG/SelectionDAGISel.cpp +++ b/llvm/lib/CodeGen/SelectionDAG/SelectionDAGISel.cpp @@ -2157,7 +2157,9 @@ static bool findNonImmUse(SDNode *Use, SDNode* Def, SDNode *ImmedUse, while (!WorkList.empty()) { Use = WorkList.back(); WorkList.pop_back(); - if (Use->getNodeId() < Def->getNodeId() && Use->getNodeId() != -1) + // NodeId topological order of TokenFactors is not guaranteed. Do not skip. + if (Use->getOpcode() != ISD::TokenFactor && + Use->getNodeId() < Def->getNodeId() && Use->getNodeId() != -1) continue; // Don't revisit nodes if we already scanned it and didn't fail, we know we diff --git a/llvm/test/CodeGen/X86/pr35316.ll b/llvm/test/CodeGen/X86/pr35316.ll new file mode 100644 index 00000000000..1c1523b3547 --- /dev/null +++ b/llvm/test/CodeGen/X86/pr35316.ll @@ -0,0 +1,76 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc < %s -mtriple=x86_64-linux | FileCheck %s --check-prefix=CHECK + +; This tests for a cyclic dependencies in the generated DAG. + +@c = external local_unnamed_addr global i32, align 4 +@a = external local_unnamed_addr global i32, align 4 +@b = external local_unnamed_addr global i32, align 4 + +define void @main() { +; CHECK-LABEL: main: +; CHECK: # %bb.0: # %entry +; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %eax +; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %eax +; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %eax +; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %eax +; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %eax +; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %eax +; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %eax +; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %eax +; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %eax +; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %eax +; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %eax +; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %eax +; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %eax +; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %eax +; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %eax +; CHECK-NEXT: movl $0, {{.*}}(%rip) +; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %r8d +; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %edi +; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %esi +; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %eax +; CHECK-NEXT: cltd +; CHECK-NEXT: idivl {{.*}}(%rip) +; CHECK-NEXT: movl %eax, %ecx +; CHECK-NEXT: movl {{.*}}(%rip), %eax +; CHECK-NEXT: cltd +; CHECK-NEXT: idivl %esi +; CHECK-NEXT: andl %edi, %eax +; CHECK-NEXT: addl %ecx, %eax +; CHECK-NEXT: andl %r8d, %eax +; CHECK-NEXT: movl %eax, (%rax) +; CHECK-NEXT: retq +entry: + %e = alloca i32, align 4 + %e.0.e.0.24 = load volatile i32, i32* %e, align 4 + %e.0.e.0.25 = load volatile i32, i32* %e, align 4 + %e.0.e.0.26 = load volatile i32, i32* %e, align 4 + %e.0.e.0.27 = load volatile i32, i32* %e, align 4 + %e.0.e.0.28 = load volatile i32, i32* %e, align 4 + %e.0.e.0.29 = load volatile i32, i32* %e, align 4 + %e.0.e.0.30 = load volatile i32, i32* %e, align 4 + %e.0.e.0.31 = load volatile i32, i32* %e, align 4 + %e.0.e.0.32 = load volatile i32, i32* %e, align 4 + %e.0.e.0.33 = load volatile i32, i32* %e, align 4 + %e.0.e.0.34 = load volatile i32, i32* %e, align 4 + %e.0.e.0.35 = load volatile i32, i32* %e, align 4 + %e.0.e.0.36 = load volatile i32, i32* %e, align 4 + %e.0.e.0.37 = load volatile i32, i32* %e, align 4 + %e.0.e.0.39 = load volatile i32, i32* %e, align 4 + %tmp = load i32, i32* @a, align 4 + store i32 0, i32* @b, align 4 + %e.0.e.0.41 = load volatile i32, i32* %e, align 4 + %add17 = add nsw i32 %e.0.e.0.41, 0 + %e.0.e.0.42 = load volatile i32, i32* %e, align 4 + %tmp1 = load i32, i32* @c, align 4 + %e.0.e.0.43 = load volatile i32, i32* %e, align 4 + %div = sdiv i32 %tmp1, %e.0.e.0.43 + %and18 = and i32 %div, %e.0.e.0.42 + %e.0.e.0.44 = load volatile i32, i32* %e, align 4 + %div19 = sdiv i32 %e.0.e.0.44, %tmp + %add20 = add nsw i32 %div19, %and18 + %and21 = and i32 %add20, %add17 + store volatile i32 %and21, i32* undef, align 4 + ret void +} |