diff options
| author | Evandro Menezes <e.menezes@samsung.com> | 2019-09-25 16:10:20 +0000 |
|---|---|---|
| committer | Evandro Menezes <e.menezes@samsung.com> | 2019-09-25 16:10:20 +0000 |
| commit | 3bd8ba156b5241571ecc932ca332c5e869981901 (patch) | |
| tree | 4efeb30246a06802f82229c7a369346afff3b6ba /llvm/lib | |
| parent | 6b3749f6968f0c22be821115462d551a0a780fc6 (diff) | |
| download | bcm5719-llvm-3bd8ba156b5241571ecc932ca332c5e869981901.tar.gz bcm5719-llvm-3bd8ba156b5241571ecc932ca332c5e869981901.zip | |
[CodeGen] Replace -max-jump-table-size with -max-jump-table-targets
Modern processors predict the targets of an indirect branch regardless of
the size of any jump table used to glean its target address. Moreover,
branch predictors typically use resources limited by the number of actual
targets that occur at run time.
This patch changes the semantics of the option `-max-jump-table-size` to limit
the number of different targets instead of the number of entries in a jump
table. Thus, it is now renamed to `-max-jump-table-targets`.
Before, when `-max-jump-table-size` was specified, it could happen that
cluster jump tables could have targets used repeatedly, but each one was
counted and typically resulted in tables with the same number of entries.
With this patch, when specifying `-max-jump-table-targets`, tables may have
different lengths, since the number of unique targets is counted towards the
limit, but the number of unique targets in tables is the same, but for the
last one containing the balance of targets.
Differential revision: https://reviews.llvm.org/D60295
llvm-svn: 372893
Diffstat (limited to 'llvm/lib')
| -rw-r--r-- | llvm/lib/CodeGen/SwitchLoweringUtils.cpp | 94 | ||||
| -rw-r--r-- | llvm/lib/CodeGen/TargetLoweringBase.cpp | 18 | ||||
| -rw-r--r-- | llvm/lib/Target/AArch64/AArch64ISelLowering.cpp | 7 | ||||
| -rw-r--r-- | llvm/lib/Target/AArch64/AArch64Subtarget.cpp | 4 | ||||
| -rw-r--r-- | llvm/lib/Target/AArch64/AArch64Subtarget.h | 4 |
5 files changed, 66 insertions, 61 deletions
diff --git a/llvm/lib/CodeGen/SwitchLoweringUtils.cpp b/llvm/lib/CodeGen/SwitchLoweringUtils.cpp index 83acf7f8071..2b9999d0b41 100644 --- a/llvm/lib/CodeGen/SwitchLoweringUtils.cpp +++ b/llvm/lib/CodeGen/SwitchLoweringUtils.cpp @@ -11,33 +11,47 @@ // //===----------------------------------------------------------------------===// +#include "llvm/ADT/SmallSet.h" #include "llvm/CodeGen/MachineJumpTableInfo.h" #include "llvm/CodeGen/SwitchLoweringUtils.h" using namespace llvm; using namespace SwitchCG; -uint64_t SwitchCG::getJumpTableRange(const CaseClusterVector &Clusters, - unsigned First, unsigned Last) { - assert(Last >= First); - const APInt &LowCase = Clusters[First].Low->getValue(); - const APInt &HighCase = Clusters[Last].High->getValue(); - assert(LowCase.getBitWidth() == HighCase.getBitWidth()); - - // FIXME: A range of consecutive cases has 100% density, but only requires one - // comparison to lower. We should discriminate against such consecutive ranges - // in jump tables. - return (HighCase - LowCase).getLimitedValue((UINT64_MAX - 1) / 100) + 1; -} +// Collection of partition stats, made up of, for a given cluster, +// the range of the cases, their number and the number of unique targets. +struct PartitionStats { + uint64_t Range, Cases, Targets; +}; + +static PartitionStats getJumpTableStats(const CaseClusterVector &Clusters, + unsigned First, unsigned Last, + bool HasReachableDefault) { + assert(Last >= First && "Invalid order of clusters"); + + SmallSet<const MachineBasicBlock *, 8> Targets; + PartitionStats Stats; + + Stats.Cases = 0; + for (unsigned i = First; i <= Last; ++i) { + const APInt &Hi = Clusters[i].High->getValue(), + &Lo = Clusters[i].Low->getValue(); + Stats.Cases += (Hi - Lo).getLimitedValue() + 1; + + Targets.insert(Clusters[i].MBB); + } + assert(Stats.Cases < UINT64_MAX / 100 && "Too many cases"); + + const APInt &Hi = Clusters[Last].High->getValue(), + &Lo = Clusters[First].Low->getValue(); + assert(Hi.getBitWidth() == Lo.getBitWidth()); + Stats.Range = (Hi - Lo).getLimitedValue((UINT64_MAX - 1) / 100) + 1; + assert(Stats.Range >= Stats.Cases && "Invalid range or number of cases"); + + Stats.Targets = + Targets.size() + (HasReachableDefault && Stats.Range > Stats.Cases); -uint64_t -SwitchCG::getJumpTableNumCases(const SmallVectorImpl<unsigned> &TotalCases, - unsigned First, unsigned Last) { - assert(Last >= First); - assert(TotalCases[Last] >= TotalCases[First]); - uint64_t NumCases = - TotalCases[Last] - (First == 0 ? 0 : TotalCases[First - 1]); - return NumCases; + return Stats; } void SwitchCG::SwitchLowering::findJumpTables(CaseClusterVector &Clusters, @@ -64,23 +78,13 @@ void SwitchCG::SwitchLowering::findJumpTables(CaseClusterVector &Clusters, if (N < 2 || N < MinJumpTableEntries) return; - // Accumulated number of cases in each cluster and those prior to it. - SmallVector<unsigned, 8> TotalCases(N); - for (unsigned i = 0; i < N; ++i) { - const APInt &Hi = Clusters[i].High->getValue(); - const APInt &Lo = Clusters[i].Low->getValue(); - TotalCases[i] = (Hi - Lo).getLimitedValue() + 1; - if (i != 0) - TotalCases[i] += TotalCases[i - 1]; - } - - uint64_t Range = getJumpTableRange(Clusters,0, N - 1); - uint64_t NumCases = getJumpTableNumCases(TotalCases, 0, N - 1); - assert(NumCases < UINT64_MAX / 100); - assert(Range >= NumCases); + const bool HasReachableDefault = + !isa<UnreachableInst>(DefaultMBB->getBasicBlock()->getFirstNonPHIOrDbg()); + PartitionStats Stats = + getJumpTableStats(Clusters, 0, N - 1, HasReachableDefault); // Cheap case: the whole range may be suitable for jump table. - if (TLI->isSuitableForJumpTable(SI, NumCases, Range)) { + if (TLI->isSuitableForJumpTable(SI, Stats.Cases, Stats.Targets, Stats.Range)) { CaseCluster JTCluster; if (buildJumpTable(Clusters, 0, N - 1, SI, DefaultMBB, JTCluster)) { Clusters[0] = JTCluster; @@ -104,9 +108,6 @@ void SwitchCG::SwitchLowering::findJumpTables(CaseClusterVector &Clusters, SmallVector<unsigned, 8> MinPartitions(N); // LastElement[i] is the last element of the partition starting at i. SmallVector<unsigned, 8> LastElement(N); - // PartitionsScore[i] is used to break ties when choosing between two - // partitionings resulting in the same number of partitions. - SmallVector<unsigned, 8> PartitionsScore(N); // For PartitionsScore, a small number of comparisons is considered as good as // a jump table and a single comparison is considered better than a jump // table. @@ -116,6 +117,11 @@ void SwitchCG::SwitchLowering::findJumpTables(CaseClusterVector &Clusters, FewCases = 1, SingleCase = 2 }; + // PartitionsScore[i] is used to break ties when choosing between two + // partitionings resulting in the same number of partitions. + SmallVector<unsigned, 8> PartitionsScore(N); + // PartitionsStats[j] is the stats for the partition Clusters[i..j]. + SmallVector<PartitionStats, 8> PartitionsStats(N); // Base case: There is only one way to partition Clusters[N-1]. MinPartitions[N - 1] = 1; @@ -129,16 +135,16 @@ void SwitchCG::SwitchLowering::findJumpTables(CaseClusterVector &Clusters, MinPartitions[i] = MinPartitions[i + 1] + 1; LastElement[i] = i; PartitionsScore[i] = PartitionsScore[i + 1] + PartitionScores::SingleCase; + for (int64_t j = i + 1; j < N; j++) + PartitionsStats[j] = + getJumpTableStats(Clusters, i, j, HasReachableDefault); // Search for a solution that results in fewer partitions. for (int64_t j = N - 1; j > i; j--) { // Try building a partition from Clusters[i..j]. - Range = getJumpTableRange(Clusters, i, j); - NumCases = getJumpTableNumCases(TotalCases, i, j); - assert(NumCases < UINT64_MAX / 100); - assert(Range >= NumCases); - - if (TLI->isSuitableForJumpTable(SI, NumCases, Range)) { + if (TLI->isSuitableForJumpTable(SI, PartitionsStats[j].Cases, + PartitionsStats[j].Targets, + PartitionsStats[j].Range)) { unsigned NumPartitions = 1 + (j == N - 1 ? 0 : MinPartitions[j + 1]); unsigned Score = j == N - 1 ? 0 : PartitionsScore[j + 1]; int64_t NumEntries = j - i + 1; diff --git a/llvm/lib/CodeGen/TargetLoweringBase.cpp b/llvm/lib/CodeGen/TargetLoweringBase.cpp index 0eb10a11042..557df03784d 100644 --- a/llvm/lib/CodeGen/TargetLoweringBase.cpp +++ b/llvm/lib/CodeGen/TargetLoweringBase.cpp @@ -72,9 +72,9 @@ static cl::opt<unsigned> MinimumJumpTableEntries ("min-jump-table-entries", cl::init(4), cl::Hidden, cl::desc("Set minimum number of entries to use a jump table.")); -static cl::opt<unsigned> MaximumJumpTableSize - ("max-jump-table-size", cl::init(UINT_MAX), cl::Hidden, - cl::desc("Set maximum size of jump tables.")); +static cl::opt<unsigned> MaximumJumpTableTargets + ("max-jump-table-targets", cl::init(UINT_MAX), cl::Hidden, + cl::desc("Set maximum number of targets to use in a jump table.")); /// Minimum jump table density for normal functions. static cl::opt<unsigned> @@ -1778,16 +1778,16 @@ void TargetLoweringBase::setMinimumJumpTableEntries(unsigned Val) { MinimumJumpTableEntries = Val; } -unsigned TargetLoweringBase::getMinimumJumpTableDensity(bool OptForSize) const { - return OptForSize ? OptsizeJumpTableDensity : JumpTableDensity; +unsigned TargetLoweringBase::getMaximumJumpTableTargets() const { + return MaximumJumpTableTargets; } -unsigned TargetLoweringBase::getMaximumJumpTableSize() const { - return MaximumJumpTableSize; +void TargetLoweringBase::setMaximumJumpTableTargets(unsigned Val) { + MaximumJumpTableTargets = Val; } -void TargetLoweringBase::setMaximumJumpTableSize(unsigned Val) { - MaximumJumpTableSize = Val; +unsigned TargetLoweringBase::getMinimumJumpTableDensity(bool OptForSize) const { + return OptForSize ? OptsizeJumpTableDensity : JumpTableDensity; } //===----------------------------------------------------------------------===// diff --git a/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp b/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp index ae09714395a..9628000b477 100644 --- a/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp +++ b/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp @@ -647,11 +647,10 @@ AArch64TargetLowering::AArch64TargetLowering(const TargetMachine &TM, setPrefFunctionAlignment( llvm::Align(1ULL << STI.getPrefFunctionLogAlignment())); - // Only change the limit for entries in a jump table if specified by + // Only change the limit for targets in a jump table if specified by // the sub target, but not at the command line. - unsigned MaxJT = STI.getMaximumJumpTableSize(); - if (MaxJT && getMaximumJumpTableSize() == UINT_MAX) - setMaximumJumpTableSize(MaxJT); + if (getMaximumJumpTableTargets() == UINT_MAX) + setMaximumJumpTableTargets(STI.getMaximumJumpTableTargets()); setHasExtractBitsInsn(true); diff --git a/llvm/lib/Target/AArch64/AArch64Subtarget.cpp b/llvm/lib/Target/AArch64/AArch64Subtarget.cpp index 558bea368ef..085a2ec5fe0 100644 --- a/llvm/lib/Target/AArch64/AArch64Subtarget.cpp +++ b/llvm/lib/Target/AArch64/AArch64Subtarget.cpp @@ -96,13 +96,13 @@ void AArch64Subtarget::initializeProperties() { break; case ExynosM1: MaxInterleaveFactor = 4; - MaxJumpTableSize = 8; + MaxJumpTableTargets = 8; PrefFunctionLogAlignment = 4; PrefLoopLogAlignment = 3; break; case ExynosM3: MaxInterleaveFactor = 4; - MaxJumpTableSize = 20; + MaxJumpTableTargets = 20; PrefFunctionLogAlignment = 5; PrefLoopLogAlignment = 4; break; diff --git a/llvm/lib/Target/AArch64/AArch64Subtarget.h b/llvm/lib/Target/AArch64/AArch64Subtarget.h index 757a4699986..fa6e35e7c3d 100644 --- a/llvm/lib/Target/AArch64/AArch64Subtarget.h +++ b/llvm/lib/Target/AArch64/AArch64Subtarget.h @@ -200,7 +200,7 @@ protected: unsigned MaxPrefetchIterationsAhead = UINT_MAX; unsigned PrefFunctionLogAlignment = 0; unsigned PrefLoopLogAlignment = 0; - unsigned MaxJumpTableSize = 0; + unsigned MaxJumpTableTargets = UINT_MAX; unsigned WideningBaseCost = 0; // ReserveXRegister[i] - X#i is not available as a general purpose register. @@ -364,7 +364,7 @@ public: } unsigned getPrefLoopLogAlignment() const { return PrefLoopLogAlignment; } - unsigned getMaximumJumpTableSize() const { return MaxJumpTableSize; } + unsigned getMaximumJumpTableTargets() const { return MaxJumpTableTargets; } unsigned getWideningBaseCost() const { return WideningBaseCost; } |

