Revert r300932 and r300930.

It seems that r300930 was creating an infinite loop in dag-combine when compling the following file: MultiSource/Benchmarks/MiBench/consumer-typeset/z21.c llvm-svn: 300940
author: Akira Hatanaka <ahatanaka@apple.com> 2017-04-21 01:31:50 +0000
committer: Akira Hatanaka <ahatanaka@apple.com> 2017-04-21 01:31:50 +0000
commit: 78ccba6a204eeb5bf0a72ba599451e73ba3649ea (patch)
tree: 90c64e9cffe3f11ced9b5b9c61e992d5217160ab /llvm/lib/Target/AArch64/AArch64ISelLowering.cpp
parent: a232323ff7c17665ca4a354a82bb13baa6a64770 (diff)
download: bcm5719-llvm-78ccba6a204eeb5bf0a72ba599451e73ba3649ea.tar.gz
bcm5719-llvm-78ccba6a204eeb5bf0a72ba599451e73ba3649ea.zip
1 files changed, 0 insertions, 139 deletions
diff --git a/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp b/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp
index 593c4187137..4ddc95199d4 100644
--- a/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp
+++ b/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp
@@ -91,7 +91,6 @@ using namespace llvm;
 
 STATISTIC(NumTailCalls, "Number of tail calls");
 STATISTIC(NumShiftInserts, "Number of vector shift inserts");
-STATISTIC(NumOptimizedImms, "Number of times immediates were optimized");
 
 static cl::opt<bool>
 EnableAArch64SlrGeneration("aarch64-shift-insert-generation", cl::Hidden,
@@ -106,12 +105,6 @@ cl::opt<bool> EnableAArch64ELFLocalDynamicTLSGeneration(
     cl::desc("Allow AArch64 Local Dynamic TLS code generation"),
     cl::init(false));
 
-static cl::opt<bool>
-EnableOptimizeLogicalImm("aarch64-enable-logical-imm", cl::Hidden,
-                         cl::desc("Enable AArch64 logical imm instruction "
-                                  "optimization"),
-                         cl::init(true));
-
 /// Value type used for condition codes.
 static const MVT MVT_CC = MVT::i32;
 
@@ -794,138 +787,6 @@ EVT AArch64TargetLowering::getSetCCResultType(const DataLayout &, LLVMContext &,
   return VT.changeVectorElementTypeToInteger();
 }
 
-static bool optimizeLogicalImm(SDValue Op, unsigned Size, uint64_t Imm,
-                               const APInt &Demanded,
-                               TargetLowering::TargetLoweringOpt &TLO,
-                               unsigned NewOpc) {
-  uint64_t OldImm = Imm, NewImm, Enc;
-  uint64_t Mask = ((uint64_t)(-1LL) >> (64 - Size));
-
-  // Return if the immediate is already a bimm32 or bimm64.
-  if (AArch64_AM::isLogicalImmediate(Imm & Mask, Size))
-    return false;
-
-  unsigned EltSize = Size;
-  uint64_t DemandedBits = Demanded.getZExtValue();
-
-  // Clear bits that are not demanded.
-  Imm &= DemandedBits;
-
-  while (true) {
-    // The goal here is to set the non-demanded bits in a way that minimizes
-    // the number of switching between 0 and 1. In order to achieve this goal,
-    // we set the non-demanded bits to the value of the preceding demanded bits.
-    // For example, if we have an immediate 0bx10xx0x1 ('x' indicates a
-    // non-demanded bit), we copy bit0 (1) to the least significant 'x',
-    // bit2 (0) to 'xx', and bit6 (1) to the most significant 'x'.
-    // The final result is 0b11000011.
-    uint64_t NonDemandedBits = ~DemandedBits;
-    uint64_t InvertedImm = ~Imm & DemandedBits;
-    uint64_t RotatedImm =
-        ((InvertedImm << 1) | (InvertedImm >> (EltSize - 1) & 1)) &
-        NonDemandedBits;
-    uint64_t Sum = RotatedImm + NonDemandedBits;
-    bool Carry = NonDemandedBits & ~Sum & (1ULL << (EltSize - 1));
-    uint64_t Ones = (Sum + Carry) & NonDemandedBits;
-    NewImm = (Imm | Ones) & Mask;
-
-    // If NewImm or its bitwise NOT is a shifted mask, it is a bitmask immediate
-    // or all-ones or all-zeros, in which case we can stop searching. Otherwise,
-    // we halve the element size and continue the search.
-    if (isShiftedMask_64(NewImm) || isShiftedMask_64(~(NewImm | ~Mask)))
-      break;
-
-    // We cannot shrink the element size any further if it is 2-bits.
-    if (EltSize == 2)
-      return false;
-
-    EltSize /= 2;
-    Mask >>= EltSize;
-    uint64_t Hi = Imm >> EltSize, DemandedBitsHi = DemandedBits >> EltSize;
-
-    // Return if there is mismatch in any of the demanded bits of Imm and Hi.
-    if (((Imm ^ Hi) & (DemandedBits & DemandedBitsHi) & Mask) != 0)
-      return false;
-
-    // Merge the upper and lower halves of Imm and DemandedBits.
-    Imm |= Hi;
-    DemandedBits |= DemandedBitsHi;
-  }
-
-  ++NumOptimizedImms;
-
-  // Replicate the element across the register width.
-  while (EltSize < Size) {
-    NewImm |= NewImm << EltSize;
-    EltSize *= 2;
-  }
-
-  (void)OldImm;
-  assert(((OldImm ^ NewImm) & Demanded.getZExtValue()) == 0 &&
-         "demanded bits should never be altered");
-
-  // Create the new constant immediate node.
-  EVT VT = Op.getValueType();
-  unsigned Population = countPopulation(NewImm);
-  SDLoc DL(Op);
-
-  // If the new constant immediate is all-zeros or all-ones, let the target
-  // independent DAG combine optimize this node.
-  if (Population == 0 || Population == Size)
-    return TLO.CombineTo(Op.getOperand(1), TLO.DAG.getConstant(NewImm, DL, VT));
-
-  // Otherwise, create a machine node so that target independent DAG combine
-  // doesn't undo this optimization.
-  Enc = AArch64_AM::encodeLogicalImmediate(NewImm, Size);
-  SDValue EncConst = TLO.DAG.getTargetConstant(Enc, DL, VT);
-  SDValue New(
-      TLO.DAG.getMachineNode(NewOpc, DL, VT, Op.getOperand(0), EncConst), 0);
-
-  return TLO.CombineTo(Op, New);
-}
-
-bool AArch64TargetLowering::targetShrinkDemandedConstant(
-    SDValue Op, const APInt &Demanded, TargetLoweringOpt &TLO) const {
-  // Delay this optimization to as late as possible.
-  if (!TLO.LegalOps)
-    return false;
-
-  if (!EnableOptimizeLogicalImm)
-    return false;
-
-  EVT VT = Op.getValueType();
-  if (VT.isVector())
-    return false;
-
-  unsigned Size = VT.getSizeInBits();
-  assert((Size == 32 || Size == 64) &&
-         "i32 or i64 is expected after legalization.");
-
-  // Exit early if we demand all bits.
-  if (Demanded.countPopulation() == Size)
-    return false;
-
-  unsigned NewOpc;
-  switch (Op.getOpcode()) {
-  default:
-    return false;
-  case ISD::AND:
-    NewOpc = Size == 32 ? AArch64::ANDWri : AArch64::ANDXri;
-    break;
-  case ISD::OR:
-    NewOpc = Size == 32 ? AArch64::ORRWri : AArch64::ORRXri;
-    break;
-  case ISD::XOR:
-    NewOpc = Size == 32 ? AArch64::EORWri : AArch64::EORXri;
-    break;
-  }
-  ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op.getOperand(1));
-  if (!C)
-    return false;
-  uint64_t Imm = C->getZExtValue();
-  return optimizeLogicalImm(Op, Size, Imm, Demanded, TLO, NewOpc);
-}
-
 /// computeKnownBitsForTargetNode - Determine which of the bits specified in
 /// Mask are known to be either zero or one and return them in the
 /// KnownZero/KnownOne bitsets.
author	Akira Hatanaka <ahatanaka@apple.com>	2017-04-21 01:31:50 +0000
committer	Akira Hatanaka <ahatanaka@apple.com>	2017-04-21 01:31:50 +0000
commit	78ccba6a204eeb5bf0a72ba599451e73ba3649ea (patch)
tree	90c64e9cffe3f11ced9b5b9c61e992d5217160ab /llvm/lib/Target/AArch64/AArch64ISelLowering.cpp
parent	a232323ff7c17665ca4a354a82bb13baa6a64770 (diff)
download	bcm5719-llvm-78ccba6a204eeb5bf0a72ba599451e73ba3649ea.tar.gz bcm5719-llvm-78ccba6a204eeb5bf0a72ba599451e73ba3649ea.zip