Allow vectorization of division by uniform power of 2.

This patch adds support to recognize division by uniform power of 2 and modifies the cost table to vectorize division by uniform power of 2 whenever possible. Updates Cost model for Loop and SLP Vectorizer.The cost table is currently only updated for X86 backend. Thanks to Hal, Andrea, Sanjay for the review. (http://reviews.llvm.org/D4971) llvm-svn: 216371
author: Karthik Bhat <kv.bhat@samsung.com> 2014-08-25 04:56:54 +0000
committer: Karthik Bhat <kv.bhat@samsung.com> 2014-08-25 04:56:54 +0000
commit: 7f33ff7deaea1454422a99d3a497fa0d11955e2a (patch)
tree: 87a2d6dddf2342728ee8a1d9c75dfe0bc5ed05d2 /llvm/lib/Target/X86/X86TargetTransformInfo.cpp
parent: c6914d068f317f3c8bc9734b6bbeb090975b50b1 (diff)
download: bcm5719-llvm-7f33ff7deaea1454422a99d3a497fa0d11955e2a.tar.gz
bcm5719-llvm-7f33ff7deaea1454422a99d3a497fa0d11955e2a.zip
1 files changed, 27 insertions, 4 deletions
diff --git a/llvm/lib/Target/X86/X86TargetTransformInfo.cpp b/llvm/lib/Target/X86/X86TargetTransformInfo.cpp
index 173bb4e6ec8..cd0336fa92f 100644
--- a/llvm/lib/Target/X86/X86TargetTransformInfo.cpp
+++ b/llvm/lib/Target/X86/X86TargetTransformInfo.cpp
@@ -84,7 +84,8 @@ public:
   unsigned getRegisterBitWidth(bool Vector) const override;
   unsigned getMaximumUnrollFactor() const override;
   unsigned getArithmeticInstrCost(unsigned Opcode, Type *Ty, OperandValueKind,
-                                  OperandValueKind) const override;
+                                  OperandValueKind, OperandValueProperties,
+                                  OperandValueProperties) const override;
   unsigned getShuffleCost(ShuffleKind Kind, Type *Tp,
                           int Index, Type *SubTp) const override;
   unsigned getCastInstrCost(unsigned Opcode, Type *Dst,
@@ -178,15 +179,37 @@ unsigned X86TTI::getMaximumUnrollFactor() const {
   return 2;
 }
 
-unsigned X86TTI::getArithmeticInstrCost(unsigned Opcode, Type *Ty,
-                                        OperandValueKind Op1Info,
-                                        OperandValueKind Op2Info) const {
+unsigned X86TTI::getArithmeticInstrCost(
+    unsigned Opcode, Type *Ty, OperandValueKind Op1Info,
+    OperandValueKind Op2Info, OperandValueProperties Opd1PropInfo,
+    OperandValueProperties Opd2PropInfo) const {
   // Legalize the type.
   std::pair<unsigned, MVT> LT = TLI->getTypeLegalizationCost(Ty);
 
   int ISD = TLI->InstructionOpcodeToISD(Opcode);
   assert(ISD && "Invalid opcode");
 
+  if (ISD == ISD::SDIV &&
+      Op2Info == TargetTransformInfo::OK_UniformConstantValue &&
+      Opd2PropInfo == TargetTransformInfo::OP_PowerOf2) {
+    // On X86, vector signed division by constants power-of-two are
+    // normally expanded to the sequence SRA + SRL + ADD + SRA.
+    // The OperandValue properties many not be same as that of previous
+    // operation;conservatively assume OP_None.
+    unsigned Cost =
+        2 * getArithmeticInstrCost(Instruction::AShr, Ty, Op1Info, Op2Info,
+                                   TargetTransformInfo::OP_None,
+                                   TargetTransformInfo::OP_None);
+    Cost += getArithmeticInstrCost(Instruction::LShr, Ty, Op1Info, Op2Info,
+                                   TargetTransformInfo::OP_None,
+                                   TargetTransformInfo::OP_None);
+    Cost += getArithmeticInstrCost(Instruction::Add, Ty, Op1Info, Op2Info,
+                                   TargetTransformInfo::OP_None,
+                                   TargetTransformInfo::OP_None);
+
+    return Cost;
+  }
+
   static const CostTblEntry<MVT::SimpleValueType>
   AVX2UniformConstCostTable[] = {
     { ISD::SDIV, MVT::v16i16,  6 }, // vpmulhw sequence
author	Karthik Bhat <kv.bhat@samsung.com>	2014-08-25 04:56:54 +0000
committer	Karthik Bhat <kv.bhat@samsung.com>	2014-08-25 04:56:54 +0000
commit	7f33ff7deaea1454422a99d3a497fa0d11955e2a (patch)
tree	87a2d6dddf2342728ee8a1d9c75dfe0bc5ed05d2 /llvm/lib/Target/X86/X86TargetTransformInfo.cpp
parent	c6914d068f317f3c8bc9734b6bbeb090975b50b1 (diff)
download	bcm5719-llvm-7f33ff7deaea1454422a99d3a497fa0d11955e2a.tar.gz bcm5719-llvm-7f33ff7deaea1454422a99d3a497fa0d11955e2a.zip