[SystemZ] Modelling of costs of divisions with a constant power of 2.

Such divisions will eventually be implemented with shifts which should be reflected in the cost function. Review: Ulrich Weigand llvm-svn: 303254
author: Jonas Paulsson <paulsson@linux.vnet.ibm.com> 2017-05-17 12:46:26 +0000
committer: Jonas Paulsson <paulsson@linux.vnet.ibm.com> 2017-05-17 12:46:26 +0000
commit: 8722ade770bdbb249026271436341adc28fac39c (patch)
tree: ade0e45dacda49e316e8ff3b21076a407f52c7fc /llvm/lib/Target/SystemZ/SystemZTargetTransformInfo.cpp
parent: ed205a090db1e6aca740e29a9bb54c589df81f0e (diff)
download: bcm5719-llvm-8722ade770bdbb249026271436341adc28fac39c.tar.gz
bcm5719-llvm-8722ade770bdbb249026271436341adc28fac39c.zip
1 files changed, 33 insertions, 1 deletions
diff --git a/llvm/lib/Target/SystemZ/SystemZTargetTransformInfo.cpp b/llvm/lib/Target/SystemZ/SystemZTargetTransformInfo.cpp
index f56b238f91e..6a3dc6799c4 100644
--- a/llvm/lib/Target/SystemZ/SystemZTargetTransformInfo.cpp
+++ b/llvm/lib/Target/SystemZ/SystemZTargetTransformInfo.cpp
@@ -325,6 +325,30 @@ int SystemZTTIImpl::getArithmeticInstrCost(
 
   unsigned ScalarBits = Ty->getScalarSizeInBits();
 
+  // Div with a constant which is a power of 2 will be converted by
+  // DAGCombiner to use shifts. With vector shift-element instructions, a
+  // vector sdiv costs about as much as a scalar one.
+  const unsigned SDivCostEstimate = 4;
+  bool SDivPow2 = false;
+  bool UDivPow2 = false;
+  if ((Opcode == Instruction::SDiv || Opcode == Instruction::UDiv) &&
+      Args.size() == 2) {
+    const ConstantInt *CI = nullptr;
+    if (const Constant *C = dyn_cast<Constant>(Args[1])) {
+      if (C->getType()->isVectorTy())
+        CI = dyn_cast_or_null<const ConstantInt>(C->getSplatValue());
+      else
+        CI = dyn_cast<const ConstantInt>(C);
+    }
+    if (CI != nullptr &&
+        (CI->getValue().isPowerOf2() || (-CI->getValue()).isPowerOf2())) {
+      if (Opcode == Instruction::SDiv)
+        SDivPow2 = true;
+      else
+        UDivPow2 = true;
+    }
+  }
+
   if (Ty->isVectorTy()) {
     assert (ST->hasVector() && "getArithmeticInstrCost() called with vector type.");
     unsigned VF = Ty->getVectorNumElements();
@@ -333,10 +357,13 @@ int SystemZTTIImpl::getArithmeticInstrCost(
     // These vector operations are custom handled, but are still supported
     // with one instruction per vector, regardless of element size.
     if (Opcode == Instruction::Shl || Opcode == Instruction::LShr ||
-        Opcode == Instruction::AShr) {
+        Opcode == Instruction::AShr || UDivPow2) {
       return NumVectors;
     }
 
+    if (SDivPow2)
+      return (NumVectors * SDivCostEstimate);
+
     // These FP operations are supported with a single vector instruction for
     // double (base implementation assumes float generally costs 2). For
     // FP128, the scalar cost is 1, and there is no overhead since the values
@@ -395,6 +422,11 @@ int SystemZTTIImpl::getArithmeticInstrCost(
       // 2 * ipm sequences ; xor ; shift ; compare
       return 7;
 
+    if (UDivPow2)
+      return 1;
+    if (SDivPow2)
+      return SDivCostEstimate;
+
     // An extra extension for narrow types is needed.
     if ((Opcode == Instruction::SDiv || Opcode == Instruction::SRem))
       // sext of op(s) for narrow types
author	Jonas Paulsson <paulsson@linux.vnet.ibm.com>	2017-05-17 12:46:26 +0000
committer	Jonas Paulsson <paulsson@linux.vnet.ibm.com>	2017-05-17 12:46:26 +0000
commit	8722ade770bdbb249026271436341adc28fac39c (patch)
tree	ade0e45dacda49e316e8ff3b21076a407f52c7fc /llvm/lib/Target/SystemZ/SystemZTargetTransformInfo.cpp
parent	ed205a090db1e6aca740e29a9bb54c589df81f0e (diff)
download	bcm5719-llvm-8722ade770bdbb249026271436341adc28fac39c.tar.gz bcm5719-llvm-8722ade770bdbb249026271436341adc28fac39c.zip