ARM cost model: Address computation in vector mem ops not free

Adds a function to target transform info to query for the cost of address computation. The cost model analysis pass now also queries this interface. The code in LoopVectorize adds the cost of address computation as part of the memory instruction cost calculation. Only there, we know whether the instruction will be scalarized or not. Increase the penality for inserting in to D registers on swift. This becomes necessary because we now always assume that address computation has a cost and three is a closer value to the architecture. radar://13097204 llvm-svn: 174713
author: Arnold Schwaighofer <aschwaighofer@apple.com> 2013-02-08 14:50:48 +0000
committer: Arnold Schwaighofer <aschwaighofer@apple.com> 2013-02-08 14:50:48 +0000
commit: 594fa2dc2ba2f5748f294c25fe309b03d7eaf700 (patch)
tree: 6fe16384da8197bf293ad2d55f0a81bd6a1c7fe9 /llvm/lib/Target/ARM
parent: 897f2cf408c9522187b3a375e201bdf6938f404f (diff)
download: bcm5719-llvm-594fa2dc2ba2f5748f294c25fe309b03d7eaf700.tar.gz
bcm5719-llvm-594fa2dc2ba2f5748f294c25fe309b03d7eaf700.zip
1 files changed, 11 insertions, 2 deletions
diff --git a/llvm/lib/Target/ARM/ARMTargetTransformInfo.cpp b/llvm/lib/Target/ARM/ARMTargetTransformInfo.cpp
index 1f91e0ee362..f6fa3199709 100644
--- a/llvm/lib/Target/ARM/ARMTargetTransformInfo.cpp
+++ b/llvm/lib/Target/ARM/ARMTargetTransformInfo.cpp
@@ -120,6 +120,8 @@ public:
   unsigned getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy) const;
 
   unsigned getVectorInstrCost(unsigned Opcode, Type *Val, unsigned Index) const;
+
+  unsigned getAddressComputationCost(Type *Val) const;
   /// @}
 };
 
@@ -304,12 +306,13 @@ unsigned ARMTTI::getCastInstrCost(unsigned Opcode, Type *Dst,
 
 unsigned ARMTTI::getVectorInstrCost(unsigned Opcode, Type *ValTy,
                                     unsigned Index) const {
-  // Penalize inserting into an D-subregister.
+  // Penalize inserting into an D-subregister. We end up with a three times
+  // lower estimated throughput on swift.
   if (ST->isSwift() &&
       Opcode == Instruction::InsertElement &&
       ValTy->isVectorTy() &&
       ValTy->getScalarSizeInBits() <= 32)
-    return 2;
+    return 3;
 
   return TargetTransformInfo::getVectorInstrCost(Opcode, ValTy, Index);
 }
@@ -326,3 +329,9 @@ unsigned ARMTTI::getCmpSelInstrCost(unsigned Opcode, Type *ValTy,
 
   return TargetTransformInfo::getCmpSelInstrCost(Opcode, ValTy, CondTy);
 }
+
+unsigned ARMTTI::getAddressComputationCost(Type *Ty) const {
+  // In many cases the address computation is not merged into the instruction
+  // addressing mode.
+  return 1;
+}
author	Arnold Schwaighofer <aschwaighofer@apple.com>	2013-02-08 14:50:48 +0000
committer	Arnold Schwaighofer <aschwaighofer@apple.com>	2013-02-08 14:50:48 +0000
commit	594fa2dc2ba2f5748f294c25fe309b03d7eaf700 (patch)
tree	6fe16384da8197bf293ad2d55f0a81bd6a1c7fe9 /llvm/lib/Target/ARM
parent	897f2cf408c9522187b3a375e201bdf6938f404f (diff)
download	bcm5719-llvm-594fa2dc2ba2f5748f294c25fe309b03d7eaf700.tar.gz bcm5719-llvm-594fa2dc2ba2f5748f294c25fe309b03d7eaf700.zip