Fix PR 17368: disable vector mul distribution for square of add/sub for ARM

Generally, it is desirable to distribute (a + b) * c to a*c + b*c for ARM with VMLx forwarding, where a, b and c are vectors. However, for (a + b)*(a + b), distribution will result in one extra instruction. With distribution: x = a + b (add) y = a * x (mul) z = y + b * y (mla) Without distribution: x = a + b (add) z = x * x (mul) This patch checks if a mul is a square of add/sub. If yes, skip distribution. llvm-svn: 191410
author: Weiming Zhao <weimingz@codeaurora.org> 2013-09-25 23:12:06 +0000
committer: Weiming Zhao <weimingz@codeaurora.org> 2013-09-25 23:12:06 +0000
commit: 2052f4843bb50400c0ab158213e546f3dd9be8ac (patch)
tree: 36fa496a1e49b1aea1071efec63b1704b3c529e3 /llvm/lib/Target/ARM
parent: a9e303e7462f1748febd9622259db6915f97cc1b (diff)
download: bcm5719-llvm-2052f4843bb50400c0ab158213e546f3dd9be8ac.tar.gz
bcm5719-llvm-2052f4843bb50400c0ab158213e546f3dd9be8ac.zip
1 files changed, 10 insertions, 0 deletions
diff --git a/llvm/lib/Target/ARM/ARMISelLowering.cpp b/llvm/lib/Target/ARM/ARMISelLowering.cpp
index c83f7b194ae..773b710ab05 100644
--- a/llvm/lib/Target/ARM/ARMISelLowering.cpp
+++ b/llvm/lib/Target/ARM/ARMISelLowering.cpp
@@ -8342,6 +8342,13 @@ static SDValue PerformSUBCombine(SDNode *N,
 /// is faster than
 ///   vadd d3, d0, d1
 ///   vmul d3, d3, d2
+//  However, for (A + B) * (A + B),
+//    vadd d2, d0, d1
+//    vmul d3, d0, d2
+//    vmla d3, d1, d2
+//  is slower than
+//    vadd d2, d0, d1
+//    vmul d3, d2, d2
 static SDValue PerformVMULCombine(SDNode *N,
                                   TargetLowering::DAGCombinerInfo &DCI,
                                   const ARMSubtarget *Subtarget) {
@@ -8361,6 +8368,9 @@ static SDValue PerformVMULCombine(SDNode *N,
     std::swap(N0, N1);
   }
 
+  if (N0 == N1)
+    return SDValue();
+
   EVT VT = N->getValueType(0);
   SDLoc DL(N);
   SDValue N00 = N0->getOperand(0);
author	Weiming Zhao <weimingz@codeaurora.org>	2013-09-25 23:12:06 +0000
committer	Weiming Zhao <weimingz@codeaurora.org>	2013-09-25 23:12:06 +0000
commit	2052f4843bb50400c0ab158213e546f3dd9be8ac (patch)
tree	36fa496a1e49b1aea1071efec63b1704b3c529e3 /llvm/lib/Target/ARM
parent	a9e303e7462f1748febd9622259db6915f97cc1b (diff)
download	bcm5719-llvm-2052f4843bb50400c0ab158213e546f3dd9be8ac.tar.gz bcm5719-llvm-2052f4843bb50400c0ab158213e546f3dd9be8ac.zip