[PowerPC] Do not round values prior to converting to integer

Adding the FP_ROUND nodes when combining FP_TO_[SU]INT of elements feeding a BUILD_VECTOR into an FP_TO_[SU]INT of the built vector loses precision. This patch removes the code that adds these nodes to true f64 operands. It also adds patterns required to ensure the code is still vectorized rather than converting individual elements and inserting into a vector. Fixes https://bugs.llvm.org/show_bug.cgi?id=38342 Differential Revision: https://reviews.llvm.org/D50121 llvm-svn: 338658
author: Nemanja Ivanovic <nemanja.i.ibm@gmail.com> 2018-08-02 00:03:22 +0000
committer: Nemanja Ivanovic <nemanja.i.ibm@gmail.com> 2018-08-02 00:03:22 +0000
commit: e1a525ed06e1c53f9707d29d7d53c580a738900a (patch)
tree: d02ed4afd2c815417564fd8a1bbf0dc10f0b59d6 /llvm/lib/Target/PowerPC/PPCISelLowering.cpp
parent: 8fa58b1d178b34a03acf692ec410b0d8a2b3c825 (diff)
download: bcm5719-llvm-e1a525ed06e1c53f9707d29d7d53c580a738900a.tar.gz
bcm5719-llvm-e1a525ed06e1c53f9707d29d7d53c580a738900a.zip
1 files changed, 19 insertions, 3 deletions
diff --git a/llvm/lib/Target/PowerPC/PPCISelLowering.cpp b/llvm/lib/Target/PowerPC/PPCISelLowering.cpp
index 51ff8a5cf77..f6e13aee968 100644
--- a/llvm/lib/Target/PowerPC/PPCISelLowering.cpp
+++ b/llvm/lib/Target/PowerPC/PPCISelLowering.cpp
@@ -11761,6 +11761,14 @@ SDValue PPCTargetLowering::DAGCombineExtBoolTrunc(SDNode *N,
       ShiftCst);
 }
 
+// Is this an extending load from an f32 to an f64?
+static bool isFPExtLoad(SDValue Op) {
+  if (LoadSDNode *LD = dyn_cast<LoadSDNode>(Op.getNode()))
+    return LD->getExtensionType() == ISD::EXTLOAD &&
+      Op.getValueType() == MVT::f64;
+  return false;
+}
+
 /// Reduces the number of fp-to-int conversion when building a vector.
 ///
 /// If this vector is built out of floating to integer conversions,
@@ -11795,11 +11803,18 @@ combineElementTruncationToVectorTruncation(SDNode *N,
     SmallVector<SDValue, 4> Ops;
     EVT TargetVT = N->getValueType(0);
     for (int i = 0, e = N->getNumOperands(); i < e; ++i) {
-      if (N->getOperand(i).getOpcode() != PPCISD::MFVSR)
+      SDValue NextOp = N->getOperand(i);
+      if (NextOp.getOpcode() != PPCISD::MFVSR)
         return SDValue();
-      unsigned NextConversion = N->getOperand(i).getOperand(0).getOpcode();
+      unsigned NextConversion = NextOp.getOperand(0).getOpcode();
       if (NextConversion != FirstConversion)
         return SDValue();
+      // If we are converting to 32-bit integers, we need to add an FP_ROUND.
+      // This is not valid if the input was originally double precision. It is
+      // also not profitable to do unless this is an extending load in which
+      // case doing this combine will allow us to combine consecutive loads.
+      if (Is32Bit && !isFPExtLoad(NextOp.getOperand(0).getOperand(0)))
+        return SDValue();
       if (N->getOperand(i) != FirstInput)
         IsSplat = false;
     }
@@ -11813,8 +11828,9 @@ combineElementTruncationToVectorTruncation(SDNode *N,
     // Now that we know we have the right type of node, get its operands
     for (int i = 0, e = N->getNumOperands(); i < e; ++i) {
       SDValue In = N->getOperand(i).getOperand(0);
-      // For 32-bit values, we need to add an FP_ROUND node.
       if (Is32Bit) {
+        // For 32-bit values, we need to add an FP_ROUND node (if we made it
+        // here, we know that all inputs are extending loads so this is safe).
         if (In.isUndef())
           Ops.push_back(DAG.getUNDEF(SrcVT));
         else {
author	Nemanja Ivanovic <nemanja.i.ibm@gmail.com>	2018-08-02 00:03:22 +0000
committer	Nemanja Ivanovic <nemanja.i.ibm@gmail.com>	2018-08-02 00:03:22 +0000
commit	e1a525ed06e1c53f9707d29d7d53c580a738900a (patch)
tree	d02ed4afd2c815417564fd8a1bbf0dc10f0b59d6 /llvm/lib/Target/PowerPC/PPCISelLowering.cpp
parent	8fa58b1d178b34a03acf692ec410b0d8a2b3c825 (diff)
download	bcm5719-llvm-e1a525ed06e1c53f9707d29d7d53c580a738900a.tar.gz bcm5719-llvm-e1a525ed06e1c53f9707d29d7d53c580a738900a.zip