[x86] Fix PR21139, one of the last remaining regressions found in the

new vector shuffle lowering. This is loosely based on a patch by Marius Wachtler to the PR (thanks!). I refactored it a bi to use std::count_if and a mutable array ref but the core idea was exactly right. I also added some direct testing of this case. I believe PR21137 is now the only remaining regression. llvm-svn: 219081
author: Chandler Carruth <chandlerc@gmail.com> 2014-10-05 12:07:34 +0000
committer: Chandler Carruth <chandlerc@gmail.com> 2014-10-05 12:07:34 +0000
commit: acecdc02119459d8ca13e6ca8fa2f16d655ae2f7 (patch)
tree: d7d1f0654fa99218721118c0edc03952289598c3 /llvm/lib
parent: ae81abfa3807885d0ecc221f747100607cd4be3e (diff)
download: bcm5719-llvm-acecdc02119459d8ca13e6ca8fa2f16d655ae2f7.tar.gz
bcm5719-llvm-acecdc02119459d8ca13e6ca8fa2f16d655ae2f7.zip
1 files changed, 17 insertions, 9 deletions
diff --git a/llvm/lib/Target/X86/X86ISelLowering.cpp b/llvm/lib/Target/X86/X86ISelLowering.cpp
index 1bfacfe65a2..64e0db1e70f 100644
--- a/llvm/lib/Target/X86/X86ISelLowering.cpp
+++ b/llvm/lib/Target/X86/X86ISelLowering.cpp
@@ -9278,21 +9278,29 @@ static SDValue lowerV16I8VectorShuffle(SDValue Op, SDValue V1, SDValue V2,
   //
   // FIXME: We need to handle other interleaving widths (i16, i32, ...).
   if (shouldLowerAsInterleaving(Mask)) {
-    // FIXME: Figure out whether we should pack these into the low or high
-    // halves.
-
-    int EMask[16], OMask[16];
+    int NumLoHalf = std::count_if(Mask.begin(), Mask.end(), [](int M) {
+      return (M >= 0 && M < 8) || (M >= 16 && M < 24);
+    });
+    int NumHiHalf = std::count_if(Mask.begin(), Mask.end(), [](int M) {
+      return (M >= 8 && M < 16) || M >= 24;
+    });
+    int EMask[16] = {-1, -1, -1, -1, -1, -1, -1, -1,
+                     -1, -1, -1, -1, -1, -1, -1, -1};
+    int OMask[16] = {-1, -1, -1, -1, -1, -1, -1, -1,
+                     -1, -1, -1, -1, -1, -1, -1, -1};
+    bool UnpackLo = NumLoHalf >= NumHiHalf;
+    MutableArrayRef<int> TargetEMask(UnpackLo ? EMask : EMask + 8, 8);
+    MutableArrayRef<int> TargetOMask(UnpackLo ? OMask : OMask + 8, 8);
     for (int i = 0; i < 8; ++i) {
-      EMask[i] = Mask[2*i];
-      OMask[i] = Mask[2*i + 1];
-      EMask[i + 8] = -1;
-      OMask[i + 8] = -1;
+      TargetEMask[i] = Mask[2 * i];
+      TargetOMask[i] = Mask[2 * i + 1];
     }
 
     SDValue Evens = DAG.getVectorShuffle(MVT::v16i8, DL, V1, V2, EMask);
     SDValue Odds = DAG.getVectorShuffle(MVT::v16i8, DL, V1, V2, OMask);
 
-    return DAG.getNode(X86ISD::UNPCKL, DL, MVT::v16i8, Evens, Odds);
+    return DAG.getNode(UnpackLo ? X86ISD::UNPCKL : X86ISD::UNPCKH, DL,
+                       MVT::v16i8, Evens, Odds);
   }
 
   // Check for SSSE3 which lets us lower all v16i8 shuffles much more directly
author	Chandler Carruth <chandlerc@gmail.com>	2014-10-05 12:07:34 +0000
committer	Chandler Carruth <chandlerc@gmail.com>	2014-10-05 12:07:34 +0000
commit	acecdc02119459d8ca13e6ca8fa2f16d655ae2f7 (patch)
tree	d7d1f0654fa99218721118c0edc03952289598c3 /llvm/lib
parent	ae81abfa3807885d0ecc221f747100607cd4be3e (diff)
download	bcm5719-llvm-acecdc02119459d8ca13e6ca8fa2f16d655ae2f7.tar.gz bcm5719-llvm-acecdc02119459d8ca13e6ca8fa2f16d655ae2f7.zip