summaryrefslogtreecommitdiffstats
path: root/llvm/lib
diff options
context:
space:
mode:
authorCraig Topper <craig.topper@intel.com>2017-12-16 19:31:36 +0000
committerCraig Topper <craig.topper@intel.com>2017-12-16 19:31:36 +0000
commit1260a4e826ecff1ba6a9076336fb735cc90dcd76 (patch)
tree5bf3626d9e3f991fd45d00079f09b428ea1d1e0b /llvm/lib
parent5029d676f82782c36b2217a542286eb1773756d5 (diff)
downloadbcm5719-llvm-1260a4e826ecff1ba6a9076336fb735cc90dcd76.tar.gz
bcm5719-llvm-1260a4e826ecff1ba6a9076336fb735cc90dcd76.zip
[X86] When using vpopcntdq for ctpop of v8i16 vectors, only promote to v8i32.
Previously we promoted to v8i64, but we don't need to go all the way to 512-bits. If we have VLX we can use the 256-bit instruction. And even if we don't have VLX we can widen v8i32 to v16i32 and drop the upper half. llvm-svn: 320926
Diffstat (limited to 'llvm/lib')
-rw-r--r--llvm/lib/Target/X86/X86ISelLowering.cpp15
1 files changed, 7 insertions, 8 deletions
diff --git a/llvm/lib/Target/X86/X86ISelLowering.cpp b/llvm/lib/Target/X86/X86ISelLowering.cpp
index de6e721c76c..ffbcd4537ec 100644
--- a/llvm/lib/Target/X86/X86ISelLowering.cpp
+++ b/llvm/lib/Target/X86/X86ISelLowering.cpp
@@ -23765,14 +23765,13 @@ static SDValue LowerVectorCTPOP(SDValue Op, const X86Subtarget &Subtarget,
// TRUNC(CTPOP(ZEXT(X))) to make use of vXi32/vXi64 VPOPCNT instructions.
if (Subtarget.hasVPOPCNTDQ()) {
- if (VT == MVT::v8i16) {
- Op = DAG.getNode(ISD::ZERO_EXTEND, DL, MVT::v8i64, Op0);
- Op = DAG.getNode(ISD::CTPOP, DL, MVT::v8i64, Op);
- return DAG.getNode(ISD::TRUNCATE, DL, VT, Op);
- }
- if (VT == MVT::v16i8 || VT == MVT::v16i16) {
- Op = DAG.getNode(ISD::ZERO_EXTEND, DL, MVT::v16i32, Op0);
- Op = DAG.getNode(ISD::CTPOP, DL, MVT::v16i32, Op);
+ unsigned NumElems = VT.getVectorNumElements();
+ assert((VT.getVectorElementType() == MVT::i8 ||
+ VT.getVectorElementType() == MVT::i16) && "Unexpected type");
+ if (NumElems <= 16) {
+ MVT NewVT = MVT::getVectorVT(MVT::i32, NumElems);
+ Op = DAG.getNode(ISD::ZERO_EXTEND, DL, NewVT, Op0);
+ Op = DAG.getNode(ISD::CTPOP, DL, NewVT, Op);
return DAG.getNode(ISD::TRUNCATE, DL, VT, Op);
}
}
OpenPOWER on IntegriCloud