diff options
author | David Majnemer <david.majnemer@gmail.com> | 2015-08-16 04:52:11 +0000 |
---|---|---|
committer | David Majnemer <david.majnemer@gmail.com> | 2015-08-16 04:52:11 +0000 |
commit | 1a59e49f3caeacf5d8525351ac361abb56bc8fb1 (patch) | |
tree | 491e779ed739c8bda8b6c067dbc102a3e02137fc /llvm/lib | |
parent | 5196275eeab605a62060ed07c66bb6d49a767a62 (diff) | |
download | bcm5719-llvm-1a59e49f3caeacf5d8525351ac361abb56bc8fb1.tar.gz bcm5719-llvm-1a59e49f3caeacf5d8525351ac361abb56bc8fb1.zip |
[X86] Widen the 'AND' mask if doing so shrinks the encoding size
We can set additional bits in a mask given that we know the other
operand of an AND already has some bits set to zero. This can be more
efficient if doing so allows us to use an instruction which implicitly
sign extends the immediate.
This fixes PR24085.
Differential Revision: http://reviews.llvm.org/D11289
llvm-svn: 245169
Diffstat (limited to 'llvm/lib')
-rw-r--r-- | llvm/lib/Target/X86/X86ISelDAGToDAG.cpp | 63 |
1 files changed, 61 insertions, 2 deletions
diff --git a/llvm/lib/Target/X86/X86ISelDAGToDAG.cpp b/llvm/lib/Target/X86/X86ISelDAGToDAG.cpp index d37db7f788b..3453bf625cd 100644 --- a/llvm/lib/Target/X86/X86ISelDAGToDAG.cpp +++ b/llvm/lib/Target/X86/X86ISelDAGToDAG.cpp @@ -198,6 +198,7 @@ namespace { SDNode *Select(SDNode *N) override; SDNode *SelectGather(SDNode *N, unsigned Opc); SDNode *SelectAtomicLoadArith(SDNode *Node, MVT NVT); + SDNode *SelectAndWithSExtImmediate(SDNode *Node, MVT NVT); bool FoldOffsetIntoAddress(uint64_t Offset, X86ISelAddressMode &AM); bool MatchLoadInAddress(LoadSDNode *N, X86ISelAddressMode &AM); @@ -2208,6 +2209,57 @@ SDNode *X86DAGToDAGISel::SelectGather(SDNode *Node, unsigned Opc) { return ResNode; } +// Try to shrink the encoding of an AND by setting additional bits in the mask. +// It is only correct to do so if we know a priori that the other operand of the +// AND already has those bits set to zero. +SDNode *X86DAGToDAGISel::SelectAndWithSExtImmediate(SDNode *Node, MVT NVT) { + SDValue N0 = Node->getOperand(0); + SDValue N1 = Node->getOperand(1); + + if (NVT != MVT::i32 && NVT != MVT::i64) + return nullptr; + + auto *Cst = dyn_cast<ConstantSDNode>(N1); + if (!Cst) + return nullptr; + + // As a heuristic, skip over negative constants. It turns out not to be + // productive to widen the mask. + int64_t Val = Cst->getSExtValue(); + if (Val <= 0) + return nullptr; + + // Limit ourselves to constants which already have sign bits to save on + // compile time. + if ((int8_t)Val >= 0) + return nullptr; + + unsigned Opc; + switch (NVT.SimpleTy) { + default: + llvm_unreachable("Unsupported VT!"); + case MVT::i32: + Opc = X86::AND32ri8; + break; + case MVT::i64: + Opc = X86::AND64ri8; + break; + } + + APInt Op0Zero, Op0One; + CurDAG->computeKnownBits(N0, Op0Zero, Op0One); + // Grow the mask using the known zero bits. + Op0Zero |= Val; + // See if the mask can be efficiently encoded using at most NumBits. + if (!Op0Zero.isSignedIntN(8)) + return nullptr; + + SDLoc DL(Node); + SDValue NewCst = + CurDAG->getTargetConstant(Op0Zero.getSExtValue(), DL, MVT::i8); + return CurDAG->getMachineNode(Opc, DL, NVT, N0, NewCst); +} + SDNode *X86DAGToDAGISel::Select(SDNode *Node) { MVT NVT = Node->getSimpleValueType(0); unsigned Opc, MOpc; @@ -2223,7 +2275,8 @@ SDNode *X86DAGToDAGISel::Select(SDNode *Node) { } switch (Opcode) { - default: break; + default: + break; case ISD::INTRINSIC_W_CHAIN: { unsigned IntNo = cast<ConstantSDNode>(Node->getOperand(1))->getZExtValue(); switch (IntNo) { @@ -2298,7 +2351,13 @@ SDNode *X86DAGToDAGISel::Select(SDNode *Node) { return RetVal; break; } - case ISD::AND: + case ISD::AND: { + if (SDNode *NewNode = SelectAndWithSExtImmediate(Node, NVT)) { + ReplaceUses(SDValue(Node, 0), SDValue(NewNode, 0)); + return nullptr; + } + // FALLTHROUGH + } case ISD::OR: case ISD::XOR: { // For operations of the form (x << C1) op C2, check if we can use a smaller |