diff options
| author | Nadav Rotem <nadav.rotem@intel.com> | 2011-10-21 11:42:07 +0000 | 
|---|---|---|
| committer | Nadav Rotem <nadav.rotem@intel.com> | 2011-10-21 11:42:07 +0000 | 
| commit | d315157f12c57118be2a458c2bc5fae27bc59dd2 (patch) | |
| tree | 550ff1b4d3772035b9392983bef94437b6390ead | |
| parent | 12a16dbcb0bcab32dbeb757a81bf9dbe67f2eade (diff) | |
| download | bcm5719-llvm-d315157f12c57118be2a458c2bc5fae27bc59dd2.tar.gz bcm5719-llvm-d315157f12c57118be2a458c2bc5fae27bc59dd2.zip  | |
1. Fix the widening of SETCC in WidenVecOp_SETCC. Use the correct return CC type.
2. Fix a typo in CONCAT_VECTORS which exposed the bug in #1.
llvm-svn: 142648
4 files changed, 47 insertions, 14 deletions
diff --git a/llvm/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp b/llvm/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp index a5c4c2ded4c..455307197c5 100644 --- a/llvm/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp +++ b/llvm/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp @@ -2926,7 +2926,7 @@ SDValue DAGTypeLegalizer::PromoteIntRes_SCALAR_TO_VECTOR(SDNode *N) {  SDValue DAGTypeLegalizer::PromoteIntRes_CONCAT_VECTORS(SDNode *N) {    DebugLoc dl = N->getDebugLoc(); -  SDValue Op0 = N->getOperand(1); +  SDValue Op0 = N->getOperand(0);    SDValue Op1 = N->getOperand(1);    assert(Op0.getValueType() == Op1.getValueType() &&           "Invalid input vector types"); diff --git a/llvm/lib/CodeGen/SelectionDAG/LegalizeTypes.h b/llvm/lib/CodeGen/SelectionDAG/LegalizeTypes.h index 0a8db0897b5..69c21000015 100644 --- a/llvm/lib/CodeGen/SelectionDAG/LegalizeTypes.h +++ b/llvm/lib/CodeGen/SelectionDAG/LegalizeTypes.h @@ -633,7 +633,7 @@ private:    SDValue WidenVecOp_EXTRACT_VECTOR_ELT(SDNode *N);    SDValue WidenVecOp_EXTRACT_SUBVECTOR(SDNode *N);    SDValue WidenVecOp_STORE(SDNode* N); -  SDValue WidenVecOp_SETCC(SDNode* N, unsigned ResNo); +  SDValue WidenVecOp_SETCC(SDNode* N);    SDValue WidenVecOp_Convert(SDNode *N); diff --git a/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp b/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp index 7fc7525a5b9..e950e072bc7 100644 --- a/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp +++ b/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp @@ -2033,7 +2033,7 @@ bool DAGTypeLegalizer::WidenVectorOperand(SDNode *N, unsigned ResNo) {    case ISD::EXTRACT_SUBVECTOR:  Res = WidenVecOp_EXTRACT_SUBVECTOR(N); break;    case ISD::EXTRACT_VECTOR_ELT: Res = WidenVecOp_EXTRACT_VECTOR_ELT(N); break;    case ISD::STORE:              Res = WidenVecOp_STORE(N); break; -  case ISD::SETCC:              Res = WidenVecOp_SETCC(N, ResNo); break; +  case ISD::SETCC:              Res = WidenVecOp_SETCC(N); break;    case ISD::FP_EXTEND:    case ISD::FP_TO_SINT: @@ -2167,27 +2167,30 @@ SDValue DAGTypeLegalizer::WidenVecOp_STORE(SDNode *N) {                         MVT::Other,&StChain[0],StChain.size());  } -SDValue DAGTypeLegalizer::WidenVecOp_SETCC(SDNode *N, unsigned ResNo) { -  assert(ResNo < 2 && "Invalid res num to widen"); +SDValue DAGTypeLegalizer::WidenVecOp_SETCC(SDNode *N) {    SDValue InOp0 = GetWidenedVector(N->getOperand(0));    SDValue InOp1 = GetWidenedVector(N->getOperand(1)); -  EVT VT = InOp0.getValueType();    DebugLoc dl = N->getDebugLoc();    // WARNING: In this code we widen the compare instruction with garbage.    // This garbage may contain denormal floats which may be slow. Is this a real    // concern ? Should we zero the unused lanes if this is a float compare ? -  SDValue Zero = DAG.getIntPtrConstant(0); -  EVT ResVT = EVT::getVectorVT(*DAG.getContext(), -                               N->getValueType(0).getVectorElementType(), -                               VT.getVectorNumElements()); - +  // Get a new SETCC node to compare the newly widened operands. +  // Only some of the compared elements are legal. +  EVT SVT = TLI.getSetCCResultType(InOp0.getValueType());    SDValue WideSETCC = DAG.getNode(ISD::SETCC, N->getDebugLoc(), -                     ResVT, InOp0, InOp1, N->getOperand(2)); +                     SVT, InOp0, InOp1, N->getOperand(2)); + +  // Extract the needed results from the result vector. +  EVT ResVT = EVT::getVectorVT(*DAG.getContext(), +                               SVT.getVectorElementType(), +                               N->getValueType(0).getVectorNumElements()); +  SDValue CC = DAG.getNode(ISD::EXTRACT_SUBVECTOR, dl, +                           ResVT, WideSETCC, DAG.getIntPtrConstant(0)); -  return DAG.getNode(ISD::EXTRACT_SUBVECTOR, dl, N->getValueType(0), -                     WideSETCC, Zero); +  // Convert the result mask to the correct kind. +  return DAG.getAnyExtOrTrunc(CC, dl, N->getValueType(0));  } diff --git a/llvm/test/CodeGen/X86/2011-10-21-widen-cmp.ll b/llvm/test/CodeGen/X86/2011-10-21-widen-cmp.ll new file mode 100644 index 00000000000..aa1a60026f4 --- /dev/null +++ b/llvm/test/CodeGen/X86/2011-10-21-widen-cmp.ll @@ -0,0 +1,30 @@ +; RUN: llc < %s -march=x86-64 -mcpu=corei7 | FileCheck %s + +target triple = "x86_64-unknown-linux-gnu" + +; Check that a <4 x float> compare is generated and that we are +; not stuck in an endless loop. + +; CHECK: cmp_2_floats +; CHECK: cmpordps +; CHECK: ret + +define void @cmp_2_floats() { +entry: +  %0 = fcmp oeq <2 x float> undef, undef +  %1 = select <2 x i1> %0, <2 x float> undef, <2 x float> undef +  store <2 x float> %1, <2 x float>* undef +  ret void +} + +; CHECK: cmp_2_doubles +; CHECK: cmpordpd +; CHECK: blendvpd +; CHECK: ret +define void @cmp_2_doubles() { +entry: +  %0 = fcmp oeq <2 x double> undef, undef +  %1 = select <2 x i1> %0, <2 x double> undef, <2 x double> undef +  store <2 x double> %1, <2 x double>* undef +  ret void +}  | 

