diff options
| author | Ahmed Bougacha <ahmed.bougacha@gmail.com> | 2014-10-30 23:46:50 +0000 | 
|---|---|---|
| committer | Ahmed Bougacha <ahmed.bougacha@gmail.com> | 2014-10-30 23:46:50 +0000 | 
| commit | 9f336c4ec5adb124c8d7b75be8bc5d2f02db119c (patch) | |
| tree | c7f9184ce965abc299920caface9fe3842bbc1f5 | |
| parent | 6cda0d7269188f9b21c6dfe19a6f32f8432918da (diff) | |
| download | bcm5719-llvm-9f336c4ec5adb124c8d7b75be8bc5d2f02db119c.tar.gz bcm5719-llvm-9f336c4ec5adb124c8d7b75be8bc5d2f02db119c.zip | |
[SelectionDAG] When scalarizing trunc, don't assert for legal operands.
r212242 introduced a legalizer hook, originally to let AArch64 widen
v1i{32,16,8} rather than scalarize, because the legalizer expected, when
scalarizing the result of a conversion operation, to already have
scalarized the operands.  On AArch64, v1i64 is legal, so that commit
ensured operations such as v1i32 = trunc v1i64 wouldn't assert.
It did that by choosing to widen v1 types whenever possible.  However,
v1i1 types, for which there's no legal widened type, would still trigger
the assert.
This commit fixes that, by only scalarizing a trunc's result when the
operand has already been scalarized, and introducing an extract_elt
otherwise.  
This is similar to r205625.
Fixes PR20777.
llvm-svn: 220937
| -rw-r--r-- | llvm/lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp | 18 | ||||
| -rw-r--r-- | llvm/test/CodeGen/AArch64/trunc-v1i64.ll | 21 | 
2 files changed, 37 insertions, 2 deletions
| diff --git a/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp b/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp index 68187dd0b8c..27f63d27823 100644 --- a/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp +++ b/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp @@ -237,7 +237,23 @@ SDValue DAGTypeLegalizer::ScalarizeVecRes_LOAD(LoadSDNode *N) {  SDValue DAGTypeLegalizer::ScalarizeVecRes_UnaryOp(SDNode *N) {    // Get the dest type - it doesn't always match the input type, e.g. int_to_fp.    EVT DestVT = N->getValueType(0).getVectorElementType(); -  SDValue Op = GetScalarizedVector(N->getOperand(0)); +  SDValue Op = N->getOperand(0); +  EVT OpVT = Op.getValueType(); +  SDLoc DL(N); +  // The result needs scalarizing, but it's not a given that the source does. +  // This is a workaround for targets where it's impossible to scalarize the +  // result of a conversion, because the source type is legal. +  // For instance, this happens on AArch64: v1i1 is illegal but v1i{8,16,32} +  // are widened to v8i8, v4i16, and v2i32, which is legal, because v1i64 is +  // legal and was not scalarized. +  // See the similar logic in ScalarizeVecRes_VSETCC +  if (getTypeAction(OpVT) == TargetLowering::TypeScalarizeVector) { +    Op = GetScalarizedVector(Op); +  } else { +    EVT VT = OpVT.getVectorElementType(); +    Op = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, DL, VT, Op, +                      DAG.getConstant(0, TLI.getVectorIdxTy())); +  }    return DAG.getNode(N->getOpcode(), SDLoc(N), DestVT, Op);  } diff --git a/llvm/test/CodeGen/AArch64/trunc-v1i64.ll b/llvm/test/CodeGen/AArch64/trunc-v1i64.ll index 159b8e0cff3..19efd2fafd5 100644 --- a/llvm/test/CodeGen/AArch64/trunc-v1i64.ll +++ b/llvm/test/CodeGen/AArch64/trunc-v1i64.ll @@ -60,4 +60,23 @@ define <8 x i8> @test_v1i8_1(<1 x i64> %in0) {    %1 = shufflevector <1 x i64> %in0, <1 x i64> undef, <8 x i32> <i32 undef, i32 undef, i32 0, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef>    %2 = trunc <8 x i64> %1 to <8 x i8>    ret <8 x i8> %2 -}
\ No newline at end of file +} + +; PR20777: v1i1 is also problematic, but we can't widen it, so we extract_elt +; the i64 out of the v1i64 operand, and truncate that scalar instead. + +define <1 x i1> @test_v1i1_0(<1 x i64> %in0) { +; CHECK-LABEL: test_v1i1_0: +; CHECK: fmov w0, s0 +  %1 = trunc <1 x i64> %in0 to <1 x i1> +  ret <1 x i1> %1 +} + +define i1 @test_v1i1_1(<1 x i64> %in0) { +; CHECK-LABEL: test_v1i1_1: +; CHECK: fmov [[REG:w[0-9]+]], s0 +  %1 = trunc <1 x i64> %in0 to <1 x i1> +; CHECK: and w0, [[REG]], #0x1 +  %2 = extractelement <1 x i1> %1, i32 0 +  ret i1 %2 +} | 

