diff options
| -rw-r--r-- | llvm/lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp | 2 | ||||
| -rw-r--r-- | llvm/test/CodeGen/X86/avx512-load-trunc-store-i1.ll | 49 |
2 files changed, 12 insertions, 39 deletions
diff --git a/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp b/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp index 8fb5c5e7ed7..5e7279c058c 100644 --- a/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp +++ b/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp @@ -525,7 +525,7 @@ SDValue DAGTypeLegalizer::ScalarizeVecOp_UnaryOp(SDNode *N) { N->getValueType(0).getScalarType(), Elt); // Revectorize the result so the types line up with what the uses of this // expression expect. - return DAG.getBuildVector(N->getValueType(0), SDLoc(N), Op); + return DAG.getNode(ISD::SCALAR_TO_VECTOR, SDLoc(N), N->getValueType(0), Op); } /// The vectors to concatenate have length one - use a BUILD_VECTOR instead. diff --git a/llvm/test/CodeGen/X86/avx512-load-trunc-store-i1.ll b/llvm/test/CodeGen/X86/avx512-load-trunc-store-i1.ll index bfcac893512..02cf3734f96 100644 --- a/llvm/test/CodeGen/X86/avx512-load-trunc-store-i1.ll +++ b/llvm/test/CodeGen/X86/avx512-load-trunc-store-i1.ll @@ -5,18 +5,13 @@ define void @load_v1i2_trunc_v1i1_store(<1 x i2>* %a0,<1 x i1>* %a1) { ; AVX512-ALL-LABEL: load_v1i2_trunc_v1i1_store: ; AVX512-ALL: # %bb.0: -; AVX512-ALL-NEXT: movb (%rdi), %al -; AVX512-ALL-NEXT: testb %al, %al -; AVX512-ALL-NEXT: setne %al -; AVX512-ALL-NEXT: kmovd %eax, %k0 +; AVX512-ALL-NEXT: kmovb (%rdi), %k0 ; AVX512-ALL-NEXT: kmovb %k0, (%rsi) ; AVX512-ALL-NEXT: retq ; ; AVX512-ONLY-LABEL: load_v1i2_trunc_v1i1_store: ; AVX512-ONLY: # %bb.0: ; AVX512-ONLY-NEXT: movb (%rdi), %al -; AVX512-ONLY-NEXT: testb %al, %al -; AVX512-ONLY-NEXT: setne %al ; AVX512-ONLY-NEXT: movb %al, (%rsi) ; AVX512-ONLY-NEXT: retq %d0 = load <1 x i2>, <1 x i2>* %a0 @@ -27,18 +22,13 @@ define void @load_v1i2_trunc_v1i1_store(<1 x i2>* %a0,<1 x i1>* %a1) { define void @load_v1i3_trunc_v1i1_store(<1 x i3>* %a0,<1 x i1>* %a1) { ; AVX512-ALL-LABEL: load_v1i3_trunc_v1i1_store: ; AVX512-ALL: # %bb.0: -; AVX512-ALL-NEXT: movb (%rdi), %al -; AVX512-ALL-NEXT: testb %al, %al -; AVX512-ALL-NEXT: setne %al -; AVX512-ALL-NEXT: kmovd %eax, %k0 +; AVX512-ALL-NEXT: kmovb (%rdi), %k0 ; AVX512-ALL-NEXT: kmovb %k0, (%rsi) ; AVX512-ALL-NEXT: retq ; ; AVX512-ONLY-LABEL: load_v1i3_trunc_v1i1_store: ; AVX512-ONLY: # %bb.0: ; AVX512-ONLY-NEXT: movb (%rdi), %al -; AVX512-ONLY-NEXT: testb %al, %al -; AVX512-ONLY-NEXT: setne %al ; AVX512-ONLY-NEXT: movb %al, (%rsi) ; AVX512-ONLY-NEXT: retq %d0 = load <1 x i3>, <1 x i3>* %a0 @@ -49,18 +39,13 @@ define void @load_v1i3_trunc_v1i1_store(<1 x i3>* %a0,<1 x i1>* %a1) { define void @load_v1i4_trunc_v1i1_store(<1 x i4>* %a0,<1 x i1>* %a1) { ; AVX512-ALL-LABEL: load_v1i4_trunc_v1i1_store: ; AVX512-ALL: # %bb.0: -; AVX512-ALL-NEXT: movb (%rdi), %al -; AVX512-ALL-NEXT: testb %al, %al -; AVX512-ALL-NEXT: setne %al -; AVX512-ALL-NEXT: kmovd %eax, %k0 +; AVX512-ALL-NEXT: kmovb (%rdi), %k0 ; AVX512-ALL-NEXT: kmovb %k0, (%rsi) ; AVX512-ALL-NEXT: retq ; ; AVX512-ONLY-LABEL: load_v1i4_trunc_v1i1_store: ; AVX512-ONLY: # %bb.0: ; AVX512-ONLY-NEXT: movb (%rdi), %al -; AVX512-ONLY-NEXT: testb %al, %al -; AVX512-ONLY-NEXT: setne %al ; AVX512-ONLY-NEXT: movb %al, (%rsi) ; AVX512-ONLY-NEXT: retq %d0 = load <1 x i4>, <1 x i4>* %a0 @@ -71,16 +56,13 @@ define void @load_v1i4_trunc_v1i1_store(<1 x i4>* %a0,<1 x i1>* %a1) { define void @load_v1i8_trunc_v1i1_store(<1 x i8>* %a0,<1 x i1>* %a1) { ; AVX512-ALL-LABEL: load_v1i8_trunc_v1i1_store: ; AVX512-ALL: # %bb.0: -; AVX512-ALL-NEXT: cmpb $0, (%rdi) -; AVX512-ALL-NEXT: setne %al -; AVX512-ALL-NEXT: kmovd %eax, %k0 +; AVX512-ALL-NEXT: kmovb (%rdi), %k0 ; AVX512-ALL-NEXT: kmovb %k0, (%rsi) ; AVX512-ALL-NEXT: retq ; ; AVX512-ONLY-LABEL: load_v1i8_trunc_v1i1_store: ; AVX512-ONLY: # %bb.0: -; AVX512-ONLY-NEXT: cmpb $0, (%rdi) -; AVX512-ONLY-NEXT: setne %al +; AVX512-ONLY-NEXT: movb (%rdi), %al ; AVX512-ONLY-NEXT: movb %al, (%rsi) ; AVX512-ONLY-NEXT: retq %d0 = load <1 x i8>, <1 x i8>* %a0 @@ -91,16 +73,13 @@ define void @load_v1i8_trunc_v1i1_store(<1 x i8>* %a0,<1 x i1>* %a1) { define void @load_v1i16_trunc_v1i1_store(<1 x i16>* %a0,<1 x i1>* %a1) { ; AVX512-ALL-LABEL: load_v1i16_trunc_v1i1_store: ; AVX512-ALL: # %bb.0: -; AVX512-ALL-NEXT: cmpb $0, (%rdi) -; AVX512-ALL-NEXT: setne %al -; AVX512-ALL-NEXT: kmovd %eax, %k0 +; AVX512-ALL-NEXT: kmovb (%rdi), %k0 ; AVX512-ALL-NEXT: kmovb %k0, (%rsi) ; AVX512-ALL-NEXT: retq ; ; AVX512-ONLY-LABEL: load_v1i16_trunc_v1i1_store: ; AVX512-ONLY: # %bb.0: -; AVX512-ONLY-NEXT: cmpb $0, (%rdi) -; AVX512-ONLY-NEXT: setne %al +; AVX512-ONLY-NEXT: movb (%rdi), %al ; AVX512-ONLY-NEXT: movb %al, (%rsi) ; AVX512-ONLY-NEXT: retq %d0 = load <1 x i16>, <1 x i16>* %a0 @@ -111,16 +90,13 @@ define void @load_v1i16_trunc_v1i1_store(<1 x i16>* %a0,<1 x i1>* %a1) { define void @load_v1i32_trunc_v1i1_store(<1 x i32>* %a0,<1 x i1>* %a1) { ; AVX512-ALL-LABEL: load_v1i32_trunc_v1i1_store: ; AVX512-ALL: # %bb.0: -; AVX512-ALL-NEXT: cmpb $0, (%rdi) -; AVX512-ALL-NEXT: setne %al -; AVX512-ALL-NEXT: kmovd %eax, %k0 +; AVX512-ALL-NEXT: kmovb (%rdi), %k0 ; AVX512-ALL-NEXT: kmovb %k0, (%rsi) ; AVX512-ALL-NEXT: retq ; ; AVX512-ONLY-LABEL: load_v1i32_trunc_v1i1_store: ; AVX512-ONLY: # %bb.0: -; AVX512-ONLY-NEXT: cmpb $0, (%rdi) -; AVX512-ONLY-NEXT: setne %al +; AVX512-ONLY-NEXT: movb (%rdi), %al ; AVX512-ONLY-NEXT: movb %al, (%rsi) ; AVX512-ONLY-NEXT: retq %d0 = load <1 x i32>, <1 x i32>* %a0 @@ -131,16 +107,13 @@ define void @load_v1i32_trunc_v1i1_store(<1 x i32>* %a0,<1 x i1>* %a1) { define void @load_v1i64_trunc_v1i1_store(<1 x i64>* %a0,<1 x i1>* %a1) { ; AVX512-ALL-LABEL: load_v1i64_trunc_v1i1_store: ; AVX512-ALL: # %bb.0: -; AVX512-ALL-NEXT: cmpb $0, (%rdi) -; AVX512-ALL-NEXT: setne %al -; AVX512-ALL-NEXT: kmovd %eax, %k0 +; AVX512-ALL-NEXT: kmovb (%rdi), %k0 ; AVX512-ALL-NEXT: kmovb %k0, (%rsi) ; AVX512-ALL-NEXT: retq ; ; AVX512-ONLY-LABEL: load_v1i64_trunc_v1i1_store: ; AVX512-ONLY: # %bb.0: -; AVX512-ONLY-NEXT: cmpb $0, (%rdi) -; AVX512-ONLY-NEXT: setne %al +; AVX512-ONLY-NEXT: movb (%rdi), %al ; AVX512-ONLY-NEXT: movb %al, (%rsi) ; AVX512-ONLY-NEXT: retq %d0 = load <1 x i64>, <1 x i64>* %a0 |

