diff options
| author | Adam Nemet <anemet@apple.com> | 2014-08-07 23:18:18 +0000 |
|---|---|---|
| committer | Adam Nemet <anemet@apple.com> | 2014-08-07 23:18:18 +0000 |
| commit | fa1f7201fca0c3ab4bdfe31b89e5b18e04c78320 (patch) | |
| tree | eb45202459f479ef803dff180c4a3663d3c41486 | |
| parent | 5acc58fcfb403d1638856133088727c4e1a22fce (diff) | |
| download | bcm5719-llvm-fa1f7201fca0c3ab4bdfe31b89e5b18e04c78320.tar.gz bcm5719-llvm-fa1f7201fca0c3ab4bdfe31b89e5b18e04c78320.zip | |
[AVX512] Add codegen test for the masking variant of valign
The AddedComplexity is needed just like in avx512_perm_3src. There may be a
bug in the complexity computation...
llvm-svn: 215168
| -rw-r--r-- | llvm/lib/Target/X86/X86InstrAVX512.td | 5 | ||||
| -rw-r--r-- | llvm/test/CodeGen/X86/avx512-shuffle.ll | 9 |
2 files changed, 12 insertions, 2 deletions
diff --git a/llvm/lib/Target/X86/X86InstrAVX512.td b/llvm/lib/Target/X86/X86InstrAVX512.td index 2dcf368add1..a62e926629e 100644 --- a/llvm/lib/Target/X86/X86InstrAVX512.td +++ b/llvm/lib/Target/X86/X86InstrAVX512.td @@ -8,8 +8,9 @@ multiclass AVX512_masking<bits<8> O, Format F, dag Outs, dag Ins, "$dst, "#IntelSrcAsm#"}", [(set RC:$dst, RHS)]>; - let Constraints = "$src0 = $dst" in - def NAME#k: AVX512<O, F, Outs, + // Prefer over VMOV*rrk Pat<> + let Constraints = "$src0 = $dst", AddedComplexity = 20 in + def NAME#k: AVX512<O, F, Outs, !con((ins RC:$src0, KRC:$mask), Ins), OpcodeStr#" \t{"#AttSrcAsm#", $dst {${mask}}|"# "$dst {${mask}}, "#IntelSrcAsm#"}", diff --git a/llvm/test/CodeGen/X86/avx512-shuffle.ll b/llvm/test/CodeGen/X86/avx512-shuffle.ll index b99e89a9a54..a4aa87a2ea9 100644 --- a/llvm/test/CodeGen/X86/avx512-shuffle.ll +++ b/llvm/test/CodeGen/X86/avx512-shuffle.ll @@ -207,6 +207,15 @@ define <8 x double> @test16(<8 x double> %a, <8 x double> %b) nounwind { ret <8 x double> %c } +; CHECK-LABEL: test16k +; CHECK: valignq $2, %zmm0, %zmm1, %zmm2 {%k1} # +define <8 x i64> @test16k(<8 x i64> %a, <8 x i64> %b, <8 x i64> %src, i8 %mask) nounwind { + %c = shufflevector <8 x i64> %a, <8 x i64> %b, <8 x i32> <i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9> + %m = bitcast i8 %mask to <8 x i1> + %res = select <8 x i1> %m, <8 x i64> %c, <8 x i64> %src + ret <8 x i64> %res +} + ; CHECK-LABEL: test17 ; CHECK: vshufpd $19, %zmm1, %zmm0 ; CHECK: ret |

