diff options
Diffstat (limited to 'llvm/test/CodeGen/X86/avx512-extract-subvector-load-store.ll')
-rw-r--r-- | llvm/test/CodeGen/X86/avx512-extract-subvector-load-store.ll | 212 |
1 files changed, 106 insertions, 106 deletions
diff --git a/llvm/test/CodeGen/X86/avx512-extract-subvector-load-store.ll b/llvm/test/CodeGen/X86/avx512-extract-subvector-load-store.ll index f556cb977ae..34ea468aebe 100644 --- a/llvm/test/CodeGen/X86/avx512-extract-subvector-load-store.ll +++ b/llvm/test/CodeGen/X86/avx512-extract-subvector-load-store.ll @@ -4,7 +4,7 @@ define void @load_v8i1_broadcast_4_v2i1(<8 x i1>* %a0,<2 x double> %a1,<2 x double> %a2,<2 x double>* %a3) { ; AVX512-LABEL: load_v8i1_broadcast_4_v2i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovb (%rdi), %k0 ; AVX512-NEXT: kshiftrw $4, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %xmm2 @@ -15,7 +15,7 @@ define void @load_v8i1_broadcast_4_v2i1(<8 x i1>* %a0,<2 x double> %a1,<2 x doub ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v8i1_broadcast_4_v2i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: movzbl (%rdi), %eax ; AVX512NOTDQ-NEXT: kmovd %eax, %k0 ; AVX512NOTDQ-NEXT: kshiftrw $4, %k0, %k1 @@ -35,7 +35,7 @@ define void @load_v8i1_broadcast_4_v2i1(<8 x i1>* %a0,<2 x double> %a1,<2 x doub } define void @load_v8i1_broadcast_7_v2i1(<8 x i1>* %a0,<2 x double> %a1,<2 x double> %a2,<2 x double>* %a3) { ; AVX512-LABEL: load_v8i1_broadcast_7_v2i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovb (%rdi), %k0 ; AVX512-NEXT: kshiftrw $6, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %xmm2 @@ -46,7 +46,7 @@ define void @load_v8i1_broadcast_7_v2i1(<8 x i1>* %a0,<2 x double> %a1,<2 x doub ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v8i1_broadcast_7_v2i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: movzbl (%rdi), %eax ; AVX512NOTDQ-NEXT: kmovd %eax, %k0 ; AVX512NOTDQ-NEXT: kshiftrw $6, %k0, %k1 @@ -66,7 +66,7 @@ define void @load_v8i1_broadcast_7_v2i1(<8 x i1>* %a0,<2 x double> %a1,<2 x doub } define void @load_v16i1_broadcast_8_v2i1(<16 x i1>* %a0,<2 x double> %a1,<2 x double> %a2,<2 x double>* %a3) { ; AVX512-LABEL: load_v16i1_broadcast_8_v2i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovw (%rdi), %k0 ; AVX512-NEXT: kshiftrw $8, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %xmm2 @@ -77,7 +77,7 @@ define void @load_v16i1_broadcast_8_v2i1(<16 x i1>* %a0,<2 x double> %a1,<2 x do ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v16i1_broadcast_8_v2i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovw (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrw $8, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm2, %xmm2, %xmm2 @@ -96,7 +96,7 @@ define void @load_v16i1_broadcast_8_v2i1(<16 x i1>* %a0,<2 x double> %a1,<2 x do } define void @load_v16i1_broadcast_8_v4i1(<16 x i1>* %a0,<4 x float> %a1,<4 x float> %a2,<4 x float>* %a3) { ; AVX512-LABEL: load_v16i1_broadcast_8_v4i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovw (%rdi), %k0 ; AVX512-NEXT: kshiftrw $8, %k0, %k0 ; AVX512-NEXT: vpmovm2d %k0, %xmm2 @@ -107,7 +107,7 @@ define void @load_v16i1_broadcast_8_v4i1(<16 x i1>* %a0,<4 x float> %a1,<4 x flo ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v16i1_broadcast_8_v4i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovw (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrw $8, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm2, %xmm2, %xmm2 @@ -126,7 +126,7 @@ define void @load_v16i1_broadcast_8_v4i1(<16 x i1>* %a0,<4 x float> %a1,<4 x flo } define void @load_v16i1_broadcast_15_v2i1(<16 x i1>* %a0,<2 x double> %a1,<2 x double> %a2,<2 x double>* %a3) { ; AVX512-LABEL: load_v16i1_broadcast_15_v2i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovw (%rdi), %k0 ; AVX512-NEXT: kshiftrw $14, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %xmm2 @@ -137,7 +137,7 @@ define void @load_v16i1_broadcast_15_v2i1(<16 x i1>* %a0,<2 x double> %a1,<2 x d ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v16i1_broadcast_15_v2i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovw (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrw $14, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm2, %xmm2, %xmm2 @@ -156,7 +156,7 @@ define void @load_v16i1_broadcast_15_v2i1(<16 x i1>* %a0,<2 x double> %a1,<2 x d } define void @load_v16i1_broadcast_15_v4i1(<16 x i1>* %a0,<4 x float> %a1,<4 x float> %a2,<4 x float>* %a3) { ; AVX512-LABEL: load_v16i1_broadcast_15_v4i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovw (%rdi), %k0 ; AVX512-NEXT: kshiftrw $12, %k0, %k0 ; AVX512-NEXT: vpmovm2d %k0, %xmm2 @@ -167,7 +167,7 @@ define void @load_v16i1_broadcast_15_v4i1(<16 x i1>* %a0,<4 x float> %a1,<4 x fl ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v16i1_broadcast_15_v4i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovw (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrw $12, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm2, %xmm2, %xmm2 @@ -186,7 +186,7 @@ define void @load_v16i1_broadcast_15_v4i1(<16 x i1>* %a0,<4 x float> %a1,<4 x fl } define void @load_v32i1_broadcast_16_v2i1(<32 x i1>* %a0,<2 x double> %a1,<2 x double> %a2,<2 x double>* %a3) { ; AVX512-LABEL: load_v32i1_broadcast_16_v2i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovd (%rdi), %k0 ; AVX512-NEXT: kshiftrd $16, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %xmm2 @@ -197,7 +197,7 @@ define void @load_v32i1_broadcast_16_v2i1(<32 x i1>* %a0,<2 x double> %a1,<2 x d ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v32i1_broadcast_16_v2i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovd (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrd $16, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm2, %xmm2, %xmm2 @@ -216,7 +216,7 @@ define void @load_v32i1_broadcast_16_v2i1(<32 x i1>* %a0,<2 x double> %a1,<2 x d } define void @load_v32i1_broadcast_16_v4i1(<32 x i1>* %a0,<4 x float> %a1,<4 x float> %a2,<4 x float>* %a3) { ; AVX512-LABEL: load_v32i1_broadcast_16_v4i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovd (%rdi), %k0 ; AVX512-NEXT: kshiftrd $16, %k0, %k0 ; AVX512-NEXT: vpmovm2d %k0, %xmm2 @@ -227,7 +227,7 @@ define void @load_v32i1_broadcast_16_v4i1(<32 x i1>* %a0,<4 x float> %a1,<4 x fl ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v32i1_broadcast_16_v4i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovd (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrd $16, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm2, %xmm2, %xmm2 @@ -246,7 +246,7 @@ define void @load_v32i1_broadcast_16_v4i1(<32 x i1>* %a0,<4 x float> %a1,<4 x fl } define void @load_v32i1_broadcast_16_v8i1(<32 x i1>* %a0,<8 x float> %a1,<8 x float> %a2,<8 x float>* %a3) { ; AVX512-LABEL: load_v32i1_broadcast_16_v8i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovd (%rdi), %k0 ; AVX512-NEXT: kshiftrd $16, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %zmm2 @@ -258,7 +258,7 @@ define void @load_v32i1_broadcast_16_v8i1(<32 x i1>* %a0,<8 x float> %a1,<8 x fl ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v32i1_broadcast_16_v8i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovd (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrd $16, %k0, %k1 ; AVX512NOTDQ-NEXT: vpternlogq $255, %zmm2, %zmm2, %zmm2 {%k1} {z} @@ -277,7 +277,7 @@ define void @load_v32i1_broadcast_16_v8i1(<32 x i1>* %a0,<8 x float> %a1,<8 x fl } define void @load_v32i1_broadcast_31_v2i1(<32 x i1>* %a0,<2 x double> %a1,<2 x double> %a2,<2 x double>* %a3) { ; AVX512-LABEL: load_v32i1_broadcast_31_v2i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovd (%rdi), %k0 ; AVX512-NEXT: kshiftrd $30, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %xmm2 @@ -288,7 +288,7 @@ define void @load_v32i1_broadcast_31_v2i1(<32 x i1>* %a0,<2 x double> %a1,<2 x d ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v32i1_broadcast_31_v2i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovd (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrd $30, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm2, %xmm2, %xmm2 @@ -307,7 +307,7 @@ define void @load_v32i1_broadcast_31_v2i1(<32 x i1>* %a0,<2 x double> %a1,<2 x d } define void @load_v32i1_broadcast_31_v4i1(<32 x i1>* %a0,<4 x float> %a1,<4 x float> %a2,<4 x float>* %a3) { ; AVX512-LABEL: load_v32i1_broadcast_31_v4i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovd (%rdi), %k0 ; AVX512-NEXT: kshiftrd $28, %k0, %k0 ; AVX512-NEXT: vpmovm2d %k0, %xmm2 @@ -318,7 +318,7 @@ define void @load_v32i1_broadcast_31_v4i1(<32 x i1>* %a0,<4 x float> %a1,<4 x fl ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v32i1_broadcast_31_v4i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovd (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrd $28, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm2, %xmm2, %xmm2 @@ -337,7 +337,7 @@ define void @load_v32i1_broadcast_31_v4i1(<32 x i1>* %a0,<4 x float> %a1,<4 x fl } define void @load_v32i1_broadcast_31_v8i1(<32 x i1>* %a0,<8 x float> %a1,<8 x float> %a2,<8 x float>* %a3) { ; AVX512-LABEL: load_v32i1_broadcast_31_v8i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovd (%rdi), %k0 ; AVX512-NEXT: kshiftrd $24, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %zmm2 @@ -350,7 +350,7 @@ define void @load_v32i1_broadcast_31_v8i1(<32 x i1>* %a0,<8 x float> %a1,<8 x fl ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v32i1_broadcast_31_v8i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovd (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrd $24, %k0, %k1 ; AVX512NOTDQ-NEXT: vpternlogq $255, %zmm2, %zmm2, %zmm2 {%k1} {z} @@ -370,7 +370,7 @@ define void @load_v32i1_broadcast_31_v8i1(<32 x i1>* %a0,<8 x float> %a1,<8 x fl } define void @load_v64i1_broadcast_32_v2i1(<64 x i1>* %a0,<2 x double> %a1,<2 x double> %a2,<2 x double>* %a3) { ; AVX512-LABEL: load_v64i1_broadcast_32_v2i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovq (%rdi), %k0 ; AVX512-NEXT: kshiftrq $32, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %xmm2 @@ -381,7 +381,7 @@ define void @load_v64i1_broadcast_32_v2i1(<64 x i1>* %a0,<2 x double> %a1,<2 x d ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v64i1_broadcast_32_v2i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovq (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrq $32, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm2, %xmm2, %xmm2 @@ -400,7 +400,7 @@ define void @load_v64i1_broadcast_32_v2i1(<64 x i1>* %a0,<2 x double> %a1,<2 x d } define void @load_v64i1_broadcast_32_v4i1(<64 x i1>* %a0,<4 x float> %a1,<4 x float> %a2,<4 x float>* %a3) { ; AVX512-LABEL: load_v64i1_broadcast_32_v4i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovq (%rdi), %k0 ; AVX512-NEXT: kshiftrq $32, %k0, %k0 ; AVX512-NEXT: vpmovm2d %k0, %xmm2 @@ -411,7 +411,7 @@ define void @load_v64i1_broadcast_32_v4i1(<64 x i1>* %a0,<4 x float> %a1,<4 x fl ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v64i1_broadcast_32_v4i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovq (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrq $32, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm2, %xmm2, %xmm2 @@ -430,7 +430,7 @@ define void @load_v64i1_broadcast_32_v4i1(<64 x i1>* %a0,<4 x float> %a1,<4 x fl } define void @load_v64i1_broadcast_32_v8i1(<64 x i1>* %a0,<8 x float> %a1,<8 x float> %a2,<8 x float>* %a3) { ; AVX512-LABEL: load_v64i1_broadcast_32_v8i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovq (%rdi), %k0 ; AVX512-NEXT: kshiftrq $32, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %zmm2 @@ -442,7 +442,7 @@ define void @load_v64i1_broadcast_32_v8i1(<64 x i1>* %a0,<8 x float> %a1,<8 x fl ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v64i1_broadcast_32_v8i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovq (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrq $32, %k0, %k1 ; AVX512NOTDQ-NEXT: vpternlogq $255, %zmm2, %zmm2, %zmm2 {%k1} {z} @@ -461,7 +461,7 @@ define void @load_v64i1_broadcast_32_v8i1(<64 x i1>* %a0,<8 x float> %a1,<8 x fl } define void @load_v64i1_broadcast_32_v16i1(<64 x i1>* %a0,<16 x float> %a1,<16 x float> %a2,<16 x float>* %a3) { ; AVX512-LABEL: load_v64i1_broadcast_32_v16i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovq (%rdi), %k0 ; AVX512-NEXT: kshiftrq $32, %k0, %k0 ; AVX512-NEXT: vpmovm2d %k0, %zmm2 @@ -473,7 +473,7 @@ define void @load_v64i1_broadcast_32_v16i1(<64 x i1>* %a0,<16 x float> %a1,<16 x ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v64i1_broadcast_32_v16i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovq (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrq $32, %k0, %k1 ; AVX512NOTDQ-NEXT: vpternlogd $255, %zmm2, %zmm2, %zmm2 {%k1} {z} @@ -492,7 +492,7 @@ define void @load_v64i1_broadcast_32_v16i1(<64 x i1>* %a0,<16 x float> %a1,<16 x } define void @load_v64i1_broadcast_63_v2i1(<64 x i1>* %a0,<2 x double> %a1,<2 x double> %a2,<2 x double>* %a3) { ; AVX512-LABEL: load_v64i1_broadcast_63_v2i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovq (%rdi), %k0 ; AVX512-NEXT: kshiftrq $62, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %xmm2 @@ -503,7 +503,7 @@ define void @load_v64i1_broadcast_63_v2i1(<64 x i1>* %a0,<2 x double> %a1,<2 x d ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v64i1_broadcast_63_v2i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovq (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrq $62, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm2, %xmm2, %xmm2 @@ -522,7 +522,7 @@ define void @load_v64i1_broadcast_63_v2i1(<64 x i1>* %a0,<2 x double> %a1,<2 x d } define void @load_v64i1_broadcast_63_v4i1(<64 x i1>* %a0,<4 x float> %a1,<4 x float> %a2,<4 x float>* %a3) { ; AVX512-LABEL: load_v64i1_broadcast_63_v4i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovq (%rdi), %k0 ; AVX512-NEXT: kshiftrq $60, %k0, %k0 ; AVX512-NEXT: vpmovm2d %k0, %xmm2 @@ -533,7 +533,7 @@ define void @load_v64i1_broadcast_63_v4i1(<64 x i1>* %a0,<4 x float> %a1,<4 x fl ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v64i1_broadcast_63_v4i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovq (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrq $60, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm2, %xmm2, %xmm2 @@ -552,7 +552,7 @@ define void @load_v64i1_broadcast_63_v4i1(<64 x i1>* %a0,<4 x float> %a1,<4 x fl } define void @load_v64i1_broadcast_63_v8i1(<64 x i1>* %a0,<8 x float> %a1,<8 x float> %a2,<8 x float>* %a3) { ; AVX512-LABEL: load_v64i1_broadcast_63_v8i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovq (%rdi), %k0 ; AVX512-NEXT: kshiftrq $56, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %zmm2 @@ -565,7 +565,7 @@ define void @load_v64i1_broadcast_63_v8i1(<64 x i1>* %a0,<8 x float> %a1,<8 x fl ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v64i1_broadcast_63_v8i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovq (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrq $56, %k0, %k1 ; AVX512NOTDQ-NEXT: vpternlogq $255, %zmm2, %zmm2, %zmm2 {%k1} {z} @@ -585,7 +585,7 @@ define void @load_v64i1_broadcast_63_v8i1(<64 x i1>* %a0,<8 x float> %a1,<8 x fl } define void @load_v64i1_broadcast_63_v16i1(<64 x i1>* %a0,<16 x float> %a1,<16 x float> %a2,<16 x float>* %a3) { ; AVX512-LABEL: load_v64i1_broadcast_63_v16i1: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovq (%rdi), %k0 ; AVX512-NEXT: kshiftrq $48, %k0, %k0 ; AVX512-NEXT: vpmovm2d %k0, %zmm2 @@ -598,7 +598,7 @@ define void @load_v64i1_broadcast_63_v16i1(<64 x i1>* %a0,<16 x float> %a1,<16 x ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v64i1_broadcast_63_v16i1: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovq (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrq $48, %k0, %k1 ; AVX512NOTDQ-NEXT: vpternlogd $255, %zmm2, %zmm2, %zmm2 {%k1} {z} @@ -618,14 +618,14 @@ define void @load_v64i1_broadcast_63_v16i1(<64 x i1>* %a0,<16 x float> %a1,<16 x } define void @load_v2i1_broadcast_1_v1i1_store(<2 x i1>* %a0,<1 x i1>* %a1) { ; AVX512-LABEL: load_v2i1_broadcast_1_v1i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovb (%rdi), %k0 ; AVX512-NEXT: kshiftrw $1, %k0, %k0 ; AVX512-NEXT: kmovb %k0, (%rsi) ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v2i1_broadcast_1_v1i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: movzbl (%rdi), %eax ; AVX512NOTDQ-NEXT: kmovd %eax, %k0 ; AVX512NOTDQ-NEXT: kshiftrw $1, %k0, %k0 @@ -639,14 +639,14 @@ define void @load_v2i1_broadcast_1_v1i1_store(<2 x i1>* %a0,<1 x i1>* %a1) { } define void @load_v3i1_broadcast_1_v1i1_store(<3 x i1>* %a0,<1 x i1>* %a1) { ; AVX512-LABEL: load_v3i1_broadcast_1_v1i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovb (%rdi), %k0 ; AVX512-NEXT: kshiftrw $1, %k0, %k0 ; AVX512-NEXT: kmovb %k0, (%rsi) ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v3i1_broadcast_1_v1i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: movzbl (%rdi), %eax ; AVX512NOTDQ-NEXT: kmovd %eax, %k0 ; AVX512NOTDQ-NEXT: kshiftrw $1, %k0, %k0 @@ -660,14 +660,14 @@ define void @load_v3i1_broadcast_1_v1i1_store(<3 x i1>* %a0,<1 x i1>* %a1) { } define void @load_v3i1_broadcast_2_v1i1_store(<3 x i1>* %a0,<1 x i1>* %a1) { ; AVX512-LABEL: load_v3i1_broadcast_2_v1i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovb (%rdi), %k0 ; AVX512-NEXT: kshiftrw $2, %k0, %k0 ; AVX512-NEXT: kmovb %k0, (%rsi) ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v3i1_broadcast_2_v1i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: movzbl (%rdi), %eax ; AVX512NOTDQ-NEXT: kmovd %eax, %k0 ; AVX512NOTDQ-NEXT: kshiftrw $2, %k0, %k0 @@ -681,14 +681,14 @@ define void @load_v3i1_broadcast_2_v1i1_store(<3 x i1>* %a0,<1 x i1>* %a1) { } define void @load_v4i1_broadcast_2_v1i1_store(<4 x i1>* %a0,<1 x i1>* %a1) { ; AVX512-LABEL: load_v4i1_broadcast_2_v1i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovb (%rdi), %k0 ; AVX512-NEXT: kshiftrw $2, %k0, %k0 ; AVX512-NEXT: kmovb %k0, (%rsi) ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v4i1_broadcast_2_v1i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: movzbl (%rdi), %eax ; AVX512NOTDQ-NEXT: kmovd %eax, %k0 ; AVX512NOTDQ-NEXT: kshiftrw $2, %k0, %k0 @@ -702,14 +702,14 @@ define void @load_v4i1_broadcast_2_v1i1_store(<4 x i1>* %a0,<1 x i1>* %a1) { } define void @load_v4i1_broadcast_3_v1i1_store(<4 x i1>* %a0,<1 x i1>* %a1) { ; AVX512-LABEL: load_v4i1_broadcast_3_v1i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovb (%rdi), %k0 ; AVX512-NEXT: kshiftrw $3, %k0, %k0 ; AVX512-NEXT: kmovb %k0, (%rsi) ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v4i1_broadcast_3_v1i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: movzbl (%rdi), %eax ; AVX512NOTDQ-NEXT: kmovd %eax, %k0 ; AVX512NOTDQ-NEXT: kshiftrw $3, %k0, %k0 @@ -723,14 +723,14 @@ define void @load_v4i1_broadcast_3_v1i1_store(<4 x i1>* %a0,<1 x i1>* %a1) { } define void @load_v8i1_broadcast_4_v1i1_store(<8 x i1>* %a0,<1 x i1>* %a1) { ; AVX512-LABEL: load_v8i1_broadcast_4_v1i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovb (%rdi), %k0 ; AVX512-NEXT: kshiftrw $4, %k0, %k0 ; AVX512-NEXT: kmovb %k0, (%rsi) ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v8i1_broadcast_4_v1i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: movzbl (%rdi), %eax ; AVX512NOTDQ-NEXT: kmovd %eax, %k0 ; AVX512NOTDQ-NEXT: kshiftrw $4, %k0, %k0 @@ -744,7 +744,7 @@ define void @load_v8i1_broadcast_4_v1i1_store(<8 x i1>* %a0,<1 x i1>* %a1) { } define void @load_v8i1_broadcast_4_v2i1_store(<8 x i1>* %a0,<2 x i1>* %a1) { ; AVX512-LABEL: load_v8i1_broadcast_4_v2i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovb (%rdi), %k0 ; AVX512-NEXT: kshiftrw $4, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %xmm0 @@ -754,7 +754,7 @@ define void @load_v8i1_broadcast_4_v2i1_store(<8 x i1>* %a0,<2 x i1>* %a1) { ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v8i1_broadcast_4_v2i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: movzbl (%rdi), %eax ; AVX512NOTDQ-NEXT: kmovd %eax, %k0 ; AVX512NOTDQ-NEXT: kshiftrw $4, %k0, %k1 @@ -773,14 +773,14 @@ define void @load_v8i1_broadcast_4_v2i1_store(<8 x i1>* %a0,<2 x i1>* %a1) { } define void @load_v8i1_broadcast_7_v1i1_store(<8 x i1>* %a0,<1 x i1>* %a1) { ; AVX512-LABEL: load_v8i1_broadcast_7_v1i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovb (%rdi), %k0 ; AVX512-NEXT: kshiftrw $7, %k0, %k0 ; AVX512-NEXT: kmovb %k0, (%rsi) ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v8i1_broadcast_7_v1i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: movzbl (%rdi), %eax ; AVX512NOTDQ-NEXT: kmovd %eax, %k0 ; AVX512NOTDQ-NEXT: kshiftrw $7, %k0, %k0 @@ -794,7 +794,7 @@ define void @load_v8i1_broadcast_7_v1i1_store(<8 x i1>* %a0,<1 x i1>* %a1) { } define void @load_v8i1_broadcast_7_v2i1_store(<8 x i1>* %a0,<2 x i1>* %a1) { ; AVX512-LABEL: load_v8i1_broadcast_7_v2i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovb (%rdi), %k0 ; AVX512-NEXT: kshiftrw $6, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %xmm0 @@ -804,7 +804,7 @@ define void @load_v8i1_broadcast_7_v2i1_store(<8 x i1>* %a0,<2 x i1>* %a1) { ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v8i1_broadcast_7_v2i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: movzbl (%rdi), %eax ; AVX512NOTDQ-NEXT: kmovd %eax, %k0 ; AVX512NOTDQ-NEXT: kshiftrw $6, %k0, %k1 @@ -823,14 +823,14 @@ define void @load_v8i1_broadcast_7_v2i1_store(<8 x i1>* %a0,<2 x i1>* %a1) { } define void @load_v16i1_broadcast_8_v1i1_store(<16 x i1>* %a0,<1 x i1>* %a1) { ; AVX512-LABEL: load_v16i1_broadcast_8_v1i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovw (%rdi), %k0 ; AVX512-NEXT: kshiftrw $8, %k0, %k0 ; AVX512-NEXT: kmovb %k0, (%rsi) ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v16i1_broadcast_8_v1i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovw (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrw $8, %k0, %k0 ; AVX512NOTDQ-NEXT: kmovd %k0, %eax @@ -843,7 +843,7 @@ define void @load_v16i1_broadcast_8_v1i1_store(<16 x i1>* %a0,<1 x i1>* %a1) { } define void @load_v16i1_broadcast_8_v2i1_store(<16 x i1>* %a0,<2 x i1>* %a1) { ; AVX512-LABEL: load_v16i1_broadcast_8_v2i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovw (%rdi), %k0 ; AVX512-NEXT: kshiftrw $8, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %xmm0 @@ -853,7 +853,7 @@ define void @load_v16i1_broadcast_8_v2i1_store(<16 x i1>* %a0,<2 x i1>* %a1) { ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v16i1_broadcast_8_v2i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovw (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrw $8, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 @@ -871,7 +871,7 @@ define void @load_v16i1_broadcast_8_v2i1_store(<16 x i1>* %a0,<2 x i1>* %a1) { } define void @load_v16i1_broadcast_8_v4i1_store(<16 x i1>* %a0,<4 x i1>* %a1) { ; AVX512-LABEL: load_v16i1_broadcast_8_v4i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovw (%rdi), %k0 ; AVX512-NEXT: kshiftrw $8, %k0, %k0 ; AVX512-NEXT: vpmovm2d %k0, %xmm0 @@ -881,7 +881,7 @@ define void @load_v16i1_broadcast_8_v4i1_store(<16 x i1>* %a0,<4 x i1>* %a1) { ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v16i1_broadcast_8_v4i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovw (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrw $8, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 @@ -899,14 +899,14 @@ define void @load_v16i1_broadcast_8_v4i1_store(<16 x i1>* %a0,<4 x i1>* %a1) { } define void @load_v16i1_broadcast_15_v1i1_store(<16 x i1>* %a0,<1 x i1>* %a1) { ; AVX512-LABEL: load_v16i1_broadcast_15_v1i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovw (%rdi), %k0 ; AVX512-NEXT: kshiftrw $15, %k0, %k0 ; AVX512-NEXT: kmovb %k0, (%rsi) ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v16i1_broadcast_15_v1i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovw (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrw $15, %k0, %k0 ; AVX512NOTDQ-NEXT: kmovd %k0, %eax @@ -919,7 +919,7 @@ define void @load_v16i1_broadcast_15_v1i1_store(<16 x i1>* %a0,<1 x i1>* %a1) { } define void @load_v16i1_broadcast_15_v2i1_store(<16 x i1>* %a0,<2 x i1>* %a1) { ; AVX512-LABEL: load_v16i1_broadcast_15_v2i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovw (%rdi), %k0 ; AVX512-NEXT: kshiftrw $14, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %xmm0 @@ -929,7 +929,7 @@ define void @load_v16i1_broadcast_15_v2i1_store(<16 x i1>* %a0,<2 x i1>* %a1) { ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v16i1_broadcast_15_v2i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovw (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrw $14, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 @@ -947,7 +947,7 @@ define void @load_v16i1_broadcast_15_v2i1_store(<16 x i1>* %a0,<2 x i1>* %a1) { } define void @load_v16i1_broadcast_15_v4i1_store(<16 x i1>* %a0,<4 x i1>* %a1) { ; AVX512-LABEL: load_v16i1_broadcast_15_v4i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovw (%rdi), %k0 ; AVX512-NEXT: kshiftrw $12, %k0, %k0 ; AVX512-NEXT: vpmovm2d %k0, %xmm0 @@ -957,7 +957,7 @@ define void @load_v16i1_broadcast_15_v4i1_store(<16 x i1>* %a0,<4 x i1>* %a1) { ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v16i1_broadcast_15_v4i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovw (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrw $12, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 @@ -975,14 +975,14 @@ define void @load_v16i1_broadcast_15_v4i1_store(<16 x i1>* %a0,<4 x i1>* %a1) { } define void @load_v32i1_broadcast_16_v1i1_store(<32 x i1>* %a0,<1 x i1>* %a1) { ; AVX512-LABEL: load_v32i1_broadcast_16_v1i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovd (%rdi), %k0 ; AVX512-NEXT: kshiftrd $16, %k0, %k0 ; AVX512-NEXT: kmovb %k0, (%rsi) ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v32i1_broadcast_16_v1i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovd (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrd $16, %k0, %k0 ; AVX512NOTDQ-NEXT: kmovd %k0, %eax @@ -995,7 +995,7 @@ define void @load_v32i1_broadcast_16_v1i1_store(<32 x i1>* %a0,<1 x i1>* %a1) { } define void @load_v32i1_broadcast_16_v2i1_store(<32 x i1>* %a0,<2 x i1>* %a1) { ; AVX512-LABEL: load_v32i1_broadcast_16_v2i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovd (%rdi), %k0 ; AVX512-NEXT: kshiftrd $16, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %xmm0 @@ -1005,7 +1005,7 @@ define void @load_v32i1_broadcast_16_v2i1_store(<32 x i1>* %a0,<2 x i1>* %a1) { ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v32i1_broadcast_16_v2i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovd (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrd $16, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 @@ -1023,7 +1023,7 @@ define void @load_v32i1_broadcast_16_v2i1_store(<32 x i1>* %a0,<2 x i1>* %a1) { } define void @load_v32i1_broadcast_16_v4i1_store(<32 x i1>* %a0,<4 x i1>* %a1) { ; AVX512-LABEL: load_v32i1_broadcast_16_v4i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovd (%rdi), %k0 ; AVX512-NEXT: kshiftrd $16, %k0, %k0 ; AVX512-NEXT: vpmovm2d %k0, %xmm0 @@ -1033,7 +1033,7 @@ define void @load_v32i1_broadcast_16_v4i1_store(<32 x i1>* %a0,<4 x i1>* %a1) { ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v32i1_broadcast_16_v4i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovd (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrd $16, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 @@ -1051,7 +1051,7 @@ define void @load_v32i1_broadcast_16_v4i1_store(<32 x i1>* %a0,<4 x i1>* %a1) { } define void @load_v32i1_broadcast_16_v8i1_store(<32 x i1>* %a0,<8 x i1>* %a1) { ; AVX512-LABEL: load_v32i1_broadcast_16_v8i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovd (%rdi), %k0 ; AVX512-NEXT: kshiftrd $16, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %zmm0 @@ -1062,7 +1062,7 @@ define void @load_v32i1_broadcast_16_v8i1_store(<32 x i1>* %a0,<8 x i1>* %a1) { ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v32i1_broadcast_16_v8i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovd (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrd $16, %k0, %k1 ; AVX512NOTDQ-NEXT: vpternlogq $255, %zmm0, %zmm0, %zmm0 {%k1} {z} @@ -1080,14 +1080,14 @@ define void @load_v32i1_broadcast_16_v8i1_store(<32 x i1>* %a0,<8 x i1>* %a1) { } define void @load_v32i1_broadcast_31_v1i1_store(<32 x i1>* %a0,<1 x i1>* %a1) { ; AVX512-LABEL: load_v32i1_broadcast_31_v1i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovd (%rdi), %k0 ; AVX512-NEXT: kshiftrd $31, %k0, %k0 ; AVX512-NEXT: kmovb %k0, (%rsi) ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v32i1_broadcast_31_v1i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovd (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrd $31, %k0, %k0 ; AVX512NOTDQ-NEXT: kmovd %k0, %eax @@ -1100,7 +1100,7 @@ define void @load_v32i1_broadcast_31_v1i1_store(<32 x i1>* %a0,<1 x i1>* %a1) { } define void @load_v32i1_broadcast_31_v2i1_store(<32 x i1>* %a0,<2 x i1>* %a1) { ; AVX512-LABEL: load_v32i1_broadcast_31_v2i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovd (%rdi), %k0 ; AVX512-NEXT: kshiftrd $30, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %xmm0 @@ -1110,7 +1110,7 @@ define void @load_v32i1_broadcast_31_v2i1_store(<32 x i1>* %a0,<2 x i1>* %a1) { ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v32i1_broadcast_31_v2i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovd (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrd $30, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 @@ -1128,7 +1128,7 @@ define void @load_v32i1_broadcast_31_v2i1_store(<32 x i1>* %a0,<2 x i1>* %a1) { } define void @load_v32i1_broadcast_31_v4i1_store(<32 x i1>* %a0,<4 x i1>* %a1) { ; AVX512-LABEL: load_v32i1_broadcast_31_v4i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovd (%rdi), %k0 ; AVX512-NEXT: kshiftrd $28, %k0, %k0 ; AVX512-NEXT: vpmovm2d %k0, %xmm0 @@ -1138,7 +1138,7 @@ define void @load_v32i1_broadcast_31_v4i1_store(<32 x i1>* %a0,<4 x i1>* %a1) { ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v32i1_broadcast_31_v4i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovd (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrd $28, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 @@ -1156,7 +1156,7 @@ define void @load_v32i1_broadcast_31_v4i1_store(<32 x i1>* %a0,<4 x i1>* %a1) { } define void @load_v32i1_broadcast_31_v8i1_store(<32 x i1>* %a0,<8 x i1>* %a1) { ; AVX512-LABEL: load_v32i1_broadcast_31_v8i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovd (%rdi), %k0 ; AVX512-NEXT: kshiftrd $24, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %zmm0 @@ -1168,7 +1168,7 @@ define void @load_v32i1_broadcast_31_v8i1_store(<32 x i1>* %a0,<8 x i1>* %a1) { ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v32i1_broadcast_31_v8i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovd (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrd $24, %k0, %k1 ; AVX512NOTDQ-NEXT: vpternlogq $255, %zmm0, %zmm0, %zmm0 {%k1} {z} @@ -1187,14 +1187,14 @@ define void @load_v32i1_broadcast_31_v8i1_store(<32 x i1>* %a0,<8 x i1>* %a1) { } define void @load_v64i1_broadcast_32_v1i1_store(<64 x i1>* %a0,<1 x i1>* %a1) { ; AVX512-LABEL: load_v64i1_broadcast_32_v1i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovq (%rdi), %k0 ; AVX512-NEXT: kshiftrq $32, %k0, %k0 ; AVX512-NEXT: kmovb %k0, (%rsi) ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v64i1_broadcast_32_v1i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovq (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrq $32, %k0, %k0 ; AVX512NOTDQ-NEXT: kmovd %k0, %eax @@ -1207,7 +1207,7 @@ define void @load_v64i1_broadcast_32_v1i1_store(<64 x i1>* %a0,<1 x i1>* %a1) { } define void @load_v64i1_broadcast_32_v2i1_store(<64 x i1>* %a0,<2 x i1>* %a1) { ; AVX512-LABEL: load_v64i1_broadcast_32_v2i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovq (%rdi), %k0 ; AVX512-NEXT: kshiftrq $32, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %xmm0 @@ -1217,7 +1217,7 @@ define void @load_v64i1_broadcast_32_v2i1_store(<64 x i1>* %a0,<2 x i1>* %a1) { ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v64i1_broadcast_32_v2i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovq (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrq $32, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 @@ -1235,7 +1235,7 @@ define void @load_v64i1_broadcast_32_v2i1_store(<64 x i1>* %a0,<2 x i1>* %a1) { } define void @load_v64i1_broadcast_32_v4i1_store(<64 x i1>* %a0,<4 x i1>* %a1) { ; AVX512-LABEL: load_v64i1_broadcast_32_v4i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovq (%rdi), %k0 ; AVX512-NEXT: kshiftrq $32, %k0, %k0 ; AVX512-NEXT: vpmovm2d %k0, %xmm0 @@ -1245,7 +1245,7 @@ define void @load_v64i1_broadcast_32_v4i1_store(<64 x i1>* %a0,<4 x i1>* %a1) { ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v64i1_broadcast_32_v4i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovq (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrq $32, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 @@ -1263,7 +1263,7 @@ define void @load_v64i1_broadcast_32_v4i1_store(<64 x i1>* %a0,<4 x i1>* %a1) { } define void @load_v64i1_broadcast_32_v8i1_store(<64 x i1>* %a0,<8 x i1>* %a1) { ; AVX512-LABEL: load_v64i1_broadcast_32_v8i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovq (%rdi), %k0 ; AVX512-NEXT: kshiftrq $32, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %zmm0 @@ -1274,7 +1274,7 @@ define void @load_v64i1_broadcast_32_v8i1_store(<64 x i1>* %a0,<8 x i1>* %a1) { ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v64i1_broadcast_32_v8i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovq (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrq $32, %k0, %k1 ; AVX512NOTDQ-NEXT: vpternlogq $255, %zmm0, %zmm0, %zmm0 {%k1} {z} @@ -1292,7 +1292,7 @@ define void @load_v64i1_broadcast_32_v8i1_store(<64 x i1>* %a0,<8 x i1>* %a1) { } define void @load_v64i1_broadcast_32_v16i1_store(<64 x i1>* %a0,<16 x i1>* %a1) { ; AVX512-LABEL: load_v64i1_broadcast_32_v16i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovq (%rdi), %k0 ; AVX512-NEXT: kshiftrq $32, %k0, %k0 ; AVX512-NEXT: vpmovm2d %k0, %zmm0 @@ -1303,7 +1303,7 @@ define void @load_v64i1_broadcast_32_v16i1_store(<64 x i1>* %a0,<16 x i1>* %a1) ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v64i1_broadcast_32_v16i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovq (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrq $32, %k0, %k1 ; AVX512NOTDQ-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0 {%k1} {z} @@ -1320,14 +1320,14 @@ define void @load_v64i1_broadcast_32_v16i1_store(<64 x i1>* %a0,<16 x i1>* %a1) } define void @load_v64i1_broadcast_63_v1i1_store(<64 x i1>* %a0,<1 x i1>* %a1) { ; AVX512-LABEL: load_v64i1_broadcast_63_v1i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovq (%rdi), %k0 ; AVX512-NEXT: kshiftrq $63, %k0, %k0 ; AVX512-NEXT: kmovb %k0, (%rsi) ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v64i1_broadcast_63_v1i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovq (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrq $63, %k0, %k0 ; AVX512NOTDQ-NEXT: kmovd %k0, %eax @@ -1340,7 +1340,7 @@ define void @load_v64i1_broadcast_63_v1i1_store(<64 x i1>* %a0,<1 x i1>* %a1) { } define void @load_v64i1_broadcast_63_v2i1_store(<64 x i1>* %a0,<2 x i1>* %a1) { ; AVX512-LABEL: load_v64i1_broadcast_63_v2i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovq (%rdi), %k0 ; AVX512-NEXT: kshiftrq $62, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %xmm0 @@ -1350,7 +1350,7 @@ define void @load_v64i1_broadcast_63_v2i1_store(<64 x i1>* %a0,<2 x i1>* %a1) { ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v64i1_broadcast_63_v2i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovq (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrq $62, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 @@ -1368,7 +1368,7 @@ define void @load_v64i1_broadcast_63_v2i1_store(<64 x i1>* %a0,<2 x i1>* %a1) { } define void @load_v64i1_broadcast_63_v4i1_store(<64 x i1>* %a0,<4 x i1>* %a1) { ; AVX512-LABEL: load_v64i1_broadcast_63_v4i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovq (%rdi), %k0 ; AVX512-NEXT: kshiftrq $60, %k0, %k0 ; AVX512-NEXT: vpmovm2d %k0, %xmm0 @@ -1378,7 +1378,7 @@ define void @load_v64i1_broadcast_63_v4i1_store(<64 x i1>* %a0,<4 x i1>* %a1) { ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v64i1_broadcast_63_v4i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovq (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrq $60, %k0, %k1 ; AVX512NOTDQ-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 @@ -1396,7 +1396,7 @@ define void @load_v64i1_broadcast_63_v4i1_store(<64 x i1>* %a0,<4 x i1>* %a1) { } define void @load_v64i1_broadcast_63_v8i1_store(<64 x i1>* %a0,<8 x i1>* %a1) { ; AVX512-LABEL: load_v64i1_broadcast_63_v8i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovq (%rdi), %k0 ; AVX512-NEXT: kshiftrq $56, %k0, %k0 ; AVX512-NEXT: vpmovm2q %k0, %zmm0 @@ -1408,7 +1408,7 @@ define void @load_v64i1_broadcast_63_v8i1_store(<64 x i1>* %a0,<8 x i1>* %a1) { ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v64i1_broadcast_63_v8i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovq (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrq $56, %k0, %k1 ; AVX512NOTDQ-NEXT: vpternlogq $255, %zmm0, %zmm0, %zmm0 {%k1} {z} @@ -1427,7 +1427,7 @@ define void @load_v64i1_broadcast_63_v8i1_store(<64 x i1>* %a0,<8 x i1>* %a1) { } define void @load_v64i1_broadcast_63_v16i1_store(<64 x i1>* %a0,<16 x i1>* %a1) { ; AVX512-LABEL: load_v64i1_broadcast_63_v16i1_store: -; AVX512: # BB#0: +; AVX512: # %bb.0: ; AVX512-NEXT: kmovq (%rdi), %k0 ; AVX512-NEXT: kshiftrq $48, %k0, %k0 ; AVX512-NEXT: vpmovm2d %k0, %zmm0 @@ -1439,7 +1439,7 @@ define void @load_v64i1_broadcast_63_v16i1_store(<64 x i1>* %a0,<16 x i1>* %a1) ; AVX512-NEXT: retq ; ; AVX512NOTDQ-LABEL: load_v64i1_broadcast_63_v16i1_store: -; AVX512NOTDQ: # BB#0: +; AVX512NOTDQ: # %bb.0: ; AVX512NOTDQ-NEXT: kmovq (%rdi), %k0 ; AVX512NOTDQ-NEXT: kshiftrq $48, %k0, %k1 ; AVX512NOTDQ-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0 {%k1} {z} |