diff options
Diffstat (limited to 'llvm/test/CodeGen/X86/vector-shuffle-combining-avx512bw.ll')
| -rw-r--r-- | llvm/test/CodeGen/X86/vector-shuffle-combining-avx512bw.ll | 32 |
1 files changed, 16 insertions, 16 deletions
diff --git a/llvm/test/CodeGen/X86/vector-shuffle-combining-avx512bw.ll b/llvm/test/CodeGen/X86/vector-shuffle-combining-avx512bw.ll index e550653518d..b68f609fc65 100644 --- a/llvm/test/CodeGen/X86/vector-shuffle-combining-avx512bw.ll +++ b/llvm/test/CodeGen/X86/vector-shuffle-combining-avx512bw.ll @@ -51,7 +51,7 @@ define <8 x double> @combine_permvar_8f64_identity_mask(<8 x double> %x0, <8 x d ; ; X64-LABEL: combine_permvar_8f64_identity_mask: ; X64: # BB#0: -; X64-NEXT: kmovw %edi, %k1 +; X64-NEXT: kmovd %edi, %k1 ; X64-NEXT: vmovapd {{.*#+}} zmm2 = [7,6,5,4,3,2,1,0] ; X64-NEXT: vpermpd %zmm0, %zmm2, %zmm1 {%k1} ; X64-NEXT: vmovapd {{.*#+}} zmm0 = [7,14,5,12,3,10,1,8] @@ -89,7 +89,7 @@ define <8 x i64> @combine_permvar_8i64_identity_mask(<8 x i64> %x0, <8 x i64> %x ; ; X64-LABEL: combine_permvar_8i64_identity_mask: ; X64: # BB#0: -; X64-NEXT: kmovw %edi, %k1 +; X64-NEXT: kmovd %edi, %k1 ; X64-NEXT: vmovdqa64 {{.*#+}} zmm2 = [7,6,5,4,3,2,1,0] ; X64-NEXT: vpermq %zmm0, %zmm2, %zmm1 {%k1} ; X64-NEXT: vmovdqa64 {{.*#+}} zmm0 = [7,14,5,12,3,10,1,8] @@ -126,7 +126,7 @@ define <8 x double> @combine_vpermt2var_8f64_identity_mask(<8 x double> %x0, <8 ; ; X64-LABEL: combine_vpermt2var_8f64_identity_mask: ; X64: # BB#0: -; X64-NEXT: kmovw %edi, %k1 +; X64-NEXT: kmovd %edi, %k1 ; X64-NEXT: vmovapd {{.*#+}} zmm2 = [7,6,5,4,3,2,1,0] ; X64-NEXT: vpermi2pd %zmm1, %zmm0, %zmm2 {%k1} {z} ; X64-NEXT: vmovapd {{.*#+}} zmm0 = [7,14,5,12,3,10,1,8] @@ -175,7 +175,7 @@ define <8 x double> @combine_vpermt2var_8f64_movddup_mask(<8 x double> %x0, <8 x ; ; X64-LABEL: combine_vpermt2var_8f64_movddup_mask: ; X64: # BB#0: -; X64-NEXT: kmovw %edi, %k1 +; X64-NEXT: kmovd %edi, %k1 ; X64-NEXT: vmovddup {{.*#+}} zmm0 {%k1} {z} = zmm0[0,0,2,2,4,4,6,6] ; X64-NEXT: retq %res0 = call <8 x double> @llvm.x86.avx512.maskz.vpermt2var.pd.512(<8 x i64> <i64 0, i64 0, i64 2, i64 2, i64 4, i64 4, i64 6, i64 6>, <8 x double> %x0, <8 x double> %x1, i8 %m) @@ -207,7 +207,7 @@ define <8 x i64> @combine_vpermt2var_8i64_identity_mask(<8 x i64> %x0, <8 x i64> ; ; X64-LABEL: combine_vpermt2var_8i64_identity_mask: ; X64: # BB#0: -; X64-NEXT: kmovw %edi, %k1 +; X64-NEXT: kmovd %edi, %k1 ; X64-NEXT: vmovdqa64 {{.*#+}} zmm2 = [7,6,5,4,3,2,1,0] ; X64-NEXT: vpermi2q %zmm1, %zmm0, %zmm2 {%k1} {z} ; X64-NEXT: vmovdqa64 {{.*#+}} zmm0 = [7,14,5,12,3,10,1,8] @@ -242,7 +242,7 @@ define <16 x float> @combine_vpermt2var_16f32_identity_mask(<16 x float> %x0, <1 ; ; X64-LABEL: combine_vpermt2var_16f32_identity_mask: ; X64: # BB#0: -; X64-NEXT: kmovw %edi, %k1 +; X64-NEXT: kmovd %edi, %k1 ; X64-NEXT: vmovaps {{.*#+}} zmm2 = [15,14,13,12,11,10,9,8,7,6,5,4,3,2,1,0] ; X64-NEXT: vpermi2ps %zmm1, %zmm0, %zmm2 {%k1} {z} ; X64-NEXT: vmovaps {{.*#+}} zmm0 = [15,30,13,28,11,26,9,24,7,22,5,20,3,18,1,16] @@ -299,7 +299,7 @@ define <16 x float> @combine_vpermt2var_16f32_vmovddup_mask(<16 x float> %x0, <1 ; ; X64-LABEL: combine_vpermt2var_16f32_vmovddup_mask: ; X64: # BB#0: -; X64-NEXT: kmovw %edi, %k1 +; X64-NEXT: kmovd %edi, %k1 ; X64-NEXT: vmovaps {{.*#+}} zmm2 = [0,1,0,1,4,5,4,5,8,9,8,9,12,13,12,13] ; X64-NEXT: vpermt2ps %zmm1, %zmm2, %zmm0 {%k1} {z} ; X64-NEXT: retq @@ -319,7 +319,7 @@ define <16 x float> @combine_vpermt2var_16f32_vmovddup_mask_load(<16 x float> *% ; ; X64-LABEL: combine_vpermt2var_16f32_vmovddup_mask_load: ; X64: # BB#0: -; X64-NEXT: kmovw %esi, %k1 +; X64-NEXT: kmovd %esi, %k1 ; X64-NEXT: vmovaps (%rdi), %zmm2 ; X64-NEXT: vmovaps {{.*#+}} zmm1 = [0,1,0,1,4,5,4,5,8,9,8,9,12,13,12,13] ; X64-NEXT: vpermi2ps %zmm0, %zmm2, %zmm1 {%k1} {z} @@ -367,7 +367,7 @@ define <16 x float> @combine_vpermt2var_16f32_vmovshdup_mask(<16 x float> %x0, < ; ; X64-LABEL: combine_vpermt2var_16f32_vmovshdup_mask: ; X64: # BB#0: -; X64-NEXT: kmovw %edi, %k1 +; X64-NEXT: kmovd %edi, %k1 ; X64-NEXT: vmovshdup {{.*#+}} zmm0 {%k1} {z} = zmm0[1,1,3,3,5,5,7,7,9,9,11,11,13,13,15,15] ; X64-NEXT: retq %res0 = call <16 x float> @llvm.x86.avx512.maskz.vpermt2var.ps.512(<16 x i32> <i32 1, i32 1, i32 3, i32 3, i32 5, i32 5, i32 7, i32 7, i32 9, i32 9, i32 11, i32 11, i32 13, i32 13, i32 15, i32 15>, <16 x float> %x0, <16 x float> %x1, i16 %m) @@ -411,7 +411,7 @@ define <16 x float> @combine_vpermt2var_16f32_vmovsldup_mask(<16 x float> %x0, < ; ; X64-LABEL: combine_vpermt2var_16f32_vmovsldup_mask: ; X64: # BB#0: -; X64-NEXT: kmovw %edi, %k1 +; X64-NEXT: kmovd %edi, %k1 ; X64-NEXT: vmovsldup {{.*#+}} zmm0 {%k1} {z} = zmm0[0,0,2,2,4,4,6,6,8,8,10,10,12,12,14,14] ; X64-NEXT: retq %res0 = call <16 x float> @llvm.x86.avx512.maskz.vpermt2var.ps.512(<16 x i32> <i32 undef, i32 0, i32 undef, i32 2, i32 4, i32 4, i32 6, i32 6, i32 8, i32 8, i32 10, i32 10, i32 12, i32 12, i32 14, i32 14>, <16 x float> %x0, <16 x float> %x1, i16 %m) @@ -427,7 +427,7 @@ define <16 x float> @combine_vpermt2var_16f32_vmovsldup_mask_load(<16 x float> * ; ; X64-LABEL: combine_vpermt2var_16f32_vmovsldup_mask_load: ; X64: # BB#0: -; X64-NEXT: kmovw %esi, %k1 +; X64-NEXT: kmovd %esi, %k1 ; X64-NEXT: vmovsldup {{.*#+}} zmm0 {%k1} {z} = mem[0,0,2,2,4,4,6,6,8,8,10,10,12,12,14,14] ; X64-NEXT: retq %x0 = load <16 x float>, <16 x float> *%p0 @@ -472,7 +472,7 @@ define <16 x float> @combine_vpermt2var_16f32_vpermilps_mask(<16 x float> %x0, < ; ; X64-LABEL: combine_vpermt2var_16f32_vpermilps_mask: ; X64: # BB#0: -; X64-NEXT: kmovw %edi, %k1 +; X64-NEXT: kmovd %edi, %k1 ; X64-NEXT: vpermilps {{.*#+}} zmm0 {%k1} {z} = zmm0[3,2,1,0,7,6,5,4,11,10,9,8,15,14,13,12] ; X64-NEXT: retq %res0 = call <16 x float> @llvm.x86.avx512.maskz.vpermt2var.ps.512(<16 x i32> <i32 3, i32 2, i32 1, i32 0, i32 7, i32 6, i32 5, i32 4, i32 11, i32 10, i32 9, i32 8, i32 15, i32 14, i32 13, i32 12>, <16 x float> %x0, <16 x float> %x1, i16 %m) @@ -488,7 +488,7 @@ define <16 x float> @combine_vpermt2var_16f32_vpermilps_mask_load(<16 x float> * ; ; X64-LABEL: combine_vpermt2var_16f32_vpermilps_mask_load: ; X64: # BB#0: -; X64-NEXT: kmovw %esi, %k1 +; X64-NEXT: kmovd %esi, %k1 ; X64-NEXT: vpermilps {{.*#+}} zmm0 {%k1} {z} = mem[3,2,1,0,7,6,5,4,11,10,9,8,15,14,13,12] ; X64-NEXT: retq %x0 = load <16 x float>, <16 x float> *%p0 @@ -520,7 +520,7 @@ define <16 x i32> @combine_vpermt2var_16i32_identity_mask(<16 x i32> %x0, <16 x ; ; X64-LABEL: combine_vpermt2var_16i32_identity_mask: ; X64: # BB#0: -; X64-NEXT: kmovw %edi, %k1 +; X64-NEXT: kmovd %edi, %k1 ; X64-NEXT: vmovdqa32 {{.*#+}} zmm2 = [15,14,13,12,11,10,9,8,7,6,5,4,3,2,1,0] ; X64-NEXT: vpermi2d %zmm1, %zmm0, %zmm2 {%k1} {z} ; X64-NEXT: vmovdqa32 {{.*#+}} zmm0 = [15,30,13,28,11,26,9,24,7,22,5,20,3,18,1,16] @@ -675,7 +675,7 @@ define <8 x i64> @combine_permvar_8i64_as_permq_mask(<8 x i64> %x0, <8 x i64> %x ; ; X64-LABEL: combine_permvar_8i64_as_permq_mask: ; X64: # BB#0: -; X64-NEXT: kmovw %edi, %k1 +; X64-NEXT: kmovd %edi, %k1 ; X64-NEXT: vpermq {{.*#+}} zmm1 {%k1} = zmm0[3,2,1,0,7,6,5,4] ; X64-NEXT: vmovdqa64 %zmm1, %zmm0 ; X64-NEXT: retq @@ -707,7 +707,7 @@ define <8 x double> @combine_permvar_8f64_as_permpd_mask(<8 x double> %x0, <8 x ; ; X64-LABEL: combine_permvar_8f64_as_permpd_mask: ; X64: # BB#0: -; X64-NEXT: kmovw %edi, %k1 +; X64-NEXT: kmovd %edi, %k1 ; X64-NEXT: vpermpd {{.*#+}} zmm1 {%k1} = zmm0[3,2,1,0,7,6,5,4] ; X64-NEXT: vmovapd %zmm1, %zmm0 ; X64-NEXT: retq |

