diff options
| author | Michael Zuckerman <Michael.zuckerman@intel.com> | 2016-02-28 07:39:34 +0000 |
|---|---|---|
| committer | Michael Zuckerman <Michael.zuckerman@intel.com> | 2016-02-28 07:39:34 +0000 |
| commit | 431b0e18b4c1e2a4cfcffd797b4f8b9581164da4 (patch) | |
| tree | 0e73d17c18b7172d7de9383f257fcd5dd1e86958 | |
| parent | 96836fc81c1580e50f920c7d97396e428846d0b9 (diff) | |
| download | bcm5719-llvm-431b0e18b4c1e2a4cfcffd797b4f8b9581164da4.tar.gz bcm5719-llvm-431b0e18b4c1e2a4cfcffd797b4f8b9581164da4.zip | |
[CLANG] [AVX512] [BUILTIN] Adding PSLL{V|W|Wi}{128|256|512} builtin
Differential Revision: http://reviews.llvm.org/D17685
llvm-svn: 262177
| -rw-r--r-- | clang/include/clang/Basic/BuiltinsX86.def | 14 | ||||
| -rw-r--r-- | clang/lib/Headers/avx512bwintrin.h | 80 | ||||
| -rw-r--r-- | clang/lib/Headers/avx512vlbwintrin.h | 126 | ||||
| -rw-r--r-- | clang/lib/Headers/avx512vlintrin.h | 87 | ||||
| -rw-r--r-- | clang/test/CodeGen/avx512bw-builtins.c | 54 | ||||
| -rw-r--r-- | clang/test/CodeGen/avx512vl-builtins.c | 49 | ||||
| -rw-r--r-- | clang/test/CodeGen/avx512vlbw-builtins.c | 87 |
7 files changed, 496 insertions, 1 deletions
diff --git a/clang/include/clang/Basic/BuiltinsX86.def b/clang/include/clang/Basic/BuiltinsX86.def index 31688581459..4951e3df207 100644 --- a/clang/include/clang/Basic/BuiltinsX86.def +++ b/clang/include/clang/Basic/BuiltinsX86.def @@ -1638,6 +1638,20 @@ TARGET_BUILTIN(__builtin_ia32_pshufhw128_mask, "V8sV8sIiV8sUc","","avx512bw,avx5 TARGET_BUILTIN(__builtin_ia32_pshufhw256_mask, "V16sV16sIiV16sUs","","avx512bw,avx512vl") TARGET_BUILTIN(__builtin_ia32_pshuflw128_mask, "V8sV8sIiV8sUc","","avx512bw,avx512vl") TARGET_BUILTIN(__builtin_ia32_pshuflw256_mask, "V16sV16sIiV16sUs","","avx512bw,avx512vl") +TARGET_BUILTIN(__builtin_ia32_psllv32hi_mask, "V32sV32sV32sV32sUi","","avx512bw") +TARGET_BUILTIN(__builtin_ia32_psllw512_mask, "V32sV32sV8sV32sUi","","avx512bw") +TARGET_BUILTIN(__builtin_ia32_psllwi512_mask, "V32sV32sIiV32sUi","","avx512bw") +TARGET_BUILTIN(__builtin_ia32_psllv16hi_mask, "V16sV16sV16sV16sUs","","avx512bw,avx512vl") +TARGET_BUILTIN(__builtin_ia32_psllv8hi_mask, "V8sV8sV8sV8sUc","","avx512bw,avx512vl") +TARGET_BUILTIN(__builtin_ia32_psllw128_mask, "V8sV8sV8sV8sUc","","avx512bw,avx512vl") +TARGET_BUILTIN(__builtin_ia32_psllw256_mask, "V16sV16sV8sV16sUs","","avx512bw,avx512vl") +TARGET_BUILTIN(__builtin_ia32_psllwi128_mask, "V8sV8siV8sUc","","avx512bw,avx512vl") +TARGET_BUILTIN(__builtin_ia32_psllwi256_mask, "V16sV16siV16sUs","","avx512bw,avx512vl") +TARGET_BUILTIN(__builtin_ia32_psllv2di_mask, "V2LLiV2LLiV2LLiV2LLiUc","","avx512vl") +TARGET_BUILTIN(__builtin_ia32_psllv4di_mask, "V4LLiV4LLiV4LLiV4LLiUc","","avx512vl") +TARGET_BUILTIN(__builtin_ia32_psllv4si_mask, "V4iV4iV4iV4iUc","","avx512vl") +TARGET_BUILTIN(__builtin_ia32_psllv8si_mask, "V8iV8iV8iV8iUc","","avx512vl") + #undef BUILTIN #undef TARGET_BUILTIN diff --git a/clang/lib/Headers/avx512bwintrin.h b/clang/lib/Headers/avx512bwintrin.h index af4cdecf7d8..1eda6384528 100644 --- a/clang/lib/Headers/avx512bwintrin.h +++ b/clang/lib/Headers/avx512bwintrin.h @@ -1638,6 +1638,86 @@ __builtin_ia32_pshuflw512_mask ((__v32hi) (__A),\ (__mmask32)( __U));\ }) +static __inline__ __m512i __DEFAULT_FN_ATTRS +_mm512_sllv_epi16 (__m512i __A, __m512i __B) +{ + return (__m512i) __builtin_ia32_psllv32hi_mask ((__v32hi) __A, + (__v32hi) __B, + (__v32hi) + _mm512_setzero_hi (), + (__mmask32) -1); +} + +static __inline__ __m512i __DEFAULT_FN_ATTRS +_mm512_mask_sllv_epi16 (__m512i __W, __mmask32 __U, __m512i __A, + __m512i __B) +{ + return (__m512i) __builtin_ia32_psllv32hi_mask ((__v32hi) __A, + (__v32hi) __B, + (__v32hi) __W, + (__mmask32) __U); +} + +static __inline__ __m512i __DEFAULT_FN_ATTRS +_mm512_maskz_sllv_epi16 (__mmask32 __U, __m512i __A, __m512i __B) +{ + return (__m512i) __builtin_ia32_psllv32hi_mask ((__v32hi) __A, + (__v32hi) __B, + (__v32hi) + _mm512_setzero_hi (), + (__mmask32) __U); +} + +static __inline__ __m512i __DEFAULT_FN_ATTRS +_mm512_sll_epi16 (__m512i __A, __m128i __B) +{ + return (__m512i) __builtin_ia32_psllw512_mask ((__v32hi) __A, + (__v8hi) __B, + (__v32hi) + _mm512_setzero_hi (), + (__mmask32) -1); +} + +static __inline__ __m512i __DEFAULT_FN_ATTRS +_mm512_mask_sll_epi16 (__m512i __W, __mmask32 __U, __m512i __A, + __m128i __B) +{ + return (__m512i) __builtin_ia32_psllw512_mask ((__v32hi) __A, + (__v8hi) __B, + (__v32hi) __W, + (__mmask32) __U); +} + +static __inline__ __m512i __DEFAULT_FN_ATTRS +_mm512_maskz_sll_epi16 (__mmask32 __U, __m512i __A, __m128i __B) +{ + return (__m512i) __builtin_ia32_psllw512_mask ((__v32hi) __A, + (__v8hi) __B, + (__v32hi) + _mm512_setzero_hi (), + (__mmask32) __U); +} + +#define _mm512_slli_epi16( __A, __B) __extension__ ({ \ +__builtin_ia32_psllwi512_mask ((__v32hi)( __A),( __B),\ + (__v32hi)\ + _mm512_setzero_hi (),\ + (__mmask32) -1);\ +}) + +#define _mm512_mask_slli_epi16( __W, __U, __A, __B) __extension__ ({ \ +__builtin_ia32_psllwi512_mask ((__v32hi)( __A),( __B),\ + (__v32hi)( __W),\ + (__mmask32)( __U));\ +}) + +#define _mm512_maskz_slli_epi16( __U, __A, __B) __extension__ ({ \ +__builtin_ia32_psllwi512_mask ((__v32hi)( __A),( __B),\ + (__v32hi)\ + _mm512_setzero_hi (),\ + (__mmask32)( __U));\ +}) + #undef __DEFAULT_FN_ATTRS #endif diff --git a/clang/lib/Headers/avx512vlbwintrin.h b/clang/lib/Headers/avx512vlbwintrin.h index fe4b1d67444..831ca8a6d3a 100644 --- a/clang/lib/Headers/avx512vlbwintrin.h +++ b/clang/lib/Headers/avx512vlbwintrin.h @@ -2467,6 +2467,132 @@ __builtin_ia32_pshuflw256_mask ((__v16hi) (__A),\ (__mmask16)( __U));\ }) +static __inline__ __m256i __DEFAULT_FN_ATTRS +_mm256_sllv_epi16 (__m256i __A, __m256i __B) +{ + return (__m256i) __builtin_ia32_psllv16hi_mask ((__v16hi) __A, + (__v16hi) __B, + (__v16hi) + _mm256_setzero_si256 (), + (__mmask16) -1); +} + +static __inline__ __m256i __DEFAULT_FN_ATTRS +_mm256_mask_sllv_epi16 (__m256i __W, __mmask16 __U, __m256i __A, + __m256i __B) +{ + return (__m256i) __builtin_ia32_psllv16hi_mask ((__v16hi) __A, + (__v16hi) __B, + (__v16hi) __W, + (__mmask16) __U); +} + +static __inline__ __m256i __DEFAULT_FN_ATTRS +_mm256_maskz_sllv_epi16 (__mmask16 __U, __m256i __A, __m256i __B) +{ + return (__m256i) __builtin_ia32_psllv16hi_mask ((__v16hi) __A, + (__v16hi) __B, + (__v16hi) + _mm256_setzero_si256 (), + (__mmask16) __U); +} + +static __inline__ __m128i __DEFAULT_FN_ATTRS +_mm_sllv_epi16 (__m128i __A, __m128i __B) +{ + return (__m128i) __builtin_ia32_psllv8hi_mask ((__v8hi) __A, + (__v8hi) __B, + (__v8hi) + _mm_setzero_hi (), + (__mmask8) -1); +} + +static __inline__ __m128i __DEFAULT_FN_ATTRS +_mm_mask_sllv_epi16 (__m128i __W, __mmask8 __U, __m128i __A, + __m128i __B) +{ + return (__m128i) __builtin_ia32_psllv8hi_mask ((__v8hi) __A, + (__v8hi) __B, + (__v8hi) __W, + (__mmask8) __U); +} + +static __inline__ __m128i __DEFAULT_FN_ATTRS +_mm_maskz_sllv_epi16 (__mmask8 __U, __m128i __A, __m128i __B) +{ + return (__m128i) __builtin_ia32_psllv8hi_mask ((__v8hi) __A, + (__v8hi) __B, + (__v8hi) + _mm_setzero_si128 (), + (__mmask8) __U); +} + +static __inline__ __m128i __DEFAULT_FN_ATTRS +_mm_mask_sll_epi16 (__m128i __W, __mmask8 __U, __m128i __A, + __m128i __B) +{ + return (__m128i) __builtin_ia32_psllw128_mask ((__v8hi) __A, + (__v8hi) __B, + (__v8hi) __W, + (__mmask8) __U); +} + +static __inline__ __m128i __DEFAULT_FN_ATTRS +_mm_maskz_sll_epi16 (__mmask8 __U, __m128i __A, __m128i __B) +{ + return (__m128i) __builtin_ia32_psllw128_mask ((__v8hi) __A, + (__v8hi) __B, + (__v8hi) + _mm_setzero_si128 (), + (__mmask8) __U); +} + +static __inline__ __m256i __DEFAULT_FN_ATTRS +_mm256_mask_sll_epi16 (__m256i __W, __mmask16 __U, __m256i __A, + __m128i __B) +{ + return (__m256i) __builtin_ia32_psllw256_mask ((__v16hi) __A, + (__v8hi) __B, + (__v16hi) __W, + (__mmask16) __U); +} + +static __inline__ __m256i __DEFAULT_FN_ATTRS +_mm256_maskz_sll_epi16 (__mmask16 __U, __m256i __A, __m128i __B) +{ + return (__m256i) __builtin_ia32_psllw256_mask ((__v16hi) __A, + (__v8hi) __B, + (__v16hi) + _mm256_setzero_si256 (), + (__mmask16) __U); +} + +#define _mm_mask_slli_epi16( __W, __U, __A, __B) __extension__ ({ \ +__builtin_ia32_psllwi128_mask ((__v8hi)( __A),( __B),\ + (__v8hi)( __W),\ + (__mmask8)( __U));\ +}) + +#define _mm_maskz_slli_epi16( __U, __A, __B) __extension__ ({ \ +__builtin_ia32_psllwi128_mask ((__v8hi)( __A),( __B),\ + (__v8hi)\ + _mm_setzero_si128 (),\ + (__mmask8)( __U));\ +}) + +#define _mm256_mask_slli_epi16( __W, __U, __A, __B) __extension__ ({ \ +__builtin_ia32_psllwi256_mask ((__v16hi)( __A),( __B),\ + (__v16hi)( __W),\ + (__mmask16)( __U));\ +}) + +#define _mm256_maskz_slli_epi16( __U, __A, __B) __extension__ ({ \ +__builtin_ia32_psllwi256_mask ((__v16hi)( __A),( __B),\ + (__v16hi)\ + _mm256_setzero_si256 (),\ + (__mmask16)( __U));\ +}) + #undef __DEFAULT_FN_ATTRS #endif /* __AVX512VLBWINTRIN_H */ diff --git a/clang/lib/Headers/avx512vlintrin.h b/clang/lib/Headers/avx512vlintrin.h index 6f938c4b434..dda0f2854b0 100644 --- a/clang/lib/Headers/avx512vlintrin.h +++ b/clang/lib/Headers/avx512vlintrin.h @@ -5336,6 +5336,93 @@ _mm256_maskz_rorv_epi64 (__mmask8 __U, __m256i __A, __m256i __B) (__mmask8) __U); } +static __inline__ __m128i __DEFAULT_FN_ATTRS +_mm_mask_sllv_epi64 (__m128i __W, __mmask8 __U, __m128i __X, + __m128i __Y) +{ + return (__m128i) __builtin_ia32_psllv2di_mask ((__v2di) __X, + (__v2di) __Y, + (__v2di) __W, + (__mmask8) __U); +} + +static __inline__ __m128i __DEFAULT_FN_ATTRS +_mm_maskz_sllv_epi64 (__mmask8 __U, __m128i __X, __m128i __Y) +{ + return (__m128i) __builtin_ia32_psllv2di_mask ((__v2di) __X, + (__v2di) __Y, + (__v2di) + _mm_setzero_di (), + (__mmask8) __U); +} + +static __inline__ __m256i __DEFAULT_FN_ATTRS +_mm256_mask_sllv_epi64 (__m256i __W, __mmask8 __U, __m256i __X, + __m256i __Y) +{ + return (__m256i) __builtin_ia32_psllv4di_mask ((__v4di) __X, + (__v4di) __Y, + (__v4di) __W, + (__mmask8) __U); +} + +static __inline__ __m256i __DEFAULT_FN_ATTRS +_mm256_maskz_sllv_epi64 (__mmask8 __U, __m256i __X, __m256i __Y) +{ + return (__m256i) __builtin_ia32_psllv4di_mask ((__v4di) __X, + (__v4di) __Y, + (__v4di) + _mm256_setzero_si256 (), + (__mmask8) __U); +} + +static __inline__ __m128i __DEFAULT_FN_ATTRS +_mm_mask_sllv_epi32 (__m128i __W, __mmask8 __U, __m128i __X, + __m128i __Y) +{ + return (__m128i) __builtin_ia32_psllv4si_mask ((__v4si) __X, + (__v4si) __Y, + (__v4si) __W, + (__mmask8) __U); +} + +static __inline__ __m128i __DEFAULT_FN_ATTRS +_mm_maskz_sllv_epi32 (__mmask8 __U, __m128i __X, __m128i __Y) +{ + return (__m128i) __builtin_ia32_psllv4si_mask ((__v4si) __X, + (__v4si) __Y, + (__v4si) + _mm_setzero_si128 (), + (__mmask8) __U); +} + +static __inline__ __m256i __DEFAULT_FN_ATTRS +_mm256_mask_sllv_epi32 (__m256i __W, __mmask8 __U, __m256i __X, + __m256i __Y) +{ + return (__m256i) __builtin_ia32_psllv8si_mask ((__v8si) __X, + (__v8si) __Y, + (__v8si) __W, + (__mmask8) __U); +} + +static __inline__ __m256i __DEFAULT_FN_ATTRS +_mm256_maskz_sllv_epi32 (__mmask8 __U, __m256i __X, __m256i __Y) +{ + return (__m256i) __builtin_ia32_psllv8si_mask ((__v8si) __X, + (__v8si) __Y, + (__v8si) + _mm256_setzero_si256 (), + (__mmask8) __U); +} + +#define _mm256_maskz_sllv_epi32( __U, __X, __Y) __extension__ ({ \ +__builtin_ia32_psllv8si_mask ((__v8si)( __X),\ + (__v8si)( __Y),\ + (__v8si)\ + _mm256_setzero_si256 (),\ + (__mmask8)( __U));\ +}) #undef __DEFAULT_FN_ATTRS #undef __DEFAULT_FN_ATTRS_BOTH diff --git a/clang/test/CodeGen/avx512bw-builtins.c b/clang/test/CodeGen/avx512bw-builtins.c index 21984c2b988..8520f969e05 100644 --- a/clang/test/CodeGen/avx512bw-builtins.c +++ b/clang/test/CodeGen/avx512bw-builtins.c @@ -1113,4 +1113,58 @@ __m512i test_mm512_maskz_shufflelo_epi16(__mmask32 __U, __m512i __A) { return _mm512_maskz_shufflelo_epi16(__U, __A, 5); } +__m512i test_mm512_sllv_epi16(__m512i __A, __m512i __B) { + // CHECK-LABEL: @test_mm512_sllv_epi16 + // CHECK: @llvm.x86.avx512.mask.psllv + return _mm512_sllv_epi16(__A, __B); +} + +__m512i test_mm512_mask_sllv_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B) { + // CHECK-LABEL: @test_mm512_mask_sllv_epi16 + // CHECK: @llvm.x86.avx512.mask.psllv + return _mm512_mask_sllv_epi16(__W, __U, __A, __B); +} + +__m512i test_mm512_maskz_sllv_epi16(__mmask32 __U, __m512i __A, __m512i __B) { + // CHECK-LABEL: @test_mm512_maskz_sllv_epi16 + // CHECK: @llvm.x86.avx512.mask.psllv + return _mm512_maskz_sllv_epi16(__U, __A, __B); +} + +__m512i test_mm512_sll_epi16(__m512i __A, __m128i __B) { + // CHECK-LABEL: @test_mm512_sll_epi16 + // CHECK: @llvm.x86.avx512.mask.psll.w.512 + return _mm512_sll_epi16(__A, __B); +} + +__m512i test_mm512_mask_sll_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m128i __B) { + // CHECK-LABEL: @test_mm512_mask_sll_epi16 + // CHECK: @llvm.x86.avx512.mask.psll.w.512 + return _mm512_mask_sll_epi16(__W, __U, __A, __B); +} + +__m512i test_mm512_maskz_sll_epi16(__mmask32 __U, __m512i __A, __m128i __B) { + // CHECK-LABEL: @test_mm512_maskz_sll_epi16 + // CHECK: @llvm.x86.avx512.mask.psll.w.512 + return _mm512_maskz_sll_epi16(__U, __A, __B); +} + +__m512i test_mm512_slli_epi16(__m512i __A) { + // CHECK-LABEL: @test_mm512_slli_epi16 + // CHECK: @llvm.x86.avx512.mask.psll.wi.512 + return _mm512_slli_epi16(__A, 5); +} + +__m512i test_mm512_mask_slli_epi16(__m512i __W, __mmask32 __U, __m512i __A) { + // CHECK-LABEL: @test_mm512_mask_slli_epi16 + // CHECK: @llvm.x86.avx512.mask.psll.wi.512 + return _mm512_mask_slli_epi16(__W, __U, __A, 5); +} + +__m512i test_mm512_maskz_slli_epi16(__mmask32 __U, __m512i __A) { + // CHECK-LABEL: @test_mm512_maskz_slli_epi16 + // CHECK: @llvm.x86.avx512.mask.psll.wi.512 + return _mm512_maskz_slli_epi16(__U, __A, 5); +} + diff --git a/clang/test/CodeGen/avx512vl-builtins.c b/clang/test/CodeGen/avx512vl-builtins.c index c8c48f35b07..f417aff23eb 100644 --- a/clang/test/CodeGen/avx512vl-builtins.c +++ b/clang/test/CodeGen/avx512vl-builtins.c @@ -3683,3 +3683,52 @@ __m256i test_mm256_maskz_rorv_epi64(__mmask8 __U, __m256i __A, __m256i __B) { // CHECK: @llvm.x86.avx512.mask.prorv.q.256 return _mm256_maskz_rorv_epi64(__U, __A, __B); } + +__m128i test_mm_mask_sllv_epi64(__m128i __W, __mmask8 __U, __m128i __X, __m128i __Y) { + // CHECK-LABEL: @test_mm_mask_sllv_epi64 + // CHECK: @llvm.x86.avx512.mask.psllv + return _mm_mask_sllv_epi64(__W, __U, __X, __Y); +} + +__m128i test_mm_maskz_sllv_epi64(__mmask8 __U, __m128i __X, __m128i __Y) { + // CHECK-LABEL: @test_mm_maskz_sllv_epi64 + // CHECK: @llvm.x86.avx512.mask.psllv + return _mm_maskz_sllv_epi64(__U, __X, __Y); +} + +__m256i test_mm256_mask_sllv_epi64(__m256i __W, __mmask8 __U, __m256i __X, __m256i __Y) { + // CHECK-LABEL: @test_mm256_mask_sllv_epi64 + // CHECK: @llvm.x86.avx512.mask.psllv + return _mm256_mask_sllv_epi64(__W, __U, __X, __Y); +} + +__m256i test_mm256_maskz_sllv_epi64(__mmask8 __U, __m256i __X, __m256i __Y) { + // CHECK-LABEL: @test_mm256_maskz_sllv_epi64 + // CHECK: @llvm.x86.avx512.mask.psllv + return _mm256_maskz_sllv_epi64(__U, __X, __Y); +} + +__m128i test_mm_mask_sllv_epi32(__m128i __W, __mmask8 __U, __m128i __X, __m128i __Y) { + // CHECK-LABEL: @test_mm_mask_sllv_epi32 + // CHECK: @llvm.x86.avx512.mask.psllv + return _mm_mask_sllv_epi32(__W, __U, __X, __Y); +} + +__m128i test_mm_maskz_sllv_epi32(__mmask8 __U, __m128i __X, __m128i __Y) { + // CHECK-LABEL: @test_mm_maskz_sllv_epi32 + // CHECK: @llvm.x86.avx512.mask.psllv + return _mm_maskz_sllv_epi32(__U, __X, __Y); +} + +__m256i test_mm256_mask_sllv_epi32(__m256i __W, __mmask8 __U, __m256i __X, __m256i __Y) { + // CHECK-LABEL: @test_mm256_mask_sllv_epi32 + // CHECK: @llvm.x86.avx512.mask.psllv + return _mm256_mask_sllv_epi32(__W, __U, __X, __Y); +} + +__m256i test_mm256_maskz_sllv_epi32(__mmask8 __U, __m256i __X, __m256i __Y) { + // CHECK-LABEL: @test_mm256_maskz_sllv_epi32 + // CHECK: @llvm.x86.avx512.mask.psllv + return _mm256_maskz_sllv_epi32(__U, __X, __Y); +} + diff --git a/clang/test/CodeGen/avx512vlbw-builtins.c b/clang/test/CodeGen/avx512vlbw-builtins.c index bdc486ff5ba..4a002447621 100644 --- a/clang/test/CodeGen/avx512vlbw-builtins.c +++ b/clang/test/CodeGen/avx512vlbw-builtins.c @@ -1871,4 +1871,89 @@ __m256i test_mm256_maskz_cvtepu8_epi16(__mmask16 __U, __m128i __A) { // CHECK-LABEL: @test_mm256_maskz_cvtepu8_epi16 // CHECK: @llvm.x86.avx512.mask.pmovzxb.w.256 return _mm256_maskz_cvtepu8_epi16(__U, __A); -}
\ No newline at end of file +} + +__m256i test_mm256_sllv_epi16(__m256i __A, __m256i __B) { + // CHECK-LABEL: @test_mm256_sllv_epi16 + // CHECK: @llvm.x86.avx512.mask.psllv + return _mm256_sllv_epi16(__A, __B); +} + +__m256i test_mm256_mask_sllv_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B) { + // CHECK-LABEL: @test_mm256_mask_sllv_epi16 + // CHECK: @llvm.x86.avx512.mask.psllv + return _mm256_mask_sllv_epi16(__W, __U, __A, __B); +} + +__m256i test_mm256_maskz_sllv_epi16(__mmask16 __U, __m256i __A, __m256i __B) { + // CHECK-LABEL: @test_mm256_maskz_sllv_epi16 + // CHECK: @llvm.x86.avx512.mask.psllv + return _mm256_maskz_sllv_epi16(__U, __A, __B); +} + +__m128i test_mm_sllv_epi16(__m128i __A, __m128i __B) { + // CHECK-LABEL: @test_mm_sllv_epi16 + // CHECK: @llvm.x86.avx512.mask.psllv + return _mm_sllv_epi16(__A, __B); +} + +__m128i test_mm_mask_sllv_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B) { + // CHECK-LABEL: @test_mm_mask_sllv_epi16 + // CHECK: @llvm.x86.avx512.mask.psllv + return _mm_mask_sllv_epi16(__W, __U, __A, __B); +} + +__m128i test_mm_maskz_sllv_epi16(__mmask8 __U, __m128i __A, __m128i __B) { + // CHECK-LABEL: @test_mm_maskz_sllv_epi16 + // CHECK: @llvm.x86.avx512.mask.psllv + return _mm_maskz_sllv_epi16(__U, __A, __B); +} + +__m128i test_mm_mask_sll_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B) { + // CHECK-LABEL: @test_mm_mask_sll_epi16 + // CHECK: @llvm.x86.avx512.mask.psll.w.128 + return _mm_mask_sll_epi16(__W, __U, __A, __B); +} + +__m128i test_mm_maskz_sll_epi16(__mmask8 __U, __m128i __A, __m128i __B) { + // CHECK-LABEL: @test_mm_maskz_sll_epi16 + // CHECK: @llvm.x86.avx512.mask.psll.w.128 + return _mm_maskz_sll_epi16(__U, __A, __B); +} + +__m256i test_mm256_mask_sll_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m128i __B) { + // CHECK-LABEL: @test_mm256_mask_sll_epi16 + // CHECK: @llvm.x86.avx512.mask.psll.w.256 + return _mm256_mask_sll_epi16(__W, __U, __A, __B); +} + +__m256i test_mm256_maskz_sll_epi16(__mmask16 __U, __m256i __A, __m128i __B) { + // CHECK-LABEL: @test_mm256_maskz_sll_epi16 + // CHECK: @llvm.x86.avx512.mask.psll.w.256 + return _mm256_maskz_sll_epi16(__U, __A, __B); +} + +__m128i test_mm_mask_slli_epi16(__m128i __W, __mmask8 __U, __m128i __A) { + // CHECK-LABEL: @test_mm_mask_slli_epi16 + // CHECK: @llvm.x86.avx512.mask.psll.wi.128 + return _mm_mask_slli_epi16(__W, __U, __A, 5); +} + +__m128i test_mm_maskz_slli_epi16(__mmask8 __U, __m128i __A) { + // CHECK-LABEL: @test_mm_maskz_slli_epi16 + // CHECK: @llvm.x86.avx512.mask.psll.wi.128 + return _mm_maskz_slli_epi16(__U, __A, 5); +} + +__m256i test_mm256_mask_slli_epi16(__m256i __W, __mmask16 __U, __m256i __A) { + // CHECK-LABEL: @test_mm256_mask_slli_epi16 + // CHECK: @llvm.x86.avx512.mask.psll.wi.256 + return _mm256_mask_slli_epi16(__W, __U, __A, 5); +} + +__m256i test_mm256_maskz_slli_epi16(__mmask16 __U, __m256i __A) { + // CHECK-LABEL: @test_mm256_maskz_slli_epi16 + // CHECK: @llvm.x86.avx512.mask.psll.wi.256 + return _mm256_maskz_slli_epi16(__U, __A, 5); +} + |

