diff options
author | Craig Topper <craig.topper@gmail.com> | 2012-06-12 06:03:35 +0000 |
---|---|---|
committer | Craig Topper <craig.topper@gmail.com> | 2012-06-12 06:03:35 +0000 |
commit | db0fbf0a50dbe0fc2708f10bf5dd7dbe34bc1a7d (patch) | |
tree | 7c7c0bc9610428c6f0c19d63ca9bbec36a7b3429 | |
parent | 060f5d2c4c9399af3942529c5455da2950178f91 (diff) | |
download | bcm5719-llvm-db0fbf0a50dbe0fc2708f10bf5dd7dbe34bc1a7d.tar.gz bcm5719-llvm-db0fbf0a50dbe0fc2708f10bf5dd7dbe34bc1a7d.zip |
Add XOP permute intrinsics.
llvm-svn: 158351
-rw-r--r-- | clang/include/clang/Basic/BuiltinsX86.def | 4 | ||||
-rw-r--r-- | clang/lib/Headers/xopintrin.h | 28 | ||||
-rw-r--r-- | clang/test/CodeGen/xop-builtins.c | 20 |
3 files changed, 52 insertions, 0 deletions
diff --git a/clang/include/clang/Basic/BuiltinsX86.def b/clang/include/clang/Basic/BuiltinsX86.def index 285548582c1..936ebfae9a7 100644 --- a/clang/include/clang/Basic/BuiltinsX86.def +++ b/clang/include/clang/Basic/BuiltinsX86.def @@ -697,5 +697,9 @@ BUILTIN(__builtin_ia32_vpcomb, "V16cV16cV16cIc", "") BUILTIN(__builtin_ia32_vpcomw, "V8sV8sV8sIc", "") BUILTIN(__builtin_ia32_vpcomd, "V4iV4iV4iIc", "") BUILTIN(__builtin_ia32_vpcomq, "V2LLiV2LLiV2LLiIc", "") +BUILTIN(__builtin_ia32_vpermil2pd, "V2dV2dV2dV2LLiIc", "") +BUILTIN(__builtin_ia32_vpermil2pd256, "V4dV4dV4dV4LLiIc", "") +BUILTIN(__builtin_ia32_vpermil2ps, "V4fV4fV4fV4iIc", "") +BUILTIN(__builtin_ia32_vpermil2ps256, "V8fV8fV8fV8iIc", "") #undef BUILTIN diff --git a/clang/lib/Headers/xopintrin.h b/clang/lib/Headers/xopintrin.h index d9689cc57fb..a58a3ed3824 100644 --- a/clang/lib/Headers/xopintrin.h +++ b/clang/lib/Headers/xopintrin.h @@ -342,6 +342,34 @@ _mm_sha_epi64(__m128i __A, __m128i __B) __m128i __B = (B); \ (__m128i)__builtin_ia32_vpcomq((__v2di)__A, (__v2di)__B, (N)); }) +#define _mm_permute2_pd(X, Y, C, I) __extension__ ({ \ + __m128d __X = (X); \ + __m128d __Y = (Y); \ + __m128i __C = (C); \ + (__m128d)__builtin_ia32_vpermil2pd((__v2df)__X, (__v2df)__Y, \ + (__v2di)__C, (I)); }) + +#define _mm256_permute2_pd(X, Y, C, I) __extension__ ({ \ + __m256d __X = (X); \ + __m256d __Y = (Y); \ + __m256i __C = (C); \ + (__m256d)__builtin_ia32_vpermil2pd256((__v4df)__X, (__v4df)__Y, \ + (__v4di)__C, (I)); }) + +#define _mm_permute2_ps(X, Y, C, I) __extension__ ({ \ + __m128 __X = (X); \ + __m128 __Y = (Y); \ + __m128i __C = (C); \ + (__m128)__builtin_ia32_vpermil2ps((__v4sf)__X, (__v4sf)__Y, \ + (__v4si)__C, (I)); }) + +#define _mm256_permute2_ps(X, Y, C, I) __extension__ ({ \ + __m256 __X = (X); \ + __m256 __Y = (Y); \ + __m256i __C = (C); \ + (__m256)__builtin_ia32_vpermil2ps256((__v8sf)__X, (__v8sf)__Y, \ + (__v8si)__C, (I)); }) + #endif /* __XOP__ */ #endif /* __XOPINTRIN_H */ diff --git a/clang/test/CodeGen/xop-builtins.c b/clang/test/CodeGen/xop-builtins.c index 44042bd285c..083d371c84a 100644 --- a/clang/test/CodeGen/xop-builtins.c +++ b/clang/test/CodeGen/xop-builtins.c @@ -274,3 +274,23 @@ __m128i test_mm_com_epi64(__m128i a, __m128i b) { // CHECK: @llvm.x86.xop.vpcomq return _mm_com_epi64(a, b, 0); } + +__m128d test_mm_permute2_pd(__m128d a, __m128d b, __m128i c) { + // CHECK: @llvm.x86.xop.vpermil2pd + return _mm_permute2_pd(a, b, c, 0); +} + +__m256d test_mm256_permute2_pd(__m256d a, __m256d b, __m256i c) { + // CHECK: @llvm.x86.xop.vpermil2pd.256 + return _mm256_permute2_pd(a, b, c, 0); +} + +__m128 test_mm_permute2_ps(__m128 a, __m128 b, __m128i c) { + // CHECK: @llvm.x86.xop.vpermil2ps + return _mm_permute2_ps(a, b, c, 0); +} + +__m256 test_mm256_permute2_ps(__m256 a, __m256 b, __m256i c) { + // CHECK: @llvm.x86.xop.vpermil2ps.256 + return _mm256_permute2_ps(a, b, c, 0); +} |