diff options
| author | Bruno Cardoso Lopes <bruno.cardoso@gmail.com> | 2010-08-10 02:23:54 +0000 |
|---|---|---|
| committer | Bruno Cardoso Lopes <bruno.cardoso@gmail.com> | 2010-08-10 02:23:54 +0000 |
| commit | 3d3fc1d075ce824a9b924835c5274bcb4e1961e5 (patch) | |
| tree | 5eea503f32c89beb65105489aaa076bb49700eb9 | |
| parent | 85da72a88fdd3ddcdf20a0d8c0850fa6c91690cc (diff) | |
| download | bcm5719-llvm-3d3fc1d075ce824a9b924835c5274bcb4e1961e5.tar.gz bcm5719-llvm-3d3fc1d075ce824a9b924835c5274bcb4e1961e5.zip | |
Make replicate intrinsics use shufflevector instead of dup builtins, also remove the dup builtins
llvm-svn: 110646
| -rw-r--r-- | clang/include/clang/Basic/BuiltinsX86.def | 3 | ||||
| -rw-r--r-- | clang/lib/Headers/avxintrin.h | 6 | ||||
| -rw-r--r-- | clang/test/CodeGen/builtins-x86.c | 3 |
3 files changed, 3 insertions, 9 deletions
diff --git a/clang/include/clang/Basic/BuiltinsX86.def b/clang/include/clang/Basic/BuiltinsX86.def index db8968f484f..26f4ce4884a 100644 --- a/clang/include/clang/Basic/BuiltinsX86.def +++ b/clang/include/clang/Basic/BuiltinsX86.def @@ -371,9 +371,6 @@ BUILTIN(__builtin_ia32_vpermilps256, "V8fV8fc", "") BUILTIN(__builtin_ia32_vinsertf128_pd256, "V4dV4dV2dc", "") BUILTIN(__builtin_ia32_vinsertf128_ps256, "V8fV8fV4fc", "") BUILTIN(__builtin_ia32_vinsertf128_si256, "V8iV8iV4ic", "") -BUILTIN(__builtin_ia32_movshdup256, "V8fV8f", "") -BUILTIN(__builtin_ia32_movsldup256, "V8fV8f", "") -BUILTIN(__builtin_ia32_movddup256, "V4dV4d", "") BUILTIN(__builtin_ia32_sqrtpd256, "V4dV4d", "") BUILTIN(__builtin_ia32_sqrtps256, "V8fV8f", "") BUILTIN(__builtin_ia32_sqrtps_nr256, "V8fV8f", "") diff --git a/clang/lib/Headers/avxintrin.h b/clang/lib/Headers/avxintrin.h index 95deed4b91c..719ca8f9125 100644 --- a/clang/lib/Headers/avxintrin.h +++ b/clang/lib/Headers/avxintrin.h @@ -577,19 +577,19 @@ _mm256_cvttps_epi32(__m256 a) static __inline __m256 __attribute__((__always_inline__, __nodebug__)) _mm256_movehdup_ps(__m256 a) { - return (__m256)__builtin_ia32_movshdup256((__v8sf)a); + return __builtin_shufflevector(a, a, 1, 1, 3, 3, 5, 5, 7, 7); } static __inline __m256 __attribute__((__always_inline__, __nodebug__)) _mm256_moveldup_ps(__m256 a) { - return (__m256)__builtin_ia32_movsldup256((__v8sf)a); + return __builtin_shufflevector(a, a, 0, 0, 2, 2, 4, 4, 6, 6); } static __inline __m256d __attribute__((__always_inline__, __nodebug__)) _mm256_movedup_pd(__m256d a) { - return (__m256d)__builtin_ia32_movddup256((__v4df)a); + return __builtin_shufflevector(a, a, 0, 0, 2, 2); } /* Unpack and Interleave */ diff --git a/clang/test/CodeGen/builtins-x86.c b/clang/test/CodeGen/builtins-x86.c index 287de997fab..3be7a39ecdd 100644 --- a/clang/test/CodeGen/builtins-x86.c +++ b/clang/test/CodeGen/builtins-x86.c @@ -434,9 +434,6 @@ void f0() { tmp_V4d = __builtin_ia32_vinsertf128_pd256(tmp_V4d, tmp_V2d, 0x7); tmp_V8f = __builtin_ia32_vinsertf128_ps256(tmp_V8f, tmp_V4f, 0x7); tmp_V8i = __builtin_ia32_vinsertf128_si256(tmp_V8i, tmp_V4i, 0x7); - tmp_V8f = __builtin_ia32_movshdup256(tmp_V8f); - tmp_V8f = __builtin_ia32_movsldup256(tmp_V8f); - tmp_V4d = __builtin_ia32_movddup256(tmp_V4d); tmp_V4d = __builtin_ia32_sqrtpd256(tmp_V4d); tmp_V8f = __builtin_ia32_sqrtps256(tmp_V8f); tmp_V8f = __builtin_ia32_sqrtps_nr256(tmp_V8f); |

