summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorMichael Zuckerman <Michael.zuckerman@intel.com>2016-06-14 13:45:17 +0000
committerMichael Zuckerman <Michael.zuckerman@intel.com>2016-06-14 13:45:17 +0000
commitc49f6ce3e163132ac28e1b3ec90bf4701d8ea65b (patch)
treef3df8dcc26211a3a1921cefdbf9d4eec22fc8750
parent878c0b1b76aa5ce8526a50109bd382457eb68ec7 (diff)
downloadbcm5719-llvm-c49f6ce3e163132ac28e1b3ec90bf4701d8ea65b.tar.gz
bcm5719-llvm-c49f6ce3e163132ac28e1b3ec90bf4701d8ea65b.zip
[Clang][avx512][Intrinsics] adding prefetch gather intrinsics
Differential Revision: http://reviews.llvm.org/D21322 llvm-svn: 272667
-rw-r--r--clang/lib/Headers/avx512pfintrin.h19
-rw-r--r--clang/test/CodeGen/avx512pf-builtins.c24
2 files changed, 43 insertions, 0 deletions
diff --git a/clang/lib/Headers/avx512pfintrin.h b/clang/lib/Headers/avx512pfintrin.h
index 66c64f46152..c7fa3cf313e 100644
--- a/clang/lib/Headers/avx512pfintrin.h
+++ b/clang/lib/Headers/avx512pfintrin.h
@@ -35,21 +35,40 @@
__builtin_ia32_gatherpfdpd((__mmask8)(mask), (__v8si)(__m256i)(index), \
(long long const *)(addr), (int)(scale), \
(int)(hint)); })
+
+#define _mm512_prefetch_i32gather_pd(index, addr, scale, hint) __extension__ ({\
+ __builtin_ia32_gatherpfdpd((__mmask8) -1, (__v8si)(__m256i)(index), \
+ (long long const *)(addr), (int)(scale), \
+ (int)(hint)); })
#define _mm512_mask_prefetch_i32gather_ps(index, mask, addr, scale, hint) ({\
__builtin_ia32_gatherpfdps((__mmask16)(mask), \
(__v16si)(__m512i)(index), (int const *)(addr), \
(int)(scale), (int)(hint)); })
+#define _mm512_prefetch_i32gather_ps(index, addr, scale, hint) ({\
+ __builtin_ia32_gatherpfdps((__mmask16) -1, \
+ (__v16si)(__m512i)(index), (int const *)(addr), \
+ (int)(scale), (int)(hint)); })
+
#define _mm512_mask_prefetch_i64gather_pd(index, mask, addr, scale, hint) __extension__ ({\
__builtin_ia32_gatherpfqpd((__mmask8)(mask), (__v8di)(__m512i)(index), \
(long long const *)(addr), (int)(scale), \
(int)(hint)); })
+#define _mm512_prefetch_i64gather_pd(index, addr, scale, hint) __extension__ ({\
+ __builtin_ia32_gatherpfqpd((__mmask8) -1, (__v8di)(__m512i)(index), \
+ (long long const *)(addr), (int)(scale), \
+ (int)(hint)); })
+
#define _mm512_mask_prefetch_i64gather_ps(index, mask, addr, scale, hint) ({\
__builtin_ia32_gatherpfqps((__mmask8)(mask), (__v8di)(__m512i)(index), \
(int const *)(addr), (int)(scale), (int)(hint)); })
+#define _mm512_prefetch_i64gather_ps(index, addr, scale, hint) ({\
+ __builtin_ia32_gatherpfqps((__mmask8) -1, (__v8di)(__m512i)(index), \
+ (int const *)(addr), (int)(scale), (int)(hint)); })
+
#define _mm512_prefetch_i32scatter_pd(addr, index, scale, hint) __extension__ ({\
__builtin_ia32_scatterpfdpd((__mmask8)-1, (__v8si)(__m256i)(index), \
(long long *)(addr), (int)(scale), \
diff --git a/clang/test/CodeGen/avx512pf-builtins.c b/clang/test/CodeGen/avx512pf-builtins.c
index 91140f14946..16b27e91513 100644
--- a/clang/test/CodeGen/avx512pf-builtins.c
+++ b/clang/test/CodeGen/avx512pf-builtins.c
@@ -11,24 +11,48 @@ void test_mm512_mask_prefetch_i32gather_pd(__m256i index, __mmask8 mask, void co
return _mm512_mask_prefetch_i32gather_pd(index, mask, addr, 2, 1);
}
+void test_mm512_prefetch_i32gather_pd(__m256i index, void const *addr, int hint) {
+ // CHECK-LABEL: @test_mm512_prefetch_i32gather_pd
+ // CHECK: @llvm.x86.avx512.gatherpf.dpd
+ return _mm512_prefetch_i32gather_pd(index, addr, 2, 1);
+}
+
void test_mm512_mask_prefetch_i32gather_ps(__m512i index, __mmask16 mask, void const *addr, int hint) {
// CHECK-LABEL: @test_mm512_mask_prefetch_i32gather_ps
// CHECK: @llvm.x86.avx512.gatherpf.dps
return _mm512_mask_prefetch_i32gather_ps(index, mask, addr, 2, 1);
}
+void test_mm512_prefetch_i32gather_ps(__m512i index, void const *addr, int hint) {
+ // CHECK-LABEL: @test_mm512_prefetch_i32gather_ps
+ // CHECK: @llvm.x86.avx512.gatherpf.dps
+ return _mm512_prefetch_i32gather_ps(index, addr, 2, 1);
+}
+
void test_mm512_mask_prefetch_i64gather_pd(__m512i index, __mmask8 mask, void const *addr, int hint) {
// CHECK-LABEL: @test_mm512_mask_prefetch_i64gather_pd
// CHECK: @llvm.x86.avx512.gatherpf.qpd
return _mm512_mask_prefetch_i64gather_pd(index, mask, addr, 2, 1);
}
+void test_mm512_prefetch_i64gather_pd(__m512i index, void const *addr, int hint) {
+ // CHECK-LABEL: @test_mm512_prefetch_i64gather_pd
+ // CHECK: @llvm.x86.avx512.gatherpf.qpd
+ return _mm512_prefetch_i64gather_pd(index, addr, 2, 1);
+}
+
void test_mm512_mask_prefetch_i64gather_ps(__m512i index, __mmask8 mask, void const *addr, int hint) {
// CHECK-LABEL: @test_mm512_mask_prefetch_i64gather_ps
// CHECK: @llvm.x86.avx512.gatherpf.qps
return _mm512_mask_prefetch_i64gather_ps(index, mask, addr, 2, 1);
}
+void test_mm512_prefetch_i64gather_ps(__m512i index, void const *addr, int hint) {
+ // CHECK-LABEL: @test_mm512_prefetch_i64gather_ps
+ // CHECK: @llvm.x86.avx512.gatherpf.qps
+ return _mm512_prefetch_i64gather_ps(index, addr, 2, 1);
+}
+
void test_mm512_prefetch_i32scatter_pd(void *addr, __m256i index) {
// CHECK-LABEL: @test_mm512_prefetch_i32scatter_pd
// CHECK: @llvm.x86.avx512.scatterpf.dpd.512
OpenPOWER on IntegriCloud