summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorJan Vesely <jan.vesely@rutgers.edu>2018-03-08 23:00:58 +0000
committerJan Vesely <jan.vesely@rutgers.edu>2018-03-08 23:00:58 +0000
commite724e346ab17ac82050ec667050dc7a44c653fac (patch)
tree6435ce45cbed935894bb22578d9f1ac7f86477b7
parent9f103a1a27aba3610fbe4647e5aaa8e5d21a2b75 (diff)
downloadbcm5719-llvm-e724e346ab17ac82050ec667050dc7a44c653fac.tar.gz
bcm5719-llvm-e724e346ab17ac82050ec667050dc7a44c653fac.zip
amdgcn/fmin: fcanonicalize operands
v_min instruction needs canonicalized operands. Passes CTS on carrizo Reviewer: Aaron Watry <awatry@gmail.com> Signed-off-by: Jan Vesely <jan.vesely@rutgers.edu> llvm-svn: 327075
-rw-r--r--libclc/amdgcn/lib/SOURCES1
-rw-r--r--libclc/amdgcn/lib/math/fmin.cl31
2 files changed, 32 insertions, 0 deletions
diff --git a/libclc/amdgcn/lib/SOURCES b/libclc/amdgcn/lib/SOURCES
index 6a5ce00dfb4..9cdc7b895ec 100644
--- a/libclc/amdgcn/lib/SOURCES
+++ b/libclc/amdgcn/lib/SOURCES
@@ -1,5 +1,6 @@
cl_khr_int64_extended_atomics/minmax_helpers.ll
integer/popcount.cl
+math/fmin.cl
math/ldexp.cl
mem_fence/fence.cl
synchronization/barrier.cl
diff --git a/libclc/amdgcn/lib/math/fmin.cl b/libclc/amdgcn/lib/math/fmin.cl
new file mode 100644
index 00000000000..6a11785e3d4
--- /dev/null
+++ b/libclc/amdgcn/lib/math/fmin.cl
@@ -0,0 +1,31 @@
+#include <clc/clc.h>
+
+#include "../../../generic/lib/clcmacro.h"
+
+_CLC_DEF _CLC_OVERLOAD float fmin(float x, float y)
+{
+ /* fcanonicalize removes sNaNs and flushes denormals if not enabled.
+ * Otherwise fmin instruction flushes the values for comparison,
+ * but outputs original denormal */
+ x = __builtin_canonicalizef(x);
+ y = __builtin_canonicalizef(y);
+ return __builtin_fminf(x, y);
+}
+_CLC_BINARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, float, fmin, float, float)
+
+#ifdef cl_khr_fp64
+
+#pragma OPENCL EXTENSION cl_khr_fp64 : enable
+
+_CLC_DEF _CLC_OVERLOAD double fmin(double x, double y)
+{
+ x = __builtin_canonicalizef(x);
+ y = __builtin_canonicalizef(y);
+ return __builtin_fminf(x, y);
+}
+_CLC_BINARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, double, fmin, double, double)
+
+#endif
+
+#define __CLC_BODY <../../../generic/lib/math/fmin.inc>
+#include <clc/math/gentype.inc>
OpenPOWER on IntegriCloud