diff options
author | Jan Vesely <jan.vesely@rutgers.edu> | 2018-03-08 23:00:58 +0000 |
---|---|---|
committer | Jan Vesely <jan.vesely@rutgers.edu> | 2018-03-08 23:00:58 +0000 |
commit | e724e346ab17ac82050ec667050dc7a44c653fac (patch) | |
tree | 6435ce45cbed935894bb22578d9f1ac7f86477b7 | |
parent | 9f103a1a27aba3610fbe4647e5aaa8e5d21a2b75 (diff) | |
download | bcm5719-llvm-e724e346ab17ac82050ec667050dc7a44c653fac.tar.gz bcm5719-llvm-e724e346ab17ac82050ec667050dc7a44c653fac.zip |
amdgcn/fmin: fcanonicalize operands
v_min instruction needs canonicalized operands.
Passes CTS on carrizo
Reviewer: Aaron Watry <awatry@gmail.com>
Signed-off-by: Jan Vesely <jan.vesely@rutgers.edu>
llvm-svn: 327075
-rw-r--r-- | libclc/amdgcn/lib/SOURCES | 1 | ||||
-rw-r--r-- | libclc/amdgcn/lib/math/fmin.cl | 31 |
2 files changed, 32 insertions, 0 deletions
diff --git a/libclc/amdgcn/lib/SOURCES b/libclc/amdgcn/lib/SOURCES index 6a5ce00dfb4..9cdc7b895ec 100644 --- a/libclc/amdgcn/lib/SOURCES +++ b/libclc/amdgcn/lib/SOURCES @@ -1,5 +1,6 @@ cl_khr_int64_extended_atomics/minmax_helpers.ll integer/popcount.cl +math/fmin.cl math/ldexp.cl mem_fence/fence.cl synchronization/barrier.cl diff --git a/libclc/amdgcn/lib/math/fmin.cl b/libclc/amdgcn/lib/math/fmin.cl new file mode 100644 index 00000000000..6a11785e3d4 --- /dev/null +++ b/libclc/amdgcn/lib/math/fmin.cl @@ -0,0 +1,31 @@ +#include <clc/clc.h> + +#include "../../../generic/lib/clcmacro.h" + +_CLC_DEF _CLC_OVERLOAD float fmin(float x, float y) +{ + /* fcanonicalize removes sNaNs and flushes denormals if not enabled. + * Otherwise fmin instruction flushes the values for comparison, + * but outputs original denormal */ + x = __builtin_canonicalizef(x); + y = __builtin_canonicalizef(y); + return __builtin_fminf(x, y); +} +_CLC_BINARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, float, fmin, float, float) + +#ifdef cl_khr_fp64 + +#pragma OPENCL EXTENSION cl_khr_fp64 : enable + +_CLC_DEF _CLC_OVERLOAD double fmin(double x, double y) +{ + x = __builtin_canonicalizef(x); + y = __builtin_canonicalizef(y); + return __builtin_fminf(x, y); +} +_CLC_BINARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, double, fmin, double, double) + +#endif + +#define __CLC_BODY <../../../generic/lib/math/fmin.inc> +#include <clc/math/gentype.inc> |