diff options
-rw-r--r-- | libclc/r600/lib/SOURCES | 1 | ||||
-rw-r--r-- | libclc/r600/lib/math/fmax.cl | 29 |
2 files changed, 30 insertions, 0 deletions
diff --git a/libclc/r600/lib/SOURCES b/libclc/r600/lib/SOURCES index 284052c694b..132b1519104 100644 --- a/libclc/r600/lib/SOURCES +++ b/libclc/r600/lib/SOURCES @@ -1,3 +1,4 @@ +math/fmax.cl synchronization/barrier_impl.ll workitem/get_global_offset.cl workitem/get_group_id.cl diff --git a/libclc/r600/lib/math/fmax.cl b/libclc/r600/lib/math/fmax.cl new file mode 100644 index 00000000000..e4b9e4c821f --- /dev/null +++ b/libclc/r600/lib/math/fmax.cl @@ -0,0 +1,29 @@ +#include <clc/clc.h> + +#include "../../../generic/lib/clcmacro.h" +#include "../../../generic/lib/math/math.h" + +_CLC_DEF _CLC_OVERLOAD float fmax(float x, float y) +{ + /* Flush denormals if not enabled. Otherwise fmax instruction flushes + * the values for comparison, but outputs original denormal */ + x = __clc_flush_denormal_if_not_supported(x); + y = __clc_flush_denormal_if_not_supported(y); + return __builtin_fmaxf(x, y); +} +_CLC_BINARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, float, fmax, float, float) + +#ifdef cl_khr_fp64 + +#pragma OPENCL EXTENSION cl_khr_fp64 : enable + +_CLC_DEF _CLC_OVERLOAD double fmax(double x, double y) +{ + return __builtin_fmax(x, y); +} +_CLC_BINARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, double, fmax, double, double) + +#endif + +#define __CLC_BODY <../../../generic/lib/math/fmax.inc> +#include <clc/math/gentype.inc> |