diff options
-rw-r--r-- | libclc/generic/include/clc/clc.h | 1 | ||||
-rw-r--r-- | libclc/generic/include/clc/math/tgamma.h | 3 | ||||
-rw-r--r-- | libclc/generic/include/clc/math/tgamma.inc | 1 | ||||
-rw-r--r-- | libclc/generic/lib/SOURCES | 1 | ||||
-rw-r--r-- | libclc/generic/lib/math/tgamma.cl | 71 |
5 files changed, 77 insertions, 0 deletions
diff --git a/libclc/generic/include/clc/clc.h b/libclc/generic/include/clc/clc.h index fecbd590779..5bdb09f8ffd 100644 --- a/libclc/generic/include/clc/clc.h +++ b/libclc/generic/include/clc/clc.h @@ -88,6 +88,7 @@ #include <clc/math/sqrt.h> #include <clc/math/tan.h> #include <clc/math/tanh.h> +#include <clc/math/tgamma.h> #include <clc/math/trunc.h> #include <clc/math/native_cos.h> #include <clc/math/native_divide.h> diff --git a/libclc/generic/include/clc/math/tgamma.h b/libclc/generic/include/clc/math/tgamma.h new file mode 100644 index 00000000000..a041d3219ac --- /dev/null +++ b/libclc/generic/include/clc/math/tgamma.h @@ -0,0 +1,3 @@ +#define __CLC_BODY <clc/math/tgamma.inc> +#include <clc/math/gentype.inc> +#undef __CLC_BODY diff --git a/libclc/generic/include/clc/math/tgamma.inc b/libclc/generic/include/clc/math/tgamma.inc new file mode 100644 index 00000000000..9f67fe457fb --- /dev/null +++ b/libclc/generic/include/clc/math/tgamma.inc @@ -0,0 +1 @@ +_CLC_OVERLOAD _CLC_DECL __CLC_GENTYPE tgamma(__CLC_GENTYPE a); diff --git a/libclc/generic/lib/SOURCES b/libclc/generic/lib/SOURCES index bcd09916e8a..423a50b4e95 100644 --- a/libclc/generic/lib/SOURCES +++ b/libclc/generic/lib/SOURCES @@ -119,6 +119,7 @@ math/clc_sqrt.cl math/sqrt.cl math/tan.cl math/tanh.cl +math/tgamma.cl relational/all.cl relational/any.cl relational/bitselect.cl diff --git a/libclc/generic/lib/math/tgamma.cl b/libclc/generic/lib/math/tgamma.cl new file mode 100644 index 00000000000..29c069fc925 --- /dev/null +++ b/libclc/generic/lib/math/tgamma.cl @@ -0,0 +1,71 @@ +/* + * Copyright (c) 2016 Aaron Watry + * Copyright (c) 2014 Advanced Micro Devices, Inc. + * + * Permission is hereby granted, free of charge, to any person obtaining a copy + * of this software and associated documentation files (the "Software"), to deal + * in the Software without restriction, including without limitation the rights + * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell + * copies of the Software, and to permit persons to whom the Software is + * furnished to do so, subject to the following conditions: + * + * The above copyright notice and this permission notice shall be included in + * all copies or substantial portions of the Software. + * + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE + * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, + * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN + * THE SOFTWARE. + */ + +#include <clc/clc.h> + +#include "math.h" +#include "../clcmacro.h" + +_CLC_OVERLOAD _CLC_DEF float tgamma(float x) { + const float pi = 3.1415926535897932384626433832795f; + float ax = fabs(x); + float lg = lgamma(ax); + float g = exp(lg); + + if (x < 0.0f) { + float z = sinpi(x); + g = g * ax * z; + g = pi / g; + g = g == 0 ? as_float(PINFBITPATT_SP32) : g; + g = z == 0 ? as_float(QNANBITPATT_SP32) : g; + } + + return g; +} + +_CLC_UNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, float, tgamma, float); + +#ifdef cl_khr_fp64 + +#pragma OPENCL EXTENSION cl_khr_fp64 : enable + +_CLC_OVERLOAD _CLC_DEF double tgamma(double x) { + const double pi = 3.1415926535897932384626433832795; + double ax = fabs(x); + double lg = lgamma(ax); + double g = exp(lg); + + if (x < 0.0) { + double z = sinpi(x); + g = g * ax * z; + g = pi / g; + g = g == 0 ? as_double(PINFBITPATT_DP64) : g; + g = z == 0 ? as_double(QNANBITPATT_DP64) : g; + } + + return g; +} + +_CLC_UNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, double, tgamma, double); + +#endif |