[Beignet] [PATCH] Libocl: change prototype of math built-in for OCL2.0 spec
Song, Ruiling
ruiling.song at intel.com
Tue Mar 29 03:48:33 UTC 2016
LGTM
Thanks!
Ruiling
> -----Original Message-----
> From: Beignet [mailto:beignet-bounces at lists.freedesktop.org] On Behalf Of
> Xiuli Pan
> Sent: Tuesday, March 22, 2016 12:38 PM
> To: beignet at lists.freedesktop.org
> Cc: Pan, Xiuli <xiuli.pan at intel.com>
> Subject: [Beignet] [PATCH] Libocl: change prototype of math built-in for OCL2.0
> spec
>
> From: Pan Xiuli <xiuli.pan at intel.com>
>
> Math built-in nolonger need address space, so remove them.
>
> Signed-off-by: Pan Xiuli <xiuli.pan at intel.com>
> ---
> backend/src/libocl/tmpl/ocl_math.tmpl.cl | 122 ++++---------------------------
> backend/src/libocl/tmpl/ocl_math.tmpl.h | 48 +++---------
> 2 files changed, 25 insertions(+), 145 deletions(-)
>
> diff --git a/backend/src/libocl/tmpl/ocl_math.tmpl.cl
> b/backend/src/libocl/tmpl/ocl_math.tmpl.cl
> index 782bfd2..d8fa4ae 100644
> --- a/backend/src/libocl/tmpl/ocl_math.tmpl.cl
> +++ b/backend/src/libocl/tmpl/ocl_math.tmpl.cl
> @@ -127,15 +127,7 @@ OVERLOADABLE float
> __gen_ocl_internal_fastpath_rootn(float x, int n) {
> OVERLOADABLE float __gen_ocl_internal_fastpath_sin (float x) {
> return native_sin(x);
> }
> -OVERLOADABLE float __gen_ocl_internal_fastpath_sincos (float x, __global
> float *cosval) {
> - *cosval = native_cos(x);
> - return native_sin(x);
> -}
> -OVERLOADABLE float __gen_ocl_internal_fastpath_sincos (float x, __local
> float *cosval) {
> - *cosval = native_cos(x);
> - return native_sin(x);
> -}
> -OVERLOADABLE float __gen_ocl_internal_fastpath_sincos (float x, __private
> float *cosval) {
> +OVERLOADABLE float __gen_ocl_internal_fastpath_sincos (float x, float
> *cosval) {
> *cosval = native_cos(x);
> return native_sin(x);
> }
> @@ -1182,9 +1174,7 @@ OVERLOADABLE float lgamma(float x) {
> if (hx < 0) \
> r = nadj - r; \
> return r;
> -OVERLOADABLE float lgamma_r(float x, global int *signgamp) { BODY; }
> -OVERLOADABLE float lgamma_r(float x, local int *signgamp) { BODY; }
> -OVERLOADABLE float lgamma_r(float x, private int *signgamp) { BODY; }
> +OVERLOADABLE float lgamma_r(float x, int *signgamp) { BODY; }
> #undef BODY
>
> OVERLOADABLE float log1p(float x) {
> @@ -1406,17 +1396,7 @@ OVERLOADABLE float __gen_ocl_internal_cbrt(float
> x) {
> *cosval = cos(x); \
> return sin(x);
>
> -OVERLOADABLE float sincos(float x, global float *cosval) {
> - if (__ocl_math_fastpath_flag)
> - return __gen_ocl_internal_fastpath_sincos(x, cosval);
> - BODY;
> -}
> -OVERLOADABLE float sincos(float x, local float *cosval) {
> - if (__ocl_math_fastpath_flag)
> - return __gen_ocl_internal_fastpath_sincos(x, cosval);
> - BODY;
> -}
> -OVERLOADABLE float sincos(float x, private float *cosval) {
> +OVERLOADABLE float sincos(float x, float *cosval) {
> if (__ocl_math_fastpath_flag)
> return __gen_ocl_internal_fastpath_sincos(x, cosval);
> BODY;
> @@ -2641,9 +2621,7 @@ OVERLOADABLE float mad(float a, float b, float c) {
> a <<= 1; \
> *exp = e; \
> return as_float((a & (0x807FFFFFu)) | (u & 0x80000000u) | 0x3F000000);
> -OVERLOADABLE float frexp(float x, global int *exp) { BODY; }
> -OVERLOADABLE float frexp(float x, local int *exp) { BODY; }
> -OVERLOADABLE float frexp(float x, private int *exp) { BODY; }
> +OVERLOADABLE float frexp(float x, int *exp) { BODY; }
> #undef BODY
>
> OVERLOADABLE float nextafter(float x, float y) {
> @@ -2690,9 +2668,7 @@ OVERLOADABLE float nextafter(float x, float y) {
> } \
> *i = __gen_ocl_rndz(x); \
> return x - *i;
> -OVERLOADABLE float modf(float x, global float *i) { BODY; }
> -OVERLOADABLE float modf(float x, local float *i) { BODY; }
> -OVERLOADABLE float modf(float x, private float *i) { BODY; }
> +OVERLOADABLE float modf(float x, float *i) { BODY; }
> #undef BODY
>
> OVERLOADABLE float __gen_ocl_internal_fmax(float a, float b) { return
> max(a,b); }
> @@ -3287,9 +3263,7 @@ OVERLOADABLE float hypot(float x, float y) {
> return x > 0 ? +0. : -0.; \
> } \
> return __gen_ocl_internal_fmin(x - *p, 0x1.FFFFFep-1F);
> -OVERLOADABLE float fract(float x, global float *p) { BODY; }
> -OVERLOADABLE float fract(float x, local float *p) { BODY; }
> -OVERLOADABLE float fract(float x, private float *p) { BODY; }
> +OVERLOADABLE float fract(float x, float *p) { BODY; }
> #undef BODY
>
> #define BODY \
> @@ -3371,11 +3345,9 @@ fixup: \
> *quo = (sign ? -q : q); \
> return x;
>
> -OVERLOADABLE float remquo(float x, float y, global int *quo) {
> +OVERLOADABLE float remquo(float x, float y, int *quo) {
> BODY;
> }
> -OVERLOADABLE float remquo(float x, float y, local int *quo) { BODY; }
> -OVERLOADABLE float remquo(float x, float y, private int *quo) { BODY; }
> #undef BODY
>
> OVERLOADABLE float powr(float x, float y) {
> @@ -3855,15 +3827,7 @@ OVERLOADABLE half lgamma(half x) {
> float _x = (float)x;
> return (half)lgamma(_x);
> }
> -OVERLOADABLE half lgamma_r(half x, global int *signgamp) {
> - float _x = (float)x;
> - return (half)lgamma_r(_x, signgamp);
> -}
> -OVERLOADABLE half lgamma_r(half x, local int *signgamp) {
> - float _x = (float)x;
> - return (half)lgamma_r(_x, signgamp);
> -}
> -OVERLOADABLE half lgamma_r(half x, private int *signgamp) {
> +OVERLOADABLE half lgamma_r(half x, int *signgamp) {
> float _x = (float)x;
> return (half)lgamma_r(_x, signgamp);
> }
> @@ -3883,21 +3847,7 @@ OVERLOADABLE half nan(ushort code) {
> return (half)NAN;
> }
>
> -OVERLOADABLE half sincos(half x, global half *cosval) {
> - float _x = (float)x;
> - float _cosval;
> - half ret = (half)sincos(_x, &_cosval);
> - *cosval = (half)_cosval;
> - return ret;
> -}
> -OVERLOADABLE half sincos(half x, local half *cosval) {
> - float _x = (float)x;
> - float _cosval;
> - half ret = (half)sincos(_x, &_cosval);
> - *cosval = (half)_cosval;
> - return ret;
> -}
> -OVERLOADABLE half sincos(half x, private half *cosval) {
> +OVERLOADABLE half sincos(half x, half *cosval) {
> float _x = (float)x;
> float _cosval;
> half ret = (half)sincos(_x, &_cosval);
> @@ -3913,15 +3863,7 @@ OVERLOADABLE half rsqrt(half x) {
> float _x = (float)x;
> return (half)rsqrt(_x);
> }
> -OVERLOADABLE half frexp(half x, global int *exp) {
> - float _x = (float)x;
> - return (half)frexp(_x, exp);
> -}
> -OVERLOADABLE half frexp(half x, local int *exp) {
> - float _x = (float)x;
> - return (half)frexp(_x, exp);
> -}
> -OVERLOADABLE half frexp(half x, private int *exp) {
> +OVERLOADABLE half frexp(half x, int *exp) {
> float _x = (float)x;
> return (half)frexp(_x, exp);
> }
> @@ -3931,21 +3873,7 @@ OVERLOADABLE half nextafter(half x, half y) {
> return (half)nextafter(_x, _y);
> }
>
> -OVERLOADABLE half modf(half x, global half *i) {
> - float _x = (float)x;
> - float _i;
> - half ret = (half)modf(_x, &_i);
> - *i = (half)_i;
> - return ret;
> -}
> -OVERLOADABLE half modf(half x, local half *i) {
> - float _x = (float)x;
> - float _i;
> - half ret = (half)modf(_x, &_i);
> - *i = (half)_i;
> - return ret;
> -}
> -OVERLOADABLE half modf(half x, private half *i) {
> +OVERLOADABLE half modf(half x, half *i) {
> float _x = (float)x;
> float _i;
> half ret = (half)modf(_x, &_i);
> @@ -3959,21 +3887,7 @@ OVERLOADABLE half hypot(half x, half y) {
> return (half)hypot(_x, _y);
> }
>
> -OVERLOADABLE half fract(half x, global half *p) {
> - float _x = (float)x;
> - float _p;
> - half ret = (half)fract(_x, &_p);
> - *p = (half)_p;
> - return ret;
> -}
> -OVERLOADABLE half fract(half x, local half *p) {
> - float _x = (float)x;
> - float _p;
> - half ret = (half)fract(_x, &_p);
> - *p = (half)_p;
> - return ret;
> -}
> -OVERLOADABLE half fract(half x, private half *p) {
> +OVERLOADABLE half fract(half x, half *p) {
> float _x = (float)x;
> float _p;
> half ret = (half)fract(_x, &_p);
> @@ -3981,17 +3895,7 @@ OVERLOADABLE half fract(half x, private half *p) {
> return ret;
> }
>
> -OVERLOADABLE half remquo(half x, half y, global int *quo) {
> - float _x = (float)x;
> - float _y = (float)y;
> - return (half)remquo(_x, _y, quo);
> -}
> -OVERLOADABLE half remquo(half x, half y, local int *quo) {
> - float _x = (float)x;
> - float _y = (float)y;
> - return (half)remquo(_x, _y, quo);
> -}
> -OVERLOADABLE half remquo(half x, half y, private int *quo) {
> +OVERLOADABLE half remquo(half x, half y, int *quo) {
> float _x = (float)x;
> float _y = (float)y;
> return (half)remquo(_x, _y, quo);
> diff --git a/backend/src/libocl/tmpl/ocl_math.tmpl.h
> b/backend/src/libocl/tmpl/ocl_math.tmpl.h
> index 0de3642..ca8c02a 100644
> --- a/backend/src/libocl/tmpl/ocl_math.tmpl.h
> +++ b/backend/src/libocl/tmpl/ocl_math.tmpl.h
> @@ -72,32 +72,20 @@ OVERLOADABLE float cos(float x);
> OVERLOADABLE float tan(float x);
> OVERLOADABLE float tgamma(float x);
> OVERLOADABLE float lgamma(float x);
> -OVERLOADABLE float lgamma_r(float x, global int *signgamp);
> -OVERLOADABLE float lgamma_r(float x, local int *signgamp);
> -OVERLOADABLE float lgamma_r(float x, private int *signgamp);
> +OVERLOADABLE float lgamma_r(float x, int *signgamp);
> OVERLOADABLE float log1p(float x);
> OVERLOADABLE float logb(float x);
> OVERLOADABLE int ilogb(float x);
> OVERLOADABLE float nan(uint code);
> -OVERLOADABLE float sincos(float x, global float *cosval);
> -OVERLOADABLE float sincos(float x, local float *cosval);
> -OVERLOADABLE float sincos(float x, private float *cosval);
> +OVERLOADABLE float sincos(float x, float *cosval);
> OVERLOADABLE float sqrt(float x);
> OVERLOADABLE float rsqrt(float x);
> -OVERLOADABLE float frexp(float x, global int *exp);
> -OVERLOADABLE float frexp(float x, local int *exp);
> -OVERLOADABLE float frexp(float x, private int *exp);
> +OVERLOADABLE float frexp(float x, int *exp);
> OVERLOADABLE float nextafter(float x, float y);
> -OVERLOADABLE float modf(float x, global float *i);
> -OVERLOADABLE float modf(float x, local float *i);
> -OVERLOADABLE float modf(float x, private float *i);
> +OVERLOADABLE float modf(float x, float *i);
> OVERLOADABLE float hypot(float x, float y);
> -OVERLOADABLE float fract(float x, global float *p);
> -OVERLOADABLE float fract(float x, local float *p);
> -OVERLOADABLE float fract(float x, private float *p);
> -OVERLOADABLE float remquo(float x, float y, global int *quo);
> -OVERLOADABLE float remquo(float x, float y, local int *quo);
> -OVERLOADABLE float remquo(float x, float y, private int *quo);
> +OVERLOADABLE float fract(float x, float *p);
> +OVERLOADABLE float remquo(float x, float y, int *quo);
> OVERLOADABLE float pown(float x, int n);
> OVERLOADABLE float rootn(float x, int n);
>
> @@ -171,32 +159,20 @@ OVERLOADABLE half cos(half x);
> OVERLOADABLE half tan(half x);
> OVERLOADABLE half tgamma(half x);
> OVERLOADABLE half lgamma(half x);
> -OVERLOADABLE half lgamma_r(half x, global int *signgamp);
> -OVERLOADABLE half lgamma_r(half x, local int *signgamp);
> -OVERLOADABLE half lgamma_r(half x, private int *signgamp);
> +OVERLOADABLE half lgamma_r(half x, int *signgamp);
> OVERLOADABLE half log1p(half x);
> OVERLOADABLE half logb(half x);
> OVERLOADABLE int ilogb(half x);
> OVERLOADABLE half nan(ushort code);
> -OVERLOADABLE half sincos(half x, global half *cosval);
> -OVERLOADABLE half sincos(half x, local half *cosval);
> -OVERLOADABLE half sincos(half x, private half *cosval);
> +OVERLOADABLE half sincos(half x, half *cosval);
> OVERLOADABLE half sqrt(half x);
> OVERLOADABLE half rsqrt(half x);
> -OVERLOADABLE half frexp(half x, global int *exp);
> -OVERLOADABLE half frexp(half x, local int *exp);
> -OVERLOADABLE half frexp(half x, private int *exp);
> +OVERLOADABLE half frexp(half x, int *exp);
> OVERLOADABLE half nextafter(half x, half y);
> -OVERLOADABLE half modf(half x, global half *i);
> -OVERLOADABLE half modf(half x, local half *i);
> -OVERLOADABLE half modf(half x, private half *i);
> +OVERLOADABLE half modf(half x, half *i);
> OVERLOADABLE half hypot(half x, half y);
> -OVERLOADABLE half fract(half x, global half *p);
> -OVERLOADABLE half fract(half x, local half *p);
> -OVERLOADABLE half fract(half x, private half *p);
> -OVERLOADABLE half remquo(half x, half y, global int *quo);
> -OVERLOADABLE half remquo(half x, half y, local int *quo);
> -OVERLOADABLE half remquo(half x, half y, private int *quo);
> +OVERLOADABLE half fract(half x, half *p);
> +OVERLOADABLE half remquo(half x, half y, int *quo);
> OVERLOADABLE half pown(half x, int n);
> OVERLOADABLE half rootn(half x, int n);
>
> --
> 2.5.0
>
> _______________________________________________
> Beignet mailing list
> Beignet at lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/beignet
More information about the Beignet
mailing list