[Beignet] [PATCH] Libocl: change prototype of math built-in for OCL2.0 spec

Tue Apr 5 10:26:10 UTC 2016

Pushed, thanks.

> -----Original Message-----
> From: Beignet [mailto:beignet-bounces at lists.freedesktop.org] On Behalf Of
> Xiuli Pan
> Sent: Tuesday, March 22, 2016 12:38
> To: beignet at lists.freedesktop.org
> Cc: Pan, Xiuli <xiuli.pan at intel.com>
> Subject: [Beignet] [PATCH] Libocl: change prototype of math built-in for
> OCL2.0 spec
> 
> From: Pan Xiuli <xiuli.pan at intel.com>
> 
> Math built-in nolonger need address space, so remove them.
> 
> Signed-off-by: Pan Xiuli <xiuli.pan at intel.com>
> ---
>  backend/src/libocl/tmpl/ocl_math.tmpl.cl | 122 ++++---------------------------
> backend/src/libocl/tmpl/ocl_math.tmpl.h  |  48 +++---------
>  2 files changed, 25 insertions(+), 145 deletions(-)
> 
> diff --git a/backend/src/libocl/tmpl/ocl_math.tmpl.cl
> b/backend/src/libocl/tmpl/ocl_math.tmpl.cl
> index 782bfd2..d8fa4ae 100644
> --- a/backend/src/libocl/tmpl/ocl_math.tmpl.cl
> +++ b/backend/src/libocl/tmpl/ocl_math.tmpl.cl
> @@ -127,15 +127,7 @@ OVERLOADABLE float
> __gen_ocl_internal_fastpath_rootn(float x, int n) {  OVERLOADABLE float
> __gen_ocl_internal_fastpath_sin (float x) {
>      return native_sin(x);
>  }
> -OVERLOADABLE float __gen_ocl_internal_fastpath_sincos (float x, __global
> float *cosval) {
> -    *cosval = native_cos(x);
> -    return native_sin(x);
> -}
> -OVERLOADABLE float __gen_ocl_internal_fastpath_sincos (float x, __local
> float *cosval) {
> -    *cosval = native_cos(x);
> -    return native_sin(x);
> -}
> -OVERLOADABLE float __gen_ocl_internal_fastpath_sincos (float x,
> __private float *cosval) {
> +OVERLOADABLE float __gen_ocl_internal_fastpath_sincos (float x, float
> +*cosval) {
>      *cosval = native_cos(x);
>      return native_sin(x);
>  }
> @@ -1182,9 +1174,7 @@ OVERLOADABLE float lgamma(float x) {
>  	if (hx < 0)  \
>  		r = nadj - r;  \
>  	return r;
> -OVERLOADABLE float lgamma_r(float x, global int *signgamp) { BODY; } -
> OVERLOADABLE float lgamma_r(float x, local int *signgamp) { BODY; } -
> OVERLOADABLE float lgamma_r(float x, private int *signgamp) { BODY; }
> +OVERLOADABLE float lgamma_r(float x, int *signgamp) { BODY; }
>  #undef BODY
> 
>  OVERLOADABLE float log1p(float x) {
> @@ -1406,17 +1396,7 @@ OVERLOADABLE float
> __gen_ocl_internal_cbrt(float x) {
>    *cosval = cos(x); \
>    return sin(x);
> 
> -OVERLOADABLE float sincos(float x, global float *cosval) {
> -  if (__ocl_math_fastpath_flag)
> -    return __gen_ocl_internal_fastpath_sincos(x, cosval);
> -  BODY;
> -}
> -OVERLOADABLE float sincos(float x, local float *cosval) {
> -  if (__ocl_math_fastpath_flag)
> -    return __gen_ocl_internal_fastpath_sincos(x, cosval);
> -  BODY;
> -}
> -OVERLOADABLE float sincos(float x, private float *cosval) {
> +OVERLOADABLE float sincos(float x, float *cosval) {
>    if (__ocl_math_fastpath_flag)
>      return __gen_ocl_internal_fastpath_sincos(x, cosval);
>    BODY;
> @@ -2641,9 +2621,7 @@ OVERLOADABLE float mad(float a, float b, float c) {
>    a <<= 1; \
>    *exp = e; \
>    return as_float((a & (0x807FFFFFu)) | (u & 0x80000000u) | 0x3F000000); -
> OVERLOADABLE float frexp(float x, global int *exp) { BODY; } -
> OVERLOADABLE float frexp(float x, local int *exp) { BODY; } -OVERLOADABLE
> float frexp(float x, private int *exp) { BODY; }
> +OVERLOADABLE float frexp(float x, int *exp) { BODY; }
>  #undef BODY
> 
>  OVERLOADABLE float nextafter(float x, float y) { @@ -2690,9 +2668,7 @@
> OVERLOADABLE float nextafter(float x, float y) {
>    } \
>    *i = __gen_ocl_rndz(x); \
>    return x - *i;
> -OVERLOADABLE float modf(float x, global float *i) { BODY; } -OVERLOADABLE
> float modf(float x, local float *i) { BODY; } -OVERLOADABLE float modf(float x,
> private float *i) { BODY; }
> +OVERLOADABLE float modf(float x, float *i) { BODY; }
>  #undef BODY
> 
>  OVERLOADABLE float __gen_ocl_internal_fmax(float a, float b) { return
> max(a,b); } @@ -3287,9 +3263,7 @@ OVERLOADABLE float hypot(float x,
> float y) {
>      return x > 0 ? +0. : -0.; \
>    } \
>    return __gen_ocl_internal_fmin(x - *p, 0x1.FFFFFep-1F); -OVERLOADABLE
> float fract(float x, global float *p) { BODY; } -OVERLOADABLE float fract(float x,
> local float *p) { BODY; } -OVERLOADABLE float fract(float x, private float *p)
> { BODY; }
> +OVERLOADABLE float fract(float x, float *p) { BODY; }
>  #undef BODY
> 
>  #define BODY \
> @@ -3371,11 +3345,9 @@ fixup: \
>    *quo = (sign ? -q : q); \
>    return x;
> 
> -OVERLOADABLE float remquo(float x, float y, global int *quo) {
> +OVERLOADABLE float remquo(float x, float y, int *quo) {
>  	BODY;
>  }
> -OVERLOADABLE float remquo(float x, float y, local int *quo) { BODY; } -
> OVERLOADABLE float remquo(float x, float y, private int *quo) { BODY; }
> #undef BODY
> 
>  OVERLOADABLE float powr(float x, float y) { @@ -3855,15 +3827,7 @@
> OVERLOADABLE half lgamma(half x) {
>    float _x = (float)x;
>    return (half)lgamma(_x);
>  }
> -OVERLOADABLE half lgamma_r(half x, global int *signgamp) {
> -  float _x = (float)x;
> -  return (half)lgamma_r(_x, signgamp);
> -}
> -OVERLOADABLE half lgamma_r(half x, local int *signgamp) {
> -  float _x = (float)x;
> -  return (half)lgamma_r(_x, signgamp);
> -}
> -OVERLOADABLE half lgamma_r(half x, private int *signgamp) {
> +OVERLOADABLE half lgamma_r(half x, int *signgamp) {
>    float _x = (float)x;
>    return (half)lgamma_r(_x, signgamp);
>  }
> @@ -3883,21 +3847,7 @@ OVERLOADABLE half nan(ushort code) {
>    return (half)NAN;
>  }
> 
> -OVERLOADABLE half sincos(half x, global half *cosval) {
> -  float _x = (float)x;
> -  float _cosval;
> -  half ret = (half)sincos(_x, &_cosval);
> -  *cosval = (half)_cosval;
> -  return ret;
> -}
> -OVERLOADABLE half sincos(half x, local half *cosval) {
> -  float _x = (float)x;
> -  float _cosval;
> -  half ret = (half)sincos(_x, &_cosval);
> -  *cosval = (half)_cosval;
> -  return ret;
> -}
> -OVERLOADABLE half sincos(half x, private half *cosval) {
> +OVERLOADABLE half sincos(half x, half *cosval) {
>    float _x = (float)x;
>    float _cosval;
>    half ret = (half)sincos(_x, &_cosval); @@ -3913,15 +3863,7 @@
> OVERLOADABLE half rsqrt(half x) {
>    float _x = (float)x;
>    return (half)rsqrt(_x);
>  }
> -OVERLOADABLE half frexp(half x, global int *exp) {
> -  float _x = (float)x;
> -  return (half)frexp(_x, exp);
> -}
> -OVERLOADABLE half frexp(half x, local int *exp) {
> -  float _x = (float)x;
> -  return (half)frexp(_x, exp);
> -}
> -OVERLOADABLE half frexp(half x, private int *exp) {
> +OVERLOADABLE half frexp(half x, int *exp) {
>    float _x = (float)x;
>    return (half)frexp(_x, exp);
>  }
> @@ -3931,21 +3873,7 @@ OVERLOADABLE half nextafter(half x, half y) {
>    return (half)nextafter(_x, _y);
>  }
> 
> -OVERLOADABLE half modf(half x, global half *i) {
> -  float _x = (float)x;
> -  float _i;
> -  half ret = (half)modf(_x, &_i);
> -  *i = (half)_i;
> -  return ret;
> -}
> -OVERLOADABLE half modf(half x, local half *i) {
> -  float _x = (float)x;
> -  float _i;
> -  half ret = (half)modf(_x, &_i);
> -  *i = (half)_i;
> -  return ret;
> -}
> -OVERLOADABLE half modf(half x, private half *i) {
> +OVERLOADABLE half modf(half x, half *i) {
>    float _x = (float)x;
>    float _i;
>    half ret = (half)modf(_x, &_i);
> @@ -3959,21 +3887,7 @@ OVERLOADABLE half hypot(half x, half y) {
>    return (half)hypot(_x, _y);
>  }
> 
> -OVERLOADABLE half fract(half x, global half *p) {
> -  float _x = (float)x;
> -  float _p;
> -  half ret = (half)fract(_x, &_p);
> -  *p = (half)_p;
> -  return ret;
> -}
> -OVERLOADABLE half fract(half x, local half *p) {
> -  float _x = (float)x;
> -  float _p;
> -  half ret = (half)fract(_x, &_p);
> -  *p = (half)_p;
> -  return ret;
> -}
> -OVERLOADABLE half fract(half x, private half *p) {
> +OVERLOADABLE half fract(half x, half *p) {
>    float _x = (float)x;
>    float _p;
>    half ret = (half)fract(_x, &_p);
> @@ -3981,17 +3895,7 @@ OVERLOADABLE half fract(half x, private half *p) {
>    return ret;
>  }
> 
> -OVERLOADABLE half remquo(half x, half y, global int *quo) {
> -  float _x = (float)x;
> -  float _y = (float)y;
> -  return (half)remquo(_x, _y, quo);
> -}
> -OVERLOADABLE half remquo(half x, half y, local int *quo) {
> -  float _x = (float)x;
> -  float _y = (float)y;
> -  return (half)remquo(_x, _y, quo);
> -}
> -OVERLOADABLE half remquo(half x, half y, private int *quo) {
> +OVERLOADABLE half remquo(half x, half y, int *quo) {
>    float _x = (float)x;
>    float _y = (float)y;
>    return (half)remquo(_x, _y, quo);
> diff --git a/backend/src/libocl/tmpl/ocl_math.tmpl.h
> b/backend/src/libocl/tmpl/ocl_math.tmpl.h
> index 0de3642..ca8c02a 100644
> --- a/backend/src/libocl/tmpl/ocl_math.tmpl.h
> +++ b/backend/src/libocl/tmpl/ocl_math.tmpl.h
> @@ -72,32 +72,20 @@ OVERLOADABLE float cos(float x);  OVERLOADABLE
> float tan(float x);  OVERLOADABLE float tgamma(float x);  OVERLOADABLE
> float lgamma(float x); -OVERLOADABLE float lgamma_r(float x, global int
> *signgamp); -OVERLOADABLE float lgamma_r(float x, local int *signgamp); -
> OVERLOADABLE float lgamma_r(float x, private int *signgamp);
> +OVERLOADABLE float lgamma_r(float x, int *signgamp);
>  OVERLOADABLE float log1p(float x);
>  OVERLOADABLE float logb(float x);
>  OVERLOADABLE int ilogb(float x);
>  OVERLOADABLE float nan(uint code);
> -OVERLOADABLE float sincos(float x, global float *cosval); -OVERLOADABLE
> float sincos(float x, local float *cosval); -OVERLOADABLE float sincos(float x,
> private float *cosval);
> +OVERLOADABLE float sincos(float x, float *cosval);
>  OVERLOADABLE float sqrt(float x);
>  OVERLOADABLE float rsqrt(float x);
> -OVERLOADABLE float frexp(float x, global int *exp); -OVERLOADABLE float
> frexp(float x, local int *exp); -OVERLOADABLE float frexp(float x, private int
> *exp);
> +OVERLOADABLE float frexp(float x, int *exp);
>  OVERLOADABLE float nextafter(float x, float y); -OVERLOADABLE float
> modf(float x, global float *i); -OVERLOADABLE float modf(float x, local float
> *i); -OVERLOADABLE float modf(float x, private float *i);
> +OVERLOADABLE float modf(float x, float *i);
>  OVERLOADABLE float hypot(float x, float y); -OVERLOADABLE float fract(float
> x, global float *p); -OVERLOADABLE float fract(float x, local float *p); -
> OVERLOADABLE float fract(float x, private float *p); -OVERLOADABLE float
> remquo(float x, float y, global int *quo); -OVERLOADABLE float remquo(float
> x, float y, local int *quo); -OVERLOADABLE float remquo(float x, float y,
> private int *quo);
> +OVERLOADABLE float fract(float x, float *p); OVERLOADABLE float
> +remquo(float x, float y, int *quo);
>  OVERLOADABLE float pown(float x, int n);  OVERLOADABLE float rootn(float
> x, int n);
> 
> @@ -171,32 +159,20 @@ OVERLOADABLE half cos(half x);  OVERLOADABLE
> half tan(half x);  OVERLOADABLE half tgamma(half x);  OVERLOADABLE half
> lgamma(half x); -OVERLOADABLE half lgamma_r(half x, global int *signgamp);
> -OVERLOADABLE half lgamma_r(half x, local int *signgamp); -OVERLOADABLE
> half lgamma_r(half x, private int *signgamp);
> +OVERLOADABLE half lgamma_r(half x, int *signgamp);
>  OVERLOADABLE half log1p(half x);
>  OVERLOADABLE half logb(half x);
>  OVERLOADABLE int ilogb(half x);
>  OVERLOADABLE half nan(ushort code);
> -OVERLOADABLE half sincos(half x, global half *cosval); -OVERLOADABLE half
> sincos(half x, local half *cosval); -OVERLOADABLE half sincos(half x, private
> half *cosval);
> +OVERLOADABLE half sincos(half x, half *cosval);
>  OVERLOADABLE half sqrt(half x);
>  OVERLOADABLE half rsqrt(half x);
> -OVERLOADABLE half frexp(half x, global int *exp); -OVERLOADABLE half
> frexp(half x, local int *exp); -OVERLOADABLE half frexp(half x, private int
> *exp);
> +OVERLOADABLE half frexp(half x, int *exp);
>  OVERLOADABLE half nextafter(half x, half y); -OVERLOADABLE half
> modf(half x, global half *i); -OVERLOADABLE half modf(half x, local half *i); -
> OVERLOADABLE half modf(half x, private half *i);
> +OVERLOADABLE half modf(half x, half *i);
>  OVERLOADABLE half hypot(half x, half y); -OVERLOADABLE half fract(half x,
> global half *p); -OVERLOADABLE half fract(half x, local half *p); -
> OVERLOADABLE half fract(half x, private half *p); -OVERLOADABLE half
> remquo(half x, half y, global int *quo); -OVERLOADABLE half remquo(half x,
> half y, local int *quo); -OVERLOADABLE half remquo(half x, half y, private int
> *quo);
> +OVERLOADABLE half fract(half x, half *p); OVERLOADABLE half remquo(half
> +x, half y, int *quo);
>  OVERLOADABLE half pown(half x, int n);
>  OVERLOADABLE half rootn(half x, int n);
> 
> --
> 2.5.0
> 
> _______________________________________________
> Beignet mailing list
> Beignet at lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/beignet