[Beignet] [PATCH] add empty 64bit-integer version built-in functions
Homer Hsing
homer.xing at intel.com
Wed Aug 14 23:53:27 PDT 2013
also change vector built-in generator to auto generate
64bit-integer versions of built-in functions
function body is empty now. detail will add in the future.
Signed-off-by: Homer Hsing <homer.xing at intel.com>
---
backend/src/gen_builtin_vector.py | 4 +--
backend/src/ocl_stdlib.tmpl.h | 59 +++++++++++++++++++++++++++++++++++++++
2 files changed, 60 insertions(+), 3 deletions(-)
diff --git a/backend/src/gen_builtin_vector.py b/backend/src/gen_builtin_vector.py
index b073682..35e3a2a 100755
--- a/backend/src/gen_builtin_vector.py
+++ b/backend/src/gen_builtin_vector.py
@@ -260,9 +260,7 @@ class builtinProto():
# XXX FIXME now skip all double vector, as we don't
# defined those scalar version's prototype.
if ptype[0].find('double') != -1 or \
- vtype[0].find('double') != -1 or \
- ptype[0].find('long') != -1 or \
- vtype[0].find('long') != -1 :
+ vtype[0].find('double') != -1:
return
if (n == 0):
diff --git a/backend/src/ocl_stdlib.tmpl.h b/backend/src/ocl_stdlib.tmpl.h
index 2b5e470..00d6fda 100644
--- a/backend/src/ocl_stdlib.tmpl.h
+++ b/backend/src/ocl_stdlib.tmpl.h
@@ -311,6 +311,14 @@ INLINE_OVERLOADABLE uint clz(uint x) {
return __gen_ocl_fbh(x);
}
+INLINE_OVERLOADABLE long clz(long x) {
+ return 0;
+}
+
+INLINE_OVERLOADABLE ulong clz(ulong x) {
+ return 0;
+}
+
OVERLOADABLE int __gen_ocl_mul_hi(int x, int y);
OVERLOADABLE uint __gen_ocl_mul_hi(uint x, uint y);
INLINE_OVERLOADABLE char mul_hi(char x, char y) { return (x * y) >> 8; }
@@ -319,6 +327,12 @@ INLINE_OVERLOADABLE short mul_hi(short x, short y) { return (x * y) >> 16; }
INLINE_OVERLOADABLE ushort mul_hi(ushort x, ushort y) { return (x * y) >> 16; }
INLINE_OVERLOADABLE int mul_hi(int x, int y) { return __gen_ocl_mul_hi(x, y); }
INLINE_OVERLOADABLE uint mul_hi(uint x, uint y) { return __gen_ocl_mul_hi(x, y); }
+INLINE_OVERLOADABLE long mul_hi(long x, long y) {
+ return 0;
+}
+INLINE_OVERLOADABLE ulong mul_hi(ulong x, ulong y) {
+ return 0;
+}
#define DEF(type) INLINE_OVERLOADABLE type mad_hi(type a, type b, type c) { return mul_hi(a, b) + c; }
DEF(char)
@@ -327,6 +341,8 @@ DEF(short)
DEF(ushort)
DEF(int)
DEF(uint)
+DEF(long)
+DEF(ulong)
#undef DEF
INLINE_OVERLOADABLE int mul24(int a, int b) { return ((a << 8) >> 8) * ((b << 8) >> 8); }
@@ -383,6 +399,14 @@ INLINE_OVERLOADABLE uint mad_sat(uint a, uint b, uint c) {
return (uint)x;
}
+INLINE_OVERLOADABLE long mad_sat(long a, long b, long c) {
+ return 0;
+}
+
+INLINE_OVERLOADABLE ulong mad_sat(ulong a, ulong b, ulong c) {
+ return 0;
+}
+
INLINE_OVERLOADABLE uchar __rotate_left(uchar x, uchar y) { return (x << y) | (x >> (8 - y)); }
INLINE_OVERLOADABLE char __rotate_left(char x, char y) { return __rotate_left((uchar)x, (uchar)y); }
INLINE_OVERLOADABLE ushort __rotate_left(ushort x, ushort y) { return (x << y) | (x >> (16 - y)); }
@@ -397,6 +421,12 @@ DEF(ushort, 15)
DEF(int, 31)
DEF(uint, 31)
#undef DEF
+INLINE_OVERLOADABLE long rotate(long x, long y) {
+ return 0;
+}
+INLINE_OVERLOADABLE ulong rotate(ulong x, ulong y) {
+ return 0;
+}
OVERLOADABLE short __gen_ocl_upsample(short hi, short lo);
OVERLOADABLE int __gen_ocl_upsample(int hi, int lo);
@@ -404,6 +434,12 @@ INLINE_OVERLOADABLE short upsample(char hi, uchar lo) { return __gen_ocl_upsampl
INLINE_OVERLOADABLE ushort upsample(uchar hi, uchar lo) { return __gen_ocl_upsample((short)hi, (short)lo); }
INLINE_OVERLOADABLE int upsample(short hi, ushort lo) { return __gen_ocl_upsample((int)hi, (int)lo); }
INLINE_OVERLOADABLE uint upsample(ushort hi, ushort lo) { return __gen_ocl_upsample((int)hi, (int)lo); }
+INLINE_OVERLOADABLE long upsample(int hi, uint lo) {
+ return 0;
+}
+INLINE_OVERLOADABLE ulong upsample(uint hi, uint lo) {
+ return 0;
+}
PURE CONST uint __gen_ocl_hadd(uint x, uint y);
PURE CONST uint __gen_ocl_rhadd(uint x, uint y);
@@ -419,6 +455,18 @@ INLINE_OVERLOADABLE int hadd(int x, int y) { return (x < 0 && y > 0) || (x > 0 &
INLINE_OVERLOADABLE uint hadd(uint x, uint y) { return __gen_ocl_hadd(x, y); }
INLINE_OVERLOADABLE int rhadd(int x, int y) { return (x < 0 && y > 0) || (x > 0 && y < 0) ? ((x + y + 1) >> 1) : __gen_ocl_rhadd(x, y); }
INLINE_OVERLOADABLE uint rhadd(uint x, uint y) { return __gen_ocl_rhadd(x, y); }
+INLINE_OVERLOADABLE long hadd(long x, long y) {
+ return 0;
+}
+INLINE_OVERLOADABLE ulong hadd(ulong x, ulong y) {
+ return 0;
+}
+INLINE_OVERLOADABLE long rhadd(long x, long y) {
+ return 0;
+}
+INLINE_OVERLOADABLE ulong rhadd(ulong x, ulong y) {
+ return 0;
+}
int __gen_ocl_abs(int x);
#define DEC(TYPE) INLINE_OVERLOADABLE u##TYPE abs(TYPE x) { return (u##TYPE) __gen_ocl_abs(x); }
@@ -426,11 +474,13 @@ DEC(int)
DEC(short)
DEC(char)
#undef DEC
+INLINE_OVERLOADABLE ulong abs(long x) { return x < 0 ? -x : x; }
/* For unsigned types, do nothing. */
#define DEC(TYPE) INLINE_OVERLOADABLE TYPE abs(TYPE x) { return x; }
DEC(uint)
DEC(ushort)
DEC(uchar)
+DEC(ulong)
#undef DEC
/* Char and short type abs diff */
@@ -456,6 +506,13 @@ INLINE_OVERLOADABLE uint abs_diff (int x, int y) {
return (abs(x) + abs(y));
}
+INLINE_OVERLOADABLE ulong abs_diff (long x, long y) {
+ return 0;
+}
+INLINE_OVERLOADABLE ulong abs_diff (ulong x, ulong y) {
+ return 0;
+}
+
/////////////////////////////////////////////////////////////////////////////
// Work Items functions (see 6.11.1 of OCL 1.1 spec)
/////////////////////////////////////////////////////////////////////////////
@@ -770,6 +827,8 @@ DECL_MIN_MAX_CLAMP(char)
DECL_MIN_MAX_CLAMP(uint)
DECL_MIN_MAX_CLAMP(unsigned short)
DECL_MIN_MAX_CLAMP(unsigned char)
+DECL_MIN_MAX_CLAMP(long)
+DECL_MIN_MAX_CLAMP(ulong)
#undef DECL_MIN_MAX_CLAMP
#define BODY \
--
1.8.1.2
More information about the Beignet
mailing list