[Beignet] [PATCH 3/3] Backend: Workgroup scan cmp on QW, workaround for width 16
grigore.lupescu at intel.com
grigore.lupescu at intel.com
Fri Apr 1 12:49:25 UTC 2016
From: Grigore Lupescu <grigore.lupescu at intel.com>
Signed-off-by: Grigore Lupescu <grigore.lupescu at intel.com>
---
backend/src/backend/gen_context.cpp | 28 ++++++++++++++++++++++++----
1 file changed, 24 insertions(+), 4 deletions(-)
diff --git a/backend/src/backend/gen_context.cpp b/backend/src/backend/gen_context.cpp
index 764c1cb..bf66295 100644
--- a/backend/src/backend/gen_context.cpp
+++ b/backend/src/backend/gen_context.cpp
@@ -2763,12 +2763,32 @@ namespace gbe
if(wg_op == ir::WORKGROUP_OP_INCLUSIVE_ADD
|| wg_op == ir::WORKGROUP_OP_EXCLUSIVE_ADD)
p->ADD(dst, dst, partialData);
- else if(wg_op == ir::WORKGROUP_OP_INCLUSIVE_MIN
- || wg_op == ir::WORKGROUP_OP_EXCLUSIVE_MIN)
+ else if(wg_op == ir::WORKGROUP_OP_INCLUSIVE_MIN || wg_op == ir::WORKGROUP_OP_EXCLUSIVE_MIN)
+ {
p->SEL_CMP(GEN_CONDITIONAL_LE, dst, dst, partialData);
- else if(wg_op == ir::WORKGROUP_OP_INCLUSIVE_MAX
- || wg_op == ir::WORKGROUP_OP_EXCLUSIVE_MAX)
+ /* workaround QW datatype on CMP */
+ if(dst.type == GEN_TYPE_UL || dst.type == GEN_TYPE_L){
+ p->SEL_CMP(GEN_CONDITIONAL_LE, dst.offset(dst, 1, 0),
+ dst.offset(dst, 1, 0), partialData);
+ p->SEL_CMP(GEN_CONDITIONAL_LE, dst.offset(dst, 2, 0),
+ dst.offset(dst, 2, 0), partialData);
+ p->SEL_CMP(GEN_CONDITIONAL_LE, dst.offset(dst, 3, 0),
+ dst.offset(dst, 3, 0), partialData);
+ }
+ }
+ else if(wg_op == ir::WORKGROUP_OP_INCLUSIVE_MAX || wg_op == ir::WORKGROUP_OP_EXCLUSIVE_MAX)
+ {
p->SEL_CMP(GEN_CONDITIONAL_GE, dst, dst, partialData);
+ /* workaround QW datatype on CMP */
+ if(dst.type == GEN_TYPE_UL || dst.type == GEN_TYPE_L){
+ p->SEL_CMP(GEN_CONDITIONAL_GE, dst.offset(dst, 1, 0),
+ dst.offset(dst, 1, 0), partialData);
+ p->SEL_CMP(GEN_CONDITIONAL_GE, dst.offset(dst, 2, 0),
+ dst.offset(dst, 2, 0), partialData);
+ p->SEL_CMP(GEN_CONDITIONAL_GE, dst.offset(dst, 3, 0),
+ dst.offset(dst, 3, 0), partialData);
+ }
+ }
}
/* corner cases for threads 0 */
--
2.5.0
More information about the Beignet
mailing list