[Beignet] [PATCH 2/3] support 64bit-integer AND(&), OR(|), XOR(^) arithmetic
Homer Hsing
homer.xing at intel.com
Tue Aug 6 01:01:30 PDT 2013
Signed-off-by: Homer Hsing <homer.xing at intel.com>
---
backend/src/backend/gen_context.cpp | 102 +++++++++++++++++++++++++++++
backend/src/backend/gen_insn_selection.cpp | 24 ++++++-
backend/src/backend/gen_insn_selection.hxx | 3 +
backend/src/ir/instruction.cpp | 1 +
4 files changed, 127 insertions(+), 3 deletions(-)
diff --git a/backend/src/backend/gen_context.cpp b/backend/src/backend/gen_context.cpp
index 69dab85..bbe16d0 100644
--- a/backend/src/backend/gen_context.cpp
+++ b/backend/src/backend/gen_context.cpp
@@ -162,6 +162,108 @@ namespace gbe
case SEL_OP_AND: p->AND(dst, src0, src1); break;
case SEL_OP_OR: p->OR (dst, src0, src1); break;
case SEL_OP_XOR: p->XOR(dst, src0, src1); break;
+ case SEL_OP_I64AND:
+ {
+ GenRegister xdst = GenRegister::retype(dst, GEN_TYPE_UL),
+ xsrc0 = GenRegister::retype(src0, GEN_TYPE_UL),
+ xsrc1 = GenRegister::retype(src1, GEN_TYPE_UL);
+ int execWidth = p->curr.execWidth;
+ p->push();
+ p->curr.execWidth = 8;
+ p->AND(xdst.bottom_half(), xsrc0.bottom_half(), xsrc1.bottom_half());
+ p->AND(xdst.top_half(), xsrc0.top_half(), xsrc1.top_half());
+ p->curr.nibControl = 1;
+ xdst = GenRegister::suboffset(xdst, 4),
+ xsrc0 = GenRegister::suboffset(xsrc0, 4),
+ xsrc1 = GenRegister::suboffset(xsrc1, 4);
+ p->AND(xdst.bottom_half(), xsrc0.bottom_half(), xsrc1.bottom_half());
+ p->AND(xdst.top_half(), xsrc0.top_half(), xsrc1.top_half());
+ if (execWidth == 16) {
+ p->curr.quarterControl = 1;
+ p->curr.nibControl = 0;
+ xdst = GenRegister::suboffset(xdst, 4),
+ xsrc0 = GenRegister::suboffset(xsrc0, 4),
+ xsrc1 = GenRegister::suboffset(xsrc1, 4);
+ p->AND(xdst.bottom_half(), xsrc0.bottom_half(), xsrc1.bottom_half());
+ p->AND(xdst.top_half(), xsrc0.top_half(), xsrc1.top_half());
+ p->curr.nibControl = 1;
+ xdst = GenRegister::suboffset(xdst, 4),
+ xsrc0 = GenRegister::suboffset(xsrc0, 4),
+ xsrc1 = GenRegister::suboffset(xsrc1, 4);
+ p->AND(xdst.bottom_half(), xsrc0.bottom_half(), xsrc1.bottom_half());
+ p->AND(xdst.top_half(), xsrc0.top_half(), xsrc1.top_half());
+ }
+ p->pop();
+ }
+ break;
+ case SEL_OP_I64OR:
+ {
+ GenRegister xdst = GenRegister::retype(dst, GEN_TYPE_UL),
+ xsrc0 = GenRegister::retype(src0, GEN_TYPE_UL),
+ xsrc1 = GenRegister::retype(src1, GEN_TYPE_UL);
+ int execWidth = p->curr.execWidth;
+ p->push();
+ p->curr.execWidth = 8;
+ p->OR(xdst.bottom_half(), xsrc0.bottom_half(), xsrc1.bottom_half());
+ p->OR(xdst.top_half(), xsrc0.top_half(), xsrc1.top_half());
+ p->curr.nibControl = 1;
+ xdst = GenRegister::suboffset(xdst, 4),
+ xsrc0 = GenRegister::suboffset(xsrc0, 4),
+ xsrc1 = GenRegister::suboffset(xsrc1, 4);
+ p->OR(xdst.bottom_half(), xsrc0.bottom_half(), xsrc1.bottom_half());
+ p->OR(xdst.top_half(), xsrc0.top_half(), xsrc1.top_half());
+ if (execWidth == 16) {
+ p->curr.quarterControl = 1;
+ p->curr.nibControl = 0;
+ xdst = GenRegister::suboffset(xdst, 4),
+ xsrc0 = GenRegister::suboffset(xsrc0, 4),
+ xsrc1 = GenRegister::suboffset(xsrc1, 4);
+ p->OR(xdst.bottom_half(), xsrc0.bottom_half(), xsrc1.bottom_half());
+ p->OR(xdst.top_half(), xsrc0.top_half(), xsrc1.top_half());
+ p->curr.nibControl = 1;
+ xdst = GenRegister::suboffset(xdst, 4),
+ xsrc0 = GenRegister::suboffset(xsrc0, 4),
+ xsrc1 = GenRegister::suboffset(xsrc1, 4);
+ p->OR(xdst.bottom_half(), xsrc0.bottom_half(), xsrc1.bottom_half());
+ p->OR(xdst.top_half(), xsrc0.top_half(), xsrc1.top_half());
+ }
+ p->pop();
+ }
+ break;
+ case SEL_OP_I64XOR:
+ {
+ GenRegister xdst = GenRegister::retype(dst, GEN_TYPE_UL),
+ xsrc0 = GenRegister::retype(src0, GEN_TYPE_UL),
+ xsrc1 = GenRegister::retype(src1, GEN_TYPE_UL);
+ int execWidth = p->curr.execWidth;
+ p->push();
+ p->curr.execWidth = 8;
+ p->XOR(xdst.bottom_half(), xsrc0.bottom_half(), xsrc1.bottom_half());
+ p->XOR(xdst.top_half(), xsrc0.top_half(), xsrc1.top_half());
+ p->curr.nibControl = 1;
+ xdst = GenRegister::suboffset(xdst, 4),
+ xsrc0 = GenRegister::suboffset(xsrc0, 4),
+ xsrc1 = GenRegister::suboffset(xsrc1, 4);
+ p->XOR(xdst.bottom_half(), xsrc0.bottom_half(), xsrc1.bottom_half());
+ p->XOR(xdst.top_half(), xsrc0.top_half(), xsrc1.top_half());
+ if (execWidth == 16) {
+ p->curr.quarterControl = 1;
+ p->curr.nibControl = 0;
+ xdst = GenRegister::suboffset(xdst, 4),
+ xsrc0 = GenRegister::suboffset(xsrc0, 4),
+ xsrc1 = GenRegister::suboffset(xsrc1, 4);
+ p->XOR(xdst.bottom_half(), xsrc0.bottom_half(), xsrc1.bottom_half());
+ p->XOR(xdst.top_half(), xsrc0.top_half(), xsrc1.top_half());
+ p->curr.nibControl = 1;
+ xdst = GenRegister::suboffset(xdst, 4),
+ xsrc0 = GenRegister::suboffset(xsrc0, 4),
+ xsrc1 = GenRegister::suboffset(xsrc1, 4);
+ p->XOR(xdst.bottom_half(), xsrc0.bottom_half(), xsrc1.bottom_half());
+ p->XOR(xdst.top_half(), xsrc0.top_half(), xsrc1.top_half());
+ }
+ p->pop();
+ }
+ break;
case SEL_OP_SHR: p->SHR(dst, src0, src1); break;
case SEL_OP_SHL: p->SHL(dst, src0, src1); break;
case SEL_OP_RSR: p->RSR(dst, src0, src1); break;
diff --git a/backend/src/backend/gen_insn_selection.cpp b/backend/src/backend/gen_insn_selection.cpp
index 66cfa31..7e9402d 100644
--- a/backend/src/backend/gen_insn_selection.cpp
+++ b/backend/src/backend/gen_insn_selection.cpp
@@ -423,6 +423,9 @@ namespace gbe
ALU2(AND)
ALU2(OR)
ALU2(XOR)
+ ALU2(I64AND)
+ ALU2(I64OR)
+ ALU2(I64XOR)
ALU2(SHR)
ALU2(SHL)
ALU2(RSR)
@@ -1434,9 +1437,24 @@ namespace gbe
sel.ADD(dst, src0, src1);
sel.pop();
break;
- case OP_XOR: sel.XOR(dst, src0, src1); break;
- case OP_OR: sel.OR(dst, src0, src1); break;
- case OP_AND: sel.AND(dst, src0, src1); break;
+ case OP_XOR:
+ if (type == Type::TYPE_U64 || type == Type::TYPE_S64)
+ sel.I64XOR(dst, src0, src1);
+ else
+ sel.XOR(dst, src0, src1);
+ break;
+ case OP_OR:
+ if (type == Type::TYPE_U64 || type == Type::TYPE_S64)
+ sel.I64OR(dst, src0, src1);
+ else
+ sel.OR(dst, src0, src1);
+ break;
+ case OP_AND:
+ if (type == Type::TYPE_U64 || type == Type::TYPE_S64)
+ sel.I64AND(dst, src0, src1);
+ else
+ sel.AND(dst, src0, src1);
+ break;
case OP_SUB:
if (type == Type::TYPE_U64 || type == Type::TYPE_S64) {
GenRegister t = sel.selReg(sel.reg(RegisterFamily::FAMILY_QWORD), Type::TYPE_S64);
diff --git a/backend/src/backend/gen_insn_selection.hxx b/backend/src/backend/gen_insn_selection.hxx
index 8eeb19f..7664c8f 100644
--- a/backend/src/backend/gen_insn_selection.hxx
+++ b/backend/src/backend/gen_insn_selection.hxx
@@ -14,6 +14,9 @@ DECL_SELECTION_IR(SEL, BinaryInstruction)
DECL_SELECTION_IR(AND, BinaryInstruction)
DECL_SELECTION_IR(OR, BinaryInstruction)
DECL_SELECTION_IR(XOR, BinaryInstruction)
+DECL_SELECTION_IR(I64AND, BinaryInstruction)
+DECL_SELECTION_IR(I64OR, BinaryInstruction)
+DECL_SELECTION_IR(I64XOR, BinaryInstruction)
DECL_SELECTION_IR(SHR, BinaryInstruction)
DECL_SELECTION_IR(SHL, BinaryInstruction)
DECL_SELECTION_IR(RSR, BinaryInstruction)
diff --git a/backend/src/ir/instruction.cpp b/backend/src/ir/instruction.cpp
index 2589848..f58757b 100644
--- a/backend/src/ir/instruction.cpp
+++ b/backend/src/ir/instruction.cpp
@@ -672,6 +672,7 @@ namespace ir {
static const Type logicalType[] = {TYPE_S8, TYPE_U8,
TYPE_S16, TYPE_U16,
TYPE_S32, TYPE_U32,
+ TYPE_S64, TYPE_U64,
TYPE_BOOL};
static const uint32_t logicalTypeNum = ARRAY_ELEM_NUM(logicalType);
--
1.8.1.2
More information about the Beignet
mailing list