[Mesa-dev] [PATCH 08/23] glsl: Optimize certain if-statements to just casts from the condition
Ian Romanick
idr at freedesktop.org
Fri Mar 20 13:58:08 PDT 2015
From: Ian Romanick <ian.d.romanick at intel.com>
Some shaders end up with code that looks something like:
if (condition)
result = 1.0;
else
result = 0.0;
This pass converts those if-statements to
result = float(condition);
Of the shaders hurt, 12 of them are vertex shaders "hurt" by virtue of
having a loop unrolled.
Shader-db results:
GM45 (0x2A42):
total instructions in shared programs: 3550788 -> 3548093 (-0.08%)
instructions in affected programs: 231205 -> 228510 (-1.17%)
helped: 712
HURT: 43
Iron Lake (0x0046):
total instructions in shared programs: 4980593 -> 4977700 (-0.06%)
instructions in affected programs: 267985 -> 265092 (-1.08%)
helped: 852
HURT: 56
GAINED: 3
LOST: 24
Sandy Bridge (0x0116):
total instructions in shared programs: 6817050 -> 6806224 (-0.16%)
instructions in affected programs: 696386 -> 685560 (-1.55%)
helped: 2510
HURT: 34
GAINED: 1
LOST: 11
Sandy Bridge (0x0116) NIR:
total instructions in shared programs: 6823377 -> 6813527 (-0.14%)
instructions in affected programs: 703053 -> 693203 (-1.40%)
helped: 2555
HURT: 52
LOST: 23
Ivy Bridge (0x0166):
total instructions in shared programs: 6289987 -> 6282273 (-0.12%)
instructions in affected programs: 542999 -> 535285 (-1.42%)
helped: 1751
HURT: 603
GAINED: 1
LOST: 3
Ivy Bridge (0x0166) NIR:
total instructions in shared programs: 6310434 -> 6303918 (-0.10%)
instructions in affected programs: 592493 -> 585977 (-1.10%)
helped: 1874
HURT: 665
GAINED: 21
Haswell (0x0426):
total instructions in shared programs: 5777713 -> 5766346 (-0.20%)
instructions in affected programs: 545464 -> 534097 (-2.08%)
helped: 2314
HURT: 32
GAINED: 1
LOST: 3
Haswell (0x0426) NIR:
total instructions in shared programs: 5791071 -> 5780761 (-0.18%)
instructions in affected programs: 565597 -> 555287 (-1.82%)
helped: 2399
HURT: 52
GAINED: 21
Broadwell (0x162E):
total instructions in shared programs: 6821371 -> 6813617 (-0.11%)
instructions in affected programs: 572656 -> 564902 (-1.35%)
helped: 2316
HURT: 28
GAINED: 2
LOST: 3
Broadwell (0x162E) NIR:
total instructions in shared programs: 7013739 -> 7006622 (-0.10%)
instructions in affected programs: 594449 -> 587332 (-1.20%)
helped: 2396
HURT: 46
Signed-off-by: Ian Romanick <ian.d.romanick at intel.com>
---
src/glsl/Makefile.sources | 1 +
src/glsl/glsl_parser_extras.cpp | 1 +
src/glsl/ir_optimization.h | 1 +
src/glsl/opt_if_to_bool_cast.cpp | 184 +++++++++++++++++++++++++++++++++++++++
4 files changed, 187 insertions(+)
create mode 100644 src/glsl/opt_if_to_bool_cast.cpp
diff --git a/src/glsl/Makefile.sources b/src/glsl/Makefile.sources
index b876642..f49fc86 100644
--- a/src/glsl/Makefile.sources
+++ b/src/glsl/Makefile.sources
@@ -173,6 +173,7 @@ LIBGLSL_FILES = \
opt_flip_matrices.cpp \
opt_function_inlining.cpp \
opt_if_simplification.cpp \
+ opt_if_to_bool_cast.cpp \
opt_minmax.cpp \
opt_noop_swizzle.cpp \
opt_rebalance_tree.cpp \
diff --git a/src/glsl/glsl_parser_extras.cpp b/src/glsl/glsl_parser_extras.cpp
index 79624bc..cb7ec2b 100644
--- a/src/glsl/glsl_parser_extras.cpp
+++ b/src/glsl/glsl_parser_extras.cpp
@@ -1626,6 +1626,7 @@ do_common_optimization(exec_list *ir, bool linked,
progress = do_structure_splitting(ir) || progress;
}
progress = do_if_simplification(ir) || progress;
+ progress = optimize_if_to_bool_cast(ir) || progress;
progress = opt_flatten_nested_if_blocks(ir) || progress;
progress = opt_conditional_discard(ir) || progress;
progress = do_copy_propagation(ir) || progress;
diff --git a/src/glsl/ir_optimization.h b/src/glsl/ir_optimization.h
index e6939f3..4892a1d3 100644
--- a/src/glsl/ir_optimization.h
+++ b/src/glsl/ir_optimization.h
@@ -134,6 +134,7 @@ void optimize_dead_builtin_variables(exec_list *instructions,
enum ir_variable_mode other);
bool lower_vertex_id(gl_shader *shader);
+bool optimize_if_to_bool_cast(exec_list *instructions);
ir_rvalue *
compare_index_block(exec_list *instructions, ir_variable *index,
diff --git a/src/glsl/opt_if_to_bool_cast.cpp b/src/glsl/opt_if_to_bool_cast.cpp
new file mode 100644
index 0000000..20a27e3
--- /dev/null
+++ b/src/glsl/opt_if_to_bool_cast.cpp
@@ -0,0 +1,184 @@
+/*
+ * Copyright © 2014 Intel Corporation
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice (including the next
+ * paragraph) shall be included in all copies or substantial portions of the
+ * Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+/**
+ * \file opt_if_to_bool_cast.cpp
+ * Optimize certain if-statements to just casts from the condition
+ *
+ * Some shaders end up with code that looks something like:
+ *
+ * if (some_condition)
+ * result = 1.0;
+ * else
+ * result = 0.0;
+ *
+ * This pass converts those if-statements to
+ *
+ * result = float(some_condition);
+ */
+
+#include "main/imports.h"
+#include "ir.h"
+#include "ir_builder.h"
+#include "program/prog_instruction.h"
+
+using namespace ir_builder;
+
+namespace {
+
+class ir_if_to_bool_cast_visitor : public ir_hierarchical_visitor {
+public:
+ ir_if_to_bool_cast_visitor()
+ : progress(false)
+ {
+ /* empty */
+ }
+
+ ir_visitor_status visit_leave(ir_if *);
+
+ bool progress;
+};
+
+} /* unnamed namespace */
+
+bool
+optimize_if_to_bool_cast(exec_list *instructions)
+{
+ ir_if_to_bool_cast_visitor v;
+
+ v.run(instructions);
+ return v.progress;
+}
+
+static ir_assignment *
+emit_0_or_1_assigment(ir_dereference *lhs, unsigned write_mask,
+ ir_rvalue *condition,
+ ir_rvalue *then_rhs, ir_rvalue *else_rhs)
+{
+ /* Generate the RHS of the new assignment. Note that if the old code
+ * looked like
+ *
+ * x = (cond) ? 0.0 : 1.0;
+ *
+ * we have to generate
+ *
+ * x = float(!cond);
+ */
+ if (then_rhs->is_zero())
+ condition = logic_not(condition);
+
+ ir_rvalue *rhs = NULL;
+
+ switch (then_rhs->type->base_type) {
+ case GLSL_TYPE_UINT:
+ rhs = i2u(b2i(condition));
+ break;
+ case GLSL_TYPE_INT:
+ rhs = b2i(condition);
+ break;
+ case GLSL_TYPE_FLOAT:
+ rhs = b2f(condition);
+ break;
+ case GLSL_TYPE_BOOL:
+ rhs = condition;
+ break;
+ default:
+ unreachable("invalid base type");
+ }
+
+ /* If the non-zero value was -1, negate the result of the b2[uif]
+ * operation.
+ */
+ if (then_rhs->is_negative_one() || else_rhs->is_negative_one())
+ rhs = neg(rhs);
+
+ const unsigned size = _mesa_bitcount(write_mask);
+
+ assert(size >= 1 && size <= 4);
+
+ return assign(lhs, swizzle(rhs, SWIZZLE_XXXX, size), write_mask);
+}
+
+ir_visitor_status
+ir_if_to_bool_cast_visitor::visit_leave(ir_if *ir)
+{
+ /* Both the then-block and the else-block must contain a single instruction
+ * that is an assignment.
+ */
+ ir_instruction *const then_inst =
+ (ir_instruction *) ir->then_instructions.get_head();
+ if (then_inst == NULL
+ || !then_inst->next->is_tail_sentinel()
+ || then_inst->ir_type != ir_type_assignment)
+ return visit_continue;
+
+ ir_instruction *const else_inst =
+ (ir_instruction *) ir->else_instructions.get_head();
+ if (else_inst == NULL
+ || !else_inst->next->is_tail_sentinel()
+ || else_inst->ir_type != ir_type_assignment)
+ return visit_continue;
+
+ /* That assignment must have the same write-mask and have the same LHS.
+ */
+ ir_assignment *const then_assign = then_inst->as_assignment();
+ ir_assignment *const else_assign = else_inst->as_assignment();
+
+ assert(then_assign != NULL);
+ assert(else_assign != NULL);
+
+ if (then_assign->write_mask != else_assign->write_mask
+ || then_assign->condition != NULL
+ || else_assign->condition != NULL)
+ return visit_continue;
+
+ if (!then_assign->lhs->equals(else_assign->lhs))
+ return visit_continue;
+
+ /* The RHS of the then-assignment must be 1, and the RHS of the
+ * else-assignment must be 0. Or vice-versa.
+ */
+ ir_constant *const then_rhs = then_assign->rhs->as_constant();
+ ir_constant *const else_rhs = else_assign->rhs->as_constant();
+
+ if (then_rhs == NULL || else_rhs == NULL)
+ return visit_continue;
+
+ ir_assignment *a = NULL;
+ if ((then_rhs->is_zero()
+ && (else_rhs->is_one() || else_rhs->is_negative_one()))
+ || (else_rhs->is_zero()
+ && (then_rhs->is_one() || then_rhs->is_negative_one()))) {
+ a = emit_0_or_1_assigment(then_assign->lhs, then_assign->write_mask,
+ ir->condition,
+ then_rhs, else_rhs);
+ }
+
+ if (a != NULL) {
+ ir->insert_before(a);
+ ir->remove();
+ progress = true;
+ }
+
+ return visit_continue;
+ }
--
2.1.0
More information about the mesa-dev
mailing list