[Mesa-dev] [PATCH] glsl: Add an optimization pass to flatten simple nested if blocks.
Eric Anholt
eric at anholt.net
Thu Apr 4 15:50:52 PDT 2013
Eric Anholt <eric at anholt.net> writes:
> Kenneth Graunke <kenneth at whitecape.org> writes:
>
>> On 04/04/2013 09:08 AM, Eric Anholt wrote:
>>> Kenneth Graunke <kenneth at whitecape.org> writes:
>>>> diff --git a/src/glsl/Makefile.sources b/src/glsl/Makefile.sources
>>>> index c294aa4..b5282a6 100644
>>>> --- a/src/glsl/Makefile.sources
>>>> +++ b/src/glsl/Makefile.sources
>>>> @@ -80,6 +80,7 @@ LIBGLSL_FILES = \
>>>> $(GLSL_SRCDIR)/opt_dead_code.cpp \
>>>> $(GLSL_SRCDIR)/opt_dead_code_local.cpp \
>>>> $(GLSL_SRCDIR)/opt_dead_functions.cpp \
>>>> + $(GLSL_SRCDIR)/opt_flatten_nested_if_blocks.cpp \
>>>> $(GLSL_SRCDIR)/opt_function_inlining.cpp \
>>>> $(GLSL_SRCDIR)/opt_if_simplification.cpp \
>>>> $(GLSL_SRCDIR)/opt_noop_swizzle.cpp \
>>>> diff --git a/src/glsl/glsl_parser_extras.cpp b/src/glsl/glsl_parser_extras.cpp
>>>> index 9740903..0992294 100644
>>>> --- a/src/glsl/glsl_parser_extras.cpp
>>>> +++ b/src/glsl/glsl_parser_extras.cpp
>>>> @@ -1218,6 +1218,7 @@ do_common_optimization(exec_list *ir, bool linked,
>>>> progress = do_structure_splitting(ir) || progress;
>>>> }
>>>> progress = do_if_simplification(ir) || progress;
>>>> + progress = opt_flatten_nested_if_blocks(ir) || progress;
>>>> progress = do_copy_propagation(ir) || progress;
>>>> progress = do_copy_propagation_elements(ir) || progress;
>>>> if (linked)
>>>> diff --git a/src/glsl/ir_optimization.h b/src/glsl/ir_optimization.h
>>>> index 2454bbe..a8885d7 100644
>>>> --- a/src/glsl/ir_optimization.h
>>>> +++ b/src/glsl/ir_optimization.h
>>>> @@ -82,6 +82,7 @@ bool do_function_inlining(exec_list *instructions);
>>>> bool do_lower_jumps(exec_list *instructions, bool pull_out_jumps = true, bool lower_sub_return = true, bool lower_main_return = false, bool lower_continue = false, bool lower_break = false);
>>>> bool do_lower_texture_projection(exec_list *instructions);
>>>> bool do_if_simplification(exec_list *instructions);
>>>> +bool opt_flatten_nested_if_blocks(exec_list *instructions);
>>>> bool do_discard_simplification(exec_list *instructions);
>>>> bool lower_if_to_cond_assign(exec_list *instructions, unsigned max_depth = 0);
>>>> bool do_mat_op_to_vec(exec_list *instructions);
>>>> diff --git a/src/glsl/opt_flatten_nested_if_blocks.cpp b/src/glsl/opt_flatten_nested_if_blocks.cpp
>>>> new file mode 100644
>>>> index 0000000..c702102
>>>> --- /dev/null
>>>> +++ b/src/glsl/opt_flatten_nested_if_blocks.cpp
>>>> @@ -0,0 +1,103 @@
>>>> +/*
>>>> + * Copyright © 2013 Intel Corporation
>>>> + *
>>>> + * Permission is hereby granted, free of charge, to any person obtaining a
>>>> + * copy of this software and associated documentation files (the "Software"),
>>>> + * to deal in the Software without restriction, including without limitation
>>>> + * the rights to use, copy, modify, merge, publish, distribute, sublicense,
>>>> + * and/or sell copies of the Software, and to permit persons to whom the
>>>> + * Software is furnished to do so, subject to the following conditions:
>>>> + *
>>>> + * The above copyright notice and this permission notice (including the next
>>>> + * paragraph) shall be included in all copies or substantial portions of the
>>>> + * Software.
>>>> + *
>>>> + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
>>>> + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
>>>> + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
>>>> + * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
>>>> + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
>>>> + * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
>>>> + * DEALINGS IN THE SOFTWARE.
>>>> + */
>>>> +
>>>> +/**
>>>> + * \file opt_flatten_nested_if_blocks.cpp
>>>> + *
>>>> + * Flattens nested if blocks such as:
>>>> + *
>>>> + * if (x) {
>>>> + * if (y) {
>>>> + * ...
>>>> + * }
>>>> + * }
>>>> + *
>>>> + * into a single if block with a combined condition:
>>>> + *
>>>> + * if (x && y) {
>>>> + * ...
>>>> + * }
>>>> + */
>>>> +
>>>> +#include "ir.h"
>>>> +#include "ir_builder.h"
>>>> +
>>>> +using namespace ir_builder;
>>>> +
>>>> +namespace {
>>>> +
>>>> +class nested_if_flattener : public ir_hierarchical_visitor {
>>>> +public:
>>>> + nested_if_flattener()
>>>> + {
>>>> + progress = false;
>>>> + }
>>>> +
>>>> + ir_visitor_status visit_leave(ir_if *);
>>>> + ir_visitor_status visit_enter(ir_assignment *);
>>>> +
>>>> + bool progress;
>>>> +};
>>>> +
>>>> +} /* unnamed namespace */
>>>> +
>>>> +/* We only care about the top level "if" instructions, so don't
>>>> + * descend into expressions.
>>>> + */
>>>> +ir_visitor_status
>>>> +nested_if_flattener::visit_enter(ir_assignment *ir)
>>>> +{
>>>> + (void) ir;
>>>> + return visit_continue_with_parent;
>>>> +}
>>>> +
>>>> +bool
>>>> +opt_flatten_nested_if_blocks(exec_list *instructions)
>>>> +{
>>>> + nested_if_flattener v;
>>>> +
>>>> + v.run(instructions);
>>>> + return v.progress;
>>>> +}
>>>> +
>>>> +
>>>> +ir_visitor_status
>>>> +nested_if_flattener::visit_leave(ir_if *ir)
>>>> +{
>>>> + /* Only handle a single ir_if within the then clause of an ir_if. No extra
>>>> + * instructions, no else clauses, nothing.
>>>> + */
>>>> + if (ir->then_instructions.is_empty() || !ir->else_instructions.is_empty())
>>>> + return visit_continue;
>>>> +
>>>> + ir_if *inner = ((ir_instruction *) ir->then_instructions.head)->as_if();
>>>> + if (!inner || !inner->next->is_tail_sentinel() ||
>>>> + !inner->else_instructions.is_empty())
>>>> + return visit_continue;
>>>> +
>>>> + ir->condition = logic_and(ir->condition, inner->condition);
>>>> + inner->then_instructions.move_nodes_to(&ir->then_instructions);
>>>> +
>>>
>>> Also inner->remove() right now instead of leaving it up to the
>>> empty-if-statement-remover? Equivalent functionality, but may take one
>>> less turn through the giant loop.
>>
>> It's not actually necessary. move_nodes_to throws away all nodes in the
>> target list, effectively doing the remove for us.
>
> that makes inner->then_instructions empty, but it still leaves inner in
> the outer's instruction list.
Ken corrected me, the move_nodes_to interface was unbelievable to me but
it really is that way.
-------------- next part --------------
A non-text attachment was scrubbed...
Name: not available
Type: application/pgp-signature
Size: 197 bytes
Desc: not available
URL: <http://lists.freedesktop.org/archives/mesa-dev/attachments/20130404/f3706985/attachment.pgp>
More information about the mesa-dev
mailing list