[Mesa-dev] [PATCH 05/11] glsl: Replace the linear search in get_intrinsic_opcode with a radix trie

Ian Romanick idr at freedesktop.org
Wed Jul 6 00:46:13 UTC 2016


From: Ian Romanick <ian.d.romanick at intel.com>

If there is a way to do this cleanly in mako, I'm very interested to
hear about it.

   text	   data	    bss	    dec	    hex	filename
7529003	 273096	  28584	7830683	 777c9b /tmp/i965_dri-64bit-before.so
7528883	 273096	  28584	7830563	 777c23	/tmp/i965_dri-64bit-after.so

Signed-off-by: Ian Romanick <ian.d.romanick at intel.com>
---
 src/compiler/glsl/nir_intrinsic_map.py | 131 ++++++++++++++++++++++++++++++---
 1 file changed, 119 insertions(+), 12 deletions(-)

diff --git a/src/compiler/glsl/nir_intrinsic_map.py b/src/compiler/glsl/nir_intrinsic_map.py
index 7f13c6c..5962d4b 100644
--- a/src/compiler/glsl/nir_intrinsic_map.py
+++ b/src/compiler/glsl/nir_intrinsic_map.py
@@ -66,6 +66,123 @@ intrinsics = [("__intrinsic_atomic_read", ("nir_intrinsic_atomic_counter_read_va
               ("__intrinsic_atomic_exchange_shared", ("nir_intrinsic_shared_atomic_exchange", None)),
               ("__intrinsic_atomic_comp_swap_shared", ("nir_intrinsic_shared_atomic_comp_swap", None))]
 
+def remove_prefix(table, prefix_length):
+    """Strip prefix_length characters off the name of each entry in table."""
+
+    return [(s[prefix_length:], d) for (s, d) in table]
+
+
+def generate_trie(table):
+    """table is a list of (string, data) tuples.  It is assumed to be sorted by
+    string.
+
+    A radix trie (or compact prefix trie) is recursively generated from the
+    list of names.  Names are paritioned into groups that have at least
+    prefix_thresh (tunable parameter) common prefix characters.  Each of these
+    groups becomes the branches at the current level of the tree.  The
+    matching prefix characters from each group is removed, and the group is
+    recursively operated on in the same fashion.
+
+    The recursion terminates when no groups can be formed with at least
+    prefix_thresh matching characters.
+
+    Each node in the trie is a 3-element tuple:
+
+        (prefix_string, [child_nodes], client_data)
+
+    One of [child_nodes] or client_data will be None.
+
+    See https://en.wikipedia.org/wiki/Radix_tree for more background details
+    on the data structure.
+
+    """
+
+    # Threshold for considering two strings to have the same prefix.
+    prefix_thresh = 1
+
+    if len(table) == 1 and table[0][0] == "":
+        return [("", None, table[0][1])]
+
+    trie_level = []
+
+    (s, d) = table[0]
+    candidates = [(s, d)]
+    base = s
+    prefix_length = len(s)
+
+    for (s, d) in table[1:]:
+        if s[:prefix_thresh] == base[:prefix_thresh]:
+            candidates.append((s, d))
+
+            l = len(s[:([x[0]==x[1] for x in zip(s, base)]+[0]).index(0)])
+            if l < prefix_length:
+                prefix_length = l
+        else:
+            trie_level.append((base[:prefix_length], generate_trie(remove_prefix(candidates, prefix_length)), None))
+
+            candidates = [(s, d)]
+            base = s
+            prefix_length = len(s)
+
+    trie_level.append((base[:prefix_length], generate_trie(remove_prefix(candidates, prefix_length)), None))
+
+    return trie_level
+
+
+def emit_trie_leaf(indent, d):
+    if d[1] is None:
+        return "{}return {};\n".format(indent, d[0])
+    else:
+        c_code = "{}int_op = {};\n".format(indent, d[0])
+        c_code += "{}uint_op = {};\n".format(indent, d[1])
+        return c_code
+
+
+def trie_as_C_code(trie, indent="   ", prefix_string="__intrinsic_"):
+    conditional = "if"
+
+    c_code = ""
+    for (s, t, d) in trie:
+        if d is not None:
+            c_code +=  "{}{} (name[0] == '\\0') {{\n".format(indent, conditional)
+            c_code += "{}   /* {} */\n".format(indent, prefix_string)
+            c_code += emit_trie_leaf(indent + "   ", d);
+
+        else:
+            # Before emitting the string comparison, check to see of the
+            # subtree has a single element with an empty string.  In that
+            # case, use strcmp() instead of strncmp() and don't advance the
+            # name pointer.
+
+            if len(t) == 1 and t[0][2] is not None:
+                if s == "":
+                    c_code += "{}{} (name[0] == '\\0') {{\n".format(indent, conditional, s)
+                else:
+                    c_code += "{}{} (strcmp(name, \"{}\") == 0) {{\n".format(indent, conditional, s)
+
+                c_code += "{}   /* {} */\n".format(indent, prefix_string + s)
+                c_code += emit_trie_leaf(indent + "   ", t[0][2]);
+            else:
+                c_code += "{}{} (strncmp(name, \"{}\", {}) == 0) {{\n".format(indent, conditional, s, len(s))
+                c_code += "{}   name += {};\n\n".format(indent, len(s))
+
+                c_code += trie_as_C_code(t, indent + "   ", prefix_string + s)
+
+        conditional = "} else if"
+
+    c_code += "{}}} else\n".format(indent)
+    c_code += "{}   unreachable(\"Invalid intrinsic name\");\n\n".format(indent)
+    return c_code
+
+
+intrinsics.sort(key=lambda tup: tup[0])
+
+trimmed_name_intrinsics = []
+for (s, d) in intrinsics:
+    trimmed_name_intrinsics.append((s[12:], d))
+
+trie_search = trie_as_C_code(generate_trie(trimmed_name_intrinsics))
+
 template = """
 namespace _glsl_to_nir {
 
@@ -80,17 +197,7 @@ get_intrinsic_opcode(const char *name, const ir_dereference *return_deref)
    nir_intrinsic_op int_op;
    nir_intrinsic_op uint_op;
 
-    % for (name, ops) in intrinsics:
-   if (strcmp(name, "${name[12:]}") == 0) {
-        % if ops[1] is None:
-      return ${ops[0]};
-        % else:
-      int_op = ${ops[0]};
-      uint_op = ${ops[1]};
-        % endif
-   } else
-    % endfor
-      unreachable("Unknown intrinsic name");
+${trie_search}
 
    assert(return_deref);
    if (return_deref->type == glsl_type::int_type)
@@ -103,4 +210,4 @@ get_intrinsic_opcode(const char *name, const ir_dereference *return_deref)
 }
 """
 
-print(Template(template).render(intrinsics=intrinsics))
+print(Template(template).render(trie_search=trie_search))
-- 
2.5.5



More information about the mesa-dev mailing list