3 # Copyright (C) 2014 Intel Corporation
5 # Permission is hereby granted, free of charge, to any person obtaining a
6 # copy of this software and associated documentation files (the "Software"),
7 # to deal in the Software without restriction, including without limitation
8 # the rights to use, copy, modify, merge, publish, distribute, sublicense,
9 # and/or sell copies of the Software, and to permit persons to whom the
10 # Software is furnished to do so, subject to the following conditions:
12 # The above copyright notice and this permission notice (including the next
13 # paragraph) shall be included in all copies or substantial portions of the
16 # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 # THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21 # FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
25 # Jason Ekstrand (jason@jlekstrand.net)
27 from __future__
import print_function
35 # Represents a set of variables, each with a unique id
39 self
.ids
= itertools
.count()
40 self
.immutable
= False;
42 def __getitem__(self
, name
):
43 if name
not in self
.names
:
44 assert not self
.immutable
, "Unknown replacement variable: " + name
45 self
.names
[name
] = self
.ids
.next()
47 return self
.names
[name
]
54 def create(val
, name_base
, varset
):
55 if isinstance(val
, tuple):
56 return Expression(val
, name_base
, varset
)
57 elif isinstance(val
, Expression
):
59 elif isinstance(val
, (str, unicode)):
60 return Variable(val
, name_base
, varset
)
61 elif isinstance(val
, (bool, int, long, float)):
62 return Constant(val
, name_base
)
64 __template
= mako
.template
.Template("""
65 static const ${val.c_type} ${val.name} = {
67 % if isinstance(val, Constant):
68 ${val.type()}, { ${hex(val)} /* ${val.value} */ },
69 % elif isinstance(val, Variable):
70 ${val.index}, /* ${val.var_name} */
71 ${'true' if val.is_constant else 'false'},
72 ${val.type() or 'nir_type_invalid' },
73 % elif isinstance(val, Expression):
74 ${'true' if val.inexact else 'false'},
76 { ${', '.join(src.c_ptr for src in val.sources)} },
80 def __init__(self
, name
, type_str
):
82 self
.type_str
= type_str
86 return "nir_search_value_" + self
.type_str
90 return "nir_search_" + self
.type_str
94 return "&{0}.value".format(self
.name
)
97 return self
.__template
.render(val
=self
,
100 Expression
=Expression
)
102 class Constant(Value
):
103 def __init__(self
, val
, name
):
104 Value
.__init
__(self
, name
, "constant")
108 if isinstance(self
.value
, (bool)):
109 return 'NIR_TRUE' if self
.value
else 'NIR_FALSE'
110 if isinstance(self
.value
, (int, long)):
111 return hex(self
.value
)
112 elif isinstance(self
.value
, float):
113 return hex(struct
.unpack('Q', struct
.pack('d', self
.value
))[0])
118 if isinstance(self
.value
, (bool)):
119 return "nir_type_bool32"
120 elif isinstance(self
.value
, (int, long)):
121 return "nir_type_int"
122 elif isinstance(self
.value
, float):
123 return "nir_type_float"
125 _var_name_re
= re
.compile(r
"(?P<const>#)?(?P<name>\w+)(?:@(?P<type>\w+))?")
127 class Variable(Value
):
128 def __init__(self
, val
, name
, varset
):
129 Value
.__init
__(self
, name
, "variable")
131 m
= _var_name_re
.match(val
)
132 assert m
and m
.group('name') is not None
134 self
.var_name
= m
.group('name')
135 self
.is_constant
= m
.group('const') is not None
136 self
.required_type
= m
.group('type')
138 if self
.required_type
is not None:
139 assert self
.required_type
in ('float', 'bool', 'int', 'uint')
141 self
.index
= varset
[self
.var_name
]
144 if self
.required_type
== 'bool':
145 return "nir_type_bool32"
146 elif self
.required_type
in ('int', 'uint'):
147 return "nir_type_int"
148 elif self
.required_type
== 'float':
149 return "nir_type_float"
151 _opcode_re
= re
.compile(r
"(?P<inexact>~)?(?P<opcode>\w+)")
153 class Expression(Value
):
154 def __init__(self
, expr
, name_base
, varset
):
155 Value
.__init
__(self
, name_base
, "expression")
156 assert isinstance(expr
, tuple)
158 m
= _opcode_re
.match(expr
[0])
159 assert m
and m
.group('opcode') is not None
161 self
.opcode
= m
.group('opcode')
162 self
.inexact
= m
.group('inexact') is not None
163 self
.sources
= [ Value
.create(src
, "{0}_{1}".format(name_base
, i
), varset
)
164 for (i
, src
) in enumerate(expr
[1:]) ]
167 srcs
= "\n".join(src
.render() for src
in self
.sources
)
168 return srcs
+ super(Expression
, self
).render()
170 _optimization_ids
= itertools
.count()
172 condition_list
= ['true']
174 class SearchAndReplace(object):
175 def __init__(self
, transform
):
176 self
.id = _optimization_ids
.next()
178 search
= transform
[0]
179 replace
= transform
[1]
180 if len(transform
) > 2:
181 self
.condition
= transform
[2]
183 self
.condition
= 'true'
185 if self
.condition
not in condition_list
:
186 condition_list
.append(self
.condition
)
187 self
.condition_index
= condition_list
.index(self
.condition
)
190 if isinstance(search
, Expression
):
193 self
.search
= Expression(search
, "search{0}".format(self
.id), varset
)
197 if isinstance(replace
, Value
):
198 self
.replace
= replace
200 self
.replace
= Value
.create(replace
, "replace{0}".format(self
.id), varset
)
202 _algebraic_pass_template
= mako
.template
.Template("""
204 #include "nir_search.h"
206 #ifndef NIR_OPT_ALGEBRAIC_STRUCT_DEFS
207 #define NIR_OPT_ALGEBRAIC_STRUCT_DEFS
210 const nir_search_expression *search;
211 const nir_search_value *replace;
212 unsigned condition_offset;
218 const bool *condition_flags;
223 % for (opcode, xform_list) in xform_dict.iteritems():
224 % for xform in xform_list:
225 ${xform.search.render()}
226 ${xform.replace.render()}
229 static const struct transform ${pass_name}_${opcode}_xforms[] = {
230 % for xform in xform_list:
231 { &${xform.search.name}, ${xform.replace.c_ptr}, ${xform.condition_index} },
237 ${pass_name}_block(nir_block *block, void *void_state)
239 struct opt_state *state = void_state;
241 nir_foreach_instr_reverse_safe(block, instr) {
242 if (instr->type != nir_instr_type_alu)
245 nir_alu_instr *alu = nir_instr_as_alu(instr);
246 if (!alu->dest.dest.is_ssa)
250 % for opcode in xform_dict.keys():
251 case nir_op_${opcode}:
252 for (unsigned i = 0; i < ARRAY_SIZE(${pass_name}_${opcode}_xforms); i++) {
253 const struct transform *xform = &${pass_name}_${opcode}_xforms[i];
254 if (state->condition_flags[xform->condition_offset] &&
255 nir_replace_instr(alu, xform->search, xform->replace,
257 state->progress = true;
272 ${pass_name}_impl(nir_function_impl *impl, const bool *condition_flags)
274 struct opt_state state;
276 state.mem_ctx = ralloc_parent(impl);
277 state.progress = false;
278 state.condition_flags = condition_flags;
280 nir_foreach_block_reverse_call(impl, ${pass_name}_block, &state);
283 nir_metadata_preserve(impl, nir_metadata_block_index |
284 nir_metadata_dominance);
286 return state.progress;
291 ${pass_name}(nir_shader *shader)
293 bool progress = false;
294 bool condition_flags[${len(condition_list)}];
295 const nir_shader_compiler_options *options = shader->options;
298 % for index, condition in enumerate(condition_list):
299 condition_flags[${index}] = ${condition};
302 nir_foreach_function(shader, function) {
304 progress |= ${pass_name}_impl(function->impl, condition_flags);
311 class AlgebraicPass(object):
312 def __init__(self
, pass_name
, transforms
):
314 self
.pass_name
= pass_name
318 for xform
in transforms
:
319 if not isinstance(xform
, SearchAndReplace
):
321 xform
= SearchAndReplace(xform
)
323 print("Failed to parse transformation:", file=sys
.stderr
)
324 print(" " + str(xform
), file=sys
.stderr
)
325 traceback
.print_exc(file=sys
.stderr
)
326 print('', file=sys
.stderr
)
330 if xform
.search
.opcode
not in self
.xform_dict
:
331 self
.xform_dict
[xform
.search
.opcode
] = []
333 self
.xform_dict
[xform
.search
.opcode
].append(xform
)
339 return _algebraic_pass_template
.render(pass_name
=self
.pass_name
,
340 xform_dict
=self
.xform_dict
,
341 condition_list
=condition_list
)