*
*/
+#include <inttypes.h>
#include "nir_search.h"
struct match_state {
+ bool inexact_match;
+ bool has_exact_alu;
unsigned variables_seen;
nir_alu_src variables[NIR_SEARCH_MAX_VARIABLES];
};
for (unsigned i = 0; i < num_components; ++i)
new_swizzle[i] = instr->src[src].swizzle[swizzle[i]];
+ /* If the value has a specific bit size and it doesn't match, bail */
+ if (value->bit_size &&
+ nir_src_bit_size(instr->src[src].src) != value->bit_size)
+ return false;
+
switch (value->type) {
case nir_search_value_expression:
if (!instr->src[src].src.is_ssa)
if (instr->op != expr->opcode)
return false;
+ assert(instr->dest.dest.is_ssa);
+
+ if (expr->value.bit_size &&
+ instr->dest.dest.ssa.bit_size != expr->value.bit_size)
+ return false;
+
+ state->inexact_match = expr->inexact || state->inexact_match;
+ state->has_exact_alu = instr->exact || state->has_exact_alu;
+ if (state->inexact_match && state->has_exact_alu)
+ return false;
+
assert(!instr->dest.saturate);
assert(nir_op_infos[instr->op].num_inputs > 0);
}
}
+ if (value->bit_size) {
+ assert(!tree->is_dest_sized || tree->dest_size == value->bit_size);
+ tree->common_size = value->bit_size;
+ }
+
return tree;
}
alu->dest.write_mask = (1 << num_components) - 1;
alu->dest.saturate = false;
+ /* We have no way of knowing what values in a given search expression
+ * map to a particular replacement value. Therefore, if the
+ * expression we are replacing has any exact values, the entire
+ * replacement should be exact.
+ */
+ alu->exact = state->has_exact_alu;
+
for (unsigned i = 0; i < nir_op_infos[expr->opcode].num_inputs; i++) {
/* If the source is an explicitly sized source, then we need to reset
* the number of components to match.
case nir_search_value_constant: {
const nir_search_constant *c = nir_search_value_as_constant(value);
- nir_load_const_instr *load = nir_load_const_instr_create(mem_ctx, 1);
+ nir_load_const_instr *load =
+ nir_load_const_instr_create(mem_ctx, 1, bitsize->dest_size);
switch (c->type) {
case nir_type_float:
- load->def.name = ralloc_asprintf(mem_ctx, "%f", c->data.d);
+ load->def.name = ralloc_asprintf(load, "%f", c->data.d);
switch (bitsize->dest_size) {
case 32:
load->value.f32[0] = c->data.d;
break;
case nir_type_int:
- load->def.name = ralloc_asprintf(mem_ctx, "%ld", c->data.i);
+ load->def.name = ralloc_asprintf(load, "%" PRIi64, c->data.i);
switch (bitsize->dest_size) {
case 32:
load->value.i32[0] = c->data.i;
break;
case nir_type_uint:
- load->def.name = ralloc_asprintf(mem_ctx, "%lu", c->data.u);
+ load->def.name = ralloc_asprintf(load, "%" PRIu64, c->data.u);
switch (bitsize->dest_size) {
case 32:
load->value.u32[0] = c->data.u;
default:
unreachable("unknown bit size");
}
+ break;
case nir_type_bool32:
load->value.u32[0] = c->data.u;
unreachable("Invalid alu source type");
}
- load->def.bit_size = bitsize->dest_size;
-
nir_instr_insert_before(instr, &load->instr);
nir_alu_src val;
assert(instr->dest.dest.is_ssa);
struct match_state state;
+ state.inexact_match = false;
+ state.has_exact_alu = false;
state.variables_seen = 0;
if (!match_expression(search, instr, instr->dest.dest.ssa.num_components,
instr->dest.dest.ssa.bit_size, NULL);
mov->src[0] = construct_value(replace,
- instr->dest.dest.ssa.num_components,
- tree, &state, &instr->instr, mem_ctx);
+ instr->dest.dest.ssa.num_components, tree,
+ &state, &instr->instr, mem_ctx);
nir_instr_insert_before(&instr->instr, &mov->instr);
nir_ssa_def_rewrite_uses(&instr->dest.dest.ssa,