nir: Drop imov/fmov in favor of one mov instruction
[mesa.git] / src / compiler / nir / nir_validate.c
1 /*
2 * Copyright © 2014 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 *
23 * Authors:
24 * Connor Abbott (cwabbott0@gmail.com)
25 *
26 */
27
28 #include "nir.h"
29 #include "c11/threads.h"
30 #include <assert.h>
31
32 /*
33 * This file checks for invalid IR indicating a bug somewhere in the compiler.
34 */
35
36 /* Since this file is just a pile of asserts, don't bother compiling it if
37 * we're not building a debug build.
38 */
39 #ifndef NDEBUG
40
41 /*
42 * Per-register validation state.
43 */
44
45 typedef struct {
46 /*
47 * equivalent to the uses and defs in nir_register, but built up by the
48 * validator. At the end, we verify that the sets have the same entries.
49 */
50 struct set *uses, *if_uses, *defs;
51 nir_function_impl *where_defined; /* NULL for global registers */
52 } reg_validate_state;
53
54 typedef struct {
55 void *mem_ctx;
56
57 /* map of register -> validation state (struct above) */
58 struct hash_table *regs;
59
60 /* the current shader being validated */
61 nir_shader *shader;
62
63 /* the current instruction being validated */
64 nir_instr *instr;
65
66 /* the current variable being validated */
67 nir_variable *var;
68
69 /* the current basic block being validated */
70 nir_block *block;
71
72 /* the current if statement being validated */
73 nir_if *if_stmt;
74
75 /* the current loop being visited */
76 nir_loop *loop;
77
78 /* the parent of the current cf node being visited */
79 nir_cf_node *parent_node;
80
81 /* the current function implementation being validated */
82 nir_function_impl *impl;
83
84 /* Set of seen SSA sources */
85 struct set *ssa_srcs;
86
87 /* bitset of ssa definitions we have found; used to check uniqueness */
88 BITSET_WORD *ssa_defs_found;
89
90 /* bitset of registers we have currently found; used to check uniqueness */
91 BITSET_WORD *regs_found;
92
93 /* map of variable -> function implementation where it is defined or NULL
94 * if it is a global variable
95 */
96 struct hash_table *var_defs;
97
98 /* map of instruction/var/etc to failed assert string */
99 struct hash_table *errors;
100 } validate_state;
101
102 static void
103 log_error(validate_state *state, const char *cond, const char *file, int line)
104 {
105 const void *obj;
106
107 if (state->instr)
108 obj = state->instr;
109 else if (state->var)
110 obj = state->var;
111 else
112 obj = cond;
113
114 char *msg = ralloc_asprintf(state->errors, "error: %s (%s:%d)",
115 cond, file, line);
116
117 _mesa_hash_table_insert(state->errors, obj, msg);
118 }
119
120 #define validate_assert(state, cond) do { \
121 if (!(cond)) \
122 log_error(state, #cond, __FILE__, __LINE__); \
123 } while (0)
124
125 static void validate_src(nir_src *src, validate_state *state,
126 unsigned bit_sizes, unsigned num_components);
127
128 static void
129 validate_reg_src(nir_src *src, validate_state *state,
130 unsigned bit_sizes, unsigned num_components)
131 {
132 validate_assert(state, src->reg.reg != NULL);
133
134 struct hash_entry *entry;
135 entry = _mesa_hash_table_search(state->regs, src->reg.reg);
136 validate_assert(state, entry);
137
138 reg_validate_state *reg_state = (reg_validate_state *) entry->data;
139
140 if (state->instr) {
141 _mesa_set_add(reg_state->uses, src);
142 } else {
143 validate_assert(state, state->if_stmt);
144 _mesa_set_add(reg_state->if_uses, src);
145 }
146
147 validate_assert(state, reg_state->where_defined == state->impl &&
148 "using a register declared in a different function");
149
150 if (bit_sizes)
151 validate_assert(state, src->reg.reg->bit_size & bit_sizes);
152 if (num_components)
153 validate_assert(state, src->reg.reg->num_components == num_components);
154
155 validate_assert(state, (src->reg.reg->num_array_elems == 0 ||
156 src->reg.base_offset < src->reg.reg->num_array_elems) &&
157 "definitely out-of-bounds array access");
158
159 if (src->reg.indirect) {
160 validate_assert(state, src->reg.reg->num_array_elems != 0);
161 validate_assert(state, (src->reg.indirect->is_ssa ||
162 src->reg.indirect->reg.indirect == NULL) &&
163 "only one level of indirection allowed");
164 validate_src(src->reg.indirect, state, 32, 1);
165 }
166 }
167
168 #define SET_PTR_BIT(ptr, bit) \
169 (void *)(((uintptr_t)(ptr)) | (((uintptr_t)1) << bit))
170
171 static void
172 validate_ssa_src(nir_src *src, validate_state *state,
173 unsigned bit_sizes, unsigned num_components)
174 {
175 validate_assert(state, src->ssa != NULL);
176
177 /* As we walk SSA defs, we add every use to this set. We need to make sure
178 * our use is seen in a use list.
179 */
180 struct set_entry *entry;
181 if (state->instr) {
182 entry = _mesa_set_search(state->ssa_srcs, src);
183 } else {
184 entry = _mesa_set_search(state->ssa_srcs, SET_PTR_BIT(src, 0));
185 }
186 validate_assert(state, entry);
187
188 /* This will let us prove that we've seen all the sources */
189 if (entry)
190 _mesa_set_remove(state->ssa_srcs, entry);
191
192 if (bit_sizes)
193 validate_assert(state, src->ssa->bit_size & bit_sizes);
194 if (num_components)
195 validate_assert(state, src->ssa->num_components == num_components);
196
197 /* TODO validate that the use is dominated by the definition */
198 }
199
200 static void
201 validate_src(nir_src *src, validate_state *state,
202 unsigned bit_sizes, unsigned num_components)
203 {
204 if (state->instr)
205 validate_assert(state, src->parent_instr == state->instr);
206 else
207 validate_assert(state, src->parent_if == state->if_stmt);
208
209 if (src->is_ssa)
210 validate_ssa_src(src, state, bit_sizes, num_components);
211 else
212 validate_reg_src(src, state, bit_sizes, num_components);
213 }
214
215 static void
216 validate_alu_src(nir_alu_instr *instr, unsigned index, validate_state *state)
217 {
218 nir_alu_src *src = &instr->src[index];
219
220 if (instr->op == nir_op_mov)
221 assert(!src->abs && !src->negate);
222
223 unsigned num_components = nir_src_num_components(src->src);
224 for (unsigned i = 0; i < NIR_MAX_VEC_COMPONENTS; i++) {
225 validate_assert(state, src->swizzle[i] < NIR_MAX_VEC_COMPONENTS);
226
227 if (nir_alu_instr_channel_used(instr, index, i))
228 validate_assert(state, src->swizzle[i] < num_components);
229 }
230
231 validate_src(&src->src, state, 0, 0);
232 }
233
234 static void
235 validate_reg_dest(nir_reg_dest *dest, validate_state *state,
236 unsigned bit_sizes, unsigned num_components)
237 {
238 validate_assert(state, dest->reg != NULL);
239
240 validate_assert(state, dest->parent_instr == state->instr);
241
242 struct hash_entry *entry2;
243 entry2 = _mesa_hash_table_search(state->regs, dest->reg);
244
245 validate_assert(state, entry2);
246
247 reg_validate_state *reg_state = (reg_validate_state *) entry2->data;
248 _mesa_set_add(reg_state->defs, dest);
249
250 validate_assert(state, reg_state->where_defined == state->impl &&
251 "writing to a register declared in a different function");
252
253 if (bit_sizes)
254 validate_assert(state, dest->reg->bit_size & bit_sizes);
255 if (num_components)
256 validate_assert(state, dest->reg->num_components == num_components);
257
258 validate_assert(state, (dest->reg->num_array_elems == 0 ||
259 dest->base_offset < dest->reg->num_array_elems) &&
260 "definitely out-of-bounds array access");
261
262 if (dest->indirect) {
263 validate_assert(state, dest->reg->num_array_elems != 0);
264 validate_assert(state, (dest->indirect->is_ssa || dest->indirect->reg.indirect == NULL) &&
265 "only one level of indirection allowed");
266 validate_src(dest->indirect, state, 32, 1);
267 }
268 }
269
270 static void
271 validate_ssa_def(nir_ssa_def *def, validate_state *state)
272 {
273 validate_assert(state, def->index < state->impl->ssa_alloc);
274 validate_assert(state, !BITSET_TEST(state->ssa_defs_found, def->index));
275 BITSET_SET(state->ssa_defs_found, def->index);
276
277 validate_assert(state, def->parent_instr == state->instr);
278
279 validate_assert(state, (def->num_components <= 4) ||
280 (def->num_components == 8) ||
281 (def->num_components == 16));
282
283 list_validate(&def->uses);
284 nir_foreach_use(src, def) {
285 validate_assert(state, src->is_ssa);
286 validate_assert(state, src->ssa == def);
287 bool already_seen = false;
288 _mesa_set_search_and_add(state->ssa_srcs, src, &already_seen);
289 /* A nir_src should only appear once and only in one SSA def use list */
290 validate_assert(state, !already_seen);
291 }
292
293 list_validate(&def->if_uses);
294 nir_foreach_if_use(src, def) {
295 validate_assert(state, src->is_ssa);
296 validate_assert(state, src->ssa == def);
297 bool already_seen = false;
298 _mesa_set_search_and_add(state->ssa_srcs, SET_PTR_BIT(src, 0),
299 &already_seen);
300 /* A nir_src should only appear once and only in one SSA def use list */
301 validate_assert(state, !already_seen);
302 }
303 }
304
305 static void
306 validate_dest(nir_dest *dest, validate_state *state,
307 unsigned bit_sizes, unsigned num_components)
308 {
309 if (dest->is_ssa) {
310 if (bit_sizes)
311 validate_assert(state, dest->ssa.bit_size & bit_sizes);
312 if (num_components)
313 validate_assert(state, dest->ssa.num_components == num_components);
314 validate_ssa_def(&dest->ssa, state);
315 } else {
316 validate_reg_dest(&dest->reg, state, bit_sizes, num_components);
317 }
318 }
319
320 static void
321 validate_alu_dest(nir_alu_instr *instr, validate_state *state)
322 {
323 nir_alu_dest *dest = &instr->dest;
324
325 if (instr->op == nir_op_mov)
326 assert(!dest->saturate);
327
328 unsigned dest_size = nir_dest_num_components(dest->dest);
329 /*
330 * validate that the instruction doesn't write to components not in the
331 * register/SSA value
332 */
333 validate_assert(state, !(dest->write_mask & ~((1 << dest_size) - 1)));
334
335 /* validate that saturate is only ever used on instructions with
336 * destinations of type float
337 */
338 nir_alu_instr *alu = nir_instr_as_alu(state->instr);
339 validate_assert(state,
340 (nir_alu_type_get_base_type(nir_op_infos[alu->op].output_type) ==
341 nir_type_float) ||
342 !dest->saturate);
343
344 validate_dest(&dest->dest, state, 0, 0);
345 }
346
347 static void
348 validate_alu_instr(nir_alu_instr *instr, validate_state *state)
349 {
350 validate_assert(state, instr->op < nir_num_opcodes);
351
352 unsigned instr_bit_size = 0;
353 for (unsigned i = 0; i < nir_op_infos[instr->op].num_inputs; i++) {
354 nir_alu_type src_type = nir_op_infos[instr->op].input_types[i];
355 unsigned src_bit_size = nir_src_bit_size(instr->src[i].src);
356 if (nir_alu_type_get_type_size(src_type)) {
357 validate_assert(state, src_bit_size == nir_alu_type_get_type_size(src_type));
358 } else if (instr_bit_size) {
359 validate_assert(state, src_bit_size == instr_bit_size);
360 } else {
361 instr_bit_size = src_bit_size;
362 }
363
364 if (nir_alu_type_get_base_type(src_type) == nir_type_float) {
365 /* 8-bit float isn't a thing */
366 validate_assert(state, src_bit_size == 16 || src_bit_size == 32 ||
367 src_bit_size == 64);
368 }
369
370 validate_alu_src(instr, i, state);
371 }
372
373 nir_alu_type dest_type = nir_op_infos[instr->op].output_type;
374 unsigned dest_bit_size = nir_dest_bit_size(instr->dest.dest);
375 if (nir_alu_type_get_type_size(dest_type)) {
376 validate_assert(state, dest_bit_size == nir_alu_type_get_type_size(dest_type));
377 } else if (instr_bit_size) {
378 validate_assert(state, dest_bit_size == instr_bit_size);
379 } else {
380 /* The only unsized thing is the destination so it's vacuously valid */
381 }
382
383 if (nir_alu_type_get_base_type(dest_type) == nir_type_float) {
384 /* 8-bit float isn't a thing */
385 validate_assert(state, dest_bit_size == 16 || dest_bit_size == 32 ||
386 dest_bit_size == 64);
387 }
388
389 validate_alu_dest(instr, state);
390 }
391
392 static void
393 validate_var_use(nir_variable *var, validate_state *state)
394 {
395 struct hash_entry *entry = _mesa_hash_table_search(state->var_defs, var);
396 validate_assert(state, entry);
397 if (entry && var->data.mode == nir_var_function_temp)
398 validate_assert(state, (nir_function_impl *) entry->data == state->impl);
399 }
400
401 static void
402 validate_deref_instr(nir_deref_instr *instr, validate_state *state)
403 {
404 if (instr->deref_type == nir_deref_type_var) {
405 /* Variable dereferences are stupid simple. */
406 validate_assert(state, instr->mode == instr->var->data.mode);
407 validate_assert(state, instr->type == instr->var->type);
408 validate_var_use(instr->var, state);
409 } else if (instr->deref_type == nir_deref_type_cast) {
410 /* For cast, we simply have to trust the instruction. It's up to
411 * lowering passes and front/back-ends to make them sane.
412 */
413 validate_src(&instr->parent, state, 0, 0);
414
415 /* We just validate that the type and mode are there */
416 validate_assert(state, instr->mode);
417 validate_assert(state, instr->type);
418 } else {
419 /* We require the parent to be SSA. This may be lifted in the future */
420 validate_assert(state, instr->parent.is_ssa);
421
422 /* The parent pointer value must have the same number of components
423 * as the destination.
424 */
425 validate_src(&instr->parent, state, nir_dest_bit_size(instr->dest),
426 nir_dest_num_components(instr->dest));
427
428 nir_instr *parent_instr = instr->parent.ssa->parent_instr;
429
430 /* The parent must come from another deref instruction */
431 validate_assert(state, parent_instr->type == nir_instr_type_deref);
432
433 nir_deref_instr *parent = nir_instr_as_deref(parent_instr);
434
435 validate_assert(state, instr->mode == parent->mode);
436
437 switch (instr->deref_type) {
438 case nir_deref_type_struct:
439 validate_assert(state, glsl_type_is_struct_or_ifc(parent->type));
440 validate_assert(state,
441 instr->strct.index < glsl_get_length(parent->type));
442 validate_assert(state, instr->type ==
443 glsl_get_struct_field(parent->type, instr->strct.index));
444 break;
445
446 case nir_deref_type_array:
447 case nir_deref_type_array_wildcard:
448 if (instr->mode == nir_var_mem_ubo ||
449 instr->mode == nir_var_mem_ssbo ||
450 instr->mode == nir_var_mem_shared ||
451 instr->mode == nir_var_mem_global) {
452 /* Shared variables and UBO/SSBOs have a bit more relaxed rules
453 * because we need to be able to handle array derefs on vectors.
454 * Fortunately, nir_lower_io handles these just fine.
455 */
456 validate_assert(state, glsl_type_is_array(parent->type) ||
457 glsl_type_is_matrix(parent->type) ||
458 glsl_type_is_vector(parent->type));
459 } else {
460 /* Most of NIR cannot handle array derefs on vectors */
461 validate_assert(state, glsl_type_is_array(parent->type) ||
462 glsl_type_is_matrix(parent->type));
463 }
464 validate_assert(state,
465 instr->type == glsl_get_array_element(parent->type));
466
467 if (instr->deref_type == nir_deref_type_array) {
468 validate_src(&instr->arr.index, state,
469 nir_dest_bit_size(instr->dest), 1);
470 }
471 break;
472
473 case nir_deref_type_ptr_as_array:
474 /* ptr_as_array derefs must have a parent that is either an array,
475 * ptr_as_array, or cast. If the parent is a cast, we get the stride
476 * information (if any) from the cast deref.
477 */
478 validate_assert(state,
479 parent->deref_type == nir_deref_type_array ||
480 parent->deref_type == nir_deref_type_ptr_as_array ||
481 parent->deref_type == nir_deref_type_cast);
482 validate_src(&instr->arr.index, state,
483 nir_dest_bit_size(instr->dest), 1);
484 break;
485
486 default:
487 unreachable("Invalid deref instruction type");
488 }
489 }
490
491 /* We intentionally don't validate the size of the destination because we
492 * want to let other compiler components such as SPIR-V decide how big
493 * pointers should be.
494 */
495 validate_dest(&instr->dest, state, 0, 0);
496
497 /* Deref instructions as if conditions don't make sense because if
498 * conditions expect well-formed Booleans. If you want to compare with
499 * NULL, an explicit comparison operation should be used.
500 */
501 validate_assert(state, list_empty(&instr->dest.ssa.if_uses));
502 }
503
504 static void
505 validate_intrinsic_instr(nir_intrinsic_instr *instr, validate_state *state)
506 {
507 unsigned dest_bit_size = 0;
508 unsigned src_bit_sizes[NIR_INTRINSIC_MAX_INPUTS] = { 0, };
509 switch (instr->intrinsic) {
510 case nir_intrinsic_load_param: {
511 unsigned param_idx = nir_intrinsic_param_idx(instr);
512 validate_assert(state, param_idx < state->impl->function->num_params);
513 nir_parameter *param = &state->impl->function->params[param_idx];
514 validate_assert(state, instr->num_components == param->num_components);
515 dest_bit_size = param->bit_size;
516 break;
517 }
518
519 case nir_intrinsic_load_deref: {
520 nir_deref_instr *src = nir_src_as_deref(instr->src[0]);
521 validate_assert(state, glsl_type_is_vector_or_scalar(src->type) ||
522 (src->mode == nir_var_uniform &&
523 glsl_get_base_type(src->type) == GLSL_TYPE_SUBROUTINE));
524 validate_assert(state, instr->num_components ==
525 glsl_get_vector_elements(src->type));
526 dest_bit_size = glsl_get_bit_size(src->type);
527 /* Also allow 32-bit boolean load operations */
528 if (glsl_type_is_boolean(src->type))
529 dest_bit_size |= 32;
530 break;
531 }
532
533 case nir_intrinsic_store_deref: {
534 nir_deref_instr *dst = nir_src_as_deref(instr->src[0]);
535 validate_assert(state, glsl_type_is_vector_or_scalar(dst->type));
536 validate_assert(state, instr->num_components ==
537 glsl_get_vector_elements(dst->type));
538 src_bit_sizes[1] = glsl_get_bit_size(dst->type);
539 /* Also allow 32-bit boolean store operations */
540 if (glsl_type_is_boolean(dst->type))
541 src_bit_sizes[1] |= 32;
542 validate_assert(state, (dst->mode & (nir_var_shader_in |
543 nir_var_uniform)) == 0);
544 validate_assert(state, (nir_intrinsic_write_mask(instr) & ~((1 << instr->num_components) - 1)) == 0);
545 break;
546 }
547
548 case nir_intrinsic_copy_deref: {
549 nir_deref_instr *dst = nir_src_as_deref(instr->src[0]);
550 nir_deref_instr *src = nir_src_as_deref(instr->src[1]);
551 validate_assert(state, glsl_get_bare_type(dst->type) ==
552 glsl_get_bare_type(src->type));
553 validate_assert(state, (dst->mode & (nir_var_shader_in |
554 nir_var_uniform)) == 0);
555 break;
556 }
557
558 default:
559 break;
560 }
561
562 unsigned num_srcs = nir_intrinsic_infos[instr->intrinsic].num_srcs;
563 for (unsigned i = 0; i < num_srcs; i++) {
564 unsigned components_read = nir_intrinsic_src_components(instr, i);
565
566 validate_assert(state, components_read > 0);
567
568 validate_src(&instr->src[i], state, src_bit_sizes[i], components_read);
569 }
570
571 if (nir_intrinsic_infos[instr->intrinsic].has_dest) {
572 unsigned components_written = nir_intrinsic_dest_components(instr);
573 unsigned bit_sizes = nir_intrinsic_infos[instr->intrinsic].dest_bit_sizes;
574
575 validate_assert(state, components_written > 0);
576
577 if (dest_bit_size && bit_sizes)
578 validate_assert(state, dest_bit_size & bit_sizes);
579 else
580 dest_bit_size = dest_bit_size ? dest_bit_size : bit_sizes;
581
582 validate_dest(&instr->dest, state, dest_bit_size, components_written);
583 }
584 }
585
586 static void
587 validate_tex_instr(nir_tex_instr *instr, validate_state *state)
588 {
589 bool src_type_seen[nir_num_tex_src_types];
590 for (unsigned i = 0; i < nir_num_tex_src_types; i++)
591 src_type_seen[i] = false;
592
593 for (unsigned i = 0; i < instr->num_srcs; i++) {
594 validate_assert(state, !src_type_seen[instr->src[i].src_type]);
595 src_type_seen[instr->src[i].src_type] = true;
596 validate_src(&instr->src[i].src, state,
597 0, nir_tex_instr_src_size(instr, i));
598
599 switch (instr->src[i].src_type) {
600 case nir_tex_src_texture_deref:
601 case nir_tex_src_sampler_deref:
602 validate_assert(state, instr->src[i].src.is_ssa);
603 validate_assert(state,
604 instr->src[i].src.ssa->parent_instr->type == nir_instr_type_deref);
605 break;
606 default:
607 break;
608 }
609 }
610
611 if (nir_tex_instr_has_explicit_tg4_offsets(instr)) {
612 validate_assert(state, instr->op == nir_texop_tg4);
613 validate_assert(state, !src_type_seen[nir_tex_src_offset]);
614 }
615
616 validate_dest(&instr->dest, state, 0, nir_tex_instr_dest_size(instr));
617 }
618
619 static void
620 validate_call_instr(nir_call_instr *instr, validate_state *state)
621 {
622 validate_assert(state, instr->num_params == instr->callee->num_params);
623
624 for (unsigned i = 0; i < instr->num_params; i++) {
625 validate_src(&instr->params[i], state,
626 instr->callee->params[i].bit_size,
627 instr->callee->params[i].num_components);
628 }
629 }
630
631 static void
632 validate_const_value(nir_const_value *val, unsigned bit_size,
633 validate_state *state)
634 {
635 /* In order for block copies to work properly for things like instruction
636 * comparisons and [de]serialization, we require the unused bits of the
637 * nir_const_value to be zero.
638 */
639 nir_const_value cmp_val;
640 memset(&cmp_val, 0, sizeof(cmp_val));
641 switch (bit_size) {
642 case 1:
643 cmp_val.b = val->b;
644 break;
645 case 8:
646 cmp_val.u8 = val->u8;
647 break;
648 case 16:
649 cmp_val.u16 = val->u16;
650 break;
651 case 32:
652 cmp_val.u32 = val->u32;
653 break;
654 case 64:
655 cmp_val.u64 = val->u64;
656 break;
657 default:
658 validate_assert(state, !"Invalid load_const bit size");
659 }
660 validate_assert(state, memcmp(val, &cmp_val, sizeof(cmp_val)) == 0);
661 }
662
663 static void
664 validate_load_const_instr(nir_load_const_instr *instr, validate_state *state)
665 {
666 validate_ssa_def(&instr->def, state);
667
668 for (unsigned i = 0; i < instr->def.num_components; i++)
669 validate_const_value(&instr->value[i], instr->def.bit_size, state);
670 }
671
672 static void
673 validate_ssa_undef_instr(nir_ssa_undef_instr *instr, validate_state *state)
674 {
675 validate_ssa_def(&instr->def, state);
676 }
677
678 static void
679 validate_phi_instr(nir_phi_instr *instr, validate_state *state)
680 {
681 /*
682 * don't validate the sources until we get to them from their predecessor
683 * basic blocks, to avoid validating an SSA use before its definition.
684 */
685
686 validate_dest(&instr->dest, state, 0, 0);
687
688 exec_list_validate(&instr->srcs);
689 validate_assert(state, exec_list_length(&instr->srcs) ==
690 state->block->predecessors->entries);
691 }
692
693 static void
694 validate_instr(nir_instr *instr, validate_state *state)
695 {
696 validate_assert(state, instr->block == state->block);
697
698 state->instr = instr;
699
700 switch (instr->type) {
701 case nir_instr_type_alu:
702 validate_alu_instr(nir_instr_as_alu(instr), state);
703 break;
704
705 case nir_instr_type_deref:
706 validate_deref_instr(nir_instr_as_deref(instr), state);
707 break;
708
709 case nir_instr_type_call:
710 validate_call_instr(nir_instr_as_call(instr), state);
711 break;
712
713 case nir_instr_type_intrinsic:
714 validate_intrinsic_instr(nir_instr_as_intrinsic(instr), state);
715 break;
716
717 case nir_instr_type_tex:
718 validate_tex_instr(nir_instr_as_tex(instr), state);
719 break;
720
721 case nir_instr_type_load_const:
722 validate_load_const_instr(nir_instr_as_load_const(instr), state);
723 break;
724
725 case nir_instr_type_phi:
726 validate_phi_instr(nir_instr_as_phi(instr), state);
727 break;
728
729 case nir_instr_type_ssa_undef:
730 validate_ssa_undef_instr(nir_instr_as_ssa_undef(instr), state);
731 break;
732
733 case nir_instr_type_jump:
734 break;
735
736 default:
737 validate_assert(state, !"Invalid ALU instruction type");
738 break;
739 }
740
741 state->instr = NULL;
742 }
743
744 static void
745 validate_phi_src(nir_phi_instr *instr, nir_block *pred, validate_state *state)
746 {
747 state->instr = &instr->instr;
748
749 validate_assert(state, instr->dest.is_ssa);
750
751 exec_list_validate(&instr->srcs);
752 nir_foreach_phi_src(src, instr) {
753 if (src->pred == pred) {
754 validate_assert(state, src->src.is_ssa);
755 validate_src(&src->src, state, instr->dest.ssa.bit_size,
756 instr->dest.ssa.num_components);
757 state->instr = NULL;
758 return;
759 }
760 }
761
762 abort();
763 }
764
765 static void
766 validate_phi_srcs(nir_block *block, nir_block *succ, validate_state *state)
767 {
768 nir_foreach_instr(instr, succ) {
769 if (instr->type != nir_instr_type_phi)
770 break;
771
772 validate_phi_src(nir_instr_as_phi(instr), block, state);
773 }
774 }
775
776 static void validate_cf_node(nir_cf_node *node, validate_state *state);
777
778 static void
779 validate_block(nir_block *block, validate_state *state)
780 {
781 validate_assert(state, block->cf_node.parent == state->parent_node);
782
783 state->block = block;
784
785 exec_list_validate(&block->instr_list);
786 nir_foreach_instr(instr, block) {
787 if (instr->type == nir_instr_type_phi) {
788 validate_assert(state, instr == nir_block_first_instr(block) ||
789 nir_instr_prev(instr)->type == nir_instr_type_phi);
790 }
791
792 if (instr->type == nir_instr_type_jump) {
793 validate_assert(state, instr == nir_block_last_instr(block));
794 }
795
796 validate_instr(instr, state);
797 }
798
799 validate_assert(state, block->successors[0] != NULL);
800 validate_assert(state, block->successors[0] != block->successors[1]);
801
802 for (unsigned i = 0; i < 2; i++) {
803 if (block->successors[i] != NULL) {
804 struct set_entry *entry =
805 _mesa_set_search(block->successors[i]->predecessors, block);
806 validate_assert(state, entry);
807
808 validate_phi_srcs(block, block->successors[i], state);
809 }
810 }
811
812 set_foreach(block->predecessors, entry) {
813 const nir_block *pred = entry->key;
814 validate_assert(state, pred->successors[0] == block ||
815 pred->successors[1] == block);
816 }
817
818 if (!exec_list_is_empty(&block->instr_list) &&
819 nir_block_last_instr(block)->type == nir_instr_type_jump) {
820 validate_assert(state, block->successors[1] == NULL);
821 nir_jump_instr *jump = nir_instr_as_jump(nir_block_last_instr(block));
822 switch (jump->type) {
823 case nir_jump_break: {
824 nir_block *after =
825 nir_cf_node_as_block(nir_cf_node_next(&state->loop->cf_node));
826 validate_assert(state, block->successors[0] == after);
827 break;
828 }
829
830 case nir_jump_continue: {
831 nir_block *first = nir_loop_first_block(state->loop);
832 validate_assert(state, block->successors[0] == first);
833 break;
834 }
835
836 case nir_jump_return:
837 validate_assert(state, block->successors[0] == state->impl->end_block);
838 break;
839
840 default:
841 unreachable("bad jump type");
842 }
843 } else {
844 nir_cf_node *next = nir_cf_node_next(&block->cf_node);
845 if (next == NULL) {
846 switch (state->parent_node->type) {
847 case nir_cf_node_loop: {
848 nir_block *first = nir_loop_first_block(state->loop);
849 validate_assert(state, block->successors[0] == first);
850 /* due to the hack for infinite loops, block->successors[1] may
851 * point to the block after the loop.
852 */
853 break;
854 }
855
856 case nir_cf_node_if: {
857 nir_block *after =
858 nir_cf_node_as_block(nir_cf_node_next(state->parent_node));
859 validate_assert(state, block->successors[0] == after);
860 validate_assert(state, block->successors[1] == NULL);
861 break;
862 }
863
864 case nir_cf_node_function:
865 validate_assert(state, block->successors[0] == state->impl->end_block);
866 validate_assert(state, block->successors[1] == NULL);
867 break;
868
869 default:
870 unreachable("unknown control flow node type");
871 }
872 } else {
873 if (next->type == nir_cf_node_if) {
874 nir_if *if_stmt = nir_cf_node_as_if(next);
875 validate_assert(state, block->successors[0] ==
876 nir_if_first_then_block(if_stmt));
877 validate_assert(state, block->successors[1] ==
878 nir_if_first_else_block(if_stmt));
879 } else {
880 validate_assert(state, next->type == nir_cf_node_loop);
881 nir_loop *loop = nir_cf_node_as_loop(next);
882 validate_assert(state, block->successors[0] ==
883 nir_loop_first_block(loop));
884 validate_assert(state, block->successors[1] == NULL);
885 }
886 }
887 }
888 }
889
890 static void
891 validate_if(nir_if *if_stmt, validate_state *state)
892 {
893 state->if_stmt = if_stmt;
894
895 validate_assert(state, !exec_node_is_head_sentinel(if_stmt->cf_node.node.prev));
896 nir_cf_node *prev_node = nir_cf_node_prev(&if_stmt->cf_node);
897 validate_assert(state, prev_node->type == nir_cf_node_block);
898
899 validate_assert(state, !exec_node_is_tail_sentinel(if_stmt->cf_node.node.next));
900 nir_cf_node *next_node = nir_cf_node_next(&if_stmt->cf_node);
901 validate_assert(state, next_node->type == nir_cf_node_block);
902
903 validate_src(&if_stmt->condition, state, 0, 1);
904
905 validate_assert(state, !exec_list_is_empty(&if_stmt->then_list));
906 validate_assert(state, !exec_list_is_empty(&if_stmt->else_list));
907
908 nir_cf_node *old_parent = state->parent_node;
909 state->parent_node = &if_stmt->cf_node;
910
911 exec_list_validate(&if_stmt->then_list);
912 foreach_list_typed(nir_cf_node, cf_node, node, &if_stmt->then_list) {
913 validate_cf_node(cf_node, state);
914 }
915
916 exec_list_validate(&if_stmt->else_list);
917 foreach_list_typed(nir_cf_node, cf_node, node, &if_stmt->else_list) {
918 validate_cf_node(cf_node, state);
919 }
920
921 state->parent_node = old_parent;
922 state->if_stmt = NULL;
923 }
924
925 static void
926 validate_loop(nir_loop *loop, validate_state *state)
927 {
928 validate_assert(state, !exec_node_is_head_sentinel(loop->cf_node.node.prev));
929 nir_cf_node *prev_node = nir_cf_node_prev(&loop->cf_node);
930 validate_assert(state, prev_node->type == nir_cf_node_block);
931
932 validate_assert(state, !exec_node_is_tail_sentinel(loop->cf_node.node.next));
933 nir_cf_node *next_node = nir_cf_node_next(&loop->cf_node);
934 validate_assert(state, next_node->type == nir_cf_node_block);
935
936 validate_assert(state, !exec_list_is_empty(&loop->body));
937
938 nir_cf_node *old_parent = state->parent_node;
939 state->parent_node = &loop->cf_node;
940 nir_loop *old_loop = state->loop;
941 state->loop = loop;
942
943 exec_list_validate(&loop->body);
944 foreach_list_typed(nir_cf_node, cf_node, node, &loop->body) {
945 validate_cf_node(cf_node, state);
946 }
947
948 state->parent_node = old_parent;
949 state->loop = old_loop;
950 }
951
952 static void
953 validate_cf_node(nir_cf_node *node, validate_state *state)
954 {
955 validate_assert(state, node->parent == state->parent_node);
956
957 switch (node->type) {
958 case nir_cf_node_block:
959 validate_block(nir_cf_node_as_block(node), state);
960 break;
961
962 case nir_cf_node_if:
963 validate_if(nir_cf_node_as_if(node), state);
964 break;
965
966 case nir_cf_node_loop:
967 validate_loop(nir_cf_node_as_loop(node), state);
968 break;
969
970 default:
971 unreachable("Invalid CF node type");
972 }
973 }
974
975 static void
976 prevalidate_reg_decl(nir_register *reg, validate_state *state)
977 {
978 validate_assert(state, reg->index < state->impl->reg_alloc);
979 validate_assert(state, !BITSET_TEST(state->regs_found, reg->index));
980 BITSET_SET(state->regs_found, reg->index);
981
982 list_validate(&reg->uses);
983 list_validate(&reg->defs);
984 list_validate(&reg->if_uses);
985
986 reg_validate_state *reg_state = ralloc(state->regs, reg_validate_state);
987 reg_state->uses = _mesa_pointer_set_create(reg_state);
988 reg_state->if_uses = _mesa_pointer_set_create(reg_state);
989 reg_state->defs = _mesa_pointer_set_create(reg_state);
990
991 reg_state->where_defined = state->impl;
992
993 _mesa_hash_table_insert(state->regs, reg, reg_state);
994 }
995
996 static void
997 postvalidate_reg_decl(nir_register *reg, validate_state *state)
998 {
999 struct hash_entry *entry = _mesa_hash_table_search(state->regs, reg);
1000
1001 assume(entry);
1002 reg_validate_state *reg_state = (reg_validate_state *) entry->data;
1003
1004 nir_foreach_use(src, reg) {
1005 struct set_entry *entry = _mesa_set_search(reg_state->uses, src);
1006 validate_assert(state, entry);
1007 _mesa_set_remove(reg_state->uses, entry);
1008 }
1009
1010 if (reg_state->uses->entries != 0) {
1011 printf("extra entries in register uses:\n");
1012 set_foreach(reg_state->uses, entry)
1013 printf("%p\n", entry->key);
1014
1015 abort();
1016 }
1017
1018 nir_foreach_if_use(src, reg) {
1019 struct set_entry *entry = _mesa_set_search(reg_state->if_uses, src);
1020 validate_assert(state, entry);
1021 _mesa_set_remove(reg_state->if_uses, entry);
1022 }
1023
1024 if (reg_state->if_uses->entries != 0) {
1025 printf("extra entries in register if_uses:\n");
1026 set_foreach(reg_state->if_uses, entry)
1027 printf("%p\n", entry->key);
1028
1029 abort();
1030 }
1031
1032 nir_foreach_def(src, reg) {
1033 struct set_entry *entry = _mesa_set_search(reg_state->defs, src);
1034 validate_assert(state, entry);
1035 _mesa_set_remove(reg_state->defs, entry);
1036 }
1037
1038 if (reg_state->defs->entries != 0) {
1039 printf("extra entries in register defs:\n");
1040 set_foreach(reg_state->defs, entry)
1041 printf("%p\n", entry->key);
1042
1043 abort();
1044 }
1045 }
1046
1047 static void
1048 validate_var_decl(nir_variable *var, bool is_global, validate_state *state)
1049 {
1050 state->var = var;
1051
1052 validate_assert(state, is_global == nir_variable_is_global(var));
1053
1054 /* Must have exactly one mode set */
1055 validate_assert(state, util_is_power_of_two_nonzero(var->data.mode));
1056
1057 if (var->data.compact) {
1058 /* The "compact" flag is only valid on arrays of scalars. */
1059 assert(glsl_type_is_array(var->type));
1060
1061 const struct glsl_type *type = glsl_get_array_element(var->type);
1062 if (nir_is_per_vertex_io(var, state->shader->info.stage)) {
1063 assert(glsl_type_is_array(type));
1064 assert(glsl_type_is_scalar(glsl_get_array_element(type)));
1065 } else {
1066 assert(glsl_type_is_scalar(type));
1067 }
1068 }
1069
1070 if (var->num_members > 0) {
1071 const struct glsl_type *without_array = glsl_without_array(var->type);
1072 validate_assert(state, glsl_type_is_struct_or_ifc(without_array));
1073 validate_assert(state, var->num_members == glsl_get_length(without_array));
1074 validate_assert(state, var->members != NULL);
1075 }
1076
1077 /*
1078 * TODO validate some things ir_validate.cpp does (requires more GLSL type
1079 * support)
1080 */
1081
1082 _mesa_hash_table_insert(state->var_defs, var,
1083 is_global ? NULL : state->impl);
1084
1085 state->var = NULL;
1086 }
1087
1088 static void
1089 validate_function_impl(nir_function_impl *impl, validate_state *state)
1090 {
1091 /* Resize the ssa_srcs set. It's likely that the size of this set will
1092 * never actually hit the number of SSA defs because we remove sources from
1093 * the set as we visit them. (It could actually be much larger because
1094 * each SSA def can be used more than once.) However, growing it now costs
1095 * us very little (the extra memory is already dwarfed by the SSA defs
1096 * themselves) and makes collisions much less likely.
1097 */
1098 _mesa_set_resize(state->ssa_srcs, impl->ssa_alloc);
1099
1100 validate_assert(state, impl->function->impl == impl);
1101 validate_assert(state, impl->cf_node.parent == NULL);
1102
1103 validate_assert(state, exec_list_is_empty(&impl->end_block->instr_list));
1104 validate_assert(state, impl->end_block->successors[0] == NULL);
1105 validate_assert(state, impl->end_block->successors[1] == NULL);
1106
1107 state->impl = impl;
1108 state->parent_node = &impl->cf_node;
1109
1110 exec_list_validate(&impl->locals);
1111 nir_foreach_variable(var, &impl->locals) {
1112 validate_var_decl(var, false, state);
1113 }
1114
1115 state->regs_found = reralloc(state->mem_ctx, state->regs_found,
1116 BITSET_WORD, BITSET_WORDS(impl->reg_alloc));
1117 memset(state->regs_found, 0, BITSET_WORDS(impl->reg_alloc) *
1118 sizeof(BITSET_WORD));
1119 exec_list_validate(&impl->registers);
1120 foreach_list_typed(nir_register, reg, node, &impl->registers) {
1121 prevalidate_reg_decl(reg, state);
1122 }
1123
1124 state->ssa_defs_found = reralloc(state->mem_ctx, state->ssa_defs_found,
1125 BITSET_WORD, BITSET_WORDS(impl->ssa_alloc));
1126 memset(state->ssa_defs_found, 0, BITSET_WORDS(impl->ssa_alloc) *
1127 sizeof(BITSET_WORD));
1128 exec_list_validate(&impl->body);
1129 foreach_list_typed(nir_cf_node, node, node, &impl->body) {
1130 validate_cf_node(node, state);
1131 }
1132
1133 foreach_list_typed(nir_register, reg, node, &impl->registers) {
1134 postvalidate_reg_decl(reg, state);
1135 }
1136
1137 if (state->ssa_srcs->entries != 0) {
1138 printf("extra dangling SSA sources:\n");
1139 set_foreach(state->ssa_srcs, entry)
1140 printf("%p\n", entry->key);
1141
1142 abort();
1143 }
1144 }
1145
1146 static void
1147 validate_function(nir_function *func, validate_state *state)
1148 {
1149 if (func->impl != NULL) {
1150 validate_assert(state, func->impl->function == func);
1151 validate_function_impl(func->impl, state);
1152 }
1153 }
1154
1155 static void
1156 init_validate_state(validate_state *state)
1157 {
1158 state->mem_ctx = ralloc_context(NULL);
1159 state->regs = _mesa_pointer_hash_table_create(state->mem_ctx);
1160 state->ssa_srcs = _mesa_pointer_set_create(state->mem_ctx);
1161 state->ssa_defs_found = NULL;
1162 state->regs_found = NULL;
1163 state->var_defs = _mesa_pointer_hash_table_create(state->mem_ctx);
1164 state->errors = _mesa_pointer_hash_table_create(state->mem_ctx);
1165
1166 state->loop = NULL;
1167 state->instr = NULL;
1168 state->var = NULL;
1169 }
1170
1171 static void
1172 destroy_validate_state(validate_state *state)
1173 {
1174 ralloc_free(state->mem_ctx);
1175 }
1176
1177 mtx_t fail_dump_mutex = _MTX_INITIALIZER_NP;
1178
1179 static void
1180 dump_errors(validate_state *state, const char *when)
1181 {
1182 struct hash_table *errors = state->errors;
1183
1184 /* Lock around dumping so that we get clean dumps in a multi-threaded
1185 * scenario
1186 */
1187 mtx_lock(&fail_dump_mutex);
1188
1189 if (when) {
1190 fprintf(stderr, "NIR validation failed %s\n", when);
1191 fprintf(stderr, "%d errors:\n", _mesa_hash_table_num_entries(errors));
1192 } else {
1193 fprintf(stderr, "NIR validation failed with %d errors:\n",
1194 _mesa_hash_table_num_entries(errors));
1195 }
1196
1197 nir_print_shader_annotated(state->shader, stderr, errors);
1198
1199 if (_mesa_hash_table_num_entries(errors) > 0) {
1200 fprintf(stderr, "%d additional errors:\n",
1201 _mesa_hash_table_num_entries(errors));
1202 hash_table_foreach(errors, entry) {
1203 fprintf(stderr, "%s\n", (char *)entry->data);
1204 }
1205 }
1206
1207 mtx_unlock(&fail_dump_mutex);
1208
1209 abort();
1210 }
1211
1212 void
1213 nir_validate_shader(nir_shader *shader, const char *when)
1214 {
1215 static int should_validate = -1;
1216 if (should_validate < 0)
1217 should_validate = env_var_as_boolean("NIR_VALIDATE", true);
1218 if (!should_validate)
1219 return;
1220
1221 validate_state state;
1222 init_validate_state(&state);
1223
1224 state.shader = shader;
1225
1226 exec_list_validate(&shader->uniforms);
1227 nir_foreach_variable(var, &shader->uniforms) {
1228 validate_var_decl(var, true, &state);
1229 }
1230
1231 exec_list_validate(&shader->inputs);
1232 nir_foreach_variable(var, &shader->inputs) {
1233 validate_var_decl(var, true, &state);
1234 }
1235
1236 exec_list_validate(&shader->outputs);
1237 nir_foreach_variable(var, &shader->outputs) {
1238 validate_var_decl(var, true, &state);
1239 }
1240
1241 exec_list_validate(&shader->shared);
1242 nir_foreach_variable(var, &shader->shared) {
1243 validate_var_decl(var, true, &state);
1244 }
1245
1246 exec_list_validate(&shader->globals);
1247 nir_foreach_variable(var, &shader->globals) {
1248 validate_var_decl(var, true, &state);
1249 }
1250
1251 exec_list_validate(&shader->system_values);
1252 nir_foreach_variable(var, &shader->system_values) {
1253 validate_var_decl(var, true, &state);
1254 }
1255
1256 exec_list_validate(&shader->functions);
1257 foreach_list_typed(nir_function, func, node, &shader->functions) {
1258 validate_function(func, &state);
1259 }
1260
1261 if (_mesa_hash_table_num_entries(state.errors) > 0)
1262 dump_errors(&state, when);
1263
1264 destroy_validate_state(&state);
1265 }
1266
1267 #endif /* NDEBUG */