2 * Copyright © 2014 Intel Corporation
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
24 * Connor Abbott (cwabbott0@gmail.com)
29 #include "compiler/shader_enums.h"
30 #include "util/half_float.h"
33 #include <inttypes.h> /* for PRIx64 macro */
36 print_tabs(unsigned num_tabs
, FILE *fp
)
38 for (unsigned i
= 0; i
< num_tabs
; i
++)
45 /** map from nir_variable -> printable name */
46 struct hash_table
*ht
;
48 /** set of names used so far for nir_variables */
51 /* an index used to make new non-conflicting names */
55 * Optional table of annotations mapping nir object
56 * (such as instr or var) to message to print.
58 struct hash_table
*annotations
;
62 print_annotation(print_state
*state
, void *obj
)
64 if (!state
->annotations
)
67 struct hash_entry
*entry
= _mesa_hash_table_search(state
->annotations
, obj
);
71 const char *note
= entry
->data
;
72 _mesa_hash_table_remove(state
->annotations
, entry
);
74 fprintf(stderr
, "%s\n\n", note
);
78 print_register(nir_register
*reg
, print_state
*state
)
81 if (reg
->name
!= NULL
)
82 fprintf(fp
, "/* %s */ ", reg
->name
);
84 fprintf(fp
, "gr%u", reg
->index
);
86 fprintf(fp
, "r%u", reg
->index
);
89 static const char *sizes
[] = { "error", "vec1", "vec2", "vec3", "vec4",
90 "error", "error", "error", "vec8",
91 "error", "error", "error", "error",
92 "error", "error", "error", "vec16"};
95 print_register_decl(nir_register
*reg
, print_state
*state
)
98 fprintf(fp
, "decl_reg %s %u ", sizes
[reg
->num_components
], reg
->bit_size
);
100 fprintf(fp
, "(packed) ");
101 print_register(reg
, state
);
102 if (reg
->num_array_elems
!= 0)
103 fprintf(fp
, "[%u]", reg
->num_array_elems
);
108 print_ssa_def(nir_ssa_def
*def
, print_state
*state
)
110 FILE *fp
= state
->fp
;
111 if (def
->name
!= NULL
)
112 fprintf(fp
, "/* %s */ ", def
->name
);
113 fprintf(fp
, "%s %u ssa_%u", sizes
[def
->num_components
], def
->bit_size
,
118 print_ssa_use(nir_ssa_def
*def
, print_state
*state
)
120 FILE *fp
= state
->fp
;
121 if (def
->name
!= NULL
)
122 fprintf(fp
, "/* %s */ ", def
->name
);
123 fprintf(fp
, "ssa_%u", def
->index
);
126 static void print_src(nir_src
*src
, print_state
*state
);
129 print_reg_src(nir_reg_src
*src
, print_state
*state
)
131 FILE *fp
= state
->fp
;
132 print_register(src
->reg
, state
);
133 if (src
->reg
->num_array_elems
!= 0) {
134 fprintf(fp
, "[%u", src
->base_offset
);
135 if (src
->indirect
!= NULL
) {
137 print_src(src
->indirect
, state
);
144 print_reg_dest(nir_reg_dest
*dest
, print_state
*state
)
146 FILE *fp
= state
->fp
;
147 print_register(dest
->reg
, state
);
148 if (dest
->reg
->num_array_elems
!= 0) {
149 fprintf(fp
, "[%u", dest
->base_offset
);
150 if (dest
->indirect
!= NULL
) {
152 print_src(dest
->indirect
, state
);
159 print_src(nir_src
*src
, print_state
*state
)
162 print_ssa_use(src
->ssa
, state
);
164 print_reg_src(&src
->reg
, state
);
168 print_dest(nir_dest
*dest
, print_state
*state
)
171 print_ssa_def(&dest
->ssa
, state
);
173 print_reg_dest(&dest
->reg
, state
);
177 print_alu_src(nir_alu_instr
*instr
, unsigned src
, print_state
*state
)
179 FILE *fp
= state
->fp
;
181 if (instr
->src
[src
].negate
)
183 if (instr
->src
[src
].abs
)
186 print_src(&instr
->src
[src
].src
, state
);
188 bool print_swizzle
= false;
189 nir_component_mask_t used_channels
= 0;
191 for (unsigned i
= 0; i
< NIR_MAX_VEC_COMPONENTS
; i
++) {
192 if (!nir_alu_instr_channel_used(instr
, src
, i
))
197 if (instr
->src
[src
].swizzle
[i
] != i
) {
198 print_swizzle
= true;
203 unsigned live_channels
= nir_src_num_components(instr
->src
[src
].src
);
205 if (print_swizzle
|| used_channels
!= live_channels
) {
207 for (unsigned i
= 0; i
< NIR_MAX_VEC_COMPONENTS
; i
++) {
208 if (!nir_alu_instr_channel_used(instr
, src
, i
))
211 fprintf(fp
, "%c", "xyzw"[instr
->src
[src
].swizzle
[i
]]);
215 if (instr
->src
[src
].abs
)
220 print_alu_dest(nir_alu_dest
*dest
, print_state
*state
)
222 FILE *fp
= state
->fp
;
223 /* we're going to print the saturate modifier later, after the opcode */
225 print_dest(&dest
->dest
, state
);
227 if (!dest
->dest
.is_ssa
&&
228 dest
->write_mask
!= (1 << dest
->dest
.reg
.reg
->num_components
) - 1) {
230 for (unsigned i
= 0; i
< NIR_MAX_VEC_COMPONENTS
; i
++)
231 if ((dest
->write_mask
>> i
) & 1)
232 fprintf(fp
, "%c", "xyzw"[i
]);
237 print_alu_instr(nir_alu_instr
*instr
, print_state
*state
)
239 FILE *fp
= state
->fp
;
241 print_alu_dest(&instr
->dest
, state
);
243 fprintf(fp
, " = %s", nir_op_infos
[instr
->op
].name
);
246 if (instr
->dest
.saturate
)
250 for (unsigned i
= 0; i
< nir_op_infos
[instr
->op
].num_inputs
; i
++) {
254 print_alu_src(instr
, i
, state
);
259 get_var_name(nir_variable
*var
, print_state
*state
)
261 if (state
->ht
== NULL
)
262 return var
->name
? var
->name
: "unnamed";
266 struct hash_entry
*entry
= _mesa_hash_table_search(state
->ht
, var
);
271 if (var
->name
== NULL
) {
272 name
= ralloc_asprintf(state
->syms
, "@%u", state
->index
++);
274 struct set_entry
*set_entry
= _mesa_set_search(state
->syms
, var
->name
);
275 if (set_entry
!= NULL
) {
276 /* we have a collision with another name, append an @ + a unique
278 name
= ralloc_asprintf(state
->syms
, "%s@%u", var
->name
,
281 /* Mark this one as seen */
282 _mesa_set_add(state
->syms
, var
->name
);
287 _mesa_hash_table_insert(state
->ht
, var
, name
);
293 print_constant(nir_constant
*c
, const struct glsl_type
*type
, print_state
*state
)
295 FILE *fp
= state
->fp
;
296 const unsigned rows
= glsl_get_vector_elements(type
);
297 const unsigned cols
= glsl_get_matrix_columns(type
);
300 switch (glsl_get_base_type(type
)) {
301 case GLSL_TYPE_UINT8
:
303 /* Only float base types can be matrices. */
306 for (i
= 0; i
< rows
; i
++) {
307 if (i
> 0) fprintf(fp
, ", ");
308 fprintf(fp
, "0x%02x", c
->values
[0].u8
[i
]);
312 case GLSL_TYPE_UINT16
:
313 case GLSL_TYPE_INT16
:
314 /* Only float base types can be matrices. */
317 for (i
= 0; i
< rows
; i
++) {
318 if (i
> 0) fprintf(fp
, ", ");
319 fprintf(fp
, "0x%04x", c
->values
[0].u16
[i
]);
326 /* Only float base types can be matrices. */
329 for (i
= 0; i
< rows
; i
++) {
330 if (i
> 0) fprintf(fp
, ", ");
331 fprintf(fp
, "0x%08x", c
->values
[0].u32
[i
]);
335 case GLSL_TYPE_FLOAT16
:
336 for (i
= 0; i
< cols
; i
++) {
337 for (j
= 0; j
< rows
; j
++) {
338 if (i
+ j
> 0) fprintf(fp
, ", ");
339 fprintf(fp
, "%f", _mesa_half_to_float(c
->values
[i
].u16
[j
]));
344 case GLSL_TYPE_FLOAT
:
345 for (i
= 0; i
< cols
; i
++) {
346 for (j
= 0; j
< rows
; j
++) {
347 if (i
+ j
> 0) fprintf(fp
, ", ");
348 fprintf(fp
, "%f", c
->values
[i
].f32
[j
]);
353 case GLSL_TYPE_DOUBLE
:
354 for (i
= 0; i
< cols
; i
++) {
355 for (j
= 0; j
< rows
; j
++) {
356 if (i
+ j
> 0) fprintf(fp
, ", ");
357 fprintf(fp
, "%f", c
->values
[i
].f64
[j
]);
362 case GLSL_TYPE_UINT64
:
363 case GLSL_TYPE_INT64
:
364 /* Only float base types can be matrices. */
367 for (i
= 0; i
< cols
; i
++) {
368 if (i
> 0) fprintf(fp
, ", ");
369 fprintf(fp
, "0x%08" PRIx64
, c
->values
[0].u64
[i
]);
373 case GLSL_TYPE_STRUCT
:
374 for (i
= 0; i
< c
->num_elements
; i
++) {
375 if (i
> 0) fprintf(fp
, ", ");
377 print_constant(c
->elements
[i
], glsl_get_struct_field(type
, i
), state
);
382 case GLSL_TYPE_ARRAY
:
383 for (i
= 0; i
< c
->num_elements
; i
++) {
384 if (i
> 0) fprintf(fp
, ", ");
386 print_constant(c
->elements
[i
], glsl_get_array_element(type
), state
);
392 unreachable("not reached");
397 get_variable_mode_str(nir_variable_mode mode
, bool want_local_global_mode
)
400 case nir_var_shader_in
:
402 case nir_var_shader_out
:
404 case nir_var_uniform
:
406 case nir_var_shader_storage
:
407 return "shader_storage";
408 case nir_var_system_value
:
413 return want_local_global_mode
? "global" : "";
415 return want_local_global_mode
? "local" : "";
422 print_var_decl(nir_variable
*var
, print_state
*state
)
424 FILE *fp
= state
->fp
;
426 fprintf(fp
, "decl_var ");
428 const char *const cent
= (var
->data
.centroid
) ? "centroid " : "";
429 const char *const samp
= (var
->data
.sample
) ? "sample " : "";
430 const char *const patch
= (var
->data
.patch
) ? "patch " : "";
431 const char *const inv
= (var
->data
.invariant
) ? "invariant " : "";
432 fprintf(fp
, "%s%s%s%s%s %s ",
433 cent
, samp
, patch
, inv
, get_variable_mode_str(var
->data
.mode
, false),
434 glsl_interp_mode_name(var
->data
.interpolation
));
436 const char *const coher
= (var
->data
.image
.coherent
) ? "coherent " : "";
437 const char *const volat
= (var
->data
.image
._volatile
) ? "volatile " : "";
438 const char *const restr
= (var
->data
.image
.restrict_flag
) ? "restrict " : "";
439 const char *const ronly
= (var
->data
.image
.read_only
) ? "readonly " : "";
440 const char *const wonly
= (var
->data
.image
.write_only
) ? "writeonly " : "";
441 fprintf(fp
, "%s%s%s%s%s", coher
, volat
, restr
, ronly
, wonly
);
443 fprintf(fp
, "%s %s", glsl_get_type_name(var
->type
),
444 get_var_name(var
, state
));
446 if (var
->data
.mode
== nir_var_shader_in
||
447 var
->data
.mode
== nir_var_shader_out
||
448 var
->data
.mode
== nir_var_uniform
||
449 var
->data
.mode
== nir_var_shader_storage
) {
450 const char *loc
= NULL
;
453 switch (state
->shader
->info
.stage
) {
454 case MESA_SHADER_VERTEX
:
455 if (var
->data
.mode
== nir_var_shader_in
)
456 loc
= gl_vert_attrib_name(var
->data
.location
);
457 else if (var
->data
.mode
== nir_var_shader_out
)
458 loc
= gl_varying_slot_name(var
->data
.location
);
460 case MESA_SHADER_GEOMETRY
:
461 if ((var
->data
.mode
== nir_var_shader_in
) ||
462 (var
->data
.mode
== nir_var_shader_out
))
463 loc
= gl_varying_slot_name(var
->data
.location
);
465 case MESA_SHADER_FRAGMENT
:
466 if (var
->data
.mode
== nir_var_shader_in
)
467 loc
= gl_varying_slot_name(var
->data
.location
);
468 else if (var
->data
.mode
== nir_var_shader_out
)
469 loc
= gl_frag_result_name(var
->data
.location
);
471 case MESA_SHADER_TESS_CTRL
:
472 case MESA_SHADER_TESS_EVAL
:
473 case MESA_SHADER_COMPUTE
:
480 snprintf(buf
, sizeof(buf
), "%u", var
->data
.location
);
484 /* For shader I/O vars that have been split to components or packed,
485 * print the fractional location within the input/output.
487 unsigned int num_components
=
488 glsl_get_components(glsl_without_array(var
->type
));
489 const char *components
= NULL
;
490 char components_local
[6] = {'.' /* the rest is 0-filled */};
491 switch (var
->data
.mode
) {
492 case nir_var_shader_in
:
493 case nir_var_shader_out
:
494 if (num_components
< 4 && num_components
!= 0) {
495 const char *xyzw
= "xyzw";
496 for (int i
= 0; i
< num_components
; i
++)
497 components_local
[i
+ 1] = xyzw
[i
+ var
->data
.location_frac
];
499 components
= components_local
;
506 fprintf(fp
, " (%s%s, %u, %u)%s", loc
,
507 components
? components
: "",
508 var
->data
.driver_location
, var
->data
.binding
,
509 var
->data
.compact
? " compact" : "");
512 if (var
->constant_initializer
) {
513 fprintf(fp
, " = { ");
514 print_constant(var
->constant_initializer
, var
->type
, state
);
519 print_annotation(state
, var
);
523 print_deref_link(nir_deref_instr
*instr
, bool whole_chain
, print_state
*state
)
525 FILE *fp
= state
->fp
;
527 if (instr
->deref_type
== nir_deref_type_var
) {
528 fprintf(fp
, "%s", get_var_name(instr
->var
, state
));
530 } else if (instr
->deref_type
== nir_deref_type_cast
) {
531 fprintf(fp
, "(%s *)", glsl_get_type_name(instr
->type
));
532 print_src(&instr
->parent
, state
);
536 assert(instr
->parent
.is_ssa
);
537 nir_deref_instr
*parent
=
538 nir_instr_as_deref(instr
->parent
.ssa
->parent_instr
);
540 /* Is the parent we're going to print a bare cast? */
541 const bool is_parent_cast
=
542 whole_chain
&& parent
->deref_type
== nir_deref_type_cast
;
544 /* If we're not printing the whole chain, the parent we print will be a SSA
545 * value that represents a pointer. The only deref type that naturally
546 * gives a pointer is a cast.
548 const bool is_parent_pointer
=
549 !whole_chain
|| parent
->deref_type
== nir_deref_type_cast
;
551 /* Struct derefs have a nice syntax that works on pointers, arrays derefs
554 const bool need_deref
=
555 is_parent_pointer
&& instr
->deref_type
!= nir_deref_type_struct
;
557 /* Cast need extra parens and so * dereferences */
558 if (is_parent_cast
|| need_deref
)
565 print_deref_link(parent
, whole_chain
, state
);
567 print_src(&instr
->parent
, state
);
570 if (is_parent_cast
|| need_deref
)
573 switch (instr
->deref_type
) {
574 case nir_deref_type_struct
:
575 fprintf(fp
, "%s%s", is_parent_pointer
? "->" : ".",
576 glsl_get_struct_elem_name(parent
->type
, instr
->strct
.index
));
579 case nir_deref_type_array
: {
580 nir_const_value
*const_index
= nir_src_as_const_value(instr
->arr
.index
);
582 fprintf(fp
, "[%u]", const_index
->u32
[0]);
585 print_src(&instr
->arr
.index
, state
);
591 case nir_deref_type_array_wildcard
:
596 unreachable("Invalid deref instruction type");
601 print_deref_instr(nir_deref_instr
*instr
, print_state
*state
)
603 FILE *fp
= state
->fp
;
605 print_dest(&instr
->dest
, state
);
607 switch (instr
->deref_type
) {
608 case nir_deref_type_var
:
609 fprintf(fp
, " = deref_var ");
611 case nir_deref_type_array
:
612 case nir_deref_type_array_wildcard
:
613 fprintf(fp
, " = deref_array ");
615 case nir_deref_type_struct
:
616 fprintf(fp
, " = deref_struct ");
618 case nir_deref_type_cast
:
619 fprintf(fp
, " = deref_cast ");
622 unreachable("Invalid deref instruction type");
625 /* Only casts naturally return a pointer type */
626 if (instr
->deref_type
!= nir_deref_type_cast
)
629 print_deref_link(instr
, false, state
);
631 fprintf(fp
, " (%s %s) ",
632 get_variable_mode_str(instr
->mode
, true),
633 glsl_get_type_name(instr
->type
));
635 if (instr
->deref_type
!= nir_deref_type_var
&&
636 instr
->deref_type
!= nir_deref_type_cast
) {
637 /* Print the entire chain as a comment */
639 print_deref_link(instr
, true, state
);
645 print_intrinsic_instr(nir_intrinsic_instr
*instr
, print_state
*state
)
647 const nir_intrinsic_info
*info
= &nir_intrinsic_infos
[instr
->intrinsic
];
648 unsigned num_srcs
= info
->num_srcs
;
649 FILE *fp
= state
->fp
;
651 if (info
->has_dest
) {
652 print_dest(&instr
->dest
, state
);
656 fprintf(fp
, "intrinsic %s (", info
->name
);
658 for (unsigned i
= 0; i
< num_srcs
; i
++) {
662 print_src(&instr
->src
[i
], state
);
667 for (unsigned i
= 0; i
< info
->num_indices
; i
++) {
671 fprintf(fp
, "%d", instr
->const_index
[i
]);
676 static const char *index_name
[NIR_INTRINSIC_NUM_INDEX_FLAGS
] = {
677 [NIR_INTRINSIC_BASE
] = "base",
678 [NIR_INTRINSIC_WRMASK
] = "wrmask",
679 [NIR_INTRINSIC_STREAM_ID
] = "stream-id",
680 [NIR_INTRINSIC_UCP_ID
] = "ucp-id",
681 [NIR_INTRINSIC_RANGE
] = "range",
682 [NIR_INTRINSIC_DESC_SET
] = "desc-set",
683 [NIR_INTRINSIC_BINDING
] = "binding",
684 [NIR_INTRINSIC_COMPONENT
] = "component",
685 [NIR_INTRINSIC_INTERP_MODE
] = "interp_mode",
686 [NIR_INTRINSIC_REDUCTION_OP
] = "reduction_op",
687 [NIR_INTRINSIC_CLUSTER_SIZE
] = "cluster_size",
688 [NIR_INTRINSIC_PARAM_IDX
] = "param_idx",
690 for (unsigned idx
= 1; idx
< NIR_INTRINSIC_NUM_INDEX_FLAGS
; idx
++) {
691 if (!info
->index_map
[idx
])
694 if (idx
== NIR_INTRINSIC_WRMASK
) {
695 /* special case wrmask to show it as a writemask.. */
696 unsigned wrmask
= nir_intrinsic_write_mask(instr
);
697 fprintf(fp
, " wrmask=");
698 for (unsigned i
= 0; i
< 4; i
++)
699 if ((wrmask
>> i
) & 1)
700 fprintf(fp
, "%c", "xyzw"[i
]);
701 } else if (idx
== NIR_INTRINSIC_REDUCTION_OP
) {
702 nir_op reduction_op
= nir_intrinsic_reduction_op(instr
);
703 fprintf(fp
, " reduction_op=%s", nir_op_infos
[reduction_op
].name
);
705 unsigned off
= info
->index_map
[idx
] - 1;
706 assert(index_name
[idx
]); /* forgot to update index_name table? */
707 fprintf(fp
, " %s=%d", index_name
[idx
], instr
->const_index
[off
]);
715 struct exec_list
*var_list
= NULL
;
717 switch (instr
->intrinsic
) {
718 case nir_intrinsic_load_uniform
:
719 var_list
= &state
->shader
->uniforms
;
721 case nir_intrinsic_load_input
:
722 case nir_intrinsic_load_per_vertex_input
:
723 var_list
= &state
->shader
->inputs
;
725 case nir_intrinsic_load_output
:
726 case nir_intrinsic_store_output
:
727 case nir_intrinsic_store_per_vertex_output
:
728 var_list
= &state
->shader
->outputs
;
734 nir_foreach_variable(var
, var_list
) {
735 if ((var
->data
.driver_location
== nir_intrinsic_base(instr
)) &&
736 (instr
->intrinsic
== nir_intrinsic_load_uniform
||
737 var
->data
.location_frac
== nir_intrinsic_component(instr
)) &&
739 fprintf(fp
, "\t/* %s */", var
->name
);
746 print_tex_instr(nir_tex_instr
*instr
, print_state
*state
)
748 FILE *fp
= state
->fp
;
750 print_dest(&instr
->dest
, state
);
770 case nir_texop_txf_ms
:
771 fprintf(fp
, "txf_ms ");
773 case nir_texop_txf_ms_mcs
:
774 fprintf(fp
, "txf_ms_mcs ");
785 case nir_texop_query_levels
:
786 fprintf(fp
, "query_levels ");
788 case nir_texop_texture_samples
:
789 fprintf(fp
, "texture_samples ");
791 case nir_texop_samples_identical
:
792 fprintf(fp
, "samples_identical ");
795 unreachable("Invalid texture operation");
799 bool has_texture_deref
= false, has_sampler_deref
= false;
800 for (unsigned i
= 0; i
< instr
->num_srcs
; i
++) {
801 print_src(&instr
->src
[i
].src
, state
);
805 switch(instr
->src
[i
].src_type
) {
806 case nir_tex_src_coord
:
807 fprintf(fp
, "(coord)");
809 case nir_tex_src_projector
:
810 fprintf(fp
, "(projector)");
812 case nir_tex_src_comparator
:
813 fprintf(fp
, "(comparator)");
815 case nir_tex_src_offset
:
816 fprintf(fp
, "(offset)");
818 case nir_tex_src_bias
:
819 fprintf(fp
, "(bias)");
821 case nir_tex_src_lod
:
822 fprintf(fp
, "(lod)");
824 case nir_tex_src_ms_index
:
825 fprintf(fp
, "(ms_index)");
827 case nir_tex_src_ms_mcs
:
828 fprintf(fp
, "(ms_mcs)");
830 case nir_tex_src_ddx
:
831 fprintf(fp
, "(ddx)");
833 case nir_tex_src_ddy
:
834 fprintf(fp
, "(ddy)");
836 case nir_tex_src_texture_deref
:
837 has_texture_deref
= true;
838 fprintf(fp
, "(texture_deref)");
840 case nir_tex_src_sampler_deref
:
841 has_sampler_deref
= true;
842 fprintf(fp
, "(sampler_deref)");
844 case nir_tex_src_texture_offset
:
845 fprintf(fp
, "(texture_offset)");
847 case nir_tex_src_sampler_offset
:
848 fprintf(fp
, "(sampler_offset)");
850 case nir_tex_src_plane
:
851 fprintf(fp
, "(plane)");
855 unreachable("Invalid texture source type");
862 if (instr
->op
== nir_texop_tg4
) {
863 fprintf(fp
, "%u (gather_component), ", instr
->component
);
866 if (!has_texture_deref
) {
867 fprintf(fp
, "%u (texture), ", instr
->texture_index
);
870 if (!has_sampler_deref
) {
871 fprintf(fp
, "%u (sampler), ", instr
->sampler_index
);
876 print_call_instr(nir_call_instr
*instr
, print_state
*state
)
878 FILE *fp
= state
->fp
;
880 fprintf(fp
, "call %s ", instr
->callee
->name
);
882 for (unsigned i
= 0; i
< instr
->num_params
; i
++) {
886 print_src(&instr
->params
[i
], state
);
891 print_load_const_instr(nir_load_const_instr
*instr
, print_state
*state
)
893 FILE *fp
= state
->fp
;
895 print_ssa_def(&instr
->def
, state
);
897 fprintf(fp
, " = load_const (");
899 for (unsigned i
= 0; i
< instr
->def
.num_components
; i
++) {
904 * we don't really know the type of the constant (if it will be used as a
905 * float or an int), so just print the raw constant in hex for fidelity
906 * and then print the float in a comment for readability.
909 switch (instr
->def
.bit_size
) {
911 fprintf(fp
, "0x%16" PRIx64
" /* %f */", instr
->value
.u64
[i
],
912 instr
->value
.f64
[i
]);
915 fprintf(fp
, "0x%08x /* %f */", instr
->value
.u32
[i
], instr
->value
.f32
[i
]);
918 fprintf(fp
, "0x%04x /* %f */", instr
->value
.u16
[i
],
919 _mesa_half_to_float(instr
->value
.u16
[i
]));
922 fprintf(fp
, "0x%02x", instr
->value
.u8
[i
]);
931 print_jump_instr(nir_jump_instr
*instr
, print_state
*state
)
933 FILE *fp
= state
->fp
;
935 switch (instr
->type
) {
937 fprintf(fp
, "break");
940 case nir_jump_continue
:
941 fprintf(fp
, "continue");
944 case nir_jump_return
:
945 fprintf(fp
, "return");
951 print_ssa_undef_instr(nir_ssa_undef_instr
* instr
, print_state
*state
)
953 FILE *fp
= state
->fp
;
954 print_ssa_def(&instr
->def
, state
);
955 fprintf(fp
, " = undefined");
959 print_phi_instr(nir_phi_instr
*instr
, print_state
*state
)
961 FILE *fp
= state
->fp
;
962 print_dest(&instr
->dest
, state
);
963 fprintf(fp
, " = phi ");
964 nir_foreach_phi_src(src
, instr
) {
965 if (&src
->node
!= exec_list_get_head(&instr
->srcs
))
968 fprintf(fp
, "block_%u: ", src
->pred
->index
);
969 print_src(&src
->src
, state
);
974 print_parallel_copy_instr(nir_parallel_copy_instr
*instr
, print_state
*state
)
976 FILE *fp
= state
->fp
;
977 nir_foreach_parallel_copy_entry(entry
, instr
) {
978 if (&entry
->node
!= exec_list_get_head(&instr
->entries
))
981 print_dest(&entry
->dest
, state
);
983 print_src(&entry
->src
, state
);
988 print_instr(const nir_instr
*instr
, print_state
*state
, unsigned tabs
)
990 FILE *fp
= state
->fp
;
991 print_tabs(tabs
, fp
);
993 switch (instr
->type
) {
994 case nir_instr_type_alu
:
995 print_alu_instr(nir_instr_as_alu(instr
), state
);
998 case nir_instr_type_deref
:
999 print_deref_instr(nir_instr_as_deref(instr
), state
);
1002 case nir_instr_type_call
:
1003 print_call_instr(nir_instr_as_call(instr
), state
);
1006 case nir_instr_type_intrinsic
:
1007 print_intrinsic_instr(nir_instr_as_intrinsic(instr
), state
);
1010 case nir_instr_type_tex
:
1011 print_tex_instr(nir_instr_as_tex(instr
), state
);
1014 case nir_instr_type_load_const
:
1015 print_load_const_instr(nir_instr_as_load_const(instr
), state
);
1018 case nir_instr_type_jump
:
1019 print_jump_instr(nir_instr_as_jump(instr
), state
);
1022 case nir_instr_type_ssa_undef
:
1023 print_ssa_undef_instr(nir_instr_as_ssa_undef(instr
), state
);
1026 case nir_instr_type_phi
:
1027 print_phi_instr(nir_instr_as_phi(instr
), state
);
1030 case nir_instr_type_parallel_copy
:
1031 print_parallel_copy_instr(nir_instr_as_parallel_copy(instr
), state
);
1035 unreachable("Invalid instruction type");
1041 compare_block_index(const void *p1
, const void *p2
)
1043 const nir_block
*block1
= *((const nir_block
**) p1
);
1044 const nir_block
*block2
= *((const nir_block
**) p2
);
1046 return (int) block1
->index
- (int) block2
->index
;
1049 static void print_cf_node(nir_cf_node
*node
, print_state
*state
,
1053 print_block(nir_block
*block
, print_state
*state
, unsigned tabs
)
1055 FILE *fp
= state
->fp
;
1057 print_tabs(tabs
, fp
);
1058 fprintf(fp
, "block block_%u:\n", block
->index
);
1060 /* sort the predecessors by index so we consistently print the same thing */
1063 malloc(block
->predecessors
->entries
* sizeof(nir_block
*));
1065 struct set_entry
*entry
;
1067 set_foreach(block
->predecessors
, entry
) {
1068 preds
[i
++] = (nir_block
*) entry
->key
;
1071 qsort(preds
, block
->predecessors
->entries
, sizeof(nir_block
*),
1072 compare_block_index
);
1074 print_tabs(tabs
, fp
);
1075 fprintf(fp
, "/* preds: ");
1076 for (unsigned i
= 0; i
< block
->predecessors
->entries
; i
++) {
1077 fprintf(fp
, "block_%u ", preds
[i
]->index
);
1079 fprintf(fp
, "*/\n");
1083 nir_foreach_instr(instr
, block
) {
1084 print_instr(instr
, state
, tabs
);
1086 print_annotation(state
, instr
);
1089 print_tabs(tabs
, fp
);
1090 fprintf(fp
, "/* succs: ");
1091 for (unsigned i
= 0; i
< 2; i
++)
1092 if (block
->successors
[i
]) {
1093 fprintf(fp
, "block_%u ", block
->successors
[i
]->index
);
1095 fprintf(fp
, "*/\n");
1099 print_if(nir_if
*if_stmt
, print_state
*state
, unsigned tabs
)
1101 FILE *fp
= state
->fp
;
1103 print_tabs(tabs
, fp
);
1105 print_src(&if_stmt
->condition
, state
);
1106 fprintf(fp
, " {\n");
1107 foreach_list_typed(nir_cf_node
, node
, node
, &if_stmt
->then_list
) {
1108 print_cf_node(node
, state
, tabs
+ 1);
1110 print_tabs(tabs
, fp
);
1111 fprintf(fp
, "} else {\n");
1112 foreach_list_typed(nir_cf_node
, node
, node
, &if_stmt
->else_list
) {
1113 print_cf_node(node
, state
, tabs
+ 1);
1115 print_tabs(tabs
, fp
);
1120 print_loop(nir_loop
*loop
, print_state
*state
, unsigned tabs
)
1122 FILE *fp
= state
->fp
;
1124 print_tabs(tabs
, fp
);
1125 fprintf(fp
, "loop {\n");
1126 foreach_list_typed(nir_cf_node
, node
, node
, &loop
->body
) {
1127 print_cf_node(node
, state
, tabs
+ 1);
1129 print_tabs(tabs
, fp
);
1134 print_cf_node(nir_cf_node
*node
, print_state
*state
, unsigned int tabs
)
1136 switch (node
->type
) {
1137 case nir_cf_node_block
:
1138 print_block(nir_cf_node_as_block(node
), state
, tabs
);
1141 case nir_cf_node_if
:
1142 print_if(nir_cf_node_as_if(node
), state
, tabs
);
1145 case nir_cf_node_loop
:
1146 print_loop(nir_cf_node_as_loop(node
), state
, tabs
);
1150 unreachable("Invalid CFG node type");
1155 print_function_impl(nir_function_impl
*impl
, print_state
*state
)
1157 FILE *fp
= state
->fp
;
1159 fprintf(fp
, "\nimpl %s ", impl
->function
->name
);
1163 nir_foreach_variable(var
, &impl
->locals
) {
1165 print_var_decl(var
, state
);
1168 foreach_list_typed(nir_register
, reg
, node
, &impl
->registers
) {
1170 print_register_decl(reg
, state
);
1173 nir_index_blocks(impl
);
1175 foreach_list_typed(nir_cf_node
, node
, node
, &impl
->body
) {
1176 print_cf_node(node
, state
, 1);
1179 fprintf(fp
, "\tblock block_%u:\n}\n\n", impl
->end_block
->index
);
1183 print_function(nir_function
*function
, print_state
*state
)
1185 FILE *fp
= state
->fp
;
1187 fprintf(fp
, "decl_function %s (%d params)", function
->name
,
1188 function
->num_params
);
1192 if (function
->impl
!= NULL
) {
1193 print_function_impl(function
->impl
, state
);
1199 init_print_state(print_state
*state
, nir_shader
*shader
, FILE *fp
)
1202 state
->shader
= shader
;
1203 state
->ht
= _mesa_hash_table_create(NULL
, _mesa_hash_pointer
,
1204 _mesa_key_pointer_equal
);
1205 state
->syms
= _mesa_set_create(NULL
, _mesa_key_hash_string
,
1206 _mesa_key_string_equal
);
1211 destroy_print_state(print_state
*state
)
1213 _mesa_hash_table_destroy(state
->ht
, NULL
);
1214 _mesa_set_destroy(state
->syms
, NULL
);
1218 nir_print_shader_annotated(nir_shader
*shader
, FILE *fp
,
1219 struct hash_table
*annotations
)
1222 init_print_state(&state
, shader
, fp
);
1224 state
.annotations
= annotations
;
1226 fprintf(fp
, "shader: %s\n", gl_shader_stage_name(shader
->info
.stage
));
1228 if (shader
->info
.name
)
1229 fprintf(fp
, "name: %s\n", shader
->info
.name
);
1231 if (shader
->info
.label
)
1232 fprintf(fp
, "label: %s\n", shader
->info
.label
);
1234 switch (shader
->info
.stage
) {
1235 case MESA_SHADER_COMPUTE
:
1236 fprintf(fp
, "local-size: %u, %u, %u%s\n",
1237 shader
->info
.cs
.local_size
[0],
1238 shader
->info
.cs
.local_size
[1],
1239 shader
->info
.cs
.local_size
[2],
1240 shader
->info
.cs
.local_size_variable
? " (variable)" : "");
1241 fprintf(fp
, "shared-size: %u\n", shader
->info
.cs
.shared_size
);
1247 fprintf(fp
, "inputs: %u\n", shader
->num_inputs
);
1248 fprintf(fp
, "outputs: %u\n", shader
->num_outputs
);
1249 fprintf(fp
, "uniforms: %u\n", shader
->num_uniforms
);
1250 fprintf(fp
, "shared: %u\n", shader
->num_shared
);
1252 nir_foreach_variable(var
, &shader
->uniforms
) {
1253 print_var_decl(var
, &state
);
1256 nir_foreach_variable(var
, &shader
->inputs
) {
1257 print_var_decl(var
, &state
);
1260 nir_foreach_variable(var
, &shader
->outputs
) {
1261 print_var_decl(var
, &state
);
1264 nir_foreach_variable(var
, &shader
->shared
) {
1265 print_var_decl(var
, &state
);
1268 nir_foreach_variable(var
, &shader
->globals
) {
1269 print_var_decl(var
, &state
);
1272 nir_foreach_variable(var
, &shader
->system_values
) {
1273 print_var_decl(var
, &state
);
1276 foreach_list_typed(nir_register
, reg
, node
, &shader
->registers
) {
1277 print_register_decl(reg
, &state
);
1280 foreach_list_typed(nir_function
, func
, node
, &shader
->functions
) {
1281 print_function(func
, &state
);
1284 destroy_print_state(&state
);
1288 nir_print_shader(nir_shader
*shader
, FILE *fp
)
1290 nir_print_shader_annotated(shader
, fp
, NULL
);
1294 nir_print_instr(const nir_instr
*instr
, FILE *fp
)
1296 print_state state
= {
1299 print_instr(instr
, &state
, 0);