2 * Copyright © 2014 Intel Corporation
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
24 * Connor Abbott (cwabbott0@gmail.com)
29 #include "compiler/shader_enums.h"
30 #include "util/half_float.h"
31 #include "vulkan/vulkan_core.h"
34 #include <inttypes.h> /* for PRIx64 macro */
37 print_tabs(unsigned num_tabs
, FILE *fp
)
39 for (unsigned i
= 0; i
< num_tabs
; i
++)
46 /** map from nir_variable -> printable name */
47 struct hash_table
*ht
;
49 /** set of names used so far for nir_variables */
52 /* an index used to make new non-conflicting names */
56 * Optional table of annotations mapping nir object
57 * (such as instr or var) to message to print.
59 struct hash_table
*annotations
;
63 print_annotation(print_state
*state
, void *obj
)
65 if (!state
->annotations
)
68 struct hash_entry
*entry
= _mesa_hash_table_search(state
->annotations
, obj
);
72 const char *note
= entry
->data
;
73 _mesa_hash_table_remove(state
->annotations
, entry
);
75 fprintf(stderr
, "%s\n\n", note
);
79 print_register(nir_register
*reg
, print_state
*state
)
82 if (reg
->name
!= NULL
)
83 fprintf(fp
, "/* %s */ ", reg
->name
);
84 fprintf(fp
, "r%u", reg
->index
);
87 static const char *sizes
[] = { "error", "vec1", "vec2", "vec3", "vec4",
88 "error", "error", "error", "vec8",
89 "error", "error", "error", "error",
90 "error", "error", "error", "vec16"};
93 print_register_decl(nir_register
*reg
, print_state
*state
)
96 fprintf(fp
, "decl_reg %s %u ", sizes
[reg
->num_components
], reg
->bit_size
);
97 print_register(reg
, state
);
98 if (reg
->num_array_elems
!= 0)
99 fprintf(fp
, "[%u]", reg
->num_array_elems
);
104 print_ssa_def(nir_ssa_def
*def
, print_state
*state
)
106 FILE *fp
= state
->fp
;
107 if (def
->name
!= NULL
)
108 fprintf(fp
, "/* %s */ ", def
->name
);
109 fprintf(fp
, "%s %u ssa_%u", sizes
[def
->num_components
], def
->bit_size
,
114 print_ssa_use(nir_ssa_def
*def
, print_state
*state
)
116 FILE *fp
= state
->fp
;
117 if (def
->name
!= NULL
)
118 fprintf(fp
, "/* %s */ ", def
->name
);
119 fprintf(fp
, "ssa_%u", def
->index
);
122 static void print_src(const nir_src
*src
, print_state
*state
);
125 print_reg_src(const nir_reg_src
*src
, print_state
*state
)
127 FILE *fp
= state
->fp
;
128 print_register(src
->reg
, state
);
129 if (src
->reg
->num_array_elems
!= 0) {
130 fprintf(fp
, "[%u", src
->base_offset
);
131 if (src
->indirect
!= NULL
) {
133 print_src(src
->indirect
, state
);
140 print_reg_dest(nir_reg_dest
*dest
, print_state
*state
)
142 FILE *fp
= state
->fp
;
143 print_register(dest
->reg
, state
);
144 if (dest
->reg
->num_array_elems
!= 0) {
145 fprintf(fp
, "[%u", dest
->base_offset
);
146 if (dest
->indirect
!= NULL
) {
148 print_src(dest
->indirect
, state
);
155 print_src(const nir_src
*src
, print_state
*state
)
158 print_ssa_use(src
->ssa
, state
);
160 print_reg_src(&src
->reg
, state
);
164 print_dest(nir_dest
*dest
, print_state
*state
)
167 print_ssa_def(&dest
->ssa
, state
);
169 print_reg_dest(&dest
->reg
, state
);
173 print_alu_src(nir_alu_instr
*instr
, unsigned src
, print_state
*state
)
175 FILE *fp
= state
->fp
;
177 if (instr
->src
[src
].negate
)
179 if (instr
->src
[src
].abs
)
182 print_src(&instr
->src
[src
].src
, state
);
184 bool print_swizzle
= false;
185 nir_component_mask_t used_channels
= 0;
187 for (unsigned i
= 0; i
< NIR_MAX_VEC_COMPONENTS
; i
++) {
188 if (!nir_alu_instr_channel_used(instr
, src
, i
))
193 if (instr
->src
[src
].swizzle
[i
] != i
) {
194 print_swizzle
= true;
199 unsigned live_channels
= nir_src_num_components(instr
->src
[src
].src
);
201 if (print_swizzle
|| used_channels
!= live_channels
) {
203 for (unsigned i
= 0; i
< NIR_MAX_VEC_COMPONENTS
; i
++) {
204 if (!nir_alu_instr_channel_used(instr
, src
, i
))
207 fprintf(fp
, "%c", "xyzw"[instr
->src
[src
].swizzle
[i
]]);
211 if (instr
->src
[src
].abs
)
216 print_alu_dest(nir_alu_dest
*dest
, print_state
*state
)
218 FILE *fp
= state
->fp
;
219 /* we're going to print the saturate modifier later, after the opcode */
221 print_dest(&dest
->dest
, state
);
223 if (!dest
->dest
.is_ssa
&&
224 dest
->write_mask
!= (1 << dest
->dest
.reg
.reg
->num_components
) - 1) {
226 for (unsigned i
= 0; i
< NIR_MAX_VEC_COMPONENTS
; i
++)
227 if ((dest
->write_mask
>> i
) & 1)
228 fprintf(fp
, "%c", "xyzw"[i
]);
233 print_alu_instr(nir_alu_instr
*instr
, print_state
*state
)
235 FILE *fp
= state
->fp
;
237 print_alu_dest(&instr
->dest
, state
);
239 fprintf(fp
, " = %s", nir_op_infos
[instr
->op
].name
);
242 if (instr
->dest
.saturate
)
246 for (unsigned i
= 0; i
< nir_op_infos
[instr
->op
].num_inputs
; i
++) {
250 print_alu_src(instr
, i
, state
);
255 get_var_name(nir_variable
*var
, print_state
*state
)
257 if (state
->ht
== NULL
)
258 return var
->name
? var
->name
: "unnamed";
262 struct hash_entry
*entry
= _mesa_hash_table_search(state
->ht
, var
);
267 if (var
->name
== NULL
) {
268 name
= ralloc_asprintf(state
->syms
, "@%u", state
->index
++);
270 struct set_entry
*set_entry
= _mesa_set_search(state
->syms
, var
->name
);
271 if (set_entry
!= NULL
) {
272 /* we have a collision with another name, append an @ + a unique
274 name
= ralloc_asprintf(state
->syms
, "%s@%u", var
->name
,
277 /* Mark this one as seen */
278 _mesa_set_add(state
->syms
, var
->name
);
283 _mesa_hash_table_insert(state
->ht
, var
, name
);
289 print_constant(nir_constant
*c
, const struct glsl_type
*type
, print_state
*state
)
291 FILE *fp
= state
->fp
;
292 const unsigned rows
= glsl_get_vector_elements(type
);
293 const unsigned cols
= glsl_get_matrix_columns(type
);
296 switch (glsl_get_base_type(type
)) {
298 /* Only float base types can be matrices. */
301 for (i
= 0; i
< rows
; i
++) {
302 if (i
> 0) fprintf(fp
, ", ");
303 fprintf(fp
, "%s", c
->values
[0].b
[i
] ? "true" : "false");
307 case GLSL_TYPE_UINT8
:
309 /* Only float base types can be matrices. */
312 for (i
= 0; i
< rows
; i
++) {
313 if (i
> 0) fprintf(fp
, ", ");
314 fprintf(fp
, "0x%02x", c
->values
[0].u8
[i
]);
318 case GLSL_TYPE_UINT16
:
319 case GLSL_TYPE_INT16
:
320 /* Only float base types can be matrices. */
323 for (i
= 0; i
< rows
; i
++) {
324 if (i
> 0) fprintf(fp
, ", ");
325 fprintf(fp
, "0x%04x", c
->values
[0].u16
[i
]);
331 /* Only float base types can be matrices. */
334 for (i
= 0; i
< rows
; i
++) {
335 if (i
> 0) fprintf(fp
, ", ");
336 fprintf(fp
, "0x%08x", c
->values
[0].u32
[i
]);
340 case GLSL_TYPE_FLOAT16
:
341 for (i
= 0; i
< cols
; i
++) {
342 for (j
= 0; j
< rows
; j
++) {
343 if (i
+ j
> 0) fprintf(fp
, ", ");
344 fprintf(fp
, "%f", _mesa_half_to_float(c
->values
[i
].u16
[j
]));
349 case GLSL_TYPE_FLOAT
:
350 for (i
= 0; i
< cols
; i
++) {
351 for (j
= 0; j
< rows
; j
++) {
352 if (i
+ j
> 0) fprintf(fp
, ", ");
353 fprintf(fp
, "%f", c
->values
[i
].f32
[j
]);
358 case GLSL_TYPE_DOUBLE
:
359 for (i
= 0; i
< cols
; i
++) {
360 for (j
= 0; j
< rows
; j
++) {
361 if (i
+ j
> 0) fprintf(fp
, ", ");
362 fprintf(fp
, "%f", c
->values
[i
].f64
[j
]);
367 case GLSL_TYPE_UINT64
:
368 case GLSL_TYPE_INT64
:
369 /* Only float base types can be matrices. */
372 for (i
= 0; i
< cols
; i
++) {
373 if (i
> 0) fprintf(fp
, ", ");
374 fprintf(fp
, "0x%08" PRIx64
, c
->values
[0].u64
[i
]);
378 case GLSL_TYPE_STRUCT
:
379 for (i
= 0; i
< c
->num_elements
; i
++) {
380 if (i
> 0) fprintf(fp
, ", ");
382 print_constant(c
->elements
[i
], glsl_get_struct_field(type
, i
), state
);
387 case GLSL_TYPE_ARRAY
:
388 for (i
= 0; i
< c
->num_elements
; i
++) {
389 if (i
> 0) fprintf(fp
, ", ");
391 print_constant(c
->elements
[i
], glsl_get_array_element(type
), state
);
397 unreachable("not reached");
402 get_variable_mode_str(nir_variable_mode mode
, bool want_local_global_mode
)
405 case nir_var_shader_in
:
407 case nir_var_shader_out
:
409 case nir_var_uniform
:
411 case nir_var_mem_ubo
:
413 case nir_var_system_value
:
415 case nir_var_mem_ssbo
:
417 case nir_var_mem_shared
:
419 case nir_var_mem_global
:
421 case nir_var_shader_temp
:
422 return want_local_global_mode
? "shader_temp" : "";
423 case nir_var_function_temp
:
424 return want_local_global_mode
? "function_temp" : "";
431 print_var_decl(nir_variable
*var
, print_state
*state
)
433 FILE *fp
= state
->fp
;
435 fprintf(fp
, "decl_var ");
437 const char *const cent
= (var
->data
.centroid
) ? "centroid " : "";
438 const char *const samp
= (var
->data
.sample
) ? "sample " : "";
439 const char *const patch
= (var
->data
.patch
) ? "patch " : "";
440 const char *const inv
= (var
->data
.invariant
) ? "invariant " : "";
441 fprintf(fp
, "%s%s%s%s%s %s ",
442 cent
, samp
, patch
, inv
, get_variable_mode_str(var
->data
.mode
, false),
443 glsl_interp_mode_name(var
->data
.interpolation
));
445 enum gl_access_qualifier access
= var
->data
.image
.access
;
446 const char *const coher
= (access
& ACCESS_COHERENT
) ? "coherent " : "";
447 const char *const volat
= (access
& ACCESS_VOLATILE
) ? "volatile " : "";
448 const char *const restr
= (access
& ACCESS_RESTRICT
) ? "restrict " : "";
449 const char *const ronly
= (access
& ACCESS_NON_WRITEABLE
) ? "readonly " : "";
450 const char *const wonly
= (access
& ACCESS_NON_READABLE
) ? "writeonly " : "";
451 fprintf(fp
, "%s%s%s%s%s", coher
, volat
, restr
, ronly
, wonly
);
453 #define FORMAT_CASE(x) case x: fprintf(stderr, #x " "); break
454 switch (var
->data
.image
.format
) {
455 FORMAT_CASE(GL_RGBA32F
);
456 FORMAT_CASE(GL_RGBA32UI
);
457 FORMAT_CASE(GL_RGBA32I
);
458 FORMAT_CASE(GL_R32F
);
459 FORMAT_CASE(GL_R32UI
);
460 FORMAT_CASE(GL_R32I
);
461 FORMAT_CASE(GL_RG32F
);
462 FORMAT_CASE(GL_RG32UI
);
463 FORMAT_CASE(GL_RG32I
);
466 FORMAT_CASE(GL_RGBA8
);
467 FORMAT_CASE(GL_R8_SNORM
);
468 FORMAT_CASE(GL_RG8_SNORM
);
469 FORMAT_CASE(GL_RGBA8_SNORM
);
471 FORMAT_CASE(GL_RG16
);
472 FORMAT_CASE(GL_RGBA16
);
473 FORMAT_CASE(GL_R16_SNORM
);
474 FORMAT_CASE(GL_RG16_SNORM
);
475 FORMAT_CASE(GL_RGBA16_SNORM
);
476 FORMAT_CASE(GL_R16F
);
477 FORMAT_CASE(GL_RG16F
);
478 FORMAT_CASE(GL_RGBA16F
);
479 FORMAT_CASE(GL_R8UI
);
481 FORMAT_CASE(GL_RG8UI
);
482 FORMAT_CASE(GL_RG8I
);
483 FORMAT_CASE(GL_RGBA8UI
);
484 FORMAT_CASE(GL_RGBA8I
);
485 FORMAT_CASE(GL_R16UI
);
486 FORMAT_CASE(GL_R16I
);
487 FORMAT_CASE(GL_RG16UI
);
488 FORMAT_CASE(GL_RG16I
);
489 FORMAT_CASE(GL_RGBA16UI
);
490 FORMAT_CASE(GL_RGBA16I
);
491 FORMAT_CASE(GL_R11F_G11F_B10F
);
492 FORMAT_CASE(GL_RGB9_E5
);
493 FORMAT_CASE(GL_RGB10_A2
);
494 FORMAT_CASE(GL_RGB10_A2UI
);
495 default: /* Including the normal GL_NONE */
500 fprintf(fp
, "%s %s", glsl_get_type_name(var
->type
),
501 get_var_name(var
, state
));
503 if (var
->data
.mode
== nir_var_shader_in
||
504 var
->data
.mode
== nir_var_shader_out
||
505 var
->data
.mode
== nir_var_uniform
||
506 var
->data
.mode
== nir_var_mem_ubo
||
507 var
->data
.mode
== nir_var_mem_ssbo
) {
508 const char *loc
= NULL
;
511 switch (state
->shader
->info
.stage
) {
512 case MESA_SHADER_VERTEX
:
513 if (var
->data
.mode
== nir_var_shader_in
)
514 loc
= gl_vert_attrib_name(var
->data
.location
);
515 else if (var
->data
.mode
== nir_var_shader_out
)
516 loc
= gl_varying_slot_name(var
->data
.location
);
518 case MESA_SHADER_GEOMETRY
:
519 if ((var
->data
.mode
== nir_var_shader_in
) ||
520 (var
->data
.mode
== nir_var_shader_out
))
521 loc
= gl_varying_slot_name(var
->data
.location
);
523 case MESA_SHADER_FRAGMENT
:
524 if (var
->data
.mode
== nir_var_shader_in
)
525 loc
= gl_varying_slot_name(var
->data
.location
);
526 else if (var
->data
.mode
== nir_var_shader_out
)
527 loc
= gl_frag_result_name(var
->data
.location
);
529 case MESA_SHADER_TESS_CTRL
:
530 case MESA_SHADER_TESS_EVAL
:
531 case MESA_SHADER_COMPUTE
:
532 case MESA_SHADER_KERNEL
:
539 snprintf(buf
, sizeof(buf
), "%u", var
->data
.location
);
543 /* For shader I/O vars that have been split to components or packed,
544 * print the fractional location within the input/output.
546 unsigned int num_components
=
547 glsl_get_components(glsl_without_array(var
->type
));
548 const char *components
= NULL
;
549 char components_local
[6] = {'.' /* the rest is 0-filled */};
550 switch (var
->data
.mode
) {
551 case nir_var_shader_in
:
552 case nir_var_shader_out
:
553 if (num_components
< 4 && num_components
!= 0) {
554 const char *xyzw
= "xyzw";
555 for (int i
= 0; i
< num_components
; i
++)
556 components_local
[i
+ 1] = xyzw
[i
+ var
->data
.location_frac
];
558 components
= components_local
;
565 fprintf(fp
, " (%s%s, %u, %u)%s", loc
,
566 components
? components
: "",
567 var
->data
.driver_location
, var
->data
.binding
,
568 var
->data
.compact
? " compact" : "");
571 if (var
->constant_initializer
) {
572 fprintf(fp
, " = { ");
573 print_constant(var
->constant_initializer
, var
->type
, state
);
578 print_annotation(state
, var
);
582 print_deref_link(const nir_deref_instr
*instr
, bool whole_chain
, print_state
*state
)
584 FILE *fp
= state
->fp
;
586 if (instr
->deref_type
== nir_deref_type_var
) {
587 fprintf(fp
, "%s", get_var_name(instr
->var
, state
));
589 } else if (instr
->deref_type
== nir_deref_type_cast
) {
590 fprintf(fp
, "(%s *)", glsl_get_type_name(instr
->type
));
591 print_src(&instr
->parent
, state
);
595 assert(instr
->parent
.is_ssa
);
596 nir_deref_instr
*parent
=
597 nir_instr_as_deref(instr
->parent
.ssa
->parent_instr
);
599 /* Is the parent we're going to print a bare cast? */
600 const bool is_parent_cast
=
601 whole_chain
&& parent
->deref_type
== nir_deref_type_cast
;
603 /* If we're not printing the whole chain, the parent we print will be a SSA
604 * value that represents a pointer. The only deref type that naturally
605 * gives a pointer is a cast.
607 const bool is_parent_pointer
=
608 !whole_chain
|| parent
->deref_type
== nir_deref_type_cast
;
610 /* Struct derefs have a nice syntax that works on pointers, arrays derefs
613 const bool need_deref
=
614 is_parent_pointer
&& instr
->deref_type
!= nir_deref_type_struct
;
616 /* Cast need extra parens and so * dereferences */
617 if (is_parent_cast
|| need_deref
)
624 print_deref_link(parent
, whole_chain
, state
);
626 print_src(&instr
->parent
, state
);
629 if (is_parent_cast
|| need_deref
)
632 switch (instr
->deref_type
) {
633 case nir_deref_type_struct
:
634 fprintf(fp
, "%s%s", is_parent_pointer
? "->" : ".",
635 glsl_get_struct_elem_name(parent
->type
, instr
->strct
.index
));
638 case nir_deref_type_array
:
639 case nir_deref_type_ptr_as_array
: {
640 nir_const_value
*const_index
= nir_src_as_const_value(instr
->arr
.index
);
642 fprintf(fp
, "[%u]", const_index
->u32
[0]);
645 print_src(&instr
->arr
.index
, state
);
651 case nir_deref_type_array_wildcard
:
656 unreachable("Invalid deref instruction type");
661 print_deref_instr(nir_deref_instr
*instr
, print_state
*state
)
663 FILE *fp
= state
->fp
;
665 print_dest(&instr
->dest
, state
);
667 switch (instr
->deref_type
) {
668 case nir_deref_type_var
:
669 fprintf(fp
, " = deref_var ");
671 case nir_deref_type_array
:
672 case nir_deref_type_array_wildcard
:
673 fprintf(fp
, " = deref_array ");
675 case nir_deref_type_struct
:
676 fprintf(fp
, " = deref_struct ");
678 case nir_deref_type_cast
:
679 fprintf(fp
, " = deref_cast ");
681 case nir_deref_type_ptr_as_array
:
682 fprintf(fp
, " = deref_ptr_as_array ");
685 unreachable("Invalid deref instruction type");
688 /* Only casts naturally return a pointer type */
689 if (instr
->deref_type
!= nir_deref_type_cast
)
692 print_deref_link(instr
, false, state
);
694 fprintf(fp
, " (%s %s) ",
695 get_variable_mode_str(instr
->mode
, true),
696 glsl_get_type_name(instr
->type
));
698 if (instr
->deref_type
!= nir_deref_type_var
&&
699 instr
->deref_type
!= nir_deref_type_cast
) {
700 /* Print the entire chain as a comment */
702 print_deref_link(instr
, true, state
);
708 vulkan_descriptor_type_name(VkDescriptorType type
)
711 case VK_DESCRIPTOR_TYPE_SAMPLER
: return "sampler";
712 case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER
: return "texture+sampler";
713 case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE
: return "texture";
714 case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE
: return "image";
715 case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER
: return "texture-buffer";
716 case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER
: return "image-buffer";
717 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER
: return "UBO";
718 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER
: return "SSBO";
719 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC
: return "UBO";
720 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC
: return "SSBO";
721 case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT
: return "input-att";
722 case VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK_EXT
: return "inline-UBO";
723 default: return "unknown";
728 print_intrinsic_instr(nir_intrinsic_instr
*instr
, print_state
*state
)
730 const nir_intrinsic_info
*info
= &nir_intrinsic_infos
[instr
->intrinsic
];
731 unsigned num_srcs
= info
->num_srcs
;
732 FILE *fp
= state
->fp
;
734 if (info
->has_dest
) {
735 print_dest(&instr
->dest
, state
);
739 fprintf(fp
, "intrinsic %s (", info
->name
);
741 for (unsigned i
= 0; i
< num_srcs
; i
++) {
745 print_src(&instr
->src
[i
], state
);
750 for (unsigned i
= 0; i
< info
->num_indices
; i
++) {
754 fprintf(fp
, "%d", instr
->const_index
[i
]);
759 static const char *index_name
[NIR_INTRINSIC_NUM_INDEX_FLAGS
] = {
760 [NIR_INTRINSIC_BASE
] = "base",
761 [NIR_INTRINSIC_WRMASK
] = "wrmask",
762 [NIR_INTRINSIC_STREAM_ID
] = "stream-id",
763 [NIR_INTRINSIC_UCP_ID
] = "ucp-id",
764 [NIR_INTRINSIC_RANGE
] = "range",
765 [NIR_INTRINSIC_DESC_SET
] = "desc-set",
766 [NIR_INTRINSIC_BINDING
] = "binding",
767 [NIR_INTRINSIC_COMPONENT
] = "component",
768 [NIR_INTRINSIC_INTERP_MODE
] = "interp_mode",
769 [NIR_INTRINSIC_REDUCTION_OP
] = "reduction_op",
770 [NIR_INTRINSIC_CLUSTER_SIZE
] = "cluster_size",
771 [NIR_INTRINSIC_PARAM_IDX
] = "param_idx",
772 [NIR_INTRINSIC_IMAGE_DIM
] = "image_dim",
773 [NIR_INTRINSIC_IMAGE_ARRAY
] = "image_array",
774 [NIR_INTRINSIC_ACCESS
] = "access",
775 [NIR_INTRINSIC_FORMAT
] = "format",
776 [NIR_INTRINSIC_ALIGN_MUL
] = "align_mul",
777 [NIR_INTRINSIC_ALIGN_OFFSET
] = "align_offset",
778 [NIR_INTRINSIC_DESC_TYPE
] = "desc_type",
780 for (unsigned idx
= 1; idx
< NIR_INTRINSIC_NUM_INDEX_FLAGS
; idx
++) {
781 if (!info
->index_map
[idx
])
784 if (idx
== NIR_INTRINSIC_WRMASK
) {
785 /* special case wrmask to show it as a writemask.. */
786 unsigned wrmask
= nir_intrinsic_write_mask(instr
);
787 fprintf(fp
, " wrmask=");
788 for (unsigned i
= 0; i
< 4; i
++)
789 if ((wrmask
>> i
) & 1)
790 fprintf(fp
, "%c", "xyzw"[i
]);
791 } else if (idx
== NIR_INTRINSIC_REDUCTION_OP
) {
792 nir_op reduction_op
= nir_intrinsic_reduction_op(instr
);
793 fprintf(fp
, " reduction_op=%s", nir_op_infos
[reduction_op
].name
);
794 } else if (idx
== NIR_INTRINSIC_IMAGE_DIM
) {
795 static const char *dim_name
[] = {
796 [GLSL_SAMPLER_DIM_1D
] = "1D",
797 [GLSL_SAMPLER_DIM_2D
] = "2D",
798 [GLSL_SAMPLER_DIM_3D
] = "3D",
799 [GLSL_SAMPLER_DIM_CUBE
] = "Cube",
800 [GLSL_SAMPLER_DIM_RECT
] = "Rect",
801 [GLSL_SAMPLER_DIM_BUF
] = "Buf",
802 [GLSL_SAMPLER_DIM_MS
] = "2D-MSAA",
803 [GLSL_SAMPLER_DIM_SUBPASS
] = "Subpass",
804 [GLSL_SAMPLER_DIM_SUBPASS_MS
] = "Subpass-MSAA",
806 enum glsl_sampler_dim dim
= nir_intrinsic_image_dim(instr
);
807 assert(dim
< ARRAY_SIZE(dim_name
) && dim_name
[dim
]);
808 fprintf(fp
, " image_dim=%s", dim_name
[dim
]);
809 } else if (idx
== NIR_INTRINSIC_IMAGE_ARRAY
) {
810 bool array
= nir_intrinsic_image_array(instr
);
811 fprintf(fp
, " image_array=%s", array
? "true" : "false");
812 } else if (idx
== NIR_INTRINSIC_DESC_TYPE
) {
813 VkDescriptorType desc_type
= nir_intrinsic_desc_type(instr
);
814 fprintf(fp
, " desc_type=%s", vulkan_descriptor_type_name(desc_type
));
816 unsigned off
= info
->index_map
[idx
] - 1;
817 assert(index_name
[idx
]); /* forgot to update index_name table? */
818 fprintf(fp
, " %s=%d", index_name
[idx
], instr
->const_index
[off
]);
826 struct exec_list
*var_list
= NULL
;
828 switch (instr
->intrinsic
) {
829 case nir_intrinsic_load_uniform
:
830 var_list
= &state
->shader
->uniforms
;
832 case nir_intrinsic_load_input
:
833 case nir_intrinsic_load_interpolated_input
:
834 case nir_intrinsic_load_per_vertex_input
:
835 var_list
= &state
->shader
->inputs
;
837 case nir_intrinsic_load_output
:
838 case nir_intrinsic_store_output
:
839 case nir_intrinsic_store_per_vertex_output
:
840 var_list
= &state
->shader
->outputs
;
846 nir_foreach_variable(var
, var_list
) {
847 if ((var
->data
.driver_location
== nir_intrinsic_base(instr
)) &&
848 (instr
->intrinsic
== nir_intrinsic_load_uniform
||
849 (nir_intrinsic_component(instr
) >= var
->data
.location_frac
&&
850 nir_intrinsic_component(instr
) <
851 (var
->data
.location_frac
+ glsl_get_components(var
->type
)))) &&
853 fprintf(fp
, "\t/* %s */", var
->name
);
860 print_tex_instr(nir_tex_instr
*instr
, print_state
*state
)
862 FILE *fp
= state
->fp
;
864 print_dest(&instr
->dest
, state
);
884 case nir_texop_txf_ms
:
885 fprintf(fp
, "txf_ms ");
887 case nir_texop_txf_ms_mcs
:
888 fprintf(fp
, "txf_ms_mcs ");
899 case nir_texop_query_levels
:
900 fprintf(fp
, "query_levels ");
902 case nir_texop_texture_samples
:
903 fprintf(fp
, "texture_samples ");
905 case nir_texop_samples_identical
:
906 fprintf(fp
, "samples_identical ");
909 unreachable("Invalid texture operation");
913 bool has_texture_deref
= false, has_sampler_deref
= false;
914 for (unsigned i
= 0; i
< instr
->num_srcs
; i
++) {
915 print_src(&instr
->src
[i
].src
, state
);
919 switch(instr
->src
[i
].src_type
) {
920 case nir_tex_src_coord
:
921 fprintf(fp
, "(coord)");
923 case nir_tex_src_projector
:
924 fprintf(fp
, "(projector)");
926 case nir_tex_src_comparator
:
927 fprintf(fp
, "(comparator)");
929 case nir_tex_src_offset
:
930 fprintf(fp
, "(offset)");
932 case nir_tex_src_bias
:
933 fprintf(fp
, "(bias)");
935 case nir_tex_src_lod
:
936 fprintf(fp
, "(lod)");
938 case nir_tex_src_min_lod
:
939 fprintf(fp
, "(min_lod)");
941 case nir_tex_src_ms_index
:
942 fprintf(fp
, "(ms_index)");
944 case nir_tex_src_ms_mcs
:
945 fprintf(fp
, "(ms_mcs)");
947 case nir_tex_src_ddx
:
948 fprintf(fp
, "(ddx)");
950 case nir_tex_src_ddy
:
951 fprintf(fp
, "(ddy)");
953 case nir_tex_src_texture_deref
:
954 has_texture_deref
= true;
955 fprintf(fp
, "(texture_deref)");
957 case nir_tex_src_sampler_deref
:
958 has_sampler_deref
= true;
959 fprintf(fp
, "(sampler_deref)");
961 case nir_tex_src_texture_offset
:
962 fprintf(fp
, "(texture_offset)");
964 case nir_tex_src_sampler_offset
:
965 fprintf(fp
, "(sampler_offset)");
967 case nir_tex_src_texture_handle
:
968 fprintf(fp
, "(texture_handle)");
970 case nir_tex_src_sampler_handle
:
971 fprintf(fp
, "(sampler_handle)");
973 case nir_tex_src_plane
:
974 fprintf(fp
, "(plane)");
978 unreachable("Invalid texture source type");
985 if (instr
->op
== nir_texop_tg4
) {
986 fprintf(fp
, "%u (gather_component), ", instr
->component
);
989 if (nir_tex_instr_has_explicit_tg4_offsets(instr
)) {
990 fprintf(fp
, "{ (%i, %i)", instr
->tg4_offsets
[0][0], instr
->tg4_offsets
[0][1]);
991 for (unsigned i
= 1; i
< 4; ++i
)
992 fprintf(fp
, ", (%i, %i)", instr
->tg4_offsets
[i
][0],
993 instr
->tg4_offsets
[i
][1]);
994 fprintf(fp
, " } (offsets), ");
997 if (!has_texture_deref
) {
998 fprintf(fp
, "%u (texture), ", instr
->texture_index
);
1001 if (!has_sampler_deref
) {
1002 fprintf(fp
, "%u (sampler), ", instr
->sampler_index
);
1007 print_call_instr(nir_call_instr
*instr
, print_state
*state
)
1009 FILE *fp
= state
->fp
;
1011 fprintf(fp
, "call %s ", instr
->callee
->name
);
1013 for (unsigned i
= 0; i
< instr
->num_params
; i
++) {
1017 print_src(&instr
->params
[i
], state
);
1022 print_load_const_instr(nir_load_const_instr
*instr
, print_state
*state
)
1024 FILE *fp
= state
->fp
;
1026 print_ssa_def(&instr
->def
, state
);
1028 fprintf(fp
, " = load_const (");
1030 for (unsigned i
= 0; i
< instr
->def
.num_components
; i
++) {
1035 * we don't really know the type of the constant (if it will be used as a
1036 * float or an int), so just print the raw constant in hex for fidelity
1037 * and then print the float in a comment for readability.
1040 switch (instr
->def
.bit_size
) {
1042 fprintf(fp
, "0x%16" PRIx64
" /* %f */", instr
->value
.u64
[i
],
1043 instr
->value
.f64
[i
]);
1046 fprintf(fp
, "0x%08x /* %f */", instr
->value
.u32
[i
], instr
->value
.f32
[i
]);
1049 fprintf(fp
, "0x%04x /* %f */", instr
->value
.u16
[i
],
1050 _mesa_half_to_float(instr
->value
.u16
[i
]));
1053 fprintf(fp
, "0x%02x", instr
->value
.u8
[i
]);
1056 fprintf(fp
, "%s", instr
->value
.b
[i
] ? "true" : "false");
1065 print_jump_instr(nir_jump_instr
*instr
, print_state
*state
)
1067 FILE *fp
= state
->fp
;
1069 switch (instr
->type
) {
1070 case nir_jump_break
:
1071 fprintf(fp
, "break");
1074 case nir_jump_continue
:
1075 fprintf(fp
, "continue");
1078 case nir_jump_return
:
1079 fprintf(fp
, "return");
1085 print_ssa_undef_instr(nir_ssa_undef_instr
* instr
, print_state
*state
)
1087 FILE *fp
= state
->fp
;
1088 print_ssa_def(&instr
->def
, state
);
1089 fprintf(fp
, " = undefined");
1093 print_phi_instr(nir_phi_instr
*instr
, print_state
*state
)
1095 FILE *fp
= state
->fp
;
1096 print_dest(&instr
->dest
, state
);
1097 fprintf(fp
, " = phi ");
1098 nir_foreach_phi_src(src
, instr
) {
1099 if (&src
->node
!= exec_list_get_head(&instr
->srcs
))
1102 fprintf(fp
, "block_%u: ", src
->pred
->index
);
1103 print_src(&src
->src
, state
);
1108 print_parallel_copy_instr(nir_parallel_copy_instr
*instr
, print_state
*state
)
1110 FILE *fp
= state
->fp
;
1111 nir_foreach_parallel_copy_entry(entry
, instr
) {
1112 if (&entry
->node
!= exec_list_get_head(&instr
->entries
))
1115 print_dest(&entry
->dest
, state
);
1117 print_src(&entry
->src
, state
);
1122 print_instr(const nir_instr
*instr
, print_state
*state
, unsigned tabs
)
1124 FILE *fp
= state
->fp
;
1125 print_tabs(tabs
, fp
);
1127 switch (instr
->type
) {
1128 case nir_instr_type_alu
:
1129 print_alu_instr(nir_instr_as_alu(instr
), state
);
1132 case nir_instr_type_deref
:
1133 print_deref_instr(nir_instr_as_deref(instr
), state
);
1136 case nir_instr_type_call
:
1137 print_call_instr(nir_instr_as_call(instr
), state
);
1140 case nir_instr_type_intrinsic
:
1141 print_intrinsic_instr(nir_instr_as_intrinsic(instr
), state
);
1144 case nir_instr_type_tex
:
1145 print_tex_instr(nir_instr_as_tex(instr
), state
);
1148 case nir_instr_type_load_const
:
1149 print_load_const_instr(nir_instr_as_load_const(instr
), state
);
1152 case nir_instr_type_jump
:
1153 print_jump_instr(nir_instr_as_jump(instr
), state
);
1156 case nir_instr_type_ssa_undef
:
1157 print_ssa_undef_instr(nir_instr_as_ssa_undef(instr
), state
);
1160 case nir_instr_type_phi
:
1161 print_phi_instr(nir_instr_as_phi(instr
), state
);
1164 case nir_instr_type_parallel_copy
:
1165 print_parallel_copy_instr(nir_instr_as_parallel_copy(instr
), state
);
1169 unreachable("Invalid instruction type");
1175 compare_block_index(const void *p1
, const void *p2
)
1177 const nir_block
*block1
= *((const nir_block
**) p1
);
1178 const nir_block
*block2
= *((const nir_block
**) p2
);
1180 return (int) block1
->index
- (int) block2
->index
;
1183 static void print_cf_node(nir_cf_node
*node
, print_state
*state
,
1187 print_block(nir_block
*block
, print_state
*state
, unsigned tabs
)
1189 FILE *fp
= state
->fp
;
1191 print_tabs(tabs
, fp
);
1192 fprintf(fp
, "block block_%u:\n", block
->index
);
1194 /* sort the predecessors by index so we consistently print the same thing */
1197 malloc(block
->predecessors
->entries
* sizeof(nir_block
*));
1200 set_foreach(block
->predecessors
, entry
) {
1201 preds
[i
++] = (nir_block
*) entry
->key
;
1204 qsort(preds
, block
->predecessors
->entries
, sizeof(nir_block
*),
1205 compare_block_index
);
1207 print_tabs(tabs
, fp
);
1208 fprintf(fp
, "/* preds: ");
1209 for (unsigned i
= 0; i
< block
->predecessors
->entries
; i
++) {
1210 fprintf(fp
, "block_%u ", preds
[i
]->index
);
1212 fprintf(fp
, "*/\n");
1216 nir_foreach_instr(instr
, block
) {
1217 print_instr(instr
, state
, tabs
);
1219 print_annotation(state
, instr
);
1222 print_tabs(tabs
, fp
);
1223 fprintf(fp
, "/* succs: ");
1224 for (unsigned i
= 0; i
< 2; i
++)
1225 if (block
->successors
[i
]) {
1226 fprintf(fp
, "block_%u ", block
->successors
[i
]->index
);
1228 fprintf(fp
, "*/\n");
1232 print_if(nir_if
*if_stmt
, print_state
*state
, unsigned tabs
)
1234 FILE *fp
= state
->fp
;
1236 print_tabs(tabs
, fp
);
1238 print_src(&if_stmt
->condition
, state
);
1239 fprintf(fp
, " {\n");
1240 foreach_list_typed(nir_cf_node
, node
, node
, &if_stmt
->then_list
) {
1241 print_cf_node(node
, state
, tabs
+ 1);
1243 print_tabs(tabs
, fp
);
1244 fprintf(fp
, "} else {\n");
1245 foreach_list_typed(nir_cf_node
, node
, node
, &if_stmt
->else_list
) {
1246 print_cf_node(node
, state
, tabs
+ 1);
1248 print_tabs(tabs
, fp
);
1253 print_loop(nir_loop
*loop
, print_state
*state
, unsigned tabs
)
1255 FILE *fp
= state
->fp
;
1257 print_tabs(tabs
, fp
);
1258 fprintf(fp
, "loop {\n");
1259 foreach_list_typed(nir_cf_node
, node
, node
, &loop
->body
) {
1260 print_cf_node(node
, state
, tabs
+ 1);
1262 print_tabs(tabs
, fp
);
1267 print_cf_node(nir_cf_node
*node
, print_state
*state
, unsigned int tabs
)
1269 switch (node
->type
) {
1270 case nir_cf_node_block
:
1271 print_block(nir_cf_node_as_block(node
), state
, tabs
);
1274 case nir_cf_node_if
:
1275 print_if(nir_cf_node_as_if(node
), state
, tabs
);
1278 case nir_cf_node_loop
:
1279 print_loop(nir_cf_node_as_loop(node
), state
, tabs
);
1283 unreachable("Invalid CFG node type");
1288 print_function_impl(nir_function_impl
*impl
, print_state
*state
)
1290 FILE *fp
= state
->fp
;
1292 fprintf(fp
, "\nimpl %s ", impl
->function
->name
);
1296 nir_foreach_variable(var
, &impl
->locals
) {
1298 print_var_decl(var
, state
);
1301 foreach_list_typed(nir_register
, reg
, node
, &impl
->registers
) {
1303 print_register_decl(reg
, state
);
1306 nir_index_blocks(impl
);
1308 foreach_list_typed(nir_cf_node
, node
, node
, &impl
->body
) {
1309 print_cf_node(node
, state
, 1);
1312 fprintf(fp
, "\tblock block_%u:\n}\n\n", impl
->end_block
->index
);
1316 print_function(nir_function
*function
, print_state
*state
)
1318 FILE *fp
= state
->fp
;
1320 fprintf(fp
, "decl_function %s (%d params)", function
->name
,
1321 function
->num_params
);
1325 if (function
->impl
!= NULL
) {
1326 print_function_impl(function
->impl
, state
);
1332 init_print_state(print_state
*state
, nir_shader
*shader
, FILE *fp
)
1335 state
->shader
= shader
;
1336 state
->ht
= _mesa_pointer_hash_table_create(NULL
);
1337 state
->syms
= _mesa_set_create(NULL
, _mesa_key_hash_string
,
1338 _mesa_key_string_equal
);
1343 destroy_print_state(print_state
*state
)
1345 _mesa_hash_table_destroy(state
->ht
, NULL
);
1346 _mesa_set_destroy(state
->syms
, NULL
);
1350 nir_print_shader_annotated(nir_shader
*shader
, FILE *fp
,
1351 struct hash_table
*annotations
)
1354 init_print_state(&state
, shader
, fp
);
1356 state
.annotations
= annotations
;
1358 fprintf(fp
, "shader: %s\n", gl_shader_stage_name(shader
->info
.stage
));
1360 if (shader
->info
.name
)
1361 fprintf(fp
, "name: %s\n", shader
->info
.name
);
1363 if (shader
->info
.label
)
1364 fprintf(fp
, "label: %s\n", shader
->info
.label
);
1366 if (gl_shader_stage_is_compute(shader
->info
.stage
)) {
1367 fprintf(fp
, "local-size: %u, %u, %u%s\n",
1368 shader
->info
.cs
.local_size
[0],
1369 shader
->info
.cs
.local_size
[1],
1370 shader
->info
.cs
.local_size
[2],
1371 shader
->info
.cs
.local_size_variable
? " (variable)" : "");
1372 fprintf(fp
, "shared-size: %u\n", shader
->info
.cs
.shared_size
);
1375 fprintf(fp
, "inputs: %u\n", shader
->num_inputs
);
1376 fprintf(fp
, "outputs: %u\n", shader
->num_outputs
);
1377 fprintf(fp
, "uniforms: %u\n", shader
->num_uniforms
);
1378 fprintf(fp
, "shared: %u\n", shader
->num_shared
);
1379 if (shader
->scratch_size
)
1380 fprintf(fp
, "scratch: %u\n", shader
->scratch_size
);
1382 nir_foreach_variable(var
, &shader
->uniforms
) {
1383 print_var_decl(var
, &state
);
1386 nir_foreach_variable(var
, &shader
->inputs
) {
1387 print_var_decl(var
, &state
);
1390 nir_foreach_variable(var
, &shader
->outputs
) {
1391 print_var_decl(var
, &state
);
1394 nir_foreach_variable(var
, &shader
->shared
) {
1395 print_var_decl(var
, &state
);
1398 nir_foreach_variable(var
, &shader
->globals
) {
1399 print_var_decl(var
, &state
);
1402 nir_foreach_variable(var
, &shader
->system_values
) {
1403 print_var_decl(var
, &state
);
1406 foreach_list_typed(nir_function
, func
, node
, &shader
->functions
) {
1407 print_function(func
, &state
);
1410 destroy_print_state(&state
);
1414 nir_print_shader(nir_shader
*shader
, FILE *fp
)
1416 nir_print_shader_annotated(shader
, fp
, NULL
);
1421 nir_print_instr(const nir_instr
*instr
, FILE *fp
)
1423 print_state state
= {
1426 print_instr(instr
, &state
, 0);
1431 nir_print_deref(const nir_deref_instr
*deref
, FILE *fp
)
1433 print_state state
= {
1436 print_deref_link(deref
, true, &state
);