1 /**************************************************************************
3 * Copyright 2009-2010 VMware, Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE, INC AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
29 #include "pipe/p_screen.h"
30 #include "pipe/p_context.h"
31 #include "pipe/p_state.h"
32 #include "tgsi/tgsi_ureg.h"
33 #include "tgsi/tgsi_build.h"
34 #include "tgsi/tgsi_info.h"
35 #include "tgsi/tgsi_dump.h"
36 #include "tgsi/tgsi_sanity.h"
37 #include "util/u_debug.h"
38 #include "util/u_inlines.h"
39 #include "util/u_memory.h"
40 #include "util/u_math.h"
41 #include "util/u_bitmask.h"
43 union tgsi_any_token
{
44 struct tgsi_header header
;
45 struct tgsi_processor processor
;
46 struct tgsi_token token
;
47 struct tgsi_property prop
;
48 struct tgsi_property_data prop_data
;
49 struct tgsi_declaration decl
;
50 struct tgsi_declaration_range decl_range
;
51 struct tgsi_declaration_dimension decl_dim
;
52 struct tgsi_declaration_interp decl_interp
;
53 struct tgsi_declaration_image decl_image
;
54 struct tgsi_declaration_semantic decl_semantic
;
55 struct tgsi_declaration_sampler_view decl_sampler_view
;
56 struct tgsi_declaration_array array
;
57 struct tgsi_immediate imm
;
58 union tgsi_immediate_data imm_data
;
59 struct tgsi_instruction insn
;
60 struct tgsi_instruction_label insn_label
;
61 struct tgsi_instruction_texture insn_texture
;
62 struct tgsi_instruction_memory insn_memory
;
63 struct tgsi_texture_offset insn_texture_offset
;
64 struct tgsi_src_register src
;
65 struct tgsi_ind_register ind
;
66 struct tgsi_dimension dim
;
67 struct tgsi_dst_register dst
;
73 union tgsi_any_token
*tokens
;
79 #define UREG_MAX_INPUT (4 * PIPE_MAX_SHADER_INPUTS)
80 #define UREG_MAX_SYSTEM_VALUE PIPE_MAX_ATTRIBS
81 #define UREG_MAX_OUTPUT (4 * PIPE_MAX_SHADER_OUTPUTS)
82 #define UREG_MAX_CONSTANT_RANGE 32
83 #define UREG_MAX_HW_ATOMIC_RANGE 32
84 #define UREG_MAX_IMMEDIATE 4096
85 #define UREG_MAX_ADDR 3
86 #define UREG_MAX_ARRAY_TEMPS 256
92 } constant_range
[UREG_MAX_CONSTANT_RANGE
];
93 unsigned nr_constant_ranges
;
96 struct hw_atomic_decl
{
101 } hw_atomic_range
[UREG_MAX_HW_ATOMIC_RANGE
];
102 unsigned nr_hw_atomic_ranges
;
105 #define DOMAIN_DECL 0
106 #define DOMAIN_INSN 1
110 enum pipe_shader_type processor
;
111 bool supports_any_inout_decl_range
;
112 int next_shader_processor
;
115 enum tgsi_semantic semantic_name
;
116 unsigned semantic_index
;
117 enum tgsi_interpolate_mode interp
;
118 unsigned char cylindrical_wrap
;
119 unsigned char usage_mask
;
120 enum tgsi_interpolate_loc interp_location
;
124 } input
[UREG_MAX_INPUT
];
125 unsigned nr_inputs
, nr_input_regs
;
127 unsigned vs_inputs
[PIPE_MAX_ATTRIBS
/32];
130 enum tgsi_semantic semantic_name
;
131 unsigned semantic_index
;
132 } system_value
[UREG_MAX_SYSTEM_VALUE
];
133 unsigned nr_system_values
;
136 enum tgsi_semantic semantic_name
;
137 unsigned semantic_index
;
139 unsigned usage_mask
; /* = TGSI_WRITEMASK_* */
144 } output
[UREG_MAX_OUTPUT
];
145 unsigned nr_outputs
, nr_output_regs
;
155 } immediate
[UREG_MAX_IMMEDIATE
];
156 unsigned nr_immediates
;
158 struct ureg_src sampler
[PIPE_MAX_SAMPLERS
];
159 unsigned nr_samplers
;
163 enum tgsi_texture_type target
;
164 enum tgsi_return_type return_type_x
;
165 enum tgsi_return_type return_type_y
;
166 enum tgsi_return_type return_type_z
;
167 enum tgsi_return_type return_type_w
;
168 } sampler_view
[PIPE_MAX_SHADER_SAMPLER_VIEWS
];
169 unsigned nr_sampler_views
;
173 enum tgsi_texture_type target
;
174 enum pipe_format format
;
177 } image
[PIPE_MAX_SHADER_IMAGES
];
183 } buffer
[PIPE_MAX_SHADER_BUFFERS
];
186 struct util_bitmask
*free_temps
;
187 struct util_bitmask
*local_temps
;
188 struct util_bitmask
*decl_temps
;
191 unsigned array_temps
[UREG_MAX_ARRAY_TEMPS
];
192 unsigned nr_array_temps
;
194 struct const_decl const_decls
[PIPE_MAX_CONSTANT_BUFFERS
];
196 struct hw_atomic_decl hw_atomic_decls
[PIPE_MAX_HW_ATOMIC_BUFFERS
];
198 unsigned properties
[TGSI_PROPERTY_COUNT
];
201 unsigned nr_instructions
;
203 struct ureg_tokens domain
[2];
205 bool use_memory
[TGSI_MEMORY_TYPE_COUNT
];
208 static union tgsi_any_token error_tokens
[32];
210 static void tokens_error( struct ureg_tokens
*tokens
)
212 if (tokens
->tokens
&& tokens
->tokens
!= error_tokens
)
213 FREE(tokens
->tokens
);
215 tokens
->tokens
= error_tokens
;
216 tokens
->size
= ARRAY_SIZE(error_tokens
);
221 static void tokens_expand( struct ureg_tokens
*tokens
,
224 unsigned old_size
= tokens
->size
* sizeof(unsigned);
226 if (tokens
->tokens
== error_tokens
) {
230 while (tokens
->count
+ count
> tokens
->size
) {
231 tokens
->size
= (1 << ++tokens
->order
);
234 tokens
->tokens
= REALLOC(tokens
->tokens
,
236 tokens
->size
* sizeof(unsigned));
237 if (tokens
->tokens
== NULL
) {
238 tokens_error(tokens
);
242 static void set_bad( struct ureg_program
*ureg
)
244 tokens_error(&ureg
->domain
[0]);
249 static union tgsi_any_token
*get_tokens( struct ureg_program
*ureg
,
253 struct ureg_tokens
*tokens
= &ureg
->domain
[domain
];
254 union tgsi_any_token
*result
;
256 if (tokens
->count
+ count
> tokens
->size
)
257 tokens_expand(tokens
, count
);
259 result
= &tokens
->tokens
[tokens
->count
];
260 tokens
->count
+= count
;
265 static union tgsi_any_token
*retrieve_token( struct ureg_program
*ureg
,
269 if (ureg
->domain
[domain
].tokens
== error_tokens
)
270 return &error_tokens
[0];
272 return &ureg
->domain
[domain
].tokens
[nr
];
277 ureg_property(struct ureg_program
*ureg
, unsigned name
, unsigned value
)
279 assert(name
< ARRAY_SIZE(ureg
->properties
));
280 ureg
->properties
[name
] = value
;
284 ureg_DECL_fs_input_cyl_centroid_layout(struct ureg_program
*ureg
,
285 enum tgsi_semantic semantic_name
,
286 unsigned semantic_index
,
287 enum tgsi_interpolate_mode interp_mode
,
288 unsigned cylindrical_wrap
,
289 enum tgsi_interpolate_loc interp_location
,
297 assert(usage_mask
!= 0);
298 assert(usage_mask
<= TGSI_WRITEMASK_XYZW
);
300 for (i
= 0; i
< ureg
->nr_inputs
; i
++) {
301 if (ureg
->input
[i
].semantic_name
== semantic_name
&&
302 ureg
->input
[i
].semantic_index
== semantic_index
) {
303 assert(ureg
->input
[i
].interp
== interp_mode
);
304 assert(ureg
->input
[i
].cylindrical_wrap
== cylindrical_wrap
);
305 assert(ureg
->input
[i
].interp_location
== interp_location
);
306 if (ureg
->input
[i
].array_id
== array_id
) {
307 ureg
->input
[i
].usage_mask
|= usage_mask
;
310 assert((ureg
->input
[i
].usage_mask
& usage_mask
) == 0);
314 if (ureg
->nr_inputs
< UREG_MAX_INPUT
) {
315 assert(array_size
>= 1);
316 ureg
->input
[i
].semantic_name
= semantic_name
;
317 ureg
->input
[i
].semantic_index
= semantic_index
;
318 ureg
->input
[i
].interp
= interp_mode
;
319 ureg
->input
[i
].cylindrical_wrap
= cylindrical_wrap
;
320 ureg
->input
[i
].interp_location
= interp_location
;
321 ureg
->input
[i
].first
= index
;
322 ureg
->input
[i
].last
= index
+ array_size
- 1;
323 ureg
->input
[i
].array_id
= array_id
;
324 ureg
->input
[i
].usage_mask
= usage_mask
;
325 ureg
->nr_input_regs
= MAX2(ureg
->nr_input_regs
, index
+ array_size
);
332 return ureg_src_array_register(TGSI_FILE_INPUT
, ureg
->input
[i
].first
,
337 ureg_DECL_fs_input_cyl_centroid(struct ureg_program
*ureg
,
338 enum tgsi_semantic semantic_name
,
339 unsigned semantic_index
,
340 enum tgsi_interpolate_mode interp_mode
,
341 unsigned cylindrical_wrap
,
342 enum tgsi_interpolate_loc interp_location
,
346 return ureg_DECL_fs_input_cyl_centroid_layout(ureg
,
347 semantic_name
, semantic_index
, interp_mode
,
348 cylindrical_wrap
, interp_location
,
349 ureg
->nr_input_regs
, TGSI_WRITEMASK_XYZW
, array_id
, array_size
);
354 ureg_DECL_vs_input( struct ureg_program
*ureg
,
357 assert(ureg
->processor
== PIPE_SHADER_VERTEX
);
358 assert(index
/ 32 < ARRAY_SIZE(ureg
->vs_inputs
));
360 ureg
->vs_inputs
[index
/32] |= 1 << (index
% 32);
361 return ureg_src_register( TGSI_FILE_INPUT
, index
);
366 ureg_DECL_input_layout(struct ureg_program
*ureg
,
367 enum tgsi_semantic semantic_name
,
368 unsigned semantic_index
,
374 return ureg_DECL_fs_input_cyl_centroid_layout(ureg
,
375 semantic_name
, semantic_index
,
376 TGSI_INTERPOLATE_CONSTANT
, 0, TGSI_INTERPOLATE_LOC_CENTER
,
377 index
, usage_mask
, array_id
, array_size
);
382 ureg_DECL_input(struct ureg_program
*ureg
,
383 enum tgsi_semantic semantic_name
,
384 unsigned semantic_index
,
388 return ureg_DECL_fs_input_cyl_centroid(ureg
, semantic_name
, semantic_index
,
389 TGSI_INTERPOLATE_CONSTANT
, 0,
390 TGSI_INTERPOLATE_LOC_CENTER
,
391 array_id
, array_size
);
396 ureg_DECL_system_value(struct ureg_program
*ureg
,
397 enum tgsi_semantic semantic_name
,
398 unsigned semantic_index
)
402 for (i
= 0; i
< ureg
->nr_system_values
; i
++) {
403 if (ureg
->system_value
[i
].semantic_name
== semantic_name
&&
404 ureg
->system_value
[i
].semantic_index
== semantic_index
) {
409 if (ureg
->nr_system_values
< UREG_MAX_SYSTEM_VALUE
) {
410 ureg
->system_value
[ureg
->nr_system_values
].semantic_name
= semantic_name
;
411 ureg
->system_value
[ureg
->nr_system_values
].semantic_index
= semantic_index
;
412 i
= ureg
->nr_system_values
;
413 ureg
->nr_system_values
++;
419 return ureg_src_register(TGSI_FILE_SYSTEM_VALUE
, i
);
424 ureg_DECL_output_layout(struct ureg_program
*ureg
,
425 enum tgsi_semantic semantic_name
,
426 unsigned semantic_index
,
436 assert(usage_mask
!= 0);
437 assert(!(streams
& 0x03) || (usage_mask
& 1));
438 assert(!(streams
& 0x0c) || (usage_mask
& 2));
439 assert(!(streams
& 0x30) || (usage_mask
& 4));
440 assert(!(streams
& 0xc0) || (usage_mask
& 8));
442 for (i
= 0; i
< ureg
->nr_outputs
; i
++) {
443 if (ureg
->output
[i
].semantic_name
== semantic_name
&&
444 ureg
->output
[i
].semantic_index
== semantic_index
) {
445 if (ureg
->output
[i
].array_id
== array_id
) {
446 ureg
->output
[i
].usage_mask
|= usage_mask
;
449 assert((ureg
->output
[i
].usage_mask
& usage_mask
) == 0);
453 if (ureg
->nr_outputs
< UREG_MAX_OUTPUT
) {
454 ureg
->output
[i
].semantic_name
= semantic_name
;
455 ureg
->output
[i
].semantic_index
= semantic_index
;
456 ureg
->output
[i
].usage_mask
= usage_mask
;
457 ureg
->output
[i
].first
= index
;
458 ureg
->output
[i
].last
= index
+ array_size
- 1;
459 ureg
->output
[i
].array_id
= array_id
;
460 ureg
->output
[i
].invariant
= invariant
;
461 ureg
->nr_output_regs
= MAX2(ureg
->nr_output_regs
, index
+ array_size
);
470 ureg
->output
[i
].streams
|= streams
;
472 return ureg_dst_array_register(TGSI_FILE_OUTPUT
, ureg
->output
[i
].first
,
478 ureg_DECL_output_masked(struct ureg_program
*ureg
,
485 return ureg_DECL_output_layout(ureg
, name
, index
, 0,
486 ureg
->nr_output_regs
, usage_mask
, array_id
,
492 ureg_DECL_output(struct ureg_program
*ureg
,
493 enum tgsi_semantic name
,
496 return ureg_DECL_output_masked(ureg
, name
, index
, TGSI_WRITEMASK_XYZW
,
501 ureg_DECL_output_array(struct ureg_program
*ureg
,
502 enum tgsi_semantic semantic_name
,
503 unsigned semantic_index
,
507 return ureg_DECL_output_masked(ureg
, semantic_name
, semantic_index
,
509 array_id
, array_size
);
513 /* Returns a new constant register. Keep track of which have been
514 * referred to so that we can emit decls later.
516 * Constant operands declared with this function must be addressed
517 * with a two-dimensional index.
519 * There is nothing in this code to bind this constant to any tracked
520 * value or manage any constant_buffer contents -- that's the
521 * resposibility of the calling code.
524 ureg_DECL_constant2D(struct ureg_program
*ureg
,
529 struct const_decl
*decl
= &ureg
->const_decls
[index2D
];
531 assert(index2D
< PIPE_MAX_CONSTANT_BUFFERS
);
533 if (decl
->nr_constant_ranges
< UREG_MAX_CONSTANT_RANGE
) {
534 uint i
= decl
->nr_constant_ranges
++;
536 decl
->constant_range
[i
].first
= first
;
537 decl
->constant_range
[i
].last
= last
;
542 /* A one-dimensional, deprecated version of ureg_DECL_constant2D().
544 * Constant operands declared with this function must be addressed
545 * with a one-dimensional index.
548 ureg_DECL_constant(struct ureg_program
*ureg
,
551 struct const_decl
*decl
= &ureg
->const_decls
[0];
552 unsigned minconst
= index
, maxconst
= index
;
555 /* Inside existing range?
557 for (i
= 0; i
< decl
->nr_constant_ranges
; i
++) {
558 if (decl
->constant_range
[i
].first
<= index
&&
559 decl
->constant_range
[i
].last
>= index
) {
564 /* Extend existing range?
566 for (i
= 0; i
< decl
->nr_constant_ranges
; i
++) {
567 if (decl
->constant_range
[i
].last
== index
- 1) {
568 decl
->constant_range
[i
].last
= index
;
572 if (decl
->constant_range
[i
].first
== index
+ 1) {
573 decl
->constant_range
[i
].first
= index
;
577 minconst
= MIN2(minconst
, decl
->constant_range
[i
].first
);
578 maxconst
= MAX2(maxconst
, decl
->constant_range
[i
].last
);
583 if (decl
->nr_constant_ranges
< UREG_MAX_CONSTANT_RANGE
) {
584 i
= decl
->nr_constant_ranges
++;
585 decl
->constant_range
[i
].first
= index
;
586 decl
->constant_range
[i
].last
= index
;
590 /* Collapse all ranges down to one:
593 decl
->constant_range
[0].first
= minconst
;
594 decl
->constant_range
[0].last
= maxconst
;
595 decl
->nr_constant_ranges
= 1;
598 assert(i
< decl
->nr_constant_ranges
);
599 assert(decl
->constant_range
[i
].first
<= index
);
600 assert(decl
->constant_range
[i
].last
>= index
);
602 struct ureg_src src
= ureg_src_register(TGSI_FILE_CONSTANT
, index
);
603 return ureg_src_dimension(src
, 0);
607 /* Returns a new hw atomic register. Keep track of which have been
608 * referred to so that we can emit decls later.
611 ureg_DECL_hw_atomic(struct ureg_program
*ureg
,
617 struct hw_atomic_decl
*decl
= &ureg
->hw_atomic_decls
[buffer_id
];
619 if (decl
->nr_hw_atomic_ranges
< UREG_MAX_HW_ATOMIC_RANGE
) {
620 uint i
= decl
->nr_hw_atomic_ranges
++;
622 decl
->hw_atomic_range
[i
].first
= first
;
623 decl
->hw_atomic_range
[i
].last
= last
;
624 decl
->hw_atomic_range
[i
].array_id
= array_id
;
630 static struct ureg_dst
alloc_temporary( struct ureg_program
*ureg
,
635 /* Look for a released temporary.
637 for (i
= util_bitmask_get_first_index(ureg
->free_temps
);
638 i
!= UTIL_BITMASK_INVALID_INDEX
;
639 i
= util_bitmask_get_next_index(ureg
->free_temps
, i
+ 1)) {
640 if (util_bitmask_get(ureg
->local_temps
, i
) == local
)
644 /* Or allocate a new one.
646 if (i
== UTIL_BITMASK_INVALID_INDEX
) {
647 i
= ureg
->nr_temps
++;
650 util_bitmask_set(ureg
->local_temps
, i
);
652 /* Start a new declaration when the local flag changes */
653 if (!i
|| util_bitmask_get(ureg
->local_temps
, i
- 1) != local
)
654 util_bitmask_set(ureg
->decl_temps
, i
);
657 util_bitmask_clear(ureg
->free_temps
, i
);
659 return ureg_dst_register( TGSI_FILE_TEMPORARY
, i
);
662 struct ureg_dst
ureg_DECL_temporary( struct ureg_program
*ureg
)
664 return alloc_temporary(ureg
, FALSE
);
667 struct ureg_dst
ureg_DECL_local_temporary( struct ureg_program
*ureg
)
669 return alloc_temporary(ureg
, TRUE
);
672 struct ureg_dst
ureg_DECL_array_temporary( struct ureg_program
*ureg
,
676 unsigned i
= ureg
->nr_temps
;
677 struct ureg_dst dst
= ureg_dst_register( TGSI_FILE_TEMPORARY
, i
);
680 util_bitmask_set(ureg
->local_temps
, i
);
682 /* Always start a new declaration at the start */
683 util_bitmask_set(ureg
->decl_temps
, i
);
685 ureg
->nr_temps
+= size
;
687 /* and also at the end of the array */
688 util_bitmask_set(ureg
->decl_temps
, ureg
->nr_temps
);
690 if (ureg
->nr_array_temps
< UREG_MAX_ARRAY_TEMPS
) {
691 ureg
->array_temps
[ureg
->nr_array_temps
++] = i
;
692 dst
.ArrayID
= ureg
->nr_array_temps
;
698 void ureg_release_temporary( struct ureg_program
*ureg
,
699 struct ureg_dst tmp
)
701 if(tmp
.File
== TGSI_FILE_TEMPORARY
)
702 util_bitmask_set(ureg
->free_temps
, tmp
.Index
);
706 /* Allocate a new address register.
708 struct ureg_dst
ureg_DECL_address( struct ureg_program
*ureg
)
710 if (ureg
->nr_addrs
< UREG_MAX_ADDR
)
711 return ureg_dst_register( TGSI_FILE_ADDRESS
, ureg
->nr_addrs
++ );
714 return ureg_dst_register( TGSI_FILE_ADDRESS
, 0 );
717 /* Allocate a new sampler.
719 struct ureg_src
ureg_DECL_sampler( struct ureg_program
*ureg
,
724 for (i
= 0; i
< ureg
->nr_samplers
; i
++)
725 if (ureg
->sampler
[i
].Index
== (int)nr
)
726 return ureg
->sampler
[i
];
728 if (i
< PIPE_MAX_SAMPLERS
) {
729 ureg
->sampler
[i
] = ureg_src_register( TGSI_FILE_SAMPLER
, nr
);
731 return ureg
->sampler
[i
];
735 return ureg
->sampler
[0];
739 * Allocate a new shader sampler view.
742 ureg_DECL_sampler_view(struct ureg_program
*ureg
,
744 enum tgsi_texture_type target
,
745 enum tgsi_return_type return_type_x
,
746 enum tgsi_return_type return_type_y
,
747 enum tgsi_return_type return_type_z
,
748 enum tgsi_return_type return_type_w
)
750 struct ureg_src reg
= ureg_src_register(TGSI_FILE_SAMPLER_VIEW
, index
);
753 for (i
= 0; i
< ureg
->nr_sampler_views
; i
++) {
754 if (ureg
->sampler_view
[i
].index
== index
) {
759 if (i
< PIPE_MAX_SHADER_SAMPLER_VIEWS
) {
760 ureg
->sampler_view
[i
].index
= index
;
761 ureg
->sampler_view
[i
].target
= target
;
762 ureg
->sampler_view
[i
].return_type_x
= return_type_x
;
763 ureg
->sampler_view
[i
].return_type_y
= return_type_y
;
764 ureg
->sampler_view
[i
].return_type_z
= return_type_z
;
765 ureg
->sampler_view
[i
].return_type_w
= return_type_w
;
766 ureg
->nr_sampler_views
++;
774 /* Allocate a new image.
777 ureg_DECL_image(struct ureg_program
*ureg
,
779 enum tgsi_texture_type target
,
780 enum pipe_format format
,
784 struct ureg_src reg
= ureg_src_register(TGSI_FILE_IMAGE
, index
);
787 for (i
= 0; i
< ureg
->nr_images
; i
++)
788 if (ureg
->image
[i
].index
== index
)
791 if (i
< PIPE_MAX_SHADER_IMAGES
) {
792 ureg
->image
[i
].index
= index
;
793 ureg
->image
[i
].target
= target
;
794 ureg
->image
[i
].wr
= wr
;
795 ureg
->image
[i
].raw
= raw
;
796 ureg
->image
[i
].format
= format
;
805 /* Allocate a new buffer.
807 struct ureg_src
ureg_DECL_buffer(struct ureg_program
*ureg
, unsigned nr
,
810 struct ureg_src reg
= ureg_src_register(TGSI_FILE_BUFFER
, nr
);
813 for (i
= 0; i
< ureg
->nr_buffers
; i
++)
814 if (ureg
->buffer
[i
].index
== nr
)
817 if (i
< PIPE_MAX_SHADER_BUFFERS
) {
818 ureg
->buffer
[i
].index
= nr
;
819 ureg
->buffer
[i
].atomic
= atomic
;
828 /* Allocate a memory area.
830 struct ureg_src
ureg_DECL_memory(struct ureg_program
*ureg
,
831 unsigned memory_type
)
833 struct ureg_src reg
= ureg_src_register(TGSI_FILE_MEMORY
, memory_type
);
835 ureg
->use_memory
[memory_type
] = true;
840 match_or_expand_immediate64( const unsigned *v
,
846 unsigned nr2
= *pnr2
;
850 for (i
= 0; i
< nr
; i
+= 2) {
851 boolean found
= FALSE
;
853 for (j
= 0; j
< nr2
&& !found
; j
+= 2) {
854 if (v
[i
] == v2
[j
] && v
[i
+ 1] == v2
[j
+ 1]) {
855 *swizzle
|= (j
<< (i
* 2)) | ((j
+ 1) << ((i
+ 1) * 2));
865 v2
[nr2
+ 1] = v
[i
+ 1];
867 *swizzle
|= (nr2
<< (i
* 2)) | ((nr2
+ 1) << ((i
+ 1) * 2));
872 /* Actually expand immediate only when fully succeeded.
879 match_or_expand_immediate( const unsigned *v
,
886 unsigned nr2
= *pnr2
;
889 if (type
== TGSI_IMM_FLOAT64
||
890 type
== TGSI_IMM_UINT64
||
891 type
== TGSI_IMM_INT64
)
892 return match_or_expand_immediate64(v
, nr
, v2
, pnr2
, swizzle
);
896 for (i
= 0; i
< nr
; i
++) {
897 boolean found
= FALSE
;
899 for (j
= 0; j
< nr2
&& !found
; j
++) {
901 *swizzle
|= j
<< (i
* 2);
912 *swizzle
|= nr2
<< (i
* 2);
917 /* Actually expand immediate only when fully succeeded.
924 static struct ureg_src
925 decl_immediate( struct ureg_program
*ureg
,
931 unsigned swizzle
= 0;
933 /* Could do a first pass where we examine all existing immediates
937 for (i
= 0; i
< ureg
->nr_immediates
; i
++) {
938 if (ureg
->immediate
[i
].type
!= type
) {
941 if (match_or_expand_immediate(v
,
944 ureg
->immediate
[i
].value
.u
,
945 &ureg
->immediate
[i
].nr
,
951 if (ureg
->nr_immediates
< UREG_MAX_IMMEDIATE
) {
952 i
= ureg
->nr_immediates
++;
953 ureg
->immediate
[i
].type
= type
;
954 if (match_or_expand_immediate(v
,
957 ureg
->immediate
[i
].value
.u
,
958 &ureg
->immediate
[i
].nr
,
967 /* Make sure that all referenced elements are from this immediate.
968 * Has the effect of making size-one immediates into scalars.
970 if (type
== TGSI_IMM_FLOAT64
||
971 type
== TGSI_IMM_UINT64
||
972 type
== TGSI_IMM_INT64
) {
973 for (j
= nr
; j
< 4; j
+=2) {
974 swizzle
|= (swizzle
& 0xf) << (j
* 2);
977 for (j
= nr
; j
< 4; j
++) {
978 swizzle
|= (swizzle
& 0x3) << (j
* 2);
981 return ureg_swizzle(ureg_src_register(TGSI_FILE_IMMEDIATE
, i
),
982 (swizzle
>> 0) & 0x3,
983 (swizzle
>> 2) & 0x3,
984 (swizzle
>> 4) & 0x3,
985 (swizzle
>> 6) & 0x3);
990 ureg_DECL_immediate( struct ureg_program
*ureg
,
1000 for (i
= 0; i
< nr
; i
++) {
1004 return decl_immediate(ureg
, fu
.u
, nr
, TGSI_IMM_FLOAT32
);
1008 ureg_DECL_immediate_f64( struct ureg_program
*ureg
,
1018 assert((nr
/ 2) < 3);
1019 for (i
= 0; i
< nr
/ 2; i
++) {
1023 return decl_immediate(ureg
, fu
.u
, nr
, TGSI_IMM_FLOAT64
);
1027 ureg_DECL_immediate_uint( struct ureg_program
*ureg
,
1031 return decl_immediate(ureg
, v
, nr
, TGSI_IMM_UINT32
);
1036 ureg_DECL_immediate_block_uint( struct ureg_program
*ureg
,
1043 if (ureg
->nr_immediates
+ (nr
+ 3) / 4 > UREG_MAX_IMMEDIATE
) {
1045 return ureg_src_register(TGSI_FILE_IMMEDIATE
, 0);
1048 index
= ureg
->nr_immediates
;
1049 ureg
->nr_immediates
+= (nr
+ 3) / 4;
1051 for (i
= index
; i
< ureg
->nr_immediates
; i
++) {
1052 ureg
->immediate
[i
].type
= TGSI_IMM_UINT32
;
1053 ureg
->immediate
[i
].nr
= nr
> 4 ? 4 : nr
;
1054 memcpy(ureg
->immediate
[i
].value
.u
,
1055 &v
[(i
- index
) * 4],
1056 ureg
->immediate
[i
].nr
* sizeof(uint
));
1060 return ureg_src_register(TGSI_FILE_IMMEDIATE
, index
);
1065 ureg_DECL_immediate_int( struct ureg_program
*ureg
,
1069 return decl_immediate(ureg
, (const unsigned *)v
, nr
, TGSI_IMM_INT32
);
1073 ureg_DECL_immediate_uint64( struct ureg_program
*ureg
,
1083 assert((nr
/ 2) < 3);
1084 for (i
= 0; i
< nr
/ 2; i
++) {
1088 return decl_immediate(ureg
, fu
.u
, nr
, TGSI_IMM_UINT64
);
1092 ureg_DECL_immediate_int64( struct ureg_program
*ureg
,
1102 assert((nr
/ 2) < 3);
1103 for (i
= 0; i
< nr
/ 2; i
++) {
1107 return decl_immediate(ureg
, fu
.u
, nr
, TGSI_IMM_INT64
);
1111 ureg_emit_src( struct ureg_program
*ureg
,
1112 struct ureg_src src
)
1114 unsigned size
= 1 + (src
.Indirect
? 1 : 0) +
1115 (src
.Dimension
? (src
.DimIndirect
? 2 : 1) : 0);
1117 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_INSN
, size
);
1120 assert(src
.File
!= TGSI_FILE_NULL
);
1121 assert(src
.File
< TGSI_FILE_COUNT
);
1124 out
[n
].src
.File
= src
.File
;
1125 out
[n
].src
.SwizzleX
= src
.SwizzleX
;
1126 out
[n
].src
.SwizzleY
= src
.SwizzleY
;
1127 out
[n
].src
.SwizzleZ
= src
.SwizzleZ
;
1128 out
[n
].src
.SwizzleW
= src
.SwizzleW
;
1129 out
[n
].src
.Index
= src
.Index
;
1130 out
[n
].src
.Negate
= src
.Negate
;
1131 out
[0].src
.Absolute
= src
.Absolute
;
1135 out
[0].src
.Indirect
= 1;
1137 out
[n
].ind
.File
= src
.IndirectFile
;
1138 out
[n
].ind
.Swizzle
= src
.IndirectSwizzle
;
1139 out
[n
].ind
.Index
= src
.IndirectIndex
;
1140 if (!ureg
->supports_any_inout_decl_range
&&
1141 (src
.File
== TGSI_FILE_INPUT
|| src
.File
== TGSI_FILE_OUTPUT
))
1142 out
[n
].ind
.ArrayID
= 0;
1144 out
[n
].ind
.ArrayID
= src
.ArrayID
;
1148 if (src
.Dimension
) {
1149 out
[0].src
.Dimension
= 1;
1150 out
[n
].dim
.Dimension
= 0;
1151 out
[n
].dim
.Padding
= 0;
1152 if (src
.DimIndirect
) {
1153 out
[n
].dim
.Indirect
= 1;
1154 out
[n
].dim
.Index
= src
.DimensionIndex
;
1157 out
[n
].ind
.File
= src
.DimIndFile
;
1158 out
[n
].ind
.Swizzle
= src
.DimIndSwizzle
;
1159 out
[n
].ind
.Index
= src
.DimIndIndex
;
1160 if (!ureg
->supports_any_inout_decl_range
&&
1161 (src
.File
== TGSI_FILE_INPUT
|| src
.File
== TGSI_FILE_OUTPUT
))
1162 out
[n
].ind
.ArrayID
= 0;
1164 out
[n
].ind
.ArrayID
= src
.ArrayID
;
1166 out
[n
].dim
.Indirect
= 0;
1167 out
[n
].dim
.Index
= src
.DimensionIndex
;
1177 ureg_emit_dst( struct ureg_program
*ureg
,
1178 struct ureg_dst dst
)
1180 unsigned size
= 1 + (dst
.Indirect
? 1 : 0) +
1181 (dst
.Dimension
? (dst
.DimIndirect
? 2 : 1) : 0);
1183 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_INSN
, size
);
1186 assert(dst
.File
!= TGSI_FILE_NULL
);
1187 assert(dst
.File
!= TGSI_FILE_SAMPLER
);
1188 assert(dst
.File
!= TGSI_FILE_SAMPLER_VIEW
);
1189 assert(dst
.File
!= TGSI_FILE_IMMEDIATE
);
1190 assert(dst
.File
< TGSI_FILE_COUNT
);
1193 out
[n
].dst
.File
= dst
.File
;
1194 out
[n
].dst
.WriteMask
= dst
.WriteMask
;
1195 out
[n
].dst
.Indirect
= dst
.Indirect
;
1196 out
[n
].dst
.Index
= dst
.Index
;
1201 out
[n
].ind
.File
= dst
.IndirectFile
;
1202 out
[n
].ind
.Swizzle
= dst
.IndirectSwizzle
;
1203 out
[n
].ind
.Index
= dst
.IndirectIndex
;
1204 if (!ureg
->supports_any_inout_decl_range
&&
1205 (dst
.File
== TGSI_FILE_INPUT
|| dst
.File
== TGSI_FILE_OUTPUT
))
1206 out
[n
].ind
.ArrayID
= 0;
1208 out
[n
].ind
.ArrayID
= dst
.ArrayID
;
1212 if (dst
.Dimension
) {
1213 out
[0].dst
.Dimension
= 1;
1214 out
[n
].dim
.Dimension
= 0;
1215 out
[n
].dim
.Padding
= 0;
1216 if (dst
.DimIndirect
) {
1217 out
[n
].dim
.Indirect
= 1;
1218 out
[n
].dim
.Index
= dst
.DimensionIndex
;
1221 out
[n
].ind
.File
= dst
.DimIndFile
;
1222 out
[n
].ind
.Swizzle
= dst
.DimIndSwizzle
;
1223 out
[n
].ind
.Index
= dst
.DimIndIndex
;
1224 if (!ureg
->supports_any_inout_decl_range
&&
1225 (dst
.File
== TGSI_FILE_INPUT
|| dst
.File
== TGSI_FILE_OUTPUT
))
1226 out
[n
].ind
.ArrayID
= 0;
1228 out
[n
].ind
.ArrayID
= dst
.ArrayID
;
1230 out
[n
].dim
.Indirect
= 0;
1231 out
[n
].dim
.Index
= dst
.DimensionIndex
;
1240 static void validate( enum tgsi_opcode opcode
,
1245 const struct tgsi_opcode_info
*info
= tgsi_get_opcode_info( opcode
);
1248 assert(nr_dst
== info
->num_dst
);
1249 assert(nr_src
== info
->num_src
);
1254 struct ureg_emit_insn_result
1255 ureg_emit_insn(struct ureg_program
*ureg
,
1256 enum tgsi_opcode opcode
,
1262 union tgsi_any_token
*out
;
1264 struct ureg_emit_insn_result result
;
1266 validate( opcode
, num_dst
, num_src
);
1268 out
= get_tokens( ureg
, DOMAIN_INSN
, count
);
1269 out
[0].insn
= tgsi_default_instruction();
1270 out
[0].insn
.Opcode
= opcode
;
1271 out
[0].insn
.Saturate
= saturate
;
1272 out
[0].insn
.Precise
= precise
;
1273 out
[0].insn
.NumDstRegs
= num_dst
;
1274 out
[0].insn
.NumSrcRegs
= num_src
;
1276 result
.insn_token
= ureg
->domain
[DOMAIN_INSN
].count
- count
;
1277 result
.extended_token
= result
.insn_token
;
1279 ureg
->nr_instructions
++;
1286 * Emit a label token.
1287 * \param label_token returns a token number indicating where the label
1288 * needs to be patched later. Later, this value should be passed to the
1289 * ureg_fixup_label() function.
1292 ureg_emit_label(struct ureg_program
*ureg
,
1293 unsigned extended_token
,
1294 unsigned *label_token
)
1296 union tgsi_any_token
*out
, *insn
;
1301 out
= get_tokens( ureg
, DOMAIN_INSN
, 1 );
1304 insn
= retrieve_token( ureg
, DOMAIN_INSN
, extended_token
);
1305 insn
->insn
.Label
= 1;
1307 *label_token
= ureg
->domain
[DOMAIN_INSN
].count
- 1;
1310 /* Will return a number which can be used in a label to point to the
1311 * next instruction to be emitted.
1314 ureg_get_instruction_number( struct ureg_program
*ureg
)
1316 return ureg
->nr_instructions
;
1319 /* Patch a given label (expressed as a token number) to point to a
1320 * given instruction (expressed as an instruction number).
1323 ureg_fixup_label(struct ureg_program
*ureg
,
1324 unsigned label_token
,
1325 unsigned instruction_number
)
1327 union tgsi_any_token
*out
= retrieve_token( ureg
, DOMAIN_INSN
, label_token
);
1329 out
->insn_label
.Label
= instruction_number
;
1334 ureg_emit_texture(struct ureg_program
*ureg
,
1335 unsigned extended_token
,
1336 enum tgsi_texture_type target
,
1337 enum tgsi_return_type return_type
, unsigned num_offsets
)
1339 union tgsi_any_token
*out
, *insn
;
1341 out
= get_tokens( ureg
, DOMAIN_INSN
, 1 );
1342 insn
= retrieve_token( ureg
, DOMAIN_INSN
, extended_token
);
1344 insn
->insn
.Texture
= 1;
1347 out
[0].insn_texture
.Texture
= target
;
1348 out
[0].insn_texture
.NumOffsets
= num_offsets
;
1349 out
[0].insn_texture
.ReturnType
= return_type
;
1353 ureg_emit_texture_offset(struct ureg_program
*ureg
,
1354 const struct tgsi_texture_offset
*offset
)
1356 union tgsi_any_token
*out
;
1358 out
= get_tokens( ureg
, DOMAIN_INSN
, 1);
1361 out
[0].insn_texture_offset
= *offset
;
1365 ureg_emit_memory(struct ureg_program
*ureg
,
1366 unsigned extended_token
,
1368 enum tgsi_texture_type texture
,
1369 enum pipe_format format
)
1371 union tgsi_any_token
*out
, *insn
;
1373 out
= get_tokens( ureg
, DOMAIN_INSN
, 1 );
1374 insn
= retrieve_token( ureg
, DOMAIN_INSN
, extended_token
);
1376 insn
->insn
.Memory
= 1;
1379 out
[0].insn_memory
.Qualifier
= qualifier
;
1380 out
[0].insn_memory
.Texture
= texture
;
1381 out
[0].insn_memory
.Format
= format
;
1385 ureg_fixup_insn_size(struct ureg_program
*ureg
,
1388 union tgsi_any_token
*out
= retrieve_token( ureg
, DOMAIN_INSN
, insn
);
1390 assert(out
->insn
.Type
== TGSI_TOKEN_TYPE_INSTRUCTION
);
1391 out
->insn
.NrTokens
= ureg
->domain
[DOMAIN_INSN
].count
- insn
- 1;
1396 ureg_insn(struct ureg_program
*ureg
,
1397 enum tgsi_opcode opcode
,
1398 const struct ureg_dst
*dst
,
1400 const struct ureg_src
*src
,
1404 struct ureg_emit_insn_result insn
;
1408 if (nr_dst
&& ureg_dst_is_empty(dst
[0])) {
1412 saturate
= nr_dst
? dst
[0].Saturate
: FALSE
;
1414 insn
= ureg_emit_insn(ureg
,
1421 for (i
= 0; i
< nr_dst
; i
++)
1422 ureg_emit_dst( ureg
, dst
[i
] );
1424 for (i
= 0; i
< nr_src
; i
++)
1425 ureg_emit_src( ureg
, src
[i
] );
1427 ureg_fixup_insn_size( ureg
, insn
.insn_token
);
1431 ureg_tex_insn(struct ureg_program
*ureg
,
1432 enum tgsi_opcode opcode
,
1433 const struct ureg_dst
*dst
,
1435 enum tgsi_texture_type target
,
1436 enum tgsi_return_type return_type
,
1437 const struct tgsi_texture_offset
*texoffsets
,
1439 const struct ureg_src
*src
,
1442 struct ureg_emit_insn_result insn
;
1446 if (nr_dst
&& ureg_dst_is_empty(dst
[0])) {
1450 saturate
= nr_dst
? dst
[0].Saturate
: FALSE
;
1452 insn
= ureg_emit_insn(ureg
,
1459 ureg_emit_texture( ureg
, insn
.extended_token
, target
, return_type
,
1462 for (i
= 0; i
< nr_offset
; i
++)
1463 ureg_emit_texture_offset( ureg
, &texoffsets
[i
]);
1465 for (i
= 0; i
< nr_dst
; i
++)
1466 ureg_emit_dst( ureg
, dst
[i
] );
1468 for (i
= 0; i
< nr_src
; i
++)
1469 ureg_emit_src( ureg
, src
[i
] );
1471 ureg_fixup_insn_size( ureg
, insn
.insn_token
);
1476 ureg_memory_insn(struct ureg_program
*ureg
,
1477 enum tgsi_opcode opcode
,
1478 const struct ureg_dst
*dst
,
1480 const struct ureg_src
*src
,
1483 enum tgsi_texture_type texture
,
1484 enum pipe_format format
)
1486 struct ureg_emit_insn_result insn
;
1489 insn
= ureg_emit_insn(ureg
,
1496 ureg_emit_memory(ureg
, insn
.extended_token
, qualifier
, texture
, format
);
1498 for (i
= 0; i
< nr_dst
; i
++)
1499 ureg_emit_dst(ureg
, dst
[i
]);
1501 for (i
= 0; i
< nr_src
; i
++)
1502 ureg_emit_src(ureg
, src
[i
]);
1504 ureg_fixup_insn_size(ureg
, insn
.insn_token
);
1509 emit_decl_semantic(struct ureg_program
*ureg
,
1513 enum tgsi_semantic semantic_name
,
1514 unsigned semantic_index
,
1516 unsigned usage_mask
,
1520 union tgsi_any_token
*out
= get_tokens(ureg
, DOMAIN_DECL
, array_id
? 4 : 3);
1523 out
[0].decl
.Type
= TGSI_TOKEN_TYPE_DECLARATION
;
1524 out
[0].decl
.NrTokens
= 3;
1525 out
[0].decl
.File
= file
;
1526 out
[0].decl
.UsageMask
= usage_mask
;
1527 out
[0].decl
.Semantic
= 1;
1528 out
[0].decl
.Array
= array_id
!= 0;
1529 out
[0].decl
.Invariant
= invariant
;
1532 out
[1].decl_range
.First
= first
;
1533 out
[1].decl_range
.Last
= last
;
1536 out
[2].decl_semantic
.Name
= semantic_name
;
1537 out
[2].decl_semantic
.Index
= semantic_index
;
1538 out
[2].decl_semantic
.StreamX
= streams
& 3;
1539 out
[2].decl_semantic
.StreamY
= (streams
>> 2) & 3;
1540 out
[2].decl_semantic
.StreamZ
= (streams
>> 4) & 3;
1541 out
[2].decl_semantic
.StreamW
= (streams
>> 6) & 3;
1545 out
[3].array
.ArrayID
= array_id
;
1550 emit_decl_atomic_2d(struct ureg_program
*ureg
,
1556 union tgsi_any_token
*out
= get_tokens(ureg
, DOMAIN_DECL
, array_id
? 4 : 3);
1559 out
[0].decl
.Type
= TGSI_TOKEN_TYPE_DECLARATION
;
1560 out
[0].decl
.NrTokens
= 3;
1561 out
[0].decl
.File
= TGSI_FILE_HW_ATOMIC
;
1562 out
[0].decl
.UsageMask
= TGSI_WRITEMASK_XYZW
;
1563 out
[0].decl
.Dimension
= 1;
1564 out
[0].decl
.Array
= array_id
!= 0;
1567 out
[1].decl_range
.First
= first
;
1568 out
[1].decl_range
.Last
= last
;
1571 out
[2].decl_dim
.Index2D
= index2D
;
1575 out
[3].array
.ArrayID
= array_id
;
1580 emit_decl_fs(struct ureg_program
*ureg
,
1584 enum tgsi_semantic semantic_name
,
1585 unsigned semantic_index
,
1586 enum tgsi_interpolate_mode interpolate
,
1587 unsigned cylindrical_wrap
,
1588 enum tgsi_interpolate_loc interpolate_location
,
1590 unsigned usage_mask
)
1592 union tgsi_any_token
*out
= get_tokens(ureg
, DOMAIN_DECL
,
1596 out
[0].decl
.Type
= TGSI_TOKEN_TYPE_DECLARATION
;
1597 out
[0].decl
.NrTokens
= 4;
1598 out
[0].decl
.File
= file
;
1599 out
[0].decl
.UsageMask
= usage_mask
;
1600 out
[0].decl
.Interpolate
= 1;
1601 out
[0].decl
.Semantic
= 1;
1602 out
[0].decl
.Array
= array_id
!= 0;
1605 out
[1].decl_range
.First
= first
;
1606 out
[1].decl_range
.Last
= last
;
1609 out
[2].decl_interp
.Interpolate
= interpolate
;
1610 out
[2].decl_interp
.CylindricalWrap
= cylindrical_wrap
;
1611 out
[2].decl_interp
.Location
= interpolate_location
;
1614 out
[3].decl_semantic
.Name
= semantic_name
;
1615 out
[3].decl_semantic
.Index
= semantic_index
;
1619 out
[4].array
.ArrayID
= array_id
;
1624 emit_decl_temps( struct ureg_program
*ureg
,
1625 unsigned first
, unsigned last
,
1629 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_DECL
,
1633 out
[0].decl
.Type
= TGSI_TOKEN_TYPE_DECLARATION
;
1634 out
[0].decl
.NrTokens
= 2;
1635 out
[0].decl
.File
= TGSI_FILE_TEMPORARY
;
1636 out
[0].decl
.UsageMask
= TGSI_WRITEMASK_XYZW
;
1637 out
[0].decl
.Local
= local
;
1640 out
[1].decl_range
.First
= first
;
1641 out
[1].decl_range
.Last
= last
;
1644 out
[0].decl
.Array
= 1;
1646 out
[2].array
.ArrayID
= arrayid
;
1650 static void emit_decl_range( struct ureg_program
*ureg
,
1655 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_DECL
, 2 );
1658 out
[0].decl
.Type
= TGSI_TOKEN_TYPE_DECLARATION
;
1659 out
[0].decl
.NrTokens
= 2;
1660 out
[0].decl
.File
= file
;
1661 out
[0].decl
.UsageMask
= TGSI_WRITEMASK_XYZW
;
1662 out
[0].decl
.Semantic
= 0;
1665 out
[1].decl_range
.First
= first
;
1666 out
[1].decl_range
.Last
= first
+ count
- 1;
1670 emit_decl_range2D(struct ureg_program
*ureg
,
1676 union tgsi_any_token
*out
= get_tokens(ureg
, DOMAIN_DECL
, 3);
1679 out
[0].decl
.Type
= TGSI_TOKEN_TYPE_DECLARATION
;
1680 out
[0].decl
.NrTokens
= 3;
1681 out
[0].decl
.File
= file
;
1682 out
[0].decl
.UsageMask
= TGSI_WRITEMASK_XYZW
;
1683 out
[0].decl
.Dimension
= 1;
1686 out
[1].decl_range
.First
= first
;
1687 out
[1].decl_range
.Last
= last
;
1690 out
[2].decl_dim
.Index2D
= index2D
;
1694 emit_decl_sampler_view(struct ureg_program
*ureg
,
1696 enum tgsi_texture_type target
,
1697 enum tgsi_return_type return_type_x
,
1698 enum tgsi_return_type return_type_y
,
1699 enum tgsi_return_type return_type_z
,
1700 enum tgsi_return_type return_type_w
)
1702 union tgsi_any_token
*out
= get_tokens(ureg
, DOMAIN_DECL
, 3);
1705 out
[0].decl
.Type
= TGSI_TOKEN_TYPE_DECLARATION
;
1706 out
[0].decl
.NrTokens
= 3;
1707 out
[0].decl
.File
= TGSI_FILE_SAMPLER_VIEW
;
1708 out
[0].decl
.UsageMask
= TGSI_WRITEMASK_XYZW
;
1711 out
[1].decl_range
.First
= index
;
1712 out
[1].decl_range
.Last
= index
;
1715 out
[2].decl_sampler_view
.Resource
= target
;
1716 out
[2].decl_sampler_view
.ReturnTypeX
= return_type_x
;
1717 out
[2].decl_sampler_view
.ReturnTypeY
= return_type_y
;
1718 out
[2].decl_sampler_view
.ReturnTypeZ
= return_type_z
;
1719 out
[2].decl_sampler_view
.ReturnTypeW
= return_type_w
;
1723 emit_decl_image(struct ureg_program
*ureg
,
1725 enum tgsi_texture_type target
,
1726 enum pipe_format format
,
1730 union tgsi_any_token
*out
= get_tokens(ureg
, DOMAIN_DECL
, 3);
1733 out
[0].decl
.Type
= TGSI_TOKEN_TYPE_DECLARATION
;
1734 out
[0].decl
.NrTokens
= 3;
1735 out
[0].decl
.File
= TGSI_FILE_IMAGE
;
1736 out
[0].decl
.UsageMask
= TGSI_WRITEMASK_XYZW
;
1739 out
[1].decl_range
.First
= index
;
1740 out
[1].decl_range
.Last
= index
;
1743 out
[2].decl_image
.Resource
= target
;
1744 out
[2].decl_image
.Writable
= wr
;
1745 out
[2].decl_image
.Raw
= raw
;
1746 out
[2].decl_image
.Format
= format
;
1750 emit_decl_buffer(struct ureg_program
*ureg
,
1754 union tgsi_any_token
*out
= get_tokens(ureg
, DOMAIN_DECL
, 2);
1757 out
[0].decl
.Type
= TGSI_TOKEN_TYPE_DECLARATION
;
1758 out
[0].decl
.NrTokens
= 2;
1759 out
[0].decl
.File
= TGSI_FILE_BUFFER
;
1760 out
[0].decl
.UsageMask
= TGSI_WRITEMASK_XYZW
;
1761 out
[0].decl
.Atomic
= atomic
;
1764 out
[1].decl_range
.First
= index
;
1765 out
[1].decl_range
.Last
= index
;
1769 emit_decl_memory(struct ureg_program
*ureg
, unsigned memory_type
)
1771 union tgsi_any_token
*out
= get_tokens(ureg
, DOMAIN_DECL
, 2);
1774 out
[0].decl
.Type
= TGSI_TOKEN_TYPE_DECLARATION
;
1775 out
[0].decl
.NrTokens
= 2;
1776 out
[0].decl
.File
= TGSI_FILE_MEMORY
;
1777 out
[0].decl
.UsageMask
= TGSI_WRITEMASK_XYZW
;
1778 out
[0].decl
.MemType
= memory_type
;
1781 out
[1].decl_range
.First
= memory_type
;
1782 out
[1].decl_range
.Last
= memory_type
;
1786 emit_immediate( struct ureg_program
*ureg
,
1790 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_DECL
, 5 );
1793 out
[0].imm
.Type
= TGSI_TOKEN_TYPE_IMMEDIATE
;
1794 out
[0].imm
.NrTokens
= 5;
1795 out
[0].imm
.DataType
= type
;
1796 out
[0].imm
.Padding
= 0;
1798 out
[1].imm_data
.Uint
= v
[0];
1799 out
[2].imm_data
.Uint
= v
[1];
1800 out
[3].imm_data
.Uint
= v
[2];
1801 out
[4].imm_data
.Uint
= v
[3];
1805 emit_property(struct ureg_program
*ureg
,
1809 union tgsi_any_token
*out
= get_tokens(ureg
, DOMAIN_DECL
, 2);
1812 out
[0].prop
.Type
= TGSI_TOKEN_TYPE_PROPERTY
;
1813 out
[0].prop
.NrTokens
= 2;
1814 out
[0].prop
.PropertyName
= name
;
1816 out
[1].prop_data
.Data
= data
;
1820 static void emit_decls( struct ureg_program
*ureg
)
1824 for (i
= 0; i
< ARRAY_SIZE(ureg
->properties
); i
++)
1825 if (ureg
->properties
[i
] != ~0u)
1826 emit_property(ureg
, i
, ureg
->properties
[i
]);
1828 if (ureg
->processor
== PIPE_SHADER_VERTEX
) {
1829 for (i
= 0; i
< PIPE_MAX_ATTRIBS
; i
++) {
1830 if (ureg
->vs_inputs
[i
/32] & (1u << (i
%32))) {
1831 emit_decl_range( ureg
, TGSI_FILE_INPUT
, i
, 1 );
1834 } else if (ureg
->processor
== PIPE_SHADER_FRAGMENT
) {
1835 if (ureg
->supports_any_inout_decl_range
) {
1836 for (i
= 0; i
< ureg
->nr_inputs
; i
++) {
1839 ureg
->input
[i
].first
,
1840 ureg
->input
[i
].last
,
1841 ureg
->input
[i
].semantic_name
,
1842 ureg
->input
[i
].semantic_index
,
1843 ureg
->input
[i
].interp
,
1844 ureg
->input
[i
].cylindrical_wrap
,
1845 ureg
->input
[i
].interp_location
,
1846 ureg
->input
[i
].array_id
,
1847 ureg
->input
[i
].usage_mask
);
1851 for (i
= 0; i
< ureg
->nr_inputs
; i
++) {
1852 for (j
= ureg
->input
[i
].first
; j
<= ureg
->input
[i
].last
; j
++) {
1856 ureg
->input
[i
].semantic_name
,
1857 ureg
->input
[i
].semantic_index
+
1858 (j
- ureg
->input
[i
].first
),
1859 ureg
->input
[i
].interp
,
1860 ureg
->input
[i
].cylindrical_wrap
,
1861 ureg
->input
[i
].interp_location
, 0,
1862 ureg
->input
[i
].usage_mask
);
1867 if (ureg
->supports_any_inout_decl_range
) {
1868 for (i
= 0; i
< ureg
->nr_inputs
; i
++) {
1869 emit_decl_semantic(ureg
,
1871 ureg
->input
[i
].first
,
1872 ureg
->input
[i
].last
,
1873 ureg
->input
[i
].semantic_name
,
1874 ureg
->input
[i
].semantic_index
,
1876 TGSI_WRITEMASK_XYZW
,
1877 ureg
->input
[i
].array_id
,
1882 for (i
= 0; i
< ureg
->nr_inputs
; i
++) {
1883 for (j
= ureg
->input
[i
].first
; j
<= ureg
->input
[i
].last
; j
++) {
1884 emit_decl_semantic(ureg
,
1887 ureg
->input
[i
].semantic_name
,
1888 ureg
->input
[i
].semantic_index
+
1889 (j
- ureg
->input
[i
].first
),
1891 TGSI_WRITEMASK_XYZW
, 0, FALSE
);
1897 for (i
= 0; i
< ureg
->nr_system_values
; i
++) {
1898 emit_decl_semantic(ureg
,
1899 TGSI_FILE_SYSTEM_VALUE
,
1902 ureg
->system_value
[i
].semantic_name
,
1903 ureg
->system_value
[i
].semantic_index
,
1905 TGSI_WRITEMASK_XYZW
, 0, FALSE
);
1908 if (ureg
->supports_any_inout_decl_range
) {
1909 for (i
= 0; i
< ureg
->nr_outputs
; i
++) {
1910 emit_decl_semantic(ureg
,
1912 ureg
->output
[i
].first
,
1913 ureg
->output
[i
].last
,
1914 ureg
->output
[i
].semantic_name
,
1915 ureg
->output
[i
].semantic_index
,
1916 ureg
->output
[i
].streams
,
1917 ureg
->output
[i
].usage_mask
,
1918 ureg
->output
[i
].array_id
,
1919 ureg
->output
[i
].invariant
);
1923 for (i
= 0; i
< ureg
->nr_outputs
; i
++) {
1924 for (j
= ureg
->output
[i
].first
; j
<= ureg
->output
[i
].last
; j
++) {
1925 emit_decl_semantic(ureg
,
1928 ureg
->output
[i
].semantic_name
,
1929 ureg
->output
[i
].semantic_index
+
1930 (j
- ureg
->output
[i
].first
),
1931 ureg
->output
[i
].streams
,
1932 ureg
->output
[i
].usage_mask
,
1934 ureg
->output
[i
].invariant
);
1939 for (i
= 0; i
< ureg
->nr_samplers
; i
++) {
1940 emit_decl_range( ureg
,
1942 ureg
->sampler
[i
].Index
, 1 );
1945 for (i
= 0; i
< ureg
->nr_sampler_views
; i
++) {
1946 emit_decl_sampler_view(ureg
,
1947 ureg
->sampler_view
[i
].index
,
1948 ureg
->sampler_view
[i
].target
,
1949 ureg
->sampler_view
[i
].return_type_x
,
1950 ureg
->sampler_view
[i
].return_type_y
,
1951 ureg
->sampler_view
[i
].return_type_z
,
1952 ureg
->sampler_view
[i
].return_type_w
);
1955 for (i
= 0; i
< ureg
->nr_images
; i
++) {
1956 emit_decl_image(ureg
,
1957 ureg
->image
[i
].index
,
1958 ureg
->image
[i
].target
,
1959 ureg
->image
[i
].format
,
1961 ureg
->image
[i
].raw
);
1964 for (i
= 0; i
< ureg
->nr_buffers
; i
++) {
1965 emit_decl_buffer(ureg
, ureg
->buffer
[i
].index
, ureg
->buffer
[i
].atomic
);
1968 for (i
= 0; i
< TGSI_MEMORY_TYPE_COUNT
; i
++) {
1969 if (ureg
->use_memory
[i
])
1970 emit_decl_memory(ureg
, i
);
1973 for (i
= 0; i
< PIPE_MAX_CONSTANT_BUFFERS
; i
++) {
1974 struct const_decl
*decl
= &ureg
->const_decls
[i
];
1976 if (decl
->nr_constant_ranges
) {
1979 for (j
= 0; j
< decl
->nr_constant_ranges
; j
++) {
1980 emit_decl_range2D(ureg
,
1982 decl
->constant_range
[j
].first
,
1983 decl
->constant_range
[j
].last
,
1989 for (i
= 0; i
< PIPE_MAX_HW_ATOMIC_BUFFERS
; i
++) {
1990 struct hw_atomic_decl
*decl
= &ureg
->hw_atomic_decls
[i
];
1992 if (decl
->nr_hw_atomic_ranges
) {
1995 for (j
= 0; j
< decl
->nr_hw_atomic_ranges
; j
++) {
1996 emit_decl_atomic_2d(ureg
,
1997 decl
->hw_atomic_range
[j
].first
,
1998 decl
->hw_atomic_range
[j
].last
,
2000 decl
->hw_atomic_range
[j
].array_id
);
2005 if (ureg
->nr_temps
) {
2007 for (i
= 0; i
< ureg
->nr_temps
;) {
2008 boolean local
= util_bitmask_get(ureg
->local_temps
, i
);
2010 i
= util_bitmask_get_next_index(ureg
->decl_temps
, i
+ 1);
2011 if (i
== UTIL_BITMASK_INVALID_INDEX
)
2014 if (array
< ureg
->nr_array_temps
&& ureg
->array_temps
[array
] == first
)
2015 emit_decl_temps( ureg
, first
, i
- 1, local
, ++array
);
2017 emit_decl_temps( ureg
, first
, i
- 1, local
, 0 );
2021 if (ureg
->nr_addrs
) {
2022 emit_decl_range( ureg
,
2024 0, ureg
->nr_addrs
);
2027 for (i
= 0; i
< ureg
->nr_immediates
; i
++) {
2028 emit_immediate( ureg
,
2029 ureg
->immediate
[i
].value
.u
,
2030 ureg
->immediate
[i
].type
);
2034 /* Append the instruction tokens onto the declarations to build a
2035 * contiguous stream suitable to send to the driver.
2037 static void copy_instructions( struct ureg_program
*ureg
)
2039 unsigned nr_tokens
= ureg
->domain
[DOMAIN_INSN
].count
;
2040 union tgsi_any_token
*out
= get_tokens( ureg
,
2045 ureg
->domain
[DOMAIN_INSN
].tokens
,
2046 nr_tokens
* sizeof out
[0] );
2051 fixup_header_size(struct ureg_program
*ureg
)
2053 union tgsi_any_token
*out
= retrieve_token( ureg
, DOMAIN_DECL
, 0 );
2055 out
->header
.BodySize
= ureg
->domain
[DOMAIN_DECL
].count
- 2;
2060 emit_header( struct ureg_program
*ureg
)
2062 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_DECL
, 2 );
2064 out
[0].header
.HeaderSize
= 2;
2065 out
[0].header
.BodySize
= 0;
2067 out
[1].processor
.Processor
= ureg
->processor
;
2068 out
[1].processor
.Padding
= 0;
2072 const struct tgsi_token
*ureg_finalize( struct ureg_program
*ureg
)
2074 const struct tgsi_token
*tokens
;
2076 switch (ureg
->processor
) {
2077 case PIPE_SHADER_VERTEX
:
2078 case PIPE_SHADER_TESS_EVAL
:
2079 ureg_property(ureg
, TGSI_PROPERTY_NEXT_SHADER
,
2080 ureg
->next_shader_processor
== -1 ?
2081 PIPE_SHADER_FRAGMENT
:
2082 ureg
->next_shader_processor
);
2088 emit_header( ureg
);
2090 copy_instructions( ureg
);
2091 fixup_header_size( ureg
);
2093 if (ureg
->domain
[0].tokens
== error_tokens
||
2094 ureg
->domain
[1].tokens
== error_tokens
) {
2095 debug_printf("%s: error in generated shader\n", __FUNCTION__
);
2100 tokens
= &ureg
->domain
[DOMAIN_DECL
].tokens
[0].token
;
2103 debug_printf("%s: emitted shader %d tokens:\n", __FUNCTION__
,
2104 ureg
->domain
[DOMAIN_DECL
].count
);
2105 tgsi_dump( tokens
, 0 );
2109 /* tgsi_sanity doesn't seem to return if there are too many constants. */
2110 bool too_many_constants
= false;
2111 for (unsigned i
= 0; i
< ARRAY_SIZE(ureg
->const_decls
); i
++) {
2112 for (unsigned j
= 0; j
< ureg
->const_decls
[i
].nr_constant_ranges
; j
++) {
2113 if (ureg
->const_decls
[i
].constant_range
[j
].last
> 4096) {
2114 too_many_constants
= true;
2120 if (tokens
&& !too_many_constants
&& !tgsi_sanity_check(tokens
)) {
2121 debug_printf("tgsi_ureg.c, sanity check failed on generated tokens:\n");
2122 tgsi_dump(tokens
, 0);
2132 void *ureg_create_shader( struct ureg_program
*ureg
,
2133 struct pipe_context
*pipe
,
2134 const struct pipe_stream_output_info
*so
)
2136 struct pipe_shader_state state
;
2138 pipe_shader_state_from_tgsi(&state
, ureg_finalize(ureg
));
2143 state
.stream_output
= *so
;
2145 switch (ureg
->processor
) {
2146 case PIPE_SHADER_VERTEX
:
2147 return pipe
->create_vs_state(pipe
, &state
);
2148 case PIPE_SHADER_TESS_CTRL
:
2149 return pipe
->create_tcs_state(pipe
, &state
);
2150 case PIPE_SHADER_TESS_EVAL
:
2151 return pipe
->create_tes_state(pipe
, &state
);
2152 case PIPE_SHADER_GEOMETRY
:
2153 return pipe
->create_gs_state(pipe
, &state
);
2154 case PIPE_SHADER_FRAGMENT
:
2155 return pipe
->create_fs_state(pipe
, &state
);
2162 const struct tgsi_token
*ureg_get_tokens( struct ureg_program
*ureg
,
2163 unsigned *nr_tokens
)
2165 const struct tgsi_token
*tokens
;
2167 ureg_finalize(ureg
);
2169 tokens
= &ureg
->domain
[DOMAIN_DECL
].tokens
[0].token
;
2172 *nr_tokens
= ureg
->domain
[DOMAIN_DECL
].count
;
2174 ureg
->domain
[DOMAIN_DECL
].tokens
= 0;
2175 ureg
->domain
[DOMAIN_DECL
].size
= 0;
2176 ureg
->domain
[DOMAIN_DECL
].order
= 0;
2177 ureg
->domain
[DOMAIN_DECL
].count
= 0;
2183 void ureg_free_tokens( const struct tgsi_token
*tokens
)
2185 FREE((struct tgsi_token
*)tokens
);
2189 struct ureg_program
*
2190 ureg_create(enum pipe_shader_type processor
)
2192 return ureg_create_with_screen(processor
, NULL
);
2196 struct ureg_program
*
2197 ureg_create_with_screen(enum pipe_shader_type processor
,
2198 struct pipe_screen
*screen
)
2201 struct ureg_program
*ureg
= CALLOC_STRUCT( ureg_program
);
2205 ureg
->processor
= processor
;
2206 ureg
->supports_any_inout_decl_range
=
2208 screen
->get_shader_param(screen
, processor
,
2209 PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE
) != 0;
2210 ureg
->next_shader_processor
= -1;
2212 for (i
= 0; i
< ARRAY_SIZE(ureg
->properties
); i
++)
2213 ureg
->properties
[i
] = ~0;
2215 ureg
->free_temps
= util_bitmask_create();
2216 if (ureg
->free_temps
== NULL
)
2219 ureg
->local_temps
= util_bitmask_create();
2220 if (ureg
->local_temps
== NULL
)
2221 goto no_local_temps
;
2223 ureg
->decl_temps
= util_bitmask_create();
2224 if (ureg
->decl_temps
== NULL
)
2230 util_bitmask_destroy(ureg
->local_temps
);
2232 util_bitmask_destroy(ureg
->free_temps
);
2241 ureg_set_next_shader_processor(struct ureg_program
*ureg
, unsigned processor
)
2243 ureg
->next_shader_processor
= processor
;
2248 ureg_get_nr_outputs( const struct ureg_program
*ureg
)
2252 return ureg
->nr_outputs
;
2256 void ureg_destroy( struct ureg_program
*ureg
)
2260 for (i
= 0; i
< ARRAY_SIZE(ureg
->domain
); i
++) {
2261 if (ureg
->domain
[i
].tokens
&&
2262 ureg
->domain
[i
].tokens
!= error_tokens
)
2263 FREE(ureg
->domain
[i
].tokens
);
2266 util_bitmask_destroy(ureg
->free_temps
);
2267 util_bitmask_destroy(ureg
->local_temps
);
2268 util_bitmask_destroy(ureg
->decl_temps
);