1 /**************************************************************************
3 * Copyright 2009 VMware, Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE, INC AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
29 #include "pipe/p_context.h"
30 #include "pipe/p_state.h"
31 #include "tgsi/tgsi_ureg.h"
32 #include "tgsi/tgsi_build.h"
33 #include "tgsi/tgsi_info.h"
34 #include "tgsi/tgsi_dump.h"
35 #include "tgsi/tgsi_sanity.h"
36 #include "util/u_memory.h"
37 #include "util/u_math.h"
39 union tgsi_any_token
{
40 struct tgsi_version version
;
41 struct tgsi_header header
;
42 struct tgsi_processor processor
;
43 struct tgsi_token token
;
44 struct tgsi_declaration decl
;
45 struct tgsi_declaration_range decl_range
;
46 struct tgsi_declaration_semantic decl_semantic
;
47 struct tgsi_immediate imm
;
48 union tgsi_immediate_data imm_data
;
49 struct tgsi_instruction insn
;
50 struct tgsi_instruction_predicate insn_predicate
;
51 struct tgsi_instruction_ext_label insn_ext_label
;
52 struct tgsi_instruction_ext_texture insn_ext_texture
;
53 struct tgsi_src_register src
;
54 struct tgsi_src_register_ext_mod src_ext_mod
;
55 struct tgsi_dimension dim
;
56 struct tgsi_dst_register dst
;
57 struct tgsi_dst_register_ext_modulate dst_ext_mod
;
63 union tgsi_any_token
*tokens
;
69 #define UREG_MAX_INPUT PIPE_MAX_ATTRIBS
70 #define UREG_MAX_OUTPUT PIPE_MAX_ATTRIBS
71 #define UREG_MAX_CONSTANT_RANGE 32
72 #define UREG_MAX_IMMEDIATE 32
73 #define UREG_MAX_TEMP 256
74 #define UREG_MAX_ADDR 2
75 #define UREG_MAX_LOOP 1
76 #define UREG_MAX_PRED 1
84 struct pipe_context
*pipe
;
87 unsigned semantic_name
;
88 unsigned semantic_index
;
90 } fs_input
[UREG_MAX_INPUT
];
91 unsigned nr_fs_inputs
;
93 unsigned vs_inputs
[UREG_MAX_INPUT
/32];
96 unsigned semantic_name
;
97 unsigned semantic_index
;
98 } output
[UREG_MAX_OUTPUT
];
104 } immediate
[UREG_MAX_IMMEDIATE
];
105 unsigned nr_immediates
;
107 struct ureg_src sampler
[PIPE_MAX_SAMPLERS
];
108 unsigned nr_samplers
;
110 unsigned temps_active
[UREG_MAX_TEMP
/ 32];
116 } constant_range
[UREG_MAX_CONSTANT_RANGE
];
117 unsigned nr_constant_ranges
;
122 unsigned nr_instructions
;
124 struct ureg_tokens domain
[2];
127 static union tgsi_any_token error_tokens
[32];
129 static void tokens_error( struct ureg_tokens
*tokens
)
131 if (tokens
->tokens
&& tokens
->tokens
!= error_tokens
)
132 FREE(tokens
->tokens
);
134 tokens
->tokens
= error_tokens
;
135 tokens
->size
= Elements(error_tokens
);
140 static void tokens_expand( struct ureg_tokens
*tokens
,
143 unsigned old_size
= tokens
->size
* sizeof(unsigned);
145 if (tokens
->tokens
== error_tokens
) {
149 while (tokens
->count
+ count
> tokens
->size
) {
150 tokens
->size
= (1 << ++tokens
->order
);
153 tokens
->tokens
= REALLOC(tokens
->tokens
,
155 tokens
->size
* sizeof(unsigned));
156 if (tokens
->tokens
== NULL
) {
157 tokens_error(tokens
);
161 static void set_bad( struct ureg_program
*ureg
)
163 tokens_error(&ureg
->domain
[0]);
168 static union tgsi_any_token
*get_tokens( struct ureg_program
*ureg
,
172 struct ureg_tokens
*tokens
= &ureg
->domain
[domain
];
173 union tgsi_any_token
*result
;
175 if (tokens
->count
+ count
> tokens
->size
)
176 tokens_expand(tokens
, count
);
178 result
= &tokens
->tokens
[tokens
->count
];
179 tokens
->count
+= count
;
184 static union tgsi_any_token
*retrieve_token( struct ureg_program
*ureg
,
188 if (ureg
->domain
[domain
].tokens
== error_tokens
)
189 return &error_tokens
[0];
191 return &ureg
->domain
[domain
].tokens
[nr
];
196 static INLINE
struct ureg_dst
197 ureg_dst_register( unsigned file
,
203 dst
.WriteMask
= TGSI_WRITEMASK_XYZW
;
205 dst
.IndirectIndex
= 0;
206 dst
.IndirectSwizzle
= 0;
210 dst
.PredSwizzleX
= TGSI_SWIZZLE_X
;
211 dst
.PredSwizzleY
= TGSI_SWIZZLE_Y
;
212 dst
.PredSwizzleZ
= TGSI_SWIZZLE_Z
;
213 dst
.PredSwizzleW
= TGSI_SWIZZLE_W
;
219 static INLINE
struct ureg_src
220 ureg_src_register( unsigned file
,
226 src
.SwizzleX
= TGSI_SWIZZLE_X
;
227 src
.SwizzleY
= TGSI_SWIZZLE_Y
;
228 src
.SwizzleZ
= TGSI_SWIZZLE_Z
;
229 src
.SwizzleW
= TGSI_SWIZZLE_W
;
232 src
.IndirectIndex
= 0;
233 src
.IndirectSwizzle
= 0;
245 ureg_DECL_fs_input( struct ureg_program
*ureg
,
248 unsigned interp_mode
)
252 for (i
= 0; i
< ureg
->nr_fs_inputs
; i
++) {
253 if (ureg
->fs_input
[i
].semantic_name
== name
&&
254 ureg
->fs_input
[i
].semantic_index
== index
)
258 if (ureg
->nr_fs_inputs
< UREG_MAX_INPUT
) {
259 ureg
->fs_input
[i
].semantic_name
= name
;
260 ureg
->fs_input
[i
].semantic_index
= index
;
261 ureg
->fs_input
[i
].interp
= interp_mode
;
262 ureg
->nr_fs_inputs
++;
269 return ureg_src_register( TGSI_FILE_INPUT
, i
);
274 ureg_DECL_vs_input( struct ureg_program
*ureg
,
277 assert(ureg
->processor
== TGSI_PROCESSOR_VERTEX
);
279 ureg
->vs_inputs
[index
/32] |= 1 << (index
% 32);
280 return ureg_src_register( TGSI_FILE_INPUT
, index
);
285 ureg_DECL_output( struct ureg_program
*ureg
,
291 for (i
= 0; i
< ureg
->nr_outputs
; i
++) {
292 if (ureg
->output
[i
].semantic_name
== name
&&
293 ureg
->output
[i
].semantic_index
== index
)
297 if (ureg
->nr_outputs
< UREG_MAX_OUTPUT
) {
298 ureg
->output
[i
].semantic_name
= name
;
299 ureg
->output
[i
].semantic_index
= index
;
307 return ureg_dst_register( TGSI_FILE_OUTPUT
, i
);
311 /* Returns a new constant register. Keep track of which have been
312 * referred to so that we can emit decls later.
314 * There is nothing in this code to bind this constant to any tracked
315 * value or manage any constant_buffer contents -- that's the
316 * resposibility of the calling code.
318 struct ureg_src
ureg_DECL_constant(struct ureg_program
*ureg
,
321 unsigned minconst
= index
, maxconst
= index
;
324 /* Inside existing range?
326 for (i
= 0; i
< ureg
->nr_constant_ranges
; i
++) {
327 if (ureg
->constant_range
[i
].first
<= index
&&
328 ureg
->constant_range
[i
].last
>= index
)
332 /* Extend existing range?
334 for (i
= 0; i
< ureg
->nr_constant_ranges
; i
++) {
335 if (ureg
->constant_range
[i
].last
== index
- 1) {
336 ureg
->constant_range
[i
].last
= index
;
340 if (ureg
->constant_range
[i
].first
== index
+ 1) {
341 ureg
->constant_range
[i
].first
= index
;
345 minconst
= MIN2(minconst
, ureg
->constant_range
[i
].first
);
346 maxconst
= MAX2(maxconst
, ureg
->constant_range
[i
].last
);
351 if (ureg
->nr_constant_ranges
< UREG_MAX_CONSTANT_RANGE
) {
352 i
= ureg
->nr_constant_ranges
++;
353 ureg
->constant_range
[i
].first
= index
;
354 ureg
->constant_range
[i
].last
= index
;
357 /* Collapse all ranges down to one:
360 ureg
->constant_range
[0].first
= minconst
;
361 ureg
->constant_range
[0].last
= maxconst
;
362 ureg
->nr_constant_ranges
= 1;
365 assert(i
< ureg
->nr_constant_ranges
);
366 assert(ureg
->constant_range
[i
].first
<= index
);
367 assert(ureg
->constant_range
[i
].last
>= index
);
368 return ureg_src_register( TGSI_FILE_CONSTANT
, index
);
372 /* Allocate a new temporary. Temporaries greater than UREG_MAX_TEMP
373 * are legal, but will not be released.
375 struct ureg_dst
ureg_DECL_temporary( struct ureg_program
*ureg
)
379 for (i
= 0; i
< UREG_MAX_TEMP
; i
+= 32) {
380 int bit
= ffs(~ureg
->temps_active
[i
/32]);
387 /* No reusable temps, so allocate a new one:
389 i
= ureg
->nr_temps
++;
392 if (i
< UREG_MAX_TEMP
)
393 ureg
->temps_active
[i
/32] |= 1 << (i
% 32);
395 if (i
>= ureg
->nr_temps
)
396 ureg
->nr_temps
= i
+ 1;
398 return ureg_dst_register( TGSI_FILE_TEMPORARY
, i
);
402 void ureg_release_temporary( struct ureg_program
*ureg
,
403 struct ureg_dst tmp
)
405 if(tmp
.File
== TGSI_FILE_TEMPORARY
)
406 if (tmp
.Index
< UREG_MAX_TEMP
)
407 ureg
->temps_active
[tmp
.Index
/32] &= ~(1 << (tmp
.Index
% 32));
411 /* Allocate a new address register.
413 struct ureg_dst
ureg_DECL_address( struct ureg_program
*ureg
)
415 if (ureg
->nr_addrs
< UREG_MAX_ADDR
)
416 return ureg_dst_register( TGSI_FILE_ADDRESS
, ureg
->nr_addrs
++ );
419 return ureg_dst_register( TGSI_FILE_ADDRESS
, 0 );
422 /* Allocate a new loop register.
425 ureg_DECL_loop(struct ureg_program
*ureg
)
427 if (ureg
->nr_loops
< UREG_MAX_LOOP
) {
428 return ureg_dst_register(TGSI_FILE_LOOP
, ureg
->nr_loops
++);
432 return ureg_dst_register(TGSI_FILE_LOOP
, 0);
435 /* Allocate a new predicate register.
438 ureg_DECL_predicate(struct ureg_program
*ureg
)
440 if (ureg
->nr_preds
< UREG_MAX_PRED
) {
441 return ureg_dst_register(TGSI_FILE_PREDICATE
, ureg
->nr_preds
++);
445 return ureg_dst_register(TGSI_FILE_PREDICATE
, 0);
448 /* Allocate a new sampler.
450 struct ureg_src
ureg_DECL_sampler( struct ureg_program
*ureg
,
455 for (i
= 0; i
< ureg
->nr_samplers
; i
++)
456 if (ureg
->sampler
[i
].Index
== nr
)
457 return ureg
->sampler
[i
];
459 if (i
< PIPE_MAX_SAMPLERS
) {
460 ureg
->sampler
[i
] = ureg_src_register( TGSI_FILE_SAMPLER
, nr
);
462 return ureg
->sampler
[i
];
466 return ureg
->sampler
[0];
472 static int match_or_expand_immediate( const float *v
,
482 for (i
= 0; i
< nr
; i
++) {
483 boolean found
= FALSE
;
485 for (j
= 0; j
< *nr2
&& !found
; j
++) {
487 *swizzle
|= j
<< (i
* 2);
497 *swizzle
|= *nr2
<< (i
* 2);
508 struct ureg_src
ureg_DECL_immediate( struct ureg_program
*ureg
,
515 /* Could do a first pass where we examine all existing immediates
519 for (i
= 0; i
< ureg
->nr_immediates
; i
++) {
520 if (match_or_expand_immediate( v
,
522 ureg
->immediate
[i
].v
,
523 &ureg
->immediate
[i
].nr
,
528 if (ureg
->nr_immediates
< UREG_MAX_IMMEDIATE
) {
529 i
= ureg
->nr_immediates
++;
530 if (match_or_expand_immediate( v
,
532 ureg
->immediate
[i
].v
,
533 &ureg
->immediate
[i
].nr
,
541 /* Make sure that all referenced elements are from this immediate.
542 * Has the effect of making size-one immediates into scalars.
544 for (j
= nr
; j
< 4; j
++)
545 swizzle
|= (swizzle
& 0x3) << (j
* 2);
547 return ureg_swizzle( ureg_src_register( TGSI_FILE_IMMEDIATE
, i
),
548 (swizzle
>> 0) & 0x3,
549 (swizzle
>> 2) & 0x3,
550 (swizzle
>> 4) & 0x3,
551 (swizzle
>> 6) & 0x3);
556 ureg_emit_src( struct ureg_program
*ureg
,
557 struct ureg_src src
)
560 (src
.Absolute
? 1 : 0) +
561 (src
.Indirect
? 1 : 0));
563 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_INSN
, size
);
566 assert(src
.File
!= TGSI_FILE_NULL
);
567 assert(src
.File
!= TGSI_FILE_OUTPUT
);
568 assert(src
.File
< TGSI_FILE_COUNT
);
571 out
[n
].src
.File
= src
.File
;
572 out
[n
].src
.SwizzleX
= src
.SwizzleX
;
573 out
[n
].src
.SwizzleY
= src
.SwizzleY
;
574 out
[n
].src
.SwizzleZ
= src
.SwizzleZ
;
575 out
[n
].src
.SwizzleW
= src
.SwizzleW
;
576 out
[n
].src
.Index
= src
.Index
;
577 out
[n
].src
.Negate
= src
.Negate
;
581 out
[0].src
.Extended
= 1;
582 out
[0].src
.Negate
= 0;
584 out
[n
].src_ext_mod
.Type
= TGSI_SRC_REGISTER_EXT_TYPE_MOD
;
585 out
[n
].src_ext_mod
.Absolute
= 1;
586 out
[n
].src_ext_mod
.Negate
= src
.Negate
;
591 out
[0].src
.Indirect
= 1;
593 out
[n
].src
.File
= TGSI_FILE_ADDRESS
;
594 out
[n
].src
.SwizzleX
= src
.IndirectSwizzle
;
595 out
[n
].src
.SwizzleY
= src
.IndirectSwizzle
;
596 out
[n
].src
.SwizzleZ
= src
.IndirectSwizzle
;
597 out
[n
].src
.SwizzleW
= src
.IndirectSwizzle
;
598 out
[n
].src
.Index
= src
.IndirectIndex
;
607 ureg_emit_dst( struct ureg_program
*ureg
,
608 struct ureg_dst dst
)
611 (dst
.Indirect
? 1 : 0));
613 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_INSN
, size
);
616 assert(dst
.File
!= TGSI_FILE_NULL
);
617 assert(dst
.File
!= TGSI_FILE_CONSTANT
);
618 assert(dst
.File
!= TGSI_FILE_INPUT
);
619 assert(dst
.File
!= TGSI_FILE_SAMPLER
);
620 assert(dst
.File
!= TGSI_FILE_IMMEDIATE
);
621 assert(dst
.File
< TGSI_FILE_COUNT
);
624 out
[n
].dst
.File
= dst
.File
;
625 out
[n
].dst
.WriteMask
= dst
.WriteMask
;
626 out
[n
].dst
.Indirect
= dst
.Indirect
;
627 out
[n
].dst
.Index
= dst
.Index
;
632 out
[n
].src
.File
= TGSI_FILE_ADDRESS
;
633 out
[n
].src
.SwizzleX
= dst
.IndirectSwizzle
;
634 out
[n
].src
.SwizzleY
= dst
.IndirectSwizzle
;
635 out
[n
].src
.SwizzleZ
= dst
.IndirectSwizzle
;
636 out
[n
].src
.SwizzleW
= dst
.IndirectSwizzle
;
637 out
[n
].src
.Index
= dst
.IndirectIndex
;
645 static void validate( unsigned opcode
,
650 const struct tgsi_opcode_info
*info
= tgsi_get_opcode_info( opcode
);
653 assert(nr_dst
== info
->num_dst
);
654 assert(nr_src
== info
->num_src
);
659 struct ureg_emit_insn_result
660 ureg_emit_insn(struct ureg_program
*ureg
,
665 unsigned pred_swizzle_x
,
666 unsigned pred_swizzle_y
,
667 unsigned pred_swizzle_z
,
668 unsigned pred_swizzle_w
,
672 union tgsi_any_token
*out
;
673 uint count
= predicate
? 2 : 1;
674 struct ureg_emit_insn_result result
;
676 validate( opcode
, num_dst
, num_src
);
678 out
= get_tokens( ureg
, DOMAIN_INSN
, count
);
679 out
[0].insn
= tgsi_default_instruction();
680 out
[0].insn
.Opcode
= opcode
;
681 out
[0].insn
.Saturate
= saturate
;
682 out
[0].insn
.NumDstRegs
= num_dst
;
683 out
[0].insn
.NumSrcRegs
= num_src
;
685 result
.insn_token
= ureg
->domain
[DOMAIN_INSN
].count
- count
;
686 result
.extended_token
= result
.insn_token
;
689 out
[0].insn
.Predicate
= 1;
690 out
[1].insn_predicate
= tgsi_default_instruction_predicate();
691 out
[1].insn_predicate
.Negate
= pred_negate
;
692 out
[1].insn_predicate
.SwizzleX
= pred_swizzle_x
;
693 out
[1].insn_predicate
.SwizzleY
= pred_swizzle_y
;
694 out
[1].insn_predicate
.SwizzleZ
= pred_swizzle_z
;
695 out
[1].insn_predicate
.SwizzleW
= pred_swizzle_w
;
698 ureg
->nr_instructions
++;
705 ureg_emit_label(struct ureg_program
*ureg
,
706 unsigned extended_token
,
707 unsigned *label_token
)
709 union tgsi_any_token
*out
, *insn
;
714 out
= get_tokens( ureg
, DOMAIN_INSN
, 1 );
715 insn
= retrieve_token( ureg
, DOMAIN_INSN
, extended_token
);
717 insn
->token
.Extended
= 1;
720 out
[0].insn_ext_label
.Type
= TGSI_INSTRUCTION_EXT_TYPE_LABEL
;
722 *label_token
= ureg
->domain
[DOMAIN_INSN
].count
- 1;
725 /* Will return a number which can be used in a label to point to the
726 * next instruction to be emitted.
729 ureg_get_instruction_number( struct ureg_program
*ureg
)
731 return ureg
->nr_instructions
;
734 /* Patch a given label (expressed as a token number) to point to a
735 * given instruction (expressed as an instruction number).
738 ureg_fixup_label(struct ureg_program
*ureg
,
739 unsigned label_token
,
740 unsigned instruction_number
)
742 union tgsi_any_token
*out
= retrieve_token( ureg
, DOMAIN_INSN
, label_token
);
744 assert(out
->insn_ext_label
.Type
== TGSI_INSTRUCTION_EXT_TYPE_LABEL
);
745 out
->insn_ext_label
.Label
= instruction_number
;
750 ureg_emit_texture(struct ureg_program
*ureg
,
751 unsigned extended_token
,
754 union tgsi_any_token
*out
, *insn
;
756 out
= get_tokens( ureg
, DOMAIN_INSN
, 1 );
757 insn
= retrieve_token( ureg
, DOMAIN_INSN
, extended_token
);
759 insn
->token
.Extended
= 1;
762 out
[0].insn_ext_texture
.Type
= TGSI_INSTRUCTION_EXT_TYPE_TEXTURE
;
763 out
[0].insn_ext_texture
.Texture
= target
;
768 ureg_fixup_insn_size(struct ureg_program
*ureg
,
771 union tgsi_any_token
*out
= retrieve_token( ureg
, DOMAIN_INSN
, insn
);
773 assert(out
->insn
.Type
== TGSI_TOKEN_TYPE_INSTRUCTION
);
774 out
->insn
.NrTokens
= ureg
->domain
[DOMAIN_INSN
].count
- insn
- 1;
779 ureg_insn(struct ureg_program
*ureg
,
781 const struct ureg_dst
*dst
,
783 const struct ureg_src
*src
,
786 struct ureg_emit_insn_result insn
;
793 saturate
= nr_dst
? dst
[0].Saturate
: FALSE
;
794 predicate
= nr_dst
? dst
[0].Predicate
: FALSE
;
796 negate
= dst
[0].PredNegate
;
797 swizzle
[0] = dst
[0].PredSwizzleX
;
798 swizzle
[1] = dst
[0].PredSwizzleY
;
799 swizzle
[2] = dst
[0].PredSwizzleZ
;
800 swizzle
[3] = dst
[0].PredSwizzleW
;
803 insn
= ureg_emit_insn(ureg
,
815 for (i
= 0; i
< nr_dst
; i
++)
816 ureg_emit_dst( ureg
, dst
[i
] );
818 for (i
= 0; i
< nr_src
; i
++)
819 ureg_emit_src( ureg
, src
[i
] );
821 ureg_fixup_insn_size( ureg
, insn
.insn_token
);
825 ureg_tex_insn(struct ureg_program
*ureg
,
827 const struct ureg_dst
*dst
,
830 const struct ureg_src
*src
,
833 struct ureg_emit_insn_result insn
;
840 saturate
= nr_dst
? dst
[0].Saturate
: FALSE
;
841 predicate
= nr_dst
? dst
[0].Predicate
: FALSE
;
843 negate
= dst
[0].PredNegate
;
844 swizzle
[0] = dst
[0].PredSwizzleX
;
845 swizzle
[1] = dst
[0].PredSwizzleY
;
846 swizzle
[2] = dst
[0].PredSwizzleZ
;
847 swizzle
[3] = dst
[0].PredSwizzleW
;
850 insn
= ureg_emit_insn(ureg
,
862 ureg_emit_texture( ureg
, insn
.extended_token
, target
);
864 for (i
= 0; i
< nr_dst
; i
++)
865 ureg_emit_dst( ureg
, dst
[i
] );
867 for (i
= 0; i
< nr_src
; i
++)
868 ureg_emit_src( ureg
, src
[i
] );
870 ureg_fixup_insn_size( ureg
, insn
.insn_token
);
875 ureg_label_insn(struct ureg_program
*ureg
,
877 const struct ureg_src
*src
,
879 unsigned *label_token
)
881 struct ureg_emit_insn_result insn
;
884 insn
= ureg_emit_insn(ureg
,
896 ureg_emit_label( ureg
, insn
.extended_token
, label_token
);
898 for (i
= 0; i
< nr_src
; i
++)
899 ureg_emit_src( ureg
, src
[i
] );
901 ureg_fixup_insn_size( ureg
, insn
.insn_token
);
906 static void emit_decl( struct ureg_program
*ureg
,
909 unsigned semantic_name
,
910 unsigned semantic_index
,
913 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_DECL
, 3 );
916 out
[0].decl
.Type
= TGSI_TOKEN_TYPE_DECLARATION
;
917 out
[0].decl
.NrTokens
= 3;
918 out
[0].decl
.File
= file
;
919 out
[0].decl
.UsageMask
= TGSI_WRITEMASK_XYZW
; /* FIXME! */
920 out
[0].decl
.Interpolate
= interp
;
921 out
[0].decl
.Semantic
= 1;
924 out
[1].decl_range
.First
=
925 out
[1].decl_range
.Last
= index
;
928 out
[2].decl_semantic
.SemanticName
= semantic_name
;
929 out
[2].decl_semantic
.SemanticIndex
= semantic_index
;
934 static void emit_decl_range( struct ureg_program
*ureg
,
939 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_DECL
, 2 );
942 out
[0].decl
.Type
= TGSI_TOKEN_TYPE_DECLARATION
;
943 out
[0].decl
.NrTokens
= 2;
944 out
[0].decl
.File
= file
;
945 out
[0].decl
.UsageMask
= 0xf;
946 out
[0].decl
.Interpolate
= TGSI_INTERPOLATE_CONSTANT
;
947 out
[0].decl
.Semantic
= 0;
950 out
[1].decl_range
.First
= first
;
951 out
[1].decl_range
.Last
= first
+ count
- 1;
954 static void emit_immediate( struct ureg_program
*ureg
,
957 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_DECL
, 5 );
960 out
[0].imm
.Type
= TGSI_TOKEN_TYPE_IMMEDIATE
;
961 out
[0].imm
.NrTokens
= 5;
962 out
[0].imm
.DataType
= TGSI_IMM_FLOAT32
;
963 out
[0].imm
.Padding
= 0;
964 out
[0].imm
.Extended
= 0;
966 out
[1].imm_data
.Float
= v
[0];
967 out
[2].imm_data
.Float
= v
[1];
968 out
[3].imm_data
.Float
= v
[2];
969 out
[4].imm_data
.Float
= v
[3];
975 static void emit_decls( struct ureg_program
*ureg
)
979 if (ureg
->processor
== TGSI_PROCESSOR_VERTEX
) {
980 for (i
= 0; i
< UREG_MAX_INPUT
; i
++) {
981 if (ureg
->vs_inputs
[i
/32] & (1 << (i
%32))) {
982 emit_decl_range( ureg
, TGSI_FILE_INPUT
, i
, 1 );
987 for (i
= 0; i
< ureg
->nr_fs_inputs
; i
++) {
991 ureg
->fs_input
[i
].semantic_name
,
992 ureg
->fs_input
[i
].semantic_index
,
993 ureg
->fs_input
[i
].interp
);
997 for (i
= 0; i
< ureg
->nr_outputs
; i
++) {
1001 ureg
->output
[i
].semantic_name
,
1002 ureg
->output
[i
].semantic_index
,
1003 TGSI_INTERPOLATE_CONSTANT
);
1006 for (i
= 0; i
< ureg
->nr_samplers
; i
++) {
1007 emit_decl_range( ureg
,
1009 ureg
->sampler
[i
].Index
, 1 );
1012 if (ureg
->nr_constant_ranges
) {
1013 for (i
= 0; i
< ureg
->nr_constant_ranges
; i
++)
1014 emit_decl_range( ureg
,
1016 ureg
->constant_range
[i
].first
,
1017 (ureg
->constant_range
[i
].last
+ 1 -
1018 ureg
->constant_range
[i
].first
) );
1021 if (ureg
->nr_temps
) {
1022 emit_decl_range( ureg
,
1023 TGSI_FILE_TEMPORARY
,
1024 0, ureg
->nr_temps
);
1027 if (ureg
->nr_addrs
) {
1028 emit_decl_range( ureg
,
1030 0, ureg
->nr_addrs
);
1033 if (ureg
->nr_loops
) {
1034 emit_decl_range(ureg
,
1040 if (ureg
->nr_preds
) {
1041 emit_decl_range(ureg
,
1042 TGSI_FILE_PREDICATE
,
1047 for (i
= 0; i
< ureg
->nr_immediates
; i
++) {
1048 emit_immediate( ureg
,
1049 ureg
->immediate
[i
].v
);
1053 /* Append the instruction tokens onto the declarations to build a
1054 * contiguous stream suitable to send to the driver.
1056 static void copy_instructions( struct ureg_program
*ureg
)
1058 unsigned nr_tokens
= ureg
->domain
[DOMAIN_INSN
].count
;
1059 union tgsi_any_token
*out
= get_tokens( ureg
,
1064 ureg
->domain
[DOMAIN_INSN
].tokens
,
1065 nr_tokens
* sizeof out
[0] );
1070 fixup_header_size(struct ureg_program
*ureg
)
1072 union tgsi_any_token
*out
= retrieve_token( ureg
, DOMAIN_DECL
, 1 );
1074 out
->header
.BodySize
= ureg
->domain
[DOMAIN_DECL
].count
- 3;
1079 emit_header( struct ureg_program
*ureg
)
1081 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_DECL
, 3 );
1083 out
[0].version
.MajorVersion
= 1;
1084 out
[0].version
.MinorVersion
= 1;
1085 out
[0].version
.Padding
= 0;
1087 out
[1].header
.HeaderSize
= 2;
1088 out
[1].header
.BodySize
= 0;
1090 out
[2].processor
.Processor
= ureg
->processor
;
1091 out
[2].processor
.Padding
= 0;
1095 const struct tgsi_token
*ureg_finalize( struct ureg_program
*ureg
)
1097 const struct tgsi_token
*tokens
;
1099 emit_header( ureg
);
1101 copy_instructions( ureg
);
1102 fixup_header_size( ureg
);
1104 if (ureg
->domain
[0].tokens
== error_tokens
||
1105 ureg
->domain
[1].tokens
== error_tokens
) {
1106 debug_printf("%s: error in generated shader\n", __FUNCTION__
);
1111 tokens
= &ureg
->domain
[DOMAIN_DECL
].tokens
[0].token
;
1114 debug_printf("%s: emitted shader %d tokens:\n", __FUNCTION__
,
1115 ureg
->domain
[DOMAIN_DECL
].count
);
1116 tgsi_dump( tokens
, 0 );
1120 if (tokens
&& !tgsi_sanity_check(tokens
)) {
1121 debug_printf("tgsi_ureg.c, sanity check failed on generated tokens:\n");
1122 tgsi_dump(tokens
, 0);
1132 void *ureg_create_shader( struct ureg_program
*ureg
,
1133 struct pipe_context
*pipe
)
1135 struct pipe_shader_state state
;
1137 state
.tokens
= ureg_finalize(ureg
);
1141 if (ureg
->processor
== TGSI_PROCESSOR_VERTEX
)
1142 return pipe
->create_vs_state( pipe
, &state
);
1144 return pipe
->create_fs_state( pipe
, &state
);
1148 const struct tgsi_token
*ureg_get_tokens( struct ureg_program
*ureg
,
1149 unsigned *nr_tokens
)
1151 const struct tgsi_token
*tokens
;
1153 ureg_finalize(ureg
);
1155 tokens
= &ureg
->domain
[DOMAIN_DECL
].tokens
[0].token
;
1158 *nr_tokens
= ureg
->domain
[DOMAIN_DECL
].size
;
1160 ureg
->domain
[DOMAIN_DECL
].tokens
= 0;
1161 ureg
->domain
[DOMAIN_DECL
].size
= 0;
1162 ureg
->domain
[DOMAIN_DECL
].order
= 0;
1163 ureg
->domain
[DOMAIN_DECL
].count
= 0;
1169 struct ureg_program
*ureg_create( unsigned processor
)
1171 struct ureg_program
*ureg
= CALLOC_STRUCT( ureg_program
);
1175 ureg
->processor
= processor
;
1180 void ureg_destroy( struct ureg_program
*ureg
)
1184 for (i
= 0; i
< Elements(ureg
->domain
); i
++) {
1185 if (ureg
->domain
[i
].tokens
&&
1186 ureg
->domain
[i
].tokens
!= error_tokens
)
1187 FREE(ureg
->domain
[i
].tokens
);