1 /**************************************************************************
3 * Copyright 2009 VMware, Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE, INC AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
29 #include "pipe/p_context.h"
30 #include "pipe/p_state.h"
31 #include "tgsi/tgsi_ureg.h"
32 #include "tgsi/tgsi_build.h"
33 #include "tgsi/tgsi_info.h"
34 #include "tgsi/tgsi_dump.h"
35 #include "tgsi/tgsi_sanity.h"
36 #include "util/u_memory.h"
37 #include "util/u_math.h"
39 union tgsi_any_token
{
40 struct tgsi_header header
;
41 struct tgsi_processor processor
;
42 struct tgsi_token token
;
43 struct tgsi_declaration decl
;
44 struct tgsi_declaration_range decl_range
;
45 struct tgsi_declaration_semantic decl_semantic
;
46 struct tgsi_immediate imm
;
47 union tgsi_immediate_data imm_data
;
48 struct tgsi_instruction insn
;
49 struct tgsi_instruction_predicate insn_predicate
;
50 struct tgsi_instruction_label insn_label
;
51 struct tgsi_instruction_texture insn_texture
;
52 struct tgsi_src_register src
;
53 struct tgsi_dimension dim
;
54 struct tgsi_dst_register dst
;
60 union tgsi_any_token
*tokens
;
66 #define UREG_MAX_INPUT PIPE_MAX_ATTRIBS
67 #define UREG_MAX_SYSTEM_VALUE PIPE_MAX_ATTRIBS
68 #define UREG_MAX_OUTPUT PIPE_MAX_ATTRIBS
69 #define UREG_MAX_CONSTANT_RANGE 32
70 #define UREG_MAX_IMMEDIATE 32
71 #define UREG_MAX_TEMP 256
72 #define UREG_MAX_ADDR 2
73 #define UREG_MAX_LOOP 1
74 #define UREG_MAX_PRED 1
82 struct pipe_context
*pipe
;
85 unsigned semantic_name
;
86 unsigned semantic_index
;
88 } fs_input
[UREG_MAX_INPUT
];
89 unsigned nr_fs_inputs
;
91 unsigned vs_inputs
[UREG_MAX_INPUT
/32];
95 } gs_input
[UREG_MAX_INPUT
];
96 unsigned nr_gs_inputs
;
100 unsigned semantic_name
;
101 unsigned semantic_index
;
102 } system_value
[UREG_MAX_SYSTEM_VALUE
];
103 unsigned nr_system_values
;
106 unsigned semantic_name
;
107 unsigned semantic_index
;
108 } output
[UREG_MAX_OUTPUT
];
119 } immediate
[UREG_MAX_IMMEDIATE
];
120 unsigned nr_immediates
;
122 struct ureg_src sampler
[PIPE_MAX_SAMPLERS
];
123 unsigned nr_samplers
;
125 unsigned temps_active
[UREG_MAX_TEMP
/ 32];
131 } constant_range
[UREG_MAX_CONSTANT_RANGE
];
132 unsigned nr_constant_ranges
;
137 unsigned nr_instructions
;
139 struct ureg_tokens domain
[2];
142 static union tgsi_any_token error_tokens
[32];
144 static void tokens_error( struct ureg_tokens
*tokens
)
146 if (tokens
->tokens
&& tokens
->tokens
!= error_tokens
)
147 FREE(tokens
->tokens
);
149 tokens
->tokens
= error_tokens
;
150 tokens
->size
= Elements(error_tokens
);
155 static void tokens_expand( struct ureg_tokens
*tokens
,
158 unsigned old_size
= tokens
->size
* sizeof(unsigned);
160 if (tokens
->tokens
== error_tokens
) {
164 while (tokens
->count
+ count
> tokens
->size
) {
165 tokens
->size
= (1 << ++tokens
->order
);
168 tokens
->tokens
= REALLOC(tokens
->tokens
,
170 tokens
->size
* sizeof(unsigned));
171 if (tokens
->tokens
== NULL
) {
172 tokens_error(tokens
);
176 static void set_bad( struct ureg_program
*ureg
)
178 tokens_error(&ureg
->domain
[0]);
183 static union tgsi_any_token
*get_tokens( struct ureg_program
*ureg
,
187 struct ureg_tokens
*tokens
= &ureg
->domain
[domain
];
188 union tgsi_any_token
*result
;
190 if (tokens
->count
+ count
> tokens
->size
)
191 tokens_expand(tokens
, count
);
193 result
= &tokens
->tokens
[tokens
->count
];
194 tokens
->count
+= count
;
199 static union tgsi_any_token
*retrieve_token( struct ureg_program
*ureg
,
203 if (ureg
->domain
[domain
].tokens
== error_tokens
)
204 return &error_tokens
[0];
206 return &ureg
->domain
[domain
].tokens
[nr
];
211 static INLINE
struct ureg_dst
212 ureg_dst_register( unsigned file
,
218 dst
.WriteMask
= TGSI_WRITEMASK_XYZW
;
220 dst
.IndirectIndex
= 0;
221 dst
.IndirectSwizzle
= 0;
225 dst
.PredSwizzleX
= TGSI_SWIZZLE_X
;
226 dst
.PredSwizzleY
= TGSI_SWIZZLE_Y
;
227 dst
.PredSwizzleZ
= TGSI_SWIZZLE_Z
;
228 dst
.PredSwizzleW
= TGSI_SWIZZLE_W
;
234 static INLINE
struct ureg_src
235 ureg_src_register( unsigned file
,
241 src
.SwizzleX
= TGSI_SWIZZLE_X
;
242 src
.SwizzleY
= TGSI_SWIZZLE_Y
;
243 src
.SwizzleZ
= TGSI_SWIZZLE_Z
;
244 src
.SwizzleW
= TGSI_SWIZZLE_W
;
247 src
.IndirectIndex
= 0;
248 src
.IndirectSwizzle
= 0;
260 ureg_DECL_fs_input( struct ureg_program
*ureg
,
263 unsigned interp_mode
)
267 for (i
= 0; i
< ureg
->nr_fs_inputs
; i
++) {
268 if (ureg
->fs_input
[i
].semantic_name
== name
&&
269 ureg
->fs_input
[i
].semantic_index
== index
)
273 if (ureg
->nr_fs_inputs
< UREG_MAX_INPUT
) {
274 ureg
->fs_input
[i
].semantic_name
= name
;
275 ureg
->fs_input
[i
].semantic_index
= index
;
276 ureg
->fs_input
[i
].interp
= interp_mode
;
277 ureg
->nr_fs_inputs
++;
284 return ureg_src_register( TGSI_FILE_INPUT
, i
);
289 ureg_DECL_vs_input( struct ureg_program
*ureg
,
292 assert(ureg
->processor
== TGSI_PROCESSOR_VERTEX
);
294 ureg
->vs_inputs
[index
/32] |= 1 << (index
% 32);
295 return ureg_src_register( TGSI_FILE_INPUT
, index
);
300 ureg_DECL_gs_input(struct ureg_program
*ureg
,
303 if (ureg
->nr_gs_inputs
< UREG_MAX_INPUT
) {
304 ureg
->gs_input
[ureg
->nr_gs_inputs
].index
= index
;
305 ureg
->nr_gs_inputs
++;
310 /* XXX: Add suport for true 2D input registers. */
311 return ureg_src_register(TGSI_FILE_INPUT
, index
);
316 ureg_DECL_system_value(struct ureg_program
*ureg
,
318 unsigned semantic_name
,
319 unsigned semantic_index
)
321 if (ureg
->nr_system_values
< UREG_MAX_SYSTEM_VALUE
) {
322 ureg
->system_value
[ureg
->nr_system_values
].index
= index
;
323 ureg
->system_value
[ureg
->nr_system_values
].semantic_name
= semantic_name
;
324 ureg
->system_value
[ureg
->nr_system_values
].semantic_index
= semantic_index
;
325 ureg
->nr_system_values
++;
330 return ureg_src_register(TGSI_FILE_SYSTEM_VALUE
, index
);
335 ureg_DECL_output( struct ureg_program
*ureg
,
341 for (i
= 0; i
< ureg
->nr_outputs
; i
++) {
342 if (ureg
->output
[i
].semantic_name
== name
&&
343 ureg
->output
[i
].semantic_index
== index
)
347 if (ureg
->nr_outputs
< UREG_MAX_OUTPUT
) {
348 ureg
->output
[i
].semantic_name
= name
;
349 ureg
->output
[i
].semantic_index
= index
;
357 return ureg_dst_register( TGSI_FILE_OUTPUT
, i
);
361 /* Returns a new constant register. Keep track of which have been
362 * referred to so that we can emit decls later.
364 * There is nothing in this code to bind this constant to any tracked
365 * value or manage any constant_buffer contents -- that's the
366 * resposibility of the calling code.
368 struct ureg_src
ureg_DECL_constant(struct ureg_program
*ureg
,
371 unsigned minconst
= index
, maxconst
= index
;
374 /* Inside existing range?
376 for (i
= 0; i
< ureg
->nr_constant_ranges
; i
++) {
377 if (ureg
->constant_range
[i
].first
<= index
&&
378 ureg
->constant_range
[i
].last
>= index
)
382 /* Extend existing range?
384 for (i
= 0; i
< ureg
->nr_constant_ranges
; i
++) {
385 if (ureg
->constant_range
[i
].last
== index
- 1) {
386 ureg
->constant_range
[i
].last
= index
;
390 if (ureg
->constant_range
[i
].first
== index
+ 1) {
391 ureg
->constant_range
[i
].first
= index
;
395 minconst
= MIN2(minconst
, ureg
->constant_range
[i
].first
);
396 maxconst
= MAX2(maxconst
, ureg
->constant_range
[i
].last
);
401 if (ureg
->nr_constant_ranges
< UREG_MAX_CONSTANT_RANGE
) {
402 i
= ureg
->nr_constant_ranges
++;
403 ureg
->constant_range
[i
].first
= index
;
404 ureg
->constant_range
[i
].last
= index
;
408 /* Collapse all ranges down to one:
411 ureg
->constant_range
[0].first
= minconst
;
412 ureg
->constant_range
[0].last
= maxconst
;
413 ureg
->nr_constant_ranges
= 1;
416 assert(i
< ureg
->nr_constant_ranges
);
417 assert(ureg
->constant_range
[i
].first
<= index
);
418 assert(ureg
->constant_range
[i
].last
>= index
);
419 return ureg_src_register( TGSI_FILE_CONSTANT
, index
);
423 /* Allocate a new temporary. Temporaries greater than UREG_MAX_TEMP
424 * are legal, but will not be released.
426 struct ureg_dst
ureg_DECL_temporary( struct ureg_program
*ureg
)
430 for (i
= 0; i
< UREG_MAX_TEMP
; i
+= 32) {
431 int bit
= ffs(~ureg
->temps_active
[i
/32]);
438 /* No reusable temps, so allocate a new one:
440 i
= ureg
->nr_temps
++;
443 if (i
< UREG_MAX_TEMP
)
444 ureg
->temps_active
[i
/32] |= 1 << (i
% 32);
446 if (i
>= ureg
->nr_temps
)
447 ureg
->nr_temps
= i
+ 1;
449 return ureg_dst_register( TGSI_FILE_TEMPORARY
, i
);
453 void ureg_release_temporary( struct ureg_program
*ureg
,
454 struct ureg_dst tmp
)
456 if(tmp
.File
== TGSI_FILE_TEMPORARY
)
457 if (tmp
.Index
< UREG_MAX_TEMP
)
458 ureg
->temps_active
[tmp
.Index
/32] &= ~(1 << (tmp
.Index
% 32));
462 /* Allocate a new address register.
464 struct ureg_dst
ureg_DECL_address( struct ureg_program
*ureg
)
466 if (ureg
->nr_addrs
< UREG_MAX_ADDR
)
467 return ureg_dst_register( TGSI_FILE_ADDRESS
, ureg
->nr_addrs
++ );
470 return ureg_dst_register( TGSI_FILE_ADDRESS
, 0 );
473 /* Allocate a new loop register.
476 ureg_DECL_loop(struct ureg_program
*ureg
)
478 if (ureg
->nr_loops
< UREG_MAX_LOOP
) {
479 return ureg_dst_register(TGSI_FILE_LOOP
, ureg
->nr_loops
++);
483 return ureg_dst_register(TGSI_FILE_LOOP
, 0);
486 /* Allocate a new predicate register.
489 ureg_DECL_predicate(struct ureg_program
*ureg
)
491 if (ureg
->nr_preds
< UREG_MAX_PRED
) {
492 return ureg_dst_register(TGSI_FILE_PREDICATE
, ureg
->nr_preds
++);
496 return ureg_dst_register(TGSI_FILE_PREDICATE
, 0);
499 /* Allocate a new sampler.
501 struct ureg_src
ureg_DECL_sampler( struct ureg_program
*ureg
,
506 for (i
= 0; i
< ureg
->nr_samplers
; i
++)
507 if (ureg
->sampler
[i
].Index
== nr
)
508 return ureg
->sampler
[i
];
510 if (i
< PIPE_MAX_SAMPLERS
) {
511 ureg
->sampler
[i
] = ureg_src_register( TGSI_FILE_SAMPLER
, nr
);
513 return ureg
->sampler
[i
];
517 return ureg
->sampler
[0];
522 match_or_expand_immediate( const unsigned *v
,
528 unsigned nr2
= *pnr2
;
533 for (i
= 0; i
< nr
; i
++) {
534 boolean found
= FALSE
;
536 for (j
= 0; j
< nr2
&& !found
; j
++) {
538 *swizzle
|= j
<< (i
* 2);
549 *swizzle
|= nr2
<< (i
* 2);
554 /* Actually expand immediate only when fully succeeded.
561 static struct ureg_src
562 decl_immediate( struct ureg_program
*ureg
,
570 /* Could do a first pass where we examine all existing immediates
574 for (i
= 0; i
< ureg
->nr_immediates
; i
++) {
575 if (ureg
->immediate
[i
].type
!= type
) {
578 if (match_or_expand_immediate(v
,
580 ureg
->immediate
[i
].value
.u
,
581 &ureg
->immediate
[i
].nr
,
587 if (ureg
->nr_immediates
< UREG_MAX_IMMEDIATE
) {
588 i
= ureg
->nr_immediates
++;
589 ureg
->immediate
[i
].type
= type
;
590 if (match_or_expand_immediate(v
,
592 ureg
->immediate
[i
].value
.u
,
593 &ureg
->immediate
[i
].nr
,
602 /* Make sure that all referenced elements are from this immediate.
603 * Has the effect of making size-one immediates into scalars.
605 for (j
= nr
; j
< 4; j
++) {
606 swizzle
|= (swizzle
& 0x3) << (j
* 2);
609 return ureg_swizzle(ureg_src_register(TGSI_FILE_IMMEDIATE
, i
),
610 (swizzle
>> 0) & 0x3,
611 (swizzle
>> 2) & 0x3,
612 (swizzle
>> 4) & 0x3,
613 (swizzle
>> 6) & 0x3);
618 ureg_DECL_immediate( struct ureg_program
*ureg
,
628 for (i
= 0; i
< nr
; i
++) {
632 return decl_immediate(ureg
, fu
.u
, nr
, TGSI_IMM_FLOAT32
);
637 ureg_DECL_immediate_uint( struct ureg_program
*ureg
,
641 return decl_immediate(ureg
, v
, nr
, TGSI_IMM_UINT32
);
646 ureg_DECL_immediate_int( struct ureg_program
*ureg
,
650 return decl_immediate(ureg
, (const unsigned *)v
, nr
, TGSI_IMM_INT32
);
655 ureg_emit_src( struct ureg_program
*ureg
,
656 struct ureg_src src
)
658 unsigned size
= 1 + (src
.Indirect
? 1 : 0);
660 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_INSN
, size
);
663 assert(src
.File
!= TGSI_FILE_NULL
);
664 assert(src
.File
!= TGSI_FILE_OUTPUT
);
665 assert(src
.File
< TGSI_FILE_COUNT
);
668 out
[n
].src
.File
= src
.File
;
669 out
[n
].src
.SwizzleX
= src
.SwizzleX
;
670 out
[n
].src
.SwizzleY
= src
.SwizzleY
;
671 out
[n
].src
.SwizzleZ
= src
.SwizzleZ
;
672 out
[n
].src
.SwizzleW
= src
.SwizzleW
;
673 out
[n
].src
.Index
= src
.Index
;
674 out
[n
].src
.Negate
= src
.Negate
;
675 out
[0].src
.Absolute
= src
.Absolute
;
679 out
[0].src
.Indirect
= 1;
681 out
[n
].src
.File
= TGSI_FILE_ADDRESS
;
682 out
[n
].src
.SwizzleX
= src
.IndirectSwizzle
;
683 out
[n
].src
.SwizzleY
= src
.IndirectSwizzle
;
684 out
[n
].src
.SwizzleZ
= src
.IndirectSwizzle
;
685 out
[n
].src
.SwizzleW
= src
.IndirectSwizzle
;
686 out
[n
].src
.Index
= src
.IndirectIndex
;
695 ureg_emit_dst( struct ureg_program
*ureg
,
696 struct ureg_dst dst
)
699 (dst
.Indirect
? 1 : 0));
701 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_INSN
, size
);
704 assert(dst
.File
!= TGSI_FILE_NULL
);
705 assert(dst
.File
!= TGSI_FILE_CONSTANT
);
706 assert(dst
.File
!= TGSI_FILE_INPUT
);
707 assert(dst
.File
!= TGSI_FILE_SAMPLER
);
708 assert(dst
.File
!= TGSI_FILE_IMMEDIATE
);
709 assert(dst
.File
< TGSI_FILE_COUNT
);
712 out
[n
].dst
.File
= dst
.File
;
713 out
[n
].dst
.WriteMask
= dst
.WriteMask
;
714 out
[n
].dst
.Indirect
= dst
.Indirect
;
715 out
[n
].dst
.Index
= dst
.Index
;
720 out
[n
].src
.File
= TGSI_FILE_ADDRESS
;
721 out
[n
].src
.SwizzleX
= dst
.IndirectSwizzle
;
722 out
[n
].src
.SwizzleY
= dst
.IndirectSwizzle
;
723 out
[n
].src
.SwizzleZ
= dst
.IndirectSwizzle
;
724 out
[n
].src
.SwizzleW
= dst
.IndirectSwizzle
;
725 out
[n
].src
.Index
= dst
.IndirectIndex
;
733 static void validate( unsigned opcode
,
738 const struct tgsi_opcode_info
*info
= tgsi_get_opcode_info( opcode
);
741 assert(nr_dst
== info
->num_dst
);
742 assert(nr_src
== info
->num_src
);
747 struct ureg_emit_insn_result
748 ureg_emit_insn(struct ureg_program
*ureg
,
753 unsigned pred_swizzle_x
,
754 unsigned pred_swizzle_y
,
755 unsigned pred_swizzle_z
,
756 unsigned pred_swizzle_w
,
760 union tgsi_any_token
*out
;
761 uint count
= predicate
? 2 : 1;
762 struct ureg_emit_insn_result result
;
764 validate( opcode
, num_dst
, num_src
);
766 out
= get_tokens( ureg
, DOMAIN_INSN
, count
);
767 out
[0].insn
= tgsi_default_instruction();
768 out
[0].insn
.Opcode
= opcode
;
769 out
[0].insn
.Saturate
= saturate
;
770 out
[0].insn
.NumDstRegs
= num_dst
;
771 out
[0].insn
.NumSrcRegs
= num_src
;
773 result
.insn_token
= ureg
->domain
[DOMAIN_INSN
].count
- count
;
774 result
.extended_token
= result
.insn_token
;
777 out
[0].insn
.Predicate
= 1;
778 out
[1].insn_predicate
= tgsi_default_instruction_predicate();
779 out
[1].insn_predicate
.Negate
= pred_negate
;
780 out
[1].insn_predicate
.SwizzleX
= pred_swizzle_x
;
781 out
[1].insn_predicate
.SwizzleY
= pred_swizzle_y
;
782 out
[1].insn_predicate
.SwizzleZ
= pred_swizzle_z
;
783 out
[1].insn_predicate
.SwizzleW
= pred_swizzle_w
;
786 ureg
->nr_instructions
++;
793 ureg_emit_label(struct ureg_program
*ureg
,
794 unsigned extended_token
,
795 unsigned *label_token
)
797 union tgsi_any_token
*out
, *insn
;
802 out
= get_tokens( ureg
, DOMAIN_INSN
, 1 );
805 insn
= retrieve_token( ureg
, DOMAIN_INSN
, extended_token
);
806 insn
->insn
.Label
= 1;
808 *label_token
= ureg
->domain
[DOMAIN_INSN
].count
- 1;
811 /* Will return a number which can be used in a label to point to the
812 * next instruction to be emitted.
815 ureg_get_instruction_number( struct ureg_program
*ureg
)
817 return ureg
->nr_instructions
;
820 /* Patch a given label (expressed as a token number) to point to a
821 * given instruction (expressed as an instruction number).
824 ureg_fixup_label(struct ureg_program
*ureg
,
825 unsigned label_token
,
826 unsigned instruction_number
)
828 union tgsi_any_token
*out
= retrieve_token( ureg
, DOMAIN_INSN
, label_token
);
830 out
->insn_label
.Label
= instruction_number
;
835 ureg_emit_texture(struct ureg_program
*ureg
,
836 unsigned extended_token
,
839 union tgsi_any_token
*out
, *insn
;
841 out
= get_tokens( ureg
, DOMAIN_INSN
, 1 );
842 insn
= retrieve_token( ureg
, DOMAIN_INSN
, extended_token
);
844 insn
->insn
.Texture
= 1;
847 out
[0].insn_texture
.Texture
= target
;
852 ureg_fixup_insn_size(struct ureg_program
*ureg
,
855 union tgsi_any_token
*out
= retrieve_token( ureg
, DOMAIN_INSN
, insn
);
857 assert(out
->insn
.Type
== TGSI_TOKEN_TYPE_INSTRUCTION
);
858 out
->insn
.NrTokens
= ureg
->domain
[DOMAIN_INSN
].count
- insn
- 1;
863 ureg_insn(struct ureg_program
*ureg
,
865 const struct ureg_dst
*dst
,
867 const struct ureg_src
*src
,
870 struct ureg_emit_insn_result insn
;
874 boolean negate
= FALSE
;
875 unsigned swizzle
[4] = { 0 };
877 saturate
= nr_dst
? dst
[0].Saturate
: FALSE
;
878 predicate
= nr_dst
? dst
[0].Predicate
: FALSE
;
880 negate
= dst
[0].PredNegate
;
881 swizzle
[0] = dst
[0].PredSwizzleX
;
882 swizzle
[1] = dst
[0].PredSwizzleY
;
883 swizzle
[2] = dst
[0].PredSwizzleZ
;
884 swizzle
[3] = dst
[0].PredSwizzleW
;
887 insn
= ureg_emit_insn(ureg
,
899 for (i
= 0; i
< nr_dst
; i
++)
900 ureg_emit_dst( ureg
, dst
[i
] );
902 for (i
= 0; i
< nr_src
; i
++)
903 ureg_emit_src( ureg
, src
[i
] );
905 ureg_fixup_insn_size( ureg
, insn
.insn_token
);
909 ureg_tex_insn(struct ureg_program
*ureg
,
911 const struct ureg_dst
*dst
,
914 const struct ureg_src
*src
,
917 struct ureg_emit_insn_result insn
;
921 boolean negate
= FALSE
;
922 unsigned swizzle
[4] = { 0 };
924 saturate
= nr_dst
? dst
[0].Saturate
: FALSE
;
925 predicate
= nr_dst
? dst
[0].Predicate
: FALSE
;
927 negate
= dst
[0].PredNegate
;
928 swizzle
[0] = dst
[0].PredSwizzleX
;
929 swizzle
[1] = dst
[0].PredSwizzleY
;
930 swizzle
[2] = dst
[0].PredSwizzleZ
;
931 swizzle
[3] = dst
[0].PredSwizzleW
;
934 insn
= ureg_emit_insn(ureg
,
946 ureg_emit_texture( ureg
, insn
.extended_token
, target
);
948 for (i
= 0; i
< nr_dst
; i
++)
949 ureg_emit_dst( ureg
, dst
[i
] );
951 for (i
= 0; i
< nr_src
; i
++)
952 ureg_emit_src( ureg
, src
[i
] );
954 ureg_fixup_insn_size( ureg
, insn
.insn_token
);
959 ureg_label_insn(struct ureg_program
*ureg
,
961 const struct ureg_src
*src
,
963 unsigned *label_token
)
965 struct ureg_emit_insn_result insn
;
968 insn
= ureg_emit_insn(ureg
,
980 ureg_emit_label( ureg
, insn
.extended_token
, label_token
);
982 for (i
= 0; i
< nr_src
; i
++)
983 ureg_emit_src( ureg
, src
[i
] );
985 ureg_fixup_insn_size( ureg
, insn
.insn_token
);
990 static void emit_decl( struct ureg_program
*ureg
,
993 unsigned semantic_name
,
994 unsigned semantic_index
,
997 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_DECL
, 3 );
1000 out
[0].decl
.Type
= TGSI_TOKEN_TYPE_DECLARATION
;
1001 out
[0].decl
.NrTokens
= 3;
1002 out
[0].decl
.File
= file
;
1003 out
[0].decl
.UsageMask
= TGSI_WRITEMASK_XYZW
; /* FIXME! */
1004 out
[0].decl
.Interpolate
= interp
;
1005 out
[0].decl
.Semantic
= 1;
1008 out
[1].decl_range
.First
=
1009 out
[1].decl_range
.Last
= index
;
1012 out
[2].decl_semantic
.Name
= semantic_name
;
1013 out
[2].decl_semantic
.Index
= semantic_index
;
1018 static void emit_decl_range( struct ureg_program
*ureg
,
1023 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_DECL
, 2 );
1026 out
[0].decl
.Type
= TGSI_TOKEN_TYPE_DECLARATION
;
1027 out
[0].decl
.NrTokens
= 2;
1028 out
[0].decl
.File
= file
;
1029 out
[0].decl
.UsageMask
= 0xf;
1030 out
[0].decl
.Interpolate
= TGSI_INTERPOLATE_CONSTANT
;
1031 out
[0].decl
.Semantic
= 0;
1034 out
[1].decl_range
.First
= first
;
1035 out
[1].decl_range
.Last
= first
+ count
- 1;
1039 emit_immediate( struct ureg_program
*ureg
,
1043 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_DECL
, 5 );
1046 out
[0].imm
.Type
= TGSI_TOKEN_TYPE_IMMEDIATE
;
1047 out
[0].imm
.NrTokens
= 5;
1048 out
[0].imm
.DataType
= type
;
1049 out
[0].imm
.Padding
= 0;
1051 out
[1].imm_data
.Uint
= v
[0];
1052 out
[2].imm_data
.Uint
= v
[1];
1053 out
[3].imm_data
.Uint
= v
[2];
1054 out
[4].imm_data
.Uint
= v
[3];
1060 static void emit_decls( struct ureg_program
*ureg
)
1064 if (ureg
->processor
== TGSI_PROCESSOR_VERTEX
) {
1065 for (i
= 0; i
< UREG_MAX_INPUT
; i
++) {
1066 if (ureg
->vs_inputs
[i
/32] & (1 << (i
%32))) {
1067 emit_decl_range( ureg
, TGSI_FILE_INPUT
, i
, 1 );
1070 } else if (ureg
->processor
== TGSI_PROCESSOR_FRAGMENT
) {
1071 for (i
= 0; i
< ureg
->nr_fs_inputs
; i
++) {
1075 ureg
->fs_input
[i
].semantic_name
,
1076 ureg
->fs_input
[i
].semantic_index
,
1077 ureg
->fs_input
[i
].interp
);
1080 for (i
= 0; i
< ureg
->nr_gs_inputs
; i
++) {
1081 emit_decl_range(ureg
,
1083 ureg
->gs_input
[i
].index
,
1088 for (i
= 0; i
< ureg
->nr_system_values
; i
++) {
1090 TGSI_FILE_SYSTEM_VALUE
,
1091 ureg
->system_value
[i
].index
,
1092 ureg
->system_value
[i
].semantic_name
,
1093 ureg
->system_value
[i
].semantic_index
,
1094 TGSI_INTERPOLATE_CONSTANT
);
1097 for (i
= 0; i
< ureg
->nr_outputs
; i
++) {
1101 ureg
->output
[i
].semantic_name
,
1102 ureg
->output
[i
].semantic_index
,
1103 TGSI_INTERPOLATE_CONSTANT
);
1106 for (i
= 0; i
< ureg
->nr_samplers
; i
++) {
1107 emit_decl_range( ureg
,
1109 ureg
->sampler
[i
].Index
, 1 );
1112 if (ureg
->nr_constant_ranges
) {
1113 for (i
= 0; i
< ureg
->nr_constant_ranges
; i
++)
1114 emit_decl_range( ureg
,
1116 ureg
->constant_range
[i
].first
,
1117 (ureg
->constant_range
[i
].last
+ 1 -
1118 ureg
->constant_range
[i
].first
) );
1121 if (ureg
->nr_temps
) {
1122 emit_decl_range( ureg
,
1123 TGSI_FILE_TEMPORARY
,
1124 0, ureg
->nr_temps
);
1127 if (ureg
->nr_addrs
) {
1128 emit_decl_range( ureg
,
1130 0, ureg
->nr_addrs
);
1133 if (ureg
->nr_loops
) {
1134 emit_decl_range(ureg
,
1140 if (ureg
->nr_preds
) {
1141 emit_decl_range(ureg
,
1142 TGSI_FILE_PREDICATE
,
1147 for (i
= 0; i
< ureg
->nr_immediates
; i
++) {
1148 emit_immediate( ureg
,
1149 ureg
->immediate
[i
].value
.u
,
1150 ureg
->immediate
[i
].type
);
1154 /* Append the instruction tokens onto the declarations to build a
1155 * contiguous stream suitable to send to the driver.
1157 static void copy_instructions( struct ureg_program
*ureg
)
1159 unsigned nr_tokens
= ureg
->domain
[DOMAIN_INSN
].count
;
1160 union tgsi_any_token
*out
= get_tokens( ureg
,
1165 ureg
->domain
[DOMAIN_INSN
].tokens
,
1166 nr_tokens
* sizeof out
[0] );
1171 fixup_header_size(struct ureg_program
*ureg
)
1173 union tgsi_any_token
*out
= retrieve_token( ureg
, DOMAIN_DECL
, 0 );
1175 out
->header
.BodySize
= ureg
->domain
[DOMAIN_DECL
].count
- 2;
1180 emit_header( struct ureg_program
*ureg
)
1182 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_DECL
, 2 );
1184 out
[0].header
.HeaderSize
= 2;
1185 out
[0].header
.BodySize
= 0;
1187 out
[1].processor
.Processor
= ureg
->processor
;
1188 out
[1].processor
.Padding
= 0;
1192 const struct tgsi_token
*ureg_finalize( struct ureg_program
*ureg
)
1194 const struct tgsi_token
*tokens
;
1196 emit_header( ureg
);
1198 copy_instructions( ureg
);
1199 fixup_header_size( ureg
);
1201 if (ureg
->domain
[0].tokens
== error_tokens
||
1202 ureg
->domain
[1].tokens
== error_tokens
) {
1203 debug_printf("%s: error in generated shader\n", __FUNCTION__
);
1208 tokens
= &ureg
->domain
[DOMAIN_DECL
].tokens
[0].token
;
1211 debug_printf("%s: emitted shader %d tokens:\n", __FUNCTION__
,
1212 ureg
->domain
[DOMAIN_DECL
].count
);
1213 tgsi_dump( tokens
, 0 );
1217 if (tokens
&& !tgsi_sanity_check(tokens
)) {
1218 debug_printf("tgsi_ureg.c, sanity check failed on generated tokens:\n");
1219 tgsi_dump(tokens
, 0);
1229 void *ureg_create_shader( struct ureg_program
*ureg
,
1230 struct pipe_context
*pipe
)
1232 struct pipe_shader_state state
;
1234 state
.tokens
= ureg_finalize(ureg
);
1238 if (ureg
->processor
== TGSI_PROCESSOR_VERTEX
)
1239 return pipe
->create_vs_state( pipe
, &state
);
1241 return pipe
->create_fs_state( pipe
, &state
);
1245 const struct tgsi_token
*ureg_get_tokens( struct ureg_program
*ureg
,
1246 unsigned *nr_tokens
)
1248 const struct tgsi_token
*tokens
;
1250 ureg_finalize(ureg
);
1252 tokens
= &ureg
->domain
[DOMAIN_DECL
].tokens
[0].token
;
1255 *nr_tokens
= ureg
->domain
[DOMAIN_DECL
].size
;
1257 ureg
->domain
[DOMAIN_DECL
].tokens
= 0;
1258 ureg
->domain
[DOMAIN_DECL
].size
= 0;
1259 ureg
->domain
[DOMAIN_DECL
].order
= 0;
1260 ureg
->domain
[DOMAIN_DECL
].count
= 0;
1266 struct ureg_program
*ureg_create( unsigned processor
)
1268 struct ureg_program
*ureg
= CALLOC_STRUCT( ureg_program
);
1272 ureg
->processor
= processor
;
1277 void ureg_destroy( struct ureg_program
*ureg
)
1281 for (i
= 0; i
< Elements(ureg
->domain
); i
++) {
1282 if (ureg
->domain
[i
].tokens
&&
1283 ureg
->domain
[i
].tokens
!= error_tokens
)
1284 FREE(ureg
->domain
[i
].tokens
);