1 /**************************************************************************
3 * Copyright 2009-2010 VMware, Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE, INC AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
29 #include "pipe/p_context.h"
30 #include "pipe/p_state.h"
31 #include "tgsi/tgsi_ureg.h"
32 #include "tgsi/tgsi_build.h"
33 #include "tgsi/tgsi_info.h"
34 #include "tgsi/tgsi_dump.h"
35 #include "tgsi/tgsi_sanity.h"
36 #include "util/u_debug.h"
37 #include "util/u_memory.h"
38 #include "util/u_math.h"
40 union tgsi_any_token
{
41 struct tgsi_header header
;
42 struct tgsi_processor processor
;
43 struct tgsi_token token
;
44 struct tgsi_property prop
;
45 struct tgsi_property_data prop_data
;
46 struct tgsi_declaration decl
;
47 struct tgsi_declaration_range decl_range
;
48 struct tgsi_declaration_dimension decl_dim
;
49 struct tgsi_declaration_semantic decl_semantic
;
50 struct tgsi_declaration_resource decl_resource
;
51 struct tgsi_immediate imm
;
52 union tgsi_immediate_data imm_data
;
53 struct tgsi_instruction insn
;
54 struct tgsi_instruction_predicate insn_predicate
;
55 struct tgsi_instruction_label insn_label
;
56 struct tgsi_instruction_texture insn_texture
;
57 struct tgsi_texture_offset insn_texture_offset
;
58 struct tgsi_src_register src
;
59 struct tgsi_dimension dim
;
60 struct tgsi_dst_register dst
;
66 union tgsi_any_token
*tokens
;
72 #define UREG_MAX_INPUT PIPE_MAX_ATTRIBS
73 #define UREG_MAX_SYSTEM_VALUE PIPE_MAX_ATTRIBS
74 #define UREG_MAX_OUTPUT PIPE_MAX_ATTRIBS
75 #define UREG_MAX_CONSTANT_RANGE 32
76 #define UREG_MAX_IMMEDIATE 256
77 #define UREG_MAX_TEMP 256
78 #define UREG_MAX_ADDR 2
79 #define UREG_MAX_PRED 1
85 } constant_range
[UREG_MAX_CONSTANT_RANGE
];
86 unsigned nr_constant_ranges
;
95 struct pipe_context
*pipe
;
98 unsigned semantic_name
;
99 unsigned semantic_index
;
101 unsigned char cylindrical_wrap
;
102 unsigned char centroid
;
103 } fs_input
[UREG_MAX_INPUT
];
104 unsigned nr_fs_inputs
;
106 unsigned vs_inputs
[UREG_MAX_INPUT
/32];
110 unsigned semantic_name
;
111 unsigned semantic_index
;
112 } gs_input
[UREG_MAX_INPUT
];
113 unsigned nr_gs_inputs
;
117 unsigned semantic_name
;
118 unsigned semantic_index
;
119 } system_value
[UREG_MAX_SYSTEM_VALUE
];
120 unsigned nr_system_values
;
123 unsigned semantic_name
;
124 unsigned semantic_index
;
125 } output
[UREG_MAX_OUTPUT
];
136 } immediate
[UREG_MAX_IMMEDIATE
];
137 unsigned nr_immediates
;
139 struct ureg_src sampler
[PIPE_MAX_SAMPLERS
];
140 unsigned nr_samplers
;
145 unsigned return_type_x
;
146 unsigned return_type_y
;
147 unsigned return_type_z
;
148 unsigned return_type_w
;
149 } resource
[PIPE_MAX_SHADER_RESOURCES
];
150 unsigned nr_resources
;
152 unsigned temps_active
[UREG_MAX_TEMP
/ 32];
155 struct const_decl const_decls
;
156 struct const_decl const_decls2D
[PIPE_MAX_CONSTANT_BUFFERS
];
158 unsigned property_gs_input_prim
;
159 unsigned property_gs_output_prim
;
160 unsigned property_gs_max_vertices
;
161 unsigned char property_fs_coord_origin
; /* = TGSI_FS_COORD_ORIGIN_* */
162 unsigned char property_fs_coord_pixel_center
; /* = TGSI_FS_COORD_PIXEL_CENTER_* */
163 unsigned char property_fs_color0_writes_all_cbufs
; /* = TGSI_FS_COLOR0_WRITES_ALL_CBUFS * */
167 unsigned nr_instructions
;
169 struct ureg_tokens domain
[2];
172 static union tgsi_any_token error_tokens
[32];
174 static void tokens_error( struct ureg_tokens
*tokens
)
176 if (tokens
->tokens
&& tokens
->tokens
!= error_tokens
)
177 FREE(tokens
->tokens
);
179 tokens
->tokens
= error_tokens
;
180 tokens
->size
= Elements(error_tokens
);
185 static void tokens_expand( struct ureg_tokens
*tokens
,
188 unsigned old_size
= tokens
->size
* sizeof(unsigned);
190 if (tokens
->tokens
== error_tokens
) {
194 while (tokens
->count
+ count
> tokens
->size
) {
195 tokens
->size
= (1 << ++tokens
->order
);
198 tokens
->tokens
= REALLOC(tokens
->tokens
,
200 tokens
->size
* sizeof(unsigned));
201 if (tokens
->tokens
== NULL
) {
202 tokens_error(tokens
);
206 static void set_bad( struct ureg_program
*ureg
)
208 tokens_error(&ureg
->domain
[0]);
213 static union tgsi_any_token
*get_tokens( struct ureg_program
*ureg
,
217 struct ureg_tokens
*tokens
= &ureg
->domain
[domain
];
218 union tgsi_any_token
*result
;
220 if (tokens
->count
+ count
> tokens
->size
)
221 tokens_expand(tokens
, count
);
223 result
= &tokens
->tokens
[tokens
->count
];
224 tokens
->count
+= count
;
229 static union tgsi_any_token
*retrieve_token( struct ureg_program
*ureg
,
233 if (ureg
->domain
[domain
].tokens
== error_tokens
)
234 return &error_tokens
[0];
236 return &ureg
->domain
[domain
].tokens
[nr
];
241 static INLINE
struct ureg_dst
242 ureg_dst_register( unsigned file
,
248 dst
.WriteMask
= TGSI_WRITEMASK_XYZW
;
250 dst
.IndirectIndex
= 0;
251 dst
.IndirectSwizzle
= 0;
255 dst
.PredSwizzleX
= TGSI_SWIZZLE_X
;
256 dst
.PredSwizzleY
= TGSI_SWIZZLE_Y
;
257 dst
.PredSwizzleZ
= TGSI_SWIZZLE_Z
;
258 dst
.PredSwizzleW
= TGSI_SWIZZLE_W
;
266 ureg_property_gs_input_prim(struct ureg_program
*ureg
,
269 ureg
->property_gs_input_prim
= input_prim
;
273 ureg_property_gs_output_prim(struct ureg_program
*ureg
,
274 unsigned output_prim
)
276 ureg
->property_gs_output_prim
= output_prim
;
280 ureg_property_gs_max_vertices(struct ureg_program
*ureg
,
281 unsigned max_vertices
)
283 ureg
->property_gs_max_vertices
= max_vertices
;
287 ureg_property_fs_coord_origin(struct ureg_program
*ureg
,
288 unsigned fs_coord_origin
)
290 ureg
->property_fs_coord_origin
= fs_coord_origin
;
294 ureg_property_fs_coord_pixel_center(struct ureg_program
*ureg
,
295 unsigned fs_coord_pixel_center
)
297 ureg
->property_fs_coord_pixel_center
= fs_coord_pixel_center
;
301 ureg_property_fs_color0_writes_all_cbufs(struct ureg_program
*ureg
,
302 unsigned fs_color0_writes_all_cbufs
)
304 ureg
->property_fs_color0_writes_all_cbufs
= fs_color0_writes_all_cbufs
;
308 ureg_DECL_fs_input_cyl_centroid(struct ureg_program
*ureg
,
309 unsigned semantic_name
,
310 unsigned semantic_index
,
311 unsigned interp_mode
,
312 unsigned cylindrical_wrap
,
317 for (i
= 0; i
< ureg
->nr_fs_inputs
; i
++) {
318 if (ureg
->fs_input
[i
].semantic_name
== semantic_name
&&
319 ureg
->fs_input
[i
].semantic_index
== semantic_index
) {
324 if (ureg
->nr_fs_inputs
< UREG_MAX_INPUT
) {
325 ureg
->fs_input
[i
].semantic_name
= semantic_name
;
326 ureg
->fs_input
[i
].semantic_index
= semantic_index
;
327 ureg
->fs_input
[i
].interp
= interp_mode
;
328 ureg
->fs_input
[i
].cylindrical_wrap
= cylindrical_wrap
;
329 ureg
->fs_input
[i
].centroid
= centroid
;
330 ureg
->nr_fs_inputs
++;
336 return ureg_src_register(TGSI_FILE_INPUT
, i
);
341 ureg_DECL_vs_input( struct ureg_program
*ureg
,
344 assert(ureg
->processor
== TGSI_PROCESSOR_VERTEX
);
346 ureg
->vs_inputs
[index
/32] |= 1 << (index
% 32);
347 return ureg_src_register( TGSI_FILE_INPUT
, index
);
352 ureg_DECL_gs_input(struct ureg_program
*ureg
,
354 unsigned semantic_name
,
355 unsigned semantic_index
)
357 if (ureg
->nr_gs_inputs
< UREG_MAX_INPUT
) {
358 ureg
->gs_input
[ureg
->nr_gs_inputs
].index
= index
;
359 ureg
->gs_input
[ureg
->nr_gs_inputs
].semantic_name
= semantic_name
;
360 ureg
->gs_input
[ureg
->nr_gs_inputs
].semantic_index
= semantic_index
;
361 ureg
->nr_gs_inputs
++;
366 /* XXX: Add suport for true 2D input registers. */
367 return ureg_src_register(TGSI_FILE_INPUT
, index
);
372 ureg_DECL_system_value(struct ureg_program
*ureg
,
374 unsigned semantic_name
,
375 unsigned semantic_index
)
377 if (ureg
->nr_system_values
< UREG_MAX_SYSTEM_VALUE
) {
378 ureg
->system_value
[ureg
->nr_system_values
].index
= index
;
379 ureg
->system_value
[ureg
->nr_system_values
].semantic_name
= semantic_name
;
380 ureg
->system_value
[ureg
->nr_system_values
].semantic_index
= semantic_index
;
381 ureg
->nr_system_values
++;
386 return ureg_src_register(TGSI_FILE_SYSTEM_VALUE
, index
);
391 ureg_DECL_output( struct ureg_program
*ureg
,
397 for (i
= 0; i
< ureg
->nr_outputs
; i
++) {
398 if (ureg
->output
[i
].semantic_name
== name
&&
399 ureg
->output
[i
].semantic_index
== index
)
403 if (ureg
->nr_outputs
< UREG_MAX_OUTPUT
) {
404 ureg
->output
[i
].semantic_name
= name
;
405 ureg
->output
[i
].semantic_index
= index
;
413 return ureg_dst_register( TGSI_FILE_OUTPUT
, i
);
417 /* Returns a new constant register. Keep track of which have been
418 * referred to so that we can emit decls later.
420 * Constant operands declared with this function must be addressed
421 * with a two-dimensional index.
423 * There is nothing in this code to bind this constant to any tracked
424 * value or manage any constant_buffer contents -- that's the
425 * resposibility of the calling code.
428 ureg_DECL_constant2D(struct ureg_program
*ureg
,
433 struct const_decl
*decl
= &ureg
->const_decls2D
[index2D
];
435 assert(index2D
< PIPE_MAX_CONSTANT_BUFFERS
);
437 if (decl
->nr_constant_ranges
< UREG_MAX_CONSTANT_RANGE
) {
438 uint i
= decl
->nr_constant_ranges
++;
440 decl
->constant_range
[i
].first
= first
;
441 decl
->constant_range
[i
].last
= last
;
446 /* A one-dimensional, depricated version of ureg_DECL_constant2D().
448 * Constant operands declared with this function must be addressed
449 * with a one-dimensional index.
452 ureg_DECL_constant(struct ureg_program
*ureg
,
455 struct const_decl
*decl
= &ureg
->const_decls
;
456 unsigned minconst
= index
, maxconst
= index
;
459 /* Inside existing range?
461 for (i
= 0; i
< decl
->nr_constant_ranges
; i
++) {
462 if (decl
->constant_range
[i
].first
<= index
&&
463 decl
->constant_range
[i
].last
>= index
) {
468 /* Extend existing range?
470 for (i
= 0; i
< decl
->nr_constant_ranges
; i
++) {
471 if (decl
->constant_range
[i
].last
== index
- 1) {
472 decl
->constant_range
[i
].last
= index
;
476 if (decl
->constant_range
[i
].first
== index
+ 1) {
477 decl
->constant_range
[i
].first
= index
;
481 minconst
= MIN2(minconst
, decl
->constant_range
[i
].first
);
482 maxconst
= MAX2(maxconst
, decl
->constant_range
[i
].last
);
487 if (decl
->nr_constant_ranges
< UREG_MAX_CONSTANT_RANGE
) {
488 i
= decl
->nr_constant_ranges
++;
489 decl
->constant_range
[i
].first
= index
;
490 decl
->constant_range
[i
].last
= index
;
494 /* Collapse all ranges down to one:
497 decl
->constant_range
[0].first
= minconst
;
498 decl
->constant_range
[0].last
= maxconst
;
499 decl
->nr_constant_ranges
= 1;
502 assert(i
< decl
->nr_constant_ranges
);
503 assert(decl
->constant_range
[i
].first
<= index
);
504 assert(decl
->constant_range
[i
].last
>= index
);
505 return ureg_src_register(TGSI_FILE_CONSTANT
, index
);
509 /* Allocate a new temporary. Temporaries greater than UREG_MAX_TEMP
510 * are legal, but will not be released.
512 struct ureg_dst
ureg_DECL_temporary( struct ureg_program
*ureg
)
516 for (i
= 0; i
< UREG_MAX_TEMP
; i
+= 32) {
517 int bit
= ffs(~ureg
->temps_active
[i
/32]);
524 /* No reusable temps, so allocate a new one:
526 i
= ureg
->nr_temps
++;
529 if (i
< UREG_MAX_TEMP
)
530 ureg
->temps_active
[i
/32] |= 1 << (i
% 32);
532 if (i
>= ureg
->nr_temps
)
533 ureg
->nr_temps
= i
+ 1;
535 return ureg_dst_register( TGSI_FILE_TEMPORARY
, i
);
539 void ureg_release_temporary( struct ureg_program
*ureg
,
540 struct ureg_dst tmp
)
542 if(tmp
.File
== TGSI_FILE_TEMPORARY
)
543 if (tmp
.Index
< UREG_MAX_TEMP
)
544 ureg
->temps_active
[tmp
.Index
/32] &= ~(1 << (tmp
.Index
% 32));
548 /* Allocate a new address register.
550 struct ureg_dst
ureg_DECL_address( struct ureg_program
*ureg
)
552 if (ureg
->nr_addrs
< UREG_MAX_ADDR
)
553 return ureg_dst_register( TGSI_FILE_ADDRESS
, ureg
->nr_addrs
++ );
556 return ureg_dst_register( TGSI_FILE_ADDRESS
, 0 );
559 /* Allocate a new predicate register.
562 ureg_DECL_predicate(struct ureg_program
*ureg
)
564 if (ureg
->nr_preds
< UREG_MAX_PRED
) {
565 return ureg_dst_register(TGSI_FILE_PREDICATE
, ureg
->nr_preds
++);
569 return ureg_dst_register(TGSI_FILE_PREDICATE
, 0);
572 /* Allocate a new sampler.
574 struct ureg_src
ureg_DECL_sampler( struct ureg_program
*ureg
,
579 for (i
= 0; i
< ureg
->nr_samplers
; i
++)
580 if (ureg
->sampler
[i
].Index
== nr
)
581 return ureg
->sampler
[i
];
583 if (i
< PIPE_MAX_SAMPLERS
) {
584 ureg
->sampler
[i
] = ureg_src_register( TGSI_FILE_SAMPLER
, nr
);
586 return ureg
->sampler
[i
];
590 return ureg
->sampler
[0];
594 * Allocate a new shader resource.
597 ureg_DECL_resource(struct ureg_program
*ureg
,
600 unsigned return_type_x
,
601 unsigned return_type_y
,
602 unsigned return_type_z
,
603 unsigned return_type_w
)
605 struct ureg_src reg
= ureg_src_register(TGSI_FILE_RESOURCE
, index
);
608 for (i
= 0; i
< ureg
->nr_resources
; i
++) {
609 if (ureg
->resource
[i
].index
== index
) {
614 if (i
< PIPE_MAX_SHADER_RESOURCES
) {
615 ureg
->resource
[i
].index
= index
;
616 ureg
->resource
[i
].target
= target
;
617 ureg
->resource
[i
].return_type_x
= return_type_x
;
618 ureg
->resource
[i
].return_type_y
= return_type_y
;
619 ureg
->resource
[i
].return_type_z
= return_type_z
;
620 ureg
->resource
[i
].return_type_w
= return_type_w
;
621 ureg
->nr_resources
++;
630 match_or_expand_immediate( const unsigned *v
,
636 unsigned nr2
= *pnr2
;
641 for (i
= 0; i
< nr
; i
++) {
642 boolean found
= FALSE
;
644 for (j
= 0; j
< nr2
&& !found
; j
++) {
646 *swizzle
|= j
<< (i
* 2);
657 *swizzle
|= nr2
<< (i
* 2);
662 /* Actually expand immediate only when fully succeeded.
669 static struct ureg_src
670 decl_immediate( struct ureg_program
*ureg
,
676 unsigned swizzle
= 0;
678 /* Could do a first pass where we examine all existing immediates
682 for (i
= 0; i
< ureg
->nr_immediates
; i
++) {
683 if (ureg
->immediate
[i
].type
!= type
) {
686 if (match_or_expand_immediate(v
,
688 ureg
->immediate
[i
].value
.u
,
689 &ureg
->immediate
[i
].nr
,
695 if (ureg
->nr_immediates
< UREG_MAX_IMMEDIATE
) {
696 i
= ureg
->nr_immediates
++;
697 ureg
->immediate
[i
].type
= type
;
698 if (match_or_expand_immediate(v
,
700 ureg
->immediate
[i
].value
.u
,
701 &ureg
->immediate
[i
].nr
,
710 /* Make sure that all referenced elements are from this immediate.
711 * Has the effect of making size-one immediates into scalars.
713 for (j
= nr
; j
< 4; j
++) {
714 swizzle
|= (swizzle
& 0x3) << (j
* 2);
717 return ureg_swizzle(ureg_src_register(TGSI_FILE_IMMEDIATE
, i
),
718 (swizzle
>> 0) & 0x3,
719 (swizzle
>> 2) & 0x3,
720 (swizzle
>> 4) & 0x3,
721 (swizzle
>> 6) & 0x3);
726 ureg_DECL_immediate( struct ureg_program
*ureg
,
736 for (i
= 0; i
< nr
; i
++) {
740 return decl_immediate(ureg
, fu
.u
, nr
, TGSI_IMM_FLOAT32
);
745 ureg_DECL_immediate_uint( struct ureg_program
*ureg
,
749 return decl_immediate(ureg
, v
, nr
, TGSI_IMM_UINT32
);
754 ureg_DECL_immediate_block_uint( struct ureg_program
*ureg
,
761 if (ureg
->nr_immediates
+ (nr
+ 3) / 4 > UREG_MAX_IMMEDIATE
) {
763 return ureg_src_register(TGSI_FILE_IMMEDIATE
, 0);
766 index
= ureg
->nr_immediates
;
767 ureg
->nr_immediates
+= (nr
+ 3) / 4;
769 for (i
= index
; i
< ureg
->nr_immediates
; i
++) {
770 ureg
->immediate
[i
].type
= TGSI_IMM_UINT32
;
771 ureg
->immediate
[i
].nr
= nr
> 4 ? 4 : nr
;
772 memcpy(ureg
->immediate
[i
].value
.u
,
774 ureg
->immediate
[i
].nr
* sizeof(uint
));
778 return ureg_src_register(TGSI_FILE_IMMEDIATE
, index
);
783 ureg_DECL_immediate_int( struct ureg_program
*ureg
,
787 return decl_immediate(ureg
, (const unsigned *)v
, nr
, TGSI_IMM_INT32
);
792 ureg_emit_src( struct ureg_program
*ureg
,
793 struct ureg_src src
)
795 unsigned size
= 1 + (src
.Indirect
? 1 : 0) +
796 (src
.Dimension
? (src
.DimIndirect
? 2 : 1) : 0);
798 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_INSN
, size
);
801 assert(src
.File
!= TGSI_FILE_NULL
);
802 assert(src
.File
< TGSI_FILE_COUNT
);
805 out
[n
].src
.File
= src
.File
;
806 out
[n
].src
.SwizzleX
= src
.SwizzleX
;
807 out
[n
].src
.SwizzleY
= src
.SwizzleY
;
808 out
[n
].src
.SwizzleZ
= src
.SwizzleZ
;
809 out
[n
].src
.SwizzleW
= src
.SwizzleW
;
810 out
[n
].src
.Index
= src
.Index
;
811 out
[n
].src
.Negate
= src
.Negate
;
812 out
[0].src
.Absolute
= src
.Absolute
;
816 out
[0].src
.Indirect
= 1;
818 out
[n
].src
.File
= src
.IndirectFile
;
819 out
[n
].src
.SwizzleX
= src
.IndirectSwizzle
;
820 out
[n
].src
.SwizzleY
= src
.IndirectSwizzle
;
821 out
[n
].src
.SwizzleZ
= src
.IndirectSwizzle
;
822 out
[n
].src
.SwizzleW
= src
.IndirectSwizzle
;
823 out
[n
].src
.Index
= src
.IndirectIndex
;
828 if (src
.DimIndirect
) {
829 out
[0].src
.Dimension
= 1;
830 out
[n
].dim
.Indirect
= 1;
831 out
[n
].dim
.Dimension
= 0;
832 out
[n
].dim
.Padding
= 0;
833 out
[n
].dim
.Index
= src
.DimensionIndex
;
836 out
[n
].src
.File
= src
.DimIndFile
;
837 out
[n
].src
.SwizzleX
= src
.DimIndSwizzle
;
838 out
[n
].src
.SwizzleY
= src
.DimIndSwizzle
;
839 out
[n
].src
.SwizzleZ
= src
.DimIndSwizzle
;
840 out
[n
].src
.SwizzleW
= src
.DimIndSwizzle
;
841 out
[n
].src
.Index
= src
.DimIndIndex
;
843 out
[0].src
.Dimension
= 1;
844 out
[n
].dim
.Indirect
= 0;
845 out
[n
].dim
.Dimension
= 0;
846 out
[n
].dim
.Padding
= 0;
847 out
[n
].dim
.Index
= src
.DimensionIndex
;
857 ureg_emit_dst( struct ureg_program
*ureg
,
858 struct ureg_dst dst
)
861 (dst
.Indirect
? 1 : 0));
863 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_INSN
, size
);
866 assert(dst
.File
!= TGSI_FILE_NULL
);
867 assert(dst
.File
!= TGSI_FILE_CONSTANT
);
868 assert(dst
.File
!= TGSI_FILE_INPUT
);
869 assert(dst
.File
!= TGSI_FILE_SAMPLER
);
870 assert(dst
.File
!= TGSI_FILE_RESOURCE
);
871 assert(dst
.File
!= TGSI_FILE_IMMEDIATE
);
872 assert(dst
.File
< TGSI_FILE_COUNT
);
875 out
[n
].dst
.File
= dst
.File
;
876 out
[n
].dst
.WriteMask
= dst
.WriteMask
;
877 out
[n
].dst
.Indirect
= dst
.Indirect
;
878 out
[n
].dst
.Index
= dst
.Index
;
883 out
[n
].src
.File
= TGSI_FILE_ADDRESS
;
884 out
[n
].src
.SwizzleX
= dst
.IndirectSwizzle
;
885 out
[n
].src
.SwizzleY
= dst
.IndirectSwizzle
;
886 out
[n
].src
.SwizzleZ
= dst
.IndirectSwizzle
;
887 out
[n
].src
.SwizzleW
= dst
.IndirectSwizzle
;
888 out
[n
].src
.Index
= dst
.IndirectIndex
;
896 static void validate( unsigned opcode
,
901 const struct tgsi_opcode_info
*info
= tgsi_get_opcode_info( opcode
);
904 assert(nr_dst
== info
->num_dst
);
905 assert(nr_src
== info
->num_src
);
910 struct ureg_emit_insn_result
911 ureg_emit_insn(struct ureg_program
*ureg
,
916 unsigned pred_swizzle_x
,
917 unsigned pred_swizzle_y
,
918 unsigned pred_swizzle_z
,
919 unsigned pred_swizzle_w
,
923 union tgsi_any_token
*out
;
924 uint count
= predicate
? 2 : 1;
925 struct ureg_emit_insn_result result
;
927 validate( opcode
, num_dst
, num_src
);
929 out
= get_tokens( ureg
, DOMAIN_INSN
, count
);
930 out
[0].insn
= tgsi_default_instruction();
931 out
[0].insn
.Opcode
= opcode
;
932 out
[0].insn
.Saturate
= saturate
;
933 out
[0].insn
.NumDstRegs
= num_dst
;
934 out
[0].insn
.NumSrcRegs
= num_src
;
936 result
.insn_token
= ureg
->domain
[DOMAIN_INSN
].count
- count
;
937 result
.extended_token
= result
.insn_token
;
940 out
[0].insn
.Predicate
= 1;
941 out
[1].insn_predicate
= tgsi_default_instruction_predicate();
942 out
[1].insn_predicate
.Negate
= pred_negate
;
943 out
[1].insn_predicate
.SwizzleX
= pred_swizzle_x
;
944 out
[1].insn_predicate
.SwizzleY
= pred_swizzle_y
;
945 out
[1].insn_predicate
.SwizzleZ
= pred_swizzle_z
;
946 out
[1].insn_predicate
.SwizzleW
= pred_swizzle_w
;
949 ureg
->nr_instructions
++;
956 ureg_emit_label(struct ureg_program
*ureg
,
957 unsigned extended_token
,
958 unsigned *label_token
)
960 union tgsi_any_token
*out
, *insn
;
965 out
= get_tokens( ureg
, DOMAIN_INSN
, 1 );
968 insn
= retrieve_token( ureg
, DOMAIN_INSN
, extended_token
);
969 insn
->insn
.Label
= 1;
971 *label_token
= ureg
->domain
[DOMAIN_INSN
].count
- 1;
974 /* Will return a number which can be used in a label to point to the
975 * next instruction to be emitted.
978 ureg_get_instruction_number( struct ureg_program
*ureg
)
980 return ureg
->nr_instructions
;
983 /* Patch a given label (expressed as a token number) to point to a
984 * given instruction (expressed as an instruction number).
987 ureg_fixup_label(struct ureg_program
*ureg
,
988 unsigned label_token
,
989 unsigned instruction_number
)
991 union tgsi_any_token
*out
= retrieve_token( ureg
, DOMAIN_INSN
, label_token
);
993 out
->insn_label
.Label
= instruction_number
;
998 ureg_emit_texture(struct ureg_program
*ureg
,
999 unsigned extended_token
,
1000 unsigned target
, unsigned num_offsets
)
1002 union tgsi_any_token
*out
, *insn
;
1004 out
= get_tokens( ureg
, DOMAIN_INSN
, 1 );
1005 insn
= retrieve_token( ureg
, DOMAIN_INSN
, extended_token
);
1007 insn
->insn
.Texture
= 1;
1010 out
[0].insn_texture
.Texture
= target
;
1011 out
[0].insn_texture
.NumOffsets
= num_offsets
;
1015 ureg_emit_texture_offset(struct ureg_program
*ureg
,
1016 const struct tgsi_texture_offset
*offset
)
1018 union tgsi_any_token
*out
;
1020 out
= get_tokens( ureg
, DOMAIN_INSN
, 1);
1023 out
[0].insn_texture_offset
= *offset
;
1029 ureg_fixup_insn_size(struct ureg_program
*ureg
,
1032 union tgsi_any_token
*out
= retrieve_token( ureg
, DOMAIN_INSN
, insn
);
1034 assert(out
->insn
.Type
== TGSI_TOKEN_TYPE_INSTRUCTION
);
1035 out
->insn
.NrTokens
= ureg
->domain
[DOMAIN_INSN
].count
- insn
- 1;
1040 ureg_insn(struct ureg_program
*ureg
,
1042 const struct ureg_dst
*dst
,
1044 const struct ureg_src
*src
,
1047 struct ureg_emit_insn_result insn
;
1051 boolean negate
= FALSE
;
1052 unsigned swizzle
[4] = { 0 };
1054 saturate
= nr_dst
? dst
[0].Saturate
: FALSE
;
1055 predicate
= nr_dst
? dst
[0].Predicate
: FALSE
;
1057 negate
= dst
[0].PredNegate
;
1058 swizzle
[0] = dst
[0].PredSwizzleX
;
1059 swizzle
[1] = dst
[0].PredSwizzleY
;
1060 swizzle
[2] = dst
[0].PredSwizzleZ
;
1061 swizzle
[3] = dst
[0].PredSwizzleW
;
1064 insn
= ureg_emit_insn(ureg
,
1076 for (i
= 0; i
< nr_dst
; i
++)
1077 ureg_emit_dst( ureg
, dst
[i
] );
1079 for (i
= 0; i
< nr_src
; i
++)
1080 ureg_emit_src( ureg
, src
[i
] );
1082 ureg_fixup_insn_size( ureg
, insn
.insn_token
);
1086 ureg_tex_insn(struct ureg_program
*ureg
,
1088 const struct ureg_dst
*dst
,
1091 const struct tgsi_texture_offset
*texoffsets
,
1093 const struct ureg_src
*src
,
1096 struct ureg_emit_insn_result insn
;
1100 boolean negate
= FALSE
;
1101 unsigned swizzle
[4] = { 0 };
1103 saturate
= nr_dst
? dst
[0].Saturate
: FALSE
;
1104 predicate
= nr_dst
? dst
[0].Predicate
: FALSE
;
1106 negate
= dst
[0].PredNegate
;
1107 swizzle
[0] = dst
[0].PredSwizzleX
;
1108 swizzle
[1] = dst
[0].PredSwizzleY
;
1109 swizzle
[2] = dst
[0].PredSwizzleZ
;
1110 swizzle
[3] = dst
[0].PredSwizzleW
;
1113 insn
= ureg_emit_insn(ureg
,
1125 ureg_emit_texture( ureg
, insn
.extended_token
, target
, nr_offset
);
1127 for (i
= 0; i
< nr_offset
; i
++)
1128 ureg_emit_texture_offset( ureg
, &texoffsets
[i
]);
1130 for (i
= 0; i
< nr_dst
; i
++)
1131 ureg_emit_dst( ureg
, dst
[i
] );
1133 for (i
= 0; i
< nr_src
; i
++)
1134 ureg_emit_src( ureg
, src
[i
] );
1136 ureg_fixup_insn_size( ureg
, insn
.insn_token
);
1141 ureg_label_insn(struct ureg_program
*ureg
,
1143 const struct ureg_src
*src
,
1145 unsigned *label_token
)
1147 struct ureg_emit_insn_result insn
;
1150 insn
= ureg_emit_insn(ureg
,
1162 ureg_emit_label( ureg
, insn
.extended_token
, label_token
);
1164 for (i
= 0; i
< nr_src
; i
++)
1165 ureg_emit_src( ureg
, src
[i
] );
1167 ureg_fixup_insn_size( ureg
, insn
.insn_token
);
1172 emit_decl_semantic(struct ureg_program
*ureg
,
1175 unsigned semantic_name
,
1176 unsigned semantic_index
)
1178 union tgsi_any_token
*out
= get_tokens(ureg
, DOMAIN_DECL
, 3);
1181 out
[0].decl
.Type
= TGSI_TOKEN_TYPE_DECLARATION
;
1182 out
[0].decl
.NrTokens
= 3;
1183 out
[0].decl
.File
= file
;
1184 out
[0].decl
.UsageMask
= TGSI_WRITEMASK_XYZW
; /* FIXME! */
1185 out
[0].decl
.Semantic
= 1;
1188 out
[1].decl_range
.First
= index
;
1189 out
[1].decl_range
.Last
= index
;
1192 out
[2].decl_semantic
.Name
= semantic_name
;
1193 out
[2].decl_semantic
.Index
= semantic_index
;
1198 emit_decl_fs(struct ureg_program
*ureg
,
1201 unsigned semantic_name
,
1202 unsigned semantic_index
,
1203 unsigned interpolate
,
1204 unsigned cylindrical_wrap
,
1207 union tgsi_any_token
*out
= get_tokens(ureg
, DOMAIN_DECL
, 3);
1210 out
[0].decl
.Type
= TGSI_TOKEN_TYPE_DECLARATION
;
1211 out
[0].decl
.NrTokens
= 3;
1212 out
[0].decl
.File
= file
;
1213 out
[0].decl
.UsageMask
= TGSI_WRITEMASK_XYZW
; /* FIXME! */
1214 out
[0].decl
.Interpolate
= interpolate
;
1215 out
[0].decl
.Semantic
= 1;
1216 out
[0].decl
.CylindricalWrap
= cylindrical_wrap
;
1217 out
[0].decl
.Centroid
= centroid
;
1220 out
[1].decl_range
.First
= index
;
1221 out
[1].decl_range
.Last
= index
;
1224 out
[2].decl_semantic
.Name
= semantic_name
;
1225 out
[2].decl_semantic
.Index
= semantic_index
;
1229 static void emit_decl_range( struct ureg_program
*ureg
,
1234 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_DECL
, 2 );
1237 out
[0].decl
.Type
= TGSI_TOKEN_TYPE_DECLARATION
;
1238 out
[0].decl
.NrTokens
= 2;
1239 out
[0].decl
.File
= file
;
1240 out
[0].decl
.UsageMask
= TGSI_WRITEMASK_XYZW
;
1241 out
[0].decl
.Interpolate
= TGSI_INTERPOLATE_CONSTANT
;
1242 out
[0].decl
.Semantic
= 0;
1245 out
[1].decl_range
.First
= first
;
1246 out
[1].decl_range
.Last
= first
+ count
- 1;
1250 emit_decl_range2D(struct ureg_program
*ureg
,
1256 union tgsi_any_token
*out
= get_tokens(ureg
, DOMAIN_DECL
, 3);
1259 out
[0].decl
.Type
= TGSI_TOKEN_TYPE_DECLARATION
;
1260 out
[0].decl
.NrTokens
= 3;
1261 out
[0].decl
.File
= file
;
1262 out
[0].decl
.UsageMask
= TGSI_WRITEMASK_XYZW
;
1263 out
[0].decl
.Interpolate
= TGSI_INTERPOLATE_CONSTANT
;
1264 out
[0].decl
.Dimension
= 1;
1267 out
[1].decl_range
.First
= first
;
1268 out
[1].decl_range
.Last
= last
;
1271 out
[2].decl_dim
.Index2D
= index2D
;
1275 emit_decl_resource(struct ureg_program
*ureg
,
1278 unsigned return_type_x
,
1279 unsigned return_type_y
,
1280 unsigned return_type_z
,
1281 unsigned return_type_w
)
1283 union tgsi_any_token
*out
= get_tokens(ureg
, DOMAIN_DECL
, 3);
1286 out
[0].decl
.Type
= TGSI_TOKEN_TYPE_DECLARATION
;
1287 out
[0].decl
.NrTokens
= 3;
1288 out
[0].decl
.File
= TGSI_FILE_RESOURCE
;
1289 out
[0].decl
.UsageMask
= 0xf;
1290 out
[0].decl
.Interpolate
= TGSI_INTERPOLATE_CONSTANT
;
1293 out
[1].decl_range
.First
= index
;
1294 out
[1].decl_range
.Last
= index
;
1297 out
[2].decl_resource
.Resource
= target
;
1298 out
[2].decl_resource
.ReturnTypeX
= return_type_x
;
1299 out
[2].decl_resource
.ReturnTypeY
= return_type_y
;
1300 out
[2].decl_resource
.ReturnTypeZ
= return_type_z
;
1301 out
[2].decl_resource
.ReturnTypeW
= return_type_w
;
1305 emit_immediate( struct ureg_program
*ureg
,
1309 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_DECL
, 5 );
1312 out
[0].imm
.Type
= TGSI_TOKEN_TYPE_IMMEDIATE
;
1313 out
[0].imm
.NrTokens
= 5;
1314 out
[0].imm
.DataType
= type
;
1315 out
[0].imm
.Padding
= 0;
1317 out
[1].imm_data
.Uint
= v
[0];
1318 out
[2].imm_data
.Uint
= v
[1];
1319 out
[3].imm_data
.Uint
= v
[2];
1320 out
[4].imm_data
.Uint
= v
[3];
1324 emit_property(struct ureg_program
*ureg
,
1328 union tgsi_any_token
*out
= get_tokens(ureg
, DOMAIN_DECL
, 2);
1331 out
[0].prop
.Type
= TGSI_TOKEN_TYPE_PROPERTY
;
1332 out
[0].prop
.NrTokens
= 2;
1333 out
[0].prop
.PropertyName
= name
;
1335 out
[1].prop_data
.Data
= data
;
1339 static void emit_decls( struct ureg_program
*ureg
)
1343 if (ureg
->property_gs_input_prim
!= ~0) {
1344 assert(ureg
->processor
== TGSI_PROCESSOR_GEOMETRY
);
1347 TGSI_PROPERTY_GS_INPUT_PRIM
,
1348 ureg
->property_gs_input_prim
);
1351 if (ureg
->property_gs_output_prim
!= ~0) {
1352 assert(ureg
->processor
== TGSI_PROCESSOR_GEOMETRY
);
1355 TGSI_PROPERTY_GS_OUTPUT_PRIM
,
1356 ureg
->property_gs_output_prim
);
1359 if (ureg
->property_gs_max_vertices
!= ~0) {
1360 assert(ureg
->processor
== TGSI_PROCESSOR_GEOMETRY
);
1363 TGSI_PROPERTY_GS_MAX_OUTPUT_VERTICES
,
1364 ureg
->property_gs_max_vertices
);
1367 if (ureg
->property_fs_coord_origin
) {
1368 assert(ureg
->processor
== TGSI_PROCESSOR_FRAGMENT
);
1371 TGSI_PROPERTY_FS_COORD_ORIGIN
,
1372 ureg
->property_fs_coord_origin
);
1375 if (ureg
->property_fs_coord_pixel_center
) {
1376 assert(ureg
->processor
== TGSI_PROCESSOR_FRAGMENT
);
1379 TGSI_PROPERTY_FS_COORD_PIXEL_CENTER
,
1380 ureg
->property_fs_coord_pixel_center
);
1383 if (ureg
->property_fs_color0_writes_all_cbufs
) {
1384 assert(ureg
->processor
== TGSI_PROCESSOR_FRAGMENT
);
1387 TGSI_PROPERTY_FS_COLOR0_WRITES_ALL_CBUFS
,
1388 ureg
->property_fs_color0_writes_all_cbufs
);
1391 if (ureg
->processor
== TGSI_PROCESSOR_VERTEX
) {
1392 for (i
= 0; i
< UREG_MAX_INPUT
; i
++) {
1393 if (ureg
->vs_inputs
[i
/32] & (1 << (i
%32))) {
1394 emit_decl_range( ureg
, TGSI_FILE_INPUT
, i
, 1 );
1397 } else if (ureg
->processor
== TGSI_PROCESSOR_FRAGMENT
) {
1398 for (i
= 0; i
< ureg
->nr_fs_inputs
; i
++) {
1402 ureg
->fs_input
[i
].semantic_name
,
1403 ureg
->fs_input
[i
].semantic_index
,
1404 ureg
->fs_input
[i
].interp
,
1405 ureg
->fs_input
[i
].cylindrical_wrap
,
1406 ureg
->fs_input
[i
].centroid
);
1409 for (i
= 0; i
< ureg
->nr_gs_inputs
; i
++) {
1410 emit_decl_semantic(ureg
,
1412 ureg
->gs_input
[i
].index
,
1413 ureg
->gs_input
[i
].semantic_name
,
1414 ureg
->gs_input
[i
].semantic_index
);
1418 for (i
= 0; i
< ureg
->nr_system_values
; i
++) {
1419 emit_decl_semantic(ureg
,
1420 TGSI_FILE_SYSTEM_VALUE
,
1421 ureg
->system_value
[i
].index
,
1422 ureg
->system_value
[i
].semantic_name
,
1423 ureg
->system_value
[i
].semantic_index
);
1426 for (i
= 0; i
< ureg
->nr_outputs
; i
++) {
1427 emit_decl_semantic(ureg
,
1430 ureg
->output
[i
].semantic_name
,
1431 ureg
->output
[i
].semantic_index
);
1434 for (i
= 0; i
< ureg
->nr_samplers
; i
++) {
1435 emit_decl_range( ureg
,
1437 ureg
->sampler
[i
].Index
, 1 );
1440 for (i
= 0; i
< ureg
->nr_resources
; i
++) {
1441 emit_decl_resource(ureg
,
1442 ureg
->resource
[i
].index
,
1443 ureg
->resource
[i
].target
,
1444 ureg
->resource
[i
].return_type_x
,
1445 ureg
->resource
[i
].return_type_y
,
1446 ureg
->resource
[i
].return_type_z
,
1447 ureg
->resource
[i
].return_type_w
);
1450 if (ureg
->const_decls
.nr_constant_ranges
) {
1451 for (i
= 0; i
< ureg
->const_decls
.nr_constant_ranges
; i
++) {
1452 emit_decl_range(ureg
,
1454 ureg
->const_decls
.constant_range
[i
].first
,
1455 ureg
->const_decls
.constant_range
[i
].last
- ureg
->const_decls
.constant_range
[i
].first
+ 1);
1459 for (i
= 0; i
< PIPE_MAX_CONSTANT_BUFFERS
; i
++) {
1460 struct const_decl
*decl
= &ureg
->const_decls2D
[i
];
1462 if (decl
->nr_constant_ranges
) {
1465 for (j
= 0; j
< decl
->nr_constant_ranges
; j
++) {
1466 emit_decl_range2D(ureg
,
1468 decl
->constant_range
[j
].first
,
1469 decl
->constant_range
[j
].last
,
1475 if (ureg
->nr_temps
) {
1476 emit_decl_range( ureg
,
1477 TGSI_FILE_TEMPORARY
,
1478 0, ureg
->nr_temps
);
1481 if (ureg
->nr_addrs
) {
1482 emit_decl_range( ureg
,
1484 0, ureg
->nr_addrs
);
1487 if (ureg
->nr_preds
) {
1488 emit_decl_range(ureg
,
1489 TGSI_FILE_PREDICATE
,
1494 for (i
= 0; i
< ureg
->nr_immediates
; i
++) {
1495 emit_immediate( ureg
,
1496 ureg
->immediate
[i
].value
.u
,
1497 ureg
->immediate
[i
].type
);
1501 /* Append the instruction tokens onto the declarations to build a
1502 * contiguous stream suitable to send to the driver.
1504 static void copy_instructions( struct ureg_program
*ureg
)
1506 unsigned nr_tokens
= ureg
->domain
[DOMAIN_INSN
].count
;
1507 union tgsi_any_token
*out
= get_tokens( ureg
,
1512 ureg
->domain
[DOMAIN_INSN
].tokens
,
1513 nr_tokens
* sizeof out
[0] );
1518 fixup_header_size(struct ureg_program
*ureg
)
1520 union tgsi_any_token
*out
= retrieve_token( ureg
, DOMAIN_DECL
, 0 );
1522 out
->header
.BodySize
= ureg
->domain
[DOMAIN_DECL
].count
- 2;
1527 emit_header( struct ureg_program
*ureg
)
1529 union tgsi_any_token
*out
= get_tokens( ureg
, DOMAIN_DECL
, 2 );
1531 out
[0].header
.HeaderSize
= 2;
1532 out
[0].header
.BodySize
= 0;
1534 out
[1].processor
.Processor
= ureg
->processor
;
1535 out
[1].processor
.Padding
= 0;
1539 const struct tgsi_token
*ureg_finalize( struct ureg_program
*ureg
)
1541 const struct tgsi_token
*tokens
;
1543 emit_header( ureg
);
1545 copy_instructions( ureg
);
1546 fixup_header_size( ureg
);
1548 if (ureg
->domain
[0].tokens
== error_tokens
||
1549 ureg
->domain
[1].tokens
== error_tokens
) {
1550 debug_printf("%s: error in generated shader\n", __FUNCTION__
);
1555 tokens
= &ureg
->domain
[DOMAIN_DECL
].tokens
[0].token
;
1558 debug_printf("%s: emitted shader %d tokens:\n", __FUNCTION__
,
1559 ureg
->domain
[DOMAIN_DECL
].count
);
1560 tgsi_dump( tokens
, 0 );
1564 if (tokens
&& !tgsi_sanity_check(tokens
)) {
1565 debug_printf("tgsi_ureg.c, sanity check failed on generated tokens:\n");
1566 tgsi_dump(tokens
, 0);
1576 void *ureg_create_shader( struct ureg_program
*ureg
,
1577 struct pipe_context
*pipe
)
1579 struct pipe_shader_state state
;
1581 state
.tokens
= ureg_finalize(ureg
);
1585 if (ureg
->processor
== TGSI_PROCESSOR_VERTEX
)
1586 return pipe
->create_vs_state( pipe
, &state
);
1588 return pipe
->create_fs_state( pipe
, &state
);
1592 const struct tgsi_token
*ureg_get_tokens( struct ureg_program
*ureg
,
1593 unsigned *nr_tokens
)
1595 const struct tgsi_token
*tokens
;
1597 ureg_finalize(ureg
);
1599 tokens
= &ureg
->domain
[DOMAIN_DECL
].tokens
[0].token
;
1602 *nr_tokens
= ureg
->domain
[DOMAIN_DECL
].size
;
1604 ureg
->domain
[DOMAIN_DECL
].tokens
= 0;
1605 ureg
->domain
[DOMAIN_DECL
].size
= 0;
1606 ureg
->domain
[DOMAIN_DECL
].order
= 0;
1607 ureg
->domain
[DOMAIN_DECL
].count
= 0;
1613 void ureg_free_tokens( const struct tgsi_token
*tokens
)
1615 FREE((struct tgsi_token
*)tokens
);
1619 struct ureg_program
*ureg_create( unsigned processor
)
1621 struct ureg_program
*ureg
= CALLOC_STRUCT( ureg_program
);
1625 ureg
->processor
= processor
;
1626 ureg
->property_gs_input_prim
= ~0;
1627 ureg
->property_gs_output_prim
= ~0;
1628 ureg
->property_gs_max_vertices
= ~0;
1633 void ureg_destroy( struct ureg_program
*ureg
)
1637 for (i
= 0; i
< Elements(ureg
->domain
); i
++) {
1638 if (ureg
->domain
[i
].tokens
&&
1639 ureg
->domain
[i
].tokens
!= error_tokens
)
1640 FREE(ureg
->domain
[i
].tokens
);