1 /**************************************************************************
3 * Copyright 2007 VMware, Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
29 * Keith Whitwell <keithw@vmware.com>
34 #include "main/imports.h"
35 #include "main/hash.h"
36 #include "main/mtypes.h"
37 #include "program/prog_parameter.h"
38 #include "program/prog_print.h"
39 #include "program/programopt.h"
41 #include "pipe/p_context.h"
42 #include "pipe/p_defines.h"
43 #include "pipe/p_shader_tokens.h"
44 #include "draw/draw_context.h"
45 #include "tgsi/tgsi_dump.h"
46 #include "tgsi/tgsi_emulate.h"
47 #include "tgsi/tgsi_parse.h"
48 #include "tgsi/tgsi_ureg.h"
51 #include "st_cb_bitmap.h"
52 #include "st_cb_drawpixels.h"
53 #include "st_context.h"
54 #include "st_program.h"
55 #include "st_mesa_to_tgsi.h"
56 #include "st_atifs_to_tgsi.h"
57 #include "cso_cache/cso_context.h"
62 * Delete a vertex program variant. Note the caller must unlink
63 * the variant from the linked list.
66 delete_vp_variant(struct st_context
*st
, struct st_vp_variant
*vpv
)
68 if (vpv
->driver_shader
)
69 cso_delete_vertex_shader(st
->cso_context
, vpv
->driver_shader
);
72 draw_delete_vertex_shader( st
->draw
, vpv
->draw_shader
);
75 ureg_free_tokens(vpv
->tgsi
.tokens
);
83 * Clean out any old compilations:
86 st_release_vp_variants( struct st_context
*st
,
87 struct st_vertex_program
*stvp
)
89 struct st_vp_variant
*vpv
;
91 for (vpv
= stvp
->variants
; vpv
; ) {
92 struct st_vp_variant
*next
= vpv
->next
;
93 delete_vp_variant(st
, vpv
);
97 stvp
->variants
= NULL
;
99 if (stvp
->tgsi
.tokens
) {
100 tgsi_free_tokens(stvp
->tgsi
.tokens
);
101 stvp
->tgsi
.tokens
= NULL
;
108 * Delete a fragment program variant. Note the caller must unlink
109 * the variant from the linked list.
112 delete_fp_variant(struct st_context
*st
, struct st_fp_variant
*fpv
)
114 if (fpv
->driver_shader
)
115 cso_delete_fragment_shader(st
->cso_context
, fpv
->driver_shader
);
121 * Free all variants of a fragment program.
124 st_release_fp_variants(struct st_context
*st
, struct st_fragment_program
*stfp
)
126 struct st_fp_variant
*fpv
;
128 for (fpv
= stfp
->variants
; fpv
; ) {
129 struct st_fp_variant
*next
= fpv
->next
;
130 delete_fp_variant(st
, fpv
);
134 stfp
->variants
= NULL
;
136 if (stfp
->tgsi
.tokens
) {
137 ureg_free_tokens(stfp
->tgsi
.tokens
);
138 stfp
->tgsi
.tokens
= NULL
;
144 * Delete a basic program variant. Note the caller must unlink
145 * the variant from the linked list.
148 delete_basic_variant(struct st_context
*st
, struct st_basic_variant
*v
,
151 if (v
->driver_shader
) {
153 case GL_TESS_CONTROL_PROGRAM_NV
:
154 cso_delete_tessctrl_shader(st
->cso_context
, v
->driver_shader
);
156 case GL_TESS_EVALUATION_PROGRAM_NV
:
157 cso_delete_tesseval_shader(st
->cso_context
, v
->driver_shader
);
159 case GL_GEOMETRY_PROGRAM_NV
:
160 cso_delete_geometry_shader(st
->cso_context
, v
->driver_shader
);
162 case GL_COMPUTE_PROGRAM_NV
:
163 cso_delete_compute_shader(st
->cso_context
, v
->driver_shader
);
166 assert(!"this shouldn't occur");
175 * Free all basic program variants.
178 st_release_basic_variants(struct st_context
*st
, GLenum target
,
179 struct st_basic_variant
**variants
,
180 struct pipe_shader_state
*tgsi
)
182 struct st_basic_variant
*v
;
184 for (v
= *variants
; v
; ) {
185 struct st_basic_variant
*next
= v
->next
;
186 delete_basic_variant(st
, v
, target
);
193 ureg_free_tokens(tgsi
->tokens
);
200 * Free all variants of a compute program.
203 st_release_cp_variants(struct st_context
*st
, struct st_compute_program
*stcp
)
205 struct st_basic_variant
**variants
= &stcp
->variants
;
206 struct st_basic_variant
*v
;
208 for (v
= *variants
; v
; ) {
209 struct st_basic_variant
*next
= v
->next
;
210 delete_basic_variant(st
, v
, stcp
->Base
.Base
.Target
);
216 if (stcp
->tgsi
.prog
) {
217 ureg_free_tokens(stcp
->tgsi
.prog
);
218 stcp
->tgsi
.prog
= NULL
;
224 * Translate a vertex program.
227 st_translate_vertex_program(struct st_context
*st
,
228 struct st_vertex_program
*stvp
)
230 struct ureg_program
*ureg
;
231 enum pipe_error error
;
232 unsigned num_outputs
= 0;
234 unsigned input_to_index
[VERT_ATTRIB_MAX
] = {0};
235 unsigned output_slot_to_attr
[VARYING_SLOT_MAX
] = {0};
236 ubyte output_semantic_name
[VARYING_SLOT_MAX
] = {0};
237 ubyte output_semantic_index
[VARYING_SLOT_MAX
] = {0};
239 stvp
->num_inputs
= 0;
241 if (stvp
->Base
.IsPositionInvariant
)
242 _mesa_insert_mvp_code(st
->ctx
, &stvp
->Base
);
245 * Determine number of inputs, the mappings between VERT_ATTRIB_x
246 * and TGSI generic input indexes, plus input attrib semantic info.
248 for (attr
= 0; attr
< VERT_ATTRIB_MAX
; attr
++) {
249 if ((stvp
->Base
.Base
.InputsRead
& BITFIELD64_BIT(attr
)) != 0) {
250 input_to_index
[attr
] = stvp
->num_inputs
;
251 stvp
->index_to_input
[stvp
->num_inputs
] = attr
;
253 if ((stvp
->Base
.Base
.DoubleInputsRead
& BITFIELD64_BIT(attr
)) != 0) {
254 /* add placeholder for second part of a double attribute */
255 stvp
->index_to_input
[stvp
->num_inputs
] = ST_DOUBLE_ATTRIB_PLACEHOLDER
;
260 /* bit of a hack, presetup potentially unused edgeflag input */
261 input_to_index
[VERT_ATTRIB_EDGEFLAG
] = stvp
->num_inputs
;
262 stvp
->index_to_input
[stvp
->num_inputs
] = VERT_ATTRIB_EDGEFLAG
;
264 /* Compute mapping of vertex program outputs to slots.
266 for (attr
= 0; attr
< VARYING_SLOT_MAX
; attr
++) {
267 if ((stvp
->Base
.Base
.OutputsWritten
& BITFIELD64_BIT(attr
)) == 0) {
268 stvp
->result_to_output
[attr
] = ~0;
271 unsigned slot
= num_outputs
++;
273 stvp
->result_to_output
[attr
] = slot
;
274 output_slot_to_attr
[slot
] = attr
;
277 case VARYING_SLOT_POS
:
278 output_semantic_name
[slot
] = TGSI_SEMANTIC_POSITION
;
279 output_semantic_index
[slot
] = 0;
281 case VARYING_SLOT_COL0
:
282 output_semantic_name
[slot
] = TGSI_SEMANTIC_COLOR
;
283 output_semantic_index
[slot
] = 0;
285 case VARYING_SLOT_COL1
:
286 output_semantic_name
[slot
] = TGSI_SEMANTIC_COLOR
;
287 output_semantic_index
[slot
] = 1;
289 case VARYING_SLOT_BFC0
:
290 output_semantic_name
[slot
] = TGSI_SEMANTIC_BCOLOR
;
291 output_semantic_index
[slot
] = 0;
293 case VARYING_SLOT_BFC1
:
294 output_semantic_name
[slot
] = TGSI_SEMANTIC_BCOLOR
;
295 output_semantic_index
[slot
] = 1;
297 case VARYING_SLOT_FOGC
:
298 output_semantic_name
[slot
] = TGSI_SEMANTIC_FOG
;
299 output_semantic_index
[slot
] = 0;
301 case VARYING_SLOT_PSIZ
:
302 output_semantic_name
[slot
] = TGSI_SEMANTIC_PSIZE
;
303 output_semantic_index
[slot
] = 0;
305 case VARYING_SLOT_CLIP_DIST0
:
306 output_semantic_name
[slot
] = TGSI_SEMANTIC_CLIPDIST
;
307 output_semantic_index
[slot
] = 0;
309 case VARYING_SLOT_CLIP_DIST1
:
310 output_semantic_name
[slot
] = TGSI_SEMANTIC_CLIPDIST
;
311 output_semantic_index
[slot
] = 1;
313 case VARYING_SLOT_EDGE
:
316 case VARYING_SLOT_CLIP_VERTEX
:
317 output_semantic_name
[slot
] = TGSI_SEMANTIC_CLIPVERTEX
;
318 output_semantic_index
[slot
] = 0;
320 case VARYING_SLOT_LAYER
:
321 output_semantic_name
[slot
] = TGSI_SEMANTIC_LAYER
;
322 output_semantic_index
[slot
] = 0;
324 case VARYING_SLOT_VIEWPORT
:
325 output_semantic_name
[slot
] = TGSI_SEMANTIC_VIEWPORT_INDEX
;
326 output_semantic_index
[slot
] = 0;
329 case VARYING_SLOT_TEX0
:
330 case VARYING_SLOT_TEX1
:
331 case VARYING_SLOT_TEX2
:
332 case VARYING_SLOT_TEX3
:
333 case VARYING_SLOT_TEX4
:
334 case VARYING_SLOT_TEX5
:
335 case VARYING_SLOT_TEX6
:
336 case VARYING_SLOT_TEX7
:
337 if (st
->needs_texcoord_semantic
) {
338 output_semantic_name
[slot
] = TGSI_SEMANTIC_TEXCOORD
;
339 output_semantic_index
[slot
] = attr
- VARYING_SLOT_TEX0
;
343 case VARYING_SLOT_VAR0
:
345 assert(attr
>= VARYING_SLOT_VAR0
||
346 (attr
>= VARYING_SLOT_TEX0
&& attr
<= VARYING_SLOT_TEX7
));
347 output_semantic_name
[slot
] = TGSI_SEMANTIC_GENERIC
;
348 output_semantic_index
[slot
] =
349 st_get_generic_varying_index(st
, attr
);
354 /* similar hack to above, presetup potentially unused edgeflag output */
355 stvp
->result_to_output
[VARYING_SLOT_EDGE
] = num_outputs
;
356 output_semantic_name
[num_outputs
] = TGSI_SEMANTIC_EDGEFLAG
;
357 output_semantic_index
[num_outputs
] = 0;
359 if (!stvp
->glsl_to_tgsi
)
360 _mesa_remove_output_reads(&stvp
->Base
.Base
, PROGRAM_OUTPUT
);
362 ureg
= ureg_create_with_screen(TGSI_PROCESSOR_VERTEX
, st
->pipe
->screen
);
366 if (stvp
->Base
.Base
.ClipDistanceArraySize
)
367 ureg_property(ureg
, TGSI_PROPERTY_NUM_CLIPDIST_ENABLED
,
368 stvp
->Base
.Base
.ClipDistanceArraySize
);
370 if (ST_DEBUG
& DEBUG_MESA
) {
371 _mesa_print_program(&stvp
->Base
.Base
);
372 _mesa_print_program_parameters(st
->ctx
, &stvp
->Base
.Base
);
376 if (stvp
->glsl_to_tgsi
) {
377 error
= st_translate_program(st
->ctx
,
378 TGSI_PROCESSOR_VERTEX
,
385 NULL
, /* inputSlotToAttr */
386 NULL
, /* input semantic name */
387 NULL
, /* input semantic index */
388 NULL
, /* interp mode */
389 NULL
, /* interp location */
392 stvp
->result_to_output
,
394 output_semantic_name
,
395 output_semantic_index
);
397 st_translate_stream_output_info(stvp
->glsl_to_tgsi
,
398 stvp
->result_to_output
,
399 &stvp
->tgsi
.stream_output
);
401 free_glsl_to_tgsi_visitor(stvp
->glsl_to_tgsi
);
402 stvp
->glsl_to_tgsi
= NULL
;
404 error
= st_translate_mesa_program(st
->ctx
,
405 TGSI_PROCESSOR_VERTEX
,
411 NULL
, /* input semantic name */
412 NULL
, /* input semantic index */
416 stvp
->result_to_output
,
417 output_semantic_name
,
418 output_semantic_index
);
421 debug_printf("%s: failed to translate Mesa program:\n", __func__
);
422 _mesa_print_program(&stvp
->Base
.Base
);
427 stvp
->tgsi
.tokens
= ureg_get_tokens(ureg
, NULL
);
429 return stvp
->tgsi
.tokens
!= NULL
;
432 static struct st_vp_variant
*
433 st_create_vp_variant(struct st_context
*st
,
434 struct st_vertex_program
*stvp
,
435 const struct st_vp_variant_key
*key
)
437 struct st_vp_variant
*vpv
= CALLOC_STRUCT(st_vp_variant
);
438 struct pipe_context
*pipe
= st
->pipe
;
441 vpv
->tgsi
.tokens
= tgsi_dup_tokens(stvp
->tgsi
.tokens
);
442 vpv
->tgsi
.stream_output
= stvp
->tgsi
.stream_output
;
443 vpv
->num_inputs
= stvp
->num_inputs
;
445 /* Emulate features. */
446 if (key
->clamp_color
|| key
->passthrough_edgeflags
) {
447 const struct tgsi_token
*tokens
;
449 (key
->clamp_color
? TGSI_EMU_CLAMP_COLOR_OUTPUTS
: 0) |
450 (key
->passthrough_edgeflags
? TGSI_EMU_PASSTHROUGH_EDGEFLAG
: 0);
452 tokens
= tgsi_emulate(vpv
->tgsi
.tokens
, flags
);
455 tgsi_free_tokens(vpv
->tgsi
.tokens
);
456 vpv
->tgsi
.tokens
= tokens
;
458 if (key
->passthrough_edgeflags
)
461 fprintf(stderr
, "mesa: cannot emulate deprecated features\n");
464 if (ST_DEBUG
& DEBUG_TGSI
) {
465 tgsi_dump(vpv
->tgsi
.tokens
, 0);
469 vpv
->driver_shader
= pipe
->create_vs_state(pipe
, &vpv
->tgsi
);
475 * Find/create a vertex program variant.
477 struct st_vp_variant
*
478 st_get_vp_variant(struct st_context
*st
,
479 struct st_vertex_program
*stvp
,
480 const struct st_vp_variant_key
*key
)
482 struct st_vp_variant
*vpv
;
484 /* Search for existing variant */
485 for (vpv
= stvp
->variants
; vpv
; vpv
= vpv
->next
) {
486 if (memcmp(&vpv
->key
, key
, sizeof(*key
)) == 0) {
493 vpv
= st_create_vp_variant(st
, stvp
, key
);
495 /* insert into list */
496 vpv
->next
= stvp
->variants
;
497 stvp
->variants
= vpv
;
506 st_translate_interp(enum glsl_interp_qualifier glsl_qual
, bool is_color
)
509 case INTERP_QUALIFIER_NONE
:
511 return TGSI_INTERPOLATE_COLOR
;
512 return TGSI_INTERPOLATE_PERSPECTIVE
;
513 case INTERP_QUALIFIER_SMOOTH
:
514 return TGSI_INTERPOLATE_PERSPECTIVE
;
515 case INTERP_QUALIFIER_FLAT
:
516 return TGSI_INTERPOLATE_CONSTANT
;
517 case INTERP_QUALIFIER_NOPERSPECTIVE
:
518 return TGSI_INTERPOLATE_LINEAR
;
520 assert(0 && "unexpected interp mode in st_translate_interp()");
521 return TGSI_INTERPOLATE_PERSPECTIVE
;
527 * Translate a Mesa fragment shader into a TGSI shader.
530 st_translate_fragment_program(struct st_context
*st
,
531 struct st_fragment_program
*stfp
)
533 GLuint outputMapping
[FRAG_RESULT_MAX
];
534 GLuint inputMapping
[VARYING_SLOT_MAX
];
535 GLuint inputSlotToAttr
[VARYING_SLOT_MAX
];
536 GLuint interpMode
[PIPE_MAX_SHADER_INPUTS
]; /* XXX size? */
537 GLuint interpLocation
[PIPE_MAX_SHADER_INPUTS
];
539 GLbitfield64 inputsRead
;
540 struct ureg_program
*ureg
;
542 GLboolean write_all
= GL_FALSE
;
544 ubyte input_semantic_name
[PIPE_MAX_SHADER_INPUTS
];
545 ubyte input_semantic_index
[PIPE_MAX_SHADER_INPUTS
];
546 uint fs_num_inputs
= 0;
548 ubyte fs_output_semantic_name
[PIPE_MAX_SHADER_OUTPUTS
];
549 ubyte fs_output_semantic_index
[PIPE_MAX_SHADER_OUTPUTS
];
550 uint fs_num_outputs
= 0;
552 memset(inputSlotToAttr
, ~0, sizeof(inputSlotToAttr
));
554 if (!stfp
->glsl_to_tgsi
) {
555 _mesa_remove_output_reads(&stfp
->Base
.Base
, PROGRAM_OUTPUT
);
556 if (st
->ctx
->Const
.GLSLFragCoordIsSysVal
)
557 _mesa_program_fragment_position_to_sysval(&stfp
->Base
.Base
);
561 * Convert Mesa program inputs to TGSI input register semantics.
563 inputsRead
= stfp
->Base
.Base
.InputsRead
;
564 for (attr
= 0; attr
< VARYING_SLOT_MAX
; attr
++) {
565 if ((inputsRead
& BITFIELD64_BIT(attr
)) != 0) {
566 const GLuint slot
= fs_num_inputs
++;
568 inputMapping
[attr
] = slot
;
569 inputSlotToAttr
[slot
] = attr
;
570 if (stfp
->Base
.IsCentroid
& BITFIELD64_BIT(attr
))
571 interpLocation
[slot
] = TGSI_INTERPOLATE_LOC_CENTROID
;
572 else if (stfp
->Base
.IsSample
& BITFIELD64_BIT(attr
))
573 interpLocation
[slot
] = TGSI_INTERPOLATE_LOC_SAMPLE
;
575 interpLocation
[slot
] = TGSI_INTERPOLATE_LOC_CENTER
;
578 case VARYING_SLOT_POS
:
579 input_semantic_name
[slot
] = TGSI_SEMANTIC_POSITION
;
580 input_semantic_index
[slot
] = 0;
581 interpMode
[slot
] = TGSI_INTERPOLATE_LINEAR
;
583 case VARYING_SLOT_COL0
:
584 input_semantic_name
[slot
] = TGSI_SEMANTIC_COLOR
;
585 input_semantic_index
[slot
] = 0;
586 interpMode
[slot
] = st_translate_interp(stfp
->Base
.InterpQualifier
[attr
],
589 case VARYING_SLOT_COL1
:
590 input_semantic_name
[slot
] = TGSI_SEMANTIC_COLOR
;
591 input_semantic_index
[slot
] = 1;
592 interpMode
[slot
] = st_translate_interp(stfp
->Base
.InterpQualifier
[attr
],
595 case VARYING_SLOT_FOGC
:
596 input_semantic_name
[slot
] = TGSI_SEMANTIC_FOG
;
597 input_semantic_index
[slot
] = 0;
598 interpMode
[slot
] = TGSI_INTERPOLATE_PERSPECTIVE
;
600 case VARYING_SLOT_FACE
:
601 input_semantic_name
[slot
] = TGSI_SEMANTIC_FACE
;
602 input_semantic_index
[slot
] = 0;
603 interpMode
[slot
] = TGSI_INTERPOLATE_CONSTANT
;
605 case VARYING_SLOT_PRIMITIVE_ID
:
606 input_semantic_name
[slot
] = TGSI_SEMANTIC_PRIMID
;
607 input_semantic_index
[slot
] = 0;
608 interpMode
[slot
] = TGSI_INTERPOLATE_CONSTANT
;
610 case VARYING_SLOT_LAYER
:
611 input_semantic_name
[slot
] = TGSI_SEMANTIC_LAYER
;
612 input_semantic_index
[slot
] = 0;
613 interpMode
[slot
] = TGSI_INTERPOLATE_CONSTANT
;
615 case VARYING_SLOT_VIEWPORT
:
616 input_semantic_name
[slot
] = TGSI_SEMANTIC_VIEWPORT_INDEX
;
617 input_semantic_index
[slot
] = 0;
618 interpMode
[slot
] = TGSI_INTERPOLATE_CONSTANT
;
620 case VARYING_SLOT_CLIP_DIST0
:
621 input_semantic_name
[slot
] = TGSI_SEMANTIC_CLIPDIST
;
622 input_semantic_index
[slot
] = 0;
623 interpMode
[slot
] = TGSI_INTERPOLATE_PERSPECTIVE
;
625 case VARYING_SLOT_CLIP_DIST1
:
626 input_semantic_name
[slot
] = TGSI_SEMANTIC_CLIPDIST
;
627 input_semantic_index
[slot
] = 1;
628 interpMode
[slot
] = TGSI_INTERPOLATE_PERSPECTIVE
;
630 /* In most cases, there is nothing special about these
631 * inputs, so adopt a convention to use the generic
632 * semantic name and the mesa VARYING_SLOT_ number as the
635 * All that is required is that the vertex shader labels
636 * its own outputs similarly, and that the vertex shader
637 * generates at least every output required by the
638 * fragment shader plus fixed-function hardware (such as
641 * However, some drivers may need us to identify the PNTC and TEXi
642 * varyings if, for example, their capability to replace them with
643 * sprite coordinates is limited.
645 case VARYING_SLOT_PNTC
:
646 if (st
->needs_texcoord_semantic
) {
647 input_semantic_name
[slot
] = TGSI_SEMANTIC_PCOORD
;
648 input_semantic_index
[slot
] = 0;
649 interpMode
[slot
] = TGSI_INTERPOLATE_LINEAR
;
653 case VARYING_SLOT_TEX0
:
654 case VARYING_SLOT_TEX1
:
655 case VARYING_SLOT_TEX2
:
656 case VARYING_SLOT_TEX3
:
657 case VARYING_SLOT_TEX4
:
658 case VARYING_SLOT_TEX5
:
659 case VARYING_SLOT_TEX6
:
660 case VARYING_SLOT_TEX7
:
661 if (st
->needs_texcoord_semantic
) {
662 input_semantic_name
[slot
] = TGSI_SEMANTIC_TEXCOORD
;
663 input_semantic_index
[slot
] = attr
- VARYING_SLOT_TEX0
;
665 st_translate_interp(stfp
->Base
.InterpQualifier
[attr
], FALSE
);
669 case VARYING_SLOT_VAR0
:
671 /* Semantic indices should be zero-based because drivers may choose
672 * to assign a fixed slot determined by that index.
673 * This is useful because ARB_separate_shader_objects uses location
674 * qualifiers for linkage, and if the semantic index corresponds to
675 * these locations, linkage passes in the driver become unecessary.
677 * If needs_texcoord_semantic is true, no semantic indices will be
678 * consumed for the TEXi varyings, and we can base the locations of
679 * the user varyings on VAR0. Otherwise, we use TEX0 as base index.
681 assert(attr
>= VARYING_SLOT_VAR0
|| attr
== VARYING_SLOT_PNTC
||
682 (attr
>= VARYING_SLOT_TEX0
&& attr
<= VARYING_SLOT_TEX7
));
683 input_semantic_name
[slot
] = TGSI_SEMANTIC_GENERIC
;
684 input_semantic_index
[slot
] = st_get_generic_varying_index(st
, attr
);
685 if (attr
== VARYING_SLOT_PNTC
)
686 interpMode
[slot
] = TGSI_INTERPOLATE_LINEAR
;
688 interpMode
[slot
] = st_translate_interp(stfp
->Base
.InterpQualifier
[attr
],
694 inputMapping
[attr
] = -1;
699 * Semantics and mapping for outputs
703 GLbitfield64 outputsWritten
= stfp
->Base
.Base
.OutputsWritten
;
705 /* if z is written, emit that first */
706 if (outputsWritten
& BITFIELD64_BIT(FRAG_RESULT_DEPTH
)) {
707 fs_output_semantic_name
[fs_num_outputs
] = TGSI_SEMANTIC_POSITION
;
708 fs_output_semantic_index
[fs_num_outputs
] = 0;
709 outputMapping
[FRAG_RESULT_DEPTH
] = fs_num_outputs
;
711 outputsWritten
&= ~(1 << FRAG_RESULT_DEPTH
);
714 if (outputsWritten
& BITFIELD64_BIT(FRAG_RESULT_STENCIL
)) {
715 fs_output_semantic_name
[fs_num_outputs
] = TGSI_SEMANTIC_STENCIL
;
716 fs_output_semantic_index
[fs_num_outputs
] = 0;
717 outputMapping
[FRAG_RESULT_STENCIL
] = fs_num_outputs
;
719 outputsWritten
&= ~(1 << FRAG_RESULT_STENCIL
);
722 if (outputsWritten
& BITFIELD64_BIT(FRAG_RESULT_SAMPLE_MASK
)) {
723 fs_output_semantic_name
[fs_num_outputs
] = TGSI_SEMANTIC_SAMPLEMASK
;
724 fs_output_semantic_index
[fs_num_outputs
] = 0;
725 outputMapping
[FRAG_RESULT_SAMPLE_MASK
] = fs_num_outputs
;
727 outputsWritten
&= ~(1 << FRAG_RESULT_SAMPLE_MASK
);
730 /* handle remaining outputs (color) */
731 for (attr
= 0; attr
< FRAG_RESULT_MAX
; attr
++) {
732 if (outputsWritten
& BITFIELD64_BIT(attr
)) {
734 case FRAG_RESULT_DEPTH
:
735 case FRAG_RESULT_STENCIL
:
736 case FRAG_RESULT_SAMPLE_MASK
:
740 case FRAG_RESULT_COLOR
:
741 write_all
= GL_TRUE
; /* fallthrough */
743 assert(attr
== FRAG_RESULT_COLOR
||
744 (FRAG_RESULT_DATA0
<= attr
&& attr
< FRAG_RESULT_MAX
));
745 fs_output_semantic_name
[fs_num_outputs
] = TGSI_SEMANTIC_COLOR
;
746 fs_output_semantic_index
[fs_num_outputs
] = numColors
;
747 outputMapping
[attr
] = fs_num_outputs
;
757 ureg
= ureg_create_with_screen(TGSI_PROCESSOR_FRAGMENT
, st
->pipe
->screen
);
761 if (ST_DEBUG
& DEBUG_MESA
) {
762 _mesa_print_program(&stfp
->Base
.Base
);
763 _mesa_print_program_parameters(st
->ctx
, &stfp
->Base
.Base
);
766 if (write_all
== GL_TRUE
)
767 ureg_property(ureg
, TGSI_PROPERTY_FS_COLOR0_WRITES_ALL_CBUFS
, 1);
769 if (stfp
->Base
.FragDepthLayout
!= FRAG_DEPTH_LAYOUT_NONE
) {
770 switch (stfp
->Base
.FragDepthLayout
) {
771 case FRAG_DEPTH_LAYOUT_ANY
:
772 ureg_property(ureg
, TGSI_PROPERTY_FS_DEPTH_LAYOUT
,
773 TGSI_FS_DEPTH_LAYOUT_ANY
);
775 case FRAG_DEPTH_LAYOUT_GREATER
:
776 ureg_property(ureg
, TGSI_PROPERTY_FS_DEPTH_LAYOUT
,
777 TGSI_FS_DEPTH_LAYOUT_GREATER
);
779 case FRAG_DEPTH_LAYOUT_LESS
:
780 ureg_property(ureg
, TGSI_PROPERTY_FS_DEPTH_LAYOUT
,
781 TGSI_FS_DEPTH_LAYOUT_LESS
);
783 case FRAG_DEPTH_LAYOUT_UNCHANGED
:
784 ureg_property(ureg
, TGSI_PROPERTY_FS_DEPTH_LAYOUT
,
785 TGSI_FS_DEPTH_LAYOUT_UNCHANGED
);
792 if (stfp
->glsl_to_tgsi
) {
793 st_translate_program(st
->ctx
,
794 TGSI_PROCESSOR_FRAGMENT
,
803 input_semantic_index
,
810 fs_output_semantic_name
,
811 fs_output_semantic_index
);
813 free_glsl_to_tgsi_visitor(stfp
->glsl_to_tgsi
);
814 stfp
->glsl_to_tgsi
= NULL
;
815 } else if (stfp
->ati_fs
)
816 st_translate_atifs_program(ureg
,
823 input_semantic_index
,
828 fs_output_semantic_name
,
829 fs_output_semantic_index
);
831 st_translate_mesa_program(st
->ctx
,
832 TGSI_PROCESSOR_FRAGMENT
,
839 input_semantic_index
,
844 fs_output_semantic_name
,
845 fs_output_semantic_index
);
847 stfp
->tgsi
.tokens
= ureg_get_tokens(ureg
, NULL
);
849 return stfp
->tgsi
.tokens
!= NULL
;
852 static struct st_fp_variant
*
853 st_create_fp_variant(struct st_context
*st
,
854 struct st_fragment_program
*stfp
,
855 const struct st_fp_variant_key
*key
)
857 struct pipe_context
*pipe
= st
->pipe
;
858 struct st_fp_variant
*variant
= CALLOC_STRUCT(st_fp_variant
);
859 struct pipe_shader_state tgsi
= {0};
864 tgsi
.tokens
= stfp
->tgsi
.tokens
;
866 assert(!(key
->bitmap
&& key
->drawpixels
));
868 /* Fix texture targets and add fog for ATI_fs */
870 const struct tgsi_token
*tokens
= st_fixup_atifs(tgsi
.tokens
, key
);
873 tgsi
.tokens
= tokens
;
875 fprintf(stderr
, "mesa: cannot post-process ATI_fs\n");
878 /* Emulate features. */
879 if (key
->clamp_color
|| key
->persample_shading
) {
880 const struct tgsi_token
*tokens
;
882 (key
->clamp_color
? TGSI_EMU_CLAMP_COLOR_OUTPUTS
: 0) |
883 (key
->persample_shading
? TGSI_EMU_FORCE_PERSAMPLE_INTERP
: 0);
885 tokens
= tgsi_emulate(tgsi
.tokens
, flags
);
888 if (tgsi
.tokens
!= stfp
->tgsi
.tokens
)
889 tgsi_free_tokens(tgsi
.tokens
);
890 tgsi
.tokens
= tokens
;
892 fprintf(stderr
, "mesa: cannot emulate deprecated features\n");
897 const struct tgsi_token
*tokens
;
899 variant
->bitmap_sampler
= ffs(~stfp
->Base
.Base
.SamplersUsed
) - 1;
901 tokens
= st_get_bitmap_shader(tgsi
.tokens
,
903 variant
->bitmap_sampler
,
904 st
->needs_texcoord_semantic
,
905 st
->bitmap
.tex_format
==
906 PIPE_FORMAT_L8_UNORM
);
909 if (tgsi
.tokens
!= stfp
->tgsi
.tokens
)
910 tgsi_free_tokens(tgsi
.tokens
);
911 tgsi
.tokens
= tokens
;
913 fprintf(stderr
, "mesa: cannot create a shader for glBitmap\n");
916 /* glDrawPixels (color only) */
917 if (key
->drawpixels
) {
918 const struct tgsi_token
*tokens
;
919 unsigned scale_const
= 0, bias_const
= 0, texcoord_const
= 0;
920 struct gl_program_parameter_list
*params
= stfp
->Base
.Base
.Parameters
;
922 /* Find the first unused slot. */
923 variant
->drawpix_sampler
= ffs(~stfp
->Base
.Base
.SamplersUsed
) - 1;
925 if (key
->pixelMaps
) {
926 unsigned samplers_used
= stfp
->Base
.Base
.SamplersUsed
|
927 (1 << variant
->drawpix_sampler
);
929 variant
->pixelmap_sampler
= ffs(~samplers_used
) - 1;
932 if (key
->scaleAndBias
) {
933 static const gl_state_index scale_state
[STATE_LENGTH
] =
934 { STATE_INTERNAL
, STATE_PT_SCALE
};
935 static const gl_state_index bias_state
[STATE_LENGTH
] =
936 { STATE_INTERNAL
, STATE_PT_BIAS
};
938 scale_const
= _mesa_add_state_reference(params
, scale_state
);
939 bias_const
= _mesa_add_state_reference(params
, bias_state
);
943 static const gl_state_index state
[STATE_LENGTH
] =
944 { STATE_INTERNAL
, STATE_CURRENT_ATTRIB
, VERT_ATTRIB_TEX0
};
946 texcoord_const
= _mesa_add_state_reference(params
, state
);
949 tokens
= st_get_drawpix_shader(tgsi
.tokens
,
950 st
->needs_texcoord_semantic
,
951 key
->scaleAndBias
, scale_const
,
952 bias_const
, key
->pixelMaps
,
953 variant
->drawpix_sampler
,
954 variant
->pixelmap_sampler
,
955 texcoord_const
, st
->internal_target
);
958 if (tgsi
.tokens
!= stfp
->tgsi
.tokens
)
959 tgsi_free_tokens(tgsi
.tokens
);
960 tgsi
.tokens
= tokens
;
962 fprintf(stderr
, "mesa: cannot create a shader for glDrawPixels\n");
965 if (ST_DEBUG
& DEBUG_TGSI
) {
966 tgsi_dump(tgsi
.tokens
, 0);
970 /* fill in variant */
971 variant
->driver_shader
= pipe
->create_fs_state(pipe
, &tgsi
);
974 if (tgsi
.tokens
!= stfp
->tgsi
.tokens
)
975 tgsi_free_tokens(tgsi
.tokens
);
980 * Translate fragment program if needed.
982 struct st_fp_variant
*
983 st_get_fp_variant(struct st_context
*st
,
984 struct st_fragment_program
*stfp
,
985 const struct st_fp_variant_key
*key
)
987 struct st_fp_variant
*fpv
;
989 /* Search for existing variant */
990 for (fpv
= stfp
->variants
; fpv
; fpv
= fpv
->next
) {
991 if (memcmp(&fpv
->key
, key
, sizeof(*key
)) == 0) {
998 fpv
= st_create_fp_variant(st
, stfp
, key
);
1000 /* insert into list */
1001 fpv
->next
= stfp
->variants
;
1002 stfp
->variants
= fpv
;
1011 * Translate a program. This is common code for geometry and tessellation
1015 st_translate_program_common(struct st_context
*st
,
1016 struct gl_program
*prog
,
1017 struct glsl_to_tgsi_visitor
*glsl_to_tgsi
,
1018 struct ureg_program
*ureg
,
1019 unsigned tgsi_processor
,
1020 struct pipe_shader_state
*out_state
)
1022 GLuint inputSlotToAttr
[VARYING_SLOT_TESS_MAX
];
1023 GLuint inputMapping
[VARYING_SLOT_TESS_MAX
];
1024 GLuint outputSlotToAttr
[VARYING_SLOT_TESS_MAX
];
1025 GLuint outputMapping
[VARYING_SLOT_TESS_MAX
];
1028 ubyte input_semantic_name
[PIPE_MAX_SHADER_INPUTS
];
1029 ubyte input_semantic_index
[PIPE_MAX_SHADER_INPUTS
];
1030 uint num_inputs
= 0;
1032 ubyte output_semantic_name
[PIPE_MAX_SHADER_OUTPUTS
];
1033 ubyte output_semantic_index
[PIPE_MAX_SHADER_OUTPUTS
];
1034 uint num_outputs
= 0;
1038 memset(inputSlotToAttr
, 0, sizeof(inputSlotToAttr
));
1039 memset(inputMapping
, 0, sizeof(inputMapping
));
1040 memset(outputSlotToAttr
, 0, sizeof(outputSlotToAttr
));
1041 memset(outputMapping
, 0, sizeof(outputMapping
));
1042 memset(out_state
, 0, sizeof(*out_state
));
1044 if (prog
->ClipDistanceArraySize
)
1045 ureg_property(ureg
, TGSI_PROPERTY_NUM_CLIPDIST_ENABLED
,
1046 prog
->ClipDistanceArraySize
);
1049 * Convert Mesa program inputs to TGSI input register semantics.
1051 for (attr
= 0; attr
< VARYING_SLOT_MAX
; attr
++) {
1052 if ((prog
->InputsRead
& BITFIELD64_BIT(attr
)) != 0) {
1053 const GLuint slot
= num_inputs
++;
1055 inputMapping
[attr
] = slot
;
1056 inputSlotToAttr
[slot
] = attr
;
1059 case VARYING_SLOT_PRIMITIVE_ID
:
1060 assert(tgsi_processor
== TGSI_PROCESSOR_GEOMETRY
);
1061 input_semantic_name
[slot
] = TGSI_SEMANTIC_PRIMID
;
1062 input_semantic_index
[slot
] = 0;
1064 case VARYING_SLOT_POS
:
1065 input_semantic_name
[slot
] = TGSI_SEMANTIC_POSITION
;
1066 input_semantic_index
[slot
] = 0;
1068 case VARYING_SLOT_COL0
:
1069 input_semantic_name
[slot
] = TGSI_SEMANTIC_COLOR
;
1070 input_semantic_index
[slot
] = 0;
1072 case VARYING_SLOT_COL1
:
1073 input_semantic_name
[slot
] = TGSI_SEMANTIC_COLOR
;
1074 input_semantic_index
[slot
] = 1;
1076 case VARYING_SLOT_FOGC
:
1077 input_semantic_name
[slot
] = TGSI_SEMANTIC_FOG
;
1078 input_semantic_index
[slot
] = 0;
1080 case VARYING_SLOT_CLIP_VERTEX
:
1081 input_semantic_name
[slot
] = TGSI_SEMANTIC_CLIPVERTEX
;
1082 input_semantic_index
[slot
] = 0;
1084 case VARYING_SLOT_CLIP_DIST0
:
1085 input_semantic_name
[slot
] = TGSI_SEMANTIC_CLIPDIST
;
1086 input_semantic_index
[slot
] = 0;
1088 case VARYING_SLOT_CLIP_DIST1
:
1089 input_semantic_name
[slot
] = TGSI_SEMANTIC_CLIPDIST
;
1090 input_semantic_index
[slot
] = 1;
1092 case VARYING_SLOT_PSIZ
:
1093 input_semantic_name
[slot
] = TGSI_SEMANTIC_PSIZE
;
1094 input_semantic_index
[slot
] = 0;
1096 case VARYING_SLOT_TEX0
:
1097 case VARYING_SLOT_TEX1
:
1098 case VARYING_SLOT_TEX2
:
1099 case VARYING_SLOT_TEX3
:
1100 case VARYING_SLOT_TEX4
:
1101 case VARYING_SLOT_TEX5
:
1102 case VARYING_SLOT_TEX6
:
1103 case VARYING_SLOT_TEX7
:
1104 if (st
->needs_texcoord_semantic
) {
1105 input_semantic_name
[slot
] = TGSI_SEMANTIC_TEXCOORD
;
1106 input_semantic_index
[slot
] = attr
- VARYING_SLOT_TEX0
;
1110 case VARYING_SLOT_VAR0
:
1112 assert(attr
>= VARYING_SLOT_VAR0
||
1113 (attr
>= VARYING_SLOT_TEX0
&& attr
<= VARYING_SLOT_TEX7
));
1114 input_semantic_name
[slot
] = TGSI_SEMANTIC_GENERIC
;
1115 input_semantic_index
[slot
] =
1116 st_get_generic_varying_index(st
, attr
);
1122 /* Also add patch inputs. */
1123 for (attr
= 0; attr
< 32; attr
++) {
1124 if (prog
->PatchInputsRead
& (1 << attr
)) {
1125 GLuint slot
= num_inputs
++;
1126 GLuint patch_attr
= VARYING_SLOT_PATCH0
+ attr
;
1128 inputMapping
[patch_attr
] = slot
;
1129 inputSlotToAttr
[slot
] = patch_attr
;
1130 input_semantic_name
[slot
] = TGSI_SEMANTIC_PATCH
;
1131 input_semantic_index
[slot
] = attr
;
1135 /* initialize output semantics to defaults */
1136 for (i
= 0; i
< PIPE_MAX_SHADER_OUTPUTS
; i
++) {
1137 output_semantic_name
[i
] = TGSI_SEMANTIC_GENERIC
;
1138 output_semantic_index
[i
] = 0;
1142 * Determine number of outputs, the (default) output register
1143 * mapping and the semantic information for each output.
1145 for (attr
= 0; attr
< VARYING_SLOT_MAX
; attr
++) {
1146 if (prog
->OutputsWritten
& BITFIELD64_BIT(attr
)) {
1147 GLuint slot
= num_outputs
++;
1149 outputMapping
[attr
] = slot
;
1150 outputSlotToAttr
[slot
] = attr
;
1153 case VARYING_SLOT_POS
:
1155 output_semantic_name
[slot
] = TGSI_SEMANTIC_POSITION
;
1156 output_semantic_index
[slot
] = 0;
1158 case VARYING_SLOT_COL0
:
1159 output_semantic_name
[slot
] = TGSI_SEMANTIC_COLOR
;
1160 output_semantic_index
[slot
] = 0;
1162 case VARYING_SLOT_COL1
:
1163 output_semantic_name
[slot
] = TGSI_SEMANTIC_COLOR
;
1164 output_semantic_index
[slot
] = 1;
1166 case VARYING_SLOT_BFC0
:
1167 output_semantic_name
[slot
] = TGSI_SEMANTIC_BCOLOR
;
1168 output_semantic_index
[slot
] = 0;
1170 case VARYING_SLOT_BFC1
:
1171 output_semantic_name
[slot
] = TGSI_SEMANTIC_BCOLOR
;
1172 output_semantic_index
[slot
] = 1;
1174 case VARYING_SLOT_FOGC
:
1175 output_semantic_name
[slot
] = TGSI_SEMANTIC_FOG
;
1176 output_semantic_index
[slot
] = 0;
1178 case VARYING_SLOT_PSIZ
:
1179 output_semantic_name
[slot
] = TGSI_SEMANTIC_PSIZE
;
1180 output_semantic_index
[slot
] = 0;
1182 case VARYING_SLOT_CLIP_VERTEX
:
1183 output_semantic_name
[slot
] = TGSI_SEMANTIC_CLIPVERTEX
;
1184 output_semantic_index
[slot
] = 0;
1186 case VARYING_SLOT_CLIP_DIST0
:
1187 output_semantic_name
[slot
] = TGSI_SEMANTIC_CLIPDIST
;
1188 output_semantic_index
[slot
] = 0;
1190 case VARYING_SLOT_CLIP_DIST1
:
1191 output_semantic_name
[slot
] = TGSI_SEMANTIC_CLIPDIST
;
1192 output_semantic_index
[slot
] = 1;
1194 case VARYING_SLOT_LAYER
:
1195 output_semantic_name
[slot
] = TGSI_SEMANTIC_LAYER
;
1196 output_semantic_index
[slot
] = 0;
1198 case VARYING_SLOT_PRIMITIVE_ID
:
1199 output_semantic_name
[slot
] = TGSI_SEMANTIC_PRIMID
;
1200 output_semantic_index
[slot
] = 0;
1202 case VARYING_SLOT_VIEWPORT
:
1203 output_semantic_name
[slot
] = TGSI_SEMANTIC_VIEWPORT_INDEX
;
1204 output_semantic_index
[slot
] = 0;
1206 case VARYING_SLOT_TESS_LEVEL_OUTER
:
1207 output_semantic_name
[slot
] = TGSI_SEMANTIC_TESSOUTER
;
1208 output_semantic_index
[slot
] = 0;
1210 case VARYING_SLOT_TESS_LEVEL_INNER
:
1211 output_semantic_name
[slot
] = TGSI_SEMANTIC_TESSINNER
;
1212 output_semantic_index
[slot
] = 0;
1214 case VARYING_SLOT_TEX0
:
1215 case VARYING_SLOT_TEX1
:
1216 case VARYING_SLOT_TEX2
:
1217 case VARYING_SLOT_TEX3
:
1218 case VARYING_SLOT_TEX4
:
1219 case VARYING_SLOT_TEX5
:
1220 case VARYING_SLOT_TEX6
:
1221 case VARYING_SLOT_TEX7
:
1222 if (st
->needs_texcoord_semantic
) {
1223 output_semantic_name
[slot
] = TGSI_SEMANTIC_TEXCOORD
;
1224 output_semantic_index
[slot
] = attr
- VARYING_SLOT_TEX0
;
1228 case VARYING_SLOT_VAR0
:
1230 assert(slot
< ARRAY_SIZE(output_semantic_name
));
1231 assert(attr
>= VARYING_SLOT_VAR0
||
1232 (attr
>= VARYING_SLOT_TEX0
&& attr
<= VARYING_SLOT_TEX7
));
1233 output_semantic_name
[slot
] = TGSI_SEMANTIC_GENERIC
;
1234 output_semantic_index
[slot
] =
1235 st_get_generic_varying_index(st
, attr
);
1241 /* Also add patch outputs. */
1242 for (attr
= 0; attr
< 32; attr
++) {
1243 if (prog
->PatchOutputsWritten
& (1 << attr
)) {
1244 GLuint slot
= num_outputs
++;
1245 GLuint patch_attr
= VARYING_SLOT_PATCH0
+ attr
;
1247 outputMapping
[patch_attr
] = slot
;
1248 outputSlotToAttr
[slot
] = patch_attr
;
1249 output_semantic_name
[slot
] = TGSI_SEMANTIC_PATCH
;
1250 output_semantic_index
[slot
] = attr
;
1254 st_translate_program(st
->ctx
,
1263 input_semantic_name
,
1264 input_semantic_index
,
1271 output_semantic_name
,
1272 output_semantic_index
);
1274 out_state
->tokens
= ureg_get_tokens(ureg
, NULL
);
1277 st_translate_stream_output_info(glsl_to_tgsi
,
1279 &out_state
->stream_output
);
1281 if ((ST_DEBUG
& DEBUG_TGSI
) && (ST_DEBUG
& DEBUG_MESA
)) {
1282 _mesa_print_program(prog
);
1286 if (ST_DEBUG
& DEBUG_TGSI
) {
1287 tgsi_dump(out_state
->tokens
, 0);
1294 * Translate a geometry program to create a new variant.
1297 st_translate_geometry_program(struct st_context
*st
,
1298 struct st_geometry_program
*stgp
)
1300 struct ureg_program
*ureg
;
1302 ureg
= ureg_create_with_screen(TGSI_PROCESSOR_GEOMETRY
, st
->pipe
->screen
);
1306 ureg_property(ureg
, TGSI_PROPERTY_GS_INPUT_PRIM
, stgp
->Base
.InputType
);
1307 ureg_property(ureg
, TGSI_PROPERTY_GS_OUTPUT_PRIM
, stgp
->Base
.OutputType
);
1308 ureg_property(ureg
, TGSI_PROPERTY_GS_MAX_OUTPUT_VERTICES
,
1309 stgp
->Base
.VerticesOut
);
1310 ureg_property(ureg
, TGSI_PROPERTY_GS_INVOCATIONS
, stgp
->Base
.Invocations
);
1312 st_translate_program_common(st
, &stgp
->Base
.Base
, stgp
->glsl_to_tgsi
, ureg
,
1313 TGSI_PROCESSOR_GEOMETRY
, &stgp
->tgsi
);
1315 free_glsl_to_tgsi_visitor(stgp
->glsl_to_tgsi
);
1316 stgp
->glsl_to_tgsi
= NULL
;
1322 * Get/create a basic program variant.
1324 struct st_basic_variant
*
1325 st_get_basic_variant(struct st_context
*st
,
1326 unsigned pipe_shader
,
1327 struct pipe_shader_state
*tgsi
,
1328 struct st_basic_variant
**variants
)
1330 struct pipe_context
*pipe
= st
->pipe
;
1331 struct st_basic_variant
*v
;
1332 struct st_basic_variant_key key
;
1334 memset(&key
, 0, sizeof(key
));
1335 key
.st
= st
->has_shareable_shaders
? NULL
: st
;
1337 /* Search for existing variant */
1338 for (v
= *variants
; v
; v
= v
->next
) {
1339 if (memcmp(&v
->key
, &key
, sizeof(key
)) == 0) {
1346 v
= CALLOC_STRUCT(st_basic_variant
);
1348 /* fill in new variant */
1349 switch (pipe_shader
) {
1350 case PIPE_SHADER_TESS_CTRL
:
1351 v
->driver_shader
= pipe
->create_tcs_state(pipe
, tgsi
);
1353 case PIPE_SHADER_TESS_EVAL
:
1354 v
->driver_shader
= pipe
->create_tes_state(pipe
, tgsi
);
1356 case PIPE_SHADER_GEOMETRY
:
1357 v
->driver_shader
= pipe
->create_gs_state(pipe
, tgsi
);
1360 assert(!"unhandled shader type");
1367 /* insert into list */
1368 v
->next
= *variants
;
1378 * Translate a tessellation control program to create a new variant.
1381 st_translate_tessctrl_program(struct st_context
*st
,
1382 struct st_tessctrl_program
*sttcp
)
1384 struct ureg_program
*ureg
;
1386 ureg
= ureg_create_with_screen(TGSI_PROCESSOR_TESS_CTRL
, st
->pipe
->screen
);
1390 ureg_property(ureg
, TGSI_PROPERTY_TCS_VERTICES_OUT
,
1391 sttcp
->Base
.VerticesOut
);
1393 st_translate_program_common(st
, &sttcp
->Base
.Base
, sttcp
->glsl_to_tgsi
,
1394 ureg
, TGSI_PROCESSOR_TESS_CTRL
, &sttcp
->tgsi
);
1396 free_glsl_to_tgsi_visitor(sttcp
->glsl_to_tgsi
);
1397 sttcp
->glsl_to_tgsi
= NULL
;
1403 * Translate a tessellation evaluation program to create a new variant.
1406 st_translate_tesseval_program(struct st_context
*st
,
1407 struct st_tesseval_program
*sttep
)
1409 struct ureg_program
*ureg
;
1411 ureg
= ureg_create_with_screen(TGSI_PROCESSOR_TESS_EVAL
, st
->pipe
->screen
);
1415 if (sttep
->Base
.PrimitiveMode
== GL_ISOLINES
)
1416 ureg_property(ureg
, TGSI_PROPERTY_TES_PRIM_MODE
, GL_LINES
);
1418 ureg_property(ureg
, TGSI_PROPERTY_TES_PRIM_MODE
, sttep
->Base
.PrimitiveMode
);
1420 switch (sttep
->Base
.Spacing
) {
1422 ureg_property(ureg
, TGSI_PROPERTY_TES_SPACING
, PIPE_TESS_SPACING_EQUAL
);
1424 case GL_FRACTIONAL_EVEN
:
1425 ureg_property(ureg
, TGSI_PROPERTY_TES_SPACING
,
1426 PIPE_TESS_SPACING_FRACTIONAL_EVEN
);
1428 case GL_FRACTIONAL_ODD
:
1429 ureg_property(ureg
, TGSI_PROPERTY_TES_SPACING
,
1430 PIPE_TESS_SPACING_FRACTIONAL_ODD
);
1436 ureg_property(ureg
, TGSI_PROPERTY_TES_VERTEX_ORDER_CW
,
1437 sttep
->Base
.VertexOrder
== GL_CW
);
1438 ureg_property(ureg
, TGSI_PROPERTY_TES_POINT_MODE
, sttep
->Base
.PointMode
);
1440 st_translate_program_common(st
, &sttep
->Base
.Base
, sttep
->glsl_to_tgsi
,
1441 ureg
, TGSI_PROCESSOR_TESS_EVAL
, &sttep
->tgsi
);
1443 free_glsl_to_tgsi_visitor(sttep
->glsl_to_tgsi
);
1444 sttep
->glsl_to_tgsi
= NULL
;
1450 * Translate a compute program to create a new variant.
1453 st_translate_compute_program(struct st_context
*st
,
1454 struct st_compute_program
*stcp
)
1456 struct ureg_program
*ureg
;
1457 struct pipe_shader_state prog
;
1459 ureg
= ureg_create_with_screen(TGSI_PROCESSOR_COMPUTE
, st
->pipe
->screen
);
1463 st_translate_program_common(st
, &stcp
->Base
.Base
, stcp
->glsl_to_tgsi
, ureg
,
1464 TGSI_PROCESSOR_COMPUTE
, &prog
);
1466 stcp
->tgsi
.ir_type
= PIPE_SHADER_IR_TGSI
;
1467 stcp
->tgsi
.prog
= prog
.tokens
;
1468 stcp
->tgsi
.req_local_mem
= stcp
->Base
.SharedSize
;
1469 stcp
->tgsi
.req_private_mem
= 0;
1470 stcp
->tgsi
.req_input_mem
= 0;
1472 free_glsl_to_tgsi_visitor(stcp
->glsl_to_tgsi
);
1473 stcp
->glsl_to_tgsi
= NULL
;
1479 * Get/create compute program variant.
1481 struct st_basic_variant
*
1482 st_get_cp_variant(struct st_context
*st
,
1483 struct pipe_compute_state
*tgsi
,
1484 struct st_basic_variant
**variants
)
1486 struct pipe_context
*pipe
= st
->pipe
;
1487 struct st_basic_variant
*v
;
1488 struct st_basic_variant_key key
;
1490 memset(&key
, 0, sizeof(key
));
1491 key
.st
= st
->has_shareable_shaders
? NULL
: st
;
1493 /* Search for existing variant */
1494 for (v
= *variants
; v
; v
= v
->next
) {
1495 if (memcmp(&v
->key
, &key
, sizeof(key
)) == 0) {
1502 v
= CALLOC_STRUCT(st_basic_variant
);
1504 /* fill in new variant */
1505 v
->driver_shader
= pipe
->create_compute_state(pipe
, tgsi
);
1508 /* insert into list */
1509 v
->next
= *variants
;
1519 * Vert/Geom/Frag programs have per-context variants. Free all the
1520 * variants attached to the given program which match the given context.
1523 destroy_program_variants(struct st_context
*st
, struct gl_program
*target
)
1525 if (!target
|| target
== &_mesa_DummyProgram
)
1528 switch (target
->Target
) {
1529 case GL_VERTEX_PROGRAM_ARB
:
1531 struct st_vertex_program
*stvp
= (struct st_vertex_program
*) target
;
1532 struct st_vp_variant
*vpv
, **prevPtr
= &stvp
->variants
;
1534 for (vpv
= stvp
->variants
; vpv
; ) {
1535 struct st_vp_variant
*next
= vpv
->next
;
1536 if (vpv
->key
.st
== st
) {
1537 /* unlink from list */
1539 /* destroy this variant */
1540 delete_vp_variant(st
, vpv
);
1543 prevPtr
= &vpv
->next
;
1549 case GL_FRAGMENT_PROGRAM_ARB
:
1551 struct st_fragment_program
*stfp
=
1552 (struct st_fragment_program
*) target
;
1553 struct st_fp_variant
*fpv
, **prevPtr
= &stfp
->variants
;
1555 for (fpv
= stfp
->variants
; fpv
; ) {
1556 struct st_fp_variant
*next
= fpv
->next
;
1557 if (fpv
->key
.st
== st
) {
1558 /* unlink from list */
1560 /* destroy this variant */
1561 delete_fp_variant(st
, fpv
);
1564 prevPtr
= &fpv
->next
;
1570 case GL_GEOMETRY_PROGRAM_NV
:
1571 case GL_TESS_CONTROL_PROGRAM_NV
:
1572 case GL_TESS_EVALUATION_PROGRAM_NV
:
1573 case GL_COMPUTE_PROGRAM_NV
:
1575 struct st_geometry_program
*gp
= (struct st_geometry_program
*)target
;
1576 struct st_tessctrl_program
*tcp
= (struct st_tessctrl_program
*)target
;
1577 struct st_tesseval_program
*tep
= (struct st_tesseval_program
*)target
;
1578 struct st_compute_program
*cp
= (struct st_compute_program
*)target
;
1579 struct st_basic_variant
**variants
=
1580 target
->Target
== GL_GEOMETRY_PROGRAM_NV
? &gp
->variants
:
1581 target
->Target
== GL_TESS_CONTROL_PROGRAM_NV
? &tcp
->variants
:
1582 target
->Target
== GL_TESS_EVALUATION_PROGRAM_NV
? &tep
->variants
:
1583 target
->Target
== GL_COMPUTE_PROGRAM_NV
? &cp
->variants
:
1585 struct st_basic_variant
*v
, **prevPtr
= variants
;
1587 for (v
= *variants
; v
; ) {
1588 struct st_basic_variant
*next
= v
->next
;
1589 if (v
->key
.st
== st
) {
1590 /* unlink from list */
1592 /* destroy this variant */
1593 delete_basic_variant(st
, v
, target
->Target
);
1603 _mesa_problem(NULL
, "Unexpected program target 0x%x in "
1604 "destroy_program_variants_cb()", target
->Target
);
1610 * Callback for _mesa_HashWalk. Free all the shader's program variants
1611 * which match the given context.
1614 destroy_shader_program_variants_cb(GLuint key
, void *data
, void *userData
)
1616 struct st_context
*st
= (struct st_context
*) userData
;
1617 struct gl_shader
*shader
= (struct gl_shader
*) data
;
1619 switch (shader
->Type
) {
1620 case GL_SHADER_PROGRAM_MESA
:
1622 struct gl_shader_program
*shProg
= (struct gl_shader_program
*) data
;
1625 for (i
= 0; i
< shProg
->NumShaders
; i
++) {
1626 destroy_program_variants(st
, shProg
->Shaders
[i
]->Program
);
1629 for (i
= 0; i
< ARRAY_SIZE(shProg
->_LinkedShaders
); i
++) {
1630 if (shProg
->_LinkedShaders
[i
])
1631 destroy_program_variants(st
, shProg
->_LinkedShaders
[i
]->Program
);
1635 case GL_VERTEX_SHADER
:
1636 case GL_FRAGMENT_SHADER
:
1637 case GL_GEOMETRY_SHADER
:
1638 case GL_TESS_CONTROL_SHADER
:
1639 case GL_TESS_EVALUATION_SHADER
:
1640 case GL_COMPUTE_SHADER
:
1642 destroy_program_variants(st
, shader
->Program
);
1652 * Callback for _mesa_HashWalk. Free all the program variants which match
1653 * the given context.
1656 destroy_program_variants_cb(GLuint key
, void *data
, void *userData
)
1658 struct st_context
*st
= (struct st_context
*) userData
;
1659 struct gl_program
*program
= (struct gl_program
*) data
;
1660 destroy_program_variants(st
, program
);
1665 * Walk over all shaders and programs to delete any variants which
1666 * belong to the given context.
1667 * This is called during context tear-down.
1670 st_destroy_program_variants(struct st_context
*st
)
1672 /* If shaders can be shared with other contexts, the last context will
1673 * call DeleteProgram on all shaders, releasing everything.
1675 if (st
->has_shareable_shaders
)
1678 /* ARB vert/frag program */
1679 _mesa_HashWalk(st
->ctx
->Shared
->Programs
,
1680 destroy_program_variants_cb
, st
);
1682 /* GLSL vert/frag/geom shaders */
1683 _mesa_HashWalk(st
->ctx
->Shared
->ShaderObjects
,
1684 destroy_shader_program_variants_cb
, st
);
1689 * For debugging, print/dump the current vertex program.
1692 st_print_current_vertex_program(void)
1694 GET_CURRENT_CONTEXT(ctx
);
1696 if (ctx
->VertexProgram
._Current
) {
1697 struct st_vertex_program
*stvp
=
1698 (struct st_vertex_program
*) ctx
->VertexProgram
._Current
;
1699 struct st_vp_variant
*stv
;
1701 debug_printf("Vertex program %u\n", stvp
->Base
.Base
.Id
);
1703 for (stv
= stvp
->variants
; stv
; stv
= stv
->next
) {
1704 debug_printf("variant %p\n", stv
);
1705 tgsi_dump(stv
->tgsi
.tokens
, 0);
1712 * Compile one shader variant.
1715 st_precompile_shader_variant(struct st_context
*st
,
1716 struct gl_program
*prog
)
1718 switch (prog
->Target
) {
1719 case GL_VERTEX_PROGRAM_ARB
: {
1720 struct st_vertex_program
*p
= (struct st_vertex_program
*)prog
;
1721 struct st_vp_variant_key key
;
1723 memset(&key
, 0, sizeof(key
));
1724 key
.st
= st
->has_shareable_shaders
? NULL
: st
;
1725 st_get_vp_variant(st
, p
, &key
);
1729 case GL_TESS_CONTROL_PROGRAM_NV
: {
1730 struct st_tessctrl_program
*p
= (struct st_tessctrl_program
*)prog
;
1731 st_get_basic_variant(st
, PIPE_SHADER_TESS_CTRL
, &p
->tgsi
, &p
->variants
);
1735 case GL_TESS_EVALUATION_PROGRAM_NV
: {
1736 struct st_tesseval_program
*p
= (struct st_tesseval_program
*)prog
;
1737 st_get_basic_variant(st
, PIPE_SHADER_TESS_EVAL
, &p
->tgsi
, &p
->variants
);
1741 case GL_GEOMETRY_PROGRAM_NV
: {
1742 struct st_geometry_program
*p
= (struct st_geometry_program
*)prog
;
1743 st_get_basic_variant(st
, PIPE_SHADER_GEOMETRY
, &p
->tgsi
, &p
->variants
);
1747 case GL_FRAGMENT_PROGRAM_ARB
: {
1748 struct st_fragment_program
*p
= (struct st_fragment_program
*)prog
;
1749 struct st_fp_variant_key key
;
1751 memset(&key
, 0, sizeof(key
));
1752 key
.st
= st
->has_shareable_shaders
? NULL
: st
;
1753 st_get_fp_variant(st
, p
, &key
);
1757 case GL_COMPUTE_PROGRAM_NV
: {
1758 struct st_compute_program
*p
= (struct st_compute_program
*)prog
;
1759 st_get_cp_variant(st
, &p
->tgsi
, &p
->variants
);