Merge branch 'gallium-docs'
[mesa.git] / src / mesa / state_tracker / st_program.c
1 /**************************************************************************
2 *
3 * Copyright 2007 Tungsten Graphics, Inc., Cedar Park, Texas.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27 /*
28 * Authors:
29 * Keith Whitwell <keith@tungstengraphics.com>
30 * Brian Paul
31 */
32
33
34 #include "main/imports.h"
35 #include "main/mtypes.h"
36 #include "shader/prog_print.h"
37 #include "shader/programopt.h"
38
39 #include "pipe/p_context.h"
40 #include "pipe/p_defines.h"
41 #include "pipe/p_shader_tokens.h"
42 #include "draw/draw_context.h"
43 #include "tgsi/tgsi_dump.h"
44
45 #include "st_debug.h"
46 #include "st_context.h"
47 #include "st_atom.h"
48 #include "st_program.h"
49 #include "st_mesa_to_tgsi.h"
50 #include "cso_cache/cso_context.h"
51
52
53
54 /**
55 * Clean out any old compilations:
56 */
57 void
58 st_vp_release_varients( struct st_context *st,
59 struct st_vertex_program *stvp )
60 {
61 struct st_vp_varient *vpv;
62
63 for (vpv = stvp->varients; vpv; ) {
64 struct st_vp_varient *next = vpv->next;
65
66 if (vpv->driver_shader)
67 cso_delete_vertex_shader(st->cso_context, vpv->driver_shader);
68
69 if (vpv->draw_shader)
70 draw_delete_vertex_shader( st->draw, vpv->draw_shader );
71
72 if (vpv->state.tokens)
73 st_free_tokens(vpv->state.tokens);
74
75 FREE( vpv );
76
77 vpv = next;
78 }
79
80 stvp->varients = NULL;
81 }
82
83
84
85
86 /**
87 * Translate a Mesa vertex shader into a TGSI shader.
88 * \param outputMapping to map vertex program output registers (VERT_RESULT_x)
89 * to TGSI output slots
90 * \param tokensOut destination for TGSI tokens
91 * \return pointer to cached pipe_shader object.
92 */
93 void
94 st_prepare_vertex_program(struct st_context *st,
95 struct st_vertex_program *stvp)
96 {
97 GLuint attr;
98
99 stvp->num_inputs = 0;
100 stvp->num_outputs = 0;
101
102 if (stvp->Base.IsPositionInvariant)
103 _mesa_insert_mvp_code(st->ctx, &stvp->Base);
104
105 assert(stvp->Base.Base.NumInstructions > 1);
106
107 /*
108 * Determine number of inputs, the mappings between VERT_ATTRIB_x
109 * and TGSI generic input indexes, plus input attrib semantic info.
110 */
111 for (attr = 0; attr < VERT_ATTRIB_MAX; attr++) {
112 if (stvp->Base.Base.InputsRead & (1 << attr)) {
113 stvp->input_to_index[attr] = stvp->num_inputs;
114 stvp->index_to_input[stvp->num_inputs] = attr;
115 stvp->num_inputs++;
116 }
117 }
118 /* bit of a hack, presetup potentially unused edgeflag input */
119 stvp->input_to_index[VERT_ATTRIB_EDGEFLAG] = stvp->num_inputs;
120 stvp->index_to_input[stvp->num_inputs] = VERT_ATTRIB_EDGEFLAG;
121
122 /* Compute mapping of vertex program outputs to slots.
123 */
124 for (attr = 0; attr < VERT_RESULT_MAX; attr++) {
125 if ((stvp->Base.Base.OutputsWritten & (1 << attr)) == 0) {
126 stvp->result_to_output[attr] = ~0;
127 }
128 else {
129 unsigned slot = stvp->num_outputs++;
130
131 stvp->result_to_output[attr] = slot;
132
133 switch (attr) {
134 case VERT_RESULT_HPOS:
135 stvp->output_semantic_name[slot] = TGSI_SEMANTIC_POSITION;
136 stvp->output_semantic_index[slot] = 0;
137 break;
138 case VERT_RESULT_COL0:
139 stvp->output_semantic_name[slot] = TGSI_SEMANTIC_COLOR;
140 stvp->output_semantic_index[slot] = 0;
141 break;
142 case VERT_RESULT_COL1:
143 stvp->output_semantic_name[slot] = TGSI_SEMANTIC_COLOR;
144 stvp->output_semantic_index[slot] = 1;
145 break;
146 case VERT_RESULT_BFC0:
147 stvp->output_semantic_name[slot] = TGSI_SEMANTIC_BCOLOR;
148 stvp->output_semantic_index[slot] = 0;
149 break;
150 case VERT_RESULT_BFC1:
151 stvp->output_semantic_name[slot] = TGSI_SEMANTIC_BCOLOR;
152 stvp->output_semantic_index[slot] = 1;
153 break;
154 case VERT_RESULT_FOGC:
155 stvp->output_semantic_name[slot] = TGSI_SEMANTIC_FOG;
156 stvp->output_semantic_index[slot] = 0;
157 break;
158 case VERT_RESULT_PSIZ:
159 stvp->output_semantic_name[slot] = TGSI_SEMANTIC_PSIZE;
160 stvp->output_semantic_index[slot] = 0;
161 break;
162 case VERT_RESULT_EDGE:
163 assert(0);
164 break;
165
166 case VERT_RESULT_TEX0:
167 case VERT_RESULT_TEX1:
168 case VERT_RESULT_TEX2:
169 case VERT_RESULT_TEX3:
170 case VERT_RESULT_TEX4:
171 case VERT_RESULT_TEX5:
172 case VERT_RESULT_TEX6:
173 case VERT_RESULT_TEX7:
174 stvp->output_semantic_name[slot] = TGSI_SEMANTIC_GENERIC;
175 stvp->output_semantic_index[slot] = attr - VERT_RESULT_TEX0;
176 break;
177
178 case VERT_RESULT_VAR0:
179 default:
180 assert(attr < VERT_RESULT_MAX);
181 stvp->output_semantic_name[slot] = TGSI_SEMANTIC_GENERIC;
182 stvp->output_semantic_index[slot] = (FRAG_ATTRIB_VAR0 -
183 FRAG_ATTRIB_TEX0 +
184 attr -
185 VERT_RESULT_VAR0);
186 break;
187 }
188 }
189 }
190 /* similar hack to above, presetup potentially unused edgeflag output */
191 stvp->result_to_output[VERT_RESULT_EDGE] = stvp->num_outputs;
192 stvp->output_semantic_name[stvp->num_outputs] = TGSI_SEMANTIC_EDGEFLAG;
193 stvp->output_semantic_index[stvp->num_outputs] = 0;
194 }
195
196
197 struct st_vp_varient *
198 st_translate_vertex_program(struct st_context *st,
199 struct st_vertex_program *stvp,
200 const struct st_vp_varient_key *key)
201 {
202 struct st_vp_varient *vpv = CALLOC_STRUCT(st_vp_varient);
203 struct pipe_context *pipe = st->pipe;
204 struct ureg_program *ureg;
205 enum pipe_error error;
206 unsigned num_outputs;
207
208 ureg = ureg_create( TGSI_PROCESSOR_VERTEX );
209 if (ureg == NULL)
210 return NULL;
211
212 vpv->num_inputs = stvp->num_inputs;
213 num_outputs = stvp->num_outputs;
214 if (key->passthrough_edgeflags) {
215 vpv->num_inputs++;
216 num_outputs++;
217 }
218
219 error =
220 st_translate_mesa_program(st->ctx,
221 TGSI_PROCESSOR_VERTEX,
222 ureg,
223 &stvp->Base.Base,
224 /* inputs */
225 vpv->num_inputs,
226 stvp->input_to_index,
227 NULL, /* input semantic name */
228 NULL, /* input semantic index */
229 NULL,
230 /* outputs */
231 num_outputs,
232 stvp->result_to_output,
233 stvp->output_semantic_name,
234 stvp->output_semantic_index,
235 key->passthrough_edgeflags );
236
237 if (error)
238 goto fail;
239
240 vpv->state.tokens = ureg_get_tokens( ureg, NULL );
241 if (!vpv->state.tokens)
242 goto fail;
243
244 ureg_destroy( ureg );
245
246 vpv->driver_shader = pipe->create_vs_state(pipe, &vpv->state);
247
248 if ((ST_DEBUG & DEBUG_TGSI) && (ST_DEBUG & DEBUG_MESA)) {
249 _mesa_print_program(&stvp->Base.Base);
250 debug_printf("\n");
251 }
252
253 if (ST_DEBUG & DEBUG_TGSI) {
254 tgsi_dump( vpv->state.tokens, 0 );
255 debug_printf("\n");
256 }
257
258 return vpv;
259
260 fail:
261 debug_printf("%s: failed to translate Mesa program:\n", __FUNCTION__);
262 _mesa_print_program(&stvp->Base.Base);
263 debug_assert(0);
264
265 ureg_destroy( ureg );
266 return NULL;
267 }
268
269
270
271 /**
272 * Translate a Mesa fragment shader into a TGSI shader.
273 * \param inputMapping to map fragment program input registers to TGSI
274 * input slots
275 * \return pointer to cached pipe_shader object.
276 */
277 void
278 st_translate_fragment_program(struct st_context *st,
279 struct st_fragment_program *stfp,
280 const GLuint inputMapping[])
281 {
282 struct pipe_context *pipe = st->pipe;
283 GLuint outputMapping[FRAG_RESULT_MAX];
284 GLuint defaultInputMapping[FRAG_ATTRIB_MAX];
285 GLuint interpMode[16]; /* XXX size? */
286 GLuint attr;
287 enum pipe_error error;
288 const GLbitfield inputsRead = stfp->Base.Base.InputsRead;
289 struct ureg_program *ureg;
290 GLuint vslot = 0;
291
292 uint fs_num_inputs = 0;
293
294 ubyte fs_output_semantic_name[PIPE_MAX_SHADER_OUTPUTS];
295 ubyte fs_output_semantic_index[PIPE_MAX_SHADER_OUTPUTS];
296 uint fs_num_outputs = 0;
297
298 /* which vertex output goes to the first fragment input: */
299 if (inputsRead & FRAG_BIT_WPOS)
300 vslot = 0;
301 else
302 vslot = 1;
303
304 /*
305 * Convert Mesa program inputs to TGSI input register semantics.
306 */
307 for (attr = 0; attr < FRAG_ATTRIB_MAX; attr++) {
308 if (inputsRead & (1 << attr)) {
309 const GLuint slot = fs_num_inputs;
310
311 defaultInputMapping[attr] = slot;
312
313 stfp->input_map[slot] = vslot++;
314
315 fs_num_inputs++;
316
317 switch (attr) {
318 case FRAG_ATTRIB_WPOS:
319 stfp->input_semantic_name[slot] = TGSI_SEMANTIC_POSITION;
320 stfp->input_semantic_index[slot] = 0;
321 interpMode[slot] = TGSI_INTERPOLATE_LINEAR;
322 break;
323 case FRAG_ATTRIB_COL0:
324 stfp->input_semantic_name[slot] = TGSI_SEMANTIC_COLOR;
325 stfp->input_semantic_index[slot] = 0;
326 interpMode[slot] = TGSI_INTERPOLATE_LINEAR;
327 break;
328 case FRAG_ATTRIB_COL1:
329 stfp->input_semantic_name[slot] = TGSI_SEMANTIC_COLOR;
330 stfp->input_semantic_index[slot] = 1;
331 interpMode[slot] = TGSI_INTERPOLATE_LINEAR;
332 break;
333 case FRAG_ATTRIB_FOGC:
334 stfp->input_semantic_name[slot] = TGSI_SEMANTIC_FOG;
335 stfp->input_semantic_index[slot] = 0;
336 interpMode[slot] = TGSI_INTERPOLATE_PERSPECTIVE;
337 break;
338 case FRAG_ATTRIB_FACE:
339 stfp->input_semantic_name[slot] = TGSI_SEMANTIC_FACE;
340 stfp->input_semantic_index[slot] = 0;
341 interpMode[slot] = TGSI_INTERPOLATE_CONSTANT;
342 break;
343
344 /* In most cases, there is nothing special about these
345 * inputs, so adopt a convention to use the generic
346 * semantic name and the mesa FRAG_ATTRIB_ number as the
347 * index.
348 *
349 * All that is required is that the vertex shader labels
350 * its own outputs similarly, and that the vertex shader
351 * generates at least every output required by the
352 * fragment shader plus fixed-function hardware (such as
353 * BFC).
354 *
355 * There is no requirement that semantic indexes start at
356 * zero or be restricted to a particular range -- nobody
357 * should be building tables based on semantic index.
358 */
359 case FRAG_ATTRIB_TEX0:
360 case FRAG_ATTRIB_TEX1:
361 case FRAG_ATTRIB_TEX2:
362 case FRAG_ATTRIB_TEX3:
363 case FRAG_ATTRIB_TEX4:
364 case FRAG_ATTRIB_TEX5:
365 case FRAG_ATTRIB_TEX6:
366 case FRAG_ATTRIB_TEX7:
367 case FRAG_ATTRIB_PNTC:
368 case FRAG_ATTRIB_VAR0:
369 default:
370 /* Actually, let's try and zero-base this just for
371 * readability of the generated TGSI.
372 */
373 assert(attr >= FRAG_ATTRIB_TEX0);
374 stfp->input_semantic_index[slot] = (attr - FRAG_ATTRIB_TEX0);
375 stfp->input_semantic_name[slot] = TGSI_SEMANTIC_GENERIC;
376 interpMode[slot] = TGSI_INTERPOLATE_PERSPECTIVE;
377 break;
378 }
379 }
380 }
381
382 /*
383 * Semantics and mapping for outputs
384 */
385 {
386 uint numColors = 0;
387 GLbitfield64 outputsWritten = stfp->Base.Base.OutputsWritten;
388
389 /* if z is written, emit that first */
390 if (outputsWritten & (1 << FRAG_RESULT_DEPTH)) {
391 fs_output_semantic_name[fs_num_outputs] = TGSI_SEMANTIC_POSITION;
392 fs_output_semantic_index[fs_num_outputs] = 0;
393 outputMapping[FRAG_RESULT_DEPTH] = fs_num_outputs;
394 fs_num_outputs++;
395 outputsWritten &= ~(1 << FRAG_RESULT_DEPTH);
396 }
397
398 /* handle remaning outputs (color) */
399 for (attr = 0; attr < FRAG_RESULT_MAX; attr++) {
400 if (outputsWritten & (1 << attr)) {
401 switch (attr) {
402 case FRAG_RESULT_DEPTH:
403 /* handled above */
404 assert(0);
405 break;
406 default:
407 assert(attr == FRAG_RESULT_COLOR ||
408 (FRAG_RESULT_DATA0 <= attr && attr < FRAG_RESULT_MAX));
409 fs_output_semantic_name[fs_num_outputs] = TGSI_SEMANTIC_COLOR;
410 fs_output_semantic_index[fs_num_outputs] = numColors;
411 outputMapping[attr] = fs_num_outputs;
412 numColors++;
413 break;
414 }
415
416 fs_num_outputs++;
417 }
418 }
419 }
420
421 if (!inputMapping)
422 inputMapping = defaultInputMapping;
423
424 ureg = ureg_create( TGSI_PROCESSOR_FRAGMENT );
425 if (ureg == NULL)
426 return;
427
428
429 error =
430 st_translate_mesa_program(st->ctx,
431 TGSI_PROCESSOR_FRAGMENT,
432 ureg,
433 &stfp->Base.Base,
434 /* inputs */
435 fs_num_inputs,
436 inputMapping,
437 stfp->input_semantic_name,
438 stfp->input_semantic_index,
439 interpMode,
440 /* outputs */
441 fs_num_outputs,
442 outputMapping,
443 fs_output_semantic_name,
444 fs_output_semantic_index, FALSE );
445
446 stfp->state.tokens = ureg_get_tokens( ureg, NULL );
447 ureg_destroy( ureg );
448 stfp->driver_shader = pipe->create_fs_state(pipe, &stfp->state);
449
450 if ((ST_DEBUG & DEBUG_TGSI) && (ST_DEBUG & DEBUG_MESA)) {
451 _mesa_print_program(&stfp->Base.Base);
452 debug_printf("\n");
453 }
454
455 if (ST_DEBUG & DEBUG_TGSI) {
456 tgsi_dump( stfp->state.tokens, 0/*TGSI_DUMP_VERBOSE*/ );
457 debug_printf("\n");
458 }
459 }
460
461
462 /**
463 * Debug- print current shader text
464 */
465 void
466 st_print_shaders(GLcontext *ctx)
467 {
468 struct gl_shader_program *shProg = ctx->Shader.CurrentProgram;
469 if (shProg) {
470 GLuint i;
471 for (i = 0; i < shProg->NumShaders; i++) {
472 printf("GLSL shader %u of %u:\n", i, shProg->NumShaders);
473 printf("%s\n", shProg->Shaders[i]->Source);
474 }
475 }
476 }