gallium: interface changes necessary to implement transform feedback (v5)
[mesa.git] / src / gallium / state_trackers / vega / shaders_cache.c
1 /**************************************************************************
2 *
3 * Copyright 2009 VMware, Inc. All Rights Reserved.
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the
7 * "Software"), to deal in the Software without restriction, including
8 * without limitation the rights to use, copy, modify, merge, publish,
9 * distribute, sub license, and/or sell copies of the Software, and to
10 * permit persons to whom the Software is furnished to do so, subject to
11 * the following conditions:
12 *
13 * The above copyright notice and this permission notice (including the
14 * next paragraph) shall be included in all copies or substantial portions
15 * of the Software.
16 *
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
18 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
19 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
20 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
21 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
22 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
23 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
24 *
25 **************************************************************************/
26
27 #include "shaders_cache.h"
28
29 #include "vg_context.h"
30
31 #include "pipe/p_context.h"
32 #include "pipe/p_defines.h"
33 #include "pipe/p_shader_tokens.h"
34
35 #include "tgsi/tgsi_build.h"
36 #include "tgsi/tgsi_dump.h"
37 #include "tgsi/tgsi_parse.h"
38 #include "tgsi/tgsi_util.h"
39 #include "tgsi/tgsi_text.h"
40
41 #include "util/u_memory.h"
42 #include "util/u_math.h"
43 #include "util/u_debug.h"
44 #include "cso_cache/cso_hash.h"
45 #include "cso_cache/cso_context.h"
46
47 #include "VG/openvg.h"
48
49 #include "asm_fill.h"
50
51 /* Essentially we construct an ubber-shader based on the state
52 * of the pipeline. The stages are:
53 * 1) Paint generation (color/gradient/pattern)
54 * 2) Image composition (normal/multiply/stencil)
55 * 3) Color transform
56 * 4) Per-channel alpha generation
57 * 5) Extended blend (multiply/screen/darken/lighten)
58 * 6) Mask
59 * 7) Premultiply/Unpremultiply
60 * 8) Color transform (to black and white)
61 */
62 #define SHADER_STAGES 8
63
64 struct cached_shader {
65 void *driver_shader;
66 struct pipe_shader_state state;
67 };
68
69 struct shaders_cache {
70 struct vg_context *pipe;
71
72 struct cso_hash *hash;
73 };
74
75
76 static INLINE struct tgsi_token *tokens_from_assembly(const char *txt, int num_tokens)
77 {
78 struct tgsi_token *tokens;
79
80 tokens = (struct tgsi_token *) MALLOC(num_tokens * sizeof(tokens[0]));
81
82 tgsi_text_translate(txt, tokens, num_tokens);
83
84 #if DEBUG_SHADERS
85 tgsi_dump(tokens, 0);
86 #endif
87
88 return tokens;
89 }
90
91 /*
92 static const char max_shader_preamble[] =
93 "FRAG\n"
94 "DCL IN[0], POSITION, LINEAR\n"
95 "DCL IN[1], GENERIC[0], PERSPECTIVE\n"
96 "DCL OUT[0], COLOR, CONSTANT\n"
97 "DCL CONST[0..9], CONSTANT\n"
98 "DCL TEMP[0..9], CONSTANT\n"
99 "DCL SAMP[0..9], CONSTANT\n";
100
101 max_shader_preamble strlen == 175
102 */
103 #define MAX_PREAMBLE 175
104
105 static INLINE VGint range_min(VGint min, VGint current)
106 {
107 if (min < 0)
108 min = current;
109 else
110 min = MIN2(min, current);
111 return min;
112 }
113
114 static INLINE VGint range_max(VGint max, VGint current)
115 {
116 return MAX2(max, current);
117 }
118
119 static void *
120 combine_shaders(const struct shader_asm_info *shaders[SHADER_STAGES], int num_shaders,
121 struct pipe_context *pipe,
122 struct pipe_shader_state *shader)
123 {
124 VGboolean declare_input = VG_FALSE;
125 VGint start_const = -1, end_const = 0;
126 VGint start_temp = -1, end_temp = 0;
127 VGint start_sampler = -1, end_sampler = 0;
128 VGint i, current_shader = 0;
129 VGint num_consts, num_temps, num_samplers;
130 struct ureg_program *ureg;
131 struct ureg_src in[2];
132 struct ureg_src *sampler = NULL;
133 struct ureg_src *constant = NULL;
134 struct ureg_dst out, *temp = NULL;
135 void *p = NULL;
136
137 for (i = 0; i < num_shaders; ++i) {
138 if (shaders[i]->num_consts)
139 start_const = range_min(start_const, shaders[i]->start_const);
140 if (shaders[i]->num_temps)
141 start_temp = range_min(start_temp, shaders[i]->start_temp);
142 if (shaders[i]->num_samplers)
143 start_sampler = range_min(start_sampler, shaders[i]->start_sampler);
144
145 end_const = range_max(end_const, shaders[i]->start_const +
146 shaders[i]->num_consts);
147 end_temp = range_max(end_temp, shaders[i]->start_temp +
148 shaders[i]->num_temps);
149 end_sampler = range_max(end_sampler, shaders[i]->start_sampler +
150 shaders[i]->num_samplers);
151 if (shaders[i]->needs_position)
152 declare_input = VG_TRUE;
153 }
154 /* if they're still unitialized, initialize them */
155 if (start_const < 0)
156 start_const = 0;
157 if (start_temp < 0)
158 start_temp = 0;
159 if (start_sampler < 0)
160 start_sampler = 0;
161
162 num_consts = end_const - start_const;
163 num_temps = end_temp - start_temp;
164 num_samplers = end_sampler - start_sampler;
165
166 ureg = ureg_create(TGSI_PROCESSOR_FRAGMENT);
167 if (!ureg)
168 return NULL;
169
170 if (declare_input) {
171 in[0] = ureg_DECL_fs_input(ureg,
172 TGSI_SEMANTIC_POSITION,
173 0,
174 TGSI_INTERPOLATE_LINEAR);
175 in[1] = ureg_DECL_fs_input(ureg,
176 TGSI_SEMANTIC_GENERIC,
177 0,
178 TGSI_INTERPOLATE_PERSPECTIVE);
179 }
180
181 /* we always have a color output */
182 out = ureg_DECL_output(ureg, TGSI_SEMANTIC_COLOR, 0);
183
184 if (num_consts >= 1) {
185 constant = (struct ureg_src *) malloc(sizeof(struct ureg_src) * end_const);
186 for (i = start_const; i < end_const; i++) {
187 constant[i] = ureg_DECL_constant(ureg, i);
188 }
189
190 }
191
192 if (num_temps >= 1) {
193 temp = (struct ureg_dst *) malloc(sizeof(struct ureg_dst) * end_temp);
194 for (i = start_temp; i < end_temp; i++) {
195 temp[i] = ureg_DECL_temporary(ureg);
196 }
197 }
198
199 if (num_samplers >= 1) {
200 sampler = (struct ureg_src *) malloc(sizeof(struct ureg_src) * end_sampler);
201 for (i = start_sampler; i < end_sampler; i++) {
202 sampler[i] = ureg_DECL_sampler(ureg, i);
203 }
204 }
205
206 while (current_shader < num_shaders) {
207 if ((current_shader + 1) == num_shaders) {
208 shaders[current_shader]->func(ureg,
209 &out,
210 in,
211 sampler,
212 temp,
213 constant);
214 } else {
215 shaders[current_shader]->func(ureg,
216 &temp[0],
217 in,
218 sampler,
219 temp,
220 constant);
221 }
222 current_shader++;
223 }
224
225 ureg_END(ureg);
226
227 shader->tokens = ureg_finalize(ureg);
228 if(!shader->tokens)
229 return NULL;
230
231 p = pipe->create_fs_state(pipe, shader);
232
233 if (num_temps >= 1) {
234 for (i = start_temp; i < end_temp; i++) {
235 ureg_release_temporary(ureg, temp[i]);
236 }
237 }
238
239 ureg_destroy(ureg);
240
241 if (temp)
242 free(temp);
243 if (constant)
244 free(constant);
245 if (sampler)
246 free(sampler);
247
248 return p;
249 }
250
251 static void *
252 create_shader(struct pipe_context *pipe,
253 int id,
254 struct pipe_shader_state *shader)
255 {
256 int idx = 0, sh;
257 const struct shader_asm_info * shaders[SHADER_STAGES];
258
259 /* first stage */
260 sh = SHADERS_GET_PAINT_SHADER(id);
261 switch (sh << SHADERS_PAINT_SHIFT) {
262 case VEGA_SOLID_FILL_SHADER:
263 case VEGA_LINEAR_GRADIENT_SHADER:
264 case VEGA_RADIAL_GRADIENT_SHADER:
265 case VEGA_PATTERN_SHADER:
266 case VEGA_PAINT_DEGENERATE_SHADER:
267 shaders[idx] = &shaders_paint_asm[(sh >> SHADERS_PAINT_SHIFT) - 1];
268 assert(shaders[idx]->id == sh);
269 idx++;
270 break;
271 default:
272 break;
273 }
274
275 /* second stage */
276 sh = SHADERS_GET_IMAGE_SHADER(id);
277 switch (sh) {
278 case VEGA_IMAGE_NORMAL_SHADER:
279 case VEGA_IMAGE_MULTIPLY_SHADER:
280 case VEGA_IMAGE_STENCIL_SHADER:
281 shaders[idx] = &shaders_image_asm[(sh >> SHADERS_IMAGE_SHIFT) - 1];
282 assert(shaders[idx]->id == sh);
283 idx++;
284 break;
285 default:
286 break;
287 }
288
289 /* sanity check */
290 assert(idx == ((!sh || sh == VEGA_IMAGE_NORMAL_SHADER) ? 1 : 2));
291
292 /* third stage */
293 sh = SHADERS_GET_COLOR_TRANSFORM_SHADER(id);
294 switch (sh) {
295 case VEGA_COLOR_TRANSFORM_SHADER:
296 shaders[idx] = &shaders_color_transform_asm[
297 (sh >> SHADERS_COLOR_TRANSFORM_SHIFT) - 1];
298 assert(shaders[idx]->id == sh);
299 idx++;
300 break;
301 default:
302 break;
303 }
304
305 /* fourth stage */
306 sh = SHADERS_GET_ALPHA_SHADER(id);
307 switch (sh) {
308 case VEGA_ALPHA_NORMAL_SHADER:
309 case VEGA_ALPHA_PER_CHANNEL_SHADER:
310 shaders[idx] = &shaders_alpha_asm[
311 (sh >> SHADERS_ALPHA_SHIFT) - 1];
312 assert(shaders[idx]->id == sh);
313 idx++;
314 break;
315 default:
316 break;
317 }
318
319 /* fifth stage */
320 sh = SHADERS_GET_BLEND_SHADER(id);
321 switch (sh) {
322 case VEGA_BLEND_SRC_SHADER:
323 case VEGA_BLEND_SRC_OVER_SHADER:
324 case VEGA_BLEND_DST_OVER_SHADER:
325 case VEGA_BLEND_SRC_IN_SHADER:
326 case VEGA_BLEND_DST_IN_SHADER:
327 case VEGA_BLEND_MULTIPLY_SHADER:
328 case VEGA_BLEND_SCREEN_SHADER:
329 case VEGA_BLEND_DARKEN_SHADER:
330 case VEGA_BLEND_LIGHTEN_SHADER:
331 case VEGA_BLEND_ADDITIVE_SHADER:
332 shaders[idx] = &shaders_blend_asm[(sh >> SHADERS_BLEND_SHIFT) - 1];
333 assert(shaders[idx]->id == sh);
334 idx++;
335 break;
336 default:
337 break;
338 }
339
340 /* sixth stage */
341 sh = SHADERS_GET_MASK_SHADER(id);
342 switch (sh) {
343 case VEGA_MASK_SHADER:
344 shaders[idx] = &shaders_mask_asm[(sh >> SHADERS_MASK_SHIFT) - 1];
345 assert(shaders[idx]->id == sh);
346 idx++;
347 break;
348 default:
349 break;
350 }
351
352 /* seventh stage */
353 sh = SHADERS_GET_PREMULTIPLY_SHADER(id);
354 switch (sh) {
355 case VEGA_PREMULTIPLY_SHADER:
356 case VEGA_UNPREMULTIPLY_SHADER:
357 shaders[idx] = &shaders_premultiply_asm[
358 (sh >> SHADERS_PREMULTIPLY_SHIFT) - 1];
359 assert(shaders[idx]->id == sh);
360 idx++;
361 break;
362 default:
363 break;
364 }
365
366 /* eighth stage */
367 sh = SHADERS_GET_BW_SHADER(id);
368 switch (sh) {
369 case VEGA_BW_SHADER:
370 shaders[idx] = &shaders_bw_asm[(sh >> SHADERS_BW_SHIFT) - 1];
371 assert(shaders[idx]->id == sh);
372 idx++;
373 break;
374 default:
375 break;
376 }
377
378 return combine_shaders(shaders, idx, pipe, shader);
379 }
380
381 /*************************************************/
382
383 struct shaders_cache * shaders_cache_create(struct vg_context *vg)
384 {
385 struct shaders_cache *sc = CALLOC_STRUCT(shaders_cache);
386
387 sc->pipe = vg;
388 sc->hash = cso_hash_create();
389
390 return sc;
391 }
392
393 void shaders_cache_destroy(struct shaders_cache *sc)
394 {
395 struct cso_hash_iter iter = cso_hash_first_node(sc->hash);
396
397 while (!cso_hash_iter_is_null(iter)) {
398 struct cached_shader *cached =
399 (struct cached_shader *)cso_hash_iter_data(iter);
400 cso_delete_fragment_shader(sc->pipe->cso_context,
401 cached->driver_shader);
402 iter = cso_hash_erase(sc->hash, iter);
403 }
404
405 cso_hash_delete(sc->hash);
406 FREE(sc);
407 }
408
409 void * shaders_cache_fill(struct shaders_cache *sc,
410 int shader_key)
411 {
412 VGint key = shader_key;
413 struct cached_shader *cached;
414 struct cso_hash_iter iter = cso_hash_find(sc->hash, key);
415
416 if (cso_hash_iter_is_null(iter)) {
417 cached = CALLOC_STRUCT(cached_shader);
418 cached->driver_shader = create_shader(sc->pipe->pipe, key, &cached->state);
419
420 cso_hash_insert(sc->hash, key, cached);
421
422 return cached->driver_shader;
423 }
424
425 cached = (struct cached_shader *)cso_hash_iter_data(iter);
426
427 assert(cached->driver_shader);
428 return cached->driver_shader;
429 }
430
431 struct vg_shader * shader_create_from_text(struct pipe_context *pipe,
432 const char *txt, int num_tokens,
433 int type)
434 {
435 struct vg_shader *shader = (struct vg_shader *)MALLOC(
436 sizeof(struct vg_shader));
437 struct tgsi_token *tokens = tokens_from_assembly(txt, num_tokens);
438 struct pipe_shader_state state;
439
440 debug_assert(type == PIPE_SHADER_VERTEX ||
441 type == PIPE_SHADER_FRAGMENT);
442
443 state.tokens = tokens;
444 memset(&state.stream_output, 0, sizeof(state.stream_output));
445 shader->type = type;
446 shader->tokens = tokens;
447
448 if (type == PIPE_SHADER_FRAGMENT)
449 shader->driver = pipe->create_fs_state(pipe, &state);
450 else
451 shader->driver = pipe->create_vs_state(pipe, &state);
452 return shader;
453 }
454
455 void vg_shader_destroy(struct vg_context *ctx, struct vg_shader *shader)
456 {
457 if (shader->type == PIPE_SHADER_FRAGMENT)
458 cso_delete_fragment_shader(ctx->cso_context, shader->driver);
459 else
460 cso_delete_vertex_shader(ctx->cso_context, shader->driver);
461 FREE(shader->tokens);
462 FREE(shader);
463 }