Revert "st/mesa: call nir_serialize only once per shader"
[mesa.git] / src / mesa / state_tracker / st_program.h
1 /**************************************************************************
2 *
3 * Copyright 2003 VMware, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 /*
29 * Authors:
30 * Keith Whitwell <keithw@vmware.com>
31 */
32
33
34 #ifndef ST_PROGRAM_H
35 #define ST_PROGRAM_H
36
37 #include "main/mtypes.h"
38 #include "main/atifragshader.h"
39 #include "program/program.h"
40 #include "pipe/p_state.h"
41 #include "tgsi/tgsi_from_mesa.h"
42 #include "st_context.h"
43 #include "st_texture.h"
44 #include "st_glsl_to_tgsi.h"
45
46 #ifdef __cplusplus
47 extern "C" {
48 #endif
49
50 #define ST_DOUBLE_ATTRIB_PLACEHOLDER 0xff
51
52 struct st_external_sampler_key
53 {
54 GLuint lower_nv12; /**< bitmask of 2 plane YUV samplers */
55 GLuint lower_iyuv; /**< bitmask of 3 plane YUV samplers */
56 GLuint lower_xy_uxvx; /**< bitmask of 2 plane YUV samplers */
57 GLuint lower_yx_xuxv; /**< bitmask of 2 plane YUV samplers */
58 GLuint lower_ayuv;
59 GLuint lower_xyuv;
60 };
61
62 static inline struct st_external_sampler_key
63 st_get_external_sampler_key(struct st_context *st, struct gl_program *prog)
64 {
65 unsigned mask = prog->ExternalSamplersUsed;
66 struct st_external_sampler_key key;
67
68 memset(&key, 0, sizeof(key));
69
70 while (unlikely(mask)) {
71 unsigned unit = u_bit_scan(&mask);
72 struct st_texture_object *stObj =
73 st_get_texture_object(st->ctx, prog, unit);
74
75 switch (st_get_view_format(stObj)) {
76 case PIPE_FORMAT_NV12:
77 case PIPE_FORMAT_P016:
78 key.lower_nv12 |= (1 << unit);
79 break;
80 case PIPE_FORMAT_IYUV:
81 key.lower_iyuv |= (1 << unit);
82 break;
83 case PIPE_FORMAT_YUYV:
84 key.lower_yx_xuxv |= (1 << unit);
85 break;
86 case PIPE_FORMAT_UYVY:
87 key.lower_xy_uxvx |= (1 << unit);
88 break;
89 case PIPE_FORMAT_AYUV:
90 key.lower_ayuv |= (1 << unit);
91 break;
92 case PIPE_FORMAT_XYUV:
93 key.lower_xyuv |= (1 << unit);
94 break;
95 default:
96 printf("mesa: st_get_external_sampler_key: unhandled pipe format %u\n",
97 st_get_view_format(stObj));
98 break;
99 }
100 }
101
102 return key;
103 }
104
105 /** Fragment program variant key */
106 struct st_fp_variant_key
107 {
108 struct st_context *st; /**< variants are per-context */
109
110 /** for glBitmap */
111 GLuint bitmap:1; /**< glBitmap variant? */
112
113 /** for glDrawPixels */
114 GLuint drawpixels:1; /**< glDrawPixels variant */
115 GLuint scaleAndBias:1; /**< glDrawPixels w/ scale and/or bias? */
116 GLuint pixelMaps:1; /**< glDrawPixels w/ pixel lookup map? */
117
118 /** for ARB_color_buffer_float */
119 GLuint clamp_color:1;
120
121 /** for ARB_sample_shading */
122 GLuint persample_shading:1;
123
124 /** needed for ATI_fragment_shader */
125 GLuint fog:2;
126
127 /** for ARB_depth_clamp */
128 GLuint lower_depth_clamp:1;
129
130 /** for OpenGL 1.0 on modern hardware */
131 GLuint lower_two_sided_color:1;
132
133 GLuint lower_flatshade:1;
134 enum compare_func lower_alpha_func:3;
135
136 /** needed for ATI_fragment_shader */
137 char texture_targets[MAX_NUM_FRAGMENT_REGISTERS_ATI];
138
139 struct st_external_sampler_key external;
140 };
141
142
143 /**
144 * Variant of a fragment program.
145 */
146 struct st_fp_variant
147 {
148 /** Parameters which generated this version of fragment program */
149 struct st_fp_variant_key key;
150
151 /** Driver's compiled shader */
152 void *driver_shader;
153
154 /** For glBitmap variants */
155 uint bitmap_sampler;
156
157 /** For glDrawPixels variants */
158 unsigned drawpix_sampler;
159 unsigned pixelmap_sampler;
160
161 /** next in linked list */
162 struct st_fp_variant *next;
163 };
164
165
166 /** Shader key shared by other shaders */
167 struct st_common_variant_key
168 {
169 struct st_context *st; /**< variants are per-context */
170 bool passthrough_edgeflags;
171
172 /** for ARB_color_buffer_float */
173 bool clamp_color;
174
175 /** both for ARB_depth_clamp */
176 bool lower_depth_clamp;
177 bool clip_negative_one_to_one;
178
179 /** lower glPointSize to gl_PointSize */
180 boolean lower_point_size;
181
182 /* for user-defined clip-planes */
183 uint8_t lower_ucp;
184 };
185
186
187 /**
188 * This represents a vertex program, especially translated to match
189 * the inputs of a particular fragment shader.
190 */
191 struct st_vp_variant
192 {
193 /* Parameters which generated this translated version of a vertex
194 * shader:
195 */
196 struct st_common_variant_key key;
197
198 /**
199 * The shader variant saved for the draw module to later emulate
200 * selection/feedback/rasterpos.
201 */
202 const struct tgsi_token *tokens;
203
204 /** Driver's compiled shader */
205 void *driver_shader;
206
207 /** For using our private draw module (glRasterPos) */
208 struct draw_vertex_shader *draw_shader;
209
210 /** Next in linked list */
211 struct st_vp_variant *next;
212
213 /** similar to that in st_vertex_program, but with edgeflags info too */
214 GLuint num_inputs;
215
216 /** Bitfield of VERT_BIT_* bits of mesa vertex processing inputs */
217 GLbitfield vert_attrib_mask;
218 };
219
220
221 /**
222 * Geometry program variant.
223 */
224 struct st_common_variant
225 {
226 /* Parameters which generated this variant. */
227 struct st_common_variant_key key;
228
229 void *driver_shader;
230
231 struct st_common_variant *next;
232 };
233
234
235 /**
236 * Derived from Mesa gl_program:
237 */
238 struct st_program
239 {
240 struct gl_program Base;
241 struct pipe_shader_state state;
242 struct glsl_to_tgsi_visitor* glsl_to_tgsi;
243 struct ati_fragment_shader *ati_fs;
244 uint64_t affected_states; /**< ST_NEW_* flags to mark dirty when binding */
245
246 void *nir_binary;
247 unsigned nir_size;
248
249 /* used when bypassing glsl_to_tgsi: */
250 struct gl_shader_program *shader_program;
251
252 union {
253 struct st_common_variant *variants;
254 struct st_vp_variant *vp_variants;
255 struct st_fp_variant *fp_variants;
256 };
257 };
258
259
260 struct st_vertex_program
261 {
262 struct st_program Base;
263
264 /** maps a TGSI input index back to a Mesa VERT_ATTRIB_x */
265 ubyte index_to_input[PIPE_MAX_ATTRIBS];
266 ubyte num_inputs;
267 /** Reverse mapping of the above */
268 ubyte input_to_index[VERT_ATTRIB_MAX];
269
270 /** Maps VARYING_SLOT_x to slot */
271 ubyte result_to_output[VARYING_SLOT_MAX];
272 };
273
274
275 static inline struct st_program *
276 st_program( struct gl_program *cp )
277 {
278 return (struct st_program *)cp;
279 }
280
281 static inline void
282 st_reference_prog(struct st_context *st,
283 struct st_program **ptr,
284 struct st_program *prog)
285 {
286 _mesa_reference_program(st->ctx,
287 (struct gl_program **) ptr,
288 (struct gl_program *) prog);
289 }
290
291 /**
292 * This defines mapping from Mesa VARYING_SLOTs to TGSI GENERIC slots.
293 */
294 static inline unsigned
295 st_get_generic_varying_index(struct st_context *st, GLuint attr)
296 {
297 return tgsi_get_generic_gl_varying_index((gl_varying_slot)attr,
298 st->needs_texcoord_semantic);
299 }
300
301 extern void
302 st_set_prog_affected_state_flags(struct gl_program *prog);
303
304 extern struct st_vp_variant *
305 st_get_vp_variant(struct st_context *st,
306 struct st_program *stvp,
307 const struct st_common_variant_key *key);
308
309
310 extern struct st_fp_variant *
311 st_get_fp_variant(struct st_context *st,
312 struct st_program *stfp,
313 const struct st_fp_variant_key *key);
314
315 extern struct st_common_variant *
316 st_get_common_variant(struct st_context *st,
317 struct st_program *p,
318 const struct st_common_variant_key *key);
319
320 extern void
321 st_release_vp_variants( struct st_context *st,
322 struct st_program *stvp );
323
324 extern void
325 st_release_fp_variants( struct st_context *st,
326 struct st_program *stfp );
327
328 extern void
329 st_release_common_variants(struct st_context *st, struct st_program *p);
330
331 extern void
332 st_destroy_program_variants(struct st_context *st);
333
334 extern void
335 st_finalize_nir_before_variants(struct nir_shader *nir);
336
337 extern void
338 st_prepare_vertex_program(struct st_program *stvp);
339
340 extern void
341 st_translate_stream_output_info(struct gl_program *prog);
342
343 extern bool
344 st_translate_vertex_program(struct st_context *st,
345 struct st_program *stvp);
346
347 extern bool
348 st_translate_fragment_program(struct st_context *st,
349 struct st_program *stfp);
350
351 extern bool
352 st_translate_common_program(struct st_context *st,
353 struct st_program *stp);
354
355 extern void
356 st_finalize_program(struct st_context *st, struct gl_program *prog);
357
358 #ifdef __cplusplus
359 }
360 #endif
361
362 #endif