r300: Clean emit code.
[mesa.git] / src / mesa / drivers / dri / r300 / r300_context.h
1 /*
2 Copyright (C) The Weather Channel, Inc. 2002. All Rights Reserved.
3
4 The Weather Channel (TM) funded Tungsten Graphics to develop the
5 initial release of the Radeon 8500 driver under the XFree86 license.
6 This notice must be preserved.
7
8 Permission is hereby granted, free of charge, to any person obtaining
9 a copy of this software and associated documentation files (the
10 "Software"), to deal in the Software without restriction, including
11 without limitation the rights to use, copy, modify, merge, publish,
12 distribute, sublicense, and/or sell copies of the Software, and to
13 permit persons to whom the Software is furnished to do so, subject to
14 the following conditions:
15
16 The above copyright notice and this permission notice (including the
17 next paragraph) shall be included in all copies or substantial
18 portions of the Software.
19
20 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
21 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
22 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
23 IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
24 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
25 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
26 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
27
28 **************************************************************************/
29
30 /**
31 * \file
32 *
33 * \author Keith Whitwell <keith@tungstengraphics.com>
34 * \author Nicolai Haehnle <prefect_@gmx.net>
35 */
36
37 #ifndef __R300_CONTEXT_H__
38 #define __R300_CONTEXT_H__
39
40 #include "drm.h"
41 #include "radeon_drm.h"
42 #include "dri_util.h"
43 #include "radeon_common.h"
44
45 #include "main/mtypes.h"
46 #include "shader/prog_instruction.h"
47 #include "compiler/radeon_code.h"
48
49 struct r300_context;
50 typedef struct r300_context r300ContextRec;
51 typedef struct r300_context *r300ContextPtr;
52
53
54 #include "r300_vertprog.h"
55
56
57 /* The blit width for texture uploads
58 */
59 #define R300_BLIT_WIDTH_BYTES 1024
60 #define R300_MAX_TEXTURE_UNITS 8
61
62
63
64 #define R300_VPT_CMD_0 0
65 #define R300_VPT_XSCALE 1
66 #define R300_VPT_XOFFSET 2
67 #define R300_VPT_YSCALE 3
68 #define R300_VPT_YOFFSET 4
69 #define R300_VPT_ZSCALE 5
70 #define R300_VPT_ZOFFSET 6
71 #define R300_VPT_CMDSIZE 7
72
73 #define R300_VIR_CMD_0 0 /* vir is variable size (at least 1) */
74 #define R300_VIR_CNTL_0 1
75 #define R300_VIR_CNTL_1 2
76 #define R300_VIR_CNTL_2 3
77 #define R300_VIR_CNTL_3 4
78 #define R300_VIR_CNTL_4 5
79 #define R300_VIR_CNTL_5 6
80 #define R300_VIR_CNTL_6 7
81 #define R300_VIR_CNTL_7 8
82 #define R300_VIR_CMDSIZE 9
83
84 #define R300_VIC_CMD_0 0
85 #define R300_VIC_CNTL_0 1
86 #define R300_VIC_CNTL_1 2
87 #define R300_VIC_CMDSIZE 3
88
89 #define R300_VOF_CMD_0 0
90 #define R300_VOF_CNTL_0 1
91 #define R300_VOF_CNTL_1 2
92 #define R300_VOF_CMDSIZE 3
93
94 #define R300_PVS_CMD_0 0
95 #define R300_PVS_CNTL_1 1
96 #define R300_PVS_CNTL_2 2
97 #define R300_PVS_CNTL_3 3
98 #define R300_PVS_CMDSIZE 4
99
100 #define R300_GB_MISC_CMD_0 0
101 #define R300_GB_MISC_MSPOS_0 1
102 #define R300_GB_MISC_MSPOS_1 2
103 #define R300_GB_MISC_TILE_CONFIG 3
104 #define R300_GB_MISC_CMDSIZE 4
105 #define R300_GB_MISC2_CMD_0 0
106 #define R300_GB_MISC2_SELECT 1
107 #define R300_GB_MISC2_AA_CONFIG 2
108 #define R300_GB_MISC2_CMDSIZE 3
109
110 #define R300_TXE_CMD_0 0
111 #define R300_TXE_ENABLE 1
112 #define R300_TXE_CMDSIZE 2
113
114 #define R300_PS_CMD_0 0
115 #define R300_PS_POINTSIZE 1
116 #define R300_PS_CMDSIZE 2
117
118 #define R300_ZBS_CMD_0 0
119 #define R300_ZBS_T_FACTOR 1
120 #define R300_ZBS_T_CONSTANT 2
121 #define R300_ZBS_W_FACTOR 3
122 #define R300_ZBS_W_CONSTANT 4
123 #define R300_ZBS_CMDSIZE 5
124
125 #define R300_CUL_CMD_0 0
126 #define R300_CUL_CULL 1
127 #define R300_CUL_CMDSIZE 2
128
129 #define R300_RC_CMD_0 0
130 #define R300_RC_CNTL_0 1
131 #define R300_RC_CNTL_1 2
132 #define R300_RC_CMDSIZE 3
133
134 #define R300_RI_CMD_0 0
135 #define R300_RI_INTERP_0 1
136 #define R300_RI_INTERP_1 2
137 #define R300_RI_INTERP_2 3
138 #define R300_RI_INTERP_3 4
139 #define R300_RI_INTERP_4 5
140 #define R300_RI_INTERP_5 6
141 #define R300_RI_INTERP_6 7
142 #define R300_RI_INTERP_7 8
143 #define R300_RI_CMDSIZE 9
144
145 #define R500_RI_CMDSIZE 17
146
147 #define R300_RR_CMD_0 0 /* rr is variable size (at least 1) */
148 #define R300_RR_INST_0 1
149 #define R300_RR_INST_1 2
150 #define R300_RR_INST_2 3
151 #define R300_RR_INST_3 4
152 #define R300_RR_INST_4 5
153 #define R300_RR_INST_5 6
154 #define R300_RR_INST_6 7
155 #define R300_RR_INST_7 8
156 #define R300_RR_CMDSIZE 9
157
158 #define R300_FP_CMD_0 0
159 #define R300_FP_CNTL0 1
160 #define R300_FP_CNTL1 2
161 #define R300_FP_CNTL2 3
162 #define R300_FP_CMD_1 4
163 #define R300_FP_NODE0 5
164 #define R300_FP_NODE1 6
165 #define R300_FP_NODE2 7
166 #define R300_FP_NODE3 8
167 #define R300_FP_CMDSIZE 9
168
169 #define R500_FP_CMD_0 0
170 #define R500_FP_CNTL 1
171 #define R500_FP_PIXSIZE 2
172 #define R500_FP_CMD_1 3
173 #define R500_FP_CODE_ADDR 4
174 #define R500_FP_CODE_RANGE 5
175 #define R500_FP_CODE_OFFSET 6
176 #define R500_FP_CMD_2 7
177 #define R500_FP_FC_CNTL 8
178 #define R500_FP_CMDSIZE 9
179
180 #define R300_FPT_CMD_0 0
181 #define R300_FPT_INSTR_0 1
182 #define R300_FPT_CMDSIZE 65
183
184 #define R300_FPI_CMD_0 0
185 #define R300_FPI_INSTR_0 1
186 #define R300_FPI_CMDSIZE 65
187 /* R500 has space for 512 instructions - 6 dwords per instruction */
188 #define R500_FPI_CMDSIZE (512*6+1)
189
190 #define R300_FPP_CMD_0 0
191 #define R300_FPP_PARAM_0 1
192 #define R300_FPP_CMDSIZE (32*4+1)
193 /* R500 has spcae for 256 constants - 4 dwords per constant */
194 #define R500_FPP_CMDSIZE (256*4+1)
195
196 #define R300_FOGS_CMD_0 0
197 #define R300_FOGS_STATE 1
198 #define R300_FOGS_CMDSIZE 2
199
200 #define R300_FOGC_CMD_0 0
201 #define R300_FOGC_R 1
202 #define R300_FOGC_G 2
203 #define R300_FOGC_B 3
204 #define R300_FOGC_CMDSIZE 4
205
206 #define R300_FOGP_CMD_0 0
207 #define R300_FOGP_SCALE 1
208 #define R300_FOGP_START 2
209 #define R300_FOGP_CMDSIZE 3
210
211 #define R300_AT_CMD_0 0
212 #define R300_AT_ALPHA_TEST 1
213 #define R300_AT_UNKNOWN 2
214 #define R300_AT_CMDSIZE 3
215
216 #define R300_BLD_CMD_0 0
217 #define R300_BLD_CBLEND 1
218 #define R300_BLD_ABLEND 2
219 #define R300_BLD_CMDSIZE 3
220
221 #define R300_CMK_CMD_0 0
222 #define R300_CMK_COLORMASK 1
223 #define R300_CMK_CMDSIZE 2
224
225 #define R300_CB_CMD_0 0
226 #define R300_CB_OFFSET 1
227 #define R300_CB_CMD_1 2
228 #define R300_CB_PITCH 3
229 #define R300_CB_CMDSIZE 4
230
231 #define R300_ZS_CMD_0 0
232 #define R300_ZS_CNTL_0 1
233 #define R300_ZS_CNTL_1 2
234 #define R300_ZS_CNTL_2 3
235 #define R300_ZS_CMDSIZE 4
236
237 #define R300_ZB_CMD_0 0
238 #define R300_ZB_OFFSET 1
239 #define R300_ZB_PITCH 2
240 #define R300_ZB_CMDSIZE 3
241
242 #define R300_VAP_CNTL_FLUSH 0
243 #define R300_VAP_CNTL_FLUSH_1 1
244 #define R300_VAP_CNTL_CMD 2
245 #define R300_VAP_CNTL_INSTR 3
246 #define R300_VAP_CNTL_SIZE 4
247
248 #define R300_VPI_CMD_0 0
249 #define R300_VPI_INSTR_0 1
250 #define R300_VPI_CMDSIZE 1025 /* 256 16 byte instructions */
251
252 #define R300_VPP_CMD_0 0
253 #define R300_VPP_PARAM_0 1
254 #define R300_VPP_CMDSIZE 1025 /* 256 4-component parameters */
255
256 #define R300_VPUCP_CMD_0 0
257 #define R300_VPUCP_X 1
258 #define R300_VPUCP_Y 2
259 #define R300_VPUCP_Z 3
260 #define R300_VPUCP_W 4
261 #define R300_VPUCP_CMDSIZE 5 /* 256 4-component parameters */
262
263 #define R300_VPS_CMD_0 0
264 #define R300_VPS_ZERO_0 1
265 #define R300_VPS_ZERO_1 2
266 #define R300_VPS_POINTSIZE 3
267 #define R300_VPS_ZERO_3 4
268 #define R300_VPS_CMDSIZE 5
269
270 /* the layout is common for all fields inside tex */
271 #define R300_TEX_CMD_0 0
272 #define R300_TEX_VALUE_0 1
273 /* We don't really use this, instead specify mtu+1 dynamically
274 #define R300_TEX_CMDSIZE (MAX_TEXTURE_UNITS+1)
275 */
276
277 #define R300_QUERYOBJ_CMD_0 0
278 #define R300_QUERYOBJ_DATA_0 1
279 #define R300_QUERYOBJ_CMD_1 2
280 #define R300_QUERYOBJ_DATA_1 3
281 #define R300_QUERYOBJ_CMDSIZE 4
282
283 /**
284 * Cache for hardware register state.
285 */
286 struct r300_hw_state {
287 struct radeon_state_atom vpt; /* viewport (1D98) */
288 struct radeon_state_atom vap_cntl;
289 struct radeon_state_atom vap_index_offset; /* 0x208c r5xx only */
290 struct radeon_state_atom vof; /* VAP output format register 0x2090 */
291 struct radeon_state_atom vte; /* (20B0) */
292 struct radeon_state_atom vap_vf_max_vtx_indx; /* Maximum Vertex Indx Clamp (2134) */
293 struct radeon_state_atom vap_cntl_status;
294 struct radeon_state_atom vir[2]; /* vap input route (2150/21E0) */
295 struct radeon_state_atom vic; /* vap input control (2180) */
296 struct radeon_state_atom vap_psc_sgn_norm_cntl; /* Programmable Stream Control Signed Normalize Control (21DC) */
297 struct radeon_state_atom vap_clip_cntl;
298 struct radeon_state_atom vap_clip;
299 struct radeon_state_atom vap_pvs_vtx_timeout_reg; /* Vertex timeout register (2288) */
300 struct radeon_state_atom pvs; /* pvs_cntl (22D0) */
301 struct radeon_state_atom gb_enable; /* (4008) */
302 struct radeon_state_atom gb_misc; /* Multisampling position shifts ? (4010) */
303 struct radeon_state_atom gb_misc2; /* Multisampling position shifts ? (4010) */
304 struct radeon_state_atom ga_point_s0; /* S Texture Coordinate of Vertex 0 for Point texture stuffing (LLC) (4200) */
305 struct radeon_state_atom ga_triangle_stipple; /* (4214) */
306 struct radeon_state_atom ps; /* pointsize (421C) */
307 struct radeon_state_atom ga_point_minmax; /* (4230) */
308 struct radeon_state_atom lcntl; /* line control */
309 struct radeon_state_atom ga_line_stipple; /* (4260) */
310 struct radeon_state_atom shade;
311 struct radeon_state_atom shade2;
312 struct radeon_state_atom polygon_mode;
313 struct radeon_state_atom fogp; /* fog parameters (4294) */
314 struct radeon_state_atom ga_soft_reset; /* (429C) */
315 struct radeon_state_atom zbias_cntl;
316 struct radeon_state_atom zbs; /* zbias (42A4) */
317 struct radeon_state_atom occlusion_cntl;
318 struct radeon_state_atom cul; /* cull cntl (42B8) */
319 struct radeon_state_atom su_depth_scale; /* (42C0) */
320 struct radeon_state_atom rc; /* rs control (4300) */
321 struct radeon_state_atom ri; /* rs interpolators (4310) */
322 struct radeon_state_atom rr; /* rs route (4330) */
323 struct radeon_state_atom sc_hyperz; /* (43A4) */
324 struct radeon_state_atom sc_screendoor; /* (43E8) */
325 struct radeon_state_atom fp; /* fragment program cntl + nodes (4600) */
326 struct radeon_state_atom fpt; /* texi - (4620) */
327 struct radeon_state_atom us_out_fmt; /* (46A4) */
328 struct radeon_state_atom r500fp; /* r500 fp instructions */
329 struct radeon_state_atom r500fp_const; /* r500 fp constants */
330 struct radeon_state_atom fpi[4]; /* fp instructions (46C0/47C0/48C0/49C0) */
331 struct radeon_state_atom fogs; /* fog state (4BC0) */
332 struct radeon_state_atom fogc; /* fog color (4BC8) */
333 struct radeon_state_atom at; /* alpha test (4BD4) */
334 struct radeon_state_atom fg_depth_src; /* (4BD8) */
335 struct radeon_state_atom fpp; /* 0x4C00 and following */
336 struct radeon_state_atom rb3d_cctl; /* (4E00) */
337 struct radeon_state_atom bld; /* blending (4E04) */
338 struct radeon_state_atom cmk; /* colormask (4E0C) */
339 struct radeon_state_atom blend_color; /* constant blend color */
340 struct radeon_state_atom rop; /* ropcntl */
341 struct radeon_state_atom cb; /* colorbuffer (4E28) */
342 struct radeon_state_atom rb3d_dither_ctl; /* (4E50) */
343 struct radeon_state_atom rb3d_aaresolve_ctl; /* (4E88) */
344 struct radeon_state_atom rb3d_discard_src_pixel_lte_threshold; /* (4E88) I saw it only written on RV350 hardware.. */
345 struct radeon_state_atom zs; /* zstencil control (4F00) */
346 struct radeon_state_atom zstencil_format;
347 struct radeon_state_atom zb; /* z buffer (4F20) */
348 struct radeon_state_atom zb_depthclearvalue; /* (4F28) */
349 struct radeon_state_atom zb_zmask; /* (4F30) */
350 struct radeon_state_atom zb_hiz_offset; /* (4F44) */
351 struct radeon_state_atom zb_hiz_pitch; /* (4F54) */
352
353 struct radeon_state_atom vap_flush;
354 struct radeon_state_atom vpi; /* vp instructions */
355 struct radeon_state_atom vpp; /* vp parameters */
356 struct radeon_state_atom vps; /* vertex point size (?) */
357 struct radeon_state_atom vpucp[6]; /* vp user clip plane - 6 */
358 /* 8 texture units */
359 /* the state is grouped by function and not by
360 texture unit. This makes single unit updates
361 really awkward - we are much better off
362 updating the whole thing at once */
363 struct {
364 struct radeon_state_atom filter;
365 struct radeon_state_atom filter_1;
366 struct radeon_state_atom size;
367 struct radeon_state_atom format;
368 struct radeon_state_atom pitch;
369 struct radeon_state_atom offset;
370 struct radeon_state_atom chroma_key;
371 struct radeon_state_atom border_color;
372 } tex;
373 struct radeon_state_atom txe; /* tex enable (4104) */
374 radeonTexObj *textures[R300_MAX_TEXTURE_UNITS];
375 };
376
377 /**
378 * State cache
379 */
380
381 /* Vertex shader state */
382
383 #define COLOR_IS_RGBA
384 #define TAG(x) r300##x
385 #include "tnl_dd/t_dd_vertex.h"
386 #undef TAG
387
388 struct r300_vertex_program_key {
389 GLbitfield FpReads;
390 GLuint FogAttr;
391 GLuint WPosAttr;
392 };
393
394 struct r300_vertex_program {
395 struct gl_vertex_program *Base;
396 struct r300_vertex_program *next;
397
398 struct r300_vertex_program_key key;
399 struct r300_vertex_program_code code;
400
401 GLboolean error;
402 };
403
404 struct r300_vertex_program_cont {
405 /* This is the unmodified vertex program mesa provided us with.
406 * We need to keep it unchanged because we may need to create another
407 * hw specific vertex program based on this.
408 */
409 struct gl_vertex_program mesa_program;
410 /* This is the list of hw specific vertex programs derived from mesa_program */
411 struct r300_vertex_program *progs;
412 };
413
414
415 /**
416 * Store everything about a fragment program that is needed
417 * to render with that program.
418 */
419 struct r300_fragment_program {
420 GLboolean error;
421 struct r300_fragment_program *next;
422 struct r300_fragment_program_external_state state;
423
424 struct rX00_fragment_program_code code;
425 GLbitfield InputsRead;
426
427 /* attribute that we are sending the WPOS in */
428 gl_frag_attrib wpos_attr;
429 /* attribute that we are sending the fog coordinate in */
430 gl_frag_attrib fog_attr;
431 };
432
433 struct r300_fragment_program_cont {
434 /* This is the unmodified fragment program mesa provided us with.
435 * We need to keep it unchanged because we may need to create another
436 * hw specific fragment program based on this.
437 */
438 struct gl_fragment_program Base;
439 /* This is the list of hw specific fragment programs derived from Base */
440 struct r300_fragment_program *progs;
441 };
442
443
444 #define R300_MAX_AOS_ARRAYS 16
445
446
447 /* r300_swtcl.c
448 */
449 struct r300_swtcl_info {
450 /*
451 * Offset of the 4UB color data within a hardware (swtcl) vertex.
452 */
453 GLuint coloroffset;
454
455 /**
456 * Offset of the 3UB specular color data within a hardware (swtcl) vertex.
457 */
458 GLuint specoffset;
459 };
460
461 struct r300_vtable {
462 void (* SetupRSUnit)(GLcontext *ctx);
463 void (* SetupFragmentShaderTextures)(GLcontext *ctx, int *tmu_mappings);
464 void (* SetupPixelShader)(GLcontext *ctx);
465 };
466
467 struct r300_vertex_buffer {
468 struct vertex_attribute {
469 /* generic */
470 GLubyte element;
471 GLuint stride;
472 GLuint dwords;
473 GLubyte size; /* number of components */
474 GLboolean is_named_bo;
475 struct radeon_bo *bo;
476 GLint bo_offset;
477
478 /* hw specific */
479 uint32_t data_type:4;
480 uint32_t dst_loc:5;
481 uint32_t _signed:1;
482 uint32_t normalize:1;
483 uint32_t swizzle:12;
484 uint32_t write_mask:4;
485 } attribs[VERT_ATTRIB_MAX];
486
487 GLubyte num_attribs;
488 };
489
490 struct r300_index_buffer {
491 struct radeon_bo *bo;
492 int bo_offset;
493
494 GLboolean is_32bit;
495 GLuint count;
496 };
497
498
499 /**
500 * \brief R300 context structure.
501 */
502 struct r300_context {
503 struct radeon_context radeon; /* parent class, must be first */
504
505 struct r300_vtable vtbl;
506
507 struct r300_hw_state hw;
508
509 struct r300_vertex_program *selected_vp;
510 struct r300_fragment_program *selected_fp;
511
512 /* Vertex buffers
513 */
514 GLvector4f dummy_attrib[_TNL_ATTRIB_MAX];
515 GLvector4f *temp_attrib[_TNL_ATTRIB_MAX];
516
517 struct r300_options {
518 uint32_t conformance_mode:1;
519 uint32_t hw_tcl_enabled:1;
520 uint32_t s3tc_force_enabled:1;
521 uint32_t s3tc_force_disabled:1;
522 uint32_t stencil_two_side_disabled:1;
523 } options;
524
525 struct r300_swtcl_info swtcl;
526 struct r300_vertex_buffer vbuf;
527 struct r300_index_buffer ind_buf;
528
529 uint32_t fallback;
530
531 DECLARE_RENDERINPUTS(render_inputs_bitset);
532 int num_z_pipes;
533 };
534
535 #define R300_CONTEXT(ctx) ((r300ContextPtr)(ctx->DriverCtx))
536
537 extern void r300DestroyContext(__DRIcontextPrivate * driContextPriv);
538 extern GLboolean r300CreateContext(const __GLcontextModes * glVisual,
539 __DRIcontextPrivate * driContextPriv,
540 void *sharedContextPrivate);
541
542 extern void r300InitShaderFuncs(struct dd_function_table *functions);
543
544 extern void r300InitShaderFunctions(r300ContextPtr r300);
545
546 extern void r300InitDraw(GLcontext *ctx);
547
548 #define r300PackFloat32 radeonPackFloat32
549 #define r300PackFloat24 radeonPackFloat24
550
551 #endif /* __R300_CONTEXT_H__ */