Looks like masking masking t->filter isnt needed anymore.
[mesa.git] / src / mesa / drivers / dri / r300 / r300_state.c
1 /*
2 Copyright (C) The Weather Channel, Inc. 2002.
3 Copyright (C) 2004 Nicolai Haehnle.
4 All Rights Reserved.
5
6 The Weather Channel (TM) funded Tungsten Graphics to develop the
7 initial release of the Radeon 8500 driver under the XFree86 license.
8 This notice must be preserved.
9
10 Permission is hereby granted, free of charge, to any person obtaining
11 a copy of this software and associated documentation files (the
12 "Software"), to deal in the Software without restriction, including
13 without limitation the rights to use, copy, modify, merge, publish,
14 distribute, sublicense, and/or sell copies of the Software, and to
15 permit persons to whom the Software is furnished to do so, subject to
16 the following conditions:
17
18 The above copyright notice and this permission notice (including the
19 next paragraph) shall be included in all copies or substantial
20 portions of the Software.
21
22 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
23 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
24 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
25 IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
26 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
27 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
28 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
29
30 **************************************************************************/
31
32 /*
33 * Authors:
34 * Nicolai Haehnle <prefect_@gmx.net>
35 */
36
37 #include "glheader.h"
38 #include "state.h"
39 #include "imports.h"
40 #include "enums.h"
41 #include "macros.h"
42 #include "context.h"
43 #include "dd.h"
44 #include "simple_list.h"
45
46 #include "api_arrayelt.h"
47 #include "swrast/swrast.h"
48 #include "swrast_setup/swrast_setup.h"
49 #include "array_cache/acache.h"
50 #include "tnl/tnl.h"
51 #include "texformat.h"
52
53 #include "radeon_ioctl.h"
54 #include "radeon_state.h"
55 #include "r300_context.h"
56 #include "r300_ioctl.h"
57 #include "r300_state.h"
58 #include "r300_reg.h"
59 #include "r300_program.h"
60 #include "r300_emit.h"
61 #include "r300_fixed_pipelines.h"
62
63 static void r300AlphaFunc(GLcontext * ctx, GLenum func, GLfloat ref)
64 {
65 r300ContextPtr rmesa = R300_CONTEXT(ctx);
66 int pp_misc = rmesa->hw.at.cmd[R300_AT_ALPHA_TEST];
67 GLubyte refByte;
68
69 CLAMPED_FLOAT_TO_UBYTE(refByte, ref);
70
71 R300_STATECHANGE(rmesa, at);
72
73 pp_misc &= ~(R300_ALPHA_TEST_OP_MASK | R300_REF_ALPHA_MASK);
74 pp_misc |= (refByte & R300_REF_ALPHA_MASK);
75
76 switch (func) {
77 case GL_NEVER:
78 pp_misc |= R300_ALPHA_TEST_FAIL;
79 break;
80 case GL_LESS:
81 pp_misc |= R300_ALPHA_TEST_LESS;
82 break;
83 case GL_EQUAL:
84 pp_misc |= R300_ALPHA_TEST_EQUAL;
85 break;
86 case GL_LEQUAL:
87 pp_misc |= R300_ALPHA_TEST_LEQUAL;
88 break;
89 case GL_GREATER:
90 pp_misc |= R300_ALPHA_TEST_GREATER;
91 break;
92 case GL_NOTEQUAL:
93 pp_misc |= R300_ALPHA_TEST_NEQUAL;
94 break;
95 case GL_GEQUAL:
96 pp_misc |= R300_ALPHA_TEST_GEQUAL;
97 break;
98 case GL_ALWAYS:
99 pp_misc |= R300_ALPHA_TEST_PASS;
100 break;
101 }
102
103 rmesa->hw.at.cmd[R300_AT_ALPHA_TEST] = pp_misc;
104 }
105
106 static void r300BlendColor(GLcontext * ctx, const GLfloat cf[4])
107 {
108 GLubyte color[4];
109 r300ContextPtr rmesa = R300_CONTEXT(ctx);
110 fprintf(stderr, "%s:%s is not implemented yet. Fixme !\n", __FILE__, __FUNCTION__);
111 #if 0
112 R200_STATECHANGE(rmesa, ctx);
113 CLAMPED_FLOAT_TO_UBYTE(color[0], cf[0]);
114 CLAMPED_FLOAT_TO_UBYTE(color[1], cf[1]);
115 CLAMPED_FLOAT_TO_UBYTE(color[2], cf[2]);
116 CLAMPED_FLOAT_TO_UBYTE(color[3], cf[3]);
117 if (rmesa->radeon.radeonScreen->drmSupportsBlendColor)
118 rmesa->hw.ctx.cmd[CTX_RB3D_BLENDCOLOR] =
119 radeonPackColor(4, color[0], color[1], color[2], color[3]);
120 #endif
121 }
122
123 /**
124 * Calculate the hardware blend factor setting. This same function is used
125 * for source and destination of both alpha and RGB.
126 *
127 * \returns
128 * The hardware register value for the specified blend factor. This value
129 * will need to be shifted into the correct position for either source or
130 * destination factor.
131 *
132 * \todo
133 * Since the two cases where source and destination are handled differently
134 * are essentially error cases, they should never happen. Determine if these
135 * cases can be removed.
136 */
137 static int blend_factor(GLenum factor, GLboolean is_src)
138 {
139 int func;
140
141 switch (factor) {
142 case GL_ZERO:
143 func = R200_BLEND_GL_ZERO;
144 break;
145 case GL_ONE:
146 func = R200_BLEND_GL_ONE;
147 break;
148 case GL_DST_COLOR:
149 func = R200_BLEND_GL_DST_COLOR;
150 break;
151 case GL_ONE_MINUS_DST_COLOR:
152 func = R200_BLEND_GL_ONE_MINUS_DST_COLOR;
153 break;
154 case GL_SRC_COLOR:
155 func = R200_BLEND_GL_SRC_COLOR;
156 break;
157 case GL_ONE_MINUS_SRC_COLOR:
158 func = R200_BLEND_GL_ONE_MINUS_SRC_COLOR;
159 break;
160 case GL_SRC_ALPHA:
161 func = R200_BLEND_GL_SRC_ALPHA;
162 break;
163 case GL_ONE_MINUS_SRC_ALPHA:
164 func = R200_BLEND_GL_ONE_MINUS_SRC_ALPHA;
165 break;
166 case GL_DST_ALPHA:
167 func = R200_BLEND_GL_DST_ALPHA;
168 break;
169 case GL_ONE_MINUS_DST_ALPHA:
170 func = R200_BLEND_GL_ONE_MINUS_DST_ALPHA;
171 break;
172 case GL_SRC_ALPHA_SATURATE:
173 func =
174 (is_src) ? R200_BLEND_GL_SRC_ALPHA_SATURATE :
175 R200_BLEND_GL_ZERO;
176 break;
177 case GL_CONSTANT_COLOR:
178 func = R200_BLEND_GL_CONST_COLOR;
179 break;
180 case GL_ONE_MINUS_CONSTANT_COLOR:
181 func = R200_BLEND_GL_ONE_MINUS_CONST_COLOR;
182 break;
183 case GL_CONSTANT_ALPHA:
184 func = R200_BLEND_GL_CONST_ALPHA;
185 break;
186 case GL_ONE_MINUS_CONSTANT_ALPHA:
187 func = R200_BLEND_GL_ONE_MINUS_CONST_ALPHA;
188 break;
189 default:
190 func = (is_src) ? R200_BLEND_GL_ONE : R200_BLEND_GL_ZERO;
191 }
192 return func;
193 }
194
195 /**
196 * Sets both the blend equation and the blend function.
197 * This is done in a single
198 * function because some blend equations (i.e., \c GL_MIN and \c GL_MAX)
199 * change the interpretation of the blend function.
200 * Also, make sure that blend function and blend equation are set to their default
201 * value if color blending is not enabled, since at least blend equations GL_MIN
202 * and GL_FUNC_REVERSE_SUBTRACT will cause wrong results otherwise for
203 * unknown reasons.
204 */
205
206 /* helper function */
207 static void r300_set_blend_cntl(r300ContextPtr rmesa, int func, int eqn, int cbits, int funcA, int eqnA)
208 {
209 GLuint new_ablend, new_cblend;
210
211 new_ablend = eqnA | funcA;
212 new_cblend = eqn | func | cbits;
213 if(rmesa->hw.bld.cmd[R300_BLD_ABLEND] == rmesa->hw.bld.cmd[R300_BLD_CBLEND]){
214 new_cblend |= R300_BLEND_NO_SEPARATE;
215 }
216 if((new_ablend != rmesa->hw.bld.cmd[R300_BLD_ABLEND])
217 || (new_cblend != rmesa->hw.bld.cmd[R300_BLD_CBLEND])){
218 R300_STATECHANGE(rmesa, bld);
219 rmesa->hw.bld.cmd[R300_BLD_ABLEND]=new_ablend;
220 rmesa->hw.bld.cmd[R300_BLD_CBLEND]=new_cblend;
221 }
222 }
223
224 static void r300_set_blend_state(GLcontext * ctx)
225 {
226 r300ContextPtr rmesa = R300_CONTEXT(ctx);
227 #if 0
228 GLuint cntl = rmesa->hw.ctx.cmd[CTX_RB3D_CNTL] &
229 ~(R300_ROP_ENABLE | R300_ALPHA_BLEND_ENABLE |
230 R300_SEPARATE_ALPHA_ENABLE);
231 #endif
232
233 int func = (R200_BLEND_GL_ONE << R200_SRC_BLEND_SHIFT) |
234 (R200_BLEND_GL_ZERO << R200_DST_BLEND_SHIFT);
235 int eqn = R200_COMB_FCN_ADD_CLAMP;
236 int funcA = (R200_BLEND_GL_ONE << R200_SRC_BLEND_SHIFT) |
237 (R200_BLEND_GL_ZERO << R200_DST_BLEND_SHIFT);
238 int eqnA = R200_COMB_FCN_ADD_CLAMP;
239
240
241 if (rmesa->radeon.radeonScreen->drmSupportsBlendColor) {
242 if (ctx->Color._LogicOpEnabled) {
243 #if 0
244 rmesa->hw.ctx.cmd[CTX_RB3D_CNTL] =
245 cntl | R300_ROP_ENABLE;
246 #endif
247 r300_set_blend_cntl(rmesa,
248 func, eqn, 0,
249 func, eqn);
250 return;
251 } else if (ctx->Color.BlendEnabled) {
252 #if 0
253 rmesa->hw.ctx.cmd[CTX_RB3D_CNTL] =
254 cntl | R300_ALPHA_BLEND_ENABLE |
255 R300_SEPARATE_ALPHA_ENABLE;
256 #endif
257 } else {
258 #if 0
259 rmesa->hw.ctx.cmd[CTX_RB3D_CNTL] = cntl;
260 #endif
261 r300_set_blend_cntl(rmesa,
262 func, eqn, 0,
263 func, eqn);
264 return;
265 }
266 } else {
267 if (ctx->Color._LogicOpEnabled) {
268 #if 0
269 rmesa->hw.ctx.cmd[CTX_RB3D_CNTL] =
270 cntl | R300_ROP_ENABLE;
271 rmesa->hw.ctx.cmd[CTX_RB3D_BLENDCNTL] = eqn | func;
272 #endif
273 return;
274 } else if (ctx->Color.BlendEnabled) {
275 #if 0
276 rmesa->hw.ctx.cmd[CTX_RB3D_CNTL] =
277 cntl | R300_ALPHA_BLEND_ENABLE;
278 #endif
279 } else {
280 #if 0
281 rmesa->hw.ctx.cmd[CTX_RB3D_CNTL] = cntl;
282 rmesa->hw.ctx.cmd[CTX_RB3D_BLENDCNTL] = eqn | func;
283 #endif
284 r300_set_blend_cntl(rmesa,
285 func, eqn, 0,
286 func, eqn);
287 return;
288 }
289 }
290
291 func =
292 (blend_factor(ctx->Color.BlendSrcRGB, GL_TRUE) <<
293 R200_SRC_BLEND_SHIFT) | (blend_factor(ctx->Color.BlendDstRGB,
294 GL_FALSE) <<
295 R200_DST_BLEND_SHIFT);
296
297 switch (ctx->Color.BlendEquationRGB) {
298 case GL_FUNC_ADD:
299 eqn = R300_COMB_FCN_ADD_CLAMP;
300 break;
301
302 case GL_FUNC_SUBTRACT:
303 eqn = R300_COMB_FCN_SUB_CLAMP;
304 break;
305
306 case GL_FUNC_REVERSE_SUBTRACT:
307 eqn = R200_COMB_FCN_RSUB_CLAMP;
308 break;
309
310 case GL_MIN:
311 eqn = R200_COMB_FCN_MIN;
312 func = (R200_BLEND_GL_ONE << R200_SRC_BLEND_SHIFT) |
313 (R200_BLEND_GL_ONE << R200_DST_BLEND_SHIFT);
314 break;
315
316 case GL_MAX:
317 eqn = R200_COMB_FCN_MAX;
318 func = (R200_BLEND_GL_ONE << R200_SRC_BLEND_SHIFT) |
319 (R200_BLEND_GL_ONE << R200_DST_BLEND_SHIFT);
320 break;
321
322 default:
323 fprintf(stderr,
324 "[%s:%u] Invalid RGB blend equation (0x%04x).\n",
325 __func__, __LINE__, ctx->Color.BlendEquationRGB);
326 return;
327 }
328
329 if (!rmesa->radeon.radeonScreen->drmSupportsBlendColor) {
330 #if 0
331 rmesa->hw.ctx.cmd[CTX_RB3D_BLENDCNTL] = eqn | func;
332 #endif
333 return;
334 }
335
336 funcA =
337 (blend_factor(ctx->Color.BlendSrcA, GL_TRUE) <<
338 R200_SRC_BLEND_SHIFT) | (blend_factor(ctx->Color.BlendDstA,
339 GL_FALSE) <<
340 R200_DST_BLEND_SHIFT);
341
342 switch (ctx->Color.BlendEquationA) {
343 case GL_FUNC_ADD:
344 eqnA = R300_COMB_FCN_ADD_CLAMP;
345 break;
346
347 case GL_FUNC_SUBTRACT:
348 eqnA = R300_COMB_FCN_SUB_CLAMP;
349 break;
350
351 case GL_FUNC_REVERSE_SUBTRACT:
352 eqnA = R200_COMB_FCN_RSUB_CLAMP;
353 break;
354
355 case GL_MIN:
356 eqnA = R200_COMB_FCN_MIN;
357 funcA = (R200_BLEND_GL_ONE << R200_SRC_BLEND_SHIFT) |
358 (R200_BLEND_GL_ONE << R200_DST_BLEND_SHIFT);
359 break;
360
361 case GL_MAX:
362 eqnA = R200_COMB_FCN_MAX;
363 funcA = (R200_BLEND_GL_ONE << R200_SRC_BLEND_SHIFT) |
364 (R200_BLEND_GL_ONE << R200_DST_BLEND_SHIFT);
365 break;
366
367 default:
368 fprintf(stderr, "[%s:%u] Invalid A blend equation (0x%04x).\n",
369 __func__, __LINE__, ctx->Color.BlendEquationA);
370 return;
371 }
372
373 r300_set_blend_cntl(rmesa,
374 func, eqn, R300_BLEND_UNKNOWN | R300_BLEND_ENABLE,
375 funcA, eqnA);
376 r300_set_blend_cntl(rmesa,
377 func, eqn, R300_BLEND_UNKNOWN | R300_BLEND_ENABLE,
378 funcA, eqnA);
379 }
380
381 static void r300BlendEquationSeparate(GLcontext * ctx,
382 GLenum modeRGB, GLenum modeA)
383 {
384 r300_set_blend_state(ctx);
385 }
386
387 static void r300BlendFuncSeparate(GLcontext * ctx,
388 GLenum sfactorRGB, GLenum dfactorRGB,
389 GLenum sfactorA, GLenum dfactorA)
390 {
391 r300_set_blend_state(ctx);
392 }
393
394 /**
395 * Update our tracked culling state based on Mesa's state.
396 */
397 static void r300UpdateCulling(GLcontext* ctx)
398 {
399 r300ContextPtr r300 = R300_CONTEXT(ctx);
400 uint32_t val = 0;
401
402 R300_STATECHANGE(r300, cul);
403 if (ctx->Polygon.CullFlag) {
404 if (ctx->Polygon.CullFaceMode == GL_FRONT_AND_BACK)
405 val = R300_CULL_FRONT|R300_CULL_BACK;
406 else if (ctx->Polygon.CullFaceMode == GL_FRONT)
407 val = R300_CULL_FRONT;
408 else
409 val = R300_CULL_BACK;
410
411 if (ctx->Polygon.FrontFace == GL_CW)
412 val |= R300_FRONT_FACE_CW;
413 else
414 val |= R300_FRONT_FACE_CCW;
415 }
416
417 r300->hw.cul.cmd[R300_CUL_CULL] = val;
418 }
419
420
421 /**
422 * Handle glEnable()/glDisable().
423 *
424 * \note Mesa already filters redundant calls to glEnable/glDisable.
425 */
426 static void r300Enable(GLcontext* ctx, GLenum cap, GLboolean state)
427 {
428 r300ContextPtr r300 = R300_CONTEXT(ctx);
429 uint32_t newval;
430
431 if (RADEON_DEBUG & DEBUG_STATE)
432 fprintf(stderr, "%s( %s = %s )\n", __FUNCTION__,
433 _mesa_lookup_enum_by_nr(cap),
434 state ? "GL_TRUE" : "GL_FALSE");
435
436 switch (cap) {
437 /* Fast track this one...
438 */
439 case GL_TEXTURE_1D:
440 case GL_TEXTURE_2D:
441 case GL_TEXTURE_3D:
442 break;
443
444 case GL_ALPHA_TEST:
445 R200_STATECHANGE(r300, at);
446 if (state) {
447 r300->hw.at.cmd[R300_AT_ALPHA_TEST] |=
448 R300_ALPHA_TEST_ENABLE;
449 } else {
450 r300->hw.at.cmd[R300_AT_ALPHA_TEST] |=
451 ~R300_ALPHA_TEST_ENABLE;
452 }
453 break;
454
455 case GL_BLEND:
456 case GL_COLOR_LOGIC_OP:
457 r300_set_blend_state(ctx);
458 break;
459
460 case GL_DEPTH_TEST:
461 R300_STATECHANGE(r300, zs);
462
463 if (state) {
464 if (ctx->Depth.Mask)
465 newval = R300_RB3D_Z_TEST_AND_WRITE;
466 else
467 newval = R300_RB3D_Z_TEST;
468 } else
469 newval = 0;
470
471 r300->hw.zs.cmd[R300_ZS_CNTL_0] = newval;
472 break;
473
474 case GL_STENCIL_TEST:
475 if (r300->state.hw_stencil) {
476 R300_STATECHANGE(r300, zs);
477 if (state) {
478 r300->hw.zs.cmd[R300_ZS_CNTL_0] |=
479 R300_STENCIL_ENABLE;
480 } else {
481 r300->hw.zs.cmd[R300_ZS_CNTL_0] &=
482 ~R300_STENCIL_ENABLE;
483 }
484 } else {
485 FALLBACK(&r300->radeon, RADEON_FALLBACK_STENCIL, state);
486 }
487 break;
488
489 case GL_CULL_FACE:
490 r300UpdateCulling(ctx);
491 break;
492
493 default:
494 radeonEnable(ctx, cap, state);
495 return;
496 }
497 }
498
499
500 /**
501 * Change the culling mode.
502 *
503 * \note Mesa already filters redundant calls to this function.
504 */
505 static void r300CullFace(GLcontext* ctx, GLenum mode)
506 {
507 (void)mode;
508
509 r300UpdateCulling(ctx);
510 }
511
512
513 /**
514 * Change the polygon orientation.
515 *
516 * \note Mesa already filters redundant calls to this function.
517 */
518 static void r300FrontFace(GLcontext* ctx, GLenum mode)
519 {
520 (void)mode;
521
522 r300UpdateCulling(ctx);
523 }
524
525
526 /**
527 * Change the depth testing function.
528 *
529 * \note Mesa already filters redundant calls to this function.
530 */
531 static void r300DepthFunc(GLcontext* ctx, GLenum func)
532 {
533 r300ContextPtr r300 = R300_CONTEXT(ctx);
534
535 R300_STATECHANGE(r300, zs);
536
537 r300->hw.zs.cmd[R300_ZS_CNTL_1] &= ~(R300_ZS_MASK << R300_RB3D_ZS1_DEPTH_FUNC_SHIFT);
538
539 switch(func) {
540 case GL_NEVER:
541 r300->hw.zs.cmd[R300_ZS_CNTL_1] |= R300_ZS_NEVER << R300_RB3D_ZS1_DEPTH_FUNC_SHIFT;
542 break;
543 case GL_LESS:
544 r300->hw.zs.cmd[R300_ZS_CNTL_1] |= R300_ZS_LESS << R300_RB3D_ZS1_DEPTH_FUNC_SHIFT;
545 break;
546 case GL_EQUAL:
547 r300->hw.zs.cmd[R300_ZS_CNTL_1] |= R300_ZS_EQUAL << R300_RB3D_ZS1_DEPTH_FUNC_SHIFT;
548 break;
549 case GL_LEQUAL:
550 r300->hw.zs.cmd[R300_ZS_CNTL_1] |= R300_ZS_LEQUAL << R300_RB3D_ZS1_DEPTH_FUNC_SHIFT;
551 break;
552 case GL_GREATER:
553 r300->hw.zs.cmd[R300_ZS_CNTL_1] |= R300_ZS_GREATER << R300_RB3D_ZS1_DEPTH_FUNC_SHIFT;
554 break;
555 case GL_NOTEQUAL:
556 r300->hw.zs.cmd[R300_ZS_CNTL_1] |= R300_ZS_NOTEQUAL << R300_RB3D_ZS1_DEPTH_FUNC_SHIFT;
557 break;
558 case GL_GEQUAL:
559 r300->hw.zs.cmd[R300_ZS_CNTL_1] |= R300_ZS_GEQUAL << R300_RB3D_ZS1_DEPTH_FUNC_SHIFT;
560 break;
561 case GL_ALWAYS:
562 r300->hw.zs.cmd[R300_ZS_CNTL_1] |= R300_ZS_ALWAYS << R300_RB3D_ZS1_DEPTH_FUNC_SHIFT;
563 break;
564 }
565
566 }
567
568
569 /**
570 * Enable/Disable depth writing.
571 *
572 * \note Mesa already filters redundant calls to this function.
573 */
574 static void r300DepthMask(GLcontext* ctx, GLboolean mask)
575 {
576 r300ContextPtr r300 = R300_CONTEXT(ctx);
577
578 if (!ctx->Depth.Test)
579 return;
580
581 R300_STATECHANGE(r300, zs);
582 r300->hw.zs.cmd[R300_ZS_CNTL_0] = mask
583 ? R300_RB3D_Z_TEST_AND_WRITE : R300_RB3D_Z_TEST;
584 }
585
586
587 /**
588 * Handle glColorMask()
589 */
590 static void r300ColorMask(GLcontext* ctx,
591 GLboolean r, GLboolean g, GLboolean b, GLboolean a)
592 {
593 r300ContextPtr r300 = R300_CONTEXT(ctx);
594 int mask = (b << 0) | (g << 1) | (r << 2) | (a << 3);
595
596 if (mask != r300->hw.cmk.cmd[R300_CMK_COLORMASK]) {
597 R300_STATECHANGE(r300, cmk);
598 r300->hw.cmk.cmd[R300_CMK_COLORMASK] = mask;
599 }
600 }
601
602 /* =============================================================
603 * Point state
604 */
605 static void r300PointSize(GLcontext * ctx, GLfloat size)
606 {
607 r300ContextPtr r300 = R300_CONTEXT(ctx);
608
609 /* This might need fixing later */
610 R300_STATECHANGE(r300, vps);
611 r300->hw.vps.cmd[R300_VPS_POINTSIZE] = r300PackFloat32(1.0);
612 }
613 /* =============================================================
614 * Stencil
615 */
616
617 static void r300StencilFunc(GLcontext * ctx, GLenum func,
618 GLint ref, GLuint mask)
619 {
620 r300ContextPtr rmesa = R300_CONTEXT(ctx);
621 GLuint refmask = ((ctx->Stencil.Ref[0] << R300_RB3D_ZS2_STENCIL_REF_SHIFT) |
622 (ctx->Stencil.
623 ValueMask[0] << R300_RB3D_ZS2_STENCIL_MASK_SHIFT));
624
625 R200_STATECHANGE(rmesa, zs);
626
627 rmesa->hw.zs.cmd[R300_ZS_CNTL_1] &= ~(R300_ZS_MASK << R300_RB3D_ZS1_STENCIL_FUNC_SHIFT);
628 rmesa->hw.zs.cmd[R300_ZS_CNTL_2] &= ~((R300_ZS_MASK << R300_RB3D_ZS2_STENCIL_REF_SHIFT) |
629 (R300_ZS_MASK << R300_RB3D_ZS2_STENCIL_MASK_SHIFT));
630
631 switch (ctx->Stencil.Function[0]) {
632 case GL_NEVER:
633 rmesa->hw.zs.cmd[R300_ZS_CNTL_1] |=
634 R300_ZS_NEVER << R300_RB3D_ZS1_STENCIL_FUNC_SHIFT;
635 break;
636 case GL_LESS:
637 rmesa->hw.zs.cmd[R300_ZS_CNTL_1] |=
638 R300_ZS_LESS << R300_RB3D_ZS1_STENCIL_FUNC_SHIFT;
639 break;
640 case GL_EQUAL:
641 rmesa->hw.zs.cmd[R300_ZS_CNTL_1] |=
642 R300_ZS_EQUAL << R300_RB3D_ZS1_STENCIL_FUNC_SHIFT;
643 break;
644 case GL_LEQUAL:
645 rmesa->hw.zs.cmd[R300_ZS_CNTL_1] |=
646 R300_ZS_LEQUAL << R300_RB3D_ZS1_STENCIL_FUNC_SHIFT;
647 break;
648 case GL_GREATER:
649 rmesa->hw.zs.cmd[R300_ZS_CNTL_1] |=
650 R300_ZS_GREATER << R300_RB3D_ZS1_STENCIL_FUNC_SHIFT;
651 break;
652 case GL_NOTEQUAL:
653 rmesa->hw.zs.cmd[R300_ZS_CNTL_1] |=
654 R300_ZS_NOTEQUAL << R300_RB3D_ZS1_STENCIL_FUNC_SHIFT;
655 break;
656 case GL_GEQUAL:
657 rmesa->hw.zs.cmd[R300_ZS_CNTL_1] |=
658 R300_ZS_GEQUAL << R300_RB3D_ZS1_STENCIL_FUNC_SHIFT;
659 break;
660 case GL_ALWAYS:
661 rmesa->hw.zs.cmd[R300_ZS_CNTL_1] |=
662 R300_ZS_ALWAYS << R300_RB3D_ZS1_STENCIL_FUNC_SHIFT;
663 break;
664 }
665
666 rmesa->hw.zs.cmd[R300_ZS_CNTL_2] |= refmask;
667 }
668
669 static void r300StencilMask(GLcontext * ctx, GLuint mask)
670 {
671 r300ContextPtr rmesa = R300_CONTEXT(ctx);
672
673 R200_STATECHANGE(rmesa, zs);
674 rmesa->hw.zs.cmd[R300_ZS_CNTL_2] &= ~(R300_ZS_MASK << R300_RB3D_ZS2_STENCIL_WRITE_MASK_SHIFT);
675 rmesa->hw.zs.cmd[R300_ZS_CNTL_2] |= ctx->Stencil.WriteMask[0] << R300_RB3D_ZS2_STENCIL_WRITE_MASK_SHIFT;
676 }
677
678 static int translate_stencil_op(int op)
679 {
680 switch (op) {
681 case GL_KEEP:
682 return R300_ZS_KEEP;
683 case GL_ZERO:
684 return R300_ZS_ZERO;
685 case GL_REPLACE:
686 return R300_ZS_REPLACE;
687 case GL_INCR:
688 return R300_ZS_INCR;
689 case GL_DECR:
690 return R300_ZS_DECR;
691 case GL_INCR_WRAP_EXT:
692 return R300_ZS_INCR_WRAP;
693 case GL_DECR_WRAP_EXT:
694 return R300_ZS_DECR_WRAP;
695 case GL_INVERT:
696 return R300_ZS_INVERT;
697 }
698 }
699
700 static void r300StencilOp(GLcontext * ctx, GLenum fail,
701 GLenum zfail, GLenum zpass)
702 {
703 r300ContextPtr rmesa = R300_CONTEXT(ctx);
704
705 R200_STATECHANGE(rmesa, zs);
706 rmesa->hw.zs.cmd[R300_ZS_CNTL_1] &= ~((R300_ZS_MASK << R300_RB3D_ZS1_STENCIL_FAIL_OP_SHIFT)
707 | (R300_ZS_MASK << R300_RB3D_ZS1_STENCIL_ZPASS_OP_SHIFT)
708 | (R300_ZS_MASK << R300_RB3D_ZS1_STENCIL_ZFAIL_OP_SHIFT)
709 );
710
711 rmesa->hw.zs.cmd[R300_ZS_CNTL_1] |=
712 (translate_stencil_op(ctx->Stencil.FailFunc[0]) << R300_RB3D_ZS1_STENCIL_FAIL_OP_SHIFT)
713 |(translate_stencil_op(ctx->Stencil.ZFailFunc[0]) << R300_RB3D_ZS1_STENCIL_ZFAIL_OP_SHIFT)
714 |(translate_stencil_op(ctx->Stencil.ZPassFunc[0]) << R300_RB3D_ZS1_STENCIL_ZPASS_OP_SHIFT);
715
716 }
717
718 static void r300ClearStencil(GLcontext * ctx, GLint s)
719 {
720 r300ContextPtr rmesa = R300_CONTEXT(ctx);
721
722 /* Not sure whether this is correct.. */
723 R200_STATECHANGE(rmesa, zs);
724 rmesa->hw.zs.cmd[R300_ZS_CNTL_2] =
725 ((GLuint) ctx->Stencil.Clear |
726 (0xff << R200_STENCIL_MASK_SHIFT) |
727 (ctx->Stencil.WriteMask[0] << R200_STENCIL_WRITEMASK_SHIFT));
728 }
729
730 /* =============================================================
731 * Window position and viewport transformation
732 */
733
734 /*
735 * To correctly position primitives:
736 */
737 #define SUBPIXEL_X 0.125
738 #define SUBPIXEL_Y 0.125
739
740 void r300UpdateWindow(GLcontext * ctx)
741 {
742 r300ContextPtr rmesa = R300_CONTEXT(ctx);
743 __DRIdrawablePrivate *dPriv = rmesa->radeon.dri.drawable;
744 GLfloat xoffset = dPriv ? (GLfloat) dPriv->x : 0;
745 GLfloat yoffset = dPriv ? (GLfloat) dPriv->y + dPriv->h : 0;
746 const GLfloat *v = ctx->Viewport._WindowMap.m;
747
748 GLfloat sx = v[MAT_SX];
749 GLfloat tx = v[MAT_TX] + xoffset + SUBPIXEL_X;
750 GLfloat sy = -v[MAT_SY];
751 GLfloat ty = (-v[MAT_TY]) + yoffset + SUBPIXEL_Y;
752 GLfloat sz = v[MAT_SZ] * rmesa->state.depth.scale;
753 GLfloat tz = v[MAT_TZ] * rmesa->state.depth.scale;
754
755 R300_FIREVERTICES(rmesa);
756 R300_STATECHANGE(rmesa, vpt);
757
758 rmesa->hw.vpt.cmd[R300_VPT_XSCALE] = r300PackFloat32(sx);
759 rmesa->hw.vpt.cmd[R300_VPT_XOFFSET] = r300PackFloat32(tx);
760 rmesa->hw.vpt.cmd[R300_VPT_YSCALE] = r300PackFloat32(sy);
761 rmesa->hw.vpt.cmd[R300_VPT_YOFFSET] = r300PackFloat32(ty);
762 rmesa->hw.vpt.cmd[R300_VPT_ZSCALE] = r300PackFloat32(sz);
763 rmesa->hw.vpt.cmd[R300_VPT_ZOFFSET] = r300PackFloat32(tz);
764 }
765
766 static void r300Viewport(GLcontext * ctx, GLint x, GLint y,
767 GLsizei width, GLsizei height)
768 {
769 /* Don't pipeline viewport changes, conflict with window offset
770 * setting below. Could apply deltas to rescue pipelined viewport
771 * values, or keep the originals hanging around.
772 */
773 R200_FIREVERTICES(R200_CONTEXT(ctx));
774 r300UpdateWindow(ctx);
775 }
776
777 static void r300DepthRange(GLcontext * ctx, GLclampd nearval, GLclampd farval)
778 {
779 r300UpdateWindow(ctx);
780 }
781
782 /* Routing and texture-related */
783
784 void r300_setup_routing(GLcontext *ctx, GLboolean immediate)
785 {
786 int i, count=0,reg=0;
787 GLuint dw, mask;
788 TNLcontext *tnl = TNL_CONTEXT(ctx);
789 struct vertex_buffer *VB = &tnl->vb;
790 r300ContextPtr r300 = R300_CONTEXT(ctx);
791
792
793 /* Stage 1 - input to VAP */
794
795 /* Assign register number automatically, retaining it in rmesa->state.reg */
796
797 /* Note: immediate vertex data includes all coordinates.
798 To save bandwidth use either VBUF or state-based vertex generation */
799
800 #define CONFIGURE_AOS(v, o, r, f) \
801 {\
802 if(immediate){ \
803 r300->state.aos[count].element_size=4; \
804 r300->state.aos[count].stride=4; \
805 r300->state.aos[count].ncomponents=4; \
806 } else { \
807 r300->state.aos[count].element_size=v->size; \
808 r300->state.aos[count].stride=v->size; \
809 r300->state.aos[count].ncomponents=v->size; \
810 } \
811 r300->state.aos[count].offset=o; \
812 r300->state.aos[count].reg=reg; \
813 r300->state.aos[count].format=(f); \
814 r300->state.vap_reg.r=reg; \
815 count++; \
816 reg++; \
817 }
818
819 /* All offsets are 0 - for use by immediate mode.
820 Should change later to handle vertex buffers */
821 CONFIGURE_AOS(VB->ObjPtr, 0, i_coords, AOS_FORMAT_FLOAT);
822 CONFIGURE_AOS(VB->ColorPtr[0], 0, i_color[0], AOS_FORMAT_FLOAT_COLOR);
823 for(i=0;i < ctx->Const.MaxTextureUnits;i++)
824 if(ctx->Texture.Unit[i].Enabled)
825 CONFIGURE_AOS(VB->TexCoordPtr[i], 0, i_tex[i], AOS_FORMAT_FLOAT);
826
827 r300->state.aos_count=count;
828
829 if (RADEON_DEBUG & DEBUG_STATE)
830 fprintf(stderr, "aos_count=%d\n", count);
831
832 if(count>R300_MAX_AOS_ARRAYS){
833 fprintf(stderr, "Aieee ! AOS array count exceeded !\n");
834 exit(-1);
835 }
836
837 /* Implement AOS */
838
839 /* setup INPUT_ROUTE */
840 R300_STATECHANGE(r300, vir[0]);
841 for(i=0;i+1<count;i+=2){
842 dw=(r300->state.aos[i].ncomponents-1)
843 | ((r300->state.aos[i].reg)<<8)
844 | (r300->state.aos[i].format<<14)
845 | (((r300->state.aos[i+1].ncomponents-1)
846 | ((r300->state.aos[i+1].reg)<<8)
847 | (r300->state.aos[i+1].format<<14))<<16);
848
849 if(i+2==count){
850 dw|=(1<<(13+16));
851 }
852 r300->hw.vir[0].cmd[R300_VIR_CNTL_0+(i>>1)]=dw;
853 }
854 if(count & 1){
855 dw=(r300->state.aos[count-1].ncomponents-1)
856 | (r300->state.aos[count-1].format<<14)
857 | ((r300->state.aos[count-1].reg)<<8)
858 | (1<<13);
859 r300->hw.vir[0].cmd[R300_VIR_CNTL_0+(count>>1)]=dw;
860 //fprintf(stderr, "vir0 dw=%08x\n", dw);
861 }
862 /* Set the rest of INPUT_ROUTE_0 to 0 */
863 //for(i=((count+1)>>1); i<8; i++)r300->hw.vir[0].cmd[R300_VIR_CNTL_0+i]=(0x0);
864 ((drm_r300_cmd_header_t*)r300->hw.vir[0].cmd)->unchecked_state.count = (count+1)>>1;
865
866
867 /* Mesa assumes that all missing components are from (0, 0, 0, 1) */
868 #define ALL_COMPONENTS ((R300_INPUT_ROUTE_SELECT_X<<R300_INPUT_ROUTE_X_SHIFT) \
869 | (R300_INPUT_ROUTE_SELECT_Y<<R300_INPUT_ROUTE_Y_SHIFT) \
870 | (R300_INPUT_ROUTE_SELECT_Z<<R300_INPUT_ROUTE_Z_SHIFT) \
871 | (R300_INPUT_ROUTE_SELECT_W<<R300_INPUT_ROUTE_W_SHIFT))
872
873 #define ALL_DEFAULT ((R300_INPUT_ROUTE_SELECT_ZERO<<R300_INPUT_ROUTE_X_SHIFT) \
874 | (R300_INPUT_ROUTE_SELECT_ZERO<<R300_INPUT_ROUTE_Y_SHIFT) \
875 | (R300_INPUT_ROUTE_SELECT_ZERO<<R300_INPUT_ROUTE_Z_SHIFT) \
876 | (R300_INPUT_ROUTE_SELECT_ONE<<R300_INPUT_ROUTE_W_SHIFT))
877
878 R300_STATECHANGE(r300, vir[1]);
879
880 for(i=0;i+1<count;i+=2){
881 /* do i first.. */
882 mask=(1<<(r300->state.aos[i].ncomponents*3))-1;
883 dw=(ALL_COMPONENTS & mask)
884 | (ALL_DEFAULT & ~mask)
885 | R300_INPUT_ROUTE_ENABLE;
886
887 /* i+1 */
888 mask=(1<<(r300->state.aos[i+1].ncomponents*3))-1;
889 dw|=(
890 (ALL_COMPONENTS & mask)
891 | (ALL_DEFAULT & ~mask)
892 | R300_INPUT_ROUTE_ENABLE
893 )<<16;
894
895 r300->hw.vir[1].cmd[R300_VIR_CNTL_0+(i>>1)]=dw;
896 }
897 if(count & 1){
898 mask=(1<<(r300->state.aos[count-1].ncomponents*3))-1;
899 dw=(ALL_COMPONENTS & mask)
900 | (ALL_DEFAULT & ~mask)
901 | R300_INPUT_ROUTE_ENABLE;
902 r300->hw.vir[1].cmd[R300_VIR_CNTL_0+(count>>1)]=dw;
903 //fprintf(stderr, "vir1 dw=%08x\n", dw);
904 }
905 /* Set the rest of INPUT_ROUTE_1 to 0 */
906 //for(i=((count+1)>>1); i<8; i++)r300->hw.vir[1].cmd[R300_VIR_CNTL_0+i]=0x0;
907 ((drm_r300_cmd_header_t*)r300->hw.vir[1].cmd)->unchecked_state.count = (count+1)>>1;
908
909 /* Set up input_cntl */
910
911 R300_STATECHANGE(r300, vic);
912 r300->hw.vic.cmd[R300_VIC_CNTL_0]=0x5555; /* Hard coded value, no idea what it means */
913
914 r300->hw.vic.cmd[R300_VIC_CNTL_1]=R300_INPUT_CNTL_POS
915 | R300_INPUT_CNTL_COLOR;
916
917 for(i=0;i < ctx->Const.MaxTextureUnits;i++)
918 if(ctx->Texture.Unit[i].Enabled)
919 r300->hw.vic.cmd[R300_VIC_CNTL_1]|=(R300_INPUT_CNTL_TC0<<i);
920
921 /* Stage 3: VAP output */
922 R300_STATECHANGE(r300, vof);
923 r300->hw.vof.cmd[R300_VOF_CNTL_0]=R300_VAP_OUTPUT_VTX_FMT_0__POS_PRESENT
924 | R300_VAP_OUTPUT_VTX_FMT_0__COLOR_PRESENT;
925
926 r300->hw.vof.cmd[R300_VOF_CNTL_1]=0;
927 for(i=0;i < ctx->Const.MaxTextureUnits;i++)
928 if(ctx->Texture.Unit[i].Enabled)
929 r300->hw.vof.cmd[R300_VOF_CNTL_1]|=(4<<(3*i));
930
931 }
932
933 static r300TexObj default_tex_obj={
934 filter:R300_TX_MAG_FILTER_LINEAR | R300_TX_MIN_FILTER_LINEAR,
935 pitch: 0x8000,
936 size: (0xff << R300_TX_WIDTHMASK_SHIFT)
937 | (0xff << R300_TX_HEIGHTMASK_SHIFT)
938 | (0x8 << R300_TX_SIZE_SHIFT),
939 format: 0x88a0c,
940 offset: 0x0,
941 unknown4: 0x0,
942 unknown5: 0x0
943 };
944
945 /* there is probably a system to these value, but, for now,
946 we just try by hand */
947
948 static int inline translate_src(int src)
949 {
950 switch (src) {
951 case GL_TEXTURE:
952 return 1;
953 break;
954 case GL_CONSTANT:
955 return 2;
956 break;
957 case GL_PRIMARY_COLOR:
958 return 3;
959 break;
960 case GL_PREVIOUS:
961 return 4;
962 break;
963 case GL_ZERO:
964 return 5;
965 break;
966 case GL_ONE:
967 return 6;
968 break;
969 default:
970 return 0;
971 }
972 }
973
974 /* I think 357 and 457 are prime numbers.. wiggle them if you get coincidences */
975 #define FORMAT_HASH(opRGB, srcRGB, modeRGB, opA, srcA, modeA, format, intFormat) ( \
976 (\
977 ((opRGB)<<30) | ((opA)<<28) | \
978 ((srcRGB)<< 25) | ((srcA)<<22) | \
979 ((modeRGB)) \
980 ) \
981 ^ ((modeA)*357) \
982 ^ (((format)) *457) \
983 ^ ((intFormat) * 7) \
984 )
985
986
987 static GLuint translate_texture_format(GLcontext *ctx, GLint tex_unit, GLuint format, GLint IntFormat,
988 struct gl_texture_format *tex_format)
989 {
990 const struct gl_texture_unit *texUnit= &ctx->Texture.Unit[tex_unit];
991 int i=0; /* number of alpha args .. */
992 GLuint fmt;
993
994 #if 0
995 fprintf(stderr, "_ReallyEnabled=%d EnvMode=%s\n",
996 texUnit->_ReallyEnabled,
997 _mesa_lookup_enum_by_nr(texUnit->EnvMode));
998 #endif
999
1000 if(tex_format==NULL){
1001 fprintf(stderr, "Aeiii ! tex_format==NULL !!\n");
1002 return 0;
1003 }
1004
1005 switch(tex_format->MesaFormat){
1006 case MESA_FORMAT_RGBA8888:
1007 return R300_EASY_TX_FORMAT(Y, Z, W, X, W8Z8Y8X8);
1008 default:
1009 fprintf(stderr, "Do not know format %s\n", _mesa_lookup_enum_by_nr(tex_format->MesaFormat));
1010 return 0;
1011 }
1012
1013 switch(IntFormat){
1014 case 4:
1015 case GL_RGBA:
1016 case GL_RGBA8:
1017 break;
1018 case 3:
1019 case GL_RGB8:
1020 fmt=R300_EASY_TX_FORMAT(Y, Z, W, ONE, W8Z8Y8X8);
1021 break;
1022 default:
1023 return 0;
1024 }
1025 #if 1
1026 //fmt &= 0x00fff;
1027 //fmt |= ((format) & 0xff00)<<4;
1028 fprintf(stderr, "NumArgsRGB=%d NumArgsA=%d\n",
1029 texUnit->_CurrentCombine->_NumArgsRGB,
1030 texUnit->_CurrentCombine->_NumArgsA);
1031
1032 fprintf(stderr, "fmt=%08x\n", fmt);
1033 #endif
1034 return fmt;
1035 /* Size field in format specific first */
1036 switch(FORMAT_HASH(
1037 texUnit->_CurrentCombine->OperandRGB[i] -GL_SRC_COLOR,
1038 translate_src(texUnit->_CurrentCombine->SourceRGB[i]),
1039 texUnit->_CurrentCombine->ModeRGB,
1040 texUnit->_CurrentCombine->OperandA[i] -GL_SRC_ALPHA,
1041 translate_src(texUnit->_CurrentCombine->SourceA[i]),
1042 texUnit->_CurrentCombine->ModeA,
1043 format,
1044 IntFormat
1045 )){
1046 case FORMAT_HASH(0, 1, 0x2100, 0, 1, 0x2100, 0x0008847, GL_RGBA):
1047 /* tested with:
1048 kfiresaver.kss
1049 */
1050 return R300_EASY_TX_FORMAT(X, X, CUT_W, W, W8Z8Y8X8);
1051 case FORMAT_HASH(0, 1, 0x2100, 0, 1, 0x2100, 0x0008847, GL_RGBA8):
1052 /* tested with:
1053 Quake3demo
1054 */
1055 /* Quake3demo -small font on the bottom */
1056 return fmt;
1057 case FORMAT_HASH(0, 1, 0x2100, 0, 1, 0x2100, 0x00005547, GL_RGBA8):
1058 /* Quake3demo - mouse cursor*/
1059 return fmt;
1060 case FORMAT_HASH(0, 1, 0x2100, 0, 1, 0x2100, 0x00007747, 4):
1061 /* tested with:
1062 kfiresaver.kss
1063 */
1064 return R300_EASY_TX_FORMAT(Y, Z, W, ONE, W8Z8Y8X8);
1065 case FORMAT_HASH(0, 1, 0x2100, 0, 1, 0x2100, 0x00005547, 4):
1066 /* tested with:
1067 kfiresaver.kss
1068 kfountain.kss
1069 */
1070 return R300_EASY_TX_FORMAT(Y, Z, W, ONE, W8Z8Y8X8);
1071 case FORMAT_HASH(0, 1, 0x2100, 0, 4, 0x1e01, 0x00008847, 3):
1072 /* tested with
1073 lesson 06
1074 lesson 07
1075 */
1076 case FORMAT_HASH(0, 1, 0x2100, 0, 4, 0x1e01, 0x00007747, 0x00000003):
1077 /* Tested with NeHe lesson 08 */
1078 //case FORMAT_HASH(0, 1, 0x2100, 0, 4, 0x1e01, 0x0005547, 0):
1079 /* Can't remember what I tested this with..
1080 try putting return 0 of you see broken textures which
1081 are not being complained about */
1082 case FORMAT_HASH(0, 1, 0x2100, 0, 4, 0x1e01, 0x00009947, GL_RGB8):
1083 case FORMAT_HASH(0, 1, 0x2100, 0, 4, 0x1e01, 0x00007747, GL_RGB8):
1084 case FORMAT_HASH(0, 1, 0x2100, 0, 4, 0x1e01, 0x00003347, GL_RGB8):
1085 case FORMAT_HASH(0, 1, 0x2100, 0, 4, 0x1e01, 0x00008947, 3):
1086 /* Tested with:
1087 Quake3demo
1088 */
1089 return R300_EASY_TX_FORMAT(Y, Z, W, ONE, W8Z8Y8X8);
1090 case FORMAT_HASH(0, 1, 0x2100, 0, 1, 0x2100, 0x00007847, GL_RGBA8):
1091 case FORMAT_HASH(0, 1, 0x2100, 0, 1, 0x2100, 0x00006747, GL_RGBA8):
1092 case FORMAT_HASH(0, 1, 0x2100, 0, 1, 0x2100, 0x00006647, GL_RGBA8):
1093 case FORMAT_HASH(0, 1, 0x2100, 0, 4, 0x1e01, 0x00008947, GL_RGBA8):
1094 /* Tested with:
1095 Quake3demo
1096 */
1097 return R300_EASY_TX_FORMAT(Y, Z, W, W, W8Z8Y8X8);
1098 case FORMAT_HASH(0, 1, 0x2100, 0, 1, 0x2100, 0x00007747, GL_RGBA8):
1099 return R300_EASY_TX_FORMAT(Z, Y, X, W, W8Z8Y8X8) ;
1100 case FORMAT_HASH(0, 1, 0x2100, 0, 1, 0x2100, 0x0008845, 0x00008056):
1101 //return 0;
1102 fprintf(stderr, "***\n");
1103 return R300_EASY_TX_FORMAT(Y, Z, W, W, W8Z8Y8X8);
1104 }
1105
1106
1107 {
1108 static int warn_once=1;
1109 if(warn_once){
1110 fprintf(stderr, "%s:%s Do not know how to translate texture format - help me !\n",
1111 __FILE__, __FUNCTION__);
1112 warn_once=0;
1113 }
1114 }
1115 return 0;
1116 }
1117
1118 void r300_setup_textures(GLcontext *ctx)
1119 {
1120 int i, mtu;
1121 struct r300_tex_obj *t;
1122 r300ContextPtr r300 = R300_CONTEXT(ctx);
1123 int max_texture_unit=-1; /* -1 translates into no setup costs for fields */
1124 struct gl_texture_unit *texUnit;
1125
1126 R300_STATECHANGE(r300, txe);
1127 R300_STATECHANGE(r300, tex.filter);
1128 R300_STATECHANGE(r300, tex.unknown1);
1129 R300_STATECHANGE(r300, tex.size);
1130 R300_STATECHANGE(r300, tex.format);
1131 R300_STATECHANGE(r300, tex.offset);
1132 R300_STATECHANGE(r300, tex.unknown4);
1133 R300_STATECHANGE(r300, tex.unknown5);
1134 R300_STATECHANGE(r300, tex.border_color);
1135
1136 r300->state.texture.tc_count=0;
1137
1138 r300->hw.txe.cmd[R300_TXE_ENABLE]=0x0;
1139
1140 mtu = r300->radeon.glCtx->Const.MaxTextureUnits;
1141 if (RADEON_DEBUG & DEBUG_STATE)
1142 fprintf(stderr, "mtu=%d\n", mtu);
1143
1144 if(mtu>R300_MAX_TEXTURE_UNITS){
1145 fprintf(stderr, "Aiiee ! mtu=%d is greater than R300_MAX_TEXTURE_UNITS=%d\n",
1146 mtu, R300_MAX_TEXTURE_UNITS);
1147 exit(-1);
1148 }
1149 for(i=0;i<mtu;i++){
1150 if(ctx->Texture.Unit[i].Enabled){
1151 t=r300->state.texture.unit[i].texobj;
1152 fprintf(stderr, "format=%08x\n", r300->state.texture.unit[i].format);
1153 r300->state.texture.tc_count++;
1154 if(t==NULL){
1155 fprintf(stderr, "Texture unit %d enabled, but corresponding texobj is NULL, using default object.\n", i);
1156 //exit(-1);
1157 t=&default_tex_obj;
1158 }
1159 if (RADEON_DEBUG & DEBUG_STATE)
1160 fprintf(stderr, "Activating texture unit %d\n", i);
1161 max_texture_unit=i;
1162 r300->hw.txe.cmd[R300_TXE_ENABLE]|=(1<<i);
1163
1164 r300->hw.tex.filter.cmd[R300_TEX_VALUE_0+i]=t->filter;
1165
1166 /* No idea why linear filtered textures shake when puting random data */
1167 /*r300->hw.tex.unknown1.cmd[R300_TEX_VALUE_0+i]=(rand()%0xffffffff) & (~0x1fff);*/
1168 r300->hw.tex.size.cmd[R300_TEX_VALUE_0+i]=t->size;
1169 r300->hw.tex.format.cmd[R300_TEX_VALUE_0+i]=t->format;
1170 //fprintf(stderr, "t->format=%08x\n", t->format);
1171 r300->hw.tex.offset.cmd[R300_TEX_VALUE_0+i]=r300->radeon.radeonScreen->fbLocation+t->offset;
1172 r300->hw.tex.unknown4.cmd[R300_TEX_VALUE_0+i]=0x0;
1173 r300->hw.tex.unknown5.cmd[R300_TEX_VALUE_0+i]=0x0;
1174 r300->hw.tex.border_color.cmd[R300_TEX_VALUE_0+i]=t->pp_border_color;
1175
1176 /* We don't know how to set this yet */
1177 //value from r300_lib.c for RGB24
1178 //r300->hw.tex.format.cmd[R300_TEX_VALUE_0+i]=0x88a0c;
1179 #if 0
1180 r300->hw.tex.format.cmd[R300_TEX_VALUE_0+i]=translate_texture_format(ctx, i, t->format,
1181 r300->state.texture.unit[i].texobj!=NULL?t->base.tObj->Image[0][0]->IntFormat:3,
1182 r300->state.texture.unit[i].texobj!=NULL?t->base.tObj->Image[0][0]->TexFormat:NULL);
1183 #endif
1184
1185 #if 0
1186 fprintf(stderr, "Format=%s IntFormat=%08x MesaFormat=%08x BaseFormat=%s IsCompressed=%d Target=%s\n",
1187 _mesa_lookup_enum_by_nr(t->base.tObj->Image[0][0]->Format),
1188 t->base.tObj->Image[0][0]->IntFormat,
1189 t->base.tObj->Image[0][0]->TexFormat->MesaFormat,
1190 _mesa_lookup_enum_by_nr(t->base.tObj->Image[0][0]->TexFormat->BaseFormat),
1191 t->base.tObj->Image[0][0]->IsCompressed,
1192 _mesa_lookup_enum_by_nr(t->base.tObj->Target));
1193
1194 fprintf(stderr, "pitch=%08x filter=%08x format=%08x\n", t->pitch, t->filter, r300->hw.tex.format.cmd[R300_TEX_VALUE_0+i]);
1195 fprintf(stderr, "unknown1=%08x size=%08x\n", r300->hw.tex.unknown1.cmd[R300_TEX_VALUE_0+i],
1196 r300->hw.tex.size.cmd[R300_TEX_VALUE_0+i]);
1197 #endif
1198 /* Use the code below to quickly find matching texture
1199 formats. Requires an app that displays the same texture
1200 repeatedly */
1201 #if 0
1202 if(r300->hw.tex.format.cmd[R300_TEX_VALUE_0+i]==0){
1203 static int fmt=0x0;
1204 static int k=0;
1205 k++;
1206 if(k>20){
1207 k=0;
1208 fmt++;
1209 texUnit = &ctx->Texture.Unit[i];
1210 fprintf(stderr, "Want to set FORMAT_HASH(%d, %d, 0x%04x, %d, %d, 0x%04x, 0x%08x, %s(%08x))\n",
1211 texUnit->_CurrentCombine->OperandRGB[0] -GL_SRC_COLOR,
1212 translate_src(texUnit->_CurrentCombine->SourceRGB[0]),
1213 texUnit->_CurrentCombine->ModeRGB,
1214 texUnit->_CurrentCombine->OperandA[0] -GL_SRC_ALPHA,
1215 translate_src(texUnit->_CurrentCombine->SourceA[0]),
1216 texUnit->_CurrentCombine->ModeA,
1217 t->format,
1218 _mesa_lookup_enum_by_nr(t->base.tObj->Image[0][0]->IntFormat),
1219 t->base.tObj->Image[0][0]->IntFormat
1220 );
1221 fprintf(stderr, "Also known: format_x=%08x border_color=%08x cubic_faces=%08x\n", t->format_x, t->pp_border_color, t->pp_cubic_faces);
1222 fprintf(stderr, "\t_ReallyEnabled=%08x EnvMode=%08x IntFormat=%08x\n", texUnit->_ReallyEnabled, texUnit->EnvMode, t->base.tObj->Image[0][0]->IntFormat);
1223 if(fmt>0xfff){
1224 fmt=0;
1225 }
1226 //sleep(1);
1227 fprintf(stderr, "Now trying format %08x\n",
1228 fmt);
1229 fprintf(stderr, "size=%08x\n", t->size);
1230 }
1231 //r300->hw.tex.format.cmd[R300_TEX_VALUE_0+i]=known_formats[fmt];
1232 r300->hw.tex.format.cmd[R300_TEX_VALUE_0+i]=
1233 R300_EASY_TX_FORMAT(Z, Y, X, W, W8Z8Y8X8) | (fmt<<24);
1234 //r300->hw.tex.format.cmd[R300_TEX_VALUE_0+i]=0x08a0c | (fmt<<16);
1235 //r300->hw.tex.format.cmd[R300_TEX_VALUE_0+i]=0x58a00 | (fmt);
1236 //r300->hw.tex.format.cmd[R300_TEX_VALUE_0+i]=0x53a0c | (fmt<<24);
1237 }
1238 #endif
1239
1240 }
1241
1242 }
1243 ((drm_r300_cmd_header_t*)r300->hw.tex.filter.cmd)->unchecked_state.count = max_texture_unit+1;
1244 ((drm_r300_cmd_header_t*)r300->hw.tex.unknown1.cmd)->unchecked_state.count = max_texture_unit+1;
1245 ((drm_r300_cmd_header_t*)r300->hw.tex.size.cmd)->unchecked_state.count = max_texture_unit+1;
1246 ((drm_r300_cmd_header_t*)r300->hw.tex.format.cmd)->unchecked_state.count = max_texture_unit+1;
1247 ((drm_r300_cmd_header_t*)r300->hw.tex.offset.cmd)->unchecked_state.count = max_texture_unit+1;
1248 ((drm_r300_cmd_header_t*)r300->hw.tex.unknown4.cmd)->unchecked_state.count = max_texture_unit+1;
1249 ((drm_r300_cmd_header_t*)r300->hw.tex.unknown5.cmd)->unchecked_state.count = max_texture_unit+1;
1250 ((drm_r300_cmd_header_t*)r300->hw.tex.border_color.cmd)->unchecked_state.count = max_texture_unit+1;
1251
1252 if (RADEON_DEBUG & DEBUG_STATE)
1253 fprintf(stderr, "TX_ENABLE: %08x max_texture_unit=%d\n", r300->hw.txe.cmd[R300_TXE_ENABLE], max_texture_unit);
1254 }
1255
1256 void r300_setup_rs_unit(GLcontext *ctx)
1257 {
1258 r300ContextPtr r300 = R300_CONTEXT(ctx);
1259 int i;
1260
1261 /* This needs to be rewritten - it is a hack at best */
1262
1263 R300_STATECHANGE(r300, ri);
1264 R300_STATECHANGE(r300, rc);
1265 R300_STATECHANGE(r300, rr);
1266
1267 for(i = 1; i <= 8; ++i)
1268 r300->hw.ri.cmd[i] = 0x00d10000;
1269 r300->hw.ri.cmd[R300_RI_INTERP_1] |= R300_RS_INTERP_1_UNKNOWN;
1270 r300->hw.ri.cmd[R300_RI_INTERP_2] |= R300_RS_INTERP_2_UNKNOWN;
1271 r300->hw.ri.cmd[R300_RI_INTERP_3] |= R300_RS_INTERP_3_UNKNOWN;
1272
1273 #if 1
1274 for(i = 2; i <= 8; ++i)
1275 r300->hw.ri.cmd[i] |= 4;
1276 #endif
1277
1278 for(i = 1; i <= 8; ++i)
1279 r300->hw.rr.cmd[i] = 0;
1280 /* textures enabled ? */
1281 if(r300->state.texture.tc_count>0){
1282
1283 /* This code only really works with one set of texture coordinates */
1284
1285 /* The second constant is needed to get glxgears display anything .. */
1286 r300->hw.rc.cmd[1] = R300_RS_CNTL_0_UNKNOWN_7
1287 | R300_RS_CNTL_0_UNKNOWN_18
1288 | (r300->state.texture.tc_count<<R300_RS_CNTL_TC_CNT_SHIFT);
1289 r300->hw.rc.cmd[2] = 0xc0;
1290
1291
1292 ((drm_r300_cmd_header_t*)r300->hw.rr.cmd)->unchecked_state.count = 1;
1293 r300->hw.rr.cmd[R300_RR_ROUTE_0] = 0x24008;
1294
1295 } else {
1296
1297 /* The second constant is needed to get glxgears display anything .. */
1298 r300->hw.rc.cmd[1] = R300_RS_CNTL_0_UNKNOWN_7 | R300_RS_CNTL_0_UNKNOWN_18;
1299 r300->hw.rc.cmd[2] = 0;
1300
1301 ((drm_r300_cmd_header_t*)r300->hw.rr.cmd)->unchecked_state.count = 1;
1302 r300->hw.rr.cmd[R300_RR_ROUTE_0] = 0x4000;
1303
1304 }
1305 }
1306
1307 #define vpucount(ptr) (((drm_r300_cmd_header_t*)(ptr))->vpu.count)
1308
1309 #define bump_vpu_count(ptr, new_count) do{\
1310 drm_r300_cmd_header_t* _p=((drm_r300_cmd_header_t*)(ptr));\
1311 int _nc=(new_count)/4; \
1312 if(_nc>_p->vpu.count)_p->vpu.count=_nc;\
1313 }while(0)
1314
1315 void static inline setup_vertex_shader_fragment(r300ContextPtr r300, int dest, struct r300_vertex_shader_fragment *vsf)
1316 {
1317 int i;
1318
1319 if(vsf->length==0)return;
1320
1321 if(vsf->length & 0x3){
1322 fprintf(stderr,"VERTEX_SHADER_FRAGMENT must have length divisible by 4\n");
1323 exit(-1);
1324 }
1325
1326 switch((dest>>8) & 0xf){
1327 case 0:
1328 R300_STATECHANGE(r300, vpi);
1329 for(i=0;i<vsf->length;i++)
1330 r300->hw.vpi.cmd[R300_VPI_INSTR_0+i+4*(dest & 0xff)]=(vsf->body.d[i]);
1331 bump_vpu_count(r300->hw.vpi.cmd, vsf->length+4*(dest & 0xff));
1332 break;
1333
1334 case 2:
1335 R300_STATECHANGE(r300, vpp);
1336 for(i=0;i<vsf->length;i++)
1337 r300->hw.vpp.cmd[R300_VPP_PARAM_0+i+4*(dest & 0xff)]=(vsf->body.d[i]);
1338 bump_vpu_count(r300->hw.vpp.cmd, vsf->length+4*(dest & 0xff));
1339 break;
1340 case 4:
1341 R300_STATECHANGE(r300, vps);
1342 for(i=0;i<vsf->length;i++)
1343 r300->hw.vps.cmd[1+i+4*(dest & 0xff)]=(vsf->body.d[i]);
1344 bump_vpu_count(r300->hw.vps.cmd, vsf->length+4*(dest & 0xff));
1345 break;
1346 default:
1347 fprintf(stderr, "%s:%s don't know how to handle dest %04x\n", __FILE__, __FUNCTION__, dest);
1348 exit(-1);
1349 }
1350 }
1351
1352
1353 void r300SetupVertexShader(r300ContextPtr rmesa)
1354 {
1355 GLcontext* ctx = rmesa->radeon.glCtx;
1356
1357 /* Reset state, in case we don't use something */
1358 ((drm_r300_cmd_header_t*)rmesa->hw.vpp.cmd)->vpu.count = 0;
1359 ((drm_r300_cmd_header_t*)rmesa->hw.vpi.cmd)->vpu.count = 0;
1360 ((drm_r300_cmd_header_t*)rmesa->hw.vps.cmd)->vpu.count = 0;
1361
1362
1363 /* This needs to be replaced by vertex shader generation code */
1364
1365
1366 /* textures enabled ? */
1367 if(rmesa->state.texture.tc_count>0){
1368 rmesa->state.vertex_shader=SINGLE_TEXTURE_VERTEX_SHADER;
1369 } else {
1370 rmesa->state.vertex_shader=FLAT_COLOR_VERTEX_SHADER;
1371 }
1372
1373
1374 rmesa->state.vertex_shader.matrix[0].length=16;
1375 memcpy(rmesa->state.vertex_shader.matrix[0].body.f, ctx->_ModelProjectMatrix.m, 16*4);
1376
1377 setup_vertex_shader_fragment(rmesa, VSF_DEST_PROGRAM, &(rmesa->state.vertex_shader.program));
1378
1379 setup_vertex_shader_fragment(rmesa, VSF_DEST_MATRIX0, &(rmesa->state.vertex_shader.matrix[0]));
1380 #if 0
1381 setup_vertex_shader_fragment(rmesa, VSF_DEST_MATRIX1, &(rmesa->state.vertex_shader.matrix[0]));
1382 setup_vertex_shader_fragment(rmesa, VSF_DEST_MATRIX2, &(rmesa->state.vertex_shader.matrix[0]));
1383
1384 setup_vertex_shader_fragment(rmesa, VSF_DEST_VECTOR0, &(rmesa->state.vertex_shader.vector[0]));
1385 setup_vertex_shader_fragment(rmesa, VSF_DEST_VECTOR1, &(rmesa->state.vertex_shader.vector[1]));
1386 #endif
1387
1388 #if 0
1389 setup_vertex_shader_fragment(rmesa, VSF_DEST_UNKNOWN1, &(rmesa->state.vertex_shader.unknown1));
1390 setup_vertex_shader_fragment(rmesa, VSF_DEST_UNKNOWN2, &(rmesa->state.vertex_shader.unknown2));
1391 #endif
1392
1393 R300_STATECHANGE(rmesa, pvs);
1394 rmesa->hw.pvs.cmd[R300_PVS_CNTL_1]=(rmesa->state.vertex_shader.program_start << R300_PVS_CNTL_1_PROGRAM_START_SHIFT)
1395 | (rmesa->state.vertex_shader.unknown_ptr1 << R300_PVS_CNTL_1_UNKNOWN_SHIFT)
1396 | (rmesa->state.vertex_shader.program_end << R300_PVS_CNTL_1_PROGRAM_END_SHIFT);
1397 rmesa->hw.pvs.cmd[R300_PVS_CNTL_2]=(rmesa->state.vertex_shader.param_offset << R300_PVS_CNTL_2_PARAM_OFFSET_SHIFT)
1398 | (rmesa->state.vertex_shader.param_count << R300_PVS_CNTL_2_PARAM_COUNT_SHIFT);
1399 rmesa->hw.pvs.cmd[R300_PVS_CNTL_3]=(rmesa->state.vertex_shader.unknown_ptr2 << R300_PVS_CNTL_3_PROGRAM_UNKNOWN_SHIFT)
1400 | (rmesa->state.vertex_shader.unknown_ptr3 << 0);
1401
1402 /* This is done for vertex shader fragments, but also needs to be done for vap_pvs,
1403 so I leave it as a reminder */
1404 #if 0
1405 reg_start(R300_VAP_PVS_WAITIDLE,0);
1406 e32(0x00000000);
1407 #endif
1408 }
1409
1410 void r300SetupPixelShader(r300ContextPtr rmesa)
1411 {
1412 int i,k;
1413
1414 /* This needs to be replaced by pixel shader generation code */
1415
1416 /* textures enabled ? */
1417 if(rmesa->state.texture.tc_count>0){
1418 rmesa->state.pixel_shader=SINGLE_TEXTURE_PIXEL_SHADER;
1419 } else {
1420 rmesa->state.pixel_shader=FLAT_COLOR_PIXEL_SHADER;
1421 }
1422
1423 R300_STATECHANGE(rmesa, fpt);
1424 for(i=0;i<rmesa->state.pixel_shader.program.tex.length;i++)
1425 rmesa->hw.fpt.cmd[R300_FPT_INSTR_0+i]=rmesa->state.pixel_shader.program.tex.inst[i];
1426 rmesa->hw.fpt.cmd[R300_FPT_CMD_0]=cmducs(R300_PFS_TEXI_0, rmesa->state.pixel_shader.program.tex.length);
1427
1428 #define OUTPUT_FIELD(st, reg, field) \
1429 R300_STATECHANGE(rmesa, st); \
1430 for(i=0;i<rmesa->state.pixel_shader.program.alu.length;i++) \
1431 rmesa->hw.st.cmd[R300_FPI_INSTR_0+i]=rmesa->state.pixel_shader.program.alu.inst[i].field;\
1432 rmesa->hw.st.cmd[R300_FPI_CMD_0]=cmducs(reg, rmesa->state.pixel_shader.program.alu.length);
1433
1434 OUTPUT_FIELD(fpi[0], R300_PFS_INSTR0_0, inst0);
1435 OUTPUT_FIELD(fpi[1], R300_PFS_INSTR1_0, inst1);
1436 OUTPUT_FIELD(fpi[2], R300_PFS_INSTR2_0, inst2);
1437 OUTPUT_FIELD(fpi[3], R300_PFS_INSTR3_0, inst3);
1438 #undef OUTPUT_FIELD
1439
1440 R300_STATECHANGE(rmesa, fp);
1441 for(i=0;i<4;i++){
1442 rmesa->hw.fp.cmd[R300_FP_NODE0+i]=
1443 (rmesa->state.pixel_shader.program.node[i].alu_offset << R300_PFS_NODE_ALU_OFFSET_SHIFT)
1444 | (rmesa->state.pixel_shader.program.node[i].alu_end << R300_PFS_NODE_ALU_END_SHIFT)
1445 | (rmesa->state.pixel_shader.program.node[i].tex_offset << R300_PFS_NODE_TEX_OFFSET_SHIFT)
1446 | (rmesa->state.pixel_shader.program.node[i].tex_end << R300_PFS_NODE_TEX_END_SHIFT)
1447 | ( (i==3) ? R300_PFS_NODE_LAST_NODE : 0);
1448 }
1449
1450 /* PFS_CNTL_0 */
1451 rmesa->hw.fp.cmd[R300_FP_CNTL0]=
1452 (rmesa->state.pixel_shader.program.active_nodes-1)
1453 | (rmesa->state.pixel_shader.program.first_node_has_tex<<3);
1454 /* PFS_CNTL_1 */
1455 rmesa->hw.fp.cmd[R300_FP_CNTL1]=rmesa->state.pixel_shader.program.temp_register_count;
1456 /* PFS_CNTL_2 */
1457 rmesa->hw.fp.cmd[R300_FP_CNTL2]=
1458 (rmesa->state.pixel_shader.program.alu_offset << R300_PFS_CNTL_ALU_OFFSET_SHIFT)
1459 | (rmesa->state.pixel_shader.program.alu_end << R300_PFS_CNTL_ALU_END_SHIFT)
1460 | (rmesa->state.pixel_shader.program.tex_offset << R300_PFS_CNTL_TEX_OFFSET_SHIFT)
1461 | (rmesa->state.pixel_shader.program.tex_end << R300_PFS_CNTL_TEX_END_SHIFT);
1462
1463 R300_STATECHANGE(rmesa, fpp);
1464 for(i=0;i<rmesa->state.pixel_shader.param_length;i++){
1465 rmesa->hw.fpp.cmd[R300_FPP_PARAM_0+4*i+0]=r300PackFloat32(rmesa->state.pixel_shader.param[i].x);
1466 rmesa->hw.fpp.cmd[R300_FPP_PARAM_0+4*i+1]=r300PackFloat32(rmesa->state.pixel_shader.param[i].y);
1467 rmesa->hw.fpp.cmd[R300_FPP_PARAM_0+4*i+2]=r300PackFloat32(rmesa->state.pixel_shader.param[i].z);
1468 rmesa->hw.fpp.cmd[R300_FPP_PARAM_0+4*i+3]=r300PackFloat32(rmesa->state.pixel_shader.param[i].w);
1469 }
1470 rmesa->hw.fpp.cmd[R300_FPP_CMD_0]=cmducs(R300_PFS_PARAM_0_X, rmesa->state.pixel_shader.param_length);
1471
1472 }
1473
1474 /**
1475 * Called by Mesa after an internal state update.
1476 */
1477 static void r300InvalidateState(GLcontext * ctx, GLuint new_state)
1478 {
1479 r300ContextPtr r300 = R300_CONTEXT(ctx);
1480
1481 _swrast_InvalidateState(ctx, new_state);
1482 _swsetup_InvalidateState(ctx, new_state);
1483 _ac_InvalidateState(ctx, new_state);
1484 _tnl_InvalidateState(ctx, new_state);
1485 _ae_invalidate_state(ctx, new_state);
1486
1487 /* Go inefficiency! */
1488 r300ResetHwState(r300);
1489 }
1490
1491
1492 /**
1493 * Completely recalculates hardware state based on the Mesa state.
1494 */
1495 void r300ResetHwState(r300ContextPtr r300)
1496 {
1497 GLcontext* ctx = r300->radeon.glCtx;
1498 int i;
1499
1500 if (RADEON_DEBUG & DEBUG_STATE)
1501 fprintf(stderr, "%s\n", __FUNCTION__);
1502
1503 /* This is a place to initialize registers which
1504 have bitfields accessed by different functions
1505 and not all bits are used */
1506 #if 0
1507 r300->hw.zs.cmd[R300_ZS_CNTL_0] = 0;
1508 r300->hw.zs.cmd[R300_ZS_CNTL_1] = 0;
1509 r300->hw.zs.cmd[R300_ZS_CNTL_2] = 0xffff00;
1510 #endif
1511
1512 /* go and compute register values from GL state */
1513
1514 r300UpdateWindow(ctx);
1515
1516 r300ColorMask(ctx,
1517 ctx->Color.ColorMask[RCOMP],
1518 ctx->Color.ColorMask[GCOMP],
1519 ctx->Color.ColorMask[BCOMP],
1520 ctx->Color.ColorMask[ACOMP]);
1521
1522 r300Enable(ctx, GL_DEPTH_TEST, ctx->Depth.Test);
1523 r300DepthMask(ctx, ctx->Depth.Mask);
1524 r300DepthFunc(ctx, ctx->Depth.Func);
1525
1526 r300UpdateCulling(ctx);
1527
1528 r300_setup_routing(ctx, GL_TRUE);
1529
1530 r300UpdateTextureState(ctx);
1531 r300_setup_textures(ctx);
1532 r300_setup_rs_unit(ctx);
1533
1534 r300SetupVertexShader(r300);
1535 r300SetupPixelShader(r300);
1536
1537 r300_set_blend_state(ctx);
1538 r300AlphaFunc(ctx, ctx->Color.AlphaFunc, ctx->Color.AlphaRef);
1539
1540 /* Initialize magic registers
1541 TODO : learn what they really do, or get rid of
1542 those we don't have to touch */
1543 r300->hw.unk2080.cmd[1] = 0x0030045A;
1544
1545 r300->hw.vte.cmd[1] = R300_VPORT_X_SCALE_ENA
1546 | R300_VPORT_X_OFFSET_ENA
1547 | R300_VPORT_Y_SCALE_ENA
1548 | R300_VPORT_Y_OFFSET_ENA
1549 | R300_VPORT_Z_SCALE_ENA
1550 | R300_VPORT_Z_OFFSET_ENA
1551 | R300_VTX_W0_FMT;
1552 r300->hw.vte.cmd[2] = 0x00000008;
1553
1554 r300->hw.unk2134.cmd[1] = 0x00FFFFFF;
1555 r300->hw.unk2134.cmd[2] = 0x00000000;
1556
1557 r300->hw.unk2140.cmd[1] = 0x00000000;
1558
1559 #if 0 /* Done in setup routing */
1560 ((drm_r300_cmd_header_t*)r300->hw.vir[0].cmd)->unchecked_state.count = 1;
1561 r300->hw.vir[0].cmd[1] = 0x21030003;
1562
1563 ((drm_r300_cmd_header_t*)r300->hw.vir[1].cmd)->unchecked_state.count = 1;
1564 r300->hw.vir[1].cmd[1] = 0xF688F688;
1565
1566 r300->hw.vic.cmd[R300_VIR_CNTL_0] = 0x00000001;
1567 r300->hw.vic.cmd[R300_VIR_CNTL_1] = 0x00000405;
1568 #endif
1569
1570 r300->hw.unk21DC.cmd[1] = 0xAAAAAAAA;
1571
1572 r300->hw.unk221C.cmd[1] = R300_221C_NORMAL;
1573
1574 r300->hw.unk2220.cmd[1] = r300PackFloat32(1.0);
1575 r300->hw.unk2220.cmd[2] = r300PackFloat32(1.0);
1576 r300->hw.unk2220.cmd[3] = r300PackFloat32(1.0);
1577 r300->hw.unk2220.cmd[4] = r300PackFloat32(1.0);
1578
1579 if (GET_CHIP(r300->radeon.radeonScreen) == RADEON_CHIP_R300)
1580 r300->hw.unk2288.cmd[1] = R300_2288_R300;
1581 else
1582 r300->hw.unk2288.cmd[1] = R300_2288_RV350;
1583
1584 #if 0
1585 r300->hw.vof.cmd[R300_VOF_CNTL_0] = R300_VAP_OUTPUT_VTX_FMT_0__POS_PRESENT
1586 | R300_VAP_OUTPUT_VTX_FMT_0__COLOR_PRESENT;
1587 r300->hw.vof.cmd[R300_VOF_CNTL_1] = 0; /* no textures */
1588
1589
1590 r300->hw.pvs.cmd[R300_PVS_CNTL_1] = 0;
1591 r300->hw.pvs.cmd[R300_PVS_CNTL_2] = 0;
1592 r300->hw.pvs.cmd[R300_PVS_CNTL_3] = 0;
1593 #endif
1594
1595 r300->hw.gb_enable.cmd[1] = R300_GB_POINT_STUFF_ENABLE
1596 | R300_GB_LINE_STUFF_ENABLE
1597 | R300_GB_TRIANGLE_STUFF_ENABLE;
1598
1599 r300->hw.gb_misc.cmd[R300_GB_MISC_MSPOS_0] = 0x66666666;
1600 r300->hw.gb_misc.cmd[R300_GB_MISC_MSPOS_1] = 0x06666666;
1601 if (GET_CHIP(r300->radeon.radeonScreen) == RADEON_CHIP_R300)
1602 r300->hw.gb_misc.cmd[R300_GB_MISC_TILE_CONFIG] = R300_GB_TILE_ENABLE
1603 | R300_GB_TILE_PIPE_COUNT_R300
1604 | R300_GB_TILE_SIZE_16;
1605 else
1606 r300->hw.gb_misc.cmd[R300_GB_MISC_TILE_CONFIG] = R300_GB_TILE_ENABLE
1607 | R300_GB_TILE_PIPE_COUNT_RV300
1608 | R300_GB_TILE_SIZE_16;
1609 r300->hw.gb_misc.cmd[R300_GB_MISC_SELECT] = 0x00000000;
1610 r300->hw.gb_misc.cmd[R300_GB_MISC_AA_CONFIG] = 0x00000000; /* No antialiasing */
1611
1612 //r300->hw.txe.cmd[R300_TXE_ENABLE] = 0;
1613
1614 r300->hw.unk4200.cmd[1] = r300PackFloat32(0.0);
1615 r300->hw.unk4200.cmd[2] = r300PackFloat32(0.0);
1616 r300->hw.unk4200.cmd[3] = r300PackFloat32(1.0);
1617 r300->hw.unk4200.cmd[4] = r300PackFloat32(1.0);
1618
1619 r300->hw.unk4214.cmd[1] = 0x00050005;
1620
1621 r300->hw.ps.cmd[R300_PS_POINTSIZE] = (6 << R300_POINTSIZE_X_SHIFT) |
1622 (6 << R300_POINTSIZE_Y_SHIFT);
1623
1624 r300->hw.unk4230.cmd[1] = 0x01800000;
1625 r300->hw.unk4230.cmd[2] = 0x00020006;
1626 r300->hw.unk4230.cmd[3] = r300PackFloat32(1.0 / 192.0);
1627
1628 r300->hw.unk4260.cmd[1] = 0;
1629 r300->hw.unk4260.cmd[2] = r300PackFloat32(0.0);
1630 r300->hw.unk4260.cmd[3] = r300PackFloat32(1.0);
1631
1632 r300->hw.unk4274.cmd[1] = 0x00000002;
1633 r300->hw.unk4274.cmd[2] = 0x0003AAAA;
1634 r300->hw.unk4274.cmd[3] = 0x00000000;
1635 r300->hw.unk4274.cmd[4] = 0x00000000;
1636
1637 r300->hw.unk4288.cmd[1] = 0x00000000;
1638 r300->hw.unk4288.cmd[2] = 0x00000001;
1639 r300->hw.unk4288.cmd[3] = 0x00000000;
1640 r300->hw.unk4288.cmd[4] = 0x00000000;
1641 r300->hw.unk4288.cmd[5] = 0x00000000;
1642
1643 r300->hw.unk42A0.cmd[1] = 0x00000000;
1644
1645 r300->hw.unk42B4.cmd[1] = 0x00000000;
1646
1647 r300->hw.unk42C0.cmd[1] = 0x4B7FFFFF;
1648 r300->hw.unk42C0.cmd[2] = 0x00000000;
1649
1650
1651 r300->hw.unk43A4.cmd[1] = 0x0000001C;
1652 r300->hw.unk43A4.cmd[2] = 0x2DA49525;
1653
1654 r300->hw.unk43E8.cmd[1] = 0x00FFFFFF;
1655
1656 #if 0
1657 r300->hw.fp.cmd[R300_FP_CNTL0] = 0;
1658 r300->hw.fp.cmd[R300_FP_CNTL1] = 0;
1659 r300->hw.fp.cmd[R300_FP_CNTL2] = 0;
1660 r300->hw.fp.cmd[R300_FP_NODE0] = 0;
1661 r300->hw.fp.cmd[R300_FP_NODE1] = 0;
1662 r300->hw.fp.cmd[R300_FP_NODE2] = 0;
1663 r300->hw.fp.cmd[R300_FP_NODE3] = 0;
1664 #endif
1665
1666 r300->hw.unk46A4.cmd[1] = 0x00001B01;
1667 r300->hw.unk46A4.cmd[2] = 0x00001B0F;
1668 r300->hw.unk46A4.cmd[3] = 0x00001B0F;
1669 r300->hw.unk46A4.cmd[4] = 0x00001B0F;
1670 r300->hw.unk46A4.cmd[5] = 0x00000001;
1671
1672 #if 0
1673 for(i = 1; i <= 64; ++i) {
1674 /* create NOP instructions */
1675 r300->hw.fpi[0].cmd[i] = FP_INSTRC(MAD, FP_ARGC(SRC0C_XYZ), FP_ARGC(ONE), FP_ARGC(ZERO));
1676 r300->hw.fpi[1].cmd[i] = FP_SELC(0,XYZ,NO,FP_TMP(0),0,0);
1677 r300->hw.fpi[2].cmd[i] = FP_INSTRA(MAD, FP_ARGA(SRC0A), FP_ARGA(ONE), FP_ARGA(ZERO));
1678 r300->hw.fpi[3].cmd[i] = FP_SELA(0,W,NO,FP_TMP(0),0,0);
1679 }
1680 #endif
1681
1682 r300->hw.unk4BC0.cmd[1] = 0;
1683
1684 r300->hw.unk4BC8.cmd[1] = 0;
1685 r300->hw.unk4BC8.cmd[2] = 0;
1686 r300->hw.unk4BC8.cmd[3] = 0;
1687
1688 #if 0
1689 r300->hw.at.cmd[R300_AT_ALPHA_TEST] = 0;
1690 #endif
1691
1692 r300->hw.unk4BD8.cmd[1] = 0;
1693
1694 r300->hw.unk4E00.cmd[1] = 0;
1695
1696 #if 0
1697 r300->hw.bld.cmd[R300_BLD_CBLEND] = 0;
1698 r300->hw.bld.cmd[R300_BLD_ABLEND] = 0;
1699 #endif
1700
1701 r300->hw.unk4E10.cmd[1] = 0;
1702 r300->hw.unk4E10.cmd[2] = 0;
1703 r300->hw.unk4E10.cmd[3] = 0;
1704
1705 r300->hw.cb.cmd[R300_CB_OFFSET] =
1706 r300->radeon.radeonScreen->backOffset +
1707 r300->radeon.radeonScreen->fbLocation;
1708 r300->hw.cb.cmd[R300_CB_PITCH] = r300->radeon.radeonScreen->backPitch
1709 | R300_COLOR_UNKNOWN_22_23;
1710
1711 r300->hw.unk4E50.cmd[1] = 0;
1712 r300->hw.unk4E50.cmd[2] = 0;
1713 r300->hw.unk4E50.cmd[3] = 0;
1714 r300->hw.unk4E50.cmd[4] = 0;
1715 r300->hw.unk4E50.cmd[5] = 0;
1716 r300->hw.unk4E50.cmd[6] = 0;
1717 r300->hw.unk4E50.cmd[7] = 0;
1718 r300->hw.unk4E50.cmd[8] = 0;
1719 r300->hw.unk4E50.cmd[9] = 0;
1720
1721 r300->hw.unk4E88.cmd[1] = 0;
1722
1723 r300->hw.unk4EA0.cmd[1] = 0x00000000;
1724 r300->hw.unk4EA0.cmd[2] = 0xffffffff;
1725
1726 r300->hw.unk4F10.cmd[1] = 0x00000002; // depthbuffer format?
1727 r300->hw.unk4F10.cmd[2] = 0x00000000;
1728 r300->hw.unk4F10.cmd[3] = 0x00000003;
1729 r300->hw.unk4F10.cmd[4] = 0x00000000;
1730
1731 r300->hw.zb.cmd[R300_ZB_OFFSET] =
1732 r300->radeon.radeonScreen->depthOffset +
1733 r300->radeon.radeonScreen->fbLocation;
1734 r300->hw.zb.cmd[R300_ZB_PITCH] = r300->radeon.radeonScreen->depthPitch;
1735
1736 r300->hw.unk4F28.cmd[1] = 0;
1737
1738 r300->hw.unk4F30.cmd[1] = 0;
1739 r300->hw.unk4F30.cmd[2] = 0;
1740
1741 r300->hw.unk4F44.cmd[1] = 0;
1742
1743 r300->hw.unk4F54.cmd[1] = 0;
1744
1745 #if 0
1746 ((drm_r300_cmd_header_t*)r300->hw.vpi.cmd)->vpu.count = 0;
1747 for(i = 1; i < R300_VPI_CMDSIZE; i += 4) {
1748 /* MOV t0, t0 */
1749 r300->hw.vpi.cmd[i+0] = VP_OUT(ADD,TMP,0,XYZW);
1750 r300->hw.vpi.cmd[i+1] = VP_IN(TMP,0);
1751 r300->hw.vpi.cmd[i+2] = VP_ZERO();
1752 r300->hw.vpi.cmd[i+3] = VP_ZERO();
1753 }
1754
1755 ((drm_r300_cmd_header_t*)r300->hw.vpp.cmd)->vpu.count = 0;
1756 for(i = 1; i < R300_VPP_CMDSIZE; ++i)
1757 r300->hw.vpp.cmd[i] = 0;
1758 #endif
1759
1760 r300->hw.vps.cmd[R300_VPS_ZERO_0] = 0;
1761 r300->hw.vps.cmd[R300_VPS_ZERO_1] = 0;
1762 r300->hw.vps.cmd[R300_VPS_POINTSIZE] = r300PackFloat32(1.0);
1763 r300->hw.vps.cmd[R300_VPS_ZERO_3] = 0;
1764
1765 //END: TODO
1766
1767 r300->hw.all_dirty = GL_TRUE;
1768 }
1769
1770
1771
1772 /**
1773 * Calculate initial hardware state and register state functions.
1774 * Assumes that the command buffer and state atoms have been
1775 * initialized already.
1776 */
1777 void r300InitState(r300ContextPtr r300)
1778 {
1779 GLcontext *ctx = r300->radeon.glCtx;
1780 GLuint depth_fmt;
1781
1782 radeonInitState(&r300->radeon);
1783
1784 switch (ctx->Visual.depthBits) {
1785 case 16:
1786 r300->state.depth.scale = 1.0 / (GLfloat) 0xffff;
1787 depth_fmt = R200_DEPTH_FORMAT_16BIT_INT_Z;
1788 //r300->state.stencil.clear = 0x00000000;
1789 break;
1790 case 24:
1791 r300->state.depth.scale = 1.0 / (GLfloat) 0xffffff;
1792 depth_fmt = R200_DEPTH_FORMAT_24BIT_INT_Z;
1793 //r300->state.stencil.clear = 0xff000000;
1794 break;
1795 default:
1796 fprintf(stderr, "Error: Unsupported depth %d... exiting\n",
1797 ctx->Visual.depthBits);
1798 exit(-1);
1799 }
1800
1801 /* Only have hw stencil when depth buffer is 24 bits deep */
1802 r300->state.hw_stencil = (ctx->Visual.stencilBits > 0 &&
1803 ctx->Visual.depthBits == 24);
1804
1805 memset(&(r300->state.texture), 0, sizeof(r300->state.texture));
1806
1807 r300ResetHwState(r300);
1808 }
1809
1810
1811
1812 /**
1813 * Initialize driver's state callback functions
1814 */
1815 void r300InitStateFuncs(struct dd_function_table* functions)
1816 {
1817 radeonInitStateFuncs(functions);
1818
1819 functions->UpdateState = r300InvalidateState;
1820 functions->AlphaFunc = r300AlphaFunc;
1821 functions->BlendColor = r300BlendColor;
1822 functions->BlendEquationSeparate = r300BlendEquationSeparate;
1823 functions->BlendFuncSeparate = r300BlendFuncSeparate;
1824 functions->Enable = r300Enable;
1825 functions->ColorMask = r300ColorMask;
1826 functions->DepthFunc = r300DepthFunc;
1827 functions->DepthMask = r300DepthMask;
1828 functions->CullFace = r300CullFace;
1829 functions->FrontFace = r300FrontFace;
1830
1831 /* Stencil related */
1832 functions->ClearStencil = r300ClearStencil;
1833 functions->StencilFunc = r300StencilFunc;
1834 functions->StencilMask = r300StencilMask;
1835 functions->StencilOp = r300StencilOp;
1836
1837 /* Viewport related */
1838 functions->Viewport = r300Viewport;
1839 functions->DepthRange = r300DepthRange;
1840 functions->PointSize = r300PointSize;
1841 }
1842