1 /* $XFree86: xc/lib/GL/mesa/src/drv/radeon/radeon_texstate.c,v 1.6 2002/12/16 16:18:59 dawes Exp $ */
2 /**************************************************************************
4 Copyright 2000, 2001 ATI Technologies Inc., Ontario, Canada, and
5 VA Linux Systems Inc., Fremont, California.
9 Permission is hereby granted, free of charge, to any person obtaining
10 a copy of this software and associated documentation files (the
11 "Software"), to deal in the Software without restriction, including
12 without limitation the rights to use, copy, modify, merge, publish,
13 distribute, sublicense, and/or sell copies of the Software, and to
14 permit persons to whom the Software is furnished to do so, subject to
15 the following conditions:
17 The above copyright notice and this permission notice (including the
18 next paragraph) shall be included in all copies or substantial
19 portions of the Software.
21 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
22 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
23 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
24 IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
25 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
26 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
27 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
29 **************************************************************************/
33 * Kevin E. Martin <martin@valinux.com>
34 * Gareth Hughes <gareth@valinux.com>
42 #include "texformat.h"
45 #include "radeon_context.h"
46 #include "radeon_state.h"
47 #include "radeon_ioctl.h"
48 #include "radeon_swtcl.h"
49 #include "radeon_tex.h"
50 #include "radeon_tcl.h"
53 #define RADEON_TXFORMAT_AL88 RADEON_TXFORMAT_AI88
54 #define RADEON_TXFORMAT_YCBCR RADEON_TXFORMAT_YVYU422
55 #define RADEON_TXFORMAT_YCBCR_REV RADEON_TXFORMAT_VYUY422
58 [ MESA_FORMAT_ ## f ] = { RADEON_TXFORMAT_ ## f, 0 }
60 [ MESA_FORMAT_ ## f ] = { RADEON_TXFORMAT_ ## f | RADEON_TXFORMAT_ALPHA_IN_MAP, 0 }
62 [ MESA_FORMAT_ ## f ] = { RADEON_TXFORMAT_ ## f, RADEON_YUV_TO_RGB }
64 [ MESA_FORMAT_ ## f ] = { 0xffffffff, 0 }
65 #define VALID_FORMAT(f) ( ((f) <= MESA_FORMAT_YCBCR_REV) \
66 && (tx_table[f].format != 0xffffffff) )
69 GLuint format
, filter
;
93 * This function computes the number of bytes of storage needed for
94 * the given texture object (all mipmap levels, all cube faces).
95 * The \c image[face][level].x/y/width/height parameters for upload/blitting
96 * are computed here. \c pp_txfilter, \c pp_txformat, etc. will be set here
99 * \param rmesa Context pointer
100 * \param tObj GL texture object whose images are to be posted to
103 static void radeonSetTexImages( radeonContextPtr rmesa
,
104 struct gl_texture_object
*tObj
)
106 radeonTexObjPtr t
= (radeonTexObjPtr
)tObj
->DriverData
;
107 const struct gl_texture_image
*baseImage
= tObj
->Image
[0][tObj
->BaseLevel
];
111 GLint log2Width
, log2Height
, log2Depth
;
113 /* Set the hardware texture format
116 t
->pp_txformat
&= ~(RADEON_TXFORMAT_FORMAT_MASK
|
117 RADEON_TXFORMAT_ALPHA_IN_MAP
);
118 t
->pp_txfilter
&= ~RADEON_YUV_TO_RGB
;
120 if ( VALID_FORMAT( baseImage
->TexFormat
->MesaFormat
) ) {
121 t
->pp_txformat
|= tx_table
[ baseImage
->TexFormat
->MesaFormat
].format
;
122 t
->pp_txfilter
|= tx_table
[ baseImage
->TexFormat
->MesaFormat
].filter
;
125 _mesa_problem(NULL
, "unexpected texture format in %s", __FUNCTION__
);
130 /* Compute which mipmap levels we really want to send to the hardware.
133 driCalculateTextureFirstLastLevel( (driTextureObject
*) t
);
134 log2Width
= tObj
->Image
[0][t
->base
.firstLevel
]->WidthLog2
;
135 log2Height
= tObj
->Image
[0][t
->base
.firstLevel
]->HeightLog2
;
136 log2Depth
= tObj
->Image
[0][t
->base
.firstLevel
]->DepthLog2
;
138 numLevels
= t
->base
.lastLevel
- t
->base
.firstLevel
+ 1;
140 assert(numLevels
<= RADEON_MAX_TEXTURE_LEVELS
);
142 /* Calculate mipmap offsets and dimensions for blitting (uploading)
143 * The idea is that we lay out the mipmap levels within a block of
144 * memory organized as a rectangle of width BLIT_WIDTH_BYTES.
148 for (i
= 0; i
< numLevels
; i
++) {
149 const struct gl_texture_image
*texImage
;
152 texImage
= tObj
->Image
[0][i
+ t
->base
.firstLevel
];
156 /* find image size in bytes */
157 if (texImage
->IsCompressed
) {
158 size
= texImage
->CompressedSize
;
160 else if (tObj
->Target
== GL_TEXTURE_RECTANGLE_NV
) {
161 size
= ((texImage
->Width
* texImage
->TexFormat
->TexelBytes
+ 63)
162 & ~63) * texImage
->Height
;
165 int w
= texImage
->Width
* texImage
->TexFormat
->TexelBytes
;
168 size
= w
* texImage
->Height
* texImage
->Depth
;
173 /* Align to 32-byte offset. It is faster to do this unconditionally
174 * (no branch penalty).
177 curOffset
= (curOffset
+ 0x1f) & ~0x1f;
179 t
->image
[0][i
].x
= curOffset
% BLIT_WIDTH_BYTES
;
180 t
->image
[0][i
].y
= curOffset
/ BLIT_WIDTH_BYTES
;
181 t
->image
[0][i
].width
= MIN2(size
, BLIT_WIDTH_BYTES
);
182 t
->image
[0][i
].height
= size
/ t
->image
[0][i
].width
;
185 /* for debugging only and only applicable to non-rectangle targets */
186 assert(size
% t
->image
[0][i
].width
== 0);
187 assert(t
->image
[0][i
].x
== 0
188 || (size
< BLIT_WIDTH_BYTES
&& t
->image
[0][i
].height
== 1));
193 "level %d: %dx%d x=%d y=%d w=%d h=%d size=%d at %d\n",
194 i
, texImage
->Width
, texImage
->Height
,
195 t
->image
[0][i
].x
, t
->image
[0][i
].y
,
196 t
->image
[0][i
].width
, t
->image
[0][i
].height
, size
, curOffset
);
202 /* Align the total size of texture memory block.
204 t
->base
.totalSize
= (curOffset
+ RADEON_OFFSET_MASK
) & ~RADEON_OFFSET_MASK
;
208 t
->pp_txfilter
&= ~RADEON_MAX_MIP_LEVEL_MASK
;
209 t
->pp_txfilter
|= (numLevels
- 1) << RADEON_MAX_MIP_LEVEL_SHIFT
;
211 t
->pp_txformat
&= ~(RADEON_TXFORMAT_WIDTH_MASK
|
212 RADEON_TXFORMAT_HEIGHT_MASK
|
213 RADEON_TXFORMAT_CUBIC_MAP_ENABLE
);
214 t
->pp_txformat
|= ((log2Width
<< RADEON_TXFORMAT_WIDTH_SHIFT
) |
215 (log2Height
<< RADEON_TXFORMAT_HEIGHT_SHIFT
));
217 t
->pp_txsize
= (((tObj
->Image
[0][t
->base
.firstLevel
]->Width
- 1) << 0) |
218 ((tObj
->Image
[0][t
->base
.firstLevel
]->Height
- 1) << 16));
220 /* Only need to round to nearest 32 for textures, but the blitter
221 * requires 64-byte aligned pitches, and we may/may not need the
222 * blitter. NPOT only!
224 if (baseImage
->IsCompressed
)
225 t
->pp_txpitch
= (tObj
->Image
[0][t
->base
.firstLevel
]->Width
+ 63) & ~(63);
227 t
->pp_txpitch
= ((tObj
->Image
[0][t
->base
.firstLevel
]->Width
* baseImage
->TexFormat
->TexelBytes
) + 63) & ~(63);
230 t
->dirty_state
= TEX_ALL
;
232 /* FYI: radeonUploadTexImages( rmesa, t ); used to be called here */
237 /* ================================================================
238 * Texture combine functions
241 /* GL_ARB_texture_env_combine support
244 /* The color tables have combine functions for GL_SRC_COLOR,
245 * GL_ONE_MINUS_SRC_COLOR, GL_SRC_ALPHA and GL_ONE_MINUS_SRC_ALPHA.
247 static GLuint radeon_texture_color
[][RADEON_MAX_TEXTURE_UNITS
] =
250 RADEON_COLOR_ARG_A_T0_COLOR
,
251 RADEON_COLOR_ARG_A_T1_COLOR
,
252 RADEON_COLOR_ARG_A_T2_COLOR
255 RADEON_COLOR_ARG_A_T0_COLOR
| RADEON_COMP_ARG_A
,
256 RADEON_COLOR_ARG_A_T1_COLOR
| RADEON_COMP_ARG_A
,
257 RADEON_COLOR_ARG_A_T2_COLOR
| RADEON_COMP_ARG_A
260 RADEON_COLOR_ARG_A_T0_ALPHA
,
261 RADEON_COLOR_ARG_A_T1_ALPHA
,
262 RADEON_COLOR_ARG_A_T2_ALPHA
265 RADEON_COLOR_ARG_A_T0_ALPHA
| RADEON_COMP_ARG_A
,
266 RADEON_COLOR_ARG_A_T1_ALPHA
| RADEON_COMP_ARG_A
,
267 RADEON_COLOR_ARG_A_T2_ALPHA
| RADEON_COMP_ARG_A
271 static GLuint radeon_tfactor_color
[] =
273 RADEON_COLOR_ARG_A_TFACTOR_COLOR
,
274 RADEON_COLOR_ARG_A_TFACTOR_COLOR
| RADEON_COMP_ARG_A
,
275 RADEON_COLOR_ARG_A_TFACTOR_ALPHA
,
276 RADEON_COLOR_ARG_A_TFACTOR_ALPHA
| RADEON_COMP_ARG_A
279 static GLuint radeon_primary_color
[] =
281 RADEON_COLOR_ARG_A_DIFFUSE_COLOR
,
282 RADEON_COLOR_ARG_A_DIFFUSE_COLOR
| RADEON_COMP_ARG_A
,
283 RADEON_COLOR_ARG_A_DIFFUSE_ALPHA
,
284 RADEON_COLOR_ARG_A_DIFFUSE_ALPHA
| RADEON_COMP_ARG_A
287 static GLuint radeon_previous_color
[] =
289 RADEON_COLOR_ARG_A_CURRENT_COLOR
,
290 RADEON_COLOR_ARG_A_CURRENT_COLOR
| RADEON_COMP_ARG_A
,
291 RADEON_COLOR_ARG_A_CURRENT_ALPHA
,
292 RADEON_COLOR_ARG_A_CURRENT_ALPHA
| RADEON_COMP_ARG_A
295 /* GL_ZERO table - indices 0-3
296 * GL_ONE table - indices 1-4
298 static GLuint radeon_zero_color
[] =
300 RADEON_COLOR_ARG_A_ZERO
,
301 RADEON_COLOR_ARG_A_ZERO
| RADEON_COMP_ARG_A
,
302 RADEON_COLOR_ARG_A_ZERO
,
303 RADEON_COLOR_ARG_A_ZERO
| RADEON_COMP_ARG_A
,
304 RADEON_COLOR_ARG_A_ZERO
308 /* The alpha tables only have GL_SRC_ALPHA and GL_ONE_MINUS_SRC_ALPHA.
310 static GLuint radeon_texture_alpha
[][RADEON_MAX_TEXTURE_UNITS
] =
313 RADEON_ALPHA_ARG_A_T0_ALPHA
,
314 RADEON_ALPHA_ARG_A_T1_ALPHA
,
315 RADEON_ALPHA_ARG_A_T2_ALPHA
318 RADEON_ALPHA_ARG_A_T0_ALPHA
| RADEON_COMP_ARG_A
,
319 RADEON_ALPHA_ARG_A_T1_ALPHA
| RADEON_COMP_ARG_A
,
320 RADEON_ALPHA_ARG_A_T2_ALPHA
| RADEON_COMP_ARG_A
324 static GLuint radeon_tfactor_alpha
[] =
326 RADEON_ALPHA_ARG_A_TFACTOR_ALPHA
,
327 RADEON_ALPHA_ARG_A_TFACTOR_ALPHA
| RADEON_COMP_ARG_A
330 static GLuint radeon_primary_alpha
[] =
332 RADEON_ALPHA_ARG_A_DIFFUSE_ALPHA
,
333 RADEON_ALPHA_ARG_A_DIFFUSE_ALPHA
| RADEON_COMP_ARG_A
336 static GLuint radeon_previous_alpha
[] =
338 RADEON_ALPHA_ARG_A_CURRENT_ALPHA
,
339 RADEON_ALPHA_ARG_A_CURRENT_ALPHA
| RADEON_COMP_ARG_A
342 /* GL_ZERO table - indices 0-1
343 * GL_ONE table - indices 1-2
345 static GLuint radeon_zero_alpha
[] =
347 RADEON_ALPHA_ARG_A_ZERO
,
348 RADEON_ALPHA_ARG_A_ZERO
| RADEON_COMP_ARG_A
,
349 RADEON_ALPHA_ARG_A_ZERO
353 /* Extract the arg from slot A, shift it into the correct argument slot
354 * and set the corresponding complement bit.
356 #define RADEON_COLOR_ARG( n, arg ) \
359 ((color_arg[n] & RADEON_COLOR_ARG_MASK) \
360 << RADEON_COLOR_ARG_##arg##_SHIFT); \
362 ((color_arg[n] >> RADEON_COMP_ARG_SHIFT) \
363 << RADEON_COMP_ARG_##arg##_SHIFT); \
366 #define RADEON_ALPHA_ARG( n, arg ) \
369 ((alpha_arg[n] & RADEON_ALPHA_ARG_MASK) \
370 << RADEON_ALPHA_ARG_##arg##_SHIFT); \
372 ((alpha_arg[n] >> RADEON_COMP_ARG_SHIFT) \
373 << RADEON_COMP_ARG_##arg##_SHIFT); \
377 /* ================================================================
378 * Texture unit state management
381 static GLboolean
radeonUpdateTextureEnv( GLcontext
*ctx
, int unit
)
383 radeonContextPtr rmesa
= RADEON_CONTEXT(ctx
);
384 const struct gl_texture_unit
*texUnit
= &ctx
->Texture
.Unit
[unit
];
385 GLuint color_combine
, alpha_combine
;
386 const GLuint color_combine0
= RADEON_COLOR_ARG_A_ZERO
| RADEON_COLOR_ARG_B_ZERO
387 | RADEON_COLOR_ARG_C_CURRENT_COLOR
| RADEON_BLEND_CTL_ADD
388 | RADEON_SCALE_1X
| RADEON_CLAMP_TX
;
389 const GLuint alpha_combine0
= RADEON_ALPHA_ARG_A_ZERO
| RADEON_ALPHA_ARG_B_ZERO
390 | RADEON_ALPHA_ARG_C_CURRENT_ALPHA
| RADEON_BLEND_CTL_ADD
391 | RADEON_SCALE_1X
| RADEON_CLAMP_TX
;
394 /* texUnit->_Current can be NULL if and only if the texture unit is
395 * not actually enabled.
397 assert( (texUnit
->_ReallyEnabled
== 0)
398 || (texUnit
->_Current
!= NULL
) );
400 if ( RADEON_DEBUG
& DEBUG_TEXTURE
) {
401 fprintf( stderr
, "%s( %p, %d )\n", __FUNCTION__
, (void *)ctx
, unit
);
404 /* Set the texture environment state. Isn't this nice and clean?
405 * The chip will automagically set the texture alpha to 0xff when
406 * the texture format does not include an alpha component. This
407 * reduces the amount of special-casing we have to do, alpha-only
408 * textures being a notable exception.
410 /* Don't cache these results.
412 rmesa
->state
.texture
.unit
[unit
].format
= 0;
413 rmesa
->state
.texture
.unit
[unit
].envMode
= 0;
415 if ( !texUnit
->_ReallyEnabled
) {
416 color_combine
= color_combine0
;
417 alpha_combine
= alpha_combine0
;
420 GLuint color_arg
[3], alpha_arg
[3];
422 const GLuint numColorArgs
= texUnit
->_CurrentCombine
->_NumArgsRGB
;
423 const GLuint numAlphaArgs
= texUnit
->_CurrentCombine
->_NumArgsA
;
424 GLuint RGBshift
= texUnit
->_CurrentCombine
->ScaleShiftRGB
;
425 GLuint Ashift
= texUnit
->_CurrentCombine
->ScaleShiftA
;
429 * Extract the color and alpha combine function arguments.
431 for ( i
= 0 ; i
< numColorArgs
; i
++ ) {
432 const GLint op
= texUnit
->_CurrentCombine
->OperandRGB
[i
] - GL_SRC_COLOR
;
433 const GLuint srcRGBi
= texUnit
->_CurrentCombine
->SourceRGB
[i
];
438 color_arg
[i
] = radeon_texture_color
[op
][unit
];
441 color_arg
[i
] = radeon_tfactor_color
[op
];
443 case GL_PRIMARY_COLOR
:
444 color_arg
[i
] = radeon_primary_color
[op
];
447 color_arg
[i
] = radeon_previous_color
[op
];
450 color_arg
[i
] = radeon_zero_color
[op
];
453 color_arg
[i
] = radeon_zero_color
[op
+1];
458 /* implement ogl 1.4/1.5 core spec here, not specification of
459 * GL_ARB_texture_env_crossbar (which would require disabling blending
460 * instead of undefined results when referencing not enabled texunit) */
461 color_arg
[i
] = radeon_texture_color
[op
][srcRGBi
- GL_TEXTURE0
];
468 for ( i
= 0 ; i
< numAlphaArgs
; i
++ ) {
469 const GLint op
= texUnit
->_CurrentCombine
->OperandA
[i
] - GL_SRC_ALPHA
;
470 const GLuint srcAi
= texUnit
->_CurrentCombine
->SourceA
[i
];
475 alpha_arg
[i
] = radeon_texture_alpha
[op
][unit
];
478 alpha_arg
[i
] = radeon_tfactor_alpha
[op
];
480 case GL_PRIMARY_COLOR
:
481 alpha_arg
[i
] = radeon_primary_alpha
[op
];
484 alpha_arg
[i
] = radeon_previous_alpha
[op
];
487 alpha_arg
[i
] = radeon_zero_alpha
[op
];
490 alpha_arg
[i
] = radeon_zero_alpha
[op
+1];
495 alpha_arg
[i
] = radeon_texture_alpha
[op
][srcAi
- GL_TEXTURE0
];
503 * Build up the color and alpha combine functions.
505 switch ( texUnit
->_CurrentCombine
->ModeRGB
) {
507 color_combine
= (RADEON_COLOR_ARG_A_ZERO
|
508 RADEON_COLOR_ARG_B_ZERO
|
509 RADEON_BLEND_CTL_ADD
|
511 RADEON_COLOR_ARG( 0, C
);
514 color_combine
= (RADEON_COLOR_ARG_C_ZERO
|
515 RADEON_BLEND_CTL_ADD
|
517 RADEON_COLOR_ARG( 0, A
);
518 RADEON_COLOR_ARG( 1, B
);
521 color_combine
= (RADEON_COLOR_ARG_B_ZERO
|
523 RADEON_BLEND_CTL_ADD
|
525 RADEON_COLOR_ARG( 0, A
);
526 RADEON_COLOR_ARG( 1, C
);
529 color_combine
= (RADEON_COLOR_ARG_B_ZERO
|
531 RADEON_BLEND_CTL_ADDSIGNED
|
533 RADEON_COLOR_ARG( 0, A
);
534 RADEON_COLOR_ARG( 1, C
);
537 color_combine
= (RADEON_COLOR_ARG_B_ZERO
|
539 RADEON_BLEND_CTL_SUBTRACT
|
541 RADEON_COLOR_ARG( 0, A
);
542 RADEON_COLOR_ARG( 1, C
);
545 color_combine
= (RADEON_BLEND_CTL_BLEND
|
547 RADEON_COLOR_ARG( 0, B
);
548 RADEON_COLOR_ARG( 1, A
);
549 RADEON_COLOR_ARG( 2, C
);
552 case GL_DOT3_RGB_EXT
:
553 case GL_DOT3_RGBA_EXT
:
554 /* The EXT version of the DOT3 extension does not support the
555 * scale factor, but the ARB version (and the version in OpenGL
564 /* The R100 / RV200 only support a 1X multiplier in hardware
567 if ( RGBshift
!= (RADEON_SCALE_1X
>> RADEON_SCALE_SHIFT
) ) {
574 color_combine
= (RADEON_COLOR_ARG_C_ZERO
|
575 RADEON_BLEND_CTL_DOT3
|
577 RADEON_COLOR_ARG( 0, A
);
578 RADEON_COLOR_ARG( 1, B
);
581 case GL_MODULATE_ADD_ATI
:
582 color_combine
= (RADEON_BLEND_CTL_ADD
|
584 RADEON_COLOR_ARG( 0, A
);
585 RADEON_COLOR_ARG( 1, C
);
586 RADEON_COLOR_ARG( 2, B
);
588 case GL_MODULATE_SIGNED_ADD_ATI
:
589 color_combine
= (RADEON_BLEND_CTL_ADDSIGNED
|
591 RADEON_COLOR_ARG( 0, A
);
592 RADEON_COLOR_ARG( 1, C
);
593 RADEON_COLOR_ARG( 2, B
);
595 case GL_MODULATE_SUBTRACT_ATI
:
596 color_combine
= (RADEON_BLEND_CTL_SUBTRACT
|
598 RADEON_COLOR_ARG( 0, A
);
599 RADEON_COLOR_ARG( 1, C
);
600 RADEON_COLOR_ARG( 2, B
);
606 switch ( texUnit
->_CurrentCombine
->ModeA
) {
608 alpha_combine
= (RADEON_ALPHA_ARG_A_ZERO
|
609 RADEON_ALPHA_ARG_B_ZERO
|
610 RADEON_BLEND_CTL_ADD
|
612 RADEON_ALPHA_ARG( 0, C
);
615 alpha_combine
= (RADEON_ALPHA_ARG_C_ZERO
|
616 RADEON_BLEND_CTL_ADD
|
618 RADEON_ALPHA_ARG( 0, A
);
619 RADEON_ALPHA_ARG( 1, B
);
622 alpha_combine
= (RADEON_ALPHA_ARG_B_ZERO
|
624 RADEON_BLEND_CTL_ADD
|
626 RADEON_ALPHA_ARG( 0, A
);
627 RADEON_ALPHA_ARG( 1, C
);
630 alpha_combine
= (RADEON_ALPHA_ARG_B_ZERO
|
632 RADEON_BLEND_CTL_ADDSIGNED
|
634 RADEON_ALPHA_ARG( 0, A
);
635 RADEON_ALPHA_ARG( 1, C
);
638 alpha_combine
= (RADEON_COLOR_ARG_B_ZERO
|
640 RADEON_BLEND_CTL_SUBTRACT
|
642 RADEON_ALPHA_ARG( 0, A
);
643 RADEON_ALPHA_ARG( 1, C
);
646 alpha_combine
= (RADEON_BLEND_CTL_BLEND
|
648 RADEON_ALPHA_ARG( 0, B
);
649 RADEON_ALPHA_ARG( 1, A
);
650 RADEON_ALPHA_ARG( 2, C
);
653 case GL_MODULATE_ADD_ATI
:
654 alpha_combine
= (RADEON_BLEND_CTL_ADD
|
656 RADEON_ALPHA_ARG( 0, A
);
657 RADEON_ALPHA_ARG( 1, C
);
658 RADEON_ALPHA_ARG( 2, B
);
660 case GL_MODULATE_SIGNED_ADD_ATI
:
661 alpha_combine
= (RADEON_BLEND_CTL_ADDSIGNED
|
663 RADEON_ALPHA_ARG( 0, A
);
664 RADEON_ALPHA_ARG( 1, C
);
665 RADEON_ALPHA_ARG( 2, B
);
667 case GL_MODULATE_SUBTRACT_ATI
:
668 alpha_combine
= (RADEON_BLEND_CTL_SUBTRACT
|
670 RADEON_ALPHA_ARG( 0, A
);
671 RADEON_ALPHA_ARG( 1, C
);
672 RADEON_ALPHA_ARG( 2, B
);
678 if ( (texUnit
->_CurrentCombine
->ModeRGB
== GL_DOT3_RGB_EXT
)
679 || (texUnit
->_CurrentCombine
->ModeRGB
== GL_DOT3_RGB
) ) {
680 alpha_combine
|= RADEON_DOT_ALPHA_DONT_REPLICATE
;
684 * Apply the scale factor.
686 color_combine
|= (RGBshift
<< RADEON_SCALE_SHIFT
);
687 alpha_combine
|= (Ashift
<< RADEON_SCALE_SHIFT
);
693 if ( rmesa
->hw
.tex
[unit
].cmd
[TEX_PP_TXCBLEND
] != color_combine
||
694 rmesa
->hw
.tex
[unit
].cmd
[TEX_PP_TXABLEND
] != alpha_combine
) {
695 RADEON_STATECHANGE( rmesa
, tex
[unit
] );
696 rmesa
->hw
.tex
[unit
].cmd
[TEX_PP_TXCBLEND
] = color_combine
;
697 rmesa
->hw
.tex
[unit
].cmd
[TEX_PP_TXABLEND
] = alpha_combine
;
703 #define TEXOBJ_TXFILTER_MASK (RADEON_MAX_MIP_LEVEL_MASK | \
704 RADEON_MIN_FILTER_MASK | \
705 RADEON_MAG_FILTER_MASK | \
706 RADEON_MAX_ANISO_MASK | \
707 RADEON_YUV_TO_RGB | \
708 RADEON_YUV_TEMPERATURE_MASK | \
709 RADEON_CLAMP_S_MASK | \
710 RADEON_CLAMP_T_MASK | \
711 RADEON_BORDER_MODE_D3D )
713 #define TEXOBJ_TXFORMAT_MASK (RADEON_TXFORMAT_WIDTH_MASK | \
714 RADEON_TXFORMAT_HEIGHT_MASK | \
715 RADEON_TXFORMAT_FORMAT_MASK | \
716 RADEON_TXFORMAT_F5_WIDTH_MASK | \
717 RADEON_TXFORMAT_F5_HEIGHT_MASK | \
718 RADEON_TXFORMAT_ALPHA_IN_MAP | \
719 RADEON_TXFORMAT_CUBIC_MAP_ENABLE | \
720 RADEON_TXFORMAT_NON_POWER2)
723 static void import_tex_obj_state( radeonContextPtr rmesa
,
725 radeonTexObjPtr texobj
)
727 GLuint
*cmd
= RADEON_DB_STATE( tex
[unit
] );
729 cmd
[TEX_PP_TXFILTER
] &= ~TEXOBJ_TXFILTER_MASK
;
730 cmd
[TEX_PP_TXFILTER
] |= texobj
->pp_txfilter
& TEXOBJ_TXFILTER_MASK
;
731 cmd
[TEX_PP_TXFORMAT
] &= ~TEXOBJ_TXFORMAT_MASK
;
732 cmd
[TEX_PP_TXFORMAT
] |= texobj
->pp_txformat
& TEXOBJ_TXFORMAT_MASK
;
733 cmd
[TEX_PP_TXOFFSET
] = texobj
->pp_txoffset
;
734 cmd
[TEX_PP_BORDER_COLOR
] = texobj
->pp_border_color
;
735 RADEON_DB_STATECHANGE( rmesa
, &rmesa
->hw
.tex
[unit
] );
737 if (texobj
->base
.tObj
->Target
== GL_TEXTURE_RECTANGLE_NV
) {
738 GLuint
*txr_cmd
= RADEON_DB_STATE( txr
[unit
] );
739 txr_cmd
[TXR_PP_TEX_SIZE
] = texobj
->pp_txsize
; /* NPOT only! */
740 txr_cmd
[TXR_PP_TEX_PITCH
] = texobj
->pp_txpitch
; /* NPOT only! */
741 RADEON_DB_STATECHANGE( rmesa
, &rmesa
->hw
.txr
[unit
] );
744 texobj
->dirty_state
&= ~(1<<unit
);
750 static void set_texgen_matrix( radeonContextPtr rmesa
,
752 const GLfloat
*s_plane
,
753 const GLfloat
*t_plane
)
755 static const GLfloat scale_identity
[4] = { 1,1,1,1 };
757 if (!TEST_EQ_4V( s_plane
, scale_identity
) ||
758 !TEST_EQ_4V( t_plane
, scale_identity
)) {
759 rmesa
->TexGenEnabled
|= RADEON_TEXMAT_0_ENABLE
<<unit
;
760 rmesa
->TexGenMatrix
[unit
].m
[0] = s_plane
[0];
761 rmesa
->TexGenMatrix
[unit
].m
[4] = s_plane
[1];
762 rmesa
->TexGenMatrix
[unit
].m
[8] = s_plane
[2];
763 rmesa
->TexGenMatrix
[unit
].m
[12] = s_plane
[3];
765 rmesa
->TexGenMatrix
[unit
].m
[1] = t_plane
[0];
766 rmesa
->TexGenMatrix
[unit
].m
[5] = t_plane
[1];
767 rmesa
->TexGenMatrix
[unit
].m
[9] = t_plane
[2];
768 rmesa
->TexGenMatrix
[unit
].m
[13] = t_plane
[3];
769 rmesa
->NewGLState
|= _NEW_TEXTURE_MATRIX
;
773 /* Ignoring the Q texcoord for now.
775 * Returns GL_FALSE if fallback required.
777 static GLboolean
radeon_validate_texgen( GLcontext
*ctx
, GLuint unit
)
779 radeonContextPtr rmesa
= RADEON_CONTEXT(ctx
);
780 struct gl_texture_unit
*texUnit
= &ctx
->Texture
.Unit
[unit
];
781 GLuint inputshift
= RADEON_TEXGEN_0_INPUT_SHIFT
+ unit
*4;
782 GLuint tmp
= rmesa
->TexGenEnabled
;
784 rmesa
->TexGenEnabled
&= ~(RADEON_TEXGEN_TEXMAT_0_ENABLE
<<unit
);
785 rmesa
->TexGenEnabled
&= ~(RADEON_TEXMAT_0_ENABLE
<<unit
);
786 rmesa
->TexGenEnabled
&= ~(RADEON_TEXGEN_INPUT_MASK
<<inputshift
);
787 rmesa
->TexGenNeedNormals
[unit
] = 0;
789 if ((texUnit
->TexGenEnabled
& (S_BIT
|T_BIT
)) == 0) {
790 /* Disabled, no fallback:
792 rmesa
->TexGenEnabled
|=
793 (RADEON_TEXGEN_INPUT_TEXCOORD_0
+unit
) << inputshift
;
796 else if (texUnit
->TexGenEnabled
& Q_BIT
) {
797 /* Very easy to do this, in fact would remove a fallback case
798 * elsewhere, but I haven't done it yet... Fallback:
800 fprintf(stderr
, "fallback Q_BIT\n");
803 else if ((texUnit
->TexGenEnabled
& (S_BIT
|T_BIT
)) != (S_BIT
|T_BIT
) ||
804 texUnit
->GenModeS
!= texUnit
->GenModeT
) {
805 /* Mixed modes, fallback:
807 /* fprintf(stderr, "fallback mixed texgen\n"); */
811 rmesa
->TexGenEnabled
|= RADEON_TEXGEN_TEXMAT_0_ENABLE
<< unit
;
813 switch (texUnit
->GenModeS
) {
814 case GL_OBJECT_LINEAR
:
815 rmesa
->TexGenEnabled
|= RADEON_TEXGEN_INPUT_OBJ
<< inputshift
;
816 set_texgen_matrix( rmesa
, unit
,
817 texUnit
->ObjectPlaneS
,
818 texUnit
->ObjectPlaneT
);
822 rmesa
->TexGenEnabled
|= RADEON_TEXGEN_INPUT_EYE
<< inputshift
;
823 set_texgen_matrix( rmesa
, unit
,
828 case GL_REFLECTION_MAP_NV
:
829 rmesa
->TexGenNeedNormals
[unit
] = GL_TRUE
;
830 rmesa
->TexGenEnabled
|= RADEON_TEXGEN_INPUT_EYE_REFLECT
<<inputshift
;
833 case GL_NORMAL_MAP_NV
:
834 rmesa
->TexGenNeedNormals
[unit
] = GL_TRUE
;
835 rmesa
->TexGenEnabled
|= RADEON_TEXGEN_INPUT_EYE_NORMAL
<<inputshift
;
840 /* Unsupported mode, fallback:
842 /* fprintf(stderr, "fallback unsupported texgen\n"); */
846 if (tmp
!= rmesa
->TexGenEnabled
) {
847 rmesa
->NewGLState
|= _NEW_TEXTURE_MATRIX
;
854 static void disable_tex( GLcontext
*ctx
, int unit
)
856 radeonContextPtr rmesa
= RADEON_CONTEXT(ctx
);
858 if (rmesa
->hw
.ctx
.cmd
[CTX_PP_CNTL
] & (RADEON_TEX_0_ENABLE
<<unit
)) {
859 /* Texture unit disabled */
860 if ( rmesa
->state
.texture
.unit
[unit
].texobj
!= NULL
) {
861 /* The old texture is no longer bound to this texture unit.
865 rmesa
->state
.texture
.unit
[unit
].texobj
->base
.bound
&= ~(1UL << unit
);
866 rmesa
->state
.texture
.unit
[unit
].texobj
= NULL
;
869 RADEON_STATECHANGE( rmesa
, ctx
);
870 rmesa
->hw
.ctx
.cmd
[CTX_PP_CNTL
] &=
871 ~((RADEON_TEX_0_ENABLE
| RADEON_TEX_BLEND_0_ENABLE
) << unit
);
873 RADEON_STATECHANGE( rmesa
, tcl
);
876 rmesa
->hw
.tcl
.cmd
[TCL_OUTPUT_VTXFMT
] &= ~(RADEON_TCL_VTX_ST0
|
880 rmesa
->hw
.tcl
.cmd
[TCL_OUTPUT_VTXFMT
] &= ~(RADEON_TCL_VTX_ST1
|
888 if (rmesa
->TclFallback
& (RADEON_TCL_FALLBACK_TEXGEN_0
<<unit
)) {
889 TCL_FALLBACK( ctx
, (RADEON_TCL_FALLBACK_TEXGEN_0
<<unit
), GL_FALSE
);
890 rmesa
->recheck_texgen
[unit
] = GL_TRUE
;
896 GLuint inputshift
= RADEON_TEXGEN_0_INPUT_SHIFT
+ unit
*4;
897 GLuint tmp
= rmesa
->TexGenEnabled
;
899 rmesa
->TexGenEnabled
&= ~(RADEON_TEXGEN_TEXMAT_0_ENABLE
<<unit
);
900 rmesa
->TexGenEnabled
&= ~(RADEON_TEXMAT_0_ENABLE
<<unit
);
901 rmesa
->TexGenEnabled
&= ~(RADEON_TEXGEN_INPUT_MASK
<<inputshift
);
902 rmesa
->TexGenNeedNormals
[unit
] = 0;
903 rmesa
->TexGenEnabled
|=
904 (RADEON_TEXGEN_INPUT_TEXCOORD_0
+unit
) << inputshift
;
906 if (tmp
!= rmesa
->TexGenEnabled
) {
907 rmesa
->recheck_texgen
[unit
] = GL_TRUE
;
908 rmesa
->NewGLState
|= _NEW_TEXTURE_MATRIX
;
914 static GLboolean
enable_tex_2d( GLcontext
*ctx
, int unit
)
916 radeonContextPtr rmesa
= RADEON_CONTEXT(ctx
);
917 struct gl_texture_unit
*texUnit
= &ctx
->Texture
.Unit
[unit
];
918 struct gl_texture_object
*tObj
= texUnit
->_Current
;
919 radeonTexObjPtr t
= (radeonTexObjPtr
) tObj
->DriverData
;
921 /* Need to load the 2d images associated with this unit.
923 if (t
->pp_txformat
& RADEON_TXFORMAT_NON_POWER2
) {
924 t
->pp_txformat
&= ~RADEON_TXFORMAT_NON_POWER2
;
925 t
->base
.dirty_images
[0] = ~0;
928 ASSERT(tObj
->Target
== GL_TEXTURE_2D
|| tObj
->Target
== GL_TEXTURE_1D
);
930 if ( t
->base
.dirty_images
[0] ) {
931 RADEON_FIREVERTICES( rmesa
);
932 radeonSetTexImages( rmesa
, tObj
);
933 radeonUploadTexImages( rmesa
, (radeonTexObjPtr
) tObj
->DriverData
, 0 );
934 if ( !t
->base
.memBlock
)
941 static GLboolean
enable_tex_rect( GLcontext
*ctx
, int unit
)
943 radeonContextPtr rmesa
= RADEON_CONTEXT(ctx
);
944 struct gl_texture_unit
*texUnit
= &ctx
->Texture
.Unit
[unit
];
945 struct gl_texture_object
*tObj
= texUnit
->_Current
;
946 radeonTexObjPtr t
= (radeonTexObjPtr
) tObj
->DriverData
;
948 if (!(t
->pp_txformat
& RADEON_TXFORMAT_NON_POWER2
)) {
949 t
->pp_txformat
|= RADEON_TXFORMAT_NON_POWER2
;
950 t
->base
.dirty_images
[0] = ~0;
953 ASSERT(tObj
->Target
== GL_TEXTURE_RECTANGLE_NV
);
955 if ( t
->base
.dirty_images
[0] ) {
956 RADEON_FIREVERTICES( rmesa
);
957 radeonSetTexImages( rmesa
, tObj
);
958 radeonUploadTexImages( rmesa
, (radeonTexObjPtr
) tObj
->DriverData
, 0 );
959 if ( !t
->base
.memBlock
/* && !rmesa->prefer_gart_client_texturing FIXME */ ) {
960 fprintf(stderr
, "%s: upload failed\n", __FUNCTION__
);
969 static GLboolean
update_tex_common( GLcontext
*ctx
, int unit
)
971 radeonContextPtr rmesa
= RADEON_CONTEXT(ctx
);
972 struct gl_texture_unit
*texUnit
= &ctx
->Texture
.Unit
[unit
];
973 struct gl_texture_object
*tObj
= texUnit
->_Current
;
974 radeonTexObjPtr t
= (radeonTexObjPtr
) tObj
->DriverData
;
977 /* Fallback if there's a texture border */
978 if ( tObj
->Image
[0][tObj
->BaseLevel
]->Border
> 0 ) {
979 fprintf(stderr
, "%s: border\n", __FUNCTION__
);
983 /* Update state if this is a different texture object to last
986 if ( rmesa
->state
.texture
.unit
[unit
].texobj
!= t
) {
987 if ( rmesa
->state
.texture
.unit
[unit
].texobj
!= NULL
) {
988 /* The old texture is no longer bound to this texture unit.
992 rmesa
->state
.texture
.unit
[unit
].texobj
->base
.bound
&=
996 rmesa
->state
.texture
.unit
[unit
].texobj
= t
;
997 t
->base
.bound
|= (1UL << unit
);
998 t
->dirty_state
|= 1<<unit
;
999 driUpdateTextureLRU( (driTextureObject
*) t
); /* XXX: should be locked! */
1005 if ( !(rmesa
->hw
.ctx
.cmd
[CTX_PP_CNTL
] & (RADEON_TEX_0_ENABLE
<<unit
))) {
1006 RADEON_STATECHANGE( rmesa
, ctx
);
1007 rmesa
->hw
.ctx
.cmd
[CTX_PP_CNTL
] |=
1008 (RADEON_TEX_0_ENABLE
| RADEON_TEX_BLEND_0_ENABLE
) << unit
;
1010 RADEON_STATECHANGE( rmesa
, tcl
);
1013 rmesa
->hw
.tcl
.cmd
[TCL_OUTPUT_VTXFMT
] |= RADEON_TCL_VTX_ST0
;
1015 rmesa
->hw
.tcl
.cmd
[TCL_OUTPUT_VTXFMT
] |= RADEON_TCL_VTX_ST1
;
1017 rmesa
->recheck_texgen
[unit
] = GL_TRUE
;
1020 if (t
->dirty_state
& (1<<unit
)) {
1021 import_tex_obj_state( rmesa
, unit
, t
);
1024 if (rmesa
->recheck_texgen
[unit
]) {
1025 GLboolean fallback
= !radeon_validate_texgen( ctx
, unit
);
1026 TCL_FALLBACK( ctx
, (RADEON_TCL_FALLBACK_TEXGEN_0
<<unit
), fallback
);
1027 rmesa
->recheck_texgen
[unit
] = 0;
1028 rmesa
->NewGLState
|= _NEW_TEXTURE_MATRIX
;
1031 format
= tObj
->Image
[0][tObj
->BaseLevel
]->Format
;
1032 if ( rmesa
->state
.texture
.unit
[unit
].format
!= format
||
1033 rmesa
->state
.texture
.unit
[unit
].envMode
!= texUnit
->EnvMode
) {
1034 rmesa
->state
.texture
.unit
[unit
].format
= format
;
1035 rmesa
->state
.texture
.unit
[unit
].envMode
= texUnit
->EnvMode
;
1036 if ( ! radeonUpdateTextureEnv( ctx
, unit
) ) {
1041 FALLBACK( rmesa
, RADEON_FALLBACK_BORDER_MODE
, t
->border_fallback
);
1042 return !t
->border_fallback
;
1047 static GLboolean
radeonUpdateTextureUnit( GLcontext
*ctx
, int unit
)
1049 struct gl_texture_unit
*texUnit
= &ctx
->Texture
.Unit
[unit
];
1051 TCL_FALLBACK( ctx
, RADEON_TCL_FALLBACK_TEXRECT_0
<< unit
, 0 );
1053 if ( texUnit
->_ReallyEnabled
& (TEXTURE_RECT_BIT
) ) {
1054 TCL_FALLBACK( ctx
, RADEON_TCL_FALLBACK_TEXRECT_0
<< unit
, 1 );
1056 return (enable_tex_rect( ctx
, unit
) &&
1057 update_tex_common( ctx
, unit
));
1059 else if ( texUnit
->_ReallyEnabled
& (TEXTURE_1D_BIT
| TEXTURE_2D_BIT
) ) {
1060 return (enable_tex_2d( ctx
, unit
) &&
1061 update_tex_common( ctx
, unit
));
1063 else if ( texUnit
->_ReallyEnabled
) {
1067 disable_tex( ctx
, unit
);
1072 void radeonUpdateTextureState( GLcontext
*ctx
)
1074 radeonContextPtr rmesa
= RADEON_CONTEXT(ctx
);
1077 ok
= (radeonUpdateTextureUnit( ctx
, 0 ) &&
1078 radeonUpdateTextureUnit( ctx
, 1 ));
1080 FALLBACK( rmesa
, RADEON_FALLBACK_TEXTURE
, !ok
);
1082 if (rmesa
->TclFallback
)
1083 radeonChooseVertexState( ctx
);