2 * (C) Copyright IBM Corporation 2004
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * on the rights to use, copy, modify, merge, publish, distribute, sub
9 * license, and/or sell copies of the Software, and to permit persons to whom
10 * the Software is furnished to do so, subject to the following conditions:
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
19 * IBM AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
20 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
21 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
22 * USE OR OTHER DEALINGS IN THE SOFTWARE.
26 * \file via_texcombine.c
27 * Calculate texture combine hardware state.
29 * \author Ian Romanick <idr@us.ibm.com>
42 #include "via_context.h"
43 #include "via_state.h"
46 #include "via_ioctl.h"
48 #include "swrast/swrast.h"
49 #include "array_cache/acache.h"
51 #include "swrast_setup/swrast_setup.h"
53 #include "tnl/t_pipeline.h"
55 #define VIA_USE_ALPHA (HC_XTC_Adif - HC_XTC_Dif)
57 #define INPUT_A_SHIFT 14
58 #define INPUT_B_SHIFT 7
59 #define INPUT_C_SHIFT 0
60 #define INPUT_CBias_SHIFT 14
62 #define CONST_ONE (HC_XTC_0 | HC_XTC_InvTOPC)
64 static const unsigned color_operand_modifier
[4] = {
68 VIA_USE_ALPHA
| HC_XTC_InvTOPC
,
71 static const unsigned alpha_operand_modifier
[2] = {
75 static const unsigned bias_alpha_operand_modifier
[2] = {
76 0, HC_HTXnTBLAbias_Inv
80 static const unsigned c_shift_table
[3] = {
81 HC_HTXnTBLCshift_No
, HC_HTXnTBLCshift_1
, HC_HTXnTBLCshift_2
84 static const unsigned a_shift_table
[3] = {
85 HC_HTXnTBLAshift_No
, HC_HTXnTBLAshift_1
, HC_HTXnTBLAshift_2
90 * Calculate the hardware state for the specified texture combine mode
93 * For the alpha combine, \c GL_CONSTANT is still probably wrong.
96 * All forms of DOT3 bumpmapping are completely untested, and are most
100 * This code still fails progs/demos/texenv for all modes with \c GL_ALPHA
101 * textures. This was also the case with the code that Via supplied. It
102 * also fails for \c GL_REPLACE with \c GL_RGBA textures. Everything else
103 * that texenv tests looks good.
106 * KW: needs attention to the case where texunit 1 is enabled but
110 viaTexCombineState( viaContextPtr vmesa
,
111 const struct gl_tex_env_combine_state
* combine
,
114 unsigned color_arg
[3];
115 unsigned alpha_arg
[3];
116 unsigned bias_alpha_arg
[3];
117 unsigned color
= HC_HTXnTBLCsat_MASK
;
118 unsigned alpha
= HC_HTXnTBLAsat_MASK
;
121 unsigned a_shift
= combine
->ScaleShiftA
;
122 unsigned c_shift
= combine
->ScaleShiftRGB
;
124 unsigned constant_color
[3];
125 unsigned ordered_constant_color
[4];
126 unsigned constant_alpha
[3];
127 unsigned bias_alpha
= 0;
128 unsigned abc_alpha
= 0;
129 const struct gl_texture_unit
const * texUnit
= & vmesa
->glCtx
->Texture
.Unit
[unit
];
130 unsigned env_color
[4];
132 /* It seems that the color clamping can be overwhelmed at the 4x
133 * scale settings, necessitating this fallback:
135 if (c_shift
== 2 || a_shift
== 2) {
139 CLAMPED_FLOAT_TO_UBYTE(env_color
[0], texUnit
->EnvColor
[0]);
140 CLAMPED_FLOAT_TO_UBYTE(env_color
[1], texUnit
->EnvColor
[1]);
141 CLAMPED_FLOAT_TO_UBYTE(env_color
[2], texUnit
->EnvColor
[2]);
142 CLAMPED_FLOAT_TO_UBYTE(env_color
[3], texUnit
->EnvColor
[3]);
144 (void) memset( constant_color
, 0, sizeof( constant_color
) );
145 (void) memset( ordered_constant_color
, 0, sizeof( ordered_constant_color
) );
146 (void) memset( constant_alpha
, 0, sizeof( constant_alpha
) );
148 for ( i
= 0 ; i
< combine
->_NumArgsRGB
; i
++ ) {
149 const GLint op
= combine
->OperandRGB
[i
] - GL_SRC_COLOR
;
151 switch ( combine
->SourceRGB
[i
] ) {
153 color_arg
[i
] = HC_XTC_Tex
;
154 color_arg
[i
] += color_operand_modifier
[op
];
157 color_arg
[i
] = HC_XTC_HTXnTBLRC
;
160 case 0: /* GL_SRC_COLOR */
161 constant_color
[i
] = ((env_color
[0] << 16) |
162 (env_color
[1] << 8) |
165 case 1: /* GL_ONE_MINUS_SRC_COLOR */
166 constant_color
[i
] = ~((env_color
[0] << 16) |
167 (env_color
[1] << 8) |
168 env_color
[2]) & 0x00ffffff;
170 case 2: /* GL_SRC_ALPHA */
171 constant_color
[i
] = ((env_color
[3] << 16) |
172 (env_color
[3] << 8) |
175 case 3: /* GL_ONE_MINUS_SRC_ALPHA */
176 constant_color
[i
] = ~((env_color
[3] << 16) |
177 (env_color
[3] << 8) |
178 env_color
[3]) & 0x00ffffff;
182 case GL_PRIMARY_COLOR
:
183 color_arg
[i
] = HC_XTC_Dif
;
184 color_arg
[i
] += color_operand_modifier
[op
];
187 color_arg
[i
] = (unit
== 0) ? HC_XTC_Dif
: HC_XTC_Cur
;
188 color_arg
[i
] += color_operand_modifier
[op
];
194 /* On the Unichrome, all combine operations take on some form of:
196 * (xA * (xB op xC) + xBias) << xShift
198 * 'op' can be selected as add, subtract, min, max, or mask. The min, max
199 * and mask modes are currently unused. With the exception of DOT3, all
200 * standard GL_COMBINE modes can be implemented simply by selecting the
201 * correct inputs for A, B, C, and Bias and the correct operation for op.
203 * NOTE: xBias (when read from the constant registers) is signed,
204 * and scaled to fit -255..255 in 8 bits, ie 0x1 == 2.
207 switch( combine
->ModeRGB
) {
208 /* Ca = 1.0, Cb = arg0, Cc = 0, Cbias = 0
211 color
|= ((CONST_ONE
<< INPUT_A_SHIFT
) |
212 (color_arg
[0] << INPUT_B_SHIFT
));
214 ordered_constant_color
[1] = constant_color
[0];
217 /* Ca = arg[0], Cb = arg[1], Cc = 0, Cbias = 0
220 color
|= ((color_arg
[0] << INPUT_A_SHIFT
) |
221 (color_arg
[1] << INPUT_B_SHIFT
));
223 ordered_constant_color
[0] = constant_color
[0];
224 ordered_constant_color
[1] = constant_color
[1];
227 /* Ca = 1.0, Cb = arg[0], Cc = arg[1], Cbias = 0
231 if ( combine
->ModeRGB
== GL_SUBTRACT
) {
232 op
|= HC_HTXnTBLCop_Sub
;
235 color
|= ((CONST_ONE
<< INPUT_A_SHIFT
) |
236 (color_arg
[0] << INPUT_B_SHIFT
) |
237 (color_arg
[1] << INPUT_C_SHIFT
));
239 ordered_constant_color
[1] = constant_color
[0];
240 ordered_constant_color
[2] = constant_color
[1];
243 /* Ca = 1.0, Cb = arg[0], Cc = arg[1], Cbias = -0.5
246 color
|= ((CONST_ONE
<< INPUT_A_SHIFT
) |
247 (color_arg
[0] << INPUT_B_SHIFT
) |
248 (color_arg
[1] << INPUT_C_SHIFT
));
250 bias
|= HC_HTXnTBLCbias_HTXnTBLRC
;
252 ordered_constant_color
[1] = constant_color
[0];
253 ordered_constant_color
[2] = constant_color
[1];
254 ordered_constant_color
[3] = 0x00bfbfbf; /* -.5 */
257 /* Ca = arg[2], Cb = arg[0], Cc = arg[1], Cbias = arg[1]
260 op
|= HC_HTXnTBLCop_Sub
;
262 color
|= ((color_arg
[2] << INPUT_A_SHIFT
) |
263 (color_arg
[0] << INPUT_B_SHIFT
) |
264 (color_arg
[1] << INPUT_C_SHIFT
));
266 bias
|= (color_arg
[1] << INPUT_CBias_SHIFT
);
268 ordered_constant_color
[0] = constant_color
[2];
269 ordered_constant_color
[1] = constant_color
[0];
270 ordered_constant_color
[2] = constant_color
[1];
271 ordered_constant_color
[3] = (constant_color
[1] >> 1) & 0x7f7f7f;
275 /* At this point this code is completely untested. It appears that the
276 * Unichrome has the same limitation as the Radeon R100. The only
277 * supported post-scale when doing DOT3 bumpmapping is 1x.
279 case GL_DOT3_RGB_EXT
:
280 case GL_DOT3_RGBA_EXT
:
285 color
|= ((color_arg
[0] << INPUT_A_SHIFT
) |
286 (color_arg
[1] << INPUT_B_SHIFT
));
287 op
|= HC_HTXnTBLDOT4
;
299 /* The alpha blend stage has the annoying quirk of not having a
300 * hard-wired 0 input, like the color stage. As a result, we have
301 * to program the constant register with 0 and use that as our
304 * (xA * (xB op xC) + xBias) << xShift
308 for ( i
= 0 ; i
< combine
->_NumArgsA
; i
++ ) {
309 const GLint op
= combine
->OperandA
[i
] - GL_SRC_ALPHA
;
311 switch ( combine
->SourceA
[i
] ) {
313 alpha_arg
[i
] = HC_XTA_Atex
;
314 alpha_arg
[i
] += alpha_operand_modifier
[op
];
315 bias_alpha_arg
[i
] = HC_HTXnTBLAbias_Atex
;
316 bias_alpha_arg
[i
] += bias_alpha_operand_modifier
[op
];
319 alpha_arg
[i
] = HC_XTA_HTXnTBLRA
;
320 bias_alpha_arg
[i
] = HC_HTXnTBLAbias_HTXnTBLRAbias
;
321 constant_alpha
[i
] = (op
== 0) ? env_color
[3] : (~env_color
[3] & 0xff);
323 case GL_PRIMARY_COLOR
:
324 alpha_arg
[i
] = HC_XTA_Adif
;
325 alpha_arg
[i
] += alpha_operand_modifier
[op
];
326 bias_alpha_arg
[i
] = HC_HTXnTBLAbias_Adif
;
327 bias_alpha_arg
[i
] += bias_alpha_operand_modifier
[op
];
330 alpha_arg
[i
] = (unit
== 0) ? HC_XTA_Adif
: HC_XTA_Acur
;
331 alpha_arg
[i
] += alpha_operand_modifier
[op
];
332 bias_alpha_arg
[i
] = (unit
== 0) ? HC_HTXnTBLAbias_Adif
: HC_HTXnTBLAbias_Acur
;
333 bias_alpha_arg
[i
] += bias_alpha_operand_modifier
[op
];
338 switch( combine
->ModeA
) {
339 /* Aa = 0, Ab = 0, Ac = 0, Abias = arg0
342 alpha
|= ((HC_XTA_HTXnTBLRA
<< INPUT_A_SHIFT
) |
343 (HC_XTA_HTXnTBLRA
<< INPUT_B_SHIFT
) |
344 (HC_XTA_HTXnTBLRA
<< INPUT_C_SHIFT
));
347 bias
|= bias_alpha_arg
[0];
348 bias_alpha
= constant_alpha
[0] >> 1;
351 /* Aa = arg[0], Ab = arg[1], Ac = 0, Abias = 0
354 alpha
|= ((alpha_arg
[1] << INPUT_A_SHIFT
) |
355 (alpha_arg
[0] << INPUT_B_SHIFT
) |
356 (HC_XTA_HTXnTBLRA
<< INPUT_C_SHIFT
));
358 abc_alpha
= ((constant_alpha
[1] << HC_HTXnTBLRAa_SHIFT
) |
359 (constant_alpha
[0] << HC_HTXnTBLRAb_SHIFT
) |
360 (0 << HC_HTXnTBLRAc_SHIFT
));
362 bias
|= HC_HTXnTBLAbias_HTXnTBLRAbias
;
366 /* Aa = 1.0, Ab = arg[0], Ac = arg[1], Abias = 0
370 if ( combine
->ModeA
== GL_SUBTRACT
) {
371 op
|= HC_HTXnTBLAop_Sub
;
374 alpha
|= ((HC_XTA_HTXnTBLRA
<< INPUT_A_SHIFT
) |
375 (alpha_arg
[0] << INPUT_B_SHIFT
) |
376 (alpha_arg
[1] << INPUT_C_SHIFT
));
378 abc_alpha
= ((0xff << HC_HTXnTBLRAa_SHIFT
) |
379 (constant_alpha
[0] << HC_HTXnTBLRAb_SHIFT
) |
380 (constant_alpha
[1] << HC_HTXnTBLRAc_SHIFT
));
382 bias
|= HC_HTXnTBLAbias_HTXnTBLRAbias
;
386 /* Aa = 1.0, Ab = arg[0], Ac = arg[1], Abias = -0.5
389 alpha
|= ((HC_XTA_HTXnTBLRA
<< INPUT_A_SHIFT
) |
390 (alpha_arg
[0] << INPUT_B_SHIFT
) |
391 (alpha_arg
[1] << INPUT_C_SHIFT
));
392 abc_alpha
= ((0xff << HC_HTXnTBLRAa_SHIFT
) |
393 (constant_alpha
[0] << HC_HTXnTBLRAb_SHIFT
) |
394 (constant_alpha
[1] << HC_HTXnTBLRAc_SHIFT
));
396 bias
|= HC_HTXnTBLAbias_HTXnTBLRAbias
;
400 /* Aa = arg[2], Ab = arg[0], Ac = arg[1], Abias = arg[1]
403 op
|= HC_HTXnTBLAop_Sub
;
405 alpha
|= ((alpha_arg
[2] << INPUT_A_SHIFT
) |
406 (alpha_arg
[0] << INPUT_B_SHIFT
) |
407 (alpha_arg
[1] << INPUT_C_SHIFT
));
408 abc_alpha
= ((constant_alpha
[2] << HC_HTXnTBLRAa_SHIFT
) |
409 (constant_alpha
[0] << HC_HTXnTBLRAb_SHIFT
) |
410 (constant_alpha
[1] << HC_HTXnTBLRAc_SHIFT
));
412 bias
|= bias_alpha_arg
[1];
413 bias_alpha
= constant_alpha
[1] >> 1;
418 op
|= c_shift_table
[ c_shift
] | a_shift_table
[ a_shift
];
422 vmesa
->regHTXnTBLMPfog_0
= HC_HTXnTBLMPfog_Fog
;
424 vmesa
->regHTXnTBLCsat_0
= color
;
425 vmesa
->regHTXnTBLAsat_0
= alpha
;
426 vmesa
->regHTXnTBLCop_0
= op
| bias
;
427 vmesa
->regHTXnTBLRAa_0
= abc_alpha
;
428 vmesa
->regHTXnTBLRFog_0
= bias_alpha
;
430 vmesa
->regHTXnTBLRCa_0
= ordered_constant_color
[0];
431 vmesa
->regHTXnTBLRCb_0
= ordered_constant_color
[1];
432 vmesa
->regHTXnTBLRCc_0
= ordered_constant_color
[2];
433 vmesa
->regHTXnTBLRCbias_0
= ordered_constant_color
[3];
436 vmesa
->regHTXnTBLMPfog_1
= HC_HTXnTBLMPfog_Fog
;
438 vmesa
->regHTXnTBLCsat_1
= color
;
439 vmesa
->regHTXnTBLAsat_1
= alpha
;
440 vmesa
->regHTXnTBLCop_1
= op
| bias
;
441 vmesa
->regHTXnTBLRAa_1
= abc_alpha
;
442 vmesa
->regHTXnTBLRFog_1
= bias_alpha
;
444 vmesa
->regHTXnTBLRCa_1
= ordered_constant_color
[0];
445 vmesa
->regHTXnTBLRCb_1
= ordered_constant_color
[1];
446 vmesa
->regHTXnTBLRCc_1
= ordered_constant_color
[2];
447 vmesa
->regHTXnTBLRCbias_1
= ordered_constant_color
[3];