2 Copyright (C) The Weather Channel, Inc. 2002.
3 Copyright (C) 2004 Nicolai Haehnle.
6 The Weather Channel (TM) funded Tungsten Graphics to develop the
7 initial release of the Radeon 8500 driver under the XFree86 license.
8 This notice must be preserved.
10 Permission is hereby granted, free of charge, to any person obtaining
11 a copy of this software and associated documentation files (the
12 "Software"), to deal in the Software without restriction, including
13 without limitation the rights to use, copy, modify, merge, publish,
14 distribute, sublicense, and/or sell copies of the Software, and to
15 permit persons to whom the Software is furnished to do so, subject to
16 the following conditions:
18 The above copyright notice and this permission notice (including the
19 next paragraph) shall be included in all copies or substantial
20 portions of the Software.
22 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
23 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
24 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
25 IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
26 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
27 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
28 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
30 **************************************************************************/
35 * \author Keith Whitwell <keith@tungstengraphics.com>
37 * \author Nicolai Haehnle <prefect_@gmx.net>
43 #include "main/glheader.h"
44 #include "main/imports.h"
45 #include "main/macros.h"
46 #include "main/context.h"
47 #include "main/simple_list.h"
48 #include "swrast/swrast.h"
50 #include "radeon_common.h"
51 #include "radeon_lock.h"
52 #include "r300_context.h"
53 #include "r300_ioctl.h"
54 #include "r300_cmdbuf.h"
55 #include "r300_state.h"
56 #include "r300_vertprog.h"
57 #include "radeon_reg.h"
58 #include "r300_emit.h"
59 #include "r300_context.h"
63 #define R200_3D_DRAW_IMMD_2 0xC0003500
65 #define CLEARBUFFER_COLOR 0x1
66 #define CLEARBUFFER_DEPTH 0x2
67 #define CLEARBUFFER_STENCIL 0x4
72 * Fragment program helper macros
75 /* Produce unshifted source selectors */
76 #define FP_TMP(idx) (idx)
77 #define FP_CONST(idx) ((idx) | (1 << 5))
79 /* Produce source/dest selector dword */
80 #define FP_SELC_MASK_NO 0
81 #define FP_SELC_MASK_X 1
82 #define FP_SELC_MASK_Y 2
83 #define FP_SELC_MASK_XY 3
84 #define FP_SELC_MASK_Z 4
85 #define FP_SELC_MASK_XZ 5
86 #define FP_SELC_MASK_YZ 6
87 #define FP_SELC_MASK_XYZ 7
89 #define FP_SELC(destidx,regmask,outmask,src0,src1,src2) \
90 (((destidx) << R300_ALU_DSTC_SHIFT) | \
91 (FP_SELC_MASK_##regmask << 23) | \
92 (FP_SELC_MASK_##outmask << 26) | \
93 ((src0) << R300_ALU_SRC0C_SHIFT) | \
94 ((src1) << R300_ALU_SRC1C_SHIFT) | \
95 ((src2) << R300_ALU_SRC2C_SHIFT))
97 #define FP_SELA_MASK_NO 0
98 #define FP_SELA_MASK_W 1
100 #define FP_SELA(destidx,regmask,outmask,src0,src1,src2) \
101 (((destidx) << R300_ALU_DSTA_SHIFT) | \
102 (FP_SELA_MASK_##regmask << 23) | \
103 (FP_SELA_MASK_##outmask << 24) | \
104 ((src0) << R300_ALU_SRC0A_SHIFT) | \
105 ((src1) << R300_ALU_SRC1A_SHIFT) | \
106 ((src2) << R300_ALU_SRC2A_SHIFT))
108 /* Produce unshifted argument selectors */
109 #define FP_ARGC(source) R300_ALU_ARGC_##source
110 #define FP_ARGA(source) R300_ALU_ARGA_##source
111 #define FP_ABS(arg) ((arg) | (1 << 6))
112 #define FP_NEG(arg) ((arg) ^ (1 << 5))
114 /* Produce instruction dword */
115 #define FP_INSTRC(opcode,arg0,arg1,arg2) \
116 (R300_ALU_OUTC_##opcode | \
117 ((arg0) << R300_ALU_ARG0C_SHIFT) | \
118 ((arg1) << R300_ALU_ARG1C_SHIFT) | \
119 ((arg2) << R300_ALU_ARG2C_SHIFT))
121 #define FP_INSTRA(opcode,arg0,arg1,arg2) \
122 (R300_ALU_OUTA_##opcode | \
123 ((arg0) << R300_ALU_ARG0A_SHIFT) | \
124 ((arg1) << R300_ALU_ARG1A_SHIFT) | \
125 ((arg2) << R300_ALU_ARG2A_SHIFT))
129 static void r300EmitClearState(GLcontext
* ctx
);
131 static void r300ClearBuffer(r300ContextPtr r300
, int flags
,
132 struct radeon_renderbuffer
*rrb
,
133 struct radeon_renderbuffer
*rrbd
)
135 BATCH_LOCALS(&r300
->radeon
);
136 GLcontext
*ctx
= r300
->radeon
.glCtx
;
137 __DRIdrawablePrivate
*dPriv
= radeon_get_drawable(&r300
->radeon
);
139 r300ContextPtr rmesa
= r300
;
141 if (RADEON_DEBUG
& DEBUG_IOCTL
)
142 fprintf(stderr
, "%s: buffer %p (%i,%i %ix%i)\n",
143 __FUNCTION__
, rrb
, dPriv
->x
, dPriv
->y
,
147 cbpitch
= (rrb
->pitch
/ rrb
->cpp
);
149 cbpitch
|= R300_COLOR_FORMAT_ARGB8888
;
151 cbpitch
|= R300_COLOR_FORMAT_RGB565
;
153 if (rrb
->bo
->flags
& RADEON_BO_FLAGS_MACRO_TILE
){
154 cbpitch
|= R300_COLOR_TILE_ENABLE
;
159 cp_wait(&r300
->radeon
, R300_WAIT_3D
| R300_WAIT_3D_CLEAN
);
160 end_3d(&rmesa
->radeon
);
162 if (flags
& CLEARBUFFER_COLOR
) {
164 BEGIN_BATCH_NO_AUTOSTATE(6);
165 OUT_BATCH_REGSEQ(R300_RB3D_COLOROFFSET0
, 1);
166 OUT_BATCH_RELOC(0, rrb
->bo
, 0, 0, RADEON_GEM_DOMAIN_VRAM
, 0);
167 OUT_BATCH_REGVAL(R300_RB3D_COLORPITCH0
, cbpitch
);
171 if (flags
& (CLEARBUFFER_DEPTH
| CLEARBUFFER_STENCIL
)) {
172 uint32_t zbpitch
= (rrbd
->pitch
/ rrbd
->cpp
);
173 if (rrbd
->bo
->flags
& RADEON_BO_FLAGS_MACRO_TILE
){
174 zbpitch
|= R300_DEPTHMACROTILE_ENABLE
;
176 if (rrbd
->bo
->flags
& RADEON_BO_FLAGS_MICRO_TILE
){
177 zbpitch
|= R300_DEPTHMICROTILE_TILED
;
179 BEGIN_BATCH_NO_AUTOSTATE(6);
180 OUT_BATCH_REGSEQ(R300_ZB_DEPTHOFFSET
, 1);
181 OUT_BATCH_RELOC(0, rrbd
->bo
, 0, 0, RADEON_GEM_DOMAIN_VRAM
, 0);
182 OUT_BATCH_REGSEQ(R300_ZB_DEPTHPITCH
, 1);
183 if (!r300
->radeon
.radeonScreen
->kernel_mm
)
186 OUT_BATCH_RELOC(zbpitch
, rrbd
->bo
, zbpitch
, 0, RADEON_GEM_DOMAIN_VRAM
, 0);
190 BEGIN_BATCH_NO_AUTOSTATE(6);
191 OUT_BATCH_REGSEQ(RB3D_COLOR_CHANNEL_MASK
, 1);
192 if (flags
& CLEARBUFFER_COLOR
) {
193 OUT_BATCH((ctx
->Color
.ColorMask
[BCOMP
] ? RB3D_COLOR_CHANNEL_MASK_BLUE_MASK0
: 0) |
194 (ctx
->Color
.ColorMask
[GCOMP
] ? RB3D_COLOR_CHANNEL_MASK_GREEN_MASK0
: 0) |
195 (ctx
->Color
.ColorMask
[RCOMP
] ? RB3D_COLOR_CHANNEL_MASK_RED_MASK0
: 0) |
196 (ctx
->Color
.ColorMask
[ACOMP
] ? RB3D_COLOR_CHANNEL_MASK_ALPHA_MASK0
: 0));
208 if (flags
& CLEARBUFFER_DEPTH
) {
209 t1
|= R300_Z_ENABLE
| R300_Z_WRITE_ENABLE
;
211 (R300_ZS_ALWAYS
<< R300_Z_FUNC_SHIFT
);
214 if (flags
& CLEARBUFFER_STENCIL
) {
215 t1
|= R300_STENCIL_ENABLE
;
218 R300_S_FRONT_FUNC_SHIFT
) |
220 R300_S_FRONT_SFAIL_OP_SHIFT
) |
222 R300_S_FRONT_ZPASS_OP_SHIFT
) |
224 R300_S_FRONT_ZFAIL_OP_SHIFT
);
227 OUT_BATCH_REGSEQ(R300_ZB_CNTL
, 3);
230 OUT_BATCH(((ctx
->Stencil
.WriteMask
[0] & R300_STENCILREF_MASK
) <<
231 R300_STENCILWRITEMASK_SHIFT
) |
232 (ctx
->Stencil
.Clear
& R300_STENCILREF_MASK
));
236 if (!rmesa
->radeon
.radeonScreen
->kernel_mm
) {
237 BEGIN_BATCH_NO_AUTOSTATE(9);
238 OUT_BATCH(cmdpacket3(r300
->radeon
.radeonScreen
, R300_CMD_PACKET3_CLEAR
));
239 OUT_BATCH_FLOAT32(dPriv
->w
/ 2.0);
240 OUT_BATCH_FLOAT32(dPriv
->h
/ 2.0);
241 OUT_BATCH_FLOAT32(ctx
->Depth
.Clear
);
242 OUT_BATCH_FLOAT32(1.0);
243 OUT_BATCH_FLOAT32(ctx
->Color
.ClearColor
[0]);
244 OUT_BATCH_FLOAT32(ctx
->Color
.ClearColor
[1]);
245 OUT_BATCH_FLOAT32(ctx
->Color
.ClearColor
[2]);
246 OUT_BATCH_FLOAT32(ctx
->Color
.ClearColor
[3]);
249 OUT_BATCH(CP_PACKET3(R200_3D_DRAW_IMMD_2
, 8));
250 OUT_BATCH(R300_PRIM_TYPE_POINT
| R300_PRIM_WALK_RING
|
251 (1 << R300_PRIM_NUM_VERTICES_SHIFT
));
252 OUT_BATCH_FLOAT32(dPriv
->w
/ 2.0);
253 OUT_BATCH_FLOAT32(dPriv
->h
/ 2.0);
254 OUT_BATCH_FLOAT32(ctx
->Depth
.Clear
);
255 OUT_BATCH_FLOAT32(1.0);
256 OUT_BATCH_FLOAT32(ctx
->Color
.ClearColor
[0]);
257 OUT_BATCH_FLOAT32(ctx
->Color
.ClearColor
[1]);
258 OUT_BATCH_FLOAT32(ctx
->Color
.ClearColor
[2]);
259 OUT_BATCH_FLOAT32(ctx
->Color
.ClearColor
[3]);
262 r300EmitCacheFlush(rmesa
);
263 cp_wait(&r300
->radeon
, R300_WAIT_3D
| R300_WAIT_3D_CLEAN
);
265 R300_STATECHANGE(r300
, cb
);
266 R300_STATECHANGE(r300
, cmk
);
267 R300_STATECHANGE(r300
, zs
);
270 static void r300EmitClearState(GLcontext
* ctx
)
272 r300ContextPtr r300
= R300_CONTEXT(ctx
);
273 BATCH_LOCALS(&r300
->radeon
);
274 __DRIdrawablePrivate
*dPriv
= radeon_get_drawable(&r300
->radeon
);
280 has_tcl
= r300
->options
.hw_tcl_enabled
;
282 if (r300
->radeon
.radeonScreen
->chip_family
>= CHIP_FAMILY_RV515
)
285 /* State atom dirty tracking is a little subtle here.
287 * On the one hand, we need to make sure base state is emitted
288 * here if we start with an empty batch buffer, otherwise clear
289 * works incorrectly with multiple processes. Therefore, the first
290 * BEGIN_BATCH cannot be a BEGIN_BATCH_NO_AUTOSTATE.
292 * On the other hand, implicit state emission clears the state atom
293 * dirty bits, so we have to call R300_STATECHANGE later than the
296 * The final trickiness is that, because we change state, we need
297 * to ensure that any stored swtcl primitives are flushed properly
298 * before we start changing state. See the R300_NEWPRIM in r300Clear
302 OUT_BATCH_REGSEQ(R300_VAP_PROG_STREAM_CNTL_0
, 1);
304 OUT_BATCH(((((0 << R300_DST_VEC_LOC_SHIFT
) | R300_DATA_TYPE_FLOAT_4
) << R300_DATA_TYPE_0_SHIFT
) |
305 ((R300_LAST_VEC
| (2 << R300_DST_VEC_LOC_SHIFT
) | R300_DATA_TYPE_FLOAT_4
) << R300_DATA_TYPE_1_SHIFT
)));
307 OUT_BATCH(((((0 << R300_DST_VEC_LOC_SHIFT
) | R300_DATA_TYPE_FLOAT_4
) << R300_DATA_TYPE_0_SHIFT
) |
308 ((R300_LAST_VEC
| (1 << R300_DST_VEC_LOC_SHIFT
) | R300_DATA_TYPE_FLOAT_4
) << R300_DATA_TYPE_1_SHIFT
)));
310 OUT_BATCH_REGVAL(R300_FG_FOG_BLEND
, 0);
311 OUT_BATCH_REGVAL(R300_VAP_PROG_STREAM_CNTL_EXT_0
,
312 ((((R300_SWIZZLE_SELECT_X
<< R300_SWIZZLE_SELECT_X_SHIFT
) |
313 (R300_SWIZZLE_SELECT_Y
<< R300_SWIZZLE_SELECT_Y_SHIFT
) |
314 (R300_SWIZZLE_SELECT_Z
<< R300_SWIZZLE_SELECT_Z_SHIFT
) |
315 (R300_SWIZZLE_SELECT_W
<< R300_SWIZZLE_SELECT_W_SHIFT
) |
316 ((R300_WRITE_ENA_X
| R300_WRITE_ENA_Y
| R300_WRITE_ENA_Z
| R300_WRITE_ENA_W
) << R300_WRITE_ENA_SHIFT
))
317 << R300_SWIZZLE0_SHIFT
) |
318 (((R300_SWIZZLE_SELECT_X
<< R300_SWIZZLE_SELECT_X_SHIFT
) |
319 (R300_SWIZZLE_SELECT_Y
<< R300_SWIZZLE_SELECT_Y_SHIFT
) |
320 (R300_SWIZZLE_SELECT_Z
<< R300_SWIZZLE_SELECT_Z_SHIFT
) |
321 (R300_SWIZZLE_SELECT_W
<< R300_SWIZZLE_SELECT_W_SHIFT
) |
322 ((R300_WRITE_ENA_X
| R300_WRITE_ENA_Y
| R300_WRITE_ENA_Z
| R300_WRITE_ENA_W
) << R300_WRITE_ENA_SHIFT
))
323 << R300_SWIZZLE1_SHIFT
)));
325 /* R300_VAP_INPUT_CNTL_0, R300_VAP_INPUT_CNTL_1 */
326 OUT_BATCH_REGSEQ(R300_VAP_VTX_STATE_CNTL
, 2);
327 OUT_BATCH((R300_SEL_USER_COLOR_0
<< R300_COLOR_0_ASSEMBLY_SHIFT
));
328 OUT_BATCH(R300_INPUT_CNTL_POS
| R300_INPUT_CNTL_COLOR
| R300_INPUT_CNTL_TC0
);
330 /* comes from fglrx startup of clear */
331 OUT_BATCH_REGSEQ(R300_SE_VTE_CNTL
, 2);
332 OUT_BATCH(R300_VTX_W0_FMT
| R300_VPORT_X_SCALE_ENA
|
333 R300_VPORT_X_OFFSET_ENA
| R300_VPORT_Y_SCALE_ENA
|
334 R300_VPORT_Y_OFFSET_ENA
| R300_VPORT_Z_SCALE_ENA
|
335 R300_VPORT_Z_OFFSET_ENA
);
338 OUT_BATCH_REGVAL(R300_VAP_PSC_SGN_NORM_CNTL
, 0xaaaaaaaa);
340 OUT_BATCH_REGSEQ(R300_VAP_OUTPUT_VTX_FMT_0
, 2);
341 OUT_BATCH(R300_VAP_OUTPUT_VTX_FMT_0__POS_PRESENT
|
342 R300_VAP_OUTPUT_VTX_FMT_0__COLOR_0_PRESENT
);
343 OUT_BATCH(0); /* no textures */
345 OUT_BATCH_REGVAL(R300_TX_ENABLE
, 0);
347 OUT_BATCH_REGSEQ(R300_SE_VPORT_XSCALE
, 6);
348 OUT_BATCH_FLOAT32(1.0);
349 OUT_BATCH_FLOAT32(dPriv
->x
);
350 OUT_BATCH_FLOAT32(1.0);
351 OUT_BATCH_FLOAT32(dPriv
->y
);
352 OUT_BATCH_FLOAT32(1.0);
353 OUT_BATCH_FLOAT32(0.0);
355 OUT_BATCH_REGVAL(R300_FG_ALPHA_FUNC
, 0);
357 OUT_BATCH_REGSEQ(R300_RB3D_CBLEND
, 2);
362 R300_STATECHANGE(r300
, vir
[0]);
363 R300_STATECHANGE(r300
, fogs
);
364 R300_STATECHANGE(r300
, vir
[1]);
365 R300_STATECHANGE(r300
, vic
);
366 R300_STATECHANGE(r300
, vte
);
367 R300_STATECHANGE(r300
, vof
);
368 R300_STATECHANGE(r300
, txe
);
369 R300_STATECHANGE(r300
, vpt
);
370 R300_STATECHANGE(r300
, at
);
371 R300_STATECHANGE(r300
, bld
);
372 R300_STATECHANGE(r300
, ps
);
375 R300_STATECHANGE(r300
, vap_clip_cntl
);
377 BEGIN_BATCH_NO_AUTOSTATE(2);
378 OUT_BATCH_REGVAL(R300_VAP_CLIP_CNTL
, R300_PS_UCP_MODE_CLIP_AS_TRIFAN
| R300_CLIP_DISABLE
);
382 BEGIN_BATCH_NO_AUTOSTATE(2);
383 OUT_BATCH_REGVAL(R300_GA_POINT_SIZE
,
384 ((dPriv
->w
* 6) << R300_POINTSIZE_X_SHIFT
) |
385 ((dPriv
->h
* 6) << R300_POINTSIZE_Y_SHIFT
));
389 R300_STATECHANGE(r300
, ri
);
390 R300_STATECHANGE(r300
, rc
);
391 R300_STATECHANGE(r300
, rr
);
394 OUT_BATCH_REGSEQ(R300_RS_IP_0
, 8);
395 for (i
= 0; i
< 8; ++i
)
396 OUT_BATCH(R300_RS_SEL_T(1) | R300_RS_SEL_R(2) | R300_RS_SEL_Q(3));
398 OUT_BATCH_REGSEQ(R300_RS_COUNT
, 2);
399 OUT_BATCH((1 << R300_IC_COUNT_SHIFT
) | R300_HIRES_EN
);
402 OUT_BATCH_REGVAL(R300_RS_INST_0
, R300_RS_INST_COL_CN_WRITE
);
405 R300_STATECHANGE(r300
, ri
);
406 R300_STATECHANGE(r300
, rc
);
407 R300_STATECHANGE(r300
, rr
);
410 OUT_BATCH_REGSEQ(R500_RS_IP_0
, 8);
411 for (i
= 0; i
< 8; ++i
) {
412 OUT_BATCH((R500_RS_IP_PTR_K0
<< R500_RS_IP_TEX_PTR_S_SHIFT
) |
413 (R500_RS_IP_PTR_K0
<< R500_RS_IP_TEX_PTR_T_SHIFT
) |
414 (R500_RS_IP_PTR_K0
<< R500_RS_IP_TEX_PTR_R_SHIFT
) |
415 (R500_RS_IP_PTR_K1
<< R500_RS_IP_TEX_PTR_Q_SHIFT
));
418 OUT_BATCH_REGSEQ(R300_RS_COUNT
, 2);
419 OUT_BATCH((1 << R300_IC_COUNT_SHIFT
) | R300_HIRES_EN
);
422 OUT_BATCH_REGVAL(R500_RS_INST_0
, R500_RS_INST_COL_CN_WRITE
);
427 R300_STATECHANGE(r300
, fp
);
428 R300_STATECHANGE(r300
, fpi
[0]);
429 R300_STATECHANGE(r300
, fpi
[1]);
430 R300_STATECHANGE(r300
, fpi
[2]);
431 R300_STATECHANGE(r300
, fpi
[3]);
434 OUT_BATCH_REGSEQ(R300_US_CONFIG
, 3);
438 OUT_BATCH_REGSEQ(R300_US_CODE_ADDR_0
, 4);
442 OUT_BATCH(R300_RGBA_OUT
);
444 OUT_BATCH_REGVAL(R300_US_ALU_RGB_INST_0
,
445 FP_INSTRC(MAD
, FP_ARGC(SRC0C_XYZ
), FP_ARGC(ONE
), FP_ARGC(ZERO
)));
446 OUT_BATCH_REGVAL(R300_US_ALU_RGB_ADDR_0
,
447 FP_SELC(0, NO
, XYZ
, FP_TMP(0), 0, 0));
448 OUT_BATCH_REGVAL(R300_US_ALU_ALPHA_INST_0
,
449 FP_INSTRA(MAD
, FP_ARGA(SRC0A
), FP_ARGA(ONE
), FP_ARGA(ZERO
)));
450 OUT_BATCH_REGVAL(R300_US_ALU_ALPHA_ADDR_0
,
451 FP_SELA(0, NO
, W
, FP_TMP(0), 0, 0));
454 struct radeon_state_atom r500fp
;
457 R300_STATECHANGE(r300
, fp
);
458 R300_STATECHANGE(r300
, r500fp
);
461 OUT_BATCH_REGSEQ(R500_US_CONFIG
, 2);
462 OUT_BATCH(R500_ZERO_TIMES_ANYTHING_EQUALS_ZERO
);
464 OUT_BATCH_REGSEQ(R500_US_CODE_ADDR
, 3);
465 OUT_BATCH(R500_US_CODE_START_ADDR(0) | R500_US_CODE_END_ADDR(1));
466 OUT_BATCH(R500_US_CODE_RANGE_ADDR(0) | R500_US_CODE_RANGE_SIZE(1));
467 OUT_BATCH(R500_US_CODE_OFFSET_ADDR(0));
470 r500fp
.check
= check_r500fp
;
472 r500fp
.cmd
[0] = cmdr500fp(r300
->radeon
.radeonScreen
, 0, 1, 0, 0);
473 r500fp
.cmd
[1] = R500_INST_TYPE_OUT
|
474 R500_INST_TEX_SEM_WAIT
|
476 R500_INST_RGB_OMASK_R
|
477 R500_INST_RGB_OMASK_G
|
478 R500_INST_RGB_OMASK_B
|
479 R500_INST_ALPHA_OMASK
|
480 R500_INST_RGB_CLAMP
|
481 R500_INST_ALPHA_CLAMP
;
482 r500fp
.cmd
[2] = R500_RGB_ADDR0(0) |
484 R500_RGB_ADDR1_CONST
|
486 R500_RGB_ADDR2_CONST
;
487 r500fp
.cmd
[3] = R500_ALPHA_ADDR0(0) |
488 R500_ALPHA_ADDR1(0) |
489 R500_ALPHA_ADDR1_CONST
|
490 R500_ALPHA_ADDR2(0) |
491 R500_ALPHA_ADDR2_CONST
;
492 r500fp
.cmd
[4] = R500_ALU_RGB_SEL_A_SRC0
|
493 R500_ALU_RGB_R_SWIZ_A_R
|
494 R500_ALU_RGB_G_SWIZ_A_G
|
495 R500_ALU_RGB_B_SWIZ_A_B
|
496 R500_ALU_RGB_SEL_B_SRC0
|
497 R500_ALU_RGB_R_SWIZ_B_R
|
498 R500_ALU_RGB_B_SWIZ_B_G
|
499 R500_ALU_RGB_G_SWIZ_B_B
;
500 r500fp
.cmd
[5] = R500_ALPHA_OP_CMP
|
501 R500_ALPHA_SWIZ_A_A
|
503 r500fp
.cmd
[6] = R500_ALU_RGBA_OP_CMP
|
504 R500_ALU_RGBA_R_SWIZ_0
|
505 R500_ALU_RGBA_G_SWIZ_0
|
506 R500_ALU_RGBA_B_SWIZ_0
|
507 R500_ALU_RGBA_A_SWIZ_0
;
510 emit_r500fp(ctx
, &r500fp
);
514 OUT_BATCH_REGVAL(R300_VAP_PVS_STATE_FLUSH_REG
, 0);
518 vap_cntl
= ((10 << R300_PVS_NUM_SLOTS_SHIFT
) |
519 (5 << R300_PVS_NUM_CNTLRS_SHIFT
) |
520 (12 << R300_VF_MAX_VTX_NUM_SHIFT
));
521 if (r300
->radeon
.radeonScreen
->chip_family
>= CHIP_FAMILY_RV515
)
522 vap_cntl
|= R500_TCL_STATE_OPTIMIZATION
;
524 vap_cntl
= ((10 << R300_PVS_NUM_SLOTS_SHIFT
) |
525 (5 << R300_PVS_NUM_CNTLRS_SHIFT
) |
526 (5 << R300_VF_MAX_VTX_NUM_SHIFT
));
529 if (r300
->radeon
.radeonScreen
->chip_family
== CHIP_FAMILY_RV515
)
530 vap_cntl
|= (2 << R300_PVS_NUM_FPUS_SHIFT
);
531 else if ((r300
->radeon
.radeonScreen
->chip_family
== CHIP_FAMILY_RV530
) ||
532 (r300
->radeon
.radeonScreen
->chip_family
== CHIP_FAMILY_RV560
) ||
533 (r300
->radeon
.radeonScreen
->chip_family
== CHIP_FAMILY_RV570
))
534 vap_cntl
|= (5 << R300_PVS_NUM_FPUS_SHIFT
);
535 else if ((r300
->radeon
.radeonScreen
->chip_family
== CHIP_FAMILY_RV410
) ||
536 (r300
->radeon
.radeonScreen
->chip_family
== CHIP_FAMILY_R420
))
537 vap_cntl
|= (6 << R300_PVS_NUM_FPUS_SHIFT
);
538 else if ((r300
->radeon
.radeonScreen
->chip_family
== CHIP_FAMILY_R520
) ||
539 (r300
->radeon
.radeonScreen
->chip_family
== CHIP_FAMILY_R580
))
540 vap_cntl
|= (8 << R300_PVS_NUM_FPUS_SHIFT
);
542 vap_cntl
|= (4 << R300_PVS_NUM_FPUS_SHIFT
);
544 R300_STATECHANGE(r300
, vap_cntl
);
547 OUT_BATCH_REGVAL(R300_VAP_CNTL
, vap_cntl
);
551 struct radeon_state_atom vpu
;
553 R300_STATECHANGE(r300
, pvs
);
554 R300_STATECHANGE(r300
, vpi
);
557 OUT_BATCH_REGSEQ(R300_VAP_PVS_CODE_CNTL_0
, 3);
558 OUT_BATCH((0 << R300_PVS_FIRST_INST_SHIFT
) |
559 (0 << R300_PVS_XYZW_VALID_INST_SHIFT
) |
560 (1 << R300_PVS_LAST_INST_SHIFT
));
561 OUT_BATCH((0 << R300_PVS_CONST_BASE_OFFSET_SHIFT
) |
562 (0 << R300_PVS_MAX_CONST_ADDR_SHIFT
));
563 OUT_BATCH(1 << R300_PVS_LAST_VTX_SRC_INST_SHIFT
);
566 vpu
.check
= check_vpu
;
568 vpu
.cmd
[0] = cmdvpu(r300
->radeon
.radeonScreen
, 0, 2);
570 vpu
.cmd
[1] = PVS_OP_DST_OPERAND(VE_ADD
, GL_FALSE
, GL_FALSE
,
571 0, 0xf, PVS_DST_REG_OUT
);
572 vpu
.cmd
[2] = PVS_SRC_OPERAND(0, PVS_SRC_SELECT_X
, PVS_SRC_SELECT_Y
,
573 PVS_SRC_SELECT_Z
, PVS_SRC_SELECT_W
,
574 PVS_SRC_REG_INPUT
, NEGATE_NONE
);
575 vpu
.cmd
[3] = PVS_SRC_OPERAND(0, PVS_SRC_SELECT_FORCE_0
,
576 PVS_SRC_SELECT_FORCE_0
,
577 PVS_SRC_SELECT_FORCE_0
,
578 PVS_SRC_SELECT_FORCE_0
,
579 PVS_SRC_REG_INPUT
, NEGATE_NONE
);
582 vpu
.cmd
[5] = PVS_OP_DST_OPERAND(VE_ADD
, GL_FALSE
, GL_FALSE
, 1, 0xf,
584 vpu
.cmd
[6] = PVS_SRC_OPERAND(1, PVS_SRC_SELECT_X
,
585 PVS_SRC_SELECT_Y
, PVS_SRC_SELECT_Z
,
586 PVS_SRC_SELECT_W
, PVS_SRC_REG_INPUT
,
588 vpu
.cmd
[7] = PVS_SRC_OPERAND(1, PVS_SRC_SELECT_FORCE_0
,
589 PVS_SRC_SELECT_FORCE_0
,
590 PVS_SRC_SELECT_FORCE_0
,
591 PVS_SRC_SELECT_FORCE_0
,
592 PVS_SRC_REG_INPUT
, NEGATE_NONE
);
595 r300
->vap_flush_needed
= GL_TRUE
;
600 static int r300KernelClear(GLcontext
*ctx
, GLuint flags
)
602 r300ContextPtr r300
= R300_CONTEXT(ctx
);
603 __DRIdrawablePrivate
*dPriv
= radeon_get_drawable(&r300
->radeon
);
604 struct radeon_framebuffer
*rfb
= dPriv
->driverPrivate
;
605 struct radeon_renderbuffer
*rrb
;
606 struct radeon_renderbuffer
*rrbd
;
609 /* Make sure it fits there. */
610 radeon_cs_space_reset_bos(r300
->radeon
.cmdbuf
.cs
);
612 if (flags
& BUFFER_BIT_COLOR0
) {
613 rrb
= radeon_get_renderbuffer(&rfb
->base
, BUFFER_COLOR0
);
614 radeon_cs_space_add_persistent_bo(r300
->radeon
.cmdbuf
.cs
,
615 rrb
->bo
, 0, RADEON_GEM_DOMAIN_VRAM
);
618 if (flags
& BUFFER_BIT_FRONT_LEFT
) {
619 rrb
= radeon_get_renderbuffer(&rfb
->base
, BUFFER_FRONT_LEFT
);
620 radeon_cs_space_add_persistent_bo(r300
->radeon
.cmdbuf
.cs
,
621 rrb
->bo
, 0, RADEON_GEM_DOMAIN_VRAM
);
624 if (flags
& BUFFER_BIT_BACK_LEFT
) {
625 rrb
= radeon_get_renderbuffer(&rfb
->base
, BUFFER_BACK_LEFT
);
626 radeon_cs_space_add_persistent_bo(r300
->radeon
.cmdbuf
.cs
,
627 rrb
->bo
, 0, RADEON_GEM_DOMAIN_VRAM
);
630 rrbd
= radeon_get_renderbuffer(&rfb
->base
, BUFFER_DEPTH
);
632 radeon_cs_space_add_persistent_bo(r300
->radeon
.cmdbuf
.cs
,
633 rrbd
->bo
, 0, RADEON_GEM_DOMAIN_VRAM
);
636 ret
= radeon_cs_space_check(r300
->radeon
.cmdbuf
.cs
);
640 rcommonEnsureCmdBufSpace(&r300
->radeon
, 421 * 3, __FUNCTION__
);
642 r300EmitClearState(ctx
);
644 rrbd
= radeon_get_renderbuffer(&rfb
->base
, BUFFER_DEPTH
);
645 if (rrbd
&& (flags
& BUFFER_BIT_DEPTH
))
646 bits
|= CLEARBUFFER_DEPTH
;
648 if (rrbd
&& (flags
& BUFFER_BIT_STENCIL
))
649 bits
|= CLEARBUFFER_STENCIL
;
651 if (flags
& BUFFER_BIT_COLOR0
) {
652 rrb
= radeon_get_renderbuffer(&rfb
->base
, BUFFER_COLOR0
);
653 r300ClearBuffer(r300
, CLEARBUFFER_COLOR
, rrb
, NULL
);
657 if (flags
& BUFFER_BIT_FRONT_LEFT
) {
658 rrb
= radeon_get_renderbuffer(&rfb
->base
, BUFFER_FRONT_LEFT
);
659 r300ClearBuffer(r300
, bits
| CLEARBUFFER_COLOR
, rrb
, rrbd
);
663 if (flags
& BUFFER_BIT_BACK_LEFT
) {
664 rrb
= radeon_get_renderbuffer(&rfb
->base
, BUFFER_BACK_LEFT
);
665 r300ClearBuffer(r300
, bits
| CLEARBUFFER_COLOR
, rrb
, rrbd
);
670 r300ClearBuffer(r300
, bits
, NULL
, rrbd
);
679 static void r300Clear(GLcontext
* ctx
, GLbitfield mask
)
681 r300ContextPtr r300
= R300_CONTEXT(ctx
);
682 __DRIdrawablePrivate
*dPriv
= radeon_get_drawable(&r300
->radeon
);
683 const GLuint colorMask
= *((GLuint
*) & ctx
->Color
.ColorMask
);
684 GLbitfield swrast_mask
= 0, tri_mask
= 0;
686 struct gl_framebuffer
*fb
= ctx
->DrawBuffer
;
688 if (RADEON_DEBUG
& DEBUG_IOCTL
)
689 fprintf(stderr
, "r300Clear\n");
691 if (!r300
->radeon
.radeonScreen
->driScreen
->dri2
.enabled
) {
692 LOCK_HARDWARE(&r300
->radeon
);
693 UNLOCK_HARDWARE(&r300
->radeon
);
694 if (dPriv
->numClipRects
== 0)
698 /* Flush swtcl vertices if necessary, because we will change hardware
699 * state during clear. See also the state-related comment in
700 * r300EmitClearState.
705 tri_mask
|= (mask
& BUFFER_BITS_COLOR
);
707 tri_mask
|= (mask
& (BUFFER_BIT_FRONT_LEFT
| BUFFER_BIT_BACK_LEFT
));
711 if (mask
& BUFFER_BIT_STENCIL
) {
712 tri_mask
|= BUFFER_BIT_STENCIL
;
716 if (mask
& BUFFER_BIT_DEPTH
) {
717 tri_mask
|= BUFFER_BIT_DEPTH
;
720 /* If we're doing a tri pass for depth/stencil, include a likely color
724 for (i
= 0; i
< BUFFER_COUNT
; i
++) {
725 GLuint bufBit
= 1 << i
;
726 if ((tri_mask
) & bufBit
) {
727 if (!fb
->Attachment
[i
].Renderbuffer
->ClassID
) {
729 swrast_mask
|= bufBit
;
734 /* SW fallback clearing */
735 swrast_mask
= mask
& ~tri_mask
;
739 if (r300
->radeon
.radeonScreen
->kernel_mm
)
740 radeonUserClear(ctx
, tri_mask
);
742 /* if kernel clear fails due to size restraints fallback */
743 ret
= r300KernelClear(ctx
, tri_mask
);
745 swrast_mask
|= tri_mask
;
750 if (RADEON_DEBUG
& DEBUG_FALLBACKS
)
751 fprintf(stderr
, "%s: swrast clear, mask: %x\n",
752 __FUNCTION__
, swrast_mask
);
753 _swrast_Clear(ctx
, swrast_mask
);
757 void r300InitIoctlFuncs(struct dd_function_table
*functions
)
759 functions
->Clear
= r300Clear
;
760 functions
->Finish
= radeonFinish
;
761 functions
->Flush
= radeonFlush
;