1 /**************************************************************************
3 Copyright (C) 2004 Nicolai Haehnle.
7 Permission is hereby granted, free of charge, to any person obtaining a
8 copy of this software and associated documentation files (the "Software"),
9 to deal in the Software without restriction, including without limitation
10 on the rights to use, copy, modify, merge, publish, distribute, sub
11 license, and/or sell copies of the Software, and to permit persons to whom
12 the Software is furnished to do so, subject to the following conditions:
14 The above copyright notice and this permission notice (including the next
15 paragraph) shall be included in all copies or substantial portions of the
18 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
19 IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20 FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
21 ATI, VA LINUX SYSTEMS AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
22 DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
23 OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
24 USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
30 * Nicolai Haehnle <prefect_@gmx.net>
40 #include "simple_list.h"
42 #include "api_arrayelt.h"
43 #include "swrast/swrast.h"
44 #include "swrast_setup/swrast_setup.h"
47 #include "tnl/t_vp_build.h"
49 #include "radeon_reg.h"
50 #include "radeon_macros.h"
51 #include "radeon_ioctl.h"
52 #include "radeon_state.h"
53 #include "r300_context.h"
54 #include "r300_ioctl.h"
55 #include "r300_state.h"
57 #include "r300_program.h"
59 #include "r300_maos.h"
60 #include "r300_emit.h"
62 extern int future_hw_tcl_on
;
64 /**********************************************************************
65 * Hardware rasterization
67 * When we fell back to software TCL, we still try to use the
68 * rasterization hardware for rendering.
69 **********************************************************************/
71 static int r300_get_primitive_type(r300ContextPtr rmesa
, GLcontext
*ctx
, int prim
)
75 switch (prim
& PRIM_MODE_MASK
) {
77 type
=R300_VAP_VF_CNTL__PRIM_POINTS
;
80 type
=R300_VAP_VF_CNTL__PRIM_LINES
;
83 type
=R300_VAP_VF_CNTL__PRIM_LINE_STRIP
;
86 type
=R300_VAP_VF_CNTL__PRIM_LINE_LOOP
;
89 type
=R300_VAP_VF_CNTL__PRIM_TRIANGLES
;
91 case GL_TRIANGLE_STRIP
:
92 type
=R300_VAP_VF_CNTL__PRIM_TRIANGLE_STRIP
;
95 type
=R300_VAP_VF_CNTL__PRIM_TRIANGLE_FAN
;
98 type
=R300_VAP_VF_CNTL__PRIM_QUADS
;
101 type
=R300_VAP_VF_CNTL__PRIM_QUAD_STRIP
;
104 type
=R300_VAP_VF_CNTL__PRIM_POLYGON
;
107 fprintf(stderr
, "%s:%s Do not know how to handle primitive %02x - help me !\n",
108 __FILE__
, __FUNCTION__
,
109 prim
& PRIM_MODE_MASK
);
116 int r300_get_num_verts(r300ContextPtr rmesa
, int num_verts
, int prim
)
119 char *name
="UNKNOWN";
121 switch (prim
& PRIM_MODE_MASK
) {
128 verts_off
= num_verts
% 2;
133 verts_off
= num_verts
;
138 verts_off
= num_verts
;
142 verts_off
= num_verts
% 3;
144 case GL_TRIANGLE_STRIP
:
147 verts_off
= num_verts
;
149 case GL_TRIANGLE_FAN
:
152 verts_off
= num_verts
;
156 verts_off
= num_verts
% 4;
161 verts_off
= num_verts
;
163 verts_off
= num_verts
% 2;
168 verts_off
= num_verts
;
171 fprintf(stderr
, "%s:%s Do not know how to handle primitive %02x - help me !\n",
172 __FILE__
, __FUNCTION__
,
173 prim
& PRIM_MODE_MASK
);
178 if (RADEON_DEBUG
& DEBUG_VERTS
) {
179 if (num_verts
- verts_off
== 0) {
180 WARN_ONCE("user error: Need more than %d vertices to draw primitive %s !\n", num_verts
, name
);
185 WARN_ONCE("user error: %d is not a valid number of vertices for primitive %s !\n", num_verts
, name
);
189 return num_verts
- verts_off
;
192 /* Immediate implementation has been removed from CVS. */
194 /* vertex buffer implementation */
196 static void inline fire_EB(r300ContextPtr rmesa
, unsigned long addr
, int vertex_count
, int type
, int elt_size
)
198 int cmd_reserved
= 0;
200 drm_radeon_cmd_header_t
*cmd
= NULL
;
201 unsigned long t_addr
;
202 unsigned long magic_1
, magic_2
;
204 ctx
= rmesa
->radeon
.glCtx
;
206 assert(elt_size
== 2 || elt_size
== 4);
208 if(addr
& (elt_size
-1)){
209 WARN_ONCE("Badly aligned buffer\n");
213 magic_1
= (addr
% 32) / 4;
214 t_addr
= addr
& (~0x1d);
215 magic_2
= (vertex_count
+ 1 + (t_addr
& 0x2)) / 2 + magic_1
;
219 start_packet3(RADEON_CP_PACKET3_3D_DRAW_INDX_2
, 0);
221 e32(R300_VAP_VF_CNTL__PRIM_WALK_INDICES
| (vertex_count
<<16) | type
| R300_VAP_VF_CNTL__INDEX_SIZE_32bit
);
223 e32(R300_VAP_VF_CNTL__PRIM_WALK_INDICES
| (vertex_count
<<16) | type
);
226 start_packet3(RADEON_CP_PACKET3_INDX_BUFFER
, 2);
228 e32(R300_EB_UNK1
| (0 << 16) | R300_EB_UNK2
);
229 e32(addr
/*& 0xffffffe3*/);
231 e32(R300_EB_UNK1
| (magic_1
<< 16) | R300_EB_UNK2
);
236 e32(vertex_count
); /* Total number of dwords needed? */
238 e32(magic_2
); /* Total number of dwords needed? */
240 //cp_delay(rmesa, 1);
242 (void)magic_2
, (void)magic_1
, (void)t_addr
;
246 start_packet3(RADEON_CP_PACKET3_3D_DRAW_INDX_2
, 0);
248 e32(R300_VAP_VF_CNTL__PRIM_WALK_INDICES
| (vertex_count
<<16) | type
| R300_VAP_VF_CNTL__INDEX_SIZE_32bit
);
250 e32(R300_VAP_VF_CNTL__PRIM_WALK_INDICES
| (vertex_count
<<16) | type
);
253 start_packet3(RADEON_CP_PACKET3_INDX_BUFFER
, 2);
254 e32(R300_EB_UNK1
| (0 << 16) | R300_EB_UNK2
);
255 e32(addr
/*& 0xffffffe3*/);
258 e32(vertex_count
); /* Total number of dwords needed? */
260 e32((vertex_count
+1)/2); /* Total number of dwords needed? */
262 //cp_delay(rmesa, 1);
266 static void r300_render_vb_primitive(r300ContextPtr rmesa
,
274 type
=r300_get_primitive_type(rmesa
, ctx
, prim
);
275 num_verts
=r300_get_num_verts(rmesa
, end
-start
, prim
);
277 if(type
<0 || num_verts
<= 0)return;
279 if(rmesa
->state
.VB
.Elts
){
280 r300EmitAOS(rmesa
, rmesa
->state
.aos_count
, /*0*/start
);
281 if(num_verts
> 65535){ /* not implemented yet */
282 WARN_ONCE("Too many elts\n");
285 r300EmitElts(ctx
, rmesa
->state
.VB
.Elts
, num_verts
, rmesa
->state
.VB
.elt_size
);
286 fire_EB(rmesa
, rmesa
->state
.elt_dma
.aos_offset
, num_verts
, type
, rmesa
->state
.VB
.elt_size
);
288 r300EmitAOS(rmesa
, rmesa
->state
.aos_count
, start
);
289 fire_AOS(rmesa
, num_verts
, type
);
293 GLboolean
r300_run_vb_render(GLcontext
*ctx
,
294 struct tnl_pipeline_stage
*stage
)
296 r300ContextPtr rmesa
= R300_CONTEXT(ctx
);
297 struct radeon_vertex_buffer
*VB
= &rmesa
->state
.VB
;
299 int cmd_reserved
= 0;
301 drm_radeon_cmd_header_t
*cmd
= NULL
;
304 if (RADEON_DEBUG
& DEBUG_PRIMS
)
305 fprintf(stderr
, "%s\n", __FUNCTION__
);
308 TNLcontext
*tnl
= TNL_CONTEXT(ctx
);
309 radeon_vb_to_rvb(rmesa
, VB
, &tnl
->vb
);
312 r300UpdateShaders(rmesa
);
313 if (r300EmitArrays(ctx
))
316 r300UpdateShaderStates(rmesa
);
318 reg_start(R300_RB3D_DSTCACHE_CTLSTAT
,0);
319 e32(R300_RB3D_DSTCACHE_UNKNOWN_0A
);
321 reg_start(R300_RB3D_ZCACHE_CTLSTAT
,0);
322 e32(R300_RB3D_ZCACHE_UNKNOWN_03
);
324 r300EmitState(rmesa
);
326 for(i
=0; i
< VB
->PrimitiveCount
; i
++){
327 GLuint prim
= _tnl_translate_prim(&VB
->Primitive
[i
]);
328 GLuint start
= VB
->Primitive
[i
].start
;
329 GLuint length
= VB
->Primitive
[i
].count
;
331 r300_render_vb_primitive(rmesa
, ctx
, start
, start
+ length
, prim
);
334 reg_start(R300_RB3D_DSTCACHE_CTLSTAT
,0);
335 e32(R300_RB3D_DSTCACHE_UNKNOWN_0A
/*R300_RB3D_DSTCACHE_UNKNOWN_02*/);
337 reg_start(R300_RB3D_ZCACHE_CTLSTAT
,0);
338 e32(R300_RB3D_ZCACHE_UNKNOWN_03
/*R300_RB3D_ZCACHE_UNKNOWN_01*/);
343 r300ReleaseArrays(ctx
);
347 #define FALLBACK_IF(expr) \
350 if (1 || RADEON_DEBUG & DEBUG_FALLBACKS) \
351 WARN_ONCE("Software fallback:%s\n", \
353 return R300_FALLBACK_RAST; \
357 int r300Fallback(GLcontext
*ctx
)
359 r300ContextPtr r300
= R300_CONTEXT(ctx
);
360 struct r300_fragment_program
*rp
=
361 (struct r300_fragment_program
*)
362 (char *)ctx
->FragmentProgram
._Current
;
366 r300_translate_fragment_shader(r300
, rp
);
368 FALLBACK_IF(!rp
->translated
);
371 /* We do not do SELECT or FEEDBACK (yet ?)
372 * Is it worth doing them ?
374 FALLBACK_IF(ctx
->RenderMode
!= GL_RENDER
);
376 FALLBACK_IF(ctx
->Stencil
._TestTwoSide
&&
377 (ctx
->Stencil
.Ref
[0] != ctx
->Stencil
.Ref
[1] ||
378 ctx
->Stencil
.ValueMask
[0] != ctx
->Stencil
.ValueMask
[1] ||
379 ctx
->Stencil
.WriteMask
[0] != ctx
->Stencil
.WriteMask
[1]));
381 if(!r300
->disable_lowimpact_fallback
){
382 /* GL_POLYGON_OFFSET_POINT */
383 FALLBACK_IF(ctx
->Polygon
.OffsetPoint
);
384 /* GL_POLYGON_OFFSET_LINE */
385 FALLBACK_IF(ctx
->Polygon
.OffsetLine
);
386 /* GL_POLYGON_STIPPLE */
387 FALLBACK_IF(ctx
->Polygon
.StippleFlag
);
388 /* GL_MULTISAMPLE_ARB */
389 FALLBACK_IF(ctx
->Multisample
.Enabled
);
391 FALLBACK_IF(ctx
->Line
.StippleFlag
);
393 FALLBACK_IF(ctx
->Line
.SmoothFlag
);
394 /* GL_POINT_SMOOTH */
395 FALLBACK_IF(ctx
->Point
.SmoothFlag
);
398 /* Fallback for LOGICOP */
399 FALLBACK_IF(ctx
->Color
.ColorLogicOpEnabled
);
401 /* Rest could be done with vertex fragments */
402 if (ctx
->Extensions
.NV_point_sprite
||
403 ctx
->Extensions
.ARB_point_sprite
)
404 /* GL_POINT_SPRITE_NV */
405 FALLBACK_IF(ctx
->Point
.PointSprite
);
407 return R300_FALLBACK_NONE
;
411 * Called by the pipeline manager to render a batch of primitives.
412 * We can return true to pass on to the next stage (i.e. software
413 * rasterization) or false to indicate that the pipeline has finished
414 * after we render something.
416 static GLboolean
r300_run_render(GLcontext
*ctx
,
417 struct tnl_pipeline_stage
*stage
)
419 if (RADEON_DEBUG
& DEBUG_PRIMS
)
420 fprintf(stderr
, "%s\n", __FUNCTION__
);
422 if (r300Fallback(ctx
) >= R300_FALLBACK_RAST
)
425 return r300_run_vb_render(ctx
, stage
);
428 const struct tnl_pipeline_stage _r300_render_stage
= {
434 r300_run_render
/* run */
437 static GLboolean
r300_run_tcl_render(GLcontext
*ctx
,
438 struct tnl_pipeline_stage
*stage
)
440 r300ContextPtr rmesa
= R300_CONTEXT(ctx
);
441 struct r300_vertex_program
*vp
;
443 hw_tcl_on
=future_hw_tcl_on
;
445 if (RADEON_DEBUG
& DEBUG_PRIMS
)
446 fprintf(stderr
, "%s\n", __FUNCTION__
);
447 if(hw_tcl_on
== GL_FALSE
)
450 if (r300Fallback(ctx
) >= R300_FALLBACK_TCL
) {
451 hw_tcl_on
= GL_FALSE
;
455 r300UpdateShaders(rmesa
);
457 vp
= (struct r300_vertex_program
*)CURRENT_VERTEX_SHADER(ctx
);
458 if (vp
->native
== GL_FALSE
) {
459 hw_tcl_on
= GL_FALSE
;
463 //r300UpdateShaderStates(rmesa);
465 return r300_run_vb_render(ctx
, stage
);
468 const struct tnl_pipeline_stage _r300_tcl_stage
= {
474 r300_run_tcl_render
/* run */