src/mesa/drivers/dri/r200/r200_tcl.c

   1 /*
   2 Copyright (C) The Weather Channel, Inc.  2002.  All Rights Reserved.
   3
   4 The Weather Channel (TM) funded Tungsten Graphics to develop the
   5 initial release of the Radeon 8500 driver under the XFree86 license.
   6 This notice must be preserved.
   7
   8 Permission is hereby granted, free of charge, to any person obtaining
   9 a copy of this software and associated documentation files (the
  10 "Software"), to deal in the Software without restriction, including
  11 without limitation the rights to use, copy, modify, merge, publish,
  12 distribute, sublicense, and/or sell copies of the Software, and to
  13 permit persons to whom the Software is furnished to do so, subject to
  14 the following conditions:
  15
  16 The above copyright notice and this permission notice (including the
  17 next paragraph) shall be included in all copies or substantial
  18 portions of the Software.
  19
  20 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  21 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  22 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
  23 IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
  24 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
  25 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
  26 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
  27
  28 **************************************************************************/
  29
  30 /*
  31  * Authors:
  32  *   Keith Whitwell <keithw@vmware.com>
  33  */
  34
  35 #include "main/glheader.h"
  36 #include "main/imports.h"
  37 #include "main/mtypes.h"
  38 #include "main/enums.h"
  39 #include "main/light.h"
  40 #include "main/state.h"
  41
  42 #include "vbo/vbo.h"
  43 #include "tnl/tnl.h"
  44 #include "tnl/t_pipeline.h"
  45
  46 #include "r200_context.h"
  47 #include "r200_state.h"
  48 #include "r200_ioctl.h"
  49 #include "r200_tcl.h"
  50 #include "r200_swtcl.h"
  51 #include "r200_maos.h"
  52
  53 #include "radeon_common_context.h"
  54
  55
  56
  57 #define HAVE_POINTS      1
  58 #define HAVE_LINES       1
  59 #define HAVE_LINE_LOOP   0
  60 #define HAVE_LINE_STRIPS 1
  61 #define HAVE_TRIANGLES   1
  62 #define HAVE_TRI_STRIPS  1
  63 #define HAVE_TRI_FANS    1
  64 #define HAVE_QUADS       1
  65 #define HAVE_QUAD_STRIPS 1
  66 #define HAVE_POLYGONS    1
  67 #define HAVE_ELTS        1
  68
  69
  70 #define HW_POINTS           ((!ctx->Point.SmoothFlag) ? \
  71                                 R200_VF_PRIM_POINT_SPRITES : R200_VF_PRIM_POINTS)
  72 #define HW_LINES            R200_VF_PRIM_LINES
  73 #define HW_LINE_LOOP        0
  74 #define HW_LINE_STRIP       R200_VF_PRIM_LINE_STRIP
  75 #define HW_TRIANGLES        R200_VF_PRIM_TRIANGLES
  76 #define HW_TRIANGLE_STRIP_0 R200_VF_PRIM_TRIANGLE_STRIP
  77 #define HW_TRIANGLE_STRIP_1 0
  78 #define HW_TRIANGLE_FAN     R200_VF_PRIM_TRIANGLE_FAN
  79 #define HW_QUADS            R200_VF_PRIM_QUADS
  80 #define HW_QUAD_STRIP       R200_VF_PRIM_QUAD_STRIP
  81 #define HW_POLYGON          R200_VF_PRIM_POLYGON
  82
  83
  84 static GLboolean discrete_prim[0x10] = {
  85    0,                           /* 0 none */
  86    1,                           /* 1 points */
  87    1,                           /* 2 lines */
  88    0,                           /* 3 line_strip */
  89    1,                           /* 4 tri_list */
  90    0,                           /* 5 tri_fan */
  91    0,                           /* 6 tri_strip */
  92    0,                           /* 7 tri_w_flags */
  93    1,                           /* 8 rect list (unused) */
  94    1,                           /* 9 3vert point */
  95    1,                           /* a 3vert line */
  96    0,                           /* b point sprite */
  97    0,                           /* c line loop */
  98    1,                           /* d quads */
  99    0,                           /* e quad strip */
 100    0,                           /* f polygon */
 101 };
 102
 103
 104 #define LOCAL_VARS r200ContextPtr rmesa = R200_CONTEXT(ctx)
 105 #define ELT_TYPE  GLushort
 106
 107 #define ELT_INIT(prim, hw_prim) \
 108    r200TclPrimitive( ctx, prim, hw_prim | R200_VF_PRIM_WALK_IND )
 109
 110 #define GET_MESA_ELTS() TNL_CONTEXT(ctx)->vb.Elts
 111
 112
 113 /* Don't really know how many elts will fit in what's left of cmdbuf,
 114  * as there is state to emit, etc:
 115  */
 116
 117 /* Testing on isosurf shows a maximum around here.  Don't know if it's
 118  * the card or driver or kernel module that is causing the behaviour.
 119  */
 120 #define GET_MAX_HW_ELTS() 300
 121
 122 #define RESET_STIPPLE() do {                    \
 123    R200_STATECHANGE( rmesa, lin );              \
 124    radeonEmitState(&rmesa->radeon);                     \
 125 } while (0)
 126
 127 #define AUTO_STIPPLE( mode )  do {              \
 128    R200_STATECHANGE( rmesa, lin );              \
 129    if (mode)                                    \
 130       rmesa->hw.lin.cmd[LIN_RE_LINE_PATTERN] |= \
 131          R200_LINE_PATTERN_AUTO_RESET;  \
 132    else                                         \
 133       rmesa->hw.lin.cmd[LIN_RE_LINE_PATTERN] &= \
 134          ~R200_LINE_PATTERN_AUTO_RESET; \
 135    radeonEmitState(&rmesa->radeon);                     \
 136 } while (0)
 137
 138
 139 #define ALLOC_ELTS(nr)  r200AllocElts( rmesa, nr )
 140
 141 static GLushort *r200AllocElts( r200ContextPtr rmesa, GLuint nr )
 142 {
 143    if (rmesa->radeon.dma.flush == r200FlushElts &&
 144        rmesa->tcl.elt_used + nr*2 < R200_ELT_BUF_SZ) {
 145
 146       GLushort *dest = (GLushort *)(rmesa->radeon.tcl.elt_dma_bo->ptr +
 147                                     rmesa->radeon.tcl.elt_dma_offset + rmesa->tcl.elt_used);
 148
 149       rmesa->tcl.elt_used += nr*2;
 150
 151       return dest;
 152    }
 153    else {
 154       if (rmesa->radeon.dma.flush)
 155          rmesa->radeon.dma.flush( &rmesa->radeon.glCtx );
 156
 157       r200EmitAOS( rmesa,
 158                    rmesa->radeon.tcl.aos_count, 0 );
 159
 160       r200EmitMaxVtxIndex(rmesa, rmesa->radeon.tcl.aos[0].count);
 161       return r200AllocEltsOpenEnded( rmesa, rmesa->tcl.hw_primitive, nr );
 162    }
 163 }
 164
 165
 166 #define CLOSE_ELTS()                            \
 167 do {                                            \
 168    if (0) R200_NEWPRIM( rmesa );                \
 169 }                                               \
 170 while (0)
 171
 172
 173 /* TODO: Try to extend existing primitive if both are identical,
 174  * discrete and there are no intervening state changes.  (Somewhat
 175  * duplicates changes to DrawArrays code)
 176  */
 177 static void r200EmitPrim( struct gl_context *ctx,
 178                           GLenum prim,
 179                           GLuint hwprim,
 180                           GLuint start,
 181                           GLuint count)
 182 {
 183    r200ContextPtr rmesa = R200_CONTEXT( ctx );
 184    r200TclPrimitive( ctx, prim, hwprim );
 185
 186    //   fprintf(stderr,"Emit prim %d\n", rmesa->radeon.tcl.aos_count);
 187
 188    r200EmitAOS( rmesa,
 189                 rmesa->radeon.tcl.aos_count,
 190                 start );
 191
 192    /* Why couldn't this packet have taken an offset param?
 193     */
 194    r200EmitVbufPrim( rmesa,
 195                      rmesa->tcl.hw_primitive,
 196                      count - start );
 197 }
 198
 199 #define EMIT_PRIM(ctx, prim, hwprim, start, count) do {         \
 200    r200EmitPrim( ctx, prim, hwprim, start, count );             \
 201    (void) rmesa; } while (0)
 202
 203 #define MAX_CONVERSION_SIZE 40
 204 /* Try & join small primitives
 205  */
 206 #if 0
 207 #define PREFER_DISCRETE_ELT_PRIM( NR, PRIM ) 0
 208 #else
 209 #define PREFER_DISCRETE_ELT_PRIM( NR, PRIM )                    \
 210   ((NR) < 20 ||                                                 \
 211    ((NR) < 40 &&                                                \
 212     rmesa->tcl.hw_primitive == (PRIM|                           \
 213                             R200_VF_TCL_OUTPUT_VTX_ENABLE|      \
 214                                 R200_VF_PRIM_WALK_IND)))
 215 #endif
 216
 217 #ifdef MESA_BIG_ENDIAN
 218 /* We could do without (most of) this ugliness if dest was always 32 bit word aligned... */
 219 #define EMIT_ELT(dest, offset, x) do {                          \
 220         int off = offset + ( ( (uintptr_t)dest & 0x2 ) >> 1 );     \
 221         GLushort *des = (GLushort *)( (uintptr_t)dest & ~0x2 );    \
 222         (des)[ off + 1 - 2 * ( off & 1 ) ] = (GLushort)(x);     \
 223         (void)rmesa; } while (0)
 224 #else
 225 #define EMIT_ELT(dest, offset, x) do {                          \
 226         (dest)[offset] = (GLushort) (x);                        \
 227         (void)rmesa; } while (0)
 228 #endif
 229
 230 #define EMIT_TWO_ELTS(dest, offset, x, y)  *(GLuint *)((dest)+offset) = ((y)<<16)|(x);
 231
 232
 233
 234 #define TAG(x) tcl_##x
 235 #include "tnl_dd/t_dd_dmatmp2.h"
 236
 237 /**********************************************************************/
 238 /*                          External entrypoints                     */
 239 /**********************************************************************/
 240
 241 void r200EmitPrimitive( struct gl_context *ctx,
 242                           GLuint first,
 243                           GLuint last,
 244                           GLuint flags )
 245 {
 246    tcl_render_tab_verts[flags&PRIM_MODE_MASK]( ctx, first, last, flags );
 247 }
 248
 249 void r200EmitEltPrimitive( struct gl_context *ctx,
 250                              GLuint first,
 251                              GLuint last,
 252                              GLuint flags )
 253 {
 254    tcl_render_tab_elts[flags&PRIM_MODE_MASK]( ctx, first, last, flags );
 255 }
 256
 257 void r200TclPrimitive( struct gl_context *ctx,
 258                          GLenum prim,
 259                          int hw_prim )
 260 {
 261    r200ContextPtr rmesa = R200_CONTEXT(ctx);
 262    GLuint newprim = hw_prim | R200_VF_TCL_OUTPUT_VTX_ENABLE;
 263
 264    radeon_prepare_render(&rmesa->radeon);
 265    if (rmesa->radeon.NewGLState)
 266       r200ValidateState( ctx );
 267
 268    if (newprim != rmesa->tcl.hw_primitive ||
 269        !discrete_prim[hw_prim&0xf]) {
 270       /* need to disable perspective-correct texturing for point sprites */
 271       if ((prim & PRIM_MODE_MASK) == GL_POINTS && ctx->Point.PointSprite) {
 272          if (rmesa->hw.set.cmd[SET_RE_CNTL] & R200_PERSPECTIVE_ENABLE) {
 273             R200_STATECHANGE( rmesa, set );
 274             rmesa->hw.set.cmd[SET_RE_CNTL] &= ~R200_PERSPECTIVE_ENABLE;
 275          }
 276       }
 277       else if (!(rmesa->hw.set.cmd[SET_RE_CNTL] & R200_PERSPECTIVE_ENABLE)) {
 278          R200_STATECHANGE( rmesa, set );
 279          rmesa->hw.set.cmd[SET_RE_CNTL] |= R200_PERSPECTIVE_ENABLE;
 280       }
 281       R200_NEWPRIM( rmesa );
 282       rmesa->tcl.hw_primitive = newprim;
 283    }
 284 }
 285
 286 /**
 287  * Predict total emit size for next rendering operation so there is no flush in middle of rendering
 288  * Prediction has to aim towards the best possible value that is worse than worst case scenario
 289  */
 290 static GLuint r200EnsureEmitSize( struct gl_context * ctx , GLubyte* vimap_rev )
 291 {
 292   r200ContextPtr rmesa = R200_CONTEXT(ctx);
 293   TNLcontext *tnl = TNL_CONTEXT(ctx);
 294   struct vertex_buffer *VB = &tnl->vb;
 295   GLuint space_required;
 296   GLuint state_size;
 297   GLuint nr_aos = 0;
 298   int i;
 299   /* predict number of aos to emit */
 300   for (i = 0; i < 15; ++i)
 301   {
 302     if (vimap_rev[i] != 255)
 303     {
 304       ++nr_aos;
 305     }
 306   }
 307
 308   {
 309     /* count the prediction for state size */
 310     space_required = 0;
 311     state_size = radeonCountStateEmitSize( &rmesa->radeon );
 312     /* vtx may be changed in r200EmitArrays so account for it if not dirty */
 313     if (!rmesa->hw.vtx.dirty)
 314       state_size += rmesa->hw.vtx.check(&rmesa->radeon.glCtx, &rmesa->hw.vtx);
 315     /* predict size for elements */
 316     for (i = 0; i < VB->PrimitiveCount; ++i)
 317     {
 318       if (!VB->Primitive[i].count)
 319         continue;
 320       /* If primitive.count is less than MAX_CONVERSION_SIZE
 321          rendering code may decide convert to elts.
 322          In that case we have to make pessimistic prediction.
 323          and use larger of 2 paths. */
 324       const GLuint elt_count =(VB->Primitive[i].count/GET_MAX_HW_ELTS() + 1);
 325       const GLuint elts = ELTS_BUFSZ(nr_aos) * elt_count;
 326       const GLuint index = INDEX_BUFSZ * elt_count;
 327       const GLuint vbuf = VBUF_BUFSZ;
 328       if ( (!VB->Elts && VB->Primitive[i].count >= MAX_CONVERSION_SIZE)
 329           || vbuf > index + elts)
 330         space_required += vbuf;
 331       else
 332         space_required += index + elts;
 333       space_required += AOS_BUFSZ(nr_aos);
 334     }
 335   }
 336
 337   radeon_print(RADEON_RENDER,RADEON_VERBOSE,
 338       "%s space %u, aos %d\n",
 339       __func__, space_required, AOS_BUFSZ(nr_aos) );
 340   /* flush the buffer in case we need more than is left. */
 341   if (rcommonEnsureCmdBufSpace(&rmesa->radeon, space_required + state_size, __func__))
 342     return space_required + radeonCountStateEmitSize( &rmesa->radeon );
 343   else
 344     return space_required + state_size;
 345 }
 346
 347
 348 /**********************************************************************/
 349 /*                          Render pipeline stage                     */
 350 /**********************************************************************/
 351
 352
 353 /* TCL render.
 354  */
 355 static GLboolean r200_run_tcl_render( struct gl_context *ctx,
 356                                       struct tnl_pipeline_stage *stage )
 357 {
 358    r200ContextPtr rmesa = R200_CONTEXT(ctx);
 359    TNLcontext *tnl = TNL_CONTEXT(ctx);
 360    struct vertex_buffer *VB = &tnl->vb;
 361    GLuint i;
 362    GLubyte *vimap_rev;
 363 /* use hw fixed order for simplicity, pos 0, weight 1, normal 2, fog 3,
 364    color0 - color3 4-7, texcoord0 - texcoord5 8-13, pos 1 14. Must not use
 365    more than 12 of those at the same time. */
 366    GLubyte map_rev_fixed[15] = {255, 255, 255, 255, 255, 255, 255, 255,
 367                             255, 255, 255, 255, 255, 255, 255};
 368
 369
 370    /* TODO: separate this from the swtnl pipeline
 371     */
 372    if (rmesa->radeon.TclFallback)
 373       return GL_TRUE;   /* fallback to software t&l */
 374
 375    radeon_print(RADEON_RENDER, RADEON_NORMAL, "%s\n", __func__);
 376
 377    if (VB->Count == 0)
 378       return GL_FALSE;
 379
 380    /* Validate state:
 381     */
 382    if (rmesa->radeon.NewGLState)
 383       if (!r200ValidateState( ctx ))
 384          return GL_TRUE; /* fallback to sw t&l */
 385
 386    if (!_mesa_arb_vertex_program_enabled(ctx)) {
 387    /* NOTE: inputs != tnl->render_inputs - these are the untransformed
 388     * inputs.
 389     */
 390       map_rev_fixed[0] = VERT_ATTRIB_POS;
 391       /* technically there is no reason we always need VA_COLOR0. In theory
 392          could disable it depending on lighting, color materials, texturing... */
 393       map_rev_fixed[4] = VERT_ATTRIB_COLOR0;
 394
 395       if (ctx->Light.Enabled) {
 396          map_rev_fixed[2] = VERT_ATTRIB_NORMAL;
 397       }
 398
 399       /* this also enables VA_COLOR1 when using separate specular
 400          lighting model, which is unnecessary.
 401          FIXME: OTOH, we're missing the case where a ATI_fragment_shader accesses
 402          the secondary color (if lighting is disabled). The chip seems
 403          misconfigured for that though elsewhere (tcl output, might lock up) */
 404       if (_mesa_need_secondary_color(ctx)) {
 405          map_rev_fixed[5] = VERT_ATTRIB_COLOR1;
 406       }
 407
 408       if ( (ctx->Fog.FogCoordinateSource == GL_FOG_COORD) && ctx->Fog.Enabled ) {
 409          map_rev_fixed[3] = VERT_ATTRIB_FOG;
 410       }
 411
 412       for (i = 0 ; i < ctx->Const.MaxTextureUnits; i++) {
 413          if (ctx->Texture.Unit[i]._Current) {
 414             if (rmesa->TexGenNeedNormals[i]) {
 415                map_rev_fixed[2] = VERT_ATTRIB_NORMAL;
 416             }
 417             map_rev_fixed[8 + i] = VERT_ATTRIB_TEX0 + i;
 418          }
 419       }
 420       vimap_rev = &map_rev_fixed[0];
 421    }
 422    else {
 423       /* vtx_tcl_output_vtxfmt_0/1 need to match configuration of "fragment
 424          part", since using some vertex interpolator later which is not in
 425          out_vtxfmt0/1 will lock up. It seems to be ok to write in vertex
 426          prog to a not enabled output however, so just don't mess with it.
 427          We only need to change compsel. */
 428       GLuint out_compsel = 0;
 429       const GLbitfield64 vp_out =
 430          rmesa->curr_vp_hw->mesa_program.info.outputs_written;
 431
 432       vimap_rev = &rmesa->curr_vp_hw->inputmap_rev[0];
 433       assert(vp_out & BITFIELD64_BIT(VARYING_SLOT_POS));
 434       out_compsel = R200_OUTPUT_XYZW;
 435       if (vp_out & BITFIELD64_BIT(VARYING_SLOT_COL0)) {
 436          out_compsel |= R200_OUTPUT_COLOR_0;
 437       }
 438       if (vp_out & BITFIELD64_BIT(VARYING_SLOT_COL1)) {
 439          out_compsel |= R200_OUTPUT_COLOR_1;
 440       }
 441       if (vp_out & BITFIELD64_BIT(VARYING_SLOT_FOGC)) {
 442          out_compsel |= R200_OUTPUT_DISCRETE_FOG;
 443       }
 444       if (vp_out & BITFIELD64_BIT(VARYING_SLOT_PSIZ)) {
 445          out_compsel |= R200_OUTPUT_PT_SIZE;
 446       }
 447       for (i = VARYING_SLOT_TEX0; i < VARYING_SLOT_TEX6; i++) {
 448          if (vp_out & BITFIELD64_BIT(i)) {
 449             out_compsel |= R200_OUTPUT_TEX_0 << (i - VARYING_SLOT_TEX0);
 450          }
 451       }
 452       if (rmesa->hw.vtx.cmd[VTX_TCL_OUTPUT_COMPSEL] != out_compsel) {
 453          R200_STATECHANGE( rmesa, vtx );
 454          rmesa->hw.vtx.cmd[VTX_TCL_OUTPUT_COMPSEL] = out_compsel;
 455       }
 456    }
 457
 458    /* Do the actual work:
 459     */
 460    radeonReleaseArrays( ctx, ~0 /* stage->changed_inputs */ );
 461    GLuint emit_end = r200EnsureEmitSize( ctx, vimap_rev )
 462      + rmesa->radeon.cmdbuf.cs->cdw;
 463    r200EmitArrays( ctx, vimap_rev );
 464
 465    for (i = 0 ; i < VB->PrimitiveCount ; i++)
 466    {
 467       GLuint prim = _tnl_translate_prim(&VB->Primitive[i]);
 468       GLuint start = VB->Primitive[i].start;
 469       GLuint length = VB->Primitive[i].count;
 470
 471       if (!length)
 472          continue;
 473
 474       if (VB->Elts)
 475          r200EmitEltPrimitive( ctx, start, start+length, prim );
 476       else
 477          r200EmitPrimitive( ctx, start, start+length, prim );
 478    }
 479    if ( emit_end < rmesa->radeon.cmdbuf.cs->cdw )
 480      WARN_ONCE("Rendering was %d commands larger than predicted size."
 481          " We might overflow  command buffer.\n", rmesa->radeon.cmdbuf.cs->cdw - emit_end);
 482
 483    return GL_FALSE;             /* finished the pipe */
 484 }
 485
 486
 487
 488 /* Initial state for tcl stage.
 489  */
 490 const struct tnl_pipeline_stage _r200_tcl_stage =
 491 {
 492    "r200 render",
 493    NULL,                        /*  private */
 494    NULL,
 495    NULL,
 496    NULL,
 497    r200_run_tcl_render  /* run */
 498 };
 499
 500
 501
 502 /**********************************************************************/
 503 /*                 Validate state at pipeline start                   */
 504 /**********************************************************************/
 505
 506
 507 /*-----------------------------------------------------------------------
 508  * Manage TCL fallbacks
 509  */
 510
 511
 512 static void transition_to_swtnl( struct gl_context *ctx )
 513 {
 514    r200ContextPtr rmesa = R200_CONTEXT(ctx);
 515    TNLcontext *tnl = TNL_CONTEXT(ctx);
 516
 517    R200_NEWPRIM( rmesa );
 518
 519    r200ChooseVertexState( ctx );
 520    r200ChooseRenderState( ctx );
 521
 522    _tnl_validate_shine_tables( ctx );
 523
 524    tnl->Driver.NotifyMaterialChange =
 525       _tnl_validate_shine_tables;
 526
 527    radeonReleaseArrays( ctx, ~0 );
 528
 529    /* Still using the D3D based hardware-rasterizer from the radeon;
 530     * need to put the card into D3D mode to make it work:
 531     */
 532    R200_STATECHANGE( rmesa, vap );
 533    rmesa->hw.vap.cmd[VAP_SE_VAP_CNTL] &= ~(R200_VAP_TCL_ENABLE|R200_VAP_PROG_VTX_SHADER_ENABLE);
 534 }
 535
 536 static void transition_to_hwtnl( struct gl_context *ctx )
 537 {
 538    r200ContextPtr rmesa = R200_CONTEXT(ctx);
 539    TNLcontext *tnl = TNL_CONTEXT(ctx);
 540
 541    _tnl_need_projected_coords( ctx, GL_FALSE );
 542
 543    r200UpdateMaterial( ctx );
 544
 545    tnl->Driver.NotifyMaterialChange = r200UpdateMaterial;
 546
 547    if ( rmesa->radeon.dma.flush )
 548       rmesa->radeon.dma.flush( &rmesa->radeon.glCtx );
 549
 550    rmesa->radeon.dma.flush = NULL;
 551
 552    R200_STATECHANGE( rmesa, vap );
 553    rmesa->hw.vap.cmd[VAP_SE_VAP_CNTL] |= R200_VAP_TCL_ENABLE;
 554    rmesa->hw.vap.cmd[VAP_SE_VAP_CNTL] &= ~R200_VAP_FORCE_W_TO_ONE;
 555
 556    if (_mesa_arb_vertex_program_enabled(ctx)) {
 557       rmesa->hw.vap.cmd[VAP_SE_VAP_CNTL] |= R200_VAP_PROG_VTX_SHADER_ENABLE;
 558    }
 559
 560    if ( ((rmesa->hw.ctx.cmd[CTX_PP_FOG_COLOR] & R200_FOG_USE_MASK)
 561       == R200_FOG_USE_SPEC_ALPHA) &&
 562       (ctx->Fog.FogCoordinateSource == GL_FOG_COORD )) {
 563       R200_STATECHANGE( rmesa, ctx );
 564       rmesa->hw.ctx.cmd[CTX_PP_FOG_COLOR] &= ~R200_FOG_USE_MASK;
 565       rmesa->hw.ctx.cmd[CTX_PP_FOG_COLOR] |= R200_FOG_USE_VTX_FOG;
 566    }
 567
 568    R200_STATECHANGE( rmesa, vte );
 569    rmesa->hw.vte.cmd[VTE_SE_VTE_CNTL] &= ~(R200_VTX_XY_FMT|R200_VTX_Z_FMT);
 570    rmesa->hw.vte.cmd[VTE_SE_VTE_CNTL] |= R200_VTX_W0_FMT;
 571
 572    if (R200_DEBUG & RADEON_FALLBACKS)
 573       fprintf(stderr, "R200 end tcl fallback\n");
 574 }
 575
 576
 577 static char *fallbackStrings[] = {
 578    "Rasterization fallback",
 579    "Unfilled triangles",
 580    "Twosided lighting, differing materials",
 581    "Materials in VB (maybe between begin/end)",
 582    "Texgen unit 0",
 583    "Texgen unit 1",
 584    "Texgen unit 2",
 585    "Texgen unit 3",
 586    "Texgen unit 4",
 587    "Texgen unit 5",
 588    "User disable",
 589    "Bitmap as points",
 590    "Vertex program"
 591 };
 592
 593
 594 static char *getFallbackString(GLuint bit)
 595 {
 596    int i = 0;
 597    while (bit > 1) {
 598       i++;
 599       bit >>= 1;
 600    }
 601    return fallbackStrings[i];
 602 }
 603
 604
 605
 606 void r200TclFallback( struct gl_context *ctx, GLuint bit, GLboolean mode )
 607 {
 608         r200ContextPtr rmesa = R200_CONTEXT(ctx);
 609         GLuint oldfallback = rmesa->radeon.TclFallback;
 610
 611         if (mode) {
 612                 if (oldfallback == 0) {
 613                         /* We have to flush before transition */
 614                         if ( rmesa->radeon.dma.flush )
 615                                 rmesa->radeon.dma.flush( &rmesa->radeon.glCtx );
 616
 617                         if (R200_DEBUG & RADEON_FALLBACKS)
 618                                 fprintf(stderr, "R200 begin tcl fallback %s\n",
 619                                                 getFallbackString( bit ));
 620                         rmesa->radeon.TclFallback |= bit;
 621                         transition_to_swtnl( ctx );
 622                 } else
 623                         rmesa->radeon.TclFallback |= bit;
 624         } else {
 625                 if (oldfallback == bit) {
 626                         /* We have to flush before transition */
 627                         if ( rmesa->radeon.dma.flush )
 628                                 rmesa->radeon.dma.flush( &rmesa->radeon.glCtx );
 629
 630                         if (R200_DEBUG & RADEON_FALLBACKS)
 631                                 fprintf(stderr, "R200 end tcl fallback %s\n",
 632                                                 getFallbackString( bit ));
 633                         rmesa->radeon.TclFallback &= ~bit;
 634                         transition_to_hwtnl( ctx );
 635                 } else
 636                         rmesa->radeon.TclFallback &= ~bit;
 637         }
 638 }