src/mesa/drivers/dri/i965/brw_misc_state.c

   1 /*
   2  Copyright (C) Intel Corp.  2006.  All Rights Reserved.
   3  Intel funded Tungsten Graphics (http://www.tungstengraphics.com) to
   4  develop this 3D driver.
   5
   6  Permission is hereby granted, free of charge, to any person obtaining
   7  a copy of this software and associated documentation files (the
   8  "Software"), to deal in the Software without restriction, including
   9  without limitation the rights to use, copy, modify, merge, publish,
  10  distribute, sublicense, and/or sell copies of the Software, and to
  11  permit persons to whom the Software is furnished to do so, subject to
  12  the following conditions:
  13
  14  The above copyright notice and this permission notice (including the
  15  next paragraph) shall be included in all copies or substantial
  16  portions of the Software.
  17
  18  THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  19  EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  20  MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
  21  IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
  22  LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
  23  OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
  24  WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
  25
  26  **********************************************************************/
  27  /*
  28   * Authors:
  29   *   Keith Whitwell <keith@tungstengraphics.com>
  30   */
  31
  32
  33
  34 #include "intel_batchbuffer.h"
  35 #include "intel_fbo.h"
  36 #include "intel_regions.h"
  37
  38 #include "brw_context.h"
  39 #include "brw_state.h"
  40 #include "brw_defines.h"
  41
  42 /* Constant single cliprect for framebuffer object or DRI2 drawing */
  43 static void upload_drawing_rect(struct brw_context *brw)
  44 {
  45    struct intel_context *intel = &brw->intel;
  46    struct gl_context *ctx = &intel->ctx;
  47
  48    BEGIN_BATCH(4);
  49    OUT_BATCH(_3DSTATE_DRAWRECT_INFO_I965);
  50    OUT_BATCH(0); /* xmin, ymin */
  51    OUT_BATCH(((ctx->DrawBuffer->Width - 1) & 0xffff) |
  52             ((ctx->DrawBuffer->Height - 1) << 16));
  53    OUT_BATCH(0);
  54    ADVANCE_BATCH();
  55 }
  56
  57 const struct brw_tracked_state brw_drawing_rect = {
  58    .dirty = {
  59       .mesa = _NEW_BUFFERS,
  60       .brw = BRW_NEW_CONTEXT,
  61       .cache = 0
  62    },
  63    .emit = upload_drawing_rect
  64 };
  65
  66 /**
  67  * Upload the binding table pointers, which point each stage's array of surface
  68  * state pointers.
  69  *
  70  * The binding table pointers are relative to the surface state base address,
  71  * which points at the batchbuffer containing the streamed batch state.
  72  */
  73 static void upload_binding_table_pointers(struct brw_context *brw)
  74 {
  75    struct intel_context *intel = &brw->intel;
  76
  77    BEGIN_BATCH(6);
  78    OUT_BATCH(_3DSTATE_BINDING_TABLE_POINTERS << 16 | (6 - 2));
  79    OUT_BATCH(brw->vs.bind_bo_offset);
  80    OUT_BATCH(0); /* gs */
  81    OUT_BATCH(0); /* clip */
  82    OUT_BATCH(0); /* sf */
  83    OUT_BATCH(brw->wm.bind_bo_offset);
  84    ADVANCE_BATCH();
  85 }
  86
  87 const struct brw_tracked_state brw_binding_table_pointers = {
  88    .dirty = {
  89       .mesa = 0,
  90       .brw = (BRW_NEW_BATCH |
  91               BRW_NEW_STATE_BASE_ADDRESS |
  92               BRW_NEW_VS_BINDING_TABLE |
  93               BRW_NEW_GS_BINDING_TABLE |
  94               BRW_NEW_PS_BINDING_TABLE),
  95       .cache = 0,
  96    },
  97    .emit = upload_binding_table_pointers,
  98 };
  99
 100 /**
 101  * Upload the binding table pointers, which point each stage's array of surface
 102  * state pointers.
 103  *
 104  * The binding table pointers are relative to the surface state base address,
 105  * which points at the batchbuffer containing the streamed batch state.
 106  */
 107 static void upload_gen6_binding_table_pointers(struct brw_context *brw)
 108 {
 109    struct intel_context *intel = &brw->intel;
 110
 111    BEGIN_BATCH(4);
 112    OUT_BATCH(_3DSTATE_BINDING_TABLE_POINTERS << 16 |
 113              GEN6_BINDING_TABLE_MODIFY_VS |
 114              GEN6_BINDING_TABLE_MODIFY_GS |
 115              GEN6_BINDING_TABLE_MODIFY_PS |
 116              (4 - 2));
 117    OUT_BATCH(brw->vs.bind_bo_offset); /* vs */
 118    OUT_BATCH(0); /* gs */
 119    OUT_BATCH(brw->wm.bind_bo_offset); /* wm/ps */
 120    ADVANCE_BATCH();
 121 }
 122
 123 const struct brw_tracked_state gen6_binding_table_pointers = {
 124    .dirty = {
 125       .mesa = 0,
 126       .brw = (BRW_NEW_BATCH |
 127               BRW_NEW_STATE_BASE_ADDRESS |
 128               BRW_NEW_VS_BINDING_TABLE |
 129               BRW_NEW_GS_BINDING_TABLE |
 130               BRW_NEW_PS_BINDING_TABLE),
 131       .cache = 0,
 132    },
 133    .emit = upload_gen6_binding_table_pointers,
 134 };
 135
 136 /**
 137  * Upload pointers to the per-stage state.
 138  *
 139  * The state pointers in this packet are all relative to the general state
 140  * base address set by CMD_STATE_BASE_ADDRESS, which is 0.
 141  */
 142 static void upload_pipelined_state_pointers(struct brw_context *brw )
 143 {
 144    struct intel_context *intel = &brw->intel;
 145
 146    if (intel->gen == 5) {
 147       /* Need to flush before changing clip max threads for errata. */
 148       BEGIN_BATCH(1);
 149       OUT_BATCH(MI_FLUSH);
 150       ADVANCE_BATCH();
 151    }
 152
 153    BEGIN_BATCH(7);
 154    OUT_BATCH(_3DSTATE_PIPELINED_POINTERS << 16 | (7 - 2));
 155    OUT_RELOC(intel->batch.bo, I915_GEM_DOMAIN_INSTRUCTION, 0,
 156              brw->vs.state_offset);
 157    if (brw->gs.prog_active)
 158       OUT_RELOC(brw->intel.batch.bo, I915_GEM_DOMAIN_INSTRUCTION, 0,
 159                 brw->gs.state_offset | 1);
 160    else
 161       OUT_BATCH(0);
 162    OUT_RELOC(brw->intel.batch.bo, I915_GEM_DOMAIN_INSTRUCTION, 0,
 163              brw->clip.state_offset | 1);
 164    OUT_RELOC(brw->intel.batch.bo, I915_GEM_DOMAIN_INSTRUCTION, 0,
 165              brw->sf.state_offset);
 166    OUT_RELOC(brw->intel.batch.bo, I915_GEM_DOMAIN_INSTRUCTION, 0,
 167              brw->wm.state_offset);
 168    OUT_RELOC(brw->intel.batch.bo, I915_GEM_DOMAIN_INSTRUCTION, 0,
 169              brw->cc.state_offset);
 170    ADVANCE_BATCH();
 171
 172    brw->state.dirty.brw |= BRW_NEW_PSP;
 173 }
 174
 175 static void upload_psp_urb_cbs(struct brw_context *brw )
 176 {
 177    upload_pipelined_state_pointers(brw);
 178    brw_upload_urb_fence(brw);
 179    brw_upload_cs_urb_state(brw);
 180 }
 181
 182 const struct brw_tracked_state brw_psp_urb_cbs = {
 183    .dirty = {
 184       .mesa = 0,
 185       .brw = (BRW_NEW_URB_FENCE |
 186               BRW_NEW_BATCH |
 187               BRW_NEW_STATE_BASE_ADDRESS),
 188       .cache = (CACHE_NEW_VS_UNIT |
 189                 CACHE_NEW_GS_UNIT |
 190                 CACHE_NEW_GS_PROG |
 191                 CACHE_NEW_CLIP_UNIT |
 192                 CACHE_NEW_SF_UNIT |
 193                 CACHE_NEW_WM_UNIT |
 194                 CACHE_NEW_CC_UNIT)
 195    },
 196    .emit = upload_psp_urb_cbs,
 197 };
 198
 199 static void prepare_depthbuffer(struct brw_context *brw)
 200 {
 201    struct intel_context *intel = &brw->intel;
 202    struct gl_context *ctx = &intel->ctx;
 203    struct gl_framebuffer *fb = ctx->DrawBuffer;
 204    struct intel_renderbuffer *drb = intel_get_renderbuffer(fb, BUFFER_DEPTH);
 205    struct intel_renderbuffer *srb = intel_get_renderbuffer(fb, BUFFER_STENCIL);
 206
 207    if (drb)
 208       brw_add_validated_bo(brw, drb->region->buffer);
 209    if (drb && drb->hiz_region)
 210       brw_add_validated_bo(brw, drb->hiz_region->buffer);
 211    if (srb)
 212       brw_add_validated_bo(brw, srb->region->buffer);
 213 }
 214
 215 static void emit_depthbuffer(struct brw_context *brw)
 216 {
 217    struct intel_context *intel = &brw->intel;
 218    struct gl_context *ctx = &intel->ctx;
 219    struct gl_framebuffer *fb = ctx->DrawBuffer;
 220    /* _NEW_BUFFERS */
 221    struct intel_renderbuffer *depth_irb = intel_get_renderbuffer(fb, BUFFER_DEPTH);
 222    struct intel_renderbuffer *stencil_irb = intel_get_renderbuffer(fb, BUFFER_STENCIL);
 223    struct intel_region *hiz_region = depth_irb ? depth_irb->hiz_region : NULL;
 224    unsigned int len;
 225
 226    /* 3DSTATE_DEPTH_BUFFER, 3DSTATE_STENCIL_BUFFER are both
 227     * non-pipelined state that will need the PIPE_CONTROL workaround.
 228     */
 229    if (intel->gen == 6)
 230       intel_emit_post_sync_nonzero_flush(intel);
 231
 232    /*
 233     * If either depth or stencil buffer has packed depth/stencil format,
 234     * then don't use separate stencil. Emit only a depth buffer.
 235     */
 236    if (depth_irb && depth_irb->Base.Format == MESA_FORMAT_S8_Z24) {
 237       stencil_irb = NULL;
 238    } else if (!depth_irb && stencil_irb
 239               && stencil_irb->Base.Format == MESA_FORMAT_S8_Z24) {
 240       depth_irb = stencil_irb;
 241       stencil_irb = NULL;
 242    }
 243
 244    if (intel->gen >= 6)
 245       len = 7;
 246    else if (intel->is_g4x || intel->gen == 5)
 247       len = 6;
 248    else
 249       len = 5;
 250
 251    if (!depth_irb && !stencil_irb) {
 252       BEGIN_BATCH(len);
 253       OUT_BATCH(_3DSTATE_DEPTH_BUFFER << 16 | (len - 2));
 254       OUT_BATCH((BRW_DEPTHFORMAT_D32_FLOAT << 18) |
 255                 (BRW_SURFACE_NULL << 29));
 256       OUT_BATCH(0);
 257       OUT_BATCH(0);
 258       OUT_BATCH(0);
 259
 260       if (intel->is_g4x || intel->gen >= 5)
 261          OUT_BATCH(0);
 262
 263       if (intel->gen >= 6)
 264          OUT_BATCH(0);
 265
 266       ADVANCE_BATCH();
 267
 268    } else if (!depth_irb && stencil_irb) {
 269       /*
 270        * There exists a separate stencil buffer but no depth buffer.
 271        *
 272        * The stencil buffer inherits most of its fields from
 273        * 3DSTATE_DEPTH_BUFFER: namely the tile walk, surface type, width, and
 274        * height.
 275        *
 276        * Since the stencil buffer has quirky pitch requirements, its region
 277        * was allocated with half height and double cpp. So we need
 278        * a multiplier of 2 to obtain the surface's real height.
 279        *
 280        * Enable the hiz bit because it and the separate stencil bit must have
 281        * the same value. From Section 2.11.5.6.1.1 3DSTATE_DEPTH_BUFFER, Bit
 282        * 1.21 "Separate Stencil Enable":
 283        *     [DevIL]: If this field is enabled, Hierarchical Depth Buffer
 284        *     Enable must also be enabled.
 285        *
 286        *     [DevGT]: This field must be set to the same value (enabled or
 287        *     disabled) as Hierarchical Depth Buffer Enable
 288        */
 289       assert(intel->has_separate_stencil);
 290       assert(stencil_irb->Base.Format == MESA_FORMAT_S8);
 291
 292       BEGIN_BATCH(len);
 293       OUT_BATCH(_3DSTATE_DEPTH_BUFFER << 16 | (len - 2));
 294       OUT_BATCH((BRW_DEPTHFORMAT_D32_FLOAT << 18) |
 295                 (1 << 21) | /* separate stencil enable */
 296                 (1 << 22) | /* hiz enable */
 297                 (BRW_TILEWALK_YMAJOR << 26) |
 298                 (BRW_SURFACE_2D << 29));
 299       OUT_BATCH(0);
 300       OUT_BATCH(((stencil_irb->region->width - 1) << 6) |
 301                  (2 * stencil_irb->region->height - 1) << 19);
 302       OUT_BATCH(0);
 303       OUT_BATCH(0);
 304
 305       if (intel->gen >= 6)
 306          OUT_BATCH(0);
 307
 308       ADVANCE_BATCH();
 309
 310    } else {
 311       struct intel_region *region = depth_irb->region;
 312       unsigned int format;
 313       uint32_t tile_x, tile_y, offset;
 314
 315       /* If using separate stencil, hiz must be enabled. */
 316       assert(!stencil_irb || hiz_region);
 317
 318       switch (region->cpp) {
 319       case 2:
 320          format = BRW_DEPTHFORMAT_D16_UNORM;
 321          break;
 322       case 4:
 323          if (intel->depth_buffer_is_float)
 324             format = BRW_DEPTHFORMAT_D32_FLOAT;
 325          else if (hiz_region)
 326             format = BRW_DEPTHFORMAT_D24_UNORM_X8_UINT;
 327          else
 328             format = BRW_DEPTHFORMAT_D24_UNORM_S8_UINT;
 329          break;
 330       default:
 331          assert(0);
 332          return;
 333       }
 334
 335       offset = intel_renderbuffer_tile_offsets(depth_irb, &tile_x, &tile_y);
 336
 337       assert(intel->gen < 6 || region->tiling == I915_TILING_Y);
 338       assert(!hiz_region || region->tiling == I915_TILING_Y);
 339
 340       BEGIN_BATCH(len);
 341       OUT_BATCH(_3DSTATE_DEPTH_BUFFER << 16 | (len - 2));
 342       OUT_BATCH(((region->pitch * region->cpp) - 1) |
 343                 (format << 18) |
 344                 ((hiz_region ? 1 : 0) << 21) | /* separate stencil enable */
 345                 ((hiz_region ? 1 : 0) << 22) | /* hiz enable */
 346                 (BRW_TILEWALK_YMAJOR << 26) |
 347                 ((region->tiling != I915_TILING_NONE) << 27) |
 348                 (BRW_SURFACE_2D << 29));
 349       OUT_RELOC(region->buffer,
 350                 I915_GEM_DOMAIN_RENDER, I915_GEM_DOMAIN_RENDER,
 351                 offset);
 352       OUT_BATCH((BRW_SURFACE_MIPMAPLAYOUT_BELOW << 1) |
 353                 ((region->width - 1) << 6) |
 354                 ((region->height - 1) << 19));
 355       OUT_BATCH(0);
 356
 357       if (intel->is_g4x || intel->gen >= 5)
 358          OUT_BATCH(tile_x | (tile_y << 16));
 359       else
 360          assert(tile_x == 0 && tile_y == 0);
 361
 362       if (intel->gen >= 6)
 363          OUT_BATCH(0);
 364
 365       ADVANCE_BATCH();
 366    }
 367
 368    if (hiz_region || stencil_irb) {
 369       /*
 370        * In the 3DSTATE_DEPTH_BUFFER batch emitted above, the 'separate
 371        * stencil enable' and 'hiz enable' bits were set. Therefore we must
 372        * emit 3DSTATE_HIER_DEPTH_BUFFER and 3DSTATE_STENCIL_BUFFER. Even if
 373        * there is no stencil buffer, 3DSTATE_STENCIL_BUFFER must be emitted;
 374        * failure to do so causes hangs on gen5 and a stall on gen6.
 375        */
 376
 377       /* Emit hiz buffer. */
 378       if (hiz_region) {
 379          BEGIN_BATCH(3);
 380          OUT_BATCH((_3DSTATE_HIER_DEPTH_BUFFER << 16) | (3 - 2));
 381          OUT_BATCH(hiz_region->pitch * hiz_region->cpp - 1);
 382          OUT_RELOC(hiz_region->buffer,
 383                    I915_GEM_DOMAIN_RENDER, I915_GEM_DOMAIN_RENDER,
 384                    0);
 385          ADVANCE_BATCH();
 386       } else {
 387          BEGIN_BATCH(3);
 388          OUT_BATCH((_3DSTATE_HIER_DEPTH_BUFFER << 16) | (3 - 2));
 389          OUT_BATCH(0);
 390          OUT_BATCH(0);
 391          ADVANCE_BATCH();
 392       }
 393
 394       /* Emit stencil buffer. */
 395       if (stencil_irb) {
 396          BEGIN_BATCH(3);
 397          OUT_BATCH((_3DSTATE_STENCIL_BUFFER << 16) | (3 - 2));
 398          OUT_BATCH(stencil_irb->region->pitch * stencil_irb->region->cpp - 1);
 399          OUT_RELOC(stencil_irb->region->buffer,
 400                    I915_GEM_DOMAIN_RENDER, I915_GEM_DOMAIN_RENDER,
 401                    0);
 402          ADVANCE_BATCH();
 403       } else {
 404          BEGIN_BATCH(3);
 405          OUT_BATCH((_3DSTATE_STENCIL_BUFFER << 16) | (3 - 2));
 406          OUT_BATCH(0);
 407          OUT_BATCH(0);
 408          ADVANCE_BATCH();
 409       }
 410    }
 411
 412    /*
 413     * On Gen >= 6, emit clear params for safety. If using hiz, then clear
 414     * params must be emitted.
 415     *
 416     * From Section 2.11.5.6.4.1 3DSTATE_CLEAR_PARAMS:
 417     *     3DSTATE_CLEAR_PARAMS packet must follow the DEPTH_BUFFER_STATE packet
 418     *     when HiZ is enabled and the DEPTH_BUFFER_STATE changes.
 419     */
 420    if (intel->gen >= 6 || hiz_region) {
 421       if (intel->gen == 6)
 422          intel_emit_post_sync_nonzero_flush(intel);
 423
 424       BEGIN_BATCH(2);
 425       OUT_BATCH(_3DSTATE_CLEAR_PARAMS << 16 | (2 - 2));
 426       OUT_BATCH(0);
 427       ADVANCE_BATCH();
 428    }
 429 }
 430
 431 const struct brw_tracked_state brw_depthbuffer = {
 432    .dirty = {
 433       .mesa = _NEW_BUFFERS,
 434       .brw = BRW_NEW_BATCH,
 435       .cache = 0,
 436    },
 437    .prepare = prepare_depthbuffer,
 438    .emit = emit_depthbuffer,
 439 };
 440
 441
 442
 443 /***********************************************************************
 444  * Polygon stipple packet
 445  */
 446
 447 static void upload_polygon_stipple(struct brw_context *brw)
 448 {
 449    struct intel_context *intel = &brw->intel;
 450    struct gl_context *ctx = &brw->intel.ctx;
 451    GLuint i;
 452
 453    if (!ctx->Polygon.StippleFlag)
 454       return;
 455
 456    if (intel->gen == 6)
 457       intel_emit_post_sync_nonzero_flush(intel);
 458
 459    BEGIN_BATCH(33);
 460    OUT_BATCH(_3DSTATE_POLY_STIPPLE_PATTERN << 16 | (33 - 2));
 461
 462    /* Polygon stipple is provided in OpenGL order, i.e. bottom
 463     * row first.  If we're rendering to a window (i.e. the
 464     * default frame buffer object, 0), then we need to invert
 465     * it to match our pixel layout.  But if we're rendering
 466     * to a FBO (i.e. any named frame buffer object), we *don't*
 467     * need to invert - we already match the layout.
 468     */
 469    if (ctx->DrawBuffer->Name == 0) {
 470       for (i = 0; i < 32; i++)
 471           OUT_BATCH(ctx->PolygonStipple[31 - i]); /* invert */
 472    }
 473    else {
 474       for (i = 0; i < 32; i++)
 475          OUT_BATCH(ctx->PolygonStipple[i]);
 476    }
 477    CACHED_BATCH();
 478 }
 479
 480 const struct brw_tracked_state brw_polygon_stipple = {
 481    .dirty = {
 482       .mesa = _NEW_POLYGONSTIPPLE,
 483       .brw = BRW_NEW_CONTEXT,
 484       .cache = 0
 485    },
 486    .emit = upload_polygon_stipple
 487 };
 488
 489
 490 /***********************************************************************
 491  * Polygon stipple offset packet
 492  */
 493
 494 static void upload_polygon_stipple_offset(struct brw_context *brw)
 495 {
 496    struct intel_context *intel = &brw->intel;
 497    struct gl_context *ctx = &brw->intel.ctx;
 498
 499    if (!ctx->Polygon.StippleFlag)
 500       return;
 501
 502    if (intel->gen == 6)
 503       intel_emit_post_sync_nonzero_flush(intel);
 504
 505    BEGIN_BATCH(2);
 506    OUT_BATCH(_3DSTATE_POLY_STIPPLE_OFFSET << 16 | (2-2));
 507
 508    /* If we're drawing to a system window (ctx->DrawBuffer->Name == 0),
 509     * we have to invert the Y axis in order to match the OpenGL
 510     * pixel coordinate system, and our offset must be matched
 511     * to the window position.  If we're drawing to a FBO
 512     * (ctx->DrawBuffer->Name != 0), then our native pixel coordinate
 513     * system works just fine, and there's no window system to
 514     * worry about.
 515     */
 516    if (brw->intel.ctx.DrawBuffer->Name == 0)
 517       OUT_BATCH((32 - (ctx->DrawBuffer->Height & 31)) & 31);
 518    else
 519       OUT_BATCH(0);
 520    CACHED_BATCH();
 521 }
 522
 523 #define _NEW_WINDOW_POS 0x40000000
 524
 525 const struct brw_tracked_state brw_polygon_stipple_offset = {
 526    .dirty = {
 527       .mesa = _NEW_WINDOW_POS | _NEW_POLYGONSTIPPLE,
 528       .brw = BRW_NEW_CONTEXT,
 529       .cache = 0
 530    },
 531    .emit = upload_polygon_stipple_offset
 532 };
 533
 534 /**********************************************************************
 535  * AA Line parameters
 536  */
 537 static void upload_aa_line_parameters(struct brw_context *brw)
 538 {
 539    struct intel_context *intel = &brw->intel;
 540    struct gl_context *ctx = &brw->intel.ctx;
 541
 542    if (!ctx->Line.SmoothFlag || !brw->has_aa_line_parameters)
 543       return;
 544
 545    if (intel->gen == 6)
 546       intel_emit_post_sync_nonzero_flush(intel);
 547
 548    OUT_BATCH(_3DSTATE_AA_LINE_PARAMETERS << 16 | (3 - 2));
 549    /* use legacy aa line coverage computation */
 550    OUT_BATCH(0);
 551    OUT_BATCH(0);
 552    CACHED_BATCH();
 553 }
 554
 555 const struct brw_tracked_state brw_aa_line_parameters = {
 556    .dirty = {
 557       .mesa = _NEW_LINE,
 558       .brw = BRW_NEW_CONTEXT,
 559       .cache = 0
 560    },
 561    .emit = upload_aa_line_parameters
 562 };
 563
 564 /***********************************************************************
 565  * Line stipple packet
 566  */
 567
 568 static void upload_line_stipple(struct brw_context *brw)
 569 {
 570    struct intel_context *intel = &brw->intel;
 571    struct gl_context *ctx = &brw->intel.ctx;
 572    GLfloat tmp;
 573    GLint tmpi;
 574
 575    if (!ctx->Line.StippleFlag)
 576       return;
 577
 578    if (intel->gen == 6)
 579       intel_emit_post_sync_nonzero_flush(intel);
 580
 581    BEGIN_BATCH(3);
 582    OUT_BATCH(_3DSTATE_LINE_STIPPLE_PATTERN << 16 | (3 - 2));
 583    OUT_BATCH(ctx->Line.StipplePattern);
 584    tmp = 1.0 / (GLfloat) ctx->Line.StippleFactor;
 585    tmpi = tmp * (1<<13);
 586    OUT_BATCH(tmpi << 16 | ctx->Line.StippleFactor);
 587    CACHED_BATCH();
 588 }
 589
 590 const struct brw_tracked_state brw_line_stipple = {
 591    .dirty = {
 592       .mesa = _NEW_LINE,
 593       .brw = BRW_NEW_CONTEXT,
 594       .cache = 0
 595    },
 596    .emit = upload_line_stipple
 597 };
 598
 599
 600 /***********************************************************************
 601  * Misc invarient state packets
 602  */
 603
 604 static void upload_invarient_state( struct brw_context *brw )
 605 {
 606    struct intel_context *intel = &brw->intel;
 607
 608    /* 3DSTATE_SIP, 3DSTATE_MULTISAMPLE, etc. are nonpipelined. */
 609    if (intel->gen == 6)
 610       intel_emit_post_sync_nonzero_flush(intel);
 611
 612    {
 613       /* 0x61040000  Pipeline Select */
 614       /*     PipelineSelect            : 0 */
 615       struct brw_pipeline_select ps;
 616
 617       memset(&ps, 0, sizeof(ps));
 618       ps.header.opcode = brw->CMD_PIPELINE_SELECT;
 619       ps.header.pipeline_select = 0;
 620       BRW_BATCH_STRUCT(brw, &ps);
 621    }
 622
 623    if (intel->gen < 6) {
 624       struct brw_global_depth_offset_clamp gdo;
 625       memset(&gdo, 0, sizeof(gdo));
 626
 627       /* Disable depth offset clamping.
 628        */
 629       gdo.header.opcode = _3DSTATE_GLOBAL_DEPTH_OFFSET_CLAMP;
 630       gdo.header.length = sizeof(gdo)/4 - 2;
 631       gdo.depth_offset_clamp = 0.0;
 632
 633       BRW_BATCH_STRUCT(brw, &gdo);
 634    }
 635
 636    if (intel->gen >= 6) {
 637       int i;
 638       int len = intel->gen >= 7 ? 4 : 3;
 639
 640       BEGIN_BATCH(len);
 641       OUT_BATCH(_3DSTATE_MULTISAMPLE << 16 | (len - 2));
 642       OUT_BATCH(MS_PIXEL_LOCATION_CENTER |
 643                 MS_NUMSAMPLES_1);
 644       OUT_BATCH(0); /* positions for 4/8-sample */
 645       if (intel->gen >= 7)
 646          OUT_BATCH(0);
 647       ADVANCE_BATCH();
 648
 649       BEGIN_BATCH(2);
 650       OUT_BATCH(_3DSTATE_SAMPLE_MASK << 16 | (2 - 2));
 651       OUT_BATCH(1);
 652       ADVANCE_BATCH();
 653
 654       if (intel->gen < 7) {
 655          for (i = 0; i < 4; i++) {
 656             BEGIN_BATCH(4);
 657             OUT_BATCH(_3DSTATE_GS_SVB_INDEX << 16 | (4 - 2));
 658             OUT_BATCH(i << SVB_INDEX_SHIFT);
 659             OUT_BATCH(0);
 660             OUT_BATCH(0xffffffff);
 661             ADVANCE_BATCH();
 662          }
 663       }
 664    }
 665
 666    /* 0x61020000  State Instruction Pointer */
 667    {
 668       struct brw_system_instruction_pointer sip;
 669       memset(&sip, 0, sizeof(sip));
 670
 671       sip.header.opcode = CMD_STATE_INSN_POINTER;
 672       sip.header.length = 0;
 673       sip.bits0.pad = 0;
 674       sip.bits0.system_instruction_pointer = 0;
 675
 676       BRW_BATCH_STRUCT(brw, &sip);
 677    }
 678
 679
 680    {
 681       struct brw_vf_statistics vfs;
 682       memset(&vfs, 0, sizeof(vfs));
 683
 684       vfs.opcode = brw->CMD_VF_STATISTICS;
 685       if (unlikely(INTEL_DEBUG & DEBUG_STATS))
 686          vfs.statistics_enable = 1;
 687
 688       BRW_BATCH_STRUCT(brw, &vfs);
 689    }
 690 }
 691
 692 const struct brw_tracked_state brw_invarient_state = {
 693    .dirty = {
 694       .mesa = 0,
 695       .brw = BRW_NEW_CONTEXT,
 696       .cache = 0
 697    },
 698    .emit = upload_invarient_state
 699 };
 700
 701 /**
 702  * Define the base addresses which some state is referenced from.
 703  *
 704  * This allows us to avoid having to emit relocations for the objects,
 705  * and is actually required for binding table pointers on gen6.
 706  *
 707  * Surface state base address covers binding table pointers and
 708  * surface state objects, but not the surfaces that the surface state
 709  * objects point to.
 710  */
 711 static void upload_state_base_address( struct brw_context *brw )
 712 {
 713    struct intel_context *intel = &brw->intel;
 714
 715    /* FINISHME: According to section 3.6.1 "STATE_BASE_ADDRESS" of
 716     * vol1a of the G45 PRM, MI_FLUSH with the ISC invalidate should be
 717     * programmed prior to STATE_BASE_ADDRESS.
 718     *
 719     * However, given that the instruction SBA (general state base
 720     * address) on this chipset is always set to 0 across X and GL,
 721     * maybe this isn't required for us in particular.
 722     */
 723
 724    if (intel->gen >= 6) {
 725       if (intel->gen == 6)
 726          intel_emit_post_sync_nonzero_flush(intel);
 727
 728        BEGIN_BATCH(10);
 729        OUT_BATCH(CMD_STATE_BASE_ADDRESS << 16 | (10 - 2));
 730        /* General state base address: stateless DP read/write requests */
 731        OUT_BATCH(1);
 732        /* Surface state base address:
 733         * BINDING_TABLE_STATE
 734         * SURFACE_STATE
 735         */
 736        OUT_RELOC(intel->batch.bo, I915_GEM_DOMAIN_SAMPLER, 0, 1);
 737         /* Dynamic state base address:
 738          * SAMPLER_STATE
 739          * SAMPLER_BORDER_COLOR_STATE
 740          * CLIP, SF, WM/CC viewport state
 741          * COLOR_CALC_STATE
 742          * DEPTH_STENCIL_STATE
 743          * BLEND_STATE
 744          * Push constants (when INSTPM: CONSTANT_BUFFER Address Offset
 745          * Disable is clear, which we rely on)
 746          */
 747        OUT_RELOC(intel->batch.bo, (I915_GEM_DOMAIN_RENDER |
 748                                    I915_GEM_DOMAIN_INSTRUCTION), 0, 1);
 749
 750        OUT_BATCH(1); /* Indirect object base address: MEDIA_OBJECT data */
 751        OUT_RELOC(brw->cache.bo, I915_GEM_DOMAIN_INSTRUCTION, 0,
 752                  1); /* Instruction base address: shader kernels (incl. SIP) */
 753
 754        OUT_BATCH(1); /* General state upper bound */
 755        OUT_BATCH(1); /* Dynamic state upper bound */
 756        OUT_BATCH(1); /* Indirect object upper bound */
 757        OUT_BATCH(1); /* Instruction access upper bound */
 758        ADVANCE_BATCH();
 759    } else if (intel->gen == 5) {
 760        BEGIN_BATCH(8);
 761        OUT_BATCH(CMD_STATE_BASE_ADDRESS << 16 | (8 - 2));
 762        OUT_BATCH(1); /* General state base address */
 763        OUT_RELOC(intel->batch.bo, I915_GEM_DOMAIN_SAMPLER, 0,
 764                  1); /* Surface state base address */
 765        OUT_BATCH(1); /* Indirect object base address */
 766        OUT_RELOC(brw->cache.bo, I915_GEM_DOMAIN_INSTRUCTION, 0,
 767                  1); /* Instruction base address */
 768        OUT_BATCH(1); /* General state upper bound */
 769        OUT_BATCH(1); /* Indirect object upper bound */
 770        OUT_BATCH(1); /* Instruction access upper bound */
 771        ADVANCE_BATCH();
 772    } else {
 773        BEGIN_BATCH(6);
 774        OUT_BATCH(CMD_STATE_BASE_ADDRESS << 16 | (6 - 2));
 775        OUT_BATCH(1); /* General state base address */
 776        OUT_RELOC(intel->batch.bo, I915_GEM_DOMAIN_SAMPLER, 0,
 777                  1); /* Surface state base address */
 778        OUT_BATCH(1); /* Indirect object base address */
 779        OUT_BATCH(1); /* General state upper bound */
 780        OUT_BATCH(1); /* Indirect object upper bound */
 781        ADVANCE_BATCH();
 782    }
 783
 784    /* According to section 3.6.1 of VOL1 of the 965 PRM,
 785     * STATE_BASE_ADDRESS updates require a reissue of:
 786     *
 787     * 3DSTATE_PIPELINE_POINTERS
 788     * 3DSTATE_BINDING_TABLE_POINTERS
 789     * MEDIA_STATE_POINTERS
 790     *
 791     * and this continues through Ironlake.  The Sandy Bridge PRM, vol
 792     * 1 part 1 says that the folowing packets must be reissued:
 793     *
 794     * 3DSTATE_CC_POINTERS
 795     * 3DSTATE_BINDING_TABLE_POINTERS
 796     * 3DSTATE_SAMPLER_STATE_POINTERS
 797     * 3DSTATE_VIEWPORT_STATE_POINTERS
 798     * MEDIA_STATE_POINTERS
 799     *
 800     * Those are always reissued following SBA updates anyway (new
 801     * batch time), except in the case of the program cache BO
 802     * changing.  Having a separate state flag makes the sequence more
 803     * obvious.
 804     */
 805
 806    brw->state.dirty.brw |= BRW_NEW_STATE_BASE_ADDRESS;
 807 }
 808
 809 const struct brw_tracked_state brw_state_base_address = {
 810    .dirty = {
 811       .mesa = 0,
 812       .brw = (BRW_NEW_BATCH |
 813               BRW_NEW_PROGRAM_CACHE),
 814       .cache = 0,
 815    },
 816    .emit = upload_state_base_address
 817 };