src/mesa/drivers/dri/i965/brw_context.c

   1 /*
   2  Copyright 2003 VMware, Inc.
   3  Copyright (C) Intel Corp.  2006.  All Rights Reserved.
   4  Intel funded Tungsten Graphics to
   5  develop this 3D driver.
   6
   7  Permission is hereby granted, free of charge, to any person obtaining
   8  a copy of this software and associated documentation files (the
   9  "Software"), to deal in the Software without restriction, including
  10  without limitation the rights to use, copy, modify, merge, publish,
  11  distribute, sublicense, and/or sell copies of the Software, and to
  12  permit persons to whom the Software is furnished to do so, subject to
  13  the following conditions:
  14
  15  The above copyright notice and this permission notice (including the
  16  next paragraph) shall be included in all copies or substantial
  17  portions of the Software.
  18
  19  THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  20  EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  21  MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
  22  IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
  23  LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
  24  OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
  25  WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
  26
  27  **********************************************************************/
  28  /*
  29   * Authors:
  30   *   Keith Whitwell <keithw@vmware.com>
  31   */
  32
  33
  34 #include "main/api_exec.h"
  35 #include "main/context.h"
  36 #include "main/fbobject.h"
  37 #include "main/extensions.h"
  38 #include "main/imports.h"
  39 #include "main/macros.h"
  40 #include "main/points.h"
  41 #include "main/version.h"
  42 #include "main/vtxfmt.h"
  43 #include "main/texobj.h"
  44 #include "main/framebuffer.h"
  45
  46 #include "vbo/vbo_context.h"
  47
  48 #include "drivers/common/driverfuncs.h"
  49 #include "drivers/common/meta.h"
  50 #include "utils.h"
  51
  52 #include "brw_context.h"
  53 #include "brw_defines.h"
  54 #include "brw_compiler.h"
  55 #include "brw_draw.h"
  56 #include "brw_state.h"
  57
  58 #include "intel_batchbuffer.h"
  59 #include "intel_buffer_objects.h"
  60 #include "intel_buffers.h"
  61 #include "intel_fbo.h"
  62 #include "intel_mipmap_tree.h"
  63 #include "intel_pixel.h"
  64 #include "intel_image.h"
  65 #include "intel_tex.h"
  66 #include "intel_tex_obj.h"
  67
  68 #include "swrast_setup/swrast_setup.h"
  69 #include "tnl/tnl.h"
  70 #include "tnl/t_pipeline.h"
  71 #include "util/ralloc.h"
  72 #include "util/debug.h"
  73 #include "isl/isl.h"
  74
  75 /***************************************
  76  * Mesa's Driver Functions
  77  ***************************************/
  78
  79 const char *const brw_vendor_string = "Intel Open Source Technology Center";
  80
  81 static const char *
  82 get_bsw_model(const struct intel_screen *intelScreen)
  83 {
  84    switch (intelScreen->eu_total) {
  85    case 16:
  86       return "405";
  87    case 12:
  88       return "400";
  89    default:
  90       return "   ";
  91    }
  92 }
  93
  94 const char *
  95 brw_get_renderer_string(const struct intel_screen *intelScreen)
  96 {
  97    const char *chipset;
  98    static char buffer[128];
  99    char *bsw = NULL;
 100
 101    switch (intelScreen->deviceID) {
 102 #undef CHIPSET
 103 #define CHIPSET(id, symbol, str) case id: chipset = str; break;
 104 #include "pci_ids/i965_pci_ids.h"
 105    default:
 106       chipset = "Unknown Intel Chipset";
 107       break;
 108    }
 109
 110    /* Braswell branding is funny, so we have to fix it up here */
 111    if (intelScreen->deviceID == 0x22B1) {
 112       bsw = strdup(chipset);
 113       char *needle = strstr(bsw, "XXX");
 114       if (needle) {
 115          memcpy(needle, get_bsw_model(intelScreen), 3);
 116          chipset = bsw;
 117       }
 118    }
 119
 120    (void) driGetRendererString(buffer, chipset, 0);
 121    free(bsw);
 122    return buffer;
 123 }
 124
 125 static const GLubyte *
 126 intel_get_string(struct gl_context * ctx, GLenum name)
 127 {
 128    const struct brw_context *const brw = brw_context(ctx);
 129
 130    switch (name) {
 131    case GL_VENDOR:
 132       return (GLubyte *) brw_vendor_string;
 133
 134    case GL_RENDERER:
 135       return
 136          (GLubyte *) brw_get_renderer_string(brw->intelScreen);
 137
 138    default:
 139       return NULL;
 140    }
 141 }
 142
 143 static void
 144 intel_viewport(struct gl_context *ctx)
 145 {
 146    struct brw_context *brw = brw_context(ctx);
 147    __DRIcontext *driContext = brw->driContext;
 148
 149    if (_mesa_is_winsys_fbo(ctx->DrawBuffer)) {
 150       if (driContext->driDrawablePriv)
 151          dri2InvalidateDrawable(driContext->driDrawablePriv);
 152       if (driContext->driReadablePriv)
 153          dri2InvalidateDrawable(driContext->driReadablePriv);
 154    }
 155 }
 156
 157 static void
 158 intel_update_framebuffer(struct gl_context *ctx,
 159                          struct gl_framebuffer *fb)
 160 {
 161    struct brw_context *brw = brw_context(ctx);
 162
 163    /* Quantize the derived default number of samples
 164     */
 165    fb->DefaultGeometry._NumSamples =
 166       intel_quantize_num_samples(brw->intelScreen,
 167                                  fb->DefaultGeometry.NumSamples);
 168 }
 169
 170 /* On Gen9 color buffers may be compressed by the hardware (lossless
 171  * compression). There are, however, format restrictions and care needs to be
 172  * taken that the sampler engine is capable for re-interpreting a buffer with
 173  * format different the buffer was originally written with.
 174  *
 175  * For example, SRGB formats are not compressible and the sampler engine isn't
 176  * capable of treating RGBA_UNORM as SRGB_ALPHA. In such a case the underlying
 177  * color buffer needs to be resolved so that the sampling surface can be
 178  * sampled as non-compressed (i.e., without the auxiliary MCS buffer being
 179  * set).
 180  */
 181 static bool
 182 intel_texture_view_requires_resolve(struct brw_context *brw,
 183                                     struct intel_texture_object *intel_tex)
 184 {
 185    if (brw->gen < 9 ||
 186        !intel_miptree_is_lossless_compressed(brw, intel_tex->mt))
 187      return false;
 188
 189    const uint32_t brw_format = brw_format_for_mesa_format(intel_tex->_Format);
 190
 191    if (isl_format_supports_lossless_compression(brw->intelScreen->devinfo,
 192                                                 brw_format))
 193       return false;
 194
 195    perf_debug("Incompatible sampling format (%s) for rbc (%s)\n",
 196               _mesa_get_format_name(intel_tex->_Format),
 197               _mesa_get_format_name(intel_tex->mt->format));
 198
 199    return true;
 200 }
 201
 202 static void
 203 intel_update_state(struct gl_context * ctx, GLuint new_state)
 204 {
 205    struct brw_context *brw = brw_context(ctx);
 206    struct intel_texture_object *tex_obj;
 207    struct intel_renderbuffer *depth_irb;
 208
 209    if (ctx->swrast_context)
 210       _swrast_InvalidateState(ctx, new_state);
 211    _vbo_InvalidateState(ctx, new_state);
 212
 213    brw->NewGLState |= new_state;
 214
 215    _mesa_unlock_context_textures(ctx);
 216
 217    /* Resolve the depth buffer's HiZ buffer. */
 218    depth_irb = intel_get_renderbuffer(ctx->DrawBuffer, BUFFER_DEPTH);
 219    if (depth_irb)
 220       intel_renderbuffer_resolve_hiz(brw, depth_irb);
 221
 222    /* Resolve depth buffer and render cache of each enabled texture. */
 223    int maxEnabledUnit = ctx->Texture._MaxEnabledTexImageUnit;
 224    for (int i = 0; i <= maxEnabledUnit; i++) {
 225       if (!ctx->Texture.Unit[i]._Current)
 226          continue;
 227       tex_obj = intel_texture_object(ctx->Texture.Unit[i]._Current);
 228       if (!tex_obj || !tex_obj->mt)
 229          continue;
 230       intel_miptree_all_slices_resolve_depth(brw, tex_obj->mt);
 231       /* Sampling engine understands lossless compression and resolving
 232        * those surfaces should be skipped for performance reasons.
 233        */
 234       const int flags = intel_texture_view_requires_resolve(brw, tex_obj) ?
 235                            0 : INTEL_MIPTREE_IGNORE_CCS_E;
 236       intel_miptree_resolve_color(brw, tex_obj->mt, flags);
 237       brw_render_cache_set_check_flush(brw, tex_obj->mt->bo);
 238    }
 239
 240    /* Resolve color for each active shader image. */
 241    for (unsigned i = 0; i < MESA_SHADER_STAGES; i++) {
 242       const struct gl_linked_shader *shader =
 243          ctx->_Shader->CurrentProgram[i] ?
 244             ctx->_Shader->CurrentProgram[i]->_LinkedShaders[i] : NULL;
 245
 246       if (unlikely(shader && shader->NumImages)) {
 247          for (unsigned j = 0; j < shader->NumImages; j++) {
 248             struct gl_image_unit *u = &ctx->ImageUnits[shader->ImageUnits[j]];
 249             tex_obj = intel_texture_object(u->TexObj);
 250
 251             if (tex_obj && tex_obj->mt) {
 252                /* Access to images is implemented using indirect messages
 253                 * against data port. Normal render target write understands
 254                 * lossless compression but unfortunately the typed/untyped
 255                 * read/write interface doesn't. Therefore the compressed
 256                 * surfaces need to be resolved prior to accessing them.
 257                 */
 258                intel_miptree_resolve_color(brw, tex_obj->mt, 0);
 259                brw_render_cache_set_check_flush(brw, tex_obj->mt->bo);
 260             }
 261          }
 262       }
 263    }
 264
 265    /* Resolve color buffers for non-coherent framebufer fetch. */
 266    if (!ctx->Extensions.MESA_shader_framebuffer_fetch &&
 267        ctx->FragmentProgram._Current &&
 268        ctx->FragmentProgram._Current->Base.OutputsRead) {
 269       const struct gl_framebuffer *fb = ctx->DrawBuffer;
 270
 271       for (unsigned i = 0; i < fb->_NumColorDrawBuffers; i++) {
 272          const struct intel_renderbuffer *irb =
 273             intel_renderbuffer(fb->_ColorDrawBuffers[i]);
 274
 275          if (irb &&
 276              intel_miptree_resolve_color(brw, irb->mt,
 277                                          INTEL_MIPTREE_IGNORE_CCS_E))
 278             brw_render_cache_set_check_flush(brw, irb->mt->bo);
 279       }
 280    }
 281
 282    /* If FRAMEBUFFER_SRGB is used on Gen9+ then we need to resolve any of the
 283     * single-sampled color renderbuffers because the CCS buffer isn't
 284     * supported for SRGB formats. This only matters if FRAMEBUFFER_SRGB is
 285     * enabled because otherwise the surface state will be programmed with the
 286     * linear equivalent format anyway.
 287     */
 288    if (brw->gen >= 9 && ctx->Color.sRGBEnabled) {
 289       struct gl_framebuffer *fb = ctx->DrawBuffer;
 290       for (int i = 0; i < fb->_NumColorDrawBuffers; i++) {
 291          struct gl_renderbuffer *rb = fb->_ColorDrawBuffers[i];
 292
 293          if (rb == NULL)
 294             continue;
 295
 296          struct intel_renderbuffer *irb = intel_renderbuffer(rb);
 297          struct intel_mipmap_tree *mt = irb->mt;
 298
 299          if (mt == NULL ||
 300              mt->num_samples > 1 ||
 301              _mesa_get_srgb_format_linear(mt->format) == mt->format)
 302                continue;
 303
 304          /* Lossless compression is not supported for SRGB formats, it
 305           * should be impossible to get here with such surfaces.
 306           */
 307          assert(!intel_miptree_is_lossless_compressed(brw, mt));
 308          intel_miptree_resolve_color(brw, mt, 0);
 309          brw_render_cache_set_check_flush(brw, mt->bo);
 310       }
 311    }
 312
 313    _mesa_lock_context_textures(ctx);
 314
 315    if (new_state & _NEW_BUFFERS) {
 316       intel_update_framebuffer(ctx, ctx->DrawBuffer);
 317       if (ctx->DrawBuffer != ctx->ReadBuffer)
 318          intel_update_framebuffer(ctx, ctx->ReadBuffer);
 319    }
 320 }
 321
 322 #define flushFront(screen)      ((screen)->image.loader ? (screen)->image.loader->flushFrontBuffer : (screen)->dri2.loader->flushFrontBuffer)
 323
 324 static void
 325 intel_flush_front(struct gl_context *ctx)
 326 {
 327    struct brw_context *brw = brw_context(ctx);
 328    __DRIcontext *driContext = brw->driContext;
 329    __DRIdrawable *driDrawable = driContext->driDrawablePriv;
 330    __DRIscreen *const screen = brw->intelScreen->driScrnPriv;
 331
 332    if (brw->front_buffer_dirty && _mesa_is_winsys_fbo(ctx->DrawBuffer)) {
 333       if (flushFront(screen) && driDrawable &&
 334           driDrawable->loaderPrivate) {
 335
 336          /* Resolve before flushing FAKE_FRONT_LEFT to FRONT_LEFT.
 337           *
 338           * This potentially resolves both front and back buffer. It
 339           * is unnecessary to resolve the back, but harms nothing except
 340           * performance. And no one cares about front-buffer render
 341           * performance.
 342           */
 343          intel_resolve_for_dri2_flush(brw, driDrawable);
 344          intel_batchbuffer_flush(brw);
 345
 346          flushFront(screen)(driDrawable, driDrawable->loaderPrivate);
 347
 348          /* We set the dirty bit in intel_prepare_render() if we're
 349           * front buffer rendering once we get there.
 350           */
 351          brw->front_buffer_dirty = false;
 352       }
 353    }
 354 }
 355
 356 static void
 357 intel_glFlush(struct gl_context *ctx)
 358 {
 359    struct brw_context *brw = brw_context(ctx);
 360
 361    intel_batchbuffer_flush(brw);
 362    intel_flush_front(ctx);
 363
 364    brw->need_flush_throttle = true;
 365 }
 366
 367 static void
 368 intel_finish(struct gl_context * ctx)
 369 {
 370    struct brw_context *brw = brw_context(ctx);
 371
 372    intel_glFlush(ctx);
 373
 374    if (brw->batch.last_bo)
 375       drm_intel_bo_wait_rendering(brw->batch.last_bo);
 376 }
 377
 378 static void
 379 brw_init_driver_functions(struct brw_context *brw,
 380                           struct dd_function_table *functions)
 381 {
 382    _mesa_init_driver_functions(functions);
 383
 384    /* GLX uses DRI2 invalidate events to handle window resizing.
 385     * Unfortunately, EGL does not - libEGL is written in XCB (not Xlib),
 386     * which doesn't provide a mechanism for snooping the event queues.
 387     *
 388     * So EGL still relies on viewport hacks to handle window resizing.
 389     * This should go away with DRI3000.
 390     */
 391    if (!brw->driContext->driScreenPriv->dri2.useInvalidate)
 392       functions->Viewport = intel_viewport;
 393
 394    functions->Flush = intel_glFlush;
 395    functions->Finish = intel_finish;
 396    functions->GetString = intel_get_string;
 397    functions->UpdateState = intel_update_state;
 398
 399    intelInitTextureFuncs(functions);
 400    intelInitTextureImageFuncs(functions);
 401    intelInitTextureSubImageFuncs(functions);
 402    intelInitTextureCopyImageFuncs(functions);
 403    intelInitCopyImageFuncs(functions);
 404    intelInitClearFuncs(functions);
 405    intelInitBufferFuncs(functions);
 406    intelInitPixelFuncs(functions);
 407    intelInitBufferObjectFuncs(functions);
 408    intel_init_syncobj_functions(functions);
 409    brw_init_object_purgeable_functions(functions);
 410
 411    brwInitFragProgFuncs( functions );
 412    brw_init_common_queryobj_functions(functions);
 413    if (brw->gen >= 8 || brw->is_haswell)
 414       hsw_init_queryobj_functions(functions);
 415    else if (brw->gen >= 6)
 416       gen6_init_queryobj_functions(functions);
 417    else
 418       gen4_init_queryobj_functions(functions);
 419    brw_init_compute_functions(functions);
 420    if (brw->gen >= 7)
 421       brw_init_conditional_render_functions(functions);
 422
 423    functions->QueryInternalFormat = brw_query_internal_format;
 424
 425    functions->NewTransformFeedback = brw_new_transform_feedback;
 426    functions->DeleteTransformFeedback = brw_delete_transform_feedback;
 427    if (brw->intelScreen->has_mi_math_and_lrr) {
 428       functions->BeginTransformFeedback = hsw_begin_transform_feedback;
 429       functions->EndTransformFeedback = hsw_end_transform_feedback;
 430       functions->PauseTransformFeedback = hsw_pause_transform_feedback;
 431       functions->ResumeTransformFeedback = hsw_resume_transform_feedback;
 432    } else if (brw->gen >= 7) {
 433       functions->BeginTransformFeedback = gen7_begin_transform_feedback;
 434       functions->EndTransformFeedback = gen7_end_transform_feedback;
 435       functions->PauseTransformFeedback = gen7_pause_transform_feedback;
 436       functions->ResumeTransformFeedback = gen7_resume_transform_feedback;
 437       functions->GetTransformFeedbackVertexCount =
 438          brw_get_transform_feedback_vertex_count;
 439    } else {
 440       functions->BeginTransformFeedback = brw_begin_transform_feedback;
 441       functions->EndTransformFeedback = brw_end_transform_feedback;
 442    }
 443
 444    if (brw->gen >= 6)
 445       functions->GetSamplePosition = gen6_get_sample_position;
 446 }
 447
 448 static void
 449 brw_initialize_context_constants(struct brw_context *brw)
 450 {
 451    struct gl_context *ctx = &brw->ctx;
 452    const struct brw_compiler *compiler = brw->intelScreen->compiler;
 453
 454    const bool stage_exists[MESA_SHADER_STAGES] = {
 455       [MESA_SHADER_VERTEX] = true,
 456       [MESA_SHADER_TESS_CTRL] = brw->gen >= 7,
 457       [MESA_SHADER_TESS_EVAL] = brw->gen >= 7,
 458       [MESA_SHADER_GEOMETRY] = brw->gen >= 6,
 459       [MESA_SHADER_FRAGMENT] = true,
 460       [MESA_SHADER_COMPUTE] =
 461          (ctx->API == API_OPENGL_CORE &&
 462           ctx->Const.MaxComputeWorkGroupSize[0] >= 1024) ||
 463          (ctx->API == API_OPENGLES2 &&
 464           ctx->Const.MaxComputeWorkGroupSize[0] >= 128) ||
 465          _mesa_extension_override_enables.ARB_compute_shader,
 466    };
 467
 468    unsigned num_stages = 0;
 469    for (int i = 0; i < MESA_SHADER_STAGES; i++) {
 470       if (stage_exists[i])
 471          num_stages++;
 472    }
 473
 474    unsigned max_samplers =
 475       brw->gen >= 8 || brw->is_haswell ? BRW_MAX_TEX_UNIT : 16;
 476
 477    ctx->Const.MaxDualSourceDrawBuffers = 1;
 478    ctx->Const.MaxDrawBuffers = BRW_MAX_DRAW_BUFFERS;
 479    ctx->Const.MaxCombinedShaderOutputResources =
 480       MAX_IMAGE_UNITS + BRW_MAX_DRAW_BUFFERS;
 481
 482    ctx->Const.QueryCounterBits.Timestamp = 36;
 483
 484    ctx->Const.MaxTextureCoordUnits = 8; /* Mesa limit */
 485    ctx->Const.MaxImageUnits = MAX_IMAGE_UNITS;
 486    ctx->Const.MaxRenderbufferSize = 8192;
 487    ctx->Const.MaxTextureLevels = MIN2(14 /* 8192 */, MAX_TEXTURE_LEVELS);
 488
 489    /* On Sandy Bridge and prior, the "Render Target View Extent" field of
 490     * RENDER_SURFACE_STATE is only 9 bits so the largest 3-D texture we can do
 491     * a layered render into has a depth of 512.  On Iron Lake and earlier, we
 492     * don't support layered rendering and we use manual offsetting to render
 493     * into the different layers so this doesn't matter.  On Sandy Bridge,
 494     * however, we do support layered rendering so this is a problem.
 495     */
 496    ctx->Const.Max3DTextureLevels = brw->gen == 6 ? 10 /* 512 */ : 12; /* 2048 */
 497
 498    ctx->Const.MaxCubeTextureLevels = 14; /* 8192 */
 499    ctx->Const.MaxArrayTextureLayers = brw->gen >= 7 ? 2048 : 512;
 500    ctx->Const.MaxTextureMbytes = 1536;
 501    ctx->Const.MaxTextureRectSize = 1 << 12;
 502    ctx->Const.MaxTextureMaxAnisotropy = 16.0;
 503    ctx->Const.StripTextureBorder = true;
 504    if (brw->gen >= 7)
 505       ctx->Const.MaxProgramTextureGatherComponents = 4;
 506    else if (brw->gen == 6)
 507       ctx->Const.MaxProgramTextureGatherComponents = 1;
 508
 509    ctx->Const.MaxUniformBlockSize = 65536;
 510
 511    for (int i = 0; i < MESA_SHADER_STAGES; i++) {
 512       struct gl_program_constants *prog = &ctx->Const.Program[i];
 513
 514       if (!stage_exists[i])
 515          continue;
 516
 517       prog->MaxTextureImageUnits = max_samplers;
 518
 519       prog->MaxUniformBlocks = BRW_MAX_UBO;
 520       prog->MaxCombinedUniformComponents =
 521          prog->MaxUniformComponents +
 522          ctx->Const.MaxUniformBlockSize / 4 * prog->MaxUniformBlocks;
 523
 524       prog->MaxAtomicCounters = MAX_ATOMIC_COUNTERS;
 525       prog->MaxAtomicBuffers = BRW_MAX_ABO;
 526       prog->MaxImageUniforms = compiler->scalar_stage[i] ? BRW_MAX_IMAGES : 0;
 527       prog->MaxShaderStorageBlocks = BRW_MAX_SSBO;
 528    }
 529
 530    ctx->Const.MaxTextureUnits =
 531       MIN2(ctx->Const.MaxTextureCoordUnits,
 532            ctx->Const.Program[MESA_SHADER_FRAGMENT].MaxTextureImageUnits);
 533
 534    ctx->Const.MaxUniformBufferBindings = num_stages * BRW_MAX_UBO;
 535    ctx->Const.MaxCombinedUniformBlocks = num_stages * BRW_MAX_UBO;
 536    ctx->Const.MaxCombinedAtomicBuffers = num_stages * BRW_MAX_ABO;
 537    ctx->Const.MaxCombinedShaderStorageBlocks = num_stages * BRW_MAX_SSBO;
 538    ctx->Const.MaxShaderStorageBufferBindings = num_stages * BRW_MAX_SSBO;
 539    ctx->Const.MaxCombinedTextureImageUnits = num_stages * max_samplers;
 540    ctx->Const.MaxCombinedImageUniforms = num_stages * BRW_MAX_IMAGES;
 541
 542
 543    /* Hardware only supports a limited number of transform feedback buffers.
 544     * So we need to override the Mesa default (which is based only on software
 545     * limits).
 546     */
 547    ctx->Const.MaxTransformFeedbackBuffers = BRW_MAX_SOL_BUFFERS;
 548
 549    /* On Gen6, in the worst case, we use up one binding table entry per
 550     * transform feedback component (see comments above the definition of
 551     * BRW_MAX_SOL_BINDINGS, in brw_context.h), so we need to advertise a value
 552     * for MAX_TRANSFORM_FEEDBACK_INTERLEAVED_COMPONENTS equal to
 553     * BRW_MAX_SOL_BINDINGS.
 554     *
 555     * In "separate components" mode, we need to divide this value by
 556     * BRW_MAX_SOL_BUFFERS, so that the total number of binding table entries
 557     * used up by all buffers will not exceed BRW_MAX_SOL_BINDINGS.
 558     */
 559    ctx->Const.MaxTransformFeedbackInterleavedComponents = BRW_MAX_SOL_BINDINGS;
 560    ctx->Const.MaxTransformFeedbackSeparateComponents =
 561       BRW_MAX_SOL_BINDINGS / BRW_MAX_SOL_BUFFERS;
 562
 563    ctx->Const.AlwaysUseGetTransformFeedbackVertexCount =
 564       !brw->intelScreen->has_mi_math_and_lrr;
 565
 566    int max_samples;
 567    const int *msaa_modes = intel_supported_msaa_modes(brw->intelScreen);
 568    const int clamp_max_samples =
 569       driQueryOptioni(&brw->optionCache, "clamp_max_samples");
 570
 571    if (clamp_max_samples < 0) {
 572       max_samples = msaa_modes[0];
 573    } else {
 574       /* Select the largest supported MSAA mode that does not exceed
 575        * clamp_max_samples.
 576        */
 577       max_samples = 0;
 578       for (int i = 0; msaa_modes[i] != 0; ++i) {
 579          if (msaa_modes[i] <= clamp_max_samples) {
 580             max_samples = msaa_modes[i];
 581             break;
 582          }
 583       }
 584    }
 585
 586    ctx->Const.MaxSamples = max_samples;
 587    ctx->Const.MaxColorTextureSamples = max_samples;
 588    ctx->Const.MaxDepthTextureSamples = max_samples;
 589    ctx->Const.MaxIntegerSamples = max_samples;
 590    ctx->Const.MaxImageSamples = 0;
 591
 592    /* gen6_set_sample_maps() sets SampleMap{2,4,8}x variables which are used
 593     * to map indices of rectangular grid to sample numbers within a pixel.
 594     * These variables are used by GL_EXT_framebuffer_multisample_blit_scaled
 595     * extension implementation. For more details see the comment above
 596     * gen6_set_sample_maps() definition.
 597     */
 598    gen6_set_sample_maps(ctx);
 599
 600    ctx->Const.MinLineWidth = 1.0;
 601    ctx->Const.MinLineWidthAA = 1.0;
 602    if (brw->gen >= 6) {
 603       ctx->Const.MaxLineWidth = 7.375;
 604       ctx->Const.MaxLineWidthAA = 7.375;
 605       ctx->Const.LineWidthGranularity = 0.125;
 606    } else {
 607       ctx->Const.MaxLineWidth = 7.0;
 608       ctx->Const.MaxLineWidthAA = 7.0;
 609       ctx->Const.LineWidthGranularity = 0.5;
 610    }
 611
 612    /* For non-antialiased lines, we have to round the line width to the
 613     * nearest whole number. Make sure that we don't advertise a line
 614     * width that, when rounded, will be beyond the actual hardware
 615     * maximum.
 616     */
 617    assert(roundf(ctx->Const.MaxLineWidth) <= ctx->Const.MaxLineWidth);
 618
 619    ctx->Const.MinPointSize = 1.0;
 620    ctx->Const.MinPointSizeAA = 1.0;
 621    ctx->Const.MaxPointSize = 255.0;
 622    ctx->Const.MaxPointSizeAA = 255.0;
 623    ctx->Const.PointSizeGranularity = 1.0;
 624
 625    if (brw->gen >= 5 || brw->is_g4x)
 626       ctx->Const.MaxClipPlanes = 8;
 627
 628    ctx->Const.LowerTessLevel = true;
 629    ctx->Const.LowerTCSPatchVerticesIn = brw->gen >= 8;
 630    ctx->Const.LowerTESPatchVerticesIn = true;
 631    ctx->Const.PrimitiveRestartForPatches = true;
 632
 633    ctx->Const.Program[MESA_SHADER_VERTEX].MaxNativeInstructions = 16 * 1024;
 634    ctx->Const.Program[MESA_SHADER_VERTEX].MaxAluInstructions = 0;
 635    ctx->Const.Program[MESA_SHADER_VERTEX].MaxTexInstructions = 0;
 636    ctx->Const.Program[MESA_SHADER_VERTEX].MaxTexIndirections = 0;
 637    ctx->Const.Program[MESA_SHADER_VERTEX].MaxNativeAluInstructions = 0;
 638    ctx->Const.Program[MESA_SHADER_VERTEX].MaxNativeTexInstructions = 0;
 639    ctx->Const.Program[MESA_SHADER_VERTEX].MaxNativeTexIndirections = 0;
 640    ctx->Const.Program[MESA_SHADER_VERTEX].MaxNativeAttribs = 16;
 641    ctx->Const.Program[MESA_SHADER_VERTEX].MaxNativeTemps = 256;
 642    ctx->Const.Program[MESA_SHADER_VERTEX].MaxNativeAddressRegs = 1;
 643    ctx->Const.Program[MESA_SHADER_VERTEX].MaxNativeParameters = 1024;
 644    ctx->Const.Program[MESA_SHADER_VERTEX].MaxEnvParams =
 645       MIN2(ctx->Const.Program[MESA_SHADER_VERTEX].MaxNativeParameters,
 646            ctx->Const.Program[MESA_SHADER_VERTEX].MaxEnvParams);
 647
 648    ctx->Const.Program[MESA_SHADER_FRAGMENT].MaxNativeInstructions = 1024;
 649    ctx->Const.Program[MESA_SHADER_FRAGMENT].MaxNativeAluInstructions = 1024;
 650    ctx->Const.Program[MESA_SHADER_FRAGMENT].MaxNativeTexInstructions = 1024;
 651    ctx->Const.Program[MESA_SHADER_FRAGMENT].MaxNativeTexIndirections = 1024;
 652    ctx->Const.Program[MESA_SHADER_FRAGMENT].MaxNativeAttribs = 12;
 653    ctx->Const.Program[MESA_SHADER_FRAGMENT].MaxNativeTemps = 256;
 654    ctx->Const.Program[MESA_SHADER_FRAGMENT].MaxNativeAddressRegs = 0;
 655    ctx->Const.Program[MESA_SHADER_FRAGMENT].MaxNativeParameters = 1024;
 656    ctx->Const.Program[MESA_SHADER_FRAGMENT].MaxEnvParams =
 657       MIN2(ctx->Const.Program[MESA_SHADER_FRAGMENT].MaxNativeParameters,
 658            ctx->Const.Program[MESA_SHADER_FRAGMENT].MaxEnvParams);
 659
 660    /* Fragment shaders use real, 32-bit twos-complement integers for all
 661     * integer types.
 662     */
 663    ctx->Const.Program[MESA_SHADER_FRAGMENT].LowInt.RangeMin = 31;
 664    ctx->Const.Program[MESA_SHADER_FRAGMENT].LowInt.RangeMax = 30;
 665    ctx->Const.Program[MESA_SHADER_FRAGMENT].LowInt.Precision = 0;
 666    ctx->Const.Program[MESA_SHADER_FRAGMENT].HighInt = ctx->Const.Program[MESA_SHADER_FRAGMENT].LowInt;
 667    ctx->Const.Program[MESA_SHADER_FRAGMENT].MediumInt = ctx->Const.Program[MESA_SHADER_FRAGMENT].LowInt;
 668
 669    ctx->Const.Program[MESA_SHADER_VERTEX].LowInt.RangeMin = 31;
 670    ctx->Const.Program[MESA_SHADER_VERTEX].LowInt.RangeMax = 30;
 671    ctx->Const.Program[MESA_SHADER_VERTEX].LowInt.Precision = 0;
 672    ctx->Const.Program[MESA_SHADER_VERTEX].HighInt = ctx->Const.Program[MESA_SHADER_VERTEX].LowInt;
 673    ctx->Const.Program[MESA_SHADER_VERTEX].MediumInt = ctx->Const.Program[MESA_SHADER_VERTEX].LowInt;
 674
 675    /* Gen6 converts quads to polygon in beginning of 3D pipeline,
 676     * but we're not sure how it's actually done for vertex order,
 677     * that affect provoking vertex decision. Always use last vertex
 678     * convention for quad primitive which works as expected for now.
 679     */
 680    if (brw->gen >= 6)
 681       ctx->Const.QuadsFollowProvokingVertexConvention = false;
 682
 683    ctx->Const.NativeIntegers = true;
 684    ctx->Const.VertexID_is_zero_based = true;
 685
 686    /* Regarding the CMP instruction, the Ivybridge PRM says:
 687     *
 688     *   "For each enabled channel 0b or 1b is assigned to the appropriate flag
 689     *    bit and 0/all zeros or all ones (e.g, byte 0xFF, word 0xFFFF, DWord
 690     *    0xFFFFFFFF) is assigned to dst."
 691     *
 692     * but PRMs for earlier generations say
 693     *
 694     *   "In dword format, one GRF may store up to 8 results. When the register
 695     *    is used later as a vector of Booleans, as only LSB at each channel
 696     *    contains meaning [sic] data, software should make sure all higher bits
 697     *    are masked out (e.g. by 'and-ing' an [sic] 0x01 constant)."
 698     *
 699     * We select the representation of a true boolean uniform to be ~0, and fix
 700     * the results of Gen <= 5 CMP instruction's with -(result & 1).
 701     */
 702    ctx->Const.UniformBooleanTrue = ~0;
 703
 704    /* From the gen4 PRM, volume 4 page 127:
 705     *
 706     *     "For SURFTYPE_BUFFER non-rendertarget surfaces, this field specifies
 707     *      the base address of the first element of the surface, computed in
 708     *      software by adding the surface base address to the byte offset of
 709     *      the element in the buffer."
 710     *
 711     * However, unaligned accesses are slower, so enforce buffer alignment.
 712     */
 713    ctx->Const.UniformBufferOffsetAlignment = 16;
 714
 715    /* ShaderStorageBufferOffsetAlignment should be a cacheline (64 bytes) so
 716     * that we can safely have the CPU and GPU writing the same SSBO on
 717     * non-cachecoherent systems (our Atom CPUs). With UBOs, the GPU never
 718     * writes, so there's no problem. For an SSBO, the GPU and the CPU can
 719     * be updating disjoint regions of the buffer simultaneously and that will
 720     * break if the regions overlap the same cacheline.
 721     */
 722    ctx->Const.ShaderStorageBufferOffsetAlignment = 64;
 723    ctx->Const.TextureBufferOffsetAlignment = 16;
 724    ctx->Const.MaxTextureBufferSize = 128 * 1024 * 1024;
 725
 726    if (brw->gen >= 6) {
 727       ctx->Const.MaxVarying = 32;
 728       ctx->Const.Program[MESA_SHADER_VERTEX].MaxOutputComponents = 128;
 729       ctx->Const.Program[MESA_SHADER_GEOMETRY].MaxInputComponents = 64;
 730       ctx->Const.Program[MESA_SHADER_GEOMETRY].MaxOutputComponents = 128;
 731       ctx->Const.Program[MESA_SHADER_FRAGMENT].MaxInputComponents = 128;
 732       ctx->Const.Program[MESA_SHADER_TESS_CTRL].MaxInputComponents = 128;
 733       ctx->Const.Program[MESA_SHADER_TESS_CTRL].MaxOutputComponents = 128;
 734       ctx->Const.Program[MESA_SHADER_TESS_EVAL].MaxInputComponents = 128;
 735       ctx->Const.Program[MESA_SHADER_TESS_EVAL].MaxOutputComponents = 128;
 736    }
 737
 738    /* We want the GLSL compiler to emit code that uses condition codes */
 739    for (int i = 0; i < MESA_SHADER_STAGES; i++) {
 740       ctx->Const.ShaderCompilerOptions[i] =
 741          brw->intelScreen->compiler->glsl_compiler_options[i];
 742    }
 743
 744    if (brw->gen >= 7) {
 745       ctx->Const.MaxViewportWidth = 32768;
 746       ctx->Const.MaxViewportHeight = 32768;
 747    }
 748
 749    /* ARB_viewport_array */
 750    if (brw->gen >= 6 && ctx->API == API_OPENGL_CORE) {
 751       ctx->Const.MaxViewports = GEN6_NUM_VIEWPORTS;
 752       ctx->Const.ViewportSubpixelBits = 0;
 753
 754       /* Cast to float before negating because MaxViewportWidth is unsigned.
 755        */
 756       ctx->Const.ViewportBounds.Min = -(float)ctx->Const.MaxViewportWidth;
 757       ctx->Const.ViewportBounds.Max = ctx->Const.MaxViewportWidth;
 758    }
 759
 760    /* ARB_gpu_shader5 */
 761    if (brw->gen >= 7)
 762       ctx->Const.MaxVertexStreams = MIN2(4, MAX_VERTEX_STREAMS);
 763
 764    /* ARB_framebuffer_no_attachments */
 765    ctx->Const.MaxFramebufferWidth = 16384;
 766    ctx->Const.MaxFramebufferHeight = 16384;
 767    ctx->Const.MaxFramebufferLayers = ctx->Const.MaxArrayTextureLayers;
 768    ctx->Const.MaxFramebufferSamples = max_samples;
 769 }
 770
 771 static void
 772 brw_initialize_cs_context_constants(struct brw_context *brw, unsigned max_threads)
 773 {
 774    struct gl_context *ctx = &brw->ctx;
 775    /* Maximum number of scalar compute shader invocations that can be run in
 776     * parallel in the same subslice assuming SIMD32 dispatch.
 777     */
 778    const uint32_t max_invocations = 32 * max_threads;
 779    ctx->Const.MaxComputeWorkGroupSize[0] = max_invocations;
 780    ctx->Const.MaxComputeWorkGroupSize[1] = max_invocations;
 781    ctx->Const.MaxComputeWorkGroupSize[2] = max_invocations;
 782    ctx->Const.MaxComputeWorkGroupInvocations = max_invocations;
 783    ctx->Const.MaxComputeSharedMemorySize = 64 * 1024;
 784 }
 785
 786 /**
 787  * Process driconf (drirc) options, setting appropriate context flags.
 788  *
 789  * intelInitExtensions still pokes at optionCache directly, in order to
 790  * avoid advertising various extensions.  No flags are set, so it makes
 791  * sense to continue doing that there.
 792  */
 793 static void
 794 brw_process_driconf_options(struct brw_context *brw)
 795 {
 796    struct gl_context *ctx = &brw->ctx;
 797
 798    driOptionCache *options = &brw->optionCache;
 799    driParseConfigFiles(options, &brw->intelScreen->optionCache,
 800                        brw->driContext->driScreenPriv->myNum, "i965");
 801
 802    int bo_reuse_mode = driQueryOptioni(options, "bo_reuse");
 803    switch (bo_reuse_mode) {
 804    case DRI_CONF_BO_REUSE_DISABLED:
 805       break;
 806    case DRI_CONF_BO_REUSE_ALL:
 807       intel_bufmgr_gem_enable_reuse(brw->bufmgr);
 808       break;
 809    }
 810
 811    if (!driQueryOptionb(options, "hiz")) {
 812        brw->has_hiz = false;
 813        /* On gen6, you can only do separate stencil with HIZ. */
 814        if (brw->gen == 6)
 815           brw->has_separate_stencil = false;
 816    }
 817
 818    if (driQueryOptionb(options, "always_flush_batch")) {
 819       fprintf(stderr, "flushing batchbuffer before/after each draw call\n");
 820       brw->always_flush_batch = true;
 821    }
 822
 823    if (driQueryOptionb(options, "always_flush_cache")) {
 824       fprintf(stderr, "flushing GPU caches before/after each draw call\n");
 825       brw->always_flush_cache = true;
 826    }
 827
 828    if (driQueryOptionb(options, "disable_throttling")) {
 829       fprintf(stderr, "disabling flush throttling\n");
 830       brw->disable_throttling = true;
 831    }
 832
 833    brw->precompile = driQueryOptionb(&brw->optionCache, "shader_precompile");
 834
 835    if (driQueryOptionb(&brw->optionCache, "precise_trig"))
 836       brw->intelScreen->compiler->precise_trig = true;
 837
 838    ctx->Const.ForceGLSLExtensionsWarn =
 839       driQueryOptionb(options, "force_glsl_extensions_warn");
 840
 841    ctx->Const.DisableGLSLLineContinuations =
 842       driQueryOptionb(options, "disable_glsl_line_continuations");
 843
 844    ctx->Const.AllowGLSLExtensionDirectiveMidShader =
 845       driQueryOptionb(options, "allow_glsl_extension_directive_midshader");
 846
 847    ctx->Const.GLSLZeroInit = driQueryOptionb(options, "glsl_zero_init");
 848
 849    brw->dual_color_blend_by_location =
 850       driQueryOptionb(options, "dual_color_blend_by_location");
 851 }
 852
 853 GLboolean
 854 brwCreateContext(gl_api api,
 855                  const struct gl_config *mesaVis,
 856                  __DRIcontext *driContextPriv,
 857                  unsigned major_version,
 858                  unsigned minor_version,
 859                  uint32_t flags,
 860                  bool notify_reset,
 861                  unsigned *dri_ctx_error,
 862                  void *sharedContextPrivate)
 863 {
 864    __DRIscreen *sPriv = driContextPriv->driScreenPriv;
 865    struct gl_context *shareCtx = (struct gl_context *) sharedContextPrivate;
 866    struct intel_screen *screen = sPriv->driverPrivate;
 867    const struct brw_device_info *devinfo = screen->devinfo;
 868    struct dd_function_table functions;
 869
 870    /* Only allow the __DRI_CTX_FLAG_ROBUST_BUFFER_ACCESS flag if the kernel
 871     * provides us with context reset notifications.
 872     */
 873    uint32_t allowed_flags = __DRI_CTX_FLAG_DEBUG
 874       | __DRI_CTX_FLAG_FORWARD_COMPATIBLE;
 875
 876    if (screen->has_context_reset_notification)
 877       allowed_flags |= __DRI_CTX_FLAG_ROBUST_BUFFER_ACCESS;
 878
 879    if (flags & ~allowed_flags) {
 880       *dri_ctx_error = __DRI_CTX_ERROR_UNKNOWN_FLAG;
 881       return false;
 882    }
 883
 884    struct brw_context *brw = rzalloc(NULL, struct brw_context);
 885    if (!brw) {
 886       fprintf(stderr, "%s: failed to alloc context\n", __func__);
 887       *dri_ctx_error = __DRI_CTX_ERROR_NO_MEMORY;
 888       return false;
 889    }
 890
 891    driContextPriv->driverPrivate = brw;
 892    brw->driContext = driContextPriv;
 893    brw->intelScreen = screen;
 894    brw->bufmgr = screen->bufmgr;
 895
 896    brw->gen = devinfo->gen;
 897    brw->gt = devinfo->gt;
 898    brw->is_g4x = devinfo->is_g4x;
 899    brw->is_baytrail = devinfo->is_baytrail;
 900    brw->is_haswell = devinfo->is_haswell;
 901    brw->is_cherryview = devinfo->is_cherryview;
 902    brw->is_broxton = devinfo->is_broxton;
 903    brw->has_llc = devinfo->has_llc;
 904    brw->has_hiz = devinfo->has_hiz_and_separate_stencil;
 905    brw->has_separate_stencil = devinfo->has_hiz_and_separate_stencil;
 906    brw->has_pln = devinfo->has_pln;
 907    brw->has_compr4 = devinfo->has_compr4;
 908    brw->has_surface_tile_offset = devinfo->has_surface_tile_offset;
 909    brw->has_negative_rhw_bug = devinfo->has_negative_rhw_bug;
 910    brw->needs_unlit_centroid_workaround =
 911       devinfo->needs_unlit_centroid_workaround;
 912
 913    brw->must_use_separate_stencil = devinfo->must_use_separate_stencil;
 914    brw->has_swizzling = screen->hw_has_swizzling;
 915
 916    isl_device_init(&brw->isl_dev, devinfo, screen->hw_has_swizzling);
 917
 918    brw->vs.base.stage = MESA_SHADER_VERTEX;
 919    brw->tcs.base.stage = MESA_SHADER_TESS_CTRL;
 920    brw->tes.base.stage = MESA_SHADER_TESS_EVAL;
 921    brw->gs.base.stage = MESA_SHADER_GEOMETRY;
 922    brw->wm.base.stage = MESA_SHADER_FRAGMENT;
 923    if (brw->gen >= 8) {
 924       gen8_init_vtable_surface_functions(brw);
 925       brw->vtbl.emit_depth_stencil_hiz = gen8_emit_depth_stencil_hiz;
 926    } else if (brw->gen >= 7) {
 927       gen7_init_vtable_surface_functions(brw);
 928       brw->vtbl.emit_depth_stencil_hiz = gen7_emit_depth_stencil_hiz;
 929    } else if (brw->gen >= 6) {
 930       gen6_init_vtable_surface_functions(brw);
 931       brw->vtbl.emit_depth_stencil_hiz = gen6_emit_depth_stencil_hiz;
 932    } else {
 933       gen4_init_vtable_surface_functions(brw);
 934       brw->vtbl.emit_depth_stencil_hiz = brw_emit_depth_stencil_hiz;
 935    }
 936
 937    brw_init_driver_functions(brw, &functions);
 938
 939    if (notify_reset)
 940       functions.GetGraphicsResetStatus = brw_get_graphics_reset_status;
 941
 942    struct gl_context *ctx = &brw->ctx;
 943
 944    if (!_mesa_initialize_context(ctx, api, mesaVis, shareCtx, &functions)) {
 945       *dri_ctx_error = __DRI_CTX_ERROR_NO_MEMORY;
 946       fprintf(stderr, "%s: failed to init mesa context\n", __func__);
 947       intelDestroyContext(driContextPriv);
 948       return false;
 949    }
 950
 951    driContextSetFlags(ctx, flags);
 952
 953    /* Initialize the software rasterizer and helper modules.
 954     *
 955     * As of GL 3.1 core, the gen4+ driver doesn't need the swrast context for
 956     * software fallbacks (which we have to support on legacy GL to do weird
 957     * glDrawPixels(), glBitmap(), and other functions).
 958     */
 959    if (api != API_OPENGL_CORE && api != API_OPENGLES2) {
 960       _swrast_CreateContext(ctx);
 961    }
 962
 963    _vbo_CreateContext(ctx);
 964    if (ctx->swrast_context) {
 965       _tnl_CreateContext(ctx);
 966       TNL_CONTEXT(ctx)->Driver.RunPipeline = _tnl_run_pipeline;
 967       _swsetup_CreateContext(ctx);
 968
 969       /* Configure swrast to match hardware characteristics: */
 970       _swrast_allow_pixel_fog(ctx, false);
 971       _swrast_allow_vertex_fog(ctx, true);
 972    }
 973
 974    _mesa_meta_init(ctx);
 975
 976    brw_process_driconf_options(brw);
 977
 978    if (INTEL_DEBUG & DEBUG_PERF)
 979       brw->perf_debug = true;
 980
 981    brw_initialize_cs_context_constants(brw, devinfo->max_cs_threads);
 982    brw_initialize_context_constants(brw);
 983
 984    ctx->Const.ResetStrategy = notify_reset
 985       ? GL_LOSE_CONTEXT_ON_RESET_ARB : GL_NO_RESET_NOTIFICATION_ARB;
 986
 987    /* Reinitialize the context point state.  It depends on ctx->Const values. */
 988    _mesa_init_point(ctx);
 989
 990    intel_fbo_init(brw);
 991
 992    intel_batchbuffer_init(brw);
 993
 994    if (brw->gen >= 6) {
 995       /* Create a new hardware context.  Using a hardware context means that
 996        * our GPU state will be saved/restored on context switch, allowing us
 997        * to assume that the GPU is in the same state we left it in.
 998        *
 999        * This is required for transform feedback buffer offsets, query objects,
1000        * and also allows us to reduce how much state we have to emit.
1001        */
1002       brw->hw_ctx = drm_intel_gem_context_create(brw->bufmgr);
1003
1004       if (!brw->hw_ctx) {
1005          fprintf(stderr, "Gen6+ requires Kernel 3.6 or later.\n");
1006          intelDestroyContext(driContextPriv);
1007          return false;
1008       }
1009    }
1010
1011    if (brw_init_pipe_control(brw, devinfo)) {
1012       *dri_ctx_error = __DRI_CTX_ERROR_NO_MEMORY;
1013       intelDestroyContext(driContextPriv);
1014       return false;
1015    }
1016
1017    brw_init_state(brw);
1018
1019    intelInitExtensions(ctx);
1020
1021    brw_init_surface_formats(brw);
1022
1023    brw->max_vs_threads = devinfo->max_vs_threads;
1024    brw->max_hs_threads = devinfo->max_hs_threads;
1025    brw->max_ds_threads = devinfo->max_ds_threads;
1026    brw->max_gs_threads = devinfo->max_gs_threads;
1027    brw->max_wm_threads = devinfo->max_wm_threads;
1028    /* FINISHME: Do this for all platforms that the kernel supports */
1029    if (brw->is_cherryview &&
1030        screen->subslice_total > 0 && screen->eu_total > 0) {
1031       /* Logical CS threads = EUs per subslice * 7 threads per EU */
1032       brw->max_cs_threads = screen->eu_total / screen->subslice_total * 7;
1033
1034       /* Fuse configurations may give more threads than expected, never less. */
1035       if (brw->max_cs_threads < devinfo->max_cs_threads)
1036          brw->max_cs_threads = devinfo->max_cs_threads;
1037    } else {
1038       brw->max_cs_threads = devinfo->max_cs_threads;
1039    }
1040    brw->urb.size = devinfo->urb.size;
1041    brw->urb.min_vs_entries = devinfo->urb.min_vs_entries;
1042    brw->urb.max_vs_entries = devinfo->urb.max_vs_entries;
1043    brw->urb.max_hs_entries = devinfo->urb.max_hs_entries;
1044    brw->urb.max_ds_entries = devinfo->urb.max_ds_entries;
1045    brw->urb.max_gs_entries = devinfo->urb.max_gs_entries;
1046
1047    /* Estimate the size of the mappable aperture into the GTT.  There's an
1048     * ioctl to get the whole GTT size, but not one to get the mappable subset.
1049     * It turns out it's basically always 256MB, though some ancient hardware
1050     * was smaller.
1051     */
1052    uint32_t gtt_size = 256 * 1024 * 1024;
1053
1054    /* We don't want to map two objects such that a memcpy between them would
1055     * just fault one mapping in and then the other over and over forever.  So
1056     * we would need to divide the GTT size by 2.  Additionally, some GTT is
1057     * taken up by things like the framebuffer and the ringbuffer and such, so
1058     * be more conservative.
1059     */
1060    brw->max_gtt_map_object_size = gtt_size / 4;
1061
1062    if (brw->gen == 6)
1063       brw->urb.gs_present = false;
1064
1065    brw->prim_restart.in_progress = false;
1066    brw->prim_restart.enable_cut_index = false;
1067    brw->gs.enabled = false;
1068    brw->sf.viewport_transform_enable = true;
1069
1070    brw->predicate.state = BRW_PREDICATE_STATE_RENDER;
1071
1072    brw->use_resource_streamer = screen->has_resource_streamer &&
1073       (env_var_as_boolean("INTEL_USE_HW_BT", false) ||
1074        env_var_as_boolean("INTEL_USE_GATHER", false));
1075
1076    ctx->VertexProgram._MaintainTnlProgram = true;
1077    ctx->FragmentProgram._MaintainTexEnvProgram = true;
1078
1079    brw_draw_init( brw );
1080
1081    if ((flags & __DRI_CTX_FLAG_DEBUG) != 0) {
1082       /* Turn on some extra GL_ARB_debug_output generation. */
1083       brw->perf_debug = true;
1084    }
1085
1086    if ((flags & __DRI_CTX_FLAG_ROBUST_BUFFER_ACCESS) != 0)
1087       ctx->Const.ContextFlags |= GL_CONTEXT_FLAG_ROBUST_ACCESS_BIT_ARB;
1088
1089    if (INTEL_DEBUG & DEBUG_SHADER_TIME)
1090       brw_init_shader_time(brw);
1091
1092    _mesa_compute_version(ctx);
1093
1094    _mesa_initialize_dispatch_tables(ctx);
1095    _mesa_initialize_vbo_vtxfmt(ctx);
1096
1097    if (ctx->Extensions.AMD_performance_monitor) {
1098       brw_init_performance_monitors(brw);
1099    }
1100
1101    vbo_use_buffer_objects(ctx);
1102    vbo_always_unmap_buffers(ctx);
1103
1104    return true;
1105 }
1106
1107 void
1108 intelDestroyContext(__DRIcontext * driContextPriv)
1109 {
1110    struct brw_context *brw =
1111       (struct brw_context *) driContextPriv->driverPrivate;
1112    struct gl_context *ctx = &brw->ctx;
1113
1114    /* Dump a final BMP in case the application doesn't call SwapBuffers */
1115    if (INTEL_DEBUG & DEBUG_AUB) {
1116       intel_batchbuffer_flush(brw);
1117       aub_dump_bmp(&brw->ctx);
1118    }
1119
1120    _mesa_meta_free(&brw->ctx);
1121
1122    if (INTEL_DEBUG & DEBUG_SHADER_TIME) {
1123       /* Force a report. */
1124       brw->shader_time.report_time = 0;
1125
1126       brw_collect_and_report_shader_time(brw);
1127       brw_destroy_shader_time(brw);
1128    }
1129
1130    brw_destroy_state(brw);
1131    brw_draw_destroy(brw);
1132
1133    drm_intel_bo_unreference(brw->curbe.curbe_bo);
1134    if (brw->vs.base.scratch_bo)
1135       drm_intel_bo_unreference(brw->vs.base.scratch_bo);
1136    if (brw->tcs.base.scratch_bo)
1137       drm_intel_bo_unreference(brw->tcs.base.scratch_bo);
1138    if (brw->tes.base.scratch_bo)
1139       drm_intel_bo_unreference(brw->tes.base.scratch_bo);
1140    if (brw->gs.base.scratch_bo)
1141       drm_intel_bo_unreference(brw->gs.base.scratch_bo);
1142    if (brw->wm.base.scratch_bo)
1143       drm_intel_bo_unreference(brw->wm.base.scratch_bo);
1144
1145    gen7_reset_hw_bt_pool_offsets(brw);
1146    drm_intel_bo_unreference(brw->hw_bt_pool.bo);
1147    brw->hw_bt_pool.bo = NULL;
1148
1149    drm_intel_gem_context_destroy(brw->hw_ctx);
1150
1151    if (ctx->swrast_context) {
1152       _swsetup_DestroyContext(&brw->ctx);
1153       _tnl_DestroyContext(&brw->ctx);
1154    }
1155    _vbo_DestroyContext(&brw->ctx);
1156
1157    if (ctx->swrast_context)
1158       _swrast_DestroyContext(&brw->ctx);
1159
1160    brw_fini_pipe_control(brw);
1161    intel_batchbuffer_free(brw);
1162
1163    drm_intel_bo_unreference(brw->throttle_batch[1]);
1164    drm_intel_bo_unreference(brw->throttle_batch[0]);
1165    brw->throttle_batch[1] = NULL;
1166    brw->throttle_batch[0] = NULL;
1167
1168    driDestroyOptionCache(&brw->optionCache);
1169
1170    /* free the Mesa context */
1171    _mesa_free_context_data(&brw->ctx);
1172
1173    ralloc_free(brw);
1174    driContextPriv->driverPrivate = NULL;
1175 }
1176
1177 GLboolean
1178 intelUnbindContext(__DRIcontext * driContextPriv)
1179 {
1180    /* Unset current context and dispath table */
1181    _mesa_make_current(NULL, NULL, NULL);
1182
1183    return true;
1184 }
1185
1186 /**
1187  * Fixes up the context for GLES23 with our default-to-sRGB-capable behavior
1188  * on window system framebuffers.
1189  *
1190  * Desktop GL is fairly reasonable in its handling of sRGB: You can ask if
1191  * your renderbuffer can do sRGB encode, and you can flip a switch that does
1192  * sRGB encode if the renderbuffer can handle it.  You can ask specifically
1193  * for a visual where you're guaranteed to be capable, but it turns out that
1194  * everyone just makes all their ARGB8888 visuals capable and doesn't offer
1195  * incapable ones, because there's no difference between the two in resources
1196  * used.  Applications thus get built that accidentally rely on the default
1197  * visual choice being sRGB, so we make ours sRGB capable.  Everything sounds
1198  * great...
1199  *
1200  * But for GLES2/3, they decided that it was silly to not turn on sRGB encode
1201  * for sRGB renderbuffers you made with the GL_EXT_texture_sRGB equivalent.
1202  * So they removed the enable knob and made it "if the renderbuffer is sRGB
1203  * capable, do sRGB encode".  Then, for your window system renderbuffers, you
1204  * can ask for sRGB visuals and get sRGB encode, or not ask for sRGB visuals
1205  * and get no sRGB encode (assuming that both kinds of visual are available).
1206  * Thus our choice to support sRGB by default on our visuals for desktop would
1207  * result in broken rendering of GLES apps that aren't expecting sRGB encode.
1208  *
1209  * Unfortunately, renderbuffer setup happens before a context is created.  So
1210  * in intel_screen.c we always set up sRGB, and here, if you're a GLES2/3
1211  * context (without an sRGB visual, though we don't have sRGB visuals exposed
1212  * yet), we go turn that back off before anyone finds out.
1213  */
1214 static void
1215 intel_gles3_srgb_workaround(struct brw_context *brw,
1216                             struct gl_framebuffer *fb)
1217 {
1218    struct gl_context *ctx = &brw->ctx;
1219
1220    if (_mesa_is_desktop_gl(ctx) || !fb->Visual.sRGBCapable)
1221       return;
1222
1223    /* Some day when we support the sRGB capable bit on visuals available for
1224     * GLES, we'll need to respect that and not disable things here.
1225     */
1226    fb->Visual.sRGBCapable = false;
1227    for (int i = 0; i < BUFFER_COUNT; i++) {
1228       struct gl_renderbuffer *rb = fb->Attachment[i].Renderbuffer;
1229       if (rb)
1230          rb->Format = _mesa_get_srgb_format_linear(rb->Format);
1231    }
1232 }
1233
1234 GLboolean
1235 intelMakeCurrent(__DRIcontext * driContextPriv,
1236                  __DRIdrawable * driDrawPriv,
1237                  __DRIdrawable * driReadPriv)
1238 {
1239    struct brw_context *brw;
1240    GET_CURRENT_CONTEXT(curCtx);
1241
1242    if (driContextPriv)
1243       brw = (struct brw_context *) driContextPriv->driverPrivate;
1244    else
1245       brw = NULL;
1246
1247    /* According to the glXMakeCurrent() man page: "Pending commands to
1248     * the previous context, if any, are flushed before it is released."
1249     * But only flush if we're actually changing contexts.
1250     */
1251    if (brw_context(curCtx) && brw_context(curCtx) != brw) {
1252       _mesa_flush(curCtx);
1253    }
1254
1255    if (driContextPriv) {
1256       struct gl_context *ctx = &brw->ctx;
1257       struct gl_framebuffer *fb, *readFb;
1258
1259       if (driDrawPriv == NULL) {
1260          fb = _mesa_get_incomplete_framebuffer();
1261       } else {
1262          fb = driDrawPriv->driverPrivate;
1263          driContextPriv->dri2.draw_stamp = driDrawPriv->dri2.stamp - 1;
1264       }
1265
1266       if (driReadPriv == NULL) {
1267          readFb = _mesa_get_incomplete_framebuffer();
1268       } else {
1269          readFb = driReadPriv->driverPrivate;
1270          driContextPriv->dri2.read_stamp = driReadPriv->dri2.stamp - 1;
1271       }
1272
1273       /* The sRGB workaround changes the renderbuffer's format. We must change
1274        * the format before the renderbuffer's miptree get's allocated, otherwise
1275        * the formats of the renderbuffer and its miptree will differ.
1276        */
1277       intel_gles3_srgb_workaround(brw, fb);
1278       intel_gles3_srgb_workaround(brw, readFb);
1279
1280       /* If the context viewport hasn't been initialized, force a call out to
1281        * the loader to get buffers so we have a drawable size for the initial
1282        * viewport. */
1283       if (!brw->ctx.ViewportInitialized)
1284          intel_prepare_render(brw);
1285
1286       _mesa_make_current(ctx, fb, readFb);
1287    } else {
1288       _mesa_make_current(NULL, NULL, NULL);
1289    }
1290
1291    return true;
1292 }
1293
1294 void
1295 intel_resolve_for_dri2_flush(struct brw_context *brw,
1296                              __DRIdrawable *drawable)
1297 {
1298    if (brw->gen < 6) {
1299       /* MSAA and fast color clear are not supported, so don't waste time
1300        * checking whether a resolve is needed.
1301        */
1302       return;
1303    }
1304
1305    struct gl_framebuffer *fb = drawable->driverPrivate;
1306    struct intel_renderbuffer *rb;
1307
1308    /* Usually, only the back buffer will need to be downsampled. However,
1309     * the front buffer will also need it if the user has rendered into it.
1310     */
1311    static const gl_buffer_index buffers[2] = {
1312          BUFFER_BACK_LEFT,
1313          BUFFER_FRONT_LEFT,
1314    };
1315
1316    for (int i = 0; i < 2; ++i) {
1317       rb = intel_get_renderbuffer(fb, buffers[i]);
1318       if (rb == NULL || rb->mt == NULL)
1319          continue;
1320       if (rb->mt->num_samples <= 1)
1321          intel_miptree_resolve_color(brw, rb->mt, 0);
1322       else
1323          intel_renderbuffer_downsample(brw, rb);
1324    }
1325 }
1326
1327 static unsigned
1328 intel_bits_per_pixel(const struct intel_renderbuffer *rb)
1329 {
1330    return _mesa_get_format_bytes(intel_rb_format(rb)) * 8;
1331 }
1332
1333 static void
1334 intel_query_dri2_buffers(struct brw_context *brw,
1335                          __DRIdrawable *drawable,
1336                          __DRIbuffer **buffers,
1337                          int *count);
1338
1339 static void
1340 intel_process_dri2_buffer(struct brw_context *brw,
1341                           __DRIdrawable *drawable,
1342                           __DRIbuffer *buffer,
1343                           struct intel_renderbuffer *rb,
1344                           const char *buffer_name);
1345
1346 static void
1347 intel_update_image_buffers(struct brw_context *brw, __DRIdrawable *drawable);
1348
1349 static void
1350 intel_update_dri2_buffers(struct brw_context *brw, __DRIdrawable *drawable)
1351 {
1352    struct gl_framebuffer *fb = drawable->driverPrivate;
1353    struct intel_renderbuffer *rb;
1354    __DRIbuffer *buffers = NULL;
1355    int i, count;
1356    const char *region_name;
1357
1358    /* Set this up front, so that in case our buffers get invalidated
1359     * while we're getting new buffers, we don't clobber the stamp and
1360     * thus ignore the invalidate. */
1361    drawable->lastStamp = drawable->dri2.stamp;
1362
1363    if (unlikely(INTEL_DEBUG & DEBUG_DRI))
1364       fprintf(stderr, "enter %s, drawable %p\n", __func__, drawable);
1365
1366    intel_query_dri2_buffers(brw, drawable, &buffers, &count);
1367
1368    if (buffers == NULL)
1369       return;
1370
1371    for (i = 0; i < count; i++) {
1372        switch (buffers[i].attachment) {
1373        case __DRI_BUFFER_FRONT_LEFT:
1374            rb = intel_get_renderbuffer(fb, BUFFER_FRONT_LEFT);
1375            region_name = "dri2 front buffer";
1376            break;
1377
1378        case __DRI_BUFFER_FAKE_FRONT_LEFT:
1379            rb = intel_get_renderbuffer(fb, BUFFER_FRONT_LEFT);
1380            region_name = "dri2 fake front buffer";
1381            break;
1382
1383        case __DRI_BUFFER_BACK_LEFT:
1384            rb = intel_get_renderbuffer(fb, BUFFER_BACK_LEFT);
1385            region_name = "dri2 back buffer";
1386            break;
1387
1388        case __DRI_BUFFER_DEPTH:
1389        case __DRI_BUFFER_HIZ:
1390        case __DRI_BUFFER_DEPTH_STENCIL:
1391        case __DRI_BUFFER_STENCIL:
1392        case __DRI_BUFFER_ACCUM:
1393        default:
1394            fprintf(stderr,
1395                    "unhandled buffer attach event, attachment type %d\n",
1396                    buffers[i].attachment);
1397            return;
1398        }
1399
1400        intel_process_dri2_buffer(brw, drawable, &buffers[i], rb, region_name);
1401    }
1402
1403 }
1404
1405 void
1406 intel_update_renderbuffers(__DRIcontext *context, __DRIdrawable *drawable)
1407 {
1408    struct brw_context *brw = context->driverPrivate;
1409    __DRIscreen *screen = brw->intelScreen->driScrnPriv;
1410
1411    /* Set this up front, so that in case our buffers get invalidated
1412     * while we're getting new buffers, we don't clobber the stamp and
1413     * thus ignore the invalidate. */
1414    drawable->lastStamp = drawable->dri2.stamp;
1415
1416    if (unlikely(INTEL_DEBUG & DEBUG_DRI))
1417       fprintf(stderr, "enter %s, drawable %p\n", __func__, drawable);
1418
1419    if (screen->image.loader)
1420       intel_update_image_buffers(brw, drawable);
1421    else
1422       intel_update_dri2_buffers(brw, drawable);
1423
1424    driUpdateFramebufferSize(&brw->ctx, drawable);
1425 }
1426
1427 /**
1428  * intel_prepare_render should be called anywhere that curent read/drawbuffer
1429  * state is required.
1430  */
1431 void
1432 intel_prepare_render(struct brw_context *brw)
1433 {
1434    struct gl_context *ctx = &brw->ctx;
1435    __DRIcontext *driContext = brw->driContext;
1436    __DRIdrawable *drawable;
1437
1438    drawable = driContext->driDrawablePriv;
1439    if (drawable && drawable->dri2.stamp != driContext->dri2.draw_stamp) {
1440       if (drawable->lastStamp != drawable->dri2.stamp)
1441          intel_update_renderbuffers(driContext, drawable);
1442       driContext->dri2.draw_stamp = drawable->dri2.stamp;
1443    }
1444
1445    drawable = driContext->driReadablePriv;
1446    if (drawable && drawable->dri2.stamp != driContext->dri2.read_stamp) {
1447       if (drawable->lastStamp != drawable->dri2.stamp)
1448          intel_update_renderbuffers(driContext, drawable);
1449       driContext->dri2.read_stamp = drawable->dri2.stamp;
1450    }
1451
1452    /* If we're currently rendering to the front buffer, the rendering
1453     * that will happen next will probably dirty the front buffer.  So
1454     * mark it as dirty here.
1455     */
1456    if (_mesa_is_front_buffer_drawing(ctx->DrawBuffer))
1457       brw->front_buffer_dirty = true;
1458 }
1459
1460 /**
1461  * \brief Query DRI2 to obtain a DRIdrawable's buffers.
1462  *
1463  * To determine which DRI buffers to request, examine the renderbuffers
1464  * attached to the drawable's framebuffer. Then request the buffers with
1465  * DRI2GetBuffers() or DRI2GetBuffersWithFormat().
1466  *
1467  * This is called from intel_update_renderbuffers().
1468  *
1469  * \param drawable      Drawable whose buffers are queried.
1470  * \param buffers       [out] List of buffers returned by DRI2 query.
1471  * \param buffer_count  [out] Number of buffers returned.
1472  *
1473  * \see intel_update_renderbuffers()
1474  * \see DRI2GetBuffers()
1475  * \see DRI2GetBuffersWithFormat()
1476  */
1477 static void
1478 intel_query_dri2_buffers(struct brw_context *brw,
1479                          __DRIdrawable *drawable,
1480                          __DRIbuffer **buffers,
1481                          int *buffer_count)
1482 {
1483    __DRIscreen *screen = brw->intelScreen->driScrnPriv;
1484    struct gl_framebuffer *fb = drawable->driverPrivate;
1485    int i = 0;
1486    unsigned attachments[8];
1487
1488    struct intel_renderbuffer *front_rb;
1489    struct intel_renderbuffer *back_rb;
1490
1491    front_rb = intel_get_renderbuffer(fb, BUFFER_FRONT_LEFT);
1492    back_rb = intel_get_renderbuffer(fb, BUFFER_BACK_LEFT);
1493
1494    memset(attachments, 0, sizeof(attachments));
1495    if ((_mesa_is_front_buffer_drawing(fb) ||
1496         _mesa_is_front_buffer_reading(fb) ||
1497         !back_rb) && front_rb) {
1498       /* If a fake front buffer is in use, then querying for
1499        * __DRI_BUFFER_FRONT_LEFT will cause the server to copy the image from
1500        * the real front buffer to the fake front buffer.  So before doing the
1501        * query, we need to make sure all the pending drawing has landed in the
1502        * real front buffer.
1503        */
1504       intel_batchbuffer_flush(brw);
1505       intel_flush_front(&brw->ctx);
1506
1507       attachments[i++] = __DRI_BUFFER_FRONT_LEFT;
1508       attachments[i++] = intel_bits_per_pixel(front_rb);
1509    } else if (front_rb && brw->front_buffer_dirty) {
1510       /* We have pending front buffer rendering, but we aren't querying for a
1511        * front buffer.  If the front buffer we have is a fake front buffer,
1512        * the X server is going to throw it away when it processes the query.
1513        * So before doing the query, make sure all the pending drawing has
1514        * landed in the real front buffer.
1515        */
1516       intel_batchbuffer_flush(brw);
1517       intel_flush_front(&brw->ctx);
1518    }
1519
1520    if (back_rb) {
1521       attachments[i++] = __DRI_BUFFER_BACK_LEFT;
1522       attachments[i++] = intel_bits_per_pixel(back_rb);
1523    }
1524
1525    assert(i <= ARRAY_SIZE(attachments));
1526
1527    *buffers = screen->dri2.loader->getBuffersWithFormat(drawable,
1528                                                         &drawable->w,
1529                                                         &drawable->h,
1530                                                         attachments, i / 2,
1531                                                         buffer_count,
1532                                                         drawable->loaderPrivate);
1533 }
1534
1535 /**
1536  * \brief Assign a DRI buffer's DRM region to a renderbuffer.
1537  *
1538  * This is called from intel_update_renderbuffers().
1539  *
1540  * \par Note:
1541  *    DRI buffers whose attachment point is DRI2BufferStencil or
1542  *    DRI2BufferDepthStencil are handled as special cases.
1543  *
1544  * \param buffer_name is a human readable name, such as "dri2 front buffer",
1545  *        that is passed to drm_intel_bo_gem_create_from_name().
1546  *
1547  * \see intel_update_renderbuffers()
1548  */
1549 static void
1550 intel_process_dri2_buffer(struct brw_context *brw,
1551                           __DRIdrawable *drawable,
1552                           __DRIbuffer *buffer,
1553                           struct intel_renderbuffer *rb,
1554                           const char *buffer_name)
1555 {
1556    struct gl_framebuffer *fb = drawable->driverPrivate;
1557    drm_intel_bo *bo;
1558
1559    if (!rb)
1560       return;
1561
1562    unsigned num_samples = rb->Base.Base.NumSamples;
1563
1564    /* We try to avoid closing and reopening the same BO name, because the first
1565     * use of a mapping of the buffer involves a bunch of page faulting which is
1566     * moderately expensive.
1567     */
1568    struct intel_mipmap_tree *last_mt;
1569    if (num_samples == 0)
1570       last_mt = rb->mt;
1571    else
1572       last_mt = rb->singlesample_mt;
1573
1574    uint32_t old_name = 0;
1575    if (last_mt) {
1576        /* The bo already has a name because the miptree was created by a
1577         * previous call to intel_process_dri2_buffer(). If a bo already has a
1578         * name, then drm_intel_bo_flink() is a low-cost getter.  It does not
1579         * create a new name.
1580         */
1581       drm_intel_bo_flink(last_mt->bo, &old_name);
1582    }
1583
1584    if (old_name == buffer->name)
1585       return;
1586
1587    if (unlikely(INTEL_DEBUG & DEBUG_DRI)) {
1588       fprintf(stderr,
1589               "attaching buffer %d, at %d, cpp %d, pitch %d\n",
1590               buffer->name, buffer->attachment,
1591               buffer->cpp, buffer->pitch);
1592    }
1593
1594    bo = drm_intel_bo_gem_create_from_name(brw->bufmgr, buffer_name,
1595                                           buffer->name);
1596    if (!bo) {
1597       fprintf(stderr,
1598               "Failed to open BO for returned DRI2 buffer "
1599               "(%dx%d, %s, named %d).\n"
1600               "This is likely a bug in the X Server that will lead to a "
1601               "crash soon.\n",
1602               drawable->w, drawable->h, buffer_name, buffer->name);
1603       return;
1604    }
1605
1606    intel_update_winsys_renderbuffer_miptree(brw, rb, bo,
1607                                             drawable->w, drawable->h,
1608                                             buffer->pitch);
1609
1610    if (_mesa_is_front_buffer_drawing(fb) &&
1611        (buffer->attachment == __DRI_BUFFER_FRONT_LEFT ||
1612         buffer->attachment == __DRI_BUFFER_FAKE_FRONT_LEFT) &&
1613        rb->Base.Base.NumSamples > 1) {
1614       intel_renderbuffer_upsample(brw, rb);
1615    }
1616
1617    assert(rb->mt);
1618
1619    drm_intel_bo_unreference(bo);
1620 }
1621
1622 /**
1623  * \brief Query DRI image loader to obtain a DRIdrawable's buffers.
1624  *
1625  * To determine which DRI buffers to request, examine the renderbuffers
1626  * attached to the drawable's framebuffer. Then request the buffers from
1627  * the image loader
1628  *
1629  * This is called from intel_update_renderbuffers().
1630  *
1631  * \param drawable      Drawable whose buffers are queried.
1632  * \param buffers       [out] List of buffers returned by DRI2 query.
1633  * \param buffer_count  [out] Number of buffers returned.
1634  *
1635  * \see intel_update_renderbuffers()
1636  */
1637
1638 static void
1639 intel_update_image_buffer(struct brw_context *intel,
1640                           __DRIdrawable *drawable,
1641                           struct intel_renderbuffer *rb,
1642                           __DRIimage *buffer,
1643                           enum __DRIimageBufferMask buffer_type)
1644 {
1645    struct gl_framebuffer *fb = drawable->driverPrivate;
1646
1647    if (!rb || !buffer->bo)
1648       return;
1649
1650    unsigned num_samples = rb->Base.Base.NumSamples;
1651
1652    /* Check and see if we're already bound to the right
1653     * buffer object
1654     */
1655    struct intel_mipmap_tree *last_mt;
1656    if (num_samples == 0)
1657       last_mt = rb->mt;
1658    else
1659       last_mt = rb->singlesample_mt;
1660
1661    if (last_mt && last_mt->bo == buffer->bo)
1662       return;
1663
1664    intel_update_winsys_renderbuffer_miptree(intel, rb, buffer->bo,
1665                                             buffer->width, buffer->height,
1666                                             buffer->pitch);
1667
1668    if (_mesa_is_front_buffer_drawing(fb) &&
1669        buffer_type == __DRI_IMAGE_BUFFER_FRONT &&
1670        rb->Base.Base.NumSamples > 1) {
1671       intel_renderbuffer_upsample(intel, rb);
1672    }
1673 }
1674
1675 static void
1676 intel_update_image_buffers(struct brw_context *brw, __DRIdrawable *drawable)
1677 {
1678    struct gl_framebuffer *fb = drawable->driverPrivate;
1679    __DRIscreen *screen = brw->intelScreen->driScrnPriv;
1680    struct intel_renderbuffer *front_rb;
1681    struct intel_renderbuffer *back_rb;
1682    struct __DRIimageList images;
1683    unsigned int format;
1684    uint32_t buffer_mask = 0;
1685    int ret;
1686
1687    front_rb = intel_get_renderbuffer(fb, BUFFER_FRONT_LEFT);
1688    back_rb = intel_get_renderbuffer(fb, BUFFER_BACK_LEFT);
1689
1690    if (back_rb)
1691       format = intel_rb_format(back_rb);
1692    else if (front_rb)
1693       format = intel_rb_format(front_rb);
1694    else
1695       return;
1696
1697    if (front_rb && (_mesa_is_front_buffer_drawing(fb) ||
1698                     _mesa_is_front_buffer_reading(fb) || !back_rb)) {
1699       buffer_mask |= __DRI_IMAGE_BUFFER_FRONT;
1700    }
1701
1702    if (back_rb)
1703       buffer_mask |= __DRI_IMAGE_BUFFER_BACK;
1704
1705    ret = screen->image.loader->getBuffers(drawable,
1706                                           driGLFormatToImageFormat(format),
1707                                           &drawable->dri2.stamp,
1708                                           drawable->loaderPrivate,
1709                                           buffer_mask,
1710                                           &images);
1711    if (!ret)
1712       return;
1713
1714    if (images.image_mask & __DRI_IMAGE_BUFFER_FRONT) {
1715       drawable->w = images.front->width;
1716       drawable->h = images.front->height;
1717       intel_update_image_buffer(brw,
1718                                 drawable,
1719                                 front_rb,
1720                                 images.front,
1721                                 __DRI_IMAGE_BUFFER_FRONT);
1722    }
1723    if (images.image_mask & __DRI_IMAGE_BUFFER_BACK) {
1724       drawable->w = images.back->width;
1725       drawable->h = images.back->height;
1726       intel_update_image_buffer(brw,
1727                                 drawable,
1728                                 back_rb,
1729                                 images.back,
1730                                 __DRI_IMAGE_BUFFER_BACK);
1731    }
1732 }