src/mesa/drivers/dri/i965/brw_program.c

   1 /*
   2  Copyright (C) Intel Corp.  2006.  All Rights Reserved.
   3  Intel funded Tungsten Graphics to
   4  develop this 3D driver.
   5
   6  Permission is hereby granted, free of charge, to any person obtaining
   7  a copy of this software and associated documentation files (the
   8  "Software"), to deal in the Software without restriction, including
   9  without limitation the rights to use, copy, modify, merge, publish,
  10  distribute, sublicense, and/or sell copies of the Software, and to
  11  permit persons to whom the Software is furnished to do so, subject to
  12  the following conditions:
  13
  14  The above copyright notice and this permission notice (including the
  15  next paragraph) shall be included in all copies or substantial
  16  portions of the Software.
  17
  18  THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  19  EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  20  MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
  21  IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
  22  LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
  23  OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
  24  WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
  25
  26  **********************************************************************/
  27  /*
  28   * Authors:
  29   *   Keith Whitwell <keithw@vmware.com>
  30   */
  31
  32 #include <pthread.h>
  33 #include "main/imports.h"
  34 #include "program/prog_parameter.h"
  35 #include "program/prog_print.h"
  36 #include "program/prog_to_nir.h"
  37 #include "program/program.h"
  38 #include "program/programopt.h"
  39 #include "tnl/tnl.h"
  40 #include "util/ralloc.h"
  41 #include "compiler/glsl/ir.h"
  42 #include "compiler/glsl/glsl_to_nir.h"
  43
  44 #include "brw_program.h"
  45 #include "brw_context.h"
  46 #include "brw_shader.h"
  47 #include "brw_nir.h"
  48 #include "intel_batchbuffer.h"
  49
  50 static void
  51 brw_nir_lower_uniforms(nir_shader *nir, bool is_scalar)
  52 {
  53    if (is_scalar) {
  54       nir_assign_var_locations(&nir->uniforms, &nir->num_uniforms,
  55                                type_size_scalar_bytes);
  56       nir_lower_io(nir, nir_var_uniform, type_size_scalar_bytes, 0);
  57    } else {
  58       nir_assign_var_locations(&nir->uniforms, &nir->num_uniforms,
  59                                type_size_vec4_bytes);
  60       nir_lower_io(nir, nir_var_uniform, type_size_vec4_bytes, 0);
  61    }
  62 }
  63
  64 nir_shader *
  65 brw_create_nir(struct brw_context *brw,
  66                const struct gl_shader_program *shader_prog,
  67                const struct gl_program *prog,
  68                gl_shader_stage stage,
  69                bool is_scalar)
  70 {
  71    struct gl_context *ctx = &brw->ctx;
  72    const nir_shader_compiler_options *options =
  73       ctx->Const.ShaderCompilerOptions[stage].NirOptions;
  74    bool progress;
  75    nir_shader *nir;
  76
  77    /* First, lower the GLSL IR or Mesa IR to NIR */
  78    if (shader_prog) {
  79       nir = glsl_to_nir(shader_prog, stage, options);
  80       nir_remove_dead_variables(nir, nir_var_shader_in | nir_var_shader_out);
  81       NIR_PASS_V(nir, nir_lower_io_to_temporaries,
  82                  nir_shader_get_entrypoint(nir), true, false);
  83    } else {
  84       nir = prog_to_nir(prog, options);
  85       NIR_PASS_V(nir, nir_convert_to_ssa); /* turn registers into SSA */
  86    }
  87    nir_validate_shader(nir);
  88
  89    (void)progress;
  90
  91    nir = brw_preprocess_nir(brw->screen->compiler, nir);
  92
  93    if (stage == MESA_SHADER_FRAGMENT) {
  94       static const struct nir_lower_wpos_ytransform_options wpos_options = {
  95          .state_tokens = {STATE_INTERNAL, STATE_FB_WPOS_Y_TRANSFORM, 0, 0, 0},
  96          .fs_coord_pixel_center_integer = 1,
  97          .fs_coord_origin_upper_left = 1,
  98       };
  99       _mesa_add_state_reference(prog->Parameters,
 100                                 (gl_state_index *) wpos_options.state_tokens);
 101
 102       NIR_PASS(progress, nir, nir_lower_wpos_ytransform, &wpos_options);
 103    }
 104
 105    NIR_PASS(progress, nir, nir_lower_system_values);
 106    NIR_PASS_V(nir, brw_nir_lower_uniforms, is_scalar);
 107
 108    if (shader_prog) {
 109       NIR_PASS_V(nir, nir_lower_samplers, shader_prog);
 110       NIR_PASS_V(nir, nir_lower_atomics, shader_prog);
 111    }
 112
 113    return nir;
 114 }
 115
 116 static unsigned
 117 get_new_program_id(struct intel_screen *screen)
 118 {
 119    static pthread_mutex_t m = PTHREAD_MUTEX_INITIALIZER;
 120    pthread_mutex_lock(&m);
 121    unsigned id = screen->program_id++;
 122    pthread_mutex_unlock(&m);
 123    return id;
 124 }
 125
 126 static struct gl_program *brwNewProgram( struct gl_context *ctx,
 127                                       GLenum target,
 128                                       GLuint id )
 129 {
 130    struct brw_context *brw = brw_context(ctx);
 131
 132    switch (target) {
 133    case GL_VERTEX_PROGRAM_ARB:
 134    case GL_TESS_CONTROL_PROGRAM_NV:
 135    case GL_TESS_EVALUATION_PROGRAM_NV:
 136    case GL_GEOMETRY_PROGRAM_NV:
 137    case GL_COMPUTE_PROGRAM_NV: {
 138       struct brw_program *prog = rzalloc(NULL, struct brw_program);
 139       if (prog) {
 140          prog->id = get_new_program_id(brw->screen);
 141
 142          return _mesa_init_gl_program(&prog->program, target, id);
 143       }
 144       else
 145          return NULL;
 146    }
 147
 148    case GL_FRAGMENT_PROGRAM_ARB: {
 149       struct brw_program *prog;
 150       if (brw->gen < 6) {
 151          struct gen4_fragment_program *g4_prog =
 152             rzalloc(NULL, struct gen4_fragment_program);
 153          prog = &g4_prog->base;
 154       } else {
 155          prog = rzalloc(NULL, struct brw_program);
 156       }
 157
 158       if (prog) {
 159          prog->id = get_new_program_id(brw->screen);
 160
 161          return _mesa_init_gl_program(&prog->program, target, id);
 162       }
 163       else
 164          return NULL;
 165    }
 166
 167    default:
 168       unreachable("Unsupported target in brwNewProgram()");
 169    }
 170 }
 171
 172 static void brwDeleteProgram( struct gl_context *ctx,
 173                               struct gl_program *prog )
 174 {
 175    _mesa_delete_program( ctx, prog );
 176 }
 177
 178
 179 static GLboolean
 180 brwProgramStringNotify(struct gl_context *ctx,
 181                        GLenum target,
 182                        struct gl_program *prog)
 183 {
 184    assert(target == GL_VERTEX_PROGRAM_ARB || !prog->IsPositionInvariant);
 185
 186    struct brw_context *brw = brw_context(ctx);
 187    const struct brw_compiler *compiler = brw->screen->compiler;
 188
 189    switch (target) {
 190    case GL_FRAGMENT_PROGRAM_ARB: {
 191       struct brw_program *newFP = brw_program(prog);
 192       const struct brw_program *curFP =
 193          brw_program_const(brw->fragment_program);
 194
 195       if (newFP == curFP)
 196          brw->ctx.NewDriverState |= BRW_NEW_FRAGMENT_PROGRAM;
 197       newFP->id = get_new_program_id(brw->screen);
 198
 199       brw_add_texrect_params(prog);
 200
 201       prog->nir = brw_create_nir(brw, NULL, prog, MESA_SHADER_FRAGMENT, true);
 202
 203       brw_fs_precompile(ctx, NULL, prog);
 204       break;
 205    }
 206    case GL_VERTEX_PROGRAM_ARB: {
 207       struct brw_program *newVP = brw_program(prog);
 208       const struct brw_program *curVP =
 209          brw_program_const(brw->vertex_program);
 210
 211       if (newVP == curVP)
 212          brw->ctx.NewDriverState |= BRW_NEW_VERTEX_PROGRAM;
 213       if (newVP->program.IsPositionInvariant) {
 214          _mesa_insert_mvp_code(ctx, &newVP->program);
 215       }
 216       newVP->id = get_new_program_id(brw->screen);
 217
 218       /* Also tell tnl about it:
 219        */
 220       _tnl_program_string(ctx, target, prog);
 221
 222       brw_add_texrect_params(prog);
 223
 224       prog->nir = brw_create_nir(brw, NULL, prog, MESA_SHADER_VERTEX,
 225                                  compiler->scalar_stage[MESA_SHADER_VERTEX]);
 226
 227       brw_vs_precompile(ctx, NULL, prog);
 228       break;
 229    }
 230    default:
 231       /*
 232        * driver->ProgramStringNotify is only called for ARB programs, fixed
 233        * function vertex programs, and ir_to_mesa (which isn't used by the
 234        * i965 back-end).  Therefore, even after geometry shaders are added,
 235        * this function should only ever be called with a target of
 236        * GL_VERTEX_PROGRAM_ARB or GL_FRAGMENT_PROGRAM_ARB.
 237        */
 238       unreachable("Unexpected target in brwProgramStringNotify");
 239    }
 240
 241    return true;
 242 }
 243
 244 static void
 245 brw_memory_barrier(struct gl_context *ctx, GLbitfield barriers)
 246 {
 247    struct brw_context *brw = brw_context(ctx);
 248    unsigned bits = (PIPE_CONTROL_DATA_CACHE_FLUSH |
 249                     PIPE_CONTROL_NO_WRITE |
 250                     PIPE_CONTROL_CS_STALL);
 251    assert(brw->gen >= 7 && brw->gen <= 9);
 252
 253    if (barriers & (GL_VERTEX_ATTRIB_ARRAY_BARRIER_BIT |
 254                    GL_ELEMENT_ARRAY_BARRIER_BIT |
 255                    GL_COMMAND_BARRIER_BIT))
 256       bits |= PIPE_CONTROL_VF_CACHE_INVALIDATE;
 257
 258    if (barriers & GL_UNIFORM_BARRIER_BIT)
 259       bits |= (PIPE_CONTROL_TEXTURE_CACHE_INVALIDATE |
 260                PIPE_CONTROL_CONST_CACHE_INVALIDATE);
 261
 262    if (barriers & GL_TEXTURE_FETCH_BARRIER_BIT)
 263       bits |= PIPE_CONTROL_TEXTURE_CACHE_INVALIDATE;
 264
 265    if (barriers & GL_TEXTURE_UPDATE_BARRIER_BIT)
 266       bits |= PIPE_CONTROL_RENDER_TARGET_FLUSH;
 267
 268    if (barriers & GL_FRAMEBUFFER_BARRIER_BIT)
 269       bits |= (PIPE_CONTROL_DEPTH_CACHE_FLUSH |
 270                PIPE_CONTROL_RENDER_TARGET_FLUSH);
 271
 272    /* Typed surface messages are handled by the render cache on IVB, so we
 273     * need to flush it too.
 274     */
 275    if (brw->gen == 7 && !brw->is_haswell)
 276       bits |= PIPE_CONTROL_RENDER_TARGET_FLUSH;
 277
 278    brw_emit_pipe_control_flush(brw, bits);
 279 }
 280
 281 static void
 282 brw_blend_barrier(struct gl_context *ctx)
 283 {
 284    struct brw_context *brw = brw_context(ctx);
 285
 286    if (!ctx->Extensions.MESA_shader_framebuffer_fetch) {
 287       if (brw->gen >= 6) {
 288          brw_emit_pipe_control_flush(brw,
 289                                      PIPE_CONTROL_RENDER_TARGET_FLUSH |
 290                                      PIPE_CONTROL_CS_STALL);
 291          brw_emit_pipe_control_flush(brw,
 292                                      PIPE_CONTROL_TEXTURE_CACHE_INVALIDATE);
 293       } else {
 294          brw_emit_pipe_control_flush(brw,
 295                                      PIPE_CONTROL_RENDER_TARGET_FLUSH);
 296       }
 297    }
 298 }
 299
 300 void
 301 brw_add_texrect_params(struct gl_program *prog)
 302 {
 303    for (int texunit = 0; texunit < BRW_MAX_TEX_UNIT; texunit++) {
 304       if (!(prog->TexturesUsed[texunit] & (1 << TEXTURE_RECT_INDEX)))
 305          continue;
 306
 307       int tokens[STATE_LENGTH] = {
 308          STATE_INTERNAL,
 309          STATE_TEXRECT_SCALE,
 310          texunit,
 311          0,
 312          0
 313       };
 314
 315       _mesa_add_state_reference(prog->Parameters, (gl_state_index *)tokens);
 316    }
 317 }
 318
 319 void
 320 brw_get_scratch_bo(struct brw_context *brw,
 321                    drm_intel_bo **scratch_bo, int size)
 322 {
 323    drm_intel_bo *old_bo = *scratch_bo;
 324
 325    if (old_bo && old_bo->size < size) {
 326       drm_intel_bo_unreference(old_bo);
 327       old_bo = NULL;
 328    }
 329
 330    if (!old_bo) {
 331       *scratch_bo = drm_intel_bo_alloc(brw->bufmgr, "scratch bo", size, 4096);
 332    }
 333 }
 334
 335 /**
 336  * Reserve enough scratch space for the given stage to hold \p per_thread_size
 337  * bytes times the given \p thread_count.
 338  */
 339 void
 340 brw_alloc_stage_scratch(struct brw_context *brw,
 341                         struct brw_stage_state *stage_state,
 342                         unsigned per_thread_size,
 343                         unsigned thread_count)
 344 {
 345    if (stage_state->per_thread_scratch < per_thread_size) {
 346       stage_state->per_thread_scratch = per_thread_size;
 347
 348       if (stage_state->scratch_bo)
 349          drm_intel_bo_unreference(stage_state->scratch_bo);
 350
 351       stage_state->scratch_bo =
 352          drm_intel_bo_alloc(brw->bufmgr, "shader scratch space",
 353                             per_thread_size * thread_count, 4096);
 354    }
 355 }
 356
 357 void brwInitFragProgFuncs( struct dd_function_table *functions )
 358 {
 359    assert(functions->ProgramStringNotify == _tnl_program_string);
 360
 361    functions->NewProgram = brwNewProgram;
 362    functions->DeleteProgram = brwDeleteProgram;
 363    functions->ProgramStringNotify = brwProgramStringNotify;
 364
 365    functions->NewShader = brw_new_shader;
 366    functions->LinkShader = brw_link_shader;
 367
 368    functions->MemoryBarrier = brw_memory_barrier;
 369    functions->BlendBarrier = brw_blend_barrier;
 370 }
 371
 372 struct shader_times {
 373    uint64_t time;
 374    uint64_t written;
 375    uint64_t reset;
 376 };
 377
 378 void
 379 brw_init_shader_time(struct brw_context *brw)
 380 {
 381    const int max_entries = 2048;
 382    brw->shader_time.bo =
 383       drm_intel_bo_alloc(brw->bufmgr, "shader time",
 384                          max_entries * SHADER_TIME_STRIDE * 3, 4096);
 385    brw->shader_time.names = rzalloc_array(brw, const char *, max_entries);
 386    brw->shader_time.ids = rzalloc_array(brw, int, max_entries);
 387    brw->shader_time.types = rzalloc_array(brw, enum shader_time_shader_type,
 388                                           max_entries);
 389    brw->shader_time.cumulative = rzalloc_array(brw, struct shader_times,
 390                                                max_entries);
 391    brw->shader_time.max_entries = max_entries;
 392 }
 393
 394 static int
 395 compare_time(const void *a, const void *b)
 396 {
 397    uint64_t * const *a_val = a;
 398    uint64_t * const *b_val = b;
 399
 400    /* We don't just subtract because we're turning the value to an int. */
 401    if (**a_val < **b_val)
 402       return -1;
 403    else if (**a_val == **b_val)
 404       return 0;
 405    else
 406       return 1;
 407 }
 408
 409 static void
 410 print_shader_time_line(const char *stage, const char *name,
 411                        int shader_num, uint64_t time, uint64_t total)
 412 {
 413    fprintf(stderr, "%-6s%-18s", stage, name);
 414
 415    if (shader_num != 0)
 416       fprintf(stderr, "%4d: ", shader_num);
 417    else
 418       fprintf(stderr, "    : ");
 419
 420    fprintf(stderr, "%16lld (%7.2f Gcycles)      %4.1f%%\n",
 421            (long long)time,
 422            (double)time / 1000000000.0,
 423            (double)time / total * 100.0);
 424 }
 425
 426 static void
 427 brw_report_shader_time(struct brw_context *brw)
 428 {
 429    if (!brw->shader_time.bo || !brw->shader_time.num_entries)
 430       return;
 431
 432    uint64_t scaled[brw->shader_time.num_entries];
 433    uint64_t *sorted[brw->shader_time.num_entries];
 434    uint64_t total_by_type[ST_CS + 1];
 435    memset(total_by_type, 0, sizeof(total_by_type));
 436    double total = 0;
 437    for (int i = 0; i < brw->shader_time.num_entries; i++) {
 438       uint64_t written = 0, reset = 0;
 439       enum shader_time_shader_type type = brw->shader_time.types[i];
 440
 441       sorted[i] = &scaled[i];
 442
 443       switch (type) {
 444       case ST_VS:
 445       case ST_TCS:
 446       case ST_TES:
 447       case ST_GS:
 448       case ST_FS8:
 449       case ST_FS16:
 450       case ST_CS:
 451          written = brw->shader_time.cumulative[i].written;
 452          reset = brw->shader_time.cumulative[i].reset;
 453          break;
 454
 455       default:
 456          /* I sometimes want to print things that aren't the 3 shader times.
 457           * Just print the sum in that case.
 458           */
 459          written = 1;
 460          reset = 0;
 461          break;
 462       }
 463
 464       uint64_t time = brw->shader_time.cumulative[i].time;
 465       if (written) {
 466          scaled[i] = time / written * (written + reset);
 467       } else {
 468          scaled[i] = time;
 469       }
 470
 471       switch (type) {
 472       case ST_VS:
 473       case ST_TCS:
 474       case ST_TES:
 475       case ST_GS:
 476       case ST_FS8:
 477       case ST_FS16:
 478       case ST_CS:
 479          total_by_type[type] += scaled[i];
 480          break;
 481       default:
 482          break;
 483       }
 484
 485       total += scaled[i];
 486    }
 487
 488    if (total == 0) {
 489       fprintf(stderr, "No shader time collected yet\n");
 490       return;
 491    }
 492
 493    qsort(sorted, brw->shader_time.num_entries, sizeof(sorted[0]), compare_time);
 494
 495    fprintf(stderr, "\n");
 496    fprintf(stderr, "type          ID                  cycles spent                   %% of total\n");
 497    for (int s = 0; s < brw->shader_time.num_entries; s++) {
 498       const char *stage;
 499       /* Work back from the sorted pointers times to a time to print. */
 500       int i = sorted[s] - scaled;
 501
 502       if (scaled[i] == 0)
 503          continue;
 504
 505       int shader_num = brw->shader_time.ids[i];
 506       const char *shader_name = brw->shader_time.names[i];
 507
 508       switch (brw->shader_time.types[i]) {
 509       case ST_VS:
 510          stage = "vs";
 511          break;
 512       case ST_TCS:
 513          stage = "tcs";
 514          break;
 515       case ST_TES:
 516          stage = "tes";
 517          break;
 518       case ST_GS:
 519          stage = "gs";
 520          break;
 521       case ST_FS8:
 522          stage = "fs8";
 523          break;
 524       case ST_FS16:
 525          stage = "fs16";
 526          break;
 527       case ST_CS:
 528          stage = "cs";
 529          break;
 530       default:
 531          stage = "other";
 532          break;
 533       }
 534
 535       print_shader_time_line(stage, shader_name, shader_num,
 536                              scaled[i], total);
 537    }
 538
 539    fprintf(stderr, "\n");
 540    print_shader_time_line("total", "vs", 0, total_by_type[ST_VS], total);
 541    print_shader_time_line("total", "tcs", 0, total_by_type[ST_TCS], total);
 542    print_shader_time_line("total", "tes", 0, total_by_type[ST_TES], total);
 543    print_shader_time_line("total", "gs", 0, total_by_type[ST_GS], total);
 544    print_shader_time_line("total", "fs8", 0, total_by_type[ST_FS8], total);
 545    print_shader_time_line("total", "fs16", 0, total_by_type[ST_FS16], total);
 546    print_shader_time_line("total", "cs", 0, total_by_type[ST_CS], total);
 547 }
 548
 549 static void
 550 brw_collect_shader_time(struct brw_context *brw)
 551 {
 552    if (!brw->shader_time.bo)
 553       return;
 554
 555    /* This probably stalls on the last rendering.  We could fix that by
 556     * delaying reading the reports, but it doesn't look like it's a big
 557     * overhead compared to the cost of tracking the time in the first place.
 558     */
 559    drm_intel_bo_map(brw->shader_time.bo, true);
 560    void *bo_map = brw->shader_time.bo->virtual;
 561
 562    for (int i = 0; i < brw->shader_time.num_entries; i++) {
 563       uint32_t *times = bo_map + i * 3 * SHADER_TIME_STRIDE;
 564
 565       brw->shader_time.cumulative[i].time += times[SHADER_TIME_STRIDE * 0 / 4];
 566       brw->shader_time.cumulative[i].written += times[SHADER_TIME_STRIDE * 1 / 4];
 567       brw->shader_time.cumulative[i].reset += times[SHADER_TIME_STRIDE * 2 / 4];
 568    }
 569
 570    /* Zero the BO out to clear it out for our next collection.
 571     */
 572    memset(bo_map, 0, brw->shader_time.bo->size);
 573    drm_intel_bo_unmap(brw->shader_time.bo);
 574 }
 575
 576 void
 577 brw_collect_and_report_shader_time(struct brw_context *brw)
 578 {
 579    brw_collect_shader_time(brw);
 580
 581    if (brw->shader_time.report_time == 0 ||
 582        get_time() - brw->shader_time.report_time >= 1.0) {
 583       brw_report_shader_time(brw);
 584       brw->shader_time.report_time = get_time();
 585    }
 586 }
 587
 588 /**
 589  * Chooses an index in the shader_time buffer and sets up tracking information
 590  * for our printouts.
 591  *
 592  * Note that this holds on to references to the underlying programs, which may
 593  * change their lifetimes compared to normal operation.
 594  */
 595 int
 596 brw_get_shader_time_index(struct brw_context *brw,
 597                           struct gl_shader_program *shader_prog,
 598                           struct gl_program *prog,
 599                           enum shader_time_shader_type type)
 600 {
 601    int shader_time_index = brw->shader_time.num_entries++;
 602    assert(shader_time_index < brw->shader_time.max_entries);
 603    brw->shader_time.types[shader_time_index] = type;
 604
 605    int id = shader_prog ? shader_prog->Name : prog->Id;
 606    const char *name;
 607    if (id == 0) {
 608       name = "ff";
 609    } else if (!shader_prog) {
 610       name = "prog";
 611    } else if (shader_prog->Label) {
 612       name = ralloc_strdup(brw->shader_time.names, shader_prog->Label);
 613    } else {
 614       name = "glsl";
 615    }
 616
 617    brw->shader_time.names[shader_time_index] = name;
 618    brw->shader_time.ids[shader_time_index] = id;
 619
 620    return shader_time_index;
 621 }
 622
 623 void
 624 brw_destroy_shader_time(struct brw_context *brw)
 625 {
 626    drm_intel_bo_unreference(brw->shader_time.bo);
 627    brw->shader_time.bo = NULL;
 628 }
 629
 630 void
 631 brw_stage_prog_data_free(const void *p)
 632 {
 633    struct brw_stage_prog_data *prog_data = (struct brw_stage_prog_data *)p;
 634
 635    ralloc_free(prog_data->param);
 636    ralloc_free(prog_data->pull_param);
 637    ralloc_free(prog_data->image_param);
 638 }
 639
 640 void
 641 brw_dump_ir(const char *stage, struct gl_shader_program *shader_prog,
 642             struct gl_linked_shader *shader, struct gl_program *prog)
 643 {
 644    if (shader_prog) {
 645       if (shader->ir) {
 646          fprintf(stderr,
 647                  "GLSL IR for native %s shader %d:\n",
 648                  stage, shader_prog->Name);
 649          _mesa_print_ir(stderr, shader->ir, NULL);
 650          fprintf(stderr, "\n\n");
 651       }
 652    } else {
 653       fprintf(stderr, "ARB_%s_program %d ir for native %s shader\n",
 654               stage, prog->Id, stage);
 655       _mesa_print_program(prog);
 656    }
 657 }
 658
 659 void
 660 brw_setup_tex_for_precompile(struct brw_context *brw,
 661                              struct brw_sampler_prog_key_data *tex,
 662                              struct gl_program *prog)
 663 {
 664    const bool has_shader_channel_select = brw->is_haswell || brw->gen >= 8;
 665    unsigned sampler_count = util_last_bit(prog->SamplersUsed);
 666    for (unsigned i = 0; i < sampler_count; i++) {
 667       if (!has_shader_channel_select && (prog->ShadowSamplers & (1 << i))) {
 668          /* Assume DEPTH_TEXTURE_MODE is the default: X, X, X, 1 */
 669          tex->swizzles[i] =
 670             MAKE_SWIZZLE4(SWIZZLE_X, SWIZZLE_X, SWIZZLE_X, SWIZZLE_ONE);
 671       } else {
 672          /* Color sampler: assume no swizzling. */
 673          tex->swizzles[i] = SWIZZLE_XYZW;
 674       }
 675    }
 676 }