src/mesa/state_tracker/st_program.c

   1 /**************************************************************************
   2  *
   3  * Copyright 2007 Tungsten Graphics, Inc., Cedar Park, Texas.
   4  * All Rights Reserved.
   5  *
   6  * Permission is hereby granted, free of charge, to any person obtaining a
   7  * copy of this software and associated documentation files (the
   8  * "Software"), to deal in the Software without restriction, including
   9  * without limitation the rights to use, copy, modify, merge, publish,
  10  * distribute, sub license, and/or sell copies of the Software, and to
  11  * permit persons to whom the Software is furnished to do so, subject to
  12  * the following conditions:
  13  *
  14  * The above copyright notice and this permission notice (including the
  15  * next paragraph) shall be included in all copies or substantial portions
  16  * of the Software.
  17  *
  18  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
  19  * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  20  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
  21  * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
  22  * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
  23  * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
  24  * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
  25  *
  26  **************************************************************************/
  27  /*
  28   * Authors:
  29   *   Keith Whitwell <keith@tungstengraphics.com>
  30   *   Brian Paul
  31   */
  32
  33
  34 #include "main/imports.h"
  35 #include "main/mtypes.h"
  36 #include "shader/prog_print.h"
  37 #include "shader/programopt.h"
  38
  39 #include "pipe/p_context.h"
  40 #include "pipe/p_defines.h"
  41 #include "pipe/p_shader_tokens.h"
  42 #include "draw/draw_context.h"
  43 #include "tgsi/tgsi_dump.h"
  44
  45 #include "st_debug.h"
  46 #include "st_context.h"
  47 #include "st_atom.h"
  48 #include "st_program.h"
  49 #include "st_mesa_to_tgsi.h"
  50 #include "cso_cache/cso_context.h"
  51
  52
  53
  54 /**
  55  * Clean out any old compilations:
  56  */
  57 void
  58 st_vp_release_varients( struct st_context *st,
  59                         struct st_vertex_program *stvp )
  60 {
  61    struct st_vp_varient *vpv;
  62
  63    for (vpv = stvp->varients; vpv; ) {
  64       struct st_vp_varient *next = vpv->next;
  65
  66       if (vpv->driver_shader)
  67          cso_delete_vertex_shader(st->cso_context, vpv->driver_shader);
  68
  69       if (vpv->draw_shader)
  70          draw_delete_vertex_shader( st->draw, vpv->draw_shader );
  71
  72       if (vpv->state.tokens)
  73          st_free_tokens(vpv->state.tokens);
  74
  75       FREE( vpv );
  76
  77       vpv = next;
  78    }
  79
  80    stvp->varients = NULL;
  81 }
  82
  83
  84
  85
  86 /**
  87  * Translate a Mesa vertex shader into a TGSI shader.
  88  * \param outputMapping  to map vertex program output registers (VERT_RESULT_x)
  89  *       to TGSI output slots
  90  * \param tokensOut  destination for TGSI tokens
  91  * \return  pointer to cached pipe_shader object.
  92  */
  93 void
  94 st_prepare_vertex_program(struct st_context *st,
  95                             struct st_vertex_program *stvp)
  96 {
  97    GLuint attr;
  98
  99    stvp->num_inputs = 0;
 100    stvp->num_outputs = 0;
 101
 102    if (stvp->Base.IsPositionInvariant)
 103       _mesa_insert_mvp_code(st->ctx, &stvp->Base);
 104
 105    assert(stvp->Base.Base.NumInstructions > 1);
 106
 107    /*
 108     * Determine number of inputs, the mappings between VERT_ATTRIB_x
 109     * and TGSI generic input indexes, plus input attrib semantic info.
 110     */
 111    for (attr = 0; attr < VERT_ATTRIB_MAX; attr++) {
 112       if (stvp->Base.Base.InputsRead & (1 << attr)) {
 113          stvp->input_to_index[attr] = stvp->num_inputs;
 114          stvp->index_to_input[stvp->num_inputs] = attr;
 115          stvp->num_inputs++;
 116       }
 117    }
 118    /* bit of a hack, presetup potentially unused edgeflag input */
 119    stvp->input_to_index[VERT_ATTRIB_EDGEFLAG] = stvp->num_inputs;
 120    stvp->index_to_input[stvp->num_inputs] = VERT_ATTRIB_EDGEFLAG;
 121
 122    /* Compute mapping of vertex program outputs to slots.
 123     */
 124    for (attr = 0; attr < VERT_RESULT_MAX; attr++) {
 125       if ((stvp->Base.Base.OutputsWritten & (1 << attr)) == 0) {
 126          stvp->result_to_output[attr] = ~0;
 127       }
 128       else {
 129          unsigned slot = stvp->num_outputs++;
 130
 131          stvp->result_to_output[attr] = slot;
 132
 133          switch (attr) {
 134          case VERT_RESULT_HPOS:
 135             stvp->output_semantic_name[slot] = TGSI_SEMANTIC_POSITION;
 136             stvp->output_semantic_index[slot] = 0;
 137             break;
 138          case VERT_RESULT_COL0:
 139             stvp->output_semantic_name[slot] = TGSI_SEMANTIC_COLOR;
 140             stvp->output_semantic_index[slot] = 0;
 141             break;
 142          case VERT_RESULT_COL1:
 143             stvp->output_semantic_name[slot] = TGSI_SEMANTIC_COLOR;
 144             stvp->output_semantic_index[slot] = 1;
 145             break;
 146          case VERT_RESULT_BFC0:
 147             stvp->output_semantic_name[slot] = TGSI_SEMANTIC_BCOLOR;
 148             stvp->output_semantic_index[slot] = 0;
 149             break;
 150          case VERT_RESULT_BFC1:
 151             stvp->output_semantic_name[slot] = TGSI_SEMANTIC_BCOLOR;
 152             stvp->output_semantic_index[slot] = 1;
 153             break;
 154          case VERT_RESULT_FOGC:
 155             stvp->output_semantic_name[slot] = TGSI_SEMANTIC_FOG;
 156             stvp->output_semantic_index[slot] = 0;
 157             break;
 158          case VERT_RESULT_PSIZ:
 159             stvp->output_semantic_name[slot] = TGSI_SEMANTIC_PSIZE;
 160             stvp->output_semantic_index[slot] = 0;
 161             break;
 162          case VERT_RESULT_EDGE:
 163             assert(0);
 164             break;
 165
 166          case VERT_RESULT_TEX0:
 167          case VERT_RESULT_TEX1:
 168          case VERT_RESULT_TEX2:
 169          case VERT_RESULT_TEX3:
 170          case VERT_RESULT_TEX4:
 171          case VERT_RESULT_TEX5:
 172          case VERT_RESULT_TEX6:
 173          case VERT_RESULT_TEX7:
 174             stvp->output_semantic_name[slot] = TGSI_SEMANTIC_GENERIC;
 175             stvp->output_semantic_index[slot] = attr - VERT_RESULT_TEX0;
 176             break;
 177
 178          case VERT_RESULT_VAR0:
 179          default:
 180             assert(attr < VERT_RESULT_MAX);
 181             stvp->output_semantic_name[slot] = TGSI_SEMANTIC_GENERIC;
 182             stvp->output_semantic_index[slot] = (FRAG_ATTRIB_VAR0 -
 183                                                 FRAG_ATTRIB_TEX0 +
 184                                                 attr -
 185                                                 VERT_RESULT_VAR0);
 186             break;
 187          }
 188       }
 189    }
 190    /* similar hack to above, presetup potentially unused edgeflag output */
 191    stvp->result_to_output[VERT_RESULT_EDGE] = stvp->num_outputs;
 192    stvp->output_semantic_name[stvp->num_outputs] = TGSI_SEMANTIC_EDGEFLAG;
 193    stvp->output_semantic_index[stvp->num_outputs] = 0;
 194 }
 195
 196
 197 struct st_vp_varient *
 198 st_translate_vertex_program(struct st_context *st,
 199                             struct st_vertex_program *stvp,
 200                             const struct st_vp_varient_key *key)
 201 {
 202    struct st_vp_varient *vpv = CALLOC_STRUCT(st_vp_varient);
 203    struct pipe_context *pipe = st->pipe;
 204    struct ureg_program *ureg;
 205    enum pipe_error error;
 206    unsigned num_outputs;
 207
 208    ureg = ureg_create( TGSI_PROCESSOR_VERTEX );
 209    if (ureg == NULL)
 210       return NULL;
 211
 212    vpv->num_inputs = stvp->num_inputs;
 213    num_outputs = stvp->num_outputs;
 214    if (key->passthrough_edgeflags) {
 215       vpv->num_inputs++;
 216       num_outputs++;
 217    }
 218
 219    error =
 220       st_translate_mesa_program(st->ctx,
 221                                 TGSI_PROCESSOR_VERTEX,
 222                                 ureg,
 223                                 &stvp->Base.Base,
 224                                 /* inputs */
 225                                 vpv->num_inputs,
 226                                 stvp->input_to_index,
 227                                 NULL, /* input semantic name */
 228                                 NULL, /* input semantic index */
 229                                 NULL,
 230                                 /* outputs */
 231                                 num_outputs,
 232                                 stvp->result_to_output,
 233                                 stvp->output_semantic_name,
 234                                 stvp->output_semantic_index,
 235                                 key->passthrough_edgeflags );
 236
 237    if (error)
 238       goto fail;
 239
 240    vpv->state.tokens = ureg_get_tokens( ureg, NULL );
 241    if (!vpv->state.tokens)
 242       goto fail;
 243
 244    ureg_destroy( ureg );
 245
 246    vpv->driver_shader = pipe->create_vs_state(pipe, &vpv->state);
 247
 248    if ((ST_DEBUG & DEBUG_TGSI) && (ST_DEBUG & DEBUG_MESA)) {
 249       _mesa_print_program(&stvp->Base.Base);
 250       debug_printf("\n");
 251    }
 252
 253    if (ST_DEBUG & DEBUG_TGSI) {
 254       tgsi_dump( vpv->state.tokens, 0 );
 255       debug_printf("\n");
 256    }
 257
 258    return vpv;
 259
 260 fail:
 261    debug_printf("%s: failed to translate Mesa program:\n", __FUNCTION__);
 262    _mesa_print_program(&stvp->Base.Base);
 263    debug_assert(0);
 264
 265    ureg_destroy( ureg );
 266    return NULL;
 267 }
 268
 269
 270
 271 /**
 272  * Translate a Mesa fragment shader into a TGSI shader.
 273  * \param inputMapping  to map fragment program input registers to TGSI
 274  *                      input slots
 275  * \return  pointer to cached pipe_shader object.
 276  */
 277 void
 278 st_translate_fragment_program(struct st_context *st,
 279                               struct st_fragment_program *stfp,
 280                               const GLuint inputMapping[])
 281 {
 282    struct pipe_context *pipe = st->pipe;
 283    GLuint outputMapping[FRAG_RESULT_MAX];
 284    GLuint defaultInputMapping[FRAG_ATTRIB_MAX];
 285    GLuint interpMode[16];  /* XXX size? */
 286    GLuint attr;
 287    enum pipe_error error;
 288    const GLbitfield inputsRead = stfp->Base.Base.InputsRead;
 289    struct ureg_program *ureg;
 290    GLuint vslot = 0;
 291
 292    uint fs_num_inputs = 0;
 293
 294    ubyte fs_output_semantic_name[PIPE_MAX_SHADER_OUTPUTS];
 295    ubyte fs_output_semantic_index[PIPE_MAX_SHADER_OUTPUTS];
 296    uint fs_num_outputs = 0;
 297
 298    /* which vertex output goes to the first fragment input: */
 299    if (inputsRead & FRAG_BIT_WPOS)
 300       vslot = 0;
 301    else
 302       vslot = 1;
 303
 304    /*
 305     * Convert Mesa program inputs to TGSI input register semantics.
 306     */
 307    for (attr = 0; attr < FRAG_ATTRIB_MAX; attr++) {
 308       if (inputsRead & (1 << attr)) {
 309          const GLuint slot = fs_num_inputs;
 310
 311          defaultInputMapping[attr] = slot;
 312
 313          stfp->input_map[slot] = vslot++;
 314
 315          fs_num_inputs++;
 316
 317          switch (attr) {
 318          case FRAG_ATTRIB_WPOS:
 319             stfp->input_semantic_name[slot] = TGSI_SEMANTIC_POSITION;
 320             stfp->input_semantic_index[slot] = 0;
 321             interpMode[slot] = TGSI_INTERPOLATE_LINEAR;
 322             break;
 323          case FRAG_ATTRIB_COL0:
 324             stfp->input_semantic_name[slot] = TGSI_SEMANTIC_COLOR;
 325             stfp->input_semantic_index[slot] = 0;
 326             interpMode[slot] = TGSI_INTERPOLATE_LINEAR;
 327             break;
 328          case FRAG_ATTRIB_COL1:
 329             stfp->input_semantic_name[slot] = TGSI_SEMANTIC_COLOR;
 330             stfp->input_semantic_index[slot] = 1;
 331             interpMode[slot] = TGSI_INTERPOLATE_LINEAR;
 332             break;
 333          case FRAG_ATTRIB_FOGC:
 334             stfp->input_semantic_name[slot] = TGSI_SEMANTIC_FOG;
 335             stfp->input_semantic_index[slot] = 0;
 336             interpMode[slot] = TGSI_INTERPOLATE_PERSPECTIVE;
 337             break;
 338          case FRAG_ATTRIB_FACE:
 339             stfp->input_semantic_name[slot] = TGSI_SEMANTIC_FACE;
 340             stfp->input_semantic_index[slot] = 0;
 341             interpMode[slot] = TGSI_INTERPOLATE_CONSTANT;
 342             break;
 343
 344             /* In most cases, there is nothing special about these
 345              * inputs, so adopt a convention to use the generic
 346              * semantic name and the mesa FRAG_ATTRIB_ number as the
 347              * index.
 348              *
 349              * All that is required is that the vertex shader labels
 350              * its own outputs similarly, and that the vertex shader
 351              * generates at least every output required by the
 352              * fragment shader plus fixed-function hardware (such as
 353              * BFC).
 354              *
 355              * There is no requirement that semantic indexes start at
 356              * zero or be restricted to a particular range -- nobody
 357              * should be building tables based on semantic index.
 358              */
 359          case FRAG_ATTRIB_TEX0:
 360          case FRAG_ATTRIB_TEX1:
 361          case FRAG_ATTRIB_TEX2:
 362          case FRAG_ATTRIB_TEX3:
 363          case FRAG_ATTRIB_TEX4:
 364          case FRAG_ATTRIB_TEX5:
 365          case FRAG_ATTRIB_TEX6:
 366          case FRAG_ATTRIB_TEX7:
 367          case FRAG_ATTRIB_PNTC:
 368          case FRAG_ATTRIB_VAR0:
 369          default:
 370             /* Actually, let's try and zero-base this just for
 371              * readability of the generated TGSI.
 372              */
 373             assert(attr >= FRAG_ATTRIB_TEX0);
 374             stfp->input_semantic_index[slot] = (attr - FRAG_ATTRIB_TEX0);
 375             stfp->input_semantic_name[slot] = TGSI_SEMANTIC_GENERIC;
 376             interpMode[slot] = TGSI_INTERPOLATE_PERSPECTIVE;
 377             break;
 378          }
 379       }
 380    }
 381
 382    /*
 383     * Semantics and mapping for outputs
 384     */
 385    {
 386       uint numColors = 0;
 387       GLbitfield64 outputsWritten = stfp->Base.Base.OutputsWritten;
 388
 389       /* if z is written, emit that first */
 390       if (outputsWritten & (1 << FRAG_RESULT_DEPTH)) {
 391          fs_output_semantic_name[fs_num_outputs] = TGSI_SEMANTIC_POSITION;
 392          fs_output_semantic_index[fs_num_outputs] = 0;
 393          outputMapping[FRAG_RESULT_DEPTH] = fs_num_outputs;
 394          fs_num_outputs++;
 395          outputsWritten &= ~(1 << FRAG_RESULT_DEPTH);
 396       }
 397
 398       /* handle remaning outputs (color) */
 399       for (attr = 0; attr < FRAG_RESULT_MAX; attr++) {
 400          if (outputsWritten & (1 << attr)) {
 401             switch (attr) {
 402             case FRAG_RESULT_DEPTH:
 403                /* handled above */
 404                assert(0);
 405                break;
 406             default:
 407                assert(attr == FRAG_RESULT_COLOR ||
 408                       (FRAG_RESULT_DATA0 <= attr && attr < FRAG_RESULT_MAX));
 409                fs_output_semantic_name[fs_num_outputs] = TGSI_SEMANTIC_COLOR;
 410                fs_output_semantic_index[fs_num_outputs] = numColors;
 411                outputMapping[attr] = fs_num_outputs;
 412                numColors++;
 413                break;
 414             }
 415
 416             fs_num_outputs++;
 417          }
 418       }
 419    }
 420
 421    if (!inputMapping)
 422       inputMapping = defaultInputMapping;
 423
 424    ureg = ureg_create( TGSI_PROCESSOR_FRAGMENT );
 425    if (ureg == NULL)
 426       return;
 427
 428
 429    error =
 430       st_translate_mesa_program(st->ctx,
 431                                 TGSI_PROCESSOR_FRAGMENT,
 432                                 ureg,
 433                                 &stfp->Base.Base,
 434                                 /* inputs */
 435                                 fs_num_inputs,
 436                                 inputMapping,
 437                                 stfp->input_semantic_name,
 438                                 stfp->input_semantic_index,
 439                                 interpMode,
 440                                 /* outputs */
 441                                 fs_num_outputs,
 442                                 outputMapping,
 443                                 fs_output_semantic_name,
 444                                 fs_output_semantic_index, FALSE );
 445
 446    stfp->state.tokens = ureg_get_tokens( ureg, NULL );
 447    ureg_destroy( ureg );
 448    stfp->driver_shader = pipe->create_fs_state(pipe, &stfp->state);
 449
 450    if ((ST_DEBUG & DEBUG_TGSI) && (ST_DEBUG & DEBUG_MESA)) {
 451       _mesa_print_program(&stfp->Base.Base);
 452       debug_printf("\n");
 453    }
 454
 455    if (ST_DEBUG & DEBUG_TGSI) {
 456       tgsi_dump( stfp->state.tokens, 0/*TGSI_DUMP_VERBOSE*/ );
 457       debug_printf("\n");
 458    }
 459 }
 460
 461
 462 /**
 463  * Debug- print current shader text
 464  */
 465 void
 466 st_print_shaders(GLcontext *ctx)
 467 {
 468    struct gl_shader_program *shProg = ctx->Shader.CurrentProgram;
 469    if (shProg) {
 470       GLuint i;
 471       for (i = 0; i < shProg->NumShaders; i++) {
 472          printf("GLSL shader %u of %u:\n", i, shProg->NumShaders);
 473          printf("%s\n", shProg->Shaders[i]->Source);
 474       }
 475    }
 476 }