src/gallium/drivers/svga/svga_state_framebuffer.c

   1 /**********************************************************
   2  * Copyright 2008-2009 VMware, Inc.  All rights reserved.
   3  *
   4  * Permission is hereby granted, free of charge, to any person
   5  * obtaining a copy of this software and associated documentation
   6  * files (the "Software"), to deal in the Software without
   7  * restriction, including without limitation the rights to use, copy,
   8  * modify, merge, publish, distribute, sublicense, and/or sell copies
   9  * of the Software, and to permit persons to whom the Software is
  10  * furnished to do so, subject to the following conditions:
  11  *
  12  * The above copyright notice and this permission notice shall be
  13  * included in all copies or substantial portions of the Software.
  14  *
  15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  16  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  17  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  18  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  19  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  20  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  21  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  22  * SOFTWARE.
  23  *
  24  **********************************************************/
  25
  26 #include "util/u_inlines.h"
  27 #include "pipe/p_defines.h"
  28 #include "util/u_math.h"
  29
  30 #include "svga_context.h"
  31 #include "svga_state.h"
  32 #include "svga_cmd.h"
  33 #include "svga_debug.h"
  34 #include "svga_screen.h"
  35
  36
  37 /*
  38  * flush our command buffer after the 8th distinct render target
  39  *
  40  * This helps improve the surface cache behaviour in the face of the
  41  * large number of single-use render targets generated by EXA and the xorg
  42  * state tracker.  Without this we can reference hundreds of individual
  43  * render targets from a command buffer, which leaves little scope for
  44  * sharing or reuse of those targets.
  45  */
  46 #define MAX_RT_PER_BATCH 8
  47
  48
  49 /***********************************************************************
  50  * Hardware state update
  51  */
  52
  53
  54 static enum pipe_error
  55 emit_framebuffer( struct svga_context *svga,
  56                   unsigned dirty )
  57 {
  58    struct svga_screen *svgascreen = svga_screen(svga->pipe.screen);
  59    const struct pipe_framebuffer_state *curr = &svga->curr.framebuffer;
  60    struct pipe_framebuffer_state *hw = &svga->state.hw_clear.framebuffer;
  61    boolean reemit = svga->rebind.rendertargets;
  62    unsigned i;
  63    enum pipe_error ret;
  64
  65    /*
  66     * We need to reemit non-null surface bindings, even when they are not
  67     * dirty, to ensure that the resources are paged in.
  68     */
  69
  70    for (i = 0; i < svgascreen->max_color_buffers; i++) {
  71       if (curr->cbufs[i] != hw->cbufs[i] ||
  72           (reemit && hw->cbufs[i])) {
  73          if (svga->curr.nr_fbs++ > MAX_RT_PER_BATCH)
  74             return PIPE_ERROR_OUT_OF_MEMORY;
  75
  76          ret = SVGA3D_SetRenderTarget(svga->swc, SVGA3D_RT_COLOR0 + i,
  77                                       curr->cbufs[i]);
  78          if (ret != PIPE_OK)
  79             return ret;
  80
  81          pipe_surface_reference(&hw->cbufs[i], curr->cbufs[i]);
  82       }
  83    }
  84
  85    if (curr->zsbuf != hw->zsbuf ||
  86        (reemit && hw->zsbuf)) {
  87       ret = SVGA3D_SetRenderTarget(svga->swc, SVGA3D_RT_DEPTH, curr->zsbuf);
  88       if (ret != PIPE_OK)
  89          return ret;
  90
  91       if (curr->zsbuf &&
  92           curr->zsbuf->format == PIPE_FORMAT_S8_UINT_Z24_UNORM) {
  93          ret = SVGA3D_SetRenderTarget(svga->swc, SVGA3D_RT_STENCIL,
  94                                       curr->zsbuf);
  95          if (ret != PIPE_OK)
  96             return ret;
  97       }
  98       else {
  99          ret = SVGA3D_SetRenderTarget(svga->swc, SVGA3D_RT_STENCIL, NULL);
 100          if (ret != PIPE_OK)
 101             return ret;
 102       }
 103
 104       pipe_surface_reference(&hw->zsbuf, curr->zsbuf);
 105    }
 106
 107    svga->rebind.rendertargets = FALSE;
 108
 109    return PIPE_OK;
 110 }
 111
 112
 113 /*
 114  * Rebind rendertargets.
 115  *
 116  * Similar to emit_framebuffer, but without any state checking/update.
 117  *
 118  * Called at the beginning of every new command buffer to ensure that
 119  * non-dirty rendertargets are properly paged-in.
 120  */
 121 enum pipe_error
 122 svga_reemit_framebuffer_bindings(struct svga_context *svga)
 123 {
 124    struct svga_screen *svgascreen = svga_screen(svga->pipe.screen);
 125    struct pipe_framebuffer_state *hw = &svga->state.hw_clear.framebuffer;
 126    unsigned i;
 127    enum pipe_error ret;
 128
 129    assert(svga->rebind.rendertargets);
 130
 131    for (i = 0; i < svgascreen->max_color_buffers; i++) {
 132       if (hw->cbufs[i]) {
 133          ret = SVGA3D_SetRenderTarget(svga->swc, SVGA3D_RT_COLOR0 + i,
 134                                       hw->cbufs[i]);
 135          if (ret != PIPE_OK) {
 136             return ret;
 137          }
 138       }
 139    }
 140
 141    if (hw->zsbuf) {
 142       ret = SVGA3D_SetRenderTarget(svga->swc, SVGA3D_RT_DEPTH, hw->zsbuf);
 143       if (ret != PIPE_OK) {
 144          return ret;
 145       }
 146
 147       if (hw->zsbuf &&
 148           hw->zsbuf->format == PIPE_FORMAT_S8_UINT_Z24_UNORM) {
 149          ret = SVGA3D_SetRenderTarget(svga->swc, SVGA3D_RT_STENCIL, hw->zsbuf);
 150          if (ret != PIPE_OK) {
 151             return ret;
 152          }
 153       }
 154       else {
 155          ret = SVGA3D_SetRenderTarget(svga->swc, SVGA3D_RT_STENCIL, NULL);
 156          if (ret != PIPE_OK) {
 157             return ret;
 158          }
 159       }
 160    }
 161
 162    svga->rebind.rendertargets = FALSE;
 163
 164    return PIPE_OK;
 165 }
 166
 167
 168 struct svga_tracked_state svga_hw_framebuffer =
 169 {
 170    "hw framebuffer state",
 171    SVGA_NEW_FRAME_BUFFER,
 172    emit_framebuffer
 173 };
 174
 175
 176
 177
 178 /***********************************************************************
 179  */
 180
 181 static enum pipe_error
 182 emit_viewport( struct svga_context *svga,
 183                unsigned dirty )
 184 {
 185    const struct pipe_viewport_state *viewport = &svga->curr.viewport;
 186    struct svga_prescale prescale;
 187    SVGA3dRect rect;
 188    /* Not sure if this state is relevant with POSITIONT.  Probably
 189     * not, but setting to 0,1 avoids some state pingponging.
 190     */
 191    float range_min = 0.0;
 192    float range_max = 1.0;
 193    float flip = -1.0;
 194    boolean degenerate = FALSE;
 195    boolean invertY = FALSE;
 196    enum pipe_error ret;
 197
 198    float fb_width = (float) svga->curr.framebuffer.width;
 199    float fb_height = (float) svga->curr.framebuffer.height;
 200
 201    float fx =        viewport->scale[0] * -1.0f + viewport->translate[0];
 202    float fy = flip * viewport->scale[1] * -1.0f + viewport->translate[1];
 203    float fw =        viewport->scale[0] * 2.0f;
 204    float fh = flip * viewport->scale[1] * 2.0f;
 205
 206    memset( &prescale, 0, sizeof(prescale) );
 207
 208    /* Examine gallium viewport transformation and produce a screen
 209     * rectangle and possibly vertex shader pre-transformation to
 210     * get the same results.
 211     */
 212
 213    SVGA_DBG(DEBUG_VIEWPORT,
 214             "\ninitial %f,%f %fx%f\n",
 215             fx,
 216             fy,
 217             fw,
 218             fh);
 219
 220    prescale.scale[0] = 1.0;
 221    prescale.scale[1] = 1.0;
 222    prescale.scale[2] = 1.0;
 223    prescale.scale[3] = 1.0;
 224    prescale.translate[0] = 0;
 225    prescale.translate[1] = 0;
 226    prescale.translate[2] = 0;
 227    prescale.translate[3] = 0;
 228    prescale.enabled = TRUE;
 229
 230    if (fw < 0) {
 231       prescale.scale[0] *= -1.0f;
 232       prescale.translate[0] += -fw;
 233       fw = -fw;
 234       fx = viewport->scale[0] * 1.0f + viewport->translate[0];
 235    }
 236
 237    if (fh < 0.0) {
 238       prescale.translate[1] = fh - 1.0f + fy * 2.0f;
 239       fh = -fh;
 240       fy -= fh;
 241       prescale.scale[1] = -1.0f;
 242       invertY = TRUE;
 243    }
 244
 245    if (fx < 0) {
 246       prescale.translate[0] += fx;
 247       prescale.scale[0] *= fw / (fw + fx);
 248       fw += fx;
 249       fx = 0.0f;
 250    }
 251
 252    if (fy < 0) {
 253       if (invertY) {
 254          prescale.translate[1] -= fy;
 255       }
 256       else {
 257          prescale.translate[1] += fy;
 258       }
 259       prescale.scale[1] *= fh / (fh + fy);
 260       fh += fy;
 261       fy = 0.0f;
 262    }
 263
 264    if (fx + fw > fb_width) {
 265       prescale.scale[0] *= fw / (fb_width - fx);
 266       prescale.translate[0] -= fx * (fw / (fb_width - fx));
 267       prescale.translate[0] += fx;
 268       fw = fb_width - fx;
 269    }
 270
 271    if (fy + fh > fb_height) {
 272       prescale.scale[1] *= fh / (fb_height - fy);
 273       if (invertY) {
 274          float in = fb_height - fy;       /* number of vp pixels inside view */
 275          float out = fy + fh - fb_height; /* number of vp pixels out of view */
 276          prescale.translate[1] += fy * out / in;
 277       }
 278       else {
 279          prescale.translate[1] -= fy * (fh / (fb_height - fy));
 280          prescale.translate[1] += fy;
 281       }
 282       fh = fb_height - fy;
 283    }
 284
 285    if (fw < 0 || fh < 0) {
 286       fw = fh = fx = fy = 0;
 287       degenerate = TRUE;
 288       goto out;
 289    }
 290
 291    /* D3D viewport is integer space.  Convert fx,fy,etc. to
 292     * integers.
 293     *
 294     * TODO: adjust pretranslate correct for any subpixel error
 295     * introduced converting to integers.
 296     */
 297    rect.x = (uint32) fx;
 298    rect.y = (uint32) fy;
 299    rect.w = (uint32) fw;
 300    rect.h = (uint32) fh;
 301
 302    SVGA_DBG(DEBUG_VIEWPORT,
 303             "viewport error %f,%f %fx%f\n",
 304             fabs((float)rect.x - fx),
 305             fabs((float)rect.y - fy),
 306             fabs((float)rect.w - fw),
 307             fabs((float)rect.h - fh));
 308
 309    SVGA_DBG(DEBUG_VIEWPORT,
 310             "viewport %d,%d %dx%d\n",
 311             rect.x,
 312             rect.y,
 313             rect.w,
 314             rect.h);
 315
 316    /* Finally, to get GL rasterization rules, need to tweak the
 317     * screen-space coordinates slightly relative to D3D which is
 318     * what hardware implements natively.
 319     */
 320    if (svga->curr.rast->templ.half_pixel_center) {
 321       float adjust_x = 0.0;
 322       float adjust_y = 0.0;
 323
 324       switch (svga->curr.reduced_prim) {
 325       case PIPE_PRIM_POINTS:
 326          adjust_x = -0.375;
 327          adjust_y = -0.75;
 328          break;
 329       case PIPE_PRIM_LINES:
 330          adjust_x = -0.5;
 331          adjust_y = 0;
 332          break;
 333       case PIPE_PRIM_TRIANGLES:
 334          adjust_x = -0.5;
 335          adjust_y = -0.5;
 336          break;
 337       }
 338
 339       if (invertY)
 340          adjust_y = -adjust_y;
 341
 342       prescale.translate[0] += adjust_x;
 343       prescale.translate[1] += adjust_y;
 344       prescale.translate[2] = 0.5; /* D3D clip space */
 345       prescale.scale[2]     = 0.5; /* D3D clip space */
 346    }
 347
 348    range_min = viewport->scale[2] * -1.0f + viewport->translate[2];
 349    range_max = viewport->scale[2] *  1.0f + viewport->translate[2];
 350
 351    /* D3D (and by implication SVGA) doesn't like dealing with zmax
 352     * less than zmin.  Detect that case, flip the depth range and
 353     * invert our z-scale factor to achieve the same effect.
 354     */
 355    if (range_min > range_max) {
 356       float range_tmp;
 357       range_tmp = range_min;
 358       range_min = range_max;
 359       range_max = range_tmp;
 360       prescale.scale[2] = -prescale.scale[2];
 361    }
 362
 363    if (prescale.enabled) {
 364       float H[2];
 365       float J[2];
 366       int i;
 367
 368       SVGA_DBG(DEBUG_VIEWPORT,
 369                "prescale %f,%f %fx%f\n",
 370                prescale.translate[0],
 371                prescale.translate[1],
 372                prescale.scale[0],
 373                prescale.scale[1]);
 374
 375       H[0] = (float)rect.w / 2.0f;
 376       H[1] = -(float)rect.h / 2.0f;
 377       J[0] = (float)rect.x + (float)rect.w / 2.0f;
 378       J[1] = (float)rect.y + (float)rect.h / 2.0f;
 379
 380       SVGA_DBG(DEBUG_VIEWPORT,
 381                "H %f,%f\n"
 382                "J %fx%f\n",
 383                H[0],
 384                H[1],
 385                J[0],
 386                J[1]);
 387
 388       /* Adjust prescale to take into account the fact that it is
 389        * going to be applied prior to the perspective divide and
 390        * viewport transformation.
 391        *
 392        * Vwin = H(Vc/Vc.w) + J
 393        *
 394        * We want to tweak Vwin with scale and translation from above,
 395        * as in:
 396        *
 397        * Vwin' = S Vwin + T
 398        *
 399        * But we can only modify the values at Vc.  Plugging all the
 400        * above together, and rearranging, eventually we get:
 401        *
 402        *   Vwin' = H(Vc'/Vc'.w) + J
 403        * where:
 404        *   Vc' = SVc + KVc.w
 405        *   K = (T + (S-1)J) / H
 406        *
 407        * Overwrite prescale.translate with values for K:
 408        */
 409       for (i = 0; i < 2; i++) {
 410          prescale.translate[i] = ((prescale.translate[i] +
 411                                    (prescale.scale[i] - 1.0f) * J[i]) / H[i]);
 412       }
 413
 414       SVGA_DBG(DEBUG_VIEWPORT,
 415                "clipspace %f,%f %fx%f\n",
 416                prescale.translate[0],
 417                prescale.translate[1],
 418                prescale.scale[0],
 419                prescale.scale[1]);
 420    }
 421
 422 out:
 423    if (degenerate) {
 424       rect.x = 0;
 425       rect.y = 0;
 426       rect.w = 1;
 427       rect.h = 1;
 428       prescale.enabled = FALSE;
 429    }
 430
 431    if (memcmp(&rect, &svga->state.hw_clear.viewport, sizeof(rect)) != 0) {
 432       ret = SVGA3D_SetViewport(svga->swc, &rect);
 433       if(ret != PIPE_OK)
 434          return ret;
 435
 436       memcpy(&svga->state.hw_clear.viewport, &rect, sizeof(rect));
 437       assert(sizeof(rect) == sizeof(svga->state.hw_clear.viewport));
 438    }
 439
 440    if (svga->state.hw_clear.depthrange.zmin != range_min ||
 441        svga->state.hw_clear.depthrange.zmax != range_max) {
 442       ret = SVGA3D_SetZRange(svga->swc, range_min, range_max );
 443       if(ret != PIPE_OK)
 444          return ret;
 445
 446       svga->state.hw_clear.depthrange.zmin = range_min;
 447       svga->state.hw_clear.depthrange.zmax = range_max;
 448    }
 449
 450    if (memcmp(&prescale, &svga->state.hw_clear.prescale, sizeof prescale) != 0) {
 451       svga->dirty |= SVGA_NEW_PRESCALE;
 452       svga->state.hw_clear.prescale = prescale;
 453    }
 454
 455    return PIPE_OK;
 456 }
 457
 458
 459 struct svga_tracked_state svga_hw_viewport =
 460 {
 461    "hw viewport state",
 462    ( SVGA_NEW_FRAME_BUFFER |
 463      SVGA_NEW_VIEWPORT |
 464      SVGA_NEW_RAST |
 465      SVGA_NEW_REDUCED_PRIMITIVE ),
 466    emit_viewport
 467 };
 468
 469
 470 /***********************************************************************
 471  * Scissor state
 472  */
 473 static enum pipe_error
 474 emit_scissor_rect( struct svga_context *svga,
 475                    unsigned dirty )
 476 {
 477    const struct pipe_scissor_state *scissor = &svga->curr.scissor;
 478    SVGA3dRect rect;
 479
 480    rect.x = scissor->minx;
 481    rect.y = scissor->miny;
 482    rect.w = scissor->maxx - scissor->minx; /* + 1 ?? */
 483    rect.h = scissor->maxy - scissor->miny; /* + 1 ?? */
 484
 485    return SVGA3D_SetScissorRect(svga->swc, &rect);
 486 }
 487
 488
 489 struct svga_tracked_state svga_hw_scissor =
 490 {
 491    "hw scissor state",
 492    SVGA_NEW_SCISSOR,
 493    emit_scissor_rect
 494 };
 495
 496
 497 /***********************************************************************
 498  * Userclip state
 499  */
 500
 501 static enum pipe_error
 502 emit_clip_planes( struct svga_context *svga,
 503                   unsigned dirty )
 504 {
 505    unsigned i;
 506    enum pipe_error ret;
 507
 508    /* TODO: just emit directly from svga_set_clip_state()?
 509     */
 510    for (i = 0; i < SVGA3D_MAX_CLIP_PLANES; i++) {
 511       /* need to express the plane in D3D-style coordinate space.
 512        * GL coords get converted to D3D coords with the matrix:
 513        * [ 1  0  0  0 ]
 514        * [ 0 -1  0  0 ]
 515        * [ 0  0  2  0 ]
 516        * [ 0  0 -1  1 ]
 517        * Apply that matrix to our plane equation, and invert Y.
 518        */
 519       float a = svga->curr.clip.ucp[i][0];
 520       float b = svga->curr.clip.ucp[i][1];
 521       float c = svga->curr.clip.ucp[i][2];
 522       float d = svga->curr.clip.ucp[i][3];
 523       float plane[4];
 524
 525       plane[0] = a;
 526       plane[1] = b;
 527       plane[2] = 2.0f * c;
 528       plane[3] = d - c;
 529
 530       ret = SVGA3D_SetClipPlane(svga->swc, i, plane);
 531       if(ret != PIPE_OK)
 532          return ret;
 533    }
 534
 535    return PIPE_OK;
 536 }
 537
 538
 539 struct svga_tracked_state svga_hw_clip_planes =
 540 {
 541    "hw viewport state",
 542    SVGA_NEW_CLIP,
 543    emit_clip_planes
 544 };