src/mesa/drivers/dri/i965/brw_tex_layout.c

   1 /*
   2  * Copyright 2006 VMware, Inc.
   3  * Copyright © 2006 Intel Corporation
   4  *
   5  * Permission is hereby granted, free of charge, to any person obtaining
   6  * a copy of this software and associated documentation files (the
   7  * "Software"), to deal in the Software without restriction, including
   8  * without limitation the rights to use, copy, modify, merge, publish,
   9  * distribute, sublicense, and/or sell copies of the Software, and to
  10  * permit persons to whom the Software is furnished to do so, subject to
  11  * the following conditions:
  12  *
  13  * The above copyright notice and this permission notice (including the
  14  * next paragraph) shall be included in all copies or substantial
  15  * portions of the Software.
  16  *
  17  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  18  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  19  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
  20  * IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
  21  * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
  22  * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
  23  * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
  24  */
  25
  26 /**
  27  * \file brw_tex_layout.cpp
  28  *
  29  * Code to lay out images in a mipmap tree.
  30  *
  31  * \author Keith Whitwell <keithw@vmware.com>
  32  * \author Michel Dänzer <daenzer@vmware.com>
  33  */
  34
  35 #include "intel_mipmap_tree.h"
  36 #include "brw_context.h"
  37 #include "main/macros.h"
  38 #include "main/glformats.h"
  39
  40 #define FILE_DEBUG_FLAG DEBUG_MIPTREE
  41
  42 static unsigned int
  43 tr_mode_horizontal_texture_alignment(const struct intel_mipmap_tree *mt)
  44 {
  45    unsigned ret_align, divisor, multiplier_ys;
  46
  47    /* Values in below tables specifiy the horizontal alignment requirement
  48     * in elements for TRMODE_YF surface. An element is defined as a pixel in
  49     * uncompressed surface formats, and as a compression block in compressed
  50     * surface formats. For MSFMT_DEPTH_STENCIL type multisampled surfaces, an
  51     * element is a sample.
  52     */
  53    const unsigned align_1d_yf[] = {4096, 2048, 1024, 512, 256};
  54    const unsigned align_2d_yf[] = {64, 64, 32, 32, 16};
  55    const unsigned align_3d_yf[] = {16, 8, 8, 8, 4};
  56
  57    assert(mt->tr_mode != INTEL_MIPTREE_TRMODE_NONE);
  58
  59    /* Alignment computations below assume a power of 2 cpp. */
  60    assert (mt->cpp >= 1 && mt->cpp <= 16 && _mesa_is_pow_two(mt->cpp));
  61    /* Compute array index. */
  62    const int i = ffs(mt->cpp) - 1;
  63
  64    switch(mt->target) {
  65    case GL_TEXTURE_1D:
  66    case GL_TEXTURE_1D_ARRAY:
  67       ret_align = align_1d_yf[i];
  68       multiplier_ys = 16;
  69       break;
  70    case GL_TEXTURE_2D:
  71    case GL_TEXTURE_RECTANGLE:
  72    case GL_TEXTURE_2D_ARRAY:
  73    case GL_TEXTURE_CUBE_MAP:
  74    case GL_TEXTURE_CUBE_MAP_ARRAY:
  75    case GL_TEXTURE_2D_MULTISAMPLE:
  76    case GL_TEXTURE_2D_MULTISAMPLE_ARRAY:
  77       ret_align = align_2d_yf[i];
  78       multiplier_ys = 4;
  79       break;
  80    case GL_TEXTURE_3D:
  81       ret_align = align_3d_yf[i];
  82       multiplier_ys = 4;
  83       break;
  84    default:
  85       unreachable("not reached");
  86    }
  87
  88    if (mt->tr_mode == INTEL_MIPTREE_TRMODE_YS)
  89       ret_align *= multiplier_ys;
  90
  91    assert(_mesa_is_pow_two(mt->num_samples));
  92
  93    switch (mt->num_samples) {
  94    case 2:
  95    case 4:
  96       divisor = 2;
  97       break;
  98    case 8:
  99    case 16:
 100       divisor = 4;
 101       break;
 102    default:
 103       divisor = 1;
 104       break;
 105    }
 106    return ret_align / divisor;
 107 }
 108
 109
 110 static unsigned int
 111 intel_horizontal_texture_alignment_unit(struct brw_context *brw,
 112                                         struct intel_mipmap_tree *mt,
 113                                         uint32_t layout_flags)
 114 {
 115    if (layout_flags & MIPTREE_LAYOUT_FORCE_HALIGN16)
 116       return 16;
 117
 118    /**
 119     * +----------------------------------------------------------------------+
 120     * |                                        | alignment unit width  ("i") |
 121     * | Surface Property                       |-----------------------------|
 122     * |                                        | 915 | 965 | ILK | SNB | IVB |
 123     * +----------------------------------------------------------------------+
 124     * | YUV 4:2:2 format                       |  8  |  4  |  4  |  4  |  4  |
 125     * | BC1-5 compressed format (DXTn/S3TC)    |  4  |  4  |  4  |  4  |  4  |
 126     * | FXT1  compressed format                |  8  |  8  |  8  |  8  |  8  |
 127     * | Depth Buffer (16-bit)                  |  4  |  4  |  4  |  4  |  8  |
 128     * | Depth Buffer (other)                   |  4  |  4  |  4  |  4  |  4  |
 129     * | Separate Stencil Buffer                | N/A | N/A |  8  |  8  |  8  |
 130     * | All Others                             |  4  |  4  |  4  |  4  |  4  |
 131     * +----------------------------------------------------------------------+
 132     *
 133     * On IVB+, non-special cases can be overridden by setting the SURFACE_STATE
 134     * "Surface Horizontal Alignment" field to HALIGN_4 or HALIGN_8.
 135     */
 136
 137    if (brw->gen >= 7 && mt->format == MESA_FORMAT_Z_UNORM16)
 138       return 8;
 139
 140    return 4;
 141 }
 142
 143 static unsigned int
 144 tr_mode_vertical_texture_alignment(const struct intel_mipmap_tree *mt)
 145 {
 146    unsigned ret_align, divisor, multiplier_ys;
 147
 148    /* Vertical alignment tables for TRMODE_YF */
 149    const unsigned align_2d_yf[] = {64, 32, 32, 16, 16};
 150    const unsigned align_3d_yf[] = {16, 16, 16, 8, 8};
 151
 152    assert(mt->tr_mode != INTEL_MIPTREE_TRMODE_NONE);
 153
 154    /* Alignment computations below assume a power of 2 cpp. */
 155    assert (mt->cpp >= 1 && mt->cpp <= 16 && _mesa_is_pow_two(mt->cpp)) ;
 156    /* Compute array index. */
 157    const int i = ffs(mt->cpp) - 1;
 158
 159    switch(mt->target) {
 160    case GL_TEXTURE_2D:
 161    case GL_TEXTURE_RECTANGLE:
 162    case GL_TEXTURE_2D_ARRAY:
 163    case GL_TEXTURE_CUBE_MAP:
 164    case GL_TEXTURE_CUBE_MAP_ARRAY:
 165    case GL_TEXTURE_2D_MULTISAMPLE:
 166    case GL_TEXTURE_2D_MULTISAMPLE_ARRAY:
 167       ret_align = align_2d_yf[i];
 168       multiplier_ys = 4;
 169       break;
 170    case GL_TEXTURE_3D:
 171       ret_align = align_3d_yf[i];
 172       multiplier_ys = 2;
 173       break;
 174    case GL_TEXTURE_1D:
 175    case GL_TEXTURE_1D_ARRAY:
 176    default:
 177       unreachable("Unexpected miptree target");
 178    }
 179
 180    if (mt->tr_mode == INTEL_MIPTREE_TRMODE_YS)
 181       ret_align *= multiplier_ys;
 182
 183    assert(_mesa_is_pow_two(mt->num_samples));
 184
 185    switch (mt->num_samples) {
 186    case 4:
 187    case 8:
 188       divisor = 2;
 189       break;
 190    case 16:
 191       divisor = 4;
 192       break;
 193    default:
 194       divisor = 1;
 195       break;
 196    }
 197    return ret_align / divisor;
 198 }
 199
 200 static unsigned int
 201 intel_vertical_texture_alignment_unit(struct brw_context *brw,
 202                                       const struct intel_mipmap_tree *mt)
 203 {
 204    /**
 205     * +----------------------------------------------------------------------+
 206     * |                                        | alignment unit height ("j") |
 207     * | Surface Property                       |-----------------------------|
 208     * |                                        | 915 | 965 | ILK | SNB | IVB |
 209     * +----------------------------------------------------------------------+
 210     * | BC1-5 compressed format (DXTn/S3TC)    |  4  |  4  |  4  |  4  |  4  |
 211     * | FXT1  compressed format                |  4  |  4  |  4  |  4  |  4  |
 212     * | Depth Buffer                           |  2  |  2  |  2  |  4  |  4  |
 213     * | Separate Stencil Buffer                | N/A | N/A | N/A |  4  |  8  |
 214     * | Multisampled (4x or 8x) render target  | N/A | N/A | N/A |  4  |  4  |
 215     * | All Others                             |  2  |  2  |  2  |  *  |  *  |
 216     * +----------------------------------------------------------------------+
 217     *
 218     * Where "*" means either VALIGN_2 or VALIGN_4 depending on the setting of
 219     * the SURFACE_STATE "Surface Vertical Alignment" field.
 220     */
 221
 222    /* Broadwell only supports VALIGN of 4, 8, and 16.  The BSpec says 4
 223     * should always be used, except for stencil buffers, which should be 8.
 224     */
 225    if (brw->gen >= 8)
 226       return 4;
 227
 228    if (mt->num_samples > 1)
 229       return 4;
 230
 231    GLenum base_format = _mesa_get_format_base_format(mt->format);
 232
 233    if (brw->gen >= 6 &&
 234        (base_format == GL_DEPTH_COMPONENT ||
 235         base_format == GL_DEPTH_STENCIL)) {
 236       return 4;
 237    }
 238
 239    if (brw->gen == 7) {
 240       /* On Gen7, we prefer a vertical alignment of 4 when possible, because
 241        * that allows Y tiled render targets.
 242        *
 243        * From the Ivy Bridge PRM, Vol4 Part1 2.12.2.1 (SURFACE_STATE for most
 244        * messages), on p64, under the heading "Surface Vertical Alignment":
 245        *
 246        *     Value of 1 [VALIGN_4] is not supported for format YCRCB_NORMAL
 247        *     (0x182), YCRCB_SWAPUVY (0x183), YCRCB_SWAPUV (0x18f), YCRCB_SWAPY
 248        *     (0x190)
 249        *
 250        *     VALIGN_4 is not supported for surface format R32G32B32_FLOAT.
 251        */
 252       if (base_format == GL_YCBCR_MESA || mt->format == MESA_FORMAT_RGB_FLOAT32)
 253          return 2;
 254
 255       return 4;
 256    }
 257
 258    return 2;
 259 }
 260
 261 static void
 262 gen9_miptree_layout_1d(struct intel_mipmap_tree *mt)
 263 {
 264    unsigned x = 0;
 265    unsigned width = mt->physical_width0;
 266    unsigned depth = mt->physical_depth0; /* number of array layers. */
 267
 268    /* When this layout is used the horizontal alignment is fixed at 64 and the
 269     * hardware ignores the value given in the surface state
 270     */
 271    const unsigned int halign = 64;
 272
 273    mt->total_height = mt->physical_height0;
 274    mt->total_width = 0;
 275
 276    for (unsigned level = mt->first_level; level <= mt->last_level; level++) {
 277       unsigned img_width;
 278
 279       intel_miptree_set_level_info(mt, level, x, 0, depth);
 280
 281       img_width = ALIGN(width, halign);
 282
 283       mt->total_width = MAX2(mt->total_width, x + img_width);
 284
 285       x += img_width;
 286
 287       width = minify(width, 1);
 288    }
 289 }
 290
 291 static void
 292 brw_miptree_layout_2d(struct intel_mipmap_tree *mt)
 293 {
 294    unsigned x = 0;
 295    unsigned y = 0;
 296    unsigned width = mt->physical_width0;
 297    unsigned height = mt->physical_height0;
 298    unsigned depth = mt->physical_depth0; /* number of array layers. */
 299    unsigned int bw, bh;
 300
 301    _mesa_get_format_block_size(mt->format, &bw, &bh);
 302
 303    mt->total_width = mt->physical_width0;
 304
 305    if (mt->compressed)
 306        mt->total_width = ALIGN_NPOT(mt->total_width, bw);
 307
 308    /* May need to adjust width to accommodate the placement of
 309     * the 2nd mipmap.  This occurs when the alignment
 310     * constraints of mipmap placement push the right edge of the
 311     * 2nd mipmap out past the width of its parent.
 312     */
 313    if (mt->first_level != mt->last_level) {
 314        unsigned mip1_width;
 315
 316        if (mt->compressed) {
 317           mip1_width = ALIGN_NPOT(minify(mt->physical_width0, 1), mt->halign) +
 318              ALIGN_NPOT(minify(mt->physical_width0, 2), bw);
 319        } else {
 320           mip1_width = ALIGN_NPOT(minify(mt->physical_width0, 1), mt->halign) +
 321              minify(mt->physical_width0, 2);
 322        }
 323
 324        if (mip1_width > mt->total_width) {
 325            mt->total_width = mip1_width;
 326        }
 327    }
 328
 329    mt->total_width /= bw;
 330    mt->total_height = 0;
 331
 332    for (unsigned level = mt->first_level; level <= mt->last_level; level++) {
 333       unsigned img_height;
 334
 335       intel_miptree_set_level_info(mt, level, x, y, depth);
 336
 337       img_height = ALIGN_NPOT(height, mt->valign);
 338       if (mt->compressed)
 339          img_height /= bh;
 340
 341       if (mt->array_layout == ALL_SLICES_AT_EACH_LOD) {
 342          /* Compact arrays with separated miplevels */
 343          img_height *= depth;
 344       }
 345
 346       /* Because the images are packed better, the final offset
 347        * might not be the maximal one:
 348        */
 349       mt->total_height = MAX2(mt->total_height, y + img_height);
 350
 351       /* Layout_below: step right after second mipmap.
 352        */
 353       if (level == mt->first_level + 1) {
 354          x += ALIGN_NPOT(width, mt->halign) / bw;
 355       } else {
 356          y += img_height;
 357       }
 358
 359       width  = minify(width, 1);
 360       height = minify(height, 1);
 361
 362       if (mt->target == GL_TEXTURE_3D)
 363          depth = minify(depth, 1);
 364    }
 365 }
 366
 367 unsigned
 368 brw_miptree_get_horizontal_slice_pitch(const struct brw_context *brw,
 369                                        const struct intel_mipmap_tree *mt,
 370                                        unsigned level)
 371 {
 372    if ((brw->gen < 9 && mt->target == GL_TEXTURE_3D) ||
 373        (brw->gen == 4 && mt->target == GL_TEXTURE_CUBE_MAP)) {
 374       return ALIGN_NPOT(minify(mt->physical_width0, level), mt->halign);
 375    } else {
 376       return 0;
 377    }
 378 }
 379
 380 unsigned
 381 brw_miptree_get_vertical_slice_pitch(const struct brw_context *brw,
 382                                      const struct intel_mipmap_tree *mt,
 383                                      unsigned level)
 384 {
 385    if (brw->gen >= 9) {
 386       /* ALL_SLICES_AT_EACH_LOD isn't supported on Gen8+ but this code will
 387        * effectively end up with a packed qpitch anyway whenever
 388        * mt->first_level == mt->last_level.
 389        */
 390       assert(mt->array_layout != ALL_SLICES_AT_EACH_LOD);
 391
 392       /* On Gen9 we can pick whatever qpitch we like as long as it's aligned
 393        * to the vertical alignment so we don't need to add any extra rows.
 394        */
 395       unsigned qpitch = mt->total_height;
 396
 397       /* If the surface might be used as a stencil buffer or HiZ buffer then
 398        * it needs to be a multiple of 8.
 399        */
 400       const GLenum base_format = _mesa_get_format_base_format(mt->format);
 401       if (_mesa_is_depth_or_stencil_format(base_format))
 402          qpitch = ALIGN(qpitch, 8);
 403
 404       /* 3D textures need to be aligned to the tile height. At this point we
 405        * don't know which tiling will be used so let's just align it to 32
 406        */
 407       if (mt->target == GL_TEXTURE_3D)
 408          qpitch = ALIGN(qpitch, 32);
 409
 410       return qpitch;
 411
 412    } else if (mt->target == GL_TEXTURE_3D ||
 413               (brw->gen == 4 && mt->target == GL_TEXTURE_CUBE_MAP) ||
 414               mt->array_layout == ALL_SLICES_AT_EACH_LOD) {
 415       return ALIGN_NPOT(minify(mt->physical_height0, level), mt->valign);
 416
 417    } else {
 418       const unsigned h0 = ALIGN_NPOT(mt->physical_height0, mt->valign);
 419       const unsigned h1 = ALIGN_NPOT(minify(mt->physical_height0, 1), mt->valign);
 420
 421       return h0 + h1 + (brw->gen >= 7 ? 12 : 11) * mt->valign;
 422    }
 423 }
 424
 425 static void
 426 align_cube(struct intel_mipmap_tree *mt)
 427 {
 428    /* The 965's sampler lays cachelines out according to how accesses
 429     * in the texture surfaces run, so they may be "vertical" through
 430     * memory.  As a result, the docs say in Surface Padding Requirements:
 431     * Sampling Engine Surfaces that two extra rows of padding are required.
 432     */
 433    if (mt->target == GL_TEXTURE_CUBE_MAP)
 434       mt->total_height += 2;
 435 }
 436
 437 bool
 438 gen9_use_linear_1d_layout(const struct brw_context *brw,
 439                           const struct intel_mipmap_tree *mt)
 440 {
 441    /* On Gen9+ the mipmap levels of a 1D surface are all laid out in a
 442     * horizontal line. This isn't done for depth/stencil buffers however
 443     * because those will be using a tiled layout
 444     */
 445    if (brw->gen >= 9 &&
 446        (mt->target == GL_TEXTURE_1D ||
 447         mt->target == GL_TEXTURE_1D_ARRAY)) {
 448       GLenum base_format = _mesa_get_format_base_format(mt->format);
 449
 450       if (base_format != GL_DEPTH_COMPONENT &&
 451           base_format != GL_DEPTH_STENCIL &&
 452           base_format != GL_STENCIL_INDEX)
 453          return true;
 454    }
 455
 456    return false;
 457 }
 458
 459 static void
 460 brw_miptree_layout_texture_array(struct brw_context *brw,
 461                                  struct intel_mipmap_tree *mt)
 462 {
 463    unsigned height = mt->physical_height0;
 464    bool layout_1d = gen9_use_linear_1d_layout(brw, mt);
 465    int physical_qpitch;
 466
 467    if (layout_1d)
 468       gen9_miptree_layout_1d(mt);
 469    else
 470       brw_miptree_layout_2d(mt);
 471
 472    if (layout_1d) {
 473       physical_qpitch = 1;
 474       /* When using the horizontal layout the qpitch specifies the distance in
 475        * pixels between array slices. The total_width is forced to be a
 476        * multiple of the horizontal alignment in brw_miptree_layout_1d (in
 477        * this case it's always 64). The vertical alignment is ignored.
 478        */
 479       mt->qpitch = mt->total_width;
 480    } else {
 481       mt->qpitch = brw_miptree_get_vertical_slice_pitch(brw, mt, 0);
 482       /* Unlike previous generations the qpitch is a multiple of the
 483        * compressed block size on Gen9 so physical_qpitch matches mt->qpitch.
 484        */
 485       physical_qpitch = (mt->compressed && brw->gen < 9 ? mt->qpitch / 4 :
 486                          mt->qpitch);
 487    }
 488
 489    for (unsigned level = mt->first_level; level <= mt->last_level; level++) {
 490       unsigned img_height;
 491       img_height = ALIGN_NPOT(height, mt->valign);
 492       if (mt->compressed)
 493          img_height /= mt->valign;
 494
 495       for (unsigned q = 0; q < mt->level[level].depth; q++) {
 496          if (mt->array_layout == ALL_SLICES_AT_EACH_LOD) {
 497             intel_miptree_set_image_offset(mt, level, q, 0, q * img_height);
 498          } else {
 499             intel_miptree_set_image_offset(mt, level, q, 0, q * physical_qpitch);
 500          }
 501       }
 502       height = minify(height, 1);
 503    }
 504    if (mt->array_layout == ALL_LOD_IN_EACH_SLICE)
 505       mt->total_height = physical_qpitch * mt->physical_depth0;
 506
 507    align_cube(mt);
 508 }
 509
 510 static void
 511 brw_miptree_layout_texture_3d(struct brw_context *brw,
 512                               struct intel_mipmap_tree *mt)
 513 {
 514    mt->total_width = 0;
 515    mt->total_height = 0;
 516
 517    unsigned ysum = 0;
 518    unsigned bh, bw;
 519
 520    _mesa_get_format_block_size(mt->format, &bw, &bh);
 521
 522    for (unsigned level = mt->first_level; level <= mt->last_level; level++) {
 523       unsigned WL = MAX2(mt->physical_width0 >> level, 1);
 524       unsigned HL = MAX2(mt->physical_height0 >> level, 1);
 525       unsigned DL = MAX2(mt->physical_depth0 >> level, 1);
 526       unsigned wL = ALIGN_NPOT(WL, mt->halign);
 527       unsigned hL = ALIGN_NPOT(HL, mt->valign);
 528
 529       if (mt->target == GL_TEXTURE_CUBE_MAP)
 530          DL = 6;
 531
 532       intel_miptree_set_level_info(mt, level, 0, 0, DL);
 533
 534       for (unsigned q = 0; q < DL; q++) {
 535          unsigned x = (q % (1 << level)) * wL;
 536          unsigned y = ysum + (q >> level) * hL;
 537
 538          intel_miptree_set_image_offset(mt, level, q, x / bw, y / bh);
 539          mt->total_width = MAX2(mt->total_width, (x + wL) / bw);
 540          mt->total_height = MAX2(mt->total_height, (y + hL) / bh);
 541       }
 542
 543       ysum += ALIGN(DL, 1 << level) / (1 << level) * hL;
 544    }
 545
 546    align_cube(mt);
 547 }
 548
 549 /**
 550  * \brief Helper function for intel_miptree_create().
 551  */
 552 static uint32_t
 553 brw_miptree_choose_tiling(struct brw_context *brw,
 554                           const struct intel_mipmap_tree *mt,
 555                           uint32_t layout_flags)
 556 {
 557    if (mt->format == MESA_FORMAT_S_UINT8) {
 558       /* The stencil buffer is W tiled. However, we request from the kernel a
 559        * non-tiled buffer because the GTT is incapable of W fencing.
 560        */
 561       return I915_TILING_NONE;
 562    }
 563
 564    /* Do not support changing the tiling for miptrees with pre-allocated BOs. */
 565    assert((layout_flags & MIPTREE_LAYOUT_FOR_BO) == 0);
 566
 567    /* Some usages may want only one type of tiling, like depth miptrees (Y
 568     * tiled), or temporary BOs for uploading data once (linear).
 569     */
 570    switch (layout_flags & MIPTREE_LAYOUT_TILING_ANY) {
 571    case MIPTREE_LAYOUT_TILING_ANY:
 572       break;
 573    case MIPTREE_LAYOUT_TILING_Y:
 574       return I915_TILING_Y;
 575    case MIPTREE_LAYOUT_TILING_NONE:
 576       return I915_TILING_NONE;
 577    }
 578
 579    if (mt->num_samples > 1) {
 580       /* From p82 of the Sandy Bridge PRM, dw3[1] of SURFACE_STATE ("Tiled
 581        * Surface"):
 582        *
 583        *   [DevSNB+]: For multi-sample render targets, this field must be
 584        *   1. MSRTs can only be tiled.
 585        *
 586        * Our usual reason for preferring X tiling (fast blits using the
 587        * blitting engine) doesn't apply to MSAA, since we'll generally be
 588        * downsampling or upsampling when blitting between the MSAA buffer
 589        * and another buffer, and the blitting engine doesn't support that.
 590        * So use Y tiling, since it makes better use of the cache.
 591        */
 592       return I915_TILING_Y;
 593    }
 594
 595    GLenum base_format = _mesa_get_format_base_format(mt->format);
 596    if (base_format == GL_DEPTH_COMPONENT ||
 597        base_format == GL_DEPTH_STENCIL_EXT)
 598       return I915_TILING_Y;
 599
 600    /* 1D textures (and 1D array textures) don't get any benefit from tiling,
 601     * in fact it leads to a less efficient use of memory space and bandwidth
 602     * due to tile alignment.
 603     */
 604    if (mt->logical_height0 == 1)
 605       return I915_TILING_NONE;
 606
 607    int minimum_pitch = mt->total_width * mt->cpp;
 608
 609    /* If the width is much smaller than a tile, don't bother tiling. */
 610    if (minimum_pitch < 64)
 611       return I915_TILING_NONE;
 612
 613    if (ALIGN(minimum_pitch, 512) >= 32768) {
 614       perf_debug("%dx%d miptree too large to blit, falling back to untiled",
 615                  mt->total_width, mt->total_height);
 616       return I915_TILING_NONE;
 617    }
 618
 619    /* Pre-gen6 doesn't have BLORP to handle Y-tiling, so use X-tiling. */
 620    if (brw->gen < 6)
 621       return I915_TILING_X;
 622
 623    /* From the Sandybridge PRM, Volume 1, Part 2, page 32:
 624     * "NOTE: 128BPE Format Color Buffer ( render target ) MUST be either TileX
 625     *  or Linear."
 626     * 128 bits per pixel translates to 16 bytes per pixel. This is necessary
 627     * all the way back to 965, but is permitted on Gen7+.
 628     */
 629    if (brw->gen < 7 && mt->cpp >= 16)
 630       return I915_TILING_X;
 631
 632    /* From the Ivy Bridge PRM, Vol4 Part1 2.12.2.1 (SURFACE_STATE for most
 633     * messages), on p64, under the heading "Surface Vertical Alignment":
 634     *
 635     *     This field must be set to VALIGN_4 for all tiled Y Render Target
 636     *     surfaces.
 637     *
 638     * So if the surface is renderable and uses a vertical alignment of 2,
 639     * force it to be X tiled.  This is somewhat conservative (it's possible
 640     * that the client won't ever render to this surface), but it's difficult
 641     * to know that ahead of time.  And besides, since we use a vertical
 642     * alignment of 4 as often as we can, this shouldn't happen very often.
 643     */
 644    if (brw->gen == 7 && mt->valign == 2 &&
 645        brw->format_supported_as_render_target[mt->format]) {
 646       return I915_TILING_X;
 647    }
 648
 649    return I915_TILING_Y | I915_TILING_X;
 650 }
 651
 652 static void
 653 intel_miptree_set_total_width_height(struct brw_context *brw,
 654                                      struct intel_mipmap_tree *mt)
 655 {
 656    switch (mt->target) {
 657    case GL_TEXTURE_CUBE_MAP:
 658       if (brw->gen == 4) {
 659          /* Gen4 stores cube maps as 3D textures. */
 660          assert(mt->physical_depth0 == 6);
 661          brw_miptree_layout_texture_3d(brw, mt);
 662       } else {
 663          /* All other hardware stores cube maps as 2D arrays. */
 664          brw_miptree_layout_texture_array(brw, mt);
 665       }
 666       break;
 667
 668    case GL_TEXTURE_3D:
 669       if (brw->gen >= 9)
 670          brw_miptree_layout_texture_array(brw, mt);
 671       else
 672          brw_miptree_layout_texture_3d(brw, mt);
 673       break;
 674
 675    case GL_TEXTURE_1D_ARRAY:
 676    case GL_TEXTURE_2D_ARRAY:
 677    case GL_TEXTURE_2D_MULTISAMPLE_ARRAY:
 678    case GL_TEXTURE_CUBE_MAP_ARRAY:
 679       brw_miptree_layout_texture_array(brw, mt);
 680       break;
 681
 682    default:
 683       switch (mt->msaa_layout) {
 684       case INTEL_MSAA_LAYOUT_UMS:
 685       case INTEL_MSAA_LAYOUT_CMS:
 686          brw_miptree_layout_texture_array(brw, mt);
 687          break;
 688       case INTEL_MSAA_LAYOUT_NONE:
 689       case INTEL_MSAA_LAYOUT_IMS:
 690          if (gen9_use_linear_1d_layout(brw, mt))
 691             gen9_miptree_layout_1d(mt);
 692          else
 693             brw_miptree_layout_2d(mt);
 694          break;
 695       }
 696       break;
 697    }
 698
 699    DBG("%s: %dx%dx%d\n", __func__,
 700        mt->total_width, mt->total_height, mt->cpp);
 701 }
 702
 703 static void
 704 intel_miptree_set_alignment(struct brw_context *brw,
 705                             struct intel_mipmap_tree *mt,
 706                             uint32_t layout_flags)
 707 {
 708    /**
 709     * From the "Alignment Unit Size" section of various specs, namely:
 710     * - Gen3 Spec: "Memory Data Formats" Volume,         Section 1.20.1.4
 711     * - i965 and G45 PRMs:             Volume 1,         Section 6.17.3.4.
 712     * - Ironlake and Sandybridge PRMs: Volume 1, Part 1, Section 7.18.3.4
 713     * - BSpec (for Ivybridge and slight variations in separate stencil)
 714     */
 715    bool gen6_hiz_or_stencil = false;
 716
 717    if (brw->gen == 6 && mt->array_layout == ALL_SLICES_AT_EACH_LOD) {
 718       const GLenum base_format = _mesa_get_format_base_format(mt->format);
 719       gen6_hiz_or_stencil = _mesa_is_depth_or_stencil_format(base_format);
 720    }
 721
 722    if (gen6_hiz_or_stencil) {
 723       /* On gen6, we use ALL_SLICES_AT_EACH_LOD for stencil/hiz because the
 724        * hardware doesn't support multiple mip levels on stencil/hiz.
 725        *
 726        * PRM Vol 2, Part 1, 7.5.3 Hierarchical Depth Buffer:
 727        * "The hierarchical depth buffer does not support the LOD field"
 728        *
 729        * PRM Vol 2, Part 1, 7.5.4.1 Separate Stencil Buffer:
 730        * "The stencil depth buffer does not support the LOD field"
 731        */
 732       if (mt->format == MESA_FORMAT_S_UINT8) {
 733          /* Stencil uses W tiling, so we force W tiling alignment for the
 734           * ALL_SLICES_AT_EACH_LOD miptree layout.
 735           */
 736          mt->halign = 64;
 737          mt->valign = 64;
 738          assert((layout_flags & MIPTREE_LAYOUT_FORCE_HALIGN16) == 0);
 739       } else {
 740          /* Depth uses Y tiling, so we force need Y tiling alignment for the
 741           * ALL_SLICES_AT_EACH_LOD miptree layout.
 742           */
 743          mt->halign = 128 / mt->cpp;
 744          mt->valign = 32;
 745       }
 746    } else if (mt->compressed) {
 747        /* The hardware alignment requirements for compressed textures
 748         * happen to match the block boundaries.
 749         */
 750       _mesa_get_format_block_size(mt->format, &mt->halign, &mt->valign);
 751
 752       /* On Gen9+ we can pick our own alignment for compressed textures but it
 753        * has to be a multiple of the block size. The minimum alignment we can
 754        * pick is 4 so we effectively have to align to 4 times the block
 755        * size
 756        */
 757       if (brw->gen >= 9) {
 758          mt->halign *= 4;
 759          mt->valign *= 4;
 760       }
 761    } else if (mt->format == MESA_FORMAT_S_UINT8) {
 762       mt->halign = 8;
 763       mt->valign = brw->gen >= 7 ? 8 : 4;
 764    } else if (brw->gen >= 9 && mt->tr_mode != INTEL_MIPTREE_TRMODE_NONE) {
 765       mt->halign = tr_mode_horizontal_texture_alignment(mt);
 766       mt->valign = tr_mode_vertical_texture_alignment(mt);
 767    } else {
 768       mt->halign =
 769          intel_horizontal_texture_alignment_unit(brw, mt, layout_flags);
 770       mt->valign = intel_vertical_texture_alignment_unit(brw, mt);
 771    }
 772 }
 773
 774 void
 775 brw_miptree_layout(struct brw_context *brw,
 776                    struct intel_mipmap_tree *mt,
 777                    uint32_t layout_flags)
 778 {
 779    mt->tr_mode = INTEL_MIPTREE_TRMODE_NONE;
 780
 781    intel_miptree_set_alignment(brw, mt, layout_flags);
 782    intel_miptree_set_total_width_height(brw, mt);
 783
 784    if (!mt->total_width || !mt->total_height) {
 785       intel_miptree_release(&mt);
 786       return;
 787    }
 788
 789    /* On Gen9+ the alignment values are expressed in multiples of the block
 790     * size
 791     */
 792    if (brw->gen >= 9) {
 793       unsigned int i, j;
 794       _mesa_get_format_block_size(mt->format, &i, &j);
 795       mt->halign /= i;
 796       mt->valign /= j;
 797    }
 798
 799    if ((layout_flags & MIPTREE_LAYOUT_FOR_BO) == 0)
 800       mt->tiling = brw_miptree_choose_tiling(brw, mt, layout_flags);
 801 }
 802