anv: Don't delete fragment shaders that write sample mask

[mesa.git] / src / intel / isl / isl.c
diff --git a/src/intel/isl/isl.c b/src/intel/isl/isl.c

index eaaa28014a39c1312518c4f83107aeb1931bd8b4..7c0d3c4dacd65dbf3ec8b857f4325ca483db4f2f 100644 (file)
--- a/src/intel/isl/isl.c
+++ b/src/intel/isl/isl.c
@@ -33,6 +33,7 @@
  #include "isl_gen7.h"
  #include "isl_gen8.h"
  #include "isl_gen9.h"
+#include "isl_gen12.h"
  #include "isl_priv.h"
  
  void
@@ -122,7 +123,8 @@ isl_device_init(struct isl_device *dev,
     dev->ss.size = RENDER_SURFACE_STATE_length(info) * 4;
     dev->ss.align = isl_align(dev->ss.size, 32);
  
-   dev->ss.clear_color_state_size = CLEAR_COLOR_length(info) * 4;
+   dev->ss.clear_color_state_size =
+      isl_align(CLEAR_COLOR_length(info) * 4, 64);
     dev->ss.clear_color_state_offset =
        RENDER_SURFACE_STATE_ClearValueAddress_start(info) / 32 * 4;
  
@@ -309,6 +311,29 @@ isl_tiling_get_info(enum isl_tiling tiling,
        phys_B = isl_extent2d(128, 32);
        break;
  
+   case ISL_TILING_GEN12_CCS:
+      /* From the Bspec, Gen Graphics > Gen12 > Memory Data Formats > Memory
+       * Compression > Memory Compression - Gen12:
+       *
+       *    4 bits of auxiliary plane data are required for 2 cachelines of
+       *    main surface data. This results in a single cacheline of auxiliary
+       *    plane data mapping to 4 4K pages of main surface data for the 4K
+       *    pages (tile Y ) and 1 64K Tile Ys page.
+       *
+       * The Y-tiled pairing bit of 9 shown in the table below that Bspec
+       * section expresses that the 2 cachelines of main surface data are
+       * horizontally adjacent.
+       *
+       * TODO: Handle Ys, Yf and their pairing bits.
+       *
+       * Therefore, each CCS cacheline represents a 512Bx32 row area and each
+       * element represents a 32Bx4 row area.
+       */
+      assert(format_bpb == 4);
+      logical_el = isl_extent2d(16, 8);
+      phys_B = isl_extent2d(64, 1);
+      break;
+
     default:
        unreachable("not reached");
     } /* end switch */
@@ -382,15 +407,19 @@ isl_surf_choose_tiling(const struct isl_device *dev,
     if (info->usage & ISL_SURF_USAGE_HIZ_BIT) {
        assert(info->format == ISL_FORMAT_HIZ);
        assert(tiling_flags == ISL_TILING_HIZ_BIT);
-      *tiling = ISL_TILING_HIZ;
+      *tiling = isl_tiling_flag_to_enum(tiling_flags);
        return true;
     }
  
     /* CCS surfaces always use the CCS tiling */
     if (info->usage & ISL_SURF_USAGE_CCS_BIT) {
        assert(isl_format_get_layout(info->format)->txc == ISL_TXC_CCS);
-      assert(tiling_flags == ISL_TILING_CCS_BIT);
-      *tiling = ISL_TILING_CCS;
+      UNUSED bool ivb_ccs = ISL_DEV_GEN(dev) < 12 &&
+                            tiling_flags == ISL_TILING_CCS_BIT;
+      UNUSED bool tgl_ccs = ISL_DEV_GEN(dev) >= 12 &&
+                            tiling_flags == ISL_TILING_GEN12_CCS_BIT;
+      assert(ivb_ccs != tgl_ccs);
+      *tiling = isl_tiling_flag_to_enum(tiling_flags);
        return true;
     }
  
@@ -627,16 +656,25 @@ isl_choose_image_alignment_el(const struct isl_device *dev,
        if (ISL_DEV_GEN(dev) == 6) {
           /* HiZ surfaces on Sandy Bridge are packed tightly. */
           *image_align_el = isl_extent3d(1, 1, 1);
-      } else {
+      } else if (ISL_DEV_GEN(dev) < 12) {
           /* On gen7+, HiZ surfaces are always aligned to 16x8 pixels in the
            * primary surface which works out to 2x2 HiZ elments.
            */
           *image_align_el = isl_extent3d(2, 2, 1);
+      } else {
+         /* On gen12+, HiZ surfaces are always aligned to 16x16 pixels in the
+          * primary surface which works out to 2x4 HiZ elments.
+          * TODO: Verify
+          */
+         *image_align_el = isl_extent3d(2, 4, 1);
        }
        return;
     }
  
-   if (ISL_DEV_GEN(dev) >= 9) {
+   if (ISL_DEV_GEN(dev) >= 12) {
+      isl_gen12_choose_image_alignment_el(dev, info, tiling, dim_layout,
+                                          msaa_layout, image_align_el);
+   } else if (ISL_DEV_GEN(dev) >= 9) {
        isl_gen9_choose_image_alignment_el(dev, info, tiling, dim_layout,
                                           msaa_layout, image_align_el);
     } else if (ISL_DEV_GEN(dev) >= 8) {
@@ -716,7 +754,7 @@ isl_surf_choose_dim_layout(const struct isl_device *dev,
  
  /**
   * Calculate the physical extent of the surface's first level, in units of
- * surface samples. The result is aligned to the format's compression block.
+ * surface samples.
   */
  static void
  isl_calc_phys_level0_extent_sa(const struct isl_device *dev,
@@ -745,8 +783,8 @@ isl_calc_phys_level0_extent_sa(const struct isl_device *dev,
        case ISL_DIM_LAYOUT_GEN4_2D:
        case ISL_DIM_LAYOUT_GEN6_STENCIL_HIZ:
           *phys_level0_sa = (struct isl_extent4d) {
-            .w = isl_align_npot(info->width, fmtl->bw),
-            .h = fmtl->bh,
+            .w = info->width,
+            .h = 1,
              .d = 1,
              .a = info->array_len,
           };
@@ -770,8 +808,8 @@ isl_calc_phys_level0_extent_sa(const struct isl_device *dev,
           assert(info->samples == 1);
  
           *phys_level0_sa = (struct isl_extent4d) {
-            .w = isl_align_npot(info->width, fmtl->bw),
-            .h = isl_align_npot(info->height, fmtl->bh),
+            .w = info->width,
+            .h = info->height,
              .d = 1,
              .a = info->array_len,
           };
@@ -806,9 +844,6 @@ isl_calc_phys_level0_extent_sa(const struct isl_device *dev,
           isl_msaa_interleaved_scale_px_to_sa(info->samples,
                                               &phys_level0_sa->w,
                                               &phys_level0_sa->h);
-
-         phys_level0_sa->w = isl_align(phys_level0_sa->w, fmtl->bw);
-         phys_level0_sa->h = isl_align(phys_level0_sa->h, fmtl->bh);
           break;
        }
        break;
@@ -831,8 +866,8 @@ isl_calc_phys_level0_extent_sa(const struct isl_device *dev,
           assert(ISL_DEV_GEN(dev) >= 9);
  
           *phys_level0_sa = (struct isl_extent4d) {
-            .w = isl_align_npot(info->width, fmtl->bw),
-            .h = isl_align_npot(info->height, fmtl->bh),
+            .w = info->width,
+            .h = info->height,
              .d = 1,
              .a = info->depth,
           };
@@ -841,8 +876,8 @@ isl_calc_phys_level0_extent_sa(const struct isl_device *dev,
        case ISL_DIM_LAYOUT_GEN4_3D:
           assert(ISL_DEV_GEN(dev) < 9);
           *phys_level0_sa = (struct isl_extent4d) {
-            .w = isl_align(info->width, fmtl->bw),
-            .h = isl_align(info->height, fmtl->bh),
+            .w = info->width,
+            .h = info->height,
              .d = info->depth,
              .a = 1,
           };
@@ -917,7 +952,8 @@ isl_calc_array_pitch_el_rows_gen4_2d(
     assert(pitch_sa_rows % fmtl->bh == 0);
     uint32_t pitch_el_rows = pitch_sa_rows / fmtl->bh;
  
-   if (ISL_DEV_GEN(dev) >= 9 && fmtl->txc == ISL_TXC_CCS) {
+   if (ISL_DEV_GEN(dev) >= 9 && ISL_DEV_GEN(dev) <= 11 &&
+       fmtl->txc == ISL_TXC_CCS) {
        /*
         * From the Sky Lake PRM Vol 7, "MCS Buffer for Render Target(s)" (p. 632):
         *
@@ -935,6 +971,8 @@ isl_calc_array_pitch_el_rows_gen4_2d(
         * The first restriction is already handled by isl_choose_image_alignment_el
         * but the second restriction, which is an extension of the first, only
         * applies to qpitch and must be applied here.
+       *
+       * The second restriction disappears on Gen12.
         */
        assert(fmtl->bh == 4);
        pitch_el_rows = isl_align(pitch_el_rows, 256 / 4);
@@ -967,13 +1005,10 @@ isl_calc_phys_slice0_extent_sa_gen4_2d(
        const struct isl_extent4d *phys_level0_sa,
        struct isl_extent2d *phys_slice0_sa)
  {
-   const struct isl_format_layout *fmtl = isl_format_get_layout(info->format);
-
     assert(phys_level0_sa->depth == 1);
  
     if (info->levels == 1) {
-      /* Do not pad the surface to the image alignment. Instead, pad it only
-       * to the pixel format's block alignment.
+      /* Do not pad the surface to the image alignment.
         *
         * For tiled surfaces, using a reduced alignment here avoids wasting CPU
         * cycles on the below mipmap layout caluclations. Reducing the
@@ -988,8 +1023,8 @@ isl_calc_phys_slice0_extent_sa_gen4_2d(
         * VkBufferImageCopy::bufferRowLength.
         */
        *phys_slice0_sa = (struct isl_extent2d) {
-         .w = isl_align_npot(phys_level0_sa->w, fmtl->bw),
-         .h = isl_align_npot(phys_level0_sa->h, fmtl->bh),
+         .w = phys_level0_sa->w,
+         .h = phys_level0_sa->h,
        };
        return;
     }
@@ -1054,9 +1089,9 @@ isl_calc_phys_total_extent_el_gen4_2d(
                                             array_pitch_span,
                                             &phys_slice0_sa);
     *total_extent_el = (struct isl_extent2d) {
-      .w = isl_assert_div(phys_slice0_sa.w, fmtl->bw),
+      .w = isl_align_div_npot(phys_slice0_sa.w, fmtl->bw),
        .h = *array_pitch_el_rows * (phys_level0_sa->array_len - 1) +
-           isl_assert_div(phys_slice0_sa.h, fmtl->bh),
+           isl_align_div_npot(phys_slice0_sa.h, fmtl->bh),
     };
  }
  
@@ -1198,9 +1233,9 @@ isl_calc_phys_total_extent_el_gen9_1d(
        uint32_t *array_pitch_el_rows,
        struct isl_extent2d *phys_total_el)
  {
-   MAYBE_UNUSED const struct isl_format_layout *fmtl = isl_format_get_layout(info->format);
+   const struct isl_format_layout *fmtl = isl_format_get_layout(info->format);
  
-   assert(phys_level0_sa->height / fmtl->bh == 1);
+   assert(phys_level0_sa->height == 1);
     assert(phys_level0_sa->depth == 1);
     assert(info->samples == 1);
     assert(image_align_sa->w >= fmtl->bw);
@@ -1269,6 +1304,8 @@ isl_calc_phys_total_extent_el(const struct isl_device *dev,
                                              total_extent_el);
        return;
     }
+
+   unreachable("invalid value for dim_layout");
  }
  
  static uint32_t
@@ -1381,36 +1418,30 @@ isl_calc_row_pitch(const struct isl_device *dev,
     uint32_t alignment_B =
        isl_calc_row_pitch_alignment(surf_info, tile_info);
  
-   /* If pitch isn't given and it can be chosen freely, align it by cache line
-    * allowing one to use blit engine on the surface.
-    */
-   if (surf_info->row_pitch_B == 0 && tile_info->tiling == ISL_TILING_LINEAR) {
-      /* From the Broadwell PRM docs for XY_SRC_COPY_BLT::SourceBaseAddress:
-       *
-       *    "Base address of the destination surface: X=0, Y=0. Lower 32bits
-       *    of the 48bit addressing. When Src Tiling is enabled (Bit_15
-       *    enabled), this address must be 4KB-aligned. When Tiling is not
-       *    enabled, this address should be CL (64byte) aligned."
-       */
-      alignment_B = MAX2(alignment_B, 64);
-   }
-
     const uint32_t min_row_pitch_B =
        isl_calc_min_row_pitch(dev, surf_info, tile_info, phys_total_el,
                               alignment_B);
  
-   uint32_t row_pitch_B = min_row_pitch_B;
-
     if (surf_info->row_pitch_B != 0) {
-      row_pitch_B = surf_info->row_pitch_B;
-
-      if (row_pitch_B < min_row_pitch_B)
+      if (surf_info->row_pitch_B < min_row_pitch_B)
           return false;
  
-      if (row_pitch_B % alignment_B != 0)
+      if (surf_info->row_pitch_B % alignment_B != 0)
           return false;
     }
  
+   const uint32_t row_pitch_B =
+      surf_info->row_pitch_B != 0 ?
+         surf_info->row_pitch_B :
+      /* According to BSpec: 44930, Gen12's CCS-compressed surface pitches
+       * must be 512B-aligned.
+       */
+      ISL_DEV_GEN(dev) >= 12 &&
+      isl_format_supports_ccs_e(dev->info, surf_info->format) ?
+         isl_align(min_row_pitch_B, 512) :
+      /* Else */
+         min_row_pitch_B;
+
     const uint32_t row_pitch_tl = row_pitch_B / tile_info->phys_extent_B.width;
  
     if (row_pitch_B == 0)
@@ -1491,8 +1522,6 @@ isl_surf_init_s(const struct isl_device *dev,
     struct isl_extent4d phys_level0_sa;
     isl_calc_phys_level0_extent_sa(dev, info, dim_layout, tiling, msaa_layout,
                                    &phys_level0_sa);
-   assert(phys_level0_sa.w % fmtl->bw == 0);
-   assert(phys_level0_sa.h % fmtl->bh == 0);
  
     enum isl_array_pitch_span array_pitch_span =
        isl_choose_array_pitch_span(dev, info, dim_layout, &phys_level0_sa);
@@ -1533,6 +1562,14 @@ isl_surf_init_s(const struct isl_device *dev,
           }
        }
        base_alignment_B = isl_round_up_to_power_of_two(base_alignment_B);
+
+      /* From the Skylake PRM Vol 2c, PLANE_STRIDE::Stride:
+       *
+       *     "For Linear memory, this field specifies the stride in chunks of
+       *     64 bytes (1 cache line)."
+       */
+      if (isl_surf_usage_is_display(info->usage))
+         base_alignment_B = MAX(base_alignment_B, 64);
     } else {
        const uint32_t total_h_tl =
           isl_align_div(phys_total_el.h, tile_info.logical_extent_el.height);
@@ -1543,6 +1580,19 @@ isl_surf_init_s(const struct isl_device *dev,
                                     tile_info.phys_extent_B.height;
        assert(isl_is_pow2(info->min_alignment_B) && isl_is_pow2(tile_size_B));
        base_alignment_B = MAX(info->min_alignment_B, tile_size_B);
+
+      /* The diagram in the Bspec section Memory Compression - Gen12, shows
+       * that the CCS is indexed in 256B chunks. However, the
+       * PLANE_AUX_DIST::Auxiliary Surface Distance field is in units of 4K
+       * pages. We currently don't assign the usage field like we do for main
+       * surfaces, so just use 4K for now.
+       */
+      if (tiling == ISL_TILING_GEN12_CCS)
+         base_alignment_B = MAX(base_alignment_B, 4096);
+   }
+
+   if (ISL_DEV_GEN(dev) >= 12) {
+      base_alignment_B = MAX(base_alignment_B, 64 * 1024);
     }
  
     if (ISL_DEV_GEN(dev) < 9) {
@@ -1612,6 +1662,34 @@ isl_surf_get_hiz_surf(const struct isl_device *dev,
  {
     assert(ISL_DEV_GEN(dev) >= 5 && ISL_DEV_USE_SEPARATE_STENCIL(dev));
  
+   if (!isl_surf_usage_is_depth(surf->usage))
+      return false;
+
+   /* HiZ only works with Y-tiled depth buffers */
+   if (!isl_tiling_is_any_y(surf->tiling))
+      return false;
+
+   /* On SNB+, compressed depth buffers cannot be interleaved with stencil. */
+   switch (surf->format) {
+   case ISL_FORMAT_R24_UNORM_X8_TYPELESS:
+      if (isl_surf_usage_is_depth_and_stencil(surf->usage)) {
+         assert(ISL_DEV_GEN(dev) == 5);
+         unreachable("This should work, but is untested");
+      }
+      /* Fall through */
+   case ISL_FORMAT_R16_UNORM:
+   case ISL_FORMAT_R32_FLOAT:
+      break;
+   case ISL_FORMAT_R32_FLOAT_X8X24_TYPELESS:
+      if (ISL_DEV_GEN(dev) == 5) {
+         assert(isl_surf_usage_is_depth_and_stencil(surf->usage));
+         unreachable("This should work, but is untested");
+      }
+      /* Fall through */
+   default:
+      return false;
+   }
+
     /* Multisampled depth is always interleaved */
     assert(surf->msaa_layout == ISL_MSAA_LAYOUT_NONE ||
            surf->msaa_layout == ISL_MSAA_LAYOUT_INTERLEAVED);
@@ -1691,16 +1769,33 @@ isl_surf_get_mcs_surf(const struct isl_device *dev,
                        const struct isl_surf *surf,
                        struct isl_surf *mcs_surf)
  {
-   assert(ISL_DEV_GEN(dev) >= 7);
-
     /* It must be multisampled with an array layout */
-   assert(surf->samples > 1 && surf->msaa_layout == ISL_MSAA_LAYOUT_ARRAY);
+   if (surf->msaa_layout != ISL_MSAA_LAYOUT_ARRAY)
+      return false;
+
+   if (mcs_surf->size_B > 0)
+      return false;
  
     /* The following are true of all multisampled surfaces */
+   assert(surf->samples > 1);
     assert(surf->dim == ISL_SURF_DIM_2D);
     assert(surf->levels == 1);
     assert(surf->logical_level0_px.depth == 1);
  
+   /* From the Ivy Bridge PRM, Vol4 Part1 p77 ("MCS Enable"):
+    *
+    *   This field must be set to 0 for all SINT MSRTs when all RT channels
+    *   are not written
+    *
+    * In practice this means that we have to disable MCS for all signed
+    * integer MSAA buffers.  The alternative, to disable MCS only when one
+    * of the render target channels is disabled, is impractical because it
+    * would require converting between CMS and UMS MSAA layouts on the fly,
+    * which is expensive.
+    */
+   if (ISL_DEV_GEN(dev) == 7 && isl_format_has_sint_channel(surf->format))
+      return false;
+
     /* The "Auxiliary Surface Pitch" field in RENDER_SURFACE_STATE is only 9
      * bits which means the maximum pitch of a compression surface is 512
      * tiles or 64KB (since MCS is always Y-tiled).  Since a 16x MCS buffer is
@@ -1737,15 +1832,49 @@ isl_surf_get_mcs_surf(const struct isl_device *dev,
  bool
  isl_surf_get_ccs_surf(const struct isl_device *dev,
                        const struct isl_surf *surf,
-                      struct isl_surf *ccs_surf,
+                      struct isl_surf *aux_surf,
+                      struct isl_surf *extra_aux_surf,
                        uint32_t row_pitch_B)
  {
-   assert(surf->samples == 1 && surf->msaa_layout == ISL_MSAA_LAYOUT_NONE);
-   assert(ISL_DEV_GEN(dev) >= 7);
+   assert(aux_surf);
+
+   /* An uninitialized surface is needed to get a CCS surface. */
+   if (aux_surf->size_B > 0 &&
+       (extra_aux_surf == NULL || extra_aux_surf->size_B > 0)) {
+      return false;
+   }
+
+   /* A surface can't have two CCS surfaces. */
+   if (aux_surf->usage & ISL_SURF_USAGE_CCS_BIT)
+      return false;
+
+   if (ISL_DEV_GEN(dev) < 12 && surf->samples > 1)
+      return false;
+
+   /* CCS support does not exist prior to Gen7 */
+   if (ISL_DEV_GEN(dev) <= 6)
+      return false;
  
     if (surf->usage & ISL_SURF_USAGE_DISABLE_AUX_BIT)
        return false;
  
+   /* Allow CCS for single-sampled stencil buffers Gen12+. */
+   if (isl_surf_usage_is_stencil(surf->usage) &&
+       (ISL_DEV_GEN(dev) < 12 || surf->samples > 1))
+      return false;
+
+   /* [TGL+] CCS can only be added to a non-D16-formatted depth buffer if it
+    * has HiZ. If not for GEN:BUG:1406512483 "deprecate compression enable
+    * states", D16 would be supported. Supporting D16 requires being able to
+    * specify that the control surface is present and simultaneously disabling
+    * compression. The above bug makes it so that it's not possible to specify
+    * this configuration.
+    */
+   if (isl_surf_usage_is_depth(surf->usage) && (aux_surf->size_B == 0 ||
+       ISL_DEV_GEN(dev) < 12 || surf->format == ISL_FORMAT_R16_UNORM)) {
+      return false;
+   }
+
     /* The PRM doesn't say this explicitly, but fast-clears don't appear to
      * work for 3D textures until gen9 where the layout of 3D textures changes
      * to match 2D array textures.
@@ -1770,13 +1899,66 @@ isl_surf_get_ccs_surf(const struct isl_device *dev,
         (surf->levels > 1 || surf->logical_level0_px.array_len > 1))
        return false;
  
+   /* On Gen12, 8BPP surfaces cannot be compressed if any level is not
+    * 32Bx4row-aligned. For now, just reject the cases where alignment
+    * matters.
+    */
+   if (ISL_DEV_GEN(dev) >= 12 &&
+       isl_format_get_layout(surf->format)->bpb == 8 && surf->levels >= 3) {
+      isl_finishme("%s:%s: CCS for 8BPP textures with 3+ miplevels is "
+                   "disabled, but support for more levels is possible.",
+                   __FILE__, __func__);
+      return false;
+   }
+
+   /* On Gen12, all CCS-compressed surface pitches must be multiples of 512B.
+    */
+   if (ISL_DEV_GEN(dev) >= 12 && surf->row_pitch_B % 512 != 0)
+      return false;
+
     if (isl_format_is_compressed(surf->format))
        return false;
  
+   /* According to GEN:BUG:1406738321, 3D textures need a blit to a new
+    * surface in order to perform a resolve. For now, just disable CCS.
+    */
+   if (ISL_DEV_GEN(dev) >= 12 && surf->dim == ISL_SURF_DIM_3D) {
+      isl_finishme("%s:%s: CCS for 3D textures is disabled, but a workaround"
+                   " is available.", __FILE__, __func__);
+      return false;
+   }
+
     /* TODO: More conditions where it can fail. */
  
+   /* From the Ivy Bridge PRM, Vol2 Part1 11.7 "MCS Buffer for Render
+    * Target(s)", beneath the "Fast Color Clear" bullet (p326):
+    *
+    *     - Support is limited to tiled render targets.
+    *     - MCS buffer for non-MSRT is supported only for RT formats 32bpp,
+    *       64bpp, and 128bpp.
+    *
+    * From the Skylake documentation, it is made clear that X-tiling is no
+    * longer supported:
+    *
+    *     - MCS and Lossless compression is supported for
+    *     TiledY/TileYs/TileYf non-MSRTs only.
+    */
     enum isl_format ccs_format;
-   if (ISL_DEV_GEN(dev) >= 9) {
+   if (ISL_DEV_GEN(dev) >= 12) {
+      /* TODO: Handle the other tiling formats */
+      if (surf->tiling != ISL_TILING_Y0)
+         return false;
+
+      switch (isl_format_get_layout(surf->format)->bpb) {
+      case 8:     ccs_format = ISL_FORMAT_GEN12_CCS_8BPP_Y0;    break;
+      case 16:    ccs_format = ISL_FORMAT_GEN12_CCS_16BPP_Y0;   break;
+      case 32:    ccs_format = ISL_FORMAT_GEN12_CCS_32BPP_Y0;   break;
+      case 64:    ccs_format = ISL_FORMAT_GEN12_CCS_64BPP_Y0;   break;
+      case 128:   ccs_format = ISL_FORMAT_GEN12_CCS_128BPP_Y0;  break;
+      default:
+         return false;
+      }
+   } else if (ISL_DEV_GEN(dev) >= 9) {
        if (!isl_tiling_is_any_y(surf->tiling))
           return false;
  
@@ -1807,18 +1989,41 @@ isl_surf_get_ccs_surf(const struct isl_device *dev,
        return false;
     }
  
-   return isl_surf_init(dev, ccs_surf,
-                        .dim = surf->dim,
-                        .format = ccs_format,
-                        .width = surf->logical_level0_px.width,
-                        .height = surf->logical_level0_px.height,
-                        .depth = surf->logical_level0_px.depth,
-                        .levels = surf->levels,
-                        .array_len = surf->logical_level0_px.array_len,
-                        .samples = 1,
-                        .row_pitch_B = row_pitch_B,
-                        .usage = ISL_SURF_USAGE_CCS_BIT,
-                        .tiling_flags = ISL_TILING_CCS_BIT);
+   if (ISL_DEV_GEN(dev) >= 12) {
+      /* On Gen12, the CCS is a scaled-down version of the main surface. We
+       * model this as the CCS compressing a 2D-view of the entire surface.
+       */
+      struct isl_surf *ccs_surf =
+         aux_surf->size_B > 0 ? extra_aux_surf : aux_surf;
+      const bool ok =
+         isl_surf_init(dev, ccs_surf,
+                       .dim = ISL_SURF_DIM_2D,
+                       .format = ccs_format,
+                       .width = isl_surf_get_row_pitch_el(surf),
+                       .height = surf->size_B / surf->row_pitch_B,
+                       .depth = 1,
+                       .levels = 1,
+                       .array_len = 1,
+                       .samples = 1,
+                       .row_pitch_B = row_pitch_B,
+                       .usage = ISL_SURF_USAGE_CCS_BIT,
+                       .tiling_flags = ISL_TILING_GEN12_CCS_BIT);
+      assert(!ok || ccs_surf->size_B == surf->size_B / 256);
+      return ok;
+   } else {
+      return isl_surf_init(dev, aux_surf,
+                           .dim = surf->dim,
+                           .format = ccs_format,
+                           .width = surf->logical_level0_px.width,
+                           .height = surf->logical_level0_px.height,
+                           .depth = surf->logical_level0_px.depth,
+                           .levels = surf->levels,
+                           .array_len = surf->logical_level0_px.array_len,
+                           .samples = 1,
+                           .row_pitch_B = row_pitch_B,
+                           .usage = ISL_SURF_USAGE_CCS_BIT,
+                           .tiling_flags = ISL_TILING_CCS_BIT);
+   }
  }
  
  #define isl_genX_call(dev, func, ...)              \
@@ -1856,6 +2061,9 @@ isl_surf_get_ccs_surf(const struct isl_device *dev,
     case 11:                                        \
        isl_gen11_##func(__VA_ARGS__);               \
        break;                                       \
+   case 12:                                        \
+      isl_gen12_##func(__VA_ARGS__);               \
+      break;                                       \
     default:                                        \
        assert(!"Unknown hardware generation");      \
     }
@@ -2374,6 +2582,16 @@ isl_surf_get_depth_format(const struct isl_device *dev,
     }
  }
  
+bool
+isl_surf_supports_hiz_ccs_wt(const struct gen_device_info *dev,
+                             const struct isl_surf *surf,
+                             enum isl_aux_usage aux_usage)
+{
+   return aux_usage == ISL_AUX_USAGE_HIZ_CCS &&
+          surf->samples == 1 &&
+          surf->usage & ISL_SURF_USAGE_TEXTURE_BIT;
+}
+
  bool
  isl_swizzle_supports_rendering(const struct gen_device_info *devinfo,
                                 struct isl_swizzle swizzle)