* Rob Clark <robclark@freedesktop.org>
*/
+#include "drm-uapi/drm_fourcc.h"
+
#include "fd6_resource.h"
#include "fd6_format.h"
#include "a6xx.xml.h"
-/* indexed by cpp, including msaa 2x and 4x: */
-static const struct {
- unsigned pitchalign;
- unsigned heightalign;
-} tile_alignment[] = {
- [1] = { 128, 32 },
- [2] = { 64, 32 },
- [3] = { 64, 32 },
- [4] = { 64, 16 },
- [6] = { 64, 16 },
- [8] = { 64, 16 },
- [12] = { 64, 16 },
- [16] = { 64, 16 },
- [24] = { 64, 16 },
- [32] = { 64, 16 },
- [48] = { 64, 16 },
- [64] = { 64, 16 },
-
- /* special cases for r16: */
- [0] = { 128, 16 },
-};
-
-/* NOTE: good way to test this is: (for example)
- * piglit/bin/texelFetch fs sampler3D 100x100x8
- */
-static uint32_t
-setup_slices(struct fd_resource *rsc, uint32_t alignment, enum pipe_format format)
-{
- struct pipe_resource *prsc = &rsc->base;
- struct fd_screen *screen = fd_screen(prsc->screen);
- enum util_format_layout layout = util_format_description(format)->layout;
- uint32_t pitchalign = screen->gmem_alignw;
- uint32_t level, size = 0;
- uint32_t depth = prsc->depth0;
- /* linear dimensions: */
- uint32_t lwidth = prsc->width0;
- uint32_t lheight = prsc->height0;
- /* tile_mode dimensions: */
- uint32_t twidth = util_next_power_of_two(lwidth);
- uint32_t theight = util_next_power_of_two(lheight);
- /* in layer_first layout, the level (slice) contains just one
- * layer (since in fact the layer contains the slices)
- */
- uint32_t layers_in_level = rsc->layer_first ? 1 : prsc->array_size;
- int ta = rsc->cpp;
-
- /* The z16/r16 formats seem to not play by the normal tiling rules: */
- if ((rsc->cpp == 2) && (util_format_get_nr_components(format) == 1))
- ta = 0;
-
- debug_assert(ta < ARRAY_SIZE(tile_alignment));
- debug_assert(tile_alignment[ta].pitchalign);
-
- for (level = 0; level <= prsc->last_level; level++) {
- struct fd_resource_slice *slice = fd_resource_slice(rsc, level);
- bool linear_level = fd_resource_level_linear(prsc, level);
- uint32_t width, height;
-
- /* tiled levels of 3D textures are rounded up to PoT dimensions: */
- if ((prsc->target == PIPE_TEXTURE_3D) && rsc->tile_mode && !linear_level) {
- width = twidth;
- height = theight;
- } else {
- width = lwidth;
- height = lheight;
- }
- uint32_t aligned_height = height;
- uint32_t blocks;
-
- if (rsc->tile_mode && !linear_level) {
- pitchalign = tile_alignment[ta].pitchalign;
- aligned_height = align(aligned_height,
- tile_alignment[ta].heightalign);
- } else {
- pitchalign = 64;
- }
-
- /* The blits used for mem<->gmem work at a granularity of
- * 32x32, which can cause faults due to over-fetch on the
- * last level. The simple solution is to over-allocate a
- * bit the last level to ensure any over-fetch is harmless.
- * The pitch is already sufficiently aligned, but height
- * may not be:
- */
- if ((level == prsc->last_level) && (prsc->target != PIPE_BUFFER))
- aligned_height = align(aligned_height, 32);
-
- if (layout == UTIL_FORMAT_LAYOUT_ASTC)
- slice->pitch =
- util_align_npot(width, pitchalign * util_format_get_blockwidth(format));
- else
- slice->pitch = align(width, pitchalign);
-
- slice->offset = size;
- blocks = util_format_get_nblocks(format, slice->pitch, aligned_height);
-
- /* 1d array and 2d array textures must all have the same layer size
- * for each miplevel on a6xx. 3d textures can have different layer
- * sizes for high levels, but the hw auto-sizer is buggy (or at least
- * different than what this code does), so as soon as the layer size
- * range gets into range, we stop reducing it.
- */
- if (prsc->target == PIPE_TEXTURE_3D) {
- if (level < 1 || (rsc->slices[level - 1].size0 > 0xf000)) {
- slice->size0 = align(blocks * rsc->cpp, alignment);
- } else {
- slice->size0 = rsc->slices[level - 1].size0;
- }
- } else {
- slice->size0 = align(blocks * rsc->cpp, alignment);
- }
-
- size += slice->size0 * depth * layers_in_level;
-
-#if 0
- debug_printf("%s: %ux%ux%u@%u:\t%2u: stride=%4u, size=%6u,%7u, aligned_height=%3u, blocks=%u, offset=0x%x\n",
- util_format_name(prsc->format),
- width, height, depth, rsc->cpp,
- level, slice->pitch * rsc->cpp,
- slice->size0, size, aligned_height, blocks,
- slice->offset);
-#endif
-
- depth = u_minify(depth, 1);
- lwidth = u_minify(lwidth, 1);
- lheight = u_minify(lheight, 1);
- twidth = u_minify(twidth, 1);
- theight = u_minify(theight, 1);
- }
-
- return size;
-}
-
/* A subset of the valid tiled formats can be compressed. We do
* already require tiled in order to be compressed, but just because
* it can be tiled doesn't mean it can be compressed.
*/
static bool
-ok_ubwc_format(enum pipe_format pfmt)
+ok_ubwc_format(struct fd_resource *rsc, enum pipe_format pfmt)
{
/* NOTE: both x24s8 and z24s8 map to RB6_X8Z24_UNORM, but UBWC
* does not seem to work properly when sampling x24s8.. possibly
if (pfmt == PIPE_FORMAT_X24S8_UINT)
return false;
+ /* We don't fully understand what's going wrong with this combination, but
+ * we haven't been able to make it work. It's enough of a corner-case
+ * that we can just disable UBWC for these resources.
+ */
+ if (rsc->base.target != PIPE_TEXTURE_2D &&
+ pfmt == PIPE_FORMAT_Z24_UNORM_S8_UINT)
+ return false;
+
switch (fd6_pipe2color(pfmt)) {
- case RB6_R10G10B10A2_UINT:
- case RB6_R10G10B10A2_UNORM:
- case RB6_R11G11B10_FLOAT:
- case RB6_R16_FLOAT:
- case RB6_R16G16B16A16_FLOAT:
- case RB6_R16G16B16A16_SINT:
- case RB6_R16G16B16A16_UINT:
- case RB6_R16G16_FLOAT:
- case RB6_R16G16_SINT:
- case RB6_R16G16_UINT:
- case RB6_R16_SINT:
- case RB6_R16_UINT:
- case RB6_R32G32B32A32_SINT:
- case RB6_R32G32B32A32_UINT:
- case RB6_R32G32_SINT:
- case RB6_R32G32_UINT:
- case RB6_R5G6B5_UNORM:
- case RB6_R8G8B8A8_SINT:
- case RB6_R8G8B8A8_UINT:
- case RB6_R8G8B8A8_UNORM:
- case RB6_R8G8B8_UNORM:
- case RB6_R8G8_SINT:
- case RB6_R8G8_UINT:
- case RB6_R8G8_UNORM:
- case RB6_Z24_UNORM_S8_UINT:
- case RB6_Z24_UNORM_S8_UINT_AS_R8G8B8A8:
+ case FMT6_10_10_10_2_UINT:
+ case FMT6_10_10_10_2_UNORM_DEST:
+ case FMT6_11_11_10_FLOAT:
+ case FMT6_16_FLOAT:
+ case FMT6_16_16_16_16_FLOAT:
+ case FMT6_16_16_16_16_SINT:
+ case FMT6_16_16_16_16_UINT:
+ case FMT6_16_16_FLOAT:
+ case FMT6_16_16_SINT:
+ case FMT6_16_16_UINT:
+ case FMT6_16_SINT:
+ case FMT6_16_UINT:
+ case FMT6_32_32_32_32_SINT:
+ case FMT6_32_32_32_32_UINT:
+ case FMT6_32_32_SINT:
+ case FMT6_32_32_UINT:
+ case FMT6_5_6_5_UNORM:
+ case FMT6_8_8_8_8_SINT:
+ case FMT6_8_8_8_8_UINT:
+ case FMT6_8_8_8_8_UNORM:
+ case FMT6_8_8_8_X8_UNORM:
+ case FMT6_8_8_SINT:
+ case FMT6_8_8_UINT:
+ case FMT6_8_8_UNORM:
+ case FMT6_Z24_UNORM_S8_UINT:
+ case FMT6_Z24_UNORM_S8_UINT_AS_R8G8B8A8:
return true;
default:
return false;
}
}
-uint32_t
-fd6_fill_ubwc_buffer_sizes(struct fd_resource *rsc)
-{
-#define RBG_TILE_WIDTH_ALIGNMENT 64
-#define RGB_TILE_HEIGHT_ALIGNMENT 16
-#define UBWC_PLANE_SIZE_ALIGNMENT 4096
-
- struct pipe_resource *prsc = &rsc->base;
- uint32_t width = prsc->width0;
- uint32_t height = prsc->height0;
-
- if (!ok_ubwc_format(prsc->format))
- return 0;
-
- /* limit things to simple single level 2d for now: */
- if ((prsc->depth0 != 1) || (prsc->array_size != 1) || (prsc->last_level != 0))
- return 0;
-
- uint32_t block_width, block_height;
- switch (rsc->cpp) {
- case 2:
- case 4:
- block_width = 16;
- block_height = 4;
- break;
- case 8:
- block_width = 8;
- block_height = 4;
- break;
- case 16:
- block_width = 4;
- block_height = 4;
- break;
- default:
- return 0;
- }
-
- uint32_t meta_stride =
- ALIGN_POT(DIV_ROUND_UP(width, block_width), RBG_TILE_WIDTH_ALIGNMENT);
- uint32_t meta_height =
- ALIGN_POT(DIV_ROUND_UP(height, block_height), RGB_TILE_HEIGHT_ALIGNMENT);
- uint32_t meta_size =
- ALIGN_POT(meta_stride * meta_height, UBWC_PLANE_SIZE_ALIGNMENT);
-
- /* UBWC goes first, then color data.. this constraint is mainly only
- * because it is what the kernel expects for scanout. For non-2D we
- * could just use a separate UBWC buffer..
- */
- rsc->ubwc_offset = 0;
- rsc->offset = meta_size;
- rsc->ubwc_pitch = meta_stride;
- rsc->ubwc_size = meta_size >> 2; /* in dwords??? */
- rsc->tile_mode = TILE6_3;
-
- return meta_size;
-}
-
/**
* Ensure the rsc is in an ok state to be used with the specified format.
* This handles the case of UBWC buffers used with non-UBWC compatible
fd6_validate_format(struct fd_context *ctx, struct fd_resource *rsc,
enum pipe_format format)
{
- if (!rsc->ubwc_size)
+ if (!rsc->layout.ubwc)
return;
- if (ok_ubwc_format(format))
+ if (ok_ubwc_format(rsc, format))
return;
fd_resource_uncompress(ctx, rsc);
}
-uint32_t
+static void
+setup_lrz(struct fd_resource *rsc)
+{
+ struct fd_screen *screen = fd_screen(rsc->base.screen);
+ const uint32_t flags = DRM_FREEDRENO_GEM_CACHE_WCOMBINE |
+ DRM_FREEDRENO_GEM_TYPE_KMEM; /* TODO */
+ unsigned width0 = rsc->base.width0;
+ unsigned height0 = rsc->base.height0;
+
+ /* LRZ buffer is super-sampled: */
+ switch (rsc->base.nr_samples) {
+ case 4:
+ width0 *= 2;
+ /* fallthru */
+ case 2:
+ height0 *= 2;
+ }
+
+ unsigned lrz_pitch = align(DIV_ROUND_UP(width0, 8), 32);
+ unsigned lrz_height = align(DIV_ROUND_UP(height0, 8), 16);
+
+ unsigned size = lrz_pitch * lrz_height * 2;
+
+ rsc->lrz_height = lrz_height;
+ rsc->lrz_width = lrz_pitch;
+ rsc->lrz_pitch = lrz_pitch;
+ rsc->lrz = fd_bo_new(screen->dev, size, flags, "lrz");
+}
+
+static uint32_t
fd6_setup_slices(struct fd_resource *rsc)
{
- uint32_t alignment;
+ struct pipe_resource *prsc = &rsc->base;
+
+ if (!(fd_mesa_debug & FD_DBG_NOLRZ) && has_depth(rsc->base.format))
+ setup_lrz(rsc);
+
+ if (rsc->layout.ubwc && !ok_ubwc_format(rsc, rsc->base.format))
+ rsc->layout.ubwc = false;
+
+ fdl6_layout(&rsc->layout, prsc->format, fd_resource_nr_samples(prsc),
+ prsc->width0, prsc->height0, prsc->depth0,
+ prsc->last_level + 1, prsc->array_size,
+ prsc->target == PIPE_TEXTURE_3D);
+
+ return rsc->layout.size;
+}
- switch (rsc->base.target) {
- case PIPE_TEXTURE_3D:
- rsc->layer_first = false;
- alignment = 4096;
- break;
+static int
+fill_ubwc_buffer_sizes(struct fd_resource *rsc)
+{
+ struct pipe_resource *prsc = &rsc->base;
+ struct fdl_slice slice = *fd_resource_slice(rsc, 0);
+
+ /* limit things to simple single level 2d for now: */
+ if ((prsc->depth0 != 1) || (prsc->array_size != 1) || (prsc->last_level != 0))
+ return -1;
+ if (prsc->target != PIPE_TEXTURE_2D)
+ return -1;
+ if (!ok_ubwc_format(rsc, prsc->format))
+ return -1;
+
+ rsc->layout.ubwc = true;
+ rsc->layout.tile_mode = TILE6_3;
+
+ fdl6_layout(&rsc->layout, prsc->format, fd_resource_nr_samples(prsc),
+ prsc->width0, prsc->height0, prsc->depth0,
+ prsc->last_level + 1, prsc->array_size, false);
+
+ if (fd_resource_slice(rsc, 0)->pitch != slice.pitch)
+ return -1;
+
+ /* The imported buffer may specify an offset, add that in here. */
+ rsc->layout.slices[0].offset += slice.offset;
+ rsc->layout.ubwc_slices[0].offset += slice.offset;
+ rsc->layout.size += slice.offset;
+
+ if (rsc->layout.size > fd_bo_size(rsc->bo))
+ return -1;
+
+ return 0;
+}
+
+static int
+fd6_layout_resource_for_modifier(struct fd_resource *rsc, uint64_t modifier)
+{
+ switch (modifier) {
+ case DRM_FORMAT_MOD_QCOM_COMPRESSED:
+ return fill_ubwc_buffer_sizes(rsc);
+ case DRM_FORMAT_MOD_LINEAR:
+ case DRM_FORMAT_MOD_INVALID:
+ return 0;
default:
- rsc->layer_first = true;
- alignment = 1;
- break;
+ return -1;
}
+}
+
+static const uint64_t supported_modifiers[] = {
+ DRM_FORMAT_MOD_LINEAR,
+ DRM_FORMAT_MOD_QCOM_COMPRESSED,
+};
+
+void
+fd6_resource_screen_init(struct pipe_screen *pscreen)
+{
+ struct fd_screen *screen = fd_screen(pscreen);
- return setup_slices(rsc, alignment, rsc->base.format);
+ screen->setup_slices = fd6_setup_slices;
+ screen->layout_resource_for_modifier = fd6_layout_resource_for_modifier;
+ screen->supported_modifiers = supported_modifiers;
+ screen->num_supported_modifiers = ARRAY_SIZE(supported_modifiers);
}