gallium: implement get_device_vendor() for existing drivers
[mesa.git] / src / gallium / drivers / radeon / r600_texture.c
index 8eb48678f07f5696cde64821a9f8bc0856675f92..ab8ce7bd7136d9be8d0f6cd2173dc4c3b6c70ce5 100644 (file)
@@ -80,12 +80,8 @@ static void r600_copy_to_staging_texture(struct pipe_context *ctx, struct r600_t
                return;
        }
 
-       if (!rctx->dma_copy(ctx, dst, 0, 0, 0, 0,
-                             src, transfer->level,
-                             &transfer->box)) {
-               ctx->resource_copy_region(ctx, dst, 0, 0, 0, 0,
-                                         src, transfer->level, &transfer->box);
-       }
+       rctx->dma_copy(ctx, dst, 0, 0, 0, 0, src, transfer->level,
+                      &transfer->box);
 }
 
 /* Copy from a transfer's staging texture to a full GPU one. */
@@ -106,13 +102,9 @@ static void r600_copy_from_staging_texture(struct pipe_context *ctx, struct r600
                return;
        }
 
-       if (!rctx->dma_copy(ctx, dst, transfer->level,
-                             transfer->box.x, transfer->box.y, transfer->box.z,
-                             src, 0, &sbox)) {
-               ctx->resource_copy_region(ctx, dst, transfer->level,
-                                         transfer->box.x, transfer->box.y, transfer->box.z,
-                                         src, 0, &sbox);
-       }
+       rctx->dma_copy(ctx, dst, transfer->level,
+                      transfer->box.x, transfer->box.y, transfer->box.z,
+                      src, 0, &sbox);
 }
 
 static unsigned r600_texture_get_offset(struct r600_texture *rtex, unsigned level,
@@ -297,6 +289,12 @@ void r600_texture_get_fmask_info(struct r600_common_screen *rscreen,
        fmask.nsamples = 1;
        fmask.flags |= RADEON_SURF_FMASK;
 
+       /* Force 2D tiling if it wasn't set. This may occur when creating
+        * FMASK for MSAA resolve on R6xx. On R6xx, the single-sample
+        * destination buffer must have an FMASK too. */
+       fmask.flags = RADEON_SURF_CLR(fmask.flags, MODE);
+       fmask.flags |= RADEON_SURF_SET(RADEON_SURF_MODE_2D, MODE);
+
        if (rscreen->chip_class >= SI) {
                fmask.flags |= RADEON_SURF_HAS_TILE_MODE_INDEX;
        }
@@ -382,7 +380,8 @@ void r600_texture_get_cmask_info(struct r600_common_screen *rscreen,
 
        out->slice_tile_max = ((pitch_elements * height) / (128*128)) - 1;
        out->alignment = MAX2(256, base_align);
-       out->size = rtex->surface.array_size * align(slice_bytes, base_align);
+       out->size = (util_max_layer(&rtex->resource.b.b, 0) + 1) *
+                   align(slice_bytes, base_align);
 }
 
 static void si_texture_get_cmask_info(struct r600_common_screen *rscreen,
@@ -429,7 +428,8 @@ static void si_texture_get_cmask_info(struct r600_common_screen *rscreen,
                out->slice_tile_max -= 1;
 
        out->alignment = MAX2(256, base_align);
-       out->size = rtex->surface.array_size * align(slice_bytes, base_align);
+       out->size = (util_max_layer(&rtex->resource.b.b, 0) + 1) *
+                   align(slice_bytes, base_align);
 }
 
 static void r600_texture_allocate_cmask(struct r600_common_screen *rscreen,
@@ -473,8 +473,7 @@ static void r600_texture_alloc_cmask_separate(struct r600_common_screen *rscreen
        }
 
        /* update colorbuffer state bits */
-       rtex->cmask.base_address_reg =
-               r600_resource_va(&rscreen->b, &rtex->cmask_buffer->b.b) >> 8;
+       rtex->cmask.base_address_reg = rtex->cmask_buffer->gpu_address >> 8;
 
        if (rscreen->chip_class >= SI)
                rtex->cb_color_info |= SI_S_028C70_FAST_CLEAR(1);
@@ -482,19 +481,34 @@ static void r600_texture_alloc_cmask_separate(struct r600_common_screen *rscreen
                rtex->cb_color_info |= EG_S_028C70_FAST_CLEAR(1);
 }
 
-static unsigned si_texture_htile_alloc_size(struct r600_common_screen *rscreen,
+static unsigned r600_texture_get_htile_size(struct r600_common_screen *rscreen,
                                            struct r600_texture *rtex)
 {
        unsigned cl_width, cl_height, width, height;
        unsigned slice_elements, slice_bytes, pipe_interleave_bytes, base_align;
        unsigned num_pipes = rscreen->tiling_info.num_channels;
 
-       /* HTILE doesn't work with 1D tiling (there's massive corruption
-        * in glxgears). */
-       if (rtex->surface.level[0].mode != RADEON_SURF_MODE_2D)
+       if (rscreen->chip_class <= EVERGREEN &&
+           rscreen->info.drm_minor < 26)
+               return 0;
+
+       /* HW bug on R6xx. */
+       if (rscreen->chip_class == R600 &&
+           (rtex->surface.level[0].npix_x > 7680 ||
+            rtex->surface.level[0].npix_y > 7680))
+               return 0;
+
+       /* HTILE is broken with 1D tiling on old kernels and CIK. */
+       if (rscreen->chip_class >= CIK &&
+           rtex->surface.level[0].mode == RADEON_SURF_MODE_1D &&
+           rscreen->info.drm_minor < 38)
                return 0;
 
        switch (num_pipes) {
+       case 1:
+               cl_width = 32;
+               cl_height = 16;
+               break;
        case 2:
                cl_width = 32;
                cl_height = 32;
@@ -525,48 +539,18 @@ static unsigned si_texture_htile_alloc_size(struct r600_common_screen *rscreen,
        pipe_interleave_bytes = rscreen->tiling_info.group_bytes;
        base_align = num_pipes * pipe_interleave_bytes;
 
-       return rtex->surface.array_size * align(slice_bytes, base_align);
-}
-
-static unsigned r600_texture_htile_alloc_size(struct r600_common_screen *rscreen,
-                                             struct r600_texture *rtex)
-{
-       unsigned sw = rtex->surface.level[0].nblk_x * rtex->surface.blk_w;
-       unsigned sh = rtex->surface.level[0].nblk_y * rtex->surface.blk_h;
-       unsigned npipes = rscreen->info.r600_num_tile_pipes;
-       unsigned htile_size;
-
-       /* XXX also use it for other texture targets */
-       if (rscreen->info.drm_minor < 26 ||
-           rtex->resource.b.b.target != PIPE_TEXTURE_2D ||
-           rtex->surface.level[0].nblk_x < 32 ||
-           rtex->surface.level[0].nblk_y < 32) {
-               return 0;
-       }
-
-       /* this alignment and htile size only apply to linear htile buffer */
-       sw = align(sw, 16 << 3);
-       sh = align(sh, npipes << 3);
-       htile_size = (sw >> 3) * (sh >> 3) * 4;
-       /* must be aligned with 2K * npipes */
-       htile_size = align(htile_size, (2 << 10) * npipes);
-       return htile_size;
+       return (util_max_layer(&rtex->resource.b.b, 0) + 1) *
+               align(slice_bytes, base_align);
 }
 
 static void r600_texture_allocate_htile(struct r600_common_screen *rscreen,
                                        struct r600_texture *rtex)
 {
-       unsigned htile_size;
-       if (rscreen->chip_class >= SI) {
-               htile_size = si_texture_htile_alloc_size(rscreen, rtex);
-       } else {
-               htile_size = r600_texture_htile_alloc_size(rscreen, rtex);
-       }
+       unsigned htile_size = r600_texture_get_htile_size(rscreen, rtex);
 
        if (!htile_size)
                return;
 
-       /* XXX don't allocate it separately */
        rtex->htile_buffer = (struct r600_resource*)
                             pipe_buffer_create(&rscreen->b, PIPE_BIND_CUSTOM,
                                                PIPE_USAGE_DEFAULT, htile_size);
@@ -575,7 +559,8 @@ static void r600_texture_allocate_htile(struct r600_common_screen *rscreen,
                 * without htile buffer */
                R600_ERR("Failed to create buffer object for htile buffer.\n");
        } else {
-               r600_screen_clear_buffer(rscreen, &rtex->htile_buffer->b.b, 0, htile_size, 0);
+               r600_screen_clear_buffer(rscreen, &rtex->htile_buffer->b.b, 0,
+                                        htile_size, 0, true);
        }
 }
 
@@ -590,7 +575,6 @@ r600_texture_create_object(struct pipe_screen *screen,
        struct r600_texture *rtex;
        struct r600_resource *resource;
        struct r600_common_screen *rscreen = (struct r600_common_screen*)screen;
-       uint64_t va;
 
        rtex = CALLOC_STRUCT(r600_texture);
        if (rtex == NULL)
@@ -620,7 +604,7 @@ r600_texture_create_object(struct pipe_screen *screen,
        if (rtex->is_depth) {
                if (!(base->flags & (R600_RESOURCE_FLAG_TRANSFER |
                                     R600_RESOURCE_FLAG_FLUSHED_DEPTH)) &&
-                   (rscreen->debug_flags & DBG_HYPERZ)) {
+                   !(rscreen->debug_flags & DBG_NO_HYPERZ)) {
 
                        r600_texture_allocate_htile(rscreen, rtex);
                }
@@ -641,30 +625,32 @@ r600_texture_create_object(struct pipe_screen *screen,
        /* Now create the backing buffer. */
        if (!buf) {
                if (!r600_init_resource(rscreen, resource, rtex->size,
-                                       rtex->surface.bo_alignment, FALSE)) {
+                                       rtex->surface.bo_alignment, TRUE)) {
                        FREE(rtex);
                        return NULL;
                }
        } else {
                resource->buf = buf;
                resource->cs_buf = rscreen->ws->buffer_get_cs_handle(buf);
-               resource->domains = RADEON_DOMAIN_GTT | RADEON_DOMAIN_VRAM;
+               resource->gpu_address = rscreen->ws->buffer_get_virtual_address(resource->cs_buf);
+               resource->domains = rscreen->ws->buffer_get_initial_domain(resource->cs_buf);
        }
 
        if (rtex->cmask.size) {
                /* Initialize the cmask to 0xCC (= compressed state). */
                r600_screen_clear_buffer(rscreen, &rtex->cmask_buffer->b.b,
-                                        rtex->cmask.offset, rtex->cmask.size, 0xCCCCCCCC);
+                                        rtex->cmask.offset, rtex->cmask.size,
+                                        0xCCCCCCCC, true);
        }
 
        /* Initialize the CMASK base register value. */
-       va = r600_resource_va(&rscreen->b, &rtex->resource.b.b);
-       rtex->cmask.base_address_reg = (va + rtex->cmask.offset) >> 8;
+       rtex->cmask.base_address_reg =
+               (rtex->resource.gpu_address + rtex->cmask.offset) >> 8;
 
        if (rscreen->debug_flags & DBG_VM) {
-               fprintf(stderr, "VM start=0x%"PRIu64"  end=0x%"PRIu64" | Texture %ix%ix%i, %i levels, %i samples, %s\n",
-                       r600_resource_va(screen, &rtex->resource.b.b),
-                       r600_resource_va(screen, &rtex->resource.b.b) + rtex->resource.buf->size,
+               fprintf(stderr, "VM start=0x%"PRIX64"  end=0x%"PRIX64" | Texture %ix%ix%i, %i levels, %i samples, %s\n",
+                       rtex->resource.gpu_address,
+                       rtex->resource.gpu_address + rtex->resource.buf->size,
                        base->width0, base->height0, util_max_layer(base, 0)+1, base->last_level+1,
                        base->nr_samples ? base->nr_samples : 1, util_format_short_name(base->format));
        }
@@ -733,9 +719,15 @@ static unsigned r600_choose_tiling(struct r600_common_screen *rscreen,
         * Compressed textures must always be tiled. */
        if (!(templ->flags & R600_RESOURCE_FLAG_FORCE_TILING) &&
            !util_format_is_compressed(templ->format)) {
-               /* Tiling doesn't work with the 422 (SUBSAMPLED) formats on R600-Cayman. */
-               if (rscreen->chip_class <= CAYMAN &&
-                   desc->layout == UTIL_FORMAT_LAYOUT_SUBSAMPLED)
+               /* Not everything can be linear, so we cannot enforce it
+                * for all textures. */
+               if ((rscreen->debug_flags & DBG_NO_TILING) &&
+                   (!util_format_is_depth_or_stencil(templ->format) ||
+                    !(templ->flags & R600_RESOURCE_FLAG_FLUSHED_DEPTH)))
+                       return RADEON_SURF_MODE_LINEAR_ALIGNED;
+
+               /* Tiling doesn't work with the 422 (SUBSAMPLED) formats on R600+. */
+               if (desc->layout == UTIL_FORMAT_LAYOUT_SUBSAMPLED)
                        return RADEON_SURF_MODE_LINEAR_ALIGNED;
 
                /* Cursors are linear on SI.
@@ -760,7 +752,8 @@ static unsigned r600_choose_tiling(struct r600_common_screen *rscreen,
        }
 
        /* Make small textures 1D tiled. */
-       if (templ->width0 <= 16 || templ->height0 <= 16)
+       if (templ->width0 <= 16 || templ->height0 <= 16 ||
+           (rscreen->debug_flags & DBG_NO_2D_TILING))
                return RADEON_SURF_MODE_1D;
 
        /* The allocator will switch to 1D if needed. */
@@ -933,19 +926,16 @@ static void *r600_texture_transfer_map(struct pipe_context *ctx,
         * the CPU is much happier reading out of cached system memory
         * than uncached VRAM.
         */
-       if (rtex->surface.level[level].mode >= RADEON_SURF_MODE_1D)
+       if (rtex->surface.level[0].mode >= RADEON_SURF_MODE_1D) {
                use_staging_texture = TRUE;
-
-       /* Untiled buffers in VRAM, which is slow for CPU reads and writes */
-       if (!(usage & PIPE_TRANSFER_MAP_DIRECTLY) &&
+       } else if ((usage & PIPE_TRANSFER_READ) && !(usage & PIPE_TRANSFER_MAP_DIRECTLY) &&
            (rtex->resource.domains == RADEON_DOMAIN_VRAM)) {
+               /* Untiled buffers in VRAM, which is slow for CPU reads */
                use_staging_texture = TRUE;
-       }
-
-       /* Use a staging texture for uploads if the underlying BO is busy. */
-       if (!(usage & PIPE_TRANSFER_READ) &&
+       } else if (!(usage & PIPE_TRANSFER_READ) &&
            (r600_rings_is_buffer_referenced(rctx, rtex->resource.cs_buf, RADEON_USAGE_READWRITE) ||
             rctx->ws->buffer_is_busy(rtex->resource.buf, RADEON_USAGE_READWRITE))) {
+               /* Use a staging texture for uploads if the underlying BO is busy. */
                use_staging_texture = TRUE;
        }
 
@@ -1024,6 +1014,8 @@ static void *r600_texture_transfer_map(struct pipe_context *ctx,
 
                r600_init_temp_resource_from_box(&resource, texture, box, level,
                                                 R600_RESOURCE_FLAG_TRANSFER);
+               resource.usage = (usage & PIPE_TRANSFER_READ) ?
+                       PIPE_USAGE_STAGING : PIPE_USAGE_STREAM;
 
                /* Create the temporary texture. */
                staging = (struct r600_texture*)ctx->screen->resource_create(ctx->screen, &resource);
@@ -1047,6 +1039,8 @@ static void *r600_texture_transfer_map(struct pipe_context *ctx,
 
        if (trans->staging) {
                buf = trans->staging;
+               if (!rtex->is_depth && !(usage & PIPE_TRANSFER_READ))
+                       usage |= PIPE_TRANSFER_UNSYNCHRONIZED;
        } else {
                buf = &rtex->resource;
        }
@@ -1229,6 +1223,9 @@ void evergreen_do_fast_color_clear(struct r600_common_context *rctx,
 {
        int i;
 
+       if (rctx->current_render_cond)
+               return;
+
        for (i = 0; i < fb->nr_cbufs; i++) {
                struct r600_texture *tex;
                unsigned clear_bit = PIPE_CLEAR_COLOR0 << i;
@@ -1263,6 +1260,12 @@ void evergreen_do_fast_color_clear(struct r600_common_context *rctx,
                        continue;
                }
 
+               /* fast color clear with 1D tiling doesn't work on old kernels and CIK */
+               if (tex->surface.level[0].mode == RADEON_SURF_MODE_1D &&
+                   rctx->chip_class >= CIK && rctx->screen->info.drm_minor < 38) {
+                       continue;
+               }
+
                /* ensure CMASK is enabled */
                r600_texture_alloc_cmask_separate(rctx->screen, tex);
                if (tex->cmask.size == 0) {
@@ -1272,7 +1275,7 @@ void evergreen_do_fast_color_clear(struct r600_common_context *rctx,
                /* Do the fast clear. */
                evergreen_set_clear_color(tex, fb->cbufs[i]->format, color);
                rctx->clear_buffer(&rctx->b, &tex->cmask_buffer->b.b,
-                                  tex->cmask.offset, tex->cmask.size, 0);
+                                  tex->cmask.offset, tex->cmask.size, 0, true);
 
                tex->dirty_level_mask |= 1 << fb->cbufs[i]->u.tex.level;
                fb_state->dirty = true;