X-Git-Url: https://git.libre-soc.org/?a=blobdiff_plain;f=src%2Fgallium%2Fdrivers%2Fr300%2Fr300_blit.c;h=33344982c1ea53e1dd983fa1065902e96b3a82be;hb=882ca6dfb0f3d17e0f8bc917307d915ab1718069;hp=46578318af2c51bd1f677a69b9069a4db17e41f0;hpb=8ed6b1400bc8a78f46340f41aaf2e88b24c23267;p=mesa.git diff --git a/src/gallium/drivers/r300/r300_blit.c b/src/gallium/drivers/r300/r300_blit.c index 46578318af2..33344982c1e 100644 --- a/src/gallium/drivers/r300/r300_blit.c +++ b/src/gallium/drivers/r300/r300_blit.c @@ -25,7 +25,8 @@ #include "r300_texture.h" #include "r300_reg.h" -#include "util/u_format.h" +#include "util/format/u_format.h" +#include "util/u_half.h" #include "util/u_pack_color.h" #include "util/u_surface.h" @@ -44,7 +45,7 @@ enum r300_blitter_op /* bitmask */ R300_SAVE_TEXTURES | R300_IGNORE_RENDER_COND, R300_BLIT = R300_STOP_QUERY | R300_SAVE_FRAMEBUFFER | - R300_SAVE_TEXTURES | R300_IGNORE_RENDER_COND, + R300_SAVE_TEXTURES, R300_DECOMPRESS = R300_STOP_QUERY | R300_IGNORE_RENDER_COND, }; @@ -117,7 +118,7 @@ static uint32_t r300_depth_clear_cb_value(enum pipe_format format, util_pack_color(rgba, format, &uc); if (util_format_get_blocksizebits(format) == 32) - return uc.ui; + return uc.ui[0]; else return uc.us | (uc.us << 16); } @@ -129,13 +130,14 @@ static boolean r300_cbzb_clear_allowed(struct r300_context *r300, (struct pipe_framebuffer_state*)r300->fb_state.state; /* Only color clear allowed, and only one colorbuffer. */ - if (clear_buffers != PIPE_CLEAR_COLOR || fb->nr_cbufs != 1) + if ((clear_buffers & ~PIPE_CLEAR_COLOR) != 0 || fb->nr_cbufs != 1 || !fb->cbufs[0]) return FALSE; return r300_surface(fb->cbufs[0])->cbzb_allowed; } -static boolean r300_fast_zclear_allowed(struct r300_context *r300) +static boolean r300_fast_zclear_allowed(struct r300_context *r300, + unsigned clear_buffers) { struct pipe_framebuffer_state *fb = (struct pipe_framebuffer_state*)r300->fb_state.state; @@ -175,6 +177,26 @@ static uint32_t r300_hiz_clear_value(double depth) return r | (r << 8) | (r << 16) | (r << 24); } +static void r300_set_clear_color(struct r300_context *r300, + const union pipe_color_union *color) +{ + struct pipe_framebuffer_state *fb = + (struct pipe_framebuffer_state*)r300->fb_state.state; + union util_color uc; + + memset(&uc, 0, sizeof(uc)); + util_pack_color(color->f, fb->cbufs[0]->format, &uc); + + if (fb->cbufs[0]->format == PIPE_FORMAT_R16G16B16A16_FLOAT || + fb->cbufs[0]->format == PIPE_FORMAT_R16G16B16X16_FLOAT) { + /* (0,1,2,3) maps to (B,G,R,A) */ + r300->color_clear_value_gb = uc.h[0] | ((uint32_t)uc.h[1] << 16); + r300->color_clear_value_ar = uc.h[2] | ((uint32_t)uc.h[3] << 16); + } else { + r300->color_clear_value = uc.ui[0]; + } +} + DEBUG_GET_ONCE_BOOL_OPTION(hyperz, "RADEON_HYPERZ", FALSE) /* Clear currently bound buffers. */ @@ -237,13 +259,20 @@ static void r300_clear(struct pipe_context* pipe, uint32_t height = fb->height; uint32_t hyperz_dcv = hyperz->zb_depthclearvalue; - /* Enable fast Z clear. + /* Use fast Z clear. * The zbuffer must be in micro-tiled mode, otherwise it locks up. */ if (buffers & PIPE_CLEAR_DEPTHSTENCIL) { boolean zmask_clear, hiz_clear; - zmask_clear = r300_fast_zclear_allowed(r300); - hiz_clear = r300_hiz_clear_allowed(r300); + /* If both depth and stencil are present, they must be cleared together. */ + if (fb->zsbuf->texture->format == PIPE_FORMAT_S8_UINT_Z24_UNORM && + (buffers & PIPE_CLEAR_DEPTHSTENCIL) != PIPE_CLEAR_DEPTHSTENCIL) { + zmask_clear = FALSE; + hiz_clear = FALSE; + } else { + zmask_clear = r300_fast_zclear_allowed(r300, buffers); + hiz_clear = r300_hiz_clear_allowed(r300); + } /* If we need Hyper-Z. */ if (zmask_clear || hiz_clear) { @@ -262,28 +291,64 @@ static void r300_clear(struct pipe_context* pipe, /* Setup Hyper-Z clears. */ if (r300->hyperz_enabled) { - DBG(r300, DBG_HYPERZ, "r300: Clear memory: %s%s\n", - zmask_clear ? "ZMASK " : "", hiz_clear ? "HIZ" : ""); - if (zmask_clear) { hyperz_dcv = hyperz->zb_depthclearvalue = r300_depth_clear_value(fb->zsbuf->format, depth, stencil); r300_mark_atom_dirty(r300, &r300->zmask_clear); + r300_mark_atom_dirty(r300, &r300->gpu_flush); buffers &= ~PIPE_CLEAR_DEPTHSTENCIL; } if (hiz_clear) { r300->hiz_clear_value = r300_hiz_clear_value(depth); r300_mark_atom_dirty(r300, &r300->hiz_clear); + r300_mark_atom_dirty(r300, &r300->gpu_flush); } r300->num_z_clears++; } } } + /* Use fast color clear for an AA colorbuffer. + * The CMASK is shared between all colorbuffers, so we use it + * if there is only one colorbuffer bound. */ + if ((buffers & PIPE_CLEAR_COLOR) && fb->nr_cbufs == 1 && fb->cbufs[0] && + r300_resource(fb->cbufs[0]->texture)->tex.cmask_dwords) { + /* Try to obtain the access to the CMASK if we don't have one. */ + if (!r300->cmask_access) { + r300->cmask_access = + r300->rws->cs_request_feature(r300->cs, + RADEON_FID_R300_CMASK_ACCESS, + TRUE); + } + + /* Setup the clear. */ + if (r300->cmask_access) { + /* Pair the resource with the CMASK to avoid other resources + * accessing it. */ + if (!r300->screen->cmask_resource) { + mtx_lock(&r300->screen->cmask_mutex); + /* Double checking (first unlocked, then locked). */ + if (!r300->screen->cmask_resource) { + /* Don't reference this, so that the texture can be + * destroyed while set in cmask_resource. + * Then in texture_destroy, we set cmask_resource to NULL. */ + r300->screen->cmask_resource = fb->cbufs[0]->texture; + } + mtx_unlock(&r300->screen->cmask_mutex); + } + + if (r300->screen->cmask_resource == fb->cbufs[0]->texture) { + r300_set_clear_color(r300, color); + r300_mark_atom_dirty(r300, &r300->cmask_clear); + r300_mark_atom_dirty(r300, &r300->gpu_flush); + buffers &= ~PIPE_CLEAR_COLOR; + } + } + } /* Enable CBZB clear. */ - if (r300_cbzb_clear_allowed(r300, buffers)) { + else if (r300_cbzb_clear_allowed(r300, buffers)) { struct r300_surface *surf = r300_surface(fb->cbufs[0]); hyperz->zb_depthclearvalue = @@ -298,30 +363,34 @@ static void r300_clear(struct pipe_context* pipe, /* Clear. */ if (buffers) { - enum pipe_format cformat = fb->nr_cbufs ? fb->cbufs[0]->format : PIPE_FORMAT_NONE; /* Clear using the blitter. */ r300_blitter_begin(r300, R300_CLEAR); - util_blitter_clear(r300->blitter, - width, - height, - fb->nr_cbufs, - buffers, cformat, color, depth, stencil); + util_blitter_clear(r300->blitter, width, height, 1, + buffers, color, depth, stencil, + util_framebuffer_get_num_samples(fb) > 1); r300_blitter_end(r300); - } else if (r300->zmask_clear.dirty || r300->hiz_clear.dirty) { + } else if (r300->zmask_clear.dirty || + r300->hiz_clear.dirty || + r300->cmask_clear.dirty) { /* Just clear zmask and hiz now, this does not use the standard draw * procedure. */ /* Calculate zmask_clear and hiz_clear atom sizes. */ unsigned dwords = + r300->gpu_flush.size + (r300->zmask_clear.dirty ? r300->zmask_clear.size : 0) + (r300->hiz_clear.dirty ? r300->hiz_clear.size : 0) + + (r300->cmask_clear.dirty ? r300->cmask_clear.size : 0) + r300_get_num_cs_end_dwords(r300); /* Reserve CS space. */ - if (dwords > (RADEON_MAX_CMDBUF_DWORDS - r300->cs->cdw)) { - r300_flush(&r300->context, RADEON_FLUSH_ASYNC, NULL); + if (!r300->rws->cs_check_space(r300->cs, dwords, false)) { + r300_flush(&r300->context, PIPE_FLUSH_ASYNC, NULL); } /* Emit clear packets. */ + r300_emit_gpu_flush(r300, r300->gpu_flush.size, r300->gpu_flush.state); + r300->gpu_flush.dirty = FALSE; + if (r300->zmask_clear.dirty) { r300_emit_zmask_clear(r300, r300->zmask_clear.size, r300->zmask_clear.state); @@ -332,6 +401,11 @@ static void r300_clear(struct pipe_context* pipe, r300->hiz_clear.state); r300->hiz_clear.dirty = FALSE; } + if (r300->cmask_clear.dirty) { + r300_emit_cmask_clear(r300, r300->cmask_clear.size, + r300->cmask_clear.state); + r300->cmask_clear.dirty = FALSE; + } } else { assert(0); } @@ -357,11 +431,13 @@ static void r300_clear_render_target(struct pipe_context *pipe, struct pipe_surface *dst, const union pipe_color_union *color, unsigned dstx, unsigned dsty, - unsigned width, unsigned height) + unsigned width, unsigned height, + bool render_condition_enabled) { struct r300_context *r300 = r300_context(pipe); - r300_blitter_begin(r300, R300_CLEAR_SURFACE); + r300_blitter_begin(r300, R300_CLEAR_SURFACE | + (render_condition_enabled ? 0 : R300_IGNORE_RENDER_COND)); util_blitter_clear_render_target(r300->blitter, dst, color, dstx, dsty, width, height); r300_blitter_end(r300); @@ -374,7 +450,8 @@ static void r300_clear_depth_stencil(struct pipe_context *pipe, double depth, unsigned stencil, unsigned dstx, unsigned dsty, - unsigned width, unsigned height) + unsigned width, unsigned height, + bool render_condition_enabled) { struct r300_context *r300 = r300_context(pipe); struct pipe_framebuffer_state *fb = @@ -387,7 +464,8 @@ static void r300_clear_depth_stencil(struct pipe_context *pipe, } /* XXX Do not decompress ZMask of the currently-set zbuffer. */ - r300_blitter_begin(r300, R300_CLEAR_SURFACE); + r300_blitter_begin(r300, R300_CLEAR_SURFACE | + (render_condition_enabled ? 0 : R300_IGNORE_RENDER_COND)); util_blitter_clear_depth_stencil(r300->blitter, dst, clear_flags, depth, stencil, dstx, dsty, width, height); r300_blitter_end(r300); @@ -490,17 +568,17 @@ static void r300_resource_copy_region(struct pipe_context *pipe, * colorbuffers. */ util_blitter_default_dst_texture(&dst_templ, dst, dst_level, dstz); - util_blitter_default_src_texture(&src_templ, src, src_level); + util_blitter_default_src_texture(r300->blitter, &src_templ, src, src_level); layout = util_format_description(dst_templ.format)->layout; /* Handle non-renderable plain formats. */ if (layout == UTIL_FORMAT_LAYOUT_PLAIN && (!screen->is_format_supported(screen, src_templ.format, src->target, - src->nr_samples, + src->nr_samples, src->nr_storage_samples, PIPE_BIND_SAMPLER_VIEW) || !screen->is_format_supported(screen, dst_templ.format, dst->target, - dst->nr_samples, + dst->nr_samples, dst->nr_storage_samples, PIPE_BIND_RENDER_TARGET))) { switch (util_format_get_blocksize(dst_templ.format)) { case 1: @@ -567,9 +645,11 @@ static void r300_resource_copy_region(struct pipe_context *pipe, /* Fallback for textures. */ if (!screen->is_format_supported(screen, dst_templ.format, dst->target, dst->nr_samples, + dst->nr_storage_samples, PIPE_BIND_RENDER_TARGET) || !screen->is_format_supported(screen, src_templ.format, src->target, src->nr_samples, + src->nr_storage_samples, PIPE_BIND_SAMPLER_VIEW)) { assert(0 && "this shouldn't happen, update r300_is_blit_supported"); util_resource_copy_region(pipe, dst, dst_level, dstx, dsty, dstz, @@ -607,7 +687,9 @@ static boolean r300_is_simple_msaa_resolve(const struct pipe_blit_info *info) unsigned dst_width = u_minify(info->dst.resource->width0, info->dst.level); unsigned dst_height = u_minify(info->dst.resource->height0, info->dst.level); - return info->dst.resource->format == info->src.resource->format && + return info->src.resource->nr_samples > 1 && + info->dst.resource->nr_samples <= 1 && + info->dst.resource->format == info->src.resource->format && info->dst.resource->format == info->dst.format && info->src.resource->format == info->src.format && !info->scissor_enable && @@ -621,7 +703,9 @@ static boolean r300_is_simple_msaa_resolve(const struct pipe_blit_info *info) info->src.box.x == 0 && info->src.box.y == 0 && info->src.box.width == dst_width && - info->src.box.height == dst_height; + info->src.box.height == dst_height && + (r300_resource(info->dst.resource)->tex.microtile != RADEON_LAYOUT_LINEAR || + r300_resource(info->dst.resource)->tex.macrotile[info->dst.level] != RADEON_LAYOUT_LINEAR); } static void r300_simple_msaa_resolve(struct pipe_context *pipe, @@ -698,7 +782,8 @@ static void r300_msaa_resolve(struct pipe_context *pipe, templ.height0 = info->src.resource->height0; templ.depth0 = 1; templ.array_size = 1; - templ.usage = PIPE_USAGE_STATIC; + templ.usage = PIPE_USAGE_DEFAULT; + templ.flags = R300_RESOURCE_FORCE_MICROTILING; tmp = screen->resource_create(screen, &templ); @@ -711,7 +796,7 @@ static void r300_msaa_resolve(struct pipe_context *pipe, blit.src.resource = tmp; blit.src.box.z = 0; - r300_blitter_begin(r300, R300_BLIT); + r300_blitter_begin(r300, R300_BLIT | R300_IGNORE_RENDER_COND); util_blitter_blit(r300->blitter, &blit); r300_blitter_end(r300); @@ -726,9 +811,17 @@ static void r300_blit(struct pipe_context *pipe, (struct pipe_framebuffer_state*)r300->fb_state.state; struct pipe_blit_info info = *blit; + /* The driver supports sRGB textures but not framebuffers. Blitting + * from sRGB to sRGB should be the same as blitting from linear + * to linear, so use that, This avoids incorrect linearization. + */ + if (util_format_is_srgb(info.src.format)) { + info.src.format = util_format_linear(info.src.format); + info.dst.format = util_format_linear(info.dst.format); + } + /* MSAA resolve. */ if (info.src.resource->nr_samples > 1 && - info.dst.resource->nr_samples <= 1 && !util_format_is_depth_or_stencil(info.src.resource->format)) { r300_msaa_resolve(pipe, &info); return; @@ -770,11 +863,17 @@ static void r300_blit(struct pipe_context *pipe, } } - r300_blitter_begin(r300, R300_BLIT); + r300_blitter_begin(r300, R300_BLIT | + (info.render_condition_enable ? 0 : R300_IGNORE_RENDER_COND)); util_blitter_blit(r300->blitter, &info); r300_blitter_end(r300); } +static void r300_flush_resource(struct pipe_context *ctx, + struct pipe_resource *resource) +{ +} + void r300_init_blit_functions(struct r300_context *r300) { r300->context.clear = r300_clear; @@ -782,4 +881,5 @@ void r300_init_blit_functions(struct r300_context *r300) r300->context.clear_depth_stencil = r300_clear_depth_stencil; r300->context.resource_copy_region = r300_resource_copy_region; r300->context.blit = r300_blit; + r300->context.flush_resource = r300_flush_resource; }