2 * Copyright 2009 Marek Olšák <maraeo@gmail.com>
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE. */
23 #include "r300_context.h"
24 #include "r300_emit.h"
25 #include "r300_hyperz.h"
26 #include "r300_texture.h"
27 #include "r300_winsys.h"
29 #include "util/u_format.h"
30 #include "util/u_pack_color.h"
32 enum r300_blitter_op
/* bitmask */
35 R300_CLEAR_SURFACE
= 2,
39 static void r300_blitter_begin(struct r300_context
* r300
, enum r300_blitter_op op
)
41 if (r300
->query_current
) {
42 r300
->blitter_saved_query
= r300
->query_current
;
43 r300_stop_query(r300
);
46 /* Yeah we have to save all those states to ensure the blitter operation
47 * is really transparent. The states will be restored by the blitter once
49 util_blitter_save_blend(r300
->blitter
, r300
->blend_state
.state
);
50 util_blitter_save_depth_stencil_alpha(r300
->blitter
, r300
->dsa_state
.state
);
51 util_blitter_save_stencil_ref(r300
->blitter
, &(r300
->stencil_ref
));
52 util_blitter_save_rasterizer(r300
->blitter
, r300
->rs_state
.state
);
53 util_blitter_save_fragment_shader(r300
->blitter
, r300
->fs
.state
);
54 util_blitter_save_vertex_shader(r300
->blitter
, r300
->vs_state
.state
);
55 util_blitter_save_viewport(r300
->blitter
, &r300
->viewport
);
56 util_blitter_save_clip(r300
->blitter
, (struct pipe_clip_state
*)r300
->clip_state
.state
);
57 util_blitter_save_vertex_elements(r300
->blitter
, r300
->velems
);
58 util_blitter_save_vertex_buffers(r300
->blitter
, r300
->vertex_buffer_count
,
61 if (op
& (R300_CLEAR_SURFACE
| R300_COPY
))
62 util_blitter_save_framebuffer(r300
->blitter
, r300
->fb_state
.state
);
65 struct r300_textures_state
* state
=
66 (struct r300_textures_state
*)r300
->textures_state
.state
;
68 util_blitter_save_fragment_sampler_states(
69 r300
->blitter
, state
->sampler_state_count
,
70 (void**)state
->sampler_states
);
72 util_blitter_save_fragment_sampler_views(
73 r300
->blitter
, state
->sampler_view_count
,
74 (struct pipe_sampler_view
**)state
->sampler_views
);
78 static void r300_blitter_end(struct r300_context
*r300
)
80 if (r300
->blitter_saved_query
) {
81 r300_resume_query(r300
, r300
->blitter_saved_query
);
82 r300
->blitter_saved_query
= NULL
;
86 static uint32_t r300_depth_clear_cb_value(enum pipe_format format
,
90 util_pack_color(rgba
, format
, &uc
);
92 if (util_format_get_blocksizebits(format
) == 32)
95 return uc
.us
| (uc
.us
<< 16);
98 static boolean
r300_cbzb_clear_allowed(struct r300_context
*r300
,
99 unsigned clear_buffers
)
101 struct pipe_framebuffer_state
*fb
=
102 (struct pipe_framebuffer_state
*)r300
->fb_state
.state
;
104 /* Only color clear allowed, and only one colorbuffer. */
105 if (clear_buffers
!= PIPE_CLEAR_COLOR
|| fb
->nr_cbufs
!= 1)
108 return r300_surface(fb
->cbufs
[0])->cbzb_allowed
;
111 static uint32_t r300_depth_clear_value(enum pipe_format format
,
112 double depth
, unsigned stencil
)
115 case PIPE_FORMAT_Z16_UNORM
:
116 case PIPE_FORMAT_X8Z24_UNORM
:
117 return util_pack_z(format
, depth
);
119 case PIPE_FORMAT_S8_USCALED_Z24_UNORM
:
120 return util_pack_z_stencil(format
, depth
, stencil
);
128 /* Clear currently bound buffers. */
129 static void r300_clear(struct pipe_context
* pipe
,
135 /* My notes about fastfill:
137 * 1) Only the zbuffer is cleared.
139 * 2) The zbuffer must be micro-tiled and whole microtiles must be
140 * written. If microtiling is disabled, it locks up.
142 * 3) There is Z Mask RAM which contains a compressed zbuffer and
143 * it interacts with fastfill. We should figure out how to use it
144 * to get more performance.
145 * This is what we know about the Z Mask:
147 * Each dword of the Z Mask contains compression information
148 * for 16 4x4 pixel blocks, that is 2 bits for each block.
149 * On chips with 2 Z pipes, every other dword maps to a different
152 * 4) ZB_DEPTHCLEARVALUE is used to clear the zbuffer and the Z Mask must
153 * be equal to 0. (clear the Z Mask RAM with zeros)
155 * 5) For 16-bit zbuffer, compression causes a hung with one or
156 * two samples and should not be used.
158 * 6) FORCE_COMPRESSED_STENCIL_VALUE should be enabled for stencil clears
159 * to avoid needless decompression.
161 * 7) Fastfill must not be used if reading of compressed Z data is disabled
162 * and writing of compressed Z data is enabled (RD/WR_COMP_ENABLE),
163 * i.e. it cannot be used to compress the zbuffer.
165 * 8) ZB_CB_CLEAR does not interact with fastfill in any way.
170 struct r300_context
* r300
= r300_context(pipe
);
171 struct pipe_framebuffer_state
*fb
=
172 (struct pipe_framebuffer_state
*)r300
->fb_state
.state
;
173 struct r300_hyperz_state
*hyperz
=
174 (struct r300_hyperz_state
*)r300
->hyperz_state
.state
;
175 struct r300_texture
*zstex
=
176 fb
->zsbuf
? r300_texture(fb
->zsbuf
->texture
) : NULL
;
177 uint32_t width
= fb
->width
;
178 uint32_t height
= fb
->height
;
179 boolean has_hyperz
= r300
->rws
->get_value(r300
->rws
, R300_CAN_HYPERZ
);
180 uint32_t hyperz_dcv
= hyperz
->zb_depthclearvalue
;
182 /* Enable fast Z clear.
183 * The zbuffer must be in micro-tiled mode, otherwise it locks up. */
184 if ((buffers
& PIPE_CLEAR_DEPTHSTENCIL
) && has_hyperz
) {
185 hyperz_dcv
= hyperz
->zb_depthclearvalue
=
186 r300_depth_clear_value(fb
->zsbuf
->format
, depth
, stencil
);
188 r300_mark_fb_state_dirty(r300
, R300_CHANGED_ZCLEAR_FLAG
);
189 if (zstex
->zmask_mem
[fb
->zsbuf
->level
]) {
190 r300
->zmask_clear
.dirty
= TRUE
;
191 buffers
&= ~PIPE_CLEAR_DEPTHSTENCIL
;
193 if (zstex
->hiz_mem
[fb
->zsbuf
->level
])
194 r300
->hiz_clear
.dirty
= TRUE
;
197 /* Enable CBZB clear. */
198 if (r300_cbzb_clear_allowed(r300
, buffers
)) {
199 struct r300_surface
*surf
= r300_surface(fb
->cbufs
[0]);
201 hyperz
->zb_depthclearvalue
=
202 r300_depth_clear_cb_value(surf
->base
.format
, rgba
);
204 width
= surf
->cbzb_width
;
205 height
= surf
->cbzb_height
;
207 r300
->cbzb_clear
= TRUE
;
208 r300_mark_fb_state_dirty(r300
, R300_CHANGED_CBZB_FLAG
);
213 /* Clear using the blitter. */
214 r300_blitter_begin(r300
, R300_CLEAR
);
215 util_blitter_clear(r300
->blitter
,
219 buffers
, rgba
, depth
, stencil
);
220 r300_blitter_end(r300
);
221 } else if (r300
->zmask_clear
.dirty
) {
222 /* Just clear zmask and hiz now, this does not use a standard draw
226 /* Calculate zmask_clear and hiz_clear atom sizes. */
227 r300_update_hyperz_state(r300
);
228 dwords
= r300
->zmask_clear
.size
+
229 (r300
->hiz_clear
.dirty
? r300
->hiz_clear
.size
: 0) +
230 r300_get_num_cs_end_dwords(r300
);
232 /* Reserve CS space. */
233 if (dwords
> (r300
->cs
->ndw
- r300
->cs
->cdw
)) {
234 r300
->context
.flush(&r300
->context
, 0, NULL
);
237 /* Emit clear packets. */
238 r300_emit_zmask_clear(r300
, r300
->zmask_clear
.size
,
239 r300
->zmask_clear
.state
);
240 r300
->zmask_clear
.dirty
= FALSE
;
241 if (r300
->hiz_clear
.dirty
) {
242 r300_emit_hiz_clear(r300
, r300
->hiz_clear
.size
,
243 r300
->hiz_clear
.state
);
244 r300
->hiz_clear
.dirty
= FALSE
;
250 /* Disable CBZB clear. */
251 if (r300
->cbzb_clear
) {
252 r300
->cbzb_clear
= FALSE
;
253 hyperz
->zb_depthclearvalue
= hyperz_dcv
;
254 r300_mark_fb_state_dirty(r300
, R300_CHANGED_CBZB_FLAG
);
257 /* Enable fastfill and/or hiz.
259 * If we cleared zmask/hiz, it's in use now. The Hyper-Z state update
260 * looks if zmask/hiz is in use and enables fastfill accordingly. */
262 (zstex
->zmask_in_use
[fb
->zsbuf
->level
] ||
263 zstex
->hiz_in_use
[fb
->zsbuf
->level
])) {
264 r300
->hyperz_state
.dirty
= TRUE
;
267 /* XXX this flush "fixes" a hardlock in the cubestorm xscreensaver */
268 if (r300
->flush_counter
== 0)
269 pipe
->flush(pipe
, 0, NULL
);
272 /* Clear a region of a color surface to a constant value. */
273 static void r300_clear_render_target(struct pipe_context
*pipe
,
274 struct pipe_surface
*dst
,
276 unsigned dstx
, unsigned dsty
,
277 unsigned width
, unsigned height
)
279 struct r300_context
*r300
= r300_context(pipe
);
281 r300_blitter_begin(r300
, R300_CLEAR_SURFACE
);
282 util_blitter_clear_render_target(r300
->blitter
, dst
, rgba
,
283 dstx
, dsty
, width
, height
);
284 r300_blitter_end(r300
);
287 /* Clear a region of a depth stencil surface. */
288 static void r300_clear_depth_stencil(struct pipe_context
*pipe
,
289 struct pipe_surface
*dst
,
290 unsigned clear_flags
,
293 unsigned dstx
, unsigned dsty
,
294 unsigned width
, unsigned height
)
296 struct r300_context
*r300
= r300_context(pipe
);
298 r300_blitter_begin(r300
, R300_CLEAR_SURFACE
);
299 util_blitter_clear_depth_stencil(r300
->blitter
, dst
, clear_flags
, depth
, stencil
,
300 dstx
, dsty
, width
, height
);
301 r300_blitter_end(r300
);
304 /* Flush a depth stencil buffer. */
305 void r300_flush_depth_stencil(struct pipe_context
*pipe
,
306 struct pipe_resource
*dst
,
307 struct pipe_subresource subdst
,
310 struct r300_context
*r300
= r300_context(pipe
);
311 struct pipe_surface
*dstsurf
;
312 struct r300_texture
*tex
= r300_texture(dst
);
314 if (!tex
->zmask_mem
[subdst
.level
])
316 if (!tex
->zmask_in_use
[subdst
.level
])
319 dstsurf
= pipe
->screen
->get_tex_surface(pipe
->screen
, dst
,
320 subdst
.face
, subdst
.level
, zslice
,
321 PIPE_BIND_DEPTH_STENCIL
);
322 r300
->z_decomp_rd
= TRUE
;
323 r300_blitter_begin(r300
, R300_CLEAR_SURFACE
);
324 util_blitter_flush_depth_stencil(r300
->blitter
, dstsurf
);
325 r300_blitter_end(r300
);
326 r300
->z_decomp_rd
= FALSE
;
328 tex
->zmask_in_use
[subdst
.level
] = FALSE
;
331 /* Copy a block of pixels from one surface to another using HW. */
332 static void r300_hw_copy_region(struct pipe_context
* pipe
,
333 struct pipe_resource
*dst
,
334 struct pipe_subresource subdst
,
335 unsigned dstx
, unsigned dsty
, unsigned dstz
,
336 struct pipe_resource
*src
,
337 struct pipe_subresource subsrc
,
338 unsigned srcx
, unsigned srcy
, unsigned srcz
,
339 unsigned width
, unsigned height
)
341 struct r300_context
* r300
= r300_context(pipe
);
343 r300_blitter_begin(r300
, R300_COPY
);
344 util_blitter_copy_region(r300
->blitter
, dst
, subdst
, dstx
, dsty
, dstz
,
345 src
, subsrc
, srcx
, srcy
, srcz
, width
, height
,
347 r300_blitter_end(r300
);
350 /* Copy a block of pixels from one surface to another. */
351 static void r300_resource_copy_region(struct pipe_context
*pipe
,
352 struct pipe_resource
*dst
,
353 struct pipe_subresource subdst
,
354 unsigned dstx
, unsigned dsty
, unsigned dstz
,
355 struct pipe_resource
*src
,
356 struct pipe_subresource subsrc
,
357 unsigned srcx
, unsigned srcy
, unsigned srcz
,
358 unsigned width
, unsigned height
)
360 enum pipe_format old_format
= dst
->format
;
361 enum pipe_format new_format
= old_format
;
363 if (!pipe
->screen
->is_format_supported(pipe
->screen
,
364 old_format
, src
->target
,
366 PIPE_BIND_RENDER_TARGET
|
367 PIPE_BIND_SAMPLER_VIEW
, 0) &&
368 util_format_is_plain(old_format
)) {
369 switch (util_format_get_blocksize(old_format
)) {
371 new_format
= PIPE_FORMAT_I8_UNORM
;
374 new_format
= PIPE_FORMAT_B4G4R4A4_UNORM
;
377 new_format
= PIPE_FORMAT_B8G8R8A8_UNORM
;
380 new_format
= PIPE_FORMAT_R16G16B16A16_UNORM
;
383 debug_printf("r300: surface_copy: Unhandled format: %s. Falling back to software.\n"
384 "r300: surface_copy: Software fallback doesn't work for tiled textures.\n",
385 util_format_short_name(old_format
));
389 is_depth
= util_format_get_component_bits(src
->format
, UTIL_FORMAT_COLORSPACE_ZS
, 0) != 0;
391 r300_flush_depth_stencil(pipe
, src
, subsrc
, srcz
);
393 if (old_format
!= new_format
) {
394 dst
->format
= new_format
;
395 src
->format
= new_format
;
397 r300_texture_reinterpret_format(pipe
->screen
,
399 r300_texture_reinterpret_format(pipe
->screen
,
403 r300_hw_copy_region(pipe
, dst
, subdst
, dstx
, dsty
, dstz
,
404 src
, subsrc
, srcx
, srcy
, srcz
, width
, height
);
406 if (old_format
!= new_format
) {
407 dst
->format
= old_format
;
408 src
->format
= old_format
;
410 r300_texture_reinterpret_format(pipe
->screen
,
412 r300_texture_reinterpret_format(pipe
->screen
,
417 void r300_init_blit_functions(struct r300_context
*r300
)
419 r300
->context
.clear
= r300_clear
;
420 r300
->context
.clear_render_target
= r300_clear_render_target
;
421 r300
->context
.clear_depth_stencil
= r300_clear_depth_stencil
;
422 r300
->context
.resource_copy_region
= r300_resource_copy_region
;