1 /* -*- mode: C; c-file-style: "k&r"; tab-width 4; indent-tabs-mode: t; -*- */
4 * Copyright (C) 2012 Rob Clark <robclark@freedesktop.org>
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice (including the next
14 * paragraph) shall be included in all copies or substantial portions of the
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
22 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
26 * Rob Clark <robclark@freedesktop.org>
29 #include "pipe/p_state.h"
30 #include "util/u_string.h"
31 #include "util/u_memory.h"
32 #include "util/u_prim.h"
33 #include "util/u_format.h"
34 #include "util/u_helpers.h"
36 #include "freedreno_draw.h"
37 #include "freedreno_context.h"
38 #include "freedreno_state.h"
39 #include "freedreno_resource.h"
40 #include "freedreno_query_acc.h"
41 #include "freedreno_query_hw.h"
42 #include "freedreno_util.h"
45 resource_read(struct fd_batch
*batch
, struct pipe_resource
*prsc
)
49 fd_batch_resource_used(batch
, fd_resource(prsc
), false);
53 resource_written(struct fd_batch
*batch
, struct pipe_resource
*prsc
)
57 fd_batch_resource_used(batch
, fd_resource(prsc
), true);
61 fd_draw_vbo(struct pipe_context
*pctx
, const struct pipe_draw_info
*info
)
63 struct fd_context
*ctx
= fd_context(pctx
);
64 struct fd_batch
*batch
= ctx
->batch
;
65 struct pipe_framebuffer_state
*pfb
= &batch
->framebuffer
;
66 struct pipe_scissor_state
*scissor
= fd_context_get_scissor(ctx
);
67 unsigned i
, prims
, buffers
= 0;
69 if (!info
->count_from_stream_output
&& !info
->indirect
&&
70 !info
->primitive_restart
&&
71 !u_trim_pipe_prim(info
->mode
, (unsigned*)&info
->count
))
74 /* if we supported transform feedback, we'd have to disable this: */
75 if (((scissor
->maxx
- scissor
->minx
) *
76 (scissor
->maxy
- scissor
->miny
)) == 0) {
80 /* TODO: push down the region versions into the tiles */
81 if (!fd_render_condition_check(pctx
))
84 /* emulate unsupported primitives: */
85 if (!fd_supported_prim(ctx
, info
->mode
)) {
86 if (ctx
->streamout
.num_targets
> 0)
87 debug_error("stream-out with emulated prims");
88 util_primconvert_save_index_buffer(ctx
->primconvert
, &ctx
->indexbuf
);
89 util_primconvert_save_rasterizer_state(ctx
->primconvert
, ctx
->rasterizer
);
90 util_primconvert_draw_vbo(ctx
->primconvert
, info
);
94 /* Upload a user index buffer. */
95 struct pipe_index_buffer ibuffer_saved
= {};
96 if (info
->indexed
&& ctx
->indexbuf
.user_buffer
&&
97 !util_save_and_upload_index_buffer(pctx
, info
, &ctx
->indexbuf
,
103 fd_batch_reset(batch
);
104 fd_context_all_dirty(ctx
);
107 batch
->blit
= ctx
->in_blit
;
108 batch
->back_blit
= ctx
->in_shadow
;
110 /* NOTE: needs to be before resource_written(batch->query_buf), otherwise
111 * query_buf may not be created yet.
113 fd_batch_set_stage(batch
, FD_STAGE_DRAW
);
116 * Figure out the buffers/features we need:
119 mtx_lock(&ctx
->screen
->lock
);
121 if (fd_depth_enabled(ctx
)) {
122 buffers
|= FD_BUFFER_DEPTH
;
123 resource_written(batch
, pfb
->zsbuf
->texture
);
124 batch
->gmem_reason
|= FD_GMEM_DEPTH_ENABLED
;
127 if (fd_stencil_enabled(ctx
)) {
128 buffers
|= FD_BUFFER_STENCIL
;
129 resource_written(batch
, pfb
->zsbuf
->texture
);
130 batch
->gmem_reason
|= FD_GMEM_STENCIL_ENABLED
;
133 if (fd_logicop_enabled(ctx
))
134 batch
->gmem_reason
|= FD_GMEM_LOGICOP_ENABLED
;
136 for (i
= 0; i
< pfb
->nr_cbufs
; i
++) {
137 struct pipe_resource
*surf
;
142 surf
= pfb
->cbufs
[i
]->texture
;
144 resource_written(batch
, surf
);
145 buffers
|= PIPE_CLEAR_COLOR0
<< i
;
147 if (surf
->nr_samples
> 1)
148 batch
->gmem_reason
|= FD_GMEM_MSAA_ENABLED
;
150 if (fd_blend_enabled(ctx
, i
))
151 batch
->gmem_reason
|= FD_GMEM_BLEND_ENABLED
;
154 /* Mark SSBOs as being written.. we don't actually know which ones are
155 * read vs written, so just assume the worst
157 foreach_bit(i
, ctx
->shaderbuf
[PIPE_SHADER_FRAGMENT
].enabled_mask
)
158 resource_read(batch
, ctx
->shaderbuf
[PIPE_SHADER_FRAGMENT
].sb
[i
].buffer
);
160 foreach_bit(i
, ctx
->constbuf
[PIPE_SHADER_VERTEX
].enabled_mask
)
161 resource_read(batch
, ctx
->constbuf
[PIPE_SHADER_VERTEX
].cb
[i
].buffer
);
162 foreach_bit(i
, ctx
->constbuf
[PIPE_SHADER_FRAGMENT
].enabled_mask
)
163 resource_read(batch
, ctx
->constbuf
[PIPE_SHADER_FRAGMENT
].cb
[i
].buffer
);
165 /* Mark VBOs as being read */
166 foreach_bit(i
, ctx
->vtx
.vertexbuf
.enabled_mask
) {
167 assert(!ctx
->vtx
.vertexbuf
.vb
[i
].user_buffer
);
168 resource_read(batch
, ctx
->vtx
.vertexbuf
.vb
[i
].buffer
);
171 /* Mark index buffer as being read */
172 resource_read(batch
, ctx
->indexbuf
.buffer
);
174 /* Mark textures as being read */
175 foreach_bit(i
, ctx
->tex
[PIPE_SHADER_VERTEX
].valid_textures
)
176 resource_read(batch
, ctx
->tex
[PIPE_SHADER_VERTEX
].textures
[i
]->texture
);
177 foreach_bit(i
, ctx
->tex
[PIPE_SHADER_FRAGMENT
].valid_textures
)
178 resource_read(batch
, ctx
->tex
[PIPE_SHADER_FRAGMENT
].textures
[i
]->texture
);
180 /* Mark streamout buffers as being written.. */
181 for (i
= 0; i
< ctx
->streamout
.num_targets
; i
++)
182 if (ctx
->streamout
.targets
[i
])
183 resource_written(batch
, ctx
->streamout
.targets
[i
]->buffer
);
185 resource_written(batch
, batch
->query_buf
);
187 list_for_each_entry(struct fd_acc_query
, aq
, &ctx
->acc_active_queries
, node
)
188 resource_written(batch
, aq
->prsc
);
190 mtx_unlock(&ctx
->screen
->lock
);
194 prims
= u_reduced_prims_for_vertices(info
->mode
, info
->count
);
196 ctx
->stats
.draw_calls
++;
198 /* TODO prims_emitted should be clipped when the stream-out buffer is
199 * not large enough. See max_tf_vtx().. probably need to move that
200 * into common code. Although a bit more annoying since a2xx doesn't
201 * use ir3 so no common way to get at the pipe_stream_output_info
202 * which is needed for this calculation.
204 if (ctx
->streamout
.num_targets
> 0)
205 ctx
->stats
.prims_emitted
+= prims
;
206 ctx
->stats
.prims_generated
+= prims
;
208 /* any buffers that haven't been cleared yet, we need to restore: */
209 batch
->restore
|= buffers
& (FD_BUFFER_ALL
& ~batch
->cleared
);
210 /* and any buffers used, need to be resolved: */
211 batch
->resolve
|= buffers
;
213 DBG("%p: %x %ux%u num_draws=%u (%s/%s)", batch
, buffers
,
214 pfb
->width
, pfb
->height
, batch
->num_draws
,
215 util_format_short_name(pipe_surface_format(pfb
->cbufs
[0])),
216 util_format_short_name(pipe_surface_format(pfb
->zsbuf
)));
218 if (ctx
->draw_vbo(ctx
, info
))
219 batch
->needs_flush
= true;
221 for (i
= 0; i
< ctx
->streamout
.num_targets
; i
++)
222 ctx
->streamout
.offsets
[i
] += info
->count
;
224 if (fd_mesa_debug
& FD_DBG_DDRAW
)
225 fd_context_all_dirty(ctx
);
227 fd_batch_check_size(batch
);
229 if (info
->indexed
&& ibuffer_saved
.user_buffer
)
230 pctx
->set_index_buffer(pctx
, &ibuffer_saved
);
233 /* Generic clear implementation (partially) using u_blitter: */
235 fd_blitter_clear(struct pipe_context
*pctx
, unsigned buffers
,
236 const union pipe_color_union
*color
, double depth
, unsigned stencil
)
238 struct fd_context
*ctx
= fd_context(pctx
);
239 struct pipe_framebuffer_state
*pfb
= &ctx
->batch
->framebuffer
;
240 struct blitter_context
*blitter
= ctx
->blitter
;
242 fd_blitter_pipe_begin(ctx
, false, true, FD_STAGE_CLEAR
);
244 util_blitter_common_clear_setup(blitter
, pfb
->width
, pfb
->height
,
245 buffers
, NULL
, NULL
);
247 struct pipe_stencil_ref sr
= {
248 .ref_value
= { stencil
& 0xff }
250 pctx
->set_stencil_ref(pctx
, &sr
);
252 struct pipe_constant_buffer cb
= {
254 .user_buffer
= &color
->ui
,
256 pctx
->set_constant_buffer(pctx
, PIPE_SHADER_FRAGMENT
, 0, &cb
);
258 if (!ctx
->clear_rs_state
) {
259 const struct pipe_rasterizer_state tmpl
= {
260 .cull_face
= PIPE_FACE_NONE
,
261 .half_pixel_center
= 1,
262 .bottom_edge_rule
= 1,
266 ctx
->clear_rs_state
= pctx
->create_rasterizer_state(pctx
, &tmpl
);
268 pctx
->bind_rasterizer_state(pctx
, ctx
->clear_rs_state
);
270 struct pipe_viewport_state vp
= {
271 .scale
= { 0.5f
* pfb
->width
, -0.5f
* pfb
->height
, depth
},
272 .translate
= { 0.5f
* pfb
->width
, 0.5f
* pfb
->height
, 0.0f
},
274 pctx
->set_viewport_states(pctx
, 0, 1, &vp
);
276 pctx
->bind_vertex_elements_state(pctx
, ctx
->solid_vbuf_state
.vtx
);
277 pctx
->set_vertex_buffers(pctx
, blitter
->vb_slot
, 1,
278 &ctx
->solid_vbuf_state
.vertexbuf
.vb
[0]);
279 pctx
->set_stream_output_targets(pctx
, 0, NULL
, NULL
);
280 pctx
->bind_vs_state(pctx
, ctx
->solid_prog
.vp
);
281 pctx
->bind_fs_state(pctx
, ctx
->solid_prog
.fp
);
283 struct pipe_draw_info info
= {
284 .mode
= PIPE_PRIM_MAX
, /* maps to DI_PT_RECTLIST */
289 ctx
->draw_vbo(ctx
, &info
);
291 util_blitter_restore_constant_buffer_state(blitter
);
292 util_blitter_restore_vertex_states(blitter
);
293 util_blitter_restore_fragment_states(blitter
);
294 util_blitter_restore_textures(blitter
);
295 util_blitter_restore_fb_state(blitter
);
296 util_blitter_restore_render_cond(blitter
);
297 util_blitter_unset_running_flag(blitter
);
299 fd_blitter_pipe_end(ctx
);
302 /* TODO figure out how to make better use of existing state mechanism
303 * for clear (and possibly gmem->mem / mem->gmem) so we can (a) keep
304 * track of what state really actually changes, and (b) reduce the code
305 * in the a2xx/a3xx parts.
309 fd_clear(struct pipe_context
*pctx
, unsigned buffers
,
310 const union pipe_color_union
*color
, double depth
, unsigned stencil
)
312 struct fd_context
*ctx
= fd_context(pctx
);
313 struct fd_batch
*batch
= ctx
->batch
;
314 struct pipe_framebuffer_state
*pfb
= &batch
->framebuffer
;
315 struct pipe_scissor_state
*scissor
= fd_context_get_scissor(ctx
);
316 unsigned cleared_buffers
;
319 /* TODO: push down the region versions into the tiles */
320 if (!fd_render_condition_check(pctx
))
324 fd_batch_reset(batch
);
325 fd_context_all_dirty(ctx
);
328 /* for bookkeeping about which buffers have been cleared (and thus
329 * can fully or partially skip mem2gmem) we need to ignore buffers
330 * that have already had a draw, in case apps do silly things like
331 * clear after draw (ie. if you only clear the color buffer, but
332 * something like alpha-test causes side effects from the draw in
333 * the depth buffer, etc)
335 cleared_buffers
= buffers
& (FD_BUFFER_ALL
& ~batch
->restore
);
337 /* do we have full-screen scissor? */
338 if (!memcmp(scissor
, &ctx
->disabled_scissor
, sizeof(*scissor
))) {
339 batch
->cleared
|= cleared_buffers
;
341 batch
->partial_cleared
|= cleared_buffers
;
342 if (cleared_buffers
& PIPE_CLEAR_COLOR
)
343 batch
->cleared_scissor
.color
= *scissor
;
344 if (cleared_buffers
& PIPE_CLEAR_DEPTH
)
345 batch
->cleared_scissor
.depth
= *scissor
;
346 if (cleared_buffers
& PIPE_CLEAR_STENCIL
)
347 batch
->cleared_scissor
.stencil
= *scissor
;
349 batch
->resolve
|= buffers
;
350 batch
->needs_flush
= true;
352 mtx_lock(&ctx
->screen
->lock
);
354 if (buffers
& PIPE_CLEAR_COLOR
)
355 for (i
= 0; i
< pfb
->nr_cbufs
; i
++)
356 if (buffers
& (PIPE_CLEAR_COLOR0
<< i
))
357 resource_written(batch
, pfb
->cbufs
[i
]->texture
);
359 if (buffers
& (PIPE_CLEAR_DEPTH
| PIPE_CLEAR_STENCIL
)) {
360 resource_written(batch
, pfb
->zsbuf
->texture
);
361 batch
->gmem_reason
|= FD_GMEM_CLEARS_DEPTH_STENCIL
;
364 resource_written(batch
, batch
->query_buf
);
366 list_for_each_entry(struct fd_acc_query
, aq
, &ctx
->acc_active_queries
, node
)
367 resource_written(batch
, aq
->prsc
);
369 mtx_unlock(&ctx
->screen
->lock
);
371 DBG("%p: %x %ux%u depth=%f, stencil=%u (%s/%s)", batch
, buffers
,
372 pfb
->width
, pfb
->height
, depth
, stencil
,
373 util_format_short_name(pipe_surface_format(pfb
->cbufs
[0])),
374 util_format_short_name(pipe_surface_format(pfb
->zsbuf
)));
376 /* if per-gen backend doesn't implement ctx->clear() generic
380 fd_blitter_clear(pctx
, buffers
, color
, depth
, stencil
);
384 fd_batch_set_stage(batch
, FD_STAGE_CLEAR
);
386 ctx
->clear(ctx
, buffers
, color
, depth
, stencil
);
388 if (fd_mesa_debug
& FD_DBG_DCLEAR
)
389 fd_context_all_dirty(ctx
);
393 fd_clear_render_target(struct pipe_context
*pctx
, struct pipe_surface
*ps
,
394 const union pipe_color_union
*color
,
395 unsigned x
, unsigned y
, unsigned w
, unsigned h
,
396 bool render_condition_enabled
)
398 DBG("TODO: x=%u, y=%u, w=%u, h=%u", x
, y
, w
, h
);
402 fd_clear_depth_stencil(struct pipe_context
*pctx
, struct pipe_surface
*ps
,
403 unsigned buffers
, double depth
, unsigned stencil
,
404 unsigned x
, unsigned y
, unsigned w
, unsigned h
,
405 bool render_condition_enabled
)
407 DBG("TODO: buffers=%u, depth=%f, stencil=%u, x=%u, y=%u, w=%u, h=%u",
408 buffers
, depth
, stencil
, x
, y
, w
, h
);
412 fd_draw_init(struct pipe_context
*pctx
)
414 pctx
->draw_vbo
= fd_draw_vbo
;
415 pctx
->clear
= fd_clear
;
416 pctx
->clear_render_target
= fd_clear_render_target
;
417 pctx
->clear_depth_stencil
= fd_clear_depth_stencil
;