2 * Copyright 2010 Red Hat Inc.
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * on the rights to use, copy, modify, merge, publish, distribute, sub
9 * license, and/or sell copies of the Software, and to permit persons to whom
10 * the Software is furnished to do so, subject to the following conditions:
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
20 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
21 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
22 * USE OR OTHER DEALINGS IN THE SOFTWARE.
24 * Authors: Dave Airlie <airlied@redhat.com>
25 * Jerome Glisse <jglisse@redhat.com>
27 #include "r600_formats.h"
30 #include "util/u_draw_quad.h"
31 #include "util/u_upload_mgr.h"
32 #include "tgsi/tgsi_parse.h"
35 #define R600_PRIM_RECTANGLE_LIST PIPE_PRIM_MAX
37 static void r600_emit_command_buffer(struct r600_context
*rctx
, struct r600_atom
*atom
)
39 struct radeon_winsys_cs
*cs
= rctx
->cs
;
40 struct r600_command_buffer
*cb
= (struct r600_command_buffer
*)atom
;
42 assert(cs
->cdw
+ cb
->atom
.num_dw
<= RADEON_MAX_CMDBUF_DWORDS
);
43 memcpy(cs
->buf
+ cs
->cdw
, cb
->buf
, 4 * cb
->atom
.num_dw
);
44 cs
->cdw
+= cb
->atom
.num_dw
;
47 void r600_init_command_buffer(struct r600_context
*rctx
, struct r600_command_buffer
*cb
, unsigned id
, unsigned num_dw
)
49 r600_init_atom(rctx
, &cb
->atom
, id
, r600_emit_command_buffer
, 0);
50 cb
->buf
= CALLOC(1, 4 * num_dw
);
51 cb
->max_num_dw
= num_dw
;
54 void r600_release_command_buffer(struct r600_command_buffer
*cb
)
59 static void r600_emit_surface_sync(struct r600_context
*rctx
, struct r600_atom
*atom
)
61 struct radeon_winsys_cs
*cs
= rctx
->cs
;
62 struct r600_surface_sync_cmd
*a
= (struct r600_surface_sync_cmd
*)atom
;
64 cs
->buf
[cs
->cdw
++] = PKT3(PKT3_SURFACE_SYNC
, 3, 0);
65 cs
->buf
[cs
->cdw
++] = a
->flush_flags
; /* CP_COHER_CNTL */
66 cs
->buf
[cs
->cdw
++] = 0xffffffff; /* CP_COHER_SIZE */
67 cs
->buf
[cs
->cdw
++] = 0; /* CP_COHER_BASE */
68 cs
->buf
[cs
->cdw
++] = 0x0000000A; /* POLL_INTERVAL */
73 static void r600_emit_r6xx_flush_and_inv(struct r600_context
*rctx
, struct r600_atom
*atom
)
75 struct radeon_winsys_cs
*cs
= rctx
->cs
;
76 cs
->buf
[cs
->cdw
++] = PKT3(PKT3_EVENT_WRITE
, 0, 0);
77 cs
->buf
[cs
->cdw
++] = EVENT_TYPE(EVENT_TYPE_CACHE_FLUSH_AND_INV_EVENT
) | EVENT_INDEX(0);
80 void r600_init_atom(struct r600_context
*rctx
,
81 struct r600_atom
*atom
,
83 void (*emit
)(struct r600_context
*ctx
, struct r600_atom
*state
),
86 assert(id
< R600_MAX_ATOM
);
87 assert(rctx
->atoms
[id
] == NULL
);
88 rctx
->atoms
[id
] = atom
;
91 atom
->num_dw
= num_dw
;
95 void r600_emit_alphatest_state(struct r600_context
*rctx
, struct r600_atom
*atom
)
97 struct radeon_winsys_cs
*cs
= rctx
->cs
;
98 struct r600_alphatest_state
*a
= (struct r600_alphatest_state
*)atom
;
99 unsigned alpha_ref
= a
->sx_alpha_ref
;
101 if (rctx
->chip_class
>= EVERGREEN
&& a
->cb0_export_16bpc
) {
102 alpha_ref
&= ~0x1FFF;
105 r600_write_context_reg(cs
, R_028410_SX_ALPHA_TEST_CONTROL
,
106 a
->sx_alpha_test_control
|
107 S_028410_ALPHA_TEST_BYPASS(a
->bypass
));
108 r600_write_context_reg(cs
, R_028438_SX_ALPHA_REF
, alpha_ref
);
111 void r600_init_common_atoms(struct r600_context
*rctx
)
113 r600_init_atom(rctx
, &rctx
->r6xx_flush_and_inv_cmd
, 2, r600_emit_r6xx_flush_and_inv
, 2);
114 r600_init_atom(rctx
, &rctx
->surface_sync_cmd
.atom
, 3, r600_emit_surface_sync
, 5);
117 unsigned r600_get_cb_flush_flags(struct r600_context
*rctx
)
121 if (rctx
->framebuffer
.nr_cbufs
) {
122 flags
|= S_0085F0_CB_ACTION_ENA(1) |
123 (((1 << rctx
->framebuffer
.nr_cbufs
) - 1) << S_0085F0_CB0_DEST_BASE_ENA_SHIFT
);
126 /* Workaround for broken flushing on some R6xx chipsets. */
127 if (rctx
->family
== CHIP_RV670
||
128 rctx
->family
== CHIP_RS780
||
129 rctx
->family
== CHIP_RS880
) {
130 flags
|= S_0085F0_CB1_DEST_BASE_ENA(1) |
131 S_0085F0_DEST_BASE_0_ENA(1);
136 void r600_texture_barrier(struct pipe_context
*ctx
)
138 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
140 rctx
->surface_sync_cmd
.flush_flags
|= S_0085F0_TC_ACTION_ENA(1) | r600_get_cb_flush_flags(rctx
);
141 r600_atom_dirty(rctx
, &rctx
->surface_sync_cmd
.atom
);
144 static bool r600_conv_pipe_prim(unsigned pprim
, unsigned *prim
)
146 static const int prim_conv
[] = {
147 V_008958_DI_PT_POINTLIST
,
148 V_008958_DI_PT_LINELIST
,
149 V_008958_DI_PT_LINELOOP
,
150 V_008958_DI_PT_LINESTRIP
,
151 V_008958_DI_PT_TRILIST
,
152 V_008958_DI_PT_TRISTRIP
,
153 V_008958_DI_PT_TRIFAN
,
154 V_008958_DI_PT_QUADLIST
,
155 V_008958_DI_PT_QUADSTRIP
,
156 V_008958_DI_PT_POLYGON
,
161 V_008958_DI_PT_RECTLIST
164 *prim
= prim_conv
[pprim
];
166 fprintf(stderr
, "%s:%d unsupported %d\n", __func__
, __LINE__
, pprim
);
172 /* common state between evergreen and r600 */
174 static void r600_bind_blend_state_internal(struct r600_context
*rctx
,
175 struct r600_pipe_blend
*blend
)
177 struct r600_pipe_state
*rstate
;
178 bool update_cb
= false;
180 rstate
= &blend
->rstate
;
181 rctx
->states
[rstate
->id
] = rstate
;
182 r600_context_pipe_state_set(rctx
, rstate
);
184 if (rctx
->cb_misc_state
.blend_colormask
!= blend
->cb_target_mask
) {
185 rctx
->cb_misc_state
.blend_colormask
= blend
->cb_target_mask
;
188 if (rctx
->chip_class
<= R700
&&
189 rctx
->cb_misc_state
.cb_color_control
!= blend
->cb_color_control
) {
190 rctx
->cb_misc_state
.cb_color_control
= blend
->cb_color_control
;
193 if (rctx
->cb_misc_state
.dual_src_blend
!= blend
->dual_src_blend
) {
194 rctx
->cb_misc_state
.dual_src_blend
= blend
->dual_src_blend
;
198 r600_atom_dirty(rctx
, &rctx
->cb_misc_state
.atom
);
202 void r600_bind_blend_state(struct pipe_context
*ctx
, void *state
)
204 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
205 struct r600_pipe_blend
*blend
= (struct r600_pipe_blend
*)state
;
211 rctx
->alpha_to_one
= blend
->alpha_to_one
;
212 rctx
->dual_src_blend
= blend
->dual_src_blend
;
214 if (!rctx
->blend_override
)
215 r600_bind_blend_state_internal(rctx
, blend
);
218 void r600_set_blend_color(struct pipe_context
*ctx
,
219 const struct pipe_blend_color
*state
)
221 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
222 struct r600_pipe_state
*rstate
= CALLOC_STRUCT(r600_pipe_state
);
227 rstate
->id
= R600_PIPE_STATE_BLEND_COLOR
;
228 r600_pipe_state_add_reg(rstate
, R_028414_CB_BLEND_RED
, fui(state
->color
[0]));
229 r600_pipe_state_add_reg(rstate
, R_028418_CB_BLEND_GREEN
, fui(state
->color
[1]));
230 r600_pipe_state_add_reg(rstate
, R_02841C_CB_BLEND_BLUE
, fui(state
->color
[2]));
231 r600_pipe_state_add_reg(rstate
, R_028420_CB_BLEND_ALPHA
, fui(state
->color
[3]));
233 free(rctx
->states
[R600_PIPE_STATE_BLEND_COLOR
]);
234 rctx
->states
[R600_PIPE_STATE_BLEND_COLOR
] = rstate
;
235 r600_context_pipe_state_set(rctx
, rstate
);
238 static void r600_set_stencil_ref(struct pipe_context
*ctx
,
239 const struct r600_stencil_ref
*state
)
241 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
242 struct r600_pipe_state
*rstate
= CALLOC_STRUCT(r600_pipe_state
);
247 rstate
->id
= R600_PIPE_STATE_STENCIL_REF
;
248 r600_pipe_state_add_reg(rstate
,
249 R_028430_DB_STENCILREFMASK
,
250 S_028430_STENCILREF(state
->ref_value
[0]) |
251 S_028430_STENCILMASK(state
->valuemask
[0]) |
252 S_028430_STENCILWRITEMASK(state
->writemask
[0]));
253 r600_pipe_state_add_reg(rstate
,
254 R_028434_DB_STENCILREFMASK_BF
,
255 S_028434_STENCILREF_BF(state
->ref_value
[1]) |
256 S_028434_STENCILMASK_BF(state
->valuemask
[1]) |
257 S_028434_STENCILWRITEMASK_BF(state
->writemask
[1]));
259 free(rctx
->states
[R600_PIPE_STATE_STENCIL_REF
]);
260 rctx
->states
[R600_PIPE_STATE_STENCIL_REF
] = rstate
;
261 r600_context_pipe_state_set(rctx
, rstate
);
264 void r600_set_pipe_stencil_ref(struct pipe_context
*ctx
,
265 const struct pipe_stencil_ref
*state
)
267 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
268 struct r600_pipe_dsa
*dsa
= (struct r600_pipe_dsa
*)rctx
->states
[R600_PIPE_STATE_DSA
];
269 struct r600_stencil_ref ref
;
271 rctx
->stencil_ref
= *state
;
276 ref
.ref_value
[0] = state
->ref_value
[0];
277 ref
.ref_value
[1] = state
->ref_value
[1];
278 ref
.valuemask
[0] = dsa
->valuemask
[0];
279 ref
.valuemask
[1] = dsa
->valuemask
[1];
280 ref
.writemask
[0] = dsa
->writemask
[0];
281 ref
.writemask
[1] = dsa
->writemask
[1];
283 r600_set_stencil_ref(ctx
, &ref
);
286 void r600_bind_dsa_state(struct pipe_context
*ctx
, void *state
)
288 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
289 struct r600_pipe_dsa
*dsa
= state
;
290 struct r600_pipe_state
*rstate
;
291 struct r600_stencil_ref ref
;
295 rstate
= &dsa
->rstate
;
296 rctx
->states
[rstate
->id
] = rstate
;
297 r600_context_pipe_state_set(rctx
, rstate
);
299 ref
.ref_value
[0] = rctx
->stencil_ref
.ref_value
[0];
300 ref
.ref_value
[1] = rctx
->stencil_ref
.ref_value
[1];
301 ref
.valuemask
[0] = dsa
->valuemask
[0];
302 ref
.valuemask
[1] = dsa
->valuemask
[1];
303 ref
.writemask
[0] = dsa
->writemask
[0];
304 ref
.writemask
[1] = dsa
->writemask
[1];
306 r600_set_stencil_ref(ctx
, &ref
);
308 /* Update alphatest state. */
309 if (rctx
->alphatest_state
.sx_alpha_test_control
!= dsa
->sx_alpha_test_control
||
310 rctx
->alphatest_state
.sx_alpha_ref
!= dsa
->alpha_ref
) {
311 rctx
->alphatest_state
.sx_alpha_test_control
= dsa
->sx_alpha_test_control
;
312 rctx
->alphatest_state
.sx_alpha_ref
= dsa
->alpha_ref
;
313 r600_atom_dirty(rctx
, &rctx
->alphatest_state
.atom
);
317 void r600_set_max_scissor(struct r600_context
*rctx
)
319 /* Set a scissor state such that it doesn't do anything. */
320 struct pipe_scissor_state scissor
;
326 r600_set_scissor_state(rctx
, &scissor
);
329 void r600_bind_rs_state(struct pipe_context
*ctx
, void *state
)
331 struct r600_pipe_rasterizer
*rs
= (struct r600_pipe_rasterizer
*)state
;
332 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
337 rctx
->sprite_coord_enable
= rs
->sprite_coord_enable
;
338 rctx
->two_side
= rs
->two_side
;
339 rctx
->pa_sc_line_stipple
= rs
->pa_sc_line_stipple
;
340 rctx
->pa_cl_clip_cntl
= rs
->pa_cl_clip_cntl
;
341 rctx
->multisample_enable
= rs
->multisample_enable
;
343 rctx
->rasterizer
= rs
;
345 rctx
->states
[rs
->rstate
.id
] = &rs
->rstate
;
346 r600_context_pipe_state_set(rctx
, &rs
->rstate
);
348 if (rctx
->chip_class
>= EVERGREEN
) {
349 evergreen_polygon_offset_update(rctx
);
351 r600_polygon_offset_update(rctx
);
354 /* Workaround for a missing scissor enable on r600. */
355 if (rctx
->chip_class
== R600
) {
356 if (rs
->scissor_enable
!= rctx
->scissor_enable
) {
357 rctx
->scissor_enable
= rs
->scissor_enable
;
359 if (rs
->scissor_enable
) {
360 r600_set_scissor_state(rctx
, &rctx
->scissor_state
);
362 r600_set_max_scissor(rctx
);
368 void r600_delete_rs_state(struct pipe_context
*ctx
, void *state
)
370 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
371 struct r600_pipe_rasterizer
*rs
= (struct r600_pipe_rasterizer
*)state
;
373 if (rctx
->rasterizer
== rs
) {
374 rctx
->rasterizer
= NULL
;
376 if (rctx
->states
[rs
->rstate
.id
] == &rs
->rstate
) {
377 rctx
->states
[rs
->rstate
.id
] = NULL
;
382 void r600_sampler_view_destroy(struct pipe_context
*ctx
,
383 struct pipe_sampler_view
*state
)
385 struct r600_pipe_sampler_view
*resource
= (struct r600_pipe_sampler_view
*)state
;
387 pipe_resource_reference(&state
->texture
, NULL
);
391 static void r600_bind_samplers(struct pipe_context
*pipe
,
394 unsigned count
, void **states
)
396 struct r600_context
*rctx
= (struct r600_context
*)pipe
;
397 struct r600_textures_info
*dst
;
398 int seamless_cube_map
= -1;
401 assert(start
== 0); /* XXX fix below */
404 case PIPE_SHADER_VERTEX
:
405 dst
= &rctx
->vs_samplers
;
407 case PIPE_SHADER_FRAGMENT
:
408 dst
= &rctx
->ps_samplers
;
411 debug_error("bad shader in r600_bind_samplers()");
415 memcpy(dst
->samplers
, states
, sizeof(void*) * count
);
416 dst
->n_samplers
= count
;
417 dst
->atom_sampler
.num_dw
= 0;
419 for (i
= 0; i
< count
; i
++) {
420 struct r600_pipe_sampler_state
*sampler
= states
[i
];
422 if (sampler
== NULL
) {
425 if (sampler
->border_color_use
) {
426 dst
->atom_sampler
.num_dw
+= 11;
427 rctx
->flags
|= R600_PARTIAL_FLUSH
;
429 dst
->atom_sampler
.num_dw
+= 5;
431 seamless_cube_map
= sampler
->seamless_cube_map
;
433 if (rctx
->chip_class
<= R700
&& seamless_cube_map
!= -1 && seamless_cube_map
!= rctx
->seamless_cube_map
.enabled
) {
434 /* change in TA_CNTL_AUX need a pipeline flush */
435 rctx
->flags
|= R600_PARTIAL_FLUSH
;
436 rctx
->seamless_cube_map
.enabled
= seamless_cube_map
;
437 r600_atom_dirty(rctx
, &rctx
->seamless_cube_map
.atom
);
439 if (dst
->atom_sampler
.num_dw
) {
440 r600_atom_dirty(rctx
, &dst
->atom_sampler
);
444 void r600_bind_vs_samplers(struct pipe_context
*ctx
, unsigned count
, void **states
)
446 r600_bind_samplers(ctx
, PIPE_SHADER_VERTEX
, 0, count
, states
);
449 void r600_bind_ps_samplers(struct pipe_context
*ctx
, unsigned count
, void **states
)
451 r600_bind_samplers(ctx
, PIPE_SHADER_FRAGMENT
, 0, count
, states
);
454 void r600_delete_sampler(struct pipe_context
*ctx
, void *state
)
459 void r600_delete_state(struct pipe_context
*ctx
, void *state
)
461 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
462 struct r600_pipe_state
*rstate
= (struct r600_pipe_state
*)state
;
464 if (rctx
->states
[rstate
->id
] == rstate
) {
465 rctx
->states
[rstate
->id
] = NULL
;
467 for (int i
= 0; i
< rstate
->nregs
; i
++) {
468 pipe_resource_reference((struct pipe_resource
**)&rstate
->regs
[i
].bo
, NULL
);
473 void r600_bind_vertex_elements(struct pipe_context
*ctx
, void *state
)
475 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
476 struct r600_vertex_element
*v
= (struct r600_vertex_element
*)state
;
478 rctx
->vertex_elements
= v
;
480 r600_inval_shader_cache(rctx
);
482 rctx
->states
[v
->rstate
.id
] = &v
->rstate
;
483 r600_context_pipe_state_set(rctx
, &v
->rstate
);
487 void r600_delete_vertex_element(struct pipe_context
*ctx
, void *state
)
489 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
490 struct r600_vertex_element
*v
= (struct r600_vertex_element
*)state
;
492 if (rctx
->states
[v
->rstate
.id
] == &v
->rstate
) {
493 rctx
->states
[v
->rstate
.id
] = NULL
;
495 if (rctx
->vertex_elements
== state
)
496 rctx
->vertex_elements
= NULL
;
498 pipe_resource_reference((struct pipe_resource
**)&v
->fetch_shader
, NULL
);
502 void r600_set_index_buffer(struct pipe_context
*ctx
,
503 const struct pipe_index_buffer
*ib
)
505 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
508 pipe_resource_reference(&rctx
->index_buffer
.buffer
, ib
->buffer
);
509 memcpy(&rctx
->index_buffer
, ib
, sizeof(*ib
));
511 pipe_resource_reference(&rctx
->index_buffer
.buffer
, NULL
);
515 void r600_vertex_buffers_dirty(struct r600_context
*rctx
)
517 if (rctx
->vertex_buffer_state
.dirty_mask
) {
518 r600_inval_vertex_cache(rctx
);
519 rctx
->vertex_buffer_state
.atom
.num_dw
= (rctx
->chip_class
>= EVERGREEN
? 12 : 11) *
520 util_bitcount(rctx
->vertex_buffer_state
.dirty_mask
);
521 r600_atom_dirty(rctx
, &rctx
->vertex_buffer_state
.atom
);
525 void r600_set_vertex_buffers(struct pipe_context
*ctx
, unsigned count
,
526 const struct pipe_vertex_buffer
*input
)
528 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
529 struct r600_vertexbuf_state
*state
= &rctx
->vertex_buffer_state
;
530 struct pipe_vertex_buffer
*vb
= state
->vb
;
532 /* This sets 1-bit for buffers with index >= count. */
533 uint32_t disable_mask
= ~((1ull << count
) - 1);
534 /* These are the new buffers set by this function. */
535 uint32_t new_buffer_mask
= 0;
537 /* Set buffers with index >= count to NULL. */
538 uint32_t remaining_buffers_mask
=
539 rctx
->vertex_buffer_state
.enabled_mask
& disable_mask
;
541 while (remaining_buffers_mask
) {
542 i
= u_bit_scan(&remaining_buffers_mask
);
543 pipe_resource_reference(&vb
[i
].buffer
, NULL
);
546 /* Set vertex buffers. */
547 for (i
= 0; i
< count
; i
++) {
548 if (memcmp(&input
[i
], &vb
[i
], sizeof(struct pipe_vertex_buffer
))) {
549 if (input
[i
].buffer
) {
550 vb
[i
].stride
= input
[i
].stride
;
551 vb
[i
].buffer_offset
= input
[i
].buffer_offset
;
552 pipe_resource_reference(&vb
[i
].buffer
, input
[i
].buffer
);
553 new_buffer_mask
|= 1 << i
;
555 pipe_resource_reference(&vb
[i
].buffer
, NULL
);
556 disable_mask
|= 1 << i
;
561 rctx
->vertex_buffer_state
.enabled_mask
&= ~disable_mask
;
562 rctx
->vertex_buffer_state
.dirty_mask
&= rctx
->vertex_buffer_state
.enabled_mask
;
563 rctx
->vertex_buffer_state
.enabled_mask
|= new_buffer_mask
;
564 rctx
->vertex_buffer_state
.dirty_mask
|= new_buffer_mask
;
566 r600_vertex_buffers_dirty(rctx
);
569 void r600_sampler_views_dirty(struct r600_context
*rctx
,
570 struct r600_samplerview_state
*state
)
572 if (state
->dirty_mask
) {
573 r600_inval_texture_cache(rctx
);
574 state
->atom
.num_dw
= (rctx
->chip_class
>= EVERGREEN
? 14 : 13) *
575 util_bitcount(state
->dirty_mask
);
576 r600_atom_dirty(rctx
, &state
->atom
);
580 void r600_set_sampler_views(struct pipe_context
*pipe
,
584 struct pipe_sampler_view
**views
)
586 struct r600_context
*rctx
= (struct r600_context
*) pipe
;
587 struct r600_textures_info
*dst
;
588 struct r600_pipe_sampler_view
**rviews
= (struct r600_pipe_sampler_view
**)views
;
590 /* This sets 1-bit for textures with index >= count. */
591 uint32_t disable_mask
= ~((1ull << count
) - 1);
592 /* These are the new textures set by this function. */
593 uint32_t new_mask
= 0;
595 /* Set textures with index >= count to NULL. */
596 uint32_t remaining_mask
;
598 assert(start
== 0); /* XXX fix below */
601 case PIPE_SHADER_VERTEX
:
602 dst
= &rctx
->vs_samplers
;
604 case PIPE_SHADER_FRAGMENT
:
605 dst
= &rctx
->ps_samplers
;
608 debug_error("bad shader in r600_set_sampler_views()");
612 remaining_mask
= dst
->views
.enabled_mask
& disable_mask
;
614 while (remaining_mask
) {
615 i
= u_bit_scan(&remaining_mask
);
616 assert(dst
->views
.views
[i
]);
618 pipe_sampler_view_reference((struct pipe_sampler_view
**)&dst
->views
.views
[i
], NULL
);
621 for (i
= 0; i
< count
; i
++) {
622 if (rviews
[i
] == dst
->views
.views
[i
]) {
627 struct r600_texture
*rtex
=
628 (struct r600_texture
*)rviews
[i
]->base
.texture
;
630 if (rtex
->is_depth
&& !rtex
->is_flushing_texture
) {
631 dst
->views
.compressed_depthtex_mask
|= 1 << i
;
633 dst
->views
.compressed_depthtex_mask
&= ~(1 << i
);
636 /* Track compressed colorbuffers for Evergreen (Cayman doesn't need this). */
637 if (rctx
->chip_class
!= CAYMAN
&& rtex
->cmask_size
&& rtex
->fmask_size
) {
638 dst
->views
.compressed_colortex_mask
|= 1 << i
;
640 dst
->views
.compressed_colortex_mask
&= ~(1 << i
);
643 /* Changing from array to non-arrays textures and vice
644 * versa requires updating TEX_ARRAY_OVERRIDE on R6xx-R7xx. */
645 if (rctx
->chip_class
<= R700
&&
646 (rviews
[i
]->base
.texture
->target
== PIPE_TEXTURE_1D_ARRAY
||
647 rviews
[i
]->base
.texture
->target
== PIPE_TEXTURE_2D_ARRAY
) != dst
->is_array_sampler
[i
]) {
648 r600_atom_dirty(rctx
, &dst
->atom_sampler
);
651 pipe_sampler_view_reference((struct pipe_sampler_view
**)&dst
->views
.views
[i
], views
[i
]);
654 pipe_sampler_view_reference((struct pipe_sampler_view
**)&dst
->views
.views
[i
], NULL
);
655 disable_mask
|= 1 << i
;
659 dst
->views
.enabled_mask
&= ~disable_mask
;
660 dst
->views
.dirty_mask
&= dst
->views
.enabled_mask
;
661 dst
->views
.enabled_mask
|= new_mask
;
662 dst
->views
.dirty_mask
|= new_mask
;
663 dst
->views
.compressed_depthtex_mask
&= dst
->views
.enabled_mask
;
664 dst
->views
.compressed_colortex_mask
&= dst
->views
.enabled_mask
;
666 r600_sampler_views_dirty(rctx
, &dst
->views
);
669 void *r600_create_vertex_elements(struct pipe_context
*ctx
,
671 const struct pipe_vertex_element
*elements
)
673 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
674 struct r600_vertex_element
*v
= CALLOC_STRUCT(r600_vertex_element
);
681 memcpy(v
->elements
, elements
, sizeof(struct pipe_vertex_element
) * count
);
683 if (r600_vertex_elements_build_fetch_shader(rctx
, v
)) {
691 /* Compute the key for the hw shader variant */
692 static INLINE
unsigned r600_shader_selector_key(struct pipe_context
* ctx
,
693 struct r600_pipe_shader_selector
* sel
)
695 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
698 if (sel
->type
== PIPE_SHADER_FRAGMENT
) {
699 key
= rctx
->two_side
|
700 ((rctx
->alpha_to_one
&& rctx
->multisample_enable
&& !rctx
->cb0_is_integer
) << 1) |
701 (MIN2(sel
->nr_ps_max_color_exports
, rctx
->nr_cbufs
+ rctx
->dual_src_blend
) << 2);
708 /* Select the hw shader variant depending on the current state.
709 * (*dirty) is set to 1 if current variant was changed */
710 static int r600_shader_select(struct pipe_context
*ctx
,
711 struct r600_pipe_shader_selector
* sel
,
715 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
716 struct r600_pipe_shader
* shader
= NULL
;
719 key
= r600_shader_selector_key(ctx
, sel
);
721 /* Check if we don't need to change anything.
722 * This path is also used for most shaders that don't need multiple
723 * variants, it will cost just a computation of the key and this
725 if (likely(sel
->current
&& sel
->current
->key
== key
)) {
729 /* lookup if we have other variants in the list */
730 if (sel
->num_shaders
> 1) {
731 struct r600_pipe_shader
*p
= sel
->current
, *c
= p
->next_variant
;
733 while (c
&& c
->key
!= key
) {
739 p
->next_variant
= c
->next_variant
;
744 if (unlikely(!shader
)) {
745 shader
= CALLOC(1, sizeof(struct r600_pipe_shader
));
746 shader
->selector
= sel
;
748 r
= r600_pipe_shader_create(ctx
, shader
);
750 R600_ERR("Failed to build shader variant (type=%u, key=%u) %d\n",
756 /* We don't know the value of nr_ps_max_color_exports until we built
757 * at least one variant, so we may need to recompute the key after
758 * building first variant. */
759 if (sel
->type
== PIPE_SHADER_FRAGMENT
&&
760 sel
->num_shaders
== 0) {
761 sel
->nr_ps_max_color_exports
= shader
->shader
.nr_ps_max_color_exports
;
762 key
= r600_shader_selector_key(ctx
, sel
);
772 shader
->next_variant
= sel
->current
;
773 sel
->current
= shader
;
775 if (rctx
->chip_class
< EVERGREEN
&& rctx
->ps_shader
&& rctx
->vs_shader
) {
776 r600_adjust_gprs(rctx
);
779 if (rctx
->ps_shader
&&
780 rctx
->cb_misc_state
.nr_ps_color_outputs
!= rctx
->ps_shader
->current
->nr_ps_color_outputs
) {
781 rctx
->cb_misc_state
.nr_ps_color_outputs
= rctx
->ps_shader
->current
->nr_ps_color_outputs
;
782 r600_atom_dirty(rctx
, &rctx
->cb_misc_state
.atom
);
787 static void *r600_create_shader_state(struct pipe_context
*ctx
,
788 const struct pipe_shader_state
*state
,
789 unsigned pipe_shader_type
)
791 struct r600_pipe_shader_selector
*sel
= CALLOC_STRUCT(r600_pipe_shader_selector
);
794 sel
->type
= pipe_shader_type
;
795 sel
->tokens
= tgsi_dup_tokens(state
->tokens
);
796 sel
->so
= state
->stream_output
;
798 r
= r600_shader_select(ctx
, sel
, NULL
);
805 void *r600_create_shader_state_ps(struct pipe_context
*ctx
,
806 const struct pipe_shader_state
*state
)
808 return r600_create_shader_state(ctx
, state
, PIPE_SHADER_FRAGMENT
);
811 void *r600_create_shader_state_vs(struct pipe_context
*ctx
,
812 const struct pipe_shader_state
*state
)
814 return r600_create_shader_state(ctx
, state
, PIPE_SHADER_VERTEX
);
817 void r600_bind_ps_shader(struct pipe_context
*ctx
, void *state
)
819 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
822 state
= rctx
->dummy_pixel_shader
;
824 rctx
->ps_shader
= (struct r600_pipe_shader_selector
*)state
;
825 r600_context_pipe_state_set(rctx
, &rctx
->ps_shader
->current
->rstate
);
827 if (rctx
->chip_class
<= R700
) {
828 bool multiwrite
= rctx
->ps_shader
->current
->shader
.fs_write_all
;
830 if (rctx
->cb_misc_state
.multiwrite
!= multiwrite
) {
831 rctx
->cb_misc_state
.multiwrite
= multiwrite
;
832 r600_atom_dirty(rctx
, &rctx
->cb_misc_state
.atom
);
836 r600_adjust_gprs(rctx
);
839 if (rctx
->cb_misc_state
.nr_ps_color_outputs
!= rctx
->ps_shader
->current
->nr_ps_color_outputs
) {
840 rctx
->cb_misc_state
.nr_ps_color_outputs
= rctx
->ps_shader
->current
->nr_ps_color_outputs
;
841 r600_atom_dirty(rctx
, &rctx
->cb_misc_state
.atom
);
845 void r600_bind_vs_shader(struct pipe_context
*ctx
, void *state
)
847 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
849 rctx
->vs_shader
= (struct r600_pipe_shader_selector
*)state
;
851 r600_context_pipe_state_set(rctx
, &rctx
->vs_shader
->current
->rstate
);
853 if (rctx
->chip_class
< EVERGREEN
&& rctx
->ps_shader
)
854 r600_adjust_gprs(rctx
);
858 static void r600_delete_shader_selector(struct pipe_context
*ctx
,
859 struct r600_pipe_shader_selector
*sel
)
861 struct r600_pipe_shader
*p
= sel
->current
, *c
;
864 r600_pipe_shader_destroy(ctx
, p
);
874 void r600_delete_ps_shader(struct pipe_context
*ctx
, void *state
)
876 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
877 struct r600_pipe_shader_selector
*sel
= (struct r600_pipe_shader_selector
*)state
;
879 if (rctx
->ps_shader
== sel
) {
880 rctx
->ps_shader
= NULL
;
883 r600_delete_shader_selector(ctx
, sel
);
886 void r600_delete_vs_shader(struct pipe_context
*ctx
, void *state
)
888 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
889 struct r600_pipe_shader_selector
*sel
= (struct r600_pipe_shader_selector
*)state
;
891 if (rctx
->vs_shader
== sel
) {
892 rctx
->vs_shader
= NULL
;
895 r600_delete_shader_selector(ctx
, sel
);
898 void r600_constant_buffers_dirty(struct r600_context
*rctx
, struct r600_constbuf_state
*state
)
900 if (state
->dirty_mask
) {
901 r600_inval_shader_cache(rctx
);
902 state
->atom
.num_dw
= rctx
->chip_class
>= EVERGREEN
? util_bitcount(state
->dirty_mask
)*20
903 : util_bitcount(state
->dirty_mask
)*19;
904 r600_atom_dirty(rctx
, &state
->atom
);
908 void r600_set_constant_buffer(struct pipe_context
*ctx
, uint shader
, uint index
,
909 struct pipe_constant_buffer
*input
)
911 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
912 struct r600_constbuf_state
*state
;
913 struct pipe_constant_buffer
*cb
;
917 case PIPE_SHADER_VERTEX
:
918 state
= &rctx
->vs_constbuf_state
;
920 case PIPE_SHADER_FRAGMENT
:
921 state
= &rctx
->ps_constbuf_state
;
927 /* Note that the state tracker can unbind constant buffers by
930 if (unlikely(!input
)) {
931 state
->enabled_mask
&= ~(1 << index
);
932 state
->dirty_mask
&= ~(1 << index
);
933 pipe_resource_reference(&state
->cb
[index
].buffer
, NULL
);
937 cb
= &state
->cb
[index
];
938 cb
->buffer_size
= input
->buffer_size
;
940 ptr
= input
->user_buffer
;
943 /* Upload the user buffer. */
944 if (R600_BIG_ENDIAN
) {
946 unsigned i
, size
= input
->buffer_size
;
948 if (!(tmpPtr
= malloc(size
))) {
949 R600_ERR("Failed to allocate BE swap buffer.\n");
953 for (i
= 0; i
< size
/ 4; ++i
) {
954 tmpPtr
[i
] = bswap_32(((uint32_t *)ptr
)[i
]);
957 u_upload_data(rctx
->uploader
, 0, size
, tmpPtr
, &cb
->buffer_offset
, &cb
->buffer
);
960 u_upload_data(rctx
->uploader
, 0, input
->buffer_size
, ptr
, &cb
->buffer_offset
, &cb
->buffer
);
963 /* Setup the hw buffer. */
964 cb
->buffer_offset
= input
->buffer_offset
;
965 pipe_resource_reference(&cb
->buffer
, input
->buffer
);
968 state
->enabled_mask
|= 1 << index
;
969 state
->dirty_mask
|= 1 << index
;
970 r600_constant_buffers_dirty(rctx
, state
);
973 struct pipe_stream_output_target
*
974 r600_create_so_target(struct pipe_context
*ctx
,
975 struct pipe_resource
*buffer
,
976 unsigned buffer_offset
,
977 unsigned buffer_size
)
979 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
980 struct r600_so_target
*t
;
983 t
= CALLOC_STRUCT(r600_so_target
);
988 t
->b
.reference
.count
= 1;
990 pipe_resource_reference(&t
->b
.buffer
, buffer
);
991 t
->b
.buffer_offset
= buffer_offset
;
992 t
->b
.buffer_size
= buffer_size
;
994 t
->filled_size
= (struct r600_resource
*)
995 pipe_buffer_create(ctx
->screen
, PIPE_BIND_CUSTOM
, PIPE_USAGE_STATIC
, 4);
996 ptr
= rctx
->ws
->buffer_map(t
->filled_size
->cs_buf
, rctx
->cs
, PIPE_TRANSFER_WRITE
);
997 memset(ptr
, 0, t
->filled_size
->buf
->size
);
998 rctx
->ws
->buffer_unmap(t
->filled_size
->cs_buf
);
1003 void r600_so_target_destroy(struct pipe_context
*ctx
,
1004 struct pipe_stream_output_target
*target
)
1006 struct r600_so_target
*t
= (struct r600_so_target
*)target
;
1007 pipe_resource_reference(&t
->b
.buffer
, NULL
);
1008 pipe_resource_reference((struct pipe_resource
**)&t
->filled_size
, NULL
);
1012 void r600_set_so_targets(struct pipe_context
*ctx
,
1013 unsigned num_targets
,
1014 struct pipe_stream_output_target
**targets
,
1015 unsigned append_bitmask
)
1017 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
1020 /* Stop streamout. */
1021 if (rctx
->num_so_targets
&& !rctx
->streamout_start
) {
1022 r600_context_streamout_end(rctx
);
1025 /* Set the new targets. */
1026 for (i
= 0; i
< num_targets
; i
++) {
1027 pipe_so_target_reference((struct pipe_stream_output_target
**)&rctx
->so_targets
[i
], targets
[i
]);
1029 for (; i
< rctx
->num_so_targets
; i
++) {
1030 pipe_so_target_reference((struct pipe_stream_output_target
**)&rctx
->so_targets
[i
], NULL
);
1033 rctx
->num_so_targets
= num_targets
;
1034 rctx
->streamout_start
= num_targets
!= 0;
1035 rctx
->streamout_append_bitmask
= append_bitmask
;
1038 void r600_set_sample_mask(struct pipe_context
*pipe
, unsigned sample_mask
)
1040 struct r600_context
*rctx
= (struct r600_context
*)pipe
;
1042 if (rctx
->sample_mask
.sample_mask
== (uint16_t)sample_mask
)
1045 rctx
->sample_mask
.sample_mask
= sample_mask
;
1046 r600_atom_dirty(rctx
, &rctx
->sample_mask
.atom
);
1049 static void r600_update_derived_state(struct r600_context
*rctx
)
1051 struct pipe_context
* ctx
= (struct pipe_context
*)rctx
;
1052 unsigned ps_dirty
= 0, blend_override
;
1054 if (!rctx
->blitter
->running
) {
1055 /* Decompress textures if needed. */
1056 if (rctx
->vs_samplers
.views
.compressed_depthtex_mask
) {
1057 r600_decompress_depth_textures(rctx
, &rctx
->vs_samplers
.views
);
1059 if (rctx
->ps_samplers
.views
.compressed_depthtex_mask
) {
1060 r600_decompress_depth_textures(rctx
, &rctx
->ps_samplers
.views
);
1062 if (rctx
->vs_samplers
.views
.compressed_colortex_mask
) {
1063 r600_decompress_color_textures(rctx
, &rctx
->vs_samplers
.views
);
1065 if (rctx
->ps_samplers
.views
.compressed_colortex_mask
) {
1066 r600_decompress_color_textures(rctx
, &rctx
->ps_samplers
.views
);
1070 r600_shader_select(ctx
, rctx
->ps_shader
, &ps_dirty
);
1072 if (rctx
->ps_shader
&& ((rctx
->sprite_coord_enable
&&
1073 (rctx
->ps_shader
->current
->sprite_coord_enable
!= rctx
->sprite_coord_enable
)) ||
1074 (rctx
->rasterizer
&& rctx
->rasterizer
->flatshade
!= rctx
->ps_shader
->current
->flatshade
))) {
1076 if (rctx
->chip_class
>= EVERGREEN
)
1077 evergreen_pipe_shader_ps(ctx
, rctx
->ps_shader
->current
);
1079 r600_pipe_shader_ps(ctx
, rctx
->ps_shader
->current
);
1085 r600_context_pipe_state_set(rctx
, &rctx
->ps_shader
->current
->rstate
);
1087 blend_override
= (rctx
->dual_src_blend
&&
1088 rctx
->ps_shader
->current
->nr_ps_color_outputs
< 2);
1090 if (blend_override
!= rctx
->blend_override
) {
1091 rctx
->blend_override
= blend_override
;
1092 r600_bind_blend_state_internal(rctx
,
1093 blend_override
? rctx
->no_blend
: rctx
->blend
);
1096 if (rctx
->chip_class
>= EVERGREEN
) {
1097 evergreen_update_dual_export_state(rctx
);
1099 r600_update_dual_export_state(rctx
);
1103 static unsigned r600_conv_prim_to_gs_out(unsigned mode
)
1105 static const int prim_conv
[] = {
1106 V_028A6C_OUTPRIM_TYPE_POINTLIST
,
1107 V_028A6C_OUTPRIM_TYPE_LINESTRIP
,
1108 V_028A6C_OUTPRIM_TYPE_LINESTRIP
,
1109 V_028A6C_OUTPRIM_TYPE_LINESTRIP
,
1110 V_028A6C_OUTPRIM_TYPE_TRISTRIP
,
1111 V_028A6C_OUTPRIM_TYPE_TRISTRIP
,
1112 V_028A6C_OUTPRIM_TYPE_TRISTRIP
,
1113 V_028A6C_OUTPRIM_TYPE_TRISTRIP
,
1114 V_028A6C_OUTPRIM_TYPE_TRISTRIP
,
1115 V_028A6C_OUTPRIM_TYPE_TRISTRIP
,
1116 V_028A6C_OUTPRIM_TYPE_LINESTRIP
,
1117 V_028A6C_OUTPRIM_TYPE_LINESTRIP
,
1118 V_028A6C_OUTPRIM_TYPE_TRISTRIP
,
1119 V_028A6C_OUTPRIM_TYPE_TRISTRIP
,
1120 V_028A6C_OUTPRIM_TYPE_TRISTRIP
1122 assert(mode
< Elements(prim_conv
));
1124 return prim_conv
[mode
];
1127 void r600_draw_vbo(struct pipe_context
*ctx
, const struct pipe_draw_info
*dinfo
)
1129 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
1130 struct pipe_draw_info info
= *dinfo
;
1131 struct pipe_index_buffer ib
= {};
1132 unsigned prim
, ls_mask
= 0, i
;
1133 struct r600_block
*dirty_block
= NULL
, *next_block
= NULL
;
1134 struct radeon_winsys_cs
*cs
= rctx
->cs
;
1138 if ((!info
.count
&& (info
.indexed
|| !info
.count_from_stream_output
)) ||
1139 !r600_conv_pipe_prim(info
.mode
, &prim
)) {
1144 if (!rctx
->vs_shader
) {
1149 r600_update_derived_state(rctx
);
1151 /* partial flush triggered by border color change */
1152 if (rctx
->flags
& R600_PARTIAL_FLUSH
) {
1153 rctx
->flags
&= ~R600_PARTIAL_FLUSH
;
1154 r600_write_value(cs
, PKT3(PKT3_EVENT_WRITE
, 0, 0));
1155 r600_write_value(cs
, EVENT_TYPE(EVENT_TYPE_PS_PARTIAL_FLUSH
) | EVENT_INDEX(4));
1159 /* Initialize the index buffer struct. */
1160 pipe_resource_reference(&ib
.buffer
, rctx
->index_buffer
.buffer
);
1161 ib
.user_buffer
= rctx
->index_buffer
.user_buffer
;
1162 ib
.index_size
= rctx
->index_buffer
.index_size
;
1163 ib
.offset
= rctx
->index_buffer
.offset
+ info
.start
* ib
.index_size
;
1165 /* Translate or upload, if needed. */
1166 r600_translate_index_buffer(rctx
, &ib
, info
.count
);
1168 ptr
= (uint8_t*)ib
.user_buffer
;
1169 if (!ib
.buffer
&& ptr
) {
1170 u_upload_data(rctx
->uploader
, 0, info
.count
* ib
.index_size
,
1171 ptr
, &ib
.offset
, &ib
.buffer
);
1174 info
.index_bias
= info
.start
;
1177 if (rctx
->vgt
.id
!= R600_PIPE_STATE_VGT
) {
1178 rctx
->vgt
.id
= R600_PIPE_STATE_VGT
;
1179 rctx
->vgt
.nregs
= 0;
1180 r600_pipe_state_add_reg(&rctx
->vgt
, R_008958_VGT_PRIMITIVE_TYPE
, prim
);
1181 r600_pipe_state_add_reg(&rctx
->vgt
, R_028A6C_VGT_GS_OUT_PRIM_TYPE
, 0);
1182 r600_pipe_state_add_reg(&rctx
->vgt
, R_028408_VGT_INDX_OFFSET
, info
.index_bias
);
1183 r600_pipe_state_add_reg(&rctx
->vgt
, R_02840C_VGT_MULTI_PRIM_IB_RESET_INDX
, info
.restart_index
);
1184 r600_pipe_state_add_reg(&rctx
->vgt
, R_028A94_VGT_MULTI_PRIM_IB_RESET_EN
, info
.primitive_restart
);
1185 r600_pipe_state_add_reg(&rctx
->vgt
, R_03CFF4_SQ_VTX_START_INST_LOC
, info
.start_instance
);
1186 r600_pipe_state_add_reg(&rctx
->vgt
, R_028A0C_PA_SC_LINE_STIPPLE
, 0);
1187 r600_pipe_state_add_reg(&rctx
->vgt
, R_02881C_PA_CL_VS_OUT_CNTL
, 0);
1188 r600_pipe_state_add_reg(&rctx
->vgt
, R_028810_PA_CL_CLIP_CNTL
, 0);
1191 rctx
->vgt
.nregs
= 0;
1192 r600_pipe_state_mod_reg(&rctx
->vgt
, prim
);
1193 r600_pipe_state_mod_reg(&rctx
->vgt
, r600_conv_prim_to_gs_out(info
.mode
));
1194 r600_pipe_state_mod_reg(&rctx
->vgt
, info
.index_bias
);
1195 r600_pipe_state_mod_reg(&rctx
->vgt
, info
.restart_index
);
1196 r600_pipe_state_mod_reg(&rctx
->vgt
, info
.primitive_restart
);
1197 r600_pipe_state_mod_reg(&rctx
->vgt
, info
.start_instance
);
1199 if (prim
== V_008958_DI_PT_LINELIST
)
1201 else if (prim
== V_008958_DI_PT_LINESTRIP
||
1202 prim
== V_008958_DI_PT_LINELOOP
)
1204 r600_pipe_state_mod_reg(&rctx
->vgt
, S_028A0C_AUTO_RESET_CNTL(ls_mask
) | rctx
->pa_sc_line_stipple
);
1205 r600_pipe_state_mod_reg(&rctx
->vgt
,
1206 rctx
->vs_shader
->current
->pa_cl_vs_out_cntl
|
1207 (rctx
->rasterizer
->clip_plane_enable
& rctx
->vs_shader
->current
->shader
.clip_dist_write
));
1208 r600_pipe_state_mod_reg(&rctx
->vgt
,
1209 rctx
->pa_cl_clip_cntl
|
1210 (rctx
->vs_shader
->current
->shader
.clip_dist_write
||
1211 rctx
->vs_shader
->current
->shader
.vs_prohibit_ucps
?
1212 0 : rctx
->rasterizer
->clip_plane_enable
& 0x3F));
1214 r600_context_pipe_state_set(rctx
, &rctx
->vgt
);
1216 /* Enable stream out if needed. */
1217 if (rctx
->streamout_start
) {
1218 r600_context_streamout_begin(rctx
);
1219 rctx
->streamout_start
= FALSE
;
1222 /* Emit states (the function expects that we emit at most 17 dwords here). */
1223 r600_need_cs_space(rctx
, 0, TRUE
);
1225 for (i
= 0; i
< R600_MAX_ATOM
; i
++) {
1226 if (rctx
->atoms
[i
] == NULL
|| !rctx
->atoms
[i
]->dirty
) {
1229 r600_emit_atom(rctx
, rctx
->atoms
[i
]);
1231 LIST_FOR_EACH_ENTRY_SAFE(dirty_block
, next_block
, &rctx
->dirty
,list
) {
1232 r600_context_block_emit_dirty(rctx
, dirty_block
, 0 /* pkt_flags */);
1234 rctx
->pm4_dirty_cdwords
= 0;
1237 cs
->buf
[cs
->cdw
++] = PKT3(PKT3_NUM_INSTANCES
, 0, rctx
->predicate_drawing
);
1238 cs
->buf
[cs
->cdw
++] = info
.instance_count
;
1240 cs
->buf
[cs
->cdw
++] = PKT3(PKT3_INDEX_TYPE
, 0, rctx
->predicate_drawing
);
1241 cs
->buf
[cs
->cdw
++] = ib
.index_size
== 4 ?
1242 (VGT_INDEX_32
| (R600_BIG_ENDIAN
? VGT_DMA_SWAP_32_BIT
: 0)) :
1243 (VGT_INDEX_16
| (R600_BIG_ENDIAN
? VGT_DMA_SWAP_16_BIT
: 0));
1245 va
= r600_resource_va(ctx
->screen
, ib
.buffer
);
1247 cs
->buf
[cs
->cdw
++] = PKT3(PKT3_DRAW_INDEX
, 3, rctx
->predicate_drawing
);
1248 cs
->buf
[cs
->cdw
++] = va
;
1249 cs
->buf
[cs
->cdw
++] = (va
>> 32UL) & 0xFF;
1250 cs
->buf
[cs
->cdw
++] = info
.count
;
1251 cs
->buf
[cs
->cdw
++] = V_0287F0_DI_SRC_SEL_DMA
;
1252 cs
->buf
[cs
->cdw
++] = PKT3(PKT3_NOP
, 0, rctx
->predicate_drawing
);
1253 cs
->buf
[cs
->cdw
++] = r600_context_bo_reloc(rctx
, (struct r600_resource
*)ib
.buffer
, RADEON_USAGE_READ
);
1255 if (info
.count_from_stream_output
) {
1256 struct r600_so_target
*t
= (struct r600_so_target
*)info
.count_from_stream_output
;
1257 uint64_t va
= r600_resource_va(&rctx
->screen
->screen
, (void*)t
->filled_size
);
1259 r600_write_context_reg(cs
, R_028B30_VGT_STRMOUT_DRAW_OPAQUE_VERTEX_STRIDE
, t
->stride_in_dw
);
1261 cs
->buf
[cs
->cdw
++] = PKT3(PKT3_COPY_DW
, 4, 0);
1262 cs
->buf
[cs
->cdw
++] = COPY_DW_SRC_IS_MEM
| COPY_DW_DST_IS_REG
;
1263 cs
->buf
[cs
->cdw
++] = va
& 0xFFFFFFFFUL
; /* src address lo */
1264 cs
->buf
[cs
->cdw
++] = (va
>> 32UL) & 0xFFUL
; /* src address hi */
1265 cs
->buf
[cs
->cdw
++] = R_028B2C_VGT_STRMOUT_DRAW_OPAQUE_BUFFER_FILLED_SIZE
>> 2; /* dst register */
1266 cs
->buf
[cs
->cdw
++] = 0; /* unused */
1268 cs
->buf
[cs
->cdw
++] = PKT3(PKT3_NOP
, 0, 0);
1269 cs
->buf
[cs
->cdw
++] = r600_context_bo_reloc(rctx
, t
->filled_size
, RADEON_USAGE_READ
);
1272 cs
->buf
[cs
->cdw
++] = PKT3(PKT3_DRAW_INDEX_AUTO
, 1, rctx
->predicate_drawing
);
1273 cs
->buf
[cs
->cdw
++] = info
.count
;
1274 cs
->buf
[cs
->cdw
++] = V_0287F0_DI_SRC_SEL_AUTO_INDEX
|
1275 (info
.count_from_stream_output
? S_0287F0_USE_OPAQUE(1) : 0);
1278 rctx
->flags
|= R600_CONTEXT_DST_CACHES_DIRTY
| R600_CONTEXT_DRAW_PENDING
;
1280 /* Set the depth buffer as dirty. */
1281 if (rctx
->framebuffer
.zsbuf
) {
1282 struct pipe_surface
*surf
= rctx
->framebuffer
.zsbuf
;
1283 struct r600_texture
*rtex
= (struct r600_texture
*)surf
->texture
;
1285 rtex
->dirty_level_mask
|= 1 << surf
->u
.tex
.level
;
1287 if (rctx
->compressed_cb_mask
) {
1288 struct pipe_surface
*surf
;
1289 struct r600_texture
*rtex
;
1290 unsigned mask
= rctx
->compressed_cb_mask
;
1293 unsigned i
= u_bit_scan(&mask
);
1294 surf
= rctx
->framebuffer
.cbufs
[i
];
1295 rtex
= (struct r600_texture
*)surf
->texture
;
1297 rtex
->dirty_level_mask
|= 1 << surf
->u
.tex
.level
;
1302 pipe_resource_reference(&ib
.buffer
, NULL
);
1305 void r600_draw_rectangle(struct blitter_context
*blitter
,
1306 unsigned x1
, unsigned y1
, unsigned x2
, unsigned y2
, float depth
,
1307 enum blitter_attrib_type type
, const union pipe_color_union
*attrib
)
1309 struct r600_context
*rctx
= (struct r600_context
*)util_blitter_get_pipe(blitter
);
1310 struct pipe_viewport_state viewport
;
1311 struct pipe_resource
*buf
= NULL
;
1312 unsigned offset
= 0;
1315 if (type
== UTIL_BLITTER_ATTRIB_TEXCOORD
) {
1316 util_blitter_draw_rectangle(blitter
, x1
, y1
, x2
, y2
, depth
, type
, attrib
);
1320 /* Some operations (like color resolve on r6xx) don't work
1321 * with the conventional primitive types.
1322 * One that works is PT_RECTLIST, which we use here. */
1324 /* setup viewport */
1325 viewport
.scale
[0] = 1.0f
;
1326 viewport
.scale
[1] = 1.0f
;
1327 viewport
.scale
[2] = 1.0f
;
1328 viewport
.scale
[3] = 1.0f
;
1329 viewport
.translate
[0] = 0.0f
;
1330 viewport
.translate
[1] = 0.0f
;
1331 viewport
.translate
[2] = 0.0f
;
1332 viewport
.translate
[3] = 0.0f
;
1333 rctx
->context
.set_viewport_state(&rctx
->context
, &viewport
);
1335 /* Upload vertices. The hw rectangle has only 3 vertices,
1336 * I guess the 4th one is derived from the first 3.
1337 * The vertex specification should match u_blitter's vertex element state. */
1338 u_upload_alloc(rctx
->uploader
, 0, sizeof(float) * 24, &offset
, &buf
, (void**)&vb
);
1355 memcpy(vb
+4, attrib
->f
, sizeof(float)*4);
1356 memcpy(vb
+12, attrib
->f
, sizeof(float)*4);
1357 memcpy(vb
+20, attrib
->f
, sizeof(float)*4);
1361 util_draw_vertex_buffer(&rctx
->context
, NULL
, buf
, offset
,
1362 R600_PRIM_RECTANGLE_LIST
, 3, 2);
1363 pipe_resource_reference(&buf
, NULL
);
1366 void _r600_pipe_state_add_reg_bo(struct r600_context
*ctx
,
1367 struct r600_pipe_state
*state
,
1368 uint32_t offset
, uint32_t value
,
1369 uint32_t range_id
, uint32_t block_id
,
1370 struct r600_resource
*bo
,
1371 enum radeon_bo_usage usage
)
1374 struct r600_range
*range
;
1375 struct r600_block
*block
;
1377 if (bo
) assert(usage
);
1379 range
= &ctx
->range
[range_id
];
1380 block
= range
->blocks
[block_id
];
1381 state
->regs
[state
->nregs
].block
= block
;
1382 state
->regs
[state
->nregs
].id
= (offset
- block
->start_offset
) >> 2;
1384 state
->regs
[state
->nregs
].value
= value
;
1385 state
->regs
[state
->nregs
].bo
= bo
;
1386 state
->regs
[state
->nregs
].bo_usage
= usage
;
1389 assert(state
->nregs
< R600_BLOCK_MAX_REG
);
1392 void _r600_pipe_state_add_reg(struct r600_context
*ctx
,
1393 struct r600_pipe_state
*state
,
1394 uint32_t offset
, uint32_t value
,
1395 uint32_t range_id
, uint32_t block_id
)
1397 _r600_pipe_state_add_reg_bo(ctx
, state
, offset
, value
,
1398 range_id
, block_id
, NULL
, 0);
1401 uint32_t r600_translate_stencil_op(int s_op
)
1404 case PIPE_STENCIL_OP_KEEP
:
1405 return V_028800_STENCIL_KEEP
;
1406 case PIPE_STENCIL_OP_ZERO
:
1407 return V_028800_STENCIL_ZERO
;
1408 case PIPE_STENCIL_OP_REPLACE
:
1409 return V_028800_STENCIL_REPLACE
;
1410 case PIPE_STENCIL_OP_INCR
:
1411 return V_028800_STENCIL_INCR
;
1412 case PIPE_STENCIL_OP_DECR
:
1413 return V_028800_STENCIL_DECR
;
1414 case PIPE_STENCIL_OP_INCR_WRAP
:
1415 return V_028800_STENCIL_INCR_WRAP
;
1416 case PIPE_STENCIL_OP_DECR_WRAP
:
1417 return V_028800_STENCIL_DECR_WRAP
;
1418 case PIPE_STENCIL_OP_INVERT
:
1419 return V_028800_STENCIL_INVERT
;
1421 R600_ERR("Unknown stencil op %d", s_op
);
1428 uint32_t r600_translate_fill(uint32_t func
)
1431 case PIPE_POLYGON_MODE_FILL
:
1433 case PIPE_POLYGON_MODE_LINE
:
1435 case PIPE_POLYGON_MODE_POINT
:
1443 unsigned r600_tex_wrap(unsigned wrap
)
1447 case PIPE_TEX_WRAP_REPEAT
:
1448 return V_03C000_SQ_TEX_WRAP
;
1449 case PIPE_TEX_WRAP_CLAMP
:
1450 return V_03C000_SQ_TEX_CLAMP_HALF_BORDER
;
1451 case PIPE_TEX_WRAP_CLAMP_TO_EDGE
:
1452 return V_03C000_SQ_TEX_CLAMP_LAST_TEXEL
;
1453 case PIPE_TEX_WRAP_CLAMP_TO_BORDER
:
1454 return V_03C000_SQ_TEX_CLAMP_BORDER
;
1455 case PIPE_TEX_WRAP_MIRROR_REPEAT
:
1456 return V_03C000_SQ_TEX_MIRROR
;
1457 case PIPE_TEX_WRAP_MIRROR_CLAMP
:
1458 return V_03C000_SQ_TEX_MIRROR_ONCE_HALF_BORDER
;
1459 case PIPE_TEX_WRAP_MIRROR_CLAMP_TO_EDGE
:
1460 return V_03C000_SQ_TEX_MIRROR_ONCE_LAST_TEXEL
;
1461 case PIPE_TEX_WRAP_MIRROR_CLAMP_TO_BORDER
:
1462 return V_03C000_SQ_TEX_MIRROR_ONCE_BORDER
;
1466 unsigned r600_tex_filter(unsigned filter
)
1470 case PIPE_TEX_FILTER_NEAREST
:
1471 return V_03C000_SQ_TEX_XY_FILTER_POINT
;
1472 case PIPE_TEX_FILTER_LINEAR
:
1473 return V_03C000_SQ_TEX_XY_FILTER_BILINEAR
;
1477 unsigned r600_tex_mipfilter(unsigned filter
)
1480 case PIPE_TEX_MIPFILTER_NEAREST
:
1481 return V_03C000_SQ_TEX_Z_FILTER_POINT
;
1482 case PIPE_TEX_MIPFILTER_LINEAR
:
1483 return V_03C000_SQ_TEX_Z_FILTER_LINEAR
;
1485 case PIPE_TEX_MIPFILTER_NONE
:
1486 return V_03C000_SQ_TEX_Z_FILTER_NONE
;
1490 unsigned r600_tex_compare(unsigned compare
)
1494 case PIPE_FUNC_NEVER
:
1495 return V_03C000_SQ_TEX_DEPTH_COMPARE_NEVER
;
1496 case PIPE_FUNC_LESS
:
1497 return V_03C000_SQ_TEX_DEPTH_COMPARE_LESS
;
1498 case PIPE_FUNC_EQUAL
:
1499 return V_03C000_SQ_TEX_DEPTH_COMPARE_EQUAL
;
1500 case PIPE_FUNC_LEQUAL
:
1501 return V_03C000_SQ_TEX_DEPTH_COMPARE_LESSEQUAL
;
1502 case PIPE_FUNC_GREATER
:
1503 return V_03C000_SQ_TEX_DEPTH_COMPARE_GREATER
;
1504 case PIPE_FUNC_NOTEQUAL
:
1505 return V_03C000_SQ_TEX_DEPTH_COMPARE_NOTEQUAL
;
1506 case PIPE_FUNC_GEQUAL
:
1507 return V_03C000_SQ_TEX_DEPTH_COMPARE_GREATEREQUAL
;
1508 case PIPE_FUNC_ALWAYS
:
1509 return V_03C000_SQ_TEX_DEPTH_COMPARE_ALWAYS
;