2 * Copyright 2010 Red Hat Inc.
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * on the rights to use, copy, modify, merge, publish, distribute, sub
9 * license, and/or sell copies of the Software, and to permit persons to whom
10 * the Software is furnished to do so, subject to the following conditions:
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
20 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
21 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
22 * USE OR OTHER DEALINGS IN THE SOFTWARE.
24 * Authors: Dave Airlie <airlied@redhat.com>
25 * Jerome Glisse <jglisse@redhat.com>
27 #include "r600_formats.h"
30 #include "util/u_draw_quad.h"
31 #include "util/u_upload_mgr.h"
32 #include "tgsi/tgsi_parse.h"
35 #define R600_PRIM_RECTANGLE_LIST PIPE_PRIM_MAX
37 static void r600_emit_command_buffer(struct r600_context
*rctx
, struct r600_atom
*atom
)
39 struct radeon_winsys_cs
*cs
= rctx
->cs
;
40 struct r600_command_buffer
*cb
= (struct r600_command_buffer
*)atom
;
42 assert(cs
->cdw
+ cb
->atom
.num_dw
<= RADEON_MAX_CMDBUF_DWORDS
);
43 memcpy(cs
->buf
+ cs
->cdw
, cb
->buf
, 4 * cb
->atom
.num_dw
);
44 cs
->cdw
+= cb
->atom
.num_dw
;
47 void r600_init_command_buffer(struct r600_context
*rctx
, struct r600_command_buffer
*cb
, unsigned id
, unsigned num_dw
)
49 r600_init_atom(rctx
, &cb
->atom
, id
, r600_emit_command_buffer
, 0);
50 cb
->buf
= CALLOC(1, 4 * num_dw
);
51 cb
->max_num_dw
= num_dw
;
54 void r600_release_command_buffer(struct r600_command_buffer
*cb
)
59 void r600_init_atom(struct r600_context
*rctx
,
60 struct r600_atom
*atom
,
62 void (*emit
)(struct r600_context
*ctx
, struct r600_atom
*state
),
65 assert(id
< R600_MAX_ATOM
);
66 assert(rctx
->atoms
[id
] == NULL
);
67 rctx
->atoms
[id
] = atom
;
70 atom
->num_dw
= num_dw
;
74 void r600_emit_alphatest_state(struct r600_context
*rctx
, struct r600_atom
*atom
)
76 struct radeon_winsys_cs
*cs
= rctx
->cs
;
77 struct r600_alphatest_state
*a
= (struct r600_alphatest_state
*)atom
;
78 unsigned alpha_ref
= a
->sx_alpha_ref
;
80 if (rctx
->chip_class
>= EVERGREEN
&& a
->cb0_export_16bpc
) {
84 r600_write_context_reg(cs
, R_028410_SX_ALPHA_TEST_CONTROL
,
85 a
->sx_alpha_test_control
|
86 S_028410_ALPHA_TEST_BYPASS(a
->bypass
));
87 r600_write_context_reg(cs
, R_028438_SX_ALPHA_REF
, alpha_ref
);
90 static void r600_texture_barrier(struct pipe_context
*ctx
)
92 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
94 rctx
->flags
|= R600_CONTEXT_CB_FLUSH
| R600_CONTEXT_TEX_FLUSH
;
97 if (rctx
->chip_class
== R600
) {
98 rctx
->flags
|= R600_CONTEXT_FLUSH_AND_INV
;
102 static bool r600_conv_pipe_prim(unsigned pprim
, unsigned *prim
)
104 static const int prim_conv
[] = {
105 V_008958_DI_PT_POINTLIST
,
106 V_008958_DI_PT_LINELIST
,
107 V_008958_DI_PT_LINELOOP
,
108 V_008958_DI_PT_LINESTRIP
,
109 V_008958_DI_PT_TRILIST
,
110 V_008958_DI_PT_TRISTRIP
,
111 V_008958_DI_PT_TRIFAN
,
112 V_008958_DI_PT_QUADLIST
,
113 V_008958_DI_PT_QUADSTRIP
,
114 V_008958_DI_PT_POLYGON
,
119 V_008958_DI_PT_RECTLIST
122 *prim
= prim_conv
[pprim
];
124 fprintf(stderr
, "%s:%d unsupported %d\n", __func__
, __LINE__
, pprim
);
130 /* common state between evergreen and r600 */
132 static void r600_bind_blend_state_internal(struct r600_context
*rctx
,
133 struct r600_pipe_blend
*blend
)
135 struct r600_pipe_state
*rstate
;
136 bool update_cb
= false;
138 rstate
= &blend
->rstate
;
139 rctx
->states
[rstate
->id
] = rstate
;
140 r600_context_pipe_state_set(rctx
, rstate
);
142 if (rctx
->cb_misc_state
.blend_colormask
!= blend
->cb_target_mask
) {
143 rctx
->cb_misc_state
.blend_colormask
= blend
->cb_target_mask
;
146 if (rctx
->chip_class
<= R700
&&
147 rctx
->cb_misc_state
.cb_color_control
!= blend
->cb_color_control
) {
148 rctx
->cb_misc_state
.cb_color_control
= blend
->cb_color_control
;
151 if (rctx
->cb_misc_state
.dual_src_blend
!= blend
->dual_src_blend
) {
152 rctx
->cb_misc_state
.dual_src_blend
= blend
->dual_src_blend
;
156 r600_atom_dirty(rctx
, &rctx
->cb_misc_state
.atom
);
160 static void r600_bind_blend_state(struct pipe_context
*ctx
, void *state
)
162 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
163 struct r600_pipe_blend
*blend
= (struct r600_pipe_blend
*)state
;
169 rctx
->alpha_to_one
= blend
->alpha_to_one
;
170 rctx
->dual_src_blend
= blend
->dual_src_blend
;
172 if (!rctx
->blend_override
)
173 r600_bind_blend_state_internal(rctx
, blend
);
176 static void r600_set_blend_color(struct pipe_context
*ctx
,
177 const struct pipe_blend_color
*state
)
179 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
180 struct r600_pipe_state
*rstate
= CALLOC_STRUCT(r600_pipe_state
);
185 rstate
->id
= R600_PIPE_STATE_BLEND_COLOR
;
186 r600_pipe_state_add_reg(rstate
, R_028414_CB_BLEND_RED
, fui(state
->color
[0]));
187 r600_pipe_state_add_reg(rstate
, R_028418_CB_BLEND_GREEN
, fui(state
->color
[1]));
188 r600_pipe_state_add_reg(rstate
, R_02841C_CB_BLEND_BLUE
, fui(state
->color
[2]));
189 r600_pipe_state_add_reg(rstate
, R_028420_CB_BLEND_ALPHA
, fui(state
->color
[3]));
191 free(rctx
->states
[R600_PIPE_STATE_BLEND_COLOR
]);
192 rctx
->states
[R600_PIPE_STATE_BLEND_COLOR
] = rstate
;
193 r600_context_pipe_state_set(rctx
, rstate
);
196 static void r600_set_stencil_ref(struct pipe_context
*ctx
,
197 const struct r600_stencil_ref
*state
)
199 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
200 struct r600_pipe_state
*rstate
= CALLOC_STRUCT(r600_pipe_state
);
205 rstate
->id
= R600_PIPE_STATE_STENCIL_REF
;
206 r600_pipe_state_add_reg(rstate
,
207 R_028430_DB_STENCILREFMASK
,
208 S_028430_STENCILREF(state
->ref_value
[0]) |
209 S_028430_STENCILMASK(state
->valuemask
[0]) |
210 S_028430_STENCILWRITEMASK(state
->writemask
[0]));
211 r600_pipe_state_add_reg(rstate
,
212 R_028434_DB_STENCILREFMASK_BF
,
213 S_028434_STENCILREF_BF(state
->ref_value
[1]) |
214 S_028434_STENCILMASK_BF(state
->valuemask
[1]) |
215 S_028434_STENCILWRITEMASK_BF(state
->writemask
[1]));
217 free(rctx
->states
[R600_PIPE_STATE_STENCIL_REF
]);
218 rctx
->states
[R600_PIPE_STATE_STENCIL_REF
] = rstate
;
219 r600_context_pipe_state_set(rctx
, rstate
);
222 static void r600_set_pipe_stencil_ref(struct pipe_context
*ctx
,
223 const struct pipe_stencil_ref
*state
)
225 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
226 struct r600_pipe_dsa
*dsa
= (struct r600_pipe_dsa
*)rctx
->states
[R600_PIPE_STATE_DSA
];
227 struct r600_stencil_ref ref
;
229 rctx
->stencil_ref
= *state
;
234 ref
.ref_value
[0] = state
->ref_value
[0];
235 ref
.ref_value
[1] = state
->ref_value
[1];
236 ref
.valuemask
[0] = dsa
->valuemask
[0];
237 ref
.valuemask
[1] = dsa
->valuemask
[1];
238 ref
.writemask
[0] = dsa
->writemask
[0];
239 ref
.writemask
[1] = dsa
->writemask
[1];
241 r600_set_stencil_ref(ctx
, &ref
);
244 static void r600_bind_dsa_state(struct pipe_context
*ctx
, void *state
)
246 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
247 struct r600_pipe_dsa
*dsa
= state
;
248 struct r600_pipe_state
*rstate
;
249 struct r600_stencil_ref ref
;
253 rstate
= &dsa
->rstate
;
254 rctx
->states
[rstate
->id
] = rstate
;
255 r600_context_pipe_state_set(rctx
, rstate
);
257 ref
.ref_value
[0] = rctx
->stencil_ref
.ref_value
[0];
258 ref
.ref_value
[1] = rctx
->stencil_ref
.ref_value
[1];
259 ref
.valuemask
[0] = dsa
->valuemask
[0];
260 ref
.valuemask
[1] = dsa
->valuemask
[1];
261 ref
.writemask
[0] = dsa
->writemask
[0];
262 ref
.writemask
[1] = dsa
->writemask
[1];
264 r600_set_stencil_ref(ctx
, &ref
);
266 /* Update alphatest state. */
267 if (rctx
->alphatest_state
.sx_alpha_test_control
!= dsa
->sx_alpha_test_control
||
268 rctx
->alphatest_state
.sx_alpha_ref
!= dsa
->alpha_ref
) {
269 rctx
->alphatest_state
.sx_alpha_test_control
= dsa
->sx_alpha_test_control
;
270 rctx
->alphatest_state
.sx_alpha_ref
= dsa
->alpha_ref
;
271 r600_atom_dirty(rctx
, &rctx
->alphatest_state
.atom
);
275 void r600_set_max_scissor(struct r600_context
*rctx
)
277 /* Set a scissor state such that it doesn't do anything. */
278 struct pipe_scissor_state scissor
;
284 r600_set_scissor_state(rctx
, &scissor
);
287 static void r600_bind_rs_state(struct pipe_context
*ctx
, void *state
)
289 struct r600_pipe_rasterizer
*rs
= (struct r600_pipe_rasterizer
*)state
;
290 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
295 rctx
->sprite_coord_enable
= rs
->sprite_coord_enable
;
296 rctx
->two_side
= rs
->two_side
;
297 rctx
->pa_sc_line_stipple
= rs
->pa_sc_line_stipple
;
298 rctx
->pa_cl_clip_cntl
= rs
->pa_cl_clip_cntl
;
299 rctx
->multisample_enable
= rs
->multisample_enable
;
301 rctx
->rasterizer
= rs
;
303 rctx
->states
[rs
->rstate
.id
] = &rs
->rstate
;
304 r600_context_pipe_state_set(rctx
, &rs
->rstate
);
306 if (rctx
->chip_class
>= EVERGREEN
) {
307 evergreen_polygon_offset_update(rctx
);
309 r600_polygon_offset_update(rctx
);
312 /* Workaround for a missing scissor enable on r600. */
313 if (rctx
->chip_class
== R600
) {
314 if (rs
->scissor_enable
!= rctx
->scissor_enable
) {
315 rctx
->scissor_enable
= rs
->scissor_enable
;
317 if (rs
->scissor_enable
) {
318 r600_set_scissor_state(rctx
, &rctx
->scissor_state
);
320 r600_set_max_scissor(rctx
);
326 static void r600_delete_rs_state(struct pipe_context
*ctx
, void *state
)
328 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
329 struct r600_pipe_rasterizer
*rs
= (struct r600_pipe_rasterizer
*)state
;
331 if (rctx
->rasterizer
== rs
) {
332 rctx
->rasterizer
= NULL
;
334 if (rctx
->states
[rs
->rstate
.id
] == &rs
->rstate
) {
335 rctx
->states
[rs
->rstate
.id
] = NULL
;
340 static void r600_sampler_view_destroy(struct pipe_context
*ctx
,
341 struct pipe_sampler_view
*state
)
343 struct r600_pipe_sampler_view
*resource
= (struct r600_pipe_sampler_view
*)state
;
345 pipe_resource_reference(&state
->texture
, NULL
);
349 static void r600_bind_sampler_states(struct pipe_context
*pipe
,
352 unsigned count
, void **states
)
354 struct r600_context
*rctx
= (struct r600_context
*)pipe
;
355 struct r600_textures_info
*dst
;
356 int seamless_cube_map
= -1;
359 assert(start
== 0); /* XXX fix below */
362 case PIPE_SHADER_VERTEX
:
363 dst
= &rctx
->vs_samplers
;
365 case PIPE_SHADER_FRAGMENT
:
366 dst
= &rctx
->ps_samplers
;
369 debug_error("bad shader in r600_bind_samplers()");
373 memcpy(dst
->samplers
, states
, sizeof(void*) * count
);
374 dst
->n_samplers
= count
;
375 dst
->atom_sampler
.num_dw
= 0;
377 for (i
= 0; i
< count
; i
++) {
378 struct r600_pipe_sampler_state
*sampler
= states
[i
];
380 if (sampler
== NULL
) {
383 if (sampler
->border_color_use
) {
384 dst
->atom_sampler
.num_dw
+= 11;
385 rctx
->flags
|= R600_CONTEXT_PS_PARTIAL_FLUSH
;
387 dst
->atom_sampler
.num_dw
+= 5;
389 seamless_cube_map
= sampler
->seamless_cube_map
;
391 if (rctx
->chip_class
<= R700
&& seamless_cube_map
!= -1 && seamless_cube_map
!= rctx
->seamless_cube_map
.enabled
) {
392 /* change in TA_CNTL_AUX need a pipeline flush */
393 rctx
->flags
|= R600_CONTEXT_PS_PARTIAL_FLUSH
;
394 rctx
->seamless_cube_map
.enabled
= seamless_cube_map
;
395 r600_atom_dirty(rctx
, &rctx
->seamless_cube_map
.atom
);
397 if (dst
->atom_sampler
.num_dw
) {
398 r600_atom_dirty(rctx
, &dst
->atom_sampler
);
402 static void r600_bind_vs_sampler_states(struct pipe_context
*ctx
, unsigned count
, void **states
)
404 r600_bind_sampler_states(ctx
, PIPE_SHADER_VERTEX
, 0, count
, states
);
407 static void r600_bind_ps_sampler_states(struct pipe_context
*ctx
, unsigned count
, void **states
)
409 r600_bind_sampler_states(ctx
, PIPE_SHADER_FRAGMENT
, 0, count
, states
);
412 static void r600_delete_sampler_state(struct pipe_context
*ctx
, void *state
)
417 static void r600_delete_state(struct pipe_context
*ctx
, void *state
)
419 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
420 struct r600_pipe_state
*rstate
= (struct r600_pipe_state
*)state
;
422 if (rctx
->states
[rstate
->id
] == rstate
) {
423 rctx
->states
[rstate
->id
] = NULL
;
425 for (int i
= 0; i
< rstate
->nregs
; i
++) {
426 pipe_resource_reference((struct pipe_resource
**)&rstate
->regs
[i
].bo
, NULL
);
431 static void r600_bind_vertex_elements(struct pipe_context
*ctx
, void *state
)
433 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
434 struct r600_vertex_element
*v
= (struct r600_vertex_element
*)state
;
436 rctx
->vertex_elements
= v
;
438 rctx
->states
[v
->rstate
.id
] = &v
->rstate
;
439 r600_context_pipe_state_set(rctx
, &v
->rstate
);
443 static void r600_delete_vertex_elements(struct pipe_context
*ctx
, void *state
)
445 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
446 struct r600_vertex_element
*v
= (struct r600_vertex_element
*)state
;
448 if (rctx
->states
[v
->rstate
.id
] == &v
->rstate
) {
449 rctx
->states
[v
->rstate
.id
] = NULL
;
451 if (rctx
->vertex_elements
== state
)
452 rctx
->vertex_elements
= NULL
;
454 pipe_resource_reference((struct pipe_resource
**)&v
->fetch_shader
, NULL
);
458 static void r600_set_index_buffer(struct pipe_context
*ctx
,
459 const struct pipe_index_buffer
*ib
)
461 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
464 pipe_resource_reference(&rctx
->index_buffer
.buffer
, ib
->buffer
);
465 memcpy(&rctx
->index_buffer
, ib
, sizeof(*ib
));
467 pipe_resource_reference(&rctx
->index_buffer
.buffer
, NULL
);
471 void r600_vertex_buffers_dirty(struct r600_context
*rctx
)
473 if (rctx
->vertex_buffer_state
.dirty_mask
) {
474 rctx
->flags
|= rctx
->has_vertex_cache
? R600_CONTEXT_VTX_FLUSH
: R600_CONTEXT_TEX_FLUSH
;
475 rctx
->vertex_buffer_state
.atom
.num_dw
= (rctx
->chip_class
>= EVERGREEN
? 12 : 11) *
476 util_bitcount(rctx
->vertex_buffer_state
.dirty_mask
);
477 r600_atom_dirty(rctx
, &rctx
->vertex_buffer_state
.atom
);
481 static void r600_set_vertex_buffers(struct pipe_context
*ctx
, unsigned count
,
482 const struct pipe_vertex_buffer
*input
)
484 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
485 struct r600_vertexbuf_state
*state
= &rctx
->vertex_buffer_state
;
486 struct pipe_vertex_buffer
*vb
= state
->vb
;
488 /* This sets 1-bit for buffers with index >= count. */
489 uint32_t disable_mask
= ~((1ull << count
) - 1);
490 /* These are the new buffers set by this function. */
491 uint32_t new_buffer_mask
= 0;
493 /* Set buffers with index >= count to NULL. */
494 uint32_t remaining_buffers_mask
=
495 rctx
->vertex_buffer_state
.enabled_mask
& disable_mask
;
497 while (remaining_buffers_mask
) {
498 i
= u_bit_scan(&remaining_buffers_mask
);
499 pipe_resource_reference(&vb
[i
].buffer
, NULL
);
502 /* Set vertex buffers. */
503 for (i
= 0; i
< count
; i
++) {
504 if (memcmp(&input
[i
], &vb
[i
], sizeof(struct pipe_vertex_buffer
))) {
505 if (input
[i
].buffer
) {
506 vb
[i
].stride
= input
[i
].stride
;
507 vb
[i
].buffer_offset
= input
[i
].buffer_offset
;
508 pipe_resource_reference(&vb
[i
].buffer
, input
[i
].buffer
);
509 new_buffer_mask
|= 1 << i
;
511 pipe_resource_reference(&vb
[i
].buffer
, NULL
);
512 disable_mask
|= 1 << i
;
517 rctx
->vertex_buffer_state
.enabled_mask
&= ~disable_mask
;
518 rctx
->vertex_buffer_state
.dirty_mask
&= rctx
->vertex_buffer_state
.enabled_mask
;
519 rctx
->vertex_buffer_state
.enabled_mask
|= new_buffer_mask
;
520 rctx
->vertex_buffer_state
.dirty_mask
|= new_buffer_mask
;
522 r600_vertex_buffers_dirty(rctx
);
525 void r600_sampler_views_dirty(struct r600_context
*rctx
,
526 struct r600_samplerview_state
*state
)
528 if (state
->dirty_mask
) {
529 rctx
->flags
|= R600_CONTEXT_TEX_FLUSH
;
530 state
->atom
.num_dw
= (rctx
->chip_class
>= EVERGREEN
? 14 : 13) *
531 util_bitcount(state
->dirty_mask
);
532 r600_atom_dirty(rctx
, &state
->atom
);
536 static void r600_set_sampler_views(struct pipe_context
*pipe
, unsigned shader
,
537 unsigned start
, unsigned count
,
538 struct pipe_sampler_view
**views
)
540 struct r600_context
*rctx
= (struct r600_context
*) pipe
;
541 struct r600_textures_info
*dst
;
542 struct r600_pipe_sampler_view
**rviews
= (struct r600_pipe_sampler_view
**)views
;
544 /* This sets 1-bit for textures with index >= count. */
545 uint32_t disable_mask
= ~((1ull << count
) - 1);
546 /* These are the new textures set by this function. */
547 uint32_t new_mask
= 0;
549 /* Set textures with index >= count to NULL. */
550 uint32_t remaining_mask
;
552 assert(start
== 0); /* XXX fix below */
555 case PIPE_SHADER_VERTEX
:
556 dst
= &rctx
->vs_samplers
;
558 case PIPE_SHADER_FRAGMENT
:
559 dst
= &rctx
->ps_samplers
;
562 debug_error("bad shader in r600_set_sampler_views()");
566 remaining_mask
= dst
->views
.enabled_mask
& disable_mask
;
568 while (remaining_mask
) {
569 i
= u_bit_scan(&remaining_mask
);
570 assert(dst
->views
.views
[i
]);
572 pipe_sampler_view_reference((struct pipe_sampler_view
**)&dst
->views
.views
[i
], NULL
);
575 for (i
= 0; i
< count
; i
++) {
576 if (rviews
[i
] == dst
->views
.views
[i
]) {
581 struct r600_texture
*rtex
=
582 (struct r600_texture
*)rviews
[i
]->base
.texture
;
584 if (rtex
->is_depth
&& !rtex
->is_flushing_texture
) {
585 dst
->views
.compressed_depthtex_mask
|= 1 << i
;
587 dst
->views
.compressed_depthtex_mask
&= ~(1 << i
);
590 /* Track compressed colorbuffers for Evergreen (Cayman doesn't need this). */
591 if (rctx
->chip_class
!= CAYMAN
&& rtex
->cmask_size
&& rtex
->fmask_size
) {
592 dst
->views
.compressed_colortex_mask
|= 1 << i
;
594 dst
->views
.compressed_colortex_mask
&= ~(1 << i
);
597 /* Changing from array to non-arrays textures and vice
598 * versa requires updating TEX_ARRAY_OVERRIDE on R6xx-R7xx. */
599 if (rctx
->chip_class
<= R700
&&
600 (rviews
[i
]->base
.texture
->target
== PIPE_TEXTURE_1D_ARRAY
||
601 rviews
[i
]->base
.texture
->target
== PIPE_TEXTURE_2D_ARRAY
) != dst
->is_array_sampler
[i
]) {
602 r600_atom_dirty(rctx
, &dst
->atom_sampler
);
605 pipe_sampler_view_reference((struct pipe_sampler_view
**)&dst
->views
.views
[i
], views
[i
]);
608 pipe_sampler_view_reference((struct pipe_sampler_view
**)&dst
->views
.views
[i
], NULL
);
609 disable_mask
|= 1 << i
;
613 dst
->views
.enabled_mask
&= ~disable_mask
;
614 dst
->views
.dirty_mask
&= dst
->views
.enabled_mask
;
615 dst
->views
.enabled_mask
|= new_mask
;
616 dst
->views
.dirty_mask
|= new_mask
;
617 dst
->views
.compressed_depthtex_mask
&= dst
->views
.enabled_mask
;
618 dst
->views
.compressed_colortex_mask
&= dst
->views
.enabled_mask
;
620 r600_sampler_views_dirty(rctx
, &dst
->views
);
623 static void r600_set_vs_sampler_views(struct pipe_context
*ctx
, unsigned count
,
624 struct pipe_sampler_view
**views
)
626 r600_set_sampler_views(ctx
, PIPE_SHADER_VERTEX
, 0, count
, views
);
629 static void r600_set_ps_sampler_views(struct pipe_context
*ctx
, unsigned count
,
630 struct pipe_sampler_view
**views
)
632 r600_set_sampler_views(ctx
, PIPE_SHADER_FRAGMENT
, 0, count
, views
);
635 static void r600_set_viewport_state(struct pipe_context
*ctx
,
636 const struct pipe_viewport_state
*state
)
638 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
639 struct r600_pipe_state
*rstate
= CALLOC_STRUCT(r600_pipe_state
);
644 rctx
->viewport
= *state
;
645 rstate
->id
= R600_PIPE_STATE_VIEWPORT
;
646 r600_pipe_state_add_reg(rstate
, R_02843C_PA_CL_VPORT_XSCALE_0
, fui(state
->scale
[0]));
647 r600_pipe_state_add_reg(rstate
, R_028444_PA_CL_VPORT_YSCALE_0
, fui(state
->scale
[1]));
648 r600_pipe_state_add_reg(rstate
, R_02844C_PA_CL_VPORT_ZSCALE_0
, fui(state
->scale
[2]));
649 r600_pipe_state_add_reg(rstate
, R_028440_PA_CL_VPORT_XOFFSET_0
, fui(state
->translate
[0]));
650 r600_pipe_state_add_reg(rstate
, R_028448_PA_CL_VPORT_YOFFSET_0
, fui(state
->translate
[1]));
651 r600_pipe_state_add_reg(rstate
, R_028450_PA_CL_VPORT_ZOFFSET_0
, fui(state
->translate
[2]));
653 free(rctx
->states
[R600_PIPE_STATE_VIEWPORT
]);
654 rctx
->states
[R600_PIPE_STATE_VIEWPORT
] = rstate
;
655 r600_context_pipe_state_set(rctx
, rstate
);
658 static void *r600_create_vertex_elements(struct pipe_context
*ctx
, unsigned count
,
659 const struct pipe_vertex_element
*elements
)
661 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
662 struct r600_vertex_element
*v
= CALLOC_STRUCT(r600_vertex_element
);
669 memcpy(v
->elements
, elements
, sizeof(struct pipe_vertex_element
) * count
);
671 if (r600_vertex_elements_build_fetch_shader(rctx
, v
)) {
679 /* Compute the key for the hw shader variant */
680 static INLINE
unsigned r600_shader_selector_key(struct pipe_context
* ctx
,
681 struct r600_pipe_shader_selector
* sel
)
683 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
686 if (sel
->type
== PIPE_SHADER_FRAGMENT
) {
687 key
= rctx
->two_side
|
688 ((rctx
->alpha_to_one
&& rctx
->multisample_enable
&& !rctx
->cb0_is_integer
) << 1) |
689 (MIN2(sel
->nr_ps_max_color_exports
, rctx
->nr_cbufs
+ rctx
->dual_src_blend
) << 2);
696 /* Select the hw shader variant depending on the current state.
697 * (*dirty) is set to 1 if current variant was changed */
698 static int r600_shader_select(struct pipe_context
*ctx
,
699 struct r600_pipe_shader_selector
* sel
,
703 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
704 struct r600_pipe_shader
* shader
= NULL
;
707 key
= r600_shader_selector_key(ctx
, sel
);
709 /* Check if we don't need to change anything.
710 * This path is also used for most shaders that don't need multiple
711 * variants, it will cost just a computation of the key and this
713 if (likely(sel
->current
&& sel
->current
->key
== key
)) {
717 /* lookup if we have other variants in the list */
718 if (sel
->num_shaders
> 1) {
719 struct r600_pipe_shader
*p
= sel
->current
, *c
= p
->next_variant
;
721 while (c
&& c
->key
!= key
) {
727 p
->next_variant
= c
->next_variant
;
732 if (unlikely(!shader
)) {
733 shader
= CALLOC(1, sizeof(struct r600_pipe_shader
));
734 shader
->selector
= sel
;
736 r
= r600_pipe_shader_create(ctx
, shader
);
738 R600_ERR("Failed to build shader variant (type=%u, key=%u) %d\n",
744 /* We don't know the value of nr_ps_max_color_exports until we built
745 * at least one variant, so we may need to recompute the key after
746 * building first variant. */
747 if (sel
->type
== PIPE_SHADER_FRAGMENT
&&
748 sel
->num_shaders
== 0) {
749 sel
->nr_ps_max_color_exports
= shader
->shader
.nr_ps_max_color_exports
;
750 key
= r600_shader_selector_key(ctx
, sel
);
760 shader
->next_variant
= sel
->current
;
761 sel
->current
= shader
;
763 if (rctx
->chip_class
< EVERGREEN
&& rctx
->ps_shader
&& rctx
->vs_shader
) {
764 r600_adjust_gprs(rctx
);
767 if (rctx
->ps_shader
&&
768 rctx
->cb_misc_state
.nr_ps_color_outputs
!= rctx
->ps_shader
->current
->nr_ps_color_outputs
) {
769 rctx
->cb_misc_state
.nr_ps_color_outputs
= rctx
->ps_shader
->current
->nr_ps_color_outputs
;
770 r600_atom_dirty(rctx
, &rctx
->cb_misc_state
.atom
);
775 static void *r600_create_shader_state(struct pipe_context
*ctx
,
776 const struct pipe_shader_state
*state
,
777 unsigned pipe_shader_type
)
779 struct r600_pipe_shader_selector
*sel
= CALLOC_STRUCT(r600_pipe_shader_selector
);
782 sel
->type
= pipe_shader_type
;
783 sel
->tokens
= tgsi_dup_tokens(state
->tokens
);
784 sel
->so
= state
->stream_output
;
786 r
= r600_shader_select(ctx
, sel
, NULL
);
793 static void *r600_create_ps_state(struct pipe_context
*ctx
,
794 const struct pipe_shader_state
*state
)
796 return r600_create_shader_state(ctx
, state
, PIPE_SHADER_FRAGMENT
);
799 static void *r600_create_vs_state(struct pipe_context
*ctx
,
800 const struct pipe_shader_state
*state
)
802 return r600_create_shader_state(ctx
, state
, PIPE_SHADER_VERTEX
);
805 static void r600_bind_ps_state(struct pipe_context
*ctx
, void *state
)
807 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
810 state
= rctx
->dummy_pixel_shader
;
812 rctx
->ps_shader
= (struct r600_pipe_shader_selector
*)state
;
813 r600_context_pipe_state_set(rctx
, &rctx
->ps_shader
->current
->rstate
);
815 if (rctx
->chip_class
<= R700
) {
816 bool multiwrite
= rctx
->ps_shader
->current
->shader
.fs_write_all
;
818 if (rctx
->cb_misc_state
.multiwrite
!= multiwrite
) {
819 rctx
->cb_misc_state
.multiwrite
= multiwrite
;
820 r600_atom_dirty(rctx
, &rctx
->cb_misc_state
.atom
);
824 r600_adjust_gprs(rctx
);
827 if (rctx
->cb_misc_state
.nr_ps_color_outputs
!= rctx
->ps_shader
->current
->nr_ps_color_outputs
) {
828 rctx
->cb_misc_state
.nr_ps_color_outputs
= rctx
->ps_shader
->current
->nr_ps_color_outputs
;
829 r600_atom_dirty(rctx
, &rctx
->cb_misc_state
.atom
);
833 static void r600_bind_vs_state(struct pipe_context
*ctx
, void *state
)
835 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
837 rctx
->vs_shader
= (struct r600_pipe_shader_selector
*)state
;
839 r600_context_pipe_state_set(rctx
, &rctx
->vs_shader
->current
->rstate
);
841 if (rctx
->chip_class
< EVERGREEN
&& rctx
->ps_shader
)
842 r600_adjust_gprs(rctx
);
846 static void r600_delete_shader_selector(struct pipe_context
*ctx
,
847 struct r600_pipe_shader_selector
*sel
)
849 struct r600_pipe_shader
*p
= sel
->current
, *c
;
852 r600_pipe_shader_destroy(ctx
, p
);
862 static void r600_delete_ps_state(struct pipe_context
*ctx
, void *state
)
864 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
865 struct r600_pipe_shader_selector
*sel
= (struct r600_pipe_shader_selector
*)state
;
867 if (rctx
->ps_shader
== sel
) {
868 rctx
->ps_shader
= NULL
;
871 r600_delete_shader_selector(ctx
, sel
);
874 static void r600_delete_vs_state(struct pipe_context
*ctx
, void *state
)
876 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
877 struct r600_pipe_shader_selector
*sel
= (struct r600_pipe_shader_selector
*)state
;
879 if (rctx
->vs_shader
== sel
) {
880 rctx
->vs_shader
= NULL
;
883 r600_delete_shader_selector(ctx
, sel
);
886 void r600_constant_buffers_dirty(struct r600_context
*rctx
, struct r600_constbuf_state
*state
)
888 if (state
->dirty_mask
) {
889 rctx
->flags
|= R600_CONTEXT_SHADERCONST_FLUSH
;
890 state
->atom
.num_dw
= rctx
->chip_class
>= EVERGREEN
? util_bitcount(state
->dirty_mask
)*20
891 : util_bitcount(state
->dirty_mask
)*19;
892 r600_atom_dirty(rctx
, &state
->atom
);
896 static void r600_set_constant_buffer(struct pipe_context
*ctx
, uint shader
, uint index
,
897 struct pipe_constant_buffer
*input
)
899 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
900 struct r600_constbuf_state
*state
= &rctx
->constbuf_state
[shader
];
901 struct pipe_constant_buffer
*cb
;
904 /* Note that the state tracker can unbind constant buffers by
907 if (unlikely(!input
)) {
908 state
->enabled_mask
&= ~(1 << index
);
909 state
->dirty_mask
&= ~(1 << index
);
910 pipe_resource_reference(&state
->cb
[index
].buffer
, NULL
);
914 cb
= &state
->cb
[index
];
915 cb
->buffer_size
= input
->buffer_size
;
917 ptr
= input
->user_buffer
;
920 /* Upload the user buffer. */
921 if (R600_BIG_ENDIAN
) {
923 unsigned i
, size
= input
->buffer_size
;
925 if (!(tmpPtr
= malloc(size
))) {
926 R600_ERR("Failed to allocate BE swap buffer.\n");
930 for (i
= 0; i
< size
/ 4; ++i
) {
931 tmpPtr
[i
] = bswap_32(((uint32_t *)ptr
)[i
]);
934 u_upload_data(rctx
->uploader
, 0, size
, tmpPtr
, &cb
->buffer_offset
, &cb
->buffer
);
937 u_upload_data(rctx
->uploader
, 0, input
->buffer_size
, ptr
, &cb
->buffer_offset
, &cb
->buffer
);
940 /* Setup the hw buffer. */
941 cb
->buffer_offset
= input
->buffer_offset
;
942 pipe_resource_reference(&cb
->buffer
, input
->buffer
);
945 state
->enabled_mask
|= 1 << index
;
946 state
->dirty_mask
|= 1 << index
;
947 r600_constant_buffers_dirty(rctx
, state
);
950 static struct pipe_stream_output_target
*
951 r600_create_so_target(struct pipe_context
*ctx
,
952 struct pipe_resource
*buffer
,
953 unsigned buffer_offset
,
954 unsigned buffer_size
)
956 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
957 struct r600_so_target
*t
;
960 t
= CALLOC_STRUCT(r600_so_target
);
965 t
->b
.reference
.count
= 1;
967 pipe_resource_reference(&t
->b
.buffer
, buffer
);
968 t
->b
.buffer_offset
= buffer_offset
;
969 t
->b
.buffer_size
= buffer_size
;
971 t
->filled_size
= (struct r600_resource
*)
972 pipe_buffer_create(ctx
->screen
, PIPE_BIND_CUSTOM
, PIPE_USAGE_STATIC
, 4);
973 ptr
= rctx
->ws
->buffer_map(t
->filled_size
->cs_buf
, rctx
->cs
, PIPE_TRANSFER_WRITE
);
974 memset(ptr
, 0, t
->filled_size
->buf
->size
);
975 rctx
->ws
->buffer_unmap(t
->filled_size
->cs_buf
);
980 static void r600_so_target_destroy(struct pipe_context
*ctx
,
981 struct pipe_stream_output_target
*target
)
983 struct r600_so_target
*t
= (struct r600_so_target
*)target
;
984 pipe_resource_reference(&t
->b
.buffer
, NULL
);
985 pipe_resource_reference((struct pipe_resource
**)&t
->filled_size
, NULL
);
989 static void r600_set_so_targets(struct pipe_context
*ctx
,
990 unsigned num_targets
,
991 struct pipe_stream_output_target
**targets
,
992 unsigned append_bitmask
)
994 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
997 /* Stop streamout. */
998 if (rctx
->num_so_targets
&& !rctx
->streamout_start
) {
999 r600_context_streamout_end(rctx
);
1002 /* Set the new targets. */
1003 for (i
= 0; i
< num_targets
; i
++) {
1004 pipe_so_target_reference((struct pipe_stream_output_target
**)&rctx
->so_targets
[i
], targets
[i
]);
1006 for (; i
< rctx
->num_so_targets
; i
++) {
1007 pipe_so_target_reference((struct pipe_stream_output_target
**)&rctx
->so_targets
[i
], NULL
);
1010 rctx
->num_so_targets
= num_targets
;
1011 rctx
->streamout_start
= num_targets
!= 0;
1012 rctx
->streamout_append_bitmask
= append_bitmask
;
1015 static void r600_set_sample_mask(struct pipe_context
*pipe
, unsigned sample_mask
)
1017 struct r600_context
*rctx
= (struct r600_context
*)pipe
;
1019 if (rctx
->sample_mask
.sample_mask
== (uint16_t)sample_mask
)
1022 rctx
->sample_mask
.sample_mask
= sample_mask
;
1023 r600_atom_dirty(rctx
, &rctx
->sample_mask
.atom
);
1026 static void r600_update_derived_state(struct r600_context
*rctx
)
1028 struct pipe_context
* ctx
= (struct pipe_context
*)rctx
;
1029 unsigned ps_dirty
= 0, blend_override
;
1031 if (!rctx
->blitter
->running
) {
1032 /* Decompress textures if needed. */
1033 if (rctx
->vs_samplers
.views
.compressed_depthtex_mask
) {
1034 r600_decompress_depth_textures(rctx
, &rctx
->vs_samplers
.views
);
1036 if (rctx
->ps_samplers
.views
.compressed_depthtex_mask
) {
1037 r600_decompress_depth_textures(rctx
, &rctx
->ps_samplers
.views
);
1039 if (rctx
->vs_samplers
.views
.compressed_colortex_mask
) {
1040 r600_decompress_color_textures(rctx
, &rctx
->vs_samplers
.views
);
1042 if (rctx
->ps_samplers
.views
.compressed_colortex_mask
) {
1043 r600_decompress_color_textures(rctx
, &rctx
->ps_samplers
.views
);
1047 r600_shader_select(ctx
, rctx
->ps_shader
, &ps_dirty
);
1049 if (rctx
->ps_shader
&& ((rctx
->sprite_coord_enable
&&
1050 (rctx
->ps_shader
->current
->sprite_coord_enable
!= rctx
->sprite_coord_enable
)) ||
1051 (rctx
->rasterizer
&& rctx
->rasterizer
->flatshade
!= rctx
->ps_shader
->current
->flatshade
))) {
1053 if (rctx
->chip_class
>= EVERGREEN
)
1054 evergreen_pipe_shader_ps(ctx
, rctx
->ps_shader
->current
);
1056 r600_pipe_shader_ps(ctx
, rctx
->ps_shader
->current
);
1062 r600_context_pipe_state_set(rctx
, &rctx
->ps_shader
->current
->rstate
);
1064 blend_override
= (rctx
->dual_src_blend
&&
1065 rctx
->ps_shader
->current
->nr_ps_color_outputs
< 2);
1067 if (blend_override
!= rctx
->blend_override
) {
1068 rctx
->blend_override
= blend_override
;
1069 r600_bind_blend_state_internal(rctx
,
1070 blend_override
? rctx
->no_blend
: rctx
->blend
);
1073 if (rctx
->chip_class
>= EVERGREEN
) {
1074 evergreen_update_dual_export_state(rctx
);
1076 r600_update_dual_export_state(rctx
);
1080 static unsigned r600_conv_prim_to_gs_out(unsigned mode
)
1082 static const int prim_conv
[] = {
1083 V_028A6C_OUTPRIM_TYPE_POINTLIST
,
1084 V_028A6C_OUTPRIM_TYPE_LINESTRIP
,
1085 V_028A6C_OUTPRIM_TYPE_LINESTRIP
,
1086 V_028A6C_OUTPRIM_TYPE_LINESTRIP
,
1087 V_028A6C_OUTPRIM_TYPE_TRISTRIP
,
1088 V_028A6C_OUTPRIM_TYPE_TRISTRIP
,
1089 V_028A6C_OUTPRIM_TYPE_TRISTRIP
,
1090 V_028A6C_OUTPRIM_TYPE_TRISTRIP
,
1091 V_028A6C_OUTPRIM_TYPE_TRISTRIP
,
1092 V_028A6C_OUTPRIM_TYPE_TRISTRIP
,
1093 V_028A6C_OUTPRIM_TYPE_LINESTRIP
,
1094 V_028A6C_OUTPRIM_TYPE_LINESTRIP
,
1095 V_028A6C_OUTPRIM_TYPE_TRISTRIP
,
1096 V_028A6C_OUTPRIM_TYPE_TRISTRIP
,
1097 V_028A6C_OUTPRIM_TYPE_TRISTRIP
1099 assert(mode
< Elements(prim_conv
));
1101 return prim_conv
[mode
];
1104 static void r600_draw_vbo(struct pipe_context
*ctx
, const struct pipe_draw_info
*dinfo
)
1106 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
1107 struct pipe_draw_info info
= *dinfo
;
1108 struct pipe_index_buffer ib
= {};
1109 unsigned prim
, ls_mask
= 0, i
;
1110 struct r600_block
*dirty_block
= NULL
, *next_block
= NULL
;
1111 struct radeon_winsys_cs
*cs
= rctx
->cs
;
1115 if ((!info
.count
&& (info
.indexed
|| !info
.count_from_stream_output
)) ||
1116 !r600_conv_pipe_prim(info
.mode
, &prim
)) {
1121 if (!rctx
->vs_shader
) {
1126 r600_update_derived_state(rctx
);
1129 /* Initialize the index buffer struct. */
1130 pipe_resource_reference(&ib
.buffer
, rctx
->index_buffer
.buffer
);
1131 ib
.user_buffer
= rctx
->index_buffer
.user_buffer
;
1132 ib
.index_size
= rctx
->index_buffer
.index_size
;
1133 ib
.offset
= rctx
->index_buffer
.offset
+ info
.start
* ib
.index_size
;
1135 /* Translate or upload, if needed. */
1136 r600_translate_index_buffer(rctx
, &ib
, info
.count
);
1138 ptr
= (uint8_t*)ib
.user_buffer
;
1139 if (!ib
.buffer
&& ptr
) {
1140 u_upload_data(rctx
->uploader
, 0, info
.count
* ib
.index_size
,
1141 ptr
, &ib
.offset
, &ib
.buffer
);
1144 info
.index_bias
= info
.start
;
1147 if (rctx
->vgt
.id
!= R600_PIPE_STATE_VGT
) {
1148 rctx
->vgt
.id
= R600_PIPE_STATE_VGT
;
1149 rctx
->vgt
.nregs
= 0;
1150 r600_pipe_state_add_reg(&rctx
->vgt
, R_008958_VGT_PRIMITIVE_TYPE
, prim
);
1151 r600_pipe_state_add_reg(&rctx
->vgt
, R_028A6C_VGT_GS_OUT_PRIM_TYPE
, 0);
1152 r600_pipe_state_add_reg(&rctx
->vgt
, R_028408_VGT_INDX_OFFSET
, info
.index_bias
);
1153 r600_pipe_state_add_reg(&rctx
->vgt
, R_02840C_VGT_MULTI_PRIM_IB_RESET_INDX
, info
.restart_index
);
1154 r600_pipe_state_add_reg(&rctx
->vgt
, R_028A94_VGT_MULTI_PRIM_IB_RESET_EN
, info
.primitive_restart
);
1155 r600_pipe_state_add_reg(&rctx
->vgt
, R_03CFF4_SQ_VTX_START_INST_LOC
, info
.start_instance
);
1156 r600_pipe_state_add_reg(&rctx
->vgt
, R_028A0C_PA_SC_LINE_STIPPLE
, 0);
1157 r600_pipe_state_add_reg(&rctx
->vgt
, R_02881C_PA_CL_VS_OUT_CNTL
, 0);
1158 r600_pipe_state_add_reg(&rctx
->vgt
, R_028810_PA_CL_CLIP_CNTL
, 0);
1161 rctx
->vgt
.nregs
= 0;
1162 r600_pipe_state_mod_reg(&rctx
->vgt
, prim
);
1163 r600_pipe_state_mod_reg(&rctx
->vgt
, r600_conv_prim_to_gs_out(info
.mode
));
1164 r600_pipe_state_mod_reg(&rctx
->vgt
, info
.index_bias
);
1165 r600_pipe_state_mod_reg(&rctx
->vgt
, info
.restart_index
);
1166 r600_pipe_state_mod_reg(&rctx
->vgt
, info
.primitive_restart
);
1167 r600_pipe_state_mod_reg(&rctx
->vgt
, info
.start_instance
);
1169 if (prim
== V_008958_DI_PT_LINELIST
)
1171 else if (prim
== V_008958_DI_PT_LINESTRIP
||
1172 prim
== V_008958_DI_PT_LINELOOP
)
1174 r600_pipe_state_mod_reg(&rctx
->vgt
, S_028A0C_AUTO_RESET_CNTL(ls_mask
) | rctx
->pa_sc_line_stipple
);
1175 r600_pipe_state_mod_reg(&rctx
->vgt
,
1176 rctx
->vs_shader
->current
->pa_cl_vs_out_cntl
|
1177 (rctx
->rasterizer
->clip_plane_enable
& rctx
->vs_shader
->current
->shader
.clip_dist_write
));
1178 r600_pipe_state_mod_reg(&rctx
->vgt
,
1179 rctx
->pa_cl_clip_cntl
|
1180 (rctx
->vs_shader
->current
->shader
.clip_dist_write
||
1181 rctx
->vs_shader
->current
->shader
.vs_prohibit_ucps
?
1182 0 : rctx
->rasterizer
->clip_plane_enable
& 0x3F));
1184 r600_context_pipe_state_set(rctx
, &rctx
->vgt
);
1186 /* Enable stream out if needed. */
1187 if (rctx
->streamout_start
) {
1188 r600_context_streamout_begin(rctx
);
1189 rctx
->streamout_start
= FALSE
;
1192 /* Emit states (the function expects that we emit at most 17 dwords here). */
1193 r600_need_cs_space(rctx
, 0, TRUE
);
1194 r600_flush_emit(rctx
);
1196 for (i
= 0; i
< R600_MAX_ATOM
; i
++) {
1197 if (rctx
->atoms
[i
] == NULL
|| !rctx
->atoms
[i
]->dirty
) {
1200 r600_emit_atom(rctx
, rctx
->atoms
[i
]);
1202 LIST_FOR_EACH_ENTRY_SAFE(dirty_block
, next_block
, &rctx
->dirty
,list
) {
1203 r600_context_block_emit_dirty(rctx
, dirty_block
, 0 /* pkt_flags */);
1205 rctx
->pm4_dirty_cdwords
= 0;
1208 cs
->buf
[cs
->cdw
++] = PKT3(PKT3_NUM_INSTANCES
, 0, rctx
->predicate_drawing
);
1209 cs
->buf
[cs
->cdw
++] = info
.instance_count
;
1211 cs
->buf
[cs
->cdw
++] = PKT3(PKT3_INDEX_TYPE
, 0, rctx
->predicate_drawing
);
1212 cs
->buf
[cs
->cdw
++] = ib
.index_size
== 4 ?
1213 (VGT_INDEX_32
| (R600_BIG_ENDIAN
? VGT_DMA_SWAP_32_BIT
: 0)) :
1214 (VGT_INDEX_16
| (R600_BIG_ENDIAN
? VGT_DMA_SWAP_16_BIT
: 0));
1216 va
= r600_resource_va(ctx
->screen
, ib
.buffer
);
1218 cs
->buf
[cs
->cdw
++] = PKT3(PKT3_DRAW_INDEX
, 3, rctx
->predicate_drawing
);
1219 cs
->buf
[cs
->cdw
++] = va
;
1220 cs
->buf
[cs
->cdw
++] = (va
>> 32UL) & 0xFF;
1221 cs
->buf
[cs
->cdw
++] = info
.count
;
1222 cs
->buf
[cs
->cdw
++] = V_0287F0_DI_SRC_SEL_DMA
;
1223 cs
->buf
[cs
->cdw
++] = PKT3(PKT3_NOP
, 0, rctx
->predicate_drawing
);
1224 cs
->buf
[cs
->cdw
++] = r600_context_bo_reloc(rctx
, (struct r600_resource
*)ib
.buffer
, RADEON_USAGE_READ
);
1226 if (info
.count_from_stream_output
) {
1227 struct r600_so_target
*t
= (struct r600_so_target
*)info
.count_from_stream_output
;
1228 uint64_t va
= r600_resource_va(&rctx
->screen
->screen
, (void*)t
->filled_size
);
1230 r600_write_context_reg(cs
, R_028B30_VGT_STRMOUT_DRAW_OPAQUE_VERTEX_STRIDE
, t
->stride_in_dw
);
1232 cs
->buf
[cs
->cdw
++] = PKT3(PKT3_COPY_DW
, 4, 0);
1233 cs
->buf
[cs
->cdw
++] = COPY_DW_SRC_IS_MEM
| COPY_DW_DST_IS_REG
;
1234 cs
->buf
[cs
->cdw
++] = va
& 0xFFFFFFFFUL
; /* src address lo */
1235 cs
->buf
[cs
->cdw
++] = (va
>> 32UL) & 0xFFUL
; /* src address hi */
1236 cs
->buf
[cs
->cdw
++] = R_028B2C_VGT_STRMOUT_DRAW_OPAQUE_BUFFER_FILLED_SIZE
>> 2; /* dst register */
1237 cs
->buf
[cs
->cdw
++] = 0; /* unused */
1239 cs
->buf
[cs
->cdw
++] = PKT3(PKT3_NOP
, 0, 0);
1240 cs
->buf
[cs
->cdw
++] = r600_context_bo_reloc(rctx
, t
->filled_size
, RADEON_USAGE_READ
);
1243 cs
->buf
[cs
->cdw
++] = PKT3(PKT3_DRAW_INDEX_AUTO
, 1, rctx
->predicate_drawing
);
1244 cs
->buf
[cs
->cdw
++] = info
.count
;
1245 cs
->buf
[cs
->cdw
++] = V_0287F0_DI_SRC_SEL_AUTO_INDEX
|
1246 (info
.count_from_stream_output
? S_0287F0_USE_OPAQUE(1) : 0);
1249 /* Set the depth buffer as dirty. */
1250 if (rctx
->framebuffer
.zsbuf
) {
1251 struct pipe_surface
*surf
= rctx
->framebuffer
.zsbuf
;
1252 struct r600_texture
*rtex
= (struct r600_texture
*)surf
->texture
;
1254 rtex
->dirty_level_mask
|= 1 << surf
->u
.tex
.level
;
1256 if (rctx
->compressed_cb_mask
) {
1257 struct pipe_surface
*surf
;
1258 struct r600_texture
*rtex
;
1259 unsigned mask
= rctx
->compressed_cb_mask
;
1262 unsigned i
= u_bit_scan(&mask
);
1263 surf
= rctx
->framebuffer
.cbufs
[i
];
1264 rtex
= (struct r600_texture
*)surf
->texture
;
1266 rtex
->dirty_level_mask
|= 1 << surf
->u
.tex
.level
;
1271 pipe_resource_reference(&ib
.buffer
, NULL
);
1274 void r600_draw_rectangle(struct blitter_context
*blitter
,
1275 unsigned x1
, unsigned y1
, unsigned x2
, unsigned y2
, float depth
,
1276 enum blitter_attrib_type type
, const union pipe_color_union
*attrib
)
1278 struct r600_context
*rctx
= (struct r600_context
*)util_blitter_get_pipe(blitter
);
1279 struct pipe_viewport_state viewport
;
1280 struct pipe_resource
*buf
= NULL
;
1281 unsigned offset
= 0;
1284 if (type
== UTIL_BLITTER_ATTRIB_TEXCOORD
) {
1285 util_blitter_draw_rectangle(blitter
, x1
, y1
, x2
, y2
, depth
, type
, attrib
);
1289 /* Some operations (like color resolve on r6xx) don't work
1290 * with the conventional primitive types.
1291 * One that works is PT_RECTLIST, which we use here. */
1293 /* setup viewport */
1294 viewport
.scale
[0] = 1.0f
;
1295 viewport
.scale
[1] = 1.0f
;
1296 viewport
.scale
[2] = 1.0f
;
1297 viewport
.scale
[3] = 1.0f
;
1298 viewport
.translate
[0] = 0.0f
;
1299 viewport
.translate
[1] = 0.0f
;
1300 viewport
.translate
[2] = 0.0f
;
1301 viewport
.translate
[3] = 0.0f
;
1302 rctx
->context
.set_viewport_state(&rctx
->context
, &viewport
);
1304 /* Upload vertices. The hw rectangle has only 3 vertices,
1305 * I guess the 4th one is derived from the first 3.
1306 * The vertex specification should match u_blitter's vertex element state. */
1307 u_upload_alloc(rctx
->uploader
, 0, sizeof(float) * 24, &offset
, &buf
, (void**)&vb
);
1324 memcpy(vb
+4, attrib
->f
, sizeof(float)*4);
1325 memcpy(vb
+12, attrib
->f
, sizeof(float)*4);
1326 memcpy(vb
+20, attrib
->f
, sizeof(float)*4);
1330 util_draw_vertex_buffer(&rctx
->context
, NULL
, buf
, offset
,
1331 R600_PRIM_RECTANGLE_LIST
, 3, 2);
1332 pipe_resource_reference(&buf
, NULL
);
1335 void _r600_pipe_state_add_reg_bo(struct r600_context
*ctx
,
1336 struct r600_pipe_state
*state
,
1337 uint32_t offset
, uint32_t value
,
1338 uint32_t range_id
, uint32_t block_id
,
1339 struct r600_resource
*bo
,
1340 enum radeon_bo_usage usage
)
1343 struct r600_range
*range
;
1344 struct r600_block
*block
;
1346 if (bo
) assert(usage
);
1348 range
= &ctx
->range
[range_id
];
1349 block
= range
->blocks
[block_id
];
1350 state
->regs
[state
->nregs
].block
= block
;
1351 state
->regs
[state
->nregs
].id
= (offset
- block
->start_offset
) >> 2;
1353 state
->regs
[state
->nregs
].value
= value
;
1354 state
->regs
[state
->nregs
].bo
= bo
;
1355 state
->regs
[state
->nregs
].bo_usage
= usage
;
1358 assert(state
->nregs
< R600_BLOCK_MAX_REG
);
1361 void _r600_pipe_state_add_reg(struct r600_context
*ctx
,
1362 struct r600_pipe_state
*state
,
1363 uint32_t offset
, uint32_t value
,
1364 uint32_t range_id
, uint32_t block_id
)
1366 _r600_pipe_state_add_reg_bo(ctx
, state
, offset
, value
,
1367 range_id
, block_id
, NULL
, 0);
1370 uint32_t r600_translate_stencil_op(int s_op
)
1373 case PIPE_STENCIL_OP_KEEP
:
1374 return V_028800_STENCIL_KEEP
;
1375 case PIPE_STENCIL_OP_ZERO
:
1376 return V_028800_STENCIL_ZERO
;
1377 case PIPE_STENCIL_OP_REPLACE
:
1378 return V_028800_STENCIL_REPLACE
;
1379 case PIPE_STENCIL_OP_INCR
:
1380 return V_028800_STENCIL_INCR
;
1381 case PIPE_STENCIL_OP_DECR
:
1382 return V_028800_STENCIL_DECR
;
1383 case PIPE_STENCIL_OP_INCR_WRAP
:
1384 return V_028800_STENCIL_INCR_WRAP
;
1385 case PIPE_STENCIL_OP_DECR_WRAP
:
1386 return V_028800_STENCIL_DECR_WRAP
;
1387 case PIPE_STENCIL_OP_INVERT
:
1388 return V_028800_STENCIL_INVERT
;
1390 R600_ERR("Unknown stencil op %d", s_op
);
1397 uint32_t r600_translate_fill(uint32_t func
)
1400 case PIPE_POLYGON_MODE_FILL
:
1402 case PIPE_POLYGON_MODE_LINE
:
1404 case PIPE_POLYGON_MODE_POINT
:
1412 unsigned r600_tex_wrap(unsigned wrap
)
1416 case PIPE_TEX_WRAP_REPEAT
:
1417 return V_03C000_SQ_TEX_WRAP
;
1418 case PIPE_TEX_WRAP_CLAMP
:
1419 return V_03C000_SQ_TEX_CLAMP_HALF_BORDER
;
1420 case PIPE_TEX_WRAP_CLAMP_TO_EDGE
:
1421 return V_03C000_SQ_TEX_CLAMP_LAST_TEXEL
;
1422 case PIPE_TEX_WRAP_CLAMP_TO_BORDER
:
1423 return V_03C000_SQ_TEX_CLAMP_BORDER
;
1424 case PIPE_TEX_WRAP_MIRROR_REPEAT
:
1425 return V_03C000_SQ_TEX_MIRROR
;
1426 case PIPE_TEX_WRAP_MIRROR_CLAMP
:
1427 return V_03C000_SQ_TEX_MIRROR_ONCE_HALF_BORDER
;
1428 case PIPE_TEX_WRAP_MIRROR_CLAMP_TO_EDGE
:
1429 return V_03C000_SQ_TEX_MIRROR_ONCE_LAST_TEXEL
;
1430 case PIPE_TEX_WRAP_MIRROR_CLAMP_TO_BORDER
:
1431 return V_03C000_SQ_TEX_MIRROR_ONCE_BORDER
;
1435 unsigned r600_tex_filter(unsigned filter
)
1439 case PIPE_TEX_FILTER_NEAREST
:
1440 return V_03C000_SQ_TEX_XY_FILTER_POINT
;
1441 case PIPE_TEX_FILTER_LINEAR
:
1442 return V_03C000_SQ_TEX_XY_FILTER_BILINEAR
;
1446 unsigned r600_tex_mipfilter(unsigned filter
)
1449 case PIPE_TEX_MIPFILTER_NEAREST
:
1450 return V_03C000_SQ_TEX_Z_FILTER_POINT
;
1451 case PIPE_TEX_MIPFILTER_LINEAR
:
1452 return V_03C000_SQ_TEX_Z_FILTER_LINEAR
;
1454 case PIPE_TEX_MIPFILTER_NONE
:
1455 return V_03C000_SQ_TEX_Z_FILTER_NONE
;
1459 unsigned r600_tex_compare(unsigned compare
)
1463 case PIPE_FUNC_NEVER
:
1464 return V_03C000_SQ_TEX_DEPTH_COMPARE_NEVER
;
1465 case PIPE_FUNC_LESS
:
1466 return V_03C000_SQ_TEX_DEPTH_COMPARE_LESS
;
1467 case PIPE_FUNC_EQUAL
:
1468 return V_03C000_SQ_TEX_DEPTH_COMPARE_EQUAL
;
1469 case PIPE_FUNC_LEQUAL
:
1470 return V_03C000_SQ_TEX_DEPTH_COMPARE_LESSEQUAL
;
1471 case PIPE_FUNC_GREATER
:
1472 return V_03C000_SQ_TEX_DEPTH_COMPARE_GREATER
;
1473 case PIPE_FUNC_NOTEQUAL
:
1474 return V_03C000_SQ_TEX_DEPTH_COMPARE_NOTEQUAL
;
1475 case PIPE_FUNC_GEQUAL
:
1476 return V_03C000_SQ_TEX_DEPTH_COMPARE_GREATEREQUAL
;
1477 case PIPE_FUNC_ALWAYS
:
1478 return V_03C000_SQ_TEX_DEPTH_COMPARE_ALWAYS
;
1482 /* keep this at the end of this file, please */
1483 void r600_init_common_state_functions(struct r600_context
*rctx
)
1485 rctx
->context
.create_fs_state
= r600_create_ps_state
;
1486 rctx
->context
.create_vs_state
= r600_create_vs_state
;
1487 rctx
->context
.create_vertex_elements_state
= r600_create_vertex_elements
;
1488 rctx
->context
.bind_blend_state
= r600_bind_blend_state
;
1489 rctx
->context
.bind_depth_stencil_alpha_state
= r600_bind_dsa_state
;
1490 rctx
->context
.bind_fragment_sampler_states
= r600_bind_ps_sampler_states
;
1491 rctx
->context
.bind_fs_state
= r600_bind_ps_state
;
1492 rctx
->context
.bind_rasterizer_state
= r600_bind_rs_state
;
1493 rctx
->context
.bind_vertex_elements_state
= r600_bind_vertex_elements
;
1494 rctx
->context
.bind_vertex_sampler_states
= r600_bind_vs_sampler_states
;
1495 rctx
->context
.bind_vs_state
= r600_bind_vs_state
;
1496 rctx
->context
.delete_blend_state
= r600_delete_state
;
1497 rctx
->context
.delete_depth_stencil_alpha_state
= r600_delete_state
;
1498 rctx
->context
.delete_fs_state
= r600_delete_ps_state
;
1499 rctx
->context
.delete_rasterizer_state
= r600_delete_rs_state
;
1500 rctx
->context
.delete_sampler_state
= r600_delete_sampler_state
;
1501 rctx
->context
.delete_vertex_elements_state
= r600_delete_vertex_elements
;
1502 rctx
->context
.delete_vs_state
= r600_delete_vs_state
;
1503 rctx
->context
.set_blend_color
= r600_set_blend_color
;
1504 rctx
->context
.set_constant_buffer
= r600_set_constant_buffer
;
1505 rctx
->context
.set_sample_mask
= r600_set_sample_mask
;
1506 rctx
->context
.set_stencil_ref
= r600_set_pipe_stencil_ref
;
1507 rctx
->context
.set_viewport_state
= r600_set_viewport_state
;
1508 rctx
->context
.set_vertex_buffers
= r600_set_vertex_buffers
;
1509 rctx
->context
.set_index_buffer
= r600_set_index_buffer
;
1510 rctx
->context
.set_fragment_sampler_views
= r600_set_ps_sampler_views
;
1511 rctx
->context
.set_vertex_sampler_views
= r600_set_vs_sampler_views
;
1512 rctx
->context
.sampler_view_destroy
= r600_sampler_view_destroy
;
1513 rctx
->context
.texture_barrier
= r600_texture_barrier
;
1514 rctx
->context
.create_stream_output_target
= r600_create_so_target
;
1515 rctx
->context
.stream_output_target_destroy
= r600_so_target_destroy
;
1516 rctx
->context
.set_stream_output_targets
= r600_set_so_targets
;
1517 rctx
->context
.draw_vbo
= r600_draw_vbo
;