2 * Copyright (c) 2014-2015 Etnaviv Project
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sub license,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the
12 * next paragraph) shall be included in all copies or substantial portions
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
24 * Wladimir J. van der Laan <laanwj@gmail.com>
27 #include "etnaviv_emit.h"
29 #include "etnaviv_blend.h"
30 #include "etnaviv_compiler.h"
31 #include "etnaviv_context.h"
32 #include "etnaviv_rasterizer.h"
33 #include "etnaviv_resource.h"
34 #include "etnaviv_rs.h"
35 #include "etnaviv_screen.h"
36 #include "etnaviv_shader.h"
37 #include "etnaviv_texture.h"
38 #include "etnaviv_translate.h"
39 #include "etnaviv_uniforms.h"
40 #include "etnaviv_util.h"
41 #include "etnaviv_zsa.h"
42 #include "hw/common.xml.h"
43 #include "hw/state.xml.h"
44 #include "hw/state_blt.xml.h"
45 #include "util/u_math.h"
47 /* Queue a STALL command (queues 2 words) */
49 CMD_STALL(struct etna_cmd_stream
*stream
, uint32_t from
, uint32_t to
)
51 etna_cmd_stream_emit(stream
, VIV_FE_STALL_HEADER_OP_STALL
);
52 etna_cmd_stream_emit(stream
, VIV_FE_STALL_TOKEN_FROM(from
) | VIV_FE_STALL_TOKEN_TO(to
));
56 etna_stall(struct etna_cmd_stream
*stream
, uint32_t from
, uint32_t to
)
58 bool blt
= (from
== SYNC_RECIPIENT_BLT
) || (to
== SYNC_RECIPIENT_BLT
);
59 etna_cmd_stream_reserve(stream
, blt
? 8 : 4);
62 etna_emit_load_state(stream
, VIVS_BLT_ENABLE
>> 2, 1, 0);
63 etna_cmd_stream_emit(stream
, 1);
66 /* TODO: set bit 28/29 of token after BLT COPY_BUFFER */
67 etna_emit_load_state(stream
, VIVS_GL_SEMAPHORE_TOKEN
>> 2, 1, 0);
68 etna_cmd_stream_emit(stream
, VIVS_GL_SEMAPHORE_TOKEN_FROM(from
) | VIVS_GL_SEMAPHORE_TOKEN_TO(to
));
70 if (from
== SYNC_RECIPIENT_FE
) {
71 /* if the frontend is to be stalled, queue a STALL frontend command */
72 CMD_STALL(stream
, from
, to
);
74 /* otherwise, load the STALL token state */
75 etna_emit_load_state(stream
, VIVS_GL_STALL_TOKEN
>> 2, 1, 0);
76 etna_cmd_stream_emit(stream
, VIVS_GL_STALL_TOKEN_FROM(from
) | VIVS_GL_STALL_TOKEN_TO(to
));
80 etna_emit_load_state(stream
, VIVS_BLT_ENABLE
>> 2, 1, 0);
81 etna_cmd_stream_emit(stream
, 0);
85 #define EMIT_STATE(state_name, src_value) \
86 etna_coalsence_emit(stream, &coalesce, VIVS_##state_name, src_value)
88 #define EMIT_STATE_FIXP(state_name, src_value) \
89 etna_coalsence_emit_fixp(stream, &coalesce, VIVS_##state_name, src_value)
91 #define EMIT_STATE_RELOC(state_name, src_value) \
92 etna_coalsence_emit_reloc(stream, &coalesce, VIVS_##state_name, src_value)
94 #define ETNA_3D_CONTEXT_SIZE (400) /* keep this number above "Total state updates (fixed)" from gen_weave_state tool */
97 required_stream_size(struct etna_context
*ctx
)
99 unsigned size
= ETNA_3D_CONTEXT_SIZE
;
104 /* vertex elements */
105 size
+= ctx
->vertex_elements
->num_elements
+ 1;
107 /* uniforms - worst case (2 words per uniform load) */
108 size
+= ctx
->shader
.vs
->uniforms
.imm_count
* 2;
109 size
+= ctx
->shader
.fs
->uniforms
.imm_count
* 2;
112 size
+= ctx
->shader_state
.vs_inst_mem_size
+ 1;
113 size
+= ctx
->shader_state
.ps_inst_mem_size
+ 1;
115 /* DRAW_INDEXED_PRIMITIVES command */
118 /* reserve for alignment etc. */
124 /* Emit state that only exists on HALTI5+ */
126 emit_halti5_only_state(struct etna_context
*ctx
, int vs_output_count
)
128 struct etna_cmd_stream
*stream
= ctx
->stream
;
129 uint32_t dirty
= ctx
->dirty
;
130 struct etna_coalesce coalesce
;
132 etna_coalesce_start(stream
, &coalesce
);
133 if (unlikely(dirty
& (ETNA_DIRTY_SHADER
))) {
134 /* Magic states (load balancing, inter-unit sync, buffers) */
135 /*007C4*/ EMIT_STATE(FE_HALTI5_ID_CONFIG
, ctx
->shader_state
.FE_HALTI5_ID_CONFIG
);
136 /*00870*/ EMIT_STATE(VS_HALTI5_OUTPUT_COUNT
, vs_output_count
| ((vs_output_count
* 0x10) << 8));
137 /*008A0*/ EMIT_STATE(VS_HALTI5_UNK008A0
, 0x0001000e | ((0x110/vs_output_count
) << 20));
138 for (int x
= 0; x
< 4; ++x
) {
139 /*008E0*/ EMIT_STATE(VS_HALTI5_OUTPUT(x
), ctx
->shader_state
.VS_OUTPUT
[x
]);
142 if (unlikely(dirty
& (ETNA_DIRTY_VERTEX_ELEMENTS
| ETNA_DIRTY_SHADER
))) {
143 for (int x
= 0; x
< 4; ++x
) {
144 /*008C0*/ EMIT_STATE(VS_HALTI5_INPUT(x
), ctx
->shader_state
.VS_INPUT
[x
]);
147 if (unlikely(dirty
& (ETNA_DIRTY_SHADER
))) {
148 /*00A90*/ EMIT_STATE(PA_VARYING_NUM_COMPONENTS(0), ctx
->shader_state
.GL_VARYING_NUM_COMPONENTS
[0]);
149 /*00A94*/ EMIT_STATE(PA_VARYING_NUM_COMPONENTS(1), ctx
->shader_state
.GL_VARYING_NUM_COMPONENTS
[1]);
150 /*00AA8*/ EMIT_STATE(PA_VS_OUTPUT_COUNT
, vs_output_count
);
151 /*01080*/ EMIT_STATE(PS_VARYING_NUM_COMPONENTS(0), ctx
->shader_state
.GL_VARYING_NUM_COMPONENTS
[0]);
152 /*01084*/ EMIT_STATE(PS_VARYING_NUM_COMPONENTS(1), ctx
->shader_state
.GL_VARYING_NUM_COMPONENTS
[1]);
153 /*03888*/ EMIT_STATE(GL_HALTI5_SH_SPECIALS
, ctx
->shader_state
.GL_HALTI5_SH_SPECIALS
);
155 etna_coalesce_end(stream
, &coalesce
);
158 /* Emit state that no longer exists on HALTI5 */
160 emit_pre_halti5_state(struct etna_context
*ctx
)
162 struct etna_cmd_stream
*stream
= ctx
->stream
;
163 uint32_t dirty
= ctx
->dirty
;
164 struct etna_coalesce coalesce
;
166 etna_coalesce_start(stream
, &coalesce
);
167 if (unlikely(dirty
& (ETNA_DIRTY_SHADER
))) {
168 /*00800*/ EMIT_STATE(VS_END_PC
, ctx
->shader_state
.VS_END_PC
);
170 if (unlikely(dirty
& (ETNA_DIRTY_SHADER
))) {
171 for (int x
= 0; x
< 4; ++x
) {
172 /*00810*/ EMIT_STATE(VS_OUTPUT(x
), ctx
->shader_state
.VS_OUTPUT
[x
]);
175 if (unlikely(dirty
& (ETNA_DIRTY_VERTEX_ELEMENTS
| ETNA_DIRTY_SHADER
))) {
176 for (int x
= 0; x
< 4; ++x
) {
177 /*00820*/ EMIT_STATE(VS_INPUT(x
), ctx
->shader_state
.VS_INPUT
[x
]);
180 if (unlikely(dirty
& (ETNA_DIRTY_SHADER
))) {
181 /*00838*/ EMIT_STATE(VS_START_PC
, ctx
->shader_state
.VS_START_PC
);
183 if (unlikely(dirty
& (ETNA_DIRTY_SHADER
))) {
184 for (int x
= 0; x
< 10; ++x
) {
185 /*00A40*/ EMIT_STATE(PA_SHADER_ATTRIBUTES(x
), ctx
->shader_state
.PA_SHADER_ATTRIBUTES
[x
]);
188 if (unlikely(dirty
& (ETNA_DIRTY_FRAMEBUFFER
))) {
189 /*00E04*/ EMIT_STATE(RA_MULTISAMPLE_UNK00E04
, ctx
->framebuffer
.RA_MULTISAMPLE_UNK00E04
);
190 for (int x
= 0; x
< 4; ++x
) {
191 /*00E10*/ EMIT_STATE(RA_MULTISAMPLE_UNK00E10(x
), ctx
->framebuffer
.RA_MULTISAMPLE_UNK00E10
[x
]);
193 for (int x
= 0; x
< 16; ++x
) {
194 /*00E40*/ EMIT_STATE(RA_CENTROID_TABLE(x
), ctx
->framebuffer
.RA_CENTROID_TABLE
[x
]);
197 if (unlikely(dirty
& (ETNA_DIRTY_SHADER
| ETNA_DIRTY_FRAMEBUFFER
))) {
198 /*01000*/ EMIT_STATE(PS_END_PC
, ctx
->shader_state
.PS_END_PC
);
200 if (unlikely(dirty
& (ETNA_DIRTY_SHADER
| ETNA_DIRTY_FRAMEBUFFER
))) {
201 /*01018*/ EMIT_STATE(PS_START_PC
, ctx
->shader_state
.PS_START_PC
);
203 if (unlikely(dirty
& (ETNA_DIRTY_SHADER
))) {
204 /*03820*/ EMIT_STATE(GL_VARYING_NUM_COMPONENTS
, ctx
->shader_state
.GL_VARYING_NUM_COMPONENTS
[0]);
205 for (int x
= 0; x
< 2; ++x
) {
206 /*03828*/ EMIT_STATE(GL_VARYING_COMPONENT_USE(x
), ctx
->shader_state
.GL_VARYING_COMPONENT_USE
[x
]);
208 /*03834*/ EMIT_STATE(GL_VARYING_NUM_COMPONENTS2
, ctx
->shader_state
.GL_VARYING_NUM_COMPONENTS
[1]);
210 etna_coalesce_end(stream
, &coalesce
);
213 /* Weave state before draw operation. This function merges all the compiled
214 * state blocks under the context into one device register state. Parts of
215 * this state that are changed since last call (dirty) will be uploaded as
216 * state changes in the command buffer. */
218 etna_emit_state(struct etna_context
*ctx
)
220 struct etna_cmd_stream
*stream
= ctx
->stream
;
221 struct etna_screen
*screen
= ctx
->screen
;
222 unsigned ccw
= ctx
->rasterizer
->front_ccw
;
225 /* Pre-reserve the command buffer space which we are likely to need.
226 * This must cover all the state emitted below, and the following
228 etna_cmd_stream_reserve(stream
, required_stream_size(ctx
));
230 uint32_t dirty
= ctx
->dirty
;
232 /* Pre-processing: see what caches we need to flush before making state changes. */
233 uint32_t to_flush
= 0;
234 if (unlikely(dirty
& (ETNA_DIRTY_BLEND
)))
235 to_flush
|= VIVS_GL_FLUSH_CACHE_COLOR
;
236 if (unlikely(dirty
& (ETNA_DIRTY_TEXTURE_CACHES
)))
237 to_flush
|= VIVS_GL_FLUSH_CACHE_TEXTURE
;
238 if (unlikely(dirty
& (ETNA_DIRTY_FRAMEBUFFER
))) /* Framebuffer config changed? */
239 to_flush
|= VIVS_GL_FLUSH_CACHE_COLOR
| VIVS_GL_FLUSH_CACHE_DEPTH
;
240 if (DBG_ENABLED(ETNA_DBG_CFLUSH_ALL
))
241 to_flush
|= VIVS_GL_FLUSH_CACHE_TEXTURE
| VIVS_GL_FLUSH_CACHE_COLOR
| VIVS_GL_FLUSH_CACHE_DEPTH
;
244 etna_set_state(stream
, VIVS_GL_FLUSH_CACHE
, to_flush
);
245 etna_stall(stream
, SYNC_RECIPIENT_RA
, SYNC_RECIPIENT_PE
);
248 /* Flush TS cache before changing TS configuration. */
249 if (unlikely(dirty
& ETNA_DIRTY_TS
)) {
250 etna_set_state(stream
, VIVS_TS_FLUSH_CACHE
, VIVS_TS_FLUSH_CACHE_FLUSH
);
253 /* Update vertex elements. This is different from any of the other states, in that
254 * a) the number of vertex elements written matters: so write only active ones
255 * b) the vertex element states must all be written: do not skip entries that stay the same */
256 if (dirty
& (ETNA_DIRTY_VERTEX_ELEMENTS
)) {
257 if (screen
->specs
.halti
>= 5) {
258 /*17800*/ etna_set_state_multi(stream
, VIVS_NFE_GENERIC_ATTRIB_CONFIG0(0),
259 ctx
->vertex_elements
->num_elements
,
260 ctx
->vertex_elements
->NFE_GENERIC_ATTRIB_CONFIG0
);
261 /*17A00*/ etna_set_state_multi(stream
, VIVS_NFE_GENERIC_ATTRIB_SCALE(0),
262 ctx
->vertex_elements
->num_elements
,
263 ctx
->vertex_elements
->NFE_GENERIC_ATTRIB_SCALE
);
264 /*17A80*/ etna_set_state_multi(stream
, VIVS_NFE_GENERIC_ATTRIB_CONFIG1(0),
265 ctx
->vertex_elements
->num_elements
,
266 ctx
->vertex_elements
->NFE_GENERIC_ATTRIB_CONFIG1
);
268 /* Special case: vertex elements must always be sent in full if changed */
269 /*00600*/ etna_set_state_multi(stream
, VIVS_FE_VERTEX_ELEMENT_CONFIG(0),
270 ctx
->vertex_elements
->num_elements
,
271 ctx
->vertex_elements
->FE_VERTEX_ELEMENT_CONFIG
);
272 if (screen
->specs
.halti
>= 2) {
273 /*00780*/ etna_set_state_multi(stream
, VIVS_FE_GENERIC_ATTRIB_SCALE(0),
274 ctx
->vertex_elements
->num_elements
,
275 ctx
->vertex_elements
->NFE_GENERIC_ATTRIB_SCALE
);
279 unsigned vs_output_count
= etna_rasterizer_state(ctx
->rasterizer
)->point_size_per_vertex
280 ? ctx
->shader_state
.VS_OUTPUT_COUNT_PSIZE
281 : ctx
->shader_state
.VS_OUTPUT_COUNT
;
283 /* The following code is originally generated by gen_merge_state.py, to
284 * emit state in increasing order of address (this makes it possible to merge
285 * consecutive register updates into one SET_STATE command)
287 * There have been some manual changes, where the weaving operation is not
290 * - num vertex elements
295 * - removed ETNA_DIRTY_BASE_SETUP statements -- these are guaranteed to not
297 * - PS / framebuffer interaction for MSAA
298 * - move update of GL_MULTI_SAMPLE_CONFIG first
299 * - add unlikely()/likely()
301 struct etna_coalesce coalesce
;
303 etna_coalesce_start(stream
, &coalesce
);
305 /* begin only EMIT_STATE -- make sure no new etna_reserve calls are done here
308 /* multi sample config is set first, and outside of the normal sorting
309 * order, as changing the multisample state clobbers PS.INPUT_COUNT (and
310 * possibly PS.TEMP_REGISTER_CONTROL).
312 if (unlikely(dirty
& (ETNA_DIRTY_FRAMEBUFFER
| ETNA_DIRTY_SAMPLE_MASK
))) {
313 uint32_t val
= VIVS_GL_MULTI_SAMPLE_CONFIG_MSAA_ENABLES(ctx
->sample_mask
);
314 val
|= ctx
->framebuffer
.GL_MULTI_SAMPLE_CONFIG
;
316 /*03818*/ EMIT_STATE(GL_MULTI_SAMPLE_CONFIG
, val
);
318 if (likely(dirty
& (ETNA_DIRTY_INDEX_BUFFER
))) {
319 /*00644*/ EMIT_STATE_RELOC(FE_INDEX_STREAM_BASE_ADDR
, &ctx
->index_buffer
.FE_INDEX_STREAM_BASE_ADDR
);
320 /*00648*/ EMIT_STATE(FE_INDEX_STREAM_CONTROL
, ctx
->index_buffer
.FE_INDEX_STREAM_CONTROL
);
322 if (likely(dirty
& (ETNA_DIRTY_INDEX_BUFFER
))) {
323 /*00674*/ EMIT_STATE(FE_PRIMITIVE_RESTART_INDEX
, ctx
->index_buffer
.FE_PRIMITIVE_RESTART_INDEX
);
325 if (likely(dirty
& (ETNA_DIRTY_VERTEX_BUFFERS
))) {
326 if (screen
->specs
.halti
>= 2) { /* HALTI2+: NFE_VERTEX_STREAMS */
327 for (int x
= 0; x
< ctx
->vertex_buffer
.count
; ++x
) {
328 /*14600*/ EMIT_STATE_RELOC(NFE_VERTEX_STREAMS_BASE_ADDR(x
), &ctx
->vertex_buffer
.cvb
[x
].FE_VERTEX_STREAM_BASE_ADDR
);
330 for (int x
= 0; x
< ctx
->vertex_buffer
.count
; ++x
) {
331 if (ctx
->vertex_buffer
.cvb
[x
].FE_VERTEX_STREAM_BASE_ADDR
.bo
) {
332 /*14640*/ EMIT_STATE(NFE_VERTEX_STREAMS_CONTROL(x
), ctx
->vertex_buffer
.cvb
[x
].FE_VERTEX_STREAM_CONTROL
);
335 } else if(screen
->specs
.stream_count
> 1) { /* hw w/ multiple vertex streams */
336 for (int x
= 0; x
< ctx
->vertex_buffer
.count
; ++x
) {
337 /*00680*/ EMIT_STATE_RELOC(FE_VERTEX_STREAMS_BASE_ADDR(x
), &ctx
->vertex_buffer
.cvb
[x
].FE_VERTEX_STREAM_BASE_ADDR
);
339 for (int x
= 0; x
< ctx
->vertex_buffer
.count
; ++x
) {
340 if (ctx
->vertex_buffer
.cvb
[x
].FE_VERTEX_STREAM_BASE_ADDR
.bo
) {
341 /*006A0*/ EMIT_STATE(FE_VERTEX_STREAMS_CONTROL(x
), ctx
->vertex_buffer
.cvb
[x
].FE_VERTEX_STREAM_CONTROL
);
344 } else { /* hw w/ single vertex stream */
345 /*0064C*/ EMIT_STATE_RELOC(FE_VERTEX_STREAM_BASE_ADDR
, &ctx
->vertex_buffer
.cvb
[0].FE_VERTEX_STREAM_BASE_ADDR
);
346 /*00650*/ EMIT_STATE(FE_VERTEX_STREAM_CONTROL
, ctx
->vertex_buffer
.cvb
[0].FE_VERTEX_STREAM_CONTROL
);
349 /* gallium has instance divisor as part of elements state */
350 if ((dirty
& (ETNA_DIRTY_VERTEX_ELEMENTS
)) && screen
->specs
.halti
>= 2) {
351 for (int x
= 0; x
< ctx
->vertex_elements
->num_buffers
; ++x
) {
352 /*14680*/ EMIT_STATE(NFE_VERTEX_STREAMS_VERTEX_DIVISOR(x
), ctx
->vertex_elements
->NFE_VERTEX_STREAMS_VERTEX_DIVISOR
[x
]);
356 if (unlikely(dirty
& (ETNA_DIRTY_SHADER
| ETNA_DIRTY_RASTERIZER
))) {
358 /*00804*/ EMIT_STATE(VS_OUTPUT_COUNT
, vs_output_count
);
360 if (unlikely(dirty
& (ETNA_DIRTY_VERTEX_ELEMENTS
| ETNA_DIRTY_SHADER
))) {
361 /*00808*/ EMIT_STATE(VS_INPUT_COUNT
, ctx
->shader_state
.VS_INPUT_COUNT
);
362 /*0080C*/ EMIT_STATE(VS_TEMP_REGISTER_CONTROL
, ctx
->shader_state
.VS_TEMP_REGISTER_CONTROL
);
364 if (unlikely(dirty
& (ETNA_DIRTY_SHADER
))) {
365 /*00830*/ EMIT_STATE(VS_LOAD_BALANCING
, ctx
->shader_state
.VS_LOAD_BALANCING
);
367 if (unlikely(dirty
& (ETNA_DIRTY_VIEWPORT
))) {
368 /*00A00*/ EMIT_STATE_FIXP(PA_VIEWPORT_SCALE_X
, ctx
->viewport
.PA_VIEWPORT_SCALE_X
);
369 /*00A04*/ EMIT_STATE_FIXP(PA_VIEWPORT_SCALE_Y
, ctx
->viewport
.PA_VIEWPORT_SCALE_Y
);
370 /*00A08*/ EMIT_STATE(PA_VIEWPORT_SCALE_Z
, ctx
->viewport
.PA_VIEWPORT_SCALE_Z
);
371 /*00A0C*/ EMIT_STATE_FIXP(PA_VIEWPORT_OFFSET_X
, ctx
->viewport
.PA_VIEWPORT_OFFSET_X
);
372 /*00A10*/ EMIT_STATE_FIXP(PA_VIEWPORT_OFFSET_Y
, ctx
->viewport
.PA_VIEWPORT_OFFSET_Y
);
373 /*00A14*/ EMIT_STATE(PA_VIEWPORT_OFFSET_Z
, ctx
->viewport
.PA_VIEWPORT_OFFSET_Z
);
375 if (unlikely(dirty
& (ETNA_DIRTY_RASTERIZER
))) {
376 struct etna_rasterizer_state
*rasterizer
= etna_rasterizer_state(ctx
->rasterizer
);
378 /*00A18*/ EMIT_STATE(PA_LINE_WIDTH
, rasterizer
->PA_LINE_WIDTH
);
379 /*00A1C*/ EMIT_STATE(PA_POINT_SIZE
, rasterizer
->PA_POINT_SIZE
);
380 /*00A28*/ EMIT_STATE(PA_SYSTEM_MODE
, rasterizer
->PA_SYSTEM_MODE
);
382 if (unlikely(dirty
& (ETNA_DIRTY_SHADER
))) {
383 /*00A30*/ EMIT_STATE(PA_ATTRIBUTE_ELEMENT_COUNT
, ctx
->shader_state
.PA_ATTRIBUTE_ELEMENT_COUNT
);
385 if (unlikely(dirty
& (ETNA_DIRTY_RASTERIZER
| ETNA_DIRTY_SHADER
))) {
386 uint32_t val
= etna_rasterizer_state(ctx
->rasterizer
)->PA_CONFIG
;
387 /*00A34*/ EMIT_STATE(PA_CONFIG
, val
& ctx
->shader_state
.PA_CONFIG
);
389 if (unlikely(dirty
& (ETNA_DIRTY_RASTERIZER
))) {
390 struct etna_rasterizer_state
*rasterizer
= etna_rasterizer_state(ctx
->rasterizer
);
391 /*00A38*/ EMIT_STATE(PA_WIDE_LINE_WIDTH0
, rasterizer
->PA_LINE_WIDTH
);
392 /*00A3C*/ EMIT_STATE(PA_WIDE_LINE_WIDTH1
, rasterizer
->PA_LINE_WIDTH
);
394 if (unlikely(dirty
& (ETNA_DIRTY_SCISSOR_CLIP
))) {
395 /*00C00*/ EMIT_STATE_FIXP(SE_SCISSOR_LEFT
, ctx
->clipping
.minx
<< 16);
396 /*00C04*/ EMIT_STATE_FIXP(SE_SCISSOR_TOP
, ctx
->clipping
.miny
<< 16);
397 /*00C08*/ EMIT_STATE_FIXP(SE_SCISSOR_RIGHT
, (ctx
->clipping
.maxx
<< 16) + ETNA_SE_SCISSOR_MARGIN_RIGHT
);
398 /*00C0C*/ EMIT_STATE_FIXP(SE_SCISSOR_BOTTOM
, (ctx
->clipping
.maxy
<< 16) + ETNA_SE_SCISSOR_MARGIN_BOTTOM
);
400 if (unlikely(dirty
& (ETNA_DIRTY_RASTERIZER
))) {
401 struct etna_rasterizer_state
*rasterizer
= etna_rasterizer_state(ctx
->rasterizer
);
403 /*00C10*/ EMIT_STATE(SE_DEPTH_SCALE
, rasterizer
->SE_DEPTH_SCALE
);
404 /*00C14*/ EMIT_STATE(SE_DEPTH_BIAS
, rasterizer
->SE_DEPTH_BIAS
);
405 /*00C18*/ EMIT_STATE(SE_CONFIG
, rasterizer
->SE_CONFIG
);
407 if (unlikely(dirty
& (ETNA_DIRTY_SCISSOR_CLIP
))) {
408 /*00C20*/ EMIT_STATE_FIXP(SE_CLIP_RIGHT
, (ctx
->clipping
.maxx
<< 16) + ETNA_SE_CLIP_MARGIN_RIGHT
);
409 /*00C24*/ EMIT_STATE_FIXP(SE_CLIP_BOTTOM
, (ctx
->clipping
.maxy
<< 16) + ETNA_SE_CLIP_MARGIN_BOTTOM
);
411 if (unlikely(dirty
& (ETNA_DIRTY_SHADER
))) {
412 /*00E00*/ EMIT_STATE(RA_CONTROL
, ctx
->shader_state
.RA_CONTROL
);
414 if (unlikely(dirty
& (ETNA_DIRTY_SHADER
| ETNA_DIRTY_FRAMEBUFFER
))) {
415 /*01004*/ EMIT_STATE(PS_OUTPUT_REG
, ctx
->shader_state
.PS_OUTPUT_REG
);
416 /*01008*/ EMIT_STATE(PS_INPUT_COUNT
,
417 ctx
->framebuffer
.msaa_mode
418 ? ctx
->shader_state
.PS_INPUT_COUNT_MSAA
419 : ctx
->shader_state
.PS_INPUT_COUNT
);
420 /*0100C*/ EMIT_STATE(PS_TEMP_REGISTER_CONTROL
,
421 ctx
->framebuffer
.msaa_mode
422 ? ctx
->shader_state
.PS_TEMP_REGISTER_CONTROL_MSAA
423 : ctx
->shader_state
.PS_TEMP_REGISTER_CONTROL
);
424 /*01010*/ EMIT_STATE(PS_CONTROL
, ctx
->framebuffer
.PS_CONTROL
);
425 /*01030*/ EMIT_STATE(PS_CONTROL_EXT
, ctx
->framebuffer
.PS_CONTROL_EXT
);
427 if (unlikely(dirty
& (ETNA_DIRTY_ZSA
| ETNA_DIRTY_FRAMEBUFFER
| ETNA_DIRTY_SHADER
))) {
428 /*01400*/ EMIT_STATE(PE_DEPTH_CONFIG
, (etna_zsa_state(ctx
->zsa
)->PE_DEPTH_CONFIG
|
429 ctx
->framebuffer
.PE_DEPTH_CONFIG
) &
430 ctx
->shader_state
.PE_DEPTH_CONFIG
);
432 if (unlikely(dirty
& (ETNA_DIRTY_VIEWPORT
))) {
433 /*01404*/ EMIT_STATE(PE_DEPTH_NEAR
, ctx
->viewport
.PE_DEPTH_NEAR
);
434 /*01408*/ EMIT_STATE(PE_DEPTH_FAR
, ctx
->viewport
.PE_DEPTH_FAR
);
436 if (unlikely(dirty
& (ETNA_DIRTY_FRAMEBUFFER
))) {
437 /*0140C*/ EMIT_STATE(PE_DEPTH_NORMALIZE
, ctx
->framebuffer
.PE_DEPTH_NORMALIZE
);
439 if (screen
->specs
.pixel_pipes
== 1) {
440 /*01410*/ EMIT_STATE_RELOC(PE_DEPTH_ADDR
, &ctx
->framebuffer
.PE_DEPTH_ADDR
);
443 /*01414*/ EMIT_STATE(PE_DEPTH_STRIDE
, ctx
->framebuffer
.PE_DEPTH_STRIDE
);
446 if (unlikely(dirty
& (ETNA_DIRTY_ZSA
| ETNA_DIRTY_RASTERIZER
))) {
447 uint32_t val
= etna_zsa_state(ctx
->zsa
)->PE_STENCIL_OP
[ccw
];
448 /*01418*/ EMIT_STATE(PE_STENCIL_OP
, val
);
450 if (unlikely(dirty
& (ETNA_DIRTY_ZSA
| ETNA_DIRTY_STENCIL_REF
| ETNA_DIRTY_RASTERIZER
))) {
451 uint32_t val
= etna_zsa_state(ctx
->zsa
)->PE_STENCIL_CONFIG
[ccw
];
452 /*0141C*/ EMIT_STATE(PE_STENCIL_CONFIG
, val
| ctx
->stencil_ref
.PE_STENCIL_CONFIG
[ccw
]);
454 if (unlikely(dirty
& (ETNA_DIRTY_ZSA
))) {
455 uint32_t val
= etna_zsa_state(ctx
->zsa
)->PE_ALPHA_OP
;
456 /*01420*/ EMIT_STATE(PE_ALPHA_OP
, val
);
458 if (unlikely(dirty
& (ETNA_DIRTY_BLEND_COLOR
))) {
459 /*01424*/ EMIT_STATE(PE_ALPHA_BLEND_COLOR
, ctx
->blend_color
.PE_ALPHA_BLEND_COLOR
);
461 if (unlikely(dirty
& (ETNA_DIRTY_BLEND
))) {
462 uint32_t val
= etna_blend_state(ctx
->blend
)->PE_ALPHA_CONFIG
;
463 /*01428*/ EMIT_STATE(PE_ALPHA_CONFIG
, val
);
465 if (unlikely(dirty
& (ETNA_DIRTY_BLEND
| ETNA_DIRTY_FRAMEBUFFER
))) {
467 /* Use the components and overwrite bits in framebuffer.PE_COLOR_FORMAT
468 * as a mask to enable the bits from blend PE_COLOR_FORMAT */
469 val
= ~(VIVS_PE_COLOR_FORMAT_COMPONENTS__MASK
|
470 VIVS_PE_COLOR_FORMAT_OVERWRITE
);
471 val
|= etna_blend_state(ctx
->blend
)->PE_COLOR_FORMAT
;
472 val
&= ctx
->framebuffer
.PE_COLOR_FORMAT
;
473 /*0142C*/ EMIT_STATE(PE_COLOR_FORMAT
, val
);
475 if (unlikely(dirty
& (ETNA_DIRTY_FRAMEBUFFER
))) {
476 if (screen
->specs
.pixel_pipes
== 1) {
477 /*01430*/ EMIT_STATE_RELOC(PE_COLOR_ADDR
, &ctx
->framebuffer
.PE_COLOR_ADDR
);
478 /*01434*/ EMIT_STATE(PE_COLOR_STRIDE
, ctx
->framebuffer
.PE_COLOR_STRIDE
);
479 /*01454*/ EMIT_STATE(PE_HDEPTH_CONTROL
, ctx
->framebuffer
.PE_HDEPTH_CONTROL
);
480 } else if (screen
->specs
.pixel_pipes
== 2) {
481 /*01434*/ EMIT_STATE(PE_COLOR_STRIDE
, ctx
->framebuffer
.PE_COLOR_STRIDE
);
482 /*01454*/ EMIT_STATE(PE_HDEPTH_CONTROL
, ctx
->framebuffer
.PE_HDEPTH_CONTROL
);
483 /*01460*/ EMIT_STATE_RELOC(PE_PIPE_COLOR_ADDR(0), &ctx
->framebuffer
.PE_PIPE_COLOR_ADDR
[0]);
484 /*01464*/ EMIT_STATE_RELOC(PE_PIPE_COLOR_ADDR(1), &ctx
->framebuffer
.PE_PIPE_COLOR_ADDR
[1]);
485 /*01480*/ EMIT_STATE_RELOC(PE_PIPE_DEPTH_ADDR(0), &ctx
->framebuffer
.PE_PIPE_DEPTH_ADDR
[0]);
486 /*01484*/ EMIT_STATE_RELOC(PE_PIPE_DEPTH_ADDR(1), &ctx
->framebuffer
.PE_PIPE_DEPTH_ADDR
[1]);
491 if (unlikely(dirty
& (ETNA_DIRTY_STENCIL_REF
| ETNA_DIRTY_RASTERIZER
| ETNA_DIRTY_ZSA
))) {
492 uint32_t val
= etna_zsa_state(ctx
->zsa
)->PE_STENCIL_CONFIG_EXT
;
493 /*014A0*/ EMIT_STATE(PE_STENCIL_CONFIG_EXT
, val
| ctx
->stencil_ref
.PE_STENCIL_CONFIG_EXT
[ccw
]);
495 if (unlikely(dirty
& (ETNA_DIRTY_BLEND
| ETNA_DIRTY_FRAMEBUFFER
))) {
496 struct etna_blend_state
*blend
= etna_blend_state(ctx
->blend
);
497 /*014A4*/ EMIT_STATE(PE_LOGIC_OP
, blend
->PE_LOGIC_OP
| ctx
->framebuffer
.PE_LOGIC_OP
);
499 if (unlikely(dirty
& (ETNA_DIRTY_BLEND
))) {
500 struct etna_blend_state
*blend
= etna_blend_state(ctx
->blend
);
501 for (int x
= 0; x
< 2; ++x
) {
502 /*014A8*/ EMIT_STATE(PE_DITHER(x
), blend
->PE_DITHER
[x
]);
505 if (unlikely(dirty
& (ETNA_DIRTY_BLEND_COLOR
)) &&
506 VIV_FEATURE(screen
, chipMinorFeatures1
, HALF_FLOAT
)) {
507 /*014B0*/ EMIT_STATE(PE_ALPHA_COLOR_EXT0
, ctx
->blend_color
.PE_ALPHA_COLOR_EXT0
);
508 /*014B4*/ EMIT_STATE(PE_ALPHA_COLOR_EXT1
, ctx
->blend_color
.PE_ALPHA_COLOR_EXT1
);
510 if (unlikely(dirty
& (ETNA_DIRTY_ZSA
| ETNA_DIRTY_RASTERIZER
))) {
511 /*014B8*/ EMIT_STATE(PE_STENCIL_CONFIG_EXT2
, etna_zsa_state(ctx
->zsa
)->PE_STENCIL_CONFIG_EXT2
[ccw
]);
513 if (unlikely(dirty
& (ETNA_DIRTY_FRAMEBUFFER
)) && screen
->specs
.halti
>= 3)
514 /*014BC*/ EMIT_STATE(PE_MEM_CONFIG
, ctx
->framebuffer
.PE_MEM_CONFIG
);
515 if (unlikely(dirty
& (ETNA_DIRTY_FRAMEBUFFER
| ETNA_DIRTY_TS
))) {
516 /*01654*/ EMIT_STATE(TS_MEM_CONFIG
, ctx
->framebuffer
.TS_MEM_CONFIG
);
517 /*01658*/ EMIT_STATE_RELOC(TS_COLOR_STATUS_BASE
, &ctx
->framebuffer
.TS_COLOR_STATUS_BASE
);
518 /*0165C*/ EMIT_STATE_RELOC(TS_COLOR_SURFACE_BASE
, &ctx
->framebuffer
.TS_COLOR_SURFACE_BASE
);
519 /*01660*/ EMIT_STATE(TS_COLOR_CLEAR_VALUE
, ctx
->framebuffer
.TS_COLOR_CLEAR_VALUE
);
520 /*01664*/ EMIT_STATE_RELOC(TS_DEPTH_STATUS_BASE
, &ctx
->framebuffer
.TS_DEPTH_STATUS_BASE
);
521 /*01668*/ EMIT_STATE_RELOC(TS_DEPTH_SURFACE_BASE
, &ctx
->framebuffer
.TS_DEPTH_SURFACE_BASE
);
522 /*0166C*/ EMIT_STATE(TS_DEPTH_CLEAR_VALUE
, ctx
->framebuffer
.TS_DEPTH_CLEAR_VALUE
);
523 /*016BC*/ EMIT_STATE(TS_COLOR_CLEAR_VALUE_EXT
, ctx
->framebuffer
.TS_COLOR_CLEAR_VALUE_EXT
);
525 if (unlikely(dirty
& (ETNA_DIRTY_SHADER
))) {
526 /*0381C*/ EMIT_STATE(GL_VARYING_TOTAL_COMPONENTS
, ctx
->shader_state
.GL_VARYING_TOTAL_COMPONENTS
);
528 etna_coalesce_end(stream
, &coalesce
);
529 /* end only EMIT_STATE */
531 /* Emit strongly architecture-specific state */
532 if (screen
->specs
.halti
>= 5)
533 emit_halti5_only_state(ctx
, vs_output_count
);
535 emit_pre_halti5_state(ctx
);
537 /* Beginning from Halti0 some of the new shader and sampler states are not
538 * self-synchronizing anymore. Thus we need to stall the FE on PE completion
539 * before loading the new states to avoid corrupting the state of the
542 if (screen
->specs
.halti
>= 0 &&
543 (ctx
->dirty
& (ETNA_DIRTY_SHADER
| ETNA_DIRTY_CONSTBUF
|
544 ETNA_DIRTY_SAMPLERS
| ETNA_DIRTY_SAMPLER_VIEWS
)))
545 etna_stall(ctx
->stream
, SYNC_RECIPIENT_FE
, SYNC_RECIPIENT_PE
);
547 ctx
->emit_texture_state(ctx
);
549 /* We need to update the uniform cache only if one of the following bits are
551 * - ETNA_DIRTY_SHADER
552 * - ETNA_DIRTY_CONSTBUF
553 * - uniforms_dirty_bits
555 * In case of ETNA_DIRTY_SHADER we need load all uniforms from the cache. In
557 * other cases we can load on the changed uniforms.
559 static const uint32_t uniform_dirty_bits
=
560 ETNA_DIRTY_SHADER
| ETNA_DIRTY_CONSTBUF
;
562 /**** Large dynamically-sized state ****/
563 bool do_uniform_flush
= screen
->specs
.halti
< 5;
564 if (dirty
& (ETNA_DIRTY_SHADER
)) {
565 /* Special case: a new shader was loaded; simply re-load all uniforms and
566 * shader code at once */
567 /* This sequence is special, do not change ordering unless necessary. According to comment
568 snippets in the Vivante kernel driver a process called "steering" goes on while programming
569 shader state. This (as I understand it) means certain unified states are "steered"
570 toward a specific shader unit (VS/PS/...) based on either explicit flags in register
571 00860, or what other state is written before "auto-steering". So this means some
572 state can legitimately be programmed multiple times.
575 if (screen
->specs
.halti
>= 5) { /* ICACHE (HALTI5) */
576 assert(ctx
->shader_state
.VS_INST_ADDR
.bo
&& ctx
->shader_state
.PS_INST_ADDR
.bo
);
577 /* Set icache (VS) */
578 etna_set_state(stream
, VIVS_VS_NEWRANGE_LOW
, 0);
579 etna_set_state(stream
, VIVS_VS_NEWRANGE_HIGH
, ctx
->shader_state
.vs_inst_mem_size
/ 4);
580 assert(ctx
->shader_state
.VS_INST_ADDR
.bo
);
581 etna_set_state_reloc(stream
, VIVS_VS_INST_ADDR
, &ctx
->shader_state
.VS_INST_ADDR
);
582 etna_set_state(stream
, VIVS_SH_CONFIG
, 0x00000002);
583 etna_set_state(stream
, VIVS_VS_ICACHE_CONTROL
, VIVS_VS_ICACHE_CONTROL_ENABLE
);
584 etna_set_state(stream
, VIVS_VS_ICACHE_COUNT
, ctx
->shader_state
.vs_inst_mem_size
/ 4 - 1);
586 /* Set icache (PS) */
587 etna_set_state(stream
, VIVS_PS_NEWRANGE_LOW
, 0);
588 etna_set_state(stream
, VIVS_PS_NEWRANGE_HIGH
, ctx
->shader_state
.ps_inst_mem_size
/ 4);
589 assert(ctx
->shader_state
.PS_INST_ADDR
.bo
);
590 etna_set_state_reloc(stream
, VIVS_PS_INST_ADDR
, &ctx
->shader_state
.PS_INST_ADDR
);
591 etna_set_state(stream
, VIVS_SH_CONFIG
, 0x00000002);
592 etna_set_state(stream
, VIVS_VS_ICACHE_CONTROL
, VIVS_VS_ICACHE_CONTROL_ENABLE
);
593 etna_set_state(stream
, VIVS_PS_ICACHE_COUNT
, ctx
->shader_state
.ps_inst_mem_size
/ 4 - 1);
595 } else if (ctx
->shader_state
.VS_INST_ADDR
.bo
|| ctx
->shader_state
.PS_INST_ADDR
.bo
) {
596 /* ICACHE (pre-HALTI5) */
597 assert(screen
->specs
.has_icache
&& screen
->specs
.has_shader_range_registers
);
598 /* Set icache (VS) */
599 etna_set_state(stream
, VIVS_VS_RANGE
, (ctx
->shader_state
.vs_inst_mem_size
/ 4 - 1) << 16);
600 etna_set_state(stream
, VIVS_VS_ICACHE_CONTROL
,
601 VIVS_VS_ICACHE_CONTROL_ENABLE
|
602 VIVS_VS_ICACHE_CONTROL_FLUSH_VS
);
603 assert(ctx
->shader_state
.VS_INST_ADDR
.bo
);
604 etna_set_state_reloc(stream
, VIVS_VS_INST_ADDR
, &ctx
->shader_state
.VS_INST_ADDR
);
606 /* Set icache (PS) */
607 etna_set_state(stream
, VIVS_PS_RANGE
, (ctx
->shader_state
.ps_inst_mem_size
/ 4 - 1) << 16);
608 etna_set_state(stream
, VIVS_VS_ICACHE_CONTROL
,
609 VIVS_VS_ICACHE_CONTROL_ENABLE
|
610 VIVS_VS_ICACHE_CONTROL_FLUSH_PS
);
611 assert(ctx
->shader_state
.PS_INST_ADDR
.bo
);
612 etna_set_state_reloc(stream
, VIVS_PS_INST_ADDR
, &ctx
->shader_state
.PS_INST_ADDR
);
614 /* Upload shader directly, first flushing and disabling icache if
615 * supported on this hw */
616 if (screen
->specs
.has_icache
) {
617 etna_set_state(stream
, VIVS_VS_ICACHE_CONTROL
,
618 VIVS_VS_ICACHE_CONTROL_FLUSH_PS
|
619 VIVS_VS_ICACHE_CONTROL_FLUSH_VS
);
621 if (screen
->specs
.has_shader_range_registers
) {
622 etna_set_state(stream
, VIVS_VS_RANGE
, (ctx
->shader_state
.vs_inst_mem_size
/ 4 - 1) << 16);
623 etna_set_state(stream
, VIVS_PS_RANGE
, ((ctx
->shader_state
.ps_inst_mem_size
/ 4 - 1 + 0x100) << 16) |
626 etna_set_state_multi(stream
, screen
->specs
.vs_offset
,
627 ctx
->shader_state
.vs_inst_mem_size
,
628 ctx
->shader_state
.VS_INST_MEM
);
629 etna_set_state_multi(stream
, screen
->specs
.ps_offset
,
630 ctx
->shader_state
.ps_inst_mem_size
,
631 ctx
->shader_state
.PS_INST_MEM
);
634 if (screen
->specs
.has_unified_uniforms
) {
635 etna_set_state(stream
, VIVS_VS_UNIFORM_BASE
, 0);
636 etna_set_state(stream
, VIVS_PS_UNIFORM_BASE
, screen
->specs
.max_vs_uniforms
);
639 if (do_uniform_flush
)
640 etna_set_state(stream
, VIVS_VS_UNIFORM_CACHE
, VIVS_VS_UNIFORM_CACHE_FLUSH
);
642 etna_uniforms_write(ctx
, ctx
->shader
.vs
, ctx
->constant_buffer
[PIPE_SHADER_VERTEX
].cb
);
644 if (do_uniform_flush
)
645 etna_set_state(stream
, VIVS_VS_UNIFORM_CACHE
, VIVS_VS_UNIFORM_CACHE_FLUSH
| VIVS_VS_UNIFORM_CACHE_PS
);
647 etna_uniforms_write(ctx
, ctx
->shader
.fs
, ctx
->constant_buffer
[PIPE_SHADER_FRAGMENT
].cb
);
649 if (screen
->specs
.halti
>= 5) {
650 /* HALTI5 needs to be prompted to pre-fetch shaders */
651 etna_set_state(stream
, VIVS_VS_ICACHE_PREFETCH
, 0x00000000);
652 etna_set_state(stream
, VIVS_PS_ICACHE_PREFETCH
, 0x00000000);
653 etna_stall(stream
, SYNC_RECIPIENT_RA
, SYNC_RECIPIENT_PE
);
656 /* ideally this cache would only be flushed if there are VS uniform changes */
657 if (do_uniform_flush
)
658 etna_set_state(stream
, VIVS_VS_UNIFORM_CACHE
, VIVS_VS_UNIFORM_CACHE_FLUSH
);
660 if (dirty
& (uniform_dirty_bits
| ctx
->shader
.vs
->uniforms_dirty_bits
))
661 etna_uniforms_write(ctx
, ctx
->shader
.vs
, ctx
->constant_buffer
[PIPE_SHADER_VERTEX
].cb
);
663 /* ideally this cache would only be flushed if there are PS uniform changes */
664 if (do_uniform_flush
)
665 etna_set_state(stream
, VIVS_VS_UNIFORM_CACHE
, VIVS_VS_UNIFORM_CACHE_FLUSH
| VIVS_VS_UNIFORM_CACHE_PS
);
667 if (dirty
& (uniform_dirty_bits
| ctx
->shader
.fs
->uniforms_dirty_bits
))
668 etna_uniforms_write(ctx
, ctx
->shader
.fs
, ctx
->constant_buffer
[PIPE_SHADER_FRAGMENT
].cb
);
670 /**** End of state update ****/
672 #undef EMIT_STATE_FIXP
673 #undef EMIT_STATE_RELOC
675 ctx
->dirty_sampler_views
= 0;