etnaviv: fix blend color for RB swapped rendertargets
[mesa.git] / src / gallium / drivers / etnaviv / etnaviv_state.c
1 /*
2 * Copyright (c) 2012-2015 Etnaviv Project
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sub license,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the
12 * next paragraph) shall be included in all copies or substantial portions
13 * of the Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
22 *
23 * Authors:
24 * Wladimir J. van der Laan <laanwj@gmail.com>
25 * Christian Gmeiner <christian.gmeiner@gmail.com>
26 */
27
28 #include "etnaviv_state.h"
29
30 #include "hw/common.xml.h"
31
32 #include "etnaviv_blend.h"
33 #include "etnaviv_clear_blit.h"
34 #include "etnaviv_context.h"
35 #include "etnaviv_format.h"
36 #include "etnaviv_shader.h"
37 #include "etnaviv_surface.h"
38 #include "etnaviv_translate.h"
39 #include "etnaviv_util.h"
40 #include "util/u_helpers.h"
41 #include "util/u_inlines.h"
42 #include "util/u_math.h"
43 #include "util/u_memory.h"
44
45 static void
46 etna_set_stencil_ref(struct pipe_context *pctx, const struct pipe_stencil_ref *sr)
47 {
48 struct etna_context *ctx = etna_context(pctx);
49 struct compiled_stencil_ref *cs = &ctx->stencil_ref;
50
51 ctx->stencil_ref_s = *sr;
52
53 cs->PE_STENCIL_CONFIG = VIVS_PE_STENCIL_CONFIG_REF_FRONT(sr->ref_value[0]);
54 /* rest of bits weaved in from depth_stencil_alpha */
55 cs->PE_STENCIL_CONFIG_EXT =
56 VIVS_PE_STENCIL_CONFIG_EXT_REF_BACK(sr->ref_value[0]);
57 ctx->dirty |= ETNA_DIRTY_STENCIL_REF;
58 }
59
60 static void
61 etna_set_clip_state(struct pipe_context *pctx, const struct pipe_clip_state *pcs)
62 {
63 /* NOOP */
64 }
65
66 static void
67 etna_set_sample_mask(struct pipe_context *pctx, unsigned sample_mask)
68 {
69 struct etna_context *ctx = etna_context(pctx);
70
71 ctx->sample_mask = sample_mask;
72 ctx->dirty |= ETNA_DIRTY_SAMPLE_MASK;
73 }
74
75 static void
76 etna_set_constant_buffer(struct pipe_context *pctx,
77 enum pipe_shader_type shader, uint index,
78 const struct pipe_constant_buffer *cb)
79 {
80 struct etna_context *ctx = etna_context(pctx);
81
82 if (unlikely(index > 0)) {
83 DBG("Unhandled buffer index %i", index);
84 return;
85 }
86
87
88 util_copy_constant_buffer(&ctx->constant_buffer[shader], cb);
89
90 /* Note that the state tracker can unbind constant buffers by
91 * passing NULL here. */
92 if (unlikely(!cb))
93 return;
94
95 /* there is no support for ARB_uniform_buffer_object */
96 assert(cb->buffer == NULL && cb->user_buffer != NULL);
97
98 ctx->dirty |= ETNA_DIRTY_CONSTBUF;
99 }
100
101 static void
102 etna_update_render_resource(struct pipe_context *pctx, struct pipe_resource *pres)
103 {
104 struct etna_resource *res = etna_resource(pres);
105
106 if (res->texture && etna_resource_older(res, etna_resource(res->texture))) {
107 /* The render buffer is older than the texture buffer. Copy it over. */
108 etna_copy_resource(pctx, pres, res->texture, 0, pres->last_level);
109 res->seqno = etna_resource(res->texture)->seqno;
110 }
111 }
112
113 static void
114 etna_set_framebuffer_state(struct pipe_context *pctx,
115 const struct pipe_framebuffer_state *sv)
116 {
117 struct etna_context *ctx = etna_context(pctx);
118 struct compiled_framebuffer_state *cs = &ctx->framebuffer;
119 int nr_samples_color = -1;
120 int nr_samples_depth = -1;
121
122 /* Set up TS as well. Warning: this state is used by both the RS and PE */
123 uint32_t ts_mem_config = 0;
124
125 if (sv->nr_cbufs > 0) { /* at least one color buffer? */
126 struct etna_surface *cbuf = etna_surface(sv->cbufs[0]);
127 struct etna_resource *res = etna_resource(cbuf->base.texture);
128 bool color_supertiled = (res->layout & ETNA_LAYOUT_BIT_SUPER) != 0;
129
130 assert(res->layout & ETNA_LAYOUT_BIT_TILE); /* Cannot render to linear surfaces */
131 etna_update_render_resource(pctx, cbuf->base.texture);
132
133 pipe_surface_reference(&cs->cbuf, &cbuf->base);
134 cs->PE_COLOR_FORMAT =
135 VIVS_PE_COLOR_FORMAT_FORMAT(translate_rs_format(cbuf->base.format)) |
136 VIVS_PE_COLOR_FORMAT_COMPONENTS__MASK |
137 VIVS_PE_COLOR_FORMAT_OVERWRITE |
138 COND(color_supertiled, VIVS_PE_COLOR_FORMAT_SUPER_TILED);
139 /* VIVS_PE_COLOR_FORMAT_COMPONENTS() and
140 * VIVS_PE_COLOR_FORMAT_OVERWRITE comes from blend_state
141 * but only if we set the bits above. */
142 /* merged with depth_stencil_alpha */
143 if ((cbuf->surf.offset & 63) ||
144 (((cbuf->surf.stride * 4) & 63) && cbuf->surf.height > 4)) {
145 /* XXX Must make temporary surface here.
146 * Need the same mechanism on gc2000 when we want to do mipmap
147 * generation by
148 * rendering to levels > 1 due to multitiled / tiled conversion. */
149 BUG("Alignment error, trying to render to offset %08x with tile "
150 "stride %i",
151 cbuf->surf.offset, cbuf->surf.stride * 4);
152 }
153
154 if (ctx->specs.pixel_pipes == 1) {
155 cs->PE_COLOR_ADDR = cbuf->reloc[0];
156 cs->PE_COLOR_ADDR.flags = ETNA_RELOC_READ | ETNA_RELOC_WRITE;
157 } else {
158 /* Rendered textures must always be multi-tiled, or single-buffer mode must be supported */
159 assert((res->layout & ETNA_LAYOUT_BIT_MULTI) || ctx->specs.single_buffer);
160 for (int i = 0; i < ctx->specs.pixel_pipes; i++) {
161 cs->PE_PIPE_COLOR_ADDR[i] = cbuf->reloc[i];
162 cs->PE_PIPE_COLOR_ADDR[i].flags = ETNA_RELOC_READ | ETNA_RELOC_WRITE;
163 }
164 }
165 cs->PE_COLOR_STRIDE = cbuf->surf.stride;
166
167 if (cbuf->surf.ts_size) {
168 ts_mem_config |= VIVS_TS_MEM_CONFIG_COLOR_FAST_CLEAR;
169 cs->TS_COLOR_CLEAR_VALUE = cbuf->level->clear_value;
170
171 cs->TS_COLOR_STATUS_BASE = cbuf->ts_reloc;
172 cs->TS_COLOR_STATUS_BASE.flags = ETNA_RELOC_READ | ETNA_RELOC_WRITE;
173
174 cs->TS_COLOR_SURFACE_BASE = cbuf->reloc[0];
175 cs->TS_COLOR_SURFACE_BASE.flags = ETNA_RELOC_READ | ETNA_RELOC_WRITE;
176 }
177
178 /* MSAA */
179 if (cbuf->base.texture->nr_samples > 1)
180 ts_mem_config |=
181 VIVS_TS_MEM_CONFIG_MSAA | translate_msaa_format(cbuf->base.format);
182
183 nr_samples_color = cbuf->base.texture->nr_samples;
184 } else {
185 pipe_surface_reference(&cs->cbuf, NULL);
186 /* Clearing VIVS_PE_COLOR_FORMAT_COMPONENTS__MASK and
187 * VIVS_PE_COLOR_FORMAT_OVERWRITE prevents us from overwriting the
188 * color target */
189 cs->PE_COLOR_FORMAT = 0;
190 cs->PE_COLOR_STRIDE = 0;
191 cs->TS_COLOR_STATUS_BASE.bo = NULL;
192 cs->TS_COLOR_SURFACE_BASE.bo = NULL;
193
194 for (int i = 0; i < ETNA_MAX_PIXELPIPES; i++)
195 cs->PE_PIPE_COLOR_ADDR[i].bo = NULL;
196 }
197
198 if (sv->zsbuf != NULL) {
199 struct etna_surface *zsbuf = etna_surface(sv->zsbuf);
200 struct etna_resource *res = etna_resource(zsbuf->base.texture);
201
202 etna_update_render_resource(pctx, zsbuf->base.texture);
203
204 pipe_surface_reference(&cs->zsbuf, &zsbuf->base);
205 assert(res->layout &ETNA_LAYOUT_BIT_TILE); /* Cannot render to linear surfaces */
206
207 uint32_t depth_format = translate_depth_format(zsbuf->base.format);
208 unsigned depth_bits =
209 depth_format == VIVS_PE_DEPTH_CONFIG_DEPTH_FORMAT_D16 ? 16 : 24;
210 bool depth_supertiled = (res->layout & ETNA_LAYOUT_BIT_SUPER) != 0;
211
212 cs->PE_DEPTH_CONFIG =
213 depth_format |
214 COND(depth_supertiled, VIVS_PE_DEPTH_CONFIG_SUPER_TILED) |
215 VIVS_PE_DEPTH_CONFIG_DEPTH_MODE_Z;
216 /* VIVS_PE_DEPTH_CONFIG_ONLY_DEPTH */
217 /* merged with depth_stencil_alpha */
218
219 if (ctx->specs.pixel_pipes == 1) {
220 cs->PE_DEPTH_ADDR = zsbuf->reloc[0];
221 cs->PE_DEPTH_ADDR.flags = ETNA_RELOC_READ | ETNA_RELOC_WRITE;
222 } else {
223 for (int i = 0; i < ctx->specs.pixel_pipes; i++) {
224 cs->PE_PIPE_DEPTH_ADDR[i] = zsbuf->reloc[i];
225 cs->PE_PIPE_DEPTH_ADDR[i].flags = ETNA_RELOC_READ | ETNA_RELOC_WRITE;
226 }
227 }
228
229 cs->PE_DEPTH_STRIDE = zsbuf->surf.stride;
230 cs->PE_HDEPTH_CONTROL = VIVS_PE_HDEPTH_CONTROL_FORMAT_DISABLED;
231 cs->PE_DEPTH_NORMALIZE = fui(exp2f(depth_bits) - 1.0f);
232
233 if (zsbuf->surf.ts_size) {
234 ts_mem_config |= VIVS_TS_MEM_CONFIG_DEPTH_FAST_CLEAR;
235 cs->TS_DEPTH_CLEAR_VALUE = zsbuf->level->clear_value;
236
237 cs->TS_DEPTH_STATUS_BASE = zsbuf->ts_reloc;
238 cs->TS_DEPTH_STATUS_BASE.flags = ETNA_RELOC_READ | ETNA_RELOC_WRITE;
239
240 cs->TS_DEPTH_SURFACE_BASE = zsbuf->reloc[0];
241 cs->TS_DEPTH_SURFACE_BASE.flags = ETNA_RELOC_READ | ETNA_RELOC_WRITE;
242 }
243
244 ts_mem_config |= COND(depth_bits == 16, VIVS_TS_MEM_CONFIG_DEPTH_16BPP);
245
246 /* MSAA */
247 if (zsbuf->base.texture->nr_samples > 1)
248 /* XXX VIVS_TS_MEM_CONFIG_DEPTH_COMPRESSION;
249 * Disable without MSAA for now, as it causes corruption in glquake. */
250 ts_mem_config |= VIVS_TS_MEM_CONFIG_DEPTH_COMPRESSION;
251
252 nr_samples_depth = zsbuf->base.texture->nr_samples;
253 } else {
254 pipe_surface_reference(&cs->zsbuf, NULL);
255 cs->PE_DEPTH_CONFIG = VIVS_PE_DEPTH_CONFIG_DEPTH_MODE_NONE;
256 cs->PE_DEPTH_ADDR.bo = NULL;
257 cs->PE_DEPTH_STRIDE = 0;
258 cs->TS_DEPTH_STATUS_BASE.bo = NULL;
259 cs->TS_DEPTH_SURFACE_BASE.bo = NULL;
260
261 for (int i = 0; i < ETNA_MAX_PIXELPIPES; i++)
262 cs->PE_PIPE_DEPTH_ADDR[i].bo = NULL;
263 }
264
265 /* MSAA setup */
266 if (nr_samples_depth != -1 && nr_samples_color != -1 &&
267 nr_samples_depth != nr_samples_color) {
268 BUG("Number of samples in color and depth texture must match (%i and %i respectively)",
269 nr_samples_color, nr_samples_depth);
270 }
271
272 switch (MAX2(nr_samples_depth, nr_samples_color)) {
273 case 0:
274 case 1: /* Are 0 and 1 samples allowed? */
275 cs->GL_MULTI_SAMPLE_CONFIG =
276 VIVS_GL_MULTI_SAMPLE_CONFIG_MSAA_SAMPLES_NONE;
277 cs->msaa_mode = false;
278 break;
279 case 2:
280 cs->GL_MULTI_SAMPLE_CONFIG = VIVS_GL_MULTI_SAMPLE_CONFIG_MSAA_SAMPLES_2X;
281 cs->msaa_mode = true; /* Add input to PS */
282 cs->RA_MULTISAMPLE_UNK00E04 = 0x0;
283 cs->RA_MULTISAMPLE_UNK00E10[0] = 0x0000aa22;
284 cs->RA_CENTROID_TABLE[0] = 0x66aa2288;
285 cs->RA_CENTROID_TABLE[1] = 0x88558800;
286 cs->RA_CENTROID_TABLE[2] = 0x88881100;
287 cs->RA_CENTROID_TABLE[3] = 0x33888800;
288 break;
289 case 4:
290 cs->GL_MULTI_SAMPLE_CONFIG = VIVS_GL_MULTI_SAMPLE_CONFIG_MSAA_SAMPLES_4X;
291 cs->msaa_mode = true; /* Add input to PS */
292 cs->RA_MULTISAMPLE_UNK00E04 = 0x0;
293 cs->RA_MULTISAMPLE_UNK00E10[0] = 0xeaa26e26;
294 cs->RA_MULTISAMPLE_UNK00E10[1] = 0xe6ae622a;
295 cs->RA_MULTISAMPLE_UNK00E10[2] = 0xaaa22a22;
296 cs->RA_CENTROID_TABLE[0] = 0x4a6e2688;
297 cs->RA_CENTROID_TABLE[1] = 0x888888a2;
298 cs->RA_CENTROID_TABLE[2] = 0x888888ea;
299 cs->RA_CENTROID_TABLE[3] = 0x888888c6;
300 cs->RA_CENTROID_TABLE[4] = 0x46622a88;
301 cs->RA_CENTROID_TABLE[5] = 0x888888ae;
302 cs->RA_CENTROID_TABLE[6] = 0x888888e6;
303 cs->RA_CENTROID_TABLE[7] = 0x888888ca;
304 cs->RA_CENTROID_TABLE[8] = 0x262a2288;
305 cs->RA_CENTROID_TABLE[9] = 0x886688a2;
306 cs->RA_CENTROID_TABLE[10] = 0x888866aa;
307 cs->RA_CENTROID_TABLE[11] = 0x668888a6;
308 break;
309 }
310
311 /* Scissor setup */
312 cs->SE_SCISSOR_LEFT = 0; /* affected by rasterizer and scissor state as well */
313 cs->SE_SCISSOR_TOP = 0;
314 cs->SE_SCISSOR_RIGHT = (sv->width << 16) + ETNA_SE_SCISSOR_MARGIN_RIGHT;
315 cs->SE_SCISSOR_BOTTOM = (sv->height << 16) + ETNA_SE_SCISSOR_MARGIN_BOTTOM;
316 cs->SE_CLIP_RIGHT = (sv->width << 16) + ETNA_SE_CLIP_MARGIN_RIGHT;
317 cs->SE_CLIP_BOTTOM = (sv->height << 16) + ETNA_SE_CLIP_MARGIN_BOTTOM;
318
319 cs->TS_MEM_CONFIG = ts_mem_config;
320
321 /* Single buffer setup. There is only one switch for this, not a separate
322 * one per color buffer / depth buffer. To keep the logic simple always use
323 * single buffer when this feature is available.
324 */
325 cs->PE_LOGIC_OP = VIVS_PE_LOGIC_OP_SINGLE_BUFFER(ctx->specs.single_buffer ? 2 : 0);
326
327 ctx->framebuffer_s = *sv; /* keep copy of original structure */
328 ctx->dirty |= ETNA_DIRTY_FRAMEBUFFER;
329 }
330
331 static void
332 etna_set_polygon_stipple(struct pipe_context *pctx,
333 const struct pipe_poly_stipple *stipple)
334 {
335 /* NOP */
336 }
337
338 static void
339 etna_set_scissor_states(struct pipe_context *pctx, unsigned start_slot,
340 unsigned num_scissors, const struct pipe_scissor_state *ss)
341 {
342 struct etna_context *ctx = etna_context(pctx);
343 struct compiled_scissor_state *cs = &ctx->scissor;
344 assert(ss->minx <= ss->maxx);
345 assert(ss->miny <= ss->maxy);
346
347 /* note that this state is only used when rasterizer_state->scissor is on */
348 ctx->scissor_s = *ss;
349 cs->SE_SCISSOR_LEFT = (ss->minx << 16);
350 cs->SE_SCISSOR_TOP = (ss->miny << 16);
351 cs->SE_SCISSOR_RIGHT = (ss->maxx << 16) + ETNA_SE_SCISSOR_MARGIN_RIGHT;
352 cs->SE_SCISSOR_BOTTOM = (ss->maxy << 16) + ETNA_SE_SCISSOR_MARGIN_BOTTOM;
353 cs->SE_CLIP_RIGHT = (ss->maxx << 16) + ETNA_SE_CLIP_MARGIN_RIGHT;
354 cs->SE_CLIP_BOTTOM = (ss->maxy << 16) + ETNA_SE_CLIP_MARGIN_BOTTOM;
355
356 ctx->dirty |= ETNA_DIRTY_SCISSOR;
357 }
358
359 static void
360 etna_set_viewport_states(struct pipe_context *pctx, unsigned start_slot,
361 unsigned num_scissors, const struct pipe_viewport_state *vs)
362 {
363 struct etna_context *ctx = etna_context(pctx);
364 struct compiled_viewport_state *cs = &ctx->viewport;
365
366 ctx->viewport_s = *vs;
367 /**
368 * For Vivante GPU, viewport z transformation is 0..1 to 0..1 instead of
369 * -1..1 to 0..1.
370 * scaling and translation to 0..1 already happened, so remove that
371 *
372 * z' = (z * 2 - 1) * scale + translate
373 * = z * (2 * scale) + (translate - scale)
374 *
375 * scale' = 2 * scale
376 * translate' = translate - scale
377 */
378
379 /* must be fixp as v4 state deltas assume it is */
380 cs->PA_VIEWPORT_SCALE_X = etna_f32_to_fixp16(vs->scale[0]);
381 cs->PA_VIEWPORT_SCALE_Y = etna_f32_to_fixp16(vs->scale[1]);
382 cs->PA_VIEWPORT_SCALE_Z = fui(vs->scale[2] * 2.0f);
383 cs->PA_VIEWPORT_OFFSET_X = etna_f32_to_fixp16(vs->translate[0]);
384 cs->PA_VIEWPORT_OFFSET_Y = etna_f32_to_fixp16(vs->translate[1]);
385 cs->PA_VIEWPORT_OFFSET_Z = fui(vs->translate[2] - vs->scale[2]);
386
387 /* Compute scissor rectangle (fixp) from viewport.
388 * Make sure left is always < right and top always < bottom.
389 */
390 cs->SE_SCISSOR_LEFT = etna_f32_to_fixp16(MAX2(vs->translate[0] - fabsf(vs->scale[0]), 0.0f));
391 cs->SE_SCISSOR_TOP = etna_f32_to_fixp16(MAX2(vs->translate[1] - fabsf(vs->scale[1]), 0.0f));
392 uint32_t right_fixp = etna_f32_to_fixp16(MAX2(vs->translate[0] + fabsf(vs->scale[0]), 0.0f));
393 uint32_t bottom_fixp = etna_f32_to_fixp16(MAX2(vs->translate[1] + fabsf(vs->scale[1]), 0.0f));
394 cs->SE_SCISSOR_RIGHT = right_fixp + ETNA_SE_SCISSOR_MARGIN_RIGHT;
395 cs->SE_SCISSOR_BOTTOM = bottom_fixp + ETNA_SE_SCISSOR_MARGIN_BOTTOM;
396 cs->SE_CLIP_RIGHT = right_fixp + ETNA_SE_CLIP_MARGIN_RIGHT;
397 cs->SE_CLIP_BOTTOM = bottom_fixp + ETNA_SE_CLIP_MARGIN_BOTTOM;
398
399 cs->PE_DEPTH_NEAR = fui(0.0); /* not affected if depth mode is Z (as in GL) */
400 cs->PE_DEPTH_FAR = fui(1.0);
401 ctx->dirty |= ETNA_DIRTY_VIEWPORT;
402 }
403
404 static void
405 etna_set_vertex_buffers(struct pipe_context *pctx, unsigned start_slot,
406 unsigned num_buffers, const struct pipe_vertex_buffer *vb)
407 {
408 struct etna_context *ctx = etna_context(pctx);
409 struct etna_vertexbuf_state *so = &ctx->vertex_buffer;
410
411 util_set_vertex_buffers_mask(so->vb, &so->enabled_mask, vb, start_slot, num_buffers);
412 so->count = util_last_bit(so->enabled_mask);
413
414 for (unsigned idx = start_slot; idx < start_slot + num_buffers; ++idx) {
415 struct compiled_set_vertex_buffer *cs = &so->cvb[idx];
416 struct pipe_vertex_buffer *vbi = &so->vb[idx];
417
418 assert(!vbi->is_user_buffer); /* XXX support user_buffer using
419 etna_usermem_map */
420
421 if (vbi->buffer.resource) { /* GPU buffer */
422 cs->FE_VERTEX_STREAM_BASE_ADDR.bo = etna_resource(vbi->buffer.resource)->bo;
423 cs->FE_VERTEX_STREAM_BASE_ADDR.offset = vbi->buffer_offset;
424 cs->FE_VERTEX_STREAM_BASE_ADDR.flags = ETNA_RELOC_READ;
425 cs->FE_VERTEX_STREAM_CONTROL =
426 FE_VERTEX_STREAM_CONTROL_VERTEX_STRIDE(vbi->stride);
427 } else {
428 cs->FE_VERTEX_STREAM_BASE_ADDR.bo = NULL;
429 cs->FE_VERTEX_STREAM_CONTROL = 0;
430 }
431 }
432
433 ctx->dirty |= ETNA_DIRTY_VERTEX_BUFFERS;
434 }
435
436 static void
437 etna_blend_state_bind(struct pipe_context *pctx, void *bs)
438 {
439 struct etna_context *ctx = etna_context(pctx);
440
441 ctx->blend = bs;
442 ctx->dirty |= ETNA_DIRTY_BLEND;
443 }
444
445 static void
446 etna_blend_state_delete(struct pipe_context *pctx, void *bs)
447 {
448 FREE(bs);
449 }
450
451 static void
452 etna_rasterizer_state_bind(struct pipe_context *pctx, void *rs)
453 {
454 struct etna_context *ctx = etna_context(pctx);
455
456 ctx->rasterizer = rs;
457 ctx->dirty |= ETNA_DIRTY_RASTERIZER;
458 }
459
460 static void
461 etna_rasterizer_state_delete(struct pipe_context *pctx, void *rs)
462 {
463 FREE(rs);
464 }
465
466 static void
467 etna_zsa_state_bind(struct pipe_context *pctx, void *zs)
468 {
469 struct etna_context *ctx = etna_context(pctx);
470
471 ctx->zsa = zs;
472 ctx->dirty |= ETNA_DIRTY_ZSA;
473 }
474
475 static void
476 etna_zsa_state_delete(struct pipe_context *pctx, void *zs)
477 {
478 FREE(zs);
479 }
480
481 /** Create vertex element states, which define a layout for fetching
482 * vertices for rendering.
483 */
484 static void *
485 etna_vertex_elements_state_create(struct pipe_context *pctx,
486 unsigned num_elements, const struct pipe_vertex_element *elements)
487 {
488 struct etna_context *ctx = etna_context(pctx);
489 struct compiled_vertex_elements_state *cs = CALLOC_STRUCT(compiled_vertex_elements_state);
490
491 if (!cs)
492 return NULL;
493
494 if (num_elements > ctx->specs.vertex_max_elements) {
495 BUG("number of elements (%u) exceeds chip maximum (%u)", num_elements,
496 ctx->specs.vertex_max_elements);
497 return NULL;
498 }
499
500 /* XXX could minimize number of consecutive stretches here by sorting, and
501 * permuting the inputs in shader or does Mesa do this already? */
502
503 /* Check that vertex element binding is compatible with hardware; thus
504 * elements[idx].vertex_buffer_index are < stream_count. If not, the binding
505 * uses more streams than is supported, and u_vbuf should have done some
506 * reorganization for compatibility. */
507
508 /* TODO: does mesa this for us? */
509 bool incompatible = false;
510 for (unsigned idx = 0; idx < num_elements; ++idx) {
511 if (elements[idx].vertex_buffer_index >= ctx->specs.stream_count || elements[idx].instance_divisor > 0)
512 incompatible = true;
513 }
514
515 cs->num_elements = num_elements;
516 if (incompatible || num_elements == 0) {
517 DBG("Error: zero vertex elements, or more vertex buffers used than supported");
518 FREE(cs);
519 return NULL;
520 }
521
522 unsigned start_offset = 0; /* start of current consecutive stretch */
523 bool nonconsecutive = true; /* previous value of nonconsecutive */
524
525 for (unsigned idx = 0; idx < num_elements; ++idx) {
526 unsigned element_size = util_format_get_blocksize(elements[idx].src_format);
527 unsigned end_offset = elements[idx].src_offset + element_size;
528 uint32_t format_type, normalize;
529
530 if (nonconsecutive)
531 start_offset = elements[idx].src_offset;
532
533 /* maximum vertex size is 256 bytes */
534 assert(element_size != 0 && end_offset <= 256);
535
536 /* check whether next element is consecutive to this one */
537 nonconsecutive = (idx == (num_elements - 1)) ||
538 elements[idx + 1].vertex_buffer_index != elements[idx].vertex_buffer_index ||
539 end_offset != elements[idx + 1].src_offset;
540
541 format_type = translate_vertex_format_type(elements[idx].src_format);
542 normalize = translate_vertex_format_normalize(elements[idx].src_format);
543
544 assert(format_type != ETNA_NO_MATCH);
545 assert(normalize != ETNA_NO_MATCH);
546
547 cs->FE_VERTEX_ELEMENT_CONFIG[idx] =
548 COND(nonconsecutive, VIVS_FE_VERTEX_ELEMENT_CONFIG_NONCONSECUTIVE) |
549 format_type |
550 VIVS_FE_VERTEX_ELEMENT_CONFIG_NUM(util_format_get_nr_components(elements[idx].src_format)) |
551 normalize | VIVS_FE_VERTEX_ELEMENT_CONFIG_ENDIAN(ENDIAN_MODE_NO_SWAP) |
552 VIVS_FE_VERTEX_ELEMENT_CONFIG_STREAM(elements[idx].vertex_buffer_index) |
553 VIVS_FE_VERTEX_ELEMENT_CONFIG_START(elements[idx].src_offset) |
554 VIVS_FE_VERTEX_ELEMENT_CONFIG_END(end_offset - start_offset);
555 }
556
557 return cs;
558 }
559
560 static void
561 etna_vertex_elements_state_delete(struct pipe_context *pctx, void *ve)
562 {
563 FREE(ve);
564 }
565
566 static void
567 etna_vertex_elements_state_bind(struct pipe_context *pctx, void *ve)
568 {
569 struct etna_context *ctx = etna_context(pctx);
570
571 ctx->vertex_elements = ve;
572 ctx->dirty |= ETNA_DIRTY_VERTEX_ELEMENTS;
573 }
574
575 struct etna_state_updater {
576 bool (*update)(struct etna_context *ctx);
577 uint32_t dirty;
578 };
579
580 static const struct etna_state_updater etna_state_updates[] = {
581 {
582 etna_shader_update_vertex, ETNA_DIRTY_SHADER | ETNA_DIRTY_VERTEX_ELEMENTS,
583 },
584 {
585 etna_shader_link, ETNA_DIRTY_SHADER,
586 },
587 {
588 etna_update_blend, ETNA_DIRTY_BLEND | ETNA_DIRTY_FRAMEBUFFER
589 },
590 {
591 etna_update_blend_color, ETNA_DIRTY_BLEND_COLOR | ETNA_DIRTY_FRAMEBUFFER,
592 }
593 };
594
595 bool
596 etna_state_update(struct etna_context *ctx)
597 {
598 for (unsigned int i = 0; i < ARRAY_SIZE(etna_state_updates); i++)
599 if (ctx->dirty & etna_state_updates[i].dirty)
600 if (!etna_state_updates[i].update(ctx))
601 return false;
602
603 return true;
604 }
605
606 void
607 etna_state_init(struct pipe_context *pctx)
608 {
609 pctx->set_blend_color = etna_set_blend_color;
610 pctx->set_stencil_ref = etna_set_stencil_ref;
611 pctx->set_clip_state = etna_set_clip_state;
612 pctx->set_sample_mask = etna_set_sample_mask;
613 pctx->set_constant_buffer = etna_set_constant_buffer;
614 pctx->set_framebuffer_state = etna_set_framebuffer_state;
615 pctx->set_polygon_stipple = etna_set_polygon_stipple;
616 pctx->set_scissor_states = etna_set_scissor_states;
617 pctx->set_viewport_states = etna_set_viewport_states;
618
619 pctx->set_vertex_buffers = etna_set_vertex_buffers;
620
621 pctx->bind_blend_state = etna_blend_state_bind;
622 pctx->delete_blend_state = etna_blend_state_delete;
623
624 pctx->bind_rasterizer_state = etna_rasterizer_state_bind;
625 pctx->delete_rasterizer_state = etna_rasterizer_state_delete;
626
627 pctx->bind_depth_stencil_alpha_state = etna_zsa_state_bind;
628 pctx->delete_depth_stencil_alpha_state = etna_zsa_state_delete;
629
630 pctx->create_vertex_elements_state = etna_vertex_elements_state_create;
631 pctx->delete_vertex_elements_state = etna_vertex_elements_state_delete;
632 pctx->bind_vertex_elements_state = etna_vertex_elements_state_bind;
633 }