panfrost: Move streamout offset update out of panfrost_draw_vbo()
[mesa.git] / src / gallium / drivers / panfrost / pan_context.c
1 /*
2 * © Copyright 2018 Alyssa Rosenzweig
3 * Copyright © 2014-2017 Broadcom
4 * Copyright (C) 2017 Intel Corporation
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice (including the next
14 * paragraph) shall be included in all copies or substantial portions of the
15 * Software.
16 *
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
22 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
23 * SOFTWARE.
24 *
25 */
26
27 #include <sys/poll.h>
28 #include <errno.h>
29
30 #include "pan_bo.h"
31 #include "pan_context.h"
32 #include "pan_minmax_cache.h"
33 #include "panfrost-quirks.h"
34
35 #include "util/macros.h"
36 #include "util/format/u_format.h"
37 #include "util/u_inlines.h"
38 #include "util/u_upload_mgr.h"
39 #include "util/u_memory.h"
40 #include "util/u_vbuf.h"
41 #include "util/half_float.h"
42 #include "util/u_helpers.h"
43 #include "util/format/u_format.h"
44 #include "util/u_prim.h"
45 #include "util/u_prim_restart.h"
46 #include "indices/u_primconvert.h"
47 #include "tgsi/tgsi_parse.h"
48 #include "tgsi/tgsi_from_mesa.h"
49 #include "util/u_math.h"
50
51 #include "pan_screen.h"
52 #include "pan_blending.h"
53 #include "pan_blend_shaders.h"
54 #include "pan_cmdstream.h"
55 #include "pan_util.h"
56 #include "pandecode/decode.h"
57
58 struct midgard_tiler_descriptor
59 panfrost_emit_midg_tiler(struct panfrost_batch *batch, unsigned vertex_count)
60 {
61 struct panfrost_screen *screen = pan_screen(batch->ctx->base.screen);
62 bool hierarchy = !(screen->quirks & MIDGARD_NO_HIER_TILING);
63 struct midgard_tiler_descriptor t = {0};
64 unsigned height = batch->key.height;
65 unsigned width = batch->key.width;
66
67 t.hierarchy_mask =
68 panfrost_choose_hierarchy_mask(width, height, vertex_count, hierarchy);
69
70 /* Compute the polygon header size and use that to offset the body */
71
72 unsigned header_size = panfrost_tiler_header_size(
73 width, height, t.hierarchy_mask, hierarchy);
74
75 t.polygon_list_size = panfrost_tiler_full_size(
76 width, height, t.hierarchy_mask, hierarchy);
77
78 /* Sanity check */
79
80 if (vertex_count) {
81 struct panfrost_bo *tiler_heap;
82
83 tiler_heap = panfrost_batch_get_tiler_heap(batch);
84 t.polygon_list = panfrost_batch_get_polygon_list(batch,
85 header_size +
86 t.polygon_list_size);
87
88
89 /* Allow the entire tiler heap */
90 t.heap_start = tiler_heap->gpu;
91 t.heap_end = tiler_heap->gpu + tiler_heap->size;
92 } else {
93 struct panfrost_bo *tiler_dummy;
94
95 tiler_dummy = panfrost_batch_get_tiler_dummy(batch);
96 header_size = MALI_TILER_MINIMUM_HEADER_SIZE;
97
98 /* The tiler is disabled, so don't allow the tiler heap */
99 t.heap_start = tiler_dummy->gpu;
100 t.heap_end = t.heap_start;
101
102 /* Use a dummy polygon list */
103 t.polygon_list = tiler_dummy->gpu;
104
105 /* Disable the tiler */
106 if (hierarchy)
107 t.hierarchy_mask |= MALI_TILER_DISABLED;
108 else {
109 t.hierarchy_mask = MALI_TILER_USER;
110 t.polygon_list_size = MALI_TILER_MINIMUM_HEADER_SIZE + 4;
111
112 /* We don't have a WRITE_VALUE job, so write the polygon list manually */
113 uint32_t *polygon_list_body = (uint32_t *) (tiler_dummy->cpu + header_size);
114 polygon_list_body[0] = 0xa0000000; /* TODO: Just that? */
115 }
116 }
117
118 t.polygon_list_body =
119 t.polygon_list + header_size;
120
121 return t;
122 }
123
124 static void
125 panfrost_clear(
126 struct pipe_context *pipe,
127 unsigned buffers,
128 const union pipe_color_union *color,
129 double depth, unsigned stencil)
130 {
131 struct panfrost_context *ctx = pan_context(pipe);
132
133 /* TODO: panfrost_get_fresh_batch_for_fbo() instantiates a new batch if
134 * the existing batch targeting this FBO has draws. We could probably
135 * avoid that by replacing plain clears by quad-draws with a specific
136 * color/depth/stencil value, thus avoiding the generation of extra
137 * fragment jobs.
138 */
139 struct panfrost_batch *batch = panfrost_get_fresh_batch_for_fbo(ctx);
140
141 panfrost_batch_add_fbo_bos(batch);
142 panfrost_batch_clear(batch, buffers, color, depth, stencil);
143 }
144
145 /* Reset per-frame context, called on context initialisation as well as after
146 * flushing a frame */
147
148 void
149 panfrost_invalidate_frame(struct panfrost_context *ctx)
150 {
151 for (unsigned i = 0; i < PIPE_SHADER_TYPES; ++i)
152 ctx->payloads[i].postfix.shared_memory = 0;
153
154 /* TODO: When does this need to be handled? */
155 ctx->active_queries = true;
156 }
157
158 /* In practice, every field of these payloads should be configurable
159 * arbitrarily, which means these functions are basically catch-all's for
160 * as-of-yet unwavering unknowns */
161
162 static void
163 panfrost_emit_vertex_payload(struct panfrost_context *ctx)
164 {
165 /* 0x2 bit clear on 32-bit T6XX */
166
167 struct midgard_payload_vertex_tiler payload = {
168 .gl_enables = 0x4 | 0x2,
169 };
170
171 /* Vertex and compute are closely coupled, so share a payload */
172
173 memcpy(&ctx->payloads[PIPE_SHADER_VERTEX], &payload, sizeof(payload));
174 memcpy(&ctx->payloads[PIPE_SHADER_COMPUTE], &payload, sizeof(payload));
175 }
176
177 bool
178 panfrost_writes_point_size(struct panfrost_context *ctx)
179 {
180 assert(ctx->shader[PIPE_SHADER_VERTEX]);
181 struct panfrost_shader_state *vs = panfrost_get_shader_state(ctx, PIPE_SHADER_VERTEX);
182
183 return vs->writes_point_size && ctx->payloads[PIPE_SHADER_FRAGMENT].prefix.draw_mode == MALI_POINTS;
184 }
185
186 void
187 panfrost_vertex_state_upd_attr_offs(struct panfrost_context *ctx,
188 struct midgard_payload_vertex_tiler *vp)
189 {
190 if (!ctx->vertex)
191 return;
192
193 struct panfrost_vertex_state *so = ctx->vertex;
194
195 /* Fixup offsets for the second pass. Recall that the hardware
196 * calculates attribute addresses as:
197 *
198 * addr = base + (stride * vtx) + src_offset;
199 *
200 * However, on Mali, base must be aligned to 64-bytes, so we
201 * instead let:
202 *
203 * base' = base & ~63 = base - (base & 63)
204 *
205 * To compensate when using base' (see emit_vertex_data), we have
206 * to adjust src_offset by the masked off piece:
207 *
208 * addr' = base' + (stride * vtx) + (src_offset + (base & 63))
209 * = base - (base & 63) + (stride * vtx) + src_offset + (base & 63)
210 * = base + (stride * vtx) + src_offset
211 * = addr;
212 *
213 * QED.
214 */
215
216 unsigned start = vp->offset_start;
217
218 for (unsigned i = 0; i < so->num_elements; ++i) {
219 unsigned vbi = so->pipe[i].vertex_buffer_index;
220 struct pipe_vertex_buffer *buf = &ctx->vertex_buffers[vbi];
221
222 /* Adjust by the masked off bits of the offset. Make sure we
223 * read src_offset from so->hw (which is not GPU visible)
224 * rather than target (which is) due to caching effects */
225
226 unsigned src_offset = so->pipe[i].src_offset;
227
228 /* BOs aligned to 4k so guaranteed aligned to 64 */
229 src_offset += (buf->buffer_offset & 63);
230
231 /* Also, somewhat obscurely per-instance data needs to be
232 * offset in response to a delayed start in an indexed draw */
233
234 if (so->pipe[i].instance_divisor && ctx->instance_count > 1 && start)
235 src_offset -= buf->stride * start;
236
237 so->hw[i].src_offset = src_offset;
238 }
239 }
240
241 /* Compute number of UBOs active (more specifically, compute the highest UBO
242 * number addressable -- if there are gaps, include them in the count anyway).
243 * We always include UBO #0 in the count, since we *need* uniforms enabled for
244 * sysvals. */
245
246 unsigned
247 panfrost_ubo_count(struct panfrost_context *ctx, enum pipe_shader_type stage)
248 {
249 unsigned mask = ctx->constant_buffer[stage].enabled_mask | 1;
250 return 32 - __builtin_clz(mask);
251 }
252
253 /* Go through dirty flags and actualise them in the cmdstream. */
254
255 static void
256 panfrost_emit_for_draw(struct panfrost_context *ctx)
257 {
258 struct panfrost_batch *batch = panfrost_get_batch_for_fbo(ctx);
259
260 panfrost_batch_add_fbo_bos(batch);
261
262 for (int i = 0; i <= PIPE_SHADER_FRAGMENT; ++i)
263 panfrost_vt_attach_framebuffer(ctx, &ctx->payloads[i]);
264
265 panfrost_emit_vertex_data(batch);
266
267 /* Varyings emitted for -all- geometry */
268 unsigned total_count = ctx->padded_count * ctx->instance_count;
269 panfrost_emit_varying_descriptor(ctx, total_count);
270
271 panfrost_batch_set_requirements(batch);
272
273 panfrost_vt_update_rasterizer(ctx, &ctx->payloads[PIPE_SHADER_FRAGMENT]);
274 panfrost_vt_update_occlusion_query(ctx, &ctx->payloads[PIPE_SHADER_FRAGMENT]);
275
276 panfrost_emit_shader_meta(batch, PIPE_SHADER_VERTEX,
277 &ctx->payloads[PIPE_SHADER_VERTEX]);
278 panfrost_emit_shader_meta(batch, PIPE_SHADER_FRAGMENT,
279 &ctx->payloads[PIPE_SHADER_FRAGMENT]);
280
281 panfrost_emit_vertex_attr_meta(batch,
282 &ctx->payloads[PIPE_SHADER_VERTEX]);
283
284 for (int i = 0; i <= PIPE_SHADER_FRAGMENT; ++i) {
285 panfrost_emit_sampler_descriptors(batch, i, &ctx->payloads[i]);
286 panfrost_emit_texture_descriptors(batch, i, &ctx->payloads[i]);
287 panfrost_emit_const_buf(batch, i, &ctx->payloads[i]);
288 }
289
290 /* TODO: Upload the viewport somewhere more appropriate */
291
292 panfrost_emit_viewport(batch, &ctx->payloads[PIPE_SHADER_FRAGMENT]);
293 }
294
295 /* Corresponds to exactly one draw, but does not submit anything */
296
297 static void
298 panfrost_queue_draw(struct panfrost_context *ctx)
299 {
300 /* Handle dirty flags now */
301 panfrost_emit_for_draw(ctx);
302
303 struct panfrost_batch *batch = panfrost_get_batch_for_fbo(ctx);
304
305 panfrost_emit_vertex_tiler_jobs(batch,
306 &ctx->payloads[PIPE_SHADER_VERTEX],
307 &ctx->payloads[PIPE_SHADER_FRAGMENT]);
308 panfrost_batch_adjust_stack_size(batch);
309 }
310
311 /* The entire frame is in memory -- send it off to the kernel! */
312
313 void
314 panfrost_flush(
315 struct pipe_context *pipe,
316 struct pipe_fence_handle **fence,
317 unsigned flags)
318 {
319 struct panfrost_context *ctx = pan_context(pipe);
320 struct util_dynarray fences;
321
322 /* We must collect the fences before the flush is done, otherwise we'll
323 * lose track of them.
324 */
325 if (fence) {
326 util_dynarray_init(&fences, NULL);
327 hash_table_foreach(ctx->batches, hentry) {
328 struct panfrost_batch *batch = hentry->data;
329
330 panfrost_batch_fence_reference(batch->out_sync);
331 util_dynarray_append(&fences,
332 struct panfrost_batch_fence *,
333 batch->out_sync);
334 }
335 }
336
337 /* Submit all pending jobs */
338 panfrost_flush_all_batches(ctx, false);
339
340 if (fence) {
341 struct panfrost_fence *f = panfrost_fence_create(ctx, &fences);
342 pipe->screen->fence_reference(pipe->screen, fence, NULL);
343 *fence = (struct pipe_fence_handle *)f;
344
345 util_dynarray_foreach(&fences, struct panfrost_batch_fence *, fence)
346 panfrost_batch_fence_unreference(*fence);
347
348 util_dynarray_fini(&fences);
349 }
350
351 if (pan_debug & PAN_DBG_TRACE)
352 pandecode_next_frame();
353 }
354
355 #define DEFINE_CASE(c) case PIPE_PRIM_##c: return MALI_##c;
356
357 static int
358 g2m_draw_mode(enum pipe_prim_type mode)
359 {
360 switch (mode) {
361 DEFINE_CASE(POINTS);
362 DEFINE_CASE(LINES);
363 DEFINE_CASE(LINE_LOOP);
364 DEFINE_CASE(LINE_STRIP);
365 DEFINE_CASE(TRIANGLES);
366 DEFINE_CASE(TRIANGLE_STRIP);
367 DEFINE_CASE(TRIANGLE_FAN);
368 DEFINE_CASE(QUADS);
369 DEFINE_CASE(QUAD_STRIP);
370 DEFINE_CASE(POLYGON);
371
372 default:
373 unreachable("Invalid draw mode");
374 }
375 }
376
377 #undef DEFINE_CASE
378
379 static unsigned
380 panfrost_translate_index_size(unsigned size)
381 {
382 switch (size) {
383 case 1:
384 return MALI_DRAW_INDEXED_UINT8;
385
386 case 2:
387 return MALI_DRAW_INDEXED_UINT16;
388
389 case 4:
390 return MALI_DRAW_INDEXED_UINT32;
391
392 default:
393 unreachable("Invalid index size");
394 }
395 }
396
397 /* Gets a GPU address for the associated index buffer. Only gauranteed to be
398 * good for the duration of the draw (transient), could last longer. Also get
399 * the bounds on the index buffer for the range accessed by the draw. We do
400 * these operations together because there are natural optimizations which
401 * require them to be together. */
402
403 static mali_ptr
404 panfrost_get_index_buffer_bounded(struct panfrost_context *ctx, const struct pipe_draw_info *info, unsigned *min_index, unsigned *max_index)
405 {
406 struct panfrost_resource *rsrc = (struct panfrost_resource *) (info->index.resource);
407
408 off_t offset = info->start * info->index_size;
409 struct panfrost_batch *batch = panfrost_get_batch_for_fbo(ctx);
410 mali_ptr out = 0;
411
412 bool needs_indices = true;
413
414 if (info->max_index != ~0u) {
415 *min_index = info->min_index;
416 *max_index = info->max_index;
417 needs_indices = false;
418 }
419
420 if (!info->has_user_indices) {
421 /* Only resources can be directly mapped */
422 panfrost_batch_add_bo(batch, rsrc->bo,
423 PAN_BO_ACCESS_SHARED |
424 PAN_BO_ACCESS_READ |
425 PAN_BO_ACCESS_VERTEX_TILER);
426 out = rsrc->bo->gpu + offset;
427
428 /* Check the cache */
429 needs_indices = !panfrost_minmax_cache_get(rsrc->index_cache, info->start, info->count,
430 min_index, max_index);
431 } else {
432 /* Otherwise, we need to upload to transient memory */
433 const uint8_t *ibuf8 = (const uint8_t *) info->index.user;
434 out = panfrost_upload_transient(batch, ibuf8 + offset, info->count * info->index_size);
435 }
436
437 if (needs_indices) {
438 /* Fallback */
439 u_vbuf_get_minmax_index(&ctx->base, info, min_index, max_index);
440
441 if (!info->has_user_indices) {
442 panfrost_minmax_cache_add(rsrc->index_cache, info->start, info->count,
443 *min_index, *max_index);
444 }
445 }
446
447
448 return out;
449 }
450
451 static bool
452 panfrost_scissor_culls_everything(struct panfrost_context *ctx)
453 {
454 const struct pipe_scissor_state *ss = &ctx->scissor;
455
456 /* Check if we're scissoring at all */
457
458 if (!(ctx->rasterizer && ctx->rasterizer->base.scissor))
459 return false;
460
461 return (ss->minx == ss->maxx) || (ss->miny == ss->maxy);
462 }
463
464 /* Count generated primitives (when there is no geom/tess shaders) for
465 * transform feedback */
466
467 static void
468 panfrost_statistics_record(
469 struct panfrost_context *ctx,
470 const struct pipe_draw_info *info)
471 {
472 if (!ctx->active_queries)
473 return;
474
475 uint32_t prims = u_prims_for_vertices(info->mode, info->count);
476 ctx->prims_generated += prims;
477
478 if (!ctx->streamout.num_targets)
479 return;
480
481 ctx->tf_prims_generated += prims;
482 }
483
484 static void
485 panfrost_update_streamout_offsets(struct panfrost_context *ctx)
486 {
487 for (unsigned i = 0; i < ctx->streamout.num_targets; ++i) {
488 unsigned count;
489
490 count = u_stream_outputs_for_vertices(ctx->active_prim,
491 ctx->vertex_count);
492 ctx->streamout.offsets[i] += count;
493 }
494 }
495
496 static void
497 panfrost_draw_vbo(
498 struct pipe_context *pipe,
499 const struct pipe_draw_info *info)
500 {
501 struct panfrost_context *ctx = pan_context(pipe);
502
503 /* First of all, check the scissor to see if anything is drawn at all.
504 * If it's not, we drop the draw (mostly a conformance issue;
505 * well-behaved apps shouldn't hit this) */
506
507 if (panfrost_scissor_culls_everything(ctx))
508 return;
509
510 int mode = info->mode;
511
512 /* Fallback unsupported restart index */
513 unsigned primitive_index = (1 << (info->index_size * 8)) - 1;
514
515 if (info->primitive_restart && info->index_size
516 && info->restart_index != primitive_index) {
517 util_draw_vbo_without_prim_restart(pipe, info);
518 return;
519 }
520
521 /* Fallback for unsupported modes */
522
523 assert(ctx->rasterizer != NULL);
524
525 if (!(ctx->draw_modes & (1 << mode))) {
526 if (mode == PIPE_PRIM_QUADS && info->count == 4 && !ctx->rasterizer->base.flatshade) {
527 mode = PIPE_PRIM_TRIANGLE_FAN;
528 } else {
529 if (info->count < 4) {
530 /* Degenerate case? */
531 return;
532 }
533
534 util_primconvert_save_rasterizer_state(ctx->primconvert, &ctx->rasterizer->base);
535 util_primconvert_draw_vbo(ctx->primconvert, info);
536 return;
537 }
538 }
539
540 ctx->payloads[PIPE_SHADER_VERTEX].offset_start = info->start;
541 ctx->payloads[PIPE_SHADER_FRAGMENT].offset_start = info->start;
542
543 /* Now that we have a guaranteed terminating path, find the job.
544 * Assignment commented out to prevent unused warning */
545
546 /* struct panfrost_batch *batch = */ panfrost_get_batch_for_fbo(ctx);
547
548 ctx->payloads[PIPE_SHADER_FRAGMENT].prefix.draw_mode = g2m_draw_mode(mode);
549
550 /* Take into account a negative bias */
551 ctx->vertex_count = info->count + abs(info->index_bias);
552 ctx->instance_count = info->instance_count;
553 ctx->active_prim = info->mode;
554
555 /* For non-indexed draws, they're the same */
556 unsigned vertex_count = ctx->vertex_count;
557
558 unsigned draw_flags = 0;
559
560 /* The draw flags interpret how primitive size is interpreted */
561
562 if (panfrost_writes_point_size(ctx))
563 draw_flags |= MALI_DRAW_VARYING_SIZE;
564
565 if (info->primitive_restart)
566 draw_flags |= MALI_DRAW_PRIMITIVE_RESTART_FIXED_INDEX;
567
568 /* These doesn't make much sense */
569
570 draw_flags |= 0x3000;
571
572 if (ctx->rasterizer && ctx->rasterizer->base.flatshade_first)
573 draw_flags |= MALI_DRAW_FLATSHADE_FIRST;
574
575 panfrost_statistics_record(ctx, info);
576
577 if (info->index_size) {
578 unsigned min_index = 0, max_index = 0;
579 ctx->payloads[PIPE_SHADER_FRAGMENT].prefix.indices =
580 panfrost_get_index_buffer_bounded(ctx, info, &min_index, &max_index);
581
582 /* Use the corresponding values */
583 vertex_count = max_index - min_index + 1;
584 ctx->payloads[PIPE_SHADER_VERTEX].offset_start = min_index + info->index_bias;
585 ctx->payloads[PIPE_SHADER_FRAGMENT].offset_start = min_index + info->index_bias;
586
587 ctx->payloads[PIPE_SHADER_FRAGMENT].prefix.offset_bias_correction = -min_index;
588 ctx->payloads[PIPE_SHADER_FRAGMENT].prefix.index_count = MALI_POSITIVE(info->count);
589
590 draw_flags |= panfrost_translate_index_size(info->index_size);
591 } else {
592 /* Index count == vertex count, if no indexing is applied, as
593 * if it is internally indexed in the expected order */
594
595 ctx->payloads[PIPE_SHADER_FRAGMENT].prefix.offset_bias_correction = 0;
596 ctx->payloads[PIPE_SHADER_FRAGMENT].prefix.index_count = MALI_POSITIVE(ctx->vertex_count);
597
598 /* Reverse index state */
599 ctx->payloads[PIPE_SHADER_FRAGMENT].prefix.indices = (mali_ptr) 0;
600 }
601
602 /* Dispatch "compute jobs" for the vertex/tiler pair as (1,
603 * vertex_count, 1) */
604
605 panfrost_pack_work_groups_fused(
606 &ctx->payloads[PIPE_SHADER_VERTEX].prefix,
607 &ctx->payloads[PIPE_SHADER_FRAGMENT].prefix,
608 1, vertex_count, info->instance_count,
609 1, 1, 1);
610
611 ctx->payloads[PIPE_SHADER_FRAGMENT].prefix.unknown_draw = draw_flags;
612
613 /* Encode the padded vertex count */
614
615 if (info->instance_count > 1) {
616 ctx->padded_count = panfrost_padded_vertex_count(vertex_count);
617
618 unsigned shift = __builtin_ctz(ctx->padded_count);
619 unsigned k = ctx->padded_count >> (shift + 1);
620
621 ctx->payloads[PIPE_SHADER_VERTEX].instance_shift = shift;
622 ctx->payloads[PIPE_SHADER_FRAGMENT].instance_shift = shift;
623
624 ctx->payloads[PIPE_SHADER_VERTEX].instance_odd = k;
625 ctx->payloads[PIPE_SHADER_FRAGMENT].instance_odd = k;
626 } else {
627 ctx->padded_count = vertex_count;
628
629 /* Reset instancing state */
630 ctx->payloads[PIPE_SHADER_VERTEX].instance_shift = 0;
631 ctx->payloads[PIPE_SHADER_VERTEX].instance_odd = 0;
632 ctx->payloads[PIPE_SHADER_FRAGMENT].instance_shift = 0;
633 ctx->payloads[PIPE_SHADER_FRAGMENT].instance_odd = 0;
634 }
635
636 /* Fire off the draw itself */
637 panfrost_queue_draw(ctx);
638
639 /* Increment transform feedback offsets */
640 panfrost_update_streamout_offsets(ctx);
641 }
642
643 /* CSO state */
644
645 static void
646 panfrost_generic_cso_delete(struct pipe_context *pctx, void *hwcso)
647 {
648 free(hwcso);
649 }
650
651 static void *
652 panfrost_create_rasterizer_state(
653 struct pipe_context *pctx,
654 const struct pipe_rasterizer_state *cso)
655 {
656 struct panfrost_rasterizer *so = CALLOC_STRUCT(panfrost_rasterizer);
657
658 so->base = *cso;
659
660 return so;
661 }
662
663 static void
664 panfrost_bind_rasterizer_state(
665 struct pipe_context *pctx,
666 void *hwcso)
667 {
668 struct panfrost_context *ctx = pan_context(pctx);
669
670 ctx->rasterizer = hwcso;
671
672 if (!hwcso)
673 return;
674
675 /* Gauranteed with the core GL call, so don't expose ARB_polygon_offset */
676 assert(ctx->rasterizer->base.offset_clamp == 0.0);
677
678 /* Point sprites are emulated */
679
680 struct panfrost_shader_state *variant = panfrost_get_shader_state(ctx, PIPE_SHADER_FRAGMENT);
681
682 if (ctx->rasterizer->base.sprite_coord_enable || (variant && variant->point_sprite_mask))
683 ctx->base.bind_fs_state(&ctx->base, ctx->shader[PIPE_SHADER_FRAGMENT]);
684 }
685
686 static void *
687 panfrost_create_vertex_elements_state(
688 struct pipe_context *pctx,
689 unsigned num_elements,
690 const struct pipe_vertex_element *elements)
691 {
692 struct panfrost_vertex_state *so = CALLOC_STRUCT(panfrost_vertex_state);
693
694 so->num_elements = num_elements;
695 memcpy(so->pipe, elements, sizeof(*elements) * num_elements);
696
697 for (int i = 0; i < num_elements; ++i) {
698 so->hw[i].index = i;
699
700 enum pipe_format fmt = elements[i].src_format;
701 const struct util_format_description *desc = util_format_description(fmt);
702 so->hw[i].unknown1 = 0x2;
703 so->hw[i].swizzle = panfrost_get_default_swizzle(desc->nr_channels);
704
705 so->hw[i].format = panfrost_find_format(desc);
706 }
707
708 /* Let's also prepare vertex builtins */
709 so->hw[PAN_VERTEX_ID].format = MALI_R32UI;
710 so->hw[PAN_VERTEX_ID].swizzle = panfrost_get_default_swizzle(1);
711 so->hw[PAN_INSTANCE_ID].format = MALI_R32UI;
712 so->hw[PAN_INSTANCE_ID].swizzle = panfrost_get_default_swizzle(1);
713
714 return so;
715 }
716
717 static void
718 panfrost_bind_vertex_elements_state(
719 struct pipe_context *pctx,
720 void *hwcso)
721 {
722 struct panfrost_context *ctx = pan_context(pctx);
723 ctx->vertex = hwcso;
724 }
725
726 static void *
727 panfrost_create_shader_state(
728 struct pipe_context *pctx,
729 const struct pipe_shader_state *cso,
730 enum pipe_shader_type stage)
731 {
732 struct panfrost_shader_variants *so = CALLOC_STRUCT(panfrost_shader_variants);
733 so->base = *cso;
734
735 /* Token deep copy to prevent memory corruption */
736
737 if (cso->type == PIPE_SHADER_IR_TGSI)
738 so->base.tokens = tgsi_dup_tokens(so->base.tokens);
739
740 /* Precompile for shader-db if we need to */
741 if (unlikely((pan_debug & PAN_DBG_PRECOMPILE) && cso->type == PIPE_SHADER_IR_NIR)) {
742 struct panfrost_context *ctx = pan_context(pctx);
743
744 struct panfrost_shader_state state;
745 uint64_t outputs_written;
746
747 panfrost_shader_compile(ctx, PIPE_SHADER_IR_NIR,
748 so->base.ir.nir,
749 tgsi_processor_to_shader_stage(stage),
750 &state, &outputs_written);
751 }
752
753 return so;
754 }
755
756 static void
757 panfrost_delete_shader_state(
758 struct pipe_context *pctx,
759 void *so)
760 {
761 struct panfrost_shader_variants *cso = (struct panfrost_shader_variants *) so;
762
763 if (cso->base.type == PIPE_SHADER_IR_TGSI) {
764 DBG("Deleting TGSI shader leaks duplicated tokens\n");
765 }
766
767 for (unsigned i = 0; i < cso->variant_count; ++i) {
768 struct panfrost_shader_state *shader_state = &cso->variants[i];
769 panfrost_bo_unreference(shader_state->bo);
770 shader_state->bo = NULL;
771 }
772 free(cso->variants);
773
774 free(so);
775 }
776
777 static void *
778 panfrost_create_sampler_state(
779 struct pipe_context *pctx,
780 const struct pipe_sampler_state *cso)
781 {
782 struct panfrost_sampler_state *so = CALLOC_STRUCT(panfrost_sampler_state);
783 so->base = *cso;
784
785 panfrost_sampler_desc_init(cso, &so->hw);
786
787 return so;
788 }
789
790 static void
791 panfrost_bind_sampler_states(
792 struct pipe_context *pctx,
793 enum pipe_shader_type shader,
794 unsigned start_slot, unsigned num_sampler,
795 void **sampler)
796 {
797 assert(start_slot == 0);
798
799 struct panfrost_context *ctx = pan_context(pctx);
800
801 /* XXX: Should upload, not just copy? */
802 ctx->sampler_count[shader] = num_sampler;
803 memcpy(ctx->samplers[shader], sampler, num_sampler * sizeof (void *));
804 }
805
806 static bool
807 panfrost_variant_matches(
808 struct panfrost_context *ctx,
809 struct panfrost_shader_state *variant,
810 enum pipe_shader_type type)
811 {
812 struct pipe_rasterizer_state *rasterizer = &ctx->rasterizer->base;
813 struct pipe_alpha_state *alpha = &ctx->depth_stencil->alpha;
814
815 bool is_fragment = (type == PIPE_SHADER_FRAGMENT);
816
817 if (is_fragment && (alpha->enabled || variant->alpha_state.enabled)) {
818 /* Make sure enable state is at least the same */
819 if (alpha->enabled != variant->alpha_state.enabled) {
820 return false;
821 }
822
823 /* Check that the contents of the test are the same */
824 bool same_func = alpha->func == variant->alpha_state.func;
825 bool same_ref = alpha->ref_value == variant->alpha_state.ref_value;
826
827 if (!(same_func && same_ref)) {
828 return false;
829 }
830 }
831
832 if (is_fragment && rasterizer && (rasterizer->sprite_coord_enable |
833 variant->point_sprite_mask)) {
834 /* Ensure the same varyings are turned to point sprites */
835 if (rasterizer->sprite_coord_enable != variant->point_sprite_mask)
836 return false;
837
838 /* Ensure the orientation is correct */
839 bool upper_left =
840 rasterizer->sprite_coord_mode ==
841 PIPE_SPRITE_COORD_UPPER_LEFT;
842
843 if (variant->point_sprite_upper_left != upper_left)
844 return false;
845 }
846
847 /* Otherwise, we're good to go */
848 return true;
849 }
850
851 /**
852 * Fix an uncompiled shader's stream output info, and produce a bitmask
853 * of which VARYING_SLOT_* are captured for stream output.
854 *
855 * Core Gallium stores output->register_index as a "slot" number, where
856 * slots are assigned consecutively to all outputs in info->outputs_written.
857 * This naive packing of outputs doesn't work for us - we too have slots,
858 * but the layout is defined by the VUE map, which we won't have until we
859 * compile a specific shader variant. So, we remap these and simply store
860 * VARYING_SLOT_* in our copy's output->register_index fields.
861 *
862 * We then produce a bitmask of outputs which are used for SO.
863 *
864 * Implementation from iris.
865 */
866
867 static uint64_t
868 update_so_info(struct pipe_stream_output_info *so_info,
869 uint64_t outputs_written)
870 {
871 uint64_t so_outputs = 0;
872 uint8_t reverse_map[64] = {0};
873 unsigned slot = 0;
874
875 while (outputs_written)
876 reverse_map[slot++] = u_bit_scan64(&outputs_written);
877
878 for (unsigned i = 0; i < so_info->num_outputs; i++) {
879 struct pipe_stream_output *output = &so_info->output[i];
880
881 /* Map Gallium's condensed "slots" back to real VARYING_SLOT_* enums */
882 output->register_index = reverse_map[output->register_index];
883
884 so_outputs |= 1ull << output->register_index;
885 }
886
887 return so_outputs;
888 }
889
890 static void
891 panfrost_bind_shader_state(
892 struct pipe_context *pctx,
893 void *hwcso,
894 enum pipe_shader_type type)
895 {
896 struct panfrost_context *ctx = pan_context(pctx);
897 ctx->shader[type] = hwcso;
898
899 if (!hwcso) return;
900
901 /* Match the appropriate variant */
902
903 signed variant = -1;
904 struct panfrost_shader_variants *variants = (struct panfrost_shader_variants *) hwcso;
905
906 for (unsigned i = 0; i < variants->variant_count; ++i) {
907 if (panfrost_variant_matches(ctx, &variants->variants[i], type)) {
908 variant = i;
909 break;
910 }
911 }
912
913 if (variant == -1) {
914 /* No variant matched, so create a new one */
915 variant = variants->variant_count++;
916
917 if (variants->variant_count > variants->variant_space) {
918 unsigned old_space = variants->variant_space;
919
920 variants->variant_space *= 2;
921 if (variants->variant_space == 0)
922 variants->variant_space = 1;
923
924 /* Arbitrary limit to stop runaway programs from
925 * creating an unbounded number of shader variants. */
926 assert(variants->variant_space < 1024);
927
928 unsigned msize = sizeof(struct panfrost_shader_state);
929 variants->variants = realloc(variants->variants,
930 variants->variant_space * msize);
931
932 memset(&variants->variants[old_space], 0,
933 (variants->variant_space - old_space) * msize);
934 }
935
936 struct panfrost_shader_state *v =
937 &variants->variants[variant];
938
939 if (type == PIPE_SHADER_FRAGMENT) {
940 v->alpha_state = ctx->depth_stencil->alpha;
941
942 if (ctx->rasterizer) {
943 v->point_sprite_mask = ctx->rasterizer->base.sprite_coord_enable;
944 v->point_sprite_upper_left =
945 ctx->rasterizer->base.sprite_coord_mode ==
946 PIPE_SPRITE_COORD_UPPER_LEFT;
947 }
948 }
949 }
950
951 /* Select this variant */
952 variants->active_variant = variant;
953
954 struct panfrost_shader_state *shader_state = &variants->variants[variant];
955 assert(panfrost_variant_matches(ctx, shader_state, type));
956
957 /* We finally have a variant, so compile it */
958
959 if (!shader_state->compiled) {
960 uint64_t outputs_written = 0;
961
962 panfrost_shader_compile(ctx, variants->base.type,
963 variants->base.type == PIPE_SHADER_IR_NIR ?
964 variants->base.ir.nir :
965 variants->base.tokens,
966 tgsi_processor_to_shader_stage(type),
967 shader_state,
968 &outputs_written);
969
970 shader_state->compiled = true;
971
972 /* Fixup the stream out information, since what Gallium returns
973 * normally is mildly insane */
974
975 shader_state->stream_output = variants->base.stream_output;
976 shader_state->so_mask =
977 update_so_info(&shader_state->stream_output, outputs_written);
978 }
979 }
980
981 static void *
982 panfrost_create_vs_state(struct pipe_context *pctx, const struct pipe_shader_state *hwcso)
983 {
984 return panfrost_create_shader_state(pctx, hwcso, PIPE_SHADER_VERTEX);
985 }
986
987 static void *
988 panfrost_create_fs_state(struct pipe_context *pctx, const struct pipe_shader_state *hwcso)
989 {
990 return panfrost_create_shader_state(pctx, hwcso, PIPE_SHADER_FRAGMENT);
991 }
992
993 static void
994 panfrost_bind_vs_state(struct pipe_context *pctx, void *hwcso)
995 {
996 panfrost_bind_shader_state(pctx, hwcso, PIPE_SHADER_VERTEX);
997 }
998
999 static void
1000 panfrost_bind_fs_state(struct pipe_context *pctx, void *hwcso)
1001 {
1002 panfrost_bind_shader_state(pctx, hwcso, PIPE_SHADER_FRAGMENT);
1003 }
1004
1005 static void
1006 panfrost_set_vertex_buffers(
1007 struct pipe_context *pctx,
1008 unsigned start_slot,
1009 unsigned num_buffers,
1010 const struct pipe_vertex_buffer *buffers)
1011 {
1012 struct panfrost_context *ctx = pan_context(pctx);
1013
1014 util_set_vertex_buffers_mask(ctx->vertex_buffers, &ctx->vb_mask, buffers, start_slot, num_buffers);
1015 }
1016
1017 static void
1018 panfrost_set_constant_buffer(
1019 struct pipe_context *pctx,
1020 enum pipe_shader_type shader, uint index,
1021 const struct pipe_constant_buffer *buf)
1022 {
1023 struct panfrost_context *ctx = pan_context(pctx);
1024 struct panfrost_constant_buffer *pbuf = &ctx->constant_buffer[shader];
1025
1026 util_copy_constant_buffer(&pbuf->cb[index], buf);
1027
1028 unsigned mask = (1 << index);
1029
1030 if (unlikely(!buf)) {
1031 pbuf->enabled_mask &= ~mask;
1032 pbuf->dirty_mask &= ~mask;
1033 return;
1034 }
1035
1036 pbuf->enabled_mask |= mask;
1037 pbuf->dirty_mask |= mask;
1038 }
1039
1040 static void
1041 panfrost_set_stencil_ref(
1042 struct pipe_context *pctx,
1043 const struct pipe_stencil_ref *ref)
1044 {
1045 struct panfrost_context *ctx = pan_context(pctx);
1046 ctx->stencil_ref = *ref;
1047 }
1048
1049 static enum mali_texture_type
1050 panfrost_translate_texture_type(enum pipe_texture_target t) {
1051 switch (t)
1052 {
1053 case PIPE_BUFFER:
1054 case PIPE_TEXTURE_1D:
1055 case PIPE_TEXTURE_1D_ARRAY:
1056 return MALI_TEX_1D;
1057
1058 case PIPE_TEXTURE_2D:
1059 case PIPE_TEXTURE_2D_ARRAY:
1060 case PIPE_TEXTURE_RECT:
1061 return MALI_TEX_2D;
1062
1063 case PIPE_TEXTURE_3D:
1064 return MALI_TEX_3D;
1065
1066 case PIPE_TEXTURE_CUBE:
1067 case PIPE_TEXTURE_CUBE_ARRAY:
1068 return MALI_TEX_CUBE;
1069
1070 default:
1071 unreachable("Unknown target");
1072 }
1073 }
1074
1075 static struct pipe_sampler_view *
1076 panfrost_create_sampler_view(
1077 struct pipe_context *pctx,
1078 struct pipe_resource *texture,
1079 const struct pipe_sampler_view *template)
1080 {
1081 struct panfrost_screen *screen = pan_screen(pctx->screen);
1082 struct panfrost_sampler_view *so = rzalloc(pctx, struct panfrost_sampler_view);
1083
1084 pipe_reference(NULL, &texture->reference);
1085
1086 struct panfrost_resource *prsrc = (struct panfrost_resource *) texture;
1087 assert(prsrc->bo);
1088
1089 so->base = *template;
1090 so->base.texture = texture;
1091 so->base.reference.count = 1;
1092 so->base.context = pctx;
1093
1094 unsigned char user_swizzle[4] = {
1095 template->swizzle_r,
1096 template->swizzle_g,
1097 template->swizzle_b,
1098 template->swizzle_a
1099 };
1100
1101 /* In the hardware, array_size refers specifically to array textures,
1102 * whereas in Gallium, it also covers cubemaps */
1103
1104 unsigned array_size = texture->array_size;
1105
1106 if (template->target == PIPE_TEXTURE_CUBE) {
1107 /* TODO: Cubemap arrays */
1108 assert(array_size == 6);
1109 array_size /= 6;
1110 }
1111
1112 enum mali_texture_type type =
1113 panfrost_translate_texture_type(template->target);
1114
1115 unsigned size = panfrost_estimate_texture_size(
1116 template->u.tex.first_level,
1117 template->u.tex.last_level,
1118 template->u.tex.first_layer,
1119 template->u.tex.last_layer,
1120 type, prsrc->layout);
1121
1122 so->bo = panfrost_bo_create(screen, size, 0);
1123
1124 panfrost_new_texture(
1125 so->bo->cpu,
1126 texture->width0, texture->height0,
1127 texture->depth0, array_size,
1128 template->format,
1129 type, prsrc->layout,
1130 template->u.tex.first_level,
1131 template->u.tex.last_level,
1132 template->u.tex.first_layer,
1133 template->u.tex.last_layer,
1134 prsrc->cubemap_stride,
1135 panfrost_translate_swizzle_4(user_swizzle),
1136 prsrc->bo->gpu,
1137 prsrc->slices);
1138
1139 return (struct pipe_sampler_view *) so;
1140 }
1141
1142 static void
1143 panfrost_set_sampler_views(
1144 struct pipe_context *pctx,
1145 enum pipe_shader_type shader,
1146 unsigned start_slot, unsigned num_views,
1147 struct pipe_sampler_view **views)
1148 {
1149 struct panfrost_context *ctx = pan_context(pctx);
1150 unsigned new_nr = 0;
1151 unsigned i;
1152
1153 assert(start_slot == 0);
1154
1155 for (i = 0; i < num_views; ++i) {
1156 if (views[i])
1157 new_nr = i + 1;
1158 pipe_sampler_view_reference((struct pipe_sampler_view **)&ctx->sampler_views[shader][i],
1159 views[i]);
1160 }
1161
1162 for (; i < ctx->sampler_view_count[shader]; i++) {
1163 pipe_sampler_view_reference((struct pipe_sampler_view **)&ctx->sampler_views[shader][i],
1164 NULL);
1165 }
1166 ctx->sampler_view_count[shader] = new_nr;
1167 }
1168
1169 static void
1170 panfrost_sampler_view_destroy(
1171 struct pipe_context *pctx,
1172 struct pipe_sampler_view *pview)
1173 {
1174 struct panfrost_sampler_view *view = (struct panfrost_sampler_view *) pview;
1175
1176 pipe_resource_reference(&pview->texture, NULL);
1177 panfrost_bo_unreference(view->bo);
1178 ralloc_free(view);
1179 }
1180
1181 static void
1182 panfrost_set_shader_buffers(
1183 struct pipe_context *pctx,
1184 enum pipe_shader_type shader,
1185 unsigned start, unsigned count,
1186 const struct pipe_shader_buffer *buffers,
1187 unsigned writable_bitmask)
1188 {
1189 struct panfrost_context *ctx = pan_context(pctx);
1190
1191 util_set_shader_buffers_mask(ctx->ssbo[shader], &ctx->ssbo_mask[shader],
1192 buffers, start, count);
1193 }
1194
1195 /* Hints that a framebuffer should use AFBC where possible */
1196
1197 static void
1198 panfrost_hint_afbc(
1199 struct panfrost_screen *screen,
1200 const struct pipe_framebuffer_state *fb)
1201 {
1202 /* AFBC implemenation incomplete; hide it */
1203 if (!(pan_debug & PAN_DBG_AFBC)) return;
1204
1205 /* Hint AFBC to the resources bound to each color buffer */
1206
1207 for (unsigned i = 0; i < fb->nr_cbufs; ++i) {
1208 struct pipe_surface *surf = fb->cbufs[i];
1209 struct panfrost_resource *rsrc = pan_resource(surf->texture);
1210 panfrost_resource_hint_layout(screen, rsrc, MALI_TEXTURE_AFBC, 1);
1211 }
1212
1213 /* Also hint it to the depth buffer */
1214
1215 if (fb->zsbuf) {
1216 struct panfrost_resource *rsrc = pan_resource(fb->zsbuf->texture);
1217 panfrost_resource_hint_layout(screen, rsrc, MALI_TEXTURE_AFBC, 1);
1218 }
1219 }
1220
1221 static void
1222 panfrost_set_framebuffer_state(struct pipe_context *pctx,
1223 const struct pipe_framebuffer_state *fb)
1224 {
1225 struct panfrost_context *ctx = pan_context(pctx);
1226
1227 panfrost_hint_afbc(pan_screen(pctx->screen), fb);
1228 util_copy_framebuffer_state(&ctx->pipe_framebuffer, fb);
1229 ctx->batch = NULL;
1230 panfrost_invalidate_frame(ctx);
1231 }
1232
1233 static void *
1234 panfrost_create_depth_stencil_state(struct pipe_context *pipe,
1235 const struct pipe_depth_stencil_alpha_state *depth_stencil)
1236 {
1237 return mem_dup(depth_stencil, sizeof(*depth_stencil));
1238 }
1239
1240 static void
1241 panfrost_bind_depth_stencil_state(struct pipe_context *pipe,
1242 void *cso)
1243 {
1244 struct panfrost_context *ctx = pan_context(pipe);
1245 struct pipe_depth_stencil_alpha_state *depth_stencil = cso;
1246 ctx->depth_stencil = depth_stencil;
1247
1248 if (!depth_stencil)
1249 return;
1250
1251 /* Alpha does not exist in the hardware (it's not in ES3), so it's
1252 * emulated in the fragment shader */
1253
1254 if (depth_stencil->alpha.enabled) {
1255 /* We need to trigger a new shader (maybe) */
1256 ctx->base.bind_fs_state(&ctx->base, ctx->shader[PIPE_SHADER_FRAGMENT]);
1257 }
1258
1259 /* Bounds test not implemented */
1260 assert(!depth_stencil->depth.bounds_test);
1261 }
1262
1263 static void
1264 panfrost_delete_depth_stencil_state(struct pipe_context *pipe, void *depth)
1265 {
1266 free( depth );
1267 }
1268
1269 static void
1270 panfrost_set_sample_mask(struct pipe_context *pipe,
1271 unsigned sample_mask)
1272 {
1273 }
1274
1275 static void
1276 panfrost_set_clip_state(struct pipe_context *pipe,
1277 const struct pipe_clip_state *clip)
1278 {
1279 //struct panfrost_context *panfrost = pan_context(pipe);
1280 }
1281
1282 static void
1283 panfrost_set_viewport_states(struct pipe_context *pipe,
1284 unsigned start_slot,
1285 unsigned num_viewports,
1286 const struct pipe_viewport_state *viewports)
1287 {
1288 struct panfrost_context *ctx = pan_context(pipe);
1289
1290 assert(start_slot == 0);
1291 assert(num_viewports == 1);
1292
1293 ctx->pipe_viewport = *viewports;
1294 }
1295
1296 static void
1297 panfrost_set_scissor_states(struct pipe_context *pipe,
1298 unsigned start_slot,
1299 unsigned num_scissors,
1300 const struct pipe_scissor_state *scissors)
1301 {
1302 struct panfrost_context *ctx = pan_context(pipe);
1303
1304 assert(start_slot == 0);
1305 assert(num_scissors == 1);
1306
1307 ctx->scissor = *scissors;
1308 }
1309
1310 static void
1311 panfrost_set_polygon_stipple(struct pipe_context *pipe,
1312 const struct pipe_poly_stipple *stipple)
1313 {
1314 //struct panfrost_context *panfrost = pan_context(pipe);
1315 }
1316
1317 static void
1318 panfrost_set_active_query_state(struct pipe_context *pipe,
1319 bool enable)
1320 {
1321 struct panfrost_context *ctx = pan_context(pipe);
1322 ctx->active_queries = enable;
1323 }
1324
1325 static void
1326 panfrost_destroy(struct pipe_context *pipe)
1327 {
1328 struct panfrost_context *panfrost = pan_context(pipe);
1329
1330 if (panfrost->blitter)
1331 util_blitter_destroy(panfrost->blitter);
1332
1333 if (panfrost->blitter_wallpaper)
1334 util_blitter_destroy(panfrost->blitter_wallpaper);
1335
1336 util_unreference_framebuffer_state(&panfrost->pipe_framebuffer);
1337 u_upload_destroy(pipe->stream_uploader);
1338
1339 ralloc_free(pipe);
1340 }
1341
1342 static struct pipe_query *
1343 panfrost_create_query(struct pipe_context *pipe,
1344 unsigned type,
1345 unsigned index)
1346 {
1347 struct panfrost_query *q = rzalloc(pipe, struct panfrost_query);
1348
1349 q->type = type;
1350 q->index = index;
1351
1352 return (struct pipe_query *) q;
1353 }
1354
1355 static void
1356 panfrost_destroy_query(struct pipe_context *pipe, struct pipe_query *q)
1357 {
1358 struct panfrost_query *query = (struct panfrost_query *) q;
1359
1360 if (query->bo) {
1361 panfrost_bo_unreference(query->bo);
1362 query->bo = NULL;
1363 }
1364
1365 ralloc_free(q);
1366 }
1367
1368 static bool
1369 panfrost_begin_query(struct pipe_context *pipe, struct pipe_query *q)
1370 {
1371 struct panfrost_context *ctx = pan_context(pipe);
1372 struct panfrost_query *query = (struct panfrost_query *) q;
1373
1374 switch (query->type) {
1375 case PIPE_QUERY_OCCLUSION_COUNTER:
1376 case PIPE_QUERY_OCCLUSION_PREDICATE:
1377 case PIPE_QUERY_OCCLUSION_PREDICATE_CONSERVATIVE:
1378 /* Allocate a bo for the query results to be stored */
1379 if (!query->bo) {
1380 query->bo = panfrost_bo_create(
1381 pan_screen(ctx->base.screen),
1382 sizeof(unsigned), 0);
1383 }
1384
1385 unsigned *result = (unsigned *)query->bo->cpu;
1386 *result = 0; /* Default to 0 if nothing at all drawn. */
1387 ctx->occlusion_query = query;
1388 break;
1389
1390 /* Geometry statistics are computed in the driver. XXX: geom/tess
1391 * shaders.. */
1392
1393 case PIPE_QUERY_PRIMITIVES_GENERATED:
1394 query->start = ctx->prims_generated;
1395 break;
1396 case PIPE_QUERY_PRIMITIVES_EMITTED:
1397 query->start = ctx->tf_prims_generated;
1398 break;
1399
1400 default:
1401 DBG("Skipping query %u\n", query->type);
1402 break;
1403 }
1404
1405 return true;
1406 }
1407
1408 static bool
1409 panfrost_end_query(struct pipe_context *pipe, struct pipe_query *q)
1410 {
1411 struct panfrost_context *ctx = pan_context(pipe);
1412 struct panfrost_query *query = (struct panfrost_query *) q;
1413
1414 switch (query->type) {
1415 case PIPE_QUERY_OCCLUSION_COUNTER:
1416 case PIPE_QUERY_OCCLUSION_PREDICATE:
1417 case PIPE_QUERY_OCCLUSION_PREDICATE_CONSERVATIVE:
1418 ctx->occlusion_query = NULL;
1419 break;
1420 case PIPE_QUERY_PRIMITIVES_GENERATED:
1421 query->end = ctx->prims_generated;
1422 break;
1423 case PIPE_QUERY_PRIMITIVES_EMITTED:
1424 query->end = ctx->tf_prims_generated;
1425 break;
1426 }
1427
1428 return true;
1429 }
1430
1431 static bool
1432 panfrost_get_query_result(struct pipe_context *pipe,
1433 struct pipe_query *q,
1434 bool wait,
1435 union pipe_query_result *vresult)
1436 {
1437 struct panfrost_query *query = (struct panfrost_query *) q;
1438 struct panfrost_context *ctx = pan_context(pipe);
1439
1440
1441 switch (query->type) {
1442 case PIPE_QUERY_OCCLUSION_COUNTER:
1443 case PIPE_QUERY_OCCLUSION_PREDICATE:
1444 case PIPE_QUERY_OCCLUSION_PREDICATE_CONSERVATIVE:
1445 /* Flush first */
1446 panfrost_flush_all_batches(ctx, true);
1447
1448 /* Read back the query results */
1449 unsigned *result = (unsigned *) query->bo->cpu;
1450 unsigned passed = *result;
1451
1452 if (query->type == PIPE_QUERY_OCCLUSION_COUNTER) {
1453 vresult->u64 = passed;
1454 } else {
1455 vresult->b = !!passed;
1456 }
1457
1458 break;
1459
1460 case PIPE_QUERY_PRIMITIVES_GENERATED:
1461 case PIPE_QUERY_PRIMITIVES_EMITTED:
1462 panfrost_flush_all_batches(ctx, true);
1463 vresult->u64 = query->end - query->start;
1464 break;
1465
1466 default:
1467 DBG("Skipped query get %u\n", query->type);
1468 break;
1469 }
1470
1471 return true;
1472 }
1473
1474 static struct pipe_stream_output_target *
1475 panfrost_create_stream_output_target(struct pipe_context *pctx,
1476 struct pipe_resource *prsc,
1477 unsigned buffer_offset,
1478 unsigned buffer_size)
1479 {
1480 struct pipe_stream_output_target *target;
1481
1482 target = rzalloc(pctx, struct pipe_stream_output_target);
1483
1484 if (!target)
1485 return NULL;
1486
1487 pipe_reference_init(&target->reference, 1);
1488 pipe_resource_reference(&target->buffer, prsc);
1489
1490 target->context = pctx;
1491 target->buffer_offset = buffer_offset;
1492 target->buffer_size = buffer_size;
1493
1494 return target;
1495 }
1496
1497 static void
1498 panfrost_stream_output_target_destroy(struct pipe_context *pctx,
1499 struct pipe_stream_output_target *target)
1500 {
1501 pipe_resource_reference(&target->buffer, NULL);
1502 ralloc_free(target);
1503 }
1504
1505 static void
1506 panfrost_set_stream_output_targets(struct pipe_context *pctx,
1507 unsigned num_targets,
1508 struct pipe_stream_output_target **targets,
1509 const unsigned *offsets)
1510 {
1511 struct panfrost_context *ctx = pan_context(pctx);
1512 struct panfrost_streamout *so = &ctx->streamout;
1513
1514 assert(num_targets <= ARRAY_SIZE(so->targets));
1515
1516 for (unsigned i = 0; i < num_targets; i++) {
1517 if (offsets[i] != -1)
1518 so->offsets[i] = offsets[i];
1519
1520 pipe_so_target_reference(&so->targets[i], targets[i]);
1521 }
1522
1523 for (unsigned i = 0; i < so->num_targets; i++)
1524 pipe_so_target_reference(&so->targets[i], NULL);
1525
1526 so->num_targets = num_targets;
1527 }
1528
1529 struct pipe_context *
1530 panfrost_create_context(struct pipe_screen *screen, void *priv, unsigned flags)
1531 {
1532 struct panfrost_context *ctx = rzalloc(screen, struct panfrost_context);
1533 struct pipe_context *gallium = (struct pipe_context *) ctx;
1534
1535 gallium->screen = screen;
1536
1537 gallium->destroy = panfrost_destroy;
1538
1539 gallium->set_framebuffer_state = panfrost_set_framebuffer_state;
1540
1541 gallium->flush = panfrost_flush;
1542 gallium->clear = panfrost_clear;
1543 gallium->draw_vbo = panfrost_draw_vbo;
1544
1545 gallium->set_vertex_buffers = panfrost_set_vertex_buffers;
1546 gallium->set_constant_buffer = panfrost_set_constant_buffer;
1547 gallium->set_shader_buffers = panfrost_set_shader_buffers;
1548
1549 gallium->set_stencil_ref = panfrost_set_stencil_ref;
1550
1551 gallium->create_sampler_view = panfrost_create_sampler_view;
1552 gallium->set_sampler_views = panfrost_set_sampler_views;
1553 gallium->sampler_view_destroy = panfrost_sampler_view_destroy;
1554
1555 gallium->create_rasterizer_state = panfrost_create_rasterizer_state;
1556 gallium->bind_rasterizer_state = panfrost_bind_rasterizer_state;
1557 gallium->delete_rasterizer_state = panfrost_generic_cso_delete;
1558
1559 gallium->create_vertex_elements_state = panfrost_create_vertex_elements_state;
1560 gallium->bind_vertex_elements_state = panfrost_bind_vertex_elements_state;
1561 gallium->delete_vertex_elements_state = panfrost_generic_cso_delete;
1562
1563 gallium->create_fs_state = panfrost_create_fs_state;
1564 gallium->delete_fs_state = panfrost_delete_shader_state;
1565 gallium->bind_fs_state = panfrost_bind_fs_state;
1566
1567 gallium->create_vs_state = panfrost_create_vs_state;
1568 gallium->delete_vs_state = panfrost_delete_shader_state;
1569 gallium->bind_vs_state = panfrost_bind_vs_state;
1570
1571 gallium->create_sampler_state = panfrost_create_sampler_state;
1572 gallium->delete_sampler_state = panfrost_generic_cso_delete;
1573 gallium->bind_sampler_states = panfrost_bind_sampler_states;
1574
1575 gallium->create_depth_stencil_alpha_state = panfrost_create_depth_stencil_state;
1576 gallium->bind_depth_stencil_alpha_state = panfrost_bind_depth_stencil_state;
1577 gallium->delete_depth_stencil_alpha_state = panfrost_delete_depth_stencil_state;
1578
1579 gallium->set_sample_mask = panfrost_set_sample_mask;
1580
1581 gallium->set_clip_state = panfrost_set_clip_state;
1582 gallium->set_viewport_states = panfrost_set_viewport_states;
1583 gallium->set_scissor_states = panfrost_set_scissor_states;
1584 gallium->set_polygon_stipple = panfrost_set_polygon_stipple;
1585 gallium->set_active_query_state = panfrost_set_active_query_state;
1586
1587 gallium->create_query = panfrost_create_query;
1588 gallium->destroy_query = panfrost_destroy_query;
1589 gallium->begin_query = panfrost_begin_query;
1590 gallium->end_query = panfrost_end_query;
1591 gallium->get_query_result = panfrost_get_query_result;
1592
1593 gallium->create_stream_output_target = panfrost_create_stream_output_target;
1594 gallium->stream_output_target_destroy = panfrost_stream_output_target_destroy;
1595 gallium->set_stream_output_targets = panfrost_set_stream_output_targets;
1596
1597 panfrost_resource_context_init(gallium);
1598 panfrost_blend_context_init(gallium);
1599 panfrost_compute_context_init(gallium);
1600
1601 /* XXX: leaks */
1602 gallium->stream_uploader = u_upload_create_default(gallium);
1603 gallium->const_uploader = gallium->stream_uploader;
1604 assert(gallium->stream_uploader);
1605
1606 /* Midgard supports ES modes, plus QUADS/QUAD_STRIPS/POLYGON */
1607 ctx->draw_modes = (1 << (PIPE_PRIM_POLYGON + 1)) - 1;
1608
1609 ctx->primconvert = util_primconvert_create(gallium, ctx->draw_modes);
1610
1611 ctx->blitter = util_blitter_create(gallium);
1612 ctx->blitter_wallpaper = util_blitter_create(gallium);
1613
1614 assert(ctx->blitter);
1615 assert(ctx->blitter_wallpaper);
1616
1617 /* Prepare for render! */
1618
1619 panfrost_batch_init(ctx);
1620 panfrost_emit_vertex_payload(ctx);
1621 panfrost_invalidate_frame(ctx);
1622
1623 return gallium;
1624 }