panfrost: Disable tiled formats on SFBD systems
[mesa.git] / src / gallium / drivers / panfrost / pan_resource.c
1 /*
2 * Copyright (C) 2008 VMware, Inc.
3 * Copyright (C) 2014 Broadcom
4 * Copyright (C) 2018-2019 Alyssa Rosenzweig
5 * Copyright (C) 2019 Collabora, Ltd.
6 *
7 * Permission is hereby granted, free of charge, to any person obtaining a
8 * copy of this software and associated documentation files (the "Software"),
9 * to deal in the Software without restriction, including without limitation
10 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
11 * and/or sell copies of the Software, and to permit persons to whom the
12 * Software is furnished to do so, subject to the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the next
15 * paragraph) shall be included in all copies or substantial portions of the
16 * Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
19 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
21 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
22 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
23 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24 * SOFTWARE.
25 *
26 * Authors (Collabora):
27 * Tomeu Vizoso <tomeu.vizoso@collabora.com>
28 * Alyssa Rosenzweig <alyssa.rosenzweig@collabora.com>
29 *
30 */
31
32 #include <xf86drm.h>
33 #include <fcntl.h>
34 #include "drm-uapi/drm_fourcc.h"
35
36 #include "state_tracker/winsys_handle.h"
37 #include "util/u_format.h"
38 #include "util/u_memory.h"
39 #include "util/u_surface.h"
40 #include "util/u_transfer.h"
41 #include "util/u_transfer_helper.h"
42 #include "util/u_gen_mipmap.h"
43
44 #include "pan_context.h"
45 #include "pan_screen.h"
46 #include "pan_resource.h"
47 #include "pan_util.h"
48 #include "pan_tiling.h"
49
50 static struct pipe_resource *
51 panfrost_resource_from_handle(struct pipe_screen *pscreen,
52 const struct pipe_resource *templat,
53 struct winsys_handle *whandle,
54 unsigned usage)
55 {
56 struct panfrost_screen *screen = pan_screen(pscreen);
57 struct panfrost_resource *rsc;
58 struct pipe_resource *prsc;
59
60 assert(whandle->type == WINSYS_HANDLE_TYPE_FD);
61
62 rsc = rzalloc(pscreen, struct panfrost_resource);
63 if (!rsc)
64 return NULL;
65
66 prsc = &rsc->base;
67
68 *prsc = *templat;
69
70 pipe_reference_init(&prsc->reference, 1);
71 prsc->screen = pscreen;
72
73 rsc->bo = panfrost_drm_import_bo(screen, whandle->handle);
74 rsc->slices[0].stride = whandle->stride;
75 rsc->slices[0].initialized = true;
76
77 if (screen->ro) {
78 rsc->scanout =
79 renderonly_create_gpu_import_for_resource(prsc, screen->ro, NULL);
80 /* failure is expected in some cases.. */
81 }
82
83 return prsc;
84 }
85
86 static bool
87 panfrost_resource_get_handle(struct pipe_screen *pscreen,
88 struct pipe_context *ctx,
89 struct pipe_resource *pt,
90 struct winsys_handle *handle,
91 unsigned usage)
92 {
93 struct panfrost_screen *screen = pan_screen(pscreen);
94 struct panfrost_resource *rsrc = (struct panfrost_resource *) pt;
95 struct renderonly_scanout *scanout = rsrc->scanout;
96
97 handle->modifier = DRM_FORMAT_MOD_INVALID;
98
99 if (handle->type == WINSYS_HANDLE_TYPE_SHARED) {
100 return false;
101 } else if (handle->type == WINSYS_HANDLE_TYPE_KMS) {
102 if (renderonly_get_handle(scanout, handle))
103 return true;
104
105 handle->handle = rsrc->bo->gem_handle;
106 handle->stride = rsrc->slices[0].stride;
107 return TRUE;
108 } else if (handle->type == WINSYS_HANDLE_TYPE_FD) {
109 if (scanout) {
110 struct drm_prime_handle args = {
111 .handle = scanout->handle,
112 .flags = DRM_CLOEXEC,
113 };
114
115 int ret = drmIoctl(screen->ro->kms_fd, DRM_IOCTL_PRIME_HANDLE_TO_FD, &args);
116 if (ret == -1)
117 return false;
118
119 handle->stride = scanout->stride;
120 handle->handle = args.fd;
121
122 return true;
123 } else {
124 int fd = panfrost_drm_export_bo(screen, rsrc->bo);
125
126 if (fd < 0)
127 return false;
128
129 handle->handle = fd;
130 handle->stride = rsrc->slices[0].stride;
131 return true;
132 }
133 }
134
135 return false;
136 }
137
138 static void
139 panfrost_flush_resource(struct pipe_context *pctx, struct pipe_resource *prsc)
140 {
141 //DBG("TODO %s\n", __func__);
142 }
143
144 static struct pipe_surface *
145 panfrost_create_surface(struct pipe_context *pipe,
146 struct pipe_resource *pt,
147 const struct pipe_surface *surf_tmpl)
148 {
149 struct pipe_surface *ps = NULL;
150
151 ps = rzalloc(pipe, struct pipe_surface);
152
153 if (ps) {
154 pipe_reference_init(&ps->reference, 1);
155 pipe_resource_reference(&ps->texture, pt);
156 ps->context = pipe;
157 ps->format = surf_tmpl->format;
158
159 if (pt->target != PIPE_BUFFER) {
160 assert(surf_tmpl->u.tex.level <= pt->last_level);
161 ps->width = u_minify(pt->width0, surf_tmpl->u.tex.level);
162 ps->height = u_minify(pt->height0, surf_tmpl->u.tex.level);
163 ps->u.tex.level = surf_tmpl->u.tex.level;
164 ps->u.tex.first_layer = surf_tmpl->u.tex.first_layer;
165 ps->u.tex.last_layer = surf_tmpl->u.tex.last_layer;
166 } else {
167 /* setting width as number of elements should get us correct renderbuffer width */
168 ps->width = surf_tmpl->u.buf.last_element - surf_tmpl->u.buf.first_element + 1;
169 ps->height = pt->height0;
170 ps->u.buf.first_element = surf_tmpl->u.buf.first_element;
171 ps->u.buf.last_element = surf_tmpl->u.buf.last_element;
172 assert(ps->u.buf.first_element <= ps->u.buf.last_element);
173 assert(ps->u.buf.last_element < ps->width);
174 }
175 }
176
177 return ps;
178 }
179
180 static void
181 panfrost_surface_destroy(struct pipe_context *pipe,
182 struct pipe_surface *surf)
183 {
184 assert(surf->texture);
185 pipe_resource_reference(&surf->texture, NULL);
186 ralloc_free(surf);
187 }
188
189 static struct pipe_resource *
190 panfrost_create_scanout_res(struct pipe_screen *screen,
191 const struct pipe_resource *template)
192 {
193 struct panfrost_screen *pscreen = pan_screen(screen);
194 struct pipe_resource scanout_templat = *template;
195 struct renderonly_scanout *scanout;
196 struct winsys_handle handle;
197 struct pipe_resource *res;
198
199 scanout = renderonly_scanout_for_resource(&scanout_templat,
200 pscreen->ro, &handle);
201 if (!scanout)
202 return NULL;
203
204 assert(handle.type == WINSYS_HANDLE_TYPE_FD);
205 /* TODO: handle modifiers? */
206 res = screen->resource_from_handle(screen, template, &handle,
207 PIPE_HANDLE_USAGE_FRAMEBUFFER_WRITE);
208 close(handle.handle);
209 if (!res)
210 return NULL;
211
212 struct panfrost_resource *pres = pan_resource(res);
213
214 pres->scanout = scanout;
215
216 return res;
217 }
218
219 /* Computes sizes for checksumming, which is 8 bytes per 16x16 tile */
220
221 #define CHECKSUM_TILE_WIDTH 16
222 #define CHECKSUM_TILE_HEIGHT 16
223 #define CHECKSUM_BYTES_PER_TILE 8
224
225 static unsigned
226 panfrost_compute_checksum_sizes(
227 struct panfrost_slice *slice,
228 unsigned width,
229 unsigned height)
230 {
231 unsigned aligned_width = ALIGN_POT(width, CHECKSUM_TILE_WIDTH);
232 unsigned aligned_height = ALIGN_POT(height, CHECKSUM_TILE_HEIGHT);
233
234 unsigned tile_count_x = aligned_width / CHECKSUM_TILE_WIDTH;
235 unsigned tile_count_y = aligned_height / CHECKSUM_TILE_HEIGHT;
236
237 slice->checksum_stride = tile_count_x * CHECKSUM_BYTES_PER_TILE;
238
239 return slice->checksum_stride * tile_count_y;
240 }
241
242 /* Setup the mip tree given a particular layout, possibly with checksumming */
243
244 static void
245 panfrost_setup_slices(struct panfrost_resource *pres, size_t *bo_size)
246 {
247 struct pipe_resource *res = &pres->base;
248 unsigned width = res->width0;
249 unsigned height = res->height0;
250 unsigned depth = res->depth0;
251 unsigned bytes_per_pixel = util_format_get_blocksize(res->format);
252
253 assert(depth > 0);
254
255 /* Tiled operates blockwise; linear is packed. Also, anything
256 * we render to has to be tile-aligned. Maybe not strictly
257 * necessary, but we're not *that* pressed for memory and it
258 * makes code a lot simpler */
259
260 bool renderable = res->bind &
261 (PIPE_BIND_RENDER_TARGET | PIPE_BIND_DEPTH_STENCIL);
262 bool afbc = pres->layout == PAN_AFBC;
263 bool tiled = pres->layout == PAN_TILED;
264 bool should_align = renderable || tiled;
265
266 /* We don't know how to specify a 2D stride for 3D textures */
267
268 bool can_align_stride =
269 res->target != PIPE_TEXTURE_3D;
270
271 should_align &= can_align_stride;
272
273 unsigned offset = 0;
274 unsigned size_2d = 0;
275
276 for (unsigned l = 0; l <= res->last_level; ++l) {
277 struct panfrost_slice *slice = &pres->slices[l];
278
279 unsigned effective_width = width;
280 unsigned effective_height = height;
281 unsigned effective_depth = depth;
282
283 if (should_align) {
284 effective_width = ALIGN_POT(effective_width, 16);
285 effective_height = ALIGN_POT(effective_height, 16);
286
287 /* We don't need to align depth */
288 }
289
290 /* Align levels to cache-line as a performance improvement for
291 * linear/tiled and as a requirement for AFBC */
292
293 offset = ALIGN_POT(offset, 64);
294
295 slice->offset = offset;
296
297 /* Compute the would-be stride */
298 unsigned stride = bytes_per_pixel * effective_width;
299
300 /* ..but cache-line align it for performance */
301 if (can_align_stride && pres->layout == PAN_LINEAR)
302 stride = ALIGN_POT(stride, 64);
303
304 slice->stride = stride;
305
306 unsigned slice_one_size = slice->stride * effective_height;
307 unsigned slice_full_size = slice_one_size * effective_depth;
308
309 /* Report 2D size for 3D texturing */
310
311 if (l == 0)
312 size_2d = slice_one_size;
313
314 /* Compute AFBC sizes if necessary */
315 if (afbc) {
316 slice->header_size =
317 panfrost_afbc_header_size(width, height);
318
319 offset += slice->header_size;
320 }
321
322 offset += slice_full_size;
323
324 /* Add a checksum region if necessary */
325 if (pres->checksummed) {
326 slice->checksum_offset = offset;
327
328 unsigned size = panfrost_compute_checksum_sizes(
329 slice, width, height);
330
331 offset += size;
332 }
333
334 width = u_minify(width, 1);
335 height = u_minify(height, 1);
336 depth = u_minify(depth, 1);
337 }
338
339 assert(res->array_size);
340
341 if (res->target != PIPE_TEXTURE_3D) {
342 /* Arrays and cubemaps have the entire miptree duplicated */
343
344 pres->cubemap_stride = ALIGN_POT(offset, 64);
345 *bo_size = ALIGN_POT(pres->cubemap_stride * res->array_size, 4096);
346 } else {
347 /* 3D strides across the 2D layers */
348 assert(res->array_size == 1);
349
350 pres->cubemap_stride = size_2d;
351 *bo_size = ALIGN_POT(offset, 4096);
352 }
353 }
354
355 static void
356 panfrost_resource_create_bo(struct panfrost_screen *screen, struct panfrost_resource *pres)
357 {
358 struct pipe_resource *res = &pres->base;
359
360 /* Based on the usage, figure out what storing will be used. There are
361 * various tradeoffs:
362 *
363 * Linear: the basic format, bad for memory bandwidth, bad for cache
364 * use. Zero-copy, though. Renderable.
365 *
366 * Tiled: Not compressed, but cache-optimized. Expensive to write into
367 * (due to software tiling), but cheap to sample from. Ideal for most
368 * textures.
369 *
370 * AFBC: Compressed and renderable (so always desirable for non-scanout
371 * rendertargets). Cheap to sample from. The format is black box, so we
372 * can't read/write from software.
373 */
374
375 /* Tiling textures is almost always faster, unless we only use it once */
376
377 bool is_texture = (res->bind & PIPE_BIND_SAMPLER_VIEW);
378 bool is_2d = res->depth0 == 1 && res->array_size == 1;
379 bool is_streaming = (res->usage != PIPE_USAGE_STREAM);
380
381 /* TODO: Reenable tiling on SFBD systems when we support rendering to
382 * tiled formats with SFBD */
383 bool should_tile = is_streaming && is_texture && is_2d && !screen->require_sfbd;
384
385 /* Depth/stencil can't be tiled, only linear or AFBC */
386 should_tile &= !(res->bind & PIPE_BIND_DEPTH_STENCIL);
387
388 /* FBOs we would like to checksum, if at all possible */
389 bool can_checksum = !(res->bind & (PIPE_BIND_SCANOUT | PIPE_BIND_SHARED));
390 bool should_checksum = res->bind & PIPE_BIND_RENDER_TARGET;
391
392 pres->checksummed = can_checksum && should_checksum;
393
394 /* Set the layout appropriately */
395 pres->layout = should_tile ? PAN_TILED : PAN_LINEAR;
396
397 size_t bo_size;
398
399 panfrost_setup_slices(pres, &bo_size);
400
401 /* We create a BO immediately but don't bother mapping, since we don't
402 * care to map e.g. FBOs which the CPU probably won't touch */
403 pres->bo = panfrost_drm_create_bo(screen, bo_size, PAN_ALLOCATE_DELAY_MMAP);
404 }
405
406 static struct pipe_resource *
407 panfrost_resource_create(struct pipe_screen *screen,
408 const struct pipe_resource *template)
409 {
410 /* Make sure we're familiar */
411 switch (template->target) {
412 case PIPE_BUFFER:
413 case PIPE_TEXTURE_1D:
414 case PIPE_TEXTURE_2D:
415 case PIPE_TEXTURE_3D:
416 case PIPE_TEXTURE_CUBE:
417 case PIPE_TEXTURE_RECT:
418 case PIPE_TEXTURE_2D_ARRAY:
419 break;
420 default:
421 DBG("Unknown texture target %d\n", template->target);
422 assert(0);
423 }
424
425 if (template->bind &
426 (PIPE_BIND_DISPLAY_TARGET | PIPE_BIND_SCANOUT | PIPE_BIND_SHARED))
427 return panfrost_create_scanout_res(screen, template);
428
429 struct panfrost_resource *so = rzalloc(screen, struct panfrost_resource);
430 struct panfrost_screen *pscreen = (struct panfrost_screen *) screen;
431
432 so->base = *template;
433 so->base.screen = screen;
434
435 pipe_reference_init(&so->base.reference, 1);
436
437 util_range_init(&so->valid_buffer_range);
438
439 panfrost_resource_create_bo(pscreen, so);
440 return (struct pipe_resource *)so;
441 }
442
443 void
444 panfrost_bo_reference(struct panfrost_bo *bo)
445 {
446 pipe_reference(NULL, &bo->reference);
447 }
448
449 void
450 panfrost_bo_unreference(struct pipe_screen *screen, struct panfrost_bo *bo)
451 {
452 /* When the reference count goes to zero, we need to cleanup */
453
454 if (pipe_reference(&bo->reference, NULL))
455 panfrost_drm_release_bo(pan_screen(screen), bo, true);
456 }
457
458 static void
459 panfrost_resource_destroy(struct pipe_screen *screen,
460 struct pipe_resource *pt)
461 {
462 struct panfrost_screen *pscreen = pan_screen(screen);
463 struct panfrost_resource *rsrc = (struct panfrost_resource *) pt;
464
465 if (rsrc->scanout)
466 renderonly_scanout_destroy(rsrc->scanout, pscreen->ro);
467
468 if (rsrc->bo)
469 panfrost_bo_unreference(screen, rsrc->bo);
470
471 util_range_destroy(&rsrc->valid_buffer_range);
472 ralloc_free(rsrc);
473 }
474
475 static void *
476 panfrost_transfer_map(struct pipe_context *pctx,
477 struct pipe_resource *resource,
478 unsigned level,
479 unsigned usage, /* a combination of PIPE_TRANSFER_x */
480 const struct pipe_box *box,
481 struct pipe_transfer **out_transfer)
482 {
483 int bytes_per_pixel = util_format_get_blocksize(resource->format);
484 struct panfrost_resource *rsrc = pan_resource(resource);
485 struct panfrost_bo *bo = rsrc->bo;
486
487 struct panfrost_gtransfer *transfer = rzalloc(pctx, struct panfrost_gtransfer);
488 transfer->base.level = level;
489 transfer->base.usage = usage;
490 transfer->base.box = *box;
491
492 pipe_resource_reference(&transfer->base.resource, resource);
493
494 *out_transfer = &transfer->base;
495
496 /* If we haven't already mmaped, now's the time */
497
498 if (!bo->cpu) {
499 struct panfrost_screen *screen = pan_screen(pctx->screen);
500 panfrost_drm_mmap_bo(screen, bo);
501 }
502
503 /* Check if we're bound for rendering and this is a read pixels. If so,
504 * we need to flush */
505
506 struct panfrost_context *ctx = pan_context(pctx);
507 struct pipe_framebuffer_state *fb = &ctx->pipe_framebuffer;
508
509 bool is_bound = false;
510
511 for (unsigned c = 0; c < fb->nr_cbufs; ++c) {
512 /* If cbufs is NULL, we're definitely not bound here */
513
514 if (fb->cbufs[c])
515 is_bound |= fb->cbufs[c]->texture == resource;
516 }
517
518 if (is_bound && (usage & PIPE_TRANSFER_READ)) {
519 assert(level == 0);
520 panfrost_flush(pctx, NULL, PIPE_FLUSH_END_OF_FRAME);
521 }
522
523 /* TODO: Respect usage flags */
524
525 if (usage & PIPE_TRANSFER_DISCARD_WHOLE_RESOURCE) {
526 /* TODO: reallocate */
527 //printf("debug: Missed reallocate\n");
528 } else if ((usage & PIPE_TRANSFER_WRITE)
529 && resource->target == PIPE_BUFFER
530 && !util_ranges_intersect(&rsrc->valid_buffer_range, box->x, box->x + box->width)) {
531 /* No flush for writes to uninitialized */
532 } else if (!(usage & PIPE_TRANSFER_UNSYNCHRONIZED)) {
533 if (usage & PIPE_TRANSFER_WRITE) {
534 /* STUB: flush reading */
535 //printf("debug: missed reading flush %d\n", resource->target);
536 } else if (usage & PIPE_TRANSFER_READ) {
537 /* STUB: flush writing */
538 //printf("debug: missed writing flush %d (%d-%d)\n", resource->target, box->x, box->x + box->width);
539 } else {
540 /* Why are you even mapping?! */
541 }
542 }
543
544 if (rsrc->layout != PAN_LINEAR) {
545 /* Non-linear resources need to be indirectly mapped */
546
547 if (usage & PIPE_TRANSFER_MAP_DIRECTLY)
548 return NULL;
549
550 transfer->base.stride = box->width * bytes_per_pixel;
551 transfer->base.layer_stride = transfer->base.stride * box->height;
552 transfer->map = rzalloc_size(transfer, transfer->base.layer_stride * box->depth);
553 assert(box->depth == 1);
554
555 if ((usage & PIPE_TRANSFER_READ) && rsrc->slices[level].initialized) {
556 if (rsrc->layout == PAN_AFBC) {
557 DBG("Unimplemented: reads from AFBC");
558 } else if (rsrc->layout == PAN_TILED) {
559 panfrost_load_tiled_image(
560 transfer->map,
561 bo->cpu + rsrc->slices[level].offset,
562 box,
563 transfer->base.stride,
564 rsrc->slices[level].stride,
565 util_format_get_blocksize(resource->format));
566 }
567 }
568
569 return transfer->map;
570 } else {
571 transfer->base.stride = rsrc->slices[level].stride;
572 transfer->base.layer_stride = rsrc->cubemap_stride;
573
574 /* By mapping direct-write, we're implicitly already
575 * initialized (maybe), so be conservative */
576
577 if ((usage & PIPE_TRANSFER_WRITE) && (usage & PIPE_TRANSFER_MAP_DIRECTLY))
578 rsrc->slices[level].initialized = true;
579
580 return bo->cpu
581 + rsrc->slices[level].offset
582 + transfer->base.box.z * rsrc->cubemap_stride
583 + transfer->base.box.y * rsrc->slices[level].stride
584 + transfer->base.box.x * bytes_per_pixel;
585 }
586 }
587
588 static void
589 panfrost_transfer_unmap(struct pipe_context *pctx,
590 struct pipe_transfer *transfer)
591 {
592 /* Gallium expects writeback here, so we tile */
593
594 struct panfrost_gtransfer *trans = pan_transfer(transfer);
595 struct panfrost_resource *prsrc = (struct panfrost_resource *) transfer->resource;
596
597 /* Mark whatever we wrote as written */
598 if (transfer->usage & PIPE_TRANSFER_WRITE)
599 prsrc->slices[transfer->level].initialized = true;
600
601 if (trans->map) {
602 struct panfrost_bo *bo = prsrc->bo;
603
604 if (transfer->usage & PIPE_TRANSFER_WRITE) {
605 if (prsrc->layout == PAN_AFBC) {
606 DBG("Unimplemented: writes to AFBC\n");
607 } else if (prsrc->layout == PAN_TILED) {
608 assert(transfer->box.depth == 1);
609
610 panfrost_store_tiled_image(
611 bo->cpu + prsrc->slices[transfer->level].offset,
612 trans->map,
613 &transfer->box,
614 prsrc->slices[transfer->level].stride,
615 transfer->stride,
616 util_format_get_blocksize(prsrc->base.format));
617 }
618 }
619 }
620
621
622 util_range_add(&prsrc->valid_buffer_range,
623 transfer->box.x,
624 transfer->box.x + transfer->box.width);
625
626 /* Derefence the resource */
627 pipe_resource_reference(&transfer->resource, NULL);
628
629 /* Transfer itself is RALLOCed at the moment */
630 ralloc_free(transfer);
631 }
632
633 static void
634 panfrost_transfer_flush_region(struct pipe_context *pctx,
635 struct pipe_transfer *transfer,
636 const struct pipe_box *box)
637 {
638 struct panfrost_resource *rsc = pan_resource(transfer->resource);
639
640 if (transfer->resource->target == PIPE_BUFFER) {
641 util_range_add(&rsc->valid_buffer_range,
642 transfer->box.x + box->x,
643 transfer->box.x + box->x + box->width);
644 } else {
645 unsigned level = transfer->level;
646 rsc->slices[level].initialized = true;
647 }
648 }
649
650 static void
651 panfrost_invalidate_resource(struct pipe_context *pctx, struct pipe_resource *prsc)
652 {
653 //DBG("TODO %s\n", __func__);
654 }
655
656 static enum pipe_format
657 panfrost_resource_get_internal_format(struct pipe_resource *prsrc) {
658 return prsrc->format;
659 }
660
661 static bool
662 panfrost_generate_mipmap(
663 struct pipe_context *pctx,
664 struct pipe_resource *prsrc,
665 enum pipe_format format,
666 unsigned base_level,
667 unsigned last_level,
668 unsigned first_layer,
669 unsigned last_layer)
670 {
671 struct panfrost_context *ctx = pan_context(pctx);
672 struct panfrost_resource *rsrc = pan_resource(prsrc);
673
674 /* Generating a mipmap invalidates the written levels, so make that
675 * explicit so we don't try to wallpaper them back and end up with
676 * u_blitter recursion */
677
678 assert(rsrc->bo);
679 for (unsigned l = base_level + 1; l <= last_level; ++l)
680 rsrc->slices[l].initialized = false;
681
682 /* Beyond that, we just delegate the hard stuff. We're careful to
683 * include flushes on both ends to make sure the data is really valid.
684 * We could be doing a lot better perf-wise, especially once we have
685 * reorder-type optimizations in place. But for now prioritize
686 * correctness. */
687
688 struct panfrost_job *job = panfrost_get_job_for_fbo(ctx);
689 bool has_draws = job->last_job.gpu;
690
691 if (has_draws)
692 panfrost_flush(pctx, NULL, PIPE_FLUSH_END_OF_FRAME);
693
694 /* We've flushed the original buffer if needed, now trigger a blit */
695
696 bool blit_res = util_gen_mipmap(
697 pctx, prsrc, format,
698 base_level, last_level,
699 first_layer, last_layer,
700 PIPE_TEX_FILTER_LINEAR);
701
702 /* If the blit was successful, flush once more. If it wasn't, well, let
703 * the state tracker deal with it. */
704
705 if (blit_res)
706 panfrost_flush(pctx, NULL, PIPE_FLUSH_END_OF_FRAME);
707
708 return blit_res;
709 }
710
711 /* Computes the address to a texture at a particular slice */
712
713 mali_ptr
714 panfrost_get_texture_address(
715 struct panfrost_resource *rsrc,
716 unsigned level, unsigned face)
717 {
718 unsigned level_offset = rsrc->slices[level].offset;
719 unsigned face_offset = face * rsrc->cubemap_stride;
720
721 return rsrc->bo->gpu + level_offset + face_offset;
722 }
723
724 /* Given a resource that has already been allocated, hint that it should use a
725 * given layout. These are suggestions, not commands; it is perfectly legal to
726 * stub out this function, but there will be performance implications. */
727
728 void
729 panfrost_resource_hint_layout(
730 struct panfrost_screen *screen,
731 struct panfrost_resource *rsrc,
732 enum panfrost_memory_layout layout,
733 signed weight)
734 {
735 /* Nothing to do, although a sophisticated implementation might store
736 * the hint */
737
738 if (rsrc->layout == layout)
739 return;
740
741 /* We don't use the weight yet, but we should check that it's positive
742 * (semantically meaning that we should choose the given `layout`) */
743
744 if (weight <= 0)
745 return;
746
747 /* Check if the preferred layout is legal for this buffer */
748
749 if (layout == PAN_AFBC) {
750 bool can_afbc = panfrost_format_supports_afbc(rsrc->base.format);
751 bool is_scanout = rsrc->base.bind &
752 (PIPE_BIND_DISPLAY_TARGET | PIPE_BIND_SCANOUT | PIPE_BIND_SHARED);
753
754 if (!can_afbc || is_scanout)
755 return;
756 }
757
758 /* Simple heuristic so far: if the resource is uninitialized, switch to
759 * the hinted layout. If it is initialized, keep the original layout.
760 * This misses some cases where it would be beneficial to switch and
761 * blit. */
762
763 bool is_initialized = false;
764
765 for (unsigned i = 0; i < MAX_MIP_LEVELS; ++i)
766 is_initialized |= rsrc->slices[i].initialized;
767
768 if (is_initialized)
769 return;
770
771 /* We're uninitialized, so do a layout switch. Reinitialize slices. */
772
773 size_t new_size;
774 rsrc->layout = layout;
775 panfrost_setup_slices(rsrc, &new_size);
776
777 /* If we grew in size, reallocate the BO */
778 if (new_size > rsrc->bo->size) {
779 panfrost_drm_release_bo(screen, rsrc->bo, true);
780 rsrc->bo = panfrost_drm_create_bo(screen, new_size, PAN_ALLOCATE_DELAY_MMAP);
781 }
782 }
783
784 static void
785 panfrost_resource_set_stencil(struct pipe_resource *prsrc,
786 struct pipe_resource *stencil)
787 {
788 pan_resource(prsrc)->separate_stencil = pan_resource(stencil);
789 }
790
791 static struct pipe_resource *
792 panfrost_resource_get_stencil(struct pipe_resource *prsrc)
793 {
794 return &pan_resource(prsrc)->separate_stencil->base;
795 }
796
797 static const struct u_transfer_vtbl transfer_vtbl = {
798 .resource_create = panfrost_resource_create,
799 .resource_destroy = panfrost_resource_destroy,
800 .transfer_map = panfrost_transfer_map,
801 .transfer_unmap = panfrost_transfer_unmap,
802 .transfer_flush_region = panfrost_transfer_flush_region,
803 .get_internal_format = panfrost_resource_get_internal_format,
804 .set_stencil = panfrost_resource_set_stencil,
805 .get_stencil = panfrost_resource_get_stencil,
806 };
807
808 void
809 panfrost_resource_screen_init(struct panfrost_screen *pscreen)
810 {
811 //pscreen->base.resource_create_with_modifiers =
812 // panfrost_resource_create_with_modifiers;
813 pscreen->base.resource_create = u_transfer_helper_resource_create;
814 pscreen->base.resource_destroy = u_transfer_helper_resource_destroy;
815 pscreen->base.resource_from_handle = panfrost_resource_from_handle;
816 pscreen->base.resource_get_handle = panfrost_resource_get_handle;
817 pscreen->base.transfer_helper = u_transfer_helper_create(&transfer_vtbl,
818 true, false,
819 true, true);
820 }
821
822 void
823 panfrost_resource_context_init(struct pipe_context *pctx)
824 {
825 pctx->transfer_map = u_transfer_helper_transfer_map;
826 pctx->transfer_flush_region = u_transfer_helper_transfer_flush_region;
827 pctx->transfer_unmap = u_transfer_helper_transfer_unmap;
828 pctx->buffer_subdata = u_default_buffer_subdata;
829 pctx->create_surface = panfrost_create_surface;
830 pctx->surface_destroy = panfrost_surface_destroy;
831 pctx->resource_copy_region = util_resource_copy_region;
832 pctx->blit = panfrost_blit;
833 pctx->generate_mipmap = panfrost_generate_mipmap;
834 pctx->flush_resource = panfrost_flush_resource;
835 pctx->invalidate_resource = panfrost_invalidate_resource;
836 pctx->transfer_flush_region = u_transfer_helper_transfer_flush_region;
837 pctx->buffer_subdata = u_default_buffer_subdata;
838 pctx->texture_subdata = u_default_texture_subdata;
839 }