panfrost: Size tiled temp buffers correctly
[mesa.git] / src / gallium / drivers / panfrost / pan_resource.c
1 /**************************************************************************
2 *
3 * Copyright 2008 VMware, Inc.
4 * Copyright 2014 Broadcom
5 * Copyright 2018 Alyssa Rosenzweig
6 * All Rights Reserved.
7 *
8 * Permission is hereby granted, free of charge, to any person obtaining a
9 * copy of this software and associated documentation files (the
10 * "Software"), to deal in the Software without restriction, including
11 * without limitation the rights to use, copy, modify, merge, publish,
12 * distribute, sub license, and/or sell copies of the Software, and to
13 * permit persons to whom the Software is furnished to do so, subject to
14 * the following conditions:
15 *
16 * The above copyright notice and this permission notice (including the
17 * next paragraph) shall be included in all copies or substantial portions
18 * of the Software.
19 *
20 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
21 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
22 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
23 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
24 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
25 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
26 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
27 *
28 **************************************************************************/
29
30 #include <xf86drm.h>
31 #include <fcntl.h>
32 #include "drm-uapi/drm_fourcc.h"
33
34 #include "state_tracker/winsys_handle.h"
35 #include "util/u_format.h"
36 #include "util/u_memory.h"
37 #include "util/u_surface.h"
38 #include "util/u_transfer.h"
39 #include "util/u_transfer_helper.h"
40
41 #include "pan_context.h"
42 #include "pan_screen.h"
43 #include "pan_resource.h"
44 #include "pan_swizzle.h"
45 #include "pan_util.h"
46
47 static struct pipe_resource *
48 panfrost_resource_from_handle(struct pipe_screen *pscreen,
49 const struct pipe_resource *templat,
50 struct winsys_handle *whandle,
51 unsigned usage)
52 {
53 struct panfrost_screen *screen = pan_screen(pscreen);
54 struct panfrost_resource *rsc;
55 struct pipe_resource *prsc;
56
57 assert(whandle->type == WINSYS_HANDLE_TYPE_FD);
58
59 rsc = CALLOC_STRUCT(panfrost_resource);
60 if (!rsc)
61 return NULL;
62
63 prsc = &rsc->base;
64
65 *prsc = *templat;
66
67 pipe_reference_init(&prsc->reference, 1);
68 prsc->screen = pscreen;
69
70 rsc->bo = screen->driver->import_bo(screen, whandle);
71 rsc->bo->slices[0].stride = whandle->stride;
72
73 if (screen->ro) {
74 rsc->scanout =
75 renderonly_create_gpu_import_for_resource(prsc, screen->ro, NULL);
76 /* failure is expected in some cases.. */
77 }
78
79 return prsc;
80 }
81
82 static boolean
83 panfrost_resource_get_handle(struct pipe_screen *pscreen,
84 struct pipe_context *ctx,
85 struct pipe_resource *pt,
86 struct winsys_handle *handle,
87 unsigned usage)
88 {
89 struct panfrost_screen *screen = pan_screen(pscreen);
90 struct panfrost_resource *rsrc = (struct panfrost_resource *) pt;
91 struct renderonly_scanout *scanout = rsrc->scanout;
92
93 handle->modifier = DRM_FORMAT_MOD_INVALID;
94
95 if (handle->type == WINSYS_HANDLE_TYPE_SHARED) {
96 return FALSE;
97 } else if (handle->type == WINSYS_HANDLE_TYPE_KMS) {
98 if (renderonly_get_handle(scanout, handle))
99 return TRUE;
100
101 handle->handle = rsrc->bo->gem_handle;
102 handle->stride = rsrc->bo->slices[0].stride;
103 return TRUE;
104 } else if (handle->type == WINSYS_HANDLE_TYPE_FD) {
105 if (scanout) {
106 struct drm_prime_handle args = {
107 .handle = scanout->handle,
108 .flags = DRM_CLOEXEC,
109 };
110
111 int ret = drmIoctl(screen->ro->kms_fd, DRM_IOCTL_PRIME_HANDLE_TO_FD, &args);
112 if (ret == -1)
113 return FALSE;
114
115 handle->stride = scanout->stride;
116 handle->handle = args.fd;
117
118 return TRUE;
119 } else
120 return screen->driver->export_bo(screen, rsrc->bo->gem_handle, rsrc->bo->slices[0].stride, handle);
121 }
122
123 return FALSE;
124 }
125
126 static void
127 panfrost_flush_resource(struct pipe_context *pctx, struct pipe_resource *prsc)
128 {
129 //DBG("TODO %s\n", __func__);
130 }
131
132 static void
133 panfrost_blit(struct pipe_context *pipe,
134 const struct pipe_blit_info *info)
135 {
136 if (util_try_blit_via_copy_region(pipe, info))
137 return;
138
139 /* TODO */
140 DBG("Unhandled blit.\n");
141
142 return;
143 }
144
145 static struct pipe_surface *
146 panfrost_create_surface(struct pipe_context *pipe,
147 struct pipe_resource *pt,
148 const struct pipe_surface *surf_tmpl)
149 {
150 struct pipe_surface *ps = NULL;
151
152 ps = CALLOC_STRUCT(pipe_surface);
153
154 if (ps) {
155 pipe_reference_init(&ps->reference, 1);
156 pipe_resource_reference(&ps->texture, pt);
157 ps->context = pipe;
158 ps->format = surf_tmpl->format;
159
160 if (pt->target != PIPE_BUFFER) {
161 assert(surf_tmpl->u.tex.level <= pt->last_level);
162 ps->width = u_minify(pt->width0, surf_tmpl->u.tex.level);
163 ps->height = u_minify(pt->height0, surf_tmpl->u.tex.level);
164 ps->u.tex.level = surf_tmpl->u.tex.level;
165 ps->u.tex.first_layer = surf_tmpl->u.tex.first_layer;
166 ps->u.tex.last_layer = surf_tmpl->u.tex.last_layer;
167 } else {
168 /* setting width as number of elements should get us correct renderbuffer width */
169 ps->width = surf_tmpl->u.buf.last_element - surf_tmpl->u.buf.first_element + 1;
170 ps->height = pt->height0;
171 ps->u.buf.first_element = surf_tmpl->u.buf.first_element;
172 ps->u.buf.last_element = surf_tmpl->u.buf.last_element;
173 assert(ps->u.buf.first_element <= ps->u.buf.last_element);
174 assert(ps->u.buf.last_element < ps->width);
175 }
176 }
177
178 return ps;
179 }
180
181 static void
182 panfrost_surface_destroy(struct pipe_context *pipe,
183 struct pipe_surface *surf)
184 {
185 assert(surf->texture);
186 pipe_resource_reference(&surf->texture, NULL);
187 free(surf);
188 }
189
190 static void
191 panfrost_setup_slices(const struct pipe_resource *tmpl, struct panfrost_bo *bo)
192 {
193 unsigned width = tmpl->width0;
194 unsigned height = tmpl->height0;
195 unsigned bytes_per_pixel = util_format_get_blocksize(tmpl->format);
196
197 unsigned offset = 0;
198
199 for (unsigned l = 0; l <= tmpl->last_level; ++l) {
200 struct panfrost_slice *slice = &bo->slices[l];
201
202 unsigned effective_width = width;
203 unsigned effective_height = height;
204
205 /* Tiled operates blockwise; linear is packed */
206
207 if (bo->layout == PAN_TILED) {
208 effective_width = ALIGN(effective_width, 16);
209 effective_height = ALIGN(effective_height, 16);
210 }
211
212 slice->offset = offset;
213 slice->stride = bytes_per_pixel * effective_width;
214
215 offset += slice->stride * effective_height;
216
217 width = u_minify(width, 1);
218 height = u_minify(height, 1);
219 }
220
221 assert(tmpl->array_size);
222
223 bo->cubemap_stride = ALIGN(offset, 64);
224 bo->size = ALIGN(bo->cubemap_stride * tmpl->array_size, 4096);
225 }
226
227 static struct panfrost_bo *
228 panfrost_create_bo(struct panfrost_screen *screen, const struct pipe_resource *template)
229 {
230 struct panfrost_bo *bo = CALLOC_STRUCT(panfrost_bo);
231
232 /* Based on the usage, figure out what storing will be used. There are
233 * various tradeoffs:
234 *
235 * Linear: the basic format, bad for memory bandwidth, bad for cache
236 * use. Zero-copy, though. Renderable.
237 *
238 * Tiled: Not compressed, but cache-optimized. Expensive to write into
239 * (due to software tiling), but cheap to sample from. Ideal for most
240 * textures.
241 *
242 * AFBC: Compressed and renderable (so always desirable for non-scanout
243 * rendertargets). Cheap to sample from. The format is black box, so we
244 * can't read/write from software.
245 */
246
247 /* Tiling textures is almost always faster, unless we only use it once */
248 bool should_tile = (template->usage != PIPE_USAGE_STREAM) && (template->bind & PIPE_BIND_SAMPLER_VIEW);
249
250 /* For unclear reasons, depth/stencil is faster linear than AFBC, so
251 * make sure it's linear */
252
253 if (template->bind & PIPE_BIND_DEPTH_STENCIL)
254 should_tile = false;
255
256 /* Set the layout appropriately */
257 bo->layout = should_tile ? PAN_TILED : PAN_LINEAR;
258
259 panfrost_setup_slices(template, bo);
260
261 if (bo->layout == PAN_TILED || bo->layout == PAN_LINEAR) {
262 struct panfrost_memory mem;
263
264 screen->driver->allocate_slab(screen, &mem, bo->size / 4096, true, 0, 0, 0);
265
266 bo->cpu = mem.cpu;
267 bo->gpu = mem.gpu;
268 bo->gem_handle = mem.gem_handle;
269 }
270
271 return bo;
272 }
273
274 static struct pipe_resource *
275 panfrost_resource_create(struct pipe_screen *screen,
276 const struct pipe_resource *template)
277 {
278 struct panfrost_resource *so = CALLOC_STRUCT(panfrost_resource);
279 struct panfrost_screen *pscreen = (struct panfrost_screen *) screen;
280
281 so->base = *template;
282 so->base.screen = screen;
283
284 pipe_reference_init(&so->base.reference, 1);
285
286 /* Make sure we're familiar */
287 switch (template->target) {
288 case PIPE_BUFFER:
289 case PIPE_TEXTURE_1D:
290 case PIPE_TEXTURE_2D:
291 case PIPE_TEXTURE_3D:
292 case PIPE_TEXTURE_CUBE:
293 case PIPE_TEXTURE_RECT:
294 break;
295 default:
296 DBG("Unknown texture target %d\n", template->target);
297 assert(0);
298 }
299
300 if (template->bind & PIPE_BIND_DISPLAY_TARGET ||
301 template->bind & PIPE_BIND_SCANOUT ||
302 template->bind & PIPE_BIND_SHARED) {
303 struct pipe_resource scanout_templat = *template;
304 struct renderonly_scanout *scanout;
305 struct winsys_handle handle;
306
307 scanout = renderonly_scanout_for_resource(&scanout_templat,
308 pscreen->ro, &handle);
309 if (!scanout)
310 return NULL;
311
312 assert(handle.type == WINSYS_HANDLE_TYPE_FD);
313 /* TODO: handle modifiers? */
314 so = pan_resource(screen->resource_from_handle(screen, template,
315 &handle,
316 PIPE_HANDLE_USAGE_FRAMEBUFFER_WRITE));
317 close(handle.handle);
318 if (!so)
319 return NULL;
320
321 so->scanout = scanout;
322 pscreen->display_target = so;
323 } else {
324 so->bo = panfrost_create_bo(pscreen, template);
325 }
326
327 return (struct pipe_resource *)so;
328 }
329
330 static void
331 panfrost_destroy_bo(struct panfrost_screen *screen, struct panfrost_bo *pbo)
332 {
333 struct panfrost_bo *bo = (struct panfrost_bo *)pbo;
334
335 if ((bo->layout == PAN_LINEAR || bo->layout == PAN_TILED) &&
336 !bo->imported) {
337 struct panfrost_memory mem = {
338 .cpu = bo->cpu,
339 .gpu = bo->gpu,
340 .size = bo->size,
341 .gem_handle = bo->gem_handle,
342 };
343
344 screen->driver->free_slab(screen, &mem);
345 }
346
347 if (bo->layout == PAN_AFBC) {
348 /* TODO */
349 DBG("--leaking afbc (%d bytes)--\n", bo->afbc_metadata_size);
350 }
351
352 if (bo->has_checksum) {
353 /* TODO */
354 DBG("--leaking checksum (%zd bytes)--\n", bo->checksum_slab.size);
355 }
356
357 if (bo->imported) {
358 screen->driver->free_imported_bo(screen, bo);
359 }
360 }
361
362 static void
363 panfrost_resource_destroy(struct pipe_screen *screen,
364 struct pipe_resource *pt)
365 {
366 struct panfrost_screen *pscreen = pan_screen(screen);
367 struct panfrost_resource *rsrc = (struct panfrost_resource *) pt;
368
369 if (rsrc->scanout)
370 renderonly_scanout_destroy(rsrc->scanout, pscreen->ro);
371
372 if (rsrc->bo)
373 panfrost_destroy_bo(pscreen, rsrc->bo);
374
375 FREE(rsrc);
376 }
377
378 static void *
379 panfrost_transfer_map(struct pipe_context *pctx,
380 struct pipe_resource *resource,
381 unsigned level,
382 unsigned usage, /* a combination of PIPE_TRANSFER_x */
383 const struct pipe_box *box,
384 struct pipe_transfer **out_transfer)
385 {
386 int bytes_per_pixel = util_format_get_blocksize(resource->format);
387 struct panfrost_bo *bo = pan_resource(resource)->bo;
388
389 struct panfrost_gtransfer *transfer = CALLOC_STRUCT(panfrost_gtransfer);
390 transfer->base.level = level;
391 transfer->base.usage = usage;
392 transfer->base.box = *box;
393
394 pipe_resource_reference(&transfer->base.resource, resource);
395
396 *out_transfer = &transfer->base;
397
398 if (resource->bind & PIPE_BIND_DISPLAY_TARGET ||
399 resource->bind & PIPE_BIND_SCANOUT ||
400 resource->bind & PIPE_BIND_SHARED) {
401 /* Mipmapped readpixels?! */
402 assert(level == 0);
403
404 /* Force a flush -- kill the pipeline */
405 panfrost_flush(pctx, NULL, PIPE_FLUSH_END_OF_FRAME);
406 }
407
408 if (bo->layout != PAN_LINEAR) {
409 /* Non-linear resources need to be indirectly mapped */
410
411 if (usage & PIPE_TRANSFER_MAP_DIRECTLY)
412 return NULL;
413
414 transfer->base.stride = box->width * bytes_per_pixel;
415 transfer->base.layer_stride = transfer->base.stride * box->height;
416
417 /* TODO: Reads */
418 transfer->map = malloc(transfer->base.layer_stride * box->depth);
419
420 return transfer->map;
421 } else {
422 transfer->base.stride = bo->slices[level].stride;
423 transfer->base.layer_stride = bo->cubemap_stride;
424
425 return bo->cpu
426 + bo->slices[level].offset
427 + transfer->base.box.z * bo->cubemap_stride
428 + transfer->base.box.y * bo->slices[level].stride
429 + transfer->base.box.x * bytes_per_pixel;
430 }
431 }
432
433 static void
434 panfrost_tile_texture(struct panfrost_screen *screen, struct panfrost_resource *rsrc, struct panfrost_gtransfer *trans)
435 {
436 struct panfrost_bo *bo = (struct panfrost_bo *)rsrc->bo;
437
438 unsigned level = trans->base.level;
439
440 panfrost_texture_swizzle(
441 trans->base.box.x,
442 trans->base.box.y,
443 trans->base.box.width,
444 trans->base.box.height,
445 util_format_get_blocksize(rsrc->base.format),
446 u_minify(rsrc->base.width0, level),
447 trans->map,
448 bo->cpu
449 + bo->slices[level].offset
450 + bo->cubemap_stride * trans->base.box.z
451 );
452 }
453
454 static void
455 panfrost_transfer_unmap(struct pipe_context *pctx,
456 struct pipe_transfer *transfer)
457 {
458 struct panfrost_context *ctx = pan_context(pctx);
459
460 /* Gallium expects writeback here, so we tile */
461
462 struct panfrost_gtransfer *trans = pan_transfer(transfer);
463
464 if (trans->map) {
465 struct panfrost_resource *prsrc = (struct panfrost_resource *) transfer->resource;
466 struct panfrost_bo *bo = prsrc->bo;
467
468 if (transfer->usage & PIPE_TRANSFER_WRITE) {
469
470 if (bo->layout == PAN_AFBC) {
471 DBG("Unimplemented: writes to AFBC\n");
472 } else if (bo->layout == PAN_TILED) {
473 struct pipe_context *gallium = (struct pipe_context *) ctx;
474 struct panfrost_screen *screen = pan_screen(gallium->screen);
475 assert(transfer->box.depth == 1);
476 panfrost_tile_texture(screen, prsrc, trans);
477 }
478 }
479
480 free(trans->map);
481 }
482
483 /* Derefence the resource */
484 pipe_resource_reference(&transfer->resource, NULL);
485
486 /* Transfer itself is CALLOCed at the moment */
487 free(transfer);
488 }
489
490 static struct pb_slab *
491 panfrost_slab_alloc(void *priv, unsigned heap, unsigned entry_size, unsigned group_index)
492 {
493 struct panfrost_screen *screen = (struct panfrost_screen *) priv;
494 struct panfrost_memory *mem = CALLOC_STRUCT(panfrost_memory);
495
496 size_t slab_size = (1 << (MAX_SLAB_ENTRY_SIZE + 1));
497
498 mem->slab.num_entries = slab_size / entry_size;
499 mem->slab.num_free = mem->slab.num_entries;
500
501 LIST_INITHEAD(&mem->slab.free);
502 for (unsigned i = 0; i < mem->slab.num_entries; ++i) {
503 /* Create a slab entry */
504 struct panfrost_memory_entry *entry = CALLOC_STRUCT(panfrost_memory_entry);
505 entry->offset = entry_size * i;
506
507 entry->base.slab = &mem->slab;
508 entry->base.group_index = group_index;
509
510 LIST_ADDTAIL(&entry->base.head, &mem->slab.free);
511 }
512
513 /* Actually allocate the memory from kernel-space. Mapped, same_va, no
514 * special flags */
515
516 screen->driver->allocate_slab(screen, mem, slab_size / 4096, true, 0, 0, 0);
517
518 return &mem->slab;
519 }
520
521 static bool
522 panfrost_slab_can_reclaim(void *priv, struct pb_slab_entry *entry)
523 {
524 struct panfrost_memory_entry *p_entry = (struct panfrost_memory_entry *) entry;
525 return p_entry->freed;
526 }
527
528 static void
529 panfrost_slab_free(void *priv, struct pb_slab *slab)
530 {
531 struct panfrost_memory *mem = (struct panfrost_memory *) slab;
532 struct panfrost_screen *screen = (struct panfrost_screen *) priv;
533
534 screen->driver->free_slab(screen, mem);
535 }
536
537 static void
538 panfrost_invalidate_resource(struct pipe_context *pctx, struct pipe_resource *prsc)
539 {
540 //DBG("TODO %s\n", __func__);
541 }
542
543 static enum pipe_format
544 panfrost_resource_get_internal_format(struct pipe_resource *prsrc)
545 {
546 return prsrc->format;
547 }
548
549 static void
550 panfrost_resource_set_stencil(struct pipe_resource *prsrc,
551 struct pipe_resource *stencil)
552 {
553 pan_resource(prsrc)->separate_stencil = pan_resource(stencil);
554 }
555
556 static struct pipe_resource *
557 panfrost_resource_get_stencil(struct pipe_resource *prsrc)
558 {
559 return &pan_resource(prsrc)->separate_stencil->base;
560 }
561
562 static const struct u_transfer_vtbl transfer_vtbl = {
563 .resource_create = panfrost_resource_create,
564 .resource_destroy = panfrost_resource_destroy,
565 .transfer_map = panfrost_transfer_map,
566 .transfer_unmap = panfrost_transfer_unmap,
567 .transfer_flush_region = u_default_transfer_flush_region,
568 .get_internal_format = panfrost_resource_get_internal_format,
569 .set_stencil = panfrost_resource_set_stencil,
570 .get_stencil = panfrost_resource_get_stencil,
571 };
572
573 void
574 panfrost_resource_screen_init(struct panfrost_screen *pscreen)
575 {
576 //pscreen->base.resource_create_with_modifiers =
577 // panfrost_resource_create_with_modifiers;
578 pscreen->base.resource_create = u_transfer_helper_resource_create;
579 pscreen->base.resource_destroy = u_transfer_helper_resource_destroy;
580 pscreen->base.resource_from_handle = panfrost_resource_from_handle;
581 pscreen->base.resource_get_handle = panfrost_resource_get_handle;
582 pscreen->base.transfer_helper = u_transfer_helper_create(&transfer_vtbl,
583 true, false,
584 true, true);
585
586 pb_slabs_init(&pscreen->slabs,
587 MIN_SLAB_ENTRY_SIZE,
588 MAX_SLAB_ENTRY_SIZE,
589
590 3, /* Number of heaps */
591
592 pscreen,
593
594 panfrost_slab_can_reclaim,
595 panfrost_slab_alloc,
596 panfrost_slab_free);
597 }
598
599 void
600 panfrost_resource_context_init(struct pipe_context *pctx)
601 {
602 pctx->transfer_map = u_transfer_helper_transfer_map;
603 pctx->transfer_flush_region = u_transfer_helper_transfer_flush_region;
604 pctx->transfer_unmap = u_transfer_helper_transfer_unmap;
605 pctx->buffer_subdata = u_default_buffer_subdata;
606 pctx->create_surface = panfrost_create_surface;
607 pctx->surface_destroy = panfrost_surface_destroy;
608 pctx->resource_copy_region = util_resource_copy_region;
609 pctx->blit = panfrost_blit;
610 pctx->flush_resource = panfrost_flush_resource;
611 pctx->invalidate_resource = panfrost_invalidate_resource;
612 pctx->transfer_flush_region = u_transfer_helper_transfer_flush_region;
613 pctx->buffer_subdata = u_default_buffer_subdata;
614 pctx->texture_subdata = u_default_texture_subdata;
615 }