2 * Copyright (C) 2008 VMware, Inc.
3 * Copyright (C) 2014 Broadcom
4 * Copyright (C) 2018-2019 Alyssa Rosenzweig
5 * Copyright (C) 2019 Collabora
7 * Permission is hereby granted, free of charge, to any person obtaining a
8 * copy of this software and associated documentation files (the "Software"),
9 * to deal in the Software without restriction, including without limitation
10 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
11 * and/or sell copies of the Software, and to permit persons to whom the
12 * Software is furnished to do so, subject to the following conditions:
14 * The above copyright notice and this permission notice (including the next
15 * paragraph) shall be included in all copies or substantial portions of the
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
19 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
21 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
22 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
23 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
26 * Authors (Collabora):
27 * Tomeu Vizoso <tomeu.vizoso@collabora.com>
28 * Alyssa Rosenzweig <alyssa.rosenzweig@collabora.com>
34 #include "drm-uapi/drm_fourcc.h"
36 #include "state_tracker/winsys_handle.h"
37 #include "util/u_format.h"
38 #include "util/u_memory.h"
39 #include "util/u_surface.h"
40 #include "util/u_transfer.h"
41 #include "util/u_transfer_helper.h"
43 #include "pan_context.h"
44 #include "pan_screen.h"
45 #include "pan_resource.h"
46 #include "pan_swizzle.h"
49 static struct pipe_resource
*
50 panfrost_resource_from_handle(struct pipe_screen
*pscreen
,
51 const struct pipe_resource
*templat
,
52 struct winsys_handle
*whandle
,
55 struct panfrost_screen
*screen
= pan_screen(pscreen
);
56 struct panfrost_resource
*rsc
;
57 struct pipe_resource
*prsc
;
59 assert(whandle
->type
== WINSYS_HANDLE_TYPE_FD
);
61 rsc
= CALLOC_STRUCT(panfrost_resource
);
69 pipe_reference_init(&prsc
->reference
, 1);
70 prsc
->screen
= pscreen
;
72 rsc
->bo
= screen
->driver
->import_bo(screen
, whandle
);
73 rsc
->bo
->slices
[0].stride
= whandle
->stride
;
77 renderonly_create_gpu_import_for_resource(prsc
, screen
->ro
, NULL
);
78 /* failure is expected in some cases.. */
85 panfrost_resource_get_handle(struct pipe_screen
*pscreen
,
86 struct pipe_context
*ctx
,
87 struct pipe_resource
*pt
,
88 struct winsys_handle
*handle
,
91 struct panfrost_screen
*screen
= pan_screen(pscreen
);
92 struct panfrost_resource
*rsrc
= (struct panfrost_resource
*) pt
;
93 struct renderonly_scanout
*scanout
= rsrc
->scanout
;
95 handle
->modifier
= DRM_FORMAT_MOD_INVALID
;
97 if (handle
->type
== WINSYS_HANDLE_TYPE_SHARED
) {
99 } else if (handle
->type
== WINSYS_HANDLE_TYPE_KMS
) {
100 if (renderonly_get_handle(scanout
, handle
))
103 handle
->handle
= rsrc
->bo
->gem_handle
;
104 handle
->stride
= rsrc
->bo
->slices
[0].stride
;
106 } else if (handle
->type
== WINSYS_HANDLE_TYPE_FD
) {
108 struct drm_prime_handle args
= {
109 .handle
= scanout
->handle
,
110 .flags
= DRM_CLOEXEC
,
113 int ret
= drmIoctl(screen
->ro
->kms_fd
, DRM_IOCTL_PRIME_HANDLE_TO_FD
, &args
);
117 handle
->stride
= scanout
->stride
;
118 handle
->handle
= args
.fd
;
122 return screen
->driver
->export_bo(screen
, rsrc
->bo
->gem_handle
, rsrc
->bo
->slices
[0].stride
, handle
);
129 panfrost_flush_resource(struct pipe_context
*pctx
, struct pipe_resource
*prsc
)
131 //DBG("TODO %s\n", __func__);
134 static struct pipe_surface
*
135 panfrost_create_surface(struct pipe_context
*pipe
,
136 struct pipe_resource
*pt
,
137 const struct pipe_surface
*surf_tmpl
)
139 struct pipe_surface
*ps
= NULL
;
141 ps
= CALLOC_STRUCT(pipe_surface
);
144 pipe_reference_init(&ps
->reference
, 1);
145 pipe_resource_reference(&ps
->texture
, pt
);
147 ps
->format
= surf_tmpl
->format
;
149 if (pt
->target
!= PIPE_BUFFER
) {
150 assert(surf_tmpl
->u
.tex
.level
<= pt
->last_level
);
151 ps
->width
= u_minify(pt
->width0
, surf_tmpl
->u
.tex
.level
);
152 ps
->height
= u_minify(pt
->height0
, surf_tmpl
->u
.tex
.level
);
153 ps
->u
.tex
.level
= surf_tmpl
->u
.tex
.level
;
154 ps
->u
.tex
.first_layer
= surf_tmpl
->u
.tex
.first_layer
;
155 ps
->u
.tex
.last_layer
= surf_tmpl
->u
.tex
.last_layer
;
157 /* setting width as number of elements should get us correct renderbuffer width */
158 ps
->width
= surf_tmpl
->u
.buf
.last_element
- surf_tmpl
->u
.buf
.first_element
+ 1;
159 ps
->height
= pt
->height0
;
160 ps
->u
.buf
.first_element
= surf_tmpl
->u
.buf
.first_element
;
161 ps
->u
.buf
.last_element
= surf_tmpl
->u
.buf
.last_element
;
162 assert(ps
->u
.buf
.first_element
<= ps
->u
.buf
.last_element
);
163 assert(ps
->u
.buf
.last_element
< ps
->width
);
171 panfrost_surface_destroy(struct pipe_context
*pipe
,
172 struct pipe_surface
*surf
)
174 assert(surf
->texture
);
175 pipe_resource_reference(&surf
->texture
, NULL
);
180 panfrost_setup_slices(const struct pipe_resource
*tmpl
, struct panfrost_bo
*bo
)
182 unsigned width
= tmpl
->width0
;
183 unsigned height
= tmpl
->height0
;
184 unsigned bytes_per_pixel
= util_format_get_blocksize(tmpl
->format
);
186 /* Tiled operates blockwise; linear is packed. Also, anything
187 * we render to has to be tile-aligned. Maybe not strictly
188 * necessary, but we're not *that* pressed for memory and it
189 * makes code a lot simpler */
191 bool renderable
= tmpl
->bind
& PIPE_BIND_RENDER_TARGET
;
192 bool tiled
= bo
->layout
== PAN_TILED
;
193 bool should_align
= renderable
|| tiled
;
197 for (unsigned l
= 0; l
<= tmpl
->last_level
; ++l
) {
198 struct panfrost_slice
*slice
= &bo
->slices
[l
];
200 unsigned effective_width
= width
;
201 unsigned effective_height
= height
;
204 effective_width
= ALIGN(effective_width
, 16);
205 effective_height
= ALIGN(effective_height
, 16);
208 slice
->offset
= offset
;
210 /* Compute the would-be stride */
211 unsigned stride
= bytes_per_pixel
* effective_width
;
213 /* ..but cache-line align it for performance */
214 stride
= ALIGN(stride
, 64);
215 slice
->stride
= stride
;
217 offset
+= slice
->stride
* effective_height
;
219 width
= u_minify(width
, 1);
220 height
= u_minify(height
, 1);
223 assert(tmpl
->array_size
);
225 bo
->cubemap_stride
= ALIGN(offset
, 64);
226 bo
->size
= ALIGN(bo
->cubemap_stride
* tmpl
->array_size
, 4096);
229 static struct panfrost_bo
*
230 panfrost_create_bo(struct panfrost_screen
*screen
, const struct pipe_resource
*template)
232 struct panfrost_bo
*bo
= CALLOC_STRUCT(panfrost_bo
);
233 pipe_reference_init(&bo
->reference
, 1);
235 /* Based on the usage, figure out what storing will be used. There are
238 * Linear: the basic format, bad for memory bandwidth, bad for cache
239 * use. Zero-copy, though. Renderable.
241 * Tiled: Not compressed, but cache-optimized. Expensive to write into
242 * (due to software tiling), but cheap to sample from. Ideal for most
245 * AFBC: Compressed and renderable (so always desirable for non-scanout
246 * rendertargets). Cheap to sample from. The format is black box, so we
247 * can't read/write from software.
250 /* Tiling textures is almost always faster, unless we only use it once */
251 bool should_tile
= (template->usage
!= PIPE_USAGE_STREAM
) && (template->bind
& PIPE_BIND_SAMPLER_VIEW
);
253 /* For unclear reasons, depth/stencil is faster linear than AFBC, so
254 * make sure it's linear */
256 if (template->bind
& PIPE_BIND_DEPTH_STENCIL
)
259 /* Set the layout appropriately */
260 bo
->layout
= should_tile
? PAN_TILED
: PAN_LINEAR
;
262 panfrost_setup_slices(template, bo
);
264 if (bo
->layout
== PAN_TILED
|| bo
->layout
== PAN_LINEAR
) {
265 struct panfrost_memory mem
;
267 screen
->driver
->allocate_slab(screen
, &mem
, bo
->size
/ 4096, true, 0, 0, 0);
271 bo
->gem_handle
= mem
.gem_handle
;
277 static struct pipe_resource
*
278 panfrost_resource_create(struct pipe_screen
*screen
,
279 const struct pipe_resource
*template)
281 struct panfrost_resource
*so
= CALLOC_STRUCT(panfrost_resource
);
282 struct panfrost_screen
*pscreen
= (struct panfrost_screen
*) screen
;
284 so
->base
= *template;
285 so
->base
.screen
= screen
;
287 pipe_reference_init(&so
->base
.reference
, 1);
289 /* Make sure we're familiar */
290 switch (template->target
) {
292 case PIPE_TEXTURE_1D
:
293 case PIPE_TEXTURE_2D
:
294 case PIPE_TEXTURE_3D
:
295 case PIPE_TEXTURE_CUBE
:
296 case PIPE_TEXTURE_RECT
:
299 DBG("Unknown texture target %d\n", template->target
);
303 util_range_init(&so
->valid_buffer_range
);
305 if (template->bind
& PIPE_BIND_DISPLAY_TARGET
||
306 template->bind
& PIPE_BIND_SCANOUT
||
307 template->bind
& PIPE_BIND_SHARED
) {
308 struct pipe_resource scanout_templat
= *template;
309 struct renderonly_scanout
*scanout
;
310 struct winsys_handle handle
;
312 scanout
= renderonly_scanout_for_resource(&scanout_templat
,
313 pscreen
->ro
, &handle
);
317 assert(handle
.type
== WINSYS_HANDLE_TYPE_FD
);
318 /* TODO: handle modifiers? */
319 so
= pan_resource(screen
->resource_from_handle(screen
, template,
321 PIPE_HANDLE_USAGE_FRAMEBUFFER_WRITE
));
322 close(handle
.handle
);
326 so
->scanout
= scanout
;
327 pscreen
->display_target
= so
;
329 so
->bo
= panfrost_create_bo(pscreen
, template);
332 return (struct pipe_resource
*)so
;
336 panfrost_destroy_bo(struct panfrost_screen
*screen
, struct panfrost_bo
*pbo
)
338 struct panfrost_bo
*bo
= (struct panfrost_bo
*)pbo
;
340 if ((bo
->layout
== PAN_LINEAR
|| bo
->layout
== PAN_TILED
) &&
342 struct panfrost_memory mem
= {
346 .gem_handle
= bo
->gem_handle
,
349 screen
->driver
->free_slab(screen
, &mem
);
352 if (bo
->layout
== PAN_AFBC
) {
354 DBG("--leaking afbc (%d bytes)--\n", bo
->afbc_metadata_size
);
357 if (bo
->has_checksum
) {
358 struct panfrost_memory mem
= {
359 .cpu
= bo
->checksum_slab
.cpu
,
360 .gpu
= bo
->checksum_slab
.gpu
,
361 .size
= bo
->checksum_slab
.size
,
362 .gem_handle
= bo
->checksum_slab
.gem_handle
,
365 screen
->driver
->free_slab(screen
, &mem
);
369 screen
->driver
->free_imported_bo(screen
, bo
);
374 panfrost_bo_reference(struct panfrost_bo
*bo
)
376 pipe_reference(NULL
, &bo
->reference
);
380 panfrost_bo_unreference(struct pipe_screen
*screen
, struct panfrost_bo
*bo
)
382 /* When the reference count goes to zero, we need to cleanup */
384 if (pipe_reference(&bo
->reference
, NULL
)) {
385 panfrost_destroy_bo(pan_screen(screen
), bo
);
390 panfrost_resource_destroy(struct pipe_screen
*screen
,
391 struct pipe_resource
*pt
)
393 struct panfrost_screen
*pscreen
= pan_screen(screen
);
394 struct panfrost_resource
*rsrc
= (struct panfrost_resource
*) pt
;
397 renderonly_scanout_destroy(rsrc
->scanout
, pscreen
->ro
);
400 panfrost_bo_unreference(screen
, rsrc
->bo
);
402 util_range_destroy(&rsrc
->valid_buffer_range
);
407 panfrost_transfer_map(struct pipe_context
*pctx
,
408 struct pipe_resource
*resource
,
410 unsigned usage
, /* a combination of PIPE_TRANSFER_x */
411 const struct pipe_box
*box
,
412 struct pipe_transfer
**out_transfer
)
414 int bytes_per_pixel
= util_format_get_blocksize(resource
->format
);
415 struct panfrost_resource
*rsrc
= pan_resource(resource
);
416 struct panfrost_bo
*bo
= rsrc
->bo
;
418 struct panfrost_gtransfer
*transfer
= CALLOC_STRUCT(panfrost_gtransfer
);
419 transfer
->base
.level
= level
;
420 transfer
->base
.usage
= usage
;
421 transfer
->base
.box
= *box
;
423 pipe_resource_reference(&transfer
->base
.resource
, resource
);
425 *out_transfer
= &transfer
->base
;
427 /* Check if we're bound for rendering and this is a read pixels. If so,
428 * we need to flush */
430 struct panfrost_context
*ctx
= pan_context(pctx
);
431 struct pipe_framebuffer_state
*fb
= &ctx
->pipe_framebuffer
;
433 bool is_bound
= false;
435 for (unsigned c
= 0; c
< fb
->nr_cbufs
; ++c
) {
436 is_bound
|= fb
->cbufs
[c
]->texture
== resource
;
439 if (is_bound
&& (usage
& PIPE_TRANSFER_READ
)) {
441 panfrost_flush(pctx
, NULL
, PIPE_FLUSH_END_OF_FRAME
);
444 /* TODO: Respect usage flags */
446 if (usage
& PIPE_TRANSFER_DISCARD_WHOLE_RESOURCE
) {
447 /* TODO: reallocate */
448 //printf("debug: Missed reallocate\n");
449 } else if ((usage
& PIPE_TRANSFER_WRITE
)
450 && resource
->target
== PIPE_BUFFER
451 && !util_ranges_intersect(&rsrc
->valid_buffer_range
, box
->x
, box
->x
+ box
->width
)) {
452 /* No flush for writes to uninitialized */
453 } else if (!(usage
& PIPE_TRANSFER_UNSYNCHRONIZED
)) {
454 if (usage
& PIPE_TRANSFER_WRITE
) {
455 /* STUB: flush reading */
456 //printf("debug: missed reading flush %d\n", resource->target);
457 } else if (usage
& PIPE_TRANSFER_READ
) {
458 /* STUB: flush writing */
459 //printf("debug: missed writing flush %d (%d-%d)\n", resource->target, box->x, box->x + box->width);
461 /* Why are you even mapping?! */
465 if (bo
->layout
!= PAN_LINEAR
) {
466 /* Non-linear resources need to be indirectly mapped */
468 if (usage
& PIPE_TRANSFER_MAP_DIRECTLY
)
471 transfer
->base
.stride
= box
->width
* bytes_per_pixel
;
472 transfer
->base
.layer_stride
= transfer
->base
.stride
* box
->height
;
475 transfer
->map
= malloc(transfer
->base
.layer_stride
* box
->depth
);
477 return transfer
->map
;
479 transfer
->base
.stride
= bo
->slices
[level
].stride
;
480 transfer
->base
.layer_stride
= bo
->cubemap_stride
;
483 + bo
->slices
[level
].offset
484 + transfer
->base
.box
.z
* bo
->cubemap_stride
485 + transfer
->base
.box
.y
* bo
->slices
[level
].stride
486 + transfer
->base
.box
.x
* bytes_per_pixel
;
491 panfrost_tile_texture(struct panfrost_screen
*screen
, struct panfrost_resource
*rsrc
, struct panfrost_gtransfer
*trans
)
493 struct panfrost_bo
*bo
= (struct panfrost_bo
*)rsrc
->bo
;
495 unsigned level
= trans
->base
.level
;
497 panfrost_texture_swizzle(
500 trans
->base
.box
.width
,
501 trans
->base
.box
.height
,
502 util_format_get_blocksize(rsrc
->base
.format
),
503 u_minify(rsrc
->base
.width0
, level
),
506 + bo
->slices
[level
].offset
507 + bo
->cubemap_stride
* trans
->base
.box
.z
512 panfrost_transfer_unmap(struct pipe_context
*pctx
,
513 struct pipe_transfer
*transfer
)
515 struct panfrost_context
*ctx
= pan_context(pctx
);
517 /* Gallium expects writeback here, so we tile */
519 struct panfrost_gtransfer
*trans
= pan_transfer(transfer
);
520 struct panfrost_resource
*prsrc
= (struct panfrost_resource
*) transfer
->resource
;
523 struct panfrost_bo
*bo
= prsrc
->bo
;
525 if (transfer
->usage
& PIPE_TRANSFER_WRITE
) {
527 if (bo
->layout
== PAN_AFBC
) {
528 DBG("Unimplemented: writes to AFBC\n");
529 } else if (bo
->layout
== PAN_TILED
) {
530 struct pipe_context
*gallium
= (struct pipe_context
*) ctx
;
531 struct panfrost_screen
*screen
= pan_screen(gallium
->screen
);
532 assert(transfer
->box
.depth
== 1);
533 panfrost_tile_texture(screen
, prsrc
, trans
);
541 util_range_add(&prsrc
->valid_buffer_range
,
543 transfer
->box
.x
+ transfer
->box
.width
);
545 /* Derefence the resource */
546 pipe_resource_reference(&transfer
->resource
, NULL
);
548 /* Transfer itself is CALLOCed at the moment */
553 panfrost_transfer_flush_region(struct pipe_context
*pctx
,
554 struct pipe_transfer
*transfer
,
555 const struct pipe_box
*box
)
557 struct panfrost_resource
*rsc
= pan_resource(transfer
->resource
);
559 if (transfer
->resource
->target
== PIPE_BUFFER
) {
560 util_range_add(&rsc
->valid_buffer_range
,
561 transfer
->box
.x
+ box
->x
,
562 transfer
->box
.x
+ box
->x
+ box
->width
);
566 static struct pb_slab
*
567 panfrost_slab_alloc(void *priv
, unsigned heap
, unsigned entry_size
, unsigned group_index
)
569 struct panfrost_screen
*screen
= (struct panfrost_screen
*) priv
;
570 struct panfrost_memory
*mem
= CALLOC_STRUCT(panfrost_memory
);
572 size_t slab_size
= (1 << (MAX_SLAB_ENTRY_SIZE
+ 1));
574 mem
->slab
.num_entries
= slab_size
/ entry_size
;
575 mem
->slab
.num_free
= mem
->slab
.num_entries
;
577 LIST_INITHEAD(&mem
->slab
.free
);
578 for (unsigned i
= 0; i
< mem
->slab
.num_entries
; ++i
) {
579 /* Create a slab entry */
580 struct panfrost_memory_entry
*entry
= CALLOC_STRUCT(panfrost_memory_entry
);
581 entry
->offset
= entry_size
* i
;
583 entry
->base
.slab
= &mem
->slab
;
584 entry
->base
.group_index
= group_index
;
586 LIST_ADDTAIL(&entry
->base
.head
, &mem
->slab
.free
);
589 /* Actually allocate the memory from kernel-space. Mapped, same_va, no
592 screen
->driver
->allocate_slab(screen
, mem
, slab_size
/ 4096, true, 0, 0, 0);
598 panfrost_slab_can_reclaim(void *priv
, struct pb_slab_entry
*entry
)
600 struct panfrost_memory_entry
*p_entry
= (struct panfrost_memory_entry
*) entry
;
601 return p_entry
->freed
;
605 panfrost_slab_free(void *priv
, struct pb_slab
*slab
)
607 struct panfrost_memory
*mem
= (struct panfrost_memory
*) slab
;
608 struct panfrost_screen
*screen
= (struct panfrost_screen
*) priv
;
610 screen
->driver
->free_slab(screen
, mem
);
614 panfrost_invalidate_resource(struct pipe_context
*pctx
, struct pipe_resource
*prsc
)
616 //DBG("TODO %s\n", __func__);
619 static enum pipe_format
620 panfrost_resource_get_internal_format(struct pipe_resource
*prsrc
)
622 return prsrc
->format
;
626 panfrost_resource_set_stencil(struct pipe_resource
*prsrc
,
627 struct pipe_resource
*stencil
)
629 pan_resource(prsrc
)->separate_stencil
= pan_resource(stencil
);
632 static struct pipe_resource
*
633 panfrost_resource_get_stencil(struct pipe_resource
*prsrc
)
635 return &pan_resource(prsrc
)->separate_stencil
->base
;
638 static const struct u_transfer_vtbl transfer_vtbl
= {
639 .resource_create
= panfrost_resource_create
,
640 .resource_destroy
= panfrost_resource_destroy
,
641 .transfer_map
= panfrost_transfer_map
,
642 .transfer_unmap
= panfrost_transfer_unmap
,
643 .transfer_flush_region
= panfrost_transfer_flush_region
,
644 .get_internal_format
= panfrost_resource_get_internal_format
,
645 .set_stencil
= panfrost_resource_set_stencil
,
646 .get_stencil
= panfrost_resource_get_stencil
,
650 panfrost_resource_screen_init(struct panfrost_screen
*pscreen
)
652 //pscreen->base.resource_create_with_modifiers =
653 // panfrost_resource_create_with_modifiers;
654 pscreen
->base
.resource_create
= u_transfer_helper_resource_create
;
655 pscreen
->base
.resource_destroy
= u_transfer_helper_resource_destroy
;
656 pscreen
->base
.resource_from_handle
= panfrost_resource_from_handle
;
657 pscreen
->base
.resource_get_handle
= panfrost_resource_get_handle
;
658 pscreen
->base
.transfer_helper
= u_transfer_helper_create(&transfer_vtbl
,
662 pb_slabs_init(&pscreen
->slabs
,
666 3, /* Number of heaps */
670 panfrost_slab_can_reclaim
,
676 panfrost_resource_context_init(struct pipe_context
*pctx
)
678 pctx
->transfer_map
= u_transfer_helper_transfer_map
;
679 pctx
->transfer_flush_region
= u_transfer_helper_transfer_flush_region
;
680 pctx
->transfer_unmap
= u_transfer_helper_transfer_unmap
;
681 pctx
->buffer_subdata
= u_default_buffer_subdata
;
682 pctx
->create_surface
= panfrost_create_surface
;
683 pctx
->surface_destroy
= panfrost_surface_destroy
;
684 pctx
->resource_copy_region
= util_resource_copy_region
;
685 pctx
->blit
= panfrost_blit
;
686 pctx
->flush_resource
= panfrost_flush_resource
;
687 pctx
->invalidate_resource
= panfrost_invalidate_resource
;
688 pctx
->transfer_flush_region
= u_transfer_helper_transfer_flush_region
;
689 pctx
->buffer_subdata
= u_default_buffer_subdata
;
690 pctx
->texture_subdata
= u_default_texture_subdata
;