2 * Copyright © 2014-2017 Broadcom
3 * Copyright (C) 2012 Rob Clark <robclark@freedesktop.org>
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9 * and/or sell copies of the Software, and to permit persons to whom the
10 * Software is furnished to do so, subject to the following conditions:
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
25 #include "pipe/p_defines.h"
26 #include "util/u_blit.h"
27 #include "util/u_memory.h"
28 #include "util/u_format.h"
29 #include "util/u_inlines.h"
30 #include "util/u_surface.h"
31 #include "util/u_transfer_helper.h"
32 #include "util/u_upload_mgr.h"
33 #include "util/u_format_zs.h"
34 #include "util/u_drm.h"
36 #include "drm-uapi/drm_fourcc.h"
37 #include "v3d_screen.h"
38 #include "v3d_context.h"
39 #include "v3d_resource.h"
40 #include "v3d_tiling.h"
41 #include "broadcom/cle/v3d_packet_v33_pack.h"
44 v3d_debug_resource_layout(struct v3d_resource
*rsc
, const char *caller
)
46 if (!(V3D_DEBUG
& V3D_DEBUG_SURFACE
))
49 struct pipe_resource
*prsc
= &rsc
->base
;
51 if (prsc
->target
== PIPE_BUFFER
) {
53 "rsc %s %p (format %s), %dx%d buffer @0x%08x-0x%08x\n",
55 util_format_short_name(prsc
->format
),
56 prsc
->width0
, prsc
->height0
,
58 rsc
->bo
->offset
+ rsc
->bo
->size
- 1);
62 static const char *const tiling_descriptions
[] = {
63 [VC5_TILING_RASTER
] = "R",
64 [VC5_TILING_LINEARTILE
] = "LT",
65 [VC5_TILING_UBLINEAR_1_COLUMN
] = "UB1",
66 [VC5_TILING_UBLINEAR_2_COLUMN
] = "UB2",
67 [VC5_TILING_UIF_NO_XOR
] = "UIF",
68 [VC5_TILING_UIF_XOR
] = "UIF^",
71 for (int i
= 0; i
<= prsc
->last_level
; i
++) {
72 struct v3d_resource_slice
*slice
= &rsc
->slices
[i
];
74 int level_width
= slice
->stride
/ rsc
->cpp
;
75 int level_height
= slice
->padded_height
;
77 u_minify(util_next_power_of_two(prsc
->depth0
), i
);
80 "rsc %s %p (format %s), %dx%d: "
81 "level %d (%s) %dx%dx%d -> %dx%dx%d, stride %d@0x%08x\n",
83 util_format_short_name(prsc
->format
),
84 prsc
->width0
, prsc
->height0
,
85 i
, tiling_descriptions
[slice
->tiling
],
86 u_minify(prsc
->width0
, i
),
87 u_minify(prsc
->height0
, i
),
88 u_minify(prsc
->depth0
, i
),
93 rsc
->bo
->offset
+ slice
->offset
);
98 v3d_resource_bo_alloc(struct v3d_resource
*rsc
)
100 struct pipe_resource
*prsc
= &rsc
->base
;
101 struct pipe_screen
*pscreen
= prsc
->screen
;
104 bo
= v3d_bo_alloc(v3d_screen(pscreen
), rsc
->size
, "resource");
106 v3d_bo_unreference(&rsc
->bo
);
108 v3d_debug_resource_layout(rsc
, "alloc");
116 v3d_resource_transfer_unmap(struct pipe_context
*pctx
,
117 struct pipe_transfer
*ptrans
)
119 struct v3d_context
*v3d
= v3d_context(pctx
);
120 struct v3d_transfer
*trans
= v3d_transfer(ptrans
);
123 struct v3d_resource
*rsc
= v3d_resource(ptrans
->resource
);
124 struct v3d_resource_slice
*slice
= &rsc
->slices
[ptrans
->level
];
126 if (ptrans
->usage
& PIPE_TRANSFER_WRITE
) {
127 for (int z
= 0; z
< ptrans
->box
.depth
; z
++) {
128 void *dst
= rsc
->bo
->map
+
129 v3d_layer_offset(&rsc
->base
,
132 v3d_store_tiled_image(dst
,
136 ptrans
->box
.height
* z
),
138 slice
->tiling
, rsc
->cpp
,
139 slice
->padded_height
,
146 pipe_resource_reference(&ptrans
->resource
, NULL
);
147 slab_free(&v3d
->transfer_pool
, ptrans
);
151 v3d_map_usage_prep(struct pipe_context
*pctx
,
152 struct pipe_resource
*prsc
,
155 struct v3d_context
*v3d
= v3d_context(pctx
);
156 struct v3d_resource
*rsc
= v3d_resource(prsc
);
158 if (usage
& PIPE_TRANSFER_DISCARD_WHOLE_RESOURCE
) {
159 if (v3d_resource_bo_alloc(rsc
)) {
160 /* If it might be bound as one of our vertex buffers
161 * or UBOs, make sure we re-emit vertex buffer state
164 if (prsc
->bind
& PIPE_BIND_VERTEX_BUFFER
)
165 v3d
->dirty
|= VC5_DIRTY_VTXBUF
;
166 if (prsc
->bind
& PIPE_BIND_CONSTANT_BUFFER
)
167 v3d
->dirty
|= VC5_DIRTY_CONSTBUF
;
169 /* If we failed to reallocate, flush users so that we
170 * don't violate any syncing requirements.
172 v3d_flush_jobs_reading_resource(v3d
, prsc
);
174 } else if (!(usage
& PIPE_TRANSFER_UNSYNCHRONIZED
)) {
175 /* If we're writing and the buffer is being used by the CL, we
176 * have to flush the CL first. If we're only reading, we need
177 * to flush if the CL has written our buffer.
179 if (usage
& PIPE_TRANSFER_WRITE
)
180 v3d_flush_jobs_reading_resource(v3d
, prsc
);
182 v3d_flush_jobs_writing_resource(v3d
, prsc
);
185 if (usage
& PIPE_TRANSFER_WRITE
) {
187 rsc
->initialized_buffers
= ~0;
192 v3d_resource_transfer_map(struct pipe_context
*pctx
,
193 struct pipe_resource
*prsc
,
194 unsigned level
, unsigned usage
,
195 const struct pipe_box
*box
,
196 struct pipe_transfer
**pptrans
)
198 struct v3d_context
*v3d
= v3d_context(pctx
);
199 struct v3d_resource
*rsc
= v3d_resource(prsc
);
200 struct v3d_transfer
*trans
;
201 struct pipe_transfer
*ptrans
;
202 enum pipe_format format
= prsc
->format
;
205 /* MSAA maps should have been handled by u_transfer_helper. */
206 assert(prsc
->nr_samples
<= 1);
208 /* Upgrade DISCARD_RANGE to WHOLE_RESOURCE if the whole resource is
211 if ((usage
& PIPE_TRANSFER_DISCARD_RANGE
) &&
212 !(usage
& PIPE_TRANSFER_UNSYNCHRONIZED
) &&
213 !(prsc
->flags
& PIPE_RESOURCE_FLAG_MAP_PERSISTENT
) &&
214 prsc
->last_level
== 0 &&
215 prsc
->width0
== box
->width
&&
216 prsc
->height0
== box
->height
&&
217 prsc
->depth0
== box
->depth
&&
218 prsc
->array_size
== 1 &&
220 usage
|= PIPE_TRANSFER_DISCARD_WHOLE_RESOURCE
;
223 v3d_map_usage_prep(pctx
, prsc
, usage
);
225 trans
= slab_alloc(&v3d
->transfer_pool
);
229 /* XXX: Handle DONTBLOCK, DISCARD_RANGE, PERSISTENT, COHERENT. */
231 /* slab_alloc_st() doesn't zero: */
232 memset(trans
, 0, sizeof(*trans
));
233 ptrans
= &trans
->base
;
235 pipe_resource_reference(&ptrans
->resource
, prsc
);
236 ptrans
->level
= level
;
237 ptrans
->usage
= usage
;
240 /* Note that the current kernel implementation is synchronous, so no
241 * need to do syncing stuff here yet.
244 if (usage
& PIPE_TRANSFER_UNSYNCHRONIZED
)
245 buf
= v3d_bo_map_unsynchronized(rsc
->bo
);
247 buf
= v3d_bo_map(rsc
->bo
);
249 fprintf(stderr
, "Failed to map bo\n");
255 /* Our load/store routines work on entire compressed blocks. */
256 ptrans
->box
.x
/= util_format_get_blockwidth(format
);
257 ptrans
->box
.y
/= util_format_get_blockheight(format
);
258 ptrans
->box
.width
= DIV_ROUND_UP(ptrans
->box
.width
,
259 util_format_get_blockwidth(format
));
260 ptrans
->box
.height
= DIV_ROUND_UP(ptrans
->box
.height
,
261 util_format_get_blockheight(format
));
263 struct v3d_resource_slice
*slice
= &rsc
->slices
[level
];
265 /* No direct mappings of tiled, since we need to manually
268 if (usage
& PIPE_TRANSFER_MAP_DIRECTLY
)
271 ptrans
->stride
= ptrans
->box
.width
* rsc
->cpp
;
272 ptrans
->layer_stride
= ptrans
->stride
* ptrans
->box
.height
;
274 trans
->map
= malloc(ptrans
->layer_stride
* ptrans
->box
.depth
);
276 if (usage
& PIPE_TRANSFER_READ
) {
277 for (int z
= 0; z
< ptrans
->box
.depth
; z
++) {
278 void *src
= rsc
->bo
->map
+
279 v3d_layer_offset(&rsc
->base
,
282 v3d_load_tiled_image((trans
->map
+
284 ptrans
->box
.height
* z
),
288 slice
->tiling
, rsc
->cpp
,
289 slice
->padded_height
,
295 ptrans
->stride
= slice
->stride
;
296 ptrans
->layer_stride
= rsc
->cube_map_stride
;
298 return buf
+ slice
->offset
+
299 ptrans
->box
.y
* ptrans
->stride
+
300 ptrans
->box
.x
* rsc
->cpp
+
301 ptrans
->box
.z
* rsc
->cube_map_stride
;
306 v3d_resource_transfer_unmap(pctx
, ptrans
);
311 v3d_texture_subdata(struct pipe_context
*pctx
,
312 struct pipe_resource
*prsc
,
315 const struct pipe_box
*box
,
318 unsigned layer_stride
)
320 struct v3d_resource
*rsc
= v3d_resource(prsc
);
321 struct v3d_resource_slice
*slice
= &rsc
->slices
[level
];
323 /* For a direct mapping, we can just take the u_transfer path. */
325 return u_default_texture_subdata(pctx
, prsc
, level
, usage
, box
,
326 data
, stride
, layer_stride
);
329 /* Otherwise, map and store the texture data directly into the tiled
330 * texture. Note that gallium's texture_subdata may be called with
331 * obvious usage flags missing!
333 v3d_map_usage_prep(pctx
, prsc
, usage
| (PIPE_TRANSFER_WRITE
|
334 PIPE_TRANSFER_DISCARD_RANGE
));
337 if (usage
& PIPE_TRANSFER_UNSYNCHRONIZED
)
338 buf
= v3d_bo_map_unsynchronized(rsc
->bo
);
340 buf
= v3d_bo_map(rsc
->bo
);
342 for (int i
= 0; i
< box
->depth
; i
++) {
343 v3d_store_tiled_image(buf
+
344 v3d_layer_offset(&rsc
->base
,
348 (void *)data
+ layer_stride
* i
,
350 slice
->tiling
, rsc
->cpp
, slice
->padded_height
,
356 v3d_resource_destroy(struct pipe_screen
*pscreen
,
357 struct pipe_resource
*prsc
)
359 struct v3d_screen
*screen
= v3d_screen(pscreen
);
360 struct v3d_resource
*rsc
= v3d_resource(prsc
);
363 renderonly_scanout_destroy(rsc
->scanout
, screen
->ro
);
365 v3d_bo_unreference(&rsc
->bo
);
370 v3d_resource_get_handle(struct pipe_screen
*pscreen
,
371 struct pipe_context
*pctx
,
372 struct pipe_resource
*prsc
,
373 struct winsys_handle
*whandle
,
376 struct v3d_screen
*screen
= v3d_screen(pscreen
);
377 struct v3d_resource
*rsc
= v3d_resource(prsc
);
378 struct v3d_bo
*bo
= rsc
->bo
;
380 whandle
->stride
= rsc
->slices
[0].stride
;
383 /* If we're passing some reference to our BO out to some other part of
384 * the system, then we can't do any optimizations about only us being
385 * the ones seeing it (like BO caching).
390 /* A shared tiled buffer should always be allocated as UIF,
391 * not UBLINEAR or LT.
393 assert(rsc
->slices
[0].tiling
== VC5_TILING_UIF_XOR
||
394 rsc
->slices
[0].tiling
== VC5_TILING_UIF_NO_XOR
);
395 whandle
->modifier
= DRM_FORMAT_MOD_BROADCOM_UIF
;
397 whandle
->modifier
= DRM_FORMAT_MOD_LINEAR
;
400 switch (whandle
->type
) {
401 case WINSYS_HANDLE_TYPE_SHARED
:
402 return v3d_bo_flink(bo
, &whandle
->handle
);
403 case WINSYS_HANDLE_TYPE_KMS
:
405 assert(rsc
->scanout
);
406 bool ok
= renderonly_get_handle(rsc
->scanout
, whandle
);
407 whandle
->stride
= rsc
->slices
[0].stride
;
410 whandle
->handle
= bo
->handle
;
412 case WINSYS_HANDLE_TYPE_FD
:
413 whandle
->handle
= v3d_bo_get_dmabuf(bo
);
414 return whandle
->handle
!= -1;
420 #define PAGE_UB_ROWS (VC5_UIFCFG_PAGE_SIZE / VC5_UIFBLOCK_ROW_SIZE)
421 #define PAGE_UB_ROWS_TIMES_1_5 ((PAGE_UB_ROWS * 3) >> 1)
422 #define PAGE_CACHE_UB_ROWS (VC5_PAGE_CACHE_SIZE / VC5_UIFBLOCK_ROW_SIZE)
423 #define PAGE_CACHE_MINUS_1_5_UB_ROWS (PAGE_CACHE_UB_ROWS - PAGE_UB_ROWS_TIMES_1_5)
426 * Computes the HW's UIFblock padding for a given height/cpp.
428 * The goal of the padding is to keep pages of the same color (bank number) at
429 * least half a page away from each other vertically when crossing between
430 * between columns of UIF blocks.
433 v3d_get_ub_pad(struct v3d_resource
*rsc
, uint32_t height
)
435 uint32_t utile_h
= v3d_utile_height(rsc
->cpp
);
436 uint32_t uif_block_h
= utile_h
* 2;
437 uint32_t height_ub
= height
/ uif_block_h
;
439 uint32_t height_offset_in_pc
= height_ub
% PAGE_CACHE_UB_ROWS
;
441 /* For the perfectly-aligned-for-UIF-XOR case, don't add any pad. */
442 if (height_offset_in_pc
== 0)
445 /* Try padding up to where we're offset by at least half a page. */
446 if (height_offset_in_pc
< PAGE_UB_ROWS_TIMES_1_5
) {
447 /* If we fit entirely in the page cache, don't pad. */
448 if (height_ub
< PAGE_CACHE_UB_ROWS
)
451 return PAGE_UB_ROWS_TIMES_1_5
- height_offset_in_pc
;
454 /* If we're close to being aligned to page cache size, then round up
457 if (height_offset_in_pc
> PAGE_CACHE_MINUS_1_5_UB_ROWS
)
458 return PAGE_CACHE_UB_ROWS
- height_offset_in_pc
;
460 /* Otherwise, we're far enough away (top and bottom) to not need any
467 v3d_setup_slices(struct v3d_resource
*rsc
, uint32_t winsys_stride
,
470 struct pipe_resource
*prsc
= &rsc
->base
;
471 uint32_t width
= prsc
->width0
;
472 uint32_t height
= prsc
->height0
;
473 uint32_t depth
= prsc
->depth0
;
474 /* Note that power-of-two padding is based on level 1. These are not
475 * equivalent to just util_next_power_of_two(dimension), because at a
476 * level 0 dimension of 9, the level 1 power-of-two padded value is 4,
479 uint32_t pot_width
= 2 * util_next_power_of_two(u_minify(width
, 1));
480 uint32_t pot_height
= 2 * util_next_power_of_two(u_minify(height
, 1));
481 uint32_t pot_depth
= 2 * util_next_power_of_two(u_minify(depth
, 1));
483 uint32_t utile_w
= v3d_utile_width(rsc
->cpp
);
484 uint32_t utile_h
= v3d_utile_height(rsc
->cpp
);
485 uint32_t uif_block_w
= utile_w
* 2;
486 uint32_t uif_block_h
= utile_h
* 2;
487 uint32_t block_width
= util_format_get_blockwidth(prsc
->format
);
488 uint32_t block_height
= util_format_get_blockheight(prsc
->format
);
489 bool msaa
= prsc
->nr_samples
> 1;
491 /* MSAA textures/renderbuffers are always laid out as single-level
496 /* Check some easy mistakes to make in a resource_create() call that
497 * will break our setup.
499 assert(prsc
->array_size
!= 0);
500 assert(prsc
->depth0
!= 0);
502 for (int i
= prsc
->last_level
; i
>= 0; i
--) {
503 struct v3d_resource_slice
*slice
= &rsc
->slices
[i
];
505 uint32_t level_width
, level_height
, level_depth
;
507 level_width
= u_minify(width
, i
);
508 level_height
= u_minify(height
, i
);
510 level_width
= u_minify(pot_width
, i
);
511 level_height
= u_minify(pot_height
, i
);
514 level_depth
= u_minify(depth
, i
);
516 level_depth
= u_minify(pot_depth
, i
);
523 level_width
= DIV_ROUND_UP(level_width
, block_width
);
524 level_height
= DIV_ROUND_UP(level_height
, block_height
);
527 slice
->tiling
= VC5_TILING_RASTER
;
528 if (prsc
->target
== PIPE_TEXTURE_1D
)
529 level_width
= align(level_width
, 64 / rsc
->cpp
);
531 if ((i
!= 0 || !uif_top
) &&
532 (level_width
<= utile_w
||
533 level_height
<= utile_h
)) {
534 slice
->tiling
= VC5_TILING_LINEARTILE
;
535 level_width
= align(level_width
, utile_w
);
536 level_height
= align(level_height
, utile_h
);
537 } else if ((i
!= 0 || !uif_top
) &&
538 level_width
<= uif_block_w
) {
539 slice
->tiling
= VC5_TILING_UBLINEAR_1_COLUMN
;
540 level_width
= align(level_width
, uif_block_w
);
541 level_height
= align(level_height
, uif_block_h
);
542 } else if ((i
!= 0 || !uif_top
) &&
543 level_width
<= 2 * uif_block_w
) {
544 slice
->tiling
= VC5_TILING_UBLINEAR_2_COLUMN
;
545 level_width
= align(level_width
, 2 * uif_block_w
);
546 level_height
= align(level_height
, uif_block_h
);
548 /* We align the width to a 4-block column of
549 * UIF blocks, but we only align height to UIF
552 level_width
= align(level_width
,
554 level_height
= align(level_height
,
557 slice
->ub_pad
= v3d_get_ub_pad(rsc
,
559 level_height
+= slice
->ub_pad
* uif_block_h
;
561 /* If the padding set us to to be aligned to
562 * the page cache size, then the HW will use
563 * the XOR bit on odd columns to get us
564 * perfectly misaligned
566 if ((level_height
/ uif_block_h
) %
567 (VC5_PAGE_CACHE_SIZE
/
568 VC5_UIFBLOCK_ROW_SIZE
) == 0) {
569 slice
->tiling
= VC5_TILING_UIF_XOR
;
571 slice
->tiling
= VC5_TILING_UIF_NO_XOR
;
576 slice
->offset
= offset
;
578 slice
->stride
= winsys_stride
;
580 slice
->stride
= level_width
* rsc
->cpp
;
581 slice
->padded_height
= level_height
;
582 slice
->size
= level_height
* slice
->stride
;
584 uint32_t slice_total_size
= slice
->size
* level_depth
;
586 /* The HW aligns level 1's base to a page if any of level 1 or
587 * below could be UIF XOR. The lower levels then inherit the
588 * alignment for as long as necesary, thanks to being power of
592 level_width
> 4 * uif_block_w
&&
593 level_height
> PAGE_CACHE_MINUS_1_5_UB_ROWS
* uif_block_h
) {
594 slice_total_size
= align(slice_total_size
,
595 VC5_UIFCFG_PAGE_SIZE
);
598 offset
+= slice_total_size
;
603 /* UIF/UBLINEAR levels need to be aligned to UIF-blocks, and LT only
604 * needs to be aligned to utile boundaries. Since tiles are laid out
605 * from small to big in memory, we need to align the later UIF slices
606 * to UIF blocks, if they were preceded by non-UIF-block-aligned LT
609 * We additionally align to 4k, which improves UIF XOR performance.
611 uint32_t page_align_offset
= (align(rsc
->slices
[0].offset
, 4096) -
612 rsc
->slices
[0].offset
);
613 if (page_align_offset
) {
614 rsc
->size
+= page_align_offset
;
615 for (int i
= 0; i
<= prsc
->last_level
; i
++)
616 rsc
->slices
[i
].offset
+= page_align_offset
;
619 /* Arrays and cube textures have a stride which is the distance from
620 * one full mipmap tree to the next (64b aligned). For 3D textures,
621 * we need to program the stride between slices of miplevel 0.
623 if (prsc
->target
!= PIPE_TEXTURE_3D
) {
624 rsc
->cube_map_stride
= align(rsc
->slices
[0].offset
+
625 rsc
->slices
[0].size
, 64);
626 rsc
->size
+= rsc
->cube_map_stride
* (prsc
->array_size
- 1);
628 rsc
->cube_map_stride
= rsc
->slices
[0].size
;
633 v3d_layer_offset(struct pipe_resource
*prsc
, uint32_t level
, uint32_t layer
)
635 struct v3d_resource
*rsc
= v3d_resource(prsc
);
636 struct v3d_resource_slice
*slice
= &rsc
->slices
[level
];
638 if (prsc
->target
== PIPE_TEXTURE_3D
)
639 return slice
->offset
+ layer
* slice
->size
;
641 return slice
->offset
+ layer
* rsc
->cube_map_stride
;
644 static struct v3d_resource
*
645 v3d_resource_setup(struct pipe_screen
*pscreen
,
646 const struct pipe_resource
*tmpl
)
648 struct v3d_screen
*screen
= v3d_screen(pscreen
);
649 struct v3d_resource
*rsc
= CALLOC_STRUCT(v3d_resource
);
652 struct pipe_resource
*prsc
= &rsc
->base
;
656 pipe_reference_init(&prsc
->reference
, 1);
657 prsc
->screen
= pscreen
;
659 if (prsc
->nr_samples
<= 1 ||
660 screen
->devinfo
.ver
>= 40 ||
661 util_format_is_depth_or_stencil(prsc
->format
)) {
662 rsc
->cpp
= util_format_get_blocksize(prsc
->format
);
663 if (screen
->devinfo
.ver
< 40 && prsc
->nr_samples
> 1)
664 rsc
->cpp
*= prsc
->nr_samples
;
666 assert(v3d_rt_format_supported(&screen
->devinfo
, prsc
->format
));
667 uint32_t output_image_format
=
668 v3d_get_rt_format(&screen
->devinfo
, prsc
->format
);
669 uint32_t internal_type
;
670 uint32_t internal_bpp
;
671 v3d_get_internal_type_bpp_for_output_format(&screen
->devinfo
,
675 switch (internal_bpp
) {
676 case V3D_INTERNAL_BPP_32
:
679 case V3D_INTERNAL_BPP_64
:
682 case V3D_INTERNAL_BPP_128
:
693 static struct pipe_resource
*
694 v3d_resource_create_with_modifiers(struct pipe_screen
*pscreen
,
695 const struct pipe_resource
*tmpl
,
696 const uint64_t *modifiers
,
699 struct v3d_screen
*screen
= v3d_screen(pscreen
);
701 bool linear_ok
= drm_find_modifier(DRM_FORMAT_MOD_LINEAR
, modifiers
, count
);
702 struct v3d_resource
*rsc
= v3d_resource_setup(pscreen
, tmpl
);
703 struct pipe_resource
*prsc
= &rsc
->base
;
704 /* Use a tiled layout if we can, for better 3D performance. */
705 bool should_tile
= true;
707 /* VBOs/PBOs are untiled (and 1 height). */
708 if (tmpl
->target
== PIPE_BUFFER
)
711 /* Cursors are always linear, and the user can request linear as well.
713 if (tmpl
->bind
& (PIPE_BIND_LINEAR
| PIPE_BIND_CURSOR
))
716 /* 1D and 1D_ARRAY textures are always raster-order. */
717 if (tmpl
->target
== PIPE_TEXTURE_1D
||
718 tmpl
->target
== PIPE_TEXTURE_1D_ARRAY
)
721 /* Scanout BOs for simulator need to be linear for interaction with
724 if (using_v3d_simulator
&&
725 tmpl
->bind
& (PIPE_BIND_SHARED
| PIPE_BIND_SCANOUT
))
728 /* If using the old-school SCANOUT flag, we don't know what the screen
729 * might support other than linear. Just force linear.
731 if (tmpl
->bind
& PIPE_BIND_SCANOUT
)
734 /* No user-specified modifier; determine our own. */
735 if (count
== 1 && modifiers
[0] == DRM_FORMAT_MOD_INVALID
) {
737 rsc
->tiled
= should_tile
;
738 } else if (should_tile
&&
739 drm_find_modifier(DRM_FORMAT_MOD_BROADCOM_UIF
,
742 } else if (linear_ok
) {
745 fprintf(stderr
, "Unsupported modifier requested\n");
749 rsc
->internal_format
= prsc
->format
;
751 v3d_setup_slices(rsc
, 0, tmpl
->bind
& PIPE_BIND_SHARED
);
753 /* If we're in a renderonly setup, use the other device to perform our
754 * allocation and just import it to v3d. The other device may be
755 * using CMA, and V3D can import from CMA but doesn't do CMA
756 * allocations on its own.
758 * We always allocate this way for SHARED, because get_handle will
759 * need a resource on the display fd.
761 if (screen
->ro
&& (tmpl
->bind
& (PIPE_BIND_SCANOUT
|
762 PIPE_BIND_SHARED
))) {
763 struct winsys_handle handle
;
764 struct pipe_resource scanout_tmpl
= {
765 .target
= prsc
->target
,
766 .format
= PIPE_FORMAT_RGBA8888_UNORM
,
767 .width0
= 1024, /* one page */
768 .height0
= align(rsc
->size
, 4096) / 4096,
774 renderonly_scanout_for_resource(&scanout_tmpl
,
779 fprintf(stderr
, "Failed to create scanout resource\n");
782 assert(handle
.type
== WINSYS_HANDLE_TYPE_FD
);
783 rsc
->bo
= v3d_bo_open_dmabuf(screen
, handle
.handle
);
784 close(handle
.handle
);
789 v3d_debug_resource_layout(rsc
, "renderonly");
793 if (!v3d_resource_bo_alloc(rsc
))
799 v3d_resource_destroy(pscreen
, prsc
);
803 struct pipe_resource
*
804 v3d_resource_create(struct pipe_screen
*pscreen
,
805 const struct pipe_resource
*tmpl
)
807 const uint64_t mod
= DRM_FORMAT_MOD_INVALID
;
808 return v3d_resource_create_with_modifiers(pscreen
, tmpl
, &mod
, 1);
811 static struct pipe_resource
*
812 v3d_resource_from_handle(struct pipe_screen
*pscreen
,
813 const struct pipe_resource
*tmpl
,
814 struct winsys_handle
*whandle
,
817 struct v3d_screen
*screen
= v3d_screen(pscreen
);
818 struct v3d_resource
*rsc
= v3d_resource_setup(pscreen
, tmpl
);
819 struct pipe_resource
*prsc
= &rsc
->base
;
820 struct v3d_resource_slice
*slice
= &rsc
->slices
[0];
825 switch (whandle
->modifier
) {
826 case DRM_FORMAT_MOD_LINEAR
:
829 case DRM_FORMAT_MOD_BROADCOM_UIF
:
832 case DRM_FORMAT_MOD_INVALID
:
833 rsc
->tiled
= screen
->ro
== NULL
;
837 "Attempt to import unsupported modifier 0x%llx\n",
838 (long long)whandle
->modifier
);
842 if (whandle
->offset
!= 0) {
844 "Attempt to import unsupported winsys offset %u\n",
849 switch (whandle
->type
) {
850 case WINSYS_HANDLE_TYPE_SHARED
:
851 rsc
->bo
= v3d_bo_open_name(screen
, whandle
->handle
);
853 case WINSYS_HANDLE_TYPE_FD
:
854 rsc
->bo
= v3d_bo_open_dmabuf(screen
, whandle
->handle
);
858 "Attempt to import unsupported handle type %d\n",
866 rsc
->internal_format
= prsc
->format
;
868 v3d_setup_slices(rsc
, whandle
->stride
, true);
869 v3d_debug_resource_layout(rsc
, "import");
872 /* Make sure that renderonly has a handle to our buffer in the
873 * display's fd, so that a later renderonly_get_handle()
874 * returns correct handles or GEM names.
877 renderonly_create_gpu_import_for_resource(prsc
,
881 fprintf(stderr
, "Failed to create scanout resource.\n");
886 if (whandle
->stride
!= slice
->stride
) {
887 static bool warned
= false;
891 "Attempting to import %dx%d %s with "
892 "unsupported stride %d instead of %d\n",
893 prsc
->width0
, prsc
->height0
,
894 util_format_short_name(prsc
->format
),
904 v3d_resource_destroy(pscreen
, prsc
);
909 v3d_update_shadow_texture(struct pipe_context
*pctx
,
910 struct pipe_sampler_view
*pview
)
912 struct v3d_context
*v3d
= v3d_context(pctx
);
913 struct v3d_sampler_view
*view
= v3d_sampler_view(pview
);
914 struct v3d_resource
*shadow
= v3d_resource(view
->texture
);
915 struct v3d_resource
*orig
= v3d_resource(pview
->texture
);
917 assert(view
->texture
!= pview
->texture
);
919 if (shadow
->writes
== orig
->writes
&& orig
->bo
->private)
922 perf_debug("Updating %dx%d@%d shadow for linear texture\n",
923 orig
->base
.width0
, orig
->base
.height0
,
924 pview
->u
.tex
.first_level
);
926 for (int i
= 0; i
<= shadow
->base
.last_level
; i
++) {
927 unsigned width
= u_minify(shadow
->base
.width0
, i
);
928 unsigned height
= u_minify(shadow
->base
.height0
, i
);
929 struct pipe_blit_info info
= {
931 .resource
= &shadow
->base
,
941 .format
= shadow
->base
.format
,
944 .resource
= &orig
->base
,
945 .level
= pview
->u
.tex
.first_level
+ i
,
954 .format
= orig
->base
.format
,
956 .mask
= util_format_get_mask(orig
->base
.format
),
958 pctx
->blit(pctx
, &info
);
961 shadow
->writes
= orig
->writes
;
964 static struct pipe_surface
*
965 v3d_create_surface(struct pipe_context
*pctx
,
966 struct pipe_resource
*ptex
,
967 const struct pipe_surface
*surf_tmpl
)
969 struct v3d_context
*v3d
= v3d_context(pctx
);
970 struct v3d_screen
*screen
= v3d
->screen
;
971 struct v3d_surface
*surface
= CALLOC_STRUCT(v3d_surface
);
972 struct v3d_resource
*rsc
= v3d_resource(ptex
);
977 assert(surf_tmpl
->u
.tex
.first_layer
== surf_tmpl
->u
.tex
.last_layer
);
979 struct pipe_surface
*psurf
= &surface
->base
;
980 unsigned level
= surf_tmpl
->u
.tex
.level
;
981 struct v3d_resource_slice
*slice
= &rsc
->slices
[level
];
983 pipe_reference_init(&psurf
->reference
, 1);
984 pipe_resource_reference(&psurf
->texture
, ptex
);
986 psurf
->context
= pctx
;
987 psurf
->format
= surf_tmpl
->format
;
988 psurf
->width
= u_minify(ptex
->width0
, level
);
989 psurf
->height
= u_minify(ptex
->height0
, level
);
990 psurf
->u
.tex
.level
= level
;
991 psurf
->u
.tex
.first_layer
= surf_tmpl
->u
.tex
.first_layer
;
992 psurf
->u
.tex
.last_layer
= surf_tmpl
->u
.tex
.last_layer
;
994 surface
->offset
= v3d_layer_offset(ptex
, level
,
995 psurf
->u
.tex
.first_layer
);
996 surface
->tiling
= slice
->tiling
;
998 surface
->format
= v3d_get_rt_format(&screen
->devinfo
, psurf
->format
);
1000 const struct util_format_description
*desc
=
1001 util_format_description(psurf
->format
);
1003 surface
->swap_rb
= (desc
->swizzle
[0] == PIPE_SWIZZLE_Z
&&
1004 psurf
->format
!= PIPE_FORMAT_B5G6R5_UNORM
);
1006 if (util_format_is_depth_or_stencil(psurf
->format
)) {
1007 switch (psurf
->format
) {
1008 case PIPE_FORMAT_Z16_UNORM
:
1009 surface
->internal_type
= V3D_INTERNAL_TYPE_DEPTH_16
;
1011 case PIPE_FORMAT_Z32_FLOAT
:
1012 case PIPE_FORMAT_Z32_FLOAT_S8X24_UINT
:
1013 surface
->internal_type
= V3D_INTERNAL_TYPE_DEPTH_32F
;
1016 surface
->internal_type
= V3D_INTERNAL_TYPE_DEPTH_24
;
1020 v3d_get_internal_type_bpp_for_output_format(&screen
->devinfo
,
1023 surface
->internal_type
= type
;
1024 surface
->internal_bpp
= bpp
;
1027 if (surface
->tiling
== VC5_TILING_UIF_NO_XOR
||
1028 surface
->tiling
== VC5_TILING_UIF_XOR
) {
1029 surface
->padded_height_of_output_image_in_uif_blocks
=
1030 (slice
->padded_height
/
1031 (2 * v3d_utile_height(rsc
->cpp
)));
1034 if (rsc
->separate_stencil
) {
1035 surface
->separate_stencil
=
1036 v3d_create_surface(pctx
, &rsc
->separate_stencil
->base
,
1040 return &surface
->base
;
1044 v3d_surface_destroy(struct pipe_context
*pctx
, struct pipe_surface
*psurf
)
1046 struct v3d_surface
*surf
= v3d_surface(psurf
);
1048 if (surf
->separate_stencil
)
1049 pipe_surface_reference(&surf
->separate_stencil
, NULL
);
1051 pipe_resource_reference(&psurf
->texture
, NULL
);
1056 v3d_flush_resource(struct pipe_context
*pctx
, struct pipe_resource
*resource
)
1058 /* All calls to flush_resource are followed by a flush of the context,
1059 * so there's nothing to do.
1063 static enum pipe_format
1064 v3d_resource_get_internal_format(struct pipe_resource
*prsc
)
1066 return v3d_resource(prsc
)->internal_format
;
1070 v3d_resource_set_stencil(struct pipe_resource
*prsc
,
1071 struct pipe_resource
*stencil
)
1073 v3d_resource(prsc
)->separate_stencil
= v3d_resource(stencil
);
1076 static struct pipe_resource
*
1077 v3d_resource_get_stencil(struct pipe_resource
*prsc
)
1079 struct v3d_resource
*rsc
= v3d_resource(prsc
);
1081 return &rsc
->separate_stencil
->base
;
1084 static const struct u_transfer_vtbl transfer_vtbl
= {
1085 .resource_create
= v3d_resource_create
,
1086 .resource_destroy
= v3d_resource_destroy
,
1087 .transfer_map
= v3d_resource_transfer_map
,
1088 .transfer_unmap
= v3d_resource_transfer_unmap
,
1089 .transfer_flush_region
= u_default_transfer_flush_region
,
1090 .get_internal_format
= v3d_resource_get_internal_format
,
1091 .set_stencil
= v3d_resource_set_stencil
,
1092 .get_stencil
= v3d_resource_get_stencil
,
1096 v3d_resource_screen_init(struct pipe_screen
*pscreen
)
1098 pscreen
->resource_create_with_modifiers
=
1099 v3d_resource_create_with_modifiers
;
1100 pscreen
->resource_create
= u_transfer_helper_resource_create
;
1101 pscreen
->resource_from_handle
= v3d_resource_from_handle
;
1102 pscreen
->resource_get_handle
= v3d_resource_get_handle
;
1103 pscreen
->resource_destroy
= u_transfer_helper_resource_destroy
;
1104 pscreen
->transfer_helper
= u_transfer_helper_create(&transfer_vtbl
,
1110 v3d_resource_context_init(struct pipe_context
*pctx
)
1112 pctx
->transfer_map
= u_transfer_helper_transfer_map
;
1113 pctx
->transfer_flush_region
= u_transfer_helper_transfer_flush_region
;
1114 pctx
->transfer_unmap
= u_transfer_helper_transfer_unmap
;
1115 pctx
->buffer_subdata
= u_default_buffer_subdata
;
1116 pctx
->texture_subdata
= v3d_texture_subdata
;
1117 pctx
->create_surface
= v3d_create_surface
;
1118 pctx
->surface_destroy
= v3d_surface_destroy
;
1119 pctx
->resource_copy_region
= util_resource_copy_region
;
1120 pctx
->blit
= v3d_blit
;
1121 pctx
->generate_mipmap
= v3d_generate_mipmap
;
1122 pctx
->flush_resource
= v3d_flush_resource
;