2 * Copyright © 2014-2015 Broadcom
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
29 #include <xf86drmMode.h>
31 #include "util/u_hash_table.h"
32 #include "util/u_memory.h"
33 #include "util/ralloc.h"
35 #include "vc4_context.h"
36 #include "vc4_screen.h"
46 static bool dump_stats
= false;
49 vc4_bo_cache_free_all(struct vc4_bo_cache
*cache
);
52 vc4_bo_dump_stats(struct vc4_screen
*screen
)
54 struct vc4_bo_cache
*cache
= &screen
->bo_cache
;
56 fprintf(stderr
, " BOs allocated: %d\n", screen
->bo_count
);
57 fprintf(stderr
, " BOs size: %dkb\n", screen
->bo_size
/ 1024);
58 fprintf(stderr
, " BOs cached: %d\n", cache
->bo_count
);
59 fprintf(stderr
, " BOs cached size: %dkb\n", cache
->bo_size
/ 1024);
61 if (!list_empty(&cache
->time_list
)) {
62 struct vc4_bo
*first
= LIST_ENTRY(struct vc4_bo
,
63 cache
->time_list
.next
,
65 struct vc4_bo
*last
= LIST_ENTRY(struct vc4_bo
,
66 cache
->time_list
.prev
,
69 fprintf(stderr
, " oldest cache time: %ld\n",
70 (long)first
->free_time
);
71 fprintf(stderr
, " newest cache time: %ld\n",
72 (long)last
->free_time
);
75 clock_gettime(CLOCK_MONOTONIC
, &time
);
76 fprintf(stderr
, " now: %ld\n",
82 vc4_bo_remove_from_cache(struct vc4_bo_cache
*cache
, struct vc4_bo
*bo
)
84 list_del(&bo
->time_list
);
85 list_del(&bo
->size_list
);
87 cache
->bo_size
-= bo
->size
;
90 static struct vc4_bo
*
91 vc4_bo_from_cache(struct vc4_screen
*screen
, uint32_t size
, const char *name
)
93 struct vc4_bo_cache
*cache
= &screen
->bo_cache
;
94 uint32_t page_index
= size
/ 4096 - 1;
96 if (cache
->size_list_size
<= page_index
)
99 struct vc4_bo
*bo
= NULL
;
100 pipe_mutex_lock(cache
->lock
);
101 if (!list_empty(&cache
->size_list
[page_index
])) {
102 bo
= LIST_ENTRY(struct vc4_bo
, cache
->size_list
[page_index
].next
,
105 /* Check that the BO has gone idle. If not, then we want to
106 * allocate something new instead, since we assume that the
107 * user will proceed to CPU map it and fill it with stuff.
109 if (!vc4_bo_wait(bo
, 0, NULL
)) {
110 pipe_mutex_unlock(cache
->lock
);
114 pipe_reference_init(&bo
->reference
, 1);
115 vc4_bo_remove_from_cache(cache
, bo
);
119 pipe_mutex_unlock(cache
->lock
);
124 vc4_bo_alloc(struct vc4_screen
*screen
, uint32_t size
, const char *name
)
129 size
= align(size
, 4096);
131 bo
= vc4_bo_from_cache(screen
, size
, name
);
134 fprintf(stderr
, "Allocated %s %dkb from cache:\n",
136 vc4_bo_dump_stats(screen
);
141 bo
= CALLOC_STRUCT(vc4_bo
);
145 pipe_reference_init(&bo
->reference
, 1);
151 bool cleared_and_retried
= false;
153 if (!using_vc4_simulator
) {
154 struct drm_vc4_create_bo create
;
155 memset(&create
, 0, sizeof(create
));
159 ret
= drmIoctl(screen
->fd
, DRM_IOCTL_VC4_CREATE_BO
, &create
);
160 bo
->handle
= create
.handle
;
162 struct drm_mode_create_dumb create
;
163 memset(&create
, 0, sizeof(create
));
167 create
.height
= (size
+ 127) / 128;
169 ret
= drmIoctl(screen
->fd
, DRM_IOCTL_MODE_CREATE_DUMB
, &create
);
170 bo
->handle
= create
.handle
;
171 assert(create
.size
>= size
);
174 if (!list_empty(&screen
->bo_cache
.time_list
) &&
175 !cleared_and_retried
) {
176 cleared_and_retried
= true;
177 vc4_bo_cache_free_all(&screen
->bo_cache
);
186 screen
->bo_size
+= bo
->size
;
188 fprintf(stderr
, "Allocated %s %dkb:\n", name
, size
/ 1024);
189 vc4_bo_dump_stats(screen
);
196 vc4_bo_last_unreference(struct vc4_bo
*bo
)
198 struct vc4_screen
*screen
= bo
->screen
;
200 struct timespec time
;
201 clock_gettime(CLOCK_MONOTONIC
, &time
);
202 pipe_mutex_lock(screen
->bo_cache
.lock
);
203 vc4_bo_last_unreference_locked_timed(bo
, time
.tv_sec
);
204 pipe_mutex_unlock(screen
->bo_cache
.lock
);
208 vc4_bo_free(struct vc4_bo
*bo
)
210 struct vc4_screen
*screen
= bo
->screen
;
213 #ifdef USE_VC4_SIMULATOR
214 if (bo
->simulator_winsys_map
) {
216 bo
->map
= bo
->simulator_winsys_map
;
219 munmap(bo
->map
, bo
->size
);
220 VG(VALGRIND_FREELIKE_BLOCK(bo
->map
, 0));
223 struct drm_gem_close c
;
224 memset(&c
, 0, sizeof(c
));
225 c
.handle
= bo
->handle
;
226 int ret
= drmIoctl(screen
->fd
, DRM_IOCTL_GEM_CLOSE
, &c
);
228 fprintf(stderr
, "close object %d: %s\n", bo
->handle
, strerror(errno
));
231 screen
->bo_size
-= bo
->size
;
234 fprintf(stderr
, "Freed %s%s%dkb:\n",
235 bo
->name
? bo
->name
: "",
238 vc4_bo_dump_stats(screen
);
245 free_stale_bos(struct vc4_screen
*screen
, time_t time
)
247 struct vc4_bo_cache
*cache
= &screen
->bo_cache
;
248 bool freed_any
= false;
250 list_for_each_entry_safe(struct vc4_bo
, bo
, &cache
->time_list
,
252 if (dump_stats
&& !freed_any
) {
253 fprintf(stderr
, "Freeing stale BOs:\n");
254 vc4_bo_dump_stats(screen
);
258 /* If it's more than a second old, free it. */
259 if (time
- bo
->free_time
> 2) {
260 vc4_bo_remove_from_cache(cache
, bo
);
267 if (dump_stats
&& freed_any
) {
268 fprintf(stderr
, "Freed stale BOs:\n");
269 vc4_bo_dump_stats(screen
);
274 vc4_bo_cache_free_all(struct vc4_bo_cache
*cache
)
276 pipe_mutex_lock(cache
->lock
);
277 list_for_each_entry_safe(struct vc4_bo
, bo
, &cache
->time_list
,
279 vc4_bo_remove_from_cache(cache
, bo
);
282 pipe_mutex_unlock(cache
->lock
);
286 vc4_bo_last_unreference_locked_timed(struct vc4_bo
*bo
, time_t time
)
288 struct vc4_screen
*screen
= bo
->screen
;
289 struct vc4_bo_cache
*cache
= &screen
->bo_cache
;
290 uint32_t page_index
= bo
->size
/ 4096 - 1;
297 if (cache
->size_list_size
<= page_index
) {
298 struct list_head
*new_list
=
299 ralloc_array(screen
, struct list_head
, page_index
+ 1);
301 /* Move old list contents over (since the array has moved, and
302 * therefore the pointers to the list heads have to change).
304 for (int i
= 0; i
< cache
->size_list_size
; i
++) {
305 struct list_head
*old_head
= &cache
->size_list
[i
];
306 if (list_empty(old_head
))
307 list_inithead(&new_list
[i
]);
309 new_list
[i
].next
= old_head
->next
;
310 new_list
[i
].prev
= old_head
->prev
;
311 new_list
[i
].next
->prev
= &new_list
[i
];
312 new_list
[i
].prev
->next
= &new_list
[i
];
315 for (int i
= cache
->size_list_size
; i
< page_index
+ 1; i
++)
316 list_inithead(&new_list
[i
]);
318 cache
->size_list
= new_list
;
319 cache
->size_list_size
= page_index
+ 1;
322 bo
->free_time
= time
;
323 list_addtail(&bo
->size_list
, &cache
->size_list
[page_index
]);
324 list_addtail(&bo
->time_list
, &cache
->time_list
);
326 cache
->bo_size
+= bo
->size
;
328 fprintf(stderr
, "Freed %s %dkb to cache:\n",
329 bo
->name
, bo
->size
/ 1024);
330 vc4_bo_dump_stats(screen
);
334 free_stale_bos(screen
, time
);
337 static struct vc4_bo
*
338 vc4_bo_open_handle(struct vc4_screen
*screen
,
339 uint32_t winsys_stride
,
340 uint32_t handle
, uint32_t size
)
346 pipe_mutex_lock(screen
->bo_handles_mutex
);
348 bo
= util_hash_table_get(screen
->bo_handles
, (void*)(uintptr_t)handle
);
350 pipe_reference(NULL
, &bo
->reference
);
354 bo
= CALLOC_STRUCT(vc4_bo
);
355 pipe_reference_init(&bo
->reference
, 1);
362 #ifdef USE_VC4_SIMULATOR
364 bo
->simulator_winsys_map
= bo
->map
;
365 bo
->simulator_winsys_stride
= winsys_stride
;
366 bo
->map
= malloc(bo
->size
);
369 util_hash_table_set(screen
->bo_handles
, (void *)(uintptr_t)handle
, bo
);
372 pipe_mutex_unlock(screen
->bo_handles_mutex
);
377 vc4_bo_open_name(struct vc4_screen
*screen
, uint32_t name
,
378 uint32_t winsys_stride
)
380 struct drm_gem_open o
= {
383 int ret
= drmIoctl(screen
->fd
, DRM_IOCTL_GEM_OPEN
, &o
);
385 fprintf(stderr
, "Failed to open bo %d: %s\n",
386 name
, strerror(errno
));
390 return vc4_bo_open_handle(screen
, winsys_stride
, o
.handle
, o
.size
);
394 vc4_bo_open_dmabuf(struct vc4_screen
*screen
, int fd
, uint32_t winsys_stride
)
397 int ret
= drmPrimeFDToHandle(screen
->fd
, fd
, &handle
);
400 fprintf(stderr
, "Failed to get vc4 handle for dmabuf %d\n", fd
);
404 /* Determine the size of the bo we were handed. */
405 size
= lseek(fd
, 0, SEEK_END
);
407 fprintf(stderr
, "Couldn't get size of dmabuf fd %d.\n", fd
);
411 return vc4_bo_open_handle(screen
, winsys_stride
, handle
, size
);
415 vc4_bo_get_dmabuf(struct vc4_bo
*bo
)
418 int ret
= drmPrimeHandleToFD(bo
->screen
->fd
, bo
->handle
,
421 fprintf(stderr
, "Failed to export gem bo %d to dmabuf\n",
426 pipe_mutex_lock(bo
->screen
->bo_handles_mutex
);
428 util_hash_table_set(bo
->screen
->bo_handles
, (void *)(uintptr_t)bo
->handle
, bo
);
429 pipe_mutex_unlock(bo
->screen
->bo_handles_mutex
);
435 vc4_bo_alloc_shader(struct vc4_screen
*screen
, const void *data
, uint32_t size
)
440 bo
= CALLOC_STRUCT(vc4_bo
);
444 pipe_reference_init(&bo
->reference
, 1);
446 bo
->size
= align(size
, 4096);
448 bo
->private = false; /* Make sure it doesn't go back to the cache. */
450 if (!using_vc4_simulator
) {
451 struct drm_vc4_create_shader_bo create
= {
453 .data
= (uintptr_t)data
,
456 ret
= drmIoctl(screen
->fd
, DRM_IOCTL_VC4_CREATE_SHADER_BO
,
458 bo
->handle
= create
.handle
;
460 struct drm_mode_create_dumb create
;
461 memset(&create
, 0, sizeof(create
));
465 create
.height
= (size
+ 127) / 128;
467 ret
= drmIoctl(screen
->fd
, DRM_IOCTL_MODE_CREATE_DUMB
, &create
);
468 bo
->handle
= create
.handle
;
469 assert(create
.size
>= size
);
472 memcpy(bo
->map
, data
, size
);
475 fprintf(stderr
, "create shader ioctl failure\n");
480 screen
->bo_size
+= bo
->size
;
482 fprintf(stderr
, "Allocated shader %dkb:\n", bo
->size
/ 1024);
483 vc4_bo_dump_stats(screen
);
490 vc4_bo_flink(struct vc4_bo
*bo
, uint32_t *name
)
492 struct drm_gem_flink flink
= {
493 .handle
= bo
->handle
,
495 int ret
= drmIoctl(bo
->screen
->fd
, DRM_IOCTL_GEM_FLINK
, &flink
);
497 fprintf(stderr
, "Failed to flink bo %d: %s\n",
498 bo
->handle
, strerror(errno
));
509 static int vc4_wait_seqno_ioctl(int fd
, uint64_t seqno
, uint64_t timeout_ns
)
511 if (using_vc4_simulator
)
514 struct drm_vc4_wait_seqno wait
= {
516 .timeout_ns
= timeout_ns
,
518 int ret
= drmIoctl(fd
, DRM_IOCTL_VC4_WAIT_SEQNO
, &wait
);
527 vc4_wait_seqno(struct vc4_screen
*screen
, uint64_t seqno
, uint64_t timeout_ns
,
530 if (screen
->finished_seqno
>= seqno
)
533 if (unlikely(vc4_debug
& VC4_DEBUG_PERF
) && timeout_ns
&& reason
) {
534 if (vc4_wait_seqno_ioctl(screen
->fd
, seqno
, 0) == -ETIME
) {
535 fprintf(stderr
, "Blocking on seqno %lld for %s\n",
536 (long long)seqno
, reason
);
540 int ret
= vc4_wait_seqno_ioctl(screen
->fd
, seqno
, timeout_ns
);
543 fprintf(stderr
, "wait failed: %d\n", ret
);
550 screen
->finished_seqno
= seqno
;
554 static int vc4_wait_bo_ioctl(int fd
, uint32_t handle
, uint64_t timeout_ns
)
556 if (using_vc4_simulator
)
559 struct drm_vc4_wait_bo wait
= {
561 .timeout_ns
= timeout_ns
,
563 int ret
= drmIoctl(fd
, DRM_IOCTL_VC4_WAIT_BO
, &wait
);
572 vc4_bo_wait(struct vc4_bo
*bo
, uint64_t timeout_ns
, const char *reason
)
574 struct vc4_screen
*screen
= bo
->screen
;
576 if (unlikely(vc4_debug
& VC4_DEBUG_PERF
) && timeout_ns
&& reason
) {
577 if (vc4_wait_bo_ioctl(screen
->fd
, bo
->handle
, 0) == -ETIME
) {
578 fprintf(stderr
, "Blocking on %s BO for %s\n",
583 int ret
= vc4_wait_bo_ioctl(screen
->fd
, bo
->handle
, timeout_ns
);
586 fprintf(stderr
, "wait failed: %d\n", ret
);
597 vc4_bo_map_unsynchronized(struct vc4_bo
*bo
)
605 if (!using_vc4_simulator
) {
606 struct drm_vc4_mmap_bo map
;
607 memset(&map
, 0, sizeof(map
));
608 map
.handle
= bo
->handle
;
609 ret
= drmIoctl(bo
->screen
->fd
, DRM_IOCTL_VC4_MMAP_BO
, &map
);
612 struct drm_mode_map_dumb map
;
613 memset(&map
, 0, sizeof(map
));
614 map
.handle
= bo
->handle
;
615 ret
= drmIoctl(bo
->screen
->fd
, DRM_IOCTL_MODE_MAP_DUMB
, &map
);
619 fprintf(stderr
, "map ioctl failure\n");
623 bo
->map
= mmap(NULL
, bo
->size
, PROT_READ
| PROT_WRITE
, MAP_SHARED
,
624 bo
->screen
->fd
, offset
);
625 if (bo
->map
== MAP_FAILED
) {
626 fprintf(stderr
, "mmap of bo %d (offset 0x%016llx, size %d) failed\n",
627 bo
->handle
, (long long)offset
, bo
->size
);
630 VG(VALGRIND_MALLOCLIKE_BLOCK(bo
->map
, bo
->size
, 0, false));
636 vc4_bo_map(struct vc4_bo
*bo
)
638 void *map
= vc4_bo_map_unsynchronized(bo
);
640 bool ok
= vc4_bo_wait(bo
, PIPE_TIMEOUT_INFINITE
, "bo map");
642 fprintf(stderr
, "BO wait for map failed\n");
650 vc4_bufmgr_destroy(struct pipe_screen
*pscreen
)
652 struct vc4_screen
*screen
= vc4_screen(pscreen
);
653 struct vc4_bo_cache
*cache
= &screen
->bo_cache
;
655 vc4_bo_cache_free_all(cache
);
658 fprintf(stderr
, "BO stats after screen destroy:\n");
659 vc4_bo_dump_stats(screen
);