#include "drm-uapi/lima_drm.h"
#include "util/u_hash_table.h"
+#include "util/u_math.h"
#include "util/os_time.h"
#include "os/os_mman.h"
#include "lima_screen.h"
#include "lima_bo.h"
+#include "lima_util.h"
#define PTR_TO_UINT(x) ((unsigned)((intptr_t)(x)))
return false;
}
+bool lima_bo_cache_init(struct lima_screen *screen)
+{
+ mtx_init(&screen->bo_cache_lock, mtx_plain);
+ list_inithead(&screen->bo_cache_time);
+ for (int i = 0; i < NR_BO_CACHE_BUCKETS; i++)
+ list_inithead(&screen->bo_cache_buckets[i]);
+
+ return true;
+}
+
void lima_bo_table_fini(struct lima_screen *screen)
{
mtx_destroy(&screen->bo_table_lock);
util_hash_table_destroy(screen->bo_flink_names);
}
+static void
+lima_bo_cache_remove(struct lima_bo *bo)
+{
+ list_del(&bo->size_list);
+ list_del(&bo->time_list);
+}
+
static void lima_close_kms_handle(struct lima_screen *screen, uint32_t handle)
{
struct drm_gem_close args = {
drmIoctl(screen->fd, DRM_IOCTL_GEM_CLOSE, &args);
}
+static void
+lima_bo_free(struct lima_bo *bo)
+{
+ struct lima_screen *screen = bo->screen;
+ mtx_lock(&screen->bo_table_lock);
+ util_hash_table_remove(screen->bo_handles,
+ (void *)(uintptr_t)bo->handle);
+ if (bo->flink_name)
+ util_hash_table_remove(screen->bo_flink_names,
+ (void *)(uintptr_t)bo->flink_name);
+ mtx_unlock(&screen->bo_table_lock);
+
+ if (bo->map)
+ lima_bo_unmap(bo);
+
+ lima_close_kms_handle(screen, bo->handle);
+ free(bo);
+}
+
+void lima_bo_cache_fini(struct lima_screen *screen)
+{
+ mtx_destroy(&screen->bo_cache_lock);
+
+ list_for_each_entry_safe(struct lima_bo, entry,
+ &screen->bo_cache_time, time_list) {
+ lima_bo_cache_remove(entry);
+ lima_bo_free(entry);
+ }
+}
+
static bool lima_bo_get_info(struct lima_bo *bo)
{
struct drm_lima_gem_info req = {
return true;
}
+static unsigned
+lima_bucket_index(unsigned size)
+{
+ /* Round down to POT to compute a bucket index */
+
+ unsigned bucket_index = util_logbase2(size);
+
+ /* Clamp the bucket index; all huge allocations will be
+ * sorted into the largest bucket */
+ bucket_index = CLAMP(bucket_index, MIN_BO_CACHE_BUCKET,
+ MAX_BO_CACHE_BUCKET);
+
+ /* Reindex from 0 */
+ return (bucket_index - MIN_BO_CACHE_BUCKET);
+}
+
+static struct list_head *
+lima_bo_cache_get_bucket(struct lima_screen *screen, unsigned size)
+{
+ return &screen->bo_cache_buckets[lima_bucket_index(size)];
+}
+
+static void
+lima_bo_cache_free_stale_bos(struct lima_screen *screen, time_t time)
+{
+ list_for_each_entry_safe(struct lima_bo, entry,
+ &screen->bo_cache_time, time_list) {
+ /* Free BOs that are sitting idle for longer than 5 seconds */
+ if (time - entry->free_time > 6) {
+ lima_bo_cache_remove(entry);
+ lima_bo_free(entry);
+ } else
+ break;
+ }
+}
+
+static bool
+lima_bo_cache_put(struct lima_bo *bo)
+{
+ if (!bo->cacheable)
+ return false;
+
+ struct lima_screen *screen = bo->screen;
+
+ mtx_lock(&screen->bo_cache_lock);
+ struct list_head *bucket = lima_bo_cache_get_bucket(screen, bo->size);
+
+ if (!bucket) {
+ mtx_unlock(&screen->bo_cache_lock);
+ return false;
+ }
+
+ struct timespec time;
+ clock_gettime(CLOCK_MONOTONIC, &time);
+ bo->free_time = time.tv_sec;
+ list_addtail(&bo->size_list, bucket);
+ list_addtail(&bo->time_list, &screen->bo_cache_time);
+ lima_bo_cache_free_stale_bos(screen, time.tv_sec);
+ mtx_unlock(&screen->bo_cache_lock);
+
+ return true;
+}
+
+static struct lima_bo *
+lima_bo_cache_get(struct lima_screen *screen, uint32_t size, uint32_t flags)
+{
+ struct lima_bo *bo = NULL;
+ mtx_lock(&screen->bo_cache_lock);
+ struct list_head *bucket = lima_bo_cache_get_bucket(screen, size);
+
+ if (!bucket) {
+ mtx_unlock(&screen->bo_cache_lock);
+ return false;
+ }
+
+ list_for_each_entry_safe(struct lima_bo, entry, bucket, size_list) {
+ if (entry->size >= size &&
+ entry->flags == flags) {
+ /* Check if BO is idle. If it's not it's better to allocate new one */
+ if (!lima_bo_wait(entry, LIMA_GEM_WAIT_WRITE, 0))
+ break;
+
+ lima_bo_cache_remove(entry);
+ p_atomic_set(&entry->refcnt, 1);
+ bo = entry;
+ break;
+ }
+ }
+
+ mtx_unlock(&screen->bo_cache_lock);
+
+ return bo;
+}
+
struct lima_bo *lima_bo_create(struct lima_screen *screen,
uint32_t size, uint32_t flags)
{
struct lima_bo *bo;
+
+ /* Try to get bo from cache first */
+ bo = lima_bo_cache_get(screen, size, flags);
+ if (bo)
+ return bo;
+
+ size = align(size, LIMA_PAGE_SIZE);
+
struct drm_lima_gem_create req = {
.size = size,
.flags = flags,
if (!(bo = calloc(1, sizeof(*bo))))
return NULL;
+ list_inithead(&bo->time_list);
+ list_inithead(&bo->size_list);
+
if (drmIoctl(screen->fd, DRM_IOCTL_LIMA_GEM_CREATE, &req))
goto err_out0;
bo->screen = screen;
bo->size = req.size;
+ bo->flags = req.flags;
bo->handle = req.handle;
+ bo->cacheable = !(lima_debug & LIMA_DEBUG_NO_BO_CACHE);
p_atomic_set(&bo->refcnt, 1);
if (!lima_bo_get_info(bo))
return NULL;
}
-void lima_bo_free(struct lima_bo *bo)
+void lima_bo_unreference(struct lima_bo *bo)
{
if (!p_atomic_dec_zero(&bo->refcnt))
return;
- struct lima_screen *screen = bo->screen;
- mtx_lock(&screen->bo_table_lock);
- util_hash_table_remove(screen->bo_handles,
- (void *)(uintptr_t)bo->handle);
- if (bo->flink_name)
- util_hash_table_remove(screen->bo_flink_names,
- (void *)(uintptr_t)bo->flink_name);
- mtx_unlock(&screen->bo_table_lock);
-
- if (bo->map)
- lima_bo_unmap(bo);
+ /* Try to put it into cache */
+ if (lima_bo_cache_put(bo))
+ return;
- lima_close_kms_handle(screen, bo->handle);
- free(bo);
+ lima_bo_free(bo);
}
void *lima_bo_map(struct lima_bo *bo)
{
struct lima_screen *screen = bo->screen;
+ /* Don't cache exported BOs */
+ bo->cacheable = false;
+
switch (handle->type) {
case WINSYS_HANDLE_TYPE_SHARED:
if (!bo->flink_name) {
if (bo) {
p_atomic_inc(&bo->refcnt);
+ /* Don't cache imported BOs */
+ bo->cacheable = false;
mtx_unlock(&screen->bo_table_lock);
return bo;
}
return NULL;
}
+ /* Don't cache imported BOs */
+ bo->cacheable = false;
+ list_inithead(&bo->time_list);
+ list_inithead(&bo->size_list);
bo->screen = screen;
p_atomic_set(&bo->refcnt, 1);
free(screen->ro);
if (screen->pp_buffer)
- lima_bo_free(screen->pp_buffer);
+ lima_bo_unreference(screen->pp_buffer);
+ lima_bo_cache_fini(screen);
lima_bo_table_fini(screen);
ralloc_free(screen);
}
"dump GPU command stream to $PWD/lima.dump" },
{ "shaderdb", LIMA_DEBUG_SHADERDB,
"print shader information for shaderdb" },
+ { "nobocache", LIMA_DEBUG_NO_BO_CACHE,
+ "disable BO cache" },
{ NULL }
};
if (!lima_screen_query_info(screen))
goto err_out0;
- if (!lima_bo_table_init(screen))
+ if (!lima_bo_cache_init(screen))
goto err_out0;
+ if (!lima_bo_table_init(screen))
+ goto err_out1;
+
screen->pp_ra = ppir_regalloc_init(screen);
if (!screen->pp_ra)
- goto err_out1;
+ goto err_out2;
screen->pp_buffer = lima_bo_create(screen, pp_buffer_size, 0);
if (!screen->pp_buffer)
- goto err_out1;
+ goto err_out2;
+ screen->pp_buffer->cacheable = false;
/* fs program for clear buffer?
* const0 1 0 0 -1.67773, mov.v0 $0 ^const0.xxxx, stop
screen->ro = renderonly_dup(ro);
if (!screen->ro) {
fprintf(stderr, "Failed to dup renderonly object\n");
- goto err_out2;
+ goto err_out3;
}
}
return &screen->base;
+err_out3:
+ lima_bo_unreference(screen->pp_buffer);
err_out2:
- lima_bo_free(screen->pp_buffer);
-err_out1:
lima_bo_table_fini(screen);
+err_out1:
+ lima_bo_cache_fini(screen);
err_out0:
ralloc_free(screen);
return NULL;