broadcom/vc4: Use a single-entry cached last_hindex value.

author Eric Anholt <eric@anholt.net>

Wed, 29 Nov 2017 00:17:16 +0000 (16:17 -0800)

committer Eric Anholt <eric@anholt.net>

Fri, 1 Dec 2017 23:37:28 +0000 (15:37 -0800)
author Eric Anholt <eric@anholt.net>
Wed, 29 Nov 2017 00:17:16 +0000 (16:17 -0800)
committer Eric Anholt <eric@anholt.net>
Fri, 1 Dec 2017 23:37:28 +0000 (15:37 -0800)
diff --git a/src/gallium/drivers/vc4/vc4_bufmgr.h b/src/gallium/drivers/vc4/vc4_bufmgr.h

index 4e7b23e0862477b1c45c1bf18aa4232f47fd96af..e0f6bbcfd8b4d7da8855d92d9f7008650ff6dafb 100644 (file)
--- a/src/gallium/drivers/vc4/vc4_bufmgr.h
+++ b/src/gallium/drivers/vc4/vc4_bufmgr.h
@@ -39,6 +39,14 @@ struct vc4_bo {
          uint32_t handle;
          uint32_t size;
  
+        /* This will be read/written by multiple threads without a lock -- you
+         * should take a snapshot and use it to see if you happen to be in the
+         * CL's handles at this position, to make most lookups O(1).  It's
+         * volatile to make sure that the compiler doesn't emit multiple loads
+         * from the address, which would make the lookup racy.
+         */
+        volatile uint32_t last_hindex;
+
          /** Entry in the linked list of buffers freed, by age. */
          struct list_head time_list;
          /** Entry in the per-page-count linked list of buffers freed (by age). */
diff --git a/src/gallium/drivers/vc4/vc4_cl.c b/src/gallium/drivers/vc4/vc4_cl.c

index 508281a27bba3464699745309fa6923d9505eb0a..7ae092ebce3091191a2fce5c5870d8c919df5102 100644 (file)
--- a/src/gallium/drivers/vc4/vc4_cl.c
+++ b/src/gallium/drivers/vc4/vc4_cl.c
@@ -61,10 +61,19 @@ vc4_gem_hindex(struct vc4_job *job, struct vc4_bo *bo)
  {
          uint32_t hindex;
          uint32_t *current_handles = job->bo_handles.base;
+        uint32_t cl_hindex_count = cl_offset(&job->bo_handles) / 4;
+        uint32_t last_hindex = bo->last_hindex; /* volatile read! */
  
-        for (hindex = 0; hindex < cl_offset(&job->bo_handles) / 4; hindex++) {
-                if (current_handles[hindex] == bo->handle)
+        if (last_hindex < cl_hindex_count &&
+            current_handles[last_hindex] == bo->handle) {
+                return last_hindex;
+        }
+
+        for (hindex = 0; hindex < cl_hindex_count; hindex++) {
+                if (current_handles[hindex] == bo->handle) {
+                        bo->last_hindex = hindex;
                          return hindex;
+                }
          }
  
          struct vc4_cl_out *out;
@@ -79,5 +88,6 @@ vc4_gem_hindex(struct vc4_job *job, struct vc4_bo *bo)
  
          job->bo_space += bo->size;
  
+        bo->last_hindex = hindex;
          return hindex;
  }
author	Eric Anholt <eric@anholt.net>
	Wed, 29 Nov 2017 00:17:16 +0000 (16:17 -0800)
committer	Eric Anholt <eric@anholt.net>
	Fri, 1 Dec 2017 23:37:28 +0000 (15:37 -0800)
src/gallium/drivers/vc4/vc4_bufmgr.h		patch \| blob \| history
src/gallium/drivers/vc4/vc4_cl.c		patch \| blob \| history