gallium: add PIPE_SHADER_CAP_GLSL_16BIT_TEMPS for LowerPrecisionTemporaries

[mesa.git] / src / gallium / drivers / svga / svga_screen_cache.c
diff --git a/src/gallium/drivers/svga/svga_screen_cache.c b/src/gallium/drivers/svga/svga_screen_cache.c

index 4344a87348c9737a743fbb08c2c6d4255deb0a9d..aba6e304fbdec86e679d22d099aeed40ef70d5cb 100644 (file)
--- a/src/gallium/drivers/svga/svga_screen_cache.c
+++ b/src/gallium/drivers/svga/svga_screen_cache.c
@@ -25,14 +25,15 @@
  
  #include "util/u_math.h"
  #include "util/u_memory.h"
-#include "util/u_hash.h"
+#include "util/crc32.h"
  
  #include "svga_debug.h"
  #include "svga_format.h"
  #include "svga_winsys.h"
  #include "svga_screen.h"
  #include "svga_screen_cache.h"
-
+#include "svga_context.h"
+#include "svga_cmd.h"
  
  #define SVGA_SURFACE_CACHE_ENABLED 1
  
@@ -40,13 +41,14 @@
  /**
   * Return the size of the surface described by the key (in bytes).
   */
-static unsigned
-surface_size(const struct svga_host_surface_cache_key *key)
+unsigned
+svga_surface_size(const struct svga_host_surface_cache_key *key)
  {
     unsigned bw, bh, bpb, total_size, i;
  
     assert(key->numMipLevels > 0);
     assert(key->numFaces > 0);
+   assert(key->arraySize > 0);
  
     if (key->format == SVGA3D_BUFFER) {
        /* Special case: we don't want to count vertex/index buffers
@@ -67,7 +69,7 @@ surface_size(const struct svga_host_surface_cache_key *key)
        total_size += img_size;
     }
  
-   total_size *= key->numFaces;
+   total_size *= key->numFaces * key->arraySize * MAX2(1, key->sampleCount);
  
     return total_size;
  }
@@ -104,7 +106,7 @@ svga_screen_cache_lookup(struct svga_screen *svgascreen,
  
     bucket = svga_screen_cache_bucket(key);
  
-   pipe_mutex_lock(cache->mutex);
+   mtx_lock(&cache->mutex);
  
     curr = cache->bucket[bucket].next;
     next = curr->next;
@@ -131,16 +133,16 @@ svga_screen_cache_lookup(struct svga_screen *svgascreen,
           entry->handle = NULL;
  
           /* Remove from hash table */
-         LIST_DEL(&entry->bucket_head);
+         list_del(&entry->bucket_head);
  
           /* remove from LRU list */
-         LIST_DEL(&entry->head);
+         list_del(&entry->head);
  
           /* Add the cache entry (but not the surface!) to the empty list */
-         LIST_ADD(&entry->head, &cache->empty);
+         list_add(&entry->head, &cache->empty);
  
           /* update the cache size */
-         surf_size = surface_size(&entry->key);
+         surf_size = svga_surface_size(&entry->key);
           assert(surf_size <= cache->total_size);
           if (surf_size > cache->total_size)
              cache->total_size = 0; /* should never happen, but be safe */
@@ -154,7 +156,7 @@ svga_screen_cache_lookup(struct svga_screen *svgascreen,
        next = curr->next;
     }
  
-   pipe_mutex_unlock(cache->mutex);
+   mtx_unlock(&cache->mutex);
  
     if (SVGA_DEBUG & DEBUG_DMA)
        debug_printf("%s: cache %s after %u tries (bucket %d)\n", __FUNCTION__,
@@ -185,14 +187,14 @@ svga_screen_cache_shrink(struct svga_screen *svgascreen,
        if (entry->key.format != SVGA3D_BUFFER) {
           /* we don't want to discard vertex/index buffers */
  
-         cache->total_size -= surface_size(&entry->key);
+         cache->total_size -= svga_surface_size(&entry->key);
  
           assert(entry->handle);
           sws->surface_reference(sws, &entry->handle, NULL);
  
-         LIST_DEL(&entry->bucket_head);
-         LIST_DEL(&entry->head);
-         LIST_ADD(&entry->head, &cache->empty);
+         list_del(&entry->bucket_head);
+         list_del(&entry->head);
+         list_add(&entry->head, &cache->empty);
  
           if (cache->total_size <= target_size) {
              /* all done */
@@ -223,15 +225,15 @@ svga_screen_cache_add(struct svga_screen *svgascreen,
     if (!handle)
        return;
  
-   surf_size = surface_size(key);
+   surf_size = svga_surface_size(key);
  
     *p_handle = NULL;
-   pipe_mutex_lock(cache->mutex);
+   mtx_lock(&cache->mutex);
  
     if (surf_size >= SVGA_HOST_SURFACE_CACHE_BYTES) {
        /* this surface is too large to cache, just free it */
        sws->surface_reference(sws, &handle, NULL);
-      pipe_mutex_unlock(cache->mutex);
+      mtx_unlock(&cache->mutex);
        return;
     }
  
@@ -249,12 +251,12 @@ svga_screen_cache_add(struct svga_screen *svgascreen,
            * just discard this surface.
            */
           sws->surface_reference(sws, &handle, NULL);
-         pipe_mutex_unlock(cache->mutex);
+         mtx_unlock(&cache->mutex);
           return;
        }
     }
  
-   if (!LIST_IS_EMPTY(&cache->empty)) {
+   if (!list_is_empty(&cache->empty)) {
        /* An empty entry has no surface associated with it.
         * Use the first empty entry.
         */
@@ -262,24 +264,24 @@ svga_screen_cache_add(struct svga_screen *svgascreen,
                           cache->empty.next, head);
  
        /* Remove from LRU list */
-      LIST_DEL(&entry->head);
+      list_del(&entry->head);
     }
-   else if (!LIST_IS_EMPTY(&cache->unused)) {
+   else if (!list_is_empty(&cache->unused)) {
        /* free the last used buffer and reuse its entry */
        entry = LIST_ENTRY(struct svga_host_surface_cache_entry,
                           cache->unused.prev, head);
        SVGA_DBG(DEBUG_CACHE|DEBUG_DMA,
                 "unref sid %p (make space)\n", entry->handle);
  
-      cache->total_size -= surface_size(&entry->key);
+      cache->total_size -= svga_surface_size(&entry->key);
  
        sws->surface_reference(sws, &entry->handle, NULL);
  
        /* Remove from hash table */
-      LIST_DEL(&entry->bucket_head);
+      list_del(&entry->bucket_head);
  
        /* Remove from LRU list */
-      LIST_DEL(&entry->head);
+      list_del(&entry->head);
     }
  
     if (entry) {
@@ -289,7 +291,12 @@ svga_screen_cache_add(struct svga_screen *svgascreen,
  
        SVGA_DBG(DEBUG_CACHE|DEBUG_DMA,
                 "cache sid %p\n", entry->handle);
-      LIST_ADD(&entry->head, &cache->validated);
+
+      /* If we don't have gb objects, we don't need to invalidate. */
+      if (sws->have_gb_objects)
+         list_add(&entry->head, &cache->validated);
+      else
+         list_add(&entry->head, &cache->invalidated);
  
        cache->total_size += surf_size;
     }
@@ -300,16 +307,20 @@ svga_screen_cache_add(struct svga_screen *svgascreen,
        sws->surface_reference(sws, &handle, NULL);
     }
  
-   pipe_mutex_unlock(cache->mutex);
+   mtx_unlock(&cache->mutex);
  }
  
  
+/* Maximum number of invalidate surface commands in a command buffer */
+# define SVGA_MAX_SURFACE_TO_INVALIDATE 1000
+
  /**
   * Called during the screen flush to move all buffers not in a validate list
   * into the unused list.
   */
  void
  svga_screen_cache_flush(struct svga_screen *svgascreen,
+                        struct svga_context *svga,
                          struct pipe_fence_handle *fence)
  {
     struct svga_host_surface_cache *cache = &svgascreen->cache;
@@ -318,7 +329,7 @@ svga_screen_cache_flush(struct svga_screen *svgascreen,
     struct list_head *curr, *next;
     unsigned bucket;
  
-   pipe_mutex_lock(cache->mutex);
+   mtx_lock(&cache->mutex);
  
     /* Loop over entries in the invalidated list */
     curr = cache->invalidated.next;
@@ -330,45 +341,79 @@ svga_screen_cache_flush(struct svga_screen *svgascreen,
  
        if (sws->surface_is_flushed(sws, entry->handle)) {
           /* remove entry from the invalidated list */
-         LIST_DEL(&entry->head);
+         list_del(&entry->head);
  
-         svgascreen->sws->fence_reference(svgascreen->sws, &entry->fence, fence);
+         sws->fence_reference(sws, &entry->fence, fence);
  
           /* Add entry to the unused list */
-         LIST_ADD(&entry->head, &cache->unused);
+         list_add(&entry->head, &cache->unused);
  
           /* Add entry to the hash table bucket */
           bucket = svga_screen_cache_bucket(&entry->key);
-         LIST_ADD(&entry->bucket_head, &cache->bucket[bucket]);
+         list_add(&entry->bucket_head, &cache->bucket[bucket]);
        }
  
        curr = next;
        next = curr->next;
     }
  
+   unsigned nsurf = 0;
     curr = cache->validated.next;
     next = curr->next;
     while (curr != &cache->validated) {
        entry = LIST_ENTRY(struct svga_host_surface_cache_entry, curr, head);
  
        assert(entry->handle);
+      assert(svga_have_gb_objects(svga));
  
        if (sws->surface_is_flushed(sws, entry->handle)) {
           /* remove entry from the validated list */
-         LIST_DEL(&entry->head);
+         list_del(&entry->head);
  
-         /* it is now safe to invalidate the surface content. */
-         sws->surface_invalidate(sws, entry->handle);
+         /* It is now safe to invalidate the surface content.
+          * It will be done using the current context.
+          */
+         if (SVGA_TRY(SVGA3D_InvalidateGBSurface(svga->swc, entry->handle))
+             != PIPE_OK) {
+            ASSERTED enum pipe_error ret;
+
+            /* Even though surface invalidation here is done after the command
+             * buffer is flushed, it is still possible that it will
+             * fail because there might be just enough of this command that is
+             * filling up the command buffer, so in this case we will call
+             * the winsys flush directly to flush the buffer.
+             * Note, we don't want to call svga_context_flush() here because
+             * this function itself is called inside svga_context_flush().
+             */
+            svga_retry_enter(svga);
+            svga->swc->flush(svga->swc, NULL);
+            nsurf = 0;
+            ret = SVGA3D_InvalidateGBSurface(svga->swc, entry->handle);
+            svga_retry_exit(svga);
+            assert(ret == PIPE_OK);
+         }
  
           /* add the entry to the invalidated list */
-         LIST_ADD(&entry->head, &cache->invalidated);
+
+         list_add(&entry->head, &cache->invalidated);
+         nsurf++;
        }
  
        curr = next;
        next = curr->next;
     }
  
-   pipe_mutex_unlock(cache->mutex);
+   mtx_unlock(&cache->mutex);
+
+   /**
+    * In some rare cases (when running ARK survival), we hit the max number
+    * of surface relocations with invalidated surfaces during context flush.
+    * So if the number of invalidated surface exceeds a certain limit (1000),
+    * we'll do another winsys flush.
+    */
+   if (nsurf > SVGA_MAX_SURFACE_TO_INVALIDATE) {
+      svga->swc->flush(svga->swc, NULL);
+   }
  }
  
  
@@ -389,15 +434,14 @@ svga_screen_cache_cleanup(struct svga_screen *svgascreen)
                    "unref sid %p (shutdown)\n", cache->entries[i].handle);
          sws->surface_reference(sws, &cache->entries[i].handle, NULL);
  
-         cache->total_size -= surface_size(&cache->entries[i].key);
+         cache->total_size -= svga_surface_size(&cache->entries[i].key);
        }
  
        if (cache->entries[i].fence)
-         svgascreen->sws->fence_reference(svgascreen->sws,
-                                          &cache->entries[i].fence, NULL);
+         sws->fence_reference(sws, &cache->entries[i].fence, NULL);
     }
  
-   pipe_mutex_destroy(cache->mutex);
+   mtx_destroy(&cache->mutex);
  }
  
  
@@ -409,20 +453,20 @@ svga_screen_cache_init(struct svga_screen *svgascreen)
  
     assert(cache->total_size == 0);
  
-   pipe_mutex_init(cache->mutex);
+   (void) mtx_init(&cache->mutex, mtx_plain);
  
     for (i = 0; i < SVGA_HOST_SURFACE_CACHE_BUCKETS; ++i)
-      LIST_INITHEAD(&cache->bucket[i]);
+      list_inithead(&cache->bucket[i]);
  
-   LIST_INITHEAD(&cache->unused);
+   list_inithead(&cache->unused);
  
-   LIST_INITHEAD(&cache->validated);
+   list_inithead(&cache->validated);
  
-   LIST_INITHEAD(&cache->invalidated);
+   list_inithead(&cache->invalidated);
  
-   LIST_INITHEAD(&cache->empty);
+   list_inithead(&cache->empty);
     for (i = 0; i < SVGA_HOST_SURFACE_CACHE_SIZE; ++i)
-      LIST_ADDTAIL(&cache->entries[i].head, &cache->empty);
+      list_addtail(&cache->entries[i].head, &cache->empty);
  
     return PIPE_OK;
  }
@@ -434,10 +478,12 @@ svga_screen_cache_init(struct svga_screen *svgascreen)
   * allocate a new surface.
   * \param bind_flags  bitmask of PIPE_BIND_x flags
   * \param usage  one of PIPE_USAGE_x values
+ * \param validated return True if the surface is a reused surface
   */
  struct svga_winsys_surface *
  svga_screen_surface_create(struct svga_screen *svgascreen,
                             unsigned bind_flags, enum pipe_resource_usage usage,
+                           boolean *validated,
                             struct svga_host_surface_cache_key *key)
  {
     struct svga_winsys_screen *sws = svgascreen->sws;
@@ -456,8 +502,9 @@ svga_screen_surface_create(struct svga_screen *svgascreen,
              key->cachable);
  
     if (cachable) {
+      /* Try to re-cycle a previously freed, cached surface */
        if (key->format == SVGA3D_BUFFER) {
-         SVGA3dSurfaceFlags hint_flag;
+         SVGA3dSurfaceAllFlags hint_flag;
  
           /* For buffers, round the buffer size up to the nearest power
            * of two to increase the probability of cache hits.  Keep
@@ -511,16 +558,20 @@ svga_screen_surface_create(struct svga_screen *svgascreen,
                       key->numMipLevels,
                       key->numFaces,
                       key->arraySize);
+         *validated = TRUE;
        }
     }
  
     if (!handle) {
+      /* Unable to recycle surface, allocate a new one */
        unsigned usage = 0;
  
        if (!key->cachable)
           usage |= SVGA_SURFACE_USAGE_SHARED;
        if (key->scanout)
           usage |= SVGA_SURFACE_USAGE_SCANOUT;
+      if (key->coherent)
+         usage |= SVGA_SURFACE_USAGE_COHERENT;
  
        handle = sws->surface_create(sws,
                                     key->flags,
@@ -537,6 +588,8 @@ svga_screen_surface_create(struct svga_screen *svgascreen,
                    key->size.width,
                    key->size.height,
                    key->size.depth);
+
+      *validated = FALSE;
     }
  
     return handle;
@@ -559,11 +612,6 @@ svga_screen_surface_destroy(struct svga_screen *svgascreen,
      * that case.
      */
     if (SVGA_SURFACE_CACHE_ENABLED && key->cachable) {
-
-      /* Invalidate the surface before putting it into the recycle pool */
-      if (key->format != SVGA3D_BUFFER)
-         sws->surface_invalidate(sws, *p_handle);
-
        svga_screen_cache_add(svgascreen, key, p_handle);
     }
     else {