amdgpu: use simple mtx

[mesa.git] / src / gallium / winsys / amdgpu / drm / amdgpu_cs.c
diff --git a/src/gallium/winsys/amdgpu/drm/amdgpu_cs.c b/src/gallium/winsys/amdgpu/drm/amdgpu_cs.c

index 0a657f7505d02ba3204815272388ea1bf4e0b270..0f36cc5ae6307f578331b6ff9a967a3ddfd00847 100644 (file)
--- a/src/gallium/winsys/amdgpu/drm/amdgpu_cs.c
+++ b/src/gallium/winsys/amdgpu/drm/amdgpu_cs.c
@@ -25,10 +25,6 @@
   * next paragraph) shall be included in all copies or substantial portions
   * of the Software.
   */
-/*
- * Authors:
- *      Marek Olšák <maraeo@gmail.com>
- */
  
  #include "amdgpu_cs.h"
  #include "os/os_time.h"
@@ -542,7 +538,7 @@ static int amdgpu_lookup_or_add_sparse_buffer(struct amdgpu_cs *acs,
     /* We delay adding the backing buffers until we really have to. However,
      * we cannot delay accounting for memory use.
      */
-   mtx_lock(&bo->u.sparse.commit_lock);
+   simple_mtx_lock(&bo->u.sparse.commit_lock);
  
     list_for_each_entry(struct amdgpu_sparse_backing, backing, &bo->u.sparse.backing, list) {
        if (bo->initial_domain & RADEON_DOMAIN_VRAM)
@@ -551,7 +547,7 @@ static int amdgpu_lookup_or_add_sparse_buffer(struct amdgpu_cs *acs,
           acs->main.base.used_gart += backing->bo->base.size;
     }
  
-   mtx_unlock(&bo->u.sparse.commit_lock);
+   simple_mtx_unlock(&bo->u.sparse.commit_lock);
  
     return idx;
  }
@@ -616,7 +612,8 @@ static unsigned amdgpu_cs_add_buffer(struct radeon_winsys_cs *rcs,
     return index;
  }
  
-static bool amdgpu_ib_new_buffer(struct amdgpu_winsys *ws, struct amdgpu_ib *ib)
+static bool amdgpu_ib_new_buffer(struct amdgpu_winsys *ws, struct amdgpu_ib *ib,
+                                 enum ring_type ring_type)
  {
     struct pb_buffer *pb;
     uint8_t *mapped;
@@ -646,7 +643,11 @@ static bool amdgpu_ib_new_buffer(struct amdgpu_winsys *ws, struct amdgpu_ib *ib)
     pb = ws->base.buffer_create(&ws->base, buffer_size,
                                 ws->info.gart_page_size,
                                 RADEON_DOMAIN_GTT,
-                               RADEON_FLAG_NO_INTERPROCESS_SHARING);
+                               RADEON_FLAG_NO_INTERPROCESS_SHARING |
+                               (ring_type == RING_GFX ||
+                                ring_type == RING_COMPUTE ||
+                                ring_type == RING_DMA ?
+                                   RADEON_FLAG_GTT_WC : 0));
     if (!pb)
        return false;
  
@@ -716,7 +717,7 @@ static bool amdgpu_get_new_ib(struct radeon_winsys *ws, struct amdgpu_cs *cs,
     /* Allocate a new buffer for IBs if the current buffer is all used. */
     if (!ib->big_ib_buffer ||
         ib->used_ib_space + ib_size > ib->big_ib_buffer->size) {
-      if (!amdgpu_ib_new_buffer(aws, ib))
+      if (!amdgpu_ib_new_buffer(aws, ib, cs->ring_type))
           return false;
     }
  
@@ -926,7 +927,7 @@ static bool amdgpu_cs_check_space(struct radeon_winsys_cs *rcs, unsigned dw)
        rcs->max_prev = new_max_prev;
     }
  
-   if (!amdgpu_ib_new_buffer(cs->ctx->ws, ib))
+   if (!amdgpu_ib_new_buffer(cs->ctx->ws, ib, cs->ring_type))
        return false;
  
     assert(ib->used_ib_space == 0);
@@ -1145,7 +1146,7 @@ static bool amdgpu_add_sparse_backing_buffers(struct amdgpu_cs_context *cs)
        struct amdgpu_cs_buffer *buffer = &cs->sparse_buffers[i];
        struct amdgpu_winsys_bo *bo = buffer->bo;
  
-      mtx_lock(&bo->u.sparse.commit_lock);
+      simple_mtx_lock(&bo->u.sparse.commit_lock);
  
        list_for_each_entry(struct amdgpu_sparse_backing, backing, &bo->u.sparse.backing, list) {
           /* We can directly add the buffer here, because we know that each
@@ -1154,7 +1155,7 @@ static bool amdgpu_add_sparse_backing_buffers(struct amdgpu_cs_context *cs)
           int idx = amdgpu_do_add_real_buffer(cs, backing->bo);
           if (idx < 0) {
              fprintf(stderr, "%s: failed to add buffer\n", __FUNCTION__);
-            mtx_unlock(&bo->u.sparse.commit_lock);
+            simple_mtx_unlock(&bo->u.sparse.commit_lock);
              return false;
           }
  
@@ -1163,7 +1164,7 @@ static bool amdgpu_add_sparse_backing_buffers(struct amdgpu_cs_context *cs)
           p_atomic_inc(&backing->bo->num_active_ioctls);
        }
  
-      mtx_unlock(&bo->u.sparse.commit_lock);
+      simple_mtx_unlock(&bo->u.sparse.commit_lock);
     }
  
     return true;
@@ -1187,11 +1188,11 @@ void amdgpu_cs_submit_ib(void *job, int thread_index)
        amdgpu_bo_handle *handles;
        unsigned num = 0;
  
-      mtx_lock(&ws->global_bo_list_lock);
+      simple_mtx_lock(&ws->global_bo_list_lock);
  
        handles = malloc(sizeof(handles[0]) * ws->num_buffers);
        if (!handles) {
-         mtx_unlock(&ws->global_bo_list_lock);
+         simple_mtx_unlock(&ws->global_bo_list_lock);
           amdgpu_cs_context_cleanup(cs);
           cs->error_code = -ENOMEM;
           return;
@@ -1205,7 +1206,7 @@ void amdgpu_cs_submit_ib(void *job, int thread_index)
        r = amdgpu_bo_list_create(ws->dev, ws->num_buffers,
                                  handles, NULL, &bo_list);
        free(handles);
-      mtx_unlock(&ws->global_bo_list_lock);
+      simple_mtx_unlock(&ws->global_bo_list_lock);
     } else {
        unsigned num_handles;
  
@@ -1418,6 +1419,7 @@ static int amdgpu_cs_flush(struct radeon_winsys_cs *rcs,
           while (rcs->current.cdw & 7)
              radeon_emit(rcs, 0xffff1000); /* type3 nop packet */
        }
+      ws->gfx_ib_size_counter += (rcs->prev_dw + rcs->current.cdw) * 4;
        break;
     case RING_UVD:
        while (rcs->current.cdw & 15)
@@ -1467,7 +1469,7 @@ static int amdgpu_cs_flush(struct radeon_winsys_cs *rcs,
         * that the order of fence dependency updates matches the order of
         * submissions.
         */
-      mtx_lock(&ws->bo_fence_lock);
+      simple_mtx_lock(&ws->bo_fence_lock);
        amdgpu_add_fence_dependencies_bo_lists(cs);
  
        /* Swap command streams. "cst" is going to be submitted. */
@@ -1478,7 +1480,7 @@ static int amdgpu_cs_flush(struct radeon_winsys_cs *rcs,
        util_queue_add_job(&ws->cs_queue, cs, &cs->flush_completed,
                           amdgpu_cs_submit_ib, NULL);
        /* The submission has been queued, unlock the fence now. */
-      mtx_unlock(&ws->bo_fence_lock);
+      simple_mtx_unlock(&ws->bo_fence_lock);
  
        if (!(flags & RADEON_FLUSH_ASYNC)) {
           amdgpu_cs_sync_flush(rcs);