amd,radeonsi: rename radeon_winsys_cs -> radeon_cmdbuf

[mesa.git] / src / gallium / winsys / amdgpu / drm / amdgpu_cs.h
diff --git a/src/gallium/winsys/amdgpu/drm/amdgpu_cs.h b/src/gallium/winsys/amdgpu/drm/amdgpu_cs.h

index a2fb44a4b0efff7290c87759f712fc350e4cbb57..5f96193750bcc82872b27e0305b08c4c55893055 100644 (file)
--- a/src/gallium/winsys/amdgpu/drm/amdgpu_cs.h
+++ b/src/gallium/winsys/amdgpu/drm/amdgpu_cs.h
@@ -24,16 +24,13 @@
   * next paragraph) shall be included in all copies or substantial portions
   * of the Software.
   */
-/*
- * Authors:
- *      Marek Olšák <maraeo@gmail.com>
- */
  
  #ifndef AMDGPU_CS_H
  #define AMDGPU_CS_H
  
  #include "amdgpu_bo.h"
  #include "util/u_memory.h"
+#include <amdgpu_drm.h>
  
  struct amdgpu_ctx {
     struct amdgpu_winsys *ws;
@@ -41,59 +38,129 @@ struct amdgpu_ctx {
     amdgpu_bo_handle user_fence_bo;
     uint64_t *user_fence_cpu_address_base;
     int refcount;
+   unsigned initial_num_total_rejected_cs;
+   unsigned num_rejected_cs;
  };
  
  struct amdgpu_cs_buffer {
     struct amdgpu_winsys_bo *bo;
-   uint64_t priority_usage;
+   union {
+      struct {
+         uint64_t priority_usage;
+      } real;
+      struct {
+         uint32_t real_idx; /* index of underlying real BO */
+      } slab;
+   } u;
     enum radeon_bo_usage usage;
-   enum radeon_bo_domain domains;
  };
  
+enum ib_type {
+   IB_MAIN,
+   IB_NUM,
+};
  
-struct amdgpu_cs {
-   struct radeon_winsys_cs base;
-   struct amdgpu_ctx *ctx;
-
-   /* Flush CS. */
-   void (*flush_cs)(void *ctx, unsigned flags, struct pipe_fence_handle **fence);
-   void *flush_data;
+struct amdgpu_ib {
+   struct radeon_cmdbuf base;
  
     /* A buffer out of which new IBs are allocated. */
-   struct pb_buffer *big_ib_buffer; /* for holding the reference */
-   struct amdgpu_winsys_bo *big_ib_winsys_buffer;
-   uint8_t *ib_mapped;
-   unsigned used_ib_space;
+   struct pb_buffer        *big_ib_buffer;
+   uint8_t                 *ib_mapped;
+   unsigned                used_ib_space;
+   unsigned                max_ib_size;
+   uint32_t                *ptr_ib_size;
+   bool                    ptr_ib_size_inside_ib;
+   enum ib_type            ib_type;
+};
  
-   /* amdgpu_cs_submit parameters */
-   struct amdgpu_cs_request    request;
-   struct amdgpu_cs_ib_info    ib;
+struct amdgpu_cs_context {
+   struct drm_amdgpu_cs_chunk_ib ib[IB_NUM];
  
     /* Buffers. */
-   unsigned                    max_num_buffers;
-   unsigned                    num_buffers;
+   unsigned                    max_real_buffers;
+   unsigned                    num_real_buffers;
+   struct amdgpu_cs_buffer     *real_buffers;
+
+   unsigned                    max_real_submit;
     amdgpu_bo_handle            *handles;
     uint8_t                     *flags;
-   struct amdgpu_cs_buffer     *buffers;
+
+   unsigned                    num_slab_buffers;
+   unsigned                    max_slab_buffers;
+   struct amdgpu_cs_buffer     *slab_buffers;
+
+   unsigned                    num_sparse_buffers;
+   unsigned                    max_sparse_buffers;
+   struct amdgpu_cs_buffer     *sparse_buffers;
  
     int                         buffer_indices_hashlist[4096];
  
-   uint64_t                    used_vram;
-   uint64_t                    used_gart;
+   struct amdgpu_winsys_bo     *last_added_bo;
+   unsigned                    last_added_bo_index;
+   unsigned                    last_added_bo_usage;
+   uint64_t                    last_added_bo_priority_usage;
+
+   struct pipe_fence_handle    **fence_dependencies;
+   unsigned                    num_fence_dependencies;
+   unsigned                    max_fence_dependencies;
  
-   unsigned                    max_dependencies;
+   struct pipe_fence_handle    **syncobj_to_signal;
+   unsigned                    num_syncobj_to_signal;
+   unsigned                    max_syncobj_to_signal;
+
+   struct pipe_fence_handle    *fence;
+
+   /* the error returned from cs_flush for non-async submissions */
+   int                         error_code;
+};
+
+struct amdgpu_cs {
+   struct amdgpu_ib main; /* must be first because this is inherited */
+   struct amdgpu_ctx *ctx;
+   enum ring_type ring_type;
+   struct drm_amdgpu_cs_chunk_fence fence_chunk;
+
+   /* We flip between these two CS. While one is being consumed
+    * by the kernel in another thread, the other one is being filled
+    * by the pipe driver. */
+   struct amdgpu_cs_context csc1;
+   struct amdgpu_cs_context csc2;
+   /* The currently-used CS. */
+   struct amdgpu_cs_context *csc;
+   /* The CS being currently-owned by the other thread. */
+   struct amdgpu_cs_context *cst;
+
+   /* Flush CS. */
+   void (*flush_cs)(void *ctx, unsigned flags, struct pipe_fence_handle **fence);
+   void *flush_data;
+
+   struct util_queue_fence flush_completed;
+   struct pipe_fence_handle *next_fence;
  };
  
  struct amdgpu_fence {
     struct pipe_reference reference;
+   /* If ctx == NULL, this fence is syncobj-based. */
+   uint32_t syncobj;
  
+   struct amdgpu_winsys *ws;
     struct amdgpu_ctx *ctx;  /* submission context */
     struct amdgpu_cs_fence fence;
     uint64_t *user_fence_cpu_address;
  
+   /* If the fence has been submitted. This is unsignalled for deferred fences
+    * (cs->next_fence) and while an IB is still being submitted in the submit
+    * thread. */
+   struct util_queue_fence submitted;
+
     volatile int signalled;              /* bool (int for atomicity) */
  };
  
+static inline bool amdgpu_fence_is_syncobj(struct amdgpu_fence *fence)
+{
+   return fence->ctx == NULL;
+}
+
  static inline void amdgpu_ctx_unref(struct amdgpu_ctx *ctx)
  {
     if (p_atomic_dec_zero(&ctx->refcount)) {
@@ -110,47 +177,80 @@ static inline void amdgpu_fence_reference(struct pipe_fence_handle **dst,
     struct amdgpu_fence *rsrc = (struct amdgpu_fence *)src;
  
     if (pipe_reference(&(*rdst)->reference, &rsrc->reference)) {
-      amdgpu_ctx_unref((*rdst)->ctx);
-      FREE(*rdst);
+      struct amdgpu_fence *fence = *rdst;
+
+      if (amdgpu_fence_is_syncobj(fence))
+         amdgpu_cs_destroy_syncobj(fence->ws->dev, fence->syncobj);
+      else
+         amdgpu_ctx_unref(fence->ctx);
+
+      util_queue_fence_destroy(&fence->submitted);
+      FREE(fence);
     }
     *rdst = rsrc;
  }
  
-int amdgpu_lookup_buffer(struct amdgpu_cs *csc, struct amdgpu_winsys_bo *bo);
+int amdgpu_lookup_buffer(struct amdgpu_cs_context *cs, struct amdgpu_winsys_bo *bo);
+
+static inline struct amdgpu_ib *
+amdgpu_ib(struct radeon_cmdbuf *base)
+{
+   return (struct amdgpu_ib *)base;
+}
  
  static inline struct amdgpu_cs *
-amdgpu_cs(struct radeon_winsys_cs *base)
+amdgpu_cs(struct radeon_cmdbuf *base)
  {
+   assert(amdgpu_ib(base)->ib_type == IB_MAIN);
     return (struct amdgpu_cs*)base;
  }
  
-static inline boolean
+#define get_container(member_ptr, container_type, container_member) \
+   (container_type *)((char *)(member_ptr) - offsetof(container_type, container_member))
+
+static inline struct amdgpu_cs *
+amdgpu_cs_from_ib(struct amdgpu_ib *ib)
+{
+   switch (ib->ib_type) {
+   case IB_MAIN:
+      return get_container(ib, struct amdgpu_cs, main);
+   default:
+      unreachable("bad ib_type");
+   }
+}
+
+static inline bool
  amdgpu_bo_is_referenced_by_cs(struct amdgpu_cs *cs,
                                struct amdgpu_winsys_bo *bo)
  {
     int num_refs = bo->num_cs_references;
     return num_refs == bo->ws->num_cs ||
-         (num_refs && amdgpu_lookup_buffer(cs, bo) != -1);
+         (num_refs && amdgpu_lookup_buffer(cs->csc, bo) != -1);
  }
  
-static inline boolean
+static inline bool
  amdgpu_bo_is_referenced_by_cs_with_usage(struct amdgpu_cs *cs,
                                           struct amdgpu_winsys_bo *bo,
                                           enum radeon_bo_usage usage)
  {
     int index;
+   struct amdgpu_cs_buffer *buffer;
  
     if (!bo->num_cs_references)
-      return FALSE;
+      return false;
  
-   index = amdgpu_lookup_buffer(cs, bo);
+   index = amdgpu_lookup_buffer(cs->csc, bo);
     if (index == -1)
-      return FALSE;
+      return false;
+
+   buffer = bo->bo ? &cs->csc->real_buffers[index] :
+            bo->sparse ? &cs->csc->sparse_buffers[index] :
+            &cs->csc->slab_buffers[index];
  
-   return (cs->buffers[index].usage & usage) != 0;
+   return (buffer->usage & usage) != 0;
  }
  
-static inline boolean
+static inline bool
  amdgpu_bo_is_referenced_by_any_cs(struct amdgpu_winsys_bo *bo)
  {
     return bo->num_cs_references != 0;
@@ -158,6 +258,11 @@ amdgpu_bo_is_referenced_by_any_cs(struct amdgpu_winsys_bo *bo)
  
  bool amdgpu_fence_wait(struct pipe_fence_handle *fence, uint64_t timeout,
                         bool absolute);
+void amdgpu_add_fences(struct amdgpu_winsys_bo *bo,
+                       unsigned num_fences,
+                       struct pipe_fence_handle **fences);
+void amdgpu_cs_sync_flush(struct radeon_cmdbuf *rcs);
  void amdgpu_cs_init_functions(struct amdgpu_winsys *ws);
+void amdgpu_cs_submit_ib(void *job, int thread_index);
  
  #endif