iris: Annotate all BO uses with domain and sequence number information.

[mesa.git] / src / gallium / drivers / iris / iris_batch.h
diff --git a/src/gallium/drivers/iris/iris_batch.h b/src/gallium/drivers/iris/iris_batch.h

index 771fb48ced127d207e05de2300407284b34fbb65..bfea20d268cc66d9c25f49eccd55f716ad2f1ef7 100644 (file)
--- a/src/gallium/drivers/iris/iris_batch.h
+++ b/src/gallium/drivers/iris/iris_batch.h
@@ -26,47 +26,60 @@
  
  #include <stdint.h>
  #include <stdbool.h>
+#include <string.h>
+
+#include "util/u_dynarray.h"
+
+#include "drm-uapi/i915_drm.h"
+#include "common/gen_decoder.h"
+
+#include "iris_fence.h"
+#include "iris_fine_fence.h"
+
+struct iris_context;
  
  /* The kernel assumes batchbuffers are smaller than 256kB. */
  #define MAX_BATCH_SIZE (256 * 1024)
  
-/* 3DSTATE_BINDING_TABLE_POINTERS has a U16 offset from Surface State Base
- * Address, which means that we can't put binding tables beyond 64kB.  This
- * effectively limits the maximum statebuffer size to 64kB.
+/* Terminating the batch takes either 4 bytes for MI_BATCH_BUFFER_END
+ * or 12 bytes for MI_BATCH_BUFFER_START (when chaining).  Plus another
+ * 24 bytes for the seqno write (using PIPE_CONTROL).
   */
-#define MAX_STATE_SIZE (64 * 1024)
+#define BATCH_RESERVED 36
  
-struct iris_address {
-   struct iris_bo *bo;
-   unsigned reloc_flags;
-   uint64_t offset;
-};
+/* Our target batch size - flush approximately at this point. */
+#define BATCH_SZ (64 * 1024 - BATCH_RESERVED)
  
-struct iris_batch_buffer {
-   struct iris_bo *bo;
-   void *map;
-   void *map_next;
-
-   struct iris_bo *partial_bo;
-   unsigned partial_bytes;
+enum iris_batch_name {
+   IRIS_BATCH_RENDER,
+   IRIS_BATCH_COMPUTE,
  };
  
+#define IRIS_BATCH_COUNT 2
+
  struct iris_batch {
     struct iris_screen *screen;
     struct pipe_debug_callback *dbg;
+   struct pipe_device_reset_callback *reset;
+
+   /** What batch is this? (e.g. IRIS_BATCH_RENDER/COMPUTE) */
+   enum iris_batch_name name;
  
     /** Current batchbuffer being queued up. */
-   struct iris_batch_buffer cmdbuf;
+   struct iris_bo *bo;
+   void *map;
+   void *map_next;
  
-   /** Last BO submitted to the hardware.  Used for glFinish(). */
-   struct iris_bo *last_cmd_bo;
+   /** Size of the primary batch being submitted to execbuf (in bytes). */
+   unsigned primary_batch_size;
  
-   uint32_t hw_ctx_id;
+   /** Total size of all chained batches (in bytes). */
+   unsigned total_chained_batch_size;
  
-   /** Which ring this batch targets - a I915_EXEC_RING_MASK value */
-   uint8_t ring;
+   /** Last Surface State Base Address set in this hardware context. */
+   uint64_t last_surface_base_address;
  
-   bool no_wrap;
+   uint32_t hw_ctx_id;
  
     /** The validation list */
     struct drm_i915_gem_exec_object2 *validation_list;
@@ -74,38 +87,226 @@ struct iris_batch {
     int exec_count;
     int exec_array_size;
  
+   /** Whether INTEL_BLACKHOLE_RENDER is enabled in the batch (aka first
+    * instruction is a MI_BATCH_BUFFER_END).
+    */
+   bool noop_enabled;
+
+   /**
+    * A list of iris_syncobjs associated with this batch.
+    *
+    * The first list entry will always be a signalling sync-point, indicating
+    * that this batch has completed.  The others are likely to be sync-points
+    * to wait on before executing the batch.
+    */
+   struct util_dynarray syncobjs;
+
+   /** A list of drm_i915_exec_fences to have execbuf signal or wait on */
+   struct util_dynarray exec_fences;
+
     /** The amount of aperture space (in bytes) used by all exec_bos */
     int aperture_space;
  
-   /** Map from batch offset to iris_alloc_state data (with DEBUG_BATCH) */
-   struct hash_table *state_sizes;
+   struct {
+      /** Uploader to use for sequence numbers */
+      struct u_upload_mgr *uploader;
  
-   void (*emit_state_base_address)(struct iris_batch *batch);
-};
+      /** GPU buffer and CPU map where our seqno's will be written. */
+      struct iris_state_ref ref;
+      uint32_t *map;
  
-void iris_init_batch(struct iris_batch *batch,
-                     struct iris_screen *screen,
-                     struct pipe_debug_callback *dbg,
-                     uint8_t ring);
-void iris_batch_free(struct iris_batch *batch);
-void iris_require_command_space(struct iris_batch *batch, unsigned size);
-void iris_batch_emit(struct iris_batch *batch, const void *data, unsigned size);
+      /** The sequence number to write the next time we add a fence. */
+      uint32_t next;
+   } fine_fences;
  
-int _iris_batch_flush_fence(struct iris_batch *batch,
-                            int in_fence_fd, int *out_fence_fd,
-                            const char *file, int line);
+   /** A seqno (and syncobj) for the last batch that was submitted. */
+   struct iris_fine_fence *last_fence;
  
+   /** List of other batches which we might need to flush to use a BO */
+   struct iris_batch *other_batches[IRIS_BATCH_COUNT - 1];
  
-#define iris_batch_flush_fence(batch, in_fence_fd, out_fence_fd) \
-   _iris_batch_flush_fence((batch), (in_fence_fd), (out_fence_fd), \
-                           __FILE__, __LINE__)
+   struct {
+      /**
+       * Set of struct brw_bo * that have been rendered to within this
+       * batchbuffer and would need flushing before being used from another
+       * cache domain that isn't coherent with it (i.e. the sampler).
+       */
+      struct hash_table *render;
  
-#define iris_batch_flush(batch) iris_batch_flush_fence((batch), -1, NULL)
+      /**
+       * Set of struct brw_bo * that have been used as a depth buffer within
+       * this batchbuffer and would need flushing before being used from
+       * another cache domain that isn't coherent with it (i.e. the sampler).
+       */
+      struct set *depth;
+   } cache;
+
+   struct gen_batch_decode_ctx decoder;
+   struct hash_table_u64 *state_sizes;
+
+   /**
+    * Sequence number used to track the completion of any subsequent memory
+    * operations in the batch until the next sync boundary.
+    */
+   uint64_t next_seqno;
+
+   /** Have we emitted any draw calls to this batch? */
+   bool contains_draw;
+
+   /**
+    * Number of times iris_batch_sync_region_start() has been called without a
+    * matching iris_batch_sync_region_end() on this batch.
+    */
+   uint32_t sync_region_depth;
+
+   uint32_t last_aux_map_state;
+};
+
+void iris_init_batch(struct iris_context *ice,
+                     enum iris_batch_name name,
+                     int priority);
+void iris_chain_to_new_batch(struct iris_batch *batch);
+void iris_batch_free(struct iris_batch *batch);
+void iris_batch_maybe_flush(struct iris_batch *batch, unsigned estimate);
+
+void _iris_batch_flush(struct iris_batch *batch, const char *file, int line);
+#define iris_batch_flush(batch) _iris_batch_flush((batch), __FILE__, __LINE__)
  
  bool iris_batch_references(struct iris_batch *batch, struct iris_bo *bo);
  
+bool iris_batch_prepare_noop(struct iris_batch *batch, bool noop_enable);
+
  #define RELOC_WRITE EXEC_OBJECT_WRITE
  
-void iris_use_pinned_bo(struct iris_batch *batch, struct iris_bo *bo);
+void iris_use_pinned_bo(struct iris_batch *batch, struct iris_bo *bo,
+                        bool writable, enum iris_domain access);
+
+enum pipe_reset_status iris_batch_check_for_reset(struct iris_batch *batch);
+
+static inline unsigned
+iris_batch_bytes_used(struct iris_batch *batch)
+{
+   return batch->map_next - batch->map;
+}
+
+/**
+ * Ensure the current command buffer has \param size bytes of space
+ * remaining.  If not, this creates a secondary batch buffer and emits
+ * a jump from the primary batch to the start of the secondary.
+ *
+ * Most callers want iris_get_command_space() instead.
+ */
+static inline void
+iris_require_command_space(struct iris_batch *batch, unsigned size)
+{
+   const unsigned required_bytes = iris_batch_bytes_used(batch) + size;
+
+   if (required_bytes >= BATCH_SZ) {
+      iris_chain_to_new_batch(batch);
+   }
+}
+
+/**
+ * Allocate space in the current command buffer, and return a pointer
+ * to the mapped area so the caller can write commands there.
+ *
+ * This should be called whenever emitting commands.
+ */
+static inline void *
+iris_get_command_space(struct iris_batch *batch, unsigned bytes)
+{
+   iris_require_command_space(batch, bytes);
+   void *map = batch->map_next;
+   batch->map_next += bytes;
+   return map;
+}
+
+/**
+ * Helper to emit GPU commands - allocates space, copies them there.
+ */
+static inline void
+iris_batch_emit(struct iris_batch *batch, const void *data, unsigned size)
+{
+   void *map = iris_get_command_space(batch, size);
+   memcpy(map, data, size);
+}
+
+/**
+ * Get a pointer to the batch's signalling syncobj.  Does not refcount.
+ */
+static inline struct iris_syncobj *
+iris_batch_get_signal_syncobj(struct iris_batch *batch)
+{
+   /* The signalling syncobj is the first one in the list. */
+   struct iris_syncobj *syncobj =
+      ((struct iris_syncobj **) util_dynarray_begin(&batch->syncobjs))[0];
+   return syncobj;
+}
+
+
+/**
+ * Take a reference to the batch's signalling syncobj.
+ *
+ * Callers can use this to wait for the the current batch under construction
+ * to complete (after flushing it).
+ */
+static inline void
+iris_batch_reference_signal_syncobj(struct iris_batch *batch,
+                                   struct iris_syncobj **out_syncobj)
+{
+   struct iris_syncobj *syncobj = iris_batch_get_signal_syncobj(batch);
+   iris_syncobj_reference(batch->screen, out_syncobj, syncobj);
+}
+
+/**
+ * Record the size of a piece of state for use in INTEL_DEBUG=bat printing.
+ */
+static inline void
+iris_record_state_size(struct hash_table_u64 *ht,
+                       uint32_t offset_from_base,
+                       uint32_t size)
+{
+   if (ht) {
+      _mesa_hash_table_u64_insert(ht, offset_from_base,
+                                  (void *)(uintptr_t) size);
+   }
+}
+
+/**
+ * Mark the start of a region in the batch with stable synchronization
+ * sequence number.  Any buffer object accessed by the batch buffer only needs
+ * to be marked once (e.g. via iris_bo_bump_seqno()) within a region delimited
+ * by iris_batch_sync_region_start() and iris_batch_sync_region_end().
+ */
+static inline void
+iris_batch_sync_region_start(struct iris_batch *batch)
+{
+   batch->sync_region_depth++;
+}
+
+/**
+ * Mark the end of a region in the batch with stable synchronization sequence
+ * number.  Should be called once after each call to
+ * iris_batch_sync_region_start().
+ */
+static inline void
+iris_batch_sync_region_end(struct iris_batch *batch)
+{
+   assert(batch->sync_region_depth);
+   batch->sync_region_depth--;
+}
+
+/**
+ * Start a new synchronization section at the current point of the batch,
+ * unless disallowed by a previous iris_batch_sync_region_start().
+ */
+static inline void
+iris_batch_sync_boundary(struct iris_batch *batch)
+{
+   if (!batch->sync_region_depth) {
+      batch->next_seqno = p_atomic_inc_return(&batch->screen->last_seqno);
+      assert(batch->next_seqno > 0);
+   }
+}
  
  #endif