radeonsi/gfx10: update a tunable max_es_verts_base for NGG
[mesa.git] / src / gallium / drivers / panfrost / pan_job.h
index ed8b084246add58133b08c84e0c7d4bdc03968e8..c6ae2a4eb9f4039ed149d69fb6b64f2baadf4dff 100644 (file)
 #ifndef __PAN_JOB_H__
 #define __PAN_JOB_H__
 
+#include "util/u_dynarray.h"
+#include "pipe/p_state.h"
+#include "pan_allocate.h"
+#include "pan_resource.h"
+
 /* Used as a hash table key */
 
 struct panfrost_job_key {
@@ -46,8 +51,12 @@ struct panfrost_job {
         /* Buffers cleared (PIPE_CLEAR_* bitmask) */
         unsigned clear;
 
-        /* Packed clear values */
-        uint32_t clear_color;
+        /* Packed clear values, indexed by both render target as well as word.
+         * Essentially, a single pixel is packed, with some padding to bring it
+         * up to a 32-bit interval; that pixel is then duplicated over to fill
+         * all 16-bytes */
+
+        uint32_t clear_color[PIPE_MAX_COLOR_BUFS][4];
         float clear_depth;
         unsigned clear_stencil;
 
@@ -61,8 +70,48 @@ struct panfrost_job {
         unsigned minx, miny;
         unsigned maxx, maxy;
 
+        /* CPU pointers to the job descriptor headers. next_job is only
+         * set at submit time (since only then are all the dependencies
+         * known). The upshot is that this is append-only.
+         *
+         * These arrays contain the headers for the "primary batch", our jargon
+         * referring to the part of the panfrost_job that actually contains
+         * meaningful work. In an OpenGL ES setting, that means the
+         * SET_VALUE/VERTEX/TILER jobs. Excluded is specifically the FRAGMENT
+         * job, which is sent on as a secondary batch containing only a single
+         * hardware job. Since there's one and only one FRAGMENT job issued per
+         * panfrost_job, there is no need to do any scoreboarding / management;
+         * it's easy enough to open-code it and it's not like we can get any
+         * better anyway. */
+        struct util_dynarray headers;
+
+        /* (And the GPU versions; TODO maybe combine) */
+        struct util_dynarray gpu_headers;
+
+        /* The last job in the primary batch */
+        struct panfrost_transfer last_job;
+
+        /* The first/last tiler job */
+        struct panfrost_transfer first_tiler;
+        struct panfrost_transfer last_tiler;
+
+        /* The first vertex job used as the input to a tiler job */
+        struct panfrost_transfer first_vertex_for_tiler;
+
+        /* The first job. Notice we've created a linked list */
+        struct panfrost_transfer first_job;
+
+        /* The number of jobs in the primary batch, essentially */
+        unsigned job_index;
+
         /* BOs referenced -- will be used for flushing logic */
         struct set *bos;
+
+        /* Indices of transient BOs referenced */
+        struct util_dynarray transient_indices;
+
+        /* Within the topmost transient BO, how much has been used? */
+        unsigned transient_offset;
 };
 
 /* Functions for managing the above */
@@ -75,7 +124,7 @@ panfrost_free_job(struct panfrost_context *ctx, struct panfrost_job *job);
 
 struct panfrost_job *
 panfrost_get_job(struct panfrost_context *ctx,
-                struct pipe_surface **cbufs, struct pipe_surface *zsbuf);
+                 struct pipe_surface **cbufs, struct pipe_surface *zsbuf);
 
 struct panfrost_job *
 panfrost_get_job_for_fbo(struct panfrost_context *ctx);
@@ -88,29 +137,61 @@ panfrost_job_add_bo(struct panfrost_job *job, struct panfrost_bo *bo);
 
 void
 panfrost_flush_jobs_writing_resource(struct panfrost_context *panfrost,
-                                struct pipe_resource *prsc);
+                                     struct pipe_resource *prsc);
 
 void
 panfrost_flush_jobs_reading_resource(struct panfrost_context *panfrost,
-                                struct pipe_resource *prsc);
+                                     struct pipe_resource *prsc);
 
 void
 panfrost_job_submit(struct panfrost_context *ctx, struct panfrost_job *job);
 
 void
 panfrost_job_set_requirements(struct panfrost_context *ctx,
-                         struct panfrost_job *job);
+                              struct panfrost_job *job);
 
 void
 panfrost_job_clear(struct panfrost_context *ctx,
-                struct panfrost_job *job,
-                unsigned buffers,
-                const union pipe_color_union *color,
-                double depth, unsigned stencil);
+                   struct panfrost_job *job,
+                   unsigned buffers,
+                   const union pipe_color_union *color,
+                   double depth, unsigned stencil);
 
 void
 panfrost_job_union_scissor(struct panfrost_job *job,
-                unsigned minx, unsigned miny,
-                unsigned maxx, unsigned maxy);
+                           unsigned minx, unsigned miny,
+                           unsigned maxx, unsigned maxy);
+
+/* Scoreboarding */
+
+void
+panfrost_scoreboard_queue_compute_job(
+        struct panfrost_job *batch,
+        struct panfrost_transfer job);
+
+void
+panfrost_scoreboard_queue_vertex_job(
+        struct panfrost_job *batch,
+        struct panfrost_transfer vertex,
+        bool requires_tiling);
+
+void
+panfrost_scoreboard_queue_tiler_job(
+        struct panfrost_job *batch,
+        struct panfrost_transfer tiler);
+
+void
+panfrost_scoreboard_queue_fused_job(
+        struct panfrost_job *batch,
+        struct panfrost_transfer vertex,
+        struct panfrost_transfer tiler);
+void
+panfrost_scoreboard_queue_fused_job_prepend(
+        struct panfrost_job *batch,
+        struct panfrost_transfer vertex,
+        struct panfrost_transfer tiler);
+
+void
+panfrost_scoreboard_link_batch(struct panfrost_job *batch);
 
 #endif