#include <assert.h>
#include "pan_resource.h"
#include "pan_job.h"
+#include "pan_blend.h"
+#include "pan_encoder.h"
#include "pipe/p_compiler.h"
#include "pipe/p_config.h"
#include "util/hash_table.h"
#include "midgard/midgard_compile.h"
+#include "compiler/shader_enums.h"
/* Forward declare to avoid extra header dep */
struct prim_convert_context;
unsigned type;
unsigned index;
- /* Memory for the GPU to writeback the value of the query */
- struct panfrost_transfer transfer;
+ union {
+ /* For computed queries. 64-bit to prevent overflow */
+ struct {
+ uint64_t start;
+ uint64_t end;
+ };
+
+ /* Memory for the GPU to writeback the value of the query */
+ struct panfrost_transfer transfer;
+ };
};
struct panfrost_fence {
int fd;
};
-#define PANFROST_MAX_TRANSIENT_ENTRIES 64
-
-struct panfrost_transient_pool {
- /* Memory blocks in the pool */
- struct panfrost_memory_entry *entries[PANFROST_MAX_TRANSIENT_ENTRIES];
-
- /* Number of entries we own */
- unsigned entry_count;
-
- /* Current entry that we are writing to, zero-indexed, strictly less than entry_count */
- unsigned entry_index;
-
- /* Number of bytes into the current entry we are */
- off_t entry_offset;
-
- /* Entry size (all entries must be homogenous) */
- size_t entry_size;
+struct panfrost_streamout {
+ struct pipe_stream_output_target *targets[PIPE_MAX_SO_BUFFERS];
+ uint32_t offsets[PIPE_MAX_SO_BUFFERS];
+ unsigned num_targets;
};
struct panfrost_context {
/* Gallium context */
struct pipe_context base;
+ /* Compiler context */
+ struct midgard_screen compiler;
+
/* Bound job and map of panfrost_job_key to jobs */
struct panfrost_job *job;
struct hash_table *jobs;
/* panfrost_resource -> panfrost_job */
struct hash_table *write_jobs;
+ /* Within a launch_grid call.. */
+ const struct pipe_grid_info *compute_grid;
+
/* Bit mask for supported PIPE_DRAW for this hardware */
unsigned draw_modes;
struct pipe_framebuffer_state pipe_framebuffer;
-
- /* The number of concurrent FBOs allowed depends on the number of pools
- * used; pools are ringed for parallelism opportunities */
-
- struct panfrost_transient_pool transient_pools[2];
- int cmdstream_i;
+ struct panfrost_streamout streamout;
struct panfrost_memory cmdstream_persistent;
- struct panfrost_memory shaders;
struct panfrost_memory scratchpad;
struct panfrost_memory tiler_heap;
- struct panfrost_memory varying_mem;
- struct panfrost_memory tiler_polygon_list;
struct panfrost_memory tiler_dummy;
struct panfrost_memory depth_stencil_buffer;
+ bool active_queries;
+ uint64_t prims_generated;
+ uint64_t tf_prims_generated;
struct panfrost_query *occlusion_query;
/* Each draw has corresponding vertex and tiler payloads */
- struct midgard_payload_vertex_tiler payload_vertex;
- struct midgard_payload_vertex_tiler payload_tiler;
+ struct midgard_payload_vertex_tiler payloads[PIPE_SHADER_TYPES];
/* The fragment shader binary itself is pointed here (for the tripipe) but
* also everything else in the shader core, including blending, the
unsigned vertex_count;
unsigned instance_count;
+ enum pipe_prim_type active_prim;
/* If instancing is enabled, vertex count padded for instance; if
* it is disabled, just equal to plain vertex count */
union mali_attr attributes[PIPE_MAX_ATTRIBS];
- unsigned varying_height;
-
- struct mali_single_framebuffer vt_framebuffer_sfbd;
- struct bifrost_framebuffer vt_framebuffer_mfbd;
-
/* TODO: Multiple uniform buffers (index =/= 0), finer updates? */
struct panfrost_constant_buffer constant_buffer[PIPE_SHADER_TYPES];
- /* CSOs */
struct panfrost_rasterizer *rasterizer;
-
- struct panfrost_shader_variants *vs;
- struct panfrost_shader_variants *fs;
-
+ struct panfrost_shader_variants *shader[PIPE_SHADER_TYPES];
struct panfrost_vertex_state *vertex;
struct pipe_vertex_buffer vertex_buffers[PIPE_MAX_ATTRIBS];
uint32_t vb_mask;
+ struct pipe_shader_buffer ssbo[PIPE_SHADER_TYPES][PIPE_MAX_SHADER_BUFFERS];
+ uint32_t ssbo_mask[PIPE_SHADER_TYPES];
+
struct panfrost_sampler_state *samplers[PIPE_SHADER_TYPES][PIPE_MAX_SAMPLERS];
unsigned sampler_count[PIPE_SHADER_TYPES];
/* True for t6XX, false for t8xx. */
bool is_t6xx;
- /* If set, we'll require the use of single render-target framebuffer
- * descriptors (SFBD), for older hardware -- specifically, <T760 hardware, If
- * false, we'll use the MFBD no matter what. New hardware -does- retain support
- * for SFBD, and in theory we could flip between them on a per-RT basis, but
- * there's no real advantage to doing so */
- bool require_sfbd;
-
- uint32_t out_sync;
+ uint32_t out_sync;
};
/* Corresponds to the CSO */
unsigned tiler_gl_enables;
};
-struct panfrost_blend_state {
- struct pipe_blend_state base;
-
- /* Whether a blend shader is in use */
- bool has_blend_shader;
-
- /* Compiled fixed function command */
- struct mali_blend_equation equation;
- float constant;
-
- /* Compiled blend shader */
- mali_ptr blend_shader;
- int blend_work_count;
-};
-
/* Variants bundle together to form the backing CSO, bundling multiple
* shaders with varying emulated features baked in (alpha test
* parameters, etc) */
/* A shader state corresponds to the actual, current variant of the shader */
struct panfrost_shader_state {
- struct pipe_shader_state *base;
-
/* Compiled, mapped descriptor, ready for the hardware */
bool compiled;
struct mali_shader_meta *tripipe;
- mali_ptr tripipe_gpu;
/* Non-descript information */
int uniform_count;
bool can_discard;
bool writes_point_size;
bool reads_point_coord;
+ bool reads_face;
+ bool reads_frag_coord;
struct mali_attr_meta varyings[PIPE_MAX_ATTRIBS];
gl_varying_slot varyings_loc[PIPE_MAX_ATTRIBS];
+ struct pipe_stream_output_info stream_output;
+ uint64_t so_mask;
unsigned sysval_count;
unsigned sysval[MAX_SYSVAL_COUNT];
uint16_t point_sprite_mask;
unsigned point_sprite_upper_left : 1;
+
+ /* Should we enable helper invocations */
+ bool helper_invocations;
+
+ struct panfrost_bo *bo;
};
/* A collection of varyings (the CSO) */
struct panfrost_shader_variants {
- struct pipe_shader_state base;
+ /* A panfrost_shader_variants can represent a shader for
+ * either graphics or compute */
+
+ bool is_compute;
+
+ union {
+ struct pipe_shader_state base;
+ struct pipe_compute_state cbase;
+ };
struct panfrost_shader_state variants[MAX_SHADER_VARIANTS];
unsigned variant_count;
struct panfrost_sampler_view {
struct pipe_sampler_view base;
struct mali_texture_descriptor hw;
+ bool manual_stride;
};
static inline struct panfrost_context *
panfrost_fragment_job(struct panfrost_context *ctx, bool has_draws);
void
-panfrost_shader_compile(struct panfrost_context *ctx, struct mali_shader_meta *meta, const char *src, int type, struct panfrost_shader_state *state);
-
-void
-panfrost_pack_work_groups_compute(
- struct mali_vertex_tiler_prefix *out,
- unsigned num_x,
- unsigned num_y,
- unsigned num_z,
- unsigned size_x,
- unsigned size_y,
- unsigned size_z);
-
-void
-panfrost_pack_work_groups_fused(
- struct mali_vertex_tiler_prefix *vertex,
- struct mali_vertex_tiler_prefix *tiler,
- unsigned num_x,
- unsigned num_y,
- unsigned num_z,
- unsigned size_x,
- unsigned size_y,
- unsigned size_z);
+panfrost_shader_compile(
+ struct panfrost_context *ctx,
+ struct mali_shader_meta *meta,
+ enum pipe_shader_ir ir_type,
+ const void *ir,
+ gl_shader_stage stage,
+ struct panfrost_shader_state *state,
+ uint64_t *outputs_written);
/* Instancing */
struct pan_shift_odd
panfrost_padded_vertex_count(
- unsigned vertex_count,
- bool primitive_pot);
+ unsigned vertex_count,
+ bool primitive_pot);
unsigned
pan_expand_shift_odd(struct pan_shift_odd o);
+/* Compute */
+
+void
+panfrost_compute_context_init(struct pipe_context *pctx);
+
+/* Varyings */
+
+void
+panfrost_emit_varying_descriptor(
+ struct panfrost_context *ctx,
+ unsigned vertex_count);
#endif