pan/midgard: Implement nir_intrinsic_load_num_work_groups
[mesa.git] / src / gallium / drivers / panfrost / pan_context.h
1 /*
2 * © Copyright 2018 Alyssa Rosenzweig
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 * SOFTWARE.
22 *
23 */
24
25 #ifndef __BUILDER_H__
26 #define __BUILDER_H__
27
28 #define _LARGEFILE64_SOURCE 1
29 #define CACHE_LINE_SIZE 1024 /* TODO */
30 #include <sys/mman.h>
31 #include <assert.h>
32 #include "pan_resource.h"
33 #include "pan_job.h"
34 #include "pan_blend.h"
35
36 #include "pipe/p_compiler.h"
37 #include "pipe/p_config.h"
38 #include "pipe/p_context.h"
39 #include "pipe/p_defines.h"
40 #include "pipe/p_format.h"
41 #include "pipe/p_screen.h"
42 #include "pipe/p_state.h"
43 #include "util/u_blitter.h"
44 #include "util/hash_table.h"
45
46 #include "midgard/midgard_compile.h"
47 #include "compiler/shader_enums.h"
48
49 /* Forward declare to avoid extra header dep */
50 struct prim_convert_context;
51
52 #define MAX_VARYINGS 4096
53
54 //#define PAN_DIRTY_CLEAR (1 << 0)
55 #define PAN_DIRTY_RASTERIZER (1 << 2)
56 #define PAN_DIRTY_FS (1 << 3)
57 #define PAN_DIRTY_FRAG_CORE (PAN_DIRTY_FS) /* Dirty writes are tied */
58 #define PAN_DIRTY_VS (1 << 4)
59 #define PAN_DIRTY_VERTEX (1 << 5)
60 #define PAN_DIRTY_VERT_BUF (1 << 6)
61 //#define PAN_DIRTY_VIEWPORT (1 << 7)
62 #define PAN_DIRTY_SAMPLERS (1 << 8)
63 #define PAN_DIRTY_TEXTURES (1 << 9)
64
65 #define SET_BIT(lval, bit, cond) \
66 if (cond) \
67 lval |= (bit); \
68 else \
69 lval &= ~(bit);
70
71 struct panfrost_constant_buffer {
72 struct pipe_constant_buffer cb[PIPE_MAX_CONSTANT_BUFFERS];
73 uint32_t enabled_mask;
74 uint32_t dirty_mask;
75 };
76
77 struct panfrost_query {
78 /* Passthrough from Gallium */
79 unsigned type;
80 unsigned index;
81
82 /* Memory for the GPU to writeback the value of the query */
83 struct panfrost_transfer transfer;
84 };
85
86 struct panfrost_fence {
87 struct pipe_reference reference;
88 int fd;
89 };
90
91 struct panfrost_streamout {
92 struct pipe_stream_output_target *targets[PIPE_MAX_SO_BUFFERS];
93 uint32_t offsets[PIPE_MAX_SO_BUFFERS];
94 unsigned num_targets;
95 };
96
97 struct panfrost_context {
98 /* Gallium context */
99 struct pipe_context base;
100
101 /* Compiler context */
102 struct midgard_screen compiler;
103
104 /* Bound job and map of panfrost_job_key to jobs */
105 struct panfrost_job *job;
106 struct hash_table *jobs;
107
108 /* panfrost_resource -> panfrost_job */
109 struct hash_table *write_jobs;
110
111 /* Within a launch_grid call.. */
112 const struct pipe_grid_info *compute_grid;
113
114 /* Bit mask for supported PIPE_DRAW for this hardware */
115 unsigned draw_modes;
116
117 struct pipe_framebuffer_state pipe_framebuffer;
118 struct panfrost_streamout streamout;
119
120 struct panfrost_memory cmdstream_persistent;
121 struct panfrost_memory scratchpad;
122 struct panfrost_memory tiler_heap;
123 struct panfrost_memory tiler_dummy;
124 struct panfrost_memory depth_stencil_buffer;
125
126 struct panfrost_query *occlusion_query;
127
128 /* Each draw has corresponding vertex and tiler payloads */
129 struct midgard_payload_vertex_tiler payloads[PIPE_SHADER_TYPES];
130
131 /* The fragment shader binary itself is pointed here (for the tripipe) but
132 * also everything else in the shader core, including blending, the
133 * stencil/depth tests, etc. Refer to the presentations. */
134
135 struct mali_shader_meta fragment_shader_core;
136
137 /* Per-draw Dirty flags are setup like any other driver */
138 int dirty;
139
140 unsigned vertex_count;
141 unsigned instance_count;
142
143 /* If instancing is enabled, vertex count padded for instance; if
144 * it is disabled, just equal to plain vertex count */
145 unsigned padded_count;
146
147 union mali_attr attributes[PIPE_MAX_ATTRIBS];
148
149 /* TODO: Multiple uniform buffers (index =/= 0), finer updates? */
150
151 struct panfrost_constant_buffer constant_buffer[PIPE_SHADER_TYPES];
152
153 struct panfrost_rasterizer *rasterizer;
154 struct panfrost_shader_variants *shader[PIPE_SHADER_TYPES];
155 struct panfrost_vertex_state *vertex;
156
157 struct pipe_vertex_buffer vertex_buffers[PIPE_MAX_ATTRIBS];
158 uint32_t vb_mask;
159
160 struct pipe_shader_buffer ssbo[PIPE_SHADER_TYPES][PIPE_MAX_SHADER_BUFFERS];
161 uint32_t ssbo_mask[PIPE_SHADER_TYPES];
162
163 struct panfrost_sampler_state *samplers[PIPE_SHADER_TYPES][PIPE_MAX_SAMPLERS];
164 unsigned sampler_count[PIPE_SHADER_TYPES];
165
166 struct panfrost_sampler_view *sampler_views[PIPE_SHADER_TYPES][PIPE_MAX_SHADER_SAMPLER_VIEWS];
167 unsigned sampler_view_count[PIPE_SHADER_TYPES];
168
169 struct primconvert_context *primconvert;
170 struct blitter_context *blitter;
171
172 /* Blitting the wallpaper (the old contents of the framebuffer back to
173 * itself) uses a dedicated u_blitter instance versus general blit()
174 * callbacks from Gallium, as the blit() callback can trigger
175 * wallpapering without Gallium realising, which in turns u_blitter
176 * errors due to unsupported reucrsion */
177
178 struct blitter_context *blitter_wallpaper;
179 struct panfrost_job *wallpaper_batch;
180
181 struct panfrost_blend_state *blend;
182
183 struct pipe_viewport_state pipe_viewport;
184 struct pipe_scissor_state scissor;
185 struct pipe_blend_color blend_color;
186 struct pipe_depth_stencil_alpha_state *depth_stencil;
187 struct pipe_stencil_ref stencil_ref;
188
189 /* True for t6XX, false for t8xx. */
190 bool is_t6xx;
191
192 uint32_t out_sync;
193 };
194
195 /* Corresponds to the CSO */
196
197 struct panfrost_rasterizer {
198 struct pipe_rasterizer_state base;
199
200 /* Bitmask of front face, etc */
201 unsigned tiler_gl_enables;
202 };
203
204 /* Variants bundle together to form the backing CSO, bundling multiple
205 * shaders with varying emulated features baked in (alpha test
206 * parameters, etc) */
207 #define MAX_SHADER_VARIANTS 8
208
209 /* A shader state corresponds to the actual, current variant of the shader */
210 struct panfrost_shader_state {
211 /* Compiled, mapped descriptor, ready for the hardware */
212 bool compiled;
213 struct mali_shader_meta *tripipe;
214
215 /* Non-descript information */
216 int uniform_count;
217 bool can_discard;
218 bool writes_point_size;
219 bool reads_point_coord;
220 bool reads_face;
221
222 struct mali_attr_meta varyings[PIPE_MAX_ATTRIBS];
223 gl_varying_slot varyings_loc[PIPE_MAX_ATTRIBS];
224
225 unsigned sysval_count;
226 unsigned sysval[MAX_SYSVAL_COUNT];
227
228 /* Information on this particular shader variant */
229 struct pipe_alpha_state alpha_state;
230
231 uint16_t point_sprite_mask;
232 unsigned point_sprite_upper_left : 1;
233
234 /* Should we enable helper invocations */
235 bool helper_invocations;
236
237 struct panfrost_bo *bo;
238 };
239
240 /* A collection of varyings (the CSO) */
241 struct panfrost_shader_variants {
242 /* A panfrost_shader_variants can represent a shader for
243 * either graphics or compute */
244
245 bool is_compute;
246
247 union {
248 struct pipe_shader_state base;
249 struct pipe_compute_state cbase;
250 };
251
252 struct panfrost_shader_state variants[MAX_SHADER_VARIANTS];
253 unsigned variant_count;
254
255 /* The current active variant */
256 unsigned active_variant;
257 };
258
259 struct panfrost_vertex_state {
260 unsigned num_elements;
261
262 struct pipe_vertex_element pipe[PIPE_MAX_ATTRIBS];
263 struct mali_attr_meta hw[PIPE_MAX_ATTRIBS];
264 };
265
266 struct panfrost_sampler_state {
267 struct pipe_sampler_state base;
268 struct mali_sampler_descriptor hw;
269 };
270
271 /* Misnomer: Sampler view corresponds to textures, not samplers */
272
273 struct panfrost_sampler_view {
274 struct pipe_sampler_view base;
275 struct mali_texture_descriptor hw;
276 bool manual_stride;
277 };
278
279 static inline struct panfrost_context *
280 pan_context(struct pipe_context *pcontext)
281 {
282 return (struct panfrost_context *) pcontext;
283 }
284
285 struct pipe_context *
286 panfrost_create_context(struct pipe_screen *screen, void *priv, unsigned flags);
287
288 void
289 panfrost_emit_for_draw(struct panfrost_context *ctx, bool with_vertex_data);
290
291 struct panfrost_transfer
292 panfrost_vertex_tiler_job(struct panfrost_context *ctx, bool is_tiler);
293
294 unsigned
295 panfrost_get_default_swizzle(unsigned components);
296
297 void
298 panfrost_flush(
299 struct pipe_context *pipe,
300 struct pipe_fence_handle **fence,
301 unsigned flags);
302
303 bool
304 panfrost_is_scanout(struct panfrost_context *ctx);
305
306 mali_ptr panfrost_sfbd_fragment(struct panfrost_context *ctx, bool has_draws);
307 mali_ptr panfrost_mfbd_fragment(struct panfrost_context *ctx, bool has_draws);
308
309 struct bifrost_framebuffer
310 panfrost_emit_mfbd(struct panfrost_context *ctx, unsigned vertex_count);
311
312 struct mali_single_framebuffer
313 panfrost_emit_sfbd(struct panfrost_context *ctx, unsigned vertex_count);
314
315 mali_ptr
316 panfrost_fragment_job(struct panfrost_context *ctx, bool has_draws);
317
318 void
319 panfrost_shader_compile(
320 struct panfrost_context *ctx,
321 struct mali_shader_meta *meta,
322 enum pipe_shader_ir ir_type,
323 const void *ir,
324 gl_shader_stage stage,
325 struct panfrost_shader_state *state);
326
327 void
328 panfrost_pack_work_groups_compute(
329 struct mali_vertex_tiler_prefix *out,
330 unsigned num_x,
331 unsigned num_y,
332 unsigned num_z,
333 unsigned size_x,
334 unsigned size_y,
335 unsigned size_z);
336
337 void
338 panfrost_pack_work_groups_fused(
339 struct mali_vertex_tiler_prefix *vertex,
340 struct mali_vertex_tiler_prefix *tiler,
341 unsigned num_x,
342 unsigned num_y,
343 unsigned num_z,
344 unsigned size_x,
345 unsigned size_y,
346 unsigned size_z);
347
348 /* Instancing */
349
350 mali_ptr
351 panfrost_vertex_buffer_address(struct panfrost_context *ctx, unsigned i);
352
353 void
354 panfrost_emit_vertex_data(struct panfrost_job *batch);
355
356 struct pan_shift_odd {
357 unsigned shift;
358 unsigned odd;
359 };
360
361 struct pan_shift_odd
362 panfrost_padded_vertex_count(
363 unsigned vertex_count,
364 bool primitive_pot);
365
366
367 unsigned
368 pan_expand_shift_odd(struct pan_shift_odd o);
369
370 /* Compute */
371
372 void
373 panfrost_compute_context_init(struct pipe_context *pctx);
374
375 /* Varyings */
376
377 void
378 panfrost_emit_varying_descriptor(
379 struct panfrost_context *ctx,
380 unsigned vertex_count);
381
382 #endif