2 * © Copyright 2018 Alyssa Rosenzweig
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
28 #define _LARGEFILE64_SOURCE 1
29 #define CACHE_LINE_SIZE 1024 /* TODO */
32 #include "pan_resource.h"
34 #include "pan_blend.h"
36 #include "pipe/p_compiler.h"
37 #include "pipe/p_config.h"
38 #include "pipe/p_context.h"
39 #include "pipe/p_defines.h"
40 #include "pipe/p_format.h"
41 #include "pipe/p_screen.h"
42 #include "pipe/p_state.h"
43 #include "util/u_blitter.h"
44 #include "util/hash_table.h"
46 #include "midgard/midgard_compile.h"
47 #include "compiler/shader_enums.h"
49 /* Forward declare to avoid extra header dep */
50 struct prim_convert_context
;
52 #define MAX_VARYINGS 4096
54 //#define PAN_DIRTY_CLEAR (1 << 0)
55 #define PAN_DIRTY_RASTERIZER (1 << 2)
56 #define PAN_DIRTY_FS (1 << 3)
57 #define PAN_DIRTY_FRAG_CORE (PAN_DIRTY_FS) /* Dirty writes are tied */
58 #define PAN_DIRTY_VS (1 << 4)
59 #define PAN_DIRTY_VERTEX (1 << 5)
60 #define PAN_DIRTY_VERT_BUF (1 << 6)
61 //#define PAN_DIRTY_VIEWPORT (1 << 7)
62 #define PAN_DIRTY_SAMPLERS (1 << 8)
63 #define PAN_DIRTY_TEXTURES (1 << 9)
65 #define SET_BIT(lval, bit, cond) \
71 struct panfrost_constant_buffer
{
72 struct pipe_constant_buffer cb
[PIPE_MAX_CONSTANT_BUFFERS
];
73 uint32_t enabled_mask
;
77 struct panfrost_query
{
78 /* Passthrough from Gallium */
83 /* For computed queries. 64-bit to prevent overflow */
89 /* Memory for the GPU to writeback the value of the query */
90 struct panfrost_transfer transfer
;
94 struct panfrost_fence
{
95 struct pipe_reference reference
;
99 struct panfrost_streamout
{
100 struct pipe_stream_output_target
*targets
[PIPE_MAX_SO_BUFFERS
];
101 uint32_t offsets
[PIPE_MAX_SO_BUFFERS
];
102 unsigned num_targets
;
105 struct panfrost_context
{
106 /* Gallium context */
107 struct pipe_context base
;
109 /* Compiler context */
110 struct midgard_screen compiler
;
112 /* Bound job and map of panfrost_job_key to jobs */
113 struct panfrost_job
*job
;
114 struct hash_table
*jobs
;
116 /* panfrost_resource -> panfrost_job */
117 struct hash_table
*write_jobs
;
119 /* Within a launch_grid call.. */
120 const struct pipe_grid_info
*compute_grid
;
122 /* Bit mask for supported PIPE_DRAW for this hardware */
125 struct pipe_framebuffer_state pipe_framebuffer
;
126 struct panfrost_streamout streamout
;
128 struct panfrost_memory cmdstream_persistent
;
129 struct panfrost_memory scratchpad
;
130 struct panfrost_memory tiler_heap
;
131 struct panfrost_memory tiler_dummy
;
132 struct panfrost_memory depth_stencil_buffer
;
135 uint64_t prims_generated
;
136 uint64_t tf_prims_generated
;
137 struct panfrost_query
*occlusion_query
;
139 /* Each draw has corresponding vertex and tiler payloads */
140 struct midgard_payload_vertex_tiler payloads
[PIPE_SHADER_TYPES
];
142 /* The fragment shader binary itself is pointed here (for the tripipe) but
143 * also everything else in the shader core, including blending, the
144 * stencil/depth tests, etc. Refer to the presentations. */
146 struct mali_shader_meta fragment_shader_core
;
148 /* Per-draw Dirty flags are setup like any other driver */
151 unsigned vertex_count
;
152 unsigned instance_count
;
154 /* If instancing is enabled, vertex count padded for instance; if
155 * it is disabled, just equal to plain vertex count */
156 unsigned padded_count
;
158 union mali_attr attributes
[PIPE_MAX_ATTRIBS
];
160 /* TODO: Multiple uniform buffers (index =/= 0), finer updates? */
162 struct panfrost_constant_buffer constant_buffer
[PIPE_SHADER_TYPES
];
164 struct panfrost_rasterizer
*rasterizer
;
165 struct panfrost_shader_variants
*shader
[PIPE_SHADER_TYPES
];
166 struct panfrost_vertex_state
*vertex
;
168 struct pipe_vertex_buffer vertex_buffers
[PIPE_MAX_ATTRIBS
];
171 struct pipe_shader_buffer ssbo
[PIPE_SHADER_TYPES
][PIPE_MAX_SHADER_BUFFERS
];
172 uint32_t ssbo_mask
[PIPE_SHADER_TYPES
];
174 struct panfrost_sampler_state
*samplers
[PIPE_SHADER_TYPES
][PIPE_MAX_SAMPLERS
];
175 unsigned sampler_count
[PIPE_SHADER_TYPES
];
177 struct panfrost_sampler_view
*sampler_views
[PIPE_SHADER_TYPES
][PIPE_MAX_SHADER_SAMPLER_VIEWS
];
178 unsigned sampler_view_count
[PIPE_SHADER_TYPES
];
180 struct primconvert_context
*primconvert
;
181 struct blitter_context
*blitter
;
183 /* Blitting the wallpaper (the old contents of the framebuffer back to
184 * itself) uses a dedicated u_blitter instance versus general blit()
185 * callbacks from Gallium, as the blit() callback can trigger
186 * wallpapering without Gallium realising, which in turns u_blitter
187 * errors due to unsupported reucrsion */
189 struct blitter_context
*blitter_wallpaper
;
190 struct panfrost_job
*wallpaper_batch
;
192 struct panfrost_blend_state
*blend
;
194 struct pipe_viewport_state pipe_viewport
;
195 struct pipe_scissor_state scissor
;
196 struct pipe_blend_color blend_color
;
197 struct pipe_depth_stencil_alpha_state
*depth_stencil
;
198 struct pipe_stencil_ref stencil_ref
;
200 /* True for t6XX, false for t8xx. */
206 /* Corresponds to the CSO */
208 struct panfrost_rasterizer
{
209 struct pipe_rasterizer_state base
;
211 /* Bitmask of front face, etc */
212 unsigned tiler_gl_enables
;
215 /* Variants bundle together to form the backing CSO, bundling multiple
216 * shaders with varying emulated features baked in (alpha test
217 * parameters, etc) */
218 #define MAX_SHADER_VARIANTS 8
220 /* A shader state corresponds to the actual, current variant of the shader */
221 struct panfrost_shader_state
{
222 /* Compiled, mapped descriptor, ready for the hardware */
224 struct mali_shader_meta
*tripipe
;
226 /* Non-descript information */
229 bool writes_point_size
;
230 bool reads_point_coord
;
233 struct mali_attr_meta varyings
[PIPE_MAX_ATTRIBS
];
234 gl_varying_slot varyings_loc
[PIPE_MAX_ATTRIBS
];
236 unsigned sysval_count
;
237 unsigned sysval
[MAX_SYSVAL_COUNT
];
239 /* Information on this particular shader variant */
240 struct pipe_alpha_state alpha_state
;
242 uint16_t point_sprite_mask
;
243 unsigned point_sprite_upper_left
: 1;
245 /* Should we enable helper invocations */
246 bool helper_invocations
;
248 struct panfrost_bo
*bo
;
251 /* A collection of varyings (the CSO) */
252 struct panfrost_shader_variants
{
253 /* A panfrost_shader_variants can represent a shader for
254 * either graphics or compute */
259 struct pipe_shader_state base
;
260 struct pipe_compute_state cbase
;
263 struct panfrost_shader_state variants
[MAX_SHADER_VARIANTS
];
264 unsigned variant_count
;
266 /* The current active variant */
267 unsigned active_variant
;
270 struct panfrost_vertex_state
{
271 unsigned num_elements
;
273 struct pipe_vertex_element pipe
[PIPE_MAX_ATTRIBS
];
274 struct mali_attr_meta hw
[PIPE_MAX_ATTRIBS
];
277 struct panfrost_sampler_state
{
278 struct pipe_sampler_state base
;
279 struct mali_sampler_descriptor hw
;
282 /* Misnomer: Sampler view corresponds to textures, not samplers */
284 struct panfrost_sampler_view
{
285 struct pipe_sampler_view base
;
286 struct mali_texture_descriptor hw
;
290 static inline struct panfrost_context
*
291 pan_context(struct pipe_context
*pcontext
)
293 return (struct panfrost_context
*) pcontext
;
296 struct pipe_context
*
297 panfrost_create_context(struct pipe_screen
*screen
, void *priv
, unsigned flags
);
300 panfrost_emit_for_draw(struct panfrost_context
*ctx
, bool with_vertex_data
);
302 struct panfrost_transfer
303 panfrost_vertex_tiler_job(struct panfrost_context
*ctx
, bool is_tiler
);
306 panfrost_get_default_swizzle(unsigned components
);
310 struct pipe_context
*pipe
,
311 struct pipe_fence_handle
**fence
,
315 panfrost_is_scanout(struct panfrost_context
*ctx
);
317 mali_ptr
panfrost_sfbd_fragment(struct panfrost_context
*ctx
, bool has_draws
);
318 mali_ptr
panfrost_mfbd_fragment(struct panfrost_context
*ctx
, bool has_draws
);
320 struct bifrost_framebuffer
321 panfrost_emit_mfbd(struct panfrost_context
*ctx
, unsigned vertex_count
);
323 struct mali_single_framebuffer
324 panfrost_emit_sfbd(struct panfrost_context
*ctx
, unsigned vertex_count
);
327 panfrost_fragment_job(struct panfrost_context
*ctx
, bool has_draws
);
330 panfrost_shader_compile(
331 struct panfrost_context
*ctx
,
332 struct mali_shader_meta
*meta
,
333 enum pipe_shader_ir ir_type
,
335 gl_shader_stage stage
,
336 struct panfrost_shader_state
*state
,
337 uint64_t *outputs_written
);
340 panfrost_pack_work_groups_compute(
341 struct mali_vertex_tiler_prefix
*out
,
350 panfrost_pack_work_groups_fused(
351 struct mali_vertex_tiler_prefix
*vertex
,
352 struct mali_vertex_tiler_prefix
*tiler
,
363 panfrost_vertex_buffer_address(struct panfrost_context
*ctx
, unsigned i
);
366 panfrost_emit_vertex_data(struct panfrost_job
*batch
);
368 struct pan_shift_odd
{
374 panfrost_padded_vertex_count(
375 unsigned vertex_count
,
380 pan_expand_shift_odd(struct pan_shift_odd o
);
385 panfrost_compute_context_init(struct pipe_context
*pctx
);
390 panfrost_emit_varying_descriptor(
391 struct panfrost_context
*ctx
,
392 unsigned vertex_count
);