2 * © Copyright 2018 Alyssa Rosenzweig
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30 #define _LARGEFILE64_SOURCE 1
31 #define CACHE_LINE_SIZE 1024 /* TODO */
34 #include "pan_resource.h"
36 #include "pipe/p_compiler.h"
37 #include "pipe/p_config.h"
38 #include "pipe/p_context.h"
39 #include "pipe/p_defines.h"
40 #include "pipe/p_format.h"
41 #include "pipe/p_screen.h"
42 #include "pipe/p_state.h"
43 #include "util/u_blitter.h"
45 /* Forward declare to avoid extra header dep */
46 struct prim_convert_context
;
48 /* TODO: Handle on newer hardware */
50 #define PANFROST_DEFAULT_FBD (MALI_MFBD)
51 #define PANFROST_FRAMEBUFFER struct bifrost_framebuffer
53 #define PANFROST_DEFAULT_FBD (MALI_SFBD)
54 #define PANFROST_FRAMEBUFFER struct mali_single_framebuffer
57 #define MAX_DRAW_CALLS 4096
58 #define MAX_VARYINGS 4096
60 //#define PAN_DIRTY_CLEAR (1 << 0)
61 #define PAN_DIRTY_RASTERIZER (1 << 2)
62 #define PAN_DIRTY_FS (1 << 3)
63 #define PAN_DIRTY_FRAG_CORE (PAN_DIRTY_FS) /* Dirty writes are tied */
64 #define PAN_DIRTY_VS (1 << 4)
65 #define PAN_DIRTY_VERTEX (1 << 5)
66 #define PAN_DIRTY_VERT_BUF (1 << 6)
67 //#define PAN_DIRTY_VIEWPORT (1 << 7)
68 #define PAN_DIRTY_SAMPLERS (1 << 8)
69 #define PAN_DIRTY_TEXTURES (1 << 9)
71 struct panfrost_constant_buffer
{
77 struct panfrost_query
{
78 /* Passthrough from Gallium */
82 /* Memory for the GPU to writeback the value of the query */
83 struct panfrost_transfer transfer
;
86 #define PANFROST_MAX_TRANSIENT_ENTRIES 64
88 struct panfrost_transient_pool
{
89 /* Memory blocks in the pool */
90 struct panfrost_memory_entry
*entries
[PANFROST_MAX_TRANSIENT_ENTRIES
];
92 /* Number of entries we own */
95 /* Current entry that we are writing to, zero-indexed, strictly less than entry_count */
98 /* Number of bytes into the current entry we are */
101 /* Entry size (all entries must be homogenous) */
105 struct panfrost_context
{
106 /* Gallium context */
107 struct pipe_context base
;
109 /* Bit mask for supported PIPE_DRAW for this hardware */
112 struct pipe_framebuffer_state pipe_framebuffer
;
114 /* The number of concurrent FBOs allowed depends on the number of pools
115 * used; pools are ringed for parallelism opportunities */
117 struct panfrost_transient_pool transient_pools
[2];
120 struct panfrost_memory cmdstream_persistent
;
121 struct panfrost_memory shaders
;
122 struct panfrost_memory scratchpad
;
123 struct panfrost_memory tiler_heap
;
124 struct panfrost_memory varying_mem
;
125 struct panfrost_memory misc_0
;
126 struct panfrost_memory misc_1
;
127 struct panfrost_memory depth_stencil_buffer
;
131 const union pipe_color_union
*color
;
136 struct panfrost_query
*occlusion_query
;
138 /* Each render job has multiple framebuffer descriptors associated with
139 * it, used for various purposes with more or less the same format. The
140 * most obvious is the fragment framebuffer descriptor, which carries
141 * e.g. clearing information */
144 struct mali_single_framebuffer fragment_fbd
;
146 struct bifrost_framebuffer fragment_fbd
;
148 struct bifrost_fb_extra fragment_extra
;
150 struct bifrost_render_target fragment_rts
[4];
153 /* Each draw has corresponding vertex and tiler payloads */
154 struct midgard_payload_vertex_tiler payload_vertex
;
155 struct midgard_payload_vertex_tiler payload_tiler
;
157 /* The fragment shader binary itself is pointed here (for the tripipe) but
158 * also everything else in the shader core, including blending, the
159 * stencil/depth tests, etc. Refer to the presentations. */
161 struct mali_shader_meta fragment_shader_core
;
163 /* A frame is composed of a starting set value job, a number of vertex
164 * and tiler jobs, linked to the fragment job at the end. See the
165 * presentations for more information how this works */
169 mali_ptr set_value_job
;
170 mali_ptr vertex_jobs
[MAX_DRAW_CALLS
];
171 mali_ptr tiler_jobs
[MAX_DRAW_CALLS
];
173 struct mali_job_descriptor_header
*u_set_value_job
;
174 struct mali_job_descriptor_header
*u_vertex_jobs
[MAX_DRAW_CALLS
];
175 struct mali_job_descriptor_header
*u_tiler_jobs
[MAX_DRAW_CALLS
];
177 unsigned vertex_job_count
;
178 unsigned tiler_job_count
;
180 /* Per-draw Dirty flags are setup like any other driver */
183 /* Per frame dirty flag - whether there was a clear. If not, we need to do a partial update, maybe */
186 unsigned vertex_count
;
188 union mali_attr attributes
[PIPE_MAX_ATTRIBS
];
190 unsigned varying_height
;
192 struct mali_viewport
*viewport
;
193 PANFROST_FRAMEBUFFER vt_framebuffer
;
195 /* TODO: Multiple uniform buffers (index =/= 0), finer updates? */
197 struct panfrost_constant_buffer constant_buffer
[PIPE_SHADER_TYPES
];
200 struct panfrost_rasterizer
*rasterizer
;
202 struct panfrost_shader_variants
*vs
;
203 struct panfrost_shader_variants
*fs
;
205 struct panfrost_vertex_state
*vertex
;
207 struct pipe_vertex_buffer
*vertex_buffers
;
208 unsigned vertex_buffer_count
;
210 struct panfrost_sampler_state
*samplers
[PIPE_SHADER_TYPES
][PIPE_MAX_SAMPLERS
];
211 unsigned sampler_count
[PIPE_SHADER_TYPES
];
213 struct panfrost_sampler_view
*sampler_views
[PIPE_SHADER_TYPES
][PIPE_MAX_SHADER_SAMPLER_VIEWS
];
214 unsigned sampler_view_count
[PIPE_SHADER_TYPES
];
216 struct primconvert_context
*primconvert
;
217 struct blitter_context
*blitter
;
219 struct panfrost_blend_state
*blend
;
221 struct pipe_viewport_state pipe_viewport
;
222 struct pipe_scissor_state scissor
;
223 struct pipe_blend_color blend_color
;
224 struct pipe_depth_stencil_alpha_state
*depth_stencil
;
225 struct pipe_stencil_ref stencil_ref
;
228 /* Corresponds to the CSO */
230 struct panfrost_rasterizer
{
231 struct pipe_rasterizer_state base
;
233 /* Bitmask of front face, etc */
234 unsigned tiler_gl_enables
;
237 struct panfrost_blend_state
{
238 struct pipe_blend_state base
;
240 /* Whether a blend shader is in use */
241 bool has_blend_shader
;
243 /* Compiled fixed function command */
244 struct mali_blend_equation equation
;
246 /* Compiled blend shader */
247 mali_ptr blend_shader
;
248 int blend_work_count
;
251 /* Internal varyings descriptor */
252 struct panfrost_varyings
{
253 /* Varyings information: stride of each chunk of memory used for
254 * varyings (similar structure with attributes). Count is just the
255 * number of vec4's. Buffer count is the number of varying chunks (<=
256 * count). Height is used to calculate gl_Position's position ("it's
257 * not a pun, Alyssa!"). Vertex-only varyings == descriptor for
258 * gl_Position and something else apparently occupying the same space.
259 * Varyings == main varyings descriptors following typical mali_attr
262 unsigned varyings_stride
[MAX_VARYINGS
];
263 unsigned varying_count
;
264 unsigned varying_buffer_count
;
266 /* Map of the actual varyings buffer */
267 uint8_t *varyings_buffer_cpu
;
268 mali_ptr varyings_descriptor
;
269 mali_ptr varyings_descriptor_fragment
;
272 /* Variants bundle together to form the backing CSO, bundling multiple
273 * shaders with varying emulated features baked in (alpha test
274 * parameters, etc) */
275 #define MAX_SHADER_VARIANTS 8
277 /* A shader state corresponds to the actual, current variant of the shader */
278 struct panfrost_shader_state
{
279 struct pipe_shader_state
*base
;
281 /* Compiled, mapped descriptor, ready for the hardware */
283 struct mali_shader_meta
*tripipe
;
284 mali_ptr tripipe_gpu
;
286 /* Non-descript information */
289 bool writes_point_size
;
291 /* Valid for vertex shaders only due to when this is calculated */
292 struct panfrost_varyings varyings
;
294 /* Information on this particular shader variant */
295 struct pipe_alpha_state alpha_state
;
298 /* A collection of varyings (the CSO) */
299 struct panfrost_shader_variants
{
300 struct pipe_shader_state base
;
302 struct panfrost_shader_state variants
[MAX_SHADER_VARIANTS
];
303 unsigned variant_count
;
305 /* The current active variant */
306 unsigned active_variant
;
309 struct panfrost_vertex_state
{
310 unsigned num_elements
;
312 struct pipe_vertex_element pipe
[PIPE_MAX_ATTRIBS
];
313 int nr_components
[PIPE_MAX_ATTRIBS
];
315 /* The actual attribute meta, prebaked and GPU mapped. TODO: Free memory */
316 struct mali_attr_meta
*hw
;
317 mali_ptr descriptor_ptr
;
320 struct panfrost_sampler_state
{
321 struct pipe_sampler_state base
;
322 struct mali_sampler_descriptor hw
;
325 /* Misnomer: Sampler view corresponds to textures, not samplers */
327 struct panfrost_sampler_view
{
328 struct pipe_sampler_view base
;
329 struct mali_texture_descriptor hw
;
332 static inline struct panfrost_context
*
333 pan_context(struct pipe_context
*pcontext
)
335 return (struct panfrost_context
*) pcontext
;
338 static inline struct panfrost_screen
*
339 pan_screen(struct pipe_screen
*p
)
341 return (struct panfrost_screen
*)p
;
344 struct pipe_context
*
345 panfrost_create_context(struct pipe_screen
*screen
, void *priv
, unsigned flags
);
348 panfrost_emit_for_draw(struct panfrost_context
*ctx
, bool with_vertex_data
);
350 struct panfrost_transfer
351 panfrost_vertex_tiler_job(struct panfrost_context
*ctx
, bool is_tiler
, bool is_elided_tiler
);
354 panfrost_get_default_swizzle(unsigned components
);
358 struct pipe_context
*pipe
,
359 struct pipe_fence_handle
**fence
,
363 panfrost_fragment_job(struct panfrost_context
*ctx
);
366 panfrost_shader_compile(struct panfrost_context
*ctx
, struct mali_shader_meta
*meta
, const char *src
, int type
, struct panfrost_shader_state
*state
);