2 * © Copyright 2018 Alyssa Rosenzweig
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
28 #define _LARGEFILE64_SOURCE 1
29 #define CACHE_LINE_SIZE 1024 /* TODO */
32 #include "pan_resource.h"
35 #include "pipe/p_compiler.h"
36 #include "pipe/p_config.h"
37 #include "pipe/p_context.h"
38 #include "pipe/p_defines.h"
39 #include "pipe/p_format.h"
40 #include "pipe/p_screen.h"
41 #include "pipe/p_state.h"
42 #include "util/u_blitter.h"
43 #include "util/hash_table.h"
45 #include "midgard/midgard_compile.h"
47 /* Forward declare to avoid extra header dep */
48 struct prim_convert_context
;
50 #define MAX_DRAW_CALLS 4096
51 #define MAX_VARYINGS 4096
53 //#define PAN_DIRTY_CLEAR (1 << 0)
54 #define PAN_DIRTY_RASTERIZER (1 << 2)
55 #define PAN_DIRTY_FS (1 << 3)
56 #define PAN_DIRTY_FRAG_CORE (PAN_DIRTY_FS) /* Dirty writes are tied */
57 #define PAN_DIRTY_VS (1 << 4)
58 #define PAN_DIRTY_VERTEX (1 << 5)
59 #define PAN_DIRTY_VERT_BUF (1 << 6)
60 //#define PAN_DIRTY_VIEWPORT (1 << 7)
61 #define PAN_DIRTY_SAMPLERS (1 << 8)
62 #define PAN_DIRTY_TEXTURES (1 << 9)
64 #define SET_BIT(lval, bit, cond) \
70 struct panfrost_constant_buffer
{
76 struct panfrost_query
{
77 /* Passthrough from Gallium */
81 /* Memory for the GPU to writeback the value of the query */
82 struct panfrost_transfer transfer
;
85 struct panfrost_fence
{
86 struct pipe_reference reference
;
90 #define PANFROST_MAX_TRANSIENT_ENTRIES 64
92 struct panfrost_transient_pool
{
93 /* Memory blocks in the pool */
94 struct panfrost_memory_entry
*entries
[PANFROST_MAX_TRANSIENT_ENTRIES
];
96 /* Number of entries we own */
99 /* Current entry that we are writing to, zero-indexed, strictly less than entry_count */
100 unsigned entry_index
;
102 /* Number of bytes into the current entry we are */
105 /* Entry size (all entries must be homogenous) */
109 struct panfrost_context
{
110 /* Gallium context */
111 struct pipe_context base
;
113 /* Bound job and map of panfrost_job_key to jobs */
114 struct panfrost_job
*job
;
115 struct hash_table
*jobs
;
117 /* panfrost_resource -> panfrost_job */
118 struct hash_table
*write_jobs
;
120 /* Bit mask for supported PIPE_DRAW for this hardware */
123 struct pipe_framebuffer_state pipe_framebuffer
;
125 /* The number of concurrent FBOs allowed depends on the number of pools
126 * used; pools are ringed for parallelism opportunities */
128 struct panfrost_transient_pool transient_pools
[2];
131 struct panfrost_memory cmdstream_persistent
;
132 struct panfrost_memory shaders
;
133 struct panfrost_memory scratchpad
;
134 struct panfrost_memory tiler_heap
;
135 struct panfrost_memory varying_mem
;
136 struct panfrost_memory tiler_polygon_list
;
137 struct panfrost_memory tiler_dummy
;
138 struct panfrost_memory depth_stencil_buffer
;
140 struct panfrost_query
*occlusion_query
;
142 /* Each draw has corresponding vertex and tiler payloads */
143 struct midgard_payload_vertex_tiler payload_vertex
;
144 struct midgard_payload_vertex_tiler payload_tiler
;
146 /* The fragment shader binary itself is pointed here (for the tripipe) but
147 * also everything else in the shader core, including blending, the
148 * stencil/depth tests, etc. Refer to the presentations. */
150 struct mali_shader_meta fragment_shader_core
;
152 /* A frame is composed of a starting set value job, a number of vertex
153 * and tiler jobs, linked to the fragment job at the end. See the
154 * presentations for more information how this works */
158 mali_ptr set_value_job
;
159 mali_ptr vertex_jobs
[MAX_DRAW_CALLS
];
160 mali_ptr tiler_jobs
[MAX_DRAW_CALLS
];
162 struct mali_job_descriptor_header
*u_set_value_job
;
163 struct mali_job_descriptor_header
*u_vertex_jobs
[MAX_DRAW_CALLS
];
164 struct mali_job_descriptor_header
*u_tiler_jobs
[MAX_DRAW_CALLS
];
166 unsigned vertex_job_count
;
167 unsigned tiler_job_count
;
169 /* Per-draw Dirty flags are setup like any other driver */
172 unsigned vertex_count
;
174 union mali_attr attributes
[PIPE_MAX_ATTRIBS
];
176 unsigned varying_height
;
178 struct mali_single_framebuffer vt_framebuffer_sfbd
;
179 struct bifrost_framebuffer vt_framebuffer_mfbd
;
181 /* TODO: Multiple uniform buffers (index =/= 0), finer updates? */
183 struct panfrost_constant_buffer constant_buffer
[PIPE_SHADER_TYPES
];
186 struct panfrost_rasterizer
*rasterizer
;
188 struct panfrost_shader_variants
*vs
;
189 struct panfrost_shader_variants
*fs
;
191 struct panfrost_vertex_state
*vertex
;
193 struct pipe_vertex_buffer vertex_buffers
[PIPE_MAX_ATTRIBS
];
196 struct panfrost_sampler_state
*samplers
[PIPE_SHADER_TYPES
][PIPE_MAX_SAMPLERS
];
197 unsigned sampler_count
[PIPE_SHADER_TYPES
];
199 struct panfrost_sampler_view
*sampler_views
[PIPE_SHADER_TYPES
][PIPE_MAX_SHADER_SAMPLER_VIEWS
];
200 unsigned sampler_view_count
[PIPE_SHADER_TYPES
];
202 struct primconvert_context
*primconvert
;
203 struct blitter_context
*blitter
;
206 struct panfrost_blend_state
*blend
;
208 struct pipe_viewport_state pipe_viewport
;
209 struct pipe_scissor_state scissor
;
210 struct pipe_blend_color blend_color
;
211 struct pipe_depth_stencil_alpha_state
*depth_stencil
;
212 struct pipe_stencil_ref stencil_ref
;
214 /* True for t6XX, false for t8xx. */
217 /* If set, we'll require the use of single render-target framebuffer
218 * descriptors (SFBD), for older hardware -- specifically, <T760 hardware, If
219 * false, we'll use the MFBD no matter what. New hardware -does- retain support
220 * for SFBD, and in theory we could flip between them on a per-RT basis, but
221 * there's no real advantage to doing so */
227 /* Corresponds to the CSO */
229 struct panfrost_rasterizer
{
230 struct pipe_rasterizer_state base
;
232 /* Bitmask of front face, etc */
233 unsigned tiler_gl_enables
;
236 struct panfrost_blend_state
{
237 struct pipe_blend_state base
;
239 /* Whether a blend shader is in use */
240 bool has_blend_shader
;
242 /* Compiled fixed function command */
243 struct mali_blend_equation equation
;
246 /* Compiled blend shader */
247 mali_ptr blend_shader
;
248 int blend_work_count
;
251 /* Variants bundle together to form the backing CSO, bundling multiple
252 * shaders with varying emulated features baked in (alpha test
253 * parameters, etc) */
254 #define MAX_SHADER_VARIANTS 8
256 /* A shader state corresponds to the actual, current variant of the shader */
257 struct panfrost_shader_state
{
258 struct pipe_shader_state
*base
;
260 /* Compiled, mapped descriptor, ready for the hardware */
262 struct mali_shader_meta
*tripipe
;
263 mali_ptr tripipe_gpu
;
265 /* Non-descript information */
268 bool writes_point_size
;
269 bool reads_point_coord
;
271 struct mali_attr_meta varyings
[PIPE_MAX_ATTRIBS
];
272 gl_varying_slot varyings_loc
[PIPE_MAX_ATTRIBS
];
274 unsigned sysval_count
;
275 unsigned sysval
[MAX_SYSVAL_COUNT
];
277 /* Information on this particular shader variant */
278 struct pipe_alpha_state alpha_state
;
281 /* A collection of varyings (the CSO) */
282 struct panfrost_shader_variants
{
283 struct pipe_shader_state base
;
285 struct panfrost_shader_state variants
[MAX_SHADER_VARIANTS
];
286 unsigned variant_count
;
288 /* The current active variant */
289 unsigned active_variant
;
292 struct panfrost_vertex_state
{
293 unsigned num_elements
;
295 struct pipe_vertex_element pipe
[PIPE_MAX_ATTRIBS
];
296 struct mali_attr_meta hw
[PIPE_MAX_ATTRIBS
];
299 struct panfrost_sampler_state
{
300 struct pipe_sampler_state base
;
301 struct mali_sampler_descriptor hw
;
304 /* Misnomer: Sampler view corresponds to textures, not samplers */
306 struct panfrost_sampler_view
{
307 struct pipe_sampler_view base
;
308 struct mali_texture_descriptor hw
;
311 static inline struct panfrost_context
*
312 pan_context(struct pipe_context
*pcontext
)
314 return (struct panfrost_context
*) pcontext
;
317 struct pipe_context
*
318 panfrost_create_context(struct pipe_screen
*screen
, void *priv
, unsigned flags
);
321 panfrost_emit_for_draw(struct panfrost_context
*ctx
, bool with_vertex_data
);
323 struct panfrost_transfer
324 panfrost_vertex_tiler_job(struct panfrost_context
*ctx
, bool is_tiler
);
327 panfrost_get_default_swizzle(unsigned components
);
331 struct pipe_context
*pipe
,
332 struct pipe_fence_handle
**fence
,
336 panfrost_is_scanout(struct panfrost_context
*ctx
);
338 mali_ptr
panfrost_sfbd_fragment(struct panfrost_context
*ctx
, bool has_draws
);
339 mali_ptr
panfrost_mfbd_fragment(struct panfrost_context
*ctx
, bool has_draws
);
341 struct bifrost_framebuffer
342 panfrost_emit_mfbd(struct panfrost_context
*ctx
, unsigned vertex_count
);
344 struct mali_single_framebuffer
345 panfrost_emit_sfbd(struct panfrost_context
*ctx
, unsigned vertex_count
);
348 panfrost_fragment_job(struct panfrost_context
*ctx
, bool has_draws
);
351 panfrost_shader_compile(struct panfrost_context
*ctx
, struct mali_shader_meta
*meta
, const char *src
, int type
, struct panfrost_shader_state
*state
);