nvc0: add support for programmable sample locations
[mesa.git] / src / gallium / drivers / nouveau / nvc0 / nvc0_context.h
1 #ifndef __NVC0_CONTEXT_H__
2 #define __NVC0_CONTEXT_H__
3
4 #include "pipe/p_context.h"
5 #include "pipe/p_defines.h"
6 #include "pipe/p_state.h"
7
8 #include "util/list.h"
9 #include "util/u_memory.h"
10 #include "util/u_math.h"
11 #include "util/u_inlines.h"
12 #include "util/u_dynarray.h"
13
14 #include "nvc0/nvc0_winsys.h"
15 #include "nvc0/nvc0_stateobj.h"
16 #include "nvc0/nvc0_screen.h"
17 #include "nvc0/nvc0_program.h"
18 #include "nvc0/nvc0_resource.h"
19 #include "nvc0/nvc0_query.h"
20
21 #include "nv50/nv50_transfer.h"
22
23 #include "nouveau_context.h"
24 #include "nouveau_debug.h"
25
26 #include "nv50/nv50_3ddefs.xml.h"
27 #include "nvc0/nvc0_3d.xml.h"
28 #include "nv50/nv50_2d.xml.h"
29 #include "nvc0/nvc0_m2mf.xml.h"
30 #include "nvc0/nve4_p2mf.xml.h"
31 #include "nvc0/nvc0_compute.xml.h"
32 #include "nvc0/nvc0_macros.h"
33
34 /* NOTE: must keep NVC0_NEW_3D_...PROG in consecutive bits in this order */
35 #define NVC0_NEW_3D_BLEND (1 << 0)
36 #define NVC0_NEW_3D_RASTERIZER (1 << 1)
37 #define NVC0_NEW_3D_ZSA (1 << 2)
38 #define NVC0_NEW_3D_VERTPROG (1 << 3)
39 #define NVC0_NEW_3D_TCTLPROG (1 << 4)
40 #define NVC0_NEW_3D_TEVLPROG (1 << 5)
41 #define NVC0_NEW_3D_GMTYPROG (1 << 6)
42 #define NVC0_NEW_3D_FRAGPROG (1 << 7)
43 #define NVC0_NEW_3D_BLEND_COLOUR (1 << 8)
44 #define NVC0_NEW_3D_STENCIL_REF (1 << 9)
45 #define NVC0_NEW_3D_CLIP (1 << 10)
46 #define NVC0_NEW_3D_SAMPLE_MASK (1 << 11)
47 #define NVC0_NEW_3D_FRAMEBUFFER (1 << 12)
48 #define NVC0_NEW_3D_STIPPLE (1 << 13)
49 #define NVC0_NEW_3D_SCISSOR (1 << 14)
50 #define NVC0_NEW_3D_VIEWPORT (1 << 15)
51 #define NVC0_NEW_3D_ARRAYS (1 << 16)
52 #define NVC0_NEW_3D_VERTEX (1 << 17)
53 #define NVC0_NEW_3D_CONSTBUF (1 << 18)
54 #define NVC0_NEW_3D_TEXTURES (1 << 19)
55 #define NVC0_NEW_3D_SAMPLERS (1 << 20)
56 #define NVC0_NEW_3D_TFB_TARGETS (1 << 21)
57
58 #define NVC0_NEW_3D_SURFACES (1 << 23)
59 #define NVC0_NEW_3D_MIN_SAMPLES (1 << 24)
60 #define NVC0_NEW_3D_TESSFACTOR (1 << 25)
61 #define NVC0_NEW_3D_BUFFERS (1 << 26)
62 #define NVC0_NEW_3D_DRIVERCONST (1 << 27)
63 #define NVC0_NEW_3D_WINDOW_RECTS (1 << 28)
64
65 #define NVC0_NEW_3D_SAMPLE_LOCATIONS (1 << 29)
66
67 #define NVC0_NEW_CP_PROGRAM (1 << 0)
68 #define NVC0_NEW_CP_SURFACES (1 << 1)
69 #define NVC0_NEW_CP_TEXTURES (1 << 2)
70 #define NVC0_NEW_CP_SAMPLERS (1 << 3)
71 #define NVC0_NEW_CP_CONSTBUF (1 << 4)
72 #define NVC0_NEW_CP_GLOBALS (1 << 5)
73 #define NVC0_NEW_CP_DRIVERCONST (1 << 6)
74 #define NVC0_NEW_CP_BUFFERS (1 << 7)
75
76 /* 3d bufctx (during draw_vbo, blit_3d) */
77 #define NVC0_BIND_3D_FB 0
78 #define NVC0_BIND_3D_VTX 1
79 #define NVC0_BIND_3D_VTX_TMP 2
80 #define NVC0_BIND_3D_IDX 3
81 #define NVC0_BIND_3D_TEX(s, i) ( 4 + 32 * (s) + (i))
82 #define NVC0_BIND_3D_CB(s, i) (164 + 16 * (s) + (i))
83 #define NVC0_BIND_3D_TFB 244
84 #define NVC0_BIND_3D_SUF 245
85 #define NVC0_BIND_3D_BUF 246
86 #define NVC0_BIND_3D_SCREEN 247
87 #define NVC0_BIND_3D_BINDLESS 248
88 #define NVC0_BIND_3D_TLS 249
89 #define NVC0_BIND_3D_TEXT 250
90 #define NVC0_BIND_3D_COUNT 251
91
92 /* compute bufctx (during launch_grid) */
93 #define NVC0_BIND_CP_CB(i) ( 0 + (i))
94 #define NVC0_BIND_CP_TEX(i) ( 16 + (i))
95 #define NVC0_BIND_CP_SUF 48
96 #define NVC0_BIND_CP_GLOBAL 49
97 #define NVC0_BIND_CP_DESC 50
98 #define NVC0_BIND_CP_SCREEN 51
99 #define NVC0_BIND_CP_QUERY 52
100 #define NVC0_BIND_CP_BUF 53
101 #define NVC0_BIND_CP_TEXT 54
102 #define NVC0_BIND_CP_BINDLESS 55
103 #define NVC0_BIND_CP_COUNT 56
104
105 /* bufctx for other operations */
106 #define NVC0_BIND_2D 0
107 #define NVC0_BIND_M2MF 0
108 #define NVC0_BIND_FENCE 1
109
110 /* 6 user uniform buffers, at 64K each */
111 #define NVC0_CB_USR_INFO(s) (s << 16)
112 #define NVC0_CB_USR_SIZE (6 << 16)
113 /* 6 driver constbuts, at 64K each */
114 #define NVC0_CB_AUX_INFO(s) NVC0_CB_USR_SIZE + (s << 16)
115 #define NVC0_CB_AUX_SIZE (1 << 16)
116 /* XXX: Figure out what this UNK data is. */
117 #define NVC0_CB_AUX_UNK_INFO 0x000
118 #define NVC0_CB_AUX_UNK_SIZE (8 * 4)
119 /* 40 textures handles (8 for GM107+ images only), at 1 32-bits integer each */
120 #define NVC0_CB_AUX_TEX_INFO(i) 0x020 + (i) * 4
121 #define NVC0_CB_AUX_TEX_SIZE (40 * 4)
122 /* 8 sets of 32-bits coordinate offsets */
123 #define NVC0_CB_AUX_MS_INFO 0x0c0
124 #define NVC0_CB_AUX_MS_SIZE (8 * 2 * 4)
125 /* block/grid size, at 3 32-bits integers each, gridid and work_dim */
126 #define NVC0_CB_AUX_GRID_INFO(i) 0x100 + (i) * 4 /* CP */
127 #define NVC0_CB_AUX_GRID_SIZE (8 * 4)
128 /* FB texture handle */
129 #define NVC0_CB_AUX_FB_TEX_INFO 0x100 /* FP */
130 #define NVC0_CB_AUX_FB_TEX_SIZE (4)
131 /* 8 user clip planes, at 4 32-bits floats each */
132 #define NVC0_CB_AUX_UCP_INFO 0x120
133 #define NVC0_CB_AUX_UCP_SIZE (PIPE_MAX_CLIP_PLANES * 4 * 4)
134 /* 13 ubos, at 4 32-bits integer each */
135 #define NVC0_CB_AUX_UBO_INFO(i) 0x120 + (i) * 4 * 4 /* CP */
136 #define NVC0_CB_AUX_UBO_SIZE ((NVC0_MAX_PIPE_CONSTBUFS - 1) * 4 * 4)
137 /* 8 sets of 32-bits integer pairs sample offsets */
138 #define NVC0_CB_AUX_SAMPLE_INFO 0x1a0 /* FP */
139 /* 256 bytes, though only 64 bytes used before GM200 */
140 #define NVC0_CB_AUX_SAMPLE_SIZE (8 * 2 * 4 * 4)
141 /* draw parameters (index bais, base instance, drawid) */
142 #define NVC0_CB_AUX_DRAW_INFO 0x1a0 /* VP */
143 /* 32 user buffers, at 4 32-bits integers each */
144 #define NVC0_CB_AUX_BUF_INFO(i) 0x2a0 + (i) * 4 * 4
145 #define NVC0_CB_AUX_BUF_SIZE (NVC0_MAX_BUFFERS * 4 * 4)
146 /* 8 surfaces, at 16 32-bits integers each */
147 #define NVC0_CB_AUX_SU_INFO(i) 0x4a0 + (i) * 16 * 4
148 #define NVC0_CB_AUX_SU_SIZE (NVC0_MAX_IMAGES * 16 * 4)
149 /* 1 64-bits address and 1 32-bits sequence */
150 #define NVC0_CB_AUX_MP_INFO 0x6a0
151 #define NVC0_CB_AUX_MP_SIZE 3 * 4
152 /* 512 64-byte blocks for bindless image handles */
153 #define NVC0_CB_AUX_BINDLESS_INFO(i) 0x6b0 + (i) * 16 * 4
154 #define NVC0_CB_AUX_BINDLESS_SIZE (NVE4_IMG_MAX_HANDLES * 16 * 4)
155 /* 4 32-bits floats for the vertex runout, put at the end */
156 #define NVC0_CB_AUX_RUNOUT_INFO NVC0_CB_USR_SIZE + (NVC0_CB_AUX_SIZE * 6)
157
158 struct nvc0_blitctx;
159
160 bool nvc0_blitctx_create(struct nvc0_context *);
161 void nvc0_blitctx_destroy(struct nvc0_context *);
162
163 struct nvc0_resident {
164 struct list_head list;
165 uint64_t handle;
166 struct nv04_resource *buf;
167 uint32_t flags;
168 };
169
170 struct nvc0_context {
171 struct nouveau_context base;
172
173 struct nouveau_bufctx *bufctx_3d;
174 struct nouveau_bufctx *bufctx;
175 struct nouveau_bufctx *bufctx_cp;
176
177 struct nvc0_screen *screen;
178
179 void (*m2mf_copy_rect)(struct nvc0_context *,
180 const struct nv50_m2mf_rect *dst,
181 const struct nv50_m2mf_rect *src,
182 uint32_t nblocksx, uint32_t nblocksy);
183
184 uint32_t dirty_3d; /* dirty flags for 3d state */
185 uint32_t dirty_cp; /* dirty flags for compute state */
186
187 struct nvc0_graph_state state;
188
189 struct nvc0_blend_stateobj *blend;
190 struct nvc0_rasterizer_stateobj *rast;
191 struct nvc0_zsa_stateobj *zsa;
192 struct nvc0_vertex_stateobj *vertex;
193
194 struct nvc0_program *vertprog;
195 struct nvc0_program *tctlprog;
196 struct nvc0_program *tevlprog;
197 struct nvc0_program *gmtyprog;
198 struct nvc0_program *fragprog;
199 struct nvc0_program *compprog;
200
201 struct nvc0_program *tcp_empty;
202
203 struct nvc0_constbuf constbuf[6][NVC0_MAX_PIPE_CONSTBUFS];
204 uint16_t constbuf_dirty[6];
205 uint16_t constbuf_valid[6];
206 uint16_t constbuf_coherent[6];
207 bool cb_dirty;
208
209 struct pipe_vertex_buffer vtxbuf[PIPE_MAX_ATTRIBS];
210 unsigned num_vtxbufs;
211 uint32_t vtxbufs_coherent;
212 uint32_t constant_vbos;
213 uint32_t vbo_user; /* bitmask of vertex buffers pointing to user memory */
214 uint32_t vb_elt_first; /* from pipe_draw_info, for vertex upload */
215 uint32_t vb_elt_limit; /* max - min element (count - 1) */
216 uint32_t instance_off; /* current base vertex for instanced arrays */
217 uint32_t instance_max; /* last instance for current draw call */
218
219 struct pipe_sampler_view *textures[6][PIPE_MAX_SAMPLERS];
220 unsigned num_textures[6];
221 uint32_t textures_dirty[6];
222 uint32_t textures_coherent[6];
223 struct nv50_tsc_entry *samplers[6][PIPE_MAX_SAMPLERS];
224 unsigned num_samplers[6];
225 uint32_t samplers_dirty[6];
226 bool seamless_cube_map;
227 struct pipe_sampler_view *fbtexture;
228
229 uint32_t tex_handles[6][PIPE_MAX_SAMPLERS]; /* for nve4 */
230
231 struct list_head tex_head;
232 struct list_head img_head;
233
234 struct pipe_framebuffer_state framebuffer;
235 bool sample_locations_enabled;
236 uint8_t sample_locations[2 * 4 * 8];
237 struct pipe_blend_color blend_colour;
238 struct pipe_stencil_ref stencil_ref;
239 struct pipe_poly_stipple stipple;
240 struct pipe_scissor_state scissors[NVC0_MAX_VIEWPORTS];
241 unsigned scissors_dirty;
242 struct pipe_viewport_state viewports[NVC0_MAX_VIEWPORTS];
243 unsigned viewports_dirty;
244 struct pipe_clip_state clip;
245 struct nvc0_window_rect_stateobj window_rect;
246
247 unsigned sample_mask;
248 unsigned min_samples;
249
250 float default_tess_outer[4];
251 float default_tess_inner[2];
252
253 bool vbo_push_hint;
254
255 uint8_t tfbbuf_dirty;
256 struct pipe_stream_output_target *tfbbuf[4];
257 unsigned num_tfbbufs;
258
259 struct pipe_query *cond_query;
260 bool cond_cond; /* inverted rendering condition */
261 uint cond_mode;
262 uint32_t cond_condmode; /* the calculated condition */
263
264 struct nvc0_blitctx *blit;
265
266 /* NOTE: some of these surfaces may reference buffers */
267 struct pipe_surface *surfaces[2][NVC0_MAX_SURFACE_SLOTS];
268 uint16_t surfaces_dirty[2];
269 uint16_t surfaces_valid[2];
270
271 struct pipe_shader_buffer buffers[6][NVC0_MAX_BUFFERS];
272 uint32_t buffers_dirty[6];
273 uint32_t buffers_valid[6];
274
275 struct pipe_image_view images[6][NVC0_MAX_IMAGES];
276 struct pipe_sampler_view *images_tic[6][NVC0_MAX_IMAGES]; /* GM107+ */
277 uint16_t images_dirty[6];
278 uint16_t images_valid[6];
279
280 struct util_dynarray global_residents;
281 };
282
283 static inline struct nvc0_context *
284 nvc0_context(struct pipe_context *pipe)
285 {
286 return (struct nvc0_context *)pipe;
287 }
288
289 static inline unsigned
290 nvc0_shader_stage(unsigned pipe)
291 {
292 switch (pipe) {
293 case PIPE_SHADER_VERTEX: return 0;
294 case PIPE_SHADER_TESS_CTRL: return 1;
295 case PIPE_SHADER_TESS_EVAL: return 2;
296 case PIPE_SHADER_GEOMETRY: return 3;
297 case PIPE_SHADER_FRAGMENT: return 4;
298 case PIPE_SHADER_COMPUTE: return 5;
299 default:
300 assert(!"invalid PIPE_SHADER type");
301 return 0;
302 }
303 }
304
305
306 /* nvc0_context.c */
307 struct pipe_context *nvc0_create(struct pipe_screen *, void *, unsigned flags);
308 void nvc0_bufctx_fence(struct nvc0_context *, struct nouveau_bufctx *,
309 bool on_flush);
310 void nvc0_default_kick_notify(struct nouveau_pushbuf *);
311 const void *nvc0_get_sample_locations(unsigned);
312
313 /* nvc0_draw.c */
314 extern struct draw_stage *nvc0_draw_render_stage(struct nvc0_context *);
315
316 /* nvc0_program.c */
317 bool nvc0_program_translate(struct nvc0_program *, uint16_t chipset,
318 struct pipe_debug_callback *);
319 bool nvc0_program_upload(struct nvc0_context *, struct nvc0_program *);
320 void nvc0_program_destroy(struct nvc0_context *, struct nvc0_program *);
321 void nvc0_program_library_upload(struct nvc0_context *);
322 uint32_t nvc0_program_symbol_offset(const struct nvc0_program *,
323 uint32_t label);
324 void nvc0_program_init_tcp_empty(struct nvc0_context *);
325
326 /* nvc0_shader_state.c */
327 void nvc0_vertprog_validate(struct nvc0_context *);
328 void nvc0_tctlprog_validate(struct nvc0_context *);
329 void nvc0_tevlprog_validate(struct nvc0_context *);
330 void nvc0_gmtyprog_validate(struct nvc0_context *);
331 void nvc0_fragprog_validate(struct nvc0_context *);
332 void nvc0_compprog_validate(struct nvc0_context *);
333
334 void nvc0_tfb_validate(struct nvc0_context *);
335 void nvc0_layer_validate(struct nvc0_context *);
336
337 /* nvc0_state.c */
338 extern void nvc0_init_state_functions(struct nvc0_context *);
339
340 /* nvc0_state_validate.c */
341 struct nvc0_state_validate {
342 void (*func)(struct nvc0_context *);
343 uint32_t states;
344 };
345
346 bool nvc0_state_validate(struct nvc0_context *, uint32_t,
347 struct nvc0_state_validate *, int, uint32_t *,
348 struct nouveau_bufctx *);
349 bool nvc0_state_validate_3d(struct nvc0_context *, uint32_t);
350
351 /* nvc0_surface.c */
352 extern void nvc0_clear(struct pipe_context *, unsigned buffers,
353 const union pipe_color_union *color,
354 double depth, unsigned stencil);
355 extern void nvc0_init_surface_functions(struct nvc0_context *);
356
357 /* nvc0_tex.c */
358 bool nvc0_validate_tic(struct nvc0_context *nvc0, int s);
359 bool nvc0_validate_tsc(struct nvc0_context *nvc0, int s);
360 bool nve4_validate_tsc(struct nvc0_context *nvc0, int s);
361 void nvc0_validate_suf(struct nvc0_context *nvc0, int s);
362 void nvc0_validate_textures(struct nvc0_context *);
363 void nvc0_validate_samplers(struct nvc0_context *);
364 void nve4_set_tex_handles(struct nvc0_context *);
365 void nvc0_validate_surfaces(struct nvc0_context *);
366 void nve4_set_surface_info(struct nouveau_pushbuf *,
367 const struct pipe_image_view *,
368 struct nvc0_context *);
369 void nvc0_mark_image_range_valid(const struct pipe_image_view *);
370 bool nvc0_update_tic(struct nvc0_context *, struct nv50_tic_entry *,
371 struct nv04_resource *);
372
373 struct pipe_sampler_view *
374 nvc0_create_texture_view(struct pipe_context *,
375 struct pipe_resource *,
376 const struct pipe_sampler_view *,
377 uint32_t flags,
378 enum pipe_texture_target);
379 struct pipe_sampler_view *
380 nvc0_create_sampler_view(struct pipe_context *,
381 struct pipe_resource *,
382 const struct pipe_sampler_view *);
383 struct pipe_sampler_view *
384 gm107_create_texture_view_from_image(struct pipe_context *,
385 const struct pipe_image_view *);
386
387 void nvc0_init_bindless_functions(struct pipe_context *);
388
389 /* nvc0_transfer.c */
390 void
391 nvc0_init_transfer_functions(struct nvc0_context *);
392
393 void
394 nvc0_m2mf_push_linear(struct nouveau_context *nv,
395 struct nouveau_bo *dst, unsigned offset, unsigned domain,
396 unsigned size, const void *data);
397 void
398 nve4_p2mf_push_linear(struct nouveau_context *nv,
399 struct nouveau_bo *dst, unsigned offset, unsigned domain,
400 unsigned size, const void *data);
401 void
402 nvc0_cb_bo_push(struct nouveau_context *,
403 struct nouveau_bo *bo, unsigned domain,
404 unsigned base, unsigned size,
405 unsigned offset, unsigned words, const uint32_t *data);
406
407 /* nvc0_vbo.c */
408 void nvc0_draw_vbo(struct pipe_context *, const struct pipe_draw_info *);
409
410 void *
411 nvc0_vertex_state_create(struct pipe_context *pipe,
412 unsigned num_elements,
413 const struct pipe_vertex_element *elements);
414 void
415 nvc0_vertex_state_delete(struct pipe_context *pipe, void *hwcso);
416
417 void nvc0_vertex_arrays_validate(struct nvc0_context *);
418
419 void nvc0_idxbuf_validate(struct nvc0_context *);
420
421 /* nvc0_video.c */
422 struct pipe_video_codec *
423 nvc0_create_decoder(struct pipe_context *context,
424 const struct pipe_video_codec *templ);
425
426 struct pipe_video_buffer *
427 nvc0_video_buffer_create(struct pipe_context *pipe,
428 const struct pipe_video_buffer *templat);
429
430 /* nvc0_push.c */
431 void nvc0_push_vbo(struct nvc0_context *, const struct pipe_draw_info *);
432
433 /* nve4_compute.c */
434 void nve4_launch_grid(struct pipe_context *, const struct pipe_grid_info *);
435
436 /* nvc0_compute.c */
437 void nvc0_launch_grid(struct pipe_context *, const struct pipe_grid_info *);
438 void nvc0_compute_validate_globals(struct nvc0_context *);
439
440 #endif