d3d6bd2e5dd9f1da081b35c8bdc3b81b38f489f3
[mesa.git] / src / gallium / drivers / nouveau / nvc0 / nvc0_context.h
1 #ifndef __NVC0_CONTEXT_H__
2 #define __NVC0_CONTEXT_H__
3
4 #include "pipe/p_context.h"
5 #include "pipe/p_defines.h"
6 #include "pipe/p_state.h"
7
8 #include "util/list.h"
9 #include "util/u_memory.h"
10 #include "util/u_math.h"
11 #include "util/u_inlines.h"
12 #include "util/u_dynarray.h"
13
14 #include "nvc0/nvc0_winsys.h"
15 #include "nvc0/nvc0_stateobj.h"
16 #include "nvc0/nvc0_screen.h"
17 #include "nvc0/nvc0_program.h"
18 #include "nvc0/nvc0_resource.h"
19 #include "nvc0/nvc0_query.h"
20
21 #include "nv50/nv50_transfer.h"
22
23 #include "nouveau_context.h"
24 #include "nouveau_debug.h"
25
26 #include "nv50/nv50_3ddefs.xml.h"
27 #include "nvc0/nvc0_3d.xml.h"
28 #include "nv50/nv50_2d.xml.h"
29 #include "nvc0/nvc0_m2mf.xml.h"
30 #include "nvc0/nve4_copy.xml.h"
31 #include "nvc0/nve4_p2mf.xml.h"
32 #include "nvc0/nvc0_compute.xml.h"
33 #include "nvc0/nvc0_macros.h"
34
35 /* NOTE: must keep NVC0_NEW_3D_...PROG in consecutive bits in this order */
36 #define NVC0_NEW_3D_BLEND (1 << 0)
37 #define NVC0_NEW_3D_RASTERIZER (1 << 1)
38 #define NVC0_NEW_3D_ZSA (1 << 2)
39 #define NVC0_NEW_3D_VERTPROG (1 << 3)
40 #define NVC0_NEW_3D_TCTLPROG (1 << 4)
41 #define NVC0_NEW_3D_TEVLPROG (1 << 5)
42 #define NVC0_NEW_3D_GMTYPROG (1 << 6)
43 #define NVC0_NEW_3D_FRAGPROG (1 << 7)
44 #define NVC0_NEW_3D_BLEND_COLOUR (1 << 8)
45 #define NVC0_NEW_3D_STENCIL_REF (1 << 9)
46 #define NVC0_NEW_3D_CLIP (1 << 10)
47 #define NVC0_NEW_3D_SAMPLE_MASK (1 << 11)
48 #define NVC0_NEW_3D_FRAMEBUFFER (1 << 12)
49 #define NVC0_NEW_3D_STIPPLE (1 << 13)
50 #define NVC0_NEW_3D_SCISSOR (1 << 14)
51 #define NVC0_NEW_3D_VIEWPORT (1 << 15)
52 #define NVC0_NEW_3D_ARRAYS (1 << 16)
53 #define NVC0_NEW_3D_VERTEX (1 << 17)
54 #define NVC0_NEW_3D_CONSTBUF (1 << 18)
55 #define NVC0_NEW_3D_TEXTURES (1 << 19)
56 #define NVC0_NEW_3D_SAMPLERS (1 << 20)
57 #define NVC0_NEW_3D_TFB_TARGETS (1 << 21)
58
59 #define NVC0_NEW_3D_SURFACES (1 << 23)
60 #define NVC0_NEW_3D_MIN_SAMPLES (1 << 24)
61 #define NVC0_NEW_3D_TESSFACTOR (1 << 25)
62 #define NVC0_NEW_3D_BUFFERS (1 << 26)
63 #define NVC0_NEW_3D_DRIVERCONST (1 << 27)
64 #define NVC0_NEW_3D_WINDOW_RECTS (1 << 28)
65
66 #define NVC0_NEW_3D_SAMPLE_LOCATIONS (1 << 29)
67
68 #define NVC0_NEW_CP_PROGRAM (1 << 0)
69 #define NVC0_NEW_CP_SURFACES (1 << 1)
70 #define NVC0_NEW_CP_TEXTURES (1 << 2)
71 #define NVC0_NEW_CP_SAMPLERS (1 << 3)
72 #define NVC0_NEW_CP_CONSTBUF (1 << 4)
73 #define NVC0_NEW_CP_GLOBALS (1 << 5)
74 #define NVC0_NEW_CP_DRIVERCONST (1 << 6)
75 #define NVC0_NEW_CP_BUFFERS (1 << 7)
76
77 /* 3d bufctx (during draw_vbo, blit_3d) */
78 #define NVC0_BIND_3D_FB 0
79 #define NVC0_BIND_3D_VTX 1
80 #define NVC0_BIND_3D_VTX_TMP 2
81 #define NVC0_BIND_3D_IDX 3
82 #define NVC0_BIND_3D_TEX(s, i) ( 4 + 32 * (s) + (i))
83 #define NVC0_BIND_3D_CB(s, i) (164 + 16 * (s) + (i))
84 #define NVC0_BIND_3D_TFB 244
85 #define NVC0_BIND_3D_SUF 245
86 #define NVC0_BIND_3D_BUF 246
87 #define NVC0_BIND_3D_SCREEN 247
88 #define NVC0_BIND_3D_BINDLESS 248
89 #define NVC0_BIND_3D_TLS 249
90 #define NVC0_BIND_3D_TEXT 250
91 #define NVC0_BIND_3D_COUNT 251
92
93 /* compute bufctx (during launch_grid) */
94 #define NVC0_BIND_CP_CB(i) ( 0 + (i))
95 #define NVC0_BIND_CP_TEX(i) ( 16 + (i))
96 #define NVC0_BIND_CP_SUF 48
97 #define NVC0_BIND_CP_GLOBAL 49
98 #define NVC0_BIND_CP_DESC 50
99 #define NVC0_BIND_CP_SCREEN 51
100 #define NVC0_BIND_CP_QUERY 52
101 #define NVC0_BIND_CP_BUF 53
102 #define NVC0_BIND_CP_TEXT 54
103 #define NVC0_BIND_CP_BINDLESS 55
104 #define NVC0_BIND_CP_COUNT 56
105
106 /* bufctx for other operations */
107 #define NVC0_BIND_2D 0
108 #define NVC0_BIND_M2MF 0
109 #define NVC0_BIND_FENCE 1
110
111 /* 6 user uniform buffers, at 64K each */
112 #define NVC0_CB_USR_INFO(s) (s << 16)
113 #define NVC0_CB_USR_SIZE (6 << 16)
114 /* 6 driver constbuts, at 64K each */
115 #define NVC0_CB_AUX_INFO(s) NVC0_CB_USR_SIZE + (s << 16)
116 #define NVC0_CB_AUX_SIZE (1 << 16)
117 /* XXX: Figure out what this UNK data is. */
118 #define NVC0_CB_AUX_UNK_INFO 0x000
119 #define NVC0_CB_AUX_UNK_SIZE (8 * 4)
120 /* 40 textures handles (8 for GM107+ images only), at 1 32-bits integer each */
121 #define NVC0_CB_AUX_TEX_INFO(i) 0x020 + (i) * 4
122 #define NVC0_CB_AUX_TEX_SIZE (40 * 4)
123 /* 8 sets of 32-bits coordinate offsets */
124 #define NVC0_CB_AUX_MS_INFO 0x0c0
125 #define NVC0_CB_AUX_MS_SIZE (8 * 2 * 4)
126 /* block/grid size, at 3 32-bits integers each, gridid and work_dim */
127 #define NVC0_CB_AUX_GRID_INFO(i) 0x100 + (i) * 4 /* CP */
128 #define NVC0_CB_AUX_GRID_SIZE (8 * 4)
129 /* FB texture handle */
130 #define NVC0_CB_AUX_FB_TEX_INFO 0x100 /* FP */
131 #define NVC0_CB_AUX_FB_TEX_SIZE (4)
132 /* 8 user clip planes, at 4 32-bits floats each */
133 #define NVC0_CB_AUX_UCP_INFO 0x120
134 #define NVC0_CB_AUX_UCP_SIZE (PIPE_MAX_CLIP_PLANES * 4 * 4)
135 /* 13 ubos, at 4 32-bits integer each */
136 #define NVC0_CB_AUX_UBO_INFO(i) 0x120 + (i) * 4 * 4 /* CP */
137 #define NVC0_CB_AUX_UBO_SIZE ((NVC0_MAX_PIPE_CONSTBUFS - 1) * 4 * 4)
138 /* 8 sets of 32-bits integer pairs sample offsets */
139 #define NVC0_CB_AUX_SAMPLE_INFO 0x1a0 /* FP */
140 /* 256 bytes, though only 64 bytes used before GM200 */
141 #define NVC0_CB_AUX_SAMPLE_SIZE (8 * 2 * 4 * 4)
142 /* draw parameters (index bias, base instance, drawid)
143 * be sure to update the indirect draw macros in com9097.mme when changing this
144 */
145 #define NVC0_CB_AUX_DRAW_INFO 0x1a0 /* VP */
146 /* 32 user buffers, at 4 32-bits integers each */
147 #define NVC0_CB_AUX_BUF_INFO(i) 0x2a0 + (i) * 4 * 4
148 #define NVC0_CB_AUX_BUF_SIZE (NVC0_MAX_BUFFERS * 4 * 4)
149 /* 8 surfaces, at 16 32-bits integers each */
150 #define NVC0_CB_AUX_SU_INFO(i) 0x4a0 + (i) * 16 * 4
151 #define NVC0_CB_AUX_SU_SIZE (NVC0_MAX_IMAGES * 16 * 4)
152 /* 1 64-bits address and 1 32-bits sequence
153 * be sure to update the shaders in nvc0_query_hw_sm.c when changing this
154 */
155 #define NVC0_CB_AUX_MP_INFO 0x6a0
156 #define NVC0_CB_AUX_MP_SIZE 3 * 4
157 /* 512 64-byte blocks for bindless image handles */
158 #define NVC0_CB_AUX_BINDLESS_INFO(i) 0x6b0 + (i) * 16 * 4
159 #define NVC0_CB_AUX_BINDLESS_SIZE (NVE4_IMG_MAX_HANDLES * 16 * 4)
160 /* 4 32-bits floats for the vertex runout, put at the end */
161 #define NVC0_CB_AUX_RUNOUT_INFO NVC0_CB_USR_SIZE + (NVC0_CB_AUX_SIZE * 6)
162
163 struct nvc0_blitctx;
164
165 bool nvc0_blitctx_create(struct nvc0_context *);
166 void nvc0_blitctx_destroy(struct nvc0_context *);
167
168 struct nvc0_resident {
169 struct list_head list;
170 uint64_t handle;
171 struct nv04_resource *buf;
172 uint32_t flags;
173 };
174
175 struct nvc0_context {
176 struct nouveau_context base;
177
178 struct nouveau_bufctx *bufctx_3d;
179 struct nouveau_bufctx *bufctx;
180 struct nouveau_bufctx *bufctx_cp;
181
182 struct nvc0_screen *screen;
183
184 void (*m2mf_copy_rect)(struct nvc0_context *,
185 const struct nv50_m2mf_rect *dst,
186 const struct nv50_m2mf_rect *src,
187 uint32_t nblocksx, uint32_t nblocksy);
188
189 uint32_t dirty_3d; /* dirty flags for 3d state */
190 uint32_t dirty_cp; /* dirty flags for compute state */
191
192 struct nvc0_graph_state state;
193
194 struct nvc0_blend_stateobj *blend;
195 struct nvc0_rasterizer_stateobj *rast;
196 struct nvc0_zsa_stateobj *zsa;
197 struct nvc0_vertex_stateobj *vertex;
198
199 struct nvc0_program *vertprog;
200 struct nvc0_program *tctlprog;
201 struct nvc0_program *tevlprog;
202 struct nvc0_program *gmtyprog;
203 struct nvc0_program *fragprog;
204 struct nvc0_program *compprog;
205
206 struct nvc0_program *tcp_empty;
207
208 struct nvc0_constbuf constbuf[6][NVC0_MAX_PIPE_CONSTBUFS];
209 uint16_t constbuf_dirty[6];
210 uint16_t constbuf_valid[6];
211 uint16_t constbuf_coherent[6];
212 bool cb_dirty;
213
214 struct pipe_vertex_buffer vtxbuf[PIPE_MAX_ATTRIBS];
215 unsigned num_vtxbufs;
216 uint32_t vtxbufs_coherent;
217 uint32_t constant_vbos;
218 uint32_t vbo_user; /* bitmask of vertex buffers pointing to user memory */
219 uint32_t vb_elt_first; /* from pipe_draw_info, for vertex upload */
220 uint32_t vb_elt_limit; /* max - min element (count - 1) */
221 uint32_t instance_off; /* current base vertex for instanced arrays */
222 uint32_t instance_max; /* last instance for current draw call */
223
224 struct pipe_sampler_view *textures[6][PIPE_MAX_SAMPLERS];
225 unsigned num_textures[6];
226 uint32_t textures_dirty[6];
227 uint32_t textures_coherent[6];
228 struct nv50_tsc_entry *samplers[6][PIPE_MAX_SAMPLERS];
229 unsigned num_samplers[6];
230 uint32_t samplers_dirty[6];
231 bool seamless_cube_map;
232 struct pipe_sampler_view *fbtexture;
233
234 uint32_t tex_handles[6][PIPE_MAX_SAMPLERS]; /* for nve4 */
235
236 struct list_head tex_head;
237 struct list_head img_head;
238
239 struct pipe_framebuffer_state framebuffer;
240 bool sample_locations_enabled;
241 uint8_t sample_locations[2 * 4 * 8];
242 struct pipe_blend_color blend_colour;
243 struct pipe_stencil_ref stencil_ref;
244 struct pipe_poly_stipple stipple;
245 struct pipe_scissor_state scissors[NVC0_MAX_VIEWPORTS];
246 unsigned scissors_dirty;
247 struct pipe_viewport_state viewports[NVC0_MAX_VIEWPORTS];
248 unsigned viewports_dirty;
249 struct pipe_clip_state clip;
250 struct nvc0_window_rect_stateobj window_rect;
251
252 unsigned sample_mask;
253 unsigned min_samples;
254
255 float default_tess_outer[4];
256 float default_tess_inner[2];
257
258 bool vbo_push_hint;
259
260 uint8_t tfbbuf_dirty;
261 struct pipe_stream_output_target *tfbbuf[4];
262 unsigned num_tfbbufs;
263
264 struct pipe_query *cond_query;
265 bool cond_cond; /* inverted rendering condition */
266 uint cond_mode;
267 uint32_t cond_condmode; /* the calculated condition */
268
269 struct nvc0_blitctx *blit;
270
271 /* NOTE: some of these surfaces may reference buffers */
272 struct pipe_surface *surfaces[2][NVC0_MAX_SURFACE_SLOTS];
273 uint16_t surfaces_dirty[2];
274 uint16_t surfaces_valid[2];
275
276 struct pipe_shader_buffer buffers[6][NVC0_MAX_BUFFERS];
277 uint32_t buffers_dirty[6];
278 uint32_t buffers_valid[6];
279
280 struct pipe_image_view images[6][NVC0_MAX_IMAGES];
281 struct pipe_sampler_view *images_tic[6][NVC0_MAX_IMAGES]; /* GM107+ */
282 uint16_t images_dirty[6];
283 uint16_t images_valid[6];
284
285 struct util_dynarray global_residents;
286
287 uint64_t compute_invocations;
288 };
289
290 static inline struct nvc0_context *
291 nvc0_context(struct pipe_context *pipe)
292 {
293 return (struct nvc0_context *)pipe;
294 }
295
296 static inline unsigned
297 nvc0_shader_stage(unsigned pipe)
298 {
299 switch (pipe) {
300 case PIPE_SHADER_VERTEX: return 0;
301 case PIPE_SHADER_TESS_CTRL: return 1;
302 case PIPE_SHADER_TESS_EVAL: return 2;
303 case PIPE_SHADER_GEOMETRY: return 3;
304 case PIPE_SHADER_FRAGMENT: return 4;
305 case PIPE_SHADER_COMPUTE: return 5;
306 default:
307 assert(!"invalid PIPE_SHADER type");
308 return 0;
309 }
310 }
311
312
313 /* nvc0_context.c */
314 struct pipe_context *nvc0_create(struct pipe_screen *, void *, unsigned flags);
315 void nvc0_bufctx_fence(struct nvc0_context *, struct nouveau_bufctx *,
316 bool on_flush);
317 void nvc0_default_kick_notify(struct nouveau_pushbuf *);
318 const void *nvc0_get_sample_locations(unsigned);
319
320 /* nvc0_draw.c */
321 extern struct draw_stage *nvc0_draw_render_stage(struct nvc0_context *);
322
323 /* nvc0_program.c */
324 bool nvc0_program_translate(struct nvc0_program *, uint16_t chipset,
325 struct pipe_debug_callback *);
326 bool nvc0_program_upload(struct nvc0_context *, struct nvc0_program *);
327 void nvc0_program_destroy(struct nvc0_context *, struct nvc0_program *);
328 void nvc0_program_library_upload(struct nvc0_context *);
329 void nvc0_program_init_tcp_empty(struct nvc0_context *);
330
331 /* nvc0_shader_state.c */
332 void nvc0_vertprog_validate(struct nvc0_context *);
333 void nvc0_tctlprog_validate(struct nvc0_context *);
334 void nvc0_tevlprog_validate(struct nvc0_context *);
335 void nvc0_gmtyprog_validate(struct nvc0_context *);
336 void nvc0_fragprog_validate(struct nvc0_context *);
337 void nvc0_compprog_validate(struct nvc0_context *);
338
339 void nvc0_tfb_validate(struct nvc0_context *);
340 void nvc0_layer_validate(struct nvc0_context *);
341
342 /* nvc0_state.c */
343 extern void nvc0_init_state_functions(struct nvc0_context *);
344
345 /* nvc0_state_validate.c */
346 struct nvc0_state_validate {
347 void (*func)(struct nvc0_context *);
348 uint32_t states;
349 };
350
351 bool nvc0_state_validate(struct nvc0_context *, uint32_t,
352 struct nvc0_state_validate *, int, uint32_t *,
353 struct nouveau_bufctx *);
354 bool nvc0_state_validate_3d(struct nvc0_context *, uint32_t);
355
356 /* nvc0_surface.c */
357 extern void nvc0_clear(struct pipe_context *, unsigned buffers,
358 const struct pipe_scissor_state *scissor_state,
359 const union pipe_color_union *color,
360 double depth, unsigned stencil);
361 extern void nvc0_init_surface_functions(struct nvc0_context *);
362
363 /* nvc0_tex.c */
364 bool nvc0_validate_tic(struct nvc0_context *nvc0, int s);
365 bool nvc0_validate_tsc(struct nvc0_context *nvc0, int s);
366 bool nve4_validate_tsc(struct nvc0_context *nvc0, int s);
367 void nvc0_validate_suf(struct nvc0_context *nvc0, int s);
368 void nvc0_validate_textures(struct nvc0_context *);
369 void nvc0_validate_samplers(struct nvc0_context *);
370 void nvc0_upload_tsc0(struct nvc0_context *);
371 void nve4_set_tex_handles(struct nvc0_context *);
372 void nvc0_validate_surfaces(struct nvc0_context *);
373 void nve4_set_surface_info(struct nouveau_pushbuf *,
374 const struct pipe_image_view *,
375 struct nvc0_context *);
376 void nvc0_mark_image_range_valid(const struct pipe_image_view *);
377 bool nvc0_update_tic(struct nvc0_context *, struct nv50_tic_entry *,
378 struct nv04_resource *);
379
380 struct pipe_sampler_view *
381 nvc0_create_texture_view(struct pipe_context *,
382 struct pipe_resource *,
383 const struct pipe_sampler_view *,
384 uint32_t flags,
385 enum pipe_texture_target);
386 struct pipe_sampler_view *
387 nvc0_create_sampler_view(struct pipe_context *,
388 struct pipe_resource *,
389 const struct pipe_sampler_view *);
390 struct pipe_sampler_view *
391 gm107_create_texture_view_from_image(struct pipe_context *,
392 const struct pipe_image_view *);
393
394 void nvc0_init_bindless_functions(struct pipe_context *);
395
396 /* nvc0_transfer.c */
397 void
398 nvc0_init_transfer_functions(struct nvc0_context *);
399
400 void
401 nvc0_m2mf_push_linear(struct nouveau_context *nv,
402 struct nouveau_bo *dst, unsigned offset, unsigned domain,
403 unsigned size, const void *data);
404 void
405 nve4_p2mf_push_linear(struct nouveau_context *nv,
406 struct nouveau_bo *dst, unsigned offset, unsigned domain,
407 unsigned size, const void *data);
408 void
409 nvc0_cb_bo_push(struct nouveau_context *,
410 struct nouveau_bo *bo, unsigned domain,
411 unsigned base, unsigned size,
412 unsigned offset, unsigned words, const uint32_t *data);
413
414 /* nvc0_vbo.c */
415 void nvc0_draw_vbo(struct pipe_context *, const struct pipe_draw_info *);
416
417 void *
418 nvc0_vertex_state_create(struct pipe_context *pipe,
419 unsigned num_elements,
420 const struct pipe_vertex_element *elements);
421 void
422 nvc0_vertex_state_delete(struct pipe_context *pipe, void *hwcso);
423
424 void nvc0_vertex_arrays_validate(struct nvc0_context *);
425
426 void nvc0_idxbuf_validate(struct nvc0_context *);
427
428 /* nvc0_video.c */
429 struct pipe_video_codec *
430 nvc0_create_decoder(struct pipe_context *context,
431 const struct pipe_video_codec *templ);
432
433 struct pipe_video_buffer *
434 nvc0_video_buffer_create(struct pipe_context *pipe,
435 const struct pipe_video_buffer *templat);
436
437 /* nvc0_push.c */
438 void nvc0_push_vbo(struct nvc0_context *, const struct pipe_draw_info *);
439 void nvc0_push_vbo_indirect(struct nvc0_context *, const struct pipe_draw_info *);
440
441 /* nve4_compute.c */
442 void nve4_launch_grid(struct pipe_context *, const struct pipe_grid_info *);
443
444 /* nvc0_compute.c */
445 void nvc0_launch_grid(struct pipe_context *, const struct pipe_grid_info *);
446 void nvc0_compute_validate_globals(struct nvc0_context *);
447 void nvc0_update_compute_invocations_counter(struct nvc0_context *nvc0,
448 const struct pipe_grid_info *info);
449
450 #endif