intel: Pack dynamic draws together
[mesa.git] / src / mesa / drivers / dri / intel / intel_context.h
1 /**************************************************************************
2 *
3 * Copyright 2003 Tungsten Graphics, Inc., Cedar Park, Texas.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 #ifndef INTELCONTEXT_INC
29 #define INTELCONTEXT_INC
30
31
32 #include <stdbool.h>
33 #include "main/mtypes.h"
34 #include "main/mm.h"
35
36 #ifdef __cplusplus
37 extern "C" {
38 /* Evil hack for using libdrm in a c++ compiler. */
39 #define virtual virt
40 #endif
41
42 #include "drm.h"
43 #include "intel_bufmgr.h"
44
45 #include "intel_screen.h"
46 #include "intel_tex_obj.h"
47 #include "i915_drm.h"
48
49 #ifdef __cplusplus
50 #undef virtual
51 }
52 #endif
53
54 #include "tnl/t_vertex.h"
55
56 #define TAG(x) intel##x
57 #include "tnl_dd/t_dd_vertex.h"
58 #undef TAG
59
60 #define DV_PF_555 (1<<8)
61 #define DV_PF_565 (2<<8)
62 #define DV_PF_8888 (3<<8)
63 #define DV_PF_4444 (8<<8)
64 #define DV_PF_1555 (9<<8)
65
66 struct intel_region;
67 struct intel_context;
68
69 typedef void (*intel_tri_func) (struct intel_context *, intelVertex *,
70 intelVertex *, intelVertex *);
71 typedef void (*intel_line_func) (struct intel_context *, intelVertex *,
72 intelVertex *);
73 typedef void (*intel_point_func) (struct intel_context *, intelVertex *);
74
75 /**
76 * Bits for intel->Fallback field
77 */
78 /*@{*/
79 #define INTEL_FALLBACK_DRAW_BUFFER 0x1
80 #define INTEL_FALLBACK_READ_BUFFER 0x2
81 #define INTEL_FALLBACK_DEPTH_BUFFER 0x4
82 #define INTEL_FALLBACK_STENCIL_BUFFER 0x8
83 #define INTEL_FALLBACK_USER 0x10
84 #define INTEL_FALLBACK_RENDERMODE 0x20
85 #define INTEL_FALLBACK_TEXTURE 0x40
86 #define INTEL_FALLBACK_DRIVER 0x1000 /**< first for drivers */
87 /*@}*/
88
89 extern void intelFallback(struct intel_context *intel, GLbitfield bit,
90 GLboolean mode);
91 #define FALLBACK( intel, bit, mode ) intelFallback( intel, bit, mode )
92
93
94 #define INTEL_WRITE_PART 0x1
95 #define INTEL_WRITE_FULL 0x2
96 #define INTEL_READ 0x4
97
98 #define INTEL_MAX_FIXUP 64
99
100 #ifndef likely
101 #ifdef __GNUC__
102 #define likely(expr) (__builtin_expect(expr, 1))
103 #define unlikely(expr) (__builtin_expect(expr, 0))
104 #else
105 #define likely(expr) (expr)
106 #define unlikely(expr) (expr)
107 #endif
108 #endif
109
110 struct intel_sync_object {
111 struct gl_sync_object Base;
112
113 /** Batch associated with this sync object */
114 drm_intel_bo *bo;
115 };
116
117 /**
118 * intel_context is derived from Mesa's context class: struct gl_context.
119 */
120 struct intel_context
121 {
122 struct gl_context ctx; /**< base class, must be first field */
123
124 struct
125 {
126 void (*destroy) (struct intel_context * intel);
127 void (*emit_state) (struct intel_context * intel);
128 void (*finish_batch) (struct intel_context * intel);
129 void (*new_batch) (struct intel_context * intel);
130 void (*emit_invarient_state) (struct intel_context * intel);
131 void (*update_texture_state) (struct intel_context * intel);
132
133 void (*render_start) (struct intel_context * intel);
134 void (*render_prevalidate) (struct intel_context * intel);
135 void (*set_draw_region) (struct intel_context * intel,
136 struct intel_region * draw_regions[],
137 struct intel_region * depth_region,
138 GLuint num_regions);
139
140 void (*reduced_primitive_state) (struct intel_context * intel,
141 GLenum rprim);
142
143 GLboolean (*check_vertex_size) (struct intel_context * intel,
144 GLuint expected);
145 void (*invalidate_state) (struct intel_context *intel,
146 GLuint new_state);
147
148 void (*assert_not_dirty) (struct intel_context *intel);
149
150 void (*debug_batch)(struct intel_context *intel);
151 bool (*render_target_supported)(gl_format format);
152 } vtbl;
153
154 GLbitfield Fallback; /**< mask of INTEL_FALLBACK_x bits */
155 GLuint NewGLState;
156
157 dri_bufmgr *bufmgr;
158 unsigned int maxBatchSize;
159
160 /**
161 * Generation number of the hardware: 2 is 8xx, 3 is 9xx pre-965, 4 is 965.
162 */
163 int gen;
164 GLboolean needs_ff_sync;
165 GLboolean is_g4x;
166 GLboolean is_945;
167 GLboolean has_luminance_srgb;
168 GLboolean has_xrgb_textures;
169
170 int urb_size;
171
172 struct intel_batchbuffer *batch;
173 drm_intel_bo *first_post_swapbuffers_batch;
174 GLboolean need_throttle;
175 GLboolean no_batch_wrap;
176
177 struct
178 {
179 GLuint id;
180 uint32_t primitive; /**< Current hardware primitive type */
181 void (*flush) (struct intel_context *);
182 GLubyte *start_ptr; /**< for i8xx */
183 drm_intel_bo *vb_bo;
184 uint8_t *vb;
185 unsigned int start_offset; /**< Byte offset of primitive sequence */
186 unsigned int current_offset; /**< Byte offset of next vertex */
187 unsigned int count; /**< Number of vertices in current primitive */
188 } prim;
189
190 struct {
191 drm_intel_bo *bo;
192 GLuint offset;
193 } upload;
194
195 GLuint stats_wm;
196
197 /* Offsets of fields within the current vertex:
198 */
199 GLuint coloroffset;
200 GLuint specoffset;
201 GLuint wpos_offset;
202 GLuint wpos_size;
203
204 struct tnl_attr_map vertex_attrs[VERT_ATTRIB_MAX];
205 GLuint vertex_attr_count;
206
207 GLfloat polygon_offset_scale; /* dependent on depth_scale, bpp */
208
209 GLboolean hw_stencil;
210 GLboolean hw_stipple;
211 GLboolean depth_buffer_is_float;
212 GLboolean no_rast;
213 GLboolean always_flush_batch;
214 GLboolean always_flush_cache;
215
216 /* 0 - nonconformant, best performance;
217 * 1 - fallback to sw for known conformance bugs
218 * 2 - always fallback to sw
219 */
220 GLuint conformance_mode;
221
222 /* State for intelvb.c and inteltris.c.
223 */
224 GLuint RenderIndex;
225 GLmatrix ViewportMatrix;
226 GLenum render_primitive;
227 GLenum reduced_primitive;
228 GLuint vertex_size;
229 GLubyte *verts; /* points to tnl->clipspace.vertex_buf */
230
231 /* Fallback rasterization functions
232 */
233 intel_point_func draw_point;
234 intel_line_func draw_line;
235 intel_tri_func draw_tri;
236
237 /**
238 * Set if rendering has occured to the drawable's front buffer.
239 *
240 * This is used in the DRI2 case to detect that glFlush should also copy
241 * the contents of the fake front buffer to the real front buffer.
242 */
243 GLboolean front_buffer_dirty;
244
245 /**
246 * Track whether front-buffer rendering is currently enabled
247 *
248 * A separate flag is used to track this in order to support MRT more
249 * easily.
250 */
251 GLboolean is_front_buffer_rendering;
252 /**
253 * Track whether front-buffer is the current read target.
254 *
255 * This is closely associated with is_front_buffer_rendering, but may
256 * be set separately. The DRI2 fake front buffer must be referenced
257 * either way.
258 */
259 GLboolean is_front_buffer_reading;
260
261 GLboolean use_texture_tiling;
262 GLboolean use_early_z;
263
264 int driFd;
265
266 __DRIcontext *driContext;
267 struct intel_screen *intelScreen;
268 void (*saved_viewport)(struct gl_context * ctx,
269 GLint x, GLint y, GLsizei width, GLsizei height);
270
271 /**
272 * Configuration cache
273 */
274 driOptionCache optionCache;
275 };
276
277 extern char *__progname;
278
279
280 #define SUBPIXEL_X 0.125
281 #define SUBPIXEL_Y 0.125
282
283 #define ARRAY_SIZE(x) (sizeof(x) / sizeof(x[0]))
284 #define ALIGN(value, alignment) ((value + alignment - 1) & ~(alignment - 1))
285 #define ROUND_DOWN_TO(value, alignment) (ALIGN(value - alignment - 1, \
286 alignment))
287 #define IS_POWER_OF_TWO(val) (((val) & (val - 1)) == 0)
288
289 static INLINE uint32_t
290 U_FIXED(float value, uint32_t frac_bits)
291 {
292 value *= (1 << frac_bits);
293 return value < 0 ? 0 : value;
294 }
295
296 static INLINE uint32_t
297 S_FIXED(float value, uint32_t frac_bits)
298 {
299 return value * (1 << frac_bits);
300 }
301
302 #define INTEL_FIREVERTICES(intel) \
303 do { \
304 if ((intel)->prim.flush) \
305 (intel)->prim.flush(intel); \
306 } while (0)
307
308 /* ================================================================
309 * From linux kernel i386 header files, copes with odd sizes better
310 * than COPY_DWORDS would:
311 * XXX Put this in src/mesa/main/imports.h ???
312 */
313 #if defined(i386) || defined(__i386__)
314 static INLINE void * __memcpy(void * to, const void * from, size_t n)
315 {
316 int d0, d1, d2;
317 __asm__ __volatile__(
318 "rep ; movsl\n\t"
319 "testb $2,%b4\n\t"
320 "je 1f\n\t"
321 "movsw\n"
322 "1:\ttestb $1,%b4\n\t"
323 "je 2f\n\t"
324 "movsb\n"
325 "2:"
326 : "=&c" (d0), "=&D" (d1), "=&S" (d2)
327 :"0" (n/4), "q" (n),"1" ((long) to),"2" ((long) from)
328 : "memory");
329 return (to);
330 }
331 #else
332 #define __memcpy(a,b,c) memcpy(a,b,c)
333 #endif
334
335
336 /* ================================================================
337 * Debugging:
338 */
339 extern int INTEL_DEBUG;
340
341 #define DEBUG_TEXTURE 0x1
342 #define DEBUG_STATE 0x2
343 #define DEBUG_IOCTL 0x4
344 #define DEBUG_BLIT 0x8
345 #define DEBUG_MIPTREE 0x10
346 #define DEBUG_FALLBACKS 0x20
347 #define DEBUG_VERBOSE 0x40
348 #define DEBUG_BATCH 0x80
349 #define DEBUG_PIXEL 0x100
350 #define DEBUG_BUFMGR 0x200
351 #define DEBUG_REGION 0x400
352 #define DEBUG_FBO 0x800
353 #define DEBUG_GS 0x1000
354 #define DEBUG_SYNC 0x2000
355 #define DEBUG_PRIMS 0x4000
356 #define DEBUG_VERTS 0x8000
357 #define DEBUG_DRI 0x10000
358 #define DEBUG_SF 0x20000
359 #define DEBUG_SANITY 0x40000
360 #define DEBUG_SLEEP 0x80000
361 #define DEBUG_STATS 0x100000
362 #define DEBUG_TILE 0x200000
363 #define DEBUG_SINGLE_THREAD 0x400000
364 #define DEBUG_WM 0x800000
365 #define DEBUG_URB 0x1000000
366 #define DEBUG_VS 0x2000000
367 #define DEBUG_CLIP 0x8000000
368
369 #define DBG(...) do { \
370 if (unlikely(INTEL_DEBUG & FILE_DEBUG_FLAG)) \
371 printf(__VA_ARGS__); \
372 } while(0)
373
374 #define fallback_debug(...) do { \
375 if (unlikely(INTEL_DEBUG & DEBUG_FALLBACKS)) \
376 printf(__VA_ARGS__); \
377 } while(0)
378
379 #define PCI_CHIP_845_G 0x2562
380 #define PCI_CHIP_I830_M 0x3577
381 #define PCI_CHIP_I855_GM 0x3582
382 #define PCI_CHIP_I865_G 0x2572
383 #define PCI_CHIP_I915_G 0x2582
384 #define PCI_CHIP_I915_GM 0x2592
385 #define PCI_CHIP_I945_G 0x2772
386 #define PCI_CHIP_I945_GM 0x27A2
387 #define PCI_CHIP_I945_GME 0x27AE
388 #define PCI_CHIP_G33_G 0x29C2
389 #define PCI_CHIP_Q35_G 0x29B2
390 #define PCI_CHIP_Q33_G 0x29D2
391
392
393 /* ================================================================
394 * intel_context.c:
395 */
396
397 extern GLboolean intelInitContext(struct intel_context *intel,
398 int api,
399 const struct gl_config * mesaVis,
400 __DRIcontext * driContextPriv,
401 void *sharedContextPrivate,
402 struct dd_function_table *functions);
403
404 extern void intelFinish(struct gl_context * ctx);
405 extern void intel_flush(struct gl_context * ctx);
406
407 extern void intelInitDriverFunctions(struct dd_function_table *functions);
408
409 void intel_init_syncobj_functions(struct dd_function_table *functions);
410
411
412 /* ================================================================
413 * intel_state.c:
414 */
415 extern void intelInitStateFuncs(struct dd_function_table *functions);
416
417 #define COMPAREFUNC_ALWAYS 0
418 #define COMPAREFUNC_NEVER 0x1
419 #define COMPAREFUNC_LESS 0x2
420 #define COMPAREFUNC_EQUAL 0x3
421 #define COMPAREFUNC_LEQUAL 0x4
422 #define COMPAREFUNC_GREATER 0x5
423 #define COMPAREFUNC_NOTEQUAL 0x6
424 #define COMPAREFUNC_GEQUAL 0x7
425
426 #define STENCILOP_KEEP 0
427 #define STENCILOP_ZERO 0x1
428 #define STENCILOP_REPLACE 0x2
429 #define STENCILOP_INCRSAT 0x3
430 #define STENCILOP_DECRSAT 0x4
431 #define STENCILOP_INCR 0x5
432 #define STENCILOP_DECR 0x6
433 #define STENCILOP_INVERT 0x7
434
435 #define LOGICOP_CLEAR 0
436 #define LOGICOP_NOR 0x1
437 #define LOGICOP_AND_INV 0x2
438 #define LOGICOP_COPY_INV 0x3
439 #define LOGICOP_AND_RVRSE 0x4
440 #define LOGICOP_INV 0x5
441 #define LOGICOP_XOR 0x6
442 #define LOGICOP_NAND 0x7
443 #define LOGICOP_AND 0x8
444 #define LOGICOP_EQUIV 0x9
445 #define LOGICOP_NOOP 0xa
446 #define LOGICOP_OR_INV 0xb
447 #define LOGICOP_COPY 0xc
448 #define LOGICOP_OR_RVRSE 0xd
449 #define LOGICOP_OR 0xe
450 #define LOGICOP_SET 0xf
451
452 #define BLENDFACT_ZERO 0x01
453 #define BLENDFACT_ONE 0x02
454 #define BLENDFACT_SRC_COLR 0x03
455 #define BLENDFACT_INV_SRC_COLR 0x04
456 #define BLENDFACT_SRC_ALPHA 0x05
457 #define BLENDFACT_INV_SRC_ALPHA 0x06
458 #define BLENDFACT_DST_ALPHA 0x07
459 #define BLENDFACT_INV_DST_ALPHA 0x08
460 #define BLENDFACT_DST_COLR 0x09
461 #define BLENDFACT_INV_DST_COLR 0x0a
462 #define BLENDFACT_SRC_ALPHA_SATURATE 0x0b
463 #define BLENDFACT_CONST_COLOR 0x0c
464 #define BLENDFACT_INV_CONST_COLOR 0x0d
465 #define BLENDFACT_CONST_ALPHA 0x0e
466 #define BLENDFACT_INV_CONST_ALPHA 0x0f
467 #define BLENDFACT_MASK 0x0f
468
469 enum {
470 DRI_CONF_BO_REUSE_DISABLED,
471 DRI_CONF_BO_REUSE_ALL
472 };
473
474 extern int intel_translate_shadow_compare_func(GLenum func);
475 extern int intel_translate_compare_func(GLenum func);
476 extern int intel_translate_stencil_op(GLenum op);
477 extern int intel_translate_blend_factor(GLenum factor);
478 extern int intel_translate_logic_op(GLenum opcode);
479
480 void intel_update_renderbuffers(__DRIcontext *context,
481 __DRIdrawable *drawable);
482 void intel_prepare_render(struct intel_context *intel);
483
484 void i915_set_buf_info_for_region(uint32_t *state, struct intel_region *region,
485 uint32_t buffer_id);
486
487 /*======================================================================
488 * Inline conversion functions.
489 * These are better-typed than the macros used previously:
490 */
491 static INLINE struct intel_context *
492 intel_context(struct gl_context * ctx)
493 {
494 return (struct intel_context *) ctx;
495 }
496
497 static INLINE GLboolean
498 is_power_of_two(uint32_t value)
499 {
500 return (value & (value - 1)) == 0;
501 }
502
503 #endif