intel: Add always_flush_batch driconf option for making small batchbuffers.
[mesa.git] / src / mesa / drivers / dri / intel / intel_context.h
1 /**************************************************************************
2 *
3 * Copyright 2003 Tungsten Graphics, Inc., Cedar Park, Texas.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 #ifndef INTELCONTEXT_INC
29 #define INTELCONTEXT_INC
30
31
32
33 #include "main/mtypes.h"
34 #include "main/mm.h"
35 #include "texmem.h"
36 #include "drm.h"
37 #include "intel_bufmgr.h"
38
39 #include "intel_screen.h"
40 #include "intel_tex_obj.h"
41 #include "i915_drm.h"
42 #include "tnl/t_vertex.h"
43
44 #define TAG(x) intel##x
45 #include "tnl_dd/t_dd_vertex.h"
46 #undef TAG
47
48 #define DV_PF_555 (1<<8)
49 #define DV_PF_565 (2<<8)
50 #define DV_PF_8888 (3<<8)
51
52 struct intel_region;
53 struct intel_context;
54
55 typedef void (*intel_tri_func) (struct intel_context *, intelVertex *,
56 intelVertex *, intelVertex *);
57 typedef void (*intel_line_func) (struct intel_context *, intelVertex *,
58 intelVertex *);
59 typedef void (*intel_point_func) (struct intel_context *, intelVertex *);
60
61 #define INTEL_FALLBACK_DRAW_BUFFER 0x1
62 #define INTEL_FALLBACK_READ_BUFFER 0x2
63 #define INTEL_FALLBACK_DEPTH_BUFFER 0x4
64 #define INTEL_FALLBACK_STENCIL_BUFFER 0x8
65 #define INTEL_FALLBACK_USER 0x10
66 #define INTEL_FALLBACK_RENDERMODE 0x20
67 #define INTEL_FALLBACK_TEXTURE 0x40
68
69 extern void intelFallback(struct intel_context *intel, GLuint bit,
70 GLboolean mode);
71 #define FALLBACK( intel, bit, mode ) intelFallback( intel, bit, mode )
72
73
74 #define INTEL_WRITE_PART 0x1
75 #define INTEL_WRITE_FULL 0x2
76 #define INTEL_READ 0x4
77
78 #define INTEL_MAX_FIXUP 64
79
80 struct intel_context
81 {
82 GLcontext ctx; /* the parent class */
83
84 struct
85 {
86 void (*destroy) (struct intel_context * intel);
87 void (*emit_state) (struct intel_context * intel);
88 void (*finish_batch) (struct intel_context * intel);
89 void (*new_batch) (struct intel_context * intel);
90 void (*emit_invarient_state) (struct intel_context * intel);
91 void (*note_fence) (struct intel_context *intel, GLuint fence);
92 void (*note_unlock) (struct intel_context *intel);
93 void (*update_texture_state) (struct intel_context * intel);
94
95 void (*render_start) (struct intel_context * intel);
96 void (*render_prevalidate) (struct intel_context * intel);
97 void (*set_draw_region) (struct intel_context * intel,
98 struct intel_region * draw_regions[],
99 struct intel_region * depth_region,
100 GLuint num_regions);
101
102 GLuint (*flush_cmd) (void);
103
104 void (*reduced_primitive_state) (struct intel_context * intel,
105 GLenum rprim);
106
107 GLboolean (*check_vertex_size) (struct intel_context * intel,
108 GLuint expected);
109 void (*invalidate_state) (struct intel_context *intel,
110 GLuint new_state);
111
112
113 /* Metaops:
114 */
115 void (*install_meta_state) (struct intel_context * intel);
116 void (*leave_meta_state) (struct intel_context * intel);
117
118 void (*meta_draw_region) (struct intel_context * intel,
119 struct intel_region * draw_region,
120 struct intel_region * depth_region);
121
122 void (*meta_draw_quad)(struct intel_context *intel,
123 GLfloat x0, GLfloat x1,
124 GLfloat y0, GLfloat y1,
125 GLfloat z,
126 GLuint color, /* ARGB32 */
127 GLfloat s0, GLfloat s1,
128 GLfloat t0, GLfloat t1);
129
130 void (*meta_color_mask) (struct intel_context * intel, GLboolean);
131
132 void (*meta_stencil_replace) (struct intel_context * intel,
133 GLuint mask, GLuint clear);
134
135 void (*meta_depth_replace) (struct intel_context * intel);
136
137 void (*meta_texture_blend_replace) (struct intel_context * intel);
138
139 void (*meta_no_stencil_write) (struct intel_context * intel);
140 void (*meta_no_depth_write) (struct intel_context * intel);
141 void (*meta_no_texture) (struct intel_context * intel);
142
143 void (*meta_import_pixel_state) (struct intel_context * intel);
144 void (*meta_frame_buffer_texture) (struct intel_context *intel,
145 GLint xoff, GLint yoff);
146
147 GLboolean(*meta_tex_rect_source) (struct intel_context * intel,
148 dri_bo * buffer,
149 GLuint offset,
150 GLuint pitch,
151 GLuint height,
152 GLenum format, GLenum type);
153
154 void (*assert_not_dirty) (struct intel_context *intel);
155
156 void (*debug_batch)(struct intel_context *intel);
157 } vtbl;
158
159 struct {
160 struct gl_fragment_program *bitmap_fp;
161 struct gl_vertex_program *passthrough_vp;
162
163 struct gl_fragment_program *saved_fp;
164 GLboolean saved_fp_enable;
165 struct gl_vertex_program *saved_vp;
166 GLboolean saved_vp_enable;
167
168 GLint saved_vp_x, saved_vp_y;
169 GLsizei saved_vp_width, saved_vp_height;
170 GLenum saved_matrix_mode;
171 } meta;
172
173 GLint refcount;
174 GLuint Fallback;
175 GLuint NewGLState;
176
177 dri_bufmgr *bufmgr;
178 unsigned int maxBatchSize;
179
180 struct intel_region *front_region;
181 struct intel_region *back_region;
182 struct intel_region *depth_region;
183
184 /**
185 * This value indicates that the kernel memory manager is being used
186 * instead of the fake client-side memory manager.
187 */
188 GLboolean ttm;
189
190 struct intel_batchbuffer *batch;
191 GLboolean no_batch_wrap;
192 unsigned batch_id;
193
194 struct
195 {
196 GLuint id;
197 uint32_t primitive; /**< Current hardware primitive type */
198 void (*flush) (struct intel_context *);
199 GLubyte *start_ptr; /**< for i8xx */
200 dri_bo *vb_bo;
201 uint8_t *vb;
202 unsigned int start_offset; /**< Byte offset of primitive sequence */
203 unsigned int current_offset; /**< Byte offset of next vertex */
204 unsigned int count; /**< Number of vertices in current primitive */
205 } prim;
206
207 GLuint stats_wm;
208 GLboolean locked;
209 char *prevLockFile;
210 int prevLockLine;
211
212 GLuint ClearColor565;
213 GLuint ClearColor8888;
214
215 /* Offsets of fields within the current vertex:
216 */
217 GLuint coloroffset;
218 GLuint specoffset;
219 GLuint wpos_offset;
220 GLuint wpos_size;
221
222 struct tnl_attr_map vertex_attrs[VERT_ATTRIB_MAX];
223 GLuint vertex_attr_count;
224
225 GLfloat polygon_offset_scale; /* dependent on depth_scale, bpp */
226
227 GLboolean hw_stencil;
228 GLboolean hw_stipple;
229 GLboolean depth_buffer_is_float;
230 GLboolean no_rast;
231 GLboolean always_flush_batch;
232 GLboolean always_flush_cache;
233
234 /* 0 - nonconformant, best performance;
235 * 1 - fallback to sw for known conformance bugs
236 * 2 - always fallback to sw
237 */
238 GLuint conformance_mode;
239
240 /* State for intelvb.c and inteltris.c.
241 */
242 GLuint RenderIndex;
243 GLmatrix ViewportMatrix;
244 GLenum render_primitive;
245 GLenum reduced_primitive;
246 GLuint vertex_size;
247 GLubyte *verts; /* points to tnl->clipspace.vertex_buf */
248
249 /* Fallback rasterization functions
250 */
251 intel_point_func draw_point;
252 intel_line_func draw_line;
253 intel_tri_func draw_tri;
254
255 /* These refer to the current drawing buffer:
256 */
257 struct gl_texture_object *frame_buffer_texobj;
258 /**
259 * Set to true if a single constant cliprect should be used in the
260 * batchbuffer. Otherwise, cliprects must be calculated at batchbuffer
261 * flush time while the lock is held.
262 */
263 GLboolean constant_cliprect;
264 /**
265 * In !constant_cliprect mode, set to true if the front cliprects should be
266 * used instead of back.
267 */
268 GLboolean front_cliprects;
269 drm_clip_rect_t fboRect; /**< cliprect for FBO rendering */
270
271 int perf_boxes;
272
273 GLuint do_usleeps;
274 int do_irqs;
275 GLuint irqsEmitted;
276
277 GLboolean scissor;
278 drm_clip_rect_t draw_rect;
279 drm_clip_rect_t scissor_rect;
280
281 drm_context_t hHWContext;
282 drmLock *driHwLock;
283 int driFd;
284
285 __DRIcontextPrivate *driContext;
286 __DRIdrawablePrivate *driDrawable;
287 __DRIdrawablePrivate *driReadDrawable;
288 __DRIscreenPrivate *driScreen;
289 intelScreenPrivate *intelScreen;
290 volatile struct drm_i915_sarea *sarea;
291
292 GLuint lastStamp;
293
294 GLboolean no_hw;
295
296 /**
297 * Configuration cache
298 */
299 driOptionCache optionCache;
300
301 int64_t swap_ust;
302 int64_t swap_missed_ust;
303
304 GLuint swap_count;
305 GLuint swap_missed_count;
306 };
307
308 /* These are functions now:
309 */
310 void LOCK_HARDWARE( struct intel_context *intel );
311 void UNLOCK_HARDWARE( struct intel_context *intel );
312
313 extern char *__progname;
314
315
316 #define SUBPIXEL_X 0.125
317 #define SUBPIXEL_Y 0.125
318
319 #define ARRAY_SIZE(x) (sizeof(x) / sizeof(x[0]))
320 #define ALIGN(value, alignment) ((value + alignment - 1) & ~(alignment - 1))
321
322 #define INTEL_FIREVERTICES(intel) \
323 do { \
324 if ((intel)->prim.flush) \
325 (intel)->prim.flush(intel); \
326 } while (0)
327
328 /* ================================================================
329 * Color packing:
330 */
331
332 #define INTEL_PACKCOLOR4444(r,g,b,a) \
333 ((((a) & 0xf0) << 8) | (((r) & 0xf0) << 4) | ((g) & 0xf0) | ((b) >> 4))
334
335 #define INTEL_PACKCOLOR1555(r,g,b,a) \
336 ((((r) & 0xf8) << 7) | (((g) & 0xf8) << 2) | (((b) & 0xf8) >> 3) | \
337 ((a) ? 0x8000 : 0))
338
339 #define INTEL_PACKCOLOR565(r,g,b) \
340 ((((r) & 0xf8) << 8) | (((g) & 0xfc) << 3) | (((b) & 0xf8) >> 3))
341
342 #define INTEL_PACKCOLOR8888(r,g,b,a) \
343 ((a<<24) | (r<<16) | (g<<8) | b)
344
345 #define INTEL_PACKCOLOR(format, r, g, b, a) \
346 (format == DV_PF_555 ? INTEL_PACKCOLOR1555(r,g,b,a) : \
347 (format == DV_PF_565 ? INTEL_PACKCOLOR565(r,g,b) : \
348 (format == DV_PF_8888 ? INTEL_PACKCOLOR8888(r,g,b,a) : \
349 0)))
350
351 /* ================================================================
352 * From linux kernel i386 header files, copes with odd sizes better
353 * than COPY_DWORDS would:
354 * XXX Put this in src/mesa/main/imports.h ???
355 */
356 #if defined(i386) || defined(__i386__)
357 static INLINE void * __memcpy(void * to, const void * from, size_t n)
358 {
359 int d0, d1, d2;
360 __asm__ __volatile__(
361 "rep ; movsl\n\t"
362 "testb $2,%b4\n\t"
363 "je 1f\n\t"
364 "movsw\n"
365 "1:\ttestb $1,%b4\n\t"
366 "je 2f\n\t"
367 "movsb\n"
368 "2:"
369 : "=&c" (d0), "=&D" (d1), "=&S" (d2)
370 :"0" (n/4), "q" (n),"1" ((long) to),"2" ((long) from)
371 : "memory");
372 return (to);
373 }
374 #else
375 #define __memcpy(a,b,c) memcpy(a,b,c)
376 #endif
377
378
379 /* ================================================================
380 * Debugging:
381 */
382 extern int INTEL_DEBUG;
383
384 #define DEBUG_TEXTURE 0x1
385 #define DEBUG_STATE 0x2
386 #define DEBUG_IOCTL 0x4
387 #define DEBUG_BLIT 0x8
388 #define DEBUG_MIPTREE 0x10
389 #define DEBUG_FALLBACKS 0x20
390 #define DEBUG_VERBOSE 0x40
391 #define DEBUG_BATCH 0x80
392 #define DEBUG_PIXEL 0x100
393 #define DEBUG_BUFMGR 0x200
394 #define DEBUG_REGION 0x400
395 #define DEBUG_FBO 0x800
396 #define DEBUG_LOCK 0x1000
397 #define DEBUG_SYNC 0x2000
398 #define DEBUG_PRIMS 0x4000
399 #define DEBUG_VERTS 0x8000
400 #define DEBUG_DRI 0x10000
401 #define DEBUG_DMA 0x20000
402 #define DEBUG_SANITY 0x40000
403 #define DEBUG_SLEEP 0x80000
404 #define DEBUG_STATS 0x100000
405 #define DEBUG_TILE 0x200000
406 #define DEBUG_SINGLE_THREAD 0x400000
407 #define DEBUG_WM 0x800000
408 #define DEBUG_URB 0x1000000
409 #define DEBUG_VS 0x2000000
410
411 #define DBG(...) do { \
412 if (INTEL_DEBUG & FILE_DEBUG_FLAG) \
413 _mesa_printf(__VA_ARGS__); \
414 } while(0)
415
416 #define PCI_CHIP_845_G 0x2562
417 #define PCI_CHIP_I830_M 0x3577
418 #define PCI_CHIP_I855_GM 0x3582
419 #define PCI_CHIP_I865_G 0x2572
420 #define PCI_CHIP_I915_G 0x2582
421 #define PCI_CHIP_I915_GM 0x2592
422 #define PCI_CHIP_I945_G 0x2772
423 #define PCI_CHIP_I945_GM 0x27A2
424 #define PCI_CHIP_I945_GME 0x27AE
425 #define PCI_CHIP_G33_G 0x29C2
426 #define PCI_CHIP_Q35_G 0x29B2
427 #define PCI_CHIP_Q33_G 0x29D2
428
429
430 /* ================================================================
431 * intel_context.c:
432 */
433
434 extern GLboolean intelInitContext(struct intel_context *intel,
435 const __GLcontextModes * mesaVis,
436 __DRIcontextPrivate * driContextPriv,
437 void *sharedContextPrivate,
438 struct dd_function_table *functions);
439
440 extern void intelGetLock(struct intel_context *intel, GLuint flags);
441
442 extern void intelFinish(GLcontext * ctx);
443 extern void intelFlush(GLcontext * ctx);
444
445 extern void intelInitDriverFunctions(struct dd_function_table *functions);
446
447
448 /* ================================================================
449 * intel_state.c:
450 */
451 extern void intelInitStateFuncs(struct dd_function_table *functions);
452
453 #define COMPAREFUNC_ALWAYS 0
454 #define COMPAREFUNC_NEVER 0x1
455 #define COMPAREFUNC_LESS 0x2
456 #define COMPAREFUNC_EQUAL 0x3
457 #define COMPAREFUNC_LEQUAL 0x4
458 #define COMPAREFUNC_GREATER 0x5
459 #define COMPAREFUNC_NOTEQUAL 0x6
460 #define COMPAREFUNC_GEQUAL 0x7
461
462 #define STENCILOP_KEEP 0
463 #define STENCILOP_ZERO 0x1
464 #define STENCILOP_REPLACE 0x2
465 #define STENCILOP_INCRSAT 0x3
466 #define STENCILOP_DECRSAT 0x4
467 #define STENCILOP_INCR 0x5
468 #define STENCILOP_DECR 0x6
469 #define STENCILOP_INVERT 0x7
470
471 #define LOGICOP_CLEAR 0
472 #define LOGICOP_NOR 0x1
473 #define LOGICOP_AND_INV 0x2
474 #define LOGICOP_COPY_INV 0x3
475 #define LOGICOP_AND_RVRSE 0x4
476 #define LOGICOP_INV 0x5
477 #define LOGICOP_XOR 0x6
478 #define LOGICOP_NAND 0x7
479 #define LOGICOP_AND 0x8
480 #define LOGICOP_EQUIV 0x9
481 #define LOGICOP_NOOP 0xa
482 #define LOGICOP_OR_INV 0xb
483 #define LOGICOP_COPY 0xc
484 #define LOGICOP_OR_RVRSE 0xd
485 #define LOGICOP_OR 0xe
486 #define LOGICOP_SET 0xf
487
488 #define BLENDFACT_ZERO 0x01
489 #define BLENDFACT_ONE 0x02
490 #define BLENDFACT_SRC_COLR 0x03
491 #define BLENDFACT_INV_SRC_COLR 0x04
492 #define BLENDFACT_SRC_ALPHA 0x05
493 #define BLENDFACT_INV_SRC_ALPHA 0x06
494 #define BLENDFACT_DST_ALPHA 0x07
495 #define BLENDFACT_INV_DST_ALPHA 0x08
496 #define BLENDFACT_DST_COLR 0x09
497 #define BLENDFACT_INV_DST_COLR 0x0a
498 #define BLENDFACT_SRC_ALPHA_SATURATE 0x0b
499 #define BLENDFACT_CONST_COLOR 0x0c
500 #define BLENDFACT_INV_CONST_COLOR 0x0d
501 #define BLENDFACT_CONST_ALPHA 0x0e
502 #define BLENDFACT_INV_CONST_ALPHA 0x0f
503 #define BLENDFACT_MASK 0x0f
504
505 enum {
506 DRI_CONF_BO_REUSE_DISABLED,
507 DRI_CONF_BO_REUSE_ALL
508 };
509
510 extern int intel_translate_shadow_compare_func(GLenum func);
511 extern int intel_translate_compare_func(GLenum func);
512 extern int intel_translate_stencil_op(GLenum op);
513 extern int intel_translate_blend_factor(GLenum factor);
514 extern int intel_translate_logic_op(GLenum opcode);
515
516 void intel_viewport(GLcontext * ctx, GLint x, GLint y,
517 GLsizei width, GLsizei height);
518
519 void intel_update_renderbuffers(__DRIcontext *context,
520 __DRIdrawable *drawable);
521
522 /*======================================================================
523 * Inline conversion functions.
524 * These are better-typed than the macros used previously:
525 */
526 static INLINE struct intel_context *
527 intel_context(GLcontext * ctx)
528 {
529 return (struct intel_context *) ctx;
530 }
531
532 #endif