intel: Throttle after doing copyregion/swapbuffers round trip
[mesa.git] / src / mesa / drivers / dri / intel / intel_context.h
1 /**************************************************************************
2 *
3 * Copyright 2003 Tungsten Graphics, Inc., Cedar Park, Texas.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 #ifndef INTELCONTEXT_INC
29 #define INTELCONTEXT_INC
30
31
32
33 #include "main/mtypes.h"
34 #include "main/mm.h"
35 #include "texmem.h"
36 #include "dri_metaops.h"
37 #include "drm.h"
38 #include "intel_bufmgr.h"
39
40 #include "intel_screen.h"
41 #include "intel_tex_obj.h"
42 #include "i915_drm.h"
43 #include "tnl/t_vertex.h"
44
45 #define TAG(x) intel##x
46 #include "tnl_dd/t_dd_vertex.h"
47 #undef TAG
48
49 #define DV_PF_555 (1<<8)
50 #define DV_PF_565 (2<<8)
51 #define DV_PF_8888 (3<<8)
52 #define DV_PF_4444 (8<<8)
53 #define DV_PF_1555 (9<<8)
54
55 struct intel_region;
56 struct intel_context;
57
58 typedef void (*intel_tri_func) (struct intel_context *, intelVertex *,
59 intelVertex *, intelVertex *);
60 typedef void (*intel_line_func) (struct intel_context *, intelVertex *,
61 intelVertex *);
62 typedef void (*intel_point_func) (struct intel_context *, intelVertex *);
63
64 /**
65 * Bits for intel->Fallback field
66 */
67 /*@{*/
68 #define INTEL_FALLBACK_DRAW_BUFFER 0x1
69 #define INTEL_FALLBACK_READ_BUFFER 0x2
70 #define INTEL_FALLBACK_DEPTH_BUFFER 0x4
71 #define INTEL_FALLBACK_STENCIL_BUFFER 0x8
72 #define INTEL_FALLBACK_USER 0x10
73 #define INTEL_FALLBACK_RENDERMODE 0x20
74 #define INTEL_FALLBACK_TEXTURE 0x40
75 #define INTEL_FALLBACK_DRIVER 0x1000 /**< first for drivers */
76 /*@}*/
77
78 extern void intelFallback(struct intel_context *intel, GLbitfield bit,
79 GLboolean mode);
80 #define FALLBACK( intel, bit, mode ) intelFallback( intel, bit, mode )
81
82
83 #define INTEL_WRITE_PART 0x1
84 #define INTEL_WRITE_FULL 0x2
85 #define INTEL_READ 0x4
86
87 #define INTEL_MAX_FIXUP 64
88
89 struct intel_sync_object {
90 struct gl_sync_object Base;
91
92 /** Batch associated with this sync object */
93 drm_intel_bo *bo;
94 };
95
96 /**
97 * intel_context is derived from Mesa's context class: GLcontext.
98 */
99 struct intel_context
100 {
101 GLcontext ctx; /**< base class, must be first field */
102
103 struct
104 {
105 void (*destroy) (struct intel_context * intel);
106 void (*emit_state) (struct intel_context * intel);
107 void (*finish_batch) (struct intel_context * intel);
108 void (*new_batch) (struct intel_context * intel);
109 void (*emit_invarient_state) (struct intel_context * intel);
110 void (*update_texture_state) (struct intel_context * intel);
111
112 void (*render_start) (struct intel_context * intel);
113 void (*render_prevalidate) (struct intel_context * intel);
114 void (*set_draw_region) (struct intel_context * intel,
115 struct intel_region * draw_regions[],
116 struct intel_region * depth_region,
117 GLuint num_regions);
118
119 void (*reduced_primitive_state) (struct intel_context * intel,
120 GLenum rprim);
121
122 GLboolean (*check_vertex_size) (struct intel_context * intel,
123 GLuint expected);
124 void (*invalidate_state) (struct intel_context *intel,
125 GLuint new_state);
126
127 void (*assert_not_dirty) (struct intel_context *intel);
128
129 void (*debug_batch)(struct intel_context *intel);
130 } vtbl;
131
132 struct dri_metaops meta;
133
134 GLbitfield Fallback; /**< mask of INTEL_FALLBACK_x bits */
135 GLuint NewGLState;
136
137 dri_bufmgr *bufmgr;
138 unsigned int maxBatchSize;
139
140 /**
141 * Generation number of the hardware: 2 is 8xx, 3 is 9xx pre-965, 4 is 965.
142 */
143 int gen;
144 GLboolean needs_ff_sync;
145 GLboolean is_g4x;
146 GLboolean is_945;
147 GLboolean has_luminance_srgb;
148
149 int urb_size;
150
151 struct intel_batchbuffer *batch;
152 drm_intel_bo *first_post_swapbuffers_batch;
153 GLboolean need_throttle;
154 GLboolean no_batch_wrap;
155
156 struct
157 {
158 GLuint id;
159 uint32_t primitive; /**< Current hardware primitive type */
160 void (*flush) (struct intel_context *);
161 GLubyte *start_ptr; /**< for i8xx */
162 dri_bo *vb_bo;
163 uint8_t *vb;
164 unsigned int start_offset; /**< Byte offset of primitive sequence */
165 unsigned int current_offset; /**< Byte offset of next vertex */
166 unsigned int count; /**< Number of vertices in current primitive */
167 } prim;
168
169 GLuint stats_wm;
170 GLboolean locked;
171 char *prevLockFile;
172 int prevLockLine;
173
174 /* Offsets of fields within the current vertex:
175 */
176 GLuint coloroffset;
177 GLuint specoffset;
178 GLuint wpos_offset;
179 GLuint wpos_size;
180
181 struct tnl_attr_map vertex_attrs[VERT_ATTRIB_MAX];
182 GLuint vertex_attr_count;
183
184 GLfloat polygon_offset_scale; /* dependent on depth_scale, bpp */
185
186 GLboolean hw_stencil;
187 GLboolean hw_stipple;
188 GLboolean depth_buffer_is_float;
189 GLboolean no_rast;
190 GLboolean no_hw;
191 GLboolean always_flush_batch;
192 GLboolean always_flush_cache;
193
194 /* 0 - nonconformant, best performance;
195 * 1 - fallback to sw for known conformance bugs
196 * 2 - always fallback to sw
197 */
198 GLuint conformance_mode;
199
200 /* State for intelvb.c and inteltris.c.
201 */
202 GLuint RenderIndex;
203 GLmatrix ViewportMatrix;
204 GLenum render_primitive;
205 GLenum reduced_primitive;
206 GLuint vertex_size;
207 GLubyte *verts; /* points to tnl->clipspace.vertex_buf */
208
209 /* Fallback rasterization functions
210 */
211 intel_point_func draw_point;
212 intel_line_func draw_line;
213 intel_tri_func draw_tri;
214
215 /**
216 * Set if rendering has occured to the drawable's front buffer.
217 *
218 * This is used in the DRI2 case to detect that glFlush should also copy
219 * the contents of the fake front buffer to the real front buffer.
220 */
221 GLboolean front_buffer_dirty;
222
223 /**
224 * Track whether front-buffer rendering is currently enabled
225 *
226 * A separate flag is used to track this in order to support MRT more
227 * easily.
228 */
229 GLboolean is_front_buffer_rendering;
230 /**
231 * Track whether front-buffer is the current read target.
232 *
233 * This is closely associated with is_front_buffer_rendering, but may
234 * be set separately. The DRI2 fake front buffer must be referenced
235 * either way.
236 */
237 GLboolean is_front_buffer_reading;
238
239 GLboolean use_texture_tiling;
240 GLboolean use_early_z;
241
242 int driFd;
243
244 __DRIcontext *driContext;
245 struct intel_screen *intelScreen;
246 void (*saved_viewport)(GLcontext * ctx,
247 GLint x, GLint y, GLsizei width, GLsizei height);
248
249 /**
250 * Configuration cache
251 */
252 driOptionCache optionCache;
253 };
254
255 extern char *__progname;
256
257
258 #define SUBPIXEL_X 0.125
259 #define SUBPIXEL_Y 0.125
260
261 #define ARRAY_SIZE(x) (sizeof(x) / sizeof(x[0]))
262 #define ALIGN(value, alignment) ((value + alignment - 1) & ~(alignment - 1))
263 #define IS_POWER_OF_TWO(val) (((val) & (val - 1)) == 0)
264
265 static INLINE uint32_t
266 U_FIXED(float value, uint32_t frac_bits)
267 {
268 value *= (1 << frac_bits);
269 return value < 0 ? 0 : value;
270 }
271
272 static INLINE uint32_t
273 S_FIXED(float value, uint32_t frac_bits)
274 {
275 return value * (1 << frac_bits);
276 }
277
278 #define INTEL_FIREVERTICES(intel) \
279 do { \
280 if ((intel)->prim.flush) \
281 (intel)->prim.flush(intel); \
282 } while (0)
283
284 /* ================================================================
285 * From linux kernel i386 header files, copes with odd sizes better
286 * than COPY_DWORDS would:
287 * XXX Put this in src/mesa/main/imports.h ???
288 */
289 #if defined(i386) || defined(__i386__)
290 static INLINE void * __memcpy(void * to, const void * from, size_t n)
291 {
292 int d0, d1, d2;
293 __asm__ __volatile__(
294 "rep ; movsl\n\t"
295 "testb $2,%b4\n\t"
296 "je 1f\n\t"
297 "movsw\n"
298 "1:\ttestb $1,%b4\n\t"
299 "je 2f\n\t"
300 "movsb\n"
301 "2:"
302 : "=&c" (d0), "=&D" (d1), "=&S" (d2)
303 :"0" (n/4), "q" (n),"1" ((long) to),"2" ((long) from)
304 : "memory");
305 return (to);
306 }
307 #else
308 #define __memcpy(a,b,c) memcpy(a,b,c)
309 #endif
310
311
312 /* ================================================================
313 * Debugging:
314 */
315 extern int INTEL_DEBUG;
316
317 #define DEBUG_TEXTURE 0x1
318 #define DEBUG_STATE 0x2
319 #define DEBUG_IOCTL 0x4
320 #define DEBUG_BLIT 0x8
321 #define DEBUG_MIPTREE 0x10
322 #define DEBUG_FALLBACKS 0x20
323 #define DEBUG_VERBOSE 0x40
324 #define DEBUG_BATCH 0x80
325 #define DEBUG_PIXEL 0x100
326 #define DEBUG_BUFMGR 0x200
327 #define DEBUG_REGION 0x400
328 #define DEBUG_FBO 0x800
329 #define DEBUG_GS 0x1000
330 #define DEBUG_SYNC 0x2000
331 #define DEBUG_PRIMS 0x4000
332 #define DEBUG_VERTS 0x8000
333 #define DEBUG_DRI 0x10000
334 #define DEBUG_SF 0x20000
335 #define DEBUG_SANITY 0x40000
336 #define DEBUG_SLEEP 0x80000
337 #define DEBUG_STATS 0x100000
338 #define DEBUG_TILE 0x200000
339 #define DEBUG_SINGLE_THREAD 0x400000
340 #define DEBUG_WM 0x800000
341 #define DEBUG_URB 0x1000000
342 #define DEBUG_VS 0x2000000
343 #define DEBUG_GLSL_FORCE 0x4000000
344 #define DEBUG_CLIP 0x8000000
345
346 #define DBG(...) do { \
347 if (INTEL_DEBUG & FILE_DEBUG_FLAG) \
348 printf(__VA_ARGS__); \
349 } while(0)
350
351 #define PCI_CHIP_845_G 0x2562
352 #define PCI_CHIP_I830_M 0x3577
353 #define PCI_CHIP_I855_GM 0x3582
354 #define PCI_CHIP_I865_G 0x2572
355 #define PCI_CHIP_I915_G 0x2582
356 #define PCI_CHIP_I915_GM 0x2592
357 #define PCI_CHIP_I945_G 0x2772
358 #define PCI_CHIP_I945_GM 0x27A2
359 #define PCI_CHIP_I945_GME 0x27AE
360 #define PCI_CHIP_G33_G 0x29C2
361 #define PCI_CHIP_Q35_G 0x29B2
362 #define PCI_CHIP_Q33_G 0x29D2
363
364
365 /* ================================================================
366 * intel_context.c:
367 */
368
369 extern GLboolean intelInitContext(struct intel_context *intel,
370 int api,
371 const __GLcontextModes * mesaVis,
372 __DRIcontext * driContextPriv,
373 void *sharedContextPrivate,
374 struct dd_function_table *functions);
375
376 extern void intelFinish(GLcontext * ctx);
377 extern void intel_flush(GLcontext * ctx);
378
379 extern void intelInitDriverFunctions(struct dd_function_table *functions);
380
381 void intel_init_syncobj_functions(struct dd_function_table *functions);
382
383
384 /* ================================================================
385 * intel_state.c:
386 */
387 extern void intelInitStateFuncs(struct dd_function_table *functions);
388
389 #define COMPAREFUNC_ALWAYS 0
390 #define COMPAREFUNC_NEVER 0x1
391 #define COMPAREFUNC_LESS 0x2
392 #define COMPAREFUNC_EQUAL 0x3
393 #define COMPAREFUNC_LEQUAL 0x4
394 #define COMPAREFUNC_GREATER 0x5
395 #define COMPAREFUNC_NOTEQUAL 0x6
396 #define COMPAREFUNC_GEQUAL 0x7
397
398 #define STENCILOP_KEEP 0
399 #define STENCILOP_ZERO 0x1
400 #define STENCILOP_REPLACE 0x2
401 #define STENCILOP_INCRSAT 0x3
402 #define STENCILOP_DECRSAT 0x4
403 #define STENCILOP_INCR 0x5
404 #define STENCILOP_DECR 0x6
405 #define STENCILOP_INVERT 0x7
406
407 #define LOGICOP_CLEAR 0
408 #define LOGICOP_NOR 0x1
409 #define LOGICOP_AND_INV 0x2
410 #define LOGICOP_COPY_INV 0x3
411 #define LOGICOP_AND_RVRSE 0x4
412 #define LOGICOP_INV 0x5
413 #define LOGICOP_XOR 0x6
414 #define LOGICOP_NAND 0x7
415 #define LOGICOP_AND 0x8
416 #define LOGICOP_EQUIV 0x9
417 #define LOGICOP_NOOP 0xa
418 #define LOGICOP_OR_INV 0xb
419 #define LOGICOP_COPY 0xc
420 #define LOGICOP_OR_RVRSE 0xd
421 #define LOGICOP_OR 0xe
422 #define LOGICOP_SET 0xf
423
424 #define BLENDFACT_ZERO 0x01
425 #define BLENDFACT_ONE 0x02
426 #define BLENDFACT_SRC_COLR 0x03
427 #define BLENDFACT_INV_SRC_COLR 0x04
428 #define BLENDFACT_SRC_ALPHA 0x05
429 #define BLENDFACT_INV_SRC_ALPHA 0x06
430 #define BLENDFACT_DST_ALPHA 0x07
431 #define BLENDFACT_INV_DST_ALPHA 0x08
432 #define BLENDFACT_DST_COLR 0x09
433 #define BLENDFACT_INV_DST_COLR 0x0a
434 #define BLENDFACT_SRC_ALPHA_SATURATE 0x0b
435 #define BLENDFACT_CONST_COLOR 0x0c
436 #define BLENDFACT_INV_CONST_COLOR 0x0d
437 #define BLENDFACT_CONST_ALPHA 0x0e
438 #define BLENDFACT_INV_CONST_ALPHA 0x0f
439 #define BLENDFACT_MASK 0x0f
440
441 enum {
442 DRI_CONF_BO_REUSE_DISABLED,
443 DRI_CONF_BO_REUSE_ALL
444 };
445
446 extern int intel_translate_shadow_compare_func(GLenum func);
447 extern int intel_translate_compare_func(GLenum func);
448 extern int intel_translate_stencil_op(GLenum op);
449 extern int intel_translate_blend_factor(GLenum factor);
450 extern int intel_translate_logic_op(GLenum opcode);
451
452 void intel_update_renderbuffers(__DRIcontext *context,
453 __DRIdrawable *drawable);
454 void intel_prepare_render(struct intel_context *intel);
455
456 void i915_set_buf_info_for_region(uint32_t *state, struct intel_region *region,
457 uint32_t buffer_id);
458
459 /*======================================================================
460 * Inline conversion functions.
461 * These are better-typed than the macros used previously:
462 */
463 static INLINE struct intel_context *
464 intel_context(GLcontext * ctx)
465 {
466 return (struct intel_context *) ctx;
467 }
468
469 static INLINE GLboolean
470 is_power_of_two(uint32_t value)
471 {
472 return (value & (value - 1)) == 0;
473 }
474
475 #endif