i965: Enable ES 3.2 on Skylake.
[mesa.git] / src / mesa / drivers / dri / i965 / intel_screen.c
1 /*
2 * Copyright 2003 VMware, Inc.
3 * All Rights Reserved.
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the
7 * "Software"), to deal in the Software without restriction, including
8 * without limitation the rights to use, copy, modify, merge, publish,
9 * distribute, sublicense, and/or sell copies of the Software, and to
10 * permit persons to whom the Software is furnished to do so, subject to
11 * the following conditions:
12 *
13 * The above copyright notice and this permission notice (including the
14 * next paragraph) shall be included in all copies or substantial portions
15 * of the Software.
16 *
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
18 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
19 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
20 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
21 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
22 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
23 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
24 */
25
26 #include <errno.h>
27 #include <time.h>
28 #include <unistd.h>
29 #include "main/context.h"
30 #include "main/framebuffer.h"
31 #include "main/renderbuffer.h"
32 #include "main/texobj.h"
33 #include "main/hash.h"
34 #include "main/fbobject.h"
35 #include "main/version.h"
36 #include "swrast/s_renderbuffer.h"
37 #include "util/ralloc.h"
38 #include "brw_shader.h"
39 #include "compiler/nir/nir.h"
40
41 #include "utils.h"
42 #include "xmlpool.h"
43
44 static const __DRIconfigOptionsExtension brw_config_options = {
45 .base = { __DRI_CONFIG_OPTIONS, 1 },
46 .xml =
47 DRI_CONF_BEGIN
48 DRI_CONF_SECTION_PERFORMANCE
49 DRI_CONF_VBLANK_MODE(DRI_CONF_VBLANK_ALWAYS_SYNC)
50 /* Options correspond to DRI_CONF_BO_REUSE_DISABLED,
51 * DRI_CONF_BO_REUSE_ALL
52 */
53 DRI_CONF_OPT_BEGIN_V(bo_reuse, enum, 1, "0:1")
54 DRI_CONF_DESC_BEGIN(en, "Buffer object reuse")
55 DRI_CONF_ENUM(0, "Disable buffer object reuse")
56 DRI_CONF_ENUM(1, "Enable reuse of all sizes of buffer objects")
57 DRI_CONF_DESC_END
58 DRI_CONF_OPT_END
59
60 DRI_CONF_OPT_BEGIN_B(hiz, "true")
61 DRI_CONF_DESC(en, "Enable Hierarchical Z on gen6+")
62 DRI_CONF_OPT_END
63 DRI_CONF_SECTION_END
64
65 DRI_CONF_SECTION_QUALITY
66 DRI_CONF_FORCE_S3TC_ENABLE("false")
67
68 DRI_CONF_PRECISE_TRIG("false")
69
70 DRI_CONF_OPT_BEGIN(clamp_max_samples, int, -1)
71 DRI_CONF_DESC(en, "Clamp the value of GL_MAX_SAMPLES to the "
72 "given integer. If negative, then do not clamp.")
73 DRI_CONF_OPT_END
74 DRI_CONF_SECTION_END
75
76 DRI_CONF_SECTION_DEBUG
77 DRI_CONF_NO_RAST("false")
78 DRI_CONF_ALWAYS_FLUSH_BATCH("false")
79 DRI_CONF_ALWAYS_FLUSH_CACHE("false")
80 DRI_CONF_DISABLE_THROTTLING("false")
81 DRI_CONF_FORCE_GLSL_EXTENSIONS_WARN("false")
82 DRI_CONF_DISABLE_GLSL_LINE_CONTINUATIONS("false")
83 DRI_CONF_DISABLE_BLEND_FUNC_EXTENDED("false")
84 DRI_CONF_DUAL_COLOR_BLEND_BY_LOCATION("false")
85 DRI_CONF_ALLOW_GLSL_EXTENSION_DIRECTIVE_MIDSHADER("false")
86
87 DRI_CONF_OPT_BEGIN_B(shader_precompile, "true")
88 DRI_CONF_DESC(en, "Perform code generation at shader link time.")
89 DRI_CONF_OPT_END
90 DRI_CONF_SECTION_END
91
92 DRI_CONF_SECTION_MISCELLANEOUS
93 DRI_CONF_GLSL_ZERO_INIT("false")
94 DRI_CONF_SECTION_END
95 DRI_CONF_END
96 };
97
98 #include "intel_batchbuffer.h"
99 #include "intel_buffers.h"
100 #include "intel_bufmgr.h"
101 #include "intel_fbo.h"
102 #include "intel_mipmap_tree.h"
103 #include "intel_screen.h"
104 #include "intel_tex.h"
105 #include "intel_image.h"
106
107 #include "brw_context.h"
108
109 #include "i915_drm.h"
110
111 /**
112 * For debugging purposes, this returns a time in seconds.
113 */
114 double
115 get_time(void)
116 {
117 struct timespec tp;
118
119 clock_gettime(CLOCK_MONOTONIC, &tp);
120
121 return tp.tv_sec + tp.tv_nsec / 1000000000.0;
122 }
123
124 void
125 aub_dump_bmp(struct gl_context *ctx)
126 {
127 struct gl_framebuffer *fb = ctx->DrawBuffer;
128
129 for (unsigned i = 0; i < fb->_NumColorDrawBuffers; i++) {
130 struct intel_renderbuffer *irb =
131 intel_renderbuffer(fb->_ColorDrawBuffers[i]);
132
133 if (irb && irb->mt) {
134 enum aub_dump_bmp_format format;
135
136 switch (irb->Base.Base.Format) {
137 case MESA_FORMAT_B8G8R8A8_UNORM:
138 case MESA_FORMAT_B8G8R8X8_UNORM:
139 format = AUB_DUMP_BMP_FORMAT_ARGB_8888;
140 break;
141 default:
142 continue;
143 }
144
145 drm_intel_gem_bo_aub_dump_bmp(irb->mt->bo,
146 irb->draw_x,
147 irb->draw_y,
148 irb->Base.Base.Width,
149 irb->Base.Base.Height,
150 format,
151 irb->mt->pitch,
152 0);
153 }
154 }
155 }
156
157 static const __DRItexBufferExtension intelTexBufferExtension = {
158 .base = { __DRI_TEX_BUFFER, 3 },
159
160 .setTexBuffer = intelSetTexBuffer,
161 .setTexBuffer2 = intelSetTexBuffer2,
162 .releaseTexBuffer = NULL,
163 };
164
165 static void
166 intel_dri2_flush_with_flags(__DRIcontext *cPriv,
167 __DRIdrawable *dPriv,
168 unsigned flags,
169 enum __DRI2throttleReason reason)
170 {
171 struct brw_context *brw = cPriv->driverPrivate;
172
173 if (!brw)
174 return;
175
176 struct gl_context *ctx = &brw->ctx;
177
178 FLUSH_VERTICES(ctx, 0);
179
180 if (flags & __DRI2_FLUSH_DRAWABLE)
181 intel_resolve_for_dri2_flush(brw, dPriv);
182
183 if (reason == __DRI2_THROTTLE_SWAPBUFFER)
184 brw->need_swap_throttle = true;
185 if (reason == __DRI2_THROTTLE_FLUSHFRONT)
186 brw->need_flush_throttle = true;
187
188 intel_batchbuffer_flush(brw);
189
190 if (INTEL_DEBUG & DEBUG_AUB) {
191 aub_dump_bmp(ctx);
192 }
193 }
194
195 /**
196 * Provides compatibility with loaders that only support the older (version
197 * 1-3) flush interface.
198 *
199 * That includes libGL up to Mesa 9.0, and the X Server at least up to 1.13.
200 */
201 static void
202 intel_dri2_flush(__DRIdrawable *drawable)
203 {
204 intel_dri2_flush_with_flags(drawable->driContextPriv, drawable,
205 __DRI2_FLUSH_DRAWABLE,
206 __DRI2_THROTTLE_SWAPBUFFER);
207 }
208
209 static const struct __DRI2flushExtensionRec intelFlushExtension = {
210 .base = { __DRI2_FLUSH, 4 },
211
212 .flush = intel_dri2_flush,
213 .invalidate = dri2InvalidateDrawable,
214 .flush_with_flags = intel_dri2_flush_with_flags,
215 };
216
217 static struct intel_image_format intel_image_formats[] = {
218 { __DRI_IMAGE_FOURCC_ARGB8888, __DRI_IMAGE_COMPONENTS_RGBA, 1,
219 { { 0, 0, 0, __DRI_IMAGE_FORMAT_ARGB8888, 4 } } },
220
221 { __DRI_IMAGE_FOURCC_ABGR8888, __DRI_IMAGE_COMPONENTS_RGBA, 1,
222 { { 0, 0, 0, __DRI_IMAGE_FORMAT_ABGR8888, 4 } } },
223
224 { __DRI_IMAGE_FOURCC_SARGB8888, __DRI_IMAGE_COMPONENTS_RGBA, 1,
225 { { 0, 0, 0, __DRI_IMAGE_FORMAT_SARGB8, 4 } } },
226
227 { __DRI_IMAGE_FOURCC_XRGB8888, __DRI_IMAGE_COMPONENTS_RGB, 1,
228 { { 0, 0, 0, __DRI_IMAGE_FORMAT_XRGB8888, 4 }, } },
229
230 { __DRI_IMAGE_FOURCC_XBGR8888, __DRI_IMAGE_COMPONENTS_RGB, 1,
231 { { 0, 0, 0, __DRI_IMAGE_FORMAT_XBGR8888, 4 }, } },
232
233 { __DRI_IMAGE_FOURCC_RGB565, __DRI_IMAGE_COMPONENTS_RGB, 1,
234 { { 0, 0, 0, __DRI_IMAGE_FORMAT_RGB565, 2 } } },
235
236 { __DRI_IMAGE_FOURCC_R8, __DRI_IMAGE_COMPONENTS_R, 1,
237 { { 0, 0, 0, __DRI_IMAGE_FORMAT_R8, 1 }, } },
238
239 { __DRI_IMAGE_FOURCC_GR88, __DRI_IMAGE_COMPONENTS_RG, 1,
240 { { 0, 0, 0, __DRI_IMAGE_FORMAT_GR88, 2 }, } },
241
242 { __DRI_IMAGE_FOURCC_YUV410, __DRI_IMAGE_COMPONENTS_Y_U_V, 3,
243 { { 0, 0, 0, __DRI_IMAGE_FORMAT_R8, 1 },
244 { 1, 2, 2, __DRI_IMAGE_FORMAT_R8, 1 },
245 { 2, 2, 2, __DRI_IMAGE_FORMAT_R8, 1 } } },
246
247 { __DRI_IMAGE_FOURCC_YUV411, __DRI_IMAGE_COMPONENTS_Y_U_V, 3,
248 { { 0, 0, 0, __DRI_IMAGE_FORMAT_R8, 1 },
249 { 1, 2, 0, __DRI_IMAGE_FORMAT_R8, 1 },
250 { 2, 2, 0, __DRI_IMAGE_FORMAT_R8, 1 } } },
251
252 { __DRI_IMAGE_FOURCC_YUV420, __DRI_IMAGE_COMPONENTS_Y_U_V, 3,
253 { { 0, 0, 0, __DRI_IMAGE_FORMAT_R8, 1 },
254 { 1, 1, 1, __DRI_IMAGE_FORMAT_R8, 1 },
255 { 2, 1, 1, __DRI_IMAGE_FORMAT_R8, 1 } } },
256
257 { __DRI_IMAGE_FOURCC_YUV422, __DRI_IMAGE_COMPONENTS_Y_U_V, 3,
258 { { 0, 0, 0, __DRI_IMAGE_FORMAT_R8, 1 },
259 { 1, 1, 0, __DRI_IMAGE_FORMAT_R8, 1 },
260 { 2, 1, 0, __DRI_IMAGE_FORMAT_R8, 1 } } },
261
262 { __DRI_IMAGE_FOURCC_YUV444, __DRI_IMAGE_COMPONENTS_Y_U_V, 3,
263 { { 0, 0, 0, __DRI_IMAGE_FORMAT_R8, 1 },
264 { 1, 0, 0, __DRI_IMAGE_FORMAT_R8, 1 },
265 { 2, 0, 0, __DRI_IMAGE_FORMAT_R8, 1 } } },
266
267 { __DRI_IMAGE_FOURCC_YVU410, __DRI_IMAGE_COMPONENTS_Y_U_V, 3,
268 { { 0, 0, 0, __DRI_IMAGE_FORMAT_R8, 1 },
269 { 2, 2, 2, __DRI_IMAGE_FORMAT_R8, 1 },
270 { 1, 2, 2, __DRI_IMAGE_FORMAT_R8, 1 } } },
271
272 { __DRI_IMAGE_FOURCC_YVU411, __DRI_IMAGE_COMPONENTS_Y_U_V, 3,
273 { { 0, 0, 0, __DRI_IMAGE_FORMAT_R8, 1 },
274 { 2, 2, 0, __DRI_IMAGE_FORMAT_R8, 1 },
275 { 1, 2, 0, __DRI_IMAGE_FORMAT_R8, 1 } } },
276
277 { __DRI_IMAGE_FOURCC_YVU420, __DRI_IMAGE_COMPONENTS_Y_U_V, 3,
278 { { 0, 0, 0, __DRI_IMAGE_FORMAT_R8, 1 },
279 { 2, 1, 1, __DRI_IMAGE_FORMAT_R8, 1 },
280 { 1, 1, 1, __DRI_IMAGE_FORMAT_R8, 1 } } },
281
282 { __DRI_IMAGE_FOURCC_YVU422, __DRI_IMAGE_COMPONENTS_Y_U_V, 3,
283 { { 0, 0, 0, __DRI_IMAGE_FORMAT_R8, 1 },
284 { 2, 1, 0, __DRI_IMAGE_FORMAT_R8, 1 },
285 { 1, 1, 0, __DRI_IMAGE_FORMAT_R8, 1 } } },
286
287 { __DRI_IMAGE_FOURCC_YVU444, __DRI_IMAGE_COMPONENTS_Y_U_V, 3,
288 { { 0, 0, 0, __DRI_IMAGE_FORMAT_R8, 1 },
289 { 2, 0, 0, __DRI_IMAGE_FORMAT_R8, 1 },
290 { 1, 0, 0, __DRI_IMAGE_FORMAT_R8, 1 } } },
291
292 { __DRI_IMAGE_FOURCC_NV12, __DRI_IMAGE_COMPONENTS_Y_UV, 2,
293 { { 0, 0, 0, __DRI_IMAGE_FORMAT_R8, 1 },
294 { 1, 1, 1, __DRI_IMAGE_FORMAT_GR88, 2 } } },
295
296 { __DRI_IMAGE_FOURCC_NV16, __DRI_IMAGE_COMPONENTS_Y_UV, 2,
297 { { 0, 0, 0, __DRI_IMAGE_FORMAT_R8, 1 },
298 { 1, 1, 0, __DRI_IMAGE_FORMAT_GR88, 2 } } },
299
300 /* For YUYV buffers, we set up two overlapping DRI images and treat
301 * them as planar buffers in the compositors. Plane 0 is GR88 and
302 * samples YU or YV pairs and places Y into the R component, while
303 * plane 1 is ARGB and samples YUYV clusters and places pairs and
304 * places U into the G component and V into A. This lets the
305 * texture sampler interpolate the Y components correctly when
306 * sampling from plane 0, and interpolate U and V correctly when
307 * sampling from plane 1. */
308 { __DRI_IMAGE_FOURCC_YUYV, __DRI_IMAGE_COMPONENTS_Y_XUXV, 2,
309 { { 0, 0, 0, __DRI_IMAGE_FORMAT_GR88, 2 },
310 { 0, 1, 0, __DRI_IMAGE_FORMAT_ARGB8888, 4 } } }
311 };
312
313 static void
314 intel_image_warn_if_unaligned(__DRIimage *image, const char *func)
315 {
316 uint32_t tiling, swizzle;
317 drm_intel_bo_get_tiling(image->bo, &tiling, &swizzle);
318
319 if (tiling != I915_TILING_NONE && (image->offset & 0xfff)) {
320 _mesa_warning(NULL, "%s: offset 0x%08x not on tile boundary",
321 func, image->offset);
322 }
323 }
324
325 static struct intel_image_format *
326 intel_image_format_lookup(int fourcc)
327 {
328 struct intel_image_format *f = NULL;
329
330 for (unsigned i = 0; i < ARRAY_SIZE(intel_image_formats); i++) {
331 if (intel_image_formats[i].fourcc == fourcc) {
332 f = &intel_image_formats[i];
333 break;
334 }
335 }
336
337 return f;
338 }
339
340 static boolean intel_lookup_fourcc(int dri_format, int *fourcc)
341 {
342 for (unsigned i = 0; i < ARRAY_SIZE(intel_image_formats); i++) {
343 if (intel_image_formats[i].planes[0].dri_format == dri_format) {
344 *fourcc = intel_image_formats[i].fourcc;
345 return true;
346 }
347 }
348 return false;
349 }
350
351 static __DRIimage *
352 intel_allocate_image(int dri_format, void *loaderPrivate)
353 {
354 __DRIimage *image;
355
356 image = calloc(1, sizeof *image);
357 if (image == NULL)
358 return NULL;
359
360 image->dri_format = dri_format;
361 image->offset = 0;
362
363 image->format = driImageFormatToGLFormat(dri_format);
364 if (dri_format != __DRI_IMAGE_FORMAT_NONE &&
365 image->format == MESA_FORMAT_NONE) {
366 free(image);
367 return NULL;
368 }
369
370 image->internal_format = _mesa_get_format_base_format(image->format);
371 image->data = loaderPrivate;
372
373 return image;
374 }
375
376 /**
377 * Sets up a DRIImage structure to point to a slice out of a miptree.
378 */
379 static void
380 intel_setup_image_from_mipmap_tree(struct brw_context *brw, __DRIimage *image,
381 struct intel_mipmap_tree *mt, GLuint level,
382 GLuint zoffset)
383 {
384 intel_miptree_make_shareable(brw, mt);
385
386 intel_miptree_check_level_layer(mt, level, zoffset);
387
388 image->width = minify(mt->physical_width0, level - mt->first_level);
389 image->height = minify(mt->physical_height0, level - mt->first_level);
390 image->pitch = mt->pitch;
391
392 image->offset = intel_miptree_get_tile_offsets(mt, level, zoffset,
393 &image->tile_x,
394 &image->tile_y);
395
396 drm_intel_bo_unreference(image->bo);
397 image->bo = mt->bo;
398 drm_intel_bo_reference(mt->bo);
399 }
400
401 static __DRIimage *
402 intel_create_image_from_name(__DRIscreen *dri_screen,
403 int width, int height, int format,
404 int name, int pitch, void *loaderPrivate)
405 {
406 struct intel_screen *screen = dri_screen->driverPrivate;
407 __DRIimage *image;
408 int cpp;
409
410 image = intel_allocate_image(format, loaderPrivate);
411 if (image == NULL)
412 return NULL;
413
414 if (image->format == MESA_FORMAT_NONE)
415 cpp = 1;
416 else
417 cpp = _mesa_get_format_bytes(image->format);
418
419 image->width = width;
420 image->height = height;
421 image->pitch = pitch * cpp;
422 image->bo = drm_intel_bo_gem_create_from_name(screen->bufmgr, "image",
423 name);
424 if (!image->bo) {
425 free(image);
426 return NULL;
427 }
428
429 return image;
430 }
431
432 static __DRIimage *
433 intel_create_image_from_renderbuffer(__DRIcontext *context,
434 int renderbuffer, void *loaderPrivate)
435 {
436 __DRIimage *image;
437 struct brw_context *brw = context->driverPrivate;
438 struct gl_context *ctx = &brw->ctx;
439 struct gl_renderbuffer *rb;
440 struct intel_renderbuffer *irb;
441
442 rb = _mesa_lookup_renderbuffer(ctx, renderbuffer);
443 if (!rb) {
444 _mesa_error(ctx, GL_INVALID_OPERATION, "glRenderbufferExternalMESA");
445 return NULL;
446 }
447
448 irb = intel_renderbuffer(rb);
449 intel_miptree_make_shareable(brw, irb->mt);
450 image = calloc(1, sizeof *image);
451 if (image == NULL)
452 return NULL;
453
454 image->internal_format = rb->InternalFormat;
455 image->format = rb->Format;
456 image->offset = 0;
457 image->data = loaderPrivate;
458 drm_intel_bo_unreference(image->bo);
459 image->bo = irb->mt->bo;
460 drm_intel_bo_reference(irb->mt->bo);
461 image->width = rb->Width;
462 image->height = rb->Height;
463 image->pitch = irb->mt->pitch;
464 image->dri_format = driGLFormatToImageFormat(image->format);
465 image->has_depthstencil = irb->mt->stencil_mt? true : false;
466
467 rb->NeedsFinishRenderTexture = true;
468 return image;
469 }
470
471 static __DRIimage *
472 intel_create_image_from_texture(__DRIcontext *context, int target,
473 unsigned texture, int zoffset,
474 int level,
475 unsigned *error,
476 void *loaderPrivate)
477 {
478 __DRIimage *image;
479 struct brw_context *brw = context->driverPrivate;
480 struct gl_texture_object *obj;
481 struct intel_texture_object *iobj;
482 GLuint face = 0;
483
484 obj = _mesa_lookup_texture(&brw->ctx, texture);
485 if (!obj || obj->Target != target) {
486 *error = __DRI_IMAGE_ERROR_BAD_PARAMETER;
487 return NULL;
488 }
489
490 if (target == GL_TEXTURE_CUBE_MAP)
491 face = zoffset;
492
493 _mesa_test_texobj_completeness(&brw->ctx, obj);
494 iobj = intel_texture_object(obj);
495 if (!obj->_BaseComplete || (level > 0 && !obj->_MipmapComplete)) {
496 *error = __DRI_IMAGE_ERROR_BAD_PARAMETER;
497 return NULL;
498 }
499
500 if (level < obj->BaseLevel || level > obj->_MaxLevel) {
501 *error = __DRI_IMAGE_ERROR_BAD_MATCH;
502 return NULL;
503 }
504
505 if (target == GL_TEXTURE_3D && obj->Image[face][level]->Depth < zoffset) {
506 *error = __DRI_IMAGE_ERROR_BAD_MATCH;
507 return NULL;
508 }
509 image = calloc(1, sizeof *image);
510 if (image == NULL) {
511 *error = __DRI_IMAGE_ERROR_BAD_ALLOC;
512 return NULL;
513 }
514
515 image->internal_format = obj->Image[face][level]->InternalFormat;
516 image->format = obj->Image[face][level]->TexFormat;
517 image->data = loaderPrivate;
518 intel_setup_image_from_mipmap_tree(brw, image, iobj->mt, level, zoffset);
519 image->dri_format = driGLFormatToImageFormat(image->format);
520 image->has_depthstencil = iobj->mt->stencil_mt? true : false;
521 if (image->dri_format == MESA_FORMAT_NONE) {
522 *error = __DRI_IMAGE_ERROR_BAD_PARAMETER;
523 free(image);
524 return NULL;
525 }
526
527 *error = __DRI_IMAGE_ERROR_SUCCESS;
528 return image;
529 }
530
531 static void
532 intel_destroy_image(__DRIimage *image)
533 {
534 drm_intel_bo_unreference(image->bo);
535 free(image);
536 }
537
538 static __DRIimage *
539 intel_create_image(__DRIscreen *dri_screen,
540 int width, int height, int format,
541 unsigned int use,
542 void *loaderPrivate)
543 {
544 __DRIimage *image;
545 struct intel_screen *screen = dri_screen->driverPrivate;
546 uint32_t tiling;
547 int cpp;
548 unsigned long pitch;
549
550 tiling = I915_TILING_X;
551 if (use & __DRI_IMAGE_USE_CURSOR) {
552 if (width != 64 || height != 64)
553 return NULL;
554 tiling = I915_TILING_NONE;
555 }
556
557 if (use & __DRI_IMAGE_USE_LINEAR)
558 tiling = I915_TILING_NONE;
559
560 image = intel_allocate_image(format, loaderPrivate);
561 if (image == NULL)
562 return NULL;
563
564 cpp = _mesa_get_format_bytes(image->format);
565 image->bo = drm_intel_bo_alloc_tiled(screen->bufmgr, "image",
566 width, height, cpp, &tiling,
567 &pitch, 0);
568 if (image->bo == NULL) {
569 free(image);
570 return NULL;
571 }
572 image->width = width;
573 image->height = height;
574 image->pitch = pitch;
575
576 return image;
577 }
578
579 static GLboolean
580 intel_query_image(__DRIimage *image, int attrib, int *value)
581 {
582 switch (attrib) {
583 case __DRI_IMAGE_ATTRIB_STRIDE:
584 *value = image->pitch;
585 return true;
586 case __DRI_IMAGE_ATTRIB_HANDLE:
587 *value = image->bo->handle;
588 return true;
589 case __DRI_IMAGE_ATTRIB_NAME:
590 return !drm_intel_bo_flink(image->bo, (uint32_t *) value);
591 case __DRI_IMAGE_ATTRIB_FORMAT:
592 *value = image->dri_format;
593 return true;
594 case __DRI_IMAGE_ATTRIB_WIDTH:
595 *value = image->width;
596 return true;
597 case __DRI_IMAGE_ATTRIB_HEIGHT:
598 *value = image->height;
599 return true;
600 case __DRI_IMAGE_ATTRIB_COMPONENTS:
601 if (image->planar_format == NULL)
602 return false;
603 *value = image->planar_format->components;
604 return true;
605 case __DRI_IMAGE_ATTRIB_FD:
606 return !drm_intel_bo_gem_export_to_prime(image->bo, value);
607 case __DRI_IMAGE_ATTRIB_FOURCC:
608 return intel_lookup_fourcc(image->dri_format, value);
609 case __DRI_IMAGE_ATTRIB_NUM_PLANES:
610 *value = 1;
611 return true;
612 case __DRI_IMAGE_ATTRIB_OFFSET:
613 *value = image->offset;
614 return true;
615
616 default:
617 return false;
618 }
619 }
620
621 static __DRIimage *
622 intel_dup_image(__DRIimage *orig_image, void *loaderPrivate)
623 {
624 __DRIimage *image;
625
626 image = calloc(1, sizeof *image);
627 if (image == NULL)
628 return NULL;
629
630 drm_intel_bo_reference(orig_image->bo);
631 image->bo = orig_image->bo;
632 image->internal_format = orig_image->internal_format;
633 image->planar_format = orig_image->planar_format;
634 image->dri_format = orig_image->dri_format;
635 image->format = orig_image->format;
636 image->offset = orig_image->offset;
637 image->width = orig_image->width;
638 image->height = orig_image->height;
639 image->pitch = orig_image->pitch;
640 image->tile_x = orig_image->tile_x;
641 image->tile_y = orig_image->tile_y;
642 image->has_depthstencil = orig_image->has_depthstencil;
643 image->data = loaderPrivate;
644
645 memcpy(image->strides, orig_image->strides, sizeof(image->strides));
646 memcpy(image->offsets, orig_image->offsets, sizeof(image->offsets));
647
648 return image;
649 }
650
651 static GLboolean
652 intel_validate_usage(__DRIimage *image, unsigned int use)
653 {
654 if (use & __DRI_IMAGE_USE_CURSOR) {
655 if (image->width != 64 || image->height != 64)
656 return GL_FALSE;
657 }
658
659 return GL_TRUE;
660 }
661
662 static __DRIimage *
663 intel_create_image_from_names(__DRIscreen *dri_screen,
664 int width, int height, int fourcc,
665 int *names, int num_names,
666 int *strides, int *offsets,
667 void *loaderPrivate)
668 {
669 struct intel_image_format *f = NULL;
670 __DRIimage *image;
671 int i, index;
672
673 if (dri_screen == NULL || names == NULL || num_names != 1)
674 return NULL;
675
676 f = intel_image_format_lookup(fourcc);
677 if (f == NULL)
678 return NULL;
679
680 image = intel_create_image_from_name(dri_screen, width, height,
681 __DRI_IMAGE_FORMAT_NONE,
682 names[0], strides[0],
683 loaderPrivate);
684
685 if (image == NULL)
686 return NULL;
687
688 image->planar_format = f;
689 for (i = 0; i < f->nplanes; i++) {
690 index = f->planes[i].buffer_index;
691 image->offsets[index] = offsets[index];
692 image->strides[index] = strides[index];
693 }
694
695 return image;
696 }
697
698 static __DRIimage *
699 intel_create_image_from_fds(__DRIscreen *dri_screen,
700 int width, int height, int fourcc,
701 int *fds, int num_fds, int *strides, int *offsets,
702 void *loaderPrivate)
703 {
704 struct intel_screen *screen = dri_screen->driverPrivate;
705 struct intel_image_format *f;
706 __DRIimage *image;
707 int i, index;
708
709 if (fds == NULL || num_fds < 1)
710 return NULL;
711
712 /* We only support all planes from the same bo */
713 for (i = 0; i < num_fds; i++)
714 if (fds[0] != fds[i])
715 return NULL;
716
717 f = intel_image_format_lookup(fourcc);
718 if (f == NULL)
719 return NULL;
720
721 if (f->nplanes == 1)
722 image = intel_allocate_image(f->planes[0].dri_format, loaderPrivate);
723 else
724 image = intel_allocate_image(__DRI_IMAGE_FORMAT_NONE, loaderPrivate);
725
726 if (image == NULL)
727 return NULL;
728
729 image->width = width;
730 image->height = height;
731 image->pitch = strides[0];
732
733 image->planar_format = f;
734 int size = 0;
735 for (i = 0; i < f->nplanes; i++) {
736 index = f->planes[i].buffer_index;
737 image->offsets[index] = offsets[index];
738 image->strides[index] = strides[index];
739
740 const int plane_height = height >> f->planes[i].height_shift;
741 const int end = offsets[index] + plane_height * strides[index];
742 if (size < end)
743 size = end;
744 }
745
746 image->bo = drm_intel_bo_gem_create_from_prime(screen->bufmgr,
747 fds[0], size);
748 if (image->bo == NULL) {
749 free(image);
750 return NULL;
751 }
752
753 if (f->nplanes == 1) {
754 image->offset = image->offsets[0];
755 intel_image_warn_if_unaligned(image, __func__);
756 }
757
758 return image;
759 }
760
761 static __DRIimage *
762 intel_create_image_from_dma_bufs(__DRIscreen *dri_screen,
763 int width, int height, int fourcc,
764 int *fds, int num_fds,
765 int *strides, int *offsets,
766 enum __DRIYUVColorSpace yuv_color_space,
767 enum __DRISampleRange sample_range,
768 enum __DRIChromaSiting horizontal_siting,
769 enum __DRIChromaSiting vertical_siting,
770 unsigned *error,
771 void *loaderPrivate)
772 {
773 __DRIimage *image;
774 struct intel_image_format *f = intel_image_format_lookup(fourcc);
775
776 if (!f) {
777 *error = __DRI_IMAGE_ERROR_BAD_MATCH;
778 return NULL;
779 }
780
781 image = intel_create_image_from_fds(dri_screen, width, height, fourcc, fds,
782 num_fds, strides, offsets,
783 loaderPrivate);
784
785 /*
786 * Invalid parameters and any inconsistencies between are assumed to be
787 * checked by the caller. Therefore besides unsupported formats one can fail
788 * only in allocation.
789 */
790 if (!image) {
791 *error = __DRI_IMAGE_ERROR_BAD_ALLOC;
792 return NULL;
793 }
794
795 image->dma_buf_imported = true;
796 image->yuv_color_space = yuv_color_space;
797 image->sample_range = sample_range;
798 image->horizontal_siting = horizontal_siting;
799 image->vertical_siting = vertical_siting;
800
801 *error = __DRI_IMAGE_ERROR_SUCCESS;
802 return image;
803 }
804
805 static __DRIimage *
806 intel_from_planar(__DRIimage *parent, int plane, void *loaderPrivate)
807 {
808 int width, height, offset, stride, dri_format, index;
809 struct intel_image_format *f;
810 __DRIimage *image;
811
812 if (parent == NULL || parent->planar_format == NULL)
813 return NULL;
814
815 f = parent->planar_format;
816
817 if (plane >= f->nplanes)
818 return NULL;
819
820 width = parent->width >> f->planes[plane].width_shift;
821 height = parent->height >> f->planes[plane].height_shift;
822 dri_format = f->planes[plane].dri_format;
823 index = f->planes[plane].buffer_index;
824 offset = parent->offsets[index];
825 stride = parent->strides[index];
826
827 image = intel_allocate_image(dri_format, loaderPrivate);
828 if (image == NULL)
829 return NULL;
830
831 if (offset + height * stride > parent->bo->size) {
832 _mesa_warning(NULL, "intel_create_sub_image: subimage out of bounds");
833 free(image);
834 return NULL;
835 }
836
837 image->bo = parent->bo;
838 drm_intel_bo_reference(parent->bo);
839
840 image->width = width;
841 image->height = height;
842 image->pitch = stride;
843 image->offset = offset;
844
845 intel_image_warn_if_unaligned(image, __func__);
846
847 return image;
848 }
849
850 static const __DRIimageExtension intelImageExtension = {
851 .base = { __DRI_IMAGE, 13 },
852
853 .createImageFromName = intel_create_image_from_name,
854 .createImageFromRenderbuffer = intel_create_image_from_renderbuffer,
855 .destroyImage = intel_destroy_image,
856 .createImage = intel_create_image,
857 .queryImage = intel_query_image,
858 .dupImage = intel_dup_image,
859 .validateUsage = intel_validate_usage,
860 .createImageFromNames = intel_create_image_from_names,
861 .fromPlanar = intel_from_planar,
862 .createImageFromTexture = intel_create_image_from_texture,
863 .createImageFromFds = intel_create_image_from_fds,
864 .createImageFromDmaBufs = intel_create_image_from_dma_bufs,
865 .blitImage = NULL,
866 .getCapabilities = NULL,
867 .mapImage = NULL,
868 .unmapImage = NULL,
869 };
870
871 static int
872 brw_query_renderer_integer(__DRIscreen *dri_screen,
873 int param, unsigned int *value)
874 {
875 const struct intel_screen *const screen =
876 (struct intel_screen *) dri_screen->driverPrivate;
877
878 switch (param) {
879 case __DRI2_RENDERER_VENDOR_ID:
880 value[0] = 0x8086;
881 return 0;
882 case __DRI2_RENDERER_DEVICE_ID:
883 value[0] = screen->deviceID;
884 return 0;
885 case __DRI2_RENDERER_ACCELERATED:
886 value[0] = 1;
887 return 0;
888 case __DRI2_RENDERER_VIDEO_MEMORY: {
889 /* Once a batch uses more than 75% of the maximum mappable size, we
890 * assume that there's some fragmentation, and we start doing extra
891 * flushing, etc. That's the big cliff apps will care about.
892 */
893 size_t aper_size;
894 size_t mappable_size;
895
896 drm_intel_get_aperture_sizes(dri_screen->fd, &mappable_size, &aper_size);
897
898 const unsigned gpu_mappable_megabytes =
899 (aper_size / (1024 * 1024)) * 3 / 4;
900
901 const long system_memory_pages = sysconf(_SC_PHYS_PAGES);
902 const long system_page_size = sysconf(_SC_PAGE_SIZE);
903
904 if (system_memory_pages <= 0 || system_page_size <= 0)
905 return -1;
906
907 const uint64_t system_memory_bytes = (uint64_t) system_memory_pages
908 * (uint64_t) system_page_size;
909
910 const unsigned system_memory_megabytes =
911 (unsigned) (system_memory_bytes / (1024 * 1024));
912
913 value[0] = MIN2(system_memory_megabytes, gpu_mappable_megabytes);
914 return 0;
915 }
916 case __DRI2_RENDERER_UNIFIED_MEMORY_ARCHITECTURE:
917 value[0] = 1;
918 return 0;
919 default:
920 return driQueryRendererIntegerCommon(dri_screen, param, value);
921 }
922
923 return -1;
924 }
925
926 static int
927 brw_query_renderer_string(__DRIscreen *dri_screen,
928 int param, const char **value)
929 {
930 const struct intel_screen *screen =
931 (struct intel_screen *) dri_screen->driverPrivate;
932
933 switch (param) {
934 case __DRI2_RENDERER_VENDOR_ID:
935 value[0] = brw_vendor_string;
936 return 0;
937 case __DRI2_RENDERER_DEVICE_ID:
938 value[0] = brw_get_renderer_string(screen);
939 return 0;
940 default:
941 break;
942 }
943
944 return -1;
945 }
946
947 static const __DRI2rendererQueryExtension intelRendererQueryExtension = {
948 .base = { __DRI2_RENDERER_QUERY, 1 },
949
950 .queryInteger = brw_query_renderer_integer,
951 .queryString = brw_query_renderer_string
952 };
953
954 static const __DRIrobustnessExtension dri2Robustness = {
955 .base = { __DRI2_ROBUSTNESS, 1 }
956 };
957
958 static const __DRIextension *screenExtensions[] = {
959 &intelTexBufferExtension.base,
960 &intelFenceExtension.base,
961 &intelFlushExtension.base,
962 &intelImageExtension.base,
963 &intelRendererQueryExtension.base,
964 &dri2ConfigQueryExtension.base,
965 NULL
966 };
967
968 static const __DRIextension *intelRobustScreenExtensions[] = {
969 &intelTexBufferExtension.base,
970 &intelFenceExtension.base,
971 &intelFlushExtension.base,
972 &intelImageExtension.base,
973 &intelRendererQueryExtension.base,
974 &dri2ConfigQueryExtension.base,
975 &dri2Robustness.base,
976 NULL
977 };
978
979 static int
980 intel_get_param(struct intel_screen *screen, int param, int *value)
981 {
982 int ret = 0;
983 struct drm_i915_getparam gp;
984
985 memset(&gp, 0, sizeof(gp));
986 gp.param = param;
987 gp.value = value;
988
989 if (drmIoctl(screen->driScrnPriv->fd, DRM_IOCTL_I915_GETPARAM, &gp) == -1) {
990 ret = -errno;
991 if (ret != -EINVAL)
992 _mesa_warning(NULL, "drm_i915_getparam: %d", ret);
993 }
994
995 return ret;
996 }
997
998 static bool
999 intel_get_boolean(struct intel_screen *screen, int param)
1000 {
1001 int value = 0;
1002 return (intel_get_param(screen, param, &value) == 0) && value;
1003 }
1004
1005 static int
1006 intel_get_integer(struct intel_screen *screen, int param)
1007 {
1008 int value = -1;
1009
1010 if (intel_get_param(screen, param, &value) == 0)
1011 return value;
1012
1013 return -1;
1014 }
1015
1016 static void
1017 intelDestroyScreen(__DRIscreen * sPriv)
1018 {
1019 struct intel_screen *screen = sPriv->driverPrivate;
1020
1021 dri_bufmgr_destroy(screen->bufmgr);
1022 driDestroyOptionInfo(&screen->optionCache);
1023
1024 ralloc_free(screen);
1025 sPriv->driverPrivate = NULL;
1026 }
1027
1028
1029 /**
1030 * This is called when we need to set up GL rendering to a new X window.
1031 */
1032 static GLboolean
1033 intelCreateBuffer(__DRIscreen *dri_screen,
1034 __DRIdrawable * driDrawPriv,
1035 const struct gl_config * mesaVis, GLboolean isPixmap)
1036 {
1037 struct intel_renderbuffer *rb;
1038 struct intel_screen *screen = (struct intel_screen *)
1039 dri_screen->driverPrivate;
1040 mesa_format rgbFormat;
1041 unsigned num_samples =
1042 intel_quantize_num_samples(screen, mesaVis->samples);
1043 struct gl_framebuffer *fb;
1044
1045 if (isPixmap)
1046 return false;
1047
1048 fb = CALLOC_STRUCT(gl_framebuffer);
1049 if (!fb)
1050 return false;
1051
1052 _mesa_initialize_window_framebuffer(fb, mesaVis);
1053
1054 if (screen->winsys_msaa_samples_override != -1) {
1055 num_samples = screen->winsys_msaa_samples_override;
1056 fb->Visual.samples = num_samples;
1057 }
1058
1059 if (mesaVis->redBits == 5) {
1060 rgbFormat = mesaVis->redMask == 0x1f ? MESA_FORMAT_R5G6B5_UNORM
1061 : MESA_FORMAT_B5G6R5_UNORM;
1062 } else if (mesaVis->sRGBCapable) {
1063 rgbFormat = mesaVis->redMask == 0xff ? MESA_FORMAT_R8G8B8A8_SRGB
1064 : MESA_FORMAT_B8G8R8A8_SRGB;
1065 } else if (mesaVis->alphaBits == 0) {
1066 rgbFormat = mesaVis->redMask == 0xff ? MESA_FORMAT_R8G8B8X8_UNORM
1067 : MESA_FORMAT_B8G8R8X8_UNORM;
1068 } else {
1069 rgbFormat = mesaVis->redMask == 0xff ? MESA_FORMAT_R8G8B8A8_SRGB
1070 : MESA_FORMAT_B8G8R8A8_SRGB;
1071 fb->Visual.sRGBCapable = true;
1072 }
1073
1074 /* setup the hardware-based renderbuffers */
1075 rb = intel_create_renderbuffer(rgbFormat, num_samples);
1076 _mesa_add_renderbuffer(fb, BUFFER_FRONT_LEFT, &rb->Base.Base);
1077
1078 if (mesaVis->doubleBufferMode) {
1079 rb = intel_create_renderbuffer(rgbFormat, num_samples);
1080 _mesa_add_renderbuffer(fb, BUFFER_BACK_LEFT, &rb->Base.Base);
1081 }
1082
1083 /*
1084 * Assert here that the gl_config has an expected depth/stencil bit
1085 * combination: one of d24/s8, d16/s0, d0/s0. (See intelInitScreen2(),
1086 * which constructs the advertised configs.)
1087 */
1088 if (mesaVis->depthBits == 24) {
1089 assert(mesaVis->stencilBits == 8);
1090
1091 if (screen->devinfo->has_hiz_and_separate_stencil) {
1092 rb = intel_create_private_renderbuffer(MESA_FORMAT_Z24_UNORM_X8_UINT,
1093 num_samples);
1094 _mesa_add_renderbuffer(fb, BUFFER_DEPTH, &rb->Base.Base);
1095 rb = intel_create_private_renderbuffer(MESA_FORMAT_S_UINT8,
1096 num_samples);
1097 _mesa_add_renderbuffer(fb, BUFFER_STENCIL, &rb->Base.Base);
1098 } else {
1099 /*
1100 * Use combined depth/stencil. Note that the renderbuffer is
1101 * attached to two attachment points.
1102 */
1103 rb = intel_create_private_renderbuffer(MESA_FORMAT_Z24_UNORM_S8_UINT,
1104 num_samples);
1105 _mesa_add_renderbuffer(fb, BUFFER_DEPTH, &rb->Base.Base);
1106 _mesa_add_renderbuffer(fb, BUFFER_STENCIL, &rb->Base.Base);
1107 }
1108 }
1109 else if (mesaVis->depthBits == 16) {
1110 assert(mesaVis->stencilBits == 0);
1111 rb = intel_create_private_renderbuffer(MESA_FORMAT_Z_UNORM16,
1112 num_samples);
1113 _mesa_add_renderbuffer(fb, BUFFER_DEPTH, &rb->Base.Base);
1114 }
1115 else {
1116 assert(mesaVis->depthBits == 0);
1117 assert(mesaVis->stencilBits == 0);
1118 }
1119
1120 /* now add any/all software-based renderbuffers we may need */
1121 _swrast_add_soft_renderbuffers(fb,
1122 false, /* never sw color */
1123 false, /* never sw depth */
1124 false, /* never sw stencil */
1125 mesaVis->accumRedBits > 0,
1126 false, /* never sw alpha */
1127 false /* never sw aux */ );
1128 driDrawPriv->driverPrivate = fb;
1129
1130 return true;
1131 }
1132
1133 static void
1134 intelDestroyBuffer(__DRIdrawable * driDrawPriv)
1135 {
1136 struct gl_framebuffer *fb = driDrawPriv->driverPrivate;
1137
1138 _mesa_reference_framebuffer(&fb, NULL);
1139 }
1140
1141 static void
1142 intel_detect_sseu(struct intel_screen *screen)
1143 {
1144 assert(screen->devinfo->gen >= 8);
1145 int ret;
1146
1147 screen->subslice_total = -1;
1148 screen->eu_total = -1;
1149
1150 ret = intel_get_param(screen, I915_PARAM_SUBSLICE_TOTAL,
1151 &screen->subslice_total);
1152 if (ret < 0 && ret != -EINVAL)
1153 goto err_out;
1154
1155 ret = intel_get_param(screen,
1156 I915_PARAM_EU_TOTAL, &screen->eu_total);
1157 if (ret < 0 && ret != -EINVAL)
1158 goto err_out;
1159
1160 /* Without this information, we cannot get the right Braswell brandstrings,
1161 * and we have to use conservative numbers for GPGPU on many platforms, but
1162 * otherwise, things will just work.
1163 */
1164 if (screen->subslice_total < 1 || screen->eu_total < 1)
1165 _mesa_warning(NULL,
1166 "Kernel 4.1 required to properly query GPU properties.\n");
1167
1168 return;
1169
1170 err_out:
1171 screen->subslice_total = -1;
1172 screen->eu_total = -1;
1173 _mesa_warning(NULL, "Failed to query GPU properties (%s).\n", strerror(-ret));
1174 }
1175
1176 static bool
1177 intel_init_bufmgr(struct intel_screen *screen)
1178 {
1179 __DRIscreen *dri_screen = screen->driScrnPriv;
1180
1181 screen->no_hw = getenv("INTEL_NO_HW") != NULL;
1182
1183 screen->bufmgr = intel_bufmgr_gem_init(dri_screen->fd, BATCH_SZ);
1184 if (screen->bufmgr == NULL) {
1185 fprintf(stderr, "[%s:%u] Error initializing buffer manager.\n",
1186 __func__, __LINE__);
1187 return false;
1188 }
1189
1190 drm_intel_bufmgr_gem_enable_fenced_relocs(screen->bufmgr);
1191
1192 if (!intel_get_boolean(screen, I915_PARAM_HAS_RELAXED_DELTA)) {
1193 fprintf(stderr, "[%s: %u] Kernel 2.6.39 required.\n", __func__, __LINE__);
1194 return false;
1195 }
1196
1197 return true;
1198 }
1199
1200 static bool
1201 intel_detect_swizzling(struct intel_screen *screen)
1202 {
1203 drm_intel_bo *buffer;
1204 unsigned long flags = 0;
1205 unsigned long aligned_pitch;
1206 uint32_t tiling = I915_TILING_X;
1207 uint32_t swizzle_mode = 0;
1208
1209 buffer = drm_intel_bo_alloc_tiled(screen->bufmgr, "swizzle test",
1210 64, 64, 4,
1211 &tiling, &aligned_pitch, flags);
1212 if (buffer == NULL)
1213 return false;
1214
1215 drm_intel_bo_get_tiling(buffer, &tiling, &swizzle_mode);
1216 drm_intel_bo_unreference(buffer);
1217
1218 if (swizzle_mode == I915_BIT_6_SWIZZLE_NONE)
1219 return false;
1220 else
1221 return true;
1222 }
1223
1224 static int
1225 intel_detect_timestamp(struct intel_screen *screen)
1226 {
1227 uint64_t dummy = 0, last = 0;
1228 int upper, lower, loops;
1229
1230 /* On 64bit systems, some old kernels trigger a hw bug resulting in the
1231 * TIMESTAMP register being shifted and the low 32bits always zero.
1232 *
1233 * More recent kernels offer an interface to read the full 36bits
1234 * everywhere.
1235 */
1236 if (drm_intel_reg_read(screen->bufmgr, TIMESTAMP | 1, &dummy) == 0)
1237 return 3;
1238
1239 /* Determine if we have a 32bit or 64bit kernel by inspecting the
1240 * upper 32bits for a rapidly changing timestamp.
1241 */
1242 if (drm_intel_reg_read(screen->bufmgr, TIMESTAMP, &last))
1243 return 0;
1244
1245 upper = lower = 0;
1246 for (loops = 0; loops < 10; loops++) {
1247 /* The TIMESTAMP should change every 80ns, so several round trips
1248 * through the kernel should be enough to advance it.
1249 */
1250 if (drm_intel_reg_read(screen->bufmgr, TIMESTAMP, &dummy))
1251 return 0;
1252
1253 upper += (dummy >> 32) != (last >> 32);
1254 if (upper > 1) /* beware 32bit counter overflow */
1255 return 2; /* upper dword holds the low 32bits of the timestamp */
1256
1257 lower += (dummy & 0xffffffff) != (last & 0xffffffff);
1258 if (lower > 1)
1259 return 1; /* timestamp is unshifted */
1260
1261 last = dummy;
1262 }
1263
1264 /* No advancement? No timestamp! */
1265 return 0;
1266 }
1267
1268 /**
1269 * Return array of MSAA modes supported by the hardware. The array is
1270 * zero-terminated and sorted in decreasing order.
1271 */
1272 const int*
1273 intel_supported_msaa_modes(const struct intel_screen *screen)
1274 {
1275 static const int gen9_modes[] = {16, 8, 4, 2, 0, -1};
1276 static const int gen8_modes[] = {8, 4, 2, 0, -1};
1277 static const int gen7_modes[] = {8, 4, 0, -1};
1278 static const int gen6_modes[] = {4, 0, -1};
1279 static const int gen4_modes[] = {0, -1};
1280
1281 if (screen->devinfo->gen >= 9) {
1282 return gen9_modes;
1283 } else if (screen->devinfo->gen >= 8) {
1284 return gen8_modes;
1285 } else if (screen->devinfo->gen >= 7) {
1286 return gen7_modes;
1287 } else if (screen->devinfo->gen == 6) {
1288 return gen6_modes;
1289 } else {
1290 return gen4_modes;
1291 }
1292 }
1293
1294 static __DRIconfig**
1295 intel_screen_make_configs(__DRIscreen *dri_screen)
1296 {
1297 static const mesa_format formats[] = {
1298 MESA_FORMAT_B5G6R5_UNORM,
1299 MESA_FORMAT_B8G8R8A8_UNORM,
1300 MESA_FORMAT_B8G8R8X8_UNORM
1301 };
1302
1303 /* GLX_SWAP_COPY_OML is not supported due to page flipping. */
1304 static const GLenum back_buffer_modes[] = {
1305 GLX_SWAP_UNDEFINED_OML, GLX_NONE,
1306 };
1307
1308 static const uint8_t singlesample_samples[1] = {0};
1309 static const uint8_t multisample_samples[2] = {4, 8};
1310
1311 struct intel_screen *screen = dri_screen->driverPrivate;
1312 const struct gen_device_info *devinfo = screen->devinfo;
1313 uint8_t depth_bits[4], stencil_bits[4];
1314 __DRIconfig **configs = NULL;
1315
1316 /* Generate singlesample configs without accumulation buffer. */
1317 for (unsigned i = 0; i < ARRAY_SIZE(formats); i++) {
1318 __DRIconfig **new_configs;
1319 int num_depth_stencil_bits = 2;
1320
1321 /* Starting with DRI2 protocol version 1.1 we can request a depth/stencil
1322 * buffer that has a different number of bits per pixel than the color
1323 * buffer, gen >= 6 supports this.
1324 */
1325 depth_bits[0] = 0;
1326 stencil_bits[0] = 0;
1327
1328 if (formats[i] == MESA_FORMAT_B5G6R5_UNORM) {
1329 depth_bits[1] = 16;
1330 stencil_bits[1] = 0;
1331 if (devinfo->gen >= 6) {
1332 depth_bits[2] = 24;
1333 stencil_bits[2] = 8;
1334 num_depth_stencil_bits = 3;
1335 }
1336 } else {
1337 depth_bits[1] = 24;
1338 stencil_bits[1] = 8;
1339 }
1340
1341 new_configs = driCreateConfigs(formats[i],
1342 depth_bits,
1343 stencil_bits,
1344 num_depth_stencil_bits,
1345 back_buffer_modes, 2,
1346 singlesample_samples, 1,
1347 false, false);
1348 configs = driConcatConfigs(configs, new_configs);
1349 }
1350
1351 /* Generate the minimum possible set of configs that include an
1352 * accumulation buffer.
1353 */
1354 for (unsigned i = 0; i < ARRAY_SIZE(formats); i++) {
1355 __DRIconfig **new_configs;
1356
1357 if (formats[i] == MESA_FORMAT_B5G6R5_UNORM) {
1358 depth_bits[0] = 16;
1359 stencil_bits[0] = 0;
1360 } else {
1361 depth_bits[0] = 24;
1362 stencil_bits[0] = 8;
1363 }
1364
1365 new_configs = driCreateConfigs(formats[i],
1366 depth_bits, stencil_bits, 1,
1367 back_buffer_modes, 1,
1368 singlesample_samples, 1,
1369 true, false);
1370 configs = driConcatConfigs(configs, new_configs);
1371 }
1372
1373 /* Generate multisample configs.
1374 *
1375 * This loop breaks early, and hence is a no-op, on gen < 6.
1376 *
1377 * Multisample configs must follow the singlesample configs in order to
1378 * work around an X server bug present in 1.12. The X server chooses to
1379 * associate the first listed RGBA888-Z24S8 config, regardless of its
1380 * sample count, with the 32-bit depth visual used for compositing.
1381 *
1382 * Only doublebuffer configs with GLX_SWAP_UNDEFINED_OML behavior are
1383 * supported. Singlebuffer configs are not supported because no one wants
1384 * them.
1385 */
1386 for (unsigned i = 0; i < ARRAY_SIZE(formats); i++) {
1387 if (devinfo->gen < 6)
1388 break;
1389
1390 __DRIconfig **new_configs;
1391 const int num_depth_stencil_bits = 2;
1392 int num_msaa_modes = 0;
1393
1394 depth_bits[0] = 0;
1395 stencil_bits[0] = 0;
1396
1397 if (formats[i] == MESA_FORMAT_B5G6R5_UNORM) {
1398 depth_bits[1] = 16;
1399 stencil_bits[1] = 0;
1400 } else {
1401 depth_bits[1] = 24;
1402 stencil_bits[1] = 8;
1403 }
1404
1405 if (devinfo->gen >= 7)
1406 num_msaa_modes = 2;
1407 else if (devinfo->gen == 6)
1408 num_msaa_modes = 1;
1409
1410 new_configs = driCreateConfigs(formats[i],
1411 depth_bits,
1412 stencil_bits,
1413 num_depth_stencil_bits,
1414 back_buffer_modes, 1,
1415 multisample_samples,
1416 num_msaa_modes,
1417 false, false);
1418 configs = driConcatConfigs(configs, new_configs);
1419 }
1420
1421 if (configs == NULL) {
1422 fprintf(stderr, "[%s:%u] Error creating FBConfig!\n", __func__,
1423 __LINE__);
1424 return NULL;
1425 }
1426
1427 return configs;
1428 }
1429
1430 static void
1431 set_max_gl_versions(struct intel_screen *screen)
1432 {
1433 __DRIscreen *dri_screen = screen->driScrnPriv;
1434 const bool has_astc = screen->devinfo->gen >= 9;
1435
1436 switch (screen->devinfo->gen) {
1437 case 9:
1438 case 8:
1439 dri_screen->max_gl_core_version = 44;
1440 dri_screen->max_gl_compat_version = 30;
1441 dri_screen->max_gl_es1_version = 11;
1442 dri_screen->max_gl_es2_version = has_astc ? 32 : 31;
1443 break;
1444 case 7:
1445 dri_screen->max_gl_core_version = 33;
1446 dri_screen->max_gl_compat_version = 30;
1447 dri_screen->max_gl_es1_version = 11;
1448 dri_screen->max_gl_es2_version = screen->devinfo->is_haswell ? 31 : 30;
1449 break;
1450 case 6:
1451 dri_screen->max_gl_core_version = 33;
1452 dri_screen->max_gl_compat_version = 30;
1453 dri_screen->max_gl_es1_version = 11;
1454 dri_screen->max_gl_es2_version = 30;
1455 break;
1456 case 5:
1457 case 4:
1458 dri_screen->max_gl_core_version = 0;
1459 dri_screen->max_gl_compat_version = 21;
1460 dri_screen->max_gl_es1_version = 11;
1461 dri_screen->max_gl_es2_version = 20;
1462 break;
1463 default:
1464 unreachable("unrecognized intel_screen::gen");
1465 }
1466 }
1467
1468 /**
1469 * Return the revision (generally the revid field of the PCI header) of the
1470 * graphics device.
1471 *
1472 * XXX: This function is useful to keep around even if it is not currently in
1473 * use. It is necessary for new platforms and revision specific workarounds or
1474 * features. Please don't remove it so that we know it at least continues to
1475 * build.
1476 */
1477 static __attribute__((__unused__)) int
1478 brw_get_revision(int fd)
1479 {
1480 struct drm_i915_getparam gp;
1481 int revision;
1482 int ret;
1483
1484 memset(&gp, 0, sizeof(gp));
1485 gp.param = I915_PARAM_REVISION;
1486 gp.value = &revision;
1487
1488 ret = drmCommandWriteRead(fd, DRM_I915_GETPARAM, &gp, sizeof(gp));
1489 if (ret)
1490 revision = -1;
1491
1492 return revision;
1493 }
1494
1495 /* Drop when RS headers get pulled to libdrm */
1496 #ifndef I915_PARAM_HAS_RESOURCE_STREAMER
1497 #define I915_PARAM_HAS_RESOURCE_STREAMER 36
1498 #endif
1499
1500 static void
1501 shader_debug_log_mesa(void *data, const char *fmt, ...)
1502 {
1503 struct brw_context *brw = (struct brw_context *)data;
1504 va_list args;
1505
1506 va_start(args, fmt);
1507 GLuint msg_id = 0;
1508 _mesa_gl_vdebug(&brw->ctx, &msg_id,
1509 MESA_DEBUG_SOURCE_SHADER_COMPILER,
1510 MESA_DEBUG_TYPE_OTHER,
1511 MESA_DEBUG_SEVERITY_NOTIFICATION, fmt, args);
1512 va_end(args);
1513 }
1514
1515 static void
1516 shader_perf_log_mesa(void *data, const char *fmt, ...)
1517 {
1518 struct brw_context *brw = (struct brw_context *)data;
1519
1520 va_list args;
1521 va_start(args, fmt);
1522
1523 if (unlikely(INTEL_DEBUG & DEBUG_PERF)) {
1524 va_list args_copy;
1525 va_copy(args_copy, args);
1526 vfprintf(stderr, fmt, args_copy);
1527 va_end(args_copy);
1528 }
1529
1530 if (brw->perf_debug) {
1531 GLuint msg_id = 0;
1532 _mesa_gl_vdebug(&brw->ctx, &msg_id,
1533 MESA_DEBUG_SOURCE_SHADER_COMPILER,
1534 MESA_DEBUG_TYPE_PERFORMANCE,
1535 MESA_DEBUG_SEVERITY_MEDIUM, fmt, args);
1536 }
1537 va_end(args);
1538 }
1539
1540 /**
1541 * This is the driver specific part of the createNewScreen entry point.
1542 * Called when using DRI2.
1543 *
1544 * \return the struct gl_config supported by this driver
1545 */
1546 static const
1547 __DRIconfig **intelInitScreen2(__DRIscreen *dri_screen)
1548 {
1549 struct intel_screen *screen;
1550
1551 if (dri_screen->image.loader) {
1552 } else if (dri_screen->dri2.loader->base.version <= 2 ||
1553 dri_screen->dri2.loader->getBuffersWithFormat == NULL) {
1554 fprintf(stderr,
1555 "\nERROR! DRI2 loader with getBuffersWithFormat() "
1556 "support required\n");
1557 return false;
1558 }
1559
1560 /* Allocate the private area */
1561 screen = rzalloc(NULL, struct intel_screen);
1562 if (!screen) {
1563 fprintf(stderr, "\nERROR! Allocating private area failed\n");
1564 return false;
1565 }
1566 /* parse information in __driConfigOptions */
1567 driParseOptionInfo(&screen->optionCache, brw_config_options.xml);
1568
1569 screen->driScrnPriv = dri_screen;
1570 dri_screen->driverPrivate = (void *) screen;
1571
1572 if (!intel_init_bufmgr(screen))
1573 return false;
1574
1575 screen->deviceID = drm_intel_bufmgr_gem_get_devid(screen->bufmgr);
1576 screen->devinfo = gen_get_device_info(screen->deviceID);
1577 if (!screen->devinfo)
1578 return false;
1579
1580 brw_process_intel_debug_variable();
1581
1582 if (INTEL_DEBUG & DEBUG_BUFMGR)
1583 dri_bufmgr_set_debug(screen->bufmgr, true);
1584
1585 if ((INTEL_DEBUG & DEBUG_SHADER_TIME) && screen->devinfo->gen < 7) {
1586 fprintf(stderr,
1587 "shader_time debugging requires gen7 (Ivybridge) or better.\n");
1588 INTEL_DEBUG &= ~DEBUG_SHADER_TIME;
1589 }
1590
1591 if (INTEL_DEBUG & DEBUG_AUB)
1592 drm_intel_bufmgr_gem_set_aub_dump(screen->bufmgr, true);
1593
1594 #ifndef I915_PARAM_MMAP_GTT_VERSION
1595 #define I915_PARAM_MMAP_GTT_VERSION 40 /* XXX delete me with new libdrm */
1596 #endif
1597 if (intel_get_integer(screen, I915_PARAM_MMAP_GTT_VERSION) >= 1) {
1598 /* Theorectically unlimited! At least for individual objects...
1599 *
1600 * Currently the entire (global) address space for all GTT maps is
1601 * limited to 64bits. That is all objects on the system that are
1602 * setup for GTT mmapping must fit within 64bits. An attempt to use
1603 * one that exceeds the limit with fail in drm_intel_bo_map_gtt().
1604 *
1605 * Long before we hit that limit, we will be practically limited by
1606 * that any single object must fit in physical memory (RAM). The upper
1607 * limit on the CPU's address space is currently 48bits (Skylake), of
1608 * which only 39bits can be physical memory. (The GPU itself also has
1609 * a 48bit addressable virtual space.) We can fit over 32 million
1610 * objects of the current maximum allocable size before running out
1611 * of mmap space.
1612 */
1613 screen->max_gtt_map_object_size = UINT64_MAX;
1614 } else {
1615 /* Estimate the size of the mappable aperture into the GTT. There's an
1616 * ioctl to get the whole GTT size, but not one to get the mappable subset.
1617 * It turns out it's basically always 256MB, though some ancient hardware
1618 * was smaller.
1619 */
1620 uint32_t gtt_size = 256 * 1024 * 1024;
1621
1622 /* We don't want to map two objects such that a memcpy between them would
1623 * just fault one mapping in and then the other over and over forever. So
1624 * we would need to divide the GTT size by 2. Additionally, some GTT is
1625 * taken up by things like the framebuffer and the ringbuffer and such, so
1626 * be more conservative.
1627 */
1628 screen->max_gtt_map_object_size = gtt_size / 4;
1629 }
1630
1631 screen->hw_has_swizzling = intel_detect_swizzling(screen);
1632 screen->hw_has_timestamp = intel_detect_timestamp(screen);
1633
1634 /* GENs prior to 8 do not support EU/Subslice info */
1635 if (screen->devinfo->gen >= 8) {
1636 intel_detect_sseu(screen);
1637 } else if (screen->devinfo->gen == 7) {
1638 screen->subslice_total = 1 << (screen->devinfo->gt - 1);
1639 }
1640
1641 const char *force_msaa = getenv("INTEL_FORCE_MSAA");
1642 if (force_msaa) {
1643 screen->winsys_msaa_samples_override =
1644 intel_quantize_num_samples(screen, atoi(force_msaa));
1645 printf("Forcing winsys sample count to %d\n",
1646 screen->winsys_msaa_samples_override);
1647 } else {
1648 screen->winsys_msaa_samples_override = -1;
1649 }
1650
1651 set_max_gl_versions(screen);
1652
1653 /* Notification of GPU resets requires hardware contexts and a kernel new
1654 * enough to support DRM_IOCTL_I915_GET_RESET_STATS. If the ioctl is
1655 * supported, calling it with a context of 0 will either generate EPERM or
1656 * no error. If the ioctl is not supported, it always generate EINVAL.
1657 * Use this to determine whether to advertise the __DRI2_ROBUSTNESS
1658 * extension to the loader.
1659 *
1660 * Don't even try on pre-Gen6, since we don't attempt to use contexts there.
1661 */
1662 if (screen->devinfo->gen >= 6) {
1663 struct drm_i915_reset_stats stats;
1664 memset(&stats, 0, sizeof(stats));
1665
1666 const int ret = drmIoctl(dri_screen->fd, DRM_IOCTL_I915_GET_RESET_STATS, &stats);
1667
1668 screen->has_context_reset_notification =
1669 (ret != -1 || errno != EINVAL);
1670 }
1671
1672 if (intel_get_param(screen, I915_PARAM_CMD_PARSER_VERSION,
1673 &screen->cmd_parser_version) < 0) {
1674 screen->cmd_parser_version = 0;
1675 }
1676
1677 /* Haswell requires command parser version 6 in order to write to the
1678 * MI_MATH GPR registers, and version 7 in order to use
1679 * MI_LOAD_REGISTER_REG (which all users of MI_MATH use).
1680 */
1681 screen->has_mi_math_and_lrr = screen->devinfo->gen >= 8 ||
1682 (screen->devinfo->is_haswell &&
1683 screen->cmd_parser_version >= 7);
1684
1685 dri_screen->extensions = !screen->has_context_reset_notification
1686 ? screenExtensions : intelRobustScreenExtensions;
1687
1688 screen->compiler = brw_compiler_create(screen,
1689 screen->devinfo);
1690 screen->compiler->shader_debug_log = shader_debug_log_mesa;
1691 screen->compiler->shader_perf_log = shader_perf_log_mesa;
1692 screen->program_id = 1;
1693
1694 if (screen->devinfo->has_resource_streamer) {
1695 screen->has_resource_streamer =
1696 intel_get_boolean(screen, I915_PARAM_HAS_RESOURCE_STREAMER);
1697 }
1698
1699 return (const __DRIconfig**) intel_screen_make_configs(dri_screen);
1700 }
1701
1702 struct intel_buffer {
1703 __DRIbuffer base;
1704 drm_intel_bo *bo;
1705 };
1706
1707 static __DRIbuffer *
1708 intelAllocateBuffer(__DRIscreen *dri_screen,
1709 unsigned attachment, unsigned format,
1710 int width, int height)
1711 {
1712 struct intel_buffer *intelBuffer;
1713 struct intel_screen *screen = dri_screen->driverPrivate;
1714
1715 assert(attachment == __DRI_BUFFER_FRONT_LEFT ||
1716 attachment == __DRI_BUFFER_BACK_LEFT);
1717
1718 intelBuffer = calloc(1, sizeof *intelBuffer);
1719 if (intelBuffer == NULL)
1720 return NULL;
1721
1722 /* The front and back buffers are color buffers, which are X tiled. */
1723 uint32_t tiling = I915_TILING_X;
1724 unsigned long pitch;
1725 int cpp = format / 8;
1726 intelBuffer->bo = drm_intel_bo_alloc_tiled(screen->bufmgr,
1727 "intelAllocateBuffer",
1728 width,
1729 height,
1730 cpp,
1731 &tiling, &pitch,
1732 BO_ALLOC_FOR_RENDER);
1733
1734 if (intelBuffer->bo == NULL) {
1735 free(intelBuffer);
1736 return NULL;
1737 }
1738
1739 drm_intel_bo_flink(intelBuffer->bo, &intelBuffer->base.name);
1740
1741 intelBuffer->base.attachment = attachment;
1742 intelBuffer->base.cpp = cpp;
1743 intelBuffer->base.pitch = pitch;
1744
1745 return &intelBuffer->base;
1746 }
1747
1748 static void
1749 intelReleaseBuffer(__DRIscreen *dri_screen, __DRIbuffer *buffer)
1750 {
1751 struct intel_buffer *intelBuffer = (struct intel_buffer *) buffer;
1752
1753 drm_intel_bo_unreference(intelBuffer->bo);
1754 free(intelBuffer);
1755 }
1756
1757 static const struct __DriverAPIRec brw_driver_api = {
1758 .InitScreen = intelInitScreen2,
1759 .DestroyScreen = intelDestroyScreen,
1760 .CreateContext = brwCreateContext,
1761 .DestroyContext = intelDestroyContext,
1762 .CreateBuffer = intelCreateBuffer,
1763 .DestroyBuffer = intelDestroyBuffer,
1764 .MakeCurrent = intelMakeCurrent,
1765 .UnbindContext = intelUnbindContext,
1766 .AllocateBuffer = intelAllocateBuffer,
1767 .ReleaseBuffer = intelReleaseBuffer
1768 };
1769
1770 static const struct __DRIDriverVtableExtensionRec brw_vtable = {
1771 .base = { __DRI_DRIVER_VTABLE, 1 },
1772 .vtable = &brw_driver_api,
1773 };
1774
1775 static const __DRIextension *brw_driver_extensions[] = {
1776 &driCoreExtension.base,
1777 &driImageDriverExtension.base,
1778 &driDRI2Extension.base,
1779 &brw_vtable.base,
1780 &brw_config_options.base,
1781 NULL
1782 };
1783
1784 PUBLIC const __DRIextension **__driDriverGetExtensions_i965(void)
1785 {
1786 globalDriverAPI = &brw_driver_api;
1787
1788 return brw_driver_extensions;
1789 }