c9577c8be4172b202a56c4f338b64ad7d0ee2e1b
[mesa.git] / src / gallium / drivers / ilo / ilo_screen.c
1 /*
2 * Mesa 3-D graphics library
3 *
4 * Copyright (C) 2012-2013 LunarG, Inc.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included
14 * in all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
22 * DEALINGS IN THE SOFTWARE.
23 *
24 * Authors:
25 * Chia-I Wu <olv@lunarg.com>
26 */
27
28 #include "pipe/p_state.h"
29 #include "os/os_misc.h"
30 #include "util/u_format_s3tc.h"
31 #include "vl/vl_decoder.h"
32 #include "vl/vl_video_buffer.h"
33 #include "genhw/genhw.h" /* for GEN6_REG_TIMESTAMP */
34 #include "intel_winsys.h"
35
36 #include "ilo_context.h"
37 #include "ilo_format.h"
38 #include "ilo_resource.h"
39 #include "ilo_transfer.h" /* for ILO_TRANSFER_MAP_BUFFER_ALIGNMENT */
40 #include "ilo_public.h"
41 #include "ilo_screen.h"
42
43 struct ilo_fence {
44 struct pipe_reference reference;
45 struct intel_bo *bo;
46 };
47
48 int ilo_debug;
49
50 static const struct debug_named_value ilo_debug_flags[] = {
51 { "batch", ILO_DEBUG_BATCH, "Dump batch/dynamic/surface/instruction buffers" },
52 { "vs", ILO_DEBUG_VS, "Dump vertex shaders" },
53 { "gs", ILO_DEBUG_GS, "Dump geometry shaders" },
54 { "fs", ILO_DEBUG_FS, "Dump fragment shaders" },
55 { "cs", ILO_DEBUG_CS, "Dump compute shaders" },
56 { "draw", ILO_DEBUG_DRAW, "Show draw information" },
57 { "submit", ILO_DEBUG_SUBMIT, "Show batch buffer submissions" },
58 { "hang", ILO_DEBUG_HANG, "Detect GPU hangs" },
59 { "nohw", ILO_DEBUG_NOHW, "Do not send commands to HW" },
60 { "nocache", ILO_DEBUG_NOCACHE, "Always invalidate HW caches" },
61 { "nohiz", ILO_DEBUG_NOHIZ, "Disable HiZ" },
62 DEBUG_NAMED_VALUE_END
63 };
64
65 static float
66 ilo_get_paramf(struct pipe_screen *screen, enum pipe_capf param)
67 {
68 switch (param) {
69 case PIPE_CAPF_MAX_LINE_WIDTH:
70 /* in U3.7, defined in 3DSTATE_SF */
71 return 7.0f;
72 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
73 /* line width minus one, which is reserved for AA region */
74 return 6.0f;
75 case PIPE_CAPF_MAX_POINT_WIDTH:
76 /* in U8.3, defined in 3DSTATE_SF */
77 return 255.0f;
78 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
79 /* same as point width, as we ignore rasterizer->point_smooth */
80 return 255.0f;
81 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
82 /* [2.0, 16.0], defined in SAMPLER_STATE */
83 return 16.0f;
84 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
85 /* [-16.0, 16.0), defined in SAMPLER_STATE */
86 return 15.0f;
87 case PIPE_CAPF_GUARD_BAND_LEFT:
88 case PIPE_CAPF_GUARD_BAND_TOP:
89 case PIPE_CAPF_GUARD_BAND_RIGHT:
90 case PIPE_CAPF_GUARD_BAND_BOTTOM:
91 /* what are these for? */
92 return 0.0f;
93
94 default:
95 return 0.0f;
96 }
97 }
98
99 static int
100 ilo_get_shader_param(struct pipe_screen *screen, unsigned shader,
101 enum pipe_shader_cap param)
102 {
103 switch (shader) {
104 case PIPE_SHADER_FRAGMENT:
105 case PIPE_SHADER_VERTEX:
106 case PIPE_SHADER_GEOMETRY:
107 break;
108 default:
109 return 0;
110 }
111
112 switch (param) {
113 /* the limits are copied from the classic driver */
114 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
115 return (shader == PIPE_SHADER_FRAGMENT) ? 1024 : 16384;
116 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
117 return (shader == PIPE_SHADER_FRAGMENT) ? 1024 : 0;
118 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
119 return (shader == PIPE_SHADER_FRAGMENT) ? 1024 : 0;
120 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
121 return (shader == PIPE_SHADER_FRAGMENT) ? 1024 : 0;
122 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
123 return UINT_MAX;
124 case PIPE_SHADER_CAP_MAX_INPUTS:
125 case PIPE_SHADER_CAP_MAX_OUTPUTS:
126 /* this is limited by how many attributes SF can remap */
127 return 16;
128 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
129 return 1024 * sizeof(float[4]);
130 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
131 return ILO_MAX_CONST_BUFFERS;
132 case PIPE_SHADER_CAP_MAX_TEMPS:
133 return 256;
134 case PIPE_SHADER_CAP_MAX_PREDS:
135 return 0;
136 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
137 return 1;
138 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
139 return 0;
140 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
141 return 0;
142 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
143 return (shader == PIPE_SHADER_FRAGMENT) ? 0 : 1;
144 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
145 return 1;
146 case PIPE_SHADER_CAP_SUBROUTINES:
147 return 0;
148 case PIPE_SHADER_CAP_INTEGERS:
149 return 1;
150 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
151 return ILO_MAX_SAMPLERS;
152 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
153 return ILO_MAX_SAMPLER_VIEWS;
154 case PIPE_SHADER_CAP_PREFERRED_IR:
155 return PIPE_SHADER_IR_TGSI;
156 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
157 return 1;
158
159 default:
160 return 0;
161 }
162 }
163
164 static int
165 ilo_get_video_param(struct pipe_screen *screen,
166 enum pipe_video_profile profile,
167 enum pipe_video_entrypoint entrypoint,
168 enum pipe_video_cap param)
169 {
170 switch (param) {
171 case PIPE_VIDEO_CAP_SUPPORTED:
172 return vl_profile_supported(screen, profile, entrypoint);
173 case PIPE_VIDEO_CAP_NPOT_TEXTURES:
174 return 1;
175 case PIPE_VIDEO_CAP_MAX_WIDTH:
176 case PIPE_VIDEO_CAP_MAX_HEIGHT:
177 return vl_video_buffer_max_size(screen);
178 case PIPE_VIDEO_CAP_PREFERED_FORMAT:
179 return PIPE_FORMAT_NV12;
180 case PIPE_VIDEO_CAP_PREFERS_INTERLACED:
181 return 1;
182 case PIPE_VIDEO_CAP_SUPPORTS_PROGRESSIVE:
183 return 1;
184 case PIPE_VIDEO_CAP_SUPPORTS_INTERLACED:
185 return 0;
186 case PIPE_VIDEO_CAP_MAX_LEVEL:
187 return vl_level_supported(screen, profile);
188 default:
189 return 0;
190 }
191 }
192
193 static int
194 ilo_get_compute_param(struct pipe_screen *screen,
195 enum pipe_compute_cap param,
196 void *ret)
197 {
198 struct ilo_screen *is = ilo_screen(screen);
199 union {
200 const char *ir_target;
201 uint64_t grid_dimension;
202 uint64_t max_grid_size[3];
203 uint64_t max_block_size[3];
204 uint64_t max_threads_per_block;
205 uint64_t max_global_size;
206 uint64_t max_local_size;
207 uint64_t max_private_size;
208 uint64_t max_input_size;
209 uint64_t max_mem_alloc_size;
210 uint32_t max_clock_frequency;
211 uint32_t max_compute_units;
212 uint32_t images_supported;
213 } val;
214 const void *ptr;
215 int size;
216
217 switch (param) {
218 case PIPE_COMPUTE_CAP_IR_TARGET:
219 val.ir_target = "ilog";
220
221 ptr = val.ir_target;
222 size = strlen(val.ir_target) + 1;
223 break;
224 case PIPE_COMPUTE_CAP_GRID_DIMENSION:
225 val.grid_dimension = Elements(val.max_grid_size);
226
227 ptr = &val.grid_dimension;
228 size = sizeof(val.grid_dimension);
229 break;
230 case PIPE_COMPUTE_CAP_MAX_GRID_SIZE:
231 val.max_grid_size[0] = 0xffffffffu;
232 val.max_grid_size[1] = 0xffffffffu;
233 val.max_grid_size[2] = 0xffffffffu;
234
235 ptr = &val.max_grid_size;
236 size = sizeof(val.max_grid_size);
237 break;
238 case PIPE_COMPUTE_CAP_MAX_BLOCK_SIZE:
239 val.max_block_size[0] = 1024;
240 val.max_block_size[1] = 1024;
241 val.max_block_size[2] = 1024;
242
243 ptr = &val.max_block_size;
244 size = sizeof(val.max_block_size);
245 break;
246
247 case PIPE_COMPUTE_CAP_MAX_THREADS_PER_BLOCK:
248 val.max_threads_per_block = 1024;
249
250 ptr = &val.max_threads_per_block;
251 size = sizeof(val.max_threads_per_block);
252 break;
253 case PIPE_COMPUTE_CAP_MAX_GLOBAL_SIZE:
254 /* \see ilo_max_resource_size */
255 val.max_global_size = 1u << 31;
256
257 ptr = &val.max_global_size;
258 size = sizeof(val.max_global_size);
259 break;
260 case PIPE_COMPUTE_CAP_MAX_LOCAL_SIZE:
261 /* Shared Local Memory Size of INTERFACE_DESCRIPTOR_DATA */
262 val.max_local_size = 64 * 1024;
263
264 ptr = &val.max_local_size;
265 size = sizeof(val.max_local_size);
266 break;
267 case PIPE_COMPUTE_CAP_MAX_PRIVATE_SIZE:
268 /* scratch size */
269 val.max_private_size = 12 * 1024;
270
271 ptr = &val.max_private_size;
272 size = sizeof(val.max_private_size);
273 break;
274 case PIPE_COMPUTE_CAP_MAX_INPUT_SIZE:
275 val.max_input_size = 1024;
276
277 ptr = &val.max_input_size;
278 size = sizeof(val.max_input_size);
279 break;
280 case PIPE_COMPUTE_CAP_MAX_MEM_ALLOC_SIZE:
281 val.max_mem_alloc_size = 1u << 31;
282
283 ptr = &val.max_mem_alloc_size;
284 size = sizeof(val.max_mem_alloc_size);
285 break;
286 case PIPE_COMPUTE_CAP_MAX_CLOCK_FREQUENCY:
287 val.max_clock_frequency = 1000;
288
289 ptr = &val.max_clock_frequency;
290 size = sizeof(val.max_clock_frequency);
291 break;
292 case PIPE_COMPUTE_CAP_MAX_COMPUTE_UNITS:
293 val.max_compute_units = is->dev.eu_count;
294
295 ptr = &val.max_compute_units;
296 size = sizeof(val.max_compute_units);
297 break;
298 case PIPE_COMPUTE_CAP_IMAGES_SUPPORTED:
299 val.images_supported = 1;
300
301 ptr = &val.images_supported;
302 size = sizeof(val.images_supported);
303 break;
304 default:
305 ptr = NULL;
306 size = 0;
307 break;
308 }
309
310 if (ret)
311 memcpy(ret, ptr, size);
312
313 return size;
314 }
315
316 static int
317 ilo_get_param(struct pipe_screen *screen, enum pipe_cap param)
318 {
319 struct ilo_screen *is = ilo_screen(screen);
320
321 switch (param) {
322 case PIPE_CAP_NPOT_TEXTURES:
323 case PIPE_CAP_TWO_SIDED_STENCIL:
324 return true;
325 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
326 return 0; /* TODO */
327 case PIPE_CAP_ANISOTROPIC_FILTER:
328 case PIPE_CAP_POINT_SPRITE:
329 return true;
330 case PIPE_CAP_MAX_RENDER_TARGETS:
331 return ILO_MAX_DRAW_BUFFERS;
332 case PIPE_CAP_OCCLUSION_QUERY:
333 case PIPE_CAP_QUERY_TIME_ELAPSED:
334 case PIPE_CAP_TEXTURE_SHADOW_MAP:
335 case PIPE_CAP_TEXTURE_SWIZZLE: /* must be supported for shadow map */
336 return true;
337 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
338 /*
339 * As defined in SURFACE_STATE, we have
340 *
341 * Max WxHxD for 2D and CUBE Max WxHxD for 3D
342 * GEN6 8192x8192x512 2048x2048x2048
343 * GEN7 16384x16384x2048 2048x2048x2048
344 */
345 return (ilo_dev_gen(&is->dev) >= ILO_GEN(7)) ? 15 : 14;
346 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
347 return 12;
348 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
349 return (ilo_dev_gen(&is->dev) >= ILO_GEN(7)) ? 15 : 14;
350 case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
351 return false;
352 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
353 case PIPE_CAP_SM3:
354 return true;
355 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
356 if (ilo_dev_gen(&is->dev) >= ILO_GEN(7) && !is->dev.has_gen7_sol_reset)
357 return 0;
358 return ILO_MAX_SO_BUFFERS;
359 case PIPE_CAP_PRIMITIVE_RESTART:
360 return true;
361 case PIPE_CAP_INDEP_BLEND_ENABLE:
362 case PIPE_CAP_INDEP_BLEND_FUNC:
363 return true;
364 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
365 return (ilo_dev_gen(&is->dev) >= ILO_GEN(7)) ? 2048 : 512;
366 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
367 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
368 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
369 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
370 case PIPE_CAP_DEPTH_CLIP_DISABLE:
371 return true;
372 case PIPE_CAP_SHADER_STENCIL_EXPORT:
373 return false;
374 case PIPE_CAP_TGSI_INSTANCEID:
375 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
376 return true;
377 case PIPE_CAP_FRAGMENT_COLOR_CLAMPED:
378 return false;
379 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
380 return true;
381 case PIPE_CAP_SEAMLESS_CUBE_MAP:
382 case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
383 return true;
384 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
385 case PIPE_CAP_MIN_TEXEL_OFFSET:
386 return -8;
387 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
388 case PIPE_CAP_MAX_TEXEL_OFFSET:
389 return 7;
390 case PIPE_CAP_CONDITIONAL_RENDER:
391 case PIPE_CAP_TEXTURE_BARRIER:
392 return true;
393 case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:
394 return ILO_MAX_SO_BINDINGS / ILO_MAX_SO_BUFFERS;
395 case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:
396 return ILO_MAX_SO_BINDINGS;
397 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
398 if (ilo_dev_gen(&is->dev) >= ILO_GEN(7))
399 return is->dev.has_gen7_sol_reset;
400 else
401 return false; /* TODO */
402 case PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS:
403 return false;
404 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
405 return true;
406 case PIPE_CAP_VERTEX_COLOR_CLAMPED:
407 return false;
408 case PIPE_CAP_GLSL_FEATURE_LEVEL:
409 return 140;
410 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
411 case PIPE_CAP_USER_VERTEX_BUFFERS:
412 return false;
413 case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY:
414 case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY:
415 case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY:
416 return false;
417 case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:
418 return 2048;
419 case PIPE_CAP_COMPUTE:
420 return false; /* TODO */
421 case PIPE_CAP_USER_INDEX_BUFFERS:
422 case PIPE_CAP_USER_CONSTANT_BUFFERS:
423 return true;
424 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
425 /* imposed by OWord (Dual) Block Read */
426 return 16;
427 case PIPE_CAP_START_INSTANCE:
428 return true;
429 case PIPE_CAP_QUERY_TIMESTAMP:
430 return is->dev.has_timestamp;
431 case PIPE_CAP_TEXTURE_MULTISAMPLE:
432 return false; /* TODO */
433 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
434 return ILO_TRANSFER_MAP_BUFFER_ALIGNMENT;
435 case PIPE_CAP_CUBE_MAP_ARRAY:
436 case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
437 return true;
438 case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
439 return 1;
440 case PIPE_CAP_TGSI_TEXCOORD:
441 return false;
442 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
443 case PIPE_CAP_QUERY_PIPELINE_STATISTICS:
444 return true;
445 case PIPE_CAP_TEXTURE_BORDER_COLOR_QUIRK:
446 return 0;
447 case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
448 /* a GEN6_SURFTYPE_BUFFER can have up to 2^27 elements */
449 return 1 << 27;
450 case PIPE_CAP_MAX_VIEWPORTS:
451 return ILO_MAX_VIEWPORTS;
452 case PIPE_CAP_ENDIANNESS:
453 return PIPE_ENDIAN_LITTLE;
454 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
455 return true;
456 case PIPE_CAP_TGSI_VS_LAYER_VIEWPORT:
457 case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
458 case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
459 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
460 case PIPE_CAP_TEXTURE_GATHER_SM5:
461 return 0;
462 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
463 return true;
464 case PIPE_CAP_FAKE_SW_MSAA:
465 case PIPE_CAP_TEXTURE_QUERY_LOD:
466 case PIPE_CAP_SAMPLE_SHADING:
467 case PIPE_CAP_TEXTURE_GATHER_OFFSETS:
468 case PIPE_CAP_TGSI_VS_WINDOW_SPACE_POSITION:
469 case PIPE_CAP_MAX_VERTEX_STREAMS:
470 case PIPE_CAP_DRAW_INDIRECT:
471 case PIPE_CAP_TGSI_FS_FINE_DERIVATIVE:
472 case PIPE_CAP_CONDITIONAL_RENDER_INVERTED:
473 case PIPE_CAP_SAMPLER_VIEW_TARGET:
474 case PIPE_CAP_MULTISAMPLE_Z_RESOLVE:
475 case PIPE_CAP_RESOURCE_FROM_USER_MEMORY:
476 return 0;
477
478 case PIPE_CAP_VENDOR_ID:
479 return 0x8086;
480 case PIPE_CAP_DEVICE_ID:
481 return is->dev.devid;
482 case PIPE_CAP_ACCELERATED:
483 return true;
484 case PIPE_CAP_VIDEO_MEMORY: {
485 /* Once a batch uses more than 75% of the maximum mappable size, we
486 * assume that there's some fragmentation, and we start doing extra
487 * flushing, etc. That's the big cliff apps will care about.
488 */
489 const uint64_t gpu_memory = is->dev.aperture_total * 3 / 4;
490 uint64_t system_memory;
491
492 if (!os_get_total_physical_memory(&system_memory))
493 return 0;
494
495 return (int) (MIN2(gpu_memory, system_memory) >> 20);
496 }
497 case PIPE_CAP_UMA:
498 return true;
499 case PIPE_CAP_CLIP_HALFZ:
500 return true;
501 case PIPE_CAP_VERTEXID_NOBASE:
502 return false;
503 case PIPE_CAP_POLYGON_OFFSET_CLAMP:
504 return true;
505
506 default:
507 return 0;
508 }
509 }
510
511 static const char *
512 ilo_get_vendor(struct pipe_screen *screen)
513 {
514 return "LunarG, Inc.";
515 }
516
517 static const char *
518 ilo_get_name(struct pipe_screen *screen)
519 {
520 struct ilo_screen *is = ilo_screen(screen);
521 const char *chipset = NULL;
522
523 if (gen_is_chv(is->dev.devid)) {
524 chipset = "Intel(R) Cherryview";
525 } else if (gen_is_bdw(is->dev.devid)) {
526 /* this is likely wrong */
527 if (gen_is_desktop(is->dev.devid))
528 chipset = "Intel(R) Broadwell Desktop";
529 else if (gen_is_mobile(is->dev.devid))
530 chipset = "Intel(R) Broadwell Mobile";
531 else if (gen_is_server(is->dev.devid))
532 chipset = "Intel(R) Broadwell Server";
533 } else if (gen_is_vlv(is->dev.devid)) {
534 chipset = "Intel(R) Bay Trail";
535 } else if (gen_is_hsw(is->dev.devid)) {
536 if (gen_is_desktop(is->dev.devid))
537 chipset = "Intel(R) Haswell Desktop";
538 else if (gen_is_mobile(is->dev.devid))
539 chipset = "Intel(R) Haswell Mobile";
540 else if (gen_is_server(is->dev.devid))
541 chipset = "Intel(R) Haswell Server";
542 } else if (gen_is_ivb(is->dev.devid)) {
543 if (gen_is_desktop(is->dev.devid))
544 chipset = "Intel(R) Ivybridge Desktop";
545 else if (gen_is_mobile(is->dev.devid))
546 chipset = "Intel(R) Ivybridge Mobile";
547 else if (gen_is_server(is->dev.devid))
548 chipset = "Intel(R) Ivybridge Server";
549 } else if (gen_is_snb(is->dev.devid)) {
550 if (gen_is_desktop(is->dev.devid))
551 chipset = "Intel(R) Sandybridge Desktop";
552 else if (gen_is_mobile(is->dev.devid))
553 chipset = "Intel(R) Sandybridge Mobile";
554 else if (gen_is_server(is->dev.devid))
555 chipset = "Intel(R) Sandybridge Server";
556 }
557
558 if (!chipset)
559 chipset = "Unknown Intel Chipset";
560
561 return chipset;
562 }
563
564 static uint64_t
565 ilo_get_timestamp(struct pipe_screen *screen)
566 {
567 struct ilo_screen *is = ilo_screen(screen);
568 union {
569 uint64_t val;
570 uint32_t dw[2];
571 } timestamp;
572
573 intel_winsys_read_reg(is->winsys, GEN6_REG_TIMESTAMP, &timestamp.val);
574
575 /*
576 * From the Ivy Bridge PRM, volume 1 part 3, page 107:
577 *
578 * "Note: This timestamp register reflects the value of the PCU TSC.
579 * The PCU TSC counts 10ns increments; this timestamp reflects bits
580 * 38:3 of the TSC (i.e. 80ns granularity, rolling over every 1.5
581 * hours)."
582 *
583 * However, it seems dw[0] is garbage and dw[1] contains the lower 32 bits
584 * of the timestamp. We will have to live with a timestamp that rolls over
585 * every ~343 seconds.
586 *
587 * See also brw_get_timestamp().
588 */
589 return (uint64_t) timestamp.dw[1] * 80;
590 }
591
592 static void
593 ilo_fence_reference(struct pipe_screen *screen,
594 struct pipe_fence_handle **p,
595 struct pipe_fence_handle *f)
596 {
597 struct ilo_fence *fence = ilo_fence(f);
598 struct ilo_fence *old;
599
600 if (likely(p)) {
601 old = ilo_fence(*p);
602 *p = f;
603 }
604 else {
605 old = NULL;
606 }
607
608 STATIC_ASSERT(&((struct ilo_fence *) NULL)->reference == NULL);
609 if (pipe_reference(&old->reference, &fence->reference)) {
610 if (old->bo)
611 intel_bo_unreference(old->bo);
612 FREE(old);
613 }
614 }
615
616 static boolean
617 ilo_fence_signalled(struct pipe_screen *screen,
618 struct pipe_fence_handle *f)
619 {
620 struct ilo_fence *fence = ilo_fence(f);
621
622 /* mark signalled if the bo is idle */
623 if (fence->bo && !intel_bo_is_busy(fence->bo)) {
624 intel_bo_unreference(fence->bo);
625 fence->bo = NULL;
626 }
627
628 return (fence->bo == NULL);
629 }
630
631 static boolean
632 ilo_fence_finish(struct pipe_screen *screen,
633 struct pipe_fence_handle *f,
634 uint64_t timeout)
635 {
636 struct ilo_fence *fence = ilo_fence(f);
637 const int64_t wait_timeout = (timeout > INT64_MAX) ? -1 : timeout;
638
639 /* already signalled */
640 if (!fence->bo)
641 return true;
642
643 /* wait and see if it returns error */
644 if (intel_bo_wait(fence->bo, wait_timeout))
645 return false;
646
647 /* mark signalled */
648 intel_bo_unreference(fence->bo);
649 fence->bo = NULL;
650
651 return true;
652 }
653
654 /**
655 * Create a fence for \p bo. When \p bo is not NULL, it must be submitted
656 * before waited on or checked.
657 */
658 struct ilo_fence *
659 ilo_fence_create(struct pipe_screen *screen, struct intel_bo *bo)
660 {
661 struct ilo_fence *fence;
662
663 fence = CALLOC_STRUCT(ilo_fence);
664 if (!fence)
665 return NULL;
666
667 pipe_reference_init(&fence->reference, 1);
668
669 if (bo)
670 intel_bo_reference(bo);
671 fence->bo = bo;
672
673 return fence;
674 }
675
676 static void
677 ilo_screen_destroy(struct pipe_screen *screen)
678 {
679 struct ilo_screen *is = ilo_screen(screen);
680
681 /* as it seems, winsys is owned by the screen */
682 intel_winsys_destroy(is->winsys);
683
684 FREE(is);
685 }
686
687 static bool
688 init_dev(struct ilo_dev_info *dev, const struct intel_winsys_info *info)
689 {
690 dev->devid = info->devid;
691 dev->aperture_total = info->aperture_total;
692 dev->aperture_mappable = info->aperture_mappable;
693 dev->has_llc = info->has_llc;
694 dev->has_address_swizzling = info->has_address_swizzling;
695 dev->has_logical_context = info->has_logical_context;
696 dev->has_ppgtt = info->has_ppgtt;
697 dev->has_timestamp = info->has_timestamp;
698 dev->has_gen7_sol_reset = info->has_gen7_sol_reset;
699
700 if (!dev->has_logical_context) {
701 ilo_err("missing hardware logical context support\n");
702 return false;
703 }
704
705 /*
706 * PIPE_CONTROL and MI_* use PPGTT writes on GEN7+ and privileged GGTT
707 * writes on GEN6.
708 *
709 * From the Sandy Bridge PRM, volume 1 part 3, page 101:
710 *
711 * "[DevSNB] When Per-Process GTT Enable is set, it is assumed that all
712 * code is in a secure environment, independent of address space.
713 * Under this condition, this bit only specifies the address space
714 * (GGTT or PPGTT). All commands are executed "as-is""
715 *
716 * We need PPGTT to be enabled on GEN6 too.
717 */
718 if (!dev->has_ppgtt) {
719 /* experiments show that it does not really matter... */
720 ilo_warn("PPGTT disabled\n");
721 }
722
723 if (gen_is_bdw(info->devid) || gen_is_chv(info->devid)) {
724 dev->gen_opaque = ILO_GEN(8);
725 dev->gt = (gen_is_bdw(info->devid)) ? gen_get_bdw_gt(info->devid) : 1;
726 /* XXX random values */
727 if (dev->gt == 3) {
728 dev->eu_count = 48;
729 dev->thread_count = 336;
730 dev->urb_size = 384 * 1024;
731 } else if (dev->gt == 2) {
732 dev->eu_count = 24;
733 dev->thread_count = 168;
734 dev->urb_size = 384 * 1024;
735 } else {
736 dev->eu_count = 12;
737 dev->thread_count = 84;
738 dev->urb_size = 192 * 1024;
739 }
740 } else if (gen_is_hsw(info->devid)) {
741 /*
742 * From the Haswell PRM, volume 4, page 8:
743 *
744 * "Description GT3 GT2 GT1.5 GT1
745 * (...)
746 * EUs (Total) 40 20 12 10
747 * Threads (Total) 280 140 84 70
748 * (...)
749 * URB Size (max, within L3$) 512KB 256KB 256KB 128KB
750 */
751 dev->gen_opaque = ILO_GEN(7.5);
752 dev->gt = gen_get_hsw_gt(info->devid);
753 if (dev->gt == 3) {
754 dev->eu_count = 40;
755 dev->thread_count = 280;
756 dev->urb_size = 512 * 1024;
757 } else if (dev->gt == 2) {
758 dev->eu_count = 20;
759 dev->thread_count = 140;
760 dev->urb_size = 256 * 1024;
761 } else {
762 dev->eu_count = 10;
763 dev->thread_count = 70;
764 dev->urb_size = 128 * 1024;
765 }
766 } else if (gen_is_ivb(info->devid) || gen_is_vlv(info->devid)) {
767 /*
768 * From the Ivy Bridge PRM, volume 1 part 1, page 18:
769 *
770 * "Device # of EUs #Threads/EU
771 * Ivy Bridge (GT2) 16 8
772 * Ivy Bridge (GT1) 6 6"
773 *
774 * From the Ivy Bridge PRM, volume 4 part 2, page 17:
775 *
776 * "URB Size URB Rows URB Rows when SLM Enabled
777 * 128k 4096 2048
778 * 256k 8096 4096"
779 */
780 dev->gen_opaque = ILO_GEN(7);
781 dev->gt = (gen_is_ivb(info->devid)) ? gen_get_ivb_gt(info->devid) : 1;
782 if (dev->gt == 2) {
783 dev->eu_count = 16;
784 dev->thread_count = 128;
785 dev->urb_size = 256 * 1024;
786 } else {
787 dev->eu_count = 6;
788 dev->thread_count = 36;
789 dev->urb_size = 128 * 1024;
790 }
791 } else if (gen_is_snb(info->devid)) {
792 /*
793 * From the Sandy Bridge PRM, volume 1 part 1, page 22:
794 *
795 * "Device # of EUs #Threads/EU
796 * SNB GT2 12 5
797 * SNB GT1 6 4"
798 *
799 * From the Sandy Bridge PRM, volume 4 part 2, page 18:
800 *
801 * "[DevSNB]: The GT1 product's URB provides 32KB of storage,
802 * arranged as 1024 256-bit rows. The GT2 product's URB provides
803 * 64KB of storage, arranged as 2048 256-bit rows. A row
804 * corresponds in size to an EU GRF register. Read/write access to
805 * the URB is generally supported on a row-granular basis."
806 */
807 dev->gen_opaque = ILO_GEN(6);
808 dev->gt = gen_get_snb_gt(info->devid);
809 if (dev->gt == 2) {
810 dev->eu_count = 12;
811 dev->thread_count = 60;
812 dev->urb_size = 64 * 1024;
813 } else {
814 dev->eu_count = 6;
815 dev->thread_count = 24;
816 dev->urb_size = 32 * 1024;
817 }
818 } else {
819 ilo_err("unknown GPU generation\n");
820 return false;
821 }
822
823 return true;
824 }
825
826 struct pipe_screen *
827 ilo_screen_create(struct intel_winsys *ws)
828 {
829 struct ilo_screen *is;
830 const struct intel_winsys_info *info;
831
832 ilo_debug = debug_get_flags_option("ILO_DEBUG", ilo_debug_flags, 0);
833
834 is = CALLOC_STRUCT(ilo_screen);
835 if (!is)
836 return NULL;
837
838 is->winsys = ws;
839
840 info = intel_winsys_get_info(is->winsys);
841 if (!init_dev(&is->dev, info)) {
842 FREE(is);
843 return NULL;
844 }
845
846 util_format_s3tc_init();
847
848 is->base.destroy = ilo_screen_destroy;
849 is->base.get_name = ilo_get_name;
850 is->base.get_vendor = ilo_get_vendor;
851 is->base.get_param = ilo_get_param;
852 is->base.get_paramf = ilo_get_paramf;
853 is->base.get_shader_param = ilo_get_shader_param;
854 is->base.get_video_param = ilo_get_video_param;
855 is->base.get_compute_param = ilo_get_compute_param;
856
857 is->base.get_timestamp = ilo_get_timestamp;
858
859 is->base.flush_frontbuffer = NULL;
860
861 is->base.fence_reference = ilo_fence_reference;
862 is->base.fence_signalled = ilo_fence_signalled;
863 is->base.fence_finish = ilo_fence_finish;
864
865 is->base.get_driver_query_info = NULL;
866
867 ilo_init_format_functions(is);
868 ilo_init_context_functions(is);
869 ilo_init_resource_functions(is);
870
871 return &is->base;
872 }