etnaviv: check if MSAA is supported
[mesa.git] / src / gallium / drivers / etnaviv / etnaviv_screen.c
1 /*
2 * Copyright (c) 2012-2015 Etnaviv Project
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sub license,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the
12 * next paragraph) shall be included in all copies or substantial portions
13 * of the Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
22 *
23 * Authors:
24 * Wladimir J. van der Laan <laanwj@gmail.com>
25 * Christian Gmeiner <christian.gmeiner@gmail.com>
26 */
27
28 #include "etnaviv_screen.h"
29
30 #include "hw/common.xml.h"
31
32 #include "etnaviv_compiler.h"
33 #include "etnaviv_context.h"
34 #include "etnaviv_debug.h"
35 #include "etnaviv_fence.h"
36 #include "etnaviv_format.h"
37 #include "etnaviv_query.h"
38 #include "etnaviv_resource.h"
39 #include "etnaviv_translate.h"
40
41 #include "util/hash_table.h"
42 #include "util/os_time.h"
43 #include "util/u_math.h"
44 #include "util/u_memory.h"
45 #include "util/u_screen.h"
46 #include "util/u_string.h"
47
48 #include "state_tracker/drm_driver.h"
49
50 #include "drm-uapi/drm_fourcc.h"
51
52 #define ETNA_DRM_VERSION(major, minor) ((major) << 16 | (minor))
53 #define ETNA_DRM_VERSION_FENCE_FD ETNA_DRM_VERSION(1, 1)
54 #define ETNA_DRM_VERSION_PERFMON ETNA_DRM_VERSION(1, 2)
55
56 static const struct debug_named_value debug_options[] = {
57 {"dbg_msgs", ETNA_DBG_MSGS, "Print debug messages"},
58 {"frame_msgs", ETNA_DBG_FRAME_MSGS, "Print frame messages"},
59 {"resource_msgs", ETNA_DBG_RESOURCE_MSGS, "Print resource messages"},
60 {"compiler_msgs", ETNA_DBG_COMPILER_MSGS, "Print compiler messages"},
61 {"linker_msgs", ETNA_DBG_LINKER_MSGS, "Print linker messages"},
62 {"dump_shaders", ETNA_DBG_DUMP_SHADERS, "Dump shaders"},
63 {"no_ts", ETNA_DBG_NO_TS, "Disable TS"},
64 {"no_autodisable", ETNA_DBG_NO_AUTODISABLE, "Disable autodisable"},
65 {"no_supertile", ETNA_DBG_NO_SUPERTILE, "Disable supertiles"},
66 {"no_early_z", ETNA_DBG_NO_EARLY_Z, "Disable early z"},
67 {"cflush_all", ETNA_DBG_CFLUSH_ALL, "Flush every cache before state update"},
68 {"msaa2x", ETNA_DBG_MSAA_2X, "Force 2x msaa"},
69 {"msaa4x", ETNA_DBG_MSAA_4X, "Force 4x msaa"},
70 {"flush_all", ETNA_DBG_FLUSH_ALL, "Flush after every rendered primitive"},
71 {"zero", ETNA_DBG_ZERO, "Zero all resources after allocation"},
72 {"draw_stall", ETNA_DBG_DRAW_STALL, "Stall FE/PE after each rendered primitive"},
73 {"shaderdb", ETNA_DBG_SHADERDB, "Enable shaderdb output"},
74 {"no_singlebuffer",ETNA_DBG_NO_SINGLEBUF, "Disable single buffer feature"},
75 {"nir", ETNA_DBG_NIR, "use new NIR compiler"},
76 DEBUG_NAMED_VALUE_END
77 };
78
79 DEBUG_GET_ONCE_FLAGS_OPTION(etna_mesa_debug, "ETNA_MESA_DEBUG", debug_options, 0)
80 int etna_mesa_debug = 0;
81
82 static void
83 etna_screen_destroy(struct pipe_screen *pscreen)
84 {
85 struct etna_screen *screen = etna_screen(pscreen);
86
87 if (screen->perfmon)
88 etna_perfmon_del(screen->perfmon);
89
90 if (screen->pipe)
91 etna_pipe_del(screen->pipe);
92
93 if (screen->gpu)
94 etna_gpu_del(screen->gpu);
95
96 if (screen->ro)
97 FREE(screen->ro);
98
99 if (screen->dev)
100 etna_device_del(screen->dev);
101
102 FREE(screen);
103 }
104
105 static const char *
106 etna_screen_get_name(struct pipe_screen *pscreen)
107 {
108 struct etna_screen *priv = etna_screen(pscreen);
109 static char buffer[128];
110
111 snprintf(buffer, sizeof(buffer), "Vivante GC%x rev %04x", priv->model,
112 priv->revision);
113
114 return buffer;
115 }
116
117 static const char *
118 etna_screen_get_vendor(struct pipe_screen *pscreen)
119 {
120 return "etnaviv";
121 }
122
123 static const char *
124 etna_screen_get_device_vendor(struct pipe_screen *pscreen)
125 {
126 return "Vivante";
127 }
128
129 static int
130 etna_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
131 {
132 struct etna_screen *screen = etna_screen(pscreen);
133
134 switch (param) {
135 /* Supported features (boolean caps). */
136 case PIPE_CAP_ANISOTROPIC_FILTER:
137 case PIPE_CAP_POINT_SPRITE:
138 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
139 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
140 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
141 case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:
142 case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:
143 case PIPE_CAP_VERTEX_SHADER_SATURATE:
144 case PIPE_CAP_TEXTURE_BARRIER:
145 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
146 case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY:
147 case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY:
148 case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY:
149 case PIPE_CAP_TGSI_TEXCOORD:
150 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
151 case PIPE_CAP_MIXED_COLOR_DEPTH_BITS:
152 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
153 return 1;
154 case PIPE_CAP_NATIVE_FENCE_FD:
155 return screen->drm_version >= ETNA_DRM_VERSION_FENCE_FD;
156 case PIPE_CAP_TGSI_FS_POSITION_IS_SYSVAL:
157 case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL: /* note: not integer */
158 return DBG_ENABLED(ETNA_DBG_NIR);
159 case PIPE_CAP_TGSI_FS_POINT_IS_SYSVAL:
160 return 0;
161
162 /* Memory */
163 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
164 return 256;
165 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
166 return 4; /* XXX could easily be supported */
167
168 case PIPE_CAP_NPOT_TEXTURES:
169 return true; /* VIV_FEATURE(priv->dev, chipMinorFeatures1,
170 NON_POWER_OF_TWO); */
171
172 case PIPE_CAP_TEXTURE_SWIZZLE:
173 case PIPE_CAP_PRIMITIVE_RESTART:
174 return VIV_FEATURE(screen, chipMinorFeatures1, HALTI0);
175
176 /* Unsupported features. */
177 case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
178 case PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY:
179 case PIPE_CAP_ALLOW_MAPPED_BUFFERS_DURING_EXECUTION:
180 return 0;
181
182 /* Stream output. */
183 case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:
184 case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:
185 return 0;
186
187 case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:
188 return 128;
189 case PIPE_CAP_MAX_VERTEX_ELEMENT_SRC_OFFSET:
190 return 255;
191 case PIPE_CAP_MAX_VERTEX_BUFFERS:
192 return screen->specs.stream_count;
193
194 /* Texturing. */
195 case PIPE_CAP_TEXTURE_SHADOW_MAP:
196 return DBG_ENABLED(ETNA_DBG_NIR) && screen->specs.halti >= 2;
197 case PIPE_CAP_MAX_TEXTURE_2D_SIZE:
198 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS: /* TODO: verify */
199 return screen->specs.max_texture_size;
200 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
201 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
202 {
203 int log2_max_tex_size = util_last_bit(screen->specs.max_texture_size);
204 assert(log2_max_tex_size > 0);
205 return log2_max_tex_size;
206 }
207
208 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
209 case PIPE_CAP_MIN_TEXEL_OFFSET:
210 return -8;
211 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
212 case PIPE_CAP_MAX_TEXEL_OFFSET:
213 return 7;
214 case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
215 return VIV_FEATURE(screen, chipMinorFeatures2, SEAMLESS_CUBE_MAP);
216
217 /* Timer queries. */
218 case PIPE_CAP_OCCLUSION_QUERY:
219 return VIV_FEATURE(screen, chipMinorFeatures1, HALTI0);
220 case PIPE_CAP_QUERY_TIMESTAMP:
221 return 1;
222
223 /* Preferences */
224 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
225 return 0;
226
227 case PIPE_CAP_MAX_VARYINGS:
228 return screen->specs.max_varyings;
229
230 case PIPE_CAP_PCI_GROUP:
231 case PIPE_CAP_PCI_BUS:
232 case PIPE_CAP_PCI_DEVICE:
233 case PIPE_CAP_PCI_FUNCTION:
234 return 0;
235 case PIPE_CAP_ACCELERATED:
236 return 1;
237 case PIPE_CAP_VIDEO_MEMORY:
238 return 0;
239 case PIPE_CAP_UMA:
240 return 1;
241 default:
242 return u_pipe_screen_get_param_defaults(pscreen, param);
243 }
244 }
245
246 static float
247 etna_screen_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)
248 {
249 struct etna_screen *screen = etna_screen(pscreen);
250
251 switch (param) {
252 case PIPE_CAPF_MAX_LINE_WIDTH:
253 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
254 case PIPE_CAPF_MAX_POINT_WIDTH:
255 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
256 return 8192.0f;
257 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
258 return 16.0f;
259 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
260 return util_last_bit(screen->specs.max_texture_size);
261 case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
262 case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
263 case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
264 return 0.0f;
265 }
266
267 debug_printf("unknown paramf %d", param);
268 return 0;
269 }
270
271 static int
272 etna_screen_get_shader_param(struct pipe_screen *pscreen,
273 enum pipe_shader_type shader,
274 enum pipe_shader_cap param)
275 {
276 struct etna_screen *screen = etna_screen(pscreen);
277
278 switch (shader) {
279 case PIPE_SHADER_FRAGMENT:
280 case PIPE_SHADER_VERTEX:
281 break;
282 case PIPE_SHADER_COMPUTE:
283 case PIPE_SHADER_GEOMETRY:
284 case PIPE_SHADER_TESS_CTRL:
285 case PIPE_SHADER_TESS_EVAL:
286 return 0;
287 default:
288 DBG("unknown shader type %d", shader);
289 return 0;
290 }
291
292 switch (param) {
293 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
294 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
295 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
296 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
297 return ETNA_MAX_TOKENS;
298 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
299 return ETNA_MAX_DEPTH; /* XXX */
300 case PIPE_SHADER_CAP_MAX_INPUTS:
301 /* Maximum number of inputs for the vertex shader is the number
302 * of vertex elements - each element defines one vertex shader
303 * input register. For the fragment shader, this is the number
304 * of varyings. */
305 return shader == PIPE_SHADER_FRAGMENT ? screen->specs.max_varyings
306 : screen->specs.vertex_max_elements;
307 case PIPE_SHADER_CAP_MAX_OUTPUTS:
308 return 16; /* see VIVS_VS_OUTPUT */
309 case PIPE_SHADER_CAP_MAX_TEMPS:
310 return 64; /* Max native temporaries. */
311 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
312 return 1;
313 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
314 return 1;
315 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
316 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
317 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
318 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
319 return 1;
320 case PIPE_SHADER_CAP_SUBROUTINES:
321 return 0;
322 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
323 return VIV_FEATURE(screen, chipMinorFeatures0, HAS_SQRT_TRIG);
324 case PIPE_SHADER_CAP_INT64_ATOMICS:
325 case PIPE_SHADER_CAP_FP16:
326 return 0;
327 case PIPE_SHADER_CAP_INTEGERS:
328 return DBG_ENABLED(ETNA_DBG_NIR) && screen->specs.halti >= 2;
329 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
330 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
331 return shader == PIPE_SHADER_FRAGMENT
332 ? screen->specs.fragment_sampler_count
333 : screen->specs.vertex_sampler_count;
334 case PIPE_SHADER_CAP_PREFERRED_IR:
335 return DBG_ENABLED(ETNA_DBG_NIR) ? PIPE_SHADER_IR_NIR : PIPE_SHADER_IR_TGSI;
336 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
337 return shader == PIPE_SHADER_FRAGMENT
338 ? screen->specs.max_ps_uniforms * sizeof(float[4])
339 : screen->specs.max_vs_uniforms * sizeof(float[4]);
340 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
341 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
342 case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
343 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
344 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
345 return false;
346 case PIPE_SHADER_CAP_SUPPORTED_IRS:
347 return 0;
348 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
349 return 32;
350 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
351 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
352 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
353 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
354 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
355 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
356 return 0;
357 }
358
359 debug_printf("unknown shader param %d", param);
360 return 0;
361 }
362
363 static uint64_t
364 etna_screen_get_timestamp(struct pipe_screen *pscreen)
365 {
366 return os_time_get_nano();
367 }
368
369 static bool
370 gpu_supports_texture_target(struct etna_screen *screen,
371 enum pipe_texture_target target)
372 {
373 if (target == PIPE_TEXTURE_CUBE_ARRAY)
374 return false;
375
376 /* pre-halti has no array/3D */
377 if (screen->specs.halti < 0 &&
378 (target == PIPE_TEXTURE_1D_ARRAY ||
379 target == PIPE_TEXTURE_2D_ARRAY ||
380 target == PIPE_TEXTURE_3D))
381 return false;
382
383 return true;
384 }
385
386 static bool
387 gpu_supports_texture_format(struct etna_screen *screen, uint32_t fmt,
388 enum pipe_format format)
389 {
390 bool supported = true;
391
392 if (fmt == TEXTURE_FORMAT_ETC1)
393 supported = VIV_FEATURE(screen, chipFeatures, ETC1_TEXTURE_COMPRESSION);
394
395 if (fmt >= TEXTURE_FORMAT_DXT1 && fmt <= TEXTURE_FORMAT_DXT4_DXT5)
396 supported = VIV_FEATURE(screen, chipFeatures, DXT_TEXTURE_COMPRESSION);
397
398 if (util_format_is_srgb(format))
399 supported = VIV_FEATURE(screen, chipMinorFeatures1, HALTI0);
400
401 if (fmt & EXT_FORMAT)
402 supported = VIV_FEATURE(screen, chipMinorFeatures1, HALTI0);
403
404 if (fmt & ASTC_FORMAT) {
405 supported = screen->specs.tex_astc;
406 }
407
408 if (util_format_is_snorm(format))
409 supported = VIV_FEATURE(screen, chipMinorFeatures2, HALTI1);
410
411 if (format != PIPE_FORMAT_S8_UINT_Z24_UNORM &&
412 (util_format_is_pure_integer(format) || util_format_is_float(format)))
413 supported = VIV_FEATURE(screen, chipMinorFeatures4, HALTI2);
414
415
416 if (!supported)
417 return false;
418
419 if (texture_format_needs_swiz(format))
420 return VIV_FEATURE(screen, chipMinorFeatures1, HALTI0);
421
422 return true;
423 }
424
425 static bool
426 gpu_supports_render_format(struct etna_screen *screen, enum pipe_format format,
427 unsigned sample_count)
428 {
429 const uint32_t fmt = translate_pe_format(format);
430
431 if (fmt == ETNA_NO_MATCH)
432 return false;
433
434 /* Validate MSAA; number of samples must be allowed, and render target
435 * must have MSAA'able format. */
436 if (sample_count > 1) {
437 if (!VIV_FEATURE(screen, chipFeatures, MSAA))
438 return false;
439 if (!translate_samples_to_xyscale(sample_count, NULL, NULL))
440 return false;
441 if (translate_ts_format(format) == ETNA_NO_MATCH)
442 return false;
443 }
444
445 if (format == PIPE_FORMAT_R8_UNORM)
446 return VIV_FEATURE(screen, chipMinorFeatures5, HALTI5);
447
448 /* figure out 8bpp RS clear to enable these formats */
449 if (format == PIPE_FORMAT_R8_SINT || format == PIPE_FORMAT_R8_UINT)
450 return VIV_FEATURE(screen, chipMinorFeatures5, HALTI5);
451
452 if (util_format_is_srgb(format))
453 return VIV_FEATURE(screen, chipMinorFeatures5, HALTI3);
454
455 if (util_format_is_pure_integer(format) || util_format_is_float(format))
456 return VIV_FEATURE(screen, chipMinorFeatures4, HALTI2);
457
458 if (format == PIPE_FORMAT_R8G8_UNORM)
459 return VIV_FEATURE(screen, chipMinorFeatures4, HALTI2);
460
461 /* any other extended format is HALTI0 (only R10G10B10A2?) */
462 if (fmt >= PE_FORMAT_R16F)
463 return VIV_FEATURE(screen, chipMinorFeatures1, HALTI0);
464
465 return true;
466 }
467
468 static bool
469 gpu_supports_vertex_format(struct etna_screen *screen, enum pipe_format format)
470 {
471 if (translate_vertex_format_type(format) == ETNA_NO_MATCH)
472 return false;
473
474 if (util_format_is_pure_integer(format))
475 return VIV_FEATURE(screen, chipMinorFeatures4, HALTI2);
476
477 return true;
478 }
479
480 static bool
481 etna_screen_is_format_supported(struct pipe_screen *pscreen,
482 enum pipe_format format,
483 enum pipe_texture_target target,
484 unsigned sample_count,
485 unsigned storage_sample_count,
486 unsigned usage)
487 {
488 struct etna_screen *screen = etna_screen(pscreen);
489 unsigned allowed = 0;
490
491 if (!gpu_supports_texture_target(screen, target))
492 return false;
493
494 if (MAX2(1, sample_count) != MAX2(1, storage_sample_count))
495 return false;
496
497 if (usage & PIPE_BIND_RENDER_TARGET) {
498 if (gpu_supports_render_format(screen, format, sample_count))
499 allowed |= PIPE_BIND_RENDER_TARGET;
500 }
501
502 if (usage & PIPE_BIND_DEPTH_STENCIL) {
503 if (translate_depth_format(format) != ETNA_NO_MATCH)
504 allowed |= PIPE_BIND_DEPTH_STENCIL;
505 }
506
507 if (usage & PIPE_BIND_SAMPLER_VIEW) {
508 uint32_t fmt = translate_texture_format(format);
509
510 if (!gpu_supports_texture_format(screen, fmt, format))
511 fmt = ETNA_NO_MATCH;
512
513 if (sample_count < 2 && fmt != ETNA_NO_MATCH)
514 allowed |= PIPE_BIND_SAMPLER_VIEW;
515 }
516
517 if (usage & PIPE_BIND_VERTEX_BUFFER) {
518 if (gpu_supports_vertex_format(screen, format))
519 allowed |= PIPE_BIND_VERTEX_BUFFER;
520 }
521
522 if (usage & PIPE_BIND_INDEX_BUFFER) {
523 /* must be supported index format */
524 if (format == PIPE_FORMAT_I8_UINT || format == PIPE_FORMAT_I16_UINT ||
525 (format == PIPE_FORMAT_I32_UINT &&
526 VIV_FEATURE(screen, chipFeatures, 32_BIT_INDICES))) {
527 allowed |= PIPE_BIND_INDEX_BUFFER;
528 }
529 }
530
531 /* Always allowed */
532 allowed |=
533 usage & (PIPE_BIND_DISPLAY_TARGET | PIPE_BIND_SCANOUT | PIPE_BIND_SHARED);
534
535 if (usage != allowed) {
536 DBG("not supported: format=%s, target=%d, sample_count=%d, "
537 "usage=%x, allowed=%x",
538 util_format_name(format), target, sample_count, usage, allowed);
539 }
540
541 return usage == allowed;
542 }
543
544 const uint64_t supported_modifiers[] = {
545 DRM_FORMAT_MOD_LINEAR,
546 DRM_FORMAT_MOD_VIVANTE_TILED,
547 DRM_FORMAT_MOD_VIVANTE_SUPER_TILED,
548 DRM_FORMAT_MOD_VIVANTE_SPLIT_TILED,
549 DRM_FORMAT_MOD_VIVANTE_SPLIT_SUPER_TILED,
550 };
551
552 static void
553 etna_screen_query_dmabuf_modifiers(struct pipe_screen *pscreen,
554 enum pipe_format format, int max,
555 uint64_t *modifiers,
556 unsigned int *external_only, int *count)
557 {
558 struct etna_screen *screen = etna_screen(pscreen);
559 int i, num_modifiers = 0;
560
561 if (max > ARRAY_SIZE(supported_modifiers))
562 max = ARRAY_SIZE(supported_modifiers);
563
564 if (!max) {
565 modifiers = NULL;
566 max = ARRAY_SIZE(supported_modifiers);
567 }
568
569 for (i = 0; num_modifiers < max; i++) {
570 /* don't advertise split tiled formats on single pipe/buffer GPUs */
571 if ((screen->specs.pixel_pipes == 1 || screen->specs.single_buffer) &&
572 i >= 3)
573 break;
574
575 if (modifiers)
576 modifiers[num_modifiers] = supported_modifiers[i];
577 if (external_only)
578 external_only[num_modifiers] = util_format_is_yuv(format) ? 1 : 0;
579 num_modifiers++;
580 }
581
582 *count = num_modifiers;
583 }
584
585 static void
586 etna_determine_uniform_limits(struct etna_screen *screen)
587 {
588 /* values for the non unified case are taken from
589 * gcmCONFIGUREUNIFORMS in the Vivante kernel driver file
590 * drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_base.h.
591 */
592 if (screen->model == chipModel_GC2000 &&
593 (screen->revision == 0x5118 || screen->revision == 0x5140)) {
594 screen->specs.max_vs_uniforms = 256;
595 screen->specs.max_ps_uniforms = 64;
596 } else if (screen->specs.num_constants == 320) {
597 screen->specs.max_vs_uniforms = 256;
598 screen->specs.max_ps_uniforms = 64;
599 } else if (screen->specs.num_constants > 256 &&
600 screen->model == chipModel_GC1000) {
601 /* All GC1000 series chips can only support 64 uniforms for ps on non-unified const mode. */
602 screen->specs.max_vs_uniforms = 256;
603 screen->specs.max_ps_uniforms = 64;
604 } else if (screen->specs.num_constants > 256) {
605 screen->specs.max_vs_uniforms = 256;
606 screen->specs.max_ps_uniforms = 256;
607 } else if (screen->specs.num_constants == 256) {
608 screen->specs.max_vs_uniforms = 256;
609 screen->specs.max_ps_uniforms = 256;
610 } else {
611 screen->specs.max_vs_uniforms = 168;
612 screen->specs.max_ps_uniforms = 64;
613 }
614 }
615
616 static bool
617 etna_get_specs(struct etna_screen *screen)
618 {
619 uint64_t val;
620 uint32_t instruction_count;
621
622 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_INSTRUCTION_COUNT, &val)) {
623 DBG("could not get ETNA_GPU_INSTRUCTION_COUNT");
624 goto fail;
625 }
626 instruction_count = val;
627
628 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_VERTEX_OUTPUT_BUFFER_SIZE,
629 &val)) {
630 DBG("could not get ETNA_GPU_VERTEX_OUTPUT_BUFFER_SIZE");
631 goto fail;
632 }
633 screen->specs.vertex_output_buffer_size = val;
634
635 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_VERTEX_CACHE_SIZE, &val)) {
636 DBG("could not get ETNA_GPU_VERTEX_CACHE_SIZE");
637 goto fail;
638 }
639 screen->specs.vertex_cache_size = val;
640
641 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_SHADER_CORE_COUNT, &val)) {
642 DBG("could not get ETNA_GPU_SHADER_CORE_COUNT");
643 goto fail;
644 }
645 screen->specs.shader_core_count = val;
646
647 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_STREAM_COUNT, &val)) {
648 DBG("could not get ETNA_GPU_STREAM_COUNT");
649 goto fail;
650 }
651 screen->specs.stream_count = val;
652
653 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_REGISTER_MAX, &val)) {
654 DBG("could not get ETNA_GPU_REGISTER_MAX");
655 goto fail;
656 }
657 screen->specs.max_registers = val;
658
659 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_PIXEL_PIPES, &val)) {
660 DBG("could not get ETNA_GPU_PIXEL_PIPES");
661 goto fail;
662 }
663 screen->specs.pixel_pipes = val;
664
665 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_NUM_CONSTANTS, &val)) {
666 DBG("could not get %s", "ETNA_GPU_NUM_CONSTANTS");
667 goto fail;
668 }
669 if (val == 0) {
670 fprintf(stderr, "Warning: zero num constants (update kernel?)\n");
671 val = 168;
672 }
673 screen->specs.num_constants = val;
674
675 /* Figure out gross GPU architecture. See rnndb/common.xml for a specific
676 * description of the differences. */
677 if (VIV_FEATURE(screen, chipMinorFeatures5, HALTI5))
678 screen->specs.halti = 5; /* New GC7000/GC8x00 */
679 else if (VIV_FEATURE(screen, chipMinorFeatures5, HALTI4))
680 screen->specs.halti = 4; /* Old GC7000/GC7400 */
681 else if (VIV_FEATURE(screen, chipMinorFeatures5, HALTI3))
682 screen->specs.halti = 3; /* None? */
683 else if (VIV_FEATURE(screen, chipMinorFeatures4, HALTI2))
684 screen->specs.halti = 2; /* GC2500/GC3000/GC5000/GC6400 */
685 else if (VIV_FEATURE(screen, chipMinorFeatures2, HALTI1))
686 screen->specs.halti = 1; /* GC900/GC4000/GC7000UL */
687 else if (VIV_FEATURE(screen, chipMinorFeatures1, HALTI0))
688 screen->specs.halti = 0; /* GC880/GC2000/GC7000TM */
689 else
690 screen->specs.halti = -1; /* GC7000nanolite / pre-GC2000 except GC880 */
691 if (screen->specs.halti >= 0)
692 DBG("etnaviv: GPU arch: HALTI%d", screen->specs.halti);
693 else
694 DBG("etnaviv: GPU arch: pre-HALTI");
695
696 screen->specs.can_supertile =
697 VIV_FEATURE(screen, chipMinorFeatures0, SUPER_TILED);
698 screen->specs.bits_per_tile =
699 VIV_FEATURE(screen, chipMinorFeatures0, 2BITPERTILE) ? 2 : 4;
700 screen->specs.ts_clear_value =
701 VIV_FEATURE(screen, chipMinorFeatures5, BLT_ENGINE) ? 0xffffffff :
702 VIV_FEATURE(screen, chipMinorFeatures0, 2BITPERTILE) ? 0x55555555 :
703 0x11111111;
704
705
706 /* vertex and fragment samplers live in one address space */
707 screen->specs.vertex_sampler_offset = 8;
708 screen->specs.fragment_sampler_count = 8;
709 screen->specs.vertex_sampler_count = 4;
710 screen->specs.vs_need_z_div =
711 screen->model < 0x1000 && screen->model != 0x880;
712 screen->specs.has_sin_cos_sqrt =
713 VIV_FEATURE(screen, chipMinorFeatures0, HAS_SQRT_TRIG);
714 screen->specs.has_sign_floor_ceil =
715 VIV_FEATURE(screen, chipMinorFeatures0, HAS_SIGN_FLOOR_CEIL);
716 screen->specs.has_shader_range_registers =
717 screen->model >= 0x1000 || screen->model == 0x880;
718 screen->specs.npot_tex_any_wrap =
719 VIV_FEATURE(screen, chipMinorFeatures1, NON_POWER_OF_TWO);
720 screen->specs.has_new_transcendentals =
721 VIV_FEATURE(screen, chipMinorFeatures3, HAS_FAST_TRANSCENDENTALS);
722 screen->specs.has_halti2_instructions =
723 VIV_FEATURE(screen, chipMinorFeatures4, HALTI2);
724 screen->specs.v4_compression =
725 VIV_FEATURE(screen, chipMinorFeatures6, V4_COMPRESSION);
726
727 if (screen->specs.halti >= 5) {
728 /* GC7000 - this core must load shaders from memory. */
729 screen->specs.vs_offset = 0;
730 screen->specs.ps_offset = 0;
731 screen->specs.max_instructions = 0; /* Do not program shaders manually */
732 screen->specs.has_icache = true;
733 } else if (VIV_FEATURE(screen, chipMinorFeatures3, INSTRUCTION_CACHE)) {
734 /* GC3000 - this core is capable of loading shaders from
735 * memory. It can also run shaders from registers, as a fallback, but
736 * "max_instructions" does not have the correct value. It has place for
737 * 2*256 instructions just like GC2000, but the offsets are slightly
738 * different.
739 */
740 screen->specs.vs_offset = 0xC000;
741 /* State 08000-0C000 mirrors 0C000-0E000, and the Vivante driver uses
742 * this mirror for writing PS instructions, probably safest to do the
743 * same.
744 */
745 screen->specs.ps_offset = 0x8000 + 0x1000;
746 screen->specs.max_instructions = 256; /* maximum number instructions for non-icache use */
747 screen->specs.has_icache = true;
748 } else {
749 if (instruction_count > 256) { /* unified instruction memory? */
750 screen->specs.vs_offset = 0xC000;
751 screen->specs.ps_offset = 0xD000; /* like vivante driver */
752 screen->specs.max_instructions = 256;
753 } else {
754 screen->specs.vs_offset = 0x4000;
755 screen->specs.ps_offset = 0x6000;
756 screen->specs.max_instructions = instruction_count / 2;
757 }
758 screen->specs.has_icache = false;
759 }
760
761 if (VIV_FEATURE(screen, chipMinorFeatures1, HALTI0)) {
762 screen->specs.max_varyings = 12;
763 screen->specs.vertex_max_elements = 16;
764 } else {
765 screen->specs.max_varyings = 8;
766 /* Etna_viv documentation seems confused over the correct value
767 * here so choose the lower to be safe: HALTI0 says 16 i.s.o.
768 * 10, but VERTEX_ELEMENT_CONFIG register says 16 i.s.o. 12. */
769 screen->specs.vertex_max_elements = 10;
770 }
771
772 /* Etna_viv documentation does not indicate where varyings above 8 are
773 * stored. Moreover, if we are passed more than 8 varyings, we will
774 * walk off the end of some arrays. Limit the maximum number of varyings. */
775 if (screen->specs.max_varyings > ETNA_NUM_VARYINGS)
776 screen->specs.max_varyings = ETNA_NUM_VARYINGS;
777
778 etna_determine_uniform_limits(screen);
779
780 if (screen->specs.halti >= 5) {
781 screen->specs.has_unified_uniforms = true;
782 screen->specs.vs_uniforms_offset = VIVS_SH_HALTI5_UNIFORMS_MIRROR(0);
783 screen->specs.ps_uniforms_offset = VIVS_SH_HALTI5_UNIFORMS(screen->specs.max_vs_uniforms*4);
784 } else if (screen->specs.halti >= 1) {
785 /* unified uniform memory on GC3000 - HALTI1 feature bit is just a guess
786 */
787 screen->specs.has_unified_uniforms = true;
788 screen->specs.vs_uniforms_offset = VIVS_SH_UNIFORMS(0);
789 /* hardcode PS uniforms to start after end of VS uniforms -
790 * for more flexibility this offset could be variable based on the
791 * shader.
792 */
793 screen->specs.ps_uniforms_offset = VIVS_SH_UNIFORMS(screen->specs.max_vs_uniforms*4);
794 } else {
795 screen->specs.has_unified_uniforms = false;
796 screen->specs.vs_uniforms_offset = VIVS_VS_UNIFORMS(0);
797 screen->specs.ps_uniforms_offset = VIVS_PS_UNIFORMS(0);
798 }
799
800 screen->specs.max_texture_size =
801 VIV_FEATURE(screen, chipMinorFeatures0, TEXTURE_8K) ? 8192 : 2048;
802 screen->specs.max_rendertarget_size =
803 VIV_FEATURE(screen, chipMinorFeatures0, RENDERTARGET_8K) ? 8192 : 2048;
804
805 screen->specs.single_buffer = VIV_FEATURE(screen, chipMinorFeatures4, SINGLE_BUFFER);
806 if (screen->specs.single_buffer)
807 DBG("etnaviv: Single buffer mode enabled with %d pixel pipes", screen->specs.pixel_pipes);
808
809 screen->specs.tex_astc = VIV_FEATURE(screen, chipMinorFeatures4, TEXTURE_ASTC) &&
810 !VIV_FEATURE(screen, chipMinorFeatures6, NO_ASTC);
811
812 screen->specs.use_blt = VIV_FEATURE(screen, chipMinorFeatures5, BLT_ENGINE);
813
814 return true;
815
816 fail:
817 return false;
818 }
819
820 struct etna_bo *
821 etna_screen_bo_from_handle(struct pipe_screen *pscreen,
822 struct winsys_handle *whandle, unsigned *out_stride)
823 {
824 struct etna_screen *screen = etna_screen(pscreen);
825 struct etna_bo *bo;
826
827 if (whandle->type == WINSYS_HANDLE_TYPE_SHARED) {
828 bo = etna_bo_from_name(screen->dev, whandle->handle);
829 } else if (whandle->type == WINSYS_HANDLE_TYPE_FD) {
830 bo = etna_bo_from_dmabuf(screen->dev, whandle->handle);
831 } else {
832 DBG("Attempt to import unsupported handle type %d", whandle->type);
833 return NULL;
834 }
835
836 if (!bo) {
837 DBG("ref name 0x%08x failed", whandle->handle);
838 return NULL;
839 }
840
841 *out_stride = whandle->stride;
842
843 return bo;
844 }
845
846 static const void *
847 etna_get_compiler_options(struct pipe_screen *pscreen,
848 enum pipe_shader_ir ir, unsigned shader)
849 {
850 return &etna_screen(pscreen)->options;
851 }
852
853 struct pipe_screen *
854 etna_screen_create(struct etna_device *dev, struct etna_gpu *gpu,
855 struct renderonly *ro)
856 {
857 struct etna_screen *screen = CALLOC_STRUCT(etna_screen);
858 struct pipe_screen *pscreen;
859 drmVersionPtr version;
860 uint64_t val;
861
862 if (!screen)
863 return NULL;
864
865 pscreen = &screen->base;
866 screen->dev = dev;
867 screen->gpu = gpu;
868 screen->ro = renderonly_dup(ro);
869 screen->refcnt = 1;
870
871 if (!screen->ro) {
872 DBG("could not create renderonly object");
873 goto fail;
874 }
875
876 version = drmGetVersion(screen->ro->gpu_fd);
877 screen->drm_version = ETNA_DRM_VERSION(version->version_major,
878 version->version_minor);
879 drmFreeVersion(version);
880
881 etna_mesa_debug = debug_get_option_etna_mesa_debug();
882
883 /* Disable autodisable for correct rendering with TS */
884 etna_mesa_debug |= ETNA_DBG_NO_AUTODISABLE;
885
886 screen->pipe = etna_pipe_new(gpu, ETNA_PIPE_3D);
887 if (!screen->pipe) {
888 DBG("could not create 3d pipe");
889 goto fail;
890 }
891
892 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_MODEL, &val)) {
893 DBG("could not get ETNA_GPU_MODEL");
894 goto fail;
895 }
896 screen->model = val;
897
898 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_REVISION, &val)) {
899 DBG("could not get ETNA_GPU_REVISION");
900 goto fail;
901 }
902 screen->revision = val;
903
904 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_FEATURES_0, &val)) {
905 DBG("could not get ETNA_GPU_FEATURES_0");
906 goto fail;
907 }
908 screen->features[0] = val;
909
910 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_FEATURES_1, &val)) {
911 DBG("could not get ETNA_GPU_FEATURES_1");
912 goto fail;
913 }
914 screen->features[1] = val;
915
916 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_FEATURES_2, &val)) {
917 DBG("could not get ETNA_GPU_FEATURES_2");
918 goto fail;
919 }
920 screen->features[2] = val;
921
922 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_FEATURES_3, &val)) {
923 DBG("could not get ETNA_GPU_FEATURES_3");
924 goto fail;
925 }
926 screen->features[3] = val;
927
928 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_FEATURES_4, &val)) {
929 DBG("could not get ETNA_GPU_FEATURES_4");
930 goto fail;
931 }
932 screen->features[4] = val;
933
934 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_FEATURES_5, &val)) {
935 DBG("could not get ETNA_GPU_FEATURES_5");
936 goto fail;
937 }
938 screen->features[5] = val;
939
940 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_FEATURES_6, &val)) {
941 DBG("could not get ETNA_GPU_FEATURES_6");
942 goto fail;
943 }
944 screen->features[6] = val;
945
946 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_FEATURES_7, &val)) {
947 DBG("could not get ETNA_GPU_FEATURES_7");
948 goto fail;
949 }
950 screen->features[7] = val;
951
952 if (!etna_get_specs(screen))
953 goto fail;
954
955 if (screen->specs.halti >= 5 && !etnaviv_device_softpin_capable(dev)) {
956 DBG("halti5 requires softpin");
957 goto fail;
958 }
959
960 screen->options = (nir_shader_compiler_options) {
961 .lower_fpow = true,
962 .lower_sub = true,
963 .lower_ftrunc = true,
964 .fuse_ffma = true,
965 .lower_bitops = true,
966 .lower_all_io_to_temps = true,
967 .vertex_id_zero_based = true,
968 .lower_flrp32 = true,
969 .lower_fmod = true,
970 .lower_vector_cmp = true,
971 .lower_fdph = true,
972 .lower_fdiv = true, /* !screen->specs.has_new_transcendentals */
973 .lower_fsign = !screen->specs.has_sign_floor_ceil,
974 .lower_ffloor = !screen->specs.has_sign_floor_ceil,
975 .lower_fceil = !screen->specs.has_sign_floor_ceil,
976 .lower_fsqrt = !screen->specs.has_sin_cos_sqrt,
977 .lower_sincos = !screen->specs.has_sin_cos_sqrt,
978 };
979
980 /* apply debug options that disable individual features */
981 if (DBG_ENABLED(ETNA_DBG_NO_EARLY_Z))
982 screen->features[viv_chipFeatures] |= chipFeatures_NO_EARLY_Z;
983 if (DBG_ENABLED(ETNA_DBG_NO_TS))
984 screen->features[viv_chipFeatures] &= ~chipFeatures_FAST_CLEAR;
985 if (DBG_ENABLED(ETNA_DBG_NO_AUTODISABLE))
986 screen->features[viv_chipMinorFeatures1] &= ~chipMinorFeatures1_AUTO_DISABLE;
987 if (DBG_ENABLED(ETNA_DBG_NO_SUPERTILE))
988 screen->specs.can_supertile = 0;
989 if (DBG_ENABLED(ETNA_DBG_NO_SINGLEBUF))
990 screen->specs.single_buffer = 0;
991
992 pscreen->destroy = etna_screen_destroy;
993 pscreen->get_param = etna_screen_get_param;
994 pscreen->get_paramf = etna_screen_get_paramf;
995 pscreen->get_shader_param = etna_screen_get_shader_param;
996 pscreen->get_compiler_options = etna_get_compiler_options;
997
998 pscreen->get_name = etna_screen_get_name;
999 pscreen->get_vendor = etna_screen_get_vendor;
1000 pscreen->get_device_vendor = etna_screen_get_device_vendor;
1001
1002 pscreen->get_timestamp = etna_screen_get_timestamp;
1003 pscreen->context_create = etna_context_create;
1004 pscreen->is_format_supported = etna_screen_is_format_supported;
1005 pscreen->query_dmabuf_modifiers = etna_screen_query_dmabuf_modifiers;
1006
1007 etna_fence_screen_init(pscreen);
1008 etna_query_screen_init(pscreen);
1009 etna_resource_screen_init(pscreen);
1010
1011 util_dynarray_init(&screen->supported_pm_queries, NULL);
1012 slab_create_parent(&screen->transfer_pool, sizeof(struct etna_transfer), 16);
1013
1014 if (screen->drm_version >= ETNA_DRM_VERSION_PERFMON)
1015 etna_pm_query_setup(screen);
1016
1017 return pscreen;
1018
1019 fail:
1020 etna_screen_destroy(pscreen);
1021 return NULL;
1022 }