4dccdb4ccabe34c1d143476a0b864b8adec1aeb2
[mesa.git] / src / gallium / drivers / etnaviv / etnaviv_screen.c
1 /*
2 * Copyright (c) 2012-2015 Etnaviv Project
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sub license,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the
12 * next paragraph) shall be included in all copies or substantial portions
13 * of the Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
22 *
23 * Authors:
24 * Wladimir J. van der Laan <laanwj@gmail.com>
25 * Christian Gmeiner <christian.gmeiner@gmail.com>
26 */
27
28 #include "etnaviv_screen.h"
29
30 #include "hw/common.xml.h"
31
32 #include "etnaviv_compiler.h"
33 #include "etnaviv_context.h"
34 #include "etnaviv_debug.h"
35 #include "etnaviv_fence.h"
36 #include "etnaviv_format.h"
37 #include "etnaviv_query.h"
38 #include "etnaviv_resource.h"
39 #include "etnaviv_translate.h"
40
41 #include "util/hash_table.h"
42 #include "util/os_time.h"
43 #include "util/u_math.h"
44 #include "util/u_memory.h"
45 #include "util/u_screen.h"
46 #include "util/u_string.h"
47
48 #include "frontend/drm_driver.h"
49
50 #include "drm-uapi/drm_fourcc.h"
51
52 #define ETNA_DRM_VERSION(major, minor) ((major) << 16 | (minor))
53 #define ETNA_DRM_VERSION_FENCE_FD ETNA_DRM_VERSION(1, 1)
54 #define ETNA_DRM_VERSION_PERFMON ETNA_DRM_VERSION(1, 2)
55
56 static const struct debug_named_value debug_options[] = {
57 {"dbg_msgs", ETNA_DBG_MSGS, "Print debug messages"},
58 {"frame_msgs", ETNA_DBG_FRAME_MSGS, "Print frame messages"},
59 {"resource_msgs", ETNA_DBG_RESOURCE_MSGS, "Print resource messages"},
60 {"compiler_msgs", ETNA_DBG_COMPILER_MSGS, "Print compiler messages"},
61 {"linker_msgs", ETNA_DBG_LINKER_MSGS, "Print linker messages"},
62 {"dump_shaders", ETNA_DBG_DUMP_SHADERS, "Dump shaders"},
63 {"no_ts", ETNA_DBG_NO_TS, "Disable TS"},
64 {"no_autodisable", ETNA_DBG_NO_AUTODISABLE, "Disable autodisable"},
65 {"no_supertile", ETNA_DBG_NO_SUPERTILE, "Disable supertiles"},
66 {"no_early_z", ETNA_DBG_NO_EARLY_Z, "Disable early z"},
67 {"cflush_all", ETNA_DBG_CFLUSH_ALL, "Flush every cache before state update"},
68 {"msaa2x", ETNA_DBG_MSAA_2X, "Force 2x msaa"},
69 {"msaa4x", ETNA_DBG_MSAA_4X, "Force 4x msaa"},
70 {"flush_all", ETNA_DBG_FLUSH_ALL, "Flush after every rendered primitive"},
71 {"zero", ETNA_DBG_ZERO, "Zero all resources after allocation"},
72 {"draw_stall", ETNA_DBG_DRAW_STALL, "Stall FE/PE after each rendered primitive"},
73 {"shaderdb", ETNA_DBG_SHADERDB, "Enable shaderdb output"},
74 {"no_singlebuffer",ETNA_DBG_NO_SINGLEBUF, "Disable single buffer feature"},
75 {"nir", ETNA_DBG_NIR, "use new NIR compiler"},
76 {"deqp", ETNA_DBG_DEQP, "Hacks to run dEQP GLES3 tests"}, /* needs MESA_GLES_VERSION_OVERRIDE=3.0 */
77 DEBUG_NAMED_VALUE_END
78 };
79
80 DEBUG_GET_ONCE_FLAGS_OPTION(etna_mesa_debug, "ETNA_MESA_DEBUG", debug_options, 0)
81 int etna_mesa_debug = 0;
82
83 static void
84 etna_screen_destroy(struct pipe_screen *pscreen)
85 {
86 struct etna_screen *screen = etna_screen(pscreen);
87
88 if (screen->perfmon)
89 etna_perfmon_del(screen->perfmon);
90
91 if (screen->pipe)
92 etna_pipe_del(screen->pipe);
93
94 if (screen->gpu)
95 etna_gpu_del(screen->gpu);
96
97 if (screen->ro)
98 FREE(screen->ro);
99
100 if (screen->dev)
101 etna_device_del(screen->dev);
102
103 FREE(screen);
104 }
105
106 static const char *
107 etna_screen_get_name(struct pipe_screen *pscreen)
108 {
109 struct etna_screen *priv = etna_screen(pscreen);
110 static char buffer[128];
111
112 snprintf(buffer, sizeof(buffer), "Vivante GC%x rev %04x", priv->model,
113 priv->revision);
114
115 return buffer;
116 }
117
118 static const char *
119 etna_screen_get_vendor(struct pipe_screen *pscreen)
120 {
121 return "etnaviv";
122 }
123
124 static const char *
125 etna_screen_get_device_vendor(struct pipe_screen *pscreen)
126 {
127 return "Vivante";
128 }
129
130 static int
131 etna_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
132 {
133 struct etna_screen *screen = etna_screen(pscreen);
134
135 switch (param) {
136 /* Supported features (boolean caps). */
137 case PIPE_CAP_POINT_SPRITE:
138 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
139 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
140 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
141 case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:
142 case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:
143 case PIPE_CAP_VERTEX_SHADER_SATURATE:
144 case PIPE_CAP_TEXTURE_BARRIER:
145 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
146 case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY:
147 case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY:
148 case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY:
149 case PIPE_CAP_TGSI_TEXCOORD:
150 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
151 case PIPE_CAP_MIXED_COLOR_DEPTH_BITS:
152 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
153 case PIPE_CAP_STRING_MARKER:
154 case PIPE_CAP_SHAREABLE_SHADERS:
155 return 1;
156 case PIPE_CAP_NATIVE_FENCE_FD:
157 return screen->drm_version >= ETNA_DRM_VERSION_FENCE_FD;
158 case PIPE_CAP_TGSI_FS_POSITION_IS_SYSVAL:
159 case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL: /* note: not integer */
160 return DBG_ENABLED(ETNA_DBG_NIR);
161 case PIPE_CAP_TGSI_FS_POINT_IS_SYSVAL:
162 return 0;
163
164 /* Memory */
165 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
166 return 256;
167 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
168 return 4; /* XXX could easily be supported */
169
170 case PIPE_CAP_NPOT_TEXTURES:
171 return true; /* VIV_FEATURE(priv->dev, chipMinorFeatures1,
172 NON_POWER_OF_TWO); */
173
174 case PIPE_CAP_ANISOTROPIC_FILTER:
175 case PIPE_CAP_TEXTURE_SWIZZLE:
176 case PIPE_CAP_PRIMITIVE_RESTART:
177 case PIPE_CAP_PRIMITIVE_RESTART_FIXED_INDEX:
178 return VIV_FEATURE(screen, chipMinorFeatures1, HALTI0);
179
180 /* Unsupported features. */
181 case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
182 case PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY:
183 case PIPE_CAP_ALLOW_MAPPED_BUFFERS_DURING_EXECUTION:
184 return 0;
185
186 /* Stream output. */
187 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
188 return DBG_ENABLED(ETNA_DBG_DEQP) ? 4 : 0;
189 case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:
190 case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:
191 return 0;
192
193 case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:
194 return 128;
195 case PIPE_CAP_MAX_VERTEX_ELEMENT_SRC_OFFSET:
196 return 255;
197 case PIPE_CAP_MAX_VERTEX_BUFFERS:
198 return screen->specs.stream_count;
199 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
200 return VIV_FEATURE(screen, chipMinorFeatures4, HALTI2);
201
202
203 /* Texturing. */
204 case PIPE_CAP_TEXTURE_SHADOW_MAP:
205 return DBG_ENABLED(ETNA_DBG_NIR) && screen->specs.halti >= 2;
206 case PIPE_CAP_MAX_TEXTURE_2D_SIZE:
207 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS: /* TODO: verify */
208 return screen->specs.max_texture_size;
209 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
210 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
211 {
212 int log2_max_tex_size = util_last_bit(screen->specs.max_texture_size);
213 assert(log2_max_tex_size > 0);
214 return log2_max_tex_size;
215 }
216
217 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
218 case PIPE_CAP_MIN_TEXEL_OFFSET:
219 return -8;
220 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
221 case PIPE_CAP_MAX_TEXEL_OFFSET:
222 return 7;
223 case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
224 return screen->specs.seamless_cube_map;
225
226 /* Queries. */
227 case PIPE_CAP_OCCLUSION_QUERY:
228 return VIV_FEATURE(screen, chipMinorFeatures1, HALTI0);
229
230 /* Preferences */
231 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
232 return 0;
233 case PIPE_CAP_MAX_TEXTURE_UPLOAD_MEMORY_BUDGET: {
234 /* etnaviv is being run on systems as small as 256MB total RAM so
235 * we need to provide a sane value for such a device. Limit the
236 * memory budget to min(~3% of pyhiscal memory, 64MB).
237 *
238 * a simple divison by 32 provides the numbers we want.
239 * 256MB / 32 = 8MB
240 * 2048MB / 32 = 64MB
241 */
242 uint64_t system_memory;
243
244 if (!os_get_total_physical_memory(&system_memory))
245 system_memory = (uint64_t)4096 << 20;
246
247 return MIN2(system_memory / 32, 64 * 1024 * 1024);
248 }
249
250 case PIPE_CAP_MAX_VARYINGS:
251 return screen->specs.max_varyings;
252
253 case PIPE_CAP_PCI_GROUP:
254 case PIPE_CAP_PCI_BUS:
255 case PIPE_CAP_PCI_DEVICE:
256 case PIPE_CAP_PCI_FUNCTION:
257 return 0;
258 case PIPE_CAP_ACCELERATED:
259 return 1;
260 case PIPE_CAP_VIDEO_MEMORY:
261 return 0;
262 case PIPE_CAP_UMA:
263 return 1;
264 default:
265 return u_pipe_screen_get_param_defaults(pscreen, param);
266 }
267 }
268
269 static float
270 etna_screen_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)
271 {
272 struct etna_screen *screen = etna_screen(pscreen);
273
274 switch (param) {
275 case PIPE_CAPF_MAX_LINE_WIDTH:
276 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
277 case PIPE_CAPF_MAX_POINT_WIDTH:
278 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
279 return 8192.0f;
280 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
281 return 16.0f;
282 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
283 return util_last_bit(screen->specs.max_texture_size);
284 case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
285 case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
286 case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
287 return 0.0f;
288 }
289
290 debug_printf("unknown paramf %d", param);
291 return 0;
292 }
293
294 static int
295 etna_screen_get_shader_param(struct pipe_screen *pscreen,
296 enum pipe_shader_type shader,
297 enum pipe_shader_cap param)
298 {
299 struct etna_screen *screen = etna_screen(pscreen);
300 bool ubo_enable = screen->specs.halti >= 2 && DBG_ENABLED(ETNA_DBG_NIR);
301
302 if (DBG_ENABLED(ETNA_DBG_DEQP))
303 ubo_enable = true;
304
305 switch (shader) {
306 case PIPE_SHADER_FRAGMENT:
307 case PIPE_SHADER_VERTEX:
308 break;
309 case PIPE_SHADER_COMPUTE:
310 case PIPE_SHADER_GEOMETRY:
311 case PIPE_SHADER_TESS_CTRL:
312 case PIPE_SHADER_TESS_EVAL:
313 return 0;
314 default:
315 DBG("unknown shader type %d", shader);
316 return 0;
317 }
318
319 switch (param) {
320 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
321 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
322 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
323 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
324 return ETNA_MAX_TOKENS;
325 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
326 return ETNA_MAX_DEPTH; /* XXX */
327 case PIPE_SHADER_CAP_MAX_INPUTS:
328 /* Maximum number of inputs for the vertex shader is the number
329 * of vertex elements - each element defines one vertex shader
330 * input register. For the fragment shader, this is the number
331 * of varyings. */
332 return shader == PIPE_SHADER_FRAGMENT ? screen->specs.max_varyings
333 : screen->specs.vertex_max_elements;
334 case PIPE_SHADER_CAP_MAX_OUTPUTS:
335 return 16; /* see VIVS_VS_OUTPUT */
336 case PIPE_SHADER_CAP_MAX_TEMPS:
337 return 64; /* Max native temporaries. */
338 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
339 return ubo_enable ? ETNA_MAX_CONST_BUF : 1;
340 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
341 return 1;
342 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
343 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
344 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
345 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
346 return 1;
347 case PIPE_SHADER_CAP_SUBROUTINES:
348 return 0;
349 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
350 return VIV_FEATURE(screen, chipMinorFeatures0, HAS_SQRT_TRIG);
351 case PIPE_SHADER_CAP_INT64_ATOMICS:
352 case PIPE_SHADER_CAP_FP16:
353 case PIPE_SHADER_CAP_FP16_DERIVATIVES:
354 case PIPE_SHADER_CAP_INT16:
355 return 0;
356 case PIPE_SHADER_CAP_INTEGERS:
357 return DBG_ENABLED(ETNA_DBG_NIR) && screen->specs.halti >= 2;
358 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
359 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
360 return shader == PIPE_SHADER_FRAGMENT
361 ? screen->specs.fragment_sampler_count
362 : screen->specs.vertex_sampler_count;
363 case PIPE_SHADER_CAP_PREFERRED_IR:
364 return DBG_ENABLED(ETNA_DBG_NIR) ? PIPE_SHADER_IR_NIR : PIPE_SHADER_IR_TGSI;
365 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
366 if (ubo_enable)
367 return 16384; /* 16384 so state tracker enables UBOs */
368 return shader == PIPE_SHADER_FRAGMENT
369 ? screen->specs.max_ps_uniforms * sizeof(float[4])
370 : screen->specs.max_vs_uniforms * sizeof(float[4]);
371 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
372 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
373 case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
374 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
375 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
376 return false;
377 case PIPE_SHADER_CAP_SUPPORTED_IRS:
378 return 0;
379 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
380 return 32;
381 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
382 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
383 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
384 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
385 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
386 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
387 return 0;
388 }
389
390 debug_printf("unknown shader param %d", param);
391 return 0;
392 }
393
394 static uint64_t
395 etna_screen_get_timestamp(struct pipe_screen *pscreen)
396 {
397 return os_time_get_nano();
398 }
399
400 static bool
401 gpu_supports_texture_target(struct etna_screen *screen,
402 enum pipe_texture_target target)
403 {
404 if (target == PIPE_TEXTURE_CUBE_ARRAY)
405 return false;
406
407 /* pre-halti has no array/3D */
408 if (screen->specs.halti < 0 &&
409 (target == PIPE_TEXTURE_1D_ARRAY ||
410 target == PIPE_TEXTURE_2D_ARRAY ||
411 target == PIPE_TEXTURE_3D))
412 return false;
413
414 return true;
415 }
416
417 static bool
418 gpu_supports_texture_format(struct etna_screen *screen, uint32_t fmt,
419 enum pipe_format format)
420 {
421 bool supported = true;
422
423 if (fmt == TEXTURE_FORMAT_ETC1)
424 supported = VIV_FEATURE(screen, chipFeatures, ETC1_TEXTURE_COMPRESSION);
425
426 if (fmt >= TEXTURE_FORMAT_DXT1 && fmt <= TEXTURE_FORMAT_DXT4_DXT5)
427 supported = VIV_FEATURE(screen, chipFeatures, DXT_TEXTURE_COMPRESSION);
428
429 if (util_format_is_srgb(format))
430 supported = VIV_FEATURE(screen, chipMinorFeatures1, HALTI0);
431
432 if (fmt & EXT_FORMAT)
433 supported = VIV_FEATURE(screen, chipMinorFeatures1, HALTI0);
434
435 if (fmt & ASTC_FORMAT) {
436 supported = screen->specs.tex_astc;
437 }
438
439 if (util_format_is_snorm(format))
440 supported = VIV_FEATURE(screen, chipMinorFeatures2, HALTI1);
441
442 if (format != PIPE_FORMAT_S8_UINT_Z24_UNORM &&
443 (util_format_is_pure_integer(format) || util_format_is_float(format)))
444 supported = VIV_FEATURE(screen, chipMinorFeatures4, HALTI2);
445
446
447 if (!supported)
448 return false;
449
450 if (texture_format_needs_swiz(format))
451 return VIV_FEATURE(screen, chipMinorFeatures1, HALTI0);
452
453 return true;
454 }
455
456 static bool
457 gpu_supports_render_format(struct etna_screen *screen, enum pipe_format format,
458 unsigned sample_count)
459 {
460 const uint32_t fmt = translate_pe_format(format);
461
462 if (fmt == ETNA_NO_MATCH)
463 return false;
464
465 /* Validate MSAA; number of samples must be allowed, and render target
466 * must have MSAA'able format. */
467 if (sample_count > 1) {
468 if (!VIV_FEATURE(screen, chipFeatures, MSAA))
469 return false;
470 if (!translate_samples_to_xyscale(sample_count, NULL, NULL))
471 return false;
472 if (translate_ts_format(format) == ETNA_NO_MATCH)
473 return false;
474 }
475
476 if (format == PIPE_FORMAT_R8_UNORM)
477 return VIV_FEATURE(screen, chipMinorFeatures5, HALTI5);
478
479 /* figure out 8bpp RS clear to enable these formats */
480 if (format == PIPE_FORMAT_R8_SINT || format == PIPE_FORMAT_R8_UINT)
481 return VIV_FEATURE(screen, chipMinorFeatures5, HALTI5);
482
483 if (util_format_is_srgb(format))
484 return VIV_FEATURE(screen, chipMinorFeatures5, HALTI3);
485
486 if (util_format_is_pure_integer(format) || util_format_is_float(format))
487 return VIV_FEATURE(screen, chipMinorFeatures4, HALTI2);
488
489 if (format == PIPE_FORMAT_R8G8_UNORM)
490 return VIV_FEATURE(screen, chipMinorFeatures4, HALTI2);
491
492 /* any other extended format is HALTI0 (only R10G10B10A2?) */
493 if (fmt >= PE_FORMAT_R16F)
494 return VIV_FEATURE(screen, chipMinorFeatures1, HALTI0);
495
496 return true;
497 }
498
499 static bool
500 gpu_supports_vertex_format(struct etna_screen *screen, enum pipe_format format)
501 {
502 if (translate_vertex_format_type(format) == ETNA_NO_MATCH)
503 return false;
504
505 if (util_format_is_pure_integer(format))
506 return VIV_FEATURE(screen, chipMinorFeatures4, HALTI2);
507
508 return true;
509 }
510
511 static bool
512 etna_screen_is_format_supported(struct pipe_screen *pscreen,
513 enum pipe_format format,
514 enum pipe_texture_target target,
515 unsigned sample_count,
516 unsigned storage_sample_count,
517 unsigned usage)
518 {
519 struct etna_screen *screen = etna_screen(pscreen);
520 unsigned allowed = 0;
521
522 if (!gpu_supports_texture_target(screen, target))
523 return false;
524
525 if (MAX2(1, sample_count) != MAX2(1, storage_sample_count))
526 return false;
527
528 if (usage & PIPE_BIND_RENDER_TARGET) {
529 if (gpu_supports_render_format(screen, format, sample_count))
530 allowed |= PIPE_BIND_RENDER_TARGET;
531 }
532
533 if (usage & PIPE_BIND_DEPTH_STENCIL) {
534 if (translate_depth_format(format) != ETNA_NO_MATCH)
535 allowed |= PIPE_BIND_DEPTH_STENCIL;
536 }
537
538 if (usage & PIPE_BIND_SAMPLER_VIEW) {
539 uint32_t fmt = translate_texture_format(format);
540
541 if (!gpu_supports_texture_format(screen, fmt, format))
542 fmt = ETNA_NO_MATCH;
543
544 if (sample_count < 2 && fmt != ETNA_NO_MATCH)
545 allowed |= PIPE_BIND_SAMPLER_VIEW;
546 }
547
548 if (usage & PIPE_BIND_VERTEX_BUFFER) {
549 if (gpu_supports_vertex_format(screen, format))
550 allowed |= PIPE_BIND_VERTEX_BUFFER;
551 }
552
553 if (usage & PIPE_BIND_INDEX_BUFFER) {
554 /* must be supported index format */
555 if (format == PIPE_FORMAT_I8_UINT || format == PIPE_FORMAT_I16_UINT ||
556 (format == PIPE_FORMAT_I32_UINT &&
557 VIV_FEATURE(screen, chipFeatures, 32_BIT_INDICES))) {
558 allowed |= PIPE_BIND_INDEX_BUFFER;
559 }
560 }
561
562 /* Always allowed */
563 allowed |=
564 usage & (PIPE_BIND_DISPLAY_TARGET | PIPE_BIND_SCANOUT | PIPE_BIND_SHARED);
565
566 if (usage != allowed) {
567 DBG("not supported: format=%s, target=%d, sample_count=%d, "
568 "usage=%x, allowed=%x",
569 util_format_name(format), target, sample_count, usage, allowed);
570 }
571
572 return usage == allowed;
573 }
574
575 const uint64_t supported_modifiers[] = {
576 DRM_FORMAT_MOD_LINEAR,
577 DRM_FORMAT_MOD_VIVANTE_TILED,
578 DRM_FORMAT_MOD_VIVANTE_SUPER_TILED,
579 DRM_FORMAT_MOD_VIVANTE_SPLIT_TILED,
580 DRM_FORMAT_MOD_VIVANTE_SPLIT_SUPER_TILED,
581 };
582
583 static void
584 etna_screen_query_dmabuf_modifiers(struct pipe_screen *pscreen,
585 enum pipe_format format, int max,
586 uint64_t *modifiers,
587 unsigned int *external_only, int *count)
588 {
589 struct etna_screen *screen = etna_screen(pscreen);
590 int i, num_modifiers = 0;
591
592 if (max > ARRAY_SIZE(supported_modifiers))
593 max = ARRAY_SIZE(supported_modifiers);
594
595 if (!max) {
596 modifiers = NULL;
597 max = ARRAY_SIZE(supported_modifiers);
598 }
599
600 for (i = 0; num_modifiers < max; i++) {
601 /* don't advertise split tiled formats on single pipe/buffer GPUs */
602 if ((screen->specs.pixel_pipes == 1 || screen->specs.single_buffer) &&
603 i >= 3)
604 break;
605
606 if (modifiers)
607 modifiers[num_modifiers] = supported_modifiers[i];
608 if (external_only)
609 external_only[num_modifiers] = util_format_is_yuv(format) ? 1 : 0;
610 num_modifiers++;
611 }
612
613 *count = num_modifiers;
614 }
615
616 static void
617 etna_determine_uniform_limits(struct etna_screen *screen)
618 {
619 /* values for the non unified case are taken from
620 * gcmCONFIGUREUNIFORMS in the Vivante kernel driver file
621 * drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_base.h.
622 */
623 if (screen->model == chipModel_GC2000 &&
624 (screen->revision == 0x5118 || screen->revision == 0x5140)) {
625 screen->specs.max_vs_uniforms = 256;
626 screen->specs.max_ps_uniforms = 64;
627 } else if (screen->specs.num_constants == 320) {
628 screen->specs.max_vs_uniforms = 256;
629 screen->specs.max_ps_uniforms = 64;
630 } else if (screen->specs.num_constants > 256 &&
631 screen->model == chipModel_GC1000) {
632 /* All GC1000 series chips can only support 64 uniforms for ps on non-unified const mode. */
633 screen->specs.max_vs_uniforms = 256;
634 screen->specs.max_ps_uniforms = 64;
635 } else if (screen->specs.num_constants > 256) {
636 screen->specs.max_vs_uniforms = 256;
637 screen->specs.max_ps_uniforms = 256;
638 } else if (screen->specs.num_constants == 256) {
639 screen->specs.max_vs_uniforms = 256;
640 screen->specs.max_ps_uniforms = 256;
641 } else {
642 screen->specs.max_vs_uniforms = 168;
643 screen->specs.max_ps_uniforms = 64;
644 }
645 }
646
647 static bool
648 etna_get_specs(struct etna_screen *screen)
649 {
650 uint64_t val;
651 uint32_t instruction_count;
652
653 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_INSTRUCTION_COUNT, &val)) {
654 DBG("could not get ETNA_GPU_INSTRUCTION_COUNT");
655 goto fail;
656 }
657 instruction_count = val;
658
659 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_VERTEX_OUTPUT_BUFFER_SIZE,
660 &val)) {
661 DBG("could not get ETNA_GPU_VERTEX_OUTPUT_BUFFER_SIZE");
662 goto fail;
663 }
664 screen->specs.vertex_output_buffer_size = val;
665
666 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_VERTEX_CACHE_SIZE, &val)) {
667 DBG("could not get ETNA_GPU_VERTEX_CACHE_SIZE");
668 goto fail;
669 }
670 screen->specs.vertex_cache_size = val;
671
672 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_SHADER_CORE_COUNT, &val)) {
673 DBG("could not get ETNA_GPU_SHADER_CORE_COUNT");
674 goto fail;
675 }
676 screen->specs.shader_core_count = val;
677
678 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_STREAM_COUNT, &val)) {
679 DBG("could not get ETNA_GPU_STREAM_COUNT");
680 goto fail;
681 }
682 screen->specs.stream_count = val;
683
684 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_REGISTER_MAX, &val)) {
685 DBG("could not get ETNA_GPU_REGISTER_MAX");
686 goto fail;
687 }
688 screen->specs.max_registers = val;
689
690 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_PIXEL_PIPES, &val)) {
691 DBG("could not get ETNA_GPU_PIXEL_PIPES");
692 goto fail;
693 }
694 screen->specs.pixel_pipes = val;
695
696 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_NUM_CONSTANTS, &val)) {
697 DBG("could not get %s", "ETNA_GPU_NUM_CONSTANTS");
698 goto fail;
699 }
700 if (val == 0) {
701 fprintf(stderr, "Warning: zero num constants (update kernel?)\n");
702 val = 168;
703 }
704 screen->specs.num_constants = val;
705
706 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_NUM_VARYINGS, &val)) {
707 DBG("could not get ETNA_GPU_NUM_VARYINGS");
708 goto fail;
709 }
710 screen->specs.max_varyings = MAX2(val, ETNA_NUM_VARYINGS);
711
712 /* Figure out gross GPU architecture. See rnndb/common.xml for a specific
713 * description of the differences. */
714 if (VIV_FEATURE(screen, chipMinorFeatures5, HALTI5))
715 screen->specs.halti = 5; /* New GC7000/GC8x00 */
716 else if (VIV_FEATURE(screen, chipMinorFeatures5, HALTI4))
717 screen->specs.halti = 4; /* Old GC7000/GC7400 */
718 else if (VIV_FEATURE(screen, chipMinorFeatures5, HALTI3))
719 screen->specs.halti = 3; /* None? */
720 else if (VIV_FEATURE(screen, chipMinorFeatures4, HALTI2))
721 screen->specs.halti = 2; /* GC2500/GC3000/GC5000/GC6400 */
722 else if (VIV_FEATURE(screen, chipMinorFeatures2, HALTI1))
723 screen->specs.halti = 1; /* GC900/GC4000/GC7000UL */
724 else if (VIV_FEATURE(screen, chipMinorFeatures1, HALTI0))
725 screen->specs.halti = 0; /* GC880/GC2000/GC7000TM */
726 else
727 screen->specs.halti = -1; /* GC7000nanolite / pre-GC2000 except GC880 */
728 if (screen->specs.halti >= 0)
729 DBG("etnaviv: GPU arch: HALTI%d", screen->specs.halti);
730 else
731 DBG("etnaviv: GPU arch: pre-HALTI");
732
733 screen->specs.can_supertile =
734 VIV_FEATURE(screen, chipMinorFeatures0, SUPER_TILED);
735 screen->specs.bits_per_tile =
736 VIV_FEATURE(screen, chipMinorFeatures0, 2BITPERTILE) ? 2 : 4;
737 screen->specs.ts_clear_value =
738 VIV_FEATURE(screen, chipMinorFeatures5, BLT_ENGINE) ? 0xffffffff :
739 VIV_FEATURE(screen, chipMinorFeatures0, 2BITPERTILE) ? 0x55555555 :
740 0x11111111;
741
742
743 /* vertex and fragment samplers live in one address space */
744 screen->specs.vertex_sampler_offset = 8;
745 screen->specs.fragment_sampler_count = 8;
746 screen->specs.vertex_sampler_count = 4;
747
748 if (screen->model == 0x400)
749 screen->specs.vertex_sampler_count = 0;
750
751 screen->specs.vs_need_z_div =
752 screen->model < 0x1000 && screen->model != 0x880;
753 screen->specs.has_sin_cos_sqrt =
754 VIV_FEATURE(screen, chipMinorFeatures0, HAS_SQRT_TRIG);
755 screen->specs.has_sign_floor_ceil =
756 VIV_FEATURE(screen, chipMinorFeatures0, HAS_SIGN_FLOOR_CEIL);
757 screen->specs.has_shader_range_registers =
758 screen->model >= 0x1000 || screen->model == 0x880;
759 screen->specs.npot_tex_any_wrap =
760 VIV_FEATURE(screen, chipMinorFeatures1, NON_POWER_OF_TWO);
761 screen->specs.has_new_transcendentals =
762 VIV_FEATURE(screen, chipMinorFeatures3, HAS_FAST_TRANSCENDENTALS);
763 screen->specs.has_halti2_instructions =
764 VIV_FEATURE(screen, chipMinorFeatures4, HALTI2);
765 screen->specs.v4_compression =
766 VIV_FEATURE(screen, chipMinorFeatures6, V4_COMPRESSION);
767 screen->specs.seamless_cube_map =
768 (screen->model != 0x880) && /* Seamless cubemap is broken on GC880? */
769 VIV_FEATURE(screen, chipMinorFeatures2, SEAMLESS_CUBE_MAP);
770
771 if (screen->specs.halti >= 5) {
772 /* GC7000 - this core must load shaders from memory. */
773 screen->specs.vs_offset = 0;
774 screen->specs.ps_offset = 0;
775 screen->specs.max_instructions = 0; /* Do not program shaders manually */
776 screen->specs.has_icache = true;
777 } else if (VIV_FEATURE(screen, chipMinorFeatures3, INSTRUCTION_CACHE)) {
778 /* GC3000 - this core is capable of loading shaders from
779 * memory. It can also run shaders from registers, as a fallback, but
780 * "max_instructions" does not have the correct value. It has place for
781 * 2*256 instructions just like GC2000, but the offsets are slightly
782 * different.
783 */
784 screen->specs.vs_offset = 0xC000;
785 /* State 08000-0C000 mirrors 0C000-0E000, and the Vivante driver uses
786 * this mirror for writing PS instructions, probably safest to do the
787 * same.
788 */
789 screen->specs.ps_offset = 0x8000 + 0x1000;
790 screen->specs.max_instructions = 256; /* maximum number instructions for non-icache use */
791 screen->specs.has_icache = true;
792 } else {
793 if (instruction_count > 256) { /* unified instruction memory? */
794 screen->specs.vs_offset = 0xC000;
795 screen->specs.ps_offset = 0xD000; /* like vivante driver */
796 screen->specs.max_instructions = 256;
797 } else {
798 screen->specs.vs_offset = 0x4000;
799 screen->specs.ps_offset = 0x6000;
800 screen->specs.max_instructions = instruction_count / 2;
801 }
802 screen->specs.has_icache = false;
803 }
804
805 if (VIV_FEATURE(screen, chipMinorFeatures1, HALTI0)) {
806 screen->specs.vertex_max_elements = 16;
807 } else {
808 /* Etna_viv documentation seems confused over the correct value
809 * here so choose the lower to be safe: HALTI0 says 16 i.s.o.
810 * 10, but VERTEX_ELEMENT_CONFIG register says 16 i.s.o. 12. */
811 screen->specs.vertex_max_elements = 10;
812 }
813
814 etna_determine_uniform_limits(screen);
815
816 if (screen->specs.halti >= 5) {
817 screen->specs.has_unified_uniforms = true;
818 screen->specs.vs_uniforms_offset = VIVS_SH_HALTI5_UNIFORMS_MIRROR(0);
819 screen->specs.ps_uniforms_offset = VIVS_SH_HALTI5_UNIFORMS(screen->specs.max_vs_uniforms*4);
820 } else if (screen->specs.halti >= 1) {
821 /* unified uniform memory on GC3000 - HALTI1 feature bit is just a guess
822 */
823 screen->specs.has_unified_uniforms = true;
824 screen->specs.vs_uniforms_offset = VIVS_SH_UNIFORMS(0);
825 /* hardcode PS uniforms to start after end of VS uniforms -
826 * for more flexibility this offset could be variable based on the
827 * shader.
828 */
829 screen->specs.ps_uniforms_offset = VIVS_SH_UNIFORMS(screen->specs.max_vs_uniforms*4);
830 } else {
831 screen->specs.has_unified_uniforms = false;
832 screen->specs.vs_uniforms_offset = VIVS_VS_UNIFORMS(0);
833 screen->specs.ps_uniforms_offset = VIVS_PS_UNIFORMS(0);
834 }
835
836 screen->specs.max_texture_size =
837 VIV_FEATURE(screen, chipMinorFeatures0, TEXTURE_8K) ? 8192 : 2048;
838 screen->specs.max_rendertarget_size =
839 VIV_FEATURE(screen, chipMinorFeatures0, RENDERTARGET_8K) ? 8192 : 2048;
840
841 screen->specs.single_buffer = VIV_FEATURE(screen, chipMinorFeatures4, SINGLE_BUFFER);
842 if (screen->specs.single_buffer)
843 DBG("etnaviv: Single buffer mode enabled with %d pixel pipes", screen->specs.pixel_pipes);
844
845 screen->specs.tex_astc = VIV_FEATURE(screen, chipMinorFeatures4, TEXTURE_ASTC) &&
846 !VIV_FEATURE(screen, chipMinorFeatures6, NO_ASTC);
847
848 screen->specs.use_blt = VIV_FEATURE(screen, chipMinorFeatures5, BLT_ENGINE);
849
850 return true;
851
852 fail:
853 return false;
854 }
855
856 struct etna_bo *
857 etna_screen_bo_from_handle(struct pipe_screen *pscreen,
858 struct winsys_handle *whandle, unsigned *out_stride)
859 {
860 struct etna_screen *screen = etna_screen(pscreen);
861 struct etna_bo *bo;
862
863 if (whandle->type == WINSYS_HANDLE_TYPE_SHARED) {
864 bo = etna_bo_from_name(screen->dev, whandle->handle);
865 } else if (whandle->type == WINSYS_HANDLE_TYPE_FD) {
866 bo = etna_bo_from_dmabuf(screen->dev, whandle->handle);
867 } else {
868 DBG("Attempt to import unsupported handle type %d", whandle->type);
869 return NULL;
870 }
871
872 if (!bo) {
873 DBG("ref name 0x%08x failed", whandle->handle);
874 return NULL;
875 }
876
877 *out_stride = whandle->stride;
878
879 return bo;
880 }
881
882 static const void *
883 etna_get_compiler_options(struct pipe_screen *pscreen,
884 enum pipe_shader_ir ir, unsigned shader)
885 {
886 return &etna_screen(pscreen)->options;
887 }
888
889 struct pipe_screen *
890 etna_screen_create(struct etna_device *dev, struct etna_gpu *gpu,
891 struct renderonly *ro)
892 {
893 struct etna_screen *screen = CALLOC_STRUCT(etna_screen);
894 struct pipe_screen *pscreen;
895 drmVersionPtr version;
896 uint64_t val;
897
898 if (!screen)
899 return NULL;
900
901 pscreen = &screen->base;
902 screen->dev = dev;
903 screen->gpu = gpu;
904 screen->ro = renderonly_dup(ro);
905 screen->refcnt = 1;
906
907 if (!screen->ro) {
908 DBG("could not create renderonly object");
909 goto fail;
910 }
911
912 version = drmGetVersion(screen->ro->gpu_fd);
913 screen->drm_version = ETNA_DRM_VERSION(version->version_major,
914 version->version_minor);
915 drmFreeVersion(version);
916
917 etna_mesa_debug = debug_get_option_etna_mesa_debug();
918
919 /* Disable autodisable for correct rendering with TS */
920 etna_mesa_debug |= ETNA_DBG_NO_AUTODISABLE;
921
922 screen->pipe = etna_pipe_new(gpu, ETNA_PIPE_3D);
923 if (!screen->pipe) {
924 DBG("could not create 3d pipe");
925 goto fail;
926 }
927
928 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_MODEL, &val)) {
929 DBG("could not get ETNA_GPU_MODEL");
930 goto fail;
931 }
932 screen->model = val;
933
934 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_REVISION, &val)) {
935 DBG("could not get ETNA_GPU_REVISION");
936 goto fail;
937 }
938 screen->revision = val;
939
940 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_FEATURES_0, &val)) {
941 DBG("could not get ETNA_GPU_FEATURES_0");
942 goto fail;
943 }
944 screen->features[0] = val;
945
946 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_FEATURES_1, &val)) {
947 DBG("could not get ETNA_GPU_FEATURES_1");
948 goto fail;
949 }
950 screen->features[1] = val;
951
952 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_FEATURES_2, &val)) {
953 DBG("could not get ETNA_GPU_FEATURES_2");
954 goto fail;
955 }
956 screen->features[2] = val;
957
958 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_FEATURES_3, &val)) {
959 DBG("could not get ETNA_GPU_FEATURES_3");
960 goto fail;
961 }
962 screen->features[3] = val;
963
964 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_FEATURES_4, &val)) {
965 DBG("could not get ETNA_GPU_FEATURES_4");
966 goto fail;
967 }
968 screen->features[4] = val;
969
970 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_FEATURES_5, &val)) {
971 DBG("could not get ETNA_GPU_FEATURES_5");
972 goto fail;
973 }
974 screen->features[5] = val;
975
976 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_FEATURES_6, &val)) {
977 DBG("could not get ETNA_GPU_FEATURES_6");
978 goto fail;
979 }
980 screen->features[6] = val;
981
982 if (etna_gpu_get_param(screen->gpu, ETNA_GPU_FEATURES_7, &val)) {
983 DBG("could not get ETNA_GPU_FEATURES_7");
984 goto fail;
985 }
986 screen->features[7] = val;
987
988 if (!etna_get_specs(screen))
989 goto fail;
990
991 if (screen->specs.halti >= 5 && !etnaviv_device_softpin_capable(dev)) {
992 DBG("halti5 requires softpin");
993 goto fail;
994 }
995
996 screen->options = (nir_shader_compiler_options) {
997 .lower_fpow = true,
998 .lower_sub = true,
999 .lower_ftrunc = true,
1000 .fuse_ffma = true,
1001 .lower_bitops = true,
1002 .lower_all_io_to_temps = true,
1003 .vertex_id_zero_based = true,
1004 .lower_flrp32 = true,
1005 .lower_fmod = true,
1006 .lower_vector_cmp = true,
1007 .lower_fdph = true,
1008 .lower_fdiv = true, /* !screen->specs.has_new_transcendentals */
1009 .lower_fsign = !screen->specs.has_sign_floor_ceil,
1010 .lower_ffloor = !screen->specs.has_sign_floor_ceil,
1011 .lower_fceil = !screen->specs.has_sign_floor_ceil,
1012 .lower_fsqrt = !screen->specs.has_sin_cos_sqrt,
1013 .lower_sincos = !screen->specs.has_sin_cos_sqrt,
1014 };
1015
1016 /* apply debug options that disable individual features */
1017 if (DBG_ENABLED(ETNA_DBG_NO_EARLY_Z))
1018 screen->features[viv_chipFeatures] |= chipFeatures_NO_EARLY_Z;
1019 if (DBG_ENABLED(ETNA_DBG_NO_TS))
1020 screen->features[viv_chipFeatures] &= ~chipFeatures_FAST_CLEAR;
1021 if (DBG_ENABLED(ETNA_DBG_NO_AUTODISABLE))
1022 screen->features[viv_chipMinorFeatures1] &= ~chipMinorFeatures1_AUTO_DISABLE;
1023 if (DBG_ENABLED(ETNA_DBG_NO_SUPERTILE))
1024 screen->specs.can_supertile = 0;
1025 if (DBG_ENABLED(ETNA_DBG_NO_SINGLEBUF))
1026 screen->specs.single_buffer = 0;
1027
1028 pscreen->destroy = etna_screen_destroy;
1029 pscreen->get_param = etna_screen_get_param;
1030 pscreen->get_paramf = etna_screen_get_paramf;
1031 pscreen->get_shader_param = etna_screen_get_shader_param;
1032 pscreen->get_compiler_options = etna_get_compiler_options;
1033
1034 pscreen->get_name = etna_screen_get_name;
1035 pscreen->get_vendor = etna_screen_get_vendor;
1036 pscreen->get_device_vendor = etna_screen_get_device_vendor;
1037
1038 pscreen->get_timestamp = etna_screen_get_timestamp;
1039 pscreen->context_create = etna_context_create;
1040 pscreen->is_format_supported = etna_screen_is_format_supported;
1041 pscreen->query_dmabuf_modifiers = etna_screen_query_dmabuf_modifiers;
1042
1043 etna_fence_screen_init(pscreen);
1044 etna_query_screen_init(pscreen);
1045 etna_resource_screen_init(pscreen);
1046
1047 util_dynarray_init(&screen->supported_pm_queries, NULL);
1048 slab_create_parent(&screen->transfer_pool, sizeof(struct etna_transfer), 16);
1049
1050 if (screen->drm_version >= ETNA_DRM_VERSION_PERFMON)
1051 etna_pm_query_setup(screen);
1052
1053 return pscreen;
1054
1055 fail:
1056 etna_screen_destroy(pscreen);
1057 return NULL;
1058 }