v3d: Add support for draw indirect for GLES3.1.
[mesa.git] / src / gallium / drivers / v3d / v3d_screen.c
1 /*
2 * Copyright © 2014-2017 Broadcom
3 * Copyright (C) 2012 Rob Clark <robclark@freedesktop.org>
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9 * and/or sell copies of the Software, and to permit persons to whom the
10 * Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
22 * IN THE SOFTWARE.
23 */
24
25 #include "util/os_misc.h"
26 #include "pipe/p_defines.h"
27 #include "pipe/p_screen.h"
28 #include "pipe/p_state.h"
29
30 #include "util/u_debug.h"
31 #include "util/u_memory.h"
32 #include "util/u_format.h"
33 #include "util/u_hash_table.h"
34 #include "util/u_screen.h"
35 #include "util/u_transfer_helper.h"
36 #include "util/ralloc.h"
37
38 #include <xf86drm.h>
39 #include "v3d_screen.h"
40 #include "v3d_context.h"
41 #include "v3d_resource.h"
42 #include "compiler/v3d_compiler.h"
43
44 static const char *
45 v3d_screen_get_name(struct pipe_screen *pscreen)
46 {
47 struct v3d_screen *screen = v3d_screen(pscreen);
48
49 if (!screen->name) {
50 screen->name = ralloc_asprintf(screen,
51 "V3D %d.%d",
52 screen->devinfo.ver / 10,
53 screen->devinfo.ver % 10);
54 }
55
56 return screen->name;
57 }
58
59 static const char *
60 v3d_screen_get_vendor(struct pipe_screen *pscreen)
61 {
62 return "Broadcom";
63 }
64
65 static void
66 v3d_screen_destroy(struct pipe_screen *pscreen)
67 {
68 struct v3d_screen *screen = v3d_screen(pscreen);
69
70 util_hash_table_destroy(screen->bo_handles);
71 v3d_bufmgr_destroy(pscreen);
72 slab_destroy_parent(&screen->transfer_pool);
73
74 if (using_v3d_simulator)
75 v3d_simulator_destroy(screen);
76
77 v3d_compiler_free(screen->compiler);
78 u_transfer_helper_destroy(pscreen->transfer_helper);
79
80 close(screen->fd);
81 ralloc_free(pscreen);
82 }
83
84 static bool
85 v3d_has_feature(struct v3d_screen *screen, enum drm_v3d_param feature)
86 {
87 struct drm_v3d_get_param p = {
88 .param = feature,
89 };
90 int ret = v3d_ioctl(screen->fd, DRM_IOCTL_V3D_GET_PARAM, &p);
91
92 if (ret != 0)
93 return false;
94
95 return p.value;
96 }
97
98 static int
99 v3d_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
100 {
101 struct v3d_screen *screen = v3d_screen(pscreen);
102
103 switch (param) {
104 /* Supported features (boolean caps). */
105 case PIPE_CAP_VERTEX_COLOR_CLAMPED:
106 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
107 case PIPE_CAP_FRAGMENT_COLOR_CLAMPED:
108 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
109 case PIPE_CAP_NPOT_TEXTURES:
110 case PIPE_CAP_SHAREABLE_SHADERS:
111 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
112 case PIPE_CAP_TEXTURE_MULTISAMPLE:
113 case PIPE_CAP_TEXTURE_SWIZZLE:
114 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
115 case PIPE_CAP_START_INSTANCE:
116 case PIPE_CAP_TGSI_INSTANCEID:
117 case PIPE_CAP_SM3:
118 case PIPE_CAP_TEXTURE_QUERY_LOD:
119 case PIPE_CAP_PRIMITIVE_RESTART:
120 case PIPE_CAP_OCCLUSION_QUERY:
121 case PIPE_CAP_POINT_SPRITE:
122 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
123 case PIPE_CAP_COMPUTE:
124 case PIPE_CAP_DRAW_INDIRECT:
125 case PIPE_CAP_MULTI_DRAW_INDIRECT:
126 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
127 case PIPE_CAP_SIGNED_VERTEX_BUFFER_OFFSET:
128 case PIPE_CAP_TGSI_CAN_READ_OUTPUTS:
129 case PIPE_CAP_TGSI_PACK_HALF_FLOAT:
130 case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
131 return 1;
132
133 case PIPE_CAP_GENERATE_MIPMAP:
134 return v3d_has_feature(screen, DRM_V3D_PARAM_SUPPORTS_TFU);
135
136 case PIPE_CAP_INDEP_BLEND_ENABLE:
137 return screen->devinfo.ver >= 40;
138
139 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
140 return 256;
141
142 case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
143 return 4;
144
145 case PIPE_CAP_GLSL_FEATURE_LEVEL:
146 return 400;
147
148 case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
149 return 140;
150
151 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
152 return 1;
153 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
154 return 0;
155 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
156 if (screen->devinfo.ver >= 40)
157 return 0;
158 else
159 return 1;
160 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
161 if (screen->devinfo.ver >= 40)
162 return 1;
163 else
164 return 0;
165
166 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
167 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
168 case PIPE_CAP_MIXED_COLOR_DEPTH_BITS:
169 return 1;
170
171 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
172 return 4;
173
174 /* Texturing. */
175 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
176 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
177 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
178 return VC5_MAX_MIP_LEVELS;
179 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
180 return 2048;
181
182 /* Render targets. */
183 case PIPE_CAP_MAX_RENDER_TARGETS:
184 return 4;
185
186 case PIPE_CAP_VENDOR_ID:
187 return 0x14E4;
188 case PIPE_CAP_ACCELERATED:
189 return 1;
190 case PIPE_CAP_VIDEO_MEMORY: {
191 uint64_t system_memory;
192
193 if (!os_get_total_physical_memory(&system_memory))
194 return 0;
195
196 return (int)(system_memory >> 20);
197 }
198 case PIPE_CAP_UMA:
199 return 1;
200
201 default:
202 return u_pipe_screen_get_param_defaults(pscreen, param);
203 }
204 }
205
206 static float
207 v3d_screen_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)
208 {
209 switch (param) {
210 case PIPE_CAPF_MAX_LINE_WIDTH:
211 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
212 return 32;
213
214 case PIPE_CAPF_MAX_POINT_WIDTH:
215 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
216 return 512.0f;
217
218 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
219 return 0.0f;
220 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
221 return 16.0f;
222
223 case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
224 case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
225 case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
226 return 0.0f;
227 default:
228 fprintf(stderr, "unknown paramf %d\n", param);
229 return 0;
230 }
231 }
232
233 static int
234 v3d_screen_get_shader_param(struct pipe_screen *pscreen, unsigned shader,
235 enum pipe_shader_cap param)
236 {
237 if (shader != PIPE_SHADER_VERTEX &&
238 shader != PIPE_SHADER_FRAGMENT) {
239 return 0;
240 }
241
242 /* this is probably not totally correct.. but it's a start: */
243 switch (param) {
244 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
245 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
246 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
247 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
248 return 16384;
249
250 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
251 return UINT_MAX;
252
253 case PIPE_SHADER_CAP_MAX_INPUTS:
254 if (shader == PIPE_SHADER_FRAGMENT)
255 return VC5_MAX_FS_INPUTS / 4;
256 else
257 return VC5_MAX_ATTRIBUTES;
258 case PIPE_SHADER_CAP_MAX_OUTPUTS:
259 if (shader == PIPE_SHADER_FRAGMENT)
260 return 4;
261 else
262 return VC5_MAX_FS_INPUTS / 4;
263 case PIPE_SHADER_CAP_MAX_TEMPS:
264 return 256; /* GL_MAX_PROGRAM_TEMPORARIES_ARB */
265 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
266 return 16 * 1024 * sizeof(float);
267 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
268 return 16;
269 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
270 return 0;
271 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
272 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
273 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
274 return 0;
275 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
276 return 1;
277 case PIPE_SHADER_CAP_SUBROUTINES:
278 return 0;
279 case PIPE_SHADER_CAP_INTEGERS:
280 return 1;
281 case PIPE_SHADER_CAP_FP16:
282 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
283 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
284 case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
285 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
286 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
287 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
288 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
289 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
290 return 0;
291 case PIPE_SHADER_CAP_SCALAR_ISA:
292 return 1;
293 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
294 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
295 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
296 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
297 return VC5_MAX_TEXTURE_SAMPLERS;
298 case PIPE_SHADER_CAP_PREFERRED_IR:
299 return PIPE_SHADER_IR_NIR;
300 case PIPE_SHADER_CAP_SUPPORTED_IRS:
301 return 0;
302 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
303 return 32;
304 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
305 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
306 return 0;
307 default:
308 fprintf(stderr, "unknown shader param %d\n", param);
309 return 0;
310 }
311 return 0;
312 }
313
314 static boolean
315 v3d_screen_is_format_supported(struct pipe_screen *pscreen,
316 enum pipe_format format,
317 enum pipe_texture_target target,
318 unsigned sample_count,
319 unsigned storage_sample_count,
320 unsigned usage)
321 {
322 struct v3d_screen *screen = v3d_screen(pscreen);
323
324 if (MAX2(1, sample_count) != MAX2(1, storage_sample_count))
325 return false;
326
327 if (sample_count > 1 && sample_count != VC5_MAX_SAMPLES)
328 return FALSE;
329
330 if (target >= PIPE_MAX_TEXTURE_TYPES) {
331 return FALSE;
332 }
333
334 if (usage & PIPE_BIND_VERTEX_BUFFER) {
335 switch (format) {
336 case PIPE_FORMAT_R32G32B32A32_FLOAT:
337 case PIPE_FORMAT_R32G32B32_FLOAT:
338 case PIPE_FORMAT_R32G32_FLOAT:
339 case PIPE_FORMAT_R32_FLOAT:
340 case PIPE_FORMAT_R32G32B32A32_SNORM:
341 case PIPE_FORMAT_R32G32B32_SNORM:
342 case PIPE_FORMAT_R32G32_SNORM:
343 case PIPE_FORMAT_R32_SNORM:
344 case PIPE_FORMAT_R32G32B32A32_SSCALED:
345 case PIPE_FORMAT_R32G32B32_SSCALED:
346 case PIPE_FORMAT_R32G32_SSCALED:
347 case PIPE_FORMAT_R32_SSCALED:
348 case PIPE_FORMAT_R16G16B16A16_UNORM:
349 case PIPE_FORMAT_R16G16B16_UNORM:
350 case PIPE_FORMAT_R16G16_UNORM:
351 case PIPE_FORMAT_R16_UNORM:
352 case PIPE_FORMAT_R16G16B16A16_SNORM:
353 case PIPE_FORMAT_R16G16B16_SNORM:
354 case PIPE_FORMAT_R16G16_SNORM:
355 case PIPE_FORMAT_R16_SNORM:
356 case PIPE_FORMAT_R16G16B16A16_USCALED:
357 case PIPE_FORMAT_R16G16B16_USCALED:
358 case PIPE_FORMAT_R16G16_USCALED:
359 case PIPE_FORMAT_R16_USCALED:
360 case PIPE_FORMAT_R16G16B16A16_SSCALED:
361 case PIPE_FORMAT_R16G16B16_SSCALED:
362 case PIPE_FORMAT_R16G16_SSCALED:
363 case PIPE_FORMAT_R16_SSCALED:
364 case PIPE_FORMAT_R8G8B8A8_UNORM:
365 case PIPE_FORMAT_R8G8B8_UNORM:
366 case PIPE_FORMAT_R8G8_UNORM:
367 case PIPE_FORMAT_R8_UNORM:
368 case PIPE_FORMAT_R8G8B8A8_SNORM:
369 case PIPE_FORMAT_R8G8B8_SNORM:
370 case PIPE_FORMAT_R8G8_SNORM:
371 case PIPE_FORMAT_R8_SNORM:
372 case PIPE_FORMAT_R8G8B8A8_USCALED:
373 case PIPE_FORMAT_R8G8B8_USCALED:
374 case PIPE_FORMAT_R8G8_USCALED:
375 case PIPE_FORMAT_R8_USCALED:
376 case PIPE_FORMAT_R8G8B8A8_SSCALED:
377 case PIPE_FORMAT_R8G8B8_SSCALED:
378 case PIPE_FORMAT_R8G8_SSCALED:
379 case PIPE_FORMAT_R8_SSCALED:
380 case PIPE_FORMAT_R10G10B10A2_UNORM:
381 case PIPE_FORMAT_B10G10R10A2_UNORM:
382 case PIPE_FORMAT_R10G10B10A2_SNORM:
383 case PIPE_FORMAT_B10G10R10A2_SNORM:
384 case PIPE_FORMAT_R10G10B10A2_USCALED:
385 case PIPE_FORMAT_B10G10R10A2_USCALED:
386 case PIPE_FORMAT_R10G10B10A2_SSCALED:
387 case PIPE_FORMAT_B10G10R10A2_SSCALED:
388 break;
389 default:
390 return FALSE;
391 }
392 }
393
394 if ((usage & PIPE_BIND_RENDER_TARGET) &&
395 !v3d_rt_format_supported(&screen->devinfo, format)) {
396 return FALSE;
397 }
398
399 if ((usage & PIPE_BIND_SAMPLER_VIEW) &&
400 !v3d_tex_format_supported(&screen->devinfo, format)) {
401 return FALSE;
402 }
403
404 if ((usage & PIPE_BIND_DEPTH_STENCIL) &&
405 !(format == PIPE_FORMAT_S8_UINT_Z24_UNORM ||
406 format == PIPE_FORMAT_X8Z24_UNORM ||
407 format == PIPE_FORMAT_Z16_UNORM ||
408 format == PIPE_FORMAT_Z32_FLOAT ||
409 format == PIPE_FORMAT_Z32_FLOAT_S8X24_UINT)) {
410 return FALSE;
411 }
412
413 if ((usage & PIPE_BIND_INDEX_BUFFER) &&
414 !(format == PIPE_FORMAT_I8_UINT ||
415 format == PIPE_FORMAT_I16_UINT ||
416 format == PIPE_FORMAT_I32_UINT)) {
417 return FALSE;
418 }
419
420 return TRUE;
421 }
422
423 #define PTR_TO_UINT(x) ((unsigned)((intptr_t)(x)))
424
425 static unsigned handle_hash(void *key)
426 {
427 return PTR_TO_UINT(key);
428 }
429
430 static int handle_compare(void *key1, void *key2)
431 {
432 return PTR_TO_UINT(key1) != PTR_TO_UINT(key2);
433 }
434
435 static bool
436 v3d_get_device_info(struct v3d_screen *screen)
437 {
438 struct drm_v3d_get_param ident0 = {
439 .param = DRM_V3D_PARAM_V3D_CORE0_IDENT0,
440 };
441 struct drm_v3d_get_param ident1 = {
442 .param = DRM_V3D_PARAM_V3D_CORE0_IDENT1,
443 };
444 int ret;
445
446 ret = v3d_ioctl(screen->fd, DRM_IOCTL_V3D_GET_PARAM, &ident0);
447 if (ret != 0) {
448 fprintf(stderr, "Couldn't get V3D core IDENT0: %s\n",
449 strerror(errno));
450 return false;
451 }
452 ret = v3d_ioctl(screen->fd, DRM_IOCTL_V3D_GET_PARAM, &ident1);
453 if (ret != 0) {
454 fprintf(stderr, "Couldn't get V3D core IDENT1: %s\n",
455 strerror(errno));
456 return false;
457 }
458
459 uint32_t major = (ident0.value >> 24) & 0xff;
460 uint32_t minor = (ident1.value >> 0) & 0xf;
461 screen->devinfo.ver = major * 10 + minor;
462
463 screen->devinfo.vpm_size = (ident1.value >> 28 & 0xf) * 8192;
464
465 switch (screen->devinfo.ver) {
466 case 33:
467 case 41:
468 case 42:
469 break;
470 default:
471 fprintf(stderr,
472 "V3D %d.%d not supported by this version of Mesa.\n",
473 screen->devinfo.ver / 10,
474 screen->devinfo.ver % 10);
475 return false;
476 }
477
478 return true;
479 }
480
481 static const void *
482 v3d_screen_get_compiler_options(struct pipe_screen *pscreen,
483 enum pipe_shader_ir ir, unsigned shader)
484 {
485 return &v3d_nir_options;
486 }
487
488 struct pipe_screen *
489 v3d_screen_create(int fd, struct renderonly *ro)
490 {
491 struct v3d_screen *screen = rzalloc(NULL, struct v3d_screen);
492 struct pipe_screen *pscreen;
493
494 pscreen = &screen->base;
495
496 pscreen->destroy = v3d_screen_destroy;
497 pscreen->get_param = v3d_screen_get_param;
498 pscreen->get_paramf = v3d_screen_get_paramf;
499 pscreen->get_shader_param = v3d_screen_get_shader_param;
500 pscreen->context_create = v3d_context_create;
501 pscreen->is_format_supported = v3d_screen_is_format_supported;
502
503 screen->fd = fd;
504 if (ro) {
505 screen->ro = renderonly_dup(ro);
506 if (!screen->ro) {
507 fprintf(stderr, "Failed to dup renderonly object\n");
508 ralloc_free(screen);
509 return NULL;
510 }
511 }
512 list_inithead(&screen->bo_cache.time_list);
513 (void)mtx_init(&screen->bo_handles_mutex, mtx_plain);
514 screen->bo_handles = util_hash_table_create(handle_hash, handle_compare);
515
516 #if defined(USE_V3D_SIMULATOR)
517 v3d_simulator_init(screen);
518 #endif
519
520 if (!v3d_get_device_info(screen))
521 goto fail;
522
523 slab_create_parent(&screen->transfer_pool, sizeof(struct v3d_transfer), 16);
524
525 v3d_fence_init(screen);
526
527 v3d_process_debug_variable();
528
529 v3d_resource_screen_init(pscreen);
530
531 screen->compiler = v3d_compiler_init(&screen->devinfo);
532
533 pscreen->get_name = v3d_screen_get_name;
534 pscreen->get_vendor = v3d_screen_get_vendor;
535 pscreen->get_device_vendor = v3d_screen_get_vendor;
536 pscreen->get_compiler_options = v3d_screen_get_compiler_options;
537
538 return pscreen;
539
540 fail:
541 close(fd);
542 ralloc_free(pscreen);
543 return NULL;
544 }