v3d: Add SSBO/atomic counters support.
[mesa.git] / src / gallium / drivers / v3d / v3d_screen.c
1 /*
2 * Copyright © 2014-2017 Broadcom
3 * Copyright (C) 2012 Rob Clark <robclark@freedesktop.org>
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9 * and/or sell copies of the Software, and to permit persons to whom the
10 * Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
22 * IN THE SOFTWARE.
23 */
24
25 #include "util/os_misc.h"
26 #include "pipe/p_defines.h"
27 #include "pipe/p_screen.h"
28 #include "pipe/p_state.h"
29
30 #include "util/u_debug.h"
31 #include "util/u_memory.h"
32 #include "util/u_format.h"
33 #include "util/u_hash_table.h"
34 #include "util/u_screen.h"
35 #include "util/u_transfer_helper.h"
36 #include "util/ralloc.h"
37
38 #include <xf86drm.h>
39 #include "v3d_screen.h"
40 #include "v3d_context.h"
41 #include "v3d_resource.h"
42 #include "compiler/v3d_compiler.h"
43
44 static const char *
45 v3d_screen_get_name(struct pipe_screen *pscreen)
46 {
47 struct v3d_screen *screen = v3d_screen(pscreen);
48
49 if (!screen->name) {
50 screen->name = ralloc_asprintf(screen,
51 "V3D %d.%d",
52 screen->devinfo.ver / 10,
53 screen->devinfo.ver % 10);
54 }
55
56 return screen->name;
57 }
58
59 static const char *
60 v3d_screen_get_vendor(struct pipe_screen *pscreen)
61 {
62 return "Broadcom";
63 }
64
65 static void
66 v3d_screen_destroy(struct pipe_screen *pscreen)
67 {
68 struct v3d_screen *screen = v3d_screen(pscreen);
69
70 util_hash_table_destroy(screen->bo_handles);
71 v3d_bufmgr_destroy(pscreen);
72 slab_destroy_parent(&screen->transfer_pool);
73
74 if (using_v3d_simulator)
75 v3d_simulator_destroy(screen);
76
77 v3d_compiler_free(screen->compiler);
78 u_transfer_helper_destroy(pscreen->transfer_helper);
79
80 close(screen->fd);
81 ralloc_free(pscreen);
82 }
83
84 static bool
85 v3d_has_feature(struct v3d_screen *screen, enum drm_v3d_param feature)
86 {
87 struct drm_v3d_get_param p = {
88 .param = feature,
89 };
90 int ret = v3d_ioctl(screen->fd, DRM_IOCTL_V3D_GET_PARAM, &p);
91
92 if (ret != 0)
93 return false;
94
95 return p.value;
96 }
97
98 static int
99 v3d_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
100 {
101 struct v3d_screen *screen = v3d_screen(pscreen);
102
103 switch (param) {
104 /* Supported features (boolean caps). */
105 case PIPE_CAP_VERTEX_COLOR_CLAMPED:
106 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
107 case PIPE_CAP_FRAGMENT_COLOR_CLAMPED:
108 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
109 case PIPE_CAP_NPOT_TEXTURES:
110 case PIPE_CAP_SHAREABLE_SHADERS:
111 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
112 case PIPE_CAP_TEXTURE_MULTISAMPLE:
113 case PIPE_CAP_TEXTURE_SWIZZLE:
114 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
115 case PIPE_CAP_START_INSTANCE:
116 case PIPE_CAP_TGSI_INSTANCEID:
117 case PIPE_CAP_SM3:
118 case PIPE_CAP_TEXTURE_QUERY_LOD:
119 case PIPE_CAP_PRIMITIVE_RESTART:
120 case PIPE_CAP_OCCLUSION_QUERY:
121 case PIPE_CAP_POINT_SPRITE:
122 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
123 case PIPE_CAP_COMPUTE:
124 case PIPE_CAP_DRAW_INDIRECT:
125 case PIPE_CAP_MULTI_DRAW_INDIRECT:
126 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
127 case PIPE_CAP_SIGNED_VERTEX_BUFFER_OFFSET:
128 case PIPE_CAP_TGSI_CAN_READ_OUTPUTS:
129 case PIPE_CAP_TGSI_PACK_HALF_FLOAT:
130 case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
131 case PIPE_CAP_FRAMEBUFFER_NO_ATTACHMENT:
132 return 1;
133
134 case PIPE_CAP_GENERATE_MIPMAP:
135 return v3d_has_feature(screen, DRM_V3D_PARAM_SUPPORTS_TFU);
136
137 case PIPE_CAP_INDEP_BLEND_ENABLE:
138 return screen->devinfo.ver >= 40;
139
140 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
141 return 256;
142
143 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
144 if (screen->devinfo.ver < 40)
145 return 0;
146 return 4;
147
148 case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
149 return 4;
150
151 case PIPE_CAP_GLSL_FEATURE_LEVEL:
152 return 330;
153
154 case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
155 return 140;
156
157 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
158 return 1;
159 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
160 return 0;
161 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
162 if (screen->devinfo.ver >= 40)
163 return 0;
164 else
165 return 1;
166 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
167 if (screen->devinfo.ver >= 40)
168 return 1;
169 else
170 return 0;
171
172 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
173 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
174 case PIPE_CAP_MIXED_COLOR_DEPTH_BITS:
175 return 1;
176
177 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
178 return 4;
179
180 /* Texturing. */
181 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
182 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
183 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
184 return VC5_MAX_MIP_LEVELS;
185 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
186 return 2048;
187
188 /* Render targets. */
189 case PIPE_CAP_MAX_RENDER_TARGETS:
190 return 4;
191
192 case PIPE_CAP_VENDOR_ID:
193 return 0x14E4;
194 case PIPE_CAP_ACCELERATED:
195 return 1;
196 case PIPE_CAP_VIDEO_MEMORY: {
197 uint64_t system_memory;
198
199 if (!os_get_total_physical_memory(&system_memory))
200 return 0;
201
202 return (int)(system_memory >> 20);
203 }
204 case PIPE_CAP_UMA:
205 return 1;
206
207 default:
208 return u_pipe_screen_get_param_defaults(pscreen, param);
209 }
210 }
211
212 static float
213 v3d_screen_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)
214 {
215 switch (param) {
216 case PIPE_CAPF_MAX_LINE_WIDTH:
217 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
218 return 32;
219
220 case PIPE_CAPF_MAX_POINT_WIDTH:
221 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
222 return 512.0f;
223
224 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
225 return 0.0f;
226 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
227 return 16.0f;
228
229 case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
230 case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
231 case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
232 return 0.0f;
233 default:
234 fprintf(stderr, "unknown paramf %d\n", param);
235 return 0;
236 }
237 }
238
239 static int
240 v3d_screen_get_shader_param(struct pipe_screen *pscreen, unsigned shader,
241 enum pipe_shader_cap param)
242 {
243 if (shader != PIPE_SHADER_VERTEX &&
244 shader != PIPE_SHADER_FRAGMENT) {
245 return 0;
246 }
247
248 /* this is probably not totally correct.. but it's a start: */
249 switch (param) {
250 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
251 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
252 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
253 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
254 return 16384;
255
256 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
257 return UINT_MAX;
258
259 case PIPE_SHADER_CAP_MAX_INPUTS:
260 if (shader == PIPE_SHADER_FRAGMENT)
261 return VC5_MAX_FS_INPUTS / 4;
262 else
263 return VC5_MAX_ATTRIBUTES;
264 case PIPE_SHADER_CAP_MAX_OUTPUTS:
265 if (shader == PIPE_SHADER_FRAGMENT)
266 return 4;
267 else
268 return VC5_MAX_FS_INPUTS / 4;
269 case PIPE_SHADER_CAP_MAX_TEMPS:
270 return 256; /* GL_MAX_PROGRAM_TEMPORARIES_ARB */
271 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
272 return 16 * 1024 * sizeof(float);
273 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
274 return 16;
275 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
276 return 0;
277 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
278 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
279 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
280 return 0;
281 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
282 return 1;
283 case PIPE_SHADER_CAP_SUBROUTINES:
284 return 0;
285 case PIPE_SHADER_CAP_INTEGERS:
286 return 1;
287 case PIPE_SHADER_CAP_FP16:
288 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
289 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
290 case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
291 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
292 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
293 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
294 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
295 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
296 return 0;
297 case PIPE_SHADER_CAP_SCALAR_ISA:
298 return 1;
299 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
300 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
301 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
302 return VC5_MAX_TEXTURE_SAMPLERS;
303
304 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
305 return PIPE_MAX_SHADER_BUFFERS;
306
307 case PIPE_SHADER_CAP_PREFERRED_IR:
308 return PIPE_SHADER_IR_NIR;
309 case PIPE_SHADER_CAP_SUPPORTED_IRS:
310 return 0;
311 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
312 return 32;
313 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
314 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
315 return 0;
316 default:
317 fprintf(stderr, "unknown shader param %d\n", param);
318 return 0;
319 }
320 return 0;
321 }
322
323 static boolean
324 v3d_screen_is_format_supported(struct pipe_screen *pscreen,
325 enum pipe_format format,
326 enum pipe_texture_target target,
327 unsigned sample_count,
328 unsigned storage_sample_count,
329 unsigned usage)
330 {
331 struct v3d_screen *screen = v3d_screen(pscreen);
332
333 if (MAX2(1, sample_count) != MAX2(1, storage_sample_count))
334 return false;
335
336 if (sample_count > 1 && sample_count != VC5_MAX_SAMPLES)
337 return FALSE;
338
339 if (target >= PIPE_MAX_TEXTURE_TYPES) {
340 return FALSE;
341 }
342
343 if (usage & PIPE_BIND_VERTEX_BUFFER) {
344 switch (format) {
345 case PIPE_FORMAT_R32G32B32A32_FLOAT:
346 case PIPE_FORMAT_R32G32B32_FLOAT:
347 case PIPE_FORMAT_R32G32_FLOAT:
348 case PIPE_FORMAT_R32_FLOAT:
349 case PIPE_FORMAT_R32G32B32A32_SNORM:
350 case PIPE_FORMAT_R32G32B32_SNORM:
351 case PIPE_FORMAT_R32G32_SNORM:
352 case PIPE_FORMAT_R32_SNORM:
353 case PIPE_FORMAT_R32G32B32A32_SSCALED:
354 case PIPE_FORMAT_R32G32B32_SSCALED:
355 case PIPE_FORMAT_R32G32_SSCALED:
356 case PIPE_FORMAT_R32_SSCALED:
357 case PIPE_FORMAT_R16G16B16A16_UNORM:
358 case PIPE_FORMAT_R16G16B16_UNORM:
359 case PIPE_FORMAT_R16G16_UNORM:
360 case PIPE_FORMAT_R16_UNORM:
361 case PIPE_FORMAT_R16G16B16A16_SNORM:
362 case PIPE_FORMAT_R16G16B16_SNORM:
363 case PIPE_FORMAT_R16G16_SNORM:
364 case PIPE_FORMAT_R16_SNORM:
365 case PIPE_FORMAT_R16G16B16A16_USCALED:
366 case PIPE_FORMAT_R16G16B16_USCALED:
367 case PIPE_FORMAT_R16G16_USCALED:
368 case PIPE_FORMAT_R16_USCALED:
369 case PIPE_FORMAT_R16G16B16A16_SSCALED:
370 case PIPE_FORMAT_R16G16B16_SSCALED:
371 case PIPE_FORMAT_R16G16_SSCALED:
372 case PIPE_FORMAT_R16_SSCALED:
373 case PIPE_FORMAT_R8G8B8A8_UNORM:
374 case PIPE_FORMAT_R8G8B8_UNORM:
375 case PIPE_FORMAT_R8G8_UNORM:
376 case PIPE_FORMAT_R8_UNORM:
377 case PIPE_FORMAT_R8G8B8A8_SNORM:
378 case PIPE_FORMAT_R8G8B8_SNORM:
379 case PIPE_FORMAT_R8G8_SNORM:
380 case PIPE_FORMAT_R8_SNORM:
381 case PIPE_FORMAT_R8G8B8A8_USCALED:
382 case PIPE_FORMAT_R8G8B8_USCALED:
383 case PIPE_FORMAT_R8G8_USCALED:
384 case PIPE_FORMAT_R8_USCALED:
385 case PIPE_FORMAT_R8G8B8A8_SSCALED:
386 case PIPE_FORMAT_R8G8B8_SSCALED:
387 case PIPE_FORMAT_R8G8_SSCALED:
388 case PIPE_FORMAT_R8_SSCALED:
389 case PIPE_FORMAT_R10G10B10A2_UNORM:
390 case PIPE_FORMAT_B10G10R10A2_UNORM:
391 case PIPE_FORMAT_R10G10B10A2_SNORM:
392 case PIPE_FORMAT_B10G10R10A2_SNORM:
393 case PIPE_FORMAT_R10G10B10A2_USCALED:
394 case PIPE_FORMAT_B10G10R10A2_USCALED:
395 case PIPE_FORMAT_R10G10B10A2_SSCALED:
396 case PIPE_FORMAT_B10G10R10A2_SSCALED:
397 break;
398 default:
399 return FALSE;
400 }
401 }
402
403 /* FORMAT_NONE gets allowed for ARB_framebuffer_no_attachments's probe
404 * of FRAMEBUFFER_MAX_SAMPLES
405 */
406 if ((usage & PIPE_BIND_RENDER_TARGET) &&
407 format != PIPE_FORMAT_NONE &&
408 !v3d_rt_format_supported(&screen->devinfo, format)) {
409 return FALSE;
410 }
411
412 if ((usage & PIPE_BIND_SAMPLER_VIEW) &&
413 !v3d_tex_format_supported(&screen->devinfo, format)) {
414 return FALSE;
415 }
416
417 if ((usage & PIPE_BIND_DEPTH_STENCIL) &&
418 !(format == PIPE_FORMAT_S8_UINT_Z24_UNORM ||
419 format == PIPE_FORMAT_X8Z24_UNORM ||
420 format == PIPE_FORMAT_Z16_UNORM ||
421 format == PIPE_FORMAT_Z32_FLOAT ||
422 format == PIPE_FORMAT_Z32_FLOAT_S8X24_UINT)) {
423 return FALSE;
424 }
425
426 if ((usage & PIPE_BIND_INDEX_BUFFER) &&
427 !(format == PIPE_FORMAT_I8_UINT ||
428 format == PIPE_FORMAT_I16_UINT ||
429 format == PIPE_FORMAT_I32_UINT)) {
430 return FALSE;
431 }
432
433 return TRUE;
434 }
435
436 #define PTR_TO_UINT(x) ((unsigned)((intptr_t)(x)))
437
438 static unsigned handle_hash(void *key)
439 {
440 return PTR_TO_UINT(key);
441 }
442
443 static int handle_compare(void *key1, void *key2)
444 {
445 return PTR_TO_UINT(key1) != PTR_TO_UINT(key2);
446 }
447
448 static bool
449 v3d_get_device_info(struct v3d_screen *screen)
450 {
451 struct drm_v3d_get_param ident0 = {
452 .param = DRM_V3D_PARAM_V3D_CORE0_IDENT0,
453 };
454 struct drm_v3d_get_param ident1 = {
455 .param = DRM_V3D_PARAM_V3D_CORE0_IDENT1,
456 };
457 int ret;
458
459 ret = v3d_ioctl(screen->fd, DRM_IOCTL_V3D_GET_PARAM, &ident0);
460 if (ret != 0) {
461 fprintf(stderr, "Couldn't get V3D core IDENT0: %s\n",
462 strerror(errno));
463 return false;
464 }
465 ret = v3d_ioctl(screen->fd, DRM_IOCTL_V3D_GET_PARAM, &ident1);
466 if (ret != 0) {
467 fprintf(stderr, "Couldn't get V3D core IDENT1: %s\n",
468 strerror(errno));
469 return false;
470 }
471
472 uint32_t major = (ident0.value >> 24) & 0xff;
473 uint32_t minor = (ident1.value >> 0) & 0xf;
474 screen->devinfo.ver = major * 10 + minor;
475
476 screen->devinfo.vpm_size = (ident1.value >> 28 & 0xf) * 8192;
477
478 switch (screen->devinfo.ver) {
479 case 33:
480 case 41:
481 case 42:
482 break;
483 default:
484 fprintf(stderr,
485 "V3D %d.%d not supported by this version of Mesa.\n",
486 screen->devinfo.ver / 10,
487 screen->devinfo.ver % 10);
488 return false;
489 }
490
491 return true;
492 }
493
494 static const void *
495 v3d_screen_get_compiler_options(struct pipe_screen *pscreen,
496 enum pipe_shader_ir ir, unsigned shader)
497 {
498 return &v3d_nir_options;
499 }
500
501 struct pipe_screen *
502 v3d_screen_create(int fd, struct renderonly *ro)
503 {
504 struct v3d_screen *screen = rzalloc(NULL, struct v3d_screen);
505 struct pipe_screen *pscreen;
506
507 pscreen = &screen->base;
508
509 pscreen->destroy = v3d_screen_destroy;
510 pscreen->get_param = v3d_screen_get_param;
511 pscreen->get_paramf = v3d_screen_get_paramf;
512 pscreen->get_shader_param = v3d_screen_get_shader_param;
513 pscreen->context_create = v3d_context_create;
514 pscreen->is_format_supported = v3d_screen_is_format_supported;
515
516 screen->fd = fd;
517 if (ro) {
518 screen->ro = renderonly_dup(ro);
519 if (!screen->ro) {
520 fprintf(stderr, "Failed to dup renderonly object\n");
521 ralloc_free(screen);
522 return NULL;
523 }
524 }
525 list_inithead(&screen->bo_cache.time_list);
526 (void)mtx_init(&screen->bo_handles_mutex, mtx_plain);
527 screen->bo_handles = util_hash_table_create(handle_hash, handle_compare);
528
529 #if defined(USE_V3D_SIMULATOR)
530 v3d_simulator_init(screen);
531 #endif
532
533 if (!v3d_get_device_info(screen))
534 goto fail;
535
536 slab_create_parent(&screen->transfer_pool, sizeof(struct v3d_transfer), 16);
537
538 v3d_fence_init(screen);
539
540 v3d_process_debug_variable();
541
542 v3d_resource_screen_init(pscreen);
543
544 screen->compiler = v3d_compiler_init(&screen->devinfo);
545
546 pscreen->get_name = v3d_screen_get_name;
547 pscreen->get_vendor = v3d_screen_get_vendor;
548 pscreen->get_device_vendor = v3d_screen_get_vendor;
549 pscreen->get_compiler_options = v3d_screen_get_compiler_options;
550
551 return pscreen;
552
553 fail:
554 close(fd);
555 ralloc_free(pscreen);
556 return NULL;
557 }