v3d: Enable GL_ARB_texture_gather on V3D 4.x.
[mesa.git] / src / gallium / drivers / v3d / v3d_screen.c
1 /*
2 * Copyright © 2014-2017 Broadcom
3 * Copyright (C) 2012 Rob Clark <robclark@freedesktop.org>
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9 * and/or sell copies of the Software, and to permit persons to whom the
10 * Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
22 * IN THE SOFTWARE.
23 */
24
25 #include "util/os_misc.h"
26 #include "pipe/p_defines.h"
27 #include "pipe/p_screen.h"
28 #include "pipe/p_state.h"
29
30 #include "util/u_debug.h"
31 #include "util/u_memory.h"
32 #include "util/u_format.h"
33 #include "util/u_hash_table.h"
34 #include "util/u_screen.h"
35 #include "util/u_transfer_helper.h"
36 #include "util/ralloc.h"
37
38 #include <xf86drm.h>
39 #include "v3d_screen.h"
40 #include "v3d_context.h"
41 #include "v3d_resource.h"
42 #include "compiler/v3d_compiler.h"
43
44 static const char *
45 v3d_screen_get_name(struct pipe_screen *pscreen)
46 {
47 struct v3d_screen *screen = v3d_screen(pscreen);
48
49 if (!screen->name) {
50 screen->name = ralloc_asprintf(screen,
51 "V3D %d.%d",
52 screen->devinfo.ver / 10,
53 screen->devinfo.ver % 10);
54 }
55
56 return screen->name;
57 }
58
59 static const char *
60 v3d_screen_get_vendor(struct pipe_screen *pscreen)
61 {
62 return "Broadcom";
63 }
64
65 static void
66 v3d_screen_destroy(struct pipe_screen *pscreen)
67 {
68 struct v3d_screen *screen = v3d_screen(pscreen);
69
70 util_hash_table_destroy(screen->bo_handles);
71 v3d_bufmgr_destroy(pscreen);
72 slab_destroy_parent(&screen->transfer_pool);
73
74 if (using_v3d_simulator)
75 v3d_simulator_destroy(screen);
76
77 v3d_compiler_free(screen->compiler);
78 u_transfer_helper_destroy(pscreen->transfer_helper);
79
80 close(screen->fd);
81 ralloc_free(pscreen);
82 }
83
84 static bool
85 v3d_has_feature(struct v3d_screen *screen, enum drm_v3d_param feature)
86 {
87 struct drm_v3d_get_param p = {
88 .param = feature,
89 };
90 int ret = v3d_ioctl(screen->fd, DRM_IOCTL_V3D_GET_PARAM, &p);
91
92 if (ret != 0)
93 return false;
94
95 return p.value;
96 }
97
98 static int
99 v3d_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
100 {
101 struct v3d_screen *screen = v3d_screen(pscreen);
102
103 switch (param) {
104 /* Supported features (boolean caps). */
105 case PIPE_CAP_VERTEX_COLOR_CLAMPED:
106 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
107 case PIPE_CAP_FRAGMENT_COLOR_CLAMPED:
108 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
109 case PIPE_CAP_NPOT_TEXTURES:
110 case PIPE_CAP_SHAREABLE_SHADERS:
111 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
112 case PIPE_CAP_TEXTURE_MULTISAMPLE:
113 case PIPE_CAP_TEXTURE_SWIZZLE:
114 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
115 case PIPE_CAP_START_INSTANCE:
116 case PIPE_CAP_TGSI_INSTANCEID:
117 case PIPE_CAP_SM3:
118 case PIPE_CAP_TEXTURE_QUERY_LOD:
119 case PIPE_CAP_PRIMITIVE_RESTART:
120 case PIPE_CAP_OCCLUSION_QUERY:
121 case PIPE_CAP_POINT_SPRITE:
122 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
123 case PIPE_CAP_COMPUTE:
124 case PIPE_CAP_DRAW_INDIRECT:
125 case PIPE_CAP_MULTI_DRAW_INDIRECT:
126 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
127 case PIPE_CAP_SIGNED_VERTEX_BUFFER_OFFSET:
128 case PIPE_CAP_TGSI_CAN_READ_OUTPUTS:
129 case PIPE_CAP_TGSI_PACK_HALF_FLOAT:
130 case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
131 return 1;
132
133 case PIPE_CAP_GENERATE_MIPMAP:
134 return v3d_has_feature(screen, DRM_V3D_PARAM_SUPPORTS_TFU);
135
136 case PIPE_CAP_INDEP_BLEND_ENABLE:
137 return screen->devinfo.ver >= 40;
138
139 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
140 return 256;
141
142 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
143 if (screen->devinfo.ver < 40)
144 return 0;
145 return 4;
146
147 case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
148 return 4;
149
150 case PIPE_CAP_GLSL_FEATURE_LEVEL:
151 return 400;
152
153 case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
154 return 140;
155
156 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
157 return 1;
158 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
159 return 0;
160 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
161 if (screen->devinfo.ver >= 40)
162 return 0;
163 else
164 return 1;
165 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
166 if (screen->devinfo.ver >= 40)
167 return 1;
168 else
169 return 0;
170
171 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
172 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
173 case PIPE_CAP_MIXED_COLOR_DEPTH_BITS:
174 return 1;
175
176 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
177 return 4;
178
179 /* Texturing. */
180 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
181 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
182 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
183 return VC5_MAX_MIP_LEVELS;
184 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
185 return 2048;
186
187 /* Render targets. */
188 case PIPE_CAP_MAX_RENDER_TARGETS:
189 return 4;
190
191 case PIPE_CAP_VENDOR_ID:
192 return 0x14E4;
193 case PIPE_CAP_ACCELERATED:
194 return 1;
195 case PIPE_CAP_VIDEO_MEMORY: {
196 uint64_t system_memory;
197
198 if (!os_get_total_physical_memory(&system_memory))
199 return 0;
200
201 return (int)(system_memory >> 20);
202 }
203 case PIPE_CAP_UMA:
204 return 1;
205
206 default:
207 return u_pipe_screen_get_param_defaults(pscreen, param);
208 }
209 }
210
211 static float
212 v3d_screen_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)
213 {
214 switch (param) {
215 case PIPE_CAPF_MAX_LINE_WIDTH:
216 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
217 return 32;
218
219 case PIPE_CAPF_MAX_POINT_WIDTH:
220 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
221 return 512.0f;
222
223 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
224 return 0.0f;
225 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
226 return 16.0f;
227
228 case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
229 case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
230 case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
231 return 0.0f;
232 default:
233 fprintf(stderr, "unknown paramf %d\n", param);
234 return 0;
235 }
236 }
237
238 static int
239 v3d_screen_get_shader_param(struct pipe_screen *pscreen, unsigned shader,
240 enum pipe_shader_cap param)
241 {
242 if (shader != PIPE_SHADER_VERTEX &&
243 shader != PIPE_SHADER_FRAGMENT) {
244 return 0;
245 }
246
247 /* this is probably not totally correct.. but it's a start: */
248 switch (param) {
249 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
250 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
251 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
252 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
253 return 16384;
254
255 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
256 return UINT_MAX;
257
258 case PIPE_SHADER_CAP_MAX_INPUTS:
259 if (shader == PIPE_SHADER_FRAGMENT)
260 return VC5_MAX_FS_INPUTS / 4;
261 else
262 return VC5_MAX_ATTRIBUTES;
263 case PIPE_SHADER_CAP_MAX_OUTPUTS:
264 if (shader == PIPE_SHADER_FRAGMENT)
265 return 4;
266 else
267 return VC5_MAX_FS_INPUTS / 4;
268 case PIPE_SHADER_CAP_MAX_TEMPS:
269 return 256; /* GL_MAX_PROGRAM_TEMPORARIES_ARB */
270 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
271 return 16 * 1024 * sizeof(float);
272 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
273 return 16;
274 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
275 return 0;
276 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
277 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
278 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
279 return 0;
280 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
281 return 1;
282 case PIPE_SHADER_CAP_SUBROUTINES:
283 return 0;
284 case PIPE_SHADER_CAP_INTEGERS:
285 return 1;
286 case PIPE_SHADER_CAP_FP16:
287 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
288 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
289 case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
290 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
291 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
292 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
293 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
294 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
295 return 0;
296 case PIPE_SHADER_CAP_SCALAR_ISA:
297 return 1;
298 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
299 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
300 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
301 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
302 return VC5_MAX_TEXTURE_SAMPLERS;
303 case PIPE_SHADER_CAP_PREFERRED_IR:
304 return PIPE_SHADER_IR_NIR;
305 case PIPE_SHADER_CAP_SUPPORTED_IRS:
306 return 0;
307 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
308 return 32;
309 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
310 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
311 return 0;
312 default:
313 fprintf(stderr, "unknown shader param %d\n", param);
314 return 0;
315 }
316 return 0;
317 }
318
319 static boolean
320 v3d_screen_is_format_supported(struct pipe_screen *pscreen,
321 enum pipe_format format,
322 enum pipe_texture_target target,
323 unsigned sample_count,
324 unsigned storage_sample_count,
325 unsigned usage)
326 {
327 struct v3d_screen *screen = v3d_screen(pscreen);
328
329 if (MAX2(1, sample_count) != MAX2(1, storage_sample_count))
330 return false;
331
332 if (sample_count > 1 && sample_count != VC5_MAX_SAMPLES)
333 return FALSE;
334
335 if (target >= PIPE_MAX_TEXTURE_TYPES) {
336 return FALSE;
337 }
338
339 if (usage & PIPE_BIND_VERTEX_BUFFER) {
340 switch (format) {
341 case PIPE_FORMAT_R32G32B32A32_FLOAT:
342 case PIPE_FORMAT_R32G32B32_FLOAT:
343 case PIPE_FORMAT_R32G32_FLOAT:
344 case PIPE_FORMAT_R32_FLOAT:
345 case PIPE_FORMAT_R32G32B32A32_SNORM:
346 case PIPE_FORMAT_R32G32B32_SNORM:
347 case PIPE_FORMAT_R32G32_SNORM:
348 case PIPE_FORMAT_R32_SNORM:
349 case PIPE_FORMAT_R32G32B32A32_SSCALED:
350 case PIPE_FORMAT_R32G32B32_SSCALED:
351 case PIPE_FORMAT_R32G32_SSCALED:
352 case PIPE_FORMAT_R32_SSCALED:
353 case PIPE_FORMAT_R16G16B16A16_UNORM:
354 case PIPE_FORMAT_R16G16B16_UNORM:
355 case PIPE_FORMAT_R16G16_UNORM:
356 case PIPE_FORMAT_R16_UNORM:
357 case PIPE_FORMAT_R16G16B16A16_SNORM:
358 case PIPE_FORMAT_R16G16B16_SNORM:
359 case PIPE_FORMAT_R16G16_SNORM:
360 case PIPE_FORMAT_R16_SNORM:
361 case PIPE_FORMAT_R16G16B16A16_USCALED:
362 case PIPE_FORMAT_R16G16B16_USCALED:
363 case PIPE_FORMAT_R16G16_USCALED:
364 case PIPE_FORMAT_R16_USCALED:
365 case PIPE_FORMAT_R16G16B16A16_SSCALED:
366 case PIPE_FORMAT_R16G16B16_SSCALED:
367 case PIPE_FORMAT_R16G16_SSCALED:
368 case PIPE_FORMAT_R16_SSCALED:
369 case PIPE_FORMAT_R8G8B8A8_UNORM:
370 case PIPE_FORMAT_R8G8B8_UNORM:
371 case PIPE_FORMAT_R8G8_UNORM:
372 case PIPE_FORMAT_R8_UNORM:
373 case PIPE_FORMAT_R8G8B8A8_SNORM:
374 case PIPE_FORMAT_R8G8B8_SNORM:
375 case PIPE_FORMAT_R8G8_SNORM:
376 case PIPE_FORMAT_R8_SNORM:
377 case PIPE_FORMAT_R8G8B8A8_USCALED:
378 case PIPE_FORMAT_R8G8B8_USCALED:
379 case PIPE_FORMAT_R8G8_USCALED:
380 case PIPE_FORMAT_R8_USCALED:
381 case PIPE_FORMAT_R8G8B8A8_SSCALED:
382 case PIPE_FORMAT_R8G8B8_SSCALED:
383 case PIPE_FORMAT_R8G8_SSCALED:
384 case PIPE_FORMAT_R8_SSCALED:
385 case PIPE_FORMAT_R10G10B10A2_UNORM:
386 case PIPE_FORMAT_B10G10R10A2_UNORM:
387 case PIPE_FORMAT_R10G10B10A2_SNORM:
388 case PIPE_FORMAT_B10G10R10A2_SNORM:
389 case PIPE_FORMAT_R10G10B10A2_USCALED:
390 case PIPE_FORMAT_B10G10R10A2_USCALED:
391 case PIPE_FORMAT_R10G10B10A2_SSCALED:
392 case PIPE_FORMAT_B10G10R10A2_SSCALED:
393 break;
394 default:
395 return FALSE;
396 }
397 }
398
399 if ((usage & PIPE_BIND_RENDER_TARGET) &&
400 !v3d_rt_format_supported(&screen->devinfo, format)) {
401 return FALSE;
402 }
403
404 if ((usage & PIPE_BIND_SAMPLER_VIEW) &&
405 !v3d_tex_format_supported(&screen->devinfo, format)) {
406 return FALSE;
407 }
408
409 if ((usage & PIPE_BIND_DEPTH_STENCIL) &&
410 !(format == PIPE_FORMAT_S8_UINT_Z24_UNORM ||
411 format == PIPE_FORMAT_X8Z24_UNORM ||
412 format == PIPE_FORMAT_Z16_UNORM ||
413 format == PIPE_FORMAT_Z32_FLOAT ||
414 format == PIPE_FORMAT_Z32_FLOAT_S8X24_UINT)) {
415 return FALSE;
416 }
417
418 if ((usage & PIPE_BIND_INDEX_BUFFER) &&
419 !(format == PIPE_FORMAT_I8_UINT ||
420 format == PIPE_FORMAT_I16_UINT ||
421 format == PIPE_FORMAT_I32_UINT)) {
422 return FALSE;
423 }
424
425 return TRUE;
426 }
427
428 #define PTR_TO_UINT(x) ((unsigned)((intptr_t)(x)))
429
430 static unsigned handle_hash(void *key)
431 {
432 return PTR_TO_UINT(key);
433 }
434
435 static int handle_compare(void *key1, void *key2)
436 {
437 return PTR_TO_UINT(key1) != PTR_TO_UINT(key2);
438 }
439
440 static bool
441 v3d_get_device_info(struct v3d_screen *screen)
442 {
443 struct drm_v3d_get_param ident0 = {
444 .param = DRM_V3D_PARAM_V3D_CORE0_IDENT0,
445 };
446 struct drm_v3d_get_param ident1 = {
447 .param = DRM_V3D_PARAM_V3D_CORE0_IDENT1,
448 };
449 int ret;
450
451 ret = v3d_ioctl(screen->fd, DRM_IOCTL_V3D_GET_PARAM, &ident0);
452 if (ret != 0) {
453 fprintf(stderr, "Couldn't get V3D core IDENT0: %s\n",
454 strerror(errno));
455 return false;
456 }
457 ret = v3d_ioctl(screen->fd, DRM_IOCTL_V3D_GET_PARAM, &ident1);
458 if (ret != 0) {
459 fprintf(stderr, "Couldn't get V3D core IDENT1: %s\n",
460 strerror(errno));
461 return false;
462 }
463
464 uint32_t major = (ident0.value >> 24) & 0xff;
465 uint32_t minor = (ident1.value >> 0) & 0xf;
466 screen->devinfo.ver = major * 10 + minor;
467
468 screen->devinfo.vpm_size = (ident1.value >> 28 & 0xf) * 8192;
469
470 switch (screen->devinfo.ver) {
471 case 33:
472 case 41:
473 case 42:
474 break;
475 default:
476 fprintf(stderr,
477 "V3D %d.%d not supported by this version of Mesa.\n",
478 screen->devinfo.ver / 10,
479 screen->devinfo.ver % 10);
480 return false;
481 }
482
483 return true;
484 }
485
486 static const void *
487 v3d_screen_get_compiler_options(struct pipe_screen *pscreen,
488 enum pipe_shader_ir ir, unsigned shader)
489 {
490 return &v3d_nir_options;
491 }
492
493 struct pipe_screen *
494 v3d_screen_create(int fd, struct renderonly *ro)
495 {
496 struct v3d_screen *screen = rzalloc(NULL, struct v3d_screen);
497 struct pipe_screen *pscreen;
498
499 pscreen = &screen->base;
500
501 pscreen->destroy = v3d_screen_destroy;
502 pscreen->get_param = v3d_screen_get_param;
503 pscreen->get_paramf = v3d_screen_get_paramf;
504 pscreen->get_shader_param = v3d_screen_get_shader_param;
505 pscreen->context_create = v3d_context_create;
506 pscreen->is_format_supported = v3d_screen_is_format_supported;
507
508 screen->fd = fd;
509 if (ro) {
510 screen->ro = renderonly_dup(ro);
511 if (!screen->ro) {
512 fprintf(stderr, "Failed to dup renderonly object\n");
513 ralloc_free(screen);
514 return NULL;
515 }
516 }
517 list_inithead(&screen->bo_cache.time_list);
518 (void)mtx_init(&screen->bo_handles_mutex, mtx_plain);
519 screen->bo_handles = util_hash_table_create(handle_hash, handle_compare);
520
521 #if defined(USE_V3D_SIMULATOR)
522 v3d_simulator_init(screen);
523 #endif
524
525 if (!v3d_get_device_info(screen))
526 goto fail;
527
528 slab_create_parent(&screen->transfer_pool, sizeof(struct v3d_transfer), 16);
529
530 v3d_fence_init(screen);
531
532 v3d_process_debug_variable();
533
534 v3d_resource_screen_init(pscreen);
535
536 screen->compiler = v3d_compiler_init(&screen->devinfo);
537
538 pscreen->get_name = v3d_screen_get_name;
539 pscreen->get_vendor = v3d_screen_get_vendor;
540 pscreen->get_device_vendor = v3d_screen_get_vendor;
541 pscreen->get_compiler_options = v3d_screen_get_compiler_options;
542
543 return pscreen;
544
545 fail:
546 close(fd);
547 ralloc_free(pscreen);
548 return NULL;
549 }