2 * Copyright (c) 2017-2019 Lima Project
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sub license,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the
12 * next paragraph) shall be included in all copies or substantial portions
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
27 #include "util/ralloc.h"
28 #include "util/u_debug.h"
29 #include "util/u_screen.h"
30 #include "renderonly/renderonly.h"
32 #include "drm-uapi/drm_fourcc.h"
33 #include "drm-uapi/lima_drm.h"
35 #include "lima_screen.h"
36 #include "lima_context.h"
37 #include "lima_resource.h"
38 #include "lima_program.h"
40 #include "lima_fence.h"
41 #include "lima_format.h"
42 #include "ir/lima_ir.h"
46 int lima_plb_max_blk
= 0;
47 int lima_plb_pp_stream_cache_size
= 0;
50 lima_screen_destroy(struct pipe_screen
*pscreen
)
52 struct lima_screen
*screen
= lima_screen(pscreen
);
54 slab_destroy_parent(&screen
->transfer_pool
);
59 if (screen
->pp_buffer
)
60 lima_bo_unreference(screen
->pp_buffer
);
62 lima_bo_cache_fini(screen
);
63 lima_bo_table_fini(screen
);
68 lima_screen_get_name(struct pipe_screen
*pscreen
)
70 struct lima_screen
*screen
= lima_screen(pscreen
);
72 switch (screen
->gpu_type
) {
73 case DRM_LIMA_PARAM_GPU_ID_MALI400
:
75 case DRM_LIMA_PARAM_GPU_ID_MALI450
:
83 lima_screen_get_vendor(struct pipe_screen
*pscreen
)
89 lima_screen_get_device_vendor(struct pipe_screen
*pscreen
)
95 lima_screen_get_param(struct pipe_screen
*pscreen
, enum pipe_cap param
)
98 case PIPE_CAP_NPOT_TEXTURES
:
99 case PIPE_CAP_BLEND_EQUATION_SEPARATE
:
100 case PIPE_CAP_ACCELERATED
:
102 case PIPE_CAP_NATIVE_FENCE_FD
:
103 case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD
:
106 /* Unimplemented, but for exporting OpenGL 2.0 */
107 case PIPE_CAP_OCCLUSION_QUERY
:
108 case PIPE_CAP_POINT_SPRITE
:
111 /* not clear supported */
112 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT
:
113 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT
:
114 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER
:
115 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER
:
118 case PIPE_CAP_TGSI_FS_POSITION_IS_SYSVAL
:
119 case PIPE_CAP_TGSI_FS_POINT_IS_SYSVAL
:
120 case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL
:
123 case PIPE_CAP_MAX_TEXTURE_2D_SIZE
:
124 return 1 << (LIMA_MAX_MIP_LEVELS
- 1);
125 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS
:
126 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS
:
127 return LIMA_MAX_MIP_LEVELS
;
129 case PIPE_CAP_VENDOR_ID
:
132 case PIPE_CAP_VIDEO_MEMORY
:
135 case PIPE_CAP_PCI_GROUP
:
136 case PIPE_CAP_PCI_BUS
:
137 case PIPE_CAP_PCI_DEVICE
:
138 case PIPE_CAP_PCI_FUNCTION
:
141 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER
:
144 case PIPE_CAP_ALPHA_TEST
:
145 case PIPE_CAP_FLATSHADE
:
146 case PIPE_CAP_TWO_SIDED_COLOR
:
147 case PIPE_CAP_CLIP_PLANES
:
150 case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES
:
154 return u_pipe_screen_get_param_defaults(pscreen
, param
);
159 lima_screen_get_paramf(struct pipe_screen
*pscreen
, enum pipe_capf param
)
162 case PIPE_CAPF_MAX_LINE_WIDTH
:
163 case PIPE_CAPF_MAX_LINE_WIDTH_AA
:
164 case PIPE_CAPF_MAX_POINT_WIDTH
:
165 case PIPE_CAPF_MAX_POINT_WIDTH_AA
:
167 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY
:
169 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS
:
178 get_vertex_shader_param(struct lima_screen
*screen
,
179 enum pipe_shader_cap param
)
182 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS
:
183 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS
:
184 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS
:
185 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS
:
186 return 16384; /* need investigate */
188 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH
:
191 case PIPE_SHADER_CAP_MAX_INPUTS
:
192 return 16; /* attributes */
194 case PIPE_SHADER_CAP_MAX_OUTPUTS
:
195 return LIMA_MAX_VARYING_NUM
; /* varying */
197 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE
:
198 return 16 * 1024 * sizeof(float);
200 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS
:
203 case PIPE_SHADER_CAP_PREFERRED_IR
:
204 return PIPE_SHADER_IR_NIR
;
206 case PIPE_SHADER_CAP_MAX_TEMPS
:
207 return 256; /* need investigate */
209 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT
:
218 get_fragment_shader_param(struct lima_screen
*screen
,
219 enum pipe_shader_cap param
)
222 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS
:
223 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS
:
224 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS
:
225 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS
:
226 return 16384; /* need investigate */
228 case PIPE_SHADER_CAP_MAX_INPUTS
:
229 return LIMA_MAX_VARYING_NUM
- 1; /* varying, minus gl_Position */
231 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH
:
234 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE
:
235 return 16 * 1024 * sizeof(float);
237 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS
:
240 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS
:
241 return 16; /* need investigate */
243 case PIPE_SHADER_CAP_PREFERRED_IR
:
244 return PIPE_SHADER_IR_NIR
;
246 case PIPE_SHADER_CAP_MAX_TEMPS
:
247 return 256; /* need investigate */
249 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR
:
250 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR
:
253 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR
:
254 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR
:
257 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT
:
266 lima_screen_get_shader_param(struct pipe_screen
*pscreen
,
267 enum pipe_shader_type shader
,
268 enum pipe_shader_cap param
)
270 struct lima_screen
*screen
= lima_screen(pscreen
);
273 case PIPE_SHADER_FRAGMENT
:
274 return get_fragment_shader_param(screen
, param
);
275 case PIPE_SHADER_VERTEX
:
276 return get_vertex_shader_param(screen
, param
);
284 lima_screen_is_format_supported(struct pipe_screen
*pscreen
,
285 enum pipe_format format
,
286 enum pipe_texture_target target
,
287 unsigned sample_count
,
288 unsigned storage_sample_count
,
293 case PIPE_TEXTURE_1D
:
294 case PIPE_TEXTURE_2D
:
295 case PIPE_TEXTURE_RECT
:
296 case PIPE_TEXTURE_CUBE
:
302 if (MAX2(1, sample_count
) != MAX2(1, storage_sample_count
))
305 /* be able to support 16, now limit to 4 */
306 if (sample_count
> 1 && sample_count
!= 4)
309 if (usage
& PIPE_BIND_RENDER_TARGET
&&
310 !lima_format_pixel_supported(format
))
313 if (usage
& PIPE_BIND_DEPTH_STENCIL
) {
315 case PIPE_FORMAT_Z24_UNORM_S8_UINT
:
316 case PIPE_FORMAT_Z24X8_UNORM
:
323 if (usage
& PIPE_BIND_VERTEX_BUFFER
) {
325 case PIPE_FORMAT_R32G32B32_FLOAT
:
332 if (usage
& PIPE_BIND_INDEX_BUFFER
) {
334 case PIPE_FORMAT_I8_UINT
:
335 case PIPE_FORMAT_I16_UINT
:
336 case PIPE_FORMAT_I32_UINT
:
343 if (usage
& PIPE_BIND_SAMPLER_VIEW
)
344 return lima_format_texel_supported(format
);
350 lima_screen_get_compiler_options(struct pipe_screen
*pscreen
,
351 enum pipe_shader_ir ir
,
352 enum pipe_shader_type shader
)
354 return lima_program_get_compiler_options(shader
);
358 lima_screen_set_plb_max_blk(struct lima_screen
*screen
)
360 if (lima_plb_max_blk
) {
361 screen
->plb_max_blk
= lima_plb_max_blk
;
365 if (screen
->gpu_type
== DRM_LIMA_PARAM_GPU_ID_MALI450
)
366 screen
->plb_max_blk
= 4096;
368 screen
->plb_max_blk
= 512;
370 drmDevicePtr devinfo
;
372 if (drmGetDevice2(screen
->fd
, 0, &devinfo
))
375 if (devinfo
->bustype
== DRM_BUS_PLATFORM
&& devinfo
->deviceinfo
.platform
) {
376 char **compatible
= devinfo
->deviceinfo
.platform
->compatible
;
378 if (compatible
&& *compatible
)
379 if (!strcmp("allwinner,sun50i-h5-mali", *compatible
))
380 screen
->plb_max_blk
= 2048;
383 drmFreeDevice(&devinfo
);
389 lima_screen_query_info(struct lima_screen
*screen
)
391 drmVersionPtr version
= drmGetVersion(screen
->fd
);
395 if (version
->version_major
> 1 || version
->version_minor
> 0)
396 screen
->has_growable_heap_buffer
= true;
398 drmFreeVersion(version
);
400 if (lima_debug
& LIMA_DEBUG_NO_GROW_HEAP
)
401 screen
->has_growable_heap_buffer
= false;
403 struct drm_lima_get_param param
;
405 memset(¶m
, 0, sizeof(param
));
406 param
.param
= DRM_LIMA_PARAM_GPU_ID
;
407 if (drmIoctl(screen
->fd
, DRM_IOCTL_LIMA_GET_PARAM
, ¶m
))
410 switch (param
.value
) {
411 case DRM_LIMA_PARAM_GPU_ID_MALI400
:
412 case DRM_LIMA_PARAM_GPU_ID_MALI450
:
413 screen
->gpu_type
= param
.value
;
419 memset(¶m
, 0, sizeof(param
));
420 param
.param
= DRM_LIMA_PARAM_NUM_PP
;
421 if (drmIoctl(screen
->fd
, DRM_IOCTL_LIMA_GET_PARAM
, ¶m
))
424 screen
->num_pp
= param
.value
;
426 lima_screen_set_plb_max_blk(screen
);
432 lima_screen_query_dmabuf_modifiers(struct pipe_screen
*pscreen
,
433 enum pipe_format format
, int max
,
435 unsigned int *external_only
,
438 uint64_t available_modifiers
[] = {
439 DRM_FORMAT_MOD_ARM_16X16_BLOCK_U_INTERLEAVED
,
440 DRM_FORMAT_MOD_LINEAR
,
444 *count
= ARRAY_SIZE(available_modifiers
);
448 for (int i
= 0; i
< *count
; i
++) {
449 modifiers
[i
] = available_modifiers
[i
];
451 external_only
= false;
455 static const struct debug_named_value debug_options
[] = {
456 { "gp", LIMA_DEBUG_GP
,
457 "print GP shader compiler result of each stage" },
458 { "pp", LIMA_DEBUG_PP
,
459 "print PP shader compiler result of each stage" },
460 { "dump", LIMA_DEBUG_DUMP
,
461 "dump GPU command stream to $PWD/lima.dump" },
462 { "shaderdb", LIMA_DEBUG_SHADERDB
,
463 "print shader information for shaderdb" },
464 { "nobocache", LIMA_DEBUG_NO_BO_CACHE
,
465 "disable BO cache" },
466 { "bocache", LIMA_DEBUG_BO_CACHE
,
467 "print debug info for BO cache" },
468 { "notiling", LIMA_DEBUG_NO_TILING
,
469 "don't use tiled buffers" },
470 { "nogrowheap", LIMA_DEBUG_NO_GROW_HEAP
,
471 "disable growable heap buffer" },
472 { "singlejob", LIMA_DEBUG_SINGLE_JOB
,
473 "disable multi job optimization" },
477 DEBUG_GET_ONCE_FLAGS_OPTION(lima_debug
, "LIMA_DEBUG", debug_options
, 0)
481 lima_screen_parse_env(void)
483 lima_debug
= debug_get_option_lima_debug();
485 lima_ctx_num_plb
= debug_get_num_option("LIMA_CTX_NUM_PLB", LIMA_CTX_PLB_DEF_NUM
);
486 if (lima_ctx_num_plb
> LIMA_CTX_PLB_MAX_NUM
||
487 lima_ctx_num_plb
< LIMA_CTX_PLB_MIN_NUM
) {
488 fprintf(stderr
, "lima: LIMA_CTX_NUM_PLB %d out of range [%d %d], "
489 "reset to default %d\n", lima_ctx_num_plb
, LIMA_CTX_PLB_MIN_NUM
,
490 LIMA_CTX_PLB_MAX_NUM
, LIMA_CTX_PLB_DEF_NUM
);
491 lima_ctx_num_plb
= LIMA_CTX_PLB_DEF_NUM
;
494 lima_plb_max_blk
= debug_get_num_option("LIMA_PLB_MAX_BLK", 0);
495 if (lima_plb_max_blk
< 0 || lima_plb_max_blk
> 65536) {
496 fprintf(stderr
, "lima: LIMA_PLB_MAX_BLK %d out of range [%d %d], "
497 "reset to default %d\n", lima_plb_max_blk
, 0, 65536, 0);
498 lima_plb_max_blk
= 0;
501 lima_ppir_force_spilling
= debug_get_num_option("LIMA_PPIR_FORCE_SPILLING", 0);
502 if (lima_ppir_force_spilling
< 0) {
503 fprintf(stderr
, "lima: LIMA_PPIR_FORCE_SPILLING %d less than 0, "
504 "reset to default 0\n", lima_ppir_force_spilling
);
505 lima_ppir_force_spilling
= 0;
508 lima_plb_pp_stream_cache_size
= debug_get_num_option("LIMA_PLB_PP_STREAM_CACHE_SIZE", 0);
509 if (lima_plb_pp_stream_cache_size
< 0) {
510 fprintf(stderr
, "lima: LIMA_PLB_PP_STREAM_CACHE_SIZE %d less than 0, "
511 "reset to default 0\n", lima_plb_pp_stream_cache_size
);
512 lima_plb_pp_stream_cache_size
= 0;
517 lima_screen_create(int fd
, struct renderonly
*ro
)
519 uint64_t system_memory
;
520 struct lima_screen
*screen
;
522 screen
= rzalloc(NULL
, struct lima_screen
);
528 lima_screen_parse_env();
530 /* Limit PP PLB stream cache size to 0.1% of system memory */
531 if (!lima_plb_pp_stream_cache_size
&&
532 os_get_total_physical_memory(&system_memory
))
533 lima_plb_pp_stream_cache_size
= system_memory
>> 10;
535 /* Set lower limit on PP PLB cache size */
536 lima_plb_pp_stream_cache_size
= MAX2(128 * 1024 * lima_ctx_num_plb
,
537 lima_plb_pp_stream_cache_size
);
539 if (!lima_screen_query_info(screen
))
542 if (!lima_bo_cache_init(screen
))
545 if (!lima_bo_table_init(screen
))
548 screen
->pp_ra
= ppir_regalloc_init(screen
);
552 screen
->pp_buffer
= lima_bo_create(screen
, pp_buffer_size
, 0);
553 if (!screen
->pp_buffer
)
555 screen
->pp_buffer
->cacheable
= false;
557 /* fs program for clear buffer?
558 * const0 1 0 0 -1.67773, mov.v0 $0 ^const0.xxxx, stop
560 static const uint32_t pp_clear_program
[] = {
561 0x00020425, 0x0000000c, 0x01e007cf, 0xb0000000,
562 0x000005f5, 0x00000000, 0x00000000, 0x00000000,
564 memcpy(lima_bo_map(screen
->pp_buffer
) + pp_clear_program_offset
,
565 pp_clear_program
, sizeof(pp_clear_program
));
567 /* copy texture to framebuffer, used to reload gpu tile buffer
568 * load.v $1 0.xy, texld_2d 0, mov.v0 $0 ^tex_sampler, sync, stop
570 static const uint32_t pp_reload_program
[] = {
571 0x000005e6, 0xf1003c20, 0x00000000, 0x39001000,
572 0x00000e4e, 0x000007cf, 0x00000000, 0x00000000,
574 memcpy(lima_bo_map(screen
->pp_buffer
) + pp_reload_program_offset
,
575 pp_reload_program
, sizeof(pp_reload_program
));
577 /* 0/1/2 vertex index for reload/clear draw */
578 static const uint8_t pp_shared_index
[] = { 0, 1, 2 };
579 memcpy(lima_bo_map(screen
->pp_buffer
) + pp_shared_index_offset
,
580 pp_shared_index
, sizeof(pp_shared_index
));
582 /* 4096x4096 gl pos used for partial clear */
583 static const float pp_clear_gl_pos
[] = {
588 memcpy(lima_bo_map(screen
->pp_buffer
) + pp_clear_gl_pos_offset
,
589 pp_clear_gl_pos
, sizeof(pp_clear_gl_pos
));
591 /* is pp frame render state static? */
592 uint32_t *pp_frame_rsw
= lima_bo_map(screen
->pp_buffer
) + pp_frame_rsw_offset
;
593 memset(pp_frame_rsw
, 0, 0x40);
594 pp_frame_rsw
[8] = 0x0000f008;
595 pp_frame_rsw
[9] = screen
->pp_buffer
->va
+ pp_clear_program_offset
;
596 pp_frame_rsw
[13] = 0x00000100;
599 screen
->ro
= renderonly_dup(ro
);
601 fprintf(stderr
, "Failed to dup renderonly object\n");
606 screen
->base
.destroy
= lima_screen_destroy
;
607 screen
->base
.get_name
= lima_screen_get_name
;
608 screen
->base
.get_vendor
= lima_screen_get_vendor
;
609 screen
->base
.get_device_vendor
= lima_screen_get_device_vendor
;
610 screen
->base
.get_param
= lima_screen_get_param
;
611 screen
->base
.get_paramf
= lima_screen_get_paramf
;
612 screen
->base
.get_shader_param
= lima_screen_get_shader_param
;
613 screen
->base
.context_create
= lima_context_create
;
614 screen
->base
.is_format_supported
= lima_screen_is_format_supported
;
615 screen
->base
.get_compiler_options
= lima_screen_get_compiler_options
;
616 screen
->base
.query_dmabuf_modifiers
= lima_screen_query_dmabuf_modifiers
;
618 lima_resource_screen_init(screen
);
619 lima_fence_screen_init(screen
);
621 slab_create_parent(&screen
->transfer_pool
, sizeof(struct lima_transfer
), 16);
625 return &screen
->base
;
628 lima_bo_unreference(screen
->pp_buffer
);
630 lima_bo_table_fini(screen
);
632 lima_bo_cache_fini(screen
);