vbo,gallium: make glBegin/End buffer size configurable by drivers
[mesa.git] / src / gallium / drivers / radeonsi / si_get.c
index 59d07523fbe384ef2b01ec9a2b47e3b8aca60167..d3fa08f91f2e4e24981eb6e42ead388bd19f862d 100644 (file)
@@ -26,7 +26,6 @@
 #include "radeon/radeon_video.h"
 #include "radeon/radeon_vce.h"
 #include "radeon/radeon_uvd_enc.h"
-#include "ac_llvm_util.h"
 #include "vl/vl_decoder.h"
 #include "vl/vl_video_buffer.h"
 #include "util/u_screen.h"
@@ -60,6 +59,7 @@ static int si_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
        case PIPE_CAP_POINT_SPRITE:
        case PIPE_CAP_OCCLUSION_QUERY:
        case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
+       case PIPE_CAP_TEXTURE_SHADOW_LOD:
        case PIPE_CAP_TEXTURE_MIRROR_CLAMP_TO_EDGE:
        case PIPE_CAP_BLEND_EQUATION_SEPARATE:
        case PIPE_CAP_TEXTURE_SWIZZLE:
@@ -71,7 +71,9 @@ static int si_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
        case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
        case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
        case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
-       case PIPE_CAP_SM3:
+       case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:
+       case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:
+       case PIPE_CAP_VERTEX_SHADER_SATURATE:
        case PIPE_CAP_SEAMLESS_CUBE_MAP:
        case PIPE_CAP_PRIMITIVE_RESTART:
        case PIPE_CAP_CONDITIONAL_RENDER:
@@ -140,7 +142,6 @@ static int si_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
        case PIPE_CAP_QUERY_TIMESTAMP:
        case PIPE_CAP_QUERY_TIME_ELAPSED:
        case PIPE_CAP_NIR_SAMPLERS_AS_DEREF:
-       case PIPE_CAP_QUERY_SO_OVERFLOW:
        case PIPE_CAP_MEMOBJ:
        case PIPE_CAP_LOAD_CONSTBUF:
        case PIPE_CAP_INT64:
@@ -148,17 +149,29 @@ static int si_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
        case PIPE_CAP_TGSI_CLOCK:
        case PIPE_CAP_CAN_BIND_CONST_BUFFER_AS_VERTEX:
        case PIPE_CAP_ALLOW_MAPPED_BUFFERS_DURING_EXECUTION:
-       case PIPE_CAP_TGSI_ANY_REG_AS_ADDRESS:
        case PIPE_CAP_SIGNED_VERTEX_BUFFER_OFFSET:
        case PIPE_CAP_TGSI_BALLOT:
        case PIPE_CAP_TGSI_VOTE:
        case PIPE_CAP_FBFETCH:
        case PIPE_CAP_COMPUTE_GRID_INFO_LAST_BLOCK:
        case PIPE_CAP_IMAGE_LOAD_FORMATTED:
-       case PIPE_CAP_PREFER_COMPUTE_BLIT_FOR_MULTIMEDIA:
-        case PIPE_CAP_TGSI_DIV:
+       case PIPE_CAP_PREFER_COMPUTE_FOR_MULTIMEDIA:
+       case PIPE_CAP_TGSI_DIV:
+       case PIPE_CAP_PACKED_UNIFORMS:
+       case PIPE_CAP_SHADER_SAMPLES_IDENTICAL:
+       case PIPE_CAP_GL_SPIRV:
+       case PIPE_CAP_DRAW_INFO_START_WITH_USER_INDICES:
                return 1;
 
+       case PIPE_CAP_QUERY_SO_OVERFLOW:
+               return !sscreen->use_ngg_streamout;
+
+       case PIPE_CAP_POST_DEPTH_COVERAGE:
+               return sscreen->info.chip_class >= GFX10;
+
+       case PIPE_CAP_GRAPHICS:
+               return sscreen->info.has_graphics;
+
        case PIPE_CAP_RESOURCE_FROM_USER_MEMORY:
                return !SI_BIG_ENDIAN && sscreen->info.has_userptr;
 
@@ -182,14 +195,17 @@ static int si_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
 
        case PIPE_CAP_GLSL_FEATURE_LEVEL:
        case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
-               if (sscreen->info.has_indirect_compute_dispatch)
-                               return 450;
-               return 420;
+               if (!sscreen->info.has_indirect_compute_dispatch)
+                       return 420;
+               return 460;
 
        case PIPE_CAP_MAX_TEXTURE_UPLOAD_MEMORY_BUDGET:
                /* Optimal number for good TexSubImage performance on Polaris10. */
                return 64 * 1024 * 1024;
 
+       case PIPE_CAP_GL_BEGIN_END_BUFFER_SIZE:
+               return 4096 * 1024;
+
        case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
        case PIPE_CAP_MAX_SHADER_BUFFER_SIZE:
                return MIN2(sscreen->info.max_alloc_size, INT_MAX);
@@ -197,40 +213,14 @@ static int si_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
        case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY:
        case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY:
        case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY:
-               return HAVE_LLVM < 0x0900 && !sscreen->info.has_unaligned_shader_loads;
+               return LLVM_VERSION_MAJOR < 9 && !sscreen->info.has_unaligned_shader_loads;
 
        case PIPE_CAP_SPARSE_BUFFER_PAGE_SIZE:
                return sscreen->info.has_sparse_vm_mappings ?
                                RADEON_SPARSE_PAGE_SIZE : 0;
 
-       case PIPE_CAP_PACKED_UNIFORMS:
-               if (sscreen->options.enable_nir)
-                       return 1;
-               return 0;
 
-       /* Unsupported features. */
-       case PIPE_CAP_BUFFER_SAMPLER_VIEW_RGBA_ONLY:
-       case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
-       case PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS:
-       case PIPE_CAP_USER_VERTEX_BUFFERS:
-       case PIPE_CAP_FAKE_SW_MSAA:
-       case PIPE_CAP_TEXTURE_GATHER_OFFSETS:
-       case PIPE_CAP_VERTEXID_NOBASE:
-       case PIPE_CAP_PRIMITIVE_RESTART_FOR_PATCHES:
-       case PIPE_CAP_TGSI_MUL_ZERO_WINS:
        case PIPE_CAP_UMA:
-       case PIPE_CAP_POLYGON_MODE_FILL_RECTANGLE:
-       case PIPE_CAP_POST_DEPTH_COVERAGE:
-       case PIPE_CAP_TILE_RASTER_ORDER:
-       case PIPE_CAP_MAX_COMBINED_SHADER_OUTPUT_RESOURCES:
-       case PIPE_CAP_CONTEXT_PRIORITY_MASK:
-       case PIPE_CAP_CONSERVATIVE_RASTER_POST_SNAP_TRIANGLES:
-       case PIPE_CAP_CONSERVATIVE_RASTER_POST_SNAP_POINTS_LINES:
-       case PIPE_CAP_CONSERVATIVE_RASTER_PRE_SNAP_TRIANGLES:
-       case PIPE_CAP_CONSERVATIVE_RASTER_PRE_SNAP_POINTS_LINES:
-       case PIPE_CAP_CONSERVATIVE_RASTER_POST_DEPTH_COVERAGE:
-       case PIPE_CAP_MAX_CONSERVATIVE_RASTER_SUBPIXEL_PRECISION_BIAS:
-       case PIPE_CAP_PROGRAMMABLE_SAMPLE_LOCATIONS:
                return 0;
 
        case PIPE_CAP_FENCE_SIGNAL:
@@ -329,6 +319,8 @@ static int si_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
                return sscreen->info.pci_dev;
        case PIPE_CAP_PCI_FUNCTION:
                return sscreen->info.pci_func;
+       case PIPE_CAP_TGSI_ATOMINC_WRAP:
+               return LLVM_VERSION_MAJOR >= 10;
 
        default:
                return u_pipe_screen_get_param_defaults(pscreen, param);
@@ -378,14 +370,14 @@ static int si_get_shader_param(struct pipe_screen* pscreen,
                        int ir = 1 << PIPE_SHADER_IR_NATIVE;
 
                        if (sscreen->info.has_indirect_compute_dispatch)
-                               ir |= 1 << PIPE_SHADER_IR_TGSI;
+                               ir |= 1 << PIPE_SHADER_IR_NIR;
 
                        return ir;
                }
 
                case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE: {
                        uint64_t max_const_buffer_size;
-                       pscreen->get_compute_param(pscreen, PIPE_SHADER_IR_TGSI,
+                       pscreen->get_compute_param(pscreen, PIPE_SHADER_IR_NIR,
                                PIPE_COMPUTE_CAP_MAX_MEM_ALLOC_SIZE,
                                &max_const_buffer_size);
                        return MIN2(max_const_buffer_size, INT_MAX);
@@ -427,13 +419,9 @@ static int si_get_shader_param(struct pipe_screen* pscreen,
        case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
                return SI_NUM_IMAGES;
        case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
-               if (sscreen->options.enable_nir)
-                       return 0;
-               return 32;
+               return 0;
        case PIPE_SHADER_CAP_PREFERRED_IR:
-               if (sscreen->options.enable_nir)
-                       return PIPE_SHADER_IR_NIR;
-               return PIPE_SHADER_IR_TGSI;
+               return PIPE_SHADER_IR_NIR;
        case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
                return 4;
 
@@ -480,8 +468,6 @@ static int si_get_shader_param(struct pipe_screen* pscreen,
        case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
        case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
                return 0;
-       case PIPE_SHADER_CAP_SCALAR_ISA:
-               return 1;
        }
        return 0;
 }
@@ -495,11 +481,9 @@ static const struct nir_shader_compiler_options nir_options = {
        .lower_bitfield_insert_to_bitfield_select = true,
        .lower_bitfield_extract = true,
        .lower_sub = true,
-       .lower_ffma = true,
+       .fuse_ffma = true,
        .lower_fmod = true,
-       .lower_pack_snorm_2x16 = true,
        .lower_pack_snorm_4x8 = true,
-       .lower_pack_unorm_2x16 = true,
        .lower_pack_unorm_4x8 = true,
        .lower_unpack_snorm_2x16 = true,
        .lower_unpack_snorm_4x8 = true,
@@ -508,8 +492,10 @@ static const struct nir_shader_compiler_options nir_options = {
        .lower_extract_byte = true,
        .lower_extract_word = true,
        .lower_rotate = true,
+       .lower_to_scalar = true,
        .optimize_sample_mask_in = true,
        .max_unroll_iterations = 32,
+       .use_interpolated_input_intrinsics = true,
 };
 
 static const void *
@@ -579,12 +565,14 @@ static int si_get_video_param(struct pipe_screen *screen,
        if (entrypoint == PIPE_VIDEO_ENTRYPOINT_ENCODE) {
                switch (param) {
                case PIPE_VIDEO_CAP_SUPPORTED:
-                       return (codec == PIPE_VIDEO_FORMAT_MPEG4_AVC &&
-                               (si_vce_is_fw_version_supported(sscreen) ||
-                               sscreen->info.family >= CHIP_RAVEN)) ||
+                       return ((codec == PIPE_VIDEO_FORMAT_MPEG4_AVC &&
+                               (sscreen->info.family >= CHIP_RAVEN ||
+                                si_vce_is_fw_version_supported(sscreen))) ||
                                (profile == PIPE_VIDEO_PROFILE_HEVC_MAIN &&
                                (sscreen->info.family >= CHIP_RAVEN ||
-                               si_radeon_uvd_enc_supported(sscreen)));
+                                si_radeon_uvd_enc_supported(sscreen))) ||
+                               (profile == PIPE_VIDEO_PROFILE_HEVC_MAIN_10 &&
+                                sscreen->info.family >= CHIP_RENOIR));
                case PIPE_VIDEO_CAP_NPOT_TEXTURES:
                        return 1;
                case PIPE_VIDEO_CAP_MAX_WIDTH:
@@ -632,9 +620,7 @@ static int si_get_video_param(struct pipe_screen *screen,
                                return profile == PIPE_VIDEO_PROFILE_HEVC_MAIN;
                        return false;
                case PIPE_VIDEO_FORMAT_JPEG:
-                       if (sscreen->info.family == CHIP_RAVEN ||
-                           sscreen->info.family == CHIP_RAVEN2 ||
-                           sscreen->info.family == CHIP_NAVI10)
+                       if (sscreen->info.family >= CHIP_RAVEN)
                                return true;
                        if (sscreen->info.family < CHIP_CARRIZO || sscreen->info.family >= CHIP_VEGA10)
                                return false;
@@ -653,12 +639,29 @@ static int si_get_video_param(struct pipe_screen *screen,
        case PIPE_VIDEO_CAP_NPOT_TEXTURES:
                return 1;
        case PIPE_VIDEO_CAP_MAX_WIDTH:
-               return (sscreen->info.family < CHIP_TONGA) ? 2048 : 4096;
+               switch (codec) {
+               case PIPE_VIDEO_FORMAT_HEVC:
+               case PIPE_VIDEO_FORMAT_VP9:
+                       return (sscreen->info.family < CHIP_RENOIR) ?
+                              ((sscreen->info.family < CHIP_TONGA) ? 2048 : 4096) :
+                              8192;
+               default:
+                       return (sscreen->info.family < CHIP_TONGA) ? 2048 : 4096;
+               }
        case PIPE_VIDEO_CAP_MAX_HEIGHT:
-               return (sscreen->info.family < CHIP_TONGA) ? 1152 : 4096;
+               switch (codec) {
+               case PIPE_VIDEO_FORMAT_HEVC:
+               case PIPE_VIDEO_FORMAT_VP9:
+                       return (sscreen->info.family < CHIP_RENOIR) ?
+                              ((sscreen->info.family < CHIP_TONGA) ? 1152 : 4096) :
+                              4352;
+               default:
+                       return (sscreen->info.family < CHIP_TONGA) ? 1152 : 4096;
+               }
        case PIPE_VIDEO_CAP_PREFERED_FORMAT:
-               if (profile == PIPE_VIDEO_PROFILE_HEVC_MAIN_10 ||
-                   profile == PIPE_VIDEO_PROFILE_VP9_PROFILE2)
+               if (profile == PIPE_VIDEO_PROFILE_HEVC_MAIN_10)
+                       return PIPE_FORMAT_P010;
+               else if (profile == PIPE_VIDEO_PROFILE_VP9_PROFILE2)
                        return PIPE_FORMAT_P016;
                else
                        return PIPE_FORMAT_NV12;
@@ -709,15 +712,21 @@ static int si_get_video_param(struct pipe_screen *screen,
        }
 }
 
-static boolean si_vid_is_format_supported(struct pipe_screen *screen,
-                                         enum pipe_format format,
-                                         enum pipe_video_profile profile,
-                                         enum pipe_video_entrypoint entrypoint)
+static bool si_vid_is_format_supported(struct pipe_screen *screen,
+                                      enum pipe_format format,
+                                      enum pipe_video_profile profile,
+                                      enum pipe_video_entrypoint entrypoint)
 {
-       /* HEVC 10 bit decoding should use P016 instead of NV12 if possible */
+       /* HEVC 10 bit decoding should use P010 instead of NV12 if possible */
        if (profile == PIPE_VIDEO_PROFILE_HEVC_MAIN_10)
                return (format == PIPE_FORMAT_NV12) ||
-                       (format == PIPE_FORMAT_P016);
+                      (format == PIPE_FORMAT_P010) ||
+                      (format == PIPE_FORMAT_P016);
+
+       /* Vp9 profile 2 supports 10 bit decoding using P016 */
+       if (profile == PIPE_VIDEO_PROFILE_VP9_PROFILE2)
+               return format == PIPE_FORMAT_P016;
+
 
        /* we can only handle this one with UVD */
        if (profile != PIPE_VIDEO_PROFILE_UNKNOWN)
@@ -732,14 +741,8 @@ static unsigned get_max_threads_per_block(struct si_screen *screen,
        if (ir_type == PIPE_SHADER_IR_NATIVE)
                return 256;
 
-       /* Only 16 waves per thread-group on gfx9. */
-       if (screen->info.chip_class >= GFX9)
-               return 1024;
-
-       /* Up to 40 waves per thread-group on GCN < gfx9. Expose a nice
-        * round number.
-        */
-       return 2048;
+        /* LLVM 10 only supports 1024 threads per block. */
+       return 1024;
 }
 
 static int si_get_compute_param(struct pipe_screen *screen,
@@ -871,7 +874,7 @@ static int si_get_compute_param(struct pipe_screen *screen,
        case PIPE_COMPUTE_CAP_SUBGROUP_SIZE:
                if (ret) {
                        uint32_t *subgroup_size = ret;
-                       *subgroup_size = 64;
+                       *subgroup_size = sscreen->compute_wave_size;
                }
                return sizeof(uint32_t);
        case PIPE_COMPUTE_CAP_MAX_VARIABLE_THREADS_PER_BLOCK: