radv: start conditionalising vertex inputs. (v2)
authorDave Airlie <airlied@redhat.com>
Mon, 17 Apr 2017 19:15:46 +0000 (05:15 +1000)
committerDave Airlie <airlied@redhat.com>
Tue, 18 Apr 2017 23:00:42 +0000 (09:00 +1000)
In practice this will probably just drop draw id in a few places.

v2: just do draw_id for now. (Bas)
it might be possible to do something more if we need it in the
future. (nha)

Reviewed-by: Bas Nieuwenhuizen <bas@basnieuwenhuizen.nl>
Signed-off-by: Dave Airlie <airlied@redhat.com>
src/amd/common/ac_nir_to_llvm.c
src/amd/common/ac_shader_info.c
src/amd/common/ac_shader_info.h
src/amd/vulkan/radv_cmd_buffer.c

index dbb3b67b511f92e713c7a8afdac1ab1722818e97..31b772f56691672fc4317c0f99aa8e7cdfd14a5b 100644 (file)
@@ -614,10 +614,12 @@ static void create_function(struct nir_to_llvm_context *ctx)
                break;
        case MESA_SHADER_VERTEX:
                if (!ctx->is_gs_copy_shader) {
-                       arg_types[arg_idx++] = const_array(ctx->v16i8, 16); /* vertex buffers */
+                       if (ctx->shader_info->info.vs.has_vertex_buffers)
+                               arg_types[arg_idx++] = const_array(ctx->v16i8, 16); /* vertex buffers */
                        arg_types[arg_idx++] = ctx->i32; // base vertex
                        arg_types[arg_idx++] = ctx->i32; // start instance
-                       arg_types[arg_idx++] = ctx->i32; // draw index
+                       if (ctx->shader_info->info.vs.needs_draw_id)
+                                       arg_types[arg_idx++] = ctx->i32; // draw index
                }
                user_sgpr_count = arg_idx;
                if (ctx->options->key.vs.as_es)
@@ -773,14 +775,22 @@ static void create_function(struct nir_to_llvm_context *ctx)
                break;
        case MESA_SHADER_VERTEX:
                if (!ctx->is_gs_copy_shader) {
-                       set_userdata_location_shader(ctx, AC_UD_VS_VERTEX_BUFFERS, user_sgpr_idx, 2);
-                       user_sgpr_idx += 2;
-                       ctx->vertex_buffers = LLVMGetParam(ctx->main_function, arg_idx++);
-                       set_userdata_location_shader(ctx, AC_UD_VS_BASE_VERTEX_START_INSTANCE, user_sgpr_idx, 3);
-                       user_sgpr_idx += 3;
+                       if (ctx->shader_info->info.vs.has_vertex_buffers) {
+                               set_userdata_location_shader(ctx, AC_UD_VS_VERTEX_BUFFERS, user_sgpr_idx, 2);
+                               user_sgpr_idx += 2;
+                               ctx->vertex_buffers = LLVMGetParam(ctx->main_function, arg_idx++);
+                       }
+                       unsigned vs_num = 2;
+                       if (ctx->shader_info->info.vs.needs_draw_id)
+                               vs_num++;
+
+                       set_userdata_location_shader(ctx, AC_UD_VS_BASE_VERTEX_START_INSTANCE, user_sgpr_idx, vs_num);
+                       user_sgpr_idx += vs_num;
+
                        ctx->base_vertex = LLVMGetParam(ctx->main_function, arg_idx++);
                        ctx->start_instance = LLVMGetParam(ctx->main_function, arg_idx++);
-                       ctx->draw_index = LLVMGetParam(ctx->main_function, arg_idx++);
+                       if (ctx->shader_info->info.vs.needs_draw_id)
+                               ctx->draw_index = LLVMGetParam(ctx->main_function, arg_idx++);
                }
                if (ctx->options->key.vs.as_es)
                        ctx->es2gs_offset = LLVMGetParam(ctx->main_function, arg_idx++);
index 85252fea14607139c88775b3952530802ec2dd17..6ad562505cf2e2510801000ad207a00021fc9ef8 100644 (file)
@@ -30,6 +30,9 @@ gather_intrinsic_info(nir_intrinsic_instr *instr, struct ac_shader_info *info)
        case nir_intrinsic_interp_var_at_sample:
                info->ps.needs_sample_positions = true;
                break;
+       case nir_intrinsic_load_draw_id:
+               info->vs.needs_draw_id = true;
+               break;
        default:
                break;
        }
@@ -49,12 +52,30 @@ gather_info_block(nir_block *block, struct ac_shader_info *info)
        }
 }
 
+static void
+gather_info_input_decl(nir_shader *nir,
+                      const struct ac_nir_compiler_options *options,
+                      nir_variable *var,
+                      struct ac_shader_info *info)
+{
+       switch (nir->stage) {
+       case MESA_SHADER_VERTEX:
+               info->vs.has_vertex_buffers = true;
+               break;
+       default:
+               break;
+       }
+}
+
 void
 ac_nir_shader_info_pass(struct nir_shader *nir,
                        const struct ac_nir_compiler_options *options,
                        struct ac_shader_info *info)
 {
        struct nir_function *func = (struct nir_function *)exec_list_get_head(&nir->functions);
+       nir_foreach_variable(variable, &nir->inputs)
+               gather_info_input_decl(nir, options, variable, info);
+
        nir_foreach_block(block, func->impl) {
                gather_info_block(block, info);
        }
index 5576c3b4bacdef4069d803d5c1180e08edd3dc08..7e2b6c885a6d51807fd88a64b1abae7e5afd9a2d 100644 (file)
@@ -28,6 +28,10 @@ struct ac_nir_compiler_options;
 /* a NIR pass to gather all the info needed to optimise the alloction patterns for the RADV user sgprs */
 
 struct ac_shader_info {
+       struct {
+               bool has_vertex_buffers; /* needs vertex buffers and base/start */
+               bool needs_draw_id;
+       } vs;
        struct {
                bool needs_sample_positions;
        } ps;
index f3e5f8292411fdd67b4dec17f02ee2ae2cae23ce..52b74539068f424009aa971d7ce776254f68770d 100644 (file)
@@ -1427,7 +1427,8 @@ radv_cmd_buffer_flush_state(struct radv_cmd_buffer *cmd_buffer,
                                                           cmd_buffer->cs, 4096);
 
        if ((cmd_buffer->state.vertex_descriptors_dirty || cmd_buffer->state.vb_dirty) &&
-           cmd_buffer->state.pipeline->num_vertex_attribs) {
+           cmd_buffer->state.pipeline->num_vertex_attribs &&
+           cmd_buffer->state.pipeline->shaders[MESA_SHADER_VERTEX]->info.info.vs.has_vertex_buffers) {
                unsigned vb_offset;
                void *vb_ptr;
                uint32_t i = 0;
@@ -2512,10 +2513,16 @@ void radv_CmdDraw(
        if (loc->sgpr_idx != -1) {
                uint32_t base_reg = shader_stage_to_user_data_0(MESA_SHADER_VERTEX, radv_pipeline_has_gs(cmd_buffer->state.pipeline),
                                                                radv_pipeline_has_tess(cmd_buffer->state.pipeline));
-               radeon_set_sh_reg_seq(cmd_buffer->cs, base_reg + loc->sgpr_idx * 4, 3);
+               int vs_num = 2;
+               if (cmd_buffer->state.pipeline->shaders[MESA_SHADER_VERTEX]->info.info.vs.needs_draw_id)
+                       vs_num = 3;
+
+               assert (loc->num_sgprs == vs_num);
+               radeon_set_sh_reg_seq(cmd_buffer->cs, base_reg + loc->sgpr_idx * 4, vs_num);
                radeon_emit(cmd_buffer->cs, firstVertex);
                radeon_emit(cmd_buffer->cs, firstInstance);
-               radeon_emit(cmd_buffer->cs, 0);
+               if (cmd_buffer->state.pipeline->shaders[MESA_SHADER_VERTEX]->info.info.vs.needs_draw_id)
+                       radeon_emit(cmd_buffer->cs, 0);
        }
        radeon_emit(cmd_buffer->cs, PKT3(PKT3_NUM_INSTANCES, 0, 0));
        radeon_emit(cmd_buffer->cs, instanceCount);
@@ -2555,10 +2562,16 @@ void radv_CmdDrawIndexed(
        if (loc->sgpr_idx != -1) {
                uint32_t base_reg = shader_stage_to_user_data_0(MESA_SHADER_VERTEX, radv_pipeline_has_gs(cmd_buffer->state.pipeline),
                                                                radv_pipeline_has_tess(cmd_buffer->state.pipeline));
-               radeon_set_sh_reg_seq(cmd_buffer->cs, base_reg + loc->sgpr_idx * 4, 3);
+               int vs_num = 2;
+               if (cmd_buffer->state.pipeline->shaders[MESA_SHADER_VERTEX]->info.info.vs.needs_draw_id)
+                       vs_num = 3;
+
+               assert (loc->num_sgprs == vs_num);
+               radeon_set_sh_reg_seq(cmd_buffer->cs, base_reg + loc->sgpr_idx * 4, vs_num);
                radeon_emit(cmd_buffer->cs, vertexOffset);
                radeon_emit(cmd_buffer->cs, firstInstance);
-               radeon_emit(cmd_buffer->cs, 0);
+               if (cmd_buffer->state.pipeline->shaders[MESA_SHADER_VERTEX]->info.info.vs.needs_draw_id)
+                       radeon_emit(cmd_buffer->cs, 0);
        }
        radeon_emit(cmd_buffer->cs, PKT3(PKT3_NUM_INSTANCES, 0, 0));
        radeon_emit(cmd_buffer->cs, instanceCount);
@@ -2609,6 +2622,7 @@ radv_emit_indirect_draw(struct radv_cmd_buffer *cmd_buffer,
                                                             AC_UD_VS_BASE_VERTEX_START_INSTANCE);
        uint32_t base_reg = shader_stage_to_user_data_0(MESA_SHADER_VERTEX, radv_pipeline_has_gs(cmd_buffer->state.pipeline),
                                                        radv_pipeline_has_tess(cmd_buffer->state.pipeline));
+       bool draw_id_enable = cmd_buffer->state.pipeline->shaders[MESA_SHADER_VERTEX]->info.info.vs.needs_draw_id;
        assert(loc->sgpr_idx != -1);
        radeon_emit(cs, PKT3(PKT3_SET_BASE, 2, 0));
        radeon_emit(cs, 1);
@@ -2622,7 +2636,7 @@ radv_emit_indirect_draw(struct radv_cmd_buffer *cmd_buffer,
        radeon_emit(cs, ((base_reg + loc->sgpr_idx * 4) - SI_SH_REG_OFFSET) >> 2);
        radeon_emit(cs, ((base_reg + (loc->sgpr_idx + 1) * 4) - SI_SH_REG_OFFSET) >> 2);
        radeon_emit(cs, (((base_reg + (loc->sgpr_idx + 2) * 4) - SI_SH_REG_OFFSET) >> 2) |
-                       S_2C3_DRAW_INDEX_ENABLE(1) |
+                       S_2C3_DRAW_INDEX_ENABLE(draw_id_enable) |
                        S_2C3_COUNT_INDIRECT_ENABLE(!!count_va));
        radeon_emit(cs, draw_count); /* count */
        radeon_emit(cs, count_va); /* count_addr */