radeonsi: remove redundant GS variables in si_shader_selector

[mesa.git] / src / gallium / drivers / radeonsi / gfx10_shader_ngg.c
diff --git a/src/gallium/drivers/radeonsi/gfx10_shader_ngg.c b/src/gallium/drivers/radeonsi/gfx10_shader_ngg.c

index f9415bde27948b7cc79f71a1ef812cb49dc348c8..9679508e5dfb4d30d49836499155884bcc42fbbb 100644 (file)
--- a/src/gallium/drivers/radeonsi/gfx10_shader_ngg.c
+++ b/src/gallium/drivers/radeonsi/gfx10_shader_ngg.c
@@ -90,7 +90,7 @@ static LLVMValueRef ngg_get_vertices_per_prim(struct si_shader_context *ctx, uns
     const struct si_shader_info *info = &ctx->shader->selector->info;
  
     if (ctx->stage == MESA_SHADER_VERTEX) {
-      if (info->properties[TGSI_PROPERTY_VS_BLIT_SGPRS_AMD]) {
+      if (info->base.vs.blit_sgprs_amd) {
           /* Blits always use axis-aligned rectangles with 3 vertices. */
           *num_vertices = 3;
           return LLVMConstInt(ctx->ac.i32, 3, 0);
@@ -109,9 +109,9 @@ static LLVMValueRef ngg_get_vertices_per_prim(struct si_shader_context *ctx, uns
     } else {
        assert(ctx->stage == MESA_SHADER_TESS_EVAL);
  
-      if (info->properties[TGSI_PROPERTY_TES_POINT_MODE])
+      if (info->base.tess.point_mode)
           *num_vertices = 1;
-      else if (info->properties[TGSI_PROPERTY_TES_PRIM_MODE] == PIPE_PRIM_LINES)
+      else if (info->base.tess.primitive_mode == GL_LINES)
           *num_vertices = 2;
        else
           *num_vertices = 3;
@@ -232,8 +232,7 @@ static void build_streamout_vertex(struct si_shader_context *ctx, LLVMValueRef *
  
        unsigned reg = so->output[i].register_index;
        struct si_shader_output_values out;
-      out.semantic_name = info->output_semantic_name[reg];
-      out.semantic_index = info->output_semantic_index[reg];
+      out.semantic = info->output_semantic[reg];
  
        for (unsigned comp = 0; comp < 4; comp++) {
           tmp = ac_build_gep0(&ctx->ac, vertexptr, LLVMConstInt(ctx->ac.i32, 4 * reg + comp, false));
@@ -737,8 +736,8 @@ void gfx10_emit_ngg_culling_epilogue(struct ac_shader_abi *abi, unsigned max_out
  
     LLVMValueRef position[4] = {};
     for (unsigned i = 0; i < info->num_outputs; i++) {
-      switch (info->output_semantic_name[i]) {
-      case TGSI_SEMANTIC_POSITION:
+      switch (info->output_semantic[i]) {
+      case VARYING_SLOT_POS:
           for (unsigned j = 0; j < 4; j++) {
              position[j] = LLVMBuildLoad(ctx->ac.builder, addrs[4 * i + j], "");
           }
@@ -1201,8 +1200,7 @@ void gfx10_emit_ngg_epilogue(struct ac_shader_abi *abi, unsigned max_outputs, LL
        vertex_ptr = ngg_nogs_vertex_ptr(ctx, get_thread_id_in_tg(ctx));
  
     for (unsigned i = 0; i < info->num_outputs; i++) {
-      outputs[i].semantic_name = info->output_semantic_name[i];
-      outputs[i].semantic_index = info->output_semantic_index[i];
+      outputs[i].semantic = info->output_semantic[i];
  
        for (unsigned j = 0; j < 4; j++) {
           outputs[i].vertex_stream[j] = (info->output_streams[i] >> (2 * j)) & 3;
@@ -1219,7 +1217,7 @@ void gfx10_emit_ngg_epilogue(struct ac_shader_abi *abi, unsigned max_outputs, LL
        }
  
        /* Store the edgeflag at the end (if streamout is enabled) */
-      if (info->output_semantic_name[i] == TGSI_SEMANTIC_EDGEFLAG && sel->info.writes_edgeflag) {
+      if (info->output_semantic[i] == VARYING_SLOT_EDGE && sel->info.writes_edgeflag) {
           LLVMValueRef edgeflag = LLVMBuildLoad(builder, addrs[4 * i], "");
           /* The output is a float, but the hw expects a 1-bit integer. */
           edgeflag = LLVMBuildFPToUI(ctx->ac.builder, edgeflag, ctx->ac.i32, "");
@@ -1324,7 +1322,7 @@ void gfx10_emit_ngg_epilogue(struct ac_shader_abi *abi, unsigned max_outputs, LL
     }
  
     /* Update query buffer */
-   if (ctx->screen->use_ngg_streamout && !info->properties[TGSI_PROPERTY_VS_BLIT_SGPRS_AMD]) {
+   if (ctx->screen->use_ngg_streamout && !info->base.vs.blit_sgprs_amd) {
        assert(!unterminated_es_if_block);
  
        tmp = si_unpack_param(ctx, ctx->vs_state_bits, 6, 1);
@@ -1377,7 +1375,7 @@ void gfx10_emit_ngg_epilogue(struct ac_shader_abi *abi, unsigned max_outputs, LL
            * use the position from the current shader part. Instead,
            * load it from LDS.
            */
-         if (info->output_semantic_name[i] == TGSI_SEMANTIC_POSITION &&
+         if (info->output_semantic[i] == VARYING_SLOT_POS &&
               ctx->shader->key.opt.ngg_culling) {
              vertex_ptr = ngg_nogs_vertex_ptr(ctx, ac_get_arg(&ctx->ac, ctx->ngg_old_thread_id));
  
@@ -1395,8 +1393,7 @@ void gfx10_emit_ngg_epilogue(struct ac_shader_abi *abi, unsigned max_outputs, LL
        }
  
        if (ctx->shader->key.mono.u.vs_export_prim_id) {
-         outputs[i].semantic_name = TGSI_SEMANTIC_PRIMID;
-         outputs[i].semantic_index = 0;
+         outputs[i].semantic = VARYING_SLOT_PRIMITIVE_ID;
  
           if (ctx->stage == MESA_SHADER_VERTEX) {
              /* Wait for GS stores to finish. */
@@ -1442,7 +1439,7 @@ static LLVMValueRef ngg_gs_get_vertex_storage(struct si_shader_context *ctx)
   * is in emit order; that is:
   * - during the epilogue, N is the threadidx (relative to the entire threadgroup)
   * - during vertex emit, i.e. while the API GS shader invocation is running,
- *   N = threadidx * gs_max_out_vertices + emitidx
+ *   N = threadidx * gs.vertices_out + emitidx
   *
   * Goals of the LDS memory layout:
   * 1. Eliminate bank conflicts on write for geometry shaders that have all emits
@@ -1461,7 +1458,7 @@ static LLVMValueRef ngg_gs_get_vertex_storage(struct si_shader_context *ctx)
   *
   * Swizzling is required to satisfy points 1 and 2 simultaneously.
   *
- * Vertices are stored in export order (gsthread * gs_max_out_vertices + emitidx).
+ * Vertices are stored in export order (gsthread * gs.vertices_out + emitidx).
   * Indices are swizzled in groups of 32, which ensures point 1 without
   * disturbing point 2.
   *
@@ -1473,8 +1470,8 @@ static LLVMValueRef ngg_gs_vertex_ptr(struct si_shader_context *ctx, LLVMValueRe
     LLVMBuilderRef builder = ctx->ac.builder;
     LLVMValueRef storage = ngg_gs_get_vertex_storage(ctx);
  
-   /* gs_max_out_vertices = 2^(write_stride_2exp) * some odd number */
-   unsigned write_stride_2exp = ffs(sel->gs_max_out_vertices) - 1;
+   /* gs.vertices_out = 2^(write_stride_2exp) * some odd number */
+   unsigned write_stride_2exp = ffs(sel->info.base.gs.vertices_out) - 1;
     if (write_stride_2exp) {
        LLVMValueRef row = LLVMBuildLShr(builder, vertexidx, LLVMConstInt(ctx->ac.i32, 5, false), "");
        LLVMValueRef swizzle = LLVMBuildAnd(
@@ -1492,7 +1489,7 @@ static LLVMValueRef ngg_gs_emit_vertex_ptr(struct si_shader_context *ctx, LLVMVa
     LLVMBuilderRef builder = ctx->ac.builder;
     LLVMValueRef tmp;
  
-   tmp = LLVMConstInt(ctx->ac.i32, sel->gs_max_out_vertices, false);
+   tmp = LLVMConstInt(ctx->ac.i32, sel->info.base.gs.vertices_out, false);
     tmp = LLVMBuildMul(builder, tmp, gsthread, "");
     const LLVMValueRef vertexidx = LLVMBuildAdd(builder, tmp, emitidx, "");
     return ngg_gs_vertex_ptr(ctx, vertexidx);
@@ -1534,7 +1531,7 @@ void gfx10_ngg_gs_emit_vertex(struct si_shader_context *ctx, unsigned stream, LL
      */
     const LLVMValueRef can_emit =
        LLVMBuildICmp(builder, LLVMIntULT, vertexidx,
-                    LLVMConstInt(ctx->ac.i32, sel->gs_max_out_vertices, false), "");
+                    LLVMConstInt(ctx->ac.i32, sel->info.base.gs.vertices_out, false), "");
  
     tmp = LLVMBuildAdd(builder, vertexidx, ctx->ac.i32_1, "");
     tmp = LLVMBuildSelect(builder, can_emit, tmp, vertexidx, "");
@@ -1560,7 +1557,7 @@ void gfx10_ngg_gs_emit_vertex(struct si_shader_context *ctx, unsigned stream, LL
     /* Determine and store whether this vertex completed a primitive. */
     const LLVMValueRef curverts = LLVMBuildLoad(builder, ctx->gs_curprim_verts[stream], "");
  
-   tmp = LLVMConstInt(ctx->ac.i32, u_vertices_per_prim(sel->gs_output_prim) - 1, false);
+   tmp = LLVMConstInt(ctx->ac.i32, u_vertices_per_prim(sel->info.base.gs.output_primitive) - 1, false);
     const LLVMValueRef iscompleteprim = LLVMBuildICmp(builder, LLVMIntUGE, curverts, tmp, "");
  
     /* Since the geometry shader emits triangle strips, we need to
@@ -1568,7 +1565,7 @@ void gfx10_ngg_gs_emit_vertex(struct si_shader_context *ctx, unsigned stream, LL
      * the correct vertex order.
      */
     LLVMValueRef is_odd = ctx->ac.i1false;
-   if (stream == 0 && u_vertices_per_prim(sel->gs_output_prim) == 3) {
+   if (stream == 0 && u_vertices_per_prim(sel->info.base.gs.output_primitive) == 3) {
        tmp = LLVMBuildAnd(builder, curverts, ctx->ac.i32_1, "");
        is_odd = LLVMBuildICmp(builder, LLVMIntEQ, tmp, ctx->ac.i32_1, "");
     }
@@ -1618,7 +1615,7 @@ void gfx10_ngg_gs_emit_epilogue(struct si_shader_context *ctx)
  {
     const struct si_shader_selector *sel = ctx->shader->selector;
     const struct si_shader_info *info = &sel->info;
-   const unsigned verts_per_prim = u_vertices_per_prim(sel->gs_output_prim);
+   const unsigned verts_per_prim = u_vertices_per_prim(sel->info.base.gs.output_primitive);
     LLVMBuilderRef builder = ctx->ac.builder;
     LLVMValueRef i8_0 = LLVMConstInt(ctx->ac.i8, 0, false);
     LLVMValueRef tmp, tmp2;
@@ -1640,7 +1637,7 @@ void gfx10_ngg_gs_emit_epilogue(struct si_shader_context *ctx)
  
        const LLVMValueRef vertexidx = LLVMBuildLoad(builder, ctx->gs_next_vertex[stream], "");
        tmp = LLVMBuildICmp(builder, LLVMIntUGE, vertexidx,
-                          LLVMConstInt(ctx->ac.i32, sel->gs_max_out_vertices, false), "");
+                          LLVMConstInt(ctx->ac.i32, sel->info.base.gs.vertices_out, false), "");
        ac_build_ifcc(&ctx->ac, tmp, 5101);
        ac_build_break(&ctx->ac);
        ac_build_endif(&ctx->ac, 5101);
@@ -1862,8 +1859,7 @@ void gfx10_ngg_gs_emit_epilogue(struct si_shader_context *ctx)
  
        unsigned out_idx = 0;
        for (unsigned i = 0; i < info->num_outputs; i++) {
-         outputs[i].semantic_name = info->output_semantic_name[i];
-         outputs[i].semantic_index = info->output_semantic_index[i];
+         outputs[i].semantic = info->output_semantic[i];
  
           for (unsigned j = 0; j < 4; j++, out_idx++) {
              tmp = ngg_gs_get_emit_output_ptr(ctx, vertexptr, out_idx);
@@ -1909,7 +1905,7 @@ bool gfx10_ngg_calculate_subgroup_info(struct si_shader *shader)
     const struct si_shader_selector *es_sel =
        shader->previous_stage_sel ? shader->previous_stage_sel : gs_sel;
     const gl_shader_stage gs_stage = gs_sel->info.stage;
-   const unsigned gs_num_invocations = MAX2(gs_sel->gs_num_invocations, 1);
+   const unsigned gs_num_invocations = MAX2(gs_sel->info.base.gs.invocations, 1);
     const unsigned input_prim = si_get_input_prim(gs_sel);
     const bool use_adjacency =
        input_prim >= PIPE_PRIM_LINES_ADJACENCY && input_prim <= PIPE_PRIM_TRIANGLE_STRIP_ADJACENCY;
@@ -1950,7 +1946,7 @@ bool gfx10_ngg_calculate_subgroup_info(struct si_shader *shader)
  
     if (gs_stage == MESA_SHADER_GEOMETRY) {
        bool force_multi_cycling = false;
-      unsigned max_out_verts_per_gsprim = gs_sel->gs_max_out_vertices * gs_num_invocations;
+      unsigned max_out_verts_per_gsprim = gs_sel->info.base.gs.vertices_out * gs_num_invocations;
  
  retry_select_mode:
        if (max_out_verts_per_gsprim <= 256 && !force_multi_cycling) {
@@ -1963,7 +1959,7 @@ retry_select_mode:
            * tessellation. */
           max_vert_out_per_gs_instance = true;
           max_gsprims_base = 1;
-         max_out_verts_per_gsprim = gs_sel->gs_max_out_vertices;
+         max_out_verts_per_gsprim = gs_sel->info.base.gs.vertices_out;
        }
  
        esvert_lds_size = es_sel->esgs_itemsize / 4;
@@ -2054,9 +2050,9 @@ retry_select_mode:
  
     unsigned max_out_vertices =
        max_vert_out_per_gs_instance
-         ? gs_sel->gs_max_out_vertices
+         ? gs_sel->info.base.gs.vertices_out
           : gs_stage == MESA_SHADER_GEOMETRY
-              ? max_gsprims * gs_num_invocations * gs_sel->gs_max_out_vertices
+              ? max_gsprims * gs_num_invocations * gs_sel->info.base.gs.vertices_out
                : max_esverts;
     assert(max_out_vertices <= 256);
  
@@ -2064,7 +2060,7 @@ retry_select_mode:
     if (gs_stage == MESA_SHADER_GEOMETRY) {
        /* Number of output primitives per GS input primitive after
         * GS instancing. */
-      prim_amp_factor = gs_sel->gs_max_out_vertices;
+      prim_amp_factor = gs_sel->info.base.gs.vertices_out;
     }
  
     /* The GE only checks against the maximum number of ES verts after