if (sctx->ngg) {
                if (sctx->tes_shader.cso) {
                        ge_cntl = S_03096C_PRIM_GRP_SIZE(num_patches) |
-                                 S_03096C_VERT_GRP_SIZE(0) |
+                                 S_03096C_VERT_GRP_SIZE(256) | /* 256 = disable vertex grouping */
                                  S_03096C_BREAK_WAVE_AT_EOI(key.u.tess_uses_prim_id);
                } else {
                        ge_cntl = si_get_vs_state(sctx)->ge_cntl;
                }
        } else {
                unsigned primgroup_size;
-               unsigned vertgroup_size;
+               unsigned vertgroup_size = 256; /* 256 = disable vertex grouping */;
 
                if (sctx->tes_shader.cso) {
                        primgroup_size = num_patches; /* must be a multiple of NUM_PATCHES */
-                       vertgroup_size = 0;
                } else if (sctx->gs_shader.cso) {
                        unsigned vgt_gs_onchip_cntl = sctx->gs_shader.current->ctx_reg.gs.vgt_gs_onchip_cntl;
                        primgroup_size = G_028A44_GS_PRIMS_PER_SUBGRP(vgt_gs_onchip_cntl);
-                       vertgroup_size = G_028A44_ES_VERTS_PER_SUBGRP(vgt_gs_onchip_cntl);
                } else {
                        primgroup_size = 128; /* recommended without a GS and tess */
-                       vertgroup_size = 0;
                }
 
                ge_cntl = S_03096C_PRIM_GRP_SIZE(primgroup_size) |
 
 
        shader->ge_cntl =
                S_03096C_PRIM_GRP_SIZE(shader->ngg.max_gsprims) |
-               S_03096C_VERT_GRP_SIZE(shader->ngg.hw_max_esverts) |
+               S_03096C_VERT_GRP_SIZE(256) | /* 256 = disable vertex grouping */
                S_03096C_BREAK_WAVE_AT_EOI(break_wave_at_eoi);
 
        /* Bug workaround for a possible hang with non-tessellation cases.