From: José Fonseca Date: Fri, 29 Jun 2012 20:18:24 +0000 (+0100) Subject: gallium/tgsi: Don't declare temps individually when they are all similar. X-Git-Url: https://git.libre-soc.org/?a=commitdiff_plain;h=f5c41e16d7b09e7c342bff8ec5888db88c071be3;p=mesa.git gallium/tgsi: Don't declare temps individually when they are all similar. tgsi_ureg was recently enhanced to support local temporaries, and as result temps are declared individually. This change avoids many TEMP register declarations on common shaders. (And fixes performance regression due to mismatches against performance sensitive shaders.) Reviewed-by: Brian Paul --- diff --git a/src/gallium/auxiliary/tgsi/tgsi_ureg.c b/src/gallium/auxiliary/tgsi/tgsi_ureg.c index e427585db19..3fe78e0b7f0 100644 --- a/src/gallium/auxiliary/tgsi/tgsi_ureg.c +++ b/src/gallium/auxiliary/tgsi/tgsi_ureg.c @@ -1534,9 +1534,18 @@ static void emit_decls( struct ureg_program *ureg ) } } - for (i = 0; i < ureg->nr_temps; i++) { - emit_decl( ureg, TGSI_FILE_TEMPORARY, i, - util_bitmask_get(ureg->local_temps, i) ); + if (ureg->nr_temps) { + if (util_bitmask_get_first_index(ureg->local_temps) == UTIL_BITMASK_INVALID_INDEX) { + emit_decl_range( ureg, + TGSI_FILE_TEMPORARY, + 0, ureg->nr_temps ); + + } else { + for (i = 0; i < ureg->nr_temps; i++) { + emit_decl( ureg, TGSI_FILE_TEMPORARY, i, + util_bitmask_get(ureg->local_temps, i) ); + } + } } if (ureg->nr_addrs) { @@ -1687,7 +1696,7 @@ struct ureg_program *ureg_create( unsigned processor ) { struct ureg_program *ureg = CALLOC_STRUCT( ureg_program ); if (ureg == NULL) - return NULL; + goto no_ureg; ureg->processor = processor; ureg->property_gs_input_prim = ~0; @@ -1696,17 +1705,19 @@ struct ureg_program *ureg_create( unsigned processor ) ureg->free_temps = util_bitmask_create(); if (ureg->free_temps == NULL) - goto fail; + goto no_free_temps; ureg->local_temps = util_bitmask_create(); if (ureg->local_temps == NULL) - goto fail; + goto no_local_temps; return ureg; -fail: - FREE(ureg->free_temps); +no_local_temps: + util_bitmask_destroy(ureg->free_temps); +no_free_temps: FREE(ureg); +no_ureg: return NULL; }