pan/midgard: Add uniform/work heuristic

author Alyssa Rosenzweig <alyssa.rosenzweig@collabora.com>

Wed, 18 Dec 2019 00:05:35 +0000 (19:05 -0500)

committer Marge Bot <eric+marge@anholt.net>

Thu, 19 Dec 2019 15:22:39 +0000 (15:22 +0000)
author Alyssa Rosenzweig <alyssa.rosenzweig@collabora.com>
Wed, 18 Dec 2019 00:05:35 +0000 (19:05 -0500)
committer Marge Bot <eric+marge@anholt.net>
Thu, 19 Dec 2019 15:22:39 +0000 (15:22 +0000)
diff --git a/src/panfrost/midgard/compiler.h b/src/panfrost/midgard/compiler.h

index 45a0617a84069d25cb2b1a429d55c5f1035a8cfd..acc1a22a866df241c7de869b3798c191ab19403f 100644 (file)
--- a/src/panfrost/midgard/compiler.h
+++ b/src/panfrost/midgard/compiler.h
@@ -655,9 +655,7 @@ void mir_invalidate_liveness(compiler_context *ctx);
  bool mir_is_live_after(compiler_context *ctx, midgard_block *block, midgard_instruction *start, int src);
  
  void mir_create_pipeline_registers(compiler_context *ctx);
-
-void
-midgard_promote_uniforms(compiler_context *ctx, unsigned promoted_count);
+void midgard_promote_uniforms(compiler_context *ctx);
  
  midgard_instruction *
  emit_ubo_read(
diff --git a/src/panfrost/midgard/midgard_schedule.c b/src/panfrost/midgard/midgard_schedule.c

index 157595db501d513aa9039fd486ceda22345196e1..9ee1f3b77c8618cbac931ce55d02eea9f4d7e473 100644 (file)
--- a/src/panfrost/midgard/midgard_schedule.c
+++ b/src/panfrost/midgard/midgard_schedule.c
@@ -1141,7 +1141,7 @@ schedule_block(compiler_context *ctx, midgard_block *block)
  void
  schedule_program(compiler_context *ctx)
  {
-        midgard_promote_uniforms(ctx, 16);
+        midgard_promote_uniforms(ctx);
  
          /* Must be lowered right before scheduling */
          mir_squeeze_index(ctx);
diff --git a/src/panfrost/midgard/mir_promote_uniforms.c b/src/panfrost/midgard/mir_promote_uniforms.c

index d7b3cce36d2a9d002f8698716e140f100d8ff053..12f860787c1daa8f14deb1145a701971b9d90d90 100644 (file)
--- a/src/panfrost/midgard/mir_promote_uniforms.c
+++ b/src/panfrost/midgard/mir_promote_uniforms.c
@@ -26,35 +26,118 @@
  
  #include "compiler.h"
  #include "util/u_math.h"
+#include "util/u_memory.h"
  
  /* This pass promotes reads from uniforms from load/store ops to uniform
   * registers if it is beneficial to do so. Normally, this saves both
   * instructions and total register pressure, but it does take a toll on the
   * number of work registers that are available, so this is a balance.
   *
- * To cope, we take as an argument the maximum work register pressure in the
- * program so we allow that many registers through at minimum, to prevent
- * spilling. If we spill anyway, I mean, it's a lose-lose at that point. */
+ * We use a heuristic to determine the ideal count, implemented by
+ * mir_work_heuristic, which returns the ideal number of work registers.
+ */
+
+static bool
+mir_is_promoteable_ubo(midgard_instruction *ins)
+{
+        /* TODO: promote unaligned access via swizzle? */
+
+        return (ins->type == TAG_LOAD_STORE_4) &&
+                (OP_IS_UBO_READ(ins->load_store.op)) &&
+                !(ins->constants[0] & 0xF) &&
+                !(ins->load_store.arg_1) &&
+                (ins->load_store.arg_2 == 0x1E) &&
+                ((ins->constants[0] / 16) < 16);
+}
+
+static unsigned
+mir_promoteable_uniform_count(compiler_context *ctx)
+{
+        unsigned count = 0;
+
+        mir_foreach_instr_global(ctx, ins) {
+                if (mir_is_promoteable_ubo(ins))
+                        count = MAX2(count, ins->constants[0] / 16);
+        }
+
+        return count;
+}
+
+static unsigned
+mir_count_live(uint16_t *live, unsigned temp_count)
+{
+        unsigned count = 0;
+
+        for (unsigned i = 0; i < temp_count; ++i)
+                count += util_bitcount(live[i]);
+
+        return count;
+}
+
+static unsigned
+mir_estimate_pressure(compiler_context *ctx)
+{
+        mir_invalidate_liveness(ctx);
+        mir_compute_liveness(ctx);
+
+        unsigned max_live = 0;
+
+        mir_foreach_block(ctx, block) {
+                uint16_t *live = mem_dup(block->live_out, ctx->temp_count * sizeof(uint16_t));
+
+                mir_foreach_instr_in_block_rev(block, ins) {
+                        unsigned count = mir_count_live(live, ctx->temp_count);
+                        max_live = MAX2(max_live, count);
+                        mir_liveness_ins_update(live, ins, ctx->temp_count);
+                }
+
+                free(live);
+        }
+
+        return DIV_ROUND_UP(max_live, 16);
+}
+
+static unsigned
+mir_work_heuristic(compiler_context *ctx)
+{
+        unsigned uniform_count = mir_promoteable_uniform_count(ctx);
+
+        /* If there are 8 or fewer uniforms, it doesn't matter what we do, so
+         * allow as many work registers as needed */
+
+        if (uniform_count <= 8)
+                return 16;
+
+        /* Otherwise, estimate the register pressure */
+
+        unsigned pressure = mir_estimate_pressure(ctx);
+
+        /* Prioritize not spilling above all else. The relation between the
+         * pressure estimate and the actual register pressure is a little
+         * murkier than we might like (due to scheduling, pipeline registers,
+         * failure to pack vector registers, load/store registers, texture
+         * registers...), hence why this is a heuristic parameter */
+
+        if (pressure > 6)
+                return 16;
+
+        /* If there's no chance of spilling, prioritize UBOs and thread count */
+
+        return 8;
+}
  
  void
-midgard_promote_uniforms(compiler_context *ctx, unsigned promoted_count)
+midgard_promote_uniforms(compiler_context *ctx)
  {
+        unsigned work_count = mir_work_heuristic(ctx);
+        unsigned promoted_count = 24 - work_count;
+
          mir_foreach_instr_global_safe(ctx, ins) {
-                if (ins->type != TAG_LOAD_STORE_4) continue;
-                if (!OP_IS_UBO_READ(ins->load_store.op)) continue;
+                if (!mir_is_promoteable_ubo(ins)) continue;
  
-                /* TODO: promote unaligned access via swizzle? */
                  unsigned off = ins->constants[0];
-                if (off & 0xF) continue;
-
                  unsigned address = off / 16;
  
-                /* Check this is UBO 0 */
-                if (ins->load_store.arg_1) continue;
-
-                /* Check we're accessing directly */
-                if (ins->load_store.arg_2 != 0x1E) continue;
-
                  /* Check if it's a promotable range */
                  unsigned uniform_reg = 23 - address;
author	Alyssa Rosenzweig <alyssa.rosenzweig@collabora.com>
	Wed, 18 Dec 2019 00:05:35 +0000 (19:05 -0500)
committer	Marge Bot <eric+marge@anholt.net>
	Thu, 19 Dec 2019 15:22:39 +0000 (15:22 +0000)
src/panfrost/midgard/compiler.h		patch \| blob \| history
src/panfrost/midgard/midgard_schedule.c		patch \| blob \| history
src/panfrost/midgard/mir_promote_uniforms.c		patch \| blob \| history