i965/fs: Refactor compute_to_mrf() to split search and rewrite into separate loops.
authorFrancisco Jerez <currojerez@riseup.net>
Fri, 27 May 2016 20:15:55 +0000 (13:15 -0700)
committerFrancisco Jerez <currojerez@riseup.net>
Tue, 31 May 2016 22:57:40 +0000 (15:57 -0700)
This will allow compute_to_mrf to handle cases where the source of the
VGRF-to-MRF copy is initialized by more than one instruction.  In such
cases we cannot rewrite the destination of any of the generating
instructions until it's known whether the whole VGRF source region can
be coalesced into the destination MRF, which will imply continuing the
search until all generating instructions have been found or it has
been determined that the VGRF and MRF registers cannot be coalesced.

Cc: "12.0" <mesa-stable@lists.freedesktop.org>
Reviewed-by: Jason Ekstrand <jason@jlekstrand.net>
src/mesa/drivers/dri/i965/brw_fs.cpp

index b521f905e1c73739f374cd3443a9383de6c90d98..bb36a8ef76da576e27019d4c2db4744efa1b36dd 100644 (file)
@@ -2801,6 +2801,8 @@ fs_visitor::compute_to_mrf()
       /* Found a move of a GRF to a MRF.  Let's see if we can go
        * rewrite the thing that made this GRF to write into the MRF.
        */
+      bool found = false;
+
       foreach_inst_in_block_reverse_starting_from(fs_inst, scan_inst, inst) {
          if (regions_overlap(scan_inst->dst, scan_inst->regs_written * REG_SIZE,
                              inst->src[0], inst->regs_read(0) * REG_SIZE)) {
@@ -2811,7 +2813,7 @@ fs_visitor::compute_to_mrf()
            /* If this one instruction didn't populate all the
             * channels, bail.  We might be able to rewrite everything
             * that writes that reg, but it would require smarter
-            * tracking to delay the rewriting until complete success.
+            * tracking.
             */
            if (scan_inst->is_partial_write())
               break;
@@ -2838,15 +2840,9 @@ fs_visitor::compute_to_mrf()
               }
            }
 
-           if (scan_inst->dst.reg_offset == inst->src[0].reg_offset) {
-              /* Found the creator of our MRF's source value. */
-              scan_inst->dst.file = MRF;
-               scan_inst->dst.nr = inst->dst.nr;
-               scan_inst->dst.reg_offset = 0;
-              scan_inst->saturate |= inst->saturate;
-              inst->remove(block);
-              progress = true;
-           }
+           if (scan_inst->dst.reg_offset == inst->src[0].reg_offset)
+               found = true;
+
            break;
         }
 
@@ -2889,6 +2885,25 @@ fs_visitor::compute_to_mrf()
             break;
          }
       }
+
+      if (!found)
+         continue;
+
+      /* Found all generating instructions of our MRF's source value.
+       */
+      foreach_inst_in_block_reverse_starting_from(fs_inst, scan_inst, inst) {
+         if (regions_overlap(scan_inst->dst, scan_inst->regs_written * REG_SIZE,
+                             inst->src[0], inst->regs_read(0) * REG_SIZE)) {
+            scan_inst->dst.file = MRF;
+            scan_inst->dst.nr = inst->dst.nr;
+            scan_inst->dst.reg_offset = 0;
+            scan_inst->saturate |= inst->saturate;
+            break;
+         }
+      }
+
+      inst->remove(block);
+      progress = true;
    }
 
    if (progress)