r600g: optimize away CF ALU instructions even if type doesn't match
authorChristian König <deathsimple@vodafone.de>
Fri, 17 Dec 2010 23:45:59 +0000 (00:45 +0100)
committerChristian König <deathsimple@vodafone.de>
Thu, 13 Jan 2011 18:41:07 +0000 (19:41 +0100)
src/gallium/drivers/r600/r600_asm.c

index 57acb87240de4ca788e30f2fc7c4dca67b412288..53122e54b7dae67e61a0b6b506fcfde92919dd43 100644 (file)
@@ -539,16 +539,29 @@ int r600_bc_add_alu_type(struct r600_bc *bc, const struct r600_bc_alu *alu, int
        memcpy(nalu, alu, sizeof(struct r600_bc_alu));
        nalu->nliteral = 0;
 
+       if (bc->cf_last != NULL && bc->cf_last->inst != (type << 3)) {
+               /* check if we could add it anyway */
+               if (bc->cf_last->inst == (V_SQ_CF_ALU_WORD1_SQ_CF_INST_ALU << 3) &&
+                       type == V_SQ_CF_ALU_WORD1_SQ_CF_INST_ALU_PUSH_BEFORE) {
+                       LIST_FOR_EACH_ENTRY(lalu, &bc->cf_last->alu, list) {
+                               if (lalu->predicate) {
+                                       bc->force_add_cf = 1;
+                                       break;
+                               }
+                       }
+               } else
+                       bc->force_add_cf = 1;
+       }
+
        /* cf can contains only alu or only vtx or only tex */
-       if (bc->cf_last == NULL || bc->cf_last->inst != (type << 3) ||
-               bc->force_add_cf) {
+       if (bc->cf_last == NULL || bc->force_add_cf) {
                r = r600_bc_add_cf(bc);
                if (r) {
                        free(nalu);
                        return r;
                }
-               bc->cf_last->inst = (type << 3);
        }
+       bc->cf_last->inst = (type << 3);
 
        /* Setup the kcache for this ALU instruction. This will start a new
         * ALU clause if needed. */