intel/fs: Add a generic SEND opcode

[mesa.git] / src / intel / compiler / brw_schedule_instructions.cpp
diff --git a/src/intel/compiler/brw_schedule_instructions.cpp b/src/intel/compiler/brw_schedule_instructions.cpp

index f817142a8b56453cf39f0da84f61aab0fe94249e..bc4c2dc5cdbda9b9f7fad6c5f8b2019d00d1e618 100644 (file)
--- a/src/intel/compiler/brw_schedule_instructions.cpp
+++ b/src/intel/compiler/brw_schedule_instructions.cpp
@@ -369,6 +369,7 @@ schedule_node::set_latency_gen7(bool is_haswell)
        break;
  
     case SHADER_OPCODE_UNTYPED_ATOMIC:
+   case SHADER_OPCODE_UNTYPED_ATOMIC_FLOAT:
     case SHADER_OPCODE_TYPED_ATOMIC:
        /* Test code:
         *   mov(8)    g112<1>ud       0x00000000ud       { align1 WE_all 1Q };
@@ -413,6 +414,13 @@ schedule_node::set_latency_gen7(bool is_haswell)
        latency = is_haswell ? 300 : 600;
        break;
  
+   case SHADER_OPCODE_SEND:
+      switch (inst->sfid) {
+      default:
+         unreachable("Unknown SFID");
+      }
+      break;
+
     default:
        /* 2 cycles:
         * mul(8) g4<1>F g2<0,1,0>F      0.5F            { align1 WE_normal 1Q };
@@ -429,7 +437,7 @@ schedule_node::set_latency_gen7(bool is_haswell)
  class instruction_scheduler {
  public:
     instruction_scheduler(backend_shader *s, int grf_count,
-                         int hw_reg_count, int block_count,
+                         unsigned hw_reg_count, int block_count,
                           instruction_scheduler_mode mode)
     {
        this->bs = s;
@@ -510,7 +518,7 @@ public:
     bool post_reg_alloc;
     int instructions_to_schedule;
     int grf_count;
-   int hw_reg_count;
+   unsigned hw_reg_count;
     int reg_pressure;
     int block_idx;
     exec_list instructions;
@@ -664,7 +672,7 @@ fs_instruction_scheduler::setup_liveness(cfg_t *cfg)
     int payload_last_use_ip[hw_reg_count];
     v->calculate_payload_ranges(hw_reg_count, payload_last_use_ip);
  
-   for (int i = 0; i < hw_reg_count; i++) {
+   for (unsigned i = 0; i < hw_reg_count; i++) {
        if (payload_last_use_ip[i] == -1)
           continue;
  
@@ -972,7 +980,7 @@ fs_instruction_scheduler::calculate_deps()
      * After register allocation, reg_offsets are gone and we track individual
      * GRF registers.
      */
-   schedule_node *last_grf_write[grf_count * 16];
+   schedule_node **last_grf_write;
     schedule_node *last_mrf_write[BRW_MAX_MRF(v->devinfo->gen)];
     schedule_node *last_conditional_mod[8] = {};
     schedule_node *last_accumulator_write = NULL;
@@ -983,7 +991,7 @@ fs_instruction_scheduler::calculate_deps()
      */
     schedule_node *last_fixed_grf_write = NULL;
  
-   memset(last_grf_write, 0, sizeof(last_grf_write));
+   last_grf_write = (schedule_node **)calloc(sizeof(schedule_node *), grf_count * 16);
     memset(last_mrf_write, 0, sizeof(last_mrf_write));
  
     /* top-to-bottom dependencies: RAW and WAW. */
@@ -1110,7 +1118,7 @@ fs_instruction_scheduler::calculate_deps()
     }
  
     /* bottom-to-top dependencies: WAR */
-   memset(last_grf_write, 0, sizeof(last_grf_write));
+   memset(last_grf_write, 0, sizeof(schedule_node *) * grf_count * 16);
     memset(last_mrf_write, 0, sizeof(last_mrf_write));
     memset(last_conditional_mod, 0, sizeof(last_conditional_mod));
     last_accumulator_write = NULL;
@@ -1226,6 +1234,8 @@ fs_instruction_scheduler::calculate_deps()
           last_accumulator_write = n;
        }
     }
+
+   free(last_grf_write);
  }
  
  void