nir/lower_subgroups: add lower_shuffle_to_swizzle_amd

[mesa.git] / src / compiler / nir / nir.h
diff --git a/src/compiler/nir/nir.h b/src/compiler/nir/nir.h

index a673a2a8f31260d251b41879e76744276ef2bcd6..e0caedaf5f491a74ee3160672e8c8069bcd74fc8 100644 (file)
--- a/src/compiler/nir/nir.h
+++ b/src/compiler/nir/nir.h
@@ -2699,6 +2699,15 @@ typedef enum {
      * determine.  Most passes shouldn't preserve this metadata type.
      */
     nir_metadata_loop_analysis = 0x10,
+
+   /** All metadata
+    *
+    * This includes all nir_metadata flags except not_properly_reset.  Passes
+    * which do not change the shader in any way should call
+    *
+    *    nir_metadata_preserve(impl, nir_metadata_all);
+    */
+   nir_metadata_all = ~nir_metadata_not_properly_reset,
  } nir_metadata;
  
  typedef struct {
@@ -3285,6 +3294,8 @@ nir_function_impl *nir_cf_node_get_function(nir_cf_node *node);
  void nir_metadata_require(nir_function_impl *impl, nir_metadata required, ...);
  /** dirties all but the preserved metadata */
  void nir_metadata_preserve(nir_function_impl *impl, nir_metadata preserved);
+/** Preserves all metadata for the given shader */
+void nir_shader_preserve_all_metadata(nir_shader *shader);
  
  /** creates an instruction with default swizzle/writemask/etc. with NULL registers */
  nir_alu_instr *nir_alu_instr_create(nir_shader *shader, nir_op op);
@@ -4006,6 +4017,12 @@ typedef enum {
      */
     nir_address_format_32bit_index_offset,
  
+   /**
+    * An address format which is comprised of a vec3 where the first two
+    * components specify the buffer and the third is an offset.
+    */
+   nir_address_format_vec2_index_32bit_offset,
+
     /**
      * An address format which is a simple 32-bit offset.
      */
@@ -4025,12 +4042,13 @@ static inline unsigned
  nir_address_format_bit_size(nir_address_format addr_format)
  {
     switch (addr_format) {
-   case nir_address_format_32bit_global:           return 32;
-   case nir_address_format_64bit_global:           return 64;
-   case nir_address_format_64bit_bounded_global:   return 32;
-   case nir_address_format_32bit_index_offset:     return 32;
-   case nir_address_format_32bit_offset:           return 32;
-   case nir_address_format_logical:                return 32;
+   case nir_address_format_32bit_global:              return 32;
+   case nir_address_format_64bit_global:              return 64;
+   case nir_address_format_64bit_bounded_global:      return 32;
+   case nir_address_format_32bit_index_offset:        return 32;
+   case nir_address_format_vec2_index_32bit_offset:   return 32;
+   case nir_address_format_32bit_offset:              return 32;
+   case nir_address_format_logical:                   return 32;
     }
     unreachable("Invalid address format");
  }
@@ -4039,12 +4057,13 @@ static inline unsigned
  nir_address_format_num_components(nir_address_format addr_format)
  {
     switch (addr_format) {
-   case nir_address_format_32bit_global:           return 1;
-   case nir_address_format_64bit_global:           return 1;
-   case nir_address_format_64bit_bounded_global:   return 4;
-   case nir_address_format_32bit_index_offset:     return 2;
-   case nir_address_format_32bit_offset:           return 1;
-   case nir_address_format_logical:                return 1;
+   case nir_address_format_32bit_global:              return 1;
+   case nir_address_format_64bit_global:              return 1;
+   case nir_address_format_64bit_bounded_global:      return 4;
+   case nir_address_format_32bit_index_offset:        return 2;
+   case nir_address_format_vec2_index_32bit_offset:   return 3;
+   case nir_address_format_32bit_offset:              return 1;
+   case nir_address_format_logical:                   return 1;
     }
     unreachable("Invalid address format");
  }
@@ -4120,6 +4139,7 @@ void nir_lower_io_to_scalar(nir_shader *shader, nir_variable_mode mask);
  void nir_lower_io_to_scalar_early(nir_shader *shader, nir_variable_mode mask);
  bool nir_lower_io_to_vector(nir_shader *shader, nir_variable_mode mask);
  
+bool nir_lower_fragcolor(nir_shader *shader);
  void nir_lower_fragcoord_wtrans(nir_shader *shader);
  void nir_lower_viewport_transform(nir_shader *shader);
  bool nir_lower_uniforms_to_ubo(nir_shader *shader, int multiplier);
@@ -4133,6 +4153,7 @@ typedef struct nir_lower_subgroups_options {
     bool lower_subgroup_masks:1;
     bool lower_shuffle:1;
     bool lower_shuffle_to_32bit:1;
+   bool lower_shuffle_to_swizzle_amd:1;
     bool lower_quad:1;
     bool lower_quad_broadcast_dynamic:1;
     bool lower_quad_broadcast_dynamic_to_const:1;
@@ -4346,6 +4367,7 @@ bool nir_lower_clip_gs(nir_shader *shader, unsigned ucp_enables,
  bool nir_lower_clip_fs(nir_shader *shader, unsigned ucp_enables,
                         bool use_clipdist_array);
  bool nir_lower_clip_cull_distance_arrays(nir_shader *nir);
+bool nir_lower_clip_disable(nir_shader *shader, unsigned clip_plane_enable);
  
  void nir_lower_point_size_mov(nir_shader *shader,
                                const gl_state_index16 *pointsize_state_tokens);
@@ -4568,7 +4590,20 @@ bool nir_opt_load_store_vectorize(nir_shader *shader, nir_variable_mode modes,
                                    nir_should_vectorize_mem_func callback,
                                    nir_variable_mode robust_modes);
  
-void nir_schedule(nir_shader *shader, int threshold);
+typedef struct nir_schedule_options {
+   /* On some hardware with some stages the inputs and outputs to the shader
+    * share the same memory. In that case scheduler needs to ensure that all
+    * output writes are scheduled after all of the input writes to avoid
+    * overwriting them. This is a bitmask of stages that need that.
+    */
+   unsigned stages_with_shared_io_memory;
+   /* The approximate amount of register pressure at which point the scheduler
+    * will try to reduce register usage.
+    */
+   int threshold;
+} nir_schedule_options;
+
+void nir_schedule(nir_shader *shader, const nir_schedule_options *options);
  
  void nir_strip(nir_shader *shader);