Merge remote-tracking branch 'mesa-public/master' into vulkan

[mesa.git] / src / mesa / drivers / dri / i965 / brw_shader.cpp
diff --git a/src/mesa/drivers/dri/i965/brw_shader.cpp b/src/mesa/drivers/dri/i965/brw_shader.cpp

index ebfb49acf8d70747f230baf9dfcd933fc87cd07f..06393c8ff2bb61343bcb56e77dfb3d8259fabec9 100644 (file)
--- a/src/mesa/drivers/dri/i965/brw_shader.cpp
+++ b/src/mesa/drivers/dri/i965/brw_shader.cpp
@@ -32,16 +32,106 @@
  #include "glsl/glsl_parser_extras.h"
  #include "main/shaderapi.h"
  
+static void
+shader_debug_log_mesa(void *data, const char *fmt, ...)
+{
+   struct brw_context *brw = (struct brw_context *)data;
+   va_list args;
+
+   va_start(args, fmt);
+   GLuint msg_id = 0;
+   _mesa_gl_vdebug(&brw->ctx, &msg_id,
+                   MESA_DEBUG_SOURCE_SHADER_COMPILER,
+                   MESA_DEBUG_TYPE_OTHER,
+                   MESA_DEBUG_SEVERITY_NOTIFICATION, fmt, args);
+   va_end(args);
+}
+
+static void
+shader_perf_log_mesa(void *data, const char *fmt, ...)
+{
+   struct brw_context *brw = (struct brw_context *)data;
+
+   va_list args;
+   va_start(args, fmt);
+
+   if (unlikely(INTEL_DEBUG & DEBUG_PERF)) {
+      va_list args_copy;
+      va_copy(args_copy, args);
+      vfprintf(stderr, fmt, args_copy);
+      va_end(args_copy);
+   }
+
+   if (brw->perf_debug) {
+      GLuint msg_id = 0;
+      _mesa_gl_vdebug(&brw->ctx, &msg_id,
+                      MESA_DEBUG_SOURCE_SHADER_COMPILER,
+                      MESA_DEBUG_TYPE_PERFORMANCE,
+                      MESA_DEBUG_SEVERITY_MEDIUM, fmt, args);
+   }
+   va_end(args);
+}
+
  struct brw_compiler *
  brw_compiler_create(void *mem_ctx, const struct brw_device_info *devinfo)
  {
     struct brw_compiler *compiler = rzalloc(mem_ctx, struct brw_compiler);
  
     compiler->devinfo = devinfo;
+   compiler->shader_debug_log = shader_debug_log_mesa;
+   compiler->shader_perf_log = shader_perf_log_mesa;
  
     brw_fs_alloc_reg_sets(compiler);
     brw_vec4_alloc_reg_set(compiler);
  
+   if (devinfo->gen >= 8 && !(INTEL_DEBUG & DEBUG_VEC4VS))
+      compiler->scalar_vs = true;
+
+   nir_shader_compiler_options *nir_options =
+      rzalloc(compiler, nir_shader_compiler_options);
+   nir_options->native_integers = true;
+   /* In order to help allow for better CSE at the NIR level we tell NIR
+    * to split all ffma instructions during opt_algebraic and we then
+    * re-combine them as a later step.
+    */
+   nir_options->lower_ffma = true;
+   nir_options->lower_sub = true;
+
+   /* We want the GLSL compiler to emit code that uses condition codes */
+   for (int i = 0; i < MESA_SHADER_STAGES; i++) {
+      compiler->glsl_compiler_options[i].MaxUnrollIterations = 32;
+      compiler->glsl_compiler_options[i].MaxIfDepth =
+         devinfo->gen < 6 ? 16 : UINT_MAX;
+
+      compiler->glsl_compiler_options[i].EmitCondCodes = true;
+      compiler->glsl_compiler_options[i].EmitNoNoise = true;
+      compiler->glsl_compiler_options[i].EmitNoMainReturn = true;
+      compiler->glsl_compiler_options[i].EmitNoIndirectInput = true;
+      compiler->glsl_compiler_options[i].EmitNoIndirectOutput =
+        (i == MESA_SHADER_FRAGMENT);
+      compiler->glsl_compiler_options[i].EmitNoIndirectTemp =
+        (i == MESA_SHADER_FRAGMENT);
+      compiler->glsl_compiler_options[i].EmitNoIndirectUniform = false;
+      compiler->glsl_compiler_options[i].LowerClipDistance = true;
+   }
+
+   compiler->glsl_compiler_options[MESA_SHADER_VERTEX].OptimizeForAOS = true;
+   compiler->glsl_compiler_options[MESA_SHADER_GEOMETRY].OptimizeForAOS = true;
+
+   if (compiler->scalar_vs) {
+      /* If we're using the scalar backend for vertex shaders, we need to
+       * configure these accordingly.
+       */
+      compiler->glsl_compiler_options[MESA_SHADER_VERTEX].EmitNoIndirectOutput = true;
+      compiler->glsl_compiler_options[MESA_SHADER_VERTEX].EmitNoIndirectTemp = true;
+      compiler->glsl_compiler_options[MESA_SHADER_VERTEX].OptimizeForAOS = false;
+
+      compiler->glsl_compiler_options[MESA_SHADER_VERTEX].NirOptions = nir_options;
+   }
+
+   compiler->glsl_compiler_options[MESA_SHADER_FRAGMENT].NirOptions = nir_options;
+   compiler->glsl_compiler_options[MESA_SHADER_COMPUTE].NirOptions = nir_options;
+
     return compiler;
  }
  
@@ -97,7 +187,7 @@ is_scalar_shader_stage(struct brw_context *brw, int stage)
     case MESA_SHADER_FRAGMENT:
        return true;
     case MESA_SHADER_VERTEX:
-      return brw->scalar_vs;
+      return brw->intelScreen->compiler->scalar_vs;
     default:
        return false;
     }
@@ -632,6 +722,8 @@ brw_instruction_name(enum opcode op)
        return "gs_ff_sync_set_primitives";
     case CS_OPCODE_CS_TERMINATE:
        return "cs_terminate";
+   case SHADER_OPCODE_BARRIER:
+      return "barrier";
     }
  
     unreachable("not reached");
@@ -755,19 +847,22 @@ brw_abs_immediate(enum brw_reg_type type, struct brw_reg *reg)
     return false;
  }
  
-backend_visitor::backend_visitor(struct brw_context *brw,
-                                 struct gl_shader_program *shader_prog,
-                                 struct gl_program *prog,
-                                 struct brw_stage_prog_data *stage_prog_data,
-                                 gl_shader_stage stage)
-   : brw(brw),
-     devinfo(brw->intelScreen->devinfo),
-     ctx(&brw->ctx),
+backend_shader::backend_shader(const struct brw_compiler *compiler,
+                               void *log_data,
+                               void *mem_ctx,
+                               struct gl_shader_program *shader_prog,
+                               struct gl_program *prog,
+                               struct brw_stage_prog_data *stage_prog_data,
+                               gl_shader_stage stage)
+   : compiler(compiler),
+     log_data(log_data),
+     devinfo(compiler->devinfo),
       shader(shader_prog ?
          (struct brw_shader *)shader_prog->_LinkedShaders[stage] : NULL),
       shader_prog(shader_prog),
       prog(prog),
       stage_prog_data(stage_prog_data),
+     mem_ctx(mem_ctx),
       cfg(NULL),
       stage(stage)
  {
@@ -950,7 +1045,6 @@ backend_instruction::can_do_saturate() const
     case BRW_OPCODE_LINE:
     case BRW_OPCODE_LRP:
     case BRW_OPCODE_MAC:
-   case BRW_OPCODE_MACH:
     case BRW_OPCODE_MAD:
     case BRW_OPCODE_MATH:
     case BRW_OPCODE_MOV:
@@ -1060,6 +1154,7 @@ backend_instruction::has_side_effects() const
     case SHADER_OPCODE_MEMORY_FENCE:
     case SHADER_OPCODE_URB_WRITE_SIMD8:
     case FS_OPCODE_FB_WRITE:
+   case SHADER_OPCODE_BARRIER:
        return true;
     default:
        return false;
@@ -1148,13 +1243,13 @@ backend_instruction::remove(bblock_t *block)
  }
  
  void
-backend_visitor::dump_instructions()
+backend_shader::dump_instructions()
  {
     dump_instructions(NULL);
  }
  
  void
-backend_visitor::dump_instructions(const char *name)
+backend_shader::dump_instructions(const char *name)
  {
     FILE *file = stderr;
     if (name && geteuid() != 0) {
@@ -1183,7 +1278,7 @@ backend_visitor::dump_instructions(const char *name)
  }
  
  void
-backend_visitor::calculate_cfg()
+backend_shader::calculate_cfg()
  {
     if (this->cfg)
        return;
@@ -1191,7 +1286,7 @@ backend_visitor::calculate_cfg()
  }
  
  void
-backend_visitor::invalidate_cfg()
+backend_shader::invalidate_cfg()
  {
     ralloc_free(this->cfg);
     this->cfg = NULL;
@@ -1206,7 +1301,7 @@ backend_visitor::invalidate_cfg()
   * trigger some of our asserts that surface indices are < BRW_MAX_SURFACES.
   */
  void
-backend_visitor::assign_common_binding_table_offsets(uint32_t next_binding_table_offset)
+backend_shader::assign_common_binding_table_offsets(uint32_t next_binding_table_offset)
  {
     int num_textures = _mesa_fls(prog->SamplersUsed);