freedreno/ir3: move per-generation compiler config

author Rob Clark <robdclark@gmail.com>

Fri, 10 Aug 2018 12:48:25 +0000 (08:48 -0400)

committer Rob Clark <robdclark@gmail.com>

Tue, 14 Aug 2018 21:59:02 +0000 (17:59 -0400)
author Rob Clark <robdclark@gmail.com>
Fri, 10 Aug 2018 12:48:25 +0000 (08:48 -0400)
committer Rob Clark <robdclark@gmail.com>
Tue, 14 Aug 2018 21:59:02 +0000 (17:59 -0400)
diff --git a/src/gallium/drivers/freedreno/ir3/ir3_compiler.c b/src/gallium/drivers/freedreno/ir3/ir3_compiler.c

index ff4d1b09ea8bcfd41920233f6e849076c5ad9179..c8bf0d2229adfd42ba1eba399a4092ae7af8c417 100644 (file)
--- a/src/gallium/drivers/freedreno/ir3/ir3_compiler.c
+++ b/src/gallium/drivers/freedreno/ir3/ir3_compiler.c
@@ -33,8 +33,26 @@
  struct ir3_compiler * ir3_compiler_create(struct fd_device *dev, uint32_t gpu_id)
  {
         struct ir3_compiler *compiler = rzalloc(NULL, struct ir3_compiler);
+
         compiler->dev = dev;
         compiler->gpu_id = gpu_id;
         compiler->set = ir3_ra_alloc_reg_set(compiler);
+
+       if (compiler->gpu_id >= 400) {
+               /* need special handling for "flat" */
+               compiler->flat_bypass = true;
+               compiler->levels_add_one = false;
+               compiler->unminify_coords = false;
+               compiler->txf_ms_with_isaml = false;
+               compiler->array_index_add_half = true;
+       } else {
+               /* no special handling for "flat" */
+               compiler->flat_bypass = false;
+               compiler->levels_add_one = true;
+               compiler->unminify_coords = true;
+               compiler->txf_ms_with_isaml = true;
+               compiler->array_index_add_half = false;
+       }
+
         return compiler;
  }
diff --git a/src/gallium/drivers/freedreno/ir3/ir3_compiler.h b/src/gallium/drivers/freedreno/ir3/ir3_compiler.h

index 671332e816d5f1a4a123524e70b69b348bc4bd29..c19ab1d7b02dcf921ae32c6c8a1b3c8402f51a3f 100644 (file)
--- a/src/gallium/drivers/freedreno/ir3/ir3_compiler.h
+++ b/src/gallium/drivers/freedreno/ir3/ir3_compiler.h
@@ -38,6 +38,33 @@ struct ir3_compiler {
         uint32_t gpu_id;
         struct ir3_ra_reg_set *set;
         uint32_t shader_count;
+
+       /*
+        * Configuration options for things that are handled differently on
+        * different generations:
+        */
+
+       /* a4xx (and later) drops SP_FS_FLAT_SHAD_MODE_REG_* for flat-interpolate
+        * so we need to use ldlv.u32 to load the varying directly:
+        */
+       bool flat_bypass;
+
+       /* on a3xx, we need to add one to # of array levels:
+        */
+       bool levels_add_one;
+
+       /* on a3xx, we need to scale up integer coords for isaml based
+        * on LoD:
+        */
+       bool unminify_coords;
+
+       /* on a3xx do txf_ms w/ isaml and scaled coords: */
+       bool txf_ms_with_isaml;
+
+       /* on a4xx, for array textures we need to add 0.5 to the array
+        * index coordinate:
+        */
+       bool array_index_add_half;
  };
  
  struct ir3_compiler * ir3_compiler_create(struct fd_device *dev, uint32_t gpu_id);
diff --git a/src/gallium/drivers/freedreno/ir3/ir3_compiler_nir.c b/src/gallium/drivers/freedreno/ir3/ir3_compiler_nir.c

index 6eb1e03e025f7353d84200a02af94480df322231..cffb8238b7039e0d96fd1614e5bc6a194d6e644f 100644 (file)
--- a/src/gallium/drivers/freedreno/ir3/ir3_compiler_nir.c
+++ b/src/gallium/drivers/freedreno/ir3/ir3_compiler_nir.c
@@ -104,28 +104,6 @@ struct ir3_context {
          */
         struct hash_table *block_ht;
  
-       /* a4xx (at least patchlevel 0) cannot seem to flat-interpolate
-        * so we need to use ldlv.u32 to load the varying directly:
-        */
-       bool flat_bypass;
-
-       /* on a3xx, we need to add one to # of array levels:
-        */
-       bool levels_add_one;
-
-       /* on a3xx, we need to scale up integer coords for isaml based
-        * on LoD:
-        */
-       bool unminify_coords;
-
-       /* on a3xx do txf_ms w/ isaml and scaled coords: */
-       bool txf_ms_with_isaml;
-
-       /* on a4xx, for array textures we need to add 0.5 to the array
-        * index coordinate:
-        */
-       bool array_index_add_half;
-
         /* on a4xx, bitmask of samplers which need astc+srgb workaround: */
         unsigned astc_srgb;
  
@@ -156,13 +134,6 @@ compile_init(struct ir3_compiler *compiler,
         struct ir3_context *ctx = rzalloc(NULL, struct ir3_context);
  
         if (compiler->gpu_id >= 400) {
-               /* need special handling for "flat" */
-               ctx->flat_bypass = true;
-               ctx->levels_add_one = false;
-               ctx->unminify_coords = false;
-               ctx->txf_ms_with_isaml = false;
-               ctx->array_index_add_half = true;
-
                 if (so->type == SHADER_VERTEX) {
                         ctx->astc_srgb = so->key.vastc_srgb;
                 } else if (so->type == SHADER_FRAGMENT) {
@@ -170,13 +141,6 @@ compile_init(struct ir3_compiler *compiler,
                 }
  
         } else {
-               /* no special handling for "flat" */
-               ctx->flat_bypass = false;
-               ctx->levels_add_one = true;
-               ctx->unminify_coords = true;
-               ctx->txf_ms_with_isaml = true;
-               ctx->array_index_add_half = false;
-
                 if (so->type == SHADER_VERTEX) {
                         ctx->samples = so->key.vsamples;
                 } else if (so->type == SHADER_FRAGMENT) {
@@ -2098,7 +2062,7 @@ emit_intrinsic_image_size(struct ir3_context *ctx, nir_intrinsic_instr *intr,
                 dst[i] = tmp[i];
  
         if (flags & IR3_INSTR_A) {
-               if (ctx->levels_add_one) {
+               if (ctx->compiler->levels_add_one) {
                         dst[ncoords-1] = ir3_ADD_U(b, tmp[3], 0, create_immed(b, 1), 0);
                 } else {
                         dst[ncoords-1] = ir3_MOV(b, tmp[3], TYPE_U32);
@@ -2731,7 +2695,7 @@ emit_tex(struct ir3_context *ctx, nir_tex_instr *tex)
          * with scaled x coord according to requested sample:
          */
         if (tex->op == nir_texop_txf_ms) {
-               if (ctx->txf_ms_with_isaml) {
+               if (ctx->compiler->txf_ms_with_isaml) {
                         /* the samples are laid out in x dimension as
                          *     0 1 2 3
                          * x_ms = (x << ms) + sample_index;
@@ -2749,7 +2713,7 @@ emit_tex(struct ir3_context *ctx, nir_tex_instr *tex)
         }
  
         /* scale up integer coords for TXF based on the LOD */
-       if (ctx->unminify_coords && (opc == OPC_ISAML)) {
+       if (ctx->compiler->unminify_coords && (opc == OPC_ISAML)) {
                 assert(has_lod);
                 for (i = 0; i < coords; i++)
                         src0[i] = ir3_SHL_B(b, src0[i], 0, lod, 0);
@@ -2770,7 +2734,7 @@ emit_tex(struct ir3_context *ctx, nir_tex_instr *tex)
                 struct ir3_instruction *idx = coord[coords];
  
                 /* the array coord for cube arrays needs 0.5 added to it */
-               if (ctx->array_index_add_half && (opc != OPC_ISAML))
+               if (ctx->compiler->array_index_add_half && (opc != OPC_ISAML))
                         idx = ir3_ADD_F(b, idx, 0, create_immed(b, fui(0.5)), 0);
  
                 src0[nsrc0++] = idx;
@@ -2899,7 +2863,7 @@ emit_tex_query_levels(struct ir3_context *ctx, nir_tex_instr *tex)
         /* The # of levels comes from getinfo.z. We need to add 1 to it, since
          * the value in TEX_CONST_0 is zero-based.
          */
-       if (ctx->levels_add_one)
+       if (ctx->compiler->levels_add_one)
                 dst[0] = ir3_ADD_U(b, dst[0], 0, create_immed(b, 1), 0);
  
         put_dst(ctx, &tex->dest);
@@ -2939,7 +2903,7 @@ emit_tex_txs(struct ir3_context *ctx, nir_tex_instr *tex)
          * returned, which means that we have to add 1 to it for arrays.
          */
         if (tex->is_array) {
-               if (ctx->levels_add_one) {
+               if (ctx->compiler->levels_add_one) {
                         dst[coords] = ir3_ADD_U(b, dst[3], 0, create_immed(b, 1), 0);
                 } else {
                         dst[coords] = ir3_MOV(b, dst[3], TYPE_U32);
@@ -3322,7 +3286,7 @@ setup_input(struct ir3_context *ctx, nir_variable *in)
                                         }
                                 }
  
-                               if (ctx->flat_bypass) {
+                               if (ctx->compiler->flat_bypass) {
                                         if ((so->inputs[n].interpolate == INTERP_MODE_FLAT) ||
                                                         (so->inputs[n].rasterflat && ctx->so->key.rasterflat))
                                                 use_ldlv = true;
author	Rob Clark <robdclark@gmail.com>
	Fri, 10 Aug 2018 12:48:25 +0000 (08:48 -0400)
committer	Rob Clark <robdclark@gmail.com>
	Tue, 14 Aug 2018 21:59:02 +0000 (17:59 -0400)
src/gallium/drivers/freedreno/ir3/ir3_compiler.c		patch \| blob \| history
src/gallium/drivers/freedreno/ir3/ir3_compiler.h		patch \| blob \| history
src/gallium/drivers/freedreno/ir3/ir3_compiler_nir.c		patch \| blob \| history