nv50/ir/nir: rework input output handling

author Karol Herbst <kherbst@redhat.com>

Mon, 15 Jun 2020 21:50:43 +0000 (23:50 +0200)

committer Marge Bot <eric+marge@anholt.net>

Mon, 22 Jun 2020 11:41:31 +0000 (11:41 +0000)
author Karol Herbst <kherbst@redhat.com>
Mon, 15 Jun 2020 21:50:43 +0000 (23:50 +0200)
committer Marge Bot <eric+marge@anholt.net>
Mon, 22 Jun 2020 11:41:31 +0000 (11:41 +0000)
diff --git a/src/gallium/drivers/nouveau/codegen/nv50_ir_from_nir.cpp b/src/gallium/drivers/nouveau/codegen/nv50_ir_from_nir.cpp

index 2eba4b888d1c5d925162728c8cc7bbcd87364944..e74828e0eae21ae202e3671cf4babfff4e48e027 100644 (file)
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_from_nir.cpp
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_from_nir.cpp
@@ -894,7 +894,7 @@ calcSlots(const glsl_type *type, Program::Type stage, const shader_info &info,
     uint16_t slots;
     switch (stage) {
     case Program::TYPE_GEOMETRY:
-      slots = type->uniform_locations();
+      slots = type->count_attribute_slots(false);
        if (input)
           slots /= info.gs.vertices_in;
        break;
@@ -902,9 +902,9 @@ calcSlots(const glsl_type *type, Program::Type stage, const shader_info &info,
     case Program::TYPE_TESSELLATION_EVAL:
        // remove first dimension
        if (var->data.patch || (!input && stage == Program::TYPE_TESSELLATION_EVAL))
-         slots = type->uniform_locations();
+         slots = type->count_attribute_slots(false);
        else
-         slots = type->fields.array->uniform_locations();
+         slots = type->fields.array->count_attribute_slots(false);
        break;
     default:
        slots = type->count_attribute_slots(false);
@@ -914,6 +914,24 @@ calcSlots(const glsl_type *type, Program::Type stage, const shader_info &info,
     return slots;
  }
  
+static uint8_t
+getMaskForType(const glsl_type *type, uint8_t slot) {
+   uint16_t comp = type->without_array()->components();
+   comp = comp ? comp : 4;
+
+   if (glsl_base_type_is_64bit(type->without_array()->base_type)) {
+      comp *= 2;
+      if (comp > 4) {
+         if (slot % 2)
+            comp -= 4;
+         else
+            comp = 4;
+      }
+   }
+
+   return (1 << comp) - 1;
+}
+
  bool Converter::assignSlots() {
     unsigned name;
     unsigned index;
@@ -956,16 +974,8 @@ bool Converter::assignSlots() {
        const glsl_type *type = var->type;
        int slot = var->data.location;
        uint16_t slots = calcSlots(type, prog->getType(), nir->info, true, var);
-      uint32_t comp = type->is_array() ? type->without_array()->component_slots()
-                                       : type->component_slots();
-      uint32_t frac = var->data.location_frac;
        uint32_t vary = var->data.driver_location;
  
-      if (glsl_base_type_is_64bit(type->without_array()->base_type)) {
-         if (comp > 2)
-            slots *= 2;
-      }
-
        assert(vary + slots <= PIPE_MAX_SHADER_INPUTS);
  
        switch(prog->getType()) {
@@ -1006,17 +1016,12 @@ bool Converter::assignSlots() {
        }
  
        for (uint16_t i = 0u; i < slots; ++i, ++vary) {
-         info->in[vary].id = vary;
-         info->in[vary].patch = var->data.patch;
-         info->in[vary].sn = name;
-         info->in[vary].si = index + i;
-         if (glsl_base_type_is_64bit(type->without_array()->base_type))
-            if (i & 0x1)
-               info->in[vary].mask |= (((1 << (comp * 2)) - 1) << (frac * 2) >> 0x4);
-            else
-               info->in[vary].mask |= (((1 << (comp * 2)) - 1) << (frac * 2) & 0xf);
-         else
-            info->in[vary].mask |= ((1 << comp) - 1) << frac;
+         nv50_ir_varying *v = &info->in[vary];
+
+         v->patch = var->data.patch;
+         v->sn = name;
+         v->si = index + i;
+         v->mask |= getMaskForType(type, i) << var->data.location_frac;
        }
        info->numInputs = std::max<uint8_t>(info->numInputs, vary);
     }
@@ -1025,16 +1030,8 @@ bool Converter::assignSlots() {
        const glsl_type *type = var->type;
        int slot = var->data.location;
        uint16_t slots = calcSlots(type, prog->getType(), nir->info, false, var);
-      uint32_t comp = type->is_array() ? type->without_array()->component_slots()
-                                       : type->component_slots();
-      uint32_t frac = var->data.location_frac;
        uint32_t vary = var->data.driver_location;
  
-      if (glsl_base_type_is_64bit(type->without_array()->base_type)) {
-         if (comp > 2)
-            slots *= 2;
-      }
-
        assert(vary < PIPE_MAX_SHADER_OUTPUTS);
  
        switch(prog->getType()) {
@@ -1099,20 +1096,14 @@ bool Converter::assignSlots() {
        }
  
        for (uint16_t i = 0u; i < slots; ++i, ++vary) {
-         info->out[vary].id = vary;
-         info->out[vary].patch = var->data.patch;
-         info->out[vary].sn = name;
-         info->out[vary].si = index + i;
-         if (glsl_base_type_is_64bit(type->without_array()->base_type))
-            if (i & 0x1)
-               info->out[vary].mask |= (((1 << (comp * 2)) - 1) << (frac * 2) >> 0x4);
-            else
-               info->out[vary].mask |= (((1 << (comp * 2)) - 1) << (frac * 2) & 0xf);
-         else
-            info->out[vary].mask |= ((1 << comp) - 1) << frac;
+         nv50_ir_varying *v = &info->out[vary];
+         v->patch = var->data.patch;
+         v->sn = name;
+         v->si = index + i;
+         v->mask |= getMaskForType(type, i) << var->data.location_frac;
  
           if (nir->info.outputs_read & 1ull << slot)
-            info->out[vary].oread = 1;
+            v->oread = 1;
        }
        info->numOutputs = std::max<uint8_t>(info->numOutputs, vary);
     }
@@ -3280,7 +3271,7 @@ nvir_nir_shader_compiler_options(int chipset)
     op.lower_hadd = true; // TODO
     op.lower_add_sat = true; // TODO
     op.vectorize_io = false;
-   op.lower_to_scalar = true;
+   op.lower_to_scalar = false;
     op.unify_interfaces = false;
     op.use_interpolated_input_intrinsics = true;
     op.lower_mul_2x32_64 = true; // TODO
author	Karol Herbst <kherbst@redhat.com>
	Mon, 15 Jun 2020 21:50:43 +0000 (23:50 +0200)
committer	Marge Bot <eric+marge@anholt.net>
	Mon, 22 Jun 2020 11:41:31 +0000 (11:41 +0000)