tgsi: clarify the semantics of DFRACEXP

author Nicolai Hähnle <nicolai.haehnle@amd.com>

Fri, 15 Sep 2017 16:34:48 +0000 (18:34 +0200)

committer Nicolai Hähnle <nicolai.haehnle@amd.com>

Fri, 29 Sep 2017 10:07:50 +0000 (12:07 +0200)
author Nicolai Hähnle <nicolai.haehnle@amd.com>
Fri, 15 Sep 2017 16:34:48 +0000 (18:34 +0200)
committer Nicolai Hähnle <nicolai.haehnle@amd.com>
Fri, 29 Sep 2017 10:07:50 +0000 (12:07 +0200)
diff --git a/src/gallium/auxiliary/tgsi/tgsi_exec.c b/src/gallium/auxiliary/tgsi/tgsi_exec.c

index 1264df0c622067dbe5a0ffc4cd8f011940598699..2a47f5dfaef1d4674bf4ba4be0e4eb04d4eca6d5 100644 (file)
--- a/src/gallium/auxiliary/tgsi/tgsi_exec.c
+++ b/src/gallium/auxiliary/tgsi/tgsi_exec.c
@@ -3688,17 +3688,15 @@ exec_dfracexp(struct tgsi_exec_machine *mach,
     union tgsi_double_channel dst;
     union tgsi_exec_channel dst_exp;
  
-   if (((inst->Dst[0].Register.WriteMask & TGSI_WRITEMASK_XY) == TGSI_WRITEMASK_XY)) {
-      fetch_double_channel(mach, &src, &inst->Src[0], TGSI_CHAN_X, TGSI_CHAN_Y);
-      micro_dfracexp(&dst, &dst_exp, &src);
+   fetch_double_channel(mach, &src, &inst->Src[0], TGSI_CHAN_X, TGSI_CHAN_Y);
+   micro_dfracexp(&dst, &dst_exp, &src);
+   if ((inst->Dst[0].Register.WriteMask & TGSI_WRITEMASK_XY) == TGSI_WRITEMASK_XY)
        store_double_channel(mach, &dst, &inst->Dst[0], inst, TGSI_CHAN_X, TGSI_CHAN_Y);
-      store_dest(mach, &dst_exp, &inst->Dst[1], inst, ffs(inst->Dst[1].Register.WriteMask) - 1, TGSI_EXEC_DATA_INT);
-   }
-   if (((inst->Dst[0].Register.WriteMask & TGSI_WRITEMASK_ZW) == TGSI_WRITEMASK_ZW)) {
-      fetch_double_channel(mach, &src, &inst->Src[0], TGSI_CHAN_Z, TGSI_CHAN_W);
-      micro_dfracexp(&dst, &dst_exp, &src);
+   if ((inst->Dst[0].Register.WriteMask & TGSI_WRITEMASK_ZW) == TGSI_WRITEMASK_ZW)
        store_double_channel(mach, &dst, &inst->Dst[0], inst, TGSI_CHAN_Z, TGSI_CHAN_W);
-      store_dest(mach, &dst_exp, &inst->Dst[1], inst, ffs(inst->Dst[1].Register.WriteMask) - 1, TGSI_EXEC_DATA_INT);
+   for (unsigned chan = 0; chan < TGSI_NUM_CHANNELS; chan++) {
+      if (inst->Dst[1].Register.WriteMask & (1 << chan))
+         store_dest(mach, &dst_exp, &inst->Dst[1], inst, chan, TGSI_EXEC_DATA_INT);
     }
  }
  
diff --git a/src/gallium/auxiliary/tgsi/tgsi_info_opcodes.h b/src/gallium/auxiliary/tgsi/tgsi_info_opcodes.h

index a4a97711750ccf267f4064376e45725b6ff21b5b..3f39afe21964630e0e62193138d881154ce0fc28 100644 (file)
--- a/src/gallium/auxiliary/tgsi/tgsi_info_opcodes.h
+++ b/src/gallium/auxiliary/tgsi/tgsi_info_opcodes.h
@@ -212,7 +212,7 @@ OPCODE(1, 1, COMP, DSQRT)
  OPCODE(1, 3, COMP, DMAD)
  OPCODE(1, 1, COMP, DFRAC)
  OPCODE(1, 2, COMP, DLDEXP)
-OPCODE(2, 1, COMP, DFRACEXP)
+OPCODE(2, 1, REPL, DFRACEXP)
  OPCODE(1, 1, COMP, D2I)
  OPCODE(1, 1, COMP, I2D)
  OPCODE(1, 1, COMP, D2U)
diff --git a/src/gallium/docs/source/tgsi.rst b/src/gallium/docs/source/tgsi.rst

index 8633c929b9f737e4935eb697aa01e9ed2150733c..fd78c40ba3cec388cd606506c040243d1f3b79be 100644 (file)
--- a/src/gallium/docs/source/tgsi.rst
+++ b/src/gallium/docs/source/tgsi.rst
@@ -1838,17 +1838,15 @@ two-component vectors with doubled precision in each component.
  
  Like the ``frexp()`` routine in many math libraries, this opcode stores the
  exponent of its source to ``dst0``, and the significand to ``dst1``, such that
-:math:`dst1 \times 2^{dst0} = src` .
+:math:`dst1 \times 2^{dst0} = src` . The results are replicated across
+channels.
  
  .. math::
  
-  dst0.xy = exp(src.xy)
+  dst0.xy = dst.zw = frac(src.xy)
  
-  dst1.xy = frac(src.xy)
+  dst1 = frac(src.xy)
  
-  dst0.zw = exp(src.zw)
-
-  dst1.zw = frac(src.zw)
  
  .. opcode:: DLDEXP - Multiply Number by Integral Power of 2
  
diff --git a/src/gallium/drivers/r600/r600_shader.c b/src/gallium/drivers/r600/r600_shader.c

index c9c922fc02b06ff5187e4f8c387825d2c5b6f4c7..188fbc9d47d66ec5bebcc1373431083f9a5b2287 100644 (file)
--- a/src/gallium/drivers/r600/r600_shader.c
+++ b/src/gallium/drivers/r600/r600_shader.c
@@ -4045,7 +4045,6 @@ static int tgsi_dfracexp(struct r600_shader_ctx *ctx)
         struct r600_bytecode_alu alu;
         unsigned write_mask = inst->Dst[0].Register.WriteMask;
         int i, j, r;
-       int firsti = write_mask == 0xc ? 2 : 0;
  
         for (i = 0; i <= 3; i++) {
                 memset(&alu, 0, sizeof(struct r600_bytecode_alu));
@@ -4066,15 +4065,18 @@ static int tgsi_dfracexp(struct r600_shader_ctx *ctx)
                         return r;
         }
  
-       /* MOV first two channels to writemask dst0 */
-       for (i = 0; i <= 1; i++) {
+       /* Replicate significand result across channels. */
+       for (i = 0; i <= 3; i++) {
+               if (!(write_mask & (1 << i)))
+                       continue;
+
                 memset(&alu, 0, sizeof(struct r600_bytecode_alu));
                 alu.op = ALU_OP1_MOV;
-               alu.src[0].chan = i + 2;
+               alu.src[0].chan = (i & 1) + 2;
                 alu.src[0].sel = ctx->temp_reg;
  
-               tgsi_dst(ctx, &inst->Dst[0], firsti + i, &alu.dst);
-               alu.dst.write = (inst->Dst[0].Register.WriteMask >> (firsti + i)) & 1;
+               tgsi_dst(ctx, &inst->Dst[0], i, &alu.dst);
+               alu.dst.write = 1;
                 alu.last = 1;
                 r = r600_bytecode_add_alu(ctx->bc, &alu);
                 if (r)
author	Nicolai Hähnle <nicolai.haehnle@amd.com>
	Fri, 15 Sep 2017 16:34:48 +0000 (18:34 +0200)
committer	Nicolai Hähnle <nicolai.haehnle@amd.com>
	Fri, 29 Sep 2017 10:07:50 +0000 (12:07 +0200)
src/gallium/auxiliary/tgsi/tgsi_exec.c		patch \| blob \| history
src/gallium/auxiliary/tgsi/tgsi_info_opcodes.h		patch \| blob \| history
src/gallium/docs/source/tgsi.rst		patch \| blob \| history
src/gallium/drivers/r600/r600_shader.c		patch \| blob \| history