draw,llvmpipe: use exponent manipulation instead of exp2 for polygon offset

author Roland Scheidegger <sroland@vmware.com>

Mon, 11 Nov 2013 15:11:59 +0000 (15:11 +0000)

committer Roland Scheidegger <sroland@vmware.com>

Tue, 12 Nov 2013 19:08:58 +0000 (19:08 +0000)
author Roland Scheidegger <sroland@vmware.com>
Mon, 11 Nov 2013 15:11:59 +0000 (15:11 +0000)
committer Roland Scheidegger <sroland@vmware.com>
Tue, 12 Nov 2013 19:08:58 +0000 (19:08 +0000)
diff --git a/src/gallium/auxiliary/draw/draw_pipe_offset.c b/src/gallium/auxiliary/draw/draw_pipe_offset.c

index 8071bc77b80f76f1cfc2dacbbc12b2c4487e93a1..34114035ac88b1717ff93ba3c97369fdd04f191e 100644 (file)
--- a/src/gallium/auxiliary/draw/draw_pipe_offset.c
+++ b/src/gallium/auxiliary/draw/draw_pipe_offset.c
@@ -90,18 +90,23 @@ static void do_offset_tri( struct draw_stage *stage,
     float dzdx = fabsf(a * inv_det);
     float dzdy = fabsf(b * inv_det);
  
-   float zoffset, maxz, bias, mult;
+   float zoffset, mult;
  
     mult = MAX2(dzdx, dzdy) * offset->scale;
  
     if (stage->draw->floating_point_depth) {
-      maxz = MAX3(v0[2], v1[2], v2[2]);
-
-      /**
-       * XXX: TODO optimize this to quickly resolve a pow2 number through
-       *      an exponent only operation.
-       */
-      bias = offset->units * util_fast_exp2(util_get_float32_exponent(maxz) - 23);
+      float bias;
+      union fi maxz;
+      maxz.f = MAX3(v0[2], v1[2], v2[2]);
+      /* just do the math directly on shifted number */
+      maxz.ui &= 0xff << 23;
+      maxz.i -= 23 << 23;
+      /* Clamping to zero means mrd will be zero for very small numbers,
+       * but specs do not indicate this should be prevented by clamping
+       * mrd to smallest normal number instead. */
+      maxz.i = MAX2(maxz.i, 0);
+
+      bias = offset->units * maxz.f;
        zoffset = bias + mult;
     } else {
        zoffset = offset->units + mult;
diff --git a/src/gallium/drivers/llvmpipe/lp_state_setup.c b/src/gallium/drivers/llvmpipe/lp_state_setup.c

index ccc9fb902f33ef6030d2e69d944de546c4d4b62d..1685ddce5ab9de2276aa25aec0ac5b0748660c61 100644 (file)
--- a/src/gallium/drivers/llvmpipe/lp_state_setup.c
+++ b/src/gallium/drivers/llvmpipe/lp_state_setup.c
@@ -31,6 +31,7 @@
  #include "util/u_simple_list.h"
  #include "os/os_time.h"
  #include "gallivm/lp_bld_arit.h"
+#include "gallivm/lp_bld_bitarit.h"
  #include "gallivm/lp_bld_const.h"
  #include "gallivm/lp_bld_debug.h"
  #include "gallivm/lp_bld_init.h"
@@ -268,8 +269,6 @@ lp_do_offset_tri(struct gallivm_state *gallivm,
     LLVMValueRef zeroi = lp_build_const_int32(gallivm, 0);
     LLVMValueRef twoi = lp_build_const_int32(gallivm, 2);
     LLVMValueRef threei  = lp_build_const_int32(gallivm, 3);
-   LLVMValueRef mantissa_bits, exp, bias;
-   LLVMValueRef maxz_value, maxz0z1_value;
  
     /* (res12) = cross(e,f).xy */
     shuffles[0] = twoi;
@@ -319,9 +318,13 @@ lp_do_offset_tri(struct gallivm_state *gallivm,
         *
         * NOTE: Assumes IEEE float32.
         */
+      LLVMValueRef c23_shifted, exp_mask, bias, exp;
+      LLVMValueRef maxz_value, maxz0z1_value;
+
        lp_build_context_init(&int_scalar_bld, gallivm, lp_type_int_vec(32, 32));
  
-      mantissa_bits = lp_build_const_int32(gallivm, 23);
+      c23_shifted = lp_build_const_int32(gallivm, 23 << 23);
+      exp_mask = lp_build_const_int32(gallivm, 0xff << 23);
  
        maxz0z1_value = lp_build_max(&flt_scalar_bld,
                           LLVMBuildExtractElement(b, attribv[0], twoi, ""),
@@ -331,15 +334,16 @@ lp_do_offset_tri(struct gallivm_state *gallivm,
                        LLVMBuildExtractElement(b, attribv[2], twoi, ""),
                        maxz0z1_value);
  
-      /**
-       * XXX: TODO optimize this to quickly resolve a pow2 number through
-       *      an exponent only operation.
-       */
-      exp = lp_build_extract_exponent(&flt_scalar_bld, maxz_value, 0);
-      exp = lp_build_sub(&int_scalar_bld, exp, mantissa_bits);
-      exp = lp_build_int_to_float(&flt_scalar_bld, exp);
+      exp = LLVMBuildBitCast(b, maxz_value, int_scalar_bld.vec_type, "");
+      exp = lp_build_and(&int_scalar_bld, exp, exp_mask);
+      exp = lp_build_sub(&int_scalar_bld, exp, c23_shifted);
+      /* Clamping to zero means mrd will be zero for very small numbers,
+       * but specs do not indicate this should be prevented by clamping
+       * mrd to smallest normal number instead. */
+      exp = lp_build_max(&int_scalar_bld, exp, int_scalar_bld.zero);
+      exp = LLVMBuildBitCast(b, exp, flt_scalar_bld.vec_type, "");
  
-      bias = LLVMBuildFMul(b, lp_build_exp2(&flt_scalar_bld, exp),
+      bias = LLVMBuildFMul(b, exp,
                             lp_build_const_float(gallivm, key->pgon_offset_units),
                             "bias");
author	Roland Scheidegger <sroland@vmware.com>
	Mon, 11 Nov 2013 15:11:59 +0000 (15:11 +0000)
committer	Roland Scheidegger <sroland@vmware.com>
	Tue, 12 Nov 2013 19:08:58 +0000 (19:08 +0000)
src/gallium/auxiliary/draw/draw_pipe_offset.c		patch \| blob \| history
src/gallium/drivers/llvmpipe/lp_state_setup.c		patch \| blob \| history