util: don't include p_defines.h and u_pointer.h from gallium

[mesa.git] / src / gallium / auxiliary / gallivm / lp_bld_arit.h
diff --git a/src/gallium/auxiliary/gallivm/lp_bld_arit.h b/src/gallium/auxiliary/gallivm/lp_bld_arit.h

index aeb987ff3524a5a6ef973277428969affdabce5d..862f8f6acda73497c29b473a539bb795c02dcbb2 100644 (file)
--- a/src/gallium/auxiliary/gallivm/lp_bld_arit.h
+++ b/src/gallium/auxiliary/gallivm/lp_bld_arit.h
@@ -38,10 +38,12 @@
  
  
  #include "gallivm/lp_bld.h"
+#include "pipe/p_compiler.h"
  
  
  struct lp_type;
  struct lp_build_context;
+struct gallivm_state;
  
  
  /**
@@ -57,19 +59,43 @@ lp_build_add(struct lp_build_context *bld,
               LLVMValueRef b);
  
  LLVMValueRef
-lp_build_sum_vector(struct lp_build_context *bld,
-                    LLVMValueRef a);
+lp_build_horizontal_add(struct lp_build_context *bld,
+                        LLVMValueRef a);
+
+LLVMValueRef
+lp_build_hadd_partial4(struct lp_build_context *bld,
+                       LLVMValueRef vectors[],
+                       unsigned num_vecs);
  
  LLVMValueRef
  lp_build_sub(struct lp_build_context *bld,
               LLVMValueRef a,
               LLVMValueRef b);
  
+
+LLVMValueRef
+lp_build_mul_norm(struct gallivm_state *gallivm,
+                  struct lp_type wide_type,
+                  LLVMValueRef a,
+                  LLVMValueRef b);
+
  LLVMValueRef
  lp_build_mul(struct lp_build_context *bld,
               LLVMValueRef a,
               LLVMValueRef b);
  
+LLVMValueRef
+lp_build_mul_32_lohi_cpu(struct lp_build_context *bld,
+                         LLVMValueRef a,
+                         LLVMValueRef b,
+                         LLVMValueRef *res_hi);
+
+LLVMValueRef
+lp_build_mul_32_lohi(struct lp_build_context *bld,
+                     LLVMValueRef a,
+                     LLVMValueRef b,
+                     LLVMValueRef *res_hi);
+
  LLVMValueRef
  lp_build_mul_imm(struct lp_build_context *bld,
                   LLVMValueRef a,
@@ -80,17 +106,42 @@ lp_build_div(struct lp_build_context *bld,
               LLVMValueRef a,
               LLVMValueRef b);
  
+
+/* llvm.fmuladd.* intrinsic */
  LLVMValueRef
-lp_build_lerp(struct lp_build_context *bld,
-              LLVMValueRef x,
-              LLVMValueRef v0,
-              LLVMValueRef v1);
+lp_build_fmuladd(LLVMBuilderRef builder,
+                 LLVMValueRef a,
+                 LLVMValueRef b,
+                 LLVMValueRef c);
+
+/* a * b + c */
+LLVMValueRef
+lp_build_mad(struct lp_build_context *bld,
+             LLVMValueRef a,
+             LLVMValueRef b,
+             LLVMValueRef c);
+
  
  /**
- * Bilinear interpolation.
+ * Set when the weights for normalized are prescaled, that is, in range
+ * 0..2**n, as opposed to range 0..2**(n-1).
+ */
+#define LP_BLD_LERP_PRESCALED_WEIGHTS (1 << 0)
+
+/**
+ * Used internally when using wide intermediates for normalized lerps.
   *
- * Values indices are in v_{yx}.
+ * Do not use.
   */
+#define LP_BLD_LERP_WIDE_NORMALIZED (1 << 1)
+
+LLVMValueRef
+lp_build_lerp(struct lp_build_context *bld,
+              LLVMValueRef x,
+              LLVMValueRef v0,
+              LLVMValueRef v1,
+              unsigned flags);
+
  LLVMValueRef
  lp_build_lerp_2d(struct lp_build_context *bld,
                   LLVMValueRef x,
@@ -98,24 +149,79 @@ lp_build_lerp_2d(struct lp_build_context *bld,
                   LLVMValueRef v00,
                   LLVMValueRef v01,
                   LLVMValueRef v10,
-                 LLVMValueRef v11);
+                 LLVMValueRef v11,
+                 unsigned flags);
+
+LLVMValueRef
+lp_build_lerp_3d(struct lp_build_context *bld,
+                 LLVMValueRef x,
+                 LLVMValueRef y,
+                 LLVMValueRef z,
+                 LLVMValueRef v000,
+                 LLVMValueRef v001,
+                 LLVMValueRef v010,
+                 LLVMValueRef v011,
+                 LLVMValueRef v100,
+                 LLVMValueRef v101,
+                 LLVMValueRef v110,
+                 LLVMValueRef v111,
+                 unsigned flags);
+
+/**
+ * Specifies floating point NaN behavior.
+ */
+enum gallivm_nan_behavior {
+   /* Results are undefined with NaN. Results in fastest code */
+   GALLIVM_NAN_BEHAVIOR_UNDEFINED,
+   /* If one of the inputs is NaN, NaN is returned */
+   GALLIVM_NAN_RETURN_NAN,
+   /* If one of the inputs is NaN, the other operand is returned */
+   GALLIVM_NAN_RETURN_OTHER,
+   /* If one of the inputs is NaN, the other operand is returned,
+    * but we guarantee the second operand is not a NaN.
+    * In min/max it will be as fast as undefined with sse opcodes,
+    * and archs having native return_other can benefit too. */
+   GALLIVM_NAN_RETURN_OTHER_SECOND_NONNAN,
+   /* If one of the inputs is NaN, NaN is returned,
+    * but we guarantee the first operand is not a NaN.
+    * In min/max it will be as fast as undefined with sse opcodes,
+    * and archs having native return_nan can benefit too. */
+   GALLIVM_NAN_RETURN_NAN_FIRST_NONNAN,
+
+};
  
  LLVMValueRef
  lp_build_min(struct lp_build_context *bld,
               LLVMValueRef a,
               LLVMValueRef b);
  
+LLVMValueRef
+lp_build_min_ext(struct lp_build_context *bld,
+                 LLVMValueRef a,
+                 LLVMValueRef b,
+                 enum gallivm_nan_behavior nan_behavior);
+
  LLVMValueRef
  lp_build_max(struct lp_build_context *bld,
               LLVMValueRef a,
               LLVMValueRef b);
  
+LLVMValueRef
+lp_build_max_ext(struct lp_build_context *bld,
+                 LLVMValueRef a,
+                 LLVMValueRef b,
+                 enum gallivm_nan_behavior nan_behavior);
+
  LLVMValueRef
  lp_build_clamp(struct lp_build_context *bld,
                 LLVMValueRef a,
                 LLVMValueRef min,
                 LLVMValueRef max);
  
+LLVMValueRef
+lp_build_clamp_zero_one_nanzero(struct lp_build_context *bld,
+                                LLVMValueRef a);
+
  LLVMValueRef
  lp_build_abs(struct lp_build_context *bld,
               LLVMValueRef a);
@@ -156,6 +262,10 @@ LLVMValueRef
  lp_build_fract(struct lp_build_context *bld,
                 LLVMValueRef a);
  
+LLVMValueRef
+lp_build_fract_safe(struct lp_build_context *bld,
+                    LLVMValueRef a);
+
  LLVMValueRef
  lp_build_ifloor(struct lp_build_context *bld,
                  LLVMValueRef a);
@@ -177,6 +287,12 @@ lp_build_ifloor_fract(struct lp_build_context *bld,
                        LLVMValueRef *out_ipart,
                        LLVMValueRef *out_fpart);
  
+void
+lp_build_ifloor_fract_safe(struct lp_build_context *bld,
+                           LLVMValueRef a,
+                           LLVMValueRef *out_ipart,
+                           LLVMValueRef *out_fpart);
+
  LLVMValueRef
  lp_build_sqrt(struct lp_build_context *bld,
                LLVMValueRef a);
@@ -189,6 +305,19 @@ LLVMValueRef
  lp_build_rsqrt(struct lp_build_context *bld,
                 LLVMValueRef a);
  
+boolean
+lp_build_fast_rsqrt_available(struct lp_type type);
+
+LLVMValueRef
+lp_build_fast_rsqrt(struct lp_build_context *bld,
+                    LLVMValueRef a);
+
+LLVMValueRef
+lp_build_polynomial(struct lp_build_context *bld,
+                    LLVMValueRef x,
+                    const double *coeffs,
+                    unsigned num_coeffs);
+
  LLVMValueRef
  lp_build_cos(struct lp_build_context *bld,
               LLVMValueRef a);
@@ -210,6 +339,10 @@ LLVMValueRef
  lp_build_log(struct lp_build_context *bld,
               LLVMValueRef a);
  
+LLVMValueRef
+lp_build_log_safe(struct lp_build_context *bld,
+                  LLVMValueRef a);
+
  LLVMValueRef
  lp_build_exp2(struct lp_build_context *bld,
                LLVMValueRef a);
@@ -227,6 +360,10 @@ LLVMValueRef
  lp_build_log2(struct lp_build_context *bld,
                LLVMValueRef a);
  
+LLVMValueRef
+lp_build_log2_safe(struct lp_build_context *bld,
+                   LLVMValueRef a);
+
  LLVMValueRef
  lp_build_fast_log2(struct lp_build_context *bld,
                     LLVMValueRef a);
@@ -235,23 +372,42 @@ LLVMValueRef
  lp_build_ilog2(struct lp_build_context *bld,
                 LLVMValueRef x);
  
-void
-lp_build_exp2_approx(struct lp_build_context *bld,
-                     LLVMValueRef x,
-                     LLVMValueRef *p_exp2_int_part,
-                     LLVMValueRef *p_frac_part,
-                     LLVMValueRef *p_exp2);
-
  void
  lp_build_log2_approx(struct lp_build_context *bld,
                       LLVMValueRef x,
                       LLVMValueRef *p_exp,
                       LLVMValueRef *p_floor_log2,
-                     LLVMValueRef *p_log2);
+                     LLVMValueRef *p_log2,
+                     boolean handle_nans);
  
  LLVMValueRef
  lp_build_mod(struct lp_build_context *bld,
               LLVMValueRef x,
               LLVMValueRef y);
  
+LLVMValueRef
+lp_build_isnan(struct lp_build_context *bld,
+               LLVMValueRef x);
+
+LLVMValueRef
+lp_build_isfinite(struct lp_build_context *bld,
+                  LLVMValueRef x);
+
+
+LLVMValueRef
+lp_build_is_inf_or_nan(struct gallivm_state *gallivm,
+                       const struct lp_type type,
+                       LLVMValueRef x);
+
+
+LLVMValueRef
+lp_build_fpstate_get(struct gallivm_state *gallivm);
+
+void
+lp_build_fpstate_set_denorms_zero(struct gallivm_state *gallivm,
+                                  boolean zero);
+void
+lp_build_fpstate_set(struct gallivm_state *gallivm,
+                     LLVMValueRef mxcsr);
+
  #endif /* !LP_BLD_ARIT_H */