util: Move gallium's PIPE_FORMAT utils to /util/format/

[mesa.git] / src / gallium / auxiliary / gallivm / lp_bld_arit.h
diff --git a/src/gallium/auxiliary/gallivm/lp_bld_arit.h b/src/gallium/auxiliary/gallivm/lp_bld_arit.h

index 31efa9921ce61739397bc9db585485006ea2ab5b..f5b2800a2cf2118546ad9368b254852db804927e 100644 (file)
--- a/src/gallium/auxiliary/gallivm/lp_bld_arit.h
+++ b/src/gallium/auxiliary/gallivm/lp_bld_arit.h
@@ -42,6 +42,7 @@
  
  struct lp_type;
  struct lp_build_context;
+struct gallivm_state;
  
  
  /**
@@ -57,19 +58,43 @@ lp_build_add(struct lp_build_context *bld,
               LLVMValueRef b);
  
  LLVMValueRef
-lp_build_sum_vector(struct lp_build_context *bld,
-                    LLVMValueRef a);
+lp_build_horizontal_add(struct lp_build_context *bld,
+                        LLVMValueRef a);
+
+LLVMValueRef
+lp_build_hadd_partial4(struct lp_build_context *bld,
+                       LLVMValueRef vectors[],
+                       unsigned num_vecs);
  
  LLVMValueRef
  lp_build_sub(struct lp_build_context *bld,
               LLVMValueRef a,
               LLVMValueRef b);
  
+
+LLVMValueRef
+lp_build_mul_norm(struct gallivm_state *gallivm,
+                  struct lp_type wide_type,
+                  LLVMValueRef a,
+                  LLVMValueRef b);
+
  LLVMValueRef
  lp_build_mul(struct lp_build_context *bld,
               LLVMValueRef a,
               LLVMValueRef b);
  
+LLVMValueRef
+lp_build_mul_32_lohi_cpu(struct lp_build_context *bld,
+                         LLVMValueRef a,
+                         LLVMValueRef b,
+                         LLVMValueRef *res_hi);
+
+LLVMValueRef
+lp_build_mul_32_lohi(struct lp_build_context *bld,
+                     LLVMValueRef a,
+                     LLVMValueRef b,
+                     LLVMValueRef *res_hi);
+
  LLVMValueRef
  lp_build_mul_imm(struct lp_build_context *bld,
                   LLVMValueRef a,
@@ -80,17 +105,42 @@ lp_build_div(struct lp_build_context *bld,
               LLVMValueRef a,
               LLVMValueRef b);
  
+
+/* llvm.fmuladd.* intrinsic */
  LLVMValueRef
-lp_build_lerp(struct lp_build_context *bld,
-              LLVMValueRef x,
-              LLVMValueRef v0,
-              LLVMValueRef v1);
+lp_build_fmuladd(LLVMBuilderRef builder,
+                 LLVMValueRef a,
+                 LLVMValueRef b,
+                 LLVMValueRef c);
+
+/* a * b + c */
+LLVMValueRef
+lp_build_mad(struct lp_build_context *bld,
+             LLVMValueRef a,
+             LLVMValueRef b,
+             LLVMValueRef c);
+
+
+/**
+ * Set when the weights for normalized are prescaled, that is, in range
+ * 0..2**n, as opposed to range 0..2**(n-1).
+ */
+#define LP_BLD_LERP_PRESCALED_WEIGHTS (1 << 0)
  
  /**
- * Bilinear interpolation.
+ * Used internally when using wide intermediates for normalized lerps.
   *
- * Values indices are in v_{yx}.
+ * Do not use.
   */
+#define LP_BLD_LERP_WIDE_NORMALIZED (1 << 1)
+
+LLVMValueRef
+lp_build_lerp(struct lp_build_context *bld,
+              LLVMValueRef x,
+              LLVMValueRef v0,
+              LLVMValueRef v1,
+              unsigned flags);
+
  LLVMValueRef
  lp_build_lerp_2d(struct lp_build_context *bld,
                   LLVMValueRef x,
@@ -98,24 +148,79 @@ lp_build_lerp_2d(struct lp_build_context *bld,
                   LLVMValueRef v00,
                   LLVMValueRef v01,
                   LLVMValueRef v10,
-                 LLVMValueRef v11);
+                 LLVMValueRef v11,
+                 unsigned flags);
+
+LLVMValueRef
+lp_build_lerp_3d(struct lp_build_context *bld,
+                 LLVMValueRef x,
+                 LLVMValueRef y,
+                 LLVMValueRef z,
+                 LLVMValueRef v000,
+                 LLVMValueRef v001,
+                 LLVMValueRef v010,
+                 LLVMValueRef v011,
+                 LLVMValueRef v100,
+                 LLVMValueRef v101,
+                 LLVMValueRef v110,
+                 LLVMValueRef v111,
+                 unsigned flags);
+
+/**
+ * Specifies floating point NaN behavior.
+ */
+enum gallivm_nan_behavior {
+   /* Results are undefined with NaN. Results in fastest code */
+   GALLIVM_NAN_BEHAVIOR_UNDEFINED,
+   /* If one of the inputs is NaN, NaN is returned */
+   GALLIVM_NAN_RETURN_NAN,
+   /* If one of the inputs is NaN, the other operand is returned */
+   GALLIVM_NAN_RETURN_OTHER,
+   /* If one of the inputs is NaN, the other operand is returned,
+    * but we guarantee the second operand is not a NaN.
+    * In min/max it will be as fast as undefined with sse opcodes,
+    * and archs having native return_other can benefit too. */
+   GALLIVM_NAN_RETURN_OTHER_SECOND_NONNAN,
+   /* If one of the inputs is NaN, NaN is returned,
+    * but we guarantee the first operand is not a NaN.
+    * In min/max it will be as fast as undefined with sse opcodes,
+    * and archs having native return_nan can benefit too. */
+   GALLIVM_NAN_RETURN_NAN_FIRST_NONNAN,
+
+};
  
  LLVMValueRef
  lp_build_min(struct lp_build_context *bld,
               LLVMValueRef a,
               LLVMValueRef b);
  
+LLVMValueRef
+lp_build_min_ext(struct lp_build_context *bld,
+                 LLVMValueRef a,
+                 LLVMValueRef b,
+                 enum gallivm_nan_behavior nan_behavior);
+
  LLVMValueRef
  lp_build_max(struct lp_build_context *bld,
               LLVMValueRef a,
               LLVMValueRef b);
  
+LLVMValueRef
+lp_build_max_ext(struct lp_build_context *bld,
+                 LLVMValueRef a,
+                 LLVMValueRef b,
+                 enum gallivm_nan_behavior nan_behavior);
+
  LLVMValueRef
  lp_build_clamp(struct lp_build_context *bld,
                 LLVMValueRef a,
                 LLVMValueRef min,
                 LLVMValueRef max);
  
+LLVMValueRef
+lp_build_clamp_zero_one_nanzero(struct lp_build_context *bld,
+                                LLVMValueRef a);
+
  LLVMValueRef
  lp_build_abs(struct lp_build_context *bld,
               LLVMValueRef a);
@@ -156,6 +261,10 @@ LLVMValueRef
  lp_build_fract(struct lp_build_context *bld,
                 LLVMValueRef a);
  
+LLVMValueRef
+lp_build_fract_safe(struct lp_build_context *bld,
+                    LLVMValueRef a);
+
  LLVMValueRef
  lp_build_ifloor(struct lp_build_context *bld,
                  LLVMValueRef a);
@@ -171,6 +280,18 @@ LLVMValueRef
  lp_build_itrunc(struct lp_build_context *bld,
                  LLVMValueRef a);
  
+void
+lp_build_ifloor_fract(struct lp_build_context *bld,
+                      LLVMValueRef a,
+                      LLVMValueRef *out_ipart,
+                      LLVMValueRef *out_fpart);
+
+void
+lp_build_ifloor_fract_safe(struct lp_build_context *bld,
+                           LLVMValueRef a,
+                           LLVMValueRef *out_ipart,
+                           LLVMValueRef *out_fpart);
+
  LLVMValueRef
  lp_build_sqrt(struct lp_build_context *bld,
                LLVMValueRef a);
@@ -183,6 +304,19 @@ LLVMValueRef
  lp_build_rsqrt(struct lp_build_context *bld,
                 LLVMValueRef a);
  
+boolean
+lp_build_fast_rsqrt_available(struct lp_type type);
+
+LLVMValueRef
+lp_build_fast_rsqrt(struct lp_build_context *bld,
+                    LLVMValueRef a);
+
+LLVMValueRef
+lp_build_polynomial(struct lp_build_context *bld,
+                    LLVMValueRef x,
+                    const double *coeffs,
+                    unsigned num_coeffs);
+
  LLVMValueRef
  lp_build_cos(struct lp_build_context *bld,
               LLVMValueRef a);
@@ -204,26 +338,75 @@ LLVMValueRef
  lp_build_log(struct lp_build_context *bld,
               LLVMValueRef a);
  
+LLVMValueRef
+lp_build_log_safe(struct lp_build_context *bld,
+                  LLVMValueRef a);
+
  LLVMValueRef
  lp_build_exp2(struct lp_build_context *bld,
                LLVMValueRef a);
  
+LLVMValueRef
+lp_build_extract_exponent(struct lp_build_context *bld,
+                          LLVMValueRef x,
+                          int bias);
+
+LLVMValueRef
+lp_build_extract_mantissa(struct lp_build_context *bld,
+                          LLVMValueRef x);
+
  LLVMValueRef
  lp_build_log2(struct lp_build_context *bld,
                LLVMValueRef a);
  
-void
-lp_build_exp2_approx(struct lp_build_context *bld,
-                     LLVMValueRef x,
-                     LLVMValueRef *p_exp2_int_part,
-                     LLVMValueRef *p_frac_part,
-                     LLVMValueRef *p_exp2);
+LLVMValueRef
+lp_build_log2_safe(struct lp_build_context *bld,
+                   LLVMValueRef a);
+
+LLVMValueRef
+lp_build_fast_log2(struct lp_build_context *bld,
+                   LLVMValueRef a);
+
+LLVMValueRef
+lp_build_ilog2(struct lp_build_context *bld,
+               LLVMValueRef x);
  
  void
  lp_build_log2_approx(struct lp_build_context *bld,
                       LLVMValueRef x,
                       LLVMValueRef *p_exp,
                       LLVMValueRef *p_floor_log2,
-                     LLVMValueRef *p_log2);
+                     LLVMValueRef *p_log2,
+                     boolean handle_nans);
+
+LLVMValueRef
+lp_build_mod(struct lp_build_context *bld,
+             LLVMValueRef x,
+             LLVMValueRef y);
+
+LLVMValueRef
+lp_build_isnan(struct lp_build_context *bld,
+               LLVMValueRef x);
+
+LLVMValueRef
+lp_build_isfinite(struct lp_build_context *bld,
+                  LLVMValueRef x);
+
+
+LLVMValueRef
+lp_build_is_inf_or_nan(struct gallivm_state *gallivm,
+                       const struct lp_type type,
+                       LLVMValueRef x);
+
+
+LLVMValueRef
+lp_build_fpstate_get(struct gallivm_state *gallivm);
+
+void
+lp_build_fpstate_set_denorms_zero(struct gallivm_state *gallivm,
+                                  boolean zero);
+void
+lp_build_fpstate_set(struct gallivm_state *gallivm,
+                     LLVMValueRef mxcsr);
  
  #endif /* !LP_BLD_ARIT_H */