ac/nir: use llvm.amdgcn.rcp in ac_build_fdiv()

author Samuel Pitoiset <samuel.pitoiset@gmail.com>

Thu, 26 Mar 2020 10:40:35 +0000 (11:40 +0100)

committer Samuel Pitoiset <samuel.pitoiset@gmail.com>

Fri, 27 Mar 2020 07:05:43 +0000 (08:05 +0100)
author Samuel Pitoiset <samuel.pitoiset@gmail.com>
Thu, 26 Mar 2020 10:40:35 +0000 (11:40 +0100)
committer Samuel Pitoiset <samuel.pitoiset@gmail.com>
Fri, 27 Mar 2020 07:05:43 +0000 (08:05 +0100)
diff --git a/src/amd/llvm/ac_llvm_build.c b/src/amd/llvm/ac_llvm_build.c

index f13baf792fc27597cfe379370520222171ccb278..c2b5667f9964d845a95c07c08cd863165df5ee6e 100644 (file)
--- a/src/amd/llvm/ac_llvm_build.c
+++ b/src/amd/llvm/ac_llvm_build.c
@@ -65,8 +65,6 @@ ac_llvm_context_init(struct ac_llvm_context *ctx,
                      enum ac_float_mode float_mode, unsigned wave_size,
                      unsigned ballot_mask_bits)
  {
-       LLVMValueRef args[1];
-
         ctx->context = LLVMContextCreate();
  
         ctx->chip_class = chip_class;
@@ -127,11 +125,6 @@ ac_llvm_context_init(struct ac_llvm_context *ctx,
         ctx->invariant_load_md_kind = LLVMGetMDKindIDInContext(ctx->context,
                                                                "invariant.load", 14);
  
-       ctx->fpmath_md_kind = LLVMGetMDKindIDInContext(ctx->context, "fpmath", 6);
-
-       args[0] = LLVMConstReal(ctx->f32, 2.5);
-       ctx->fpmath_md_2p5_ulp = LLVMMDNodeInContext(ctx->context, args, 1);
-
         ctx->uniform_md_kind = LLVMGetMDKindIDInContext(ctx->context,
                                                         "amdgpu.uniform", 14);
  
@@ -707,17 +700,18 @@ ac_build_fdiv(struct ac_llvm_context *ctx,
               LLVMValueRef num,
               LLVMValueRef den)
  {
-       /* If we do (num / den), LLVM >= 7.0 does:
-        *    return num * v_rcp_f32(den * (fabs(den) > 0x1.0p+96f ? 0x1.0p-32f : 1.0f));
-        *
-        * If we do (num * (1 / den)), LLVM does:
-        *    return num * v_rcp_f32(den);
-        */
-       LLVMValueRef one = LLVMConstReal(LLVMTypeOf(num), 1.0);
-       LLVMValueRef rcp = LLVMBuildFDiv(ctx->builder, one, den, "");
-       /* Use v_rcp_f32 instead of precise division. */
-       if (!LLVMIsConstant(rcp))
-               LLVMSetMetadata(rcp, ctx->fpmath_md_kind, ctx->fpmath_md_2p5_ulp);
+       unsigned type_size = ac_get_type_size(LLVMTypeOf(den));
+       const char *name;
+
+       if (type_size == 2)
+               name = "llvm.amdgcn.rcp.f16";
+       else if (type_size == 4)
+               name = "llvm.amdgcn.rcp.f32";
+       else
+               name = "llvm.amdgcn.rcp.f64";
+
+        LLVMValueRef rcp = ac_build_intrinsic(ctx, name, LLVMTypeOf(den),
+                                              &den, 1, AC_FUNC_ATTR_READNONE);
  
         return LLVMBuildFMul(ctx->builder, num, rcp, "");
  }
diff --git a/src/amd/llvm/ac_llvm_build.h b/src/amd/llvm/ac_llvm_build.h

index 2e60cf0ada1d58acff91fc15d25adedd91fffcee..ff90092754e0d2cfb5a91fd9a94851f65efe1648 100644 (file)
--- a/src/amd/llvm/ac_llvm_build.h
+++ b/src/amd/llvm/ac_llvm_build.h
@@ -123,8 +123,6 @@ struct ac_llvm_context {
         unsigned range_md_kind;
         unsigned invariant_load_md_kind;
         unsigned uniform_md_kind;
-       unsigned fpmath_md_kind;
-       LLVMValueRef fpmath_md_2p5_ulp;
         LLVMValueRef empty_md;
  
         enum chip_class chip_class;
author	Samuel Pitoiset <samuel.pitoiset@gmail.com>
	Thu, 26 Mar 2020 10:40:35 +0000 (11:40 +0100)
committer	Samuel Pitoiset <samuel.pitoiset@gmail.com>
	Fri, 27 Mar 2020 07:05:43 +0000 (08:05 +0100)
src/amd/llvm/ac_llvm_build.c		patch \| blob \| history
src/amd/llvm/ac_llvm_build.h		patch \| blob \| history