radv: lower 64-bit dfloor on GFX6 for fixing precision issues

author Samuel Pitoiset <samuel.pitoiset@gmail.com>

Wed, 24 Jun 2020 07:15:47 +0000 (09:15 +0200)

committer Marge Bot <eric+marge@anholt.net>

Thu, 25 Jun 2020 12:09:08 +0000 (12:09 +0000)
author Samuel Pitoiset <samuel.pitoiset@gmail.com>
Wed, 24 Jun 2020 07:15:47 +0000 (09:15 +0200)
committer Marge Bot <eric+marge@anholt.net>
Thu, 25 Jun 2020 12:09:08 +0000 (12:09 +0000)
diff --git a/.gitlab-ci/deqp-radv-pitcairn-aco-fails.txt b/.gitlab-ci/deqp-radv-pitcairn-aco-fails.txt

index 72549cb804cf3f4fa6f439231dabbdbc7cfe23b9..c330ba885eec10a94cb09c499fca80c2a8209a6b 100644 (file)
--- a/.gitlab-ci/deqp-radv-pitcairn-aco-fails.txt
+++ b/.gitlab-ci/deqp-radv-pitcairn-aco-fails.txt
@@ -1,7 +1,3 @@
-dEQP-VK.glsl.builtin.precision_double.floor.compute.scalar
-dEQP-VK.glsl.builtin.precision_double.floor.compute.vec2
-dEQP-VK.glsl.builtin.precision_double.floor.compute.vec3
-dEQP-VK.glsl.builtin.precision_double.floor.compute.vec4
  dEQP-VK.memory_model.message_passing.core11.u32.coherent.fence_fence.atomicwrite.device.payload_local.image.guard_nonlocal.workgroup.comp
  dEQP-VK.memory_model.message_passing.core11.u32.coherent.fence_fence.atomicwrite.device.payload_nonlocal.image.guard_nonlocal.workgroup.comp
  dEQP-VK.pipeline.depth.format.d16_unorm.compare_ops.never_zerodepthbounds_depthdisabled_stencilenabled
diff --git a/src/amd/compiler/aco_instruction_selection.cpp b/src/amd/compiler/aco_instruction_selection.cpp

index 7f4da8770680bc747a9507c02dc34fbc11c504bf..de435ff78343b60e772c2ca13b2256c7250d8f33 100644 (file)
--- a/src/amd/compiler/aco_instruction_selection.cpp
+++ b/src/amd/compiler/aco_instruction_selection.cpp
@@ -979,7 +979,8 @@ Temp emit_floor_f64(isel_context *ctx, Builder& bld, Definition dst, Temp val)
     if (ctx->options->chip_class >= GFX7)
        return bld.vop1(aco_opcode::v_floor_f64, Definition(dst), val);
  
-   /* GFX6 doesn't support V_FLOOR_F64, lower it. */
+   /* GFX6 doesn't support V_FLOOR_F64, lower it (note that it's actually
+    * lowered at NIR level for precision reasons). */
     Temp src0 = as_vgpr(ctx, val);
  
     Temp mask = bld.copy(bld.def(s1), Operand(3u)); /* isnan */
diff --git a/src/amd/vulkan/radv_shader.c b/src/amd/vulkan/radv_shader.c

index a53100fd48bd6685a30788895f2543d675a64a48..1d653e786c553baea3a2a9ac005cde5328997c32 100644 (file)
--- a/src/amd/vulkan/radv_shader.c
+++ b/src/amd/vulkan/radv_shader.c
@@ -478,6 +478,14 @@ radv_shader_compile_to_nir(struct radv_device *device,
                 nir_lower_doubles_options lower_doubles =
                         nir->options->lower_doubles_options;
  
+               if (device->physical_device->rad_info.chip_class == GFX6) {
+                       /* GFX6 doesn't support v_floor_f64 and the precision
+                        * of v_fract_f64 which is used to implement 64-bit
+                        * floor is less than what Vulkan requires.
+                        */
+                       lower_doubles |= nir_lower_dfloor;
+               }
+
                 NIR_PASS_V(nir, nir_lower_doubles, NULL, lower_doubles);
         }
author	Samuel Pitoiset <samuel.pitoiset@gmail.com>
	Wed, 24 Jun 2020 07:15:47 +0000 (09:15 +0200)
committer	Marge Bot <eric+marge@anholt.net>
	Thu, 25 Jun 2020 12:09:08 +0000 (12:09 +0000)
.gitlab-ci/deqp-radv-pitcairn-aco-fails.txt		patch \| blob \| history
src/amd/compiler/aco_instruction_selection.cpp		patch \| blob \| history
src/amd/vulkan/radv_shader.c		patch \| blob \| history