radv: lower 64-bit dfloor on GFX6 for fixing precision issues
authorSamuel Pitoiset <samuel.pitoiset@gmail.com>
Wed, 24 Jun 2020 07:15:47 +0000 (09:15 +0200)
committerMarge Bot <eric+marge@anholt.net>
Thu, 25 Jun 2020 12:09:08 +0000 (12:09 +0000)
GFX6 doesn't support v_floor_f64 and the precision of v_fract_f64
which is used to implement 64-bit floor is less than what Vulkan
requires.

Signed-off-by: Samuel Pitoiset <samuel.pitoiset@gmail.com>
Reviewed-by: Daniel Schürmann <daniel@schuermann.dev>
Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/5609>

.gitlab-ci/deqp-radv-pitcairn-aco-fails.txt
src/amd/compiler/aco_instruction_selection.cpp
src/amd/vulkan/radv_shader.c

index 72549cb804cf3f4fa6f439231dabbdbc7cfe23b9..c330ba885eec10a94cb09c499fca80c2a8209a6b 100644 (file)
@@ -1,7 +1,3 @@
-dEQP-VK.glsl.builtin.precision_double.floor.compute.scalar
-dEQP-VK.glsl.builtin.precision_double.floor.compute.vec2
-dEQP-VK.glsl.builtin.precision_double.floor.compute.vec3
-dEQP-VK.glsl.builtin.precision_double.floor.compute.vec4
 dEQP-VK.memory_model.message_passing.core11.u32.coherent.fence_fence.atomicwrite.device.payload_local.image.guard_nonlocal.workgroup.comp
 dEQP-VK.memory_model.message_passing.core11.u32.coherent.fence_fence.atomicwrite.device.payload_nonlocal.image.guard_nonlocal.workgroup.comp
 dEQP-VK.pipeline.depth.format.d16_unorm.compare_ops.never_zerodepthbounds_depthdisabled_stencilenabled
index 7f4da8770680bc747a9507c02dc34fbc11c504bf..de435ff78343b60e772c2ca13b2256c7250d8f33 100644 (file)
@@ -979,7 +979,8 @@ Temp emit_floor_f64(isel_context *ctx, Builder& bld, Definition dst, Temp val)
    if (ctx->options->chip_class >= GFX7)
       return bld.vop1(aco_opcode::v_floor_f64, Definition(dst), val);
 
-   /* GFX6 doesn't support V_FLOOR_F64, lower it. */
+   /* GFX6 doesn't support V_FLOOR_F64, lower it (note that it's actually
+    * lowered at NIR level for precision reasons). */
    Temp src0 = as_vgpr(ctx, val);
 
    Temp mask = bld.copy(bld.def(s1), Operand(3u)); /* isnan */
index a53100fd48bd6685a30788895f2543d675a64a48..1d653e786c553baea3a2a9ac005cde5328997c32 100644 (file)
@@ -478,6 +478,14 @@ radv_shader_compile_to_nir(struct radv_device *device,
                nir_lower_doubles_options lower_doubles =
                        nir->options->lower_doubles_options;
 
+               if (device->physical_device->rad_info.chip_class == GFX6) {
+                       /* GFX6 doesn't support v_floor_f64 and the precision
+                        * of v_fract_f64 which is used to implement 64-bit
+                        * floor is less than what Vulkan requires.
+                        */
+                       lower_doubles |= nir_lower_dfloor;
+               }
+
                NIR_PASS_V(nir, nir_lower_doubles, NULL, lower_doubles);
        }