ac/nir: adjust an assertion for D16 on GFX6-GFX7

[mesa.git] / src / amd / llvm / ac_llvm_build.c
diff --git a/src/amd/llvm/ac_llvm_build.c b/src/amd/llvm/ac_llvm_build.c

index 5483b3146c01c284eb7153f4cb67e5f1720a319b..69b1deaa8b275597ded358c78b076e43c29bb343 100644 (file)
--- a/src/amd/llvm/ac_llvm_build.c
+++ b/src/amd/llvm/ac_llvm_build.c
@@ -1314,6 +1314,11 @@ ac_build_buffer_load_common(struct ac_llvm_context *ctx,
         const char *indexing_kind = structurized ? "struct" : "raw";
         char name[256], type_name[8];
  
+       /* D16 is only supported on gfx8+ */
+       assert(!use_format ||
+              (channel_type != ctx->f16 && channel_type != ctx->i16) ||
+              ctx->chip_class >= GFX8);
+
         LLVMTypeRef type = func > 1 ? LLVMVectorType(channel_type, func) : channel_type;
         ac_build_type_name_for_intr(type, type_name, sizeof(type_name));
  
@@ -1389,10 +1394,12 @@ LLVMValueRef ac_build_buffer_load_format(struct ac_llvm_context *ctx,
                                          LLVMValueRef voffset,
                                          unsigned num_channels,
                                          unsigned cache_policy,
-                                        bool can_speculate)
+                                        bool can_speculate,
+                                        bool d16)
  {
         return ac_build_buffer_load_common(ctx, rsrc, vindex, voffset,
-                                          ctx->i32_0, num_channels, ctx->f32,
+                                          ctx->i32_0, num_channels,
+                                          d16 ? ctx->f16 : ctx->f32,
                                            cache_policy, can_speculate,
                                            true, true);
  }
@@ -2049,6 +2056,8 @@ ac_build_ddxy(struct ac_llvm_context *ctx,
  
         if (result_type == ctx->f16)
                 val = LLVMBuildZExt(ctx->builder, val, ctx->i32, "");
+       else if (result_type == ctx->v2f16)
+               val = LLVMBuildBitCast(ctx->builder, val, ctx->i32, "");
  
         for (unsigned i = 0; i < 4; ++i) {
                 tl_lanes[i] = i & mask;
@@ -2369,6 +2378,11 @@ LLVMValueRef ac_build_image_opcode(struct ac_llvm_context *ctx,
         assert((a->min_lod ? 1 : 0) +
                (a->lod ? 1 : 0) +
                (a->level_zero ? 1 : 0) <= 1);
+       assert(!a->d16 || (ctx->chip_class >= GFX8 &&
+                          a->opcode != ac_image_atomic &&
+                          a->opcode != ac_image_atomic_cmpswap &&
+                          a->opcode != ac_image_get_lod &&
+                          a->opcode != ac_image_get_resinfo));
  
         if (a->opcode == ac_image_get_lod) {
                 switch (dim) {
@@ -2491,7 +2505,7 @@ LLVMValueRef ac_build_image_opcode(struct ac_llvm_context *ctx,
                  a->min_lod ? ".cl" : "",
                  a->offset ? ".o" : "",
                  dimname,
-                atomic ? "i32" : "v4f32",
+                atomic ? "i32" : (a->d16 ? "v4f16" : "v4f32"),
                  overload[0], overload[1], overload[2]);
  
         LLVMTypeRef retty;
@@ -2500,15 +2514,14 @@ LLVMValueRef ac_build_image_opcode(struct ac_llvm_context *ctx,
         else if (a->opcode == ac_image_store || a->opcode == ac_image_store_mip)
                 retty = ctx->voidt;
         else
-               retty = ctx->v4f32;
+               retty = a->d16 ? ctx->v4f16 : ctx->v4f32;
  
         LLVMValueRef result =
                 ac_build_intrinsic(ctx, intr_name, retty, args, num_args,
                                    a->attributes);
-       if (!sample && retty == ctx->v4f32) {
-               result = LLVMBuildBitCast(ctx->builder, result,
-                                         ctx->v4i32, "");
-       }
+       if (!sample && !atomic && retty != ctx->voidt)
+               result = ac_to_integer(ctx, result);
+
         return result;
  }