radeonsi: only support at most 1024 threads per block
authorMarek Olšák <marek.olsak@amd.com>
Tue, 27 Aug 2019 21:39:02 +0000 (17:39 -0400)
committerMarek Olšák <marek.olsak@amd.com>
Tue, 10 Sep 2019 03:43:03 +0000 (23:43 -0400)
LLVM 10 won't support 2048.

Reviewed-by: Pierre-Eric Pelloux-Prayer <pierre-eric.pelloux-prayer@amd.com>
src/gallium/drivers/radeonsi/si_get.c

index 118301fbf4b98b682e9afca53a911220210d4455..111279674e6318edc832f4bab88e72b49b9bfcde 100644 (file)
@@ -752,14 +752,8 @@ static unsigned get_max_threads_per_block(struct si_screen *screen,
        if (ir_type == PIPE_SHADER_IR_NATIVE)
                return 256;
 
-       /* Only 16 waves per thread-group on gfx9. */
-       if (screen->info.chip_class >= GFX9)
-               return 1024;
-
-       /* Up to 40 waves per thread-group on GCN < gfx9. Expose a nice
-        * round number.
-        */
-       return 2048;
+        /* LLVM 10 only supports 1024 threads per block. */
+       return 1024;
 }
 
 static int si_get_compute_param(struct pipe_screen *screen,