summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorMarek Olšák <marek.olsak@amd.com>2019-08-27 17:39:02 -0400
committerMarek Olšák <marek.olsak@amd.com>2019-09-09 23:43:03 -0400
commit42ea0b7b52d78fc923e50a0825859fe079fd8c35 (patch)
tree9471925cde7cad22f279f787d18247740272a6e8
parentc1e08cb6d50cd7ee41478f47d92413a3ba089261 (diff)
radeonsi: only support at most 1024 threads per block
LLVM 10 won't support 2048. Reviewed-by: Pierre-Eric Pelloux-Prayer <pierre-eric.pelloux-prayer@amd.com>
-rw-r--r--src/gallium/drivers/radeonsi/si_get.c10
1 files changed, 2 insertions, 8 deletions
diff --git a/src/gallium/drivers/radeonsi/si_get.c b/src/gallium/drivers/radeonsi/si_get.c
index 118301fbf4b..111279674e6 100644
--- a/src/gallium/drivers/radeonsi/si_get.c
+++ b/src/gallium/drivers/radeonsi/si_get.c
@@ -752,14 +752,8 @@ static unsigned get_max_threads_per_block(struct si_screen *screen,
if (ir_type == PIPE_SHADER_IR_NATIVE)
return 256;
- /* Only 16 waves per thread-group on gfx9. */
- if (screen->info.chip_class >= GFX9)
- return 1024;
-
- /* Up to 40 waves per thread-group on GCN < gfx9. Expose a nice
- * round number.
- */
- return 2048;
+ /* LLVM 10 only supports 1024 threads per block. */
+ return 1024;
}
static int si_get_compute_param(struct pipe_screen *screen,