From c77bcf00a36c0c6f2bc42a052de5152589f0a372 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Marek=20Ol=C5=A1=C3=A1k?= Date: Fri, 24 Nov 2023 19:26:14 -0500 Subject: [PATCH] radeonsi/gfx11: prefer Wave64 for VS/TCS/TES/GS because it's slightly faster Reviewed-by: Pierre-Eric Pelloux-Prayer Part-of: --- src/gallium/drivers/radeonsi/si_state_shaders.cpp | 8 ++++++-- 1 file changed, 6 insertions(+), 2 deletions(-) diff --git a/src/gallium/drivers/radeonsi/si_state_shaders.cpp b/src/gallium/drivers/radeonsi/si_state_shaders.cpp index 18646a5f00c..95ee06b3313 100644 --- a/src/gallium/drivers/radeonsi/si_state_shaders.cpp +++ b/src/gallium/drivers/radeonsi/si_state_shaders.cpp @@ -75,12 +75,16 @@ unsigned si_determine_wave_size(struct si_screen *sscreen, struct si_shader *sha if (sscreen->info.gfx_level < GFX11 && stage == MESA_SHADER_FRAGMENT && !info->num_inputs) return 32; - /* There are a few very rare cases where VS is better with Wave32, and there are no known - * cases where Wave64 is better. + /* Gfx10: There are a few very rare cases where VS is better with Wave32, and there are no + * known cases where Wave64 is better. + * * Wave32 is disabled for GFX10 when culling is active as a workaround for #6457. I don't * know why this helps. + * + * Gfx11: Prefer Wave64 because it's slightly better than Wave32. */ if (stage <= MESA_SHADER_GEOMETRY && + (sscreen->info.gfx_level == GFX10 || sscreen->info.gfx_level == GFX10_3) && !(sscreen->info.gfx_level == GFX10 && shader && shader->key.ge.opt.ngg_culling)) return 32;