From aa5b2c4165b894f0d01c2921dc03c1c193b56152 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Jos=C3=A9=20Roberto=20de=20Souza?= Date: Thu, 22 Aug 2024 09:32:04 -0700 Subject: [PATCH] anv: Set recommended values for gfx20 async compute registers in STATE_COMPUTE_MODE MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit This recommended values should improve the performance of async compute in gfx20, we may want to tweek this for Linux but at least this values should give us a better baseline than default values. Reviewed-by: Paulo Zanoni Signed-off-by: José Roberto de Souza Part-of: --- src/intel/vulkan/genX_init_state.c | 9 ++++++++- 1 file changed, 8 insertions(+), 1 deletion(-) diff --git a/src/intel/vulkan/genX_init_state.c b/src/intel/vulkan/genX_init_state.c index 251ab0aed1a..ea97b324cdd 100644 --- a/src/intel/vulkan/genX_init_state.c +++ b/src/intel/vulkan/genX_init_state.c @@ -751,7 +751,14 @@ init_compute_queue_state(struct anv_queue *queue) } anv_batch_emit(batch, GENX(STATE_COMPUTE_MODE), cm) { -#if GFX_VER < 20 +#if GFX_VER >= 20 + cm.AsyncComputeThreadLimit = ACTL_Max8; + cm.ZPassAsyncComputeThreadLimit = ZPACTL_Max60; + cm.ZAsyncThrottlesettings = ZATS_DefertoAsyncComputeThreadLimit; + cm.AsyncComputeThreadLimitMask = 0x7; + cm.ZPassAsyncComputeThreadLimitMask = 0x7; + cm.ZAsyncThrottlesettingsMask = 0x3; +#else cm.PixelAsyncComputeThreadLimit = PACTL_Max24; cm.ZPassAsyncComputeThreadLimit = ZPACTL_Max60; cm.PixelAsyncComputeThreadLimitMask = 0x7;