From 8c4f0b13530f0bc2afe1e9815801c3b85502503c Mon Sep 17 00:00:00 2001 From: nihui Date: Thu, 26 Jun 2025 11:49:55 +0800 Subject: [PATCH] aco: gfx940 has no mad f32 instruction MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Reviewed-by: Daniel Schürmann Part-of: --- src/amd/compiler/aco_optimizer.cpp | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/src/amd/compiler/aco_optimizer.cpp b/src/amd/compiler/aco_optimizer.cpp index 4ac8821464d..c50eba30237 100644 --- a/src/amd/compiler/aco_optimizer.cpp +++ b/src/amd/compiler/aco_optimizer.cpp @@ -3910,7 +3910,8 @@ combine_instruction(opt_ctx& ctx, aco_ptr& instr) (mad32 && !legacy && !mad_mix && ctx.program->dev.has_fast_fma32) || (mad_mix && ctx.program->dev.fused_mad_mix); bool has_mad = mad_mix ? !ctx.program->dev.fused_mad_mix - : ((mad32 && ctx.program->gfx_level < GFX10_3) || + : ((mad32 && ctx.program->gfx_level < GFX10_3 && + ctx.program->family != CHIP_GFX940) || (mad16 && ctx.program->gfx_level <= GFX9)); bool can_use_fma = has_fma && (!(info.parent_instr->definitions[0].isPrecise() || instr->definitions[0].isPrecise()) ||