From ad5be681bd1dd4f0ab1928c6b6f6364df1857184 Mon Sep 17 00:00:00 2001 From: Rhys Perry Date: Wed, 8 Apr 2026 11:51:59 +0100 Subject: [PATCH] aco/gfx11.7: don't use v_pack_b32_f16 in do_pack_2x16 MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: Rhys Perry Reviewed-by: Georg Lehmann Reviewed-by: Marek Olšák Part-of: --- src/amd/compiler/aco_lower_to_hw_instr.cpp | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/amd/compiler/aco_lower_to_hw_instr.cpp b/src/amd/compiler/aco_lower_to_hw_instr.cpp index 09a8a6ee02e..de9e2085eb1 100644 --- a/src/amd/compiler/aco_lower_to_hw_instr.cpp +++ b/src/amd/compiler/aco_lower_to_hw_instr.cpp @@ -1627,11 +1627,11 @@ do_pack_2x16(lower_context* ctx, Builder& bld, Definition def, Operand lo, Opera /* v_pack_b32_f16 can be used for bit exact copies if: * - fp16 input denorms are enabled, otherwise they get flushed to zero * - signalling input NaNs are kept, which is the case with IEEE_MODE=0 - * GFX12+ always quiets signalling NaNs, IEEE_MODE was removed + * GFX11.7+ always quiets signalling NaNs, IEEE_MODE was removed */ bool can_use_pack = (ctx->block->fp_mode.denorm16_64 & fp_denorm_keep_in) && ctx->program->gfx_level >= GFX9 && can_use_vop3 && - ctx->program->gfx_level < GFX12; + ctx->program->gfx_level < GFX11_7; if (can_use_pack) { Instruction* instr = bld.vop3(aco_opcode::v_pack_b32_f16, def, lo, hi);