mirror of
https://gitlab.freedesktop.org/mesa/mesa.git
synced 2026-02-12 15:50:31 +01:00
ac/nir,radv: remove ac_nir_opt_pack_half
Foz-DB Navi21: Totals from 2937 (3.01% of 97591) affected shaders: Instrs: 1908695 -> 1908291 (-0.02%); split: -0.02%, +0.00% CodeSize: 10232148 -> 10229224 (-0.03%); split: -0.03%, +0.01% VGPRs: 142168 -> 142080 (-0.06%) Latency: 8052895 -> 8052622 (-0.00%); split: -0.01%, +0.01% InvThroughput: 2550330 -> 2549602 (-0.03%); split: -0.03%, +0.01% VClause: 32601 -> 32603 (+0.01%); split: -0.01%, +0.02% Copies: 118570 -> 118587 (+0.01%); split: -0.04%, +0.05% PreVGPRs: 110090 -> 110082 (-0.01%) VALU: 1468422 -> 1468043 (-0.03%); split: -0.03%, +0.00% SALU: 173858 -> 173828 (-0.02%) Foz-DB Navi48: Totals from 4196 (4.30% of 97637) affected shaders: MaxWaves: 118678 -> 118680 (+0.00%); split: +0.01%, -0.01% Instrs: 3627604 -> 3624093 (-0.10%); split: -0.10%, +0.00% CodeSize: 18956684 -> 18939824 (-0.09%); split: -0.09%, +0.01% VGPRs: 225624 -> 225060 (-0.25%); split: -0.26%, +0.01% Latency: 11856204 -> 11857280 (+0.01%); split: -0.01%, +0.02% InvThroughput: 2388584 -> 2389178 (+0.02%); split: -0.01%, +0.03% VClause: 50409 -> 50410 (+0.00%) SClause: 64701 -> 64699 (-0.00%) Copies: 208353 -> 207522 (-0.40%); split: -0.43%, +0.03% PreVGPRs: 161314 -> 161306 (-0.00%) VALU: 2345604 -> 2345172 (-0.02%); split: -0.02%, +0.00% SALU: 391466 -> 388723 (-0.70%) VOPD: 1788 -> 1806 (+1.01%) Reviewed-by: Daniel Schürmann <daniel@schuermann.dev> Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/38815>
This commit is contained in:
parent
939b4a6476
commit
711598982a
4 changed files with 0 additions and 144 deletions
|
|
@ -130,7 +130,6 @@ amd_common_files = files(
|
|||
'nir/ac_nir_meta_cs_blit.c',
|
||||
'nir/ac_nir_meta_cs_clear_copy_buffer.c',
|
||||
'nir/ac_nir_meta_ps_resolve.c',
|
||||
'nir/ac_nir_opt_pack_half.c',
|
||||
'nir/ac_nir_opt_shared_append.c',
|
||||
'nir/ac_nir_prerast_utils.c',
|
||||
'nir/ac_nir_surface.c',
|
||||
|
|
|
|||
|
|
@ -402,9 +402,6 @@ ac_nir_lower_tex(nir_shader *nir, const ac_nir_lower_tex_options *options);
|
|||
void
|
||||
ac_nir_store_debug_log_amd(nir_builder *b, nir_def *uvec4);
|
||||
|
||||
bool
|
||||
ac_nir_opt_pack_half(nir_shader *shader, enum amd_gfx_level gfx_level);
|
||||
|
||||
unsigned
|
||||
ac_nir_varying_expression_max_cost(nir_shader *producer, nir_shader *consumer);
|
||||
|
||||
|
|
|
|||
|
|
@ -1,133 +0,0 @@
|
|||
/*
|
||||
* Copyright © 2021 Valve Corporation
|
||||
*
|
||||
* SPDX-License-Identifier: MIT
|
||||
*/
|
||||
|
||||
#include "ac_nir.h"
|
||||
#include "ac_nir_helpers.h"
|
||||
|
||||
#include "nir_builder.h"
|
||||
|
||||
static bool
|
||||
needs_rounding_mode_16_64(nir_instr *instr)
|
||||
{
|
||||
if (instr->type != nir_instr_type_alu)
|
||||
return false;
|
||||
nir_alu_instr *alu = nir_instr_as_alu(instr);
|
||||
if (alu->op == nir_op_fquantize2f16)
|
||||
return true;
|
||||
if (alu->def.bit_size != 16 && alu->def.bit_size != 64)
|
||||
return false;
|
||||
if (nir_alu_type_get_base_type(nir_op_infos[alu->op].output_type) != nir_type_float)
|
||||
return false;
|
||||
|
||||
switch (alu->op) {
|
||||
case nir_op_f2f64:
|
||||
case nir_op_b2f64:
|
||||
case nir_op_f2f16_rtz:
|
||||
case nir_op_b2f16:
|
||||
case nir_op_fsat:
|
||||
case nir_op_fabs:
|
||||
case nir_op_fneg:
|
||||
case nir_op_fsign:
|
||||
case nir_op_ftrunc:
|
||||
case nir_op_fceil:
|
||||
case nir_op_ffloor:
|
||||
case nir_op_ffract:
|
||||
case nir_op_fround_even:
|
||||
case nir_op_fmin:
|
||||
case nir_op_fmax:
|
||||
return false;
|
||||
default:
|
||||
return true;
|
||||
}
|
||||
}
|
||||
|
||||
static bool
|
||||
can_use_fmamix(nir_scalar s, enum amd_gfx_level gfx_level)
|
||||
{
|
||||
s = nir_scalar_chase_movs(s);
|
||||
if (!list_is_singular(&s.def->uses))
|
||||
return false;
|
||||
|
||||
if (nir_scalar_is_intrinsic(s) &&
|
||||
nir_scalar_intrinsic_op(s) == nir_intrinsic_load_interpolated_input)
|
||||
return gfx_level >= GFX11;
|
||||
|
||||
if (!nir_scalar_is_alu(s))
|
||||
return false;
|
||||
|
||||
switch (nir_scalar_alu_op(s)) {
|
||||
case nir_op_fmul:
|
||||
case nir_op_ffma:
|
||||
case nir_op_fadd:
|
||||
case nir_op_fsub:
|
||||
return true;
|
||||
case nir_op_fsat:
|
||||
return can_use_fmamix(nir_scalar_chase_alu_src(s, 0), gfx_level);
|
||||
default:
|
||||
return false;
|
||||
}
|
||||
}
|
||||
|
||||
static bool
|
||||
split_pack_half(nir_builder *b, nir_instr *instr, void *param)
|
||||
{
|
||||
enum amd_gfx_level gfx_level = *(enum amd_gfx_level *)param;
|
||||
|
||||
if (instr->type != nir_instr_type_alu)
|
||||
return false;
|
||||
nir_alu_instr *alu = nir_instr_as_alu(instr);
|
||||
if (alu->op != nir_op_pack_half_2x16_rtz_split && alu->op != nir_op_pack_half_2x16_split)
|
||||
return false;
|
||||
|
||||
nir_scalar s = nir_get_scalar(&alu->def, 0);
|
||||
|
||||
if (!can_use_fmamix(nir_scalar_chase_alu_src(s, 0), gfx_level) ||
|
||||
!can_use_fmamix(nir_scalar_chase_alu_src(s, 1), gfx_level))
|
||||
return false;
|
||||
|
||||
b->cursor = nir_before_instr(instr);
|
||||
b->fp_math_ctrl = alu->fp_math_ctrl;
|
||||
|
||||
/* Split pack_half into two f2f16 to create v_fma_mix{lo,hi}_f16
|
||||
* in the backend.
|
||||
*/
|
||||
nir_def *lo = nir_f2f16(b, nir_ssa_for_alu_src(b, alu, 0));
|
||||
nir_def *hi = nir_f2f16(b, nir_ssa_for_alu_src(b, alu, 1));
|
||||
nir_def_replace(&alu->def, nir_pack_32_2x16_split(b, lo, hi));
|
||||
return true;
|
||||
}
|
||||
|
||||
bool
|
||||
ac_nir_opt_pack_half(nir_shader *shader, enum amd_gfx_level gfx_level)
|
||||
{
|
||||
if (gfx_level < GFX10)
|
||||
return false;
|
||||
|
||||
unsigned exec_mode = shader->info.float_controls_execution_mode;
|
||||
bool set_mode = false;
|
||||
if (!nir_is_rounding_mode_rtz(exec_mode, 16)) {
|
||||
nir_foreach_function_impl(impl, shader) {
|
||||
nir_foreach_block(block, impl) {
|
||||
nir_foreach_instr(instr, block) {
|
||||
if (needs_rounding_mode_16_64(instr))
|
||||
return false;
|
||||
}
|
||||
}
|
||||
}
|
||||
set_mode = true;
|
||||
}
|
||||
|
||||
bool progress = nir_shader_instructions_pass(shader, split_pack_half,
|
||||
nir_metadata_control_flow,
|
||||
&gfx_level);
|
||||
|
||||
if (set_mode && progress) {
|
||||
exec_mode &= ~(FLOAT_CONTROLS_ROUNDING_MODE_RTE_FP16 | FLOAT_CONTROLS_ROUNDING_MODE_RTE_FP64);
|
||||
exec_mode |= FLOAT_CONTROLS_ROUNDING_MODE_RTZ_FP16 | FLOAT_CONTROLS_ROUNDING_MODE_RTZ_FP64;
|
||||
shader->info.float_controls_execution_mode = exec_mode;
|
||||
}
|
||||
return progress;
|
||||
}
|
||||
|
|
@ -583,13 +583,6 @@ radv_postprocess_nir(struct radv_device *device, const struct radv_graphics_stat
|
|||
/* cleanup passes */
|
||||
NIR_PASS(_, stage->nir, nir_lower_alu_width, ac_nir_opt_vectorize_cb, &gfx_level);
|
||||
|
||||
/* This pass changes the global float control mode to RTZ, so can't be used
|
||||
* with LLVM, which only supports RTNE, or RT, where the mode needs to match
|
||||
* across separately compiled stages.
|
||||
*/
|
||||
if (!radv_use_llvm_for_stage(pdev, stage->stage) && !mesa_shader_stage_is_rt(stage->stage))
|
||||
NIR_PASS(_, stage->nir, ac_nir_opt_pack_half, gfx_level);
|
||||
|
||||
NIR_PASS(_, stage->nir, nir_lower_load_const_to_scalar);
|
||||
NIR_PASS(_, stage->nir, nir_opt_copy_prop);
|
||||
NIR_PASS(_, stage->nir, nir_opt_dce);
|
||||
|
|
|
|||
Loading…
Add table
Reference in a new issue