mirror of
https://gitlab.freedesktop.org/mesa/mesa.git
synced 2026-05-06 05:08:08 +02:00
radv: enable .lower_ineg
We already emit ineg as isub most of the time. The results are a bit mixed, but shouldn't really make a difference. A couple of additional copies are needed as isub writes scc. Totals from 5975 (4.29% of 139391) affected shaders: CodeSize: 31508648 -> 31509264 (+0.00%); split: -0.00%, +0.00% Instrs: 6073379 -> 6073531 (+0.00%); split: -0.00%, +0.00% Cycles: 47186280 -> 47187116 (+0.00%); split: -0.00%, +0.00% VMEM: 2528515 -> 2529139 (+0.02%); split: +0.03%, -0.01% SMEM: 596842 -> 596924 (+0.01%); split: +0.02%, -0.00% SClause: 280596 -> 280594 (-0.00%) Copies: 288554 -> 288669 (+0.04%); split: -0.00%, +0.04% PreSGPRs: 240390 -> 240397 (+0.00%) PreVGPRs: 349630 -> 349749 (+0.03%) Reviewed-by: Rhys Perry <pendingchaos02@gmail.com> Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/8425>
This commit is contained in:
parent
e92bd57008
commit
d495a5c183
2 changed files with 1 additions and 27 deletions
|
|
@ -1316,33 +1316,6 @@ void visit_alu_instr(isel_context *ctx, nir_alu_instr *instr)
|
|||
}
|
||||
break;
|
||||
}
|
||||
case nir_op_ineg: {
|
||||
Temp src = get_alu_src(ctx, instr->src[0]);
|
||||
if (dst.regClass() == v1) {
|
||||
bld.vsub32(Definition(dst), Operand(0u), Operand(src));
|
||||
} else if (dst.regClass() == s1) {
|
||||
bld.sop2(aco_opcode::s_mul_i32, Definition(dst), Operand((uint32_t) -1), src);
|
||||
} else if (dst.size() == 2) {
|
||||
Temp src0 = bld.tmp(dst.type(), 1);
|
||||
Temp src1 = bld.tmp(dst.type(), 1);
|
||||
bld.pseudo(aco_opcode::p_split_vector, Definition(src0), Definition(src1), src);
|
||||
|
||||
if (dst.regClass() == s2) {
|
||||
Temp borrow = bld.tmp(s1);
|
||||
Temp dst0 = bld.sop2(aco_opcode::s_sub_u32, bld.def(s1), bld.scc(Definition(borrow)), Operand(0u), src0);
|
||||
Temp dst1 = bld.sop2(aco_opcode::s_subb_u32, bld.def(s1), bld.def(s1, scc), Operand(0u), src1, bld.scc(borrow));
|
||||
bld.pseudo(aco_opcode::p_create_vector, Definition(dst), dst0, dst1);
|
||||
} else {
|
||||
Temp lower = bld.tmp(v1);
|
||||
Temp borrow = bld.vsub32(Definition(lower), Operand(0u), src0, true).def(1).getTemp();
|
||||
Temp upper = bld.vsub32(bld.def(v1), Operand(0u), src1, false, borrow);
|
||||
bld.pseudo(aco_opcode::p_create_vector, Definition(dst), lower, upper);
|
||||
}
|
||||
} else {
|
||||
isel_err(&instr->instr, "Unimplemented NIR instr bit size");
|
||||
}
|
||||
break;
|
||||
}
|
||||
case nir_op_iabs: {
|
||||
Temp src = get_alu_src(ctx, instr->src[0]);
|
||||
if (dst.regClass() == s1) {
|
||||
|
|
|
|||
|
|
@ -55,6 +55,7 @@ static const struct nir_shader_compiler_options nir_options = {
|
|||
.lower_device_index_to_zero = true,
|
||||
.lower_fdiv = true,
|
||||
.lower_fmod = true,
|
||||
.lower_ineg = true,
|
||||
.lower_bitfield_insert_to_bitfield_select = true,
|
||||
.lower_bitfield_extract = true,
|
||||
.lower_pack_snorm_2x16 = true,
|
||||
|
|
|
|||
Loading…
Add table
Reference in a new issue