mirror of
https://gitlab.freedesktop.org/mesa/mesa.git
synced 2026-05-05 03:08:05 +02:00
aco: fix combining max(-min(a, b), c) if a or b uses the neg modifier
No fossils-db changes. Cc: 20.2, 20.3 Signed-off-by: Samuel Pitoiset <samuel.pitoiset@gmail.com> Reviewed-by: Rhys Perry <pendingchaos02@gmail.com> Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/7657>
This commit is contained in:
parent
ff22fcf450
commit
0fcd379184
2 changed files with 27 additions and 4 deletions
|
|
@ -2106,8 +2106,8 @@ bool combine_minmax(opt_ctx& ctx, aco_ptr<Instruction>& instr, aco_opcode opposi
|
|||
if (combine_three_valu_op(ctx, instr, instr->opcode, minmax3, "012", 1 | 2))
|
||||
return true;
|
||||
|
||||
/* min(-max(a, b), c) -> min3(-a, -b, c) *
|
||||
* max(-min(a, b), c) -> max3(-a, -b, c) */
|
||||
/* min(-max(a, b), c) -> min3(c, -a, -b) *
|
||||
* max(-min(a, b), c) -> max3(c, -a, -b) */
|
||||
for (unsigned swap = 0; swap < 2; swap++) {
|
||||
Operand operands[3];
|
||||
bool neg[3], abs[3], clamp, precise;
|
||||
|
|
@ -2119,8 +2119,8 @@ bool combine_minmax(opt_ctx& ctx, aco_ptr<Instruction>& instr, aco_opcode opposi
|
|||
&clamp, &omod, &inbetween_neg, NULL, NULL, &precise) &&
|
||||
inbetween_neg) {
|
||||
ctx.uses[instr->operands[swap].tempId()]--;
|
||||
neg[1] = true;
|
||||
neg[2] = true;
|
||||
neg[1] = !neg[1];
|
||||
neg[2] = !neg[2];
|
||||
create_vop3_for_op3(ctx, minmax3, instr, operands, neg, abs, opsel, clamp, omod);
|
||||
return true;
|
||||
}
|
||||
|
|
|
|||
|
|
@ -700,3 +700,26 @@ BEGIN_TEST(optimize.add3)
|
|||
|
||||
finish_opt_test();
|
||||
END_TEST
|
||||
|
||||
BEGIN_TEST(optimize.minmax)
|
||||
for (unsigned i = GFX8; i <= GFX10; i++) {
|
||||
//>> v1: %a, s2: %_:exec = p_startpgm
|
||||
if (!setup_cs("v1", (chip_class)i))
|
||||
continue;
|
||||
|
||||
//! v1: %res0 = v_max3_f32 0, -0, %a
|
||||
//! p_unit_test 0, %res0
|
||||
Temp xor0 = bld.vop2(aco_opcode::v_xor_b32, bld.def(v1), Operand(0x80000000u), Operand(inputs[0]));
|
||||
Temp min = bld.vop2(aco_opcode::v_min_f32, bld.def(v1), Operand(0u), xor0);
|
||||
Temp xor1 = bld.vop2(aco_opcode::v_xor_b32, bld.def(v1), Operand(0x80000000u), min);
|
||||
writeout(0, bld.vop2(aco_opcode::v_max_f32, bld.def(v1), Operand(0u), xor1));
|
||||
|
||||
//! v1: %res1 = v_max3_f32 0, -0, -%a
|
||||
//! p_unit_test 1, %res1
|
||||
min = bld.vop2(aco_opcode::v_min_f32, bld.def(v1), Operand(0u), Operand(inputs[0]));
|
||||
xor1 = bld.vop2(aco_opcode::v_xor_b32, bld.def(v1), Operand(0x80000000u), min);
|
||||
writeout(1, bld.vop2(aco_opcode::v_max_f32, bld.def(v1), Operand(0u), xor1));
|
||||
|
||||
finish_opt_test();
|
||||
}
|
||||
END_TEST
|
||||
|
|
|
|||
Loading…
Add table
Reference in a new issue