lima/ppir: simplify select op lowering and scheduling

The select operation relies on the select condition coming from the
result of the the alu scalar mult slot, in the same instruction.
The current implementation creates a mov node to be the predecessor of
select, and then relies on an exception during scheduling to ensure that
both ops are inserted in the same instruction.

Now that the ppir scheduler supports pipeline register dependencies,
this can be simplified by making the mov explicitly output to the fmul
pipeline register, and the scheduler can place it without an exception.

Since the select condition can only be placed in the scalar mult slot,
differently than a regular mov, define a separate op for it.

Signed-off-by: Erico Nunes <nunes.erico@gmail.com>
Reviewed-by: Vasily Khoruzhick <anarsoul@gmail.com>
Reviewed-by: Qiang Yu <yuq825@gmail.com>
This commit is contained in:
Erico Nunes 2019-07-21 15:07:50 +02:00
parent eb82637c2f
commit fd29c4d6c5
5 changed files with 15 additions and 11 deletions

View file

@ -243,6 +243,9 @@ static void ppir_codegen_encode_scl_mul(ppir_node *node, void *code)
case ppir_op_mov:
f->op = ppir_codegen_float_mul_op_mov;
break;
case ppir_op_sel_cond:
f->op = ppir_codegen_float_mul_op_mov;
break;
case ppir_op_max:
f->op = ppir_codegen_float_mul_op_max;
break;

View file

@ -201,7 +201,7 @@ static bool ppir_lower_select(ppir_block *block, ppir_node *node)
{
ppir_alu_node *alu = ppir_node_to_alu(node);
ppir_node *move = ppir_node_create(block, ppir_op_mov, -1, 0);
ppir_node *move = ppir_node_create(block, ppir_op_sel_cond, -1, 0);
if (!move)
return false;
list_addtail(&move->list, &node->list);
@ -214,10 +214,8 @@ static bool ppir_lower_select(ppir_block *block, ppir_node *node)
move_alu->num_src = 1;
ppir_dest *move_dest = &move_alu->dest;
move_dest->type = ppir_target_ssa;
move_dest->ssa.num_components = 1;
move_dest->ssa.live_in = INT_MAX;
move_dest->ssa.live_out = 0;
move_dest->type = ppir_target_pipeline;
move_dest->pipeline = ppir_pipeline_reg_fmul;
move_dest->write_mask = 1;
ppir_node_foreach_pred(node, dep) {

View file

@ -211,6 +211,14 @@ const ppir_op_info ppir_op_infos[] = {
PPIR_INSTR_SLOT_END
},
},
[ppir_op_sel_cond] = {
/* effectively mov, but must be scheduled only to
* PPIR_INSTR_SLOT_ALU_SCL_MUL */
.name = "sel_cond",
.slots = (int []) {
PPIR_INSTR_SLOT_ALU_SCL_MUL, PPIR_INSTR_SLOT_END
},
},
[ppir_op_select] = {
.name = "select",
.slots = (int []) {

View file

@ -174,12 +174,6 @@ static bool ppir_do_one_node_to_instr(ppir_block *block, ppir_node *node, ppir_n
ppir_node *succ = ppir_node_first_succ(node);
if (succ->instr_pos == PPIR_INSTR_SLOT_ALU_VEC_ADD) {
node->instr_pos = PPIR_INSTR_SLOT_ALU_VEC_MUL;
/* select instr's condition must be inserted to fmul slot */
if (succ->op == ppir_op_select &&
ppir_node_first_pred(succ) == node) {
assert(alu->dest.ssa.num_components == 1);
node->instr_pos = PPIR_INSTR_SLOT_ALU_SCL_MUL;
}
ppir_instr_insert_mul_node(succ, node);
}
else if (succ->instr_pos == PPIR_INSTR_SLOT_ALU_SCL_ADD &&

View file

@ -53,6 +53,7 @@ typedef enum {
ppir_op_normalize3,
ppir_op_normalize4,
ppir_op_sel_cond,
ppir_op_select,
ppir_op_sin,