vc4: Add a thread switch QIR instruction.

This will eventually be generated at the QIR level, so that
vc4_qir_schedule.c can arrange the separation of tex_strb from tex_result
correctly.  It will also be important so that register allocation set the
register classes appropriately for values that are live across the switch.
This commit is contained in:
Eric Anholt 2016-11-10 15:23:19 -08:00
parent 93cdae44de
commit 4f527f1260
3 changed files with 18 additions and 0 deletions

View file

@ -82,6 +82,8 @@ static const struct qir_op_info qir_op_info[] = {
[QOP_TEX_DIRECT] = { "tex_direct", 0, 2, true },
[QOP_TEX_RESULT] = { "tex_result", 1, 0, true },
[QOP_THRSW] = { "thrsw", 0, 0, true },
[QOP_LOAD_IMM] = { "load_imm", 0, 1 },
[QOP_LOAD_IMM_U2] = { "load_imm_u2", 0, 1 },
[QOP_LOAD_IMM_I2] = { "load_imm_i2", 0, 1 },

View file

@ -156,6 +156,16 @@ enum qop {
*/
QOP_TEX_RESULT,
/**
* Insert the signal for switching threads in a threaded fragment
* shader. No value can be live in an accumulator across a thrsw.
*
* At the QPU level, this will have several delay slots before the
* switch happens. Those slots are the responsibility of the
* scheduler.
*/
QOP_THRSW,
/* 32-bit immediate loaded to each SIMD channel */
QOP_LOAD_IMM,

View file

@ -500,6 +500,12 @@ vc4_generate_code_block(struct vc4_compile *c,
handle_r4_qpu_write(block, qinst, dst);
break;
case QOP_THRSW:
queue(block, qpu_NOP());
*last_inst(block) = qpu_set_sig(*last_inst(block),
QPU_SIG_THREAD_SWITCH);
break;
case QOP_BRANCH:
/* The branch target will be updated at QPU scheduling
* time.