mirror of
https://gitlab.freedesktop.org/mesa/mesa.git
synced 2025-12-27 12:40:09 +01:00
radv: start conditionalising vertex inputs. (v2)
In practice this will probably just drop draw id in a few places. v2: just do draw_id for now. (Bas) it might be possible to do something more if we need it in the future. (nha) Reviewed-by: Bas Nieuwenhuizen <bas@basnieuwenhuizen.nl> Signed-off-by: Dave Airlie <airlied@redhat.com>
This commit is contained in:
parent
224cf2906a
commit
31174069d2
4 changed files with 63 additions and 14 deletions
|
|
@ -614,10 +614,12 @@ static void create_function(struct nir_to_llvm_context *ctx)
|
|||
break;
|
||||
case MESA_SHADER_VERTEX:
|
||||
if (!ctx->is_gs_copy_shader) {
|
||||
arg_types[arg_idx++] = const_array(ctx->v16i8, 16); /* vertex buffers */
|
||||
if (ctx->shader_info->info.vs.has_vertex_buffers)
|
||||
arg_types[arg_idx++] = const_array(ctx->v16i8, 16); /* vertex buffers */
|
||||
arg_types[arg_idx++] = ctx->i32; // base vertex
|
||||
arg_types[arg_idx++] = ctx->i32; // start instance
|
||||
arg_types[arg_idx++] = ctx->i32; // draw index
|
||||
if (ctx->shader_info->info.vs.needs_draw_id)
|
||||
arg_types[arg_idx++] = ctx->i32; // draw index
|
||||
}
|
||||
user_sgpr_count = arg_idx;
|
||||
if (ctx->options->key.vs.as_es)
|
||||
|
|
@ -773,14 +775,22 @@ static void create_function(struct nir_to_llvm_context *ctx)
|
|||
break;
|
||||
case MESA_SHADER_VERTEX:
|
||||
if (!ctx->is_gs_copy_shader) {
|
||||
set_userdata_location_shader(ctx, AC_UD_VS_VERTEX_BUFFERS, user_sgpr_idx, 2);
|
||||
user_sgpr_idx += 2;
|
||||
ctx->vertex_buffers = LLVMGetParam(ctx->main_function, arg_idx++);
|
||||
set_userdata_location_shader(ctx, AC_UD_VS_BASE_VERTEX_START_INSTANCE, user_sgpr_idx, 3);
|
||||
user_sgpr_idx += 3;
|
||||
if (ctx->shader_info->info.vs.has_vertex_buffers) {
|
||||
set_userdata_location_shader(ctx, AC_UD_VS_VERTEX_BUFFERS, user_sgpr_idx, 2);
|
||||
user_sgpr_idx += 2;
|
||||
ctx->vertex_buffers = LLVMGetParam(ctx->main_function, arg_idx++);
|
||||
}
|
||||
unsigned vs_num = 2;
|
||||
if (ctx->shader_info->info.vs.needs_draw_id)
|
||||
vs_num++;
|
||||
|
||||
set_userdata_location_shader(ctx, AC_UD_VS_BASE_VERTEX_START_INSTANCE, user_sgpr_idx, vs_num);
|
||||
user_sgpr_idx += vs_num;
|
||||
|
||||
ctx->base_vertex = LLVMGetParam(ctx->main_function, arg_idx++);
|
||||
ctx->start_instance = LLVMGetParam(ctx->main_function, arg_idx++);
|
||||
ctx->draw_index = LLVMGetParam(ctx->main_function, arg_idx++);
|
||||
if (ctx->shader_info->info.vs.needs_draw_id)
|
||||
ctx->draw_index = LLVMGetParam(ctx->main_function, arg_idx++);
|
||||
}
|
||||
if (ctx->options->key.vs.as_es)
|
||||
ctx->es2gs_offset = LLVMGetParam(ctx->main_function, arg_idx++);
|
||||
|
|
|
|||
|
|
@ -30,6 +30,9 @@ gather_intrinsic_info(nir_intrinsic_instr *instr, struct ac_shader_info *info)
|
|||
case nir_intrinsic_interp_var_at_sample:
|
||||
info->ps.needs_sample_positions = true;
|
||||
break;
|
||||
case nir_intrinsic_load_draw_id:
|
||||
info->vs.needs_draw_id = true;
|
||||
break;
|
||||
default:
|
||||
break;
|
||||
}
|
||||
|
|
@ -49,12 +52,30 @@ gather_info_block(nir_block *block, struct ac_shader_info *info)
|
|||
}
|
||||
}
|
||||
|
||||
static void
|
||||
gather_info_input_decl(nir_shader *nir,
|
||||
const struct ac_nir_compiler_options *options,
|
||||
nir_variable *var,
|
||||
struct ac_shader_info *info)
|
||||
{
|
||||
switch (nir->stage) {
|
||||
case MESA_SHADER_VERTEX:
|
||||
info->vs.has_vertex_buffers = true;
|
||||
break;
|
||||
default:
|
||||
break;
|
||||
}
|
||||
}
|
||||
|
||||
void
|
||||
ac_nir_shader_info_pass(struct nir_shader *nir,
|
||||
const struct ac_nir_compiler_options *options,
|
||||
struct ac_shader_info *info)
|
||||
{
|
||||
struct nir_function *func = (struct nir_function *)exec_list_get_head(&nir->functions);
|
||||
nir_foreach_variable(variable, &nir->inputs)
|
||||
gather_info_input_decl(nir, options, variable, info);
|
||||
|
||||
nir_foreach_block(block, func->impl) {
|
||||
gather_info_block(block, info);
|
||||
}
|
||||
|
|
|
|||
|
|
@ -28,6 +28,10 @@ struct ac_nir_compiler_options;
|
|||
/* a NIR pass to gather all the info needed to optimise the alloction patterns for the RADV user sgprs */
|
||||
|
||||
struct ac_shader_info {
|
||||
struct {
|
||||
bool has_vertex_buffers; /* needs vertex buffers and base/start */
|
||||
bool needs_draw_id;
|
||||
} vs;
|
||||
struct {
|
||||
bool needs_sample_positions;
|
||||
} ps;
|
||||
|
|
|
|||
|
|
@ -1427,7 +1427,8 @@ radv_cmd_buffer_flush_state(struct radv_cmd_buffer *cmd_buffer,
|
|||
cmd_buffer->cs, 4096);
|
||||
|
||||
if ((cmd_buffer->state.vertex_descriptors_dirty || cmd_buffer->state.vb_dirty) &&
|
||||
cmd_buffer->state.pipeline->num_vertex_attribs) {
|
||||
cmd_buffer->state.pipeline->num_vertex_attribs &&
|
||||
cmd_buffer->state.pipeline->shaders[MESA_SHADER_VERTEX]->info.info.vs.has_vertex_buffers) {
|
||||
unsigned vb_offset;
|
||||
void *vb_ptr;
|
||||
uint32_t i = 0;
|
||||
|
|
@ -2512,10 +2513,16 @@ void radv_CmdDraw(
|
|||
if (loc->sgpr_idx != -1) {
|
||||
uint32_t base_reg = shader_stage_to_user_data_0(MESA_SHADER_VERTEX, radv_pipeline_has_gs(cmd_buffer->state.pipeline),
|
||||
radv_pipeline_has_tess(cmd_buffer->state.pipeline));
|
||||
radeon_set_sh_reg_seq(cmd_buffer->cs, base_reg + loc->sgpr_idx * 4, 3);
|
||||
int vs_num = 2;
|
||||
if (cmd_buffer->state.pipeline->shaders[MESA_SHADER_VERTEX]->info.info.vs.needs_draw_id)
|
||||
vs_num = 3;
|
||||
|
||||
assert (loc->num_sgprs == vs_num);
|
||||
radeon_set_sh_reg_seq(cmd_buffer->cs, base_reg + loc->sgpr_idx * 4, vs_num);
|
||||
radeon_emit(cmd_buffer->cs, firstVertex);
|
||||
radeon_emit(cmd_buffer->cs, firstInstance);
|
||||
radeon_emit(cmd_buffer->cs, 0);
|
||||
if (cmd_buffer->state.pipeline->shaders[MESA_SHADER_VERTEX]->info.info.vs.needs_draw_id)
|
||||
radeon_emit(cmd_buffer->cs, 0);
|
||||
}
|
||||
radeon_emit(cmd_buffer->cs, PKT3(PKT3_NUM_INSTANCES, 0, 0));
|
||||
radeon_emit(cmd_buffer->cs, instanceCount);
|
||||
|
|
@ -2555,10 +2562,16 @@ void radv_CmdDrawIndexed(
|
|||
if (loc->sgpr_idx != -1) {
|
||||
uint32_t base_reg = shader_stage_to_user_data_0(MESA_SHADER_VERTEX, radv_pipeline_has_gs(cmd_buffer->state.pipeline),
|
||||
radv_pipeline_has_tess(cmd_buffer->state.pipeline));
|
||||
radeon_set_sh_reg_seq(cmd_buffer->cs, base_reg + loc->sgpr_idx * 4, 3);
|
||||
int vs_num = 2;
|
||||
if (cmd_buffer->state.pipeline->shaders[MESA_SHADER_VERTEX]->info.info.vs.needs_draw_id)
|
||||
vs_num = 3;
|
||||
|
||||
assert (loc->num_sgprs == vs_num);
|
||||
radeon_set_sh_reg_seq(cmd_buffer->cs, base_reg + loc->sgpr_idx * 4, vs_num);
|
||||
radeon_emit(cmd_buffer->cs, vertexOffset);
|
||||
radeon_emit(cmd_buffer->cs, firstInstance);
|
||||
radeon_emit(cmd_buffer->cs, 0);
|
||||
if (cmd_buffer->state.pipeline->shaders[MESA_SHADER_VERTEX]->info.info.vs.needs_draw_id)
|
||||
radeon_emit(cmd_buffer->cs, 0);
|
||||
}
|
||||
radeon_emit(cmd_buffer->cs, PKT3(PKT3_NUM_INSTANCES, 0, 0));
|
||||
radeon_emit(cmd_buffer->cs, instanceCount);
|
||||
|
|
@ -2609,6 +2622,7 @@ radv_emit_indirect_draw(struct radv_cmd_buffer *cmd_buffer,
|
|||
AC_UD_VS_BASE_VERTEX_START_INSTANCE);
|
||||
uint32_t base_reg = shader_stage_to_user_data_0(MESA_SHADER_VERTEX, radv_pipeline_has_gs(cmd_buffer->state.pipeline),
|
||||
radv_pipeline_has_tess(cmd_buffer->state.pipeline));
|
||||
bool draw_id_enable = cmd_buffer->state.pipeline->shaders[MESA_SHADER_VERTEX]->info.info.vs.needs_draw_id;
|
||||
assert(loc->sgpr_idx != -1);
|
||||
radeon_emit(cs, PKT3(PKT3_SET_BASE, 2, 0));
|
||||
radeon_emit(cs, 1);
|
||||
|
|
@ -2622,7 +2636,7 @@ radv_emit_indirect_draw(struct radv_cmd_buffer *cmd_buffer,
|
|||
radeon_emit(cs, ((base_reg + loc->sgpr_idx * 4) - SI_SH_REG_OFFSET) >> 2);
|
||||
radeon_emit(cs, ((base_reg + (loc->sgpr_idx + 1) * 4) - SI_SH_REG_OFFSET) >> 2);
|
||||
radeon_emit(cs, (((base_reg + (loc->sgpr_idx + 2) * 4) - SI_SH_REG_OFFSET) >> 2) |
|
||||
S_2C3_DRAW_INDEX_ENABLE(1) |
|
||||
S_2C3_DRAW_INDEX_ENABLE(draw_id_enable) |
|
||||
S_2C3_COUNT_INDIRECT_ENABLE(!!count_va));
|
||||
radeon_emit(cs, draw_count); /* count */
|
||||
radeon_emit(cs, count_va); /* count_addr */
|
||||
|
|
|
|||
Loading…
Add table
Reference in a new issue