mirror of
https://gitlab.freedesktop.org/mesa/mesa.git
synced 2026-05-05 18:18:06 +02:00
glsl: remove opt_structure_splitting.
nir_lower_vars_to_ssa will split temp structs up anyway. This fixes a bug where mediump wouldn't be propagated to the split vars. The effect is tiny, I think just shuffling some code scheduling from optimizing at different places. Affects Natural Selection 2, Serious Sam 3, 3dmark slingshot, and Lego Legacy. freedreno shader-db: total instructions in shared programs: 11315637 -> 11315993 (<.01%) instructions in affected programs: 24861 -> 25217 (1.43%) Reviewed-by: Adam Jackson <ajax@redhat.com> Reviewed-by: Timothy Arceri <tarceri@itsqueeze.com> Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/18466>
This commit is contained in:
parent
a19c0ce9b2
commit
a2a6995352
5 changed files with 0 additions and 379 deletions
|
|
@ -2386,7 +2386,6 @@ do_common_optimization(exec_list *ir, bool linked,
|
|||
if (linked) {
|
||||
OPT(do_function_inlining, ir);
|
||||
OPT(do_dead_functions, ir);
|
||||
OPT(do_structure_splitting, ir);
|
||||
}
|
||||
OPT(propagate_invariance, ir);
|
||||
OPT(do_if_simplification, ir);
|
||||
|
|
|
|||
|
|
@ -103,7 +103,6 @@ bool do_if_simplification(exec_list *instructions);
|
|||
bool opt_flatten_nested_if_blocks(exec_list *instructions);
|
||||
bool do_mat_op_to_vec(exec_list *instructions);
|
||||
bool do_minmax_prune(exec_list *instructions);
|
||||
bool do_structure_splitting(exec_list *instructions);
|
||||
bool do_tree_grafting(exec_list *instructions);
|
||||
bool do_vec_index_to_cond_assign(exec_list *instructions);
|
||||
bool do_vec_index_to_swizzle(exec_list *instructions);
|
||||
|
|
|
|||
|
|
@ -186,7 +186,6 @@ files_libglsl = files(
|
|||
'opt_if_simplification.cpp',
|
||||
'opt_minmax.cpp',
|
||||
'opt_rebalance_tree.cpp',
|
||||
'opt_structure_splitting.cpp',
|
||||
'opt_tree_grafting.cpp',
|
||||
'program.h',
|
||||
'propagate_invariance.cpp',
|
||||
|
|
|
|||
|
|
@ -1,374 +0,0 @@
|
|||
/*
|
||||
* Copyright © 2010 Intel Corporation
|
||||
*
|
||||
* Permission is hereby granted, free of charge, to any person obtaining a
|
||||
* copy of this software and associated documentation files (the "Software"),
|
||||
* to deal in the Software without restriction, including without limitation
|
||||
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
||||
* and/or sell copies of the Software, and to permit persons to whom the
|
||||
* Software is furnished to do so, subject to the following conditions:
|
||||
*
|
||||
* The above copyright notice and this permission notice (including the next
|
||||
* paragraph) shall be included in all copies or substantial portions of the
|
||||
* Software.
|
||||
*
|
||||
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
||||
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
||||
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
||||
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
||||
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
||||
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
||||
* DEALINGS IN THE SOFTWARE.
|
||||
*/
|
||||
|
||||
/**
|
||||
* \file opt_structure_splitting.cpp
|
||||
*
|
||||
* If a structure is only ever referenced by its components, then
|
||||
* split those components out to individual variables so they can be
|
||||
* handled normally by other optimization passes.
|
||||
*
|
||||
* This skips structures like uniforms, which need to be accessible as
|
||||
* structures for their access by the GL.
|
||||
*/
|
||||
|
||||
#include "ir.h"
|
||||
#include "ir_visitor.h"
|
||||
#include "ir_rvalue_visitor.h"
|
||||
#include "compiler/glsl_types.h"
|
||||
|
||||
namespace {
|
||||
|
||||
static bool debug = false;
|
||||
|
||||
class variable_entry : public exec_node
|
||||
{
|
||||
public:
|
||||
variable_entry(ir_variable *var)
|
||||
{
|
||||
this->var = var;
|
||||
this->whole_structure_access = 0;
|
||||
this->declaration = false;
|
||||
this->components = NULL;
|
||||
this->mem_ctx = NULL;
|
||||
}
|
||||
|
||||
ir_variable *var; /* The key: the variable's pointer. */
|
||||
|
||||
/** Number of times the variable is referenced, including assignments. */
|
||||
unsigned whole_structure_access;
|
||||
|
||||
/* If the variable had a decl we can work with in the instruction
|
||||
* stream. We can't do splitting on function arguments, which
|
||||
* don't get this variable set.
|
||||
*/
|
||||
bool declaration;
|
||||
|
||||
ir_variable **components;
|
||||
|
||||
/** ralloc_parent(this->var) -- the shader's ralloc context. */
|
||||
void *mem_ctx;
|
||||
};
|
||||
|
||||
|
||||
class ir_structure_reference_visitor : public ir_hierarchical_visitor {
|
||||
public:
|
||||
ir_structure_reference_visitor(void)
|
||||
{
|
||||
this->mem_ctx = ralloc_context(NULL);
|
||||
this->variable_list.make_empty();
|
||||
}
|
||||
|
||||
~ir_structure_reference_visitor(void)
|
||||
{
|
||||
ralloc_free(mem_ctx);
|
||||
}
|
||||
|
||||
virtual ir_visitor_status visit(ir_variable *);
|
||||
virtual ir_visitor_status visit(ir_dereference_variable *);
|
||||
virtual ir_visitor_status visit_enter(ir_dereference_record *);
|
||||
virtual ir_visitor_status visit_enter(ir_assignment *);
|
||||
virtual ir_visitor_status visit_enter(ir_function_signature *);
|
||||
|
||||
variable_entry *get_variable_entry(ir_variable *var);
|
||||
|
||||
/* List of variable_entry */
|
||||
exec_list variable_list;
|
||||
|
||||
void *mem_ctx;
|
||||
};
|
||||
|
||||
variable_entry *
|
||||
ir_structure_reference_visitor::get_variable_entry(ir_variable *var)
|
||||
{
|
||||
assert(var);
|
||||
|
||||
if (!var->type->is_struct() ||
|
||||
var->data.mode == ir_var_uniform || var->data.mode == ir_var_shader_storage ||
|
||||
var->data.mode == ir_var_shader_in || var->data.mode == ir_var_shader_out)
|
||||
return NULL;
|
||||
|
||||
foreach_in_list(variable_entry, entry, &this->variable_list) {
|
||||
if (entry->var == var)
|
||||
return entry;
|
||||
}
|
||||
|
||||
variable_entry *entry = new(mem_ctx) variable_entry(var);
|
||||
this->variable_list.push_tail(entry);
|
||||
return entry;
|
||||
}
|
||||
|
||||
|
||||
ir_visitor_status
|
||||
ir_structure_reference_visitor::visit(ir_variable *ir)
|
||||
{
|
||||
variable_entry *entry = this->get_variable_entry(ir);
|
||||
|
||||
if (entry)
|
||||
entry->declaration = true;
|
||||
|
||||
return visit_continue;
|
||||
}
|
||||
|
||||
ir_visitor_status
|
||||
ir_structure_reference_visitor::visit(ir_dereference_variable *ir)
|
||||
{
|
||||
ir_variable *const var = ir->variable_referenced();
|
||||
variable_entry *entry = this->get_variable_entry(var);
|
||||
|
||||
if (entry)
|
||||
entry->whole_structure_access++;
|
||||
|
||||
return visit_continue;
|
||||
}
|
||||
|
||||
ir_visitor_status
|
||||
ir_structure_reference_visitor::visit_enter(ir_dereference_record *ir)
|
||||
{
|
||||
(void) ir;
|
||||
/* Don't descend into the ir_dereference_variable below. */
|
||||
return visit_continue_with_parent;
|
||||
}
|
||||
|
||||
ir_visitor_status
|
||||
ir_structure_reference_visitor::visit_enter(ir_assignment *ir)
|
||||
{
|
||||
/* If there are no structure references yet, no need to bother with
|
||||
* processing the expression tree.
|
||||
*/
|
||||
if (this->variable_list.is_empty())
|
||||
return visit_continue_with_parent;
|
||||
|
||||
if (ir->lhs->as_dereference_variable() &&
|
||||
ir->rhs->as_dereference_variable()) {
|
||||
/* We'll split copies of a structure to copies of components, so don't
|
||||
* descend to the ir_dereference_variables.
|
||||
*/
|
||||
return visit_continue_with_parent;
|
||||
}
|
||||
return visit_continue;
|
||||
}
|
||||
|
||||
ir_visitor_status
|
||||
ir_structure_reference_visitor::visit_enter(ir_function_signature *ir)
|
||||
{
|
||||
/* We don't have logic for structure-splitting function arguments,
|
||||
* so just look at the body instructions and not the parameter
|
||||
* declarations.
|
||||
*/
|
||||
visit_list_elements(this, &ir->body);
|
||||
return visit_continue_with_parent;
|
||||
}
|
||||
|
||||
class ir_structure_splitting_visitor : public ir_rvalue_visitor {
|
||||
public:
|
||||
ir_structure_splitting_visitor(exec_list *vars)
|
||||
{
|
||||
this->variable_list = vars;
|
||||
}
|
||||
|
||||
virtual ~ir_structure_splitting_visitor()
|
||||
{
|
||||
}
|
||||
|
||||
virtual ir_visitor_status visit_leave(ir_assignment *);
|
||||
|
||||
void split_deref(ir_dereference **deref);
|
||||
void handle_rvalue(ir_rvalue **rvalue);
|
||||
variable_entry *get_splitting_entry(ir_variable *var);
|
||||
|
||||
exec_list *variable_list;
|
||||
};
|
||||
|
||||
variable_entry *
|
||||
ir_structure_splitting_visitor::get_splitting_entry(ir_variable *var)
|
||||
{
|
||||
assert(var);
|
||||
|
||||
if (!var->type->is_struct())
|
||||
return NULL;
|
||||
|
||||
foreach_in_list(variable_entry, entry, this->variable_list) {
|
||||
if (entry->var == var) {
|
||||
return entry;
|
||||
}
|
||||
}
|
||||
|
||||
return NULL;
|
||||
}
|
||||
|
||||
void
|
||||
ir_structure_splitting_visitor::split_deref(ir_dereference **deref)
|
||||
{
|
||||
if ((*deref)->ir_type != ir_type_dereference_record)
|
||||
return;
|
||||
|
||||
ir_dereference_record *deref_record = (ir_dereference_record *)*deref;
|
||||
ir_dereference_variable *deref_var = deref_record->record->as_dereference_variable();
|
||||
if (!deref_var)
|
||||
return;
|
||||
|
||||
variable_entry *entry = get_splitting_entry(deref_var->var);
|
||||
if (!entry)
|
||||
return;
|
||||
|
||||
int i = deref_record->field_idx;
|
||||
assert(i >= 0);
|
||||
assert((unsigned) i < entry->var->type->length);
|
||||
|
||||
*deref = new(entry->mem_ctx) ir_dereference_variable(entry->components[i]);
|
||||
}
|
||||
|
||||
void
|
||||
ir_structure_splitting_visitor::handle_rvalue(ir_rvalue **rvalue)
|
||||
{
|
||||
if (!*rvalue)
|
||||
return;
|
||||
|
||||
ir_dereference *deref = (*rvalue)->as_dereference();
|
||||
|
||||
if (!deref)
|
||||
return;
|
||||
|
||||
split_deref(&deref);
|
||||
*rvalue = deref;
|
||||
}
|
||||
|
||||
ir_visitor_status
|
||||
ir_structure_splitting_visitor::visit_leave(ir_assignment *ir)
|
||||
{
|
||||
ir_dereference_variable *lhs_deref = ir->lhs->as_dereference_variable();
|
||||
ir_dereference_variable *rhs_deref = ir->rhs->as_dereference_variable();
|
||||
variable_entry *lhs_entry = lhs_deref ? get_splitting_entry(lhs_deref->var) : NULL;
|
||||
variable_entry *rhs_entry = rhs_deref ? get_splitting_entry(rhs_deref->var) : NULL;
|
||||
const glsl_type *type = ir->rhs->type;
|
||||
|
||||
if (lhs_entry || rhs_entry) {
|
||||
for (unsigned int i = 0; i < type->length; i++) {
|
||||
ir_dereference *new_lhs, *new_rhs;
|
||||
void *mem_ctx = lhs_entry ? lhs_entry->mem_ctx : rhs_entry->mem_ctx;
|
||||
|
||||
if (lhs_entry) {
|
||||
new_lhs = new(mem_ctx) ir_dereference_variable(lhs_entry->components[i]);
|
||||
} else {
|
||||
new_lhs = new(mem_ctx)
|
||||
ir_dereference_record(ir->lhs->clone(mem_ctx, NULL),
|
||||
type->fields.structure[i].name);
|
||||
}
|
||||
|
||||
if (rhs_entry) {
|
||||
new_rhs = new(mem_ctx) ir_dereference_variable(rhs_entry->components[i]);
|
||||
} else {
|
||||
new_rhs = new(mem_ctx)
|
||||
ir_dereference_record(ir->rhs->clone(mem_ctx, NULL),
|
||||
type->fields.structure[i].name);
|
||||
}
|
||||
|
||||
ir->insert_before(new(mem_ctx) ir_assignment(new_lhs, new_rhs));
|
||||
}
|
||||
ir->remove();
|
||||
} else {
|
||||
handle_rvalue(&ir->rhs);
|
||||
split_deref(&ir->lhs);
|
||||
}
|
||||
|
||||
return visit_continue;
|
||||
}
|
||||
|
||||
} /* unnamed namespace */
|
||||
|
||||
bool
|
||||
do_structure_splitting(exec_list *instructions)
|
||||
{
|
||||
ir_structure_reference_visitor refs;
|
||||
|
||||
visit_list_elements(&refs, instructions);
|
||||
|
||||
/* Trim out variables we can't split. */
|
||||
foreach_in_list_safe(variable_entry, entry, &refs.variable_list) {
|
||||
if (debug) {
|
||||
printf("structure %s@%p: decl %d, whole_access %d\n",
|
||||
entry->var->name, (void *) entry->var, entry->declaration,
|
||||
entry->whole_structure_access);
|
||||
}
|
||||
|
||||
if (!entry->declaration || entry->whole_structure_access) {
|
||||
entry->remove();
|
||||
}
|
||||
}
|
||||
|
||||
if (refs.variable_list.is_empty())
|
||||
return false;
|
||||
|
||||
void *mem_ctx = ralloc_context(NULL);
|
||||
|
||||
/* Replace the decls of the structures to be split with their split
|
||||
* components.
|
||||
*/
|
||||
foreach_in_list_safe(variable_entry, entry, &refs.variable_list) {
|
||||
const struct glsl_type *type = entry->var->type;
|
||||
|
||||
entry->mem_ctx = ralloc_parent(entry->var);
|
||||
|
||||
entry->components = ralloc_array(mem_ctx, ir_variable *, type->length);
|
||||
|
||||
for (unsigned int i = 0; i < entry->var->type->length; i++) {
|
||||
const char *name = ralloc_asprintf(mem_ctx, "%s_%s", entry->var->name,
|
||||
type->fields.structure[i].name);
|
||||
ir_variable *new_var =
|
||||
new(entry->mem_ctx) ir_variable(type->fields.structure[i].type,
|
||||
name,
|
||||
(ir_variable_mode) entry->var->data.mode);
|
||||
|
||||
if (type->fields.structure[i].type->without_array()->is_image()) {
|
||||
/* Do not lose memory/format qualifiers for images declared inside
|
||||
* structures as allowed by ARB_bindless_texture.
|
||||
*/
|
||||
new_var->data.memory_read_only =
|
||||
type->fields.structure[i].memory_read_only;
|
||||
new_var->data.memory_write_only =
|
||||
type->fields.structure[i].memory_write_only;
|
||||
new_var->data.memory_coherent =
|
||||
type->fields.structure[i].memory_coherent;
|
||||
new_var->data.memory_volatile =
|
||||
type->fields.structure[i].memory_volatile;
|
||||
new_var->data.memory_restrict =
|
||||
type->fields.structure[i].memory_restrict;
|
||||
new_var->data.image_format =
|
||||
type->fields.structure[i].image_format;
|
||||
}
|
||||
|
||||
entry->components[i] = new_var;
|
||||
entry->var->insert_before(entry->components[i]);
|
||||
}
|
||||
|
||||
entry->var->remove();
|
||||
}
|
||||
|
||||
ir_structure_splitting_visitor split(&refs.variable_list);
|
||||
visit_list_elements(&split, instructions);
|
||||
|
||||
ralloc_free(mem_ctx);
|
||||
|
||||
return true;
|
||||
}
|
||||
|
|
@ -95,8 +95,6 @@ do_optimization(struct exec_list *ir, const char *optimization,
|
|||
return do_if_simplification(ir);
|
||||
} else if (strcmp(optimization, "do_mat_op_to_vec") == 0) {
|
||||
return do_mat_op_to_vec(ir);
|
||||
} else if (strcmp(optimization, "do_structure_splitting") == 0) {
|
||||
return do_structure_splitting(ir);
|
||||
} else if (strcmp(optimization, "do_tree_grafting") == 0) {
|
||||
return do_tree_grafting(ir);
|
||||
} else if (strcmp(optimization, "do_vec_index_to_cond_assign") == 0) {
|
||||
|
|
|
|||
Loading…
Add table
Reference in a new issue