mirror of
https://gitlab.freedesktop.org/mesa/mesa.git
synced 2025-12-23 04:40:09 +01:00
i965: Make the userclip flag for the VUE map come from VS prog data.
This reduces recomputation of state based on non-clipping-related transform changes, and is a step toward removing VUE map recomputation. Reviewed-by: Kenneth Graunke <kenneth@whitecape.org>
This commit is contained in:
parent
b5c409363c
commit
9f3d3216cf
10 changed files with 29 additions and 39 deletions
|
|
@ -69,7 +69,7 @@ static void compile_clip_prog( struct brw_context *brw,
|
||||||
c.func.single_program_flow = 1;
|
c.func.single_program_flow = 1;
|
||||||
|
|
||||||
c.key = *key;
|
c.key = *key;
|
||||||
brw_compute_vue_map(&c.vue_map, intel, c.key.nr_userclip > 0, c.key.attrs);
|
brw_compute_vue_map(&c.vue_map, intel, brw->vs.prog_data);
|
||||||
|
|
||||||
/* nr_regs is the number of registers filled by reading data from the VUE.
|
/* nr_regs is the number of registers filled by reading data from the VUE.
|
||||||
* This program accesses the entire VUE, so nr_regs needs to be the size of
|
* This program accesses the entire VUE, so nr_regs needs to be the size of
|
||||||
|
|
@ -145,12 +145,12 @@ brw_upload_clip_prog(struct brw_context *brw)
|
||||||
*/
|
*/
|
||||||
/* BRW_NEW_REDUCED_PRIMITIVE */
|
/* BRW_NEW_REDUCED_PRIMITIVE */
|
||||||
key.primitive = brw->intel.reduced_primitive;
|
key.primitive = brw->intel.reduced_primitive;
|
||||||
/* CACHE_NEW_VS_PROG */
|
/* CACHE_NEW_VS_PROG (also part of VUE map) */
|
||||||
key.attrs = brw->vs.prog_data->outputs_written;
|
key.attrs = brw->vs.prog_data->outputs_written;
|
||||||
/* _NEW_LIGHT */
|
/* _NEW_LIGHT */
|
||||||
key.do_flat_shading = (ctx->Light.ShadeModel == GL_FLAT);
|
key.do_flat_shading = (ctx->Light.ShadeModel == GL_FLAT);
|
||||||
key.pv_first = (ctx->Light.ProvokingVertex == GL_FIRST_VERTEX_CONVENTION);
|
key.pv_first = (ctx->Light.ProvokingVertex == GL_FIRST_VERTEX_CONVENTION);
|
||||||
/* _NEW_TRANSFORM */
|
/* _NEW_TRANSFORM (also part of VUE map)*/
|
||||||
key.nr_userclip = _mesa_bitcount_64(ctx->Transform.ClipPlanesEnabled);
|
key.nr_userclip = _mesa_bitcount_64(ctx->Transform.ClipPlanesEnabled);
|
||||||
|
|
||||||
if (intel->gen == 5)
|
if (intel->gen == 5)
|
||||||
|
|
|
||||||
|
|
@ -400,6 +400,7 @@ struct brw_vs_prog_data {
|
||||||
|
|
||||||
bool uses_new_param_layout;
|
bool uses_new_param_layout;
|
||||||
bool uses_vertexid;
|
bool uses_vertexid;
|
||||||
|
bool userclip;
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|
||||||
|
|
@ -1046,8 +1047,7 @@ int brw_disasm (FILE *file, struct brw_instruction *inst, int gen);
|
||||||
/* brw_vs.c */
|
/* brw_vs.c */
|
||||||
void brw_compute_vue_map(struct brw_vue_map *vue_map,
|
void brw_compute_vue_map(struct brw_vue_map *vue_map,
|
||||||
const struct intel_context *intel,
|
const struct intel_context *intel,
|
||||||
bool userclip_active,
|
const struct brw_vs_prog_data *prog_data);
|
||||||
GLbitfield64 outputs_written);
|
|
||||||
gl_clip_plane *brw_select_clip_planes(struct gl_context *ctx);
|
gl_clip_plane *brw_select_clip_planes(struct gl_context *ctx);
|
||||||
|
|
||||||
/* brw_wm.c */
|
/* brw_wm.c */
|
||||||
|
|
|
||||||
|
|
@ -56,8 +56,7 @@ static void compile_gs_prog( struct brw_context *brw,
|
||||||
memset(&c, 0, sizeof(c));
|
memset(&c, 0, sizeof(c));
|
||||||
|
|
||||||
c.key = *key;
|
c.key = *key;
|
||||||
/* The geometry shader needs to access the entire VUE. */
|
brw_compute_vue_map(&c.vue_map, intel, brw->vs.prog_data);
|
||||||
brw_compute_vue_map(&c.vue_map, intel, c.key.userclip_active, c.key.attrs);
|
|
||||||
c.nr_regs = (c.vue_map.num_slots + 1)/2;
|
c.nr_regs = (c.vue_map.num_slots + 1)/2;
|
||||||
|
|
||||||
mem_ctx = NULL;
|
mem_ctx = NULL;
|
||||||
|
|
@ -166,7 +165,7 @@ static void populate_key( struct brw_context *brw,
|
||||||
|
|
||||||
memset(key, 0, sizeof(*key));
|
memset(key, 0, sizeof(*key));
|
||||||
|
|
||||||
/* CACHE_NEW_VS_PROG */
|
/* CACHE_NEW_VS_PROG (part of VUE map) */
|
||||||
key->attrs = brw->vs.prog_data->outputs_written;
|
key->attrs = brw->vs.prog_data->outputs_written;
|
||||||
|
|
||||||
/* BRW_NEW_PRIMITIVE */
|
/* BRW_NEW_PRIMITIVE */
|
||||||
|
|
@ -181,8 +180,8 @@ static void populate_key( struct brw_context *brw,
|
||||||
key->pv_first = true;
|
key->pv_first = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
/* _NEW_TRANSFORM */
|
/* CACHE_NEW_VS_PROG (part of VUE map)*/
|
||||||
key->userclip_active = (ctx->Transform.ClipPlanesEnabled != 0);
|
key->userclip_active = brw->vs.prog_data->userclip;
|
||||||
|
|
||||||
if (intel->gen >= 7) {
|
if (intel->gen >= 7) {
|
||||||
/* On Gen7 and later, we don't use GS (yet). */
|
/* On Gen7 and later, we don't use GS (yet). */
|
||||||
|
|
@ -267,7 +266,6 @@ brw_upload_gs_prog(struct brw_context *brw)
|
||||||
const struct brw_tracked_state brw_gs_prog = {
|
const struct brw_tracked_state brw_gs_prog = {
|
||||||
.dirty = {
|
.dirty = {
|
||||||
.mesa = (_NEW_LIGHT |
|
.mesa = (_NEW_LIGHT |
|
||||||
_NEW_TRANSFORM |
|
|
||||||
_NEW_TRANSFORM_FEEDBACK |
|
_NEW_TRANSFORM_FEEDBACK |
|
||||||
_NEW_RASTERIZER_DISCARD),
|
_NEW_RASTERIZER_DISCARD),
|
||||||
.brw = BRW_NEW_PRIMITIVE,
|
.brw = BRW_NEW_PRIMITIVE,
|
||||||
|
|
|
||||||
|
|
@ -63,7 +63,7 @@ static void compile_sf_prog( struct brw_context *brw,
|
||||||
brw_init_compile(brw, &c.func, mem_ctx);
|
brw_init_compile(brw, &c.func, mem_ctx);
|
||||||
|
|
||||||
c.key = *key;
|
c.key = *key;
|
||||||
brw_compute_vue_map(&c.vue_map, intel, c.key.userclip_active, c.key.attrs);
|
brw_compute_vue_map(&c.vue_map, intel, brw->vs.prog_data);
|
||||||
c.urb_entry_read_offset = brw_sf_compute_urb_entry_read_offset(intel);
|
c.urb_entry_read_offset = brw_sf_compute_urb_entry_read_offset(intel);
|
||||||
c.nr_attr_regs = (c.vue_map.num_slots + 1)/2 - c.urb_entry_read_offset;
|
c.nr_attr_regs = (c.vue_map.num_slots + 1)/2 - c.urb_entry_read_offset;
|
||||||
c.nr_setup_regs = c.nr_attr_regs;
|
c.nr_setup_regs = c.nr_attr_regs;
|
||||||
|
|
|
||||||
|
|
@ -2252,8 +2252,7 @@ vec4_visitor::emit_urb_writes()
|
||||||
|
|
||||||
/* FINISHME: edgeflag */
|
/* FINISHME: edgeflag */
|
||||||
|
|
||||||
brw_compute_vue_map(&c->vue_map, intel, c->key.userclip_active,
|
brw_compute_vue_map(&c->vue_map, intel, &c->prog_data);
|
||||||
c->prog_data.outputs_written);
|
|
||||||
|
|
||||||
/* First mrf is the g0-based message header containing URB handles and such,
|
/* First mrf is the g0-based message header containing URB handles and such,
|
||||||
* which is implied in VS_OPCODE_URB_WRITE.
|
* which is implied in VS_OPCODE_URB_WRITE.
|
||||||
|
|
|
||||||
|
|
@ -52,13 +52,18 @@ static inline void assign_vue_slot(struct brw_vue_map *vue_map,
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Compute the VUE map for vertex shader program.
|
* Compute the VUE map for vertex shader program.
|
||||||
|
*
|
||||||
|
* Note that consumers of this map using cache keys must include
|
||||||
|
* prog_data->userclip and prog_data->outputs_written in their key
|
||||||
|
* (generated by CACHE_NEW_VS_PROG).
|
||||||
*/
|
*/
|
||||||
void
|
void
|
||||||
brw_compute_vue_map(struct brw_vue_map *vue_map,
|
brw_compute_vue_map(struct brw_vue_map *vue_map,
|
||||||
const struct intel_context *intel,
|
const struct intel_context *intel,
|
||||||
bool userclip_active,
|
const struct brw_vs_prog_data *prog_data)
|
||||||
GLbitfield64 outputs_written)
|
|
||||||
{
|
{
|
||||||
|
bool userclip_active = prog_data->userclip;
|
||||||
|
GLbitfield64 outputs_written = prog_data->outputs_written;
|
||||||
int i;
|
int i;
|
||||||
|
|
||||||
vue_map->num_slots = 0;
|
vue_map->num_slots = 0;
|
||||||
|
|
|
||||||
|
|
@ -173,6 +173,7 @@ static inline bool can_use_direct_mrf(int vert_result,
|
||||||
*/
|
*/
|
||||||
static void brw_vs_alloc_regs( struct brw_vs_compile *c )
|
static void brw_vs_alloc_regs( struct brw_vs_compile *c )
|
||||||
{
|
{
|
||||||
|
struct brw_context *brw = c->func.brw;
|
||||||
struct intel_context *intel = &c->func.brw->intel;
|
struct intel_context *intel = &c->func.brw->intel;
|
||||||
GLuint i, reg = 0, slot;
|
GLuint i, reg = 0, slot;
|
||||||
int attributes_in_vue;
|
int attributes_in_vue;
|
||||||
|
|
@ -325,8 +326,7 @@ static void brw_vs_alloc_regs( struct brw_vs_compile *c )
|
||||||
|
|
||||||
/* Allocate outputs. The non-position outputs go straight into message regs.
|
/* Allocate outputs. The non-position outputs go straight into message regs.
|
||||||
*/
|
*/
|
||||||
brw_compute_vue_map(&c->vue_map, intel, c->key.userclip_active,
|
brw_compute_vue_map(&c->vue_map, intel, &c->prog_data);
|
||||||
c->prog_data.outputs_written);
|
|
||||||
c->first_output = reg;
|
c->first_output = reg;
|
||||||
|
|
||||||
first_reladdr_output = get_first_reladdr_output(&c->vp->program);
|
first_reladdr_output = get_first_reladdr_output(&c->vp->program);
|
||||||
|
|
|
||||||
|
|
@ -114,8 +114,6 @@ upload_sf_state(struct brw_context *brw)
|
||||||
struct gl_context *ctx = &intel->ctx;
|
struct gl_context *ctx = &intel->ctx;
|
||||||
struct brw_vue_map vue_map;
|
struct brw_vue_map vue_map;
|
||||||
uint32_t urb_entry_read_length;
|
uint32_t urb_entry_read_length;
|
||||||
/* CACHE_NEW_VS_PROG */
|
|
||||||
GLbitfield64 vs_outputs_written = brw->vs.prog_data->outputs_written;
|
|
||||||
/* BRW_NEW_FRAGMENT_PROGRAM */
|
/* BRW_NEW_FRAGMENT_PROGRAM */
|
||||||
uint32_t num_outputs = _mesa_bitcount_64(brw->fragment_program->Base.InputsRead);
|
uint32_t num_outputs = _mesa_bitcount_64(brw->fragment_program->Base.InputsRead);
|
||||||
/* _NEW_LIGHT */
|
/* _NEW_LIGHT */
|
||||||
|
|
@ -128,13 +126,10 @@ upload_sf_state(struct brw_context *brw)
|
||||||
int urb_entry_read_offset = 1;
|
int urb_entry_read_offset = 1;
|
||||||
float point_size;
|
float point_size;
|
||||||
uint16_t attr_overrides[FRAG_ATTRIB_MAX];
|
uint16_t attr_overrides[FRAG_ATTRIB_MAX];
|
||||||
bool userclip_active;
|
|
||||||
uint32_t point_sprite_origin;
|
uint32_t point_sprite_origin;
|
||||||
|
|
||||||
/* _NEW_TRANSFORM */
|
/* CACHE_NEW_VS_PROG */
|
||||||
userclip_active = (ctx->Transform.ClipPlanesEnabled != 0);
|
brw_compute_vue_map(&vue_map, intel, brw->vs.prog_data);
|
||||||
|
|
||||||
brw_compute_vue_map(&vue_map, intel, userclip_active, vs_outputs_written);
|
|
||||||
urb_entry_read_length = (vue_map.num_slots + 1)/2 - urb_entry_read_offset;
|
urb_entry_read_length = (vue_map.num_slots + 1)/2 - urb_entry_read_offset;
|
||||||
if (urb_entry_read_length == 0) {
|
if (urb_entry_read_length == 0) {
|
||||||
/* Setting the URB entry read length to 0 causes undefined behavior, so
|
/* Setting the URB entry read length to 0 causes undefined behavior, so
|
||||||
|
|
@ -342,8 +337,7 @@ const struct brw_tracked_state gen6_sf_state = {
|
||||||
_NEW_LINE |
|
_NEW_LINE |
|
||||||
_NEW_SCISSOR |
|
_NEW_SCISSOR |
|
||||||
_NEW_BUFFERS |
|
_NEW_BUFFERS |
|
||||||
_NEW_POINT |
|
_NEW_POINT),
|
||||||
_NEW_TRANSFORM),
|
|
||||||
.brw = (BRW_NEW_CONTEXT |
|
.brw = (BRW_NEW_CONTEXT |
|
||||||
BRW_NEW_FRAGMENT_PROGRAM),
|
BRW_NEW_FRAGMENT_PROGRAM),
|
||||||
.cache = CACHE_NEW_VS_PROG
|
.cache = CACHE_NEW_VS_PROG
|
||||||
|
|
|
||||||
|
|
@ -35,8 +35,6 @@ upload_sbe_state(struct brw_context *brw)
|
||||||
struct gl_context *ctx = &intel->ctx;
|
struct gl_context *ctx = &intel->ctx;
|
||||||
struct brw_vue_map vue_map;
|
struct brw_vue_map vue_map;
|
||||||
uint32_t urb_entry_read_length;
|
uint32_t urb_entry_read_length;
|
||||||
/* CACHE_NEW_VS_PROG */
|
|
||||||
GLbitfield64 vs_outputs_written = brw->vs.prog_data->outputs_written;
|
|
||||||
/* BRW_NEW_FRAGMENT_PROGRAM */
|
/* BRW_NEW_FRAGMENT_PROGRAM */
|
||||||
uint32_t num_outputs = _mesa_bitcount_64(brw->fragment_program->Base.InputsRead);
|
uint32_t num_outputs = _mesa_bitcount_64(brw->fragment_program->Base.InputsRead);
|
||||||
/* _NEW_LIGHT */
|
/* _NEW_LIGHT */
|
||||||
|
|
@ -44,15 +42,14 @@ upload_sbe_state(struct brw_context *brw)
|
||||||
uint32_t dw1, dw10, dw11;
|
uint32_t dw1, dw10, dw11;
|
||||||
int i;
|
int i;
|
||||||
int attr = 0, input_index = 0;
|
int attr = 0, input_index = 0;
|
||||||
/* _NEW_TRANSFORM */
|
|
||||||
int urb_entry_read_offset = 1;
|
int urb_entry_read_offset = 1;
|
||||||
bool userclip_active = (ctx->Transform.ClipPlanesEnabled != 0);
|
|
||||||
uint16_t attr_overrides[FRAG_ATTRIB_MAX];
|
uint16_t attr_overrides[FRAG_ATTRIB_MAX];
|
||||||
/* _NEW_BUFFERS */
|
/* _NEW_BUFFERS */
|
||||||
bool render_to_fbo = ctx->DrawBuffer->Name != 0;
|
bool render_to_fbo = ctx->DrawBuffer->Name != 0;
|
||||||
uint32_t point_sprite_origin;
|
uint32_t point_sprite_origin;
|
||||||
|
|
||||||
brw_compute_vue_map(&vue_map, intel, userclip_active, vs_outputs_written);
|
/* CACHE_NEW_VS_PROG */
|
||||||
|
brw_compute_vue_map(&vue_map, intel, brw->vs.prog_data);
|
||||||
urb_entry_read_length = (vue_map.num_slots + 1)/2 - urb_entry_read_offset;
|
urb_entry_read_length = (vue_map.num_slots + 1)/2 - urb_entry_read_offset;
|
||||||
if (urb_entry_read_length == 0) {
|
if (urb_entry_read_length == 0) {
|
||||||
/* Setting the URB entry read length to 0 causes undefined behavior, so
|
/* Setting the URB entry read length to 0 causes undefined behavior, so
|
||||||
|
|
@ -146,8 +143,7 @@ const struct brw_tracked_state gen7_sbe_state = {
|
||||||
.dirty = {
|
.dirty = {
|
||||||
.mesa = (_NEW_LIGHT |
|
.mesa = (_NEW_LIGHT |
|
||||||
_NEW_POINT |
|
_NEW_POINT |
|
||||||
_NEW_PROGRAM |
|
_NEW_PROGRAM),
|
||||||
_NEW_TRANSFORM),
|
|
||||||
.brw = (BRW_NEW_CONTEXT |
|
.brw = (BRW_NEW_CONTEXT |
|
||||||
BRW_NEW_FRAGMENT_PROGRAM),
|
BRW_NEW_FRAGMENT_PROGRAM),
|
||||||
.cache = CACHE_NEW_VS_PROG
|
.cache = CACHE_NEW_VS_PROG
|
||||||
|
|
|
||||||
|
|
@ -241,9 +241,8 @@ upload_sol_state(struct brw_context *brw)
|
||||||
bool active = xfb_obj->Active && !xfb_obj->Paused;
|
bool active = xfb_obj->Active && !xfb_obj->Paused;
|
||||||
struct brw_vue_map vue_map;
|
struct brw_vue_map vue_map;
|
||||||
|
|
||||||
/* _NEW_TRANSFORM, CACHE_NEW_VS_PROG */
|
/* CACHE_NEW_VS_PROG */
|
||||||
brw_compute_vue_map(&vue_map, intel, ctx->Transform.ClipPlanesEnabled != 0,
|
brw_compute_vue_map(&vue_map, intel, brw->vs.prog_data);
|
||||||
brw->vs.prog_data->outputs_written);
|
|
||||||
|
|
||||||
if (active) {
|
if (active) {
|
||||||
upload_3dstate_so_buffers(brw);
|
upload_3dstate_so_buffers(brw);
|
||||||
|
|
@ -264,8 +263,7 @@ const struct brw_tracked_state gen7_sol_state = {
|
||||||
.dirty = {
|
.dirty = {
|
||||||
.mesa = (_NEW_RASTERIZER_DISCARD |
|
.mesa = (_NEW_RASTERIZER_DISCARD |
|
||||||
_NEW_LIGHT |
|
_NEW_LIGHT |
|
||||||
_NEW_TRANSFORM_FEEDBACK |
|
_NEW_TRANSFORM_FEEDBACK),
|
||||||
_NEW_TRANSFORM),
|
|
||||||
.brw = (BRW_NEW_BATCH |
|
.brw = (BRW_NEW_BATCH |
|
||||||
BRW_NEW_VERTEX_PROGRAM),
|
BRW_NEW_VERTEX_PROGRAM),
|
||||||
.cache = CACHE_NEW_VS_PROG,
|
.cache = CACHE_NEW_VS_PROG,
|
||||||
|
|
|
||||||
Loading…
Add table
Reference in a new issue