freedreno/a6xx: Switch to relying on fd6_view for our texture descriptors.

Having checked the deltas between fdl6_view and what we did before, switch
over to fdl6_view now.

No statistically significant difference on no-hw drawoverhead 8-texture
change (n=50) with the texture cache disabled from this and the previous
commit.

Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/13443>
This commit is contained in:
Emma Anholt 2021-10-18 14:24:40 -07:00 committed by Marge Bot
parent 84377785a4
commit 533e486923
3 changed files with 20 additions and 157 deletions

View file

@ -393,35 +393,35 @@ fd6_emit_textures(struct fd_context *ctx, struct fd_ringbuffer *ring,
view = &dummy_view;
}
OUT_RING(state, view->texconst0);
OUT_RING(state, view->texconst1);
OUT_RING(state, view->texconst2);
OUT_RING(state, view->texconst3);
OUT_RING(state, view->descriptor[0]);
OUT_RING(state, view->descriptor[1]);
OUT_RING(state, view->descriptor[2]);
OUT_RING(state, view->descriptor[3]);
if (view->ptr1) {
OUT_RELOC(state, view->ptr1->bo, view->offset1,
(uint64_t)view->texconst5 << 32, 0);
OUT_RELOC(state, view->ptr1->bo, view->descriptor[4],
(uint64_t)view->descriptor[5] << 32, 0);
} else {
OUT_RING(state, 0x00000000);
OUT_RING(state, view->texconst5);
OUT_RING(state, view->descriptor[4]);
OUT_RING(state, view->descriptor[5]);
}
OUT_RING(state, view->texconst6);
OUT_RING(state, view->descriptor[6]);
if (view->ptr2) {
OUT_RELOC(state, view->ptr2->bo, view->offset2, 0, 0);
OUT_RELOC(state, view->ptr2->bo, view->descriptor[7], 0, 0);
} else {
OUT_RING(state, 0);
OUT_RING(state, 0);
OUT_RING(state, view->descriptor[7]);
OUT_RING(state, view->descriptor[8]);
}
OUT_RING(state, view->texconst9);
OUT_RING(state, view->texconst10);
OUT_RING(state, view->texconst11);
OUT_RING(state, 0);
OUT_RING(state, 0);
OUT_RING(state, 0);
OUT_RING(state, 0);
OUT_RING(state, view->descriptor[9]);
OUT_RING(state, view->descriptor[10]);
OUT_RING(state, view->descriptor[11]);
OUT_RING(state, view->descriptor[12]);
OUT_RING(state, view->descriptor[13]);
OUT_RING(state, view->descriptor[14]);
OUT_RING(state, view->descriptor[15]);
}
if (v) {

View file

@ -213,8 +213,6 @@ fd6_sampler_view_update(struct fd_context *ctx,
struct pipe_resource *prsc = cso->texture;
struct fd_resource *rsc = fd_resource(prsc);
enum pipe_format format = cso->format;
bool ubwc_enabled = false;
unsigned lvl, layers = 0;
fd6_validate_format(ctx, rsc, cso->format);
@ -236,14 +234,6 @@ fd6_sampler_view_update(struct fd_context *ctx,
fdl6_buffer_view_init(so->descriptor, cso->format, swiz, iova,
cso->u.buf.size);
unsigned elements = cso->u.buf.size / util_format_get_blocksize(format);
lvl = 0;
so->texconst1 = A6XX_TEX_CONST_1_WIDTH(elements & MASK(15)) |
A6XX_TEX_CONST_1_HEIGHT(elements >> 15);
so->texconst2 = A6XX_TEX_CONST_2_UNK4 | A6XX_TEX_CONST_2_UNK31;
so->offset1 = cso->u.buf.offset;
} else {
struct fdl_view_args args = {
/* Using relocs for addresses still */
@ -278,141 +268,17 @@ fd6_sampler_view_update(struct fd_context *ctx,
ctx->screen->info->a6xx.has_z24uint_s8uint);
memcpy(so->descriptor, view.descriptor, sizeof(so->descriptor));
unsigned miplevels;
lvl = fd_sampler_first_level(cso);
miplevels = fd_sampler_last_level(cso) - lvl;
layers = cso->u.tex.last_layer - cso->u.tex.first_layer + 1;
so->texconst0 |= A6XX_TEX_CONST_0_MIPLVLS(miplevels);
so->texconst1 = A6XX_TEX_CONST_1_WIDTH(u_minify(prsc->width0, lvl)) |
A6XX_TEX_CONST_1_HEIGHT(u_minify(prsc->height0, lvl));
so->texconst2 = A6XX_TEX_CONST_2_PITCHALIGN(rsc->layout.pitchalign - 6) |
A6XX_TEX_CONST_2_PITCH(fd_resource_pitch(rsc, lvl));
ubwc_enabled = fd_resource_ubwc_enabled(rsc, lvl);
if (rsc->b.b.format == PIPE_FORMAT_R8_G8B8_420_UNORM) {
/* In case of biplanar R8_G8B8, the UBWC metadata address in
* dwords 7 and 8, is instead the pointer to the second plane.
*/
so->ptr2 = plane1;
so->texconst6 =
A6XX_TEX_CONST_6_PLANE_PITCH(fd_resource_pitch(plane1, lvl));
if (ubwc_enabled) {
/* Further, if using UBWC with R8_G8B8, we only point to the
* UBWC header and the color data is expected to follow immediately.
*/
so->offset1 =
fd_resource_ubwc_offset(rsc, lvl, cso->u.tex.first_layer);
so->offset2 =
fd_resource_ubwc_offset(plane1, lvl, cso->u.tex.first_layer);
} else {
so->offset1 = fd_resource_offset(rsc, lvl, cso->u.tex.first_layer);
so->offset2 =
fd_resource_offset(plane1, lvl, cso->u.tex.first_layer);
}
} else {
so->offset1 = fd_resource_offset(rsc, lvl, cso->u.tex.first_layer);
if (ubwc_enabled) {
if (fd_resource_ubwc_enabled(rsc, fd_sampler_first_level(cso))) {
so->ptr2 = rsc;
so->offset2 =
fd_resource_ubwc_offset(rsc, lvl, cso->u.tex.first_layer);
}
}
}
so->texconst0 |=
fd6_tex_const_0(prsc, lvl, cso->format, cso->swizzle_r, cso->swizzle_g,
cso->swizzle_b, cso->swizzle_a);
so->texconst2 |= A6XX_TEX_CONST_2_TYPE(fd6_tex_type(cso->target));
switch (cso->target) {
case PIPE_TEXTURE_RECT:
case PIPE_TEXTURE_1D:
case PIPE_TEXTURE_2D:
so->texconst3 = A6XX_TEX_CONST_3_ARRAY_PITCH(rsc->layout.layer_size);
so->texconst5 = A6XX_TEX_CONST_5_DEPTH(1);
break;
case PIPE_TEXTURE_1D_ARRAY:
case PIPE_TEXTURE_2D_ARRAY:
so->texconst3 = A6XX_TEX_CONST_3_ARRAY_PITCH(rsc->layout.layer_size);
so->texconst5 = A6XX_TEX_CONST_5_DEPTH(layers);
break;
case PIPE_TEXTURE_CUBE:
case PIPE_TEXTURE_CUBE_ARRAY:
so->texconst3 = A6XX_TEX_CONST_3_ARRAY_PITCH(rsc->layout.layer_size);
so->texconst5 = A6XX_TEX_CONST_5_DEPTH(layers / 6);
break;
case PIPE_TEXTURE_3D:
so->texconst3 =
A6XX_TEX_CONST_3_MIN_LAYERSZ(
fd_resource_slice(rsc, prsc->last_level)->size0) |
A6XX_TEX_CONST_3_ARRAY_PITCH(fd_resource_slice(rsc, lvl)->size0);
so->texconst5 = A6XX_TEX_CONST_5_DEPTH(u_minify(prsc->depth0, lvl));
break;
default:
break;
}
if (rsc->layout.tile_all)
so->texconst3 |= A6XX_TEX_CONST_3_TILE_ALL;
if (ubwc_enabled) {
uint32_t block_width, block_height;
fdl6_get_ubwc_blockwidth(&rsc->layout, &block_width, &block_height);
so->texconst3 |= A6XX_TEX_CONST_3_FLAG;
so->texconst9 |= A6XX_TEX_CONST_9_FLAG_BUFFER_ARRAY_PITCH(
rsc->layout.ubwc_layer_size >> 2);
so->texconst10 |=
A6XX_TEX_CONST_10_FLAG_BUFFER_PITCH(
fdl_ubwc_pitch(&rsc->layout, lvl)) |
A6XX_TEX_CONST_10_FLAG_BUFFER_LOGW(util_logbase2_ceil(
DIV_ROUND_UP(u_minify(prsc->width0, lvl), block_width))) |
A6XX_TEX_CONST_10_FLAG_BUFFER_LOGH(util_logbase2_ceil(
DIV_ROUND_UP(u_minify(prsc->height0, lvl), block_height)));
}
const uint32_t swiz_mask =
(A6XX_TEX_CONST_0_SWIZ_X__MASK | A6XX_TEX_CONST_0_SWIZ_Y__MASK |
A6XX_TEX_CONST_0_SWIZ_Z__MASK | A6XX_TEX_CONST_0_SWIZ_W__MASK);
/* Sanity check that fdl6_view_init matched previous behavior. */
uint32_t so_descriptor[16] = {
/* fd6_view applies format swizzles more, and that's fine. */
so->texconst0 & ~swiz_mask,
so->texconst1,
so->texconst2,
so->texconst3,
so->offset1,
so->texconst5,
so->texconst6,
so->offset2,
0,
so->texconst9,
so->texconst10,
so->texconst11,
};
bool diff = false;
for (int i = 0; i < ARRAY_SIZE(so_descriptor); i++) {
int view_desc = so->descriptor[i];
if (i == 0)
view_desc &= ~swiz_mask;
if (so_descriptor[i] != view_desc) {
if (!diff) {
char view_desc[500] = {0};
debug_describe_sampler_view(view_desc, cso);
mesa_loge("view mismatch for %s:", view_desc);
diff = true;
}
mesa_loge("TEXCONST[%d] = 0x%08x vs 0x%08x", i, so_descriptor[i],
view_desc);
}
}
assert(!diff);
}
/* NOTE this can be called in either driver thread or frontend thread

View file

@ -51,9 +51,6 @@ fd6_sampler_stateobj(struct pipe_sampler_state *samp)
struct fd6_pipe_sampler_view {
struct pipe_sampler_view base;
uint32_t texconst0, texconst1, texconst2, texconst3, texconst5;
uint32_t texconst6, texconst7, texconst8, texconst9, texconst10, texconst11;
uint32_t offset1, offset2;
struct fd_resource *ptr1, *ptr2;
uint16_t seqno;