intel: Add ISL_AUX_USAGE_GEN12_CCS_E

Add a new aux usage which more accurately describes the behavior of
CCS_E on gen12. On this platform, writes using the 3D engine are either
compressed or substituted with fast-cleared blocks.

Reviewed-by: Kenneth Graunke <kenneth@whitecape.org>
Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/5363>
This commit is contained in:
Nanley Chery 2020-03-27 17:15:51 -07:00 committed by Marge Bot
parent d9f7fce83c
commit db5d98cde8
6 changed files with 55 additions and 10 deletions

View file

@ -569,6 +569,8 @@ iris_resource_configure_aux(struct iris_screen *screen,
*/ */
initial_state = ISL_AUX_STATE_CLEAR; initial_state = ISL_AUX_STATE_CLEAR;
break; break;
case ISL_AUX_USAGE_GEN12_CCS_E:
unreachable("Driver unprepared to handle this aux_usage.");
case ISL_AUX_USAGE_CCS_D: case ISL_AUX_USAGE_CCS_D:
case ISL_AUX_USAGE_CCS_E: case ISL_AUX_USAGE_CCS_E:
case ISL_AUX_USAGE_STC_CCS: case ISL_AUX_USAGE_STC_CCS:

View file

@ -2664,6 +2664,7 @@ blorp_copy(struct blorp_batch *batch,
params.src.aux_usage == ISL_AUX_USAGE_MCS || params.src.aux_usage == ISL_AUX_USAGE_MCS ||
params.src.aux_usage == ISL_AUX_USAGE_MCS_CCS || params.src.aux_usage == ISL_AUX_USAGE_MCS_CCS ||
params.src.aux_usage == ISL_AUX_USAGE_CCS_E || params.src.aux_usage == ISL_AUX_USAGE_CCS_E ||
params.src.aux_usage == ISL_AUX_USAGE_GEN12_CCS_E ||
params.src.aux_usage == ISL_AUX_USAGE_STC_CCS); params.src.aux_usage == ISL_AUX_USAGE_STC_CCS);
if (isl_aux_usage_has_hiz(params.src.aux_usage)) { if (isl_aux_usage_has_hiz(params.src.aux_usage)) {
@ -2679,9 +2680,11 @@ blorp_copy(struct blorp_batch *batch,
*/ */
params.src.view.format = params.dst.surf.format; params.src.view.format = params.dst.surf.format;
params.dst.view.format = params.dst.surf.format; params.dst.view.format = params.dst.surf.format;
} else if (params.dst.aux_usage == ISL_AUX_USAGE_CCS_E) { } else if (params.dst.aux_usage == ISL_AUX_USAGE_CCS_E ||
params.dst.aux_usage == ISL_AUX_USAGE_GEN12_CCS_E) {
params.dst.view.format = get_ccs_compatible_copy_format(dst_fmtl); params.dst.view.format = get_ccs_compatible_copy_format(dst_fmtl);
if (params.src.aux_usage == ISL_AUX_USAGE_CCS_E) { if (params.src.aux_usage == ISL_AUX_USAGE_CCS_E ||
params.src.aux_usage == ISL_AUX_USAGE_GEN12_CCS_E) {
params.src.view.format = get_ccs_compatible_copy_format(src_fmtl); params.src.view.format = get_ccs_compatible_copy_format(src_fmtl);
} else if (src_fmtl->bpb == dst_fmtl->bpb) { } else if (src_fmtl->bpb == dst_fmtl->bpb) {
params.src.view.format = params.dst.view.format; params.src.view.format = params.dst.view.format;
@ -2689,7 +2692,8 @@ blorp_copy(struct blorp_batch *batch,
params.src.view.format = params.src.view.format =
get_copy_format_for_bpb(isl_dev, src_fmtl->bpb); get_copy_format_for_bpb(isl_dev, src_fmtl->bpb);
} }
} else if (params.src.aux_usage == ISL_AUX_USAGE_CCS_E) { } else if (params.src.aux_usage == ISL_AUX_USAGE_CCS_E ||
params.src.aux_usage == ISL_AUX_USAGE_GEN12_CCS_E) {
params.src.view.format = get_ccs_compatible_copy_format(src_fmtl); params.src.view.format = get_ccs_compatible_copy_format(src_fmtl);
if (src_fmtl->bpb == dst_fmtl->bpb) { if (src_fmtl->bpb == dst_fmtl->bpb) {
params.dst.view.format = params.src.view.format; params.dst.view.format = params.src.view.format;

View file

@ -611,6 +611,13 @@ enum isl_aux_usage {
*/ */
ISL_AUX_USAGE_CCS_E, ISL_AUX_USAGE_CCS_E,
/** The auxiliary surface provides full lossless color compression on
* Gen12.
*
* @invariant isl_surf::samples == 1
*/
ISL_AUX_USAGE_GEN12_CCS_E,
/** The auxiliary surface provides full lossless media color compression /** The auxiliary surface provides full lossless media color compression
* *
* @invariant isl_surf::samples == 1 * @invariant isl_surf::samples == 1
@ -1803,6 +1810,7 @@ isl_aux_usage_has_ccs(enum isl_aux_usage usage)
{ {
return usage == ISL_AUX_USAGE_CCS_D || return usage == ISL_AUX_USAGE_CCS_D ||
usage == ISL_AUX_USAGE_CCS_E || usage == ISL_AUX_USAGE_CCS_E ||
usage == ISL_AUX_USAGE_GEN12_CCS_E ||
usage == ISL_AUX_USAGE_MC || usage == ISL_AUX_USAGE_MC ||
usage == ISL_AUX_USAGE_HIZ_CCS_WT || usage == ISL_AUX_USAGE_HIZ_CCS_WT ||
usage == ISL_AUX_USAGE_HIZ_CCS || usage == ISL_AUX_USAGE_HIZ_CCS ||
@ -1864,7 +1872,8 @@ isl_drm_modifier_get_default_aux_state(uint64_t modifier)
if (!mod_info || mod_info->aux_usage == ISL_AUX_USAGE_NONE) if (!mod_info || mod_info->aux_usage == ISL_AUX_USAGE_NONE)
return ISL_AUX_STATE_AUX_INVALID; return ISL_AUX_STATE_AUX_INVALID;
assert(mod_info->aux_usage == ISL_AUX_USAGE_CCS_E); assert(mod_info->aux_usage == ISL_AUX_USAGE_CCS_E ||
mod_info->aux_usage == ISL_AUX_USAGE_GEN12_CCS_E);
return mod_info->supports_clear_color ? ISL_AUX_STATE_COMPRESSED_CLEAR : return mod_info->supports_clear_color ? ISL_AUX_STATE_COMPRESSED_CLEAR :
ISL_AUX_STATE_COMPRESSED_NO_CLEAR; ISL_AUX_STATE_COMPRESSED_NO_CLEAR;
} }

View file

@ -49,6 +49,11 @@ enum write_behavior {
/* Writes using the 3D engine are compressed. */ /* Writes using the 3D engine are compressed. */
WRITES_COMPRESS, WRITES_COMPRESS,
/* Writes using the 3D engine are either compressed or substituted with
* fast-cleared blocks.
*/
WRITES_COMPRESS_CLEAR,
/* Writes implicitly fully resolve the compression block and write the data /* Writes implicitly fully resolve the compression block and write the data
* uncompressed into the main surface. The resolved aux blocks are * uncompressed into the main surface. The resolved aux blocks are
* ambiguated and left in the pass-through state. * ambiguated and left in the pass-through state.
@ -87,6 +92,7 @@ static const struct aux_usage_info info[] = {
AUX( COMPRESS, Y, Y, Y, x, MCS) AUX( COMPRESS, Y, Y, Y, x, MCS)
AUX( COMPRESS, Y, Y, Y, x, MCS_CCS) AUX( COMPRESS, Y, Y, Y, x, MCS_CCS)
AUX( COMPRESS, Y, Y, Y, Y, CCS_E) AUX( COMPRESS, Y, Y, Y, Y, CCS_E)
AUX( COMPRESS_CLEAR, Y, Y, Y, Y, GEN12_CCS_E)
AUX(RESOLVE_AMBIGUATE, x, Y, x, Y, CCS_D) AUX(RESOLVE_AMBIGUATE, x, Y, x, Y, CCS_D)
AUX(RESOLVE_AMBIGUATE, Y, x, x, Y, MC) AUX(RESOLVE_AMBIGUATE, Y, x, x, Y, MC)
AUX( COMPRESS, Y, x, x, Y, STC_CCS) AUX( COMPRESS, Y, x, x, Y, STC_CCS)
@ -213,24 +219,29 @@ isl_aux_state_transition_write(enum isl_aux_state initial_state,
assert(isl_aux_state_has_valid_aux(initial_state)); assert(isl_aux_state_has_valid_aux(initial_state));
assert(aux_state_possible(initial_state, usage)); assert(aux_state_possible(initial_state, usage));
assert(info[usage].write_behavior == WRITES_COMPRESS || assert(info[usage].write_behavior == WRITES_COMPRESS ||
info[usage].write_behavior == WRITES_COMPRESS_CLEAR ||
info[usage].write_behavior == WRITES_RESOLVE_AMBIGUATE); info[usage].write_behavior == WRITES_RESOLVE_AMBIGUATE);
if (full_surface) { if (full_surface) {
return info[usage].write_behavior == WRITES_COMPRESS ? return info[usage].write_behavior == WRITES_COMPRESS ?
ISL_AUX_STATE_COMPRESSED_NO_CLEAR : ISL_AUX_STATE_PASS_THROUGH; ISL_AUX_STATE_COMPRESSED_NO_CLEAR :
info[usage].write_behavior == WRITES_COMPRESS_CLEAR ?
ISL_AUX_STATE_COMPRESSED_CLEAR : ISL_AUX_STATE_PASS_THROUGH;
} }
switch (initial_state) { switch (initial_state) {
case ISL_AUX_STATE_CLEAR: case ISL_AUX_STATE_CLEAR:
case ISL_AUX_STATE_PARTIAL_CLEAR: case ISL_AUX_STATE_PARTIAL_CLEAR:
return info[usage].write_behavior == WRITES_COMPRESS ? return info[usage].write_behavior == WRITES_RESOLVE_AMBIGUATE ?
ISL_AUX_STATE_COMPRESSED_CLEAR : ISL_AUX_STATE_PARTIAL_CLEAR; ISL_AUX_STATE_PARTIAL_CLEAR : ISL_AUX_STATE_COMPRESSED_CLEAR;
case ISL_AUX_STATE_RESOLVED: case ISL_AUX_STATE_RESOLVED:
case ISL_AUX_STATE_PASS_THROUGH: case ISL_AUX_STATE_PASS_THROUGH:
return info[usage].write_behavior == WRITES_COMPRESS ?
ISL_AUX_STATE_COMPRESSED_NO_CLEAR : initial_state;
case ISL_AUX_STATE_COMPRESSED_CLEAR:
case ISL_AUX_STATE_COMPRESSED_NO_CLEAR: case ISL_AUX_STATE_COMPRESSED_NO_CLEAR:
return info[usage].write_behavior == WRITES_COMPRESS ?
ISL_AUX_STATE_COMPRESSED_NO_CLEAR :
info[usage].write_behavior == WRITES_COMPRESS_CLEAR ?
ISL_AUX_STATE_COMPRESSED_CLEAR : initial_state;
case ISL_AUX_STATE_COMPRESSED_CLEAR:
case ISL_AUX_STATE_AUX_INVALID: case ISL_AUX_STATE_AUX_INVALID:
return initial_state; return initial_state;
#ifdef IN_UNIT_TEST #ifdef IN_UNIT_TEST

View file

@ -90,6 +90,7 @@ static const uint32_t isl_to_gen_multisample_layout[] = {
static const uint32_t isl_to_gen_aux_mode[] = { static const uint32_t isl_to_gen_aux_mode[] = {
[ISL_AUX_USAGE_NONE] = AUX_NONE, [ISL_AUX_USAGE_NONE] = AUX_NONE,
[ISL_AUX_USAGE_MCS] = AUX_CCS_E, [ISL_AUX_USAGE_MCS] = AUX_CCS_E,
[ISL_AUX_USAGE_GEN12_CCS_E] = AUX_CCS_E,
[ISL_AUX_USAGE_CCS_E] = AUX_CCS_E, [ISL_AUX_USAGE_CCS_E] = AUX_CCS_E,
[ISL_AUX_USAGE_HIZ_CCS_WT] = AUX_CCS_E, [ISL_AUX_USAGE_HIZ_CCS_WT] = AUX_CCS_E,
[ISL_AUX_USAGE_MCS_CCS] = AUX_MCS_LCE, [ISL_AUX_USAGE_MCS_CCS] = AUX_MCS_LCE,
@ -589,6 +590,7 @@ isl_genX(surf_fill_state_s)(const struct isl_device *dev, void *state,
if (GEN_GEN >= 12) { if (GEN_GEN >= 12) {
assert(info->aux_usage == ISL_AUX_USAGE_MCS || assert(info->aux_usage == ISL_AUX_USAGE_MCS ||
info->aux_usage == ISL_AUX_USAGE_CCS_E || info->aux_usage == ISL_AUX_USAGE_CCS_E ||
info->aux_usage == ISL_AUX_USAGE_GEN12_CCS_E ||
info->aux_usage == ISL_AUX_USAGE_HIZ_CCS_WT || info->aux_usage == ISL_AUX_USAGE_HIZ_CCS_WT ||
info->aux_usage == ISL_AUX_USAGE_MCS_CCS || info->aux_usage == ISL_AUX_USAGE_MCS_CCS ||
info->aux_usage == ISL_AUX_USAGE_STC_CCS); info->aux_usage == ISL_AUX_USAGE_STC_CCS);

View file

@ -376,6 +376,23 @@ TEST(StateTransitionWrite, WritesCompress) {
E(AUX_INVALID, STC_CCS, true, ASSERT); E(AUX_INVALID, STC_CCS, true, ASSERT);
} }
TEST(StateTransitionWrite, WritesCompressClear) {
E(CLEAR, GEN12_CCS_E, false, COMPRESSED_CLEAR);
E(CLEAR, GEN12_CCS_E, true, COMPRESSED_CLEAR);
E(PARTIAL_CLEAR, GEN12_CCS_E, false, COMPRESSED_CLEAR);
E(PARTIAL_CLEAR, GEN12_CCS_E, true, COMPRESSED_CLEAR);
E(COMPRESSED_CLEAR, GEN12_CCS_E, false, COMPRESSED_CLEAR);
E(COMPRESSED_CLEAR, GEN12_CCS_E, true, COMPRESSED_CLEAR);
E(COMPRESSED_NO_CLEAR, GEN12_CCS_E, false, COMPRESSED_CLEAR);
E(COMPRESSED_NO_CLEAR, GEN12_CCS_E, true, COMPRESSED_CLEAR);
E(RESOLVED, GEN12_CCS_E, false, COMPRESSED_CLEAR);
E(RESOLVED, GEN12_CCS_E, true, COMPRESSED_CLEAR);
E(PASS_THROUGH, GEN12_CCS_E, false, COMPRESSED_CLEAR);
E(PASS_THROUGH, GEN12_CCS_E, true, COMPRESSED_CLEAR);
E(AUX_INVALID, GEN12_CCS_E, false, ASSERT);
E(AUX_INVALID, GEN12_CCS_E, true, ASSERT);
}
TEST(StateTransitionWrite, WritesResolveAmbiguate) { TEST(StateTransitionWrite, WritesResolveAmbiguate) {
E(CLEAR, CCS_D, false, PARTIAL_CLEAR); E(CLEAR, CCS_D, false, PARTIAL_CLEAR);
E(CLEAR, CCS_D, true, PASS_THROUGH); E(CLEAR, CCS_D, true, PASS_THROUGH);