diff --git a/src/intel/vulkan/anv_instance.c b/src/intel/vulkan/anv_instance.c
index 68397ebc83d..8ccfe176efc 100644
--- a/src/intel/vulkan/anv_instance.c
+++ b/src/intel/vulkan/anv_instance.c
@@ -17,6 +17,8 @@ static const driOptionDescription anv_dri_options[] = {
DRI_CONF_ANV_ASSUME_FULL_SUBGROUPS(0)
DRI_CONF_ANV_ASSUME_FULL_SUBGROUPS_WITH_BARRIER(false)
DRI_CONF_ANV_ASSUME_FULL_SUBGROUPS_WITH_SHARED_MEMORY(false)
+ DRI_CONF_ANV_BARRIER_POST_TYPED_CLEAR_SHADER(false)
+ DRI_CONF_ANV_BARRIER_POST_UNTYPED_CLEAR_SHADER(false)
DRI_CONF_ANV_DISABLE_FCV(false)
DRI_CONF_ANV_ENABLE_BUFFER_COMP(false)
DRI_CONF_ANV_DISABLE_DRM_AUX_MODIFIERS(false)
@@ -240,6 +242,10 @@ anv_init_dri_options(struct anv_instance *instance)
driQueryOptionb(&instance->dri_options, "anv_disable_drm_ccs_modifiers");
instance->binding_table_block_size = util_next_power_of_two(
driQueryOptioni(&instance->dri_options, "intel_binding_table_block_size"));
+ instance->barrier_post_typed_clear_shader =
+ driQueryOptionb(&instance->dri_options, "anv_barrier_post_typed_clear_shader");
+ instance->barrier_post_untyped_clear_shader =
+ driQueryOptionb(&instance->dri_options, "anv_barrier_post_untyped_clear_shader");
if (instance->vk.app_info.engine_name &&
!strcmp(instance->vk.app_info.engine_name, "DXVK")) {
diff --git a/src/intel/vulkan/anv_private.h b/src/intel/vulkan/anv_private.h
index d8052dc959e..f79e9e8a8af 100644
--- a/src/intel/vulkan/anv_private.h
+++ b/src/intel/vulkan/anv_private.h
@@ -1828,6 +1828,8 @@ struct anv_instance {
bool force_sampler_prefetch;
bool force_compute_surface_prefetch;
unsigned binding_table_block_size;
+ bool barrier_post_typed_clear_shader;
+ bool barrier_post_untyped_clear_shader;
/* HW workarounds */
bool no_16bit;
diff --git a/src/intel/vulkan/genX_cmd_compute.c b/src/intel/vulkan/genX_cmd_compute.c
index bf25b9cb02e..5d726cb3328 100644
--- a/src/intel/vulkan/genX_cmd_compute.c
+++ b/src/intel/vulkan/genX_cmd_compute.c
@@ -477,6 +477,36 @@ fill_inline_params(struct GENX(COMPUTE_WALKER_BODY) *body,
}
}
+static inline void
+cmd_buffer_post_dispatch_wa(struct anv_cmd_buffer *cmd_buffer)
+{
+ genX(cmd_buffer_post_dispatch_wa)(cmd_buffer);
+
+ struct anv_cmd_compute_state *comp_state = &cmd_buffer->state.compute;
+
+ /* Workaround WaW hazards in applications that clear a buffer and start
+ * writing to it immediately without a barrier between the clear & write
+ * operations.
+ */
+ if (cmd_buffer->device->physical->instance->barrier_post_typed_clear_shader &&
+ (comp_state->shader->bind_map.inferred_behavior & ANV_PIPELINE_BEHAVIOR_CLEAR_TYPED)) {
+ anv_add_pending_pipe_bits(cmd_buffer,
+ VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT,
+ VK_PIPELINE_STAGE_2_TOP_OF_PIPE_BIT,
+ ANV_PIPE_HDC_PIPELINE_FLUSH_BIT,
+ "clear shader typed L1 flush app wa");
+ }
+ if (cmd_buffer->device->physical->instance->barrier_post_untyped_clear_shader &&
+ (comp_state->shader->bind_map.inferred_behavior & ANV_PIPELINE_BEHAVIOR_CLEAR_UNTYPED)) {
+ anv_add_pending_pipe_bits(cmd_buffer,
+ VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT,
+ VK_PIPELINE_STAGE_2_TOP_OF_PIPE_BIT,
+ ANV_PIPE_UNTYPED_DATAPORT_CACHE_FLUSH_BIT |
+ ANV_PIPE_HDC_PIPELINE_FLUSH_BIT,
+ "clear shader untyped L1 flush app wa");
+ }
+}
+
static inline void
emit_indirect_compute_walker(struct anv_cmd_buffer *cmd_buffer,
const struct brw_cs_prog_data *prog_data,
@@ -531,11 +561,9 @@ emit_indirect_compute_walker(struct anv_cmd_buffer *cmd_buffer,
indirect_addr.bo, 0),
);
- genX(cmd_buffer_post_dispatch_wa)(cmd_buffer);
+ cmd_buffer_post_dispatch_wa(cmd_buffer);
}
-
-
static inline void
emit_compute_walker(struct anv_cmd_buffer *cmd_buffer,
struct anv_address indirect_addr,
@@ -595,7 +623,7 @@ emit_compute_walker(struct anv_cmd_buffer *cmd_buffer,
#endif
);
- genX(cmd_buffer_post_dispatch_wa)(cmd_buffer);
+ cmd_buffer_post_dispatch_wa(cmd_buffer);
}
#else /* #if GFX_VERx10 >= 125 */
diff --git a/src/util/00-mesa-defaults.conf b/src/util/00-mesa-defaults.conf
index 9c1b6624f7a..9e05e8cf2d3 100644
--- a/src/util/00-mesa-defaults.conf
+++ b/src/util/00-mesa-defaults.conf
@@ -1124,6 +1124,12 @@ TODO: document the other workarounds.
+
+
+
+