intel/brw: Simplify tracking of dispatch_width_limit in brw_compile_fs

Keep it in a variable, that way don't need to check which shader to look for the limit. Reviewed-by: Kenneth Graunke <kenneth@whitecape.org> Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/33541>
2025-12-29 18:50:10 +01:00 · 2025-02-13 22:46:19 -08:00 · 2025-02-13 22:46:19 -08:00 · 834e30d244
commit 834e30d244
parent 9d53e27579
1 changed files with 26 additions and 19 deletions
--- a/src/intel/compiler/brw_compile_fs.cpp
+++ b/src/intel/compiler/brw_compile_fs.cpp
@ -1581,6 +1581,11 @@ brw_compile_fs(const struct brw_compiler *compiler,
   assert(reqd_dispatch_width == SUBGROUP_SIZE_VARYING ||
          reqd_dispatch_width == SUBGROUP_SIZE_REQUIRE_16);

+   /* Limit identified when first variant is compiled, see
+    * brw_shader::limit_dispatch_width().
+    */
+   unsigned dispatch_width_limit = UINT_MAX;
+
   std::unique_ptr<brw_shader> v8, v16, v32, vmulti;
   cfg_t *simd8_cfg = NULL, *simd16_cfg = NULL, *simd32_cfg = NULL,
      *multi_cfg = NULL;
@ -1609,7 +1614,20 @@ brw_compile_fs(const struct brw_compiler *compiler,
         params->base.error_str = ralloc_strdup(params->base.mem_ctx,
                                                v8->fail_msg);
         return NULL;
-      } else if (INTEL_SIMD(FS, 8)) {
+      }
+
+      if (key->coarse_pixel) {
+         if (prog_data->dual_src_blend) {
+            v8->limit_dispatch_width(8, "SIMD16 coarse pixel shading cannot"
+                                     " use SIMD8 messages.\n");
+         }
+         v8->limit_dispatch_width(16, "SIMD32 not supported with coarse"
+                                  " pixel shading.\n");
+      }
+
+      dispatch_width_limit = MIN2(dispatch_width_limit, v8->max_dispatch_width);
+
+      if (INTEL_SIMD(FS, 8)) {
         simd8_cfg = v8->cfg;

         assert(v8->payload().num_regs % reg_unit(devinfo) == 0);
@ -1622,15 +1640,6 @@ brw_compile_fs(const struct brw_compiler *compiler,
         has_spilled = v8->spilled_any_registers;
         allow_spilling = false;
      }
-
-      if (key->coarse_pixel) {
-         if (prog_data->dual_src_blend) {
-            v8->limit_dispatch_width(8, "SIMD16 coarse pixel shading cannot"
-                                     " use SIMD8 messages.\n");
-         }
-         v8->limit_dispatch_width(16, "SIMD32 not supported with coarse"
-                                  " pixel shading.\n");
-      }
   }

   if (devinfo->ver >= 30) {
@ -1752,8 +1761,7 @@ brw_compile_fs(const struct brw_compiler *compiler,
      }

   } else {
-      if ((!has_spilled && (!v8 || v8->max_dispatch_width >= 16) &&
-           INTEL_SIMD(FS, 16)) ||
+      if ((!has_spilled && dispatch_width_limit >= 16 && INTEL_SIMD(FS, 16)) ||
          reqd_dispatch_width == SUBGROUP_SIZE_REQUIRE_16) {
         /* Try a SIMD16 compile */
         brw_shader_params shader_params = base_shader_params;
@ -1767,6 +1775,7 @@ brw_compile_fs(const struct brw_compiler *compiler,
                                "SIMD16 shader failed to compile: %s\n",
                                v16->fail_msg);
         } else {
+            dispatch_width_limit = MIN2(dispatch_width_limit, v16->max_dispatch_width);
            simd16_cfg = v16->cfg;

            assert(v16->payload().num_regs % reg_unit(devinfo) == 0);
@ -1785,8 +1794,7 @@ brw_compile_fs(const struct brw_compiler *compiler,

      /* Currently, the compiler only supports SIMD32 on SNB+ */
      if (!has_spilled &&
-          (!v8 || v8->max_dispatch_width >= 32) &&
-          (!v16 || v16->max_dispatch_width >= 32) &&
+          dispatch_width_limit >= 32 &&
          reqd_dispatch_width == SUBGROUP_SIZE_VARYING &&
          !simd16_failed && INTEL_SIMD(FS, 32)) {
         /* Try a SIMD32 compile */
@ -1822,11 +1830,10 @@ brw_compile_fs(const struct brw_compiler *compiler,
      if (devinfo->ver >= 12 && !has_spilled &&
          max_polygons >= 2 && !key->coarse_pixel &&
          reqd_dispatch_width == SUBGROUP_SIZE_VARYING) {
-         brw_shader *vbase = v8 ? v8.get() : v16 ? v16.get() : v32.get();
-         assert(vbase);
+         assert(v8 || v16 || v32);

         if (devinfo->ver >= 20 && max_polygons >= 4 &&
-             vbase->max_dispatch_width >= 32 &&
+             dispatch_width_limit >= 32 &&
             4 * prog_data->num_varying_inputs <= MAX_VARYING &&
             INTEL_SIMD(FS, 4X8)) {
            /* Try a quad-SIMD8 compile */
@ -1846,7 +1853,7 @@ brw_compile_fs(const struct brw_compiler *compiler,
         }

         if (!multi_cfg && devinfo->ver >= 20 &&
-             vbase->max_dispatch_width >= 32 &&
+             dispatch_width_limit >= 32 &&
             2 * prog_data->num_varying_inputs <= MAX_VARYING &&
             INTEL_SIMD(FS, 2X16)) {
            /* Try a dual-SIMD16 compile */
@ -1865,7 +1872,7 @@ brw_compile_fs(const struct brw_compiler *compiler,
            }
         }

-         if (!multi_cfg && vbase->max_dispatch_width >= 16 &&
+         if (!multi_cfg && dispatch_width_limit >= 16 &&
             2 * prog_data->num_varying_inputs <= MAX_VARYING &&
             INTEL_SIMD(FS, 2X8)) {
            /* Try a dual-SIMD8 compile */