intel/brw: account for sources when determining if a operation uses half floats

Signed-off-by: Rohan Garg <rohan.garg@intel.com> Reviewed-by: Ian Romanick <ian.d.romanick@intel.com> Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/27235>
2026-05-05 13:58:04 +02:00 · 2024-03-04 02:23:23 -08:00 · 2024-03-04 02:23:23 -08:00 · c4b38c717d
commit c4b38c717d
parent 07f0825c03
1 changed files with 26 additions and 4 deletions
--- a/src/intel/compiler/brw_fs_lower_simd_width.cpp
+++ b/src/intel/compiler/brw_fs_lower_simd_width.cpp
@ -200,6 +200,20 @@ get_sampler_lowered_simd_width(const struct intel_device_info *devinfo,
   return MIN2(inst->exec_size, simd_limit);
 }

+static bool
+is_half_float_src_dst(const fs_inst *inst)
+{
+   if (inst->dst.type == BRW_REGISTER_TYPE_HF)
+      return true;
+
+   for (int i = 0; i < inst->sources; i++) {
+      if (inst->src[i].type == BRW_REGISTER_TYPE_HF)
+         return true;
+   }
+
+   return false;
+}
+
 /**
 * Get the closest native SIMD width supported by the hardware for instruction
 * \p inst.  The instruction will be left untouched by
@ -265,8 +279,16 @@ brw_fs_get_lowered_simd_width(const fs_visitor *shader, const fs_inst *inst)
   case SHADER_OPCODE_LOG2:
   case SHADER_OPCODE_SIN:
   case SHADER_OPCODE_COS: {
-      if (inst->dst.type == BRW_REGISTER_TYPE_HF)
-         return MIN2(8, inst->exec_size);
+      /* Xe2+: BSpec 56797
+       *
+       * Math operation rules when half-floats are used on both source and
+       * destination operands and both source and destinations are packed.
+       *
+       * The execution size must be 16.
+       */
+      if (is_half_float_src_dst(inst))
+         return MIN2(8,  inst->exec_size);
+
      return MIN2(16, inst->exec_size);
   }

@ -274,8 +296,8 @@ brw_fs_get_lowered_simd_width(const fs_visitor *shader, const fs_inst *inst)
      /* SIMD16 is only allowed on Gfx7+. Extended Math Function is limited
       * to SIMD8 with half-float
       */
-      if (inst->dst.type == BRW_REGISTER_TYPE_HF)
-         return MIN2(8, inst->exec_size);
+      if (is_half_float_src_dst(inst))
+        return MIN2(8,  inst->exec_size);
      return MIN2(16, inst->exec_size);
   }