nak: simplify SM80 HMMA latency categorization

Reviewed-by: Faith Ekstrand <faith.ekstrand@collabora.com>
Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/37941>
This commit is contained in:
Karol Herbst 2025-10-21 10:59:01 +02:00 committed by Marge Bot
parent 3bbf3f7826
commit 85480200f8

View file

@ -145,18 +145,14 @@ impl RegLatencySM80 {
Op::HSet2(_) | Op::HSetP2(_) | Op::HMnMx2(_) => FP16_Alu,
// let in for documentation purposes
Op::Hmma(h) => match (h.mat_size, h.dst_type, h.src_type) {
(HmmaSize::M16N8K16, FloatType::F32, FloatType::F16) => {
MMA_2x_collect
}
// (HmmaSize::M16N8K16, FloatType::F32, FloatType::BF16) => MMA_2x_collect,
// (HmmaSize::M16N8K8, FloatType::F32, FloatType::TF32) => MMA_2x_collect,
(HmmaSize::M16N8K8, FloatType::F32, FloatType::F16) => {
MMA_1x_collect
}
// (HmmaSize::M16N8K8, FloatType::F32, FloatType::BF16) => MMA_1x_collect,
// (HmmaSize::M16N8K4, FloatType::F32, FloatType::TF32) => MMA_1x_collect,
(HmmaSize::M16N8K16, FloatType::F16, _) => MMA_2x_collect,
(HmmaSize::M16N8K8, FloatType::F16, _) => MMA_1x_collect,
(HmmaSize::M16N8K16, _, _) => MMA_2x_collect,
_ => panic!("Illegal HMMA in reg category {}", h),
},
Op::Ipa(_) => DecoupledAgu,