compiler/rust: Fix the DFS loop detection algorithm

The previous algorithm just looked at the dominator's loop header. However, if you have multiple consecutive loops like: function_impl { loop { // Stuff } loop { // Other stuff } } then it will look like the second loop is contained in the first loop because the first loop's header dominates the second loop. This isn't actually what we want. Instead, we want a node N to be considered part of a loop with header H if H dominates N and H is reachable from N. Fixes: 741f7067f1 ("nak: Add loop detection to the CFG") Reviewed-by: Mel Henning <mhenning@darkrefraction.com> Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/36524> (cherry picked from commit a1d5e8bfdb)
2025-12-20 11:40:10 +01:00 · 2025-08-01 10:27:50 -04:00 · 2025-08-01 10:27:50 -04:00 · d583833971
commit d583833971
parent 953a791b53
2 changed files with 350 additions and 22 deletions
--- a/.pick_status.json
+++ b/.pick_status.json
@ -74,7 +74,7 @@
        "description": "compiler/rust: Fix the DFS loop detection algorithm",
        "nominated": true,
        "nomination_type": 2,
-        "resolution": 0,
+        "resolution": 1,
        "main_sha": null,
        "because_sha": "741f7067f1fb5953e84bac0fcb5c6c7df588df48",
        "notes": null
--- a/src/compiler/rust/cfg.rs
+++ b/src/compiler/rust/cfg.rs
@ -181,46 +181,100 @@ fn loop_detect_dfs<N>(
    id: usize,
    pre: &mut BitSet,
    post: &mut BitSet,
-    loops: &mut BitSet,
+    back_edges: &mut Vec<(usize, usize)>,
 ) {
    if pre.get(id) {
-        if !post.get(id) {
-            loops.insert(id);
-        }
        return;
    }

    pre.insert(id);

-    for s in nodes[id].succ.iter() {
-        loop_detect_dfs(nodes, *s, pre, post, loops);
+    for &s in nodes[id].succ.iter() {
+        if pre.get(s) && !post.get(s) {
+            back_edges.push((id, s));
+        }
+        loop_detect_dfs(nodes, s, pre, post, back_edges);
    }

    post.insert(id);
 }

+/// Computes the set of nodes that reach the given node without going through
+/// stop
+fn reaches_dfs<N>(
+    nodes: &Vec<CFGNode<N>>,
+    id: usize,
+    stop: usize,
+    reaches: &mut BitSet,
+) {
+    if id == stop || reaches.get(id) {
+        return;
+    }
+
+    reaches.insert(id);
+
+    // Since we're trying to find the set of things that reach the start node,
+    // not the set of things reachable from the start node, walk predecessors.
+    for &s in nodes[id].pred.iter() {
+        reaches_dfs(nodes, s, stop, reaches);
+    }
+}
+
 fn detect_loops<N>(nodes: &mut Vec<CFGNode<N>>) -> bool {
    let mut dfs_pre = BitSet::new();
    let mut dfs_post = BitSet::new();
-    let mut loops = BitSet::new();
-    loop_detect_dfs(nodes, 0, &mut dfs_pre, &mut dfs_post, &mut loops);
+    let mut back_edges = Vec::new();
+    loop_detect_dfs(nodes, 0, &mut dfs_pre, &mut dfs_post, &mut back_edges);
+
+    if back_edges.is_empty() {
+        return false;
+    }
+
+    // Construct a map from nodes N to loop headers H where there is some
+    // back-edge (C, H) such that C is reachable from N without going through H.
+    // By running the DFS backwards, we can do this in O(B * E) time where B is
+    // the number of back-edges and E is the total number of edges.
+    let mut loops = BitSet::new();
+    let mut node_loops: Vec<BitSet> = Default::default();
+    node_loops.resize_with(nodes.len(), Default::default);
+    for (c, h) in back_edges {
+        // Stash the loop headers while we're here
+        loops.insert(h);
+
+        // re-use dfs_pre for our reaches set
+        dfs_pre.clear();
+        let reaches = &mut dfs_pre;
+        reaches_dfs(nodes, c, h, reaches);
+
+        for n in reaches.iter() {
+            node_loops[n].insert(h);
+        }
+    }
+
+    for i in 0..nodes.len() {
+        debug_assert!(nodes[i].lph == usize::MAX);

-    let mut has_loop = false;
-    nodes[0].lph = usize::MAX;
-    for i in 1..nodes.len() {
        if loops.get(i) {
            // This is a loop header
            nodes[i].lph = i;
-            has_loop = true;
-        } else {
-            // Otherwise, we have the same loop header as our dominator
-            let dom = nodes[i].dom;
-            let dom_lph = nodes[dom].lph;
-            nodes[i].lph = dom_lph;
+            continue;
+        }
+
+        let mut n = i;
+        while n != 0 {
+            let dom = nodes[n].dom;
+            debug_assert!(dom < n);
+
+            if node_loops[i].get(dom) {
+                nodes[i].lph = dom;
+                break;
+            };
+
+            n = dom;
        }
    }

-    has_loop
+    true
 }

 pub struct CFG<N> {
@ -306,10 +360,27 @@ impl<N> CFG<N> {
        self.has_loop
    }

+    /// Returns true if the given node is a loop header.
+    ///
+    /// A node H is a loop header if there is a back-edge terminating at H.
    pub fn is_loop_header(&self, idx: usize) -> bool {
        self.nodes[idx].lph == idx
    }

+    /// Returns the index of the loop header of the innermost loop containing
+    /// this node, if any. If this node is not contained in any loops, `None`
+    /// is returned.
+    ///
+    /// A node N is considered to be contained to be contained in the loop with
+    /// header H if both of the following are true:
+    ///
+    ///  1. H dominates N
+    ///
+    ///  2. There is a back-edge (C, H) in the CFG such that C is reachable
+    ///     from N without going through H.
+    ///
+    /// This matches the definitions given in
+    /// https://www.cs.cornell.edu/courses/cs4120/2023sp/notes.html?id=cflow
    pub fn loop_header_index(&self, idx: usize) -> Option<usize> {
        let lph = self.nodes[idx].lph;
        if lph == usize::MAX {
@ -407,3 +478,260 @@ impl<K, N> Default for CFGBuilder<K, N> {
        CFGBuilder::new()
    }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    fn test_loop_nesting(edges: &[(usize, usize)], expected: &[Option<usize>]) {
+        let mut builder = CFGBuilder::new();
+        for i in 0..expected.len() {
+            builder.add_node(i, i);
+        }
+        for &(a, b) in edges {
+            builder.add_edge(a, b);
+        }
+        let cfg = builder.as_cfg();
+
+        let mut lphs = Vec::new();
+        lphs.resize(expected.len(), None);
+        for (i, idx) in cfg.iter().enumerate() {
+            let lph = cfg.loop_header_index(i);
+            lphs[*idx.deref()] = lph.map(|h| cfg[h]);
+        }
+
+        assert_eq!(&lphs, expected);
+    }
+
+    #[test]
+    fn test_loop_simple() {
+        // block 0
+        // loop {
+        //     block 1
+        //     if ... {
+        //         block 2
+        //         break;
+        //     }
+        //     block 3
+        // }
+        // block 4
+        test_loop_nesting(
+            &[(0, 1), (1, 2), (1, 3), (2, 4), (3, 1)],
+            &[None, Some(1), None, Some(1), None, None],
+        );
+    }
+
+    #[test]
+    fn test_loop_simple_nested() {
+        // loop {
+        //     block 0
+        //     loop {
+        //         block 1
+        //         if ... {
+        //             block 2
+        //             break;
+        //         }
+        //         block 3
+        //     }
+        //     block 4
+        //     if ... {
+        //         block 5
+        //         break;
+        //     }
+        //     block 6
+        // }
+        // block 7
+        test_loop_nesting(
+            &[
+                (0, 1),
+                (1, 2),
+                (1, 3),
+                (2, 4),
+                (3, 1),
+                (4, 5),
+                (4, 6),
+                (5, 7),
+                (6, 0),
+            ],
+            &[
+                Some(0),
+                Some(1),
+                Some(0),
+                Some(1),
+                Some(0),
+                None,
+                Some(0),
+                None,
+            ],
+        );
+    }
+
+    #[test]
+    fn test_loop_two_continues() {
+        // loop {
+        //     block 0
+        //     if ... {
+        //         block 1
+        //         continue;
+        //     }
+        //     block 2
+        //     if ... {
+        //         block 3
+        //         break;
+        //     }
+        //     block 4
+        // }
+        // block 5
+        test_loop_nesting(
+            &[(0, 1), (0, 2), (1, 0), (2, 3), (2, 4), (3, 5), (4, 0)],
+            &[Some(0), Some(0), Some(0), None, Some(0), None],
+        );
+    }
+
+    #[test]
+    fn test_loop_two_breaks() {
+        // loop {
+        //     block 0
+        //     if ... {
+        //         block 1
+        //         break;
+        //     }
+        //     block 2
+        //     if ... {
+        //         block 3
+        //         break;
+        //     }
+        //     block 4
+        // }
+        // block 5
+        test_loop_nesting(
+            &[(0, 1), (0, 2), (1, 5), (2, 3), (2, 4), (3, 5), (4, 0)],
+            &[Some(0), None, Some(0), None, Some(0), None],
+        );
+    }
+
+    #[test]
+    fn test_loop_predicated_continue() {
+        // loop {
+        //     block 0
+        //     continue_if(...);
+        //     block 1
+        //     if ... {
+        //         block 2
+        //         break;
+        //     }
+        //     block 3
+        // }
+        // block 4
+        test_loop_nesting(
+            &[(0, 0), (0, 1), (1, 2), (1, 3), (2, 4), (3, 0)],
+            &[Some(0), Some(0), None, Some(0), None],
+        );
+    }
+
+    #[test]
+    fn test_loop_predicated_break() {
+        // block 0
+        // loop {
+        //     block 1
+        //     break_if(...);
+        //     block 2
+        //     if ... {
+        //         block 3
+        //         break;
+        //     }
+        //     block 4
+        // }
+        // block 5
+        test_loop_nesting(
+            &[(0, 1), (1, 2), (1, 5), (2, 3), (2, 4), (3, 5), (4, 1)],
+            &[None, Some(1), Some(1), None, Some(1), None],
+        );
+    }
+
+    #[test]
+    fn test_loop_complex() {
+        // loop {
+        //     block 0
+        //     loop {
+        //         block 1
+        //         if ... {
+        //             block 2
+        //             break;
+        //         }
+        //         block 3
+        //     }
+        //     loop {
+        //         block 4
+        //         break_if(..);
+        //     }
+        //     block 5
+        //     if ... {
+        //         block 6
+        //         break;
+        //     }
+        //     block 7
+        // }
+        // block 8
+        test_loop_nesting(
+            &[
+                (0, 1),
+                (1, 2),
+                (1, 3),
+                (2, 4),
+                (3, 1),
+                (4, 5),
+                (4, 4),
+                (5, 6),
+                (5, 7),
+                (6, 8),
+                (7, 0),
+            ],
+            &[
+                Some(0),
+                Some(1),
+                Some(0),
+                Some(1),
+                Some(4),
+                Some(0),
+                None,
+                Some(0),
+                None,
+            ],
+        );
+    }
+
+    #[test]
+    fn test_simple_irreducible() {
+        // block 0
+        // if ... {
+        //     block 1
+        // }
+        // block 2
+        // if ... {
+        //     block 3
+        // }
+        // block 4
+        test_loop_nesting(
+            &[(0, 1), (0, 2), (1, 2), (2, 3), (2, 4), (3, 4)],
+            &[None, None, None, None, None, None],
+        );
+    }
+
+    #[test]
+    fn test_loop_irreducible() {
+        // block 0
+        // goto_if(...) label;
+        // loop {
+        //     block 1
+        //     break_if(...);
+        // label:
+        //     block 2
+        // }
+        // block 3
+        test_loop_nesting(
+            &[(0, 1), (0, 2), (1, 3), (1, 2), (2, 1)],
+            &[None, Some(1), None, None, None, None],
+        );
+    }
+}