Adding upstream version 86.0.1.upstream/86.0.1 upstream

Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
author: Daniel Baumann <daniel.baumann@progress-linux.org> 2024-04-28 14:29:10 +0000
committer: Daniel Baumann <daniel.baumann@progress-linux.org> 2024-04-28 14:29:10 +0000
commit: 2aa4a82499d4becd2284cdb482213d541b8804dd (patch)
tree: b80bf8bf13c3766139fbacc530efd0dd9d54394c /third_party/rust/regalloc/src/analysis_control_flow.rs
parent: Initial commit. (diff)
download: firefox-2aa4a82499d4becd2284cdb482213d541b8804dd.tar.xz
firefox-2aa4a82499d4becd2284cdb482213d541b8804dd.zip
1 files changed, 742 insertions, 0 deletions
diff --git a/third_party/rust/regalloc/src/analysis_control_flow.rs b/third_party/rust/regalloc/src/analysis_control_flow.rs
new file mode 100644
index 0000000000..e28f630aa0
--- /dev/null
+++ b/third_party/rust/regalloc/src/analysis_control_flow.rs
@@ -0,0 +1,742 @@
+//! Performs control flow analysis.
+
+use log::{debug, info};
+use std::cmp::Ordering;
+
+use crate::analysis_main::AnalysisError;
+use crate::data_structures::{BlockIx, InstIx, Range, Set, TypedIxVec};
+use crate::sparse_set::{SparseSetU, SparseSetUIter};
+use crate::Function;
+
+use smallvec::SmallVec;
+
+//=============================================================================
+// Debugging config.  Set all these to `false` for normal operation.
+
+// DEBUGGING: set to true to cross-check the dominator-tree computation.
+const CROSSCHECK_DOMS: bool = false;
+
+//===========================================================================//
+//                                                                           //
+// CONTROL FLOW ANALYSIS                                                     //
+//                                                                           //
+//===========================================================================//
+
+//=============================================================================
+// Control flow analysis: create the InstIx-to-BlockIx mapping
+
+// This is trivial, but it's sometimes useful to have.
+// Note: confusingly, the `Range` here is data_structures::Range, not
+// std::ops::Range.
+pub struct InstIxToBlockIxMap {
+    vek: TypedIxVec<BlockIx, Range<InstIx>>,
+}
+
+impl InstIxToBlockIxMap {
+    #[inline(never)]
+    pub fn new<F: Function>(func: &F) -> Self {
+        let mut vek = TypedIxVec::<BlockIx, Range<InstIx>>::new();
+        for bix in func.blocks() {
+            let r: Range<InstIx> = func.block_insns(bix);
+            assert!(r.start() <= r.last_plus1());
+            vek.push(r);
+        }
+
+        fn cmp_ranges(r1: &Range<InstIx>, r2: &Range<InstIx>) -> Ordering {
+            if r1.last_plus1() <= r2.first() {
+                return Ordering::Less;
+            }
+            if r2.last_plus1() <= r1.first() {
+                return Ordering::Greater;
+            }
+            if r1.first() == r2.first() && r1.last_plus1() == r2.last_plus1() {
+                return Ordering::Equal;
+            }
+            // If this happens, F::block_insns is telling us something that isn't right.
+            panic!("InstIxToBlockIxMap::cmp_ranges: overlapping InstIx ranges!");
+        }
+
+        vek.sort_unstable_by(|r1, r2| cmp_ranges(r1, r2));
+        // Sanity check: ascending, non-overlapping, no gaps.  We need this in
+        // order to ensure that binary searching in `map` works properly.
+        for i in 1..vek.len() {
+            let r_m1 = &vek[BlockIx::new(i - 1)];
+            let r_m0 = &vek[BlockIx::new(i - 0)];
+            assert!(r_m1.last_plus1() == r_m0.first());
+        }
+
+        Self { vek }
+    }
+
+    #[inline(never)]
+    pub fn map(&self, iix: InstIx) -> BlockIx {
+        if self.vek.len() > 0 {
+            let mut lo = 0isize;
+            let mut hi = self.vek.len() as isize - 1;
+            loop {
+                if lo > hi {
+                    break;
+                }
+                let mid = (lo + hi) / 2;
+                let midv = &self.vek[BlockIx::new(mid as u32)];
+                if iix < midv.start() {
+                    hi = mid - 1;
+                    continue;
+                }
+                if iix >= midv.last_plus1() {
+                    lo = mid + 1;
+                    continue;
+                }
+                assert!(midv.start() <= iix && iix < midv.last_plus1());
+                return BlockIx::new(mid as u32);
+            }
+        }
+        panic!("InstIxToBlockIxMap::map: can't map {:?}", iix);
+    }
+}
+
+//=============================================================================
+// Control flow analysis: calculation of block successor and predecessor maps
+
+// Returned TypedIxVecs contain one element per block
+#[inline(never)]
+fn calc_preds_and_succs<F: Function>(
+    func: &F,
+    num_blocks: u32,
+) -> (
+    TypedIxVec<BlockIx, SparseSetU<[BlockIx; 4]>>,
+    TypedIxVec<BlockIx, SparseSetU<[BlockIx; 4]>>,
+) {
+    info!("      calc_preds_and_succs: begin");
+
+    assert!(func.blocks().len() == num_blocks as usize);
+
+    // First calculate the succ map, since we can do that directly from the
+    // Func.
+    //
+    // Func::finish() ensures that all blocks are non-empty, and that only the
+    // last instruction is a control flow transfer.  Hence the following won't
+    // miss any edges.
+    let mut succ_map = TypedIxVec::<BlockIx, SparseSetU<[BlockIx; 4]>>::new();
+    for b in func.blocks() {
+        let mut bix_set = SparseSetU::<[BlockIx; 4]>::empty();
+        for bix in func.block_succs(b).iter() {
+            bix_set.insert(*bix);
+        }
+        succ_map.push(bix_set);
+    }
+
+    // Now invert the mapping
+    let mut pred_map = TypedIxVec::<BlockIx, SparseSetU<[BlockIx; 4]>>::new();
+    pred_map.resize(num_blocks, SparseSetU::<[BlockIx; 4]>::empty());
+    for (src, dst_set) in (0..).zip(succ_map.iter()) {
+        for dst in dst_set.iter() {
+            pred_map[*dst].insert(BlockIx::new(src));
+        }
+    }
+
+    // Stay sane ..
+    assert!(pred_map.len() == num_blocks);
+    assert!(succ_map.len() == num_blocks);
+
+    let mut n = 0;
+    debug!("");
+    for (preds, succs) in pred_map.iter().zip(succ_map.iter()) {
+        debug!(
+            "{:<3?}   preds {:<16?}  succs {:?}",
+            BlockIx::new(n),
+            preds,
+            succs
+        );
+        n += 1;
+    }
+
+    info!("      calc_preds_and_succs: end");
+    (pred_map, succ_map)
+}
+
+//=============================================================================
+// Control flow analysis: calculation of block preorder and postorder sequences
+
+// Returned Vecs contain one element per block.  `None` is returned if the
+// sequences do not contain `num_blocks` elements, in which case the input
+// contains blocks not reachable from the entry point, and is invalid.
+#[inline(never)]
+fn calc_preord_and_postord<F: Function>(
+    func: &F,
+    num_blocks: u32,
+    succ_map: &TypedIxVec<BlockIx, SparseSetU<[BlockIx; 4]>>,
+) -> Option<(Vec<BlockIx>, Vec<BlockIx>)> {
+    info!("      calc_preord_and_postord: begin");
+
+    let mut pre_ord = Vec::<BlockIx>::new();
+    let mut post_ord = Vec::<BlockIx>::new();
+
+    let mut visited = TypedIxVec::<BlockIx, bool>::new();
+    visited.resize(num_blocks, false);
+
+    // Set up initial state: entry block on the stack, marked as visited, and placed at the
+    // start of the pre-ord sequence.
+    let mut stack = SmallVec::<[(BlockIx, SparseSetUIter<[BlockIx; 4]>); 64]>::new();
+    let bix_entry = func.entry_block();
+    visited[bix_entry] = true;
+    pre_ord.push(bix_entry);
+    stack.push((bix_entry, succ_map[bix_entry].iter()));
+
+    'outer: while let Some((bix, bix_succ_iter)) = stack.last_mut() {
+        // Consider the block on the top of the stack.  Does it have any successors we
+        // haven't yet visited?
+        while let Some(bix_next_succ) = bix_succ_iter.next() {
+            if !visited[*bix_next_succ] {
+                // Yes.  Push just one of them on the stack, along with a newly initialised
+                // iterator for it, and continue by considering the new stack top.  Because
+                // blocks are only ever pushed onto the stack once, we must also add the
+                // block to the pre-ord sequence at this point.
+                visited[*bix_next_succ] = true;
+                pre_ord.push(*bix_next_succ);
+                stack.push((*bix_next_succ, succ_map[*bix_next_succ].iter()));
+                continue 'outer;
+            }
+        }
+        // No.  This is the last time we'll ever hear of it.  So add it to the post-ord
+        // sequence, remove the now-defunct stack-top item, and move on.
+        post_ord.push(*bix);
+        stack.pop();
+    }
+
+    assert!(pre_ord.len() == post_ord.len());
+    assert!(pre_ord.len() <= num_blocks as usize);
+    if pre_ord.len() < num_blocks as usize {
+        info!(
+            "      calc_preord_and_postord: invalid: {} blocks, {} reachable",
+            num_blocks,
+            pre_ord.len()
+        );
+        return None;
+    }
+
+    assert!(pre_ord.len() == num_blocks as usize);
+    assert!(post_ord.len() == num_blocks as usize);
+    #[cfg(debug_assertions)]
+    {
+        let mut pre_ord_sorted: Vec<BlockIx> = pre_ord.clone();
+        let mut post_ord_sorted: Vec<BlockIx> = post_ord.clone();
+        pre_ord_sorted.sort_by(|bix1, bix2| bix1.get().partial_cmp(&bix2.get()).unwrap());
+        post_ord_sorted.sort_by(|bix1, bix2| bix1.get().partial_cmp(&bix2.get()).unwrap());
+        let expected: Vec<BlockIx> = (0..num_blocks).map(|u| BlockIx::new(u)).collect();
+        debug_assert!(pre_ord_sorted == expected);
+        debug_assert!(post_ord_sorted == expected);
+    }
+
+    info!("      calc_preord_and_postord: end.  {} blocks", num_blocks);
+    Some((pre_ord, post_ord))
+}
+
+//=============================================================================
+// Computation of per-block dominator sets.  Note, this is slow, and will be
+// removed at some point.
+
+// Calculate the dominance relationship, given `pred_map` and a start node
+// `start`.  The resulting vector maps each block to the set of blocks that
+// dominate it. This algorithm is from Fig 7.14 of Muchnick 1997. The
+// algorithm is described as simple but not as performant as some others.
+#[inline(never)]
+fn calc_dom_sets_slow(
+    num_blocks: u32,
+    pred_map: &TypedIxVec<BlockIx, SparseSetU<[BlockIx; 4]>>,
+    post_ord: &Vec<BlockIx>,
+    start: BlockIx,
+) -> TypedIxVec<BlockIx, Set<BlockIx>> {
+    info!("          calc_dom_sets_slow: begin");
+
+    let mut dom_map = TypedIxVec::<BlockIx, Set<BlockIx>>::new();
+
+    // FIXME find better names for n/d/t sets.
+    {
+        let root: BlockIx = start;
+        let n_set: Set<BlockIx> =
+            Set::from_vec((0..num_blocks).map(|bix| BlockIx::new(bix)).collect());
+        let mut d_set: Set<BlockIx>;
+        let mut t_set: Set<BlockIx>;
+
+        dom_map.resize(num_blocks, Set::<BlockIx>::empty());
+        dom_map[root] = Set::unit(root);
+        for block_i in 0..num_blocks {
+            let block_ix = BlockIx::new(block_i);
+            if block_ix != root {
+                dom_map[block_ix] = n_set.clone();
+            }
+        }
+
+        let mut num_iter = 0;
+        loop {
+            num_iter += 1;
+            info!("          calc_dom_sets_slow:   outer loop {}", num_iter);
+            let mut change = false;
+            for i in 0..num_blocks {
+                // block_ix travels in "reverse preorder"
+                let block_ix = post_ord[(num_blocks - 1 - i) as usize];
+                if block_ix == root {
+                    continue;
+                }
+                t_set = n_set.clone();
+                for pred_ix in pred_map[block_ix].iter() {
+                    t_set.intersect(&dom_map[*pred_ix]);
+                }
+                d_set = t_set.clone();
+                d_set.insert(block_ix);
+                if !d_set.equals(&dom_map[block_ix]) {
+                    change = true;
+                    dom_map[block_ix] = d_set;
+                }
+            }
+            if !change {
+                break;
+            }
+        }
+    }
+
+    debug!("");
+    let mut block_ix = 0;
+    for dom_set in dom_map.iter() {
+        debug!("{:<3?}   dom_set {:<16?}", BlockIx::new(block_ix), dom_set);
+        block_ix += 1;
+    }
+    info!("          calc_dom_sets_slow: end");
+    dom_map
+}
+
+//=============================================================================
+// Computation of per-block dominator sets by first computing trees.
+//
+// This is an implementation of the algorithm described in
+//
+//   A Simple, Fast Dominance Algorithm
+//   Keith D. Cooper, Timothy J. Harvey, and Ken Kennedy
+//   Department of Computer Science, Rice University, Houston, Texas, USA
+//   TR-06-33870
+//   https://www.cs.rice.edu/~keith/EMBED/dom.pdf
+//
+// which appears to be the de-facto standard scheme for computing dominance
+// quickly nowadays.
+
+// Unfortunately it seems like local consts are not allowed in Rust.
+const DT_INVALID_POSTORD: u32 = 0xFFFF_FFFF;
+const DT_INVALID_BLOCKIX: BlockIx = BlockIx::BlockIx(0xFFFF_FFFF);
+
+// Helper
+fn dt_merge_sets(
+    idom: &TypedIxVec<BlockIx, BlockIx>,
+    bix2rpostord: &TypedIxVec<BlockIx, u32>,
+    mut node1: BlockIx,
+    mut node2: BlockIx,
+) -> BlockIx {
+    while node1 != node2 {
+        if node1 == DT_INVALID_BLOCKIX || node2 == DT_INVALID_BLOCKIX {
+            return DT_INVALID_BLOCKIX;
+        }
+        let rpo1 = bix2rpostord[node1];
+        let rpo2 = bix2rpostord[node2];
+        if rpo1 > rpo2 {
+            node1 = idom[node1];
+        } else if rpo2 > rpo1 {
+            node2 = idom[node2];
+        }
+    }
+    assert!(node1 == node2);
+    node1
+}
+
+#[inline(never)]
+fn calc_dom_tree(
+    num_blocks: u32,
+    pred_map: &TypedIxVec<BlockIx, SparseSetU<[BlockIx; 4]>>,
+    post_ord: &Vec<BlockIx>,
+    start: BlockIx,
+) -> TypedIxVec<BlockIx, BlockIx> {
+    info!("        calc_dom_tree: begin");
+
+    // We use 2^32-1 as a marker for an invalid BlockIx or postorder number.
+    // Hence we need this:
+    assert!(num_blocks < DT_INVALID_POSTORD);
+
+    // We have post_ord, which is the postorder sequence.
+
+    // Compute bix2rpostord, which maps a BlockIx to its reverse postorder
+    // number.  And rpostord2bix, which maps a reverse postorder number to its
+    // BlockIx.
+    let mut bix2rpostord = TypedIxVec::<BlockIx, u32>::new();
+    let mut rpostord2bix = Vec::<BlockIx>::new();
+    bix2rpostord.resize(num_blocks, DT_INVALID_POSTORD);
+    rpostord2bix.resize(num_blocks as usize, DT_INVALID_BLOCKIX);
+    for n in 0..num_blocks {
+        // bix visits the blocks in reverse postorder
+        let bix = post_ord[(num_blocks - 1 - n) as usize];
+        // Hence:
+        bix2rpostord[bix] = n;
+        // and
+        rpostord2bix[n as usize] = bix;
+    }
+    for n in 0..num_blocks {
+        debug_assert!(bix2rpostord[BlockIx::new(n)] < num_blocks);
+    }
+
+    let mut idom = TypedIxVec::<BlockIx, BlockIx>::new();
+    idom.resize(num_blocks, DT_INVALID_BLOCKIX);
+
+    // The start node must have itself as a parent.
+    idom[start] = start;
+
+    for i in 0..num_blocks {
+        let block_ix = BlockIx::new(i);
+        let preds_of_i = &pred_map[block_ix];
+        // All nodes must be reachable from the root.  That means that all nodes
+        // that aren't `start` must have at least one predecessor.  However, we
+        // can't assert the inverse case -- that the start node has no
+        // predecessors -- because the start node might be a self-loop, in which
+        // case it will have itself as a pred.  See tests/domtree_fuzz1.rat.
+        if block_ix != start {
+            assert!(!preds_of_i.is_empty());
+        }
+    }
+
+    let mut changed = true;
+    while changed {
+        changed = false;
+        for n in 0..num_blocks {
+            // Consider blocks in reverse postorder.
+            let node = rpostord2bix[n as usize];
+            assert!(node != DT_INVALID_BLOCKIX);
+            let node_preds = &pred_map[node];
+            let rponum = bix2rpostord[node];
+
+            let mut parent = DT_INVALID_BLOCKIX;
+            if node_preds.is_empty() {
+                // No preds, `parent` remains invalid.
+            } else {
+                for pred in node_preds.iter() {
+                    let pred_rpo = bix2rpostord[*pred];
+                    if pred_rpo < rponum {
+                        parent = *pred;
+                        break;
+                    }
+                }
+            }
+
+            if parent != DT_INVALID_BLOCKIX {
+                for pred in node_preds.iter() {
+                    if *pred == parent {
+                        continue;
+                    }
+                    if idom[*pred] == DT_INVALID_BLOCKIX {
+                        continue;
+                    }
+                    parent = dt_merge_sets(&idom, &bix2rpostord, parent, *pred);
+                }
+            }
+
+            if parent != DT_INVALID_BLOCKIX && parent != idom[node] {
+                idom[node] = parent;
+                changed = true;
+            }
+        }
+    }
+
+    // Check what we can.  The start node should be its own parent.  All other
+    // nodes should not be their own parent, since we are assured that there are
+    // no dead blocks in the graph, and hence that there is only one dominator
+    // tree, that covers the whole graph.
+    assert!(idom[start] == start);
+    for i in 0..num_blocks {
+        let block_ix = BlockIx::new(i);
+        // All "parent pointers" are valid.
+        assert!(idom[block_ix] != DT_INVALID_BLOCKIX);
+        // The only node whose parent pointer points to itself is the start node.
+        assert!((idom[block_ix] == block_ix) == (block_ix == start));
+    }
+
+    if CROSSCHECK_DOMS {
+        // Crosscheck the dom tree, by computing dom sets using the simple
+        // iterative algorithm.  Then, for each block, construct the dominator set
+        // by walking up the tree to the root, and check that it's the same as
+        // what the simple algorithm produced.
+
+        info!("        calc_dom_tree crosscheck: begin");
+        let slow_sets = calc_dom_sets_slow(num_blocks, pred_map, post_ord, start);
+        assert!(slow_sets.len() == idom.len());
+
+        for i in 0..num_blocks {
+            let mut block_ix = BlockIx::new(i);
+            let mut set = Set::<BlockIx>::empty();
+            loop {
+                set.insert(block_ix);
+                let other_block_ix = idom[block_ix];
+                if other_block_ix == block_ix {
+                    break;
+                }
+                block_ix = other_block_ix;
+            }
+            assert!(set.to_vec() == slow_sets[BlockIx::new(i)].to_vec());
+        }
+        info!("        calc_dom_tree crosscheck: end");
+    }
+
+    info!("        calc_dom_tree: end");
+    idom
+}
+
+//=============================================================================
+// Computation of per-block loop-depths
+
+#[inline(never)]
+fn calc_loop_depths(
+    num_blocks: u32,
+    pred_map: &TypedIxVec<BlockIx, SparseSetU<[BlockIx; 4]>>,
+    succ_map: &TypedIxVec<BlockIx, SparseSetU<[BlockIx; 4]>>,
+    post_ord: &Vec<BlockIx>,
+    start: BlockIx,
+) -> TypedIxVec<BlockIx, u32> {
+    info!("      calc_loop_depths: begin");
+    let idom = calc_dom_tree(num_blocks, pred_map, post_ord, start);
+
+    // Find the loops.  First, find the "loop header nodes", and from those,
+    // derive the loops.
+    //
+    // loop_set headers:
+    // A "back edge" m->n is some edge m->n where n dominates m.  'n' is
+    // the loop header node.
+    //
+    // `back_edges` is a set rather than a vector so as to avoid complications
+    // that might later arise if the same loop is enumerated more than once.
+    //
+    // Iterate over all edges (m->n)
+    let mut back_edges = Set::<(BlockIx, BlockIx)>::empty();
+    for block_m_ix in BlockIx::new(0).dotdot(BlockIx::new(num_blocks)) {
+        for block_n_ix in succ_map[block_m_ix].iter() {
+            // Figure out if N dominates M.  Do this by walking the dom tree from M
+            // back up to the root, and seeing if we encounter N on the way.
+            let mut n_dominates_m = false;
+            let mut block_ix = block_m_ix;
+            loop {
+                if block_ix == *block_n_ix {
+                    n_dominates_m = true;
+                    break;
+                }
+                let other_block_ix = idom[block_ix];
+                if other_block_ix == block_ix {
+                    break;
+                }
+                block_ix = other_block_ix;
+            }
+            if n_dominates_m {
+                //println!("QQQQ back edge {} -> {}",
+                //         block_m_ix.show(), block_n_ix.show());
+                back_edges.insert((block_m_ix, *block_n_ix));
+            }
+        }
+    }
+
+    // Now collect the sets of Blocks for each loop.  For each back edge,
+    // collect up all the blocks in the natural loop defined by the back edge
+    // M->N.  This algorithm is from Fig 7.21 of Muchnick 1997 (an excellent
+    // book).  Order in `natural_loops` has no particular meaning.
+    let mut natural_loops = Vec::<Set<BlockIx>>::new();
+    for (block_m_ix, block_n_ix) in back_edges.iter() {
+        let mut loop_set: Set<BlockIx>;
+        let mut stack: Vec<BlockIx>;
+        stack = Vec::<BlockIx>::new();
+        loop_set = Set::<BlockIx>::two(*block_m_ix, *block_n_ix);
+        if block_m_ix != block_n_ix {
+            // The next line is missing in the Muchnick description.  Without it the
+            // algorithm doesn't make any sense, though.
+            stack.push(*block_m_ix);
+            while let Some(block_p_ix) = stack.pop() {
+                for block_q_ix in pred_map[block_p_ix].iter() {
+                    if !loop_set.contains(*block_q_ix) {
+                        loop_set.insert(*block_q_ix);
+                        stack.push(*block_q_ix);
+                    }
+                }
+            }
+        }
+        natural_loops.push(loop_set);
+    }
+
+    // Here is a kludgey way to compute the depth of each loop.  First, order
+    // `natural_loops` by increasing size, so the largest loops are at the end.
+    // Then, repeatedly scan forwards through the vector, in "upper triangular
+    // matrix" style.  For each scan, remember the "current loop".  Initially
+    // the "current loop is the start point of each scan.  If, during the scan,
+    // we encounter a loop which is a superset of the "current loop", change the
+    // "current loop" to this new loop, and increment a counter associated with
+    // the start point of the scan.  The effect is that the counter records the
+    // nesting depth of the loop at the start of the scan.  For this to be
+    // completely accurate, I _think_ this requires the property that loops are
+    // either disjoint or nested, but are in no case intersecting.
+
+    natural_loops.sort_by(|left_block_set, right_block_set| {
+        left_block_set
+            .card()
+            .partial_cmp(&right_block_set.card())
+            .unwrap()
+    });
+
+    let num_loops = natural_loops.len();
+    let mut loop_depths = Vec::<u32>::new();
+    loop_depths.resize(num_loops, 0);
+
+    for i in 0..num_loops {
+        let mut curr = i;
+        let mut depth = 1;
+        for j in i + 1..num_loops {
+            debug_assert!(curr < j);
+            if natural_loops[curr].is_subset_of(&natural_loops[j]) {
+                depth += 1;
+                curr = j;
+            }
+        }
+        loop_depths[i] = depth;
+    }
+
+    // Now that we have a depth for each loop, we can finally compute the depth
+    // for each block.
+    let mut depth_map = TypedIxVec::<BlockIx, u32>::new();
+    depth_map.resize(num_blocks, 0);
+    for (loop_block_indexes, depth) in natural_loops.iter().zip(loop_depths) {
+        for loop_block_ix in loop_block_indexes.iter() {
+            if depth_map[*loop_block_ix] < depth {
+                depth_map[*loop_block_ix] = depth;
+            }
+        }
+    }
+
+    debug_assert!(depth_map.len() == num_blocks);
+
+    let mut n = 0;
+    debug!("");
+    for (depth, idom_by) in depth_map.iter().zip(idom.iter()) {
+        debug!(
+            "{:<3?}   depth {}   idom {:?}",
+            BlockIx::new(n),
+            depth,
+            idom_by
+        );
+        n += 1;
+    }
+
+    info!("      calc_loop_depths: end");
+    depth_map
+}
+
+//=============================================================================
+// Control-flow analysis top level: For a Func: predecessors, successors,
+// preord and postord sequences, and loop depths.
+
+// CFGInfo contains CFG-related info computed from a Func.
+pub struct CFGInfo {
+    // All these TypedIxVecs and plain Vecs contain one element per Block in the
+    // Func.
+
+    // Predecessor and successor maps.
+    pub pred_map: TypedIxVec<BlockIx, SparseSetU<[BlockIx; 4]>>,
+    pub succ_map: TypedIxVec<BlockIx, SparseSetU<[BlockIx; 4]>>,
+
+    // Pre- and post-order sequences.  Iterating forwards through these
+    // vectors enumerates the blocks in preorder and postorder respectively.
+    pub pre_ord: Vec<BlockIx>,
+    pub _post_ord: Vec<BlockIx>,
+
+    // This maps from a Block to the loop depth that it is at
+    pub depth_map: TypedIxVec<BlockIx, u32>,
+}
+
+impl CFGInfo {
+    #[inline(never)]
+    pub fn create<F: Function>(func: &F) -> Result<Self, AnalysisError> {
+        info!("    CFGInfo::create: begin");
+
+        // Throw out insanely large inputs.  They'll probably cause failure later
+        // on.
+        let num_blocks_usize = func.blocks().len();
+        if num_blocks_usize >= 1 * 1024 * 1024 {
+            // 1 million blocks should be enough for anyone.  That will soak up 20
+            // index bits, leaving a "safety margin" of 12 bits for indices for
+            // induced structures (RangeFragIx, InstIx, VirtualRangeIx, RealRangeIx,
+            // etc).
+            return Err(AnalysisError::ImplementationLimitsExceeded);
+        }
+
+        // Similarly, limit the number of instructions to 16 million.  This allows
+        // 16 insns per block with the worst-case number of blocks.  Because each
+        // insn typically generates somewhat less than one new value, this check
+        // also has the effect of limiting the number of virtual registers to
+        // roughly the same amount (16 million).
+        if func.insns().len() >= 16 * 1024 * 1024 {
+            return Err(AnalysisError::ImplementationLimitsExceeded);
+        }
+
+        // Now we know we're safe to narrow it to u32.
+        let num_blocks = num_blocks_usize as u32;
+
+        // === BEGIN compute successor and predecessor maps ===
+        //
+        let (pred_map, succ_map) = calc_preds_and_succs(func, num_blocks);
+        assert!(pred_map.len() == num_blocks);
+        assert!(succ_map.len() == num_blocks);
+        //
+        // === END compute successor and predecessor maps ===
+
+        // === BEGIN check that critical edges have been split ===
+        //
+        for (src, dst_set) in (0..).zip(succ_map.iter()) {
+            if dst_set.card() < 2 {
+                continue;
+            }
+            for dst in dst_set.iter() {
+                if pred_map[*dst].card() >= 2 {
+                    return Err(AnalysisError::CriticalEdge {
+                        from: BlockIx::new(src),
+                        to: *dst,
+                    });
+                }
+            }
+        }
+        //
+        // === END check that critical edges have been split ===
+
+        // === BEGIN compute preord/postord sequences ===
+        //
+        let mb_pre_ord_and_post_ord = calc_preord_and_postord(func, num_blocks, &succ_map);
+        if mb_pre_ord_and_post_ord.is_none() {
+            return Err(AnalysisError::UnreachableBlocks);
+        }
+
+        let (pre_ord, post_ord) = mb_pre_ord_and_post_ord.unwrap();
+        assert!(pre_ord.len() == num_blocks as usize);
+        assert!(post_ord.len() == num_blocks as usize);
+        //
+        // === END compute preord/postord sequences ===
+
+        // === BEGIN compute loop depth of all Blocks
+        //
+        let depth_map = calc_loop_depths(
+            num_blocks,
+            &pred_map,
+            &succ_map,
+            &post_ord,
+            func.entry_block(),
+        );
+        debug_assert!(depth_map.len() == num_blocks);
+        //
+        // === END compute loop depth of all Blocks
+
+        info!("    CFGInfo::create: end");
+        Ok(CFGInfo {
+            pred_map,
+            succ_map,
+            pre_ord,
+            _post_ord: post_ord,
+            depth_map,
+        })
+    }
+}
author	Daniel Baumann <daniel.baumann@progress-linux.org>	2024-04-28 14:29:10 +0000
committer	Daniel Baumann <daniel.baumann@progress-linux.org>	2024-04-28 14:29:10 +0000
commit	2aa4a82499d4becd2284cdb482213d541b8804dd (patch)
tree	b80bf8bf13c3766139fbacc530efd0dd9d54394c /third_party/rust/regalloc/src/analysis_control_flow.rs
parent	Initial commit. (diff)
download	firefox-2aa4a82499d4becd2284cdb482213d541b8804dd.tar.xz firefox-2aa4a82499d4becd2284cdb482213d541b8804dd.zip