From 0d0a5367772aacd4c0baf954f601952a3a2017aa Mon Sep 17 00:00:00 2001
From: Camille GILLOT <gillot.camille@gmail.com>
Date: Thu, 20 Apr 2023 17:07:16 +0000
Subject: [PATCH] Do not thread through loop headers.

---
 .../rustc_mir_transform/src/jump_threading.rs | 45 +++++++++++++++++--
 ...reading.dfa.JumpThreading.panic-abort.diff | 19 ++------
 ...eading.dfa.JumpThreading.panic-unwind.diff | 19 ++------
 3 files changed, 48 insertions(+), 35 deletions(-)
diff --git a/compiler/rustc_mir_transform/src/jump_threading.rs b/compiler/rustc_mir_transform/src/jump_threading.rs
index 1831184aeda..0046d6d6941 100644
--- a/compiler/rustc_mir_transform/src/jump_threading.rs
+++ b/compiler/rustc_mir_transform/src/jump_threading.rs
@@ -26,11 +26,14 @@
 //! - bound the maximum depth by a constant `MAX_BACKTRACK`;
 //! - we only traverse `Goto` terminators.
 //!
+//! We try to avoid creating irreducible control-flow by not threading through a loop header.
+//!
 //! Likewise, applying the optimisation can create a lot of new MIR, so we bound the instruction
 //! cost by `MAX_COST`.
 
 use rustc_arena::DroplessArena;
 use rustc_data_structures::fx::FxHashSet;
+use rustc_index::bit_set::BitSet;
 use rustc_index::IndexVec;
 use rustc_middle::mir::visit::Visitor;
 use rustc_middle::mir::*;
@@ -58,14 +61,22 @@ fn run_pass(&self, tcx: TyCtxt<'tcx>, body: &mut Body<'tcx>) {
 
         let param_env = tcx.param_env_reveal_all_normalized(def_id);
         let map = Map::new(tcx, body, Some(MAX_PLACES));
+        let loop_headers = loop_headers(body);
 
         let arena = DroplessArena::default();
-        let mut finder =
-            TOFinder { tcx, param_env, body, arena: &arena, map: &map, opportunities: Vec::new() };
+        let mut finder = TOFinder {
+            tcx,
+            param_env,
+            body,
+            arena: &arena,
+            map: &map,
+            loop_headers: &loop_headers,
+            opportunities: Vec::new(),
+        };
 
         for (bb, bbdata) in body.basic_blocks.iter_enumerated() {
             debug!(?bb, term = ?bbdata.terminator());
-            if bbdata.is_cleanup {
+            if bbdata.is_cleanup || loop_headers.contains(bb) {
                 continue;
             }
             let Some((discr, targets)) = bbdata.terminator().kind.as_switch() else { continue };
@@ -108,6 +119,10 @@ fn run_pass(&self, tcx: TyCtxt<'tcx>, body: &mut Body<'tcx>) {
             return;
         }
 
+        // Verify that we do not thread through a loop header.
+        for to in opportunities.iter() {
+            assert!(to.chain.iter().all(|&block| !loop_headers.contains(block)));
+        }
         OpportunitySet::new(body, opportunities).apply(body);
     }
 }
@@ -125,6 +140,7 @@ struct TOFinder<'tcx, 'a> {
     param_env: ty::ParamEnv<'tcx>,
     body: &'a Body<'tcx>,
     map: &'a Map,
+    loop_headers: &'a BitSet<BasicBlock>,
     /// We use an arena to avoid cloning the slices when cloning `state`.
     arena: &'a DroplessArena,
     opportunities: Vec<ThreadingOpportunity>,
@@ -180,6 +196,11 @@ fn find_opportunity(
         mut cost: CostChecker<'_, 'tcx>,
         depth: usize,
     ) {
+        // Do not thread through loop headers.
+        if self.loop_headers.contains(bb) {
+            return;
+        }
+
         debug!(cost = ?cost.cost());
         for (statement_index, stmt) in
             self.body.basic_blocks[bb].statements.iter().enumerate().rev()
@@ -636,3 +657,21 @@ enum Update {
     Incr,
     Decr,
 }
+
+/// Compute the set of loop headers in the given body. We define a loop header as a block which has
+/// at least a predecessor which it dominates. This definition is only correct for reducible CFGs.
+/// But if the CFG is already irreducible, there is no point in trying much harder.
+/// is already irreducibl
+fn loop_headers(body: &Body<'_>) -> BitSet<BasicBlock> {
+    let mut loop_headers = BitSet::new_empty(body.basic_blocks.len());
+    let dominators = body.basic_blocks.dominators();
+    // Only visit reachable blocks.
+    for (bb, bbdata) in traversal::preorder(body) {
+        for succ in bbdata.terminator().successors() {
+            if dominators.dominates(succ, bb) {
+                loop_headers.insert(bb);
+            }
+        }
+    }
+    loop_headers
+}
diff --git a/tests/mir-opt/jump_threading.dfa.JumpThreading.panic-abort.diff b/tests/mir-opt/jump_threading.dfa.JumpThreading.panic-abort.diff
index bad733268a3..01bddc9a173 100644
--- a/tests/mir-opt/jump_threading.dfa.JumpThreading.panic-abort.diff
+++ b/tests/mir-opt/jump_threading.dfa.JumpThreading.panic-abort.diff
@@ -25,8 +25,7 @@
   
       bb1: {
           _4 = discriminant(_1);
--         switchInt(move _4) -> [0: bb4, 1: bb5, 2: bb6, 3: bb2, otherwise: bb3];
-+         goto -> bb2;
+          switchInt(move _4) -> [0: bb4, 1: bb5, 2: bb6, 3: bb2, otherwise: bb3];
       }
   
       bb2: {
@@ -46,8 +45,7 @@
           _1 = move _5;
           _3 = const ();
           StorageDead(_5);
--         goto -> bb1;
-+         goto -> bb8;
+          goto -> bb1;
       }
   
       bb5: {
@@ -56,8 +54,7 @@
           _1 = move _6;
           _3 = const ();
           StorageDead(_6);
--         goto -> bb1;
-+         goto -> bb9;
+          goto -> bb1;
       }
   
       bb6: {
@@ -72,16 +69,6 @@
 +     bb7: {
 +         _4 = discriminant(_1);
 +         goto -> bb4;
-+     }
-+ 
-+     bb8: {
-+         _4 = discriminant(_1);
-+         goto -> bb5;
-+     }
-+ 
-+     bb9: {
-+         _4 = discriminant(_1);
-+         goto -> bb6;
       }
   }
   
diff --git a/tests/mir-opt/jump_threading.dfa.JumpThreading.panic-unwind.diff b/tests/mir-opt/jump_threading.dfa.JumpThreading.panic-unwind.diff
index bad733268a3..01bddc9a173 100644
--- a/tests/mir-opt/jump_threading.dfa.JumpThreading.panic-unwind.diff
+++ b/tests/mir-opt/jump_threading.dfa.JumpThreading.panic-unwind.diff
@@ -25,8 +25,7 @@
   
       bb1: {
           _4 = discriminant(_1);
--         switchInt(move _4) -> [0: bb4, 1: bb5, 2: bb6, 3: bb2, otherwise: bb3];
-+         goto -> bb2;
+          switchInt(move _4) -> [0: bb4, 1: bb5, 2: bb6, 3: bb2, otherwise: bb3];
       }
   
       bb2: {
@@ -46,8 +45,7 @@
           _1 = move _5;
           _3 = const ();
           StorageDead(_5);
--         goto -> bb1;
-+         goto -> bb8;
+          goto -> bb1;
       }
   
       bb5: {
@@ -56,8 +54,7 @@
           _1 = move _6;
           _3 = const ();
           StorageDead(_6);
--         goto -> bb1;
-+         goto -> bb9;
+          goto -> bb1;
       }
   
       bb6: {
@@ -72,16 +69,6 @@
 +     bb7: {
 +         _4 = discriminant(_1);
 +         goto -> bb4;
-+     }
-+ 
-+     bb8: {
-+         _4 = discriminant(_1);
-+         goto -> bb5;
-+     }
-+ 
-+     bb9: {
-+         _4 = discriminant(_1);
-+         goto -> bb6;
       }
   }