2020-10-04 15:52:14 +02:00
|
|
|
//! This pass finds basic blocks that are completely equal,
|
|
|
|
//! and replaces all uses with just one of them.
|
|
|
|
|
2021-03-08 15:32:41 -08:00
|
|
|
use std::{collections::hash_map::Entry, hash::Hash, hash::Hasher, iter};
|
2020-10-04 15:52:14 +02:00
|
|
|
|
2021-01-01 01:53:25 +01:00
|
|
|
use crate::MirPass;
|
2020-10-04 15:52:14 +02:00
|
|
|
|
|
|
|
use rustc_data_structures::fx::FxHashMap;
|
|
|
|
use rustc_middle::mir::visit::MutVisitor;
|
|
|
|
use rustc_middle::mir::*;
|
|
|
|
use rustc_middle::ty::TyCtxt;
|
|
|
|
|
|
|
|
use super::simplify::simplify_cfg;
|
|
|
|
|
|
|
|
pub struct DeduplicateBlocks;
|
|
|
|
|
|
|
|
impl<'tcx> MirPass<'tcx> for DeduplicateBlocks {
|
2021-12-02 09:17:32 -08:00
|
|
|
fn is_enabled(&self, sess: &rustc_session::Session) -> bool {
|
|
|
|
sess.mir_opt_level() >= 4
|
|
|
|
}
|
|
|
|
|
2020-10-04 15:52:14 +02:00
|
|
|
fn run_pass(&self, tcx: TyCtxt<'tcx>, body: &mut Body<'tcx>) {
|
|
|
|
debug!("Running DeduplicateBlocks on `{:?}`", body.source);
|
|
|
|
let duplicates = find_duplicates(body);
|
|
|
|
let has_opts_to_apply = !duplicates.is_empty();
|
|
|
|
|
|
|
|
if has_opts_to_apply {
|
|
|
|
let mut opt_applier = OptApplier { tcx, duplicates };
|
|
|
|
opt_applier.visit_body(body);
|
2021-05-01 14:56:48 -07:00
|
|
|
simplify_cfg(tcx, body);
|
2020-10-04 15:52:14 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
struct OptApplier<'tcx> {
|
|
|
|
tcx: TyCtxt<'tcx>,
|
|
|
|
duplicates: FxHashMap<BasicBlock, BasicBlock>,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<'tcx> MutVisitor<'tcx> for OptApplier<'tcx> {
|
|
|
|
fn tcx(&self) -> TyCtxt<'tcx> {
|
|
|
|
self.tcx
|
|
|
|
}
|
|
|
|
|
|
|
|
fn visit_terminator(&mut self, terminator: &mut Terminator<'tcx>, location: Location) {
|
|
|
|
for target in terminator.successors_mut() {
|
|
|
|
if let Some(replacement) = self.duplicates.get(target) {
|
|
|
|
debug!("SUCCESS: Replacing: `{:?}` with `{:?}`", target, replacement);
|
|
|
|
*target = *replacement;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
self.super_terminator(terminator, location);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-12-06 00:48:37 -08:00
|
|
|
fn find_duplicates(body: &Body<'_>) -> FxHashMap<BasicBlock, BasicBlock> {
|
2020-10-04 15:52:14 +02:00
|
|
|
let mut duplicates = FxHashMap::default();
|
|
|
|
|
|
|
|
let bbs_to_go_through =
|
2022-07-05 00:00:00 +00:00
|
|
|
body.basic_blocks.iter_enumerated().filter(|(_, bbd)| !bbd.is_cleanup).count();
|
2020-10-04 15:52:14 +02:00
|
|
|
|
|
|
|
let mut same_hashes =
|
|
|
|
FxHashMap::with_capacity_and_hasher(bbs_to_go_through, Default::default());
|
|
|
|
|
|
|
|
// Go through the basic blocks backwards. This means that in case of duplicates,
|
|
|
|
// we can use the basic block with the highest index as the replacement for all lower ones.
|
|
|
|
// For example, if bb1, bb2 and bb3 are duplicates, we will first insert bb3 in same_hashes.
|
|
|
|
// Then we will see that bb2 is a duplicate of bb3,
|
|
|
|
// and insert bb2 with the replacement bb3 in the duplicates list.
|
|
|
|
// When we see bb1, we see that it is a duplicate of bb3, and therefore insert it in the duplicates list
|
|
|
|
// with replacement bb3.
|
|
|
|
// When the duplicates are removed, we will end up with only bb3.
|
2022-07-05 00:00:00 +00:00
|
|
|
for (bb, bbd) in body.basic_blocks.iter_enumerated().rev().filter(|(_, bbd)| !bbd.is_cleanup) {
|
2020-10-04 15:52:14 +02:00
|
|
|
// Basic blocks can get really big, so to avoid checking for duplicates in basic blocks
|
|
|
|
// that are unlikely to have duplicates, we stop early. The early bail number has been
|
|
|
|
// found experimentally by eprintln while compiling the crates in the rustc-perf suite.
|
|
|
|
if bbd.statements.len() > 10 {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
let to_hash = BasicBlockHashable { basic_block_data: bbd };
|
|
|
|
let entry = same_hashes.entry(to_hash);
|
|
|
|
match entry {
|
|
|
|
Entry::Occupied(occupied) => {
|
|
|
|
// The basic block was already in the hashmap, which means we have a duplicate
|
|
|
|
let value = *occupied.get();
|
|
|
|
debug!("Inserting {:?} -> {:?}", bb, value);
|
2021-03-04 13:06:01 +01:00
|
|
|
duplicates.try_insert(bb, value).expect("key was already inserted");
|
2020-10-04 15:52:14 +02:00
|
|
|
}
|
|
|
|
Entry::Vacant(vacant) => {
|
|
|
|
vacant.insert(bb);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
duplicates
|
|
|
|
}
|
|
|
|
|
|
|
|
struct BasicBlockHashable<'tcx, 'a> {
|
|
|
|
basic_block_data: &'a BasicBlockData<'tcx>,
|
|
|
|
}
|
|
|
|
|
2021-12-06 00:48:37 -08:00
|
|
|
impl Hash for BasicBlockHashable<'_, '_> {
|
2020-10-04 15:52:14 +02:00
|
|
|
fn hash<H: Hasher>(&self, state: &mut H) {
|
|
|
|
hash_statements(state, self.basic_block_data.statements.iter());
|
|
|
|
// Note that since we only hash the kind, we lose span information if we deduplicate the blocks
|
|
|
|
self.basic_block_data.terminator().kind.hash(state);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-12-06 00:48:37 -08:00
|
|
|
impl Eq for BasicBlockHashable<'_, '_> {}
|
2020-10-04 15:52:14 +02:00
|
|
|
|
2021-12-06 00:48:37 -08:00
|
|
|
impl PartialEq for BasicBlockHashable<'_, '_> {
|
2020-10-04 15:52:14 +02:00
|
|
|
fn eq(&self, other: &Self) -> bool {
|
|
|
|
self.basic_block_data.statements.len() == other.basic_block_data.statements.len()
|
|
|
|
&& &self.basic_block_data.terminator().kind == &other.basic_block_data.terminator().kind
|
2021-03-08 15:32:41 -08:00
|
|
|
&& iter::zip(&self.basic_block_data.statements, &other.basic_block_data.statements)
|
2020-10-04 15:52:14 +02:00
|
|
|
.all(|(x, y)| statement_eq(&x.kind, &y.kind))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn hash_statements<'a, 'tcx, H: Hasher>(
|
|
|
|
hasher: &mut H,
|
|
|
|
iter: impl Iterator<Item = &'a Statement<'tcx>>,
|
|
|
|
) where
|
|
|
|
'tcx: 'a,
|
|
|
|
{
|
|
|
|
for stmt in iter {
|
|
|
|
statement_hash(hasher, &stmt.kind);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-12-06 00:48:37 -08:00
|
|
|
fn statement_hash<H: Hasher>(hasher: &mut H, stmt: &StatementKind<'_>) {
|
2020-10-04 15:52:14 +02:00
|
|
|
match stmt {
|
|
|
|
StatementKind::Assign(box (place, rvalue)) => {
|
|
|
|
place.hash(hasher);
|
|
|
|
rvalue_hash(hasher, rvalue)
|
|
|
|
}
|
|
|
|
x => x.hash(hasher),
|
|
|
|
};
|
|
|
|
}
|
|
|
|
|
2021-12-06 00:48:37 -08:00
|
|
|
fn rvalue_hash<H: Hasher>(hasher: &mut H, rvalue: &Rvalue<'_>) {
|
2020-10-04 15:52:14 +02:00
|
|
|
match rvalue {
|
|
|
|
Rvalue::Use(op) => operand_hash(hasher, op),
|
|
|
|
x => x.hash(hasher),
|
|
|
|
};
|
|
|
|
}
|
|
|
|
|
2021-12-06 00:48:37 -08:00
|
|
|
fn operand_hash<H: Hasher>(hasher: &mut H, operand: &Operand<'_>) {
|
2020-10-04 15:52:14 +02:00
|
|
|
match operand {
|
|
|
|
Operand::Constant(box Constant { user_ty: _, literal, span: _ }) => literal.hash(hasher),
|
|
|
|
x => x.hash(hasher),
|
|
|
|
};
|
|
|
|
}
|
|
|
|
|
|
|
|
fn statement_eq<'tcx>(lhs: &StatementKind<'tcx>, rhs: &StatementKind<'tcx>) -> bool {
|
|
|
|
let res = match (lhs, rhs) {
|
|
|
|
(
|
|
|
|
StatementKind::Assign(box (place, rvalue)),
|
|
|
|
StatementKind::Assign(box (place2, rvalue2)),
|
|
|
|
) => place == place2 && rvalue_eq(rvalue, rvalue2),
|
|
|
|
(x, y) => x == y,
|
|
|
|
};
|
|
|
|
debug!("statement_eq lhs: `{:?}` rhs: `{:?}` result: {:?}", lhs, rhs, res);
|
|
|
|
res
|
|
|
|
}
|
|
|
|
|
2021-12-06 00:48:37 -08:00
|
|
|
fn rvalue_eq<'tcx>(lhs: &Rvalue<'tcx>, rhs: &Rvalue<'tcx>) -> bool {
|
2020-10-04 15:52:14 +02:00
|
|
|
let res = match (lhs, rhs) {
|
|
|
|
(Rvalue::Use(op1), Rvalue::Use(op2)) => operand_eq(op1, op2),
|
|
|
|
(x, y) => x == y,
|
|
|
|
};
|
|
|
|
debug!("rvalue_eq lhs: `{:?}` rhs: `{:?}` result: {:?}", lhs, rhs, res);
|
|
|
|
res
|
|
|
|
}
|
|
|
|
|
2021-12-06 00:48:37 -08:00
|
|
|
fn operand_eq<'tcx>(lhs: &Operand<'tcx>, rhs: &Operand<'tcx>) -> bool {
|
2020-10-04 15:52:14 +02:00
|
|
|
let res = match (lhs, rhs) {
|
|
|
|
(
|
|
|
|
Operand::Constant(box Constant { user_ty: _, literal, span: _ }),
|
|
|
|
Operand::Constant(box Constant { user_ty: _, literal: literal2, span: _ }),
|
|
|
|
) => literal == literal2,
|
|
|
|
(x, y) => x == y,
|
|
|
|
};
|
|
|
|
debug!("operand_eq lhs: `{:?}` rhs: `{:?}` result: {:?}", lhs, rhs, res);
|
|
|
|
res
|
|
|
|
}
|