2018-04-25 19:30:39 +03:00
|
|
|
use rustc_target::spec::abi::{Abi};
|
2016-05-11 22:03:57 +02:00
|
|
|
use syntax::ast;
|
2019-05-08 13:21:18 +10:00
|
|
|
use syntax::symbol::sym;
|
2016-06-21 18:08:13 -04:00
|
|
|
use syntax_pos::Span;
|
2016-05-11 22:03:57 +02:00
|
|
|
|
|
|
|
use rustc::ty::{self, TyCtxt};
|
2019-03-17 10:36:10 +00:00
|
|
|
use rustc::hir::def_id::DefId;
|
2019-05-17 23:55:04 +02:00
|
|
|
use rustc::mir::{self, Body, Location};
|
Merge indexed_set.rs into bitvec.rs, and rename it bit_set.rs.
Currently we have two files implementing bitsets (and 2D bit matrices).
This commit combines them into one, taking the best features from each.
This involves renaming a lot of things. The high level changes are as
follows.
- bitvec.rs --> bit_set.rs
- indexed_set.rs --> (removed)
- BitArray + IdxSet --> BitSet (merged, see below)
- BitVector --> GrowableBitSet
- {,Sparse,Hybrid}IdxSet --> {,Sparse,Hybrid}BitSet
- BitMatrix --> BitMatrix
- SparseBitMatrix --> SparseBitMatrix
The changes within the bitset types themselves are as follows.
```
OLD OLD NEW
BitArray<C> IdxSet<T> BitSet<T>
-------- ------ ------
grow - grow
new - (remove)
new_empty new_empty new_empty
new_filled new_filled new_filled
- to_hybrid to_hybrid
clear clear clear
set_up_to set_up_to set_up_to
clear_above - clear_above
count - count
contains(T) contains(&T) contains(T)
contains_all - superset
is_empty - is_empty
insert(T) add(&T) insert(T)
insert_all - insert_all()
remove(T) remove(&T) remove(T)
words words words
words_mut words_mut words_mut
- overwrite overwrite
merge union union
- subtract subtract
- intersect intersect
iter iter iter
```
In general, when choosing names I went with:
- names that are more obvious (e.g. `BitSet` over `IdxSet`).
- names that are more like the Rust libraries (e.g. `T` over `C`,
`insert` over `add`);
- names that are more set-like (e.g. `union` over `merge`, `superset`
over `contains_all`, `domain_size` over `num_bits`).
Also, using `T` for index arguments seems more sensible than `&T` --
even though the latter is standard in Rust collection types -- because
indices are always copyable. It also results in fewer `&` and `*`
sigils in practice.
2018-09-14 15:07:25 +10:00
|
|
|
use rustc_data_structures::bit_set::BitSet;
|
2019-02-08 06:28:15 +09:00
|
|
|
use crate::transform::{MirPass, MirSource};
|
2016-05-11 22:03:57 +02:00
|
|
|
|
2019-02-08 06:28:15 +09:00
|
|
|
use crate::dataflow::{do_dataflow, DebugFormatted};
|
|
|
|
use crate::dataflow::MoveDataParamEnv;
|
|
|
|
use crate::dataflow::BitDenotation;
|
|
|
|
use crate::dataflow::DataflowResults;
|
|
|
|
use crate::dataflow::{
|
|
|
|
DefinitelyInitializedPlaces, MaybeInitializedPlaces, MaybeUninitializedPlaces
|
|
|
|
};
|
|
|
|
use crate::dataflow::move_paths::{MovePathIndex, LookupResult};
|
|
|
|
use crate::dataflow::move_paths::{HasMoveData, MoveData};
|
|
|
|
use crate::dataflow;
|
2017-06-26 14:57:26 +02:00
|
|
|
|
2019-02-08 06:28:15 +09:00
|
|
|
use crate::dataflow::has_rustc_mir_with;
|
2017-06-26 14:57:26 +02:00
|
|
|
|
|
|
|
pub struct SanityCheck;
|
|
|
|
|
|
|
|
impl MirPass for SanityCheck {
|
2019-06-12 00:11:55 +03:00
|
|
|
fn run_pass<'tcx>(&self, tcx: TyCtxt<'tcx, 'tcx>, src: MirSource<'tcx>, body: &mut Body<'tcx>) {
|
2019-02-03 11:51:07 +01:00
|
|
|
let def_id = src.def_id();
|
2019-05-08 13:21:18 +10:00
|
|
|
if !tcx.has_attr(def_id, sym::rustc_mir) {
|
2018-12-19 12:31:35 +02:00
|
|
|
debug!("skipping rustc_peek::SanityCheck on {}", tcx.def_path_str(def_id));
|
2017-06-26 14:57:26 +02:00
|
|
|
return;
|
|
|
|
} else {
|
2018-12-19 12:31:35 +02:00
|
|
|
debug!("running rustc_peek::SanityCheck on {}", tcx.def_path_str(def_id));
|
2017-06-26 14:57:26 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
let attributes = tcx.get_attrs(def_id);
|
|
|
|
let param_env = tcx.param_env(def_id);
|
2019-06-03 18:26:48 -04:00
|
|
|
let move_data = MoveData::gather_moves(body, tcx).unwrap();
|
2017-06-26 14:57:26 +02:00
|
|
|
let mdpe = MoveDataParamEnv { move_data: move_data, param_env: param_env };
|
2019-06-03 18:26:48 -04:00
|
|
|
let dead_unwinds = BitSet::new_empty(body.basic_blocks().len());
|
2017-06-26 14:57:26 +02:00
|
|
|
let flow_inits =
|
2019-06-03 18:26:48 -04:00
|
|
|
do_dataflow(tcx, body, def_id, &attributes, &dead_unwinds,
|
|
|
|
MaybeInitializedPlaces::new(tcx, body, &mdpe),
|
2017-11-24 13:00:09 +01:00
|
|
|
|bd, i| DebugFormatted::new(&bd.move_data().move_paths[i]));
|
2017-06-26 14:57:26 +02:00
|
|
|
let flow_uninits =
|
2019-06-03 18:26:48 -04:00
|
|
|
do_dataflow(tcx, body, def_id, &attributes, &dead_unwinds,
|
|
|
|
MaybeUninitializedPlaces::new(tcx, body, &mdpe),
|
2017-11-24 13:00:09 +01:00
|
|
|
|bd, i| DebugFormatted::new(&bd.move_data().move_paths[i]));
|
2017-06-26 14:57:26 +02:00
|
|
|
let flow_def_inits =
|
2019-06-03 18:26:48 -04:00
|
|
|
do_dataflow(tcx, body, def_id, &attributes, &dead_unwinds,
|
|
|
|
DefinitelyInitializedPlaces::new(tcx, body, &mdpe),
|
2017-11-24 13:00:09 +01:00
|
|
|
|bd, i| DebugFormatted::new(&bd.move_data().move_paths[i]));
|
2017-06-26 14:57:26 +02:00
|
|
|
|
2019-05-08 13:21:18 +10:00
|
|
|
if has_rustc_mir_with(&attributes, sym::rustc_peek_maybe_init).is_some() {
|
2019-06-03 18:26:48 -04:00
|
|
|
sanity_check_via_rustc_peek(tcx, body, def_id, &attributes, &flow_inits);
|
2017-06-26 14:57:26 +02:00
|
|
|
}
|
2019-05-08 13:21:18 +10:00
|
|
|
if has_rustc_mir_with(&attributes, sym::rustc_peek_maybe_uninit).is_some() {
|
2019-06-03 18:26:48 -04:00
|
|
|
sanity_check_via_rustc_peek(tcx, body, def_id, &attributes, &flow_uninits);
|
2017-06-26 14:57:26 +02:00
|
|
|
}
|
2019-05-08 13:21:18 +10:00
|
|
|
if has_rustc_mir_with(&attributes, sym::rustc_peek_definite_init).is_some() {
|
2019-06-03 18:26:48 -04:00
|
|
|
sanity_check_via_rustc_peek(tcx, body, def_id, &attributes, &flow_def_inits);
|
2017-06-26 14:57:26 +02:00
|
|
|
}
|
2019-05-08 13:21:18 +10:00
|
|
|
if has_rustc_mir_with(&attributes, sym::stop_after_dataflow).is_some() {
|
2017-06-26 14:57:26 +02:00
|
|
|
tcx.sess.fatal("stop_after_dataflow ended compilation");
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2016-05-11 22:03:57 +02:00
|
|
|
|
2016-05-17 08:37:36 +02:00
|
|
|
/// This function scans `mir` for all calls to the intrinsic
|
|
|
|
/// `rustc_peek` that have the expression form `rustc_peek(&expr)`.
|
|
|
|
///
|
|
|
|
/// For each such call, determines what the dataflow bit-state is for
|
|
|
|
/// the L-value corresponding to `expr`; if the bit-state is a 1, then
|
|
|
|
/// that call to `rustc_peek` is ignored by the sanity check. If the
|
|
|
|
/// bit-state is a 0, then this pass emits a error message saying
|
|
|
|
/// "rustc_peek: bit not set".
|
|
|
|
///
|
|
|
|
/// The intention is that one can write unit tests for dataflow by
|
|
|
|
/// putting code into a compile-fail test and using `rustc_peek` to
|
|
|
|
/// make observations about the results of dataflow static analyses.
|
|
|
|
///
|
|
|
|
/// (If there are any calls to `rustc_peek` that do not match the
|
|
|
|
/// expression form above, then that emits an error as well, but those
|
|
|
|
/// errors are not intended to be used for unit tests.)
|
2019-06-12 00:11:55 +03:00
|
|
|
pub fn sanity_check_via_rustc_peek<'tcx, O>(
|
|
|
|
tcx: TyCtxt<'tcx, 'tcx>,
|
|
|
|
body: &Body<'tcx>,
|
|
|
|
def_id: DefId,
|
|
|
|
_attributes: &[ast::Attribute],
|
|
|
|
results: &DataflowResults<'tcx, O>,
|
|
|
|
) where
|
|
|
|
O: BitDenotation<'tcx, Idx = MovePathIndex> + HasMoveData<'tcx>,
|
2016-05-11 22:03:57 +02:00
|
|
|
{
|
2019-03-17 10:36:10 +00:00
|
|
|
debug!("sanity_check_via_rustc_peek def_id: {:?}", def_id);
|
2016-05-11 22:03:57 +02:00
|
|
|
// FIXME: this is not DRY. Figure out way to abstract this and
|
2016-05-17 08:37:36 +02:00
|
|
|
// `dataflow::build_sets`. (But note it is doing non-standard
|
|
|
|
// stuff, so such generalization may not be realistic.)
|
2016-05-11 22:03:57 +02:00
|
|
|
|
2019-06-03 18:26:48 -04:00
|
|
|
for bb in body.basic_blocks().indices() {
|
|
|
|
each_block(tcx, body, results, bb);
|
2016-05-24 12:56:02 +02:00
|
|
|
}
|
|
|
|
}
|
2016-05-11 22:03:57 +02:00
|
|
|
|
2019-06-12 00:11:55 +03:00
|
|
|
fn each_block<'tcx, O>(
|
|
|
|
tcx: TyCtxt<'tcx, 'tcx>,
|
|
|
|
body: &Body<'tcx>,
|
|
|
|
results: &DataflowResults<'tcx, O>,
|
|
|
|
bb: mir::BasicBlock,
|
|
|
|
) where
|
|
|
|
O: BitDenotation<'tcx, Idx = MovePathIndex> + HasMoveData<'tcx>,
|
2016-05-24 12:56:02 +02:00
|
|
|
{
|
2016-12-26 09:40:15 -05:00
|
|
|
let move_data = results.0.operator.move_data();
|
2019-06-03 18:26:48 -04:00
|
|
|
let mir::BasicBlockData { ref statements, ref terminator, is_cleanup: _ } = body[bb];
|
2016-05-24 12:56:02 +02:00
|
|
|
|
|
|
|
let (args, span) = match is_rustc_peek(tcx, terminator) {
|
|
|
|
Some(args_and_span) => args_and_span,
|
|
|
|
None => return,
|
|
|
|
};
|
|
|
|
assert!(args.len() == 1);
|
2017-12-01 14:39:51 +02:00
|
|
|
let peek_arg_place = match args[0] {
|
2019-02-22 05:24:03 +01:00
|
|
|
mir::Operand::Copy(ref place @ mir::Place::Base(mir::PlaceBase::Local(_))) |
|
|
|
|
mir::Operand::Move(ref place @ mir::Place::Base(mir::PlaceBase::Local(_))) => Some(place),
|
2016-09-27 00:24:49 +02:00
|
|
|
_ => None,
|
2016-09-25 01:38:27 +02:00
|
|
|
};
|
|
|
|
|
2017-12-01 14:39:51 +02:00
|
|
|
let peek_arg_place = match peek_arg_place {
|
2016-09-25 01:38:27 +02:00
|
|
|
Some(arg) => arg,
|
|
|
|
None => {
|
2016-05-24 12:56:02 +02:00
|
|
|
tcx.sess.diagnostic().span_err(
|
|
|
|
span, "dataflow::sanity_check cannot feed a non-temp to rustc_peek.");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
};
|
2016-05-11 22:03:57 +02:00
|
|
|
|
2018-08-14 10:21:24 +10:00
|
|
|
let mut on_entry = results.0.sets.on_entry_set_for(bb.index()).to_owned();
|
|
|
|
let mut gen_set = results.0.sets.gen_set_for(bb.index()).clone();
|
|
|
|
let mut kill_set = results.0.sets.kill_set_for(bb.index()).clone();
|
2016-05-11 22:03:57 +02:00
|
|
|
|
2016-05-24 12:56:02 +02:00
|
|
|
// Emulate effect of all statements in the block up to (but not
|
2017-12-01 14:39:51 +02:00
|
|
|
// including) the borrow within `peek_arg_place`. Do *not* include
|
|
|
|
// call to `peek_arg_place` itself (since we are peeking the state
|
2016-05-24 12:56:02 +02:00
|
|
|
// of the argument at time immediate preceding Call to
|
|
|
|
// `rustc_peek`).
|
2016-05-11 22:03:57 +02:00
|
|
|
|
2018-08-14 10:21:24 +10:00
|
|
|
let mut sets = dataflow::BlockSets { on_entry: &mut on_entry,
|
|
|
|
gen_set: &mut gen_set,
|
|
|
|
kill_set: &mut kill_set };
|
2016-05-11 22:03:57 +02:00
|
|
|
|
2016-05-24 12:56:02 +02:00
|
|
|
for (j, stmt) in statements.iter().enumerate() {
|
|
|
|
debug!("rustc_peek: ({:?},{}) {:?}", bb, j, stmt);
|
2017-12-01 14:39:51 +02:00
|
|
|
let (place, rvalue) = match stmt.kind {
|
|
|
|
mir::StatementKind::Assign(ref place, ref rvalue) => {
|
|
|
|
(place, rvalue)
|
2016-05-24 12:56:02 +02:00
|
|
|
}
|
2018-09-14 21:05:31 +02:00
|
|
|
mir::StatementKind::FakeRead(..) |
|
2016-09-19 23:50:00 +03:00
|
|
|
mir::StatementKind::StorageLive(_) |
|
|
|
|
mir::StatementKind::StorageDead(_) |
|
2017-02-15 21:21:36 +02:00
|
|
|
mir::StatementKind::InlineAsm { .. } |
|
2018-10-24 11:47:17 +02:00
|
|
|
mir::StatementKind::Retag { .. } |
|
2018-08-31 18:59:35 -04:00
|
|
|
mir::StatementKind::AscribeUserType(..) |
|
2016-09-19 23:50:00 +03:00
|
|
|
mir::StatementKind::Nop => continue,
|
|
|
|
mir::StatementKind::SetDiscriminant{ .. } =>
|
2016-08-04 16:14:33 -07:00
|
|
|
span_bug!(stmt.source_info.span,
|
|
|
|
"sanity_check should run before Deaggregator inserts SetDiscriminant"),
|
2016-05-24 12:56:02 +02:00
|
|
|
};
|
2016-05-11 22:03:57 +02:00
|
|
|
|
2017-12-01 14:39:51 +02:00
|
|
|
if place == peek_arg_place {
|
2018-09-24 11:32:31 +10:00
|
|
|
if let mir::Rvalue::Ref(_, mir::BorrowKind::Shared, ref peeking_at_place) = **rvalue {
|
2016-05-24 12:56:02 +02:00
|
|
|
// Okay, our search is over.
|
2017-12-01 14:39:51 +02:00
|
|
|
match move_data.rev_lookup.find(peeking_at_place) {
|
2016-06-11 23:47:28 +03:00
|
|
|
LookupResult::Exact(peek_mpi) => {
|
Merge indexed_set.rs into bitvec.rs, and rename it bit_set.rs.
Currently we have two files implementing bitsets (and 2D bit matrices).
This commit combines them into one, taking the best features from each.
This involves renaming a lot of things. The high level changes are as
follows.
- bitvec.rs --> bit_set.rs
- indexed_set.rs --> (removed)
- BitArray + IdxSet --> BitSet (merged, see below)
- BitVector --> GrowableBitSet
- {,Sparse,Hybrid}IdxSet --> {,Sparse,Hybrid}BitSet
- BitMatrix --> BitMatrix
- SparseBitMatrix --> SparseBitMatrix
The changes within the bitset types themselves are as follows.
```
OLD OLD NEW
BitArray<C> IdxSet<T> BitSet<T>
-------- ------ ------
grow - grow
new - (remove)
new_empty new_empty new_empty
new_filled new_filled new_filled
- to_hybrid to_hybrid
clear clear clear
set_up_to set_up_to set_up_to
clear_above - clear_above
count - count
contains(T) contains(&T) contains(T)
contains_all - superset
is_empty - is_empty
insert(T) add(&T) insert(T)
insert_all - insert_all()
remove(T) remove(&T) remove(T)
words words words
words_mut words_mut words_mut
- overwrite overwrite
merge union union
- subtract subtract
- intersect intersect
iter iter iter
```
In general, when choosing names I went with:
- names that are more obvious (e.g. `BitSet` over `IdxSet`).
- names that are more like the Rust libraries (e.g. `T` over `C`,
`insert` over `add`);
- names that are more set-like (e.g. `union` over `merge`, `superset`
over `contains_all`, `domain_size` over `num_bits`).
Also, using `T` for index arguments seems more sensible than `&T` --
even though the latter is standard in Rust collection types -- because
indices are always copyable. It also results in fewer `&` and `*`
sigils in practice.
2018-09-14 15:07:25 +10:00
|
|
|
let bit_state = sets.on_entry.contains(peek_mpi);
|
2016-06-11 23:47:28 +03:00
|
|
|
debug!("rustc_peek({:?} = &{:?}) bit_state: {}",
|
2017-12-01 14:39:51 +02:00
|
|
|
place, peeking_at_place, bit_state);
|
2016-06-11 23:47:28 +03:00
|
|
|
if !bit_state {
|
|
|
|
tcx.sess.span_err(span, "rustc_peek: bit not set");
|
|
|
|
}
|
|
|
|
}
|
|
|
|
LookupResult::Parent(..) => {
|
|
|
|
tcx.sess.span_err(span, "rustc_peek: argument untracked");
|
|
|
|
}
|
2016-05-24 12:56:02 +02:00
|
|
|
}
|
|
|
|
return;
|
|
|
|
} else {
|
|
|
|
// Our search should have been over, but the input
|
|
|
|
// does not match expectations of `rustc_peek` for
|
|
|
|
// this sanity_check.
|
2016-06-11 23:47:28 +03:00
|
|
|
let msg = "rustc_peek: argument expression \
|
|
|
|
must be immediate borrow of form `&expr`";
|
2016-05-24 12:56:02 +02:00
|
|
|
tcx.sess.span_err(span, msg);
|
|
|
|
}
|
2016-05-11 22:03:57 +02:00
|
|
|
}
|
2016-05-24 23:03:52 +02:00
|
|
|
|
2017-12-01 14:39:51 +02:00
|
|
|
let lhs_mpi = move_data.rev_lookup.find(place);
|
2016-05-24 12:56:02 +02:00
|
|
|
|
2017-12-01 14:39:51 +02:00
|
|
|
debug!("rustc_peek: computing effect on place: {:?} ({:?}) in stmt: {:?}",
|
|
|
|
place, lhs_mpi, stmt);
|
2016-05-24 12:56:02 +02:00
|
|
|
// reset GEN and KILL sets before emulating their effect.
|
2018-08-14 10:21:24 +10:00
|
|
|
sets.gen_set.clear();
|
|
|
|
sets.kill_set.clear();
|
2017-12-24 00:45:53 +02:00
|
|
|
results.0.operator.before_statement_effect(
|
|
|
|
&mut sets, Location { block: bb, statement_index: j });
|
|
|
|
results.0.operator.statement_effect(
|
|
|
|
&mut sets, Location { block: bb, statement_index: j });
|
2018-08-20 15:34:08 +10:00
|
|
|
sets.on_entry.union(sets.gen_set);
|
|
|
|
sets.on_entry.subtract(sets.kill_set);
|
2016-05-11 22:03:57 +02:00
|
|
|
}
|
2016-05-20 13:18:03 +02:00
|
|
|
|
2017-12-24 00:45:53 +02:00
|
|
|
results.0.operator.before_terminator_effect(
|
|
|
|
&mut sets,
|
|
|
|
Location { block: bb, statement_index: statements.len() });
|
|
|
|
|
2016-05-24 12:56:02 +02:00
|
|
|
tcx.sess.span_err(span, &format!("rustc_peek: MIR did not match \
|
|
|
|
anticipated pattern; note that \
|
|
|
|
rustc_peek expects input of \
|
|
|
|
form `&expr`"));
|
2016-05-20 13:18:03 +02:00
|
|
|
}
|
|
|
|
|
2019-06-12 00:11:55 +03:00
|
|
|
fn is_rustc_peek<'a, 'tcx>(
|
|
|
|
tcx: TyCtxt<'tcx, 'tcx>,
|
|
|
|
terminator: &'a Option<mir::Terminator<'tcx>>,
|
|
|
|
) -> Option<(&'a [mir::Operand<'tcx>], Span)> {
|
2016-09-19 23:50:00 +03:00
|
|
|
if let Some(mir::Terminator { ref kind, source_info, .. }) = *terminator {
|
2017-05-13 17:11:52 +03:00
|
|
|
if let mir::TerminatorKind::Call { func: ref oper, ref args, .. } = *kind {
|
|
|
|
if let mir::Operand::Constant(ref func) = *oper {
|
2018-08-22 01:35:02 +01:00
|
|
|
if let ty::FnDef(def_id, _) = func.ty.sty {
|
2017-05-13 17:11:52 +03:00
|
|
|
let abi = tcx.fn_sig(def_id).abi();
|
2016-05-20 13:18:03 +02:00
|
|
|
let name = tcx.item_name(def_id);
|
2019-05-15 06:32:44 +10:00
|
|
|
if abi == Abi::RustIntrinsic && name == sym::rustc_peek {
|
2017-05-13 17:11:52 +03:00
|
|
|
return Some((args, source_info.span));
|
2016-05-20 13:18:03 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return None;
|
2016-05-11 22:03:57 +02:00
|
|
|
}
|