rust/src/machine.rs

438 lines
14 KiB
Rust
Raw Normal View History

2019-06-29 07:15:05 -05:00
//! Global machine state as well as implementation of the interpreter engine
//! `Machine` trait.
use std::borrow::Cow;
use std::cell::RefCell;
2019-10-07 08:39:59 -05:00
use std::rc::Rc;
use rand::rngs::StdRng;
2020-01-06 13:53:41 -06:00
use rustc_hir::def_id::DefId;
use rustc::mir;
2019-12-23 05:56:23 -06:00
use rustc::ty::{
self,
layout::{LayoutOf, Size},
Ty, TyCtxt,
};
2020-01-05 02:53:45 -06:00
use rustc_span::{source_map::Span, symbol::sym};
use syntax::attr;
use crate::*;
2019-06-29 07:37:41 -05:00
// Some global facts about the emulated machine.
2019-10-07 08:39:59 -05:00
pub const PAGE_SIZE: u64 = 4 * 1024; // FIXME: adjust to target architecture
pub const STACK_ADDR: u64 = 32 * PAGE_SIZE; // not really about the "stack", but where we start assigning integer addresses to allocations
pub const STACK_SIZE: u64 = 16 * PAGE_SIZE; // whatever
2019-06-29 07:37:41 -05:00
pub const NUM_CPUS: u64 = 1;
/// Extra data stored with each stack frame
#[derive(Debug)]
pub struct FrameData<'tcx> {
/// Extra data for Stacked Borrows.
pub call_id: stacked_borrows::CallId,
2019-11-19 07:51:08 -06:00
/// If this is Some(), then this is a special "catch unwind" frame (the frame of the closure
/// called by `__rustc_maybe_catch_panic`). When this frame is popped during unwinding a panic,
/// we stop unwinding, use the `CatchUnwindData` to
/// store the panic payload, and continue execution in the parent frame.
pub catch_panic: Option<CatchUnwindData<'tcx>>,
}
/// Extra memory kinds
#[derive(Debug, Copy, Clone, PartialEq, Eq)]
pub enum MiriMemoryKind {
/// `__rust_alloc` memory.
Rust,
/// `malloc` memory.
C,
/// Windows `HeapAlloc` memory.
WinHeap,
2019-12-01 03:18:41 -06:00
/// Memory for env vars and args, errno and other parts of the machine-managed environment.
Env,
2019-12-01 03:18:41 -06:00
/// Rust statics.
Static,
}
impl Into<MemoryKind<MiriMemoryKind>> for MiriMemoryKind {
#[inline(always)]
fn into(self) -> MemoryKind<MiriMemoryKind> {
MemoryKind::Machine(self)
}
}
/// Extra per-allocation data
#[derive(Debug, Clone)]
pub struct AllocExtra {
/// Stacked Borrows state is only added if validation is enabled.
pub stacked_borrows: Option<stacked_borrows::AllocExtra>,
}
/// Extra global memory data
#[derive(Clone, Debug)]
pub struct MemoryExtra {
pub stacked_borrows: stacked_borrows::MemoryExtra,
pub intptrcast: intptrcast::MemoryExtra,
2019-07-23 14:38:53 -05:00
/// The random number generator used for resolving non-determinism.
pub(crate) rng: RefCell<StdRng>,
/// Whether to enforce the validity invariant.
pub(crate) validate: bool,
}
impl MemoryExtra {
2019-11-30 17:02:58 -06:00
pub fn new(rng: StdRng, validate: bool, tracked_pointer_tag: Option<PtrId>) -> Self {
MemoryExtra {
2019-11-30 17:02:58 -06:00
stacked_borrows: Rc::new(RefCell::new(GlobalState::new(tracked_pointer_tag))),
intptrcast: Default::default(),
2019-07-23 14:38:53 -05:00
rng: RefCell::new(rng),
validate,
}
}
}
/// The machine itself.
pub struct Evaluator<'tcx> {
/// Environment variables set by `setenv`.
/// Miri does not expose env vars from the host to the emulated program.
2019-08-14 10:24:35 -05:00
pub(crate) env_vars: EnvVars,
/// Program arguments (`Option` because we can only initialize them after creating the ecx).
/// These are *pointers* to argc/argv because macOS.
/// We also need the full command line as one string because of Windows.
2019-11-02 05:50:21 -05:00
pub(crate) argc: Option<Scalar<Tag>>,
pub(crate) argv: Option<Scalar<Tag>>,
pub(crate) cmd_line: Option<Scalar<Tag>>,
/// Last OS error location in memory. It is a 32-bit integer.
2019-10-12 20:58:02 -05:00
pub(crate) last_error: Option<MPlaceTy<'tcx, Tag>>,
/// TLS state.
pub(crate) tls: TlsData<'tcx>,
/// If enabled, the `env_vars` field is populated with the host env vars during initialization
/// and random number generation is delegated to the host.
pub(crate) communicate: bool,
2019-09-24 17:28:00 -05:00
pub(crate) file_handler: FileHandler,
/// The temporary used for storing the argument of
/// the call to `miri_start_panic` (the panic payload) when unwinding.
2019-12-23 05:56:23 -06:00
pub(crate) panic_payload: Option<ImmTy<'tcx, Tag>>,
}
impl<'tcx> Evaluator<'tcx> {
pub(crate) fn new(communicate: bool) -> Self {
Evaluator {
2019-08-13 16:17:41 -05:00
// `env_vars` could be initialized properly here if `Memory` were available before
// calling this method.
2019-08-14 10:24:35 -05:00
env_vars: EnvVars::default(),
argc: None,
argv: None,
cmd_line: None,
2019-10-03 10:21:55 -05:00
last_error: None,
tls: TlsData::default(),
communicate,
2019-09-24 17:28:00 -05:00
file_handler: Default::default(),
2019-12-23 05:56:23 -06:00
panic_payload: None,
}
}
}
2019-07-05 16:47:10 -05:00
/// A rustc InterpCx for Miri.
pub type MiriEvalContext<'mir, 'tcx> = InterpCx<'mir, 'tcx, Evaluator<'tcx>>;
/// A little trait that's useful to be inherited by extension traits.
pub trait MiriEvalContextExt<'mir, 'tcx> {
fn eval_context_ref<'a>(&'a self) -> &'a MiriEvalContext<'mir, 'tcx>;
fn eval_context_mut<'a>(&'a mut self) -> &'a mut MiriEvalContext<'mir, 'tcx>;
}
impl<'mir, 'tcx> MiriEvalContextExt<'mir, 'tcx> for MiriEvalContext<'mir, 'tcx> {
#[inline(always)]
fn eval_context_ref(&self) -> &MiriEvalContext<'mir, 'tcx> {
self
}
#[inline(always)]
fn eval_context_mut(&mut self) -> &mut MiriEvalContext<'mir, 'tcx> {
self
}
}
/// Machine hook implementations.
impl<'mir, 'tcx> Machine<'mir, 'tcx> for Evaluator<'tcx> {
type MemoryKinds = MiriMemoryKind;
type FrameExtra = FrameData<'tcx>;
type MemoryExtra = MemoryExtra;
type AllocExtra = AllocExtra;
type PointerTag = Tag;
type ExtraFnVal = Dlsym;
2019-12-23 05:56:23 -06:00
type MemoryMap =
MonoHashMap<AllocId, (MemoryKind<MiriMemoryKind>, Allocation<Tag, Self::AllocExtra>)>;
const STATIC_KIND: Option<MiriMemoryKind> = Some(MiriMemoryKind::Static);
2019-08-05 08:49:19 -05:00
const CHECK_ALIGN: bool = true;
#[inline(always)]
2019-07-05 16:47:10 -05:00
fn enforce_validity(ecx: &InterpCx<'mir, 'tcx, Self>) -> bool {
2019-10-17 21:11:50 -05:00
ecx.memory.extra.validate
}
#[inline(always)]
2019-12-04 16:31:39 -06:00
fn find_mir_or_eval_fn(
2019-07-05 16:47:10 -05:00
ecx: &mut InterpCx<'mir, 'tcx, Self>,
_span: Span,
instance: ty::Instance<'tcx>,
args: &[OpTy<'tcx, Tag>],
2019-11-25 15:48:31 -06:00
ret: Option<(PlaceTy<'tcx, Tag>, mir::BasicBlock)>,
unwind: Option<mir::BasicBlock>,
) -> InterpResult<'tcx, Option<&'mir mir::Body<'tcx>>> {
2019-12-04 16:31:39 -06:00
ecx.find_mir_or_eval_fn(instance, args, ret, unwind)
}
#[inline(always)]
fn call_extra_fn(
ecx: &mut InterpCx<'mir, 'tcx, Self>,
fn_val: Dlsym,
args: &[OpTy<'tcx, Tag>],
2019-11-25 15:48:31 -06:00
ret: Option<(PlaceTy<'tcx, Tag>, mir::BasicBlock)>,
_unwind: Option<mir::BasicBlock>,
) -> InterpResult<'tcx> {
2019-11-25 15:48:31 -06:00
ecx.call_dlsym(fn_val, args, ret)
}
#[inline(always)]
fn call_intrinsic(
2019-07-05 16:47:10 -05:00
ecx: &mut rustc_mir::interpret::InterpCx<'mir, 'tcx, Self>,
2019-10-30 04:16:58 -05:00
span: Span,
instance: ty::Instance<'tcx>,
args: &[OpTy<'tcx, Tag>],
2019-11-25 15:48:31 -06:00
ret: Option<(PlaceTy<'tcx, Tag>, mir::BasicBlock)>,
unwind: Option<mir::BasicBlock>,
) -> InterpResult<'tcx> {
2019-11-25 15:48:31 -06:00
ecx.call_intrinsic(span, instance, args, ret, unwind)
}
#[inline(always)]
fn assert_panic(
ecx: &mut InterpCx<'mir, 'tcx, Self>,
span: Span,
2020-02-13 07:01:35 -06:00
msg: &mir::AssertMessage<'tcx>,
unwind: Option<mir::BasicBlock>,
) -> InterpResult<'tcx> {
ecx.assert_panic(span, msg, unwind)
}
#[inline(always)]
fn binary_ptr_op(
2019-07-05 16:47:10 -05:00
ecx: &rustc_mir::interpret::InterpCx<'mir, 'tcx, Self>,
bin_op: mir::BinOp,
left: ImmTy<'tcx, Tag>,
right: ImmTy<'tcx, Tag>,
2019-08-10 14:19:25 -05:00
) -> InterpResult<'tcx, (Scalar<Tag>, bool, Ty<'tcx>)> {
ecx.binary_ptr_op(bin_op, left, right)
}
fn box_alloc(
2019-07-05 16:47:10 -05:00
ecx: &mut InterpCx<'mir, 'tcx, Self>,
dest: PlaceTy<'tcx, Tag>,
) -> InterpResult<'tcx> {
trace!("box_alloc for {:?}", dest.layout.ty);
let layout = ecx.layout_of(dest.layout.ty.builtin_deref(false).unwrap().ty)?;
// First argument: `size`.
// (`0` is allowed here -- this is expected to be handled by the lang item).
let size = Scalar::from_uint(layout.size.bytes(), ecx.pointer_size());
// Second argument: `align`.
let align = Scalar::from_uint(layout.align.abi.bytes(), ecx.pointer_size());
// Call the `exchange_malloc` lang item.
let malloc = ecx.tcx.lang_items().exchange_malloc_fn().unwrap();
let malloc = ty::Instance::mono(ecx.tcx.tcx, malloc);
ecx.call_function(
malloc,
&[size.into(), align.into()],
Some(dest),
// Don't do anything when we are done. The `statement()` function will increment
// the old stack frame's stmt counter to the next statement, which means that when
// `exchange_malloc` returns, we go on evaluating exactly where we want to be.
StackPopCleanup::None { cleanup: true },
)?;
Ok(())
}
fn find_foreign_static(
tcx: TyCtxt<'tcx>,
def_id: DefId,
) -> InterpResult<'tcx, Cow<'tcx, Allocation>> {
let attrs = tcx.get_attrs(def_id);
let link_name = match attr::first_attr_value_str_by_name(&attrs, sym::link_name) {
Some(name) => name.as_str(),
None => tcx.item_name(def_id).as_str(),
};
2019-09-05 11:17:58 -05:00
let alloc = match &*link_name {
"__cxa_thread_atexit_impl" => {
// This should be all-zero, pointer-sized.
let size = tcx.data_layout.pointer_size;
let data = vec![0; size.bytes() as usize];
Allocation::from_bytes(&data, tcx.data_layout.pointer_align.abi)
}
2019-08-03 13:31:33 -05:00
_ => throw_unsup_format!("can't access foreign static: {}", link_name),
};
Ok(Cow::Owned(alloc))
}
#[inline(always)]
2019-10-07 08:39:59 -05:00
fn before_terminator(_ecx: &mut InterpCx<'mir, 'tcx, Self>) -> InterpResult<'tcx> {
// We are not interested in detecting loops.
Ok(())
}
2019-11-29 12:50:37 -06:00
fn init_allocation_extra<'b>(
memory_extra: &MemoryExtra,
id: AllocId,
alloc: Cow<'b, Allocation>,
kind: Option<MemoryKind<Self::MemoryKinds>>,
2019-12-01 03:18:41 -06:00
) -> (Cow<'b, Allocation<Self::PointerTag, Self::AllocExtra>>, Self::PointerTag) {
let kind = kind.expect("we set our STATIC_KIND so this cannot be None");
let alloc = alloc.into_owned();
2019-12-01 03:18:41 -06:00
let (stacks, base_tag) = if memory_extra.validate {
let (stacks, base_tag) = Stacks::new_allocation(
id,
2019-09-05 11:17:58 -05:00
alloc.size,
Rc::clone(&memory_extra.stacked_borrows),
kind,
2019-12-01 03:18:41 -06:00
);
(Some(stacks), base_tag)
2019-11-29 12:50:37 -06:00
} else {
2019-12-01 03:18:41 -06:00
// No stacks, no tag.
(None, Tag::Untagged)
};
let mut stacked_borrows = memory_extra.stacked_borrows.borrow_mut();
2019-09-17 05:30:14 -05:00
let alloc: Allocation<Tag, Self::AllocExtra> = alloc.with_tags_and_extra(
2019-10-07 08:39:59 -05:00
|alloc| {
if !memory_extra.validate {
Tag::Untagged
} else {
// Only statics may already contain pointers at this point
assert_eq!(kind, MiriMemoryKind::Static.into());
stacked_borrows.static_base_ptr(alloc)
}
2019-09-05 11:17:58 -05:00
},
2019-12-23 05:56:23 -06:00
AllocExtra { stacked_borrows: stacks },
2019-09-05 11:17:58 -05:00
);
2019-12-01 03:18:41 -06:00
(Cow::Owned(alloc), base_tag)
}
#[inline(always)]
2019-10-07 08:39:59 -05:00
fn tag_static_base_pointer(memory_extra: &MemoryExtra, id: AllocId) -> Self::PointerTag {
if !memory_extra.validate {
Tag::Untagged
} else {
2019-12-23 05:56:23 -06:00
memory_extra.stacked_borrows.borrow_mut().static_base_ptr(id)
}
}
#[inline(always)]
fn retag(
2019-07-05 16:47:10 -05:00
ecx: &mut InterpCx<'mir, 'tcx, Self>,
kind: mir::RetagKind,
place: PlaceTy<'tcx, Tag>,
) -> InterpResult<'tcx> {
if !Self::enforce_validity(ecx) {
// No tracking.
2019-10-07 08:39:59 -05:00
Ok(())
} else {
ecx.retag(kind, place)
}
}
#[inline(always)]
2019-12-23 05:56:23 -06:00
fn stack_push(ecx: &mut InterpCx<'mir, 'tcx, Self>) -> InterpResult<'tcx, FrameData<'tcx>> {
Ok(FrameData {
call_id: ecx.memory.extra.stacked_borrows.borrow_mut().new_call(),
catch_panic: None,
})
}
#[inline(always)]
fn stack_pop(
2019-07-05 16:47:10 -05:00
ecx: &mut InterpCx<'mir, 'tcx, Self>,
extra: FrameData<'tcx>,
2019-12-23 05:56:23 -06:00
unwinding: bool,
) -> InterpResult<'tcx, StackPopInfo> {
ecx.handle_stack_pop(extra, unwinding)
}
2019-07-23 14:38:53 -05:00
#[inline(always)]
fn int_to_ptr(
memory: &Memory<'mir, 'tcx, Self>,
int: u64,
) -> InterpResult<'tcx, Pointer<Self::PointerTag>> {
2019-07-23 14:38:53 -05:00
intptrcast::GlobalState::int_to_ptr(int, memory)
}
2019-07-23 14:38:53 -05:00
#[inline(always)]
fn ptr_to_int(
memory: &Memory<'mir, 'tcx, Self>,
ptr: Pointer<Self::PointerTag>,
) -> InterpResult<'tcx, u64> {
2019-07-23 14:38:53 -05:00
intptrcast::GlobalState::ptr_to_int(ptr, memory)
}
}
impl AllocationExtra<Tag> for AllocExtra {
#[inline(always)]
fn memory_read<'tcx>(
alloc: &Allocation<Tag, AllocExtra>,
ptr: Pointer<Tag>,
size: Size,
) -> InterpResult<'tcx> {
if let Some(ref stacked_borrows) = alloc.extra.stacked_borrows {
stacked_borrows.memory_read(ptr, size)
} else {
Ok(())
}
}
#[inline(always)]
fn memory_written<'tcx>(
alloc: &mut Allocation<Tag, AllocExtra>,
ptr: Pointer<Tag>,
size: Size,
) -> InterpResult<'tcx> {
if let Some(ref mut stacked_borrows) = alloc.extra.stacked_borrows {
stacked_borrows.memory_written(ptr, size)
} else {
Ok(())
}
}
#[inline(always)]
fn memory_deallocated<'tcx>(
alloc: &mut Allocation<Tag, AllocExtra>,
ptr: Pointer<Tag>,
size: Size,
) -> InterpResult<'tcx> {
if let Some(ref mut stacked_borrows) = alloc.extra.stacked_borrows {
stacked_borrows.memory_deallocated(ptr, size)
} else {
Ok(())
}
}
}
impl MayLeak for MiriMemoryKind {
#[inline(always)]
fn may_leak(self) -> bool {
use self::MiriMemoryKind::*;
match self {
Rust | C | WinHeap => false,
Env | Static => true,
}
}
}