Rollup merge of #125633 - RalfJung:miri-no-copy, r=saethlin

miri: avoid making a full copy of all new allocations

Hopefully fixes https://github.com/rust-lang/miri/issues/3637

r? ``@saethlin``
This commit is contained in:
许杰友 Jieyou Xu (Joe) 2024-05-29 03:25:09 +01:00 committed by GitHub
commit 305137de18
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
8 changed files with 92 additions and 85 deletions

View File

@ -174,7 +174,7 @@ fn expose_ptr(
unimplemented!() unimplemented!()
} }
fn init_frame_extra( fn init_frame(
_ecx: &mut InterpCx<'tcx, Self>, _ecx: &mut InterpCx<'tcx, Self>,
_frame: interpret::Frame<'tcx, Self::Provenance>, _frame: interpret::Frame<'tcx, Self::Provenance>,
) -> interpret::InterpResult<'tcx, interpret::Frame<'tcx, Self::Provenance, Self::FrameExtra>> ) -> interpret::InterpResult<'tcx, interpret::Frame<'tcx, Self::Provenance, Self::FrameExtra>>

View File

@ -643,7 +643,7 @@ fn expose_ptr(_ecx: &mut InterpCx<'tcx, Self>, _ptr: Pointer) -> InterpResult<'t
} }
#[inline(always)] #[inline(always)]
fn init_frame_extra( fn init_frame(
ecx: &mut InterpCx<'tcx, Self>, ecx: &mut InterpCx<'tcx, Self>,
frame: Frame<'tcx>, frame: Frame<'tcx>,
) -> InterpResult<'tcx, Frame<'tcx>> { ) -> InterpResult<'tcx, Frame<'tcx>> {

View File

@ -819,7 +819,7 @@ pub fn push_stack_frame(
tracing_span: SpanGuard::new(), tracing_span: SpanGuard::new(),
extra: (), extra: (),
}; };
let frame = M::init_frame_extra(self, pre_frame)?; let frame = M::init_frame(self, pre_frame)?;
self.stack_mut().push(frame); self.stack_mut().push(frame);
// Make sure all the constants required by this frame evaluate successfully (post-monomorphization check). // Make sure all the constants required by this frame evaluate successfully (post-monomorphization check).

View File

@ -329,27 +329,41 @@ fn ptr_get_alloc(
ptr: Pointer<Self::Provenance>, ptr: Pointer<Self::Provenance>,
) -> Option<(AllocId, Size, Self::ProvenanceExtra)>; ) -> Option<(AllocId, Size, Self::ProvenanceExtra)>;
/// Called to adjust allocations to the Provenance and AllocExtra of this machine. /// Called to adjust global allocations to the Provenance and AllocExtra of this machine.
/// ///
/// If `alloc` contains pointers, then they are all pointing to globals. /// If `alloc` contains pointers, then they are all pointing to globals.
/// ///
/// The way we construct allocations is to always first construct it without extra and then add
/// the extra. This keeps uniform code paths for handling both allocations created by CTFE for
/// globals, and allocations created by Miri during evaluation.
///
/// `kind` is the kind of the allocation being adjusted; it can be `None` when
/// it's a global and `GLOBAL_KIND` is `None`.
///
/// This should avoid copying if no work has to be done! If this returns an owned /// This should avoid copying if no work has to be done! If this returns an owned
/// allocation (because a copy had to be done to adjust things), machine memory will /// allocation (because a copy had to be done to adjust things), machine memory will
/// cache the result. (This relies on `AllocMap::get_or` being able to add the /// cache the result. (This relies on `AllocMap::get_or` being able to add the
/// owned allocation to the map even when the map is shared.) /// owned allocation to the map even when the map is shared.)
fn adjust_allocation<'b>( fn adjust_global_allocation<'b>(
ecx: &InterpCx<'tcx, Self>, ecx: &InterpCx<'tcx, Self>,
id: AllocId, id: AllocId,
alloc: Cow<'b, Allocation>, alloc: &'b Allocation,
kind: Option<MemoryKind<Self::MemoryKind>>, ) -> InterpResult<'tcx, Cow<'b, Allocation<Self::Provenance, Self::AllocExtra, Self::Bytes>>>
) -> InterpResult<'tcx, Cow<'b, Allocation<Self::Provenance, Self::AllocExtra, Self::Bytes>>>; {
// The default implementation does a copy; CTFE machines have a more efficient implementation
// based on their particular choice for `Provenance`, `AllocExtra`, and `Bytes`.
let kind = Self::GLOBAL_KIND
.expect("if GLOBAL_KIND is None, adjust_global_allocation must be overwritten");
let alloc = alloc.adjust_from_tcx(&ecx.tcx, |ptr| ecx.global_root_pointer(ptr))?;
let extra =
Self::init_alloc_extra(ecx, id, MemoryKind::Machine(kind), alloc.size(), alloc.align)?;
Ok(Cow::Owned(alloc.with_extra(extra)))
}
/// Initialize the extra state of an allocation.
///
/// This is guaranteed to be called exactly once on all allocations that are accessed by the
/// program.
fn init_alloc_extra(
ecx: &InterpCx<'tcx, Self>,
id: AllocId,
kind: MemoryKind<Self::MemoryKind>,
size: Size,
align: Align,
) -> InterpResult<'tcx, Self::AllocExtra>;
/// Return a "root" pointer for the given allocation: the one that is used for direct /// Return a "root" pointer for the given allocation: the one that is used for direct
/// accesses to this static/const/fn allocation, or the one returned from the heap allocator. /// accesses to this static/const/fn allocation, or the one returned from the heap allocator.
@ -473,7 +487,7 @@ fn protect_in_place_function_argument(
} }
/// Called immediately before a new stack frame gets pushed. /// Called immediately before a new stack frame gets pushed.
fn init_frame_extra( fn init_frame(
ecx: &mut InterpCx<'tcx, Self>, ecx: &mut InterpCx<'tcx, Self>,
frame: Frame<'tcx, Self::Provenance>, frame: Frame<'tcx, Self::Provenance>,
) -> InterpResult<'tcx, Frame<'tcx, Self::Provenance, Self::FrameExtra>>; ) -> InterpResult<'tcx, Frame<'tcx, Self::Provenance, Self::FrameExtra>>;
@ -590,13 +604,23 @@ fn call_extra_fn(
} }
#[inline(always)] #[inline(always)]
fn adjust_allocation<'b>( fn adjust_global_allocation<'b>(
_ecx: &InterpCx<$tcx, Self>, _ecx: &InterpCx<$tcx, Self>,
_id: AllocId, _id: AllocId,
alloc: Cow<'b, Allocation>, alloc: &'b Allocation,
_kind: Option<MemoryKind<Self::MemoryKind>>,
) -> InterpResult<$tcx, Cow<'b, Allocation<Self::Provenance>>> { ) -> InterpResult<$tcx, Cow<'b, Allocation<Self::Provenance>>> {
Ok(alloc) // Overwrite default implementation: no need to adjust anything.
Ok(Cow::Borrowed(alloc))
}
fn init_alloc_extra(
_ecx: &InterpCx<$tcx, Self>,
_id: AllocId,
_kind: MemoryKind<Self::MemoryKind>,
_size: Size,
_align: Align,
) -> InterpResult<$tcx, Self::AllocExtra> {
Ok(())
} }
fn extern_static_pointer( fn extern_static_pointer(

View File

@ -239,7 +239,7 @@ pub fn allocate_bytes_ptr(
pub fn allocate_raw_ptr( pub fn allocate_raw_ptr(
&mut self, &mut self,
alloc: Allocation, alloc: Allocation<M::Provenance, (), M::Bytes>,
kind: MemoryKind<M::MemoryKind>, kind: MemoryKind<M::MemoryKind>,
) -> InterpResult<'tcx, Pointer<M::Provenance>> { ) -> InterpResult<'tcx, Pointer<M::Provenance>> {
let id = self.tcx.reserve_alloc_id(); let id = self.tcx.reserve_alloc_id();
@ -248,8 +248,11 @@ pub fn allocate_raw_ptr(
M::GLOBAL_KIND.map(MemoryKind::Machine), M::GLOBAL_KIND.map(MemoryKind::Machine),
"dynamically allocating global memory" "dynamically allocating global memory"
); );
let alloc = M::adjust_allocation(self, id, Cow::Owned(alloc), Some(kind))?; // We have set things up so we don't need to call `adjust_from_tcx` here,
self.memory.alloc_map.insert(id, (kind, alloc.into_owned())); // so we avoid copying the entire allocation contents.
let extra = M::init_alloc_extra(self, id, kind, alloc.size(), alloc.align)?;
let alloc = alloc.with_extra(extra);
self.memory.alloc_map.insert(id, (kind, alloc));
M::adjust_alloc_root_pointer(self, Pointer::from(id), Some(kind)) M::adjust_alloc_root_pointer(self, Pointer::from(id), Some(kind))
} }
@ -583,11 +586,10 @@ fn get_global_alloc(
}; };
M::before_access_global(self.tcx, &self.machine, id, alloc, def_id, is_write)?; M::before_access_global(self.tcx, &self.machine, id, alloc, def_id, is_write)?;
// We got tcx memory. Let the machine initialize its "extra" stuff. // We got tcx memory. Let the machine initialize its "extra" stuff.
M::adjust_allocation( M::adjust_global_allocation(
self, self,
id, // always use the ID we got as input, not the "hidden" one. id, // always use the ID we got as input, not the "hidden" one.
Cow::Borrowed(alloc.inner()), alloc.inner(),
M::GLOBAL_KIND.map(MemoryKind::Machine),
) )
} }

View File

@ -266,19 +266,6 @@ pub fn subrange(self, subrange: AllocRange) -> AllocRange {
// The constructors are all without extra; the extra gets added by a machine hook later. // The constructors are all without extra; the extra gets added by a machine hook later.
impl<Prov: Provenance, Bytes: AllocBytes> Allocation<Prov, (), Bytes> { impl<Prov: Provenance, Bytes: AllocBytes> Allocation<Prov, (), Bytes> {
/// Creates an allocation from an existing `Bytes` value - this is needed for miri FFI support
pub fn from_raw_bytes(bytes: Bytes, align: Align, mutability: Mutability) -> Self {
let size = Size::from_bytes(bytes.len());
Self {
bytes,
provenance: ProvenanceMap::new(),
init_mask: InitMask::new(size, true),
align,
mutability,
extra: (),
}
}
/// Creates an allocation initialized by the given bytes /// Creates an allocation initialized by the given bytes
pub fn from_bytes<'a>( pub fn from_bytes<'a>(
slice: impl Into<Cow<'a, [u8]>>, slice: impl Into<Cow<'a, [u8]>>,
@ -342,18 +329,30 @@ pub fn uninit(size: Size, align: Align) -> Self {
Err(x) => x, Err(x) => x,
} }
} }
/// Add the extra.
pub fn with_extra<Extra>(self, extra: Extra) -> Allocation<Prov, Extra, Bytes> {
Allocation {
bytes: self.bytes,
provenance: self.provenance,
init_mask: self.init_mask,
align: self.align,
mutability: self.mutability,
extra,
}
}
} }
impl Allocation { impl Allocation {
/// Adjust allocation from the ones in `tcx` to a custom Machine instance /// Adjust allocation from the ones in `tcx` to a custom Machine instance
/// with a different `Provenance`, `Extra` and `Byte` type. /// with a different `Provenance` and `Byte` type.
pub fn adjust_from_tcx<Prov: Provenance, Extra, Bytes: AllocBytes, Err>( pub fn adjust_from_tcx<Prov: Provenance, Bytes: AllocBytes, Err>(
self, &self,
cx: &impl HasDataLayout, cx: &impl HasDataLayout,
extra: Extra,
mut adjust_ptr: impl FnMut(Pointer<CtfeProvenance>) -> Result<Pointer<Prov>, Err>, mut adjust_ptr: impl FnMut(Pointer<CtfeProvenance>) -> Result<Pointer<Prov>, Err>,
) -> Result<Allocation<Prov, Extra, Bytes>, Err> { ) -> Result<Allocation<Prov, (), Bytes>, Err> {
let mut bytes = self.bytes; // Copy the data.
let mut bytes = Bytes::from_bytes(Cow::Borrowed(&*self.bytes), self.align);
// Adjust provenance of pointers stored in this allocation. // Adjust provenance of pointers stored in this allocation.
let mut new_provenance = Vec::with_capacity(self.provenance.ptrs().len()); let mut new_provenance = Vec::with_capacity(self.provenance.ptrs().len());
let ptr_size = cx.data_layout().pointer_size.bytes_usize(); let ptr_size = cx.data_layout().pointer_size.bytes_usize();
@ -369,12 +368,12 @@ pub fn adjust_from_tcx<Prov: Provenance, Extra, Bytes: AllocBytes, Err>(
} }
// Create allocation. // Create allocation.
Ok(Allocation { Ok(Allocation {
bytes: AllocBytes::from_bytes(Cow::Owned(Vec::from(bytes)), self.align), bytes,
provenance: ProvenanceMap::from_presorted_ptrs(new_provenance), provenance: ProvenanceMap::from_presorted_ptrs(new_provenance),
init_mask: self.init_mask, init_mask: self.init_mask.clone(),
align: self.align, align: self.align,
mutability: self.mutability, mutability: self.mutability,
extra, extra: self.extra,
}) })
} }
} }

View File

@ -862,14 +862,15 @@ fn get_or_create_thread_local_alloc(
if tcx.is_foreign_item(def_id) { if tcx.is_foreign_item(def_id) {
throw_unsup_format!("foreign thread-local statics are not supported"); throw_unsup_format!("foreign thread-local statics are not supported");
} }
let allocation = this.ctfe_query(|tcx| tcx.eval_static_initializer(def_id))?; let alloc = this.ctfe_query(|tcx| tcx.eval_static_initializer(def_id))?;
let mut allocation = allocation.inner().clone(); // We make a full copy of this allocation.
let mut alloc = alloc.inner().adjust_from_tcx(&this.tcx, |ptr| this.global_root_pointer(ptr))?;
// This allocation will be deallocated when the thread dies, so it is not in read-only memory. // This allocation will be deallocated when the thread dies, so it is not in read-only memory.
allocation.mutability = Mutability::Mut; alloc.mutability = Mutability::Mut;
// Create a fresh allocation with this content. // Create a fresh allocation with this content.
let new_alloc = this.allocate_raw_ptr(allocation, MiriMemoryKind::Tls.into())?; let ptr = this.allocate_raw_ptr(alloc, MiriMemoryKind::Tls.into())?;
this.machine.threads.set_thread_local_alloc(def_id, new_alloc); this.machine.threads.set_thread_local_alloc(def_id, ptr);
Ok(new_alloc) Ok(ptr)
} }
} }

View File

@ -1,7 +1,6 @@
//! Global machine state as well as implementation of the interpreter engine //! Global machine state as well as implementation of the interpreter engine
//! `Machine` trait. //! `Machine` trait.
use std::borrow::Cow;
use std::cell::RefCell; use std::cell::RefCell;
use std::collections::hash_map::Entry; use std::collections::hash_map::Entry;
use std::fmt; use std::fmt;
@ -1086,40 +1085,33 @@ fn extern_static_pointer(
} }
} }
fn adjust_allocation<'b>( fn init_alloc_extra(
ecx: &MiriInterpCx<'tcx>, ecx: &MiriInterpCx<'tcx>,
id: AllocId, id: AllocId,
alloc: Cow<'b, Allocation>, kind: MemoryKind,
kind: Option<MemoryKind>, size: Size,
) -> InterpResult<'tcx, Cow<'b, Allocation<Self::Provenance, Self::AllocExtra, Self::Bytes>>> align: Align,
{ ) -> InterpResult<'tcx, Self::AllocExtra> {
let kind = kind.expect("we set our STATIC_KIND so this cannot be None");
if ecx.machine.tracked_alloc_ids.contains(&id) { if ecx.machine.tracked_alloc_ids.contains(&id) {
ecx.emit_diagnostic(NonHaltingDiagnostic::CreatedAlloc( ecx.emit_diagnostic(NonHaltingDiagnostic::CreatedAlloc(id, size, align, kind));
id,
alloc.size(),
alloc.align,
kind,
));
} }
let alloc = alloc.into_owned();
let borrow_tracker = ecx let borrow_tracker = ecx
.machine .machine
.borrow_tracker .borrow_tracker
.as_ref() .as_ref()
.map(|bt| bt.borrow_mut().new_allocation(id, alloc.size(), kind, &ecx.machine)); .map(|bt| bt.borrow_mut().new_allocation(id, size, kind, &ecx.machine));
let race_alloc = ecx.machine.data_race.as_ref().map(|data_race| { let data_race = ecx.machine.data_race.as_ref().map(|data_race| {
data_race::AllocState::new_allocation( data_race::AllocState::new_allocation(
data_race, data_race,
&ecx.machine.threads, &ecx.machine.threads,
alloc.size(), size,
kind, kind,
ecx.machine.current_span(), ecx.machine.current_span(),
) )
}); });
let buffer_alloc = ecx.machine.weak_memory.then(weak_memory::AllocState::new_allocation); let weak_memory = ecx.machine.weak_memory.then(weak_memory::AllocState::new_allocation);
// If an allocation is leaked, we want to report a backtrace to indicate where it was // If an allocation is leaked, we want to report a backtrace to indicate where it was
// allocated. We don't need to record a backtrace for allocations which are allowed to // allocated. We don't need to record a backtrace for allocations which are allowed to
@ -1130,17 +1122,6 @@ fn adjust_allocation<'b>(
Some(ecx.generate_stacktrace()) Some(ecx.generate_stacktrace())
}; };
let alloc: Allocation<Provenance, Self::AllocExtra, Self::Bytes> = alloc.adjust_from_tcx(
&ecx.tcx,
AllocExtra {
borrow_tracker,
data_race: race_alloc,
weak_memory: buffer_alloc,
backtrace,
},
|ptr| ecx.global_root_pointer(ptr),
)?;
if matches!(kind, MemoryKind::Machine(kind) if kind.should_save_allocation_span()) { if matches!(kind, MemoryKind::Machine(kind) if kind.should_save_allocation_span()) {
ecx.machine ecx.machine
.allocation_spans .allocation_spans
@ -1148,7 +1129,7 @@ fn adjust_allocation<'b>(
.insert(id, (ecx.machine.current_span(), None)); .insert(id, (ecx.machine.current_span(), None));
} }
Ok(Cow::Owned(alloc)) Ok(AllocExtra { borrow_tracker, data_race, weak_memory, backtrace })
} }
fn adjust_alloc_root_pointer( fn adjust_alloc_root_pointer(
@ -1357,7 +1338,7 @@ fn protect_in_place_function_argument(
} }
#[inline(always)] #[inline(always)]
fn init_frame_extra( fn init_frame(
ecx: &mut InterpCx<'tcx, Self>, ecx: &mut InterpCx<'tcx, Self>,
frame: Frame<'tcx, Provenance>, frame: Frame<'tcx, Provenance>,
) -> InterpResult<'tcx, Frame<'tcx, Provenance, FrameExtra<'tcx>>> { ) -> InterpResult<'tcx, Frame<'tcx, Provenance, FrameExtra<'tcx>>> {