339 lines
12 KiB
Rust
339 lines
12 KiB
Rust
/*! Precise Garbage Collector
|
|
|
|
The precise GC exposes two functions, gc and
|
|
cleanup_stack_for_failure. The gc function is the entry point to the
|
|
garbage collector itself. The cleanup_stack_for_failure is the entry
|
|
point for GC-based cleanup.
|
|
|
|
Precise GC depends on changes to LLVM's GC which add support for
|
|
automatic rooting and addrspace-based metadata marking. Rather than
|
|
explicitly rooting pointers with LLVM's gcroot intrinsic, the GC
|
|
merely creates allocas for pointers, and allows an LLVM pass to
|
|
automatically infer roots based on the allocas present in a function
|
|
(and live at a given location). The compiler communicates the type of
|
|
the pointer to LLVM by setting the addrspace of the pointer type. The
|
|
compiler then emits a map from addrspace to tydesc, which LLVM then
|
|
uses to match pointers with their tydesc. The GC reads the metadata
|
|
table produced by LLVM, and uses it to determine which glue functions
|
|
to call to free objects on their respective heaps.
|
|
|
|
GC-based cleanup is a replacement for landing pads which relies on the
|
|
GC infrastructure to find pointers on the stack to cleanup. Whereas
|
|
the normal GC needs to walk task-local heap allocations, the cleanup
|
|
code needs to walk exchange heap allocations and stack-allocations
|
|
with destructors.
|
|
|
|
*/
|
|
|
|
use stackwalk::Word;
|
|
use libc::size_t;
|
|
use libc::uintptr_t;
|
|
use send_map::linear::LinearMap;
|
|
|
|
export Word;
|
|
export gc;
|
|
export cleanup_stack_for_failure;
|
|
|
|
// Mirrors rust_stack.h stk_seg
|
|
struct StackSegment {
|
|
prev: *StackSegment,
|
|
next: *StackSegment,
|
|
end: uintptr_t,
|
|
// And other fields which we don't care about...
|
|
}
|
|
|
|
extern mod rustrt {
|
|
fn rust_annihilate_box(ptr: *Word);
|
|
|
|
#[rust_stack]
|
|
fn rust_call_tydesc_glue(root: *Word, tydesc: *Word, field: size_t);
|
|
|
|
#[rust_stack]
|
|
fn rust_gc_metadata() -> *Word;
|
|
|
|
fn rust_get_stack_segment() -> *StackSegment;
|
|
}
|
|
|
|
unsafe fn bump<T, U>(ptr: *T, count: uint) -> *U {
|
|
return cast::reinterpret_cast(&ptr::offset(ptr, count));
|
|
}
|
|
|
|
unsafe fn align_to_pointer<T>(ptr: *T) -> *T {
|
|
let align = sys::min_align_of::<*T>();
|
|
let ptr: uint = cast::reinterpret_cast(&ptr);
|
|
let ptr = (ptr + (align - 1)) & -align;
|
|
return cast::reinterpret_cast(&ptr);
|
|
}
|
|
|
|
unsafe fn get_safe_point_count() -> uint {
|
|
let module_meta = rustrt::rust_gc_metadata();
|
|
return *module_meta;
|
|
}
|
|
|
|
type SafePoint = { sp_meta: *Word, fn_meta: *Word };
|
|
|
|
// Returns the safe point metadata for the given program counter, if
|
|
// any.
|
|
unsafe fn is_safe_point(pc: *Word) -> Option<SafePoint> {
|
|
let module_meta = rustrt::rust_gc_metadata();
|
|
let num_safe_points = *module_meta;
|
|
let safe_points: *Word = bump(module_meta, 1);
|
|
|
|
if ptr::is_null(pc) {
|
|
return None;
|
|
}
|
|
|
|
// FIXME (#2997): Use binary rather than linear search.
|
|
let mut spi = 0;
|
|
while spi < num_safe_points {
|
|
let sp: **Word = bump(safe_points, spi*3);
|
|
let sp_loc = *sp;
|
|
if sp_loc == pc {
|
|
return Some({sp_meta: *bump(sp, 1), fn_meta: *bump(sp, 2)});
|
|
}
|
|
spi += 1;
|
|
}
|
|
return None;
|
|
}
|
|
|
|
type Visitor = fn(root: **Word, tydesc: *Word) -> bool;
|
|
|
|
// Walks the list of roots for the given safe point, and calls visitor
|
|
// on each root.
|
|
unsafe fn walk_safe_point(fp: *Word, sp: SafePoint, visitor: Visitor) {
|
|
let fp_bytes: *u8 = cast::reinterpret_cast(&fp);
|
|
let sp_meta: *u32 = cast::reinterpret_cast(&sp.sp_meta);
|
|
|
|
let num_stack_roots = *sp_meta as uint;
|
|
let num_reg_roots = *ptr::offset(sp_meta, 1) as uint;
|
|
|
|
let stack_roots: *u32 = bump(sp_meta, 2);
|
|
let reg_roots: *u8 = bump(stack_roots, num_stack_roots);
|
|
let addrspaces: *Word = align_to_pointer(bump(reg_roots, num_reg_roots));
|
|
let tydescs: ***Word = bump(addrspaces, num_stack_roots);
|
|
|
|
// Stack roots
|
|
let mut sri = 0;
|
|
while sri < num_stack_roots {
|
|
if *ptr::offset(addrspaces, sri) >= 1 {
|
|
let root =
|
|
ptr::offset(fp_bytes, *ptr::offset(stack_roots, sri) as Word)
|
|
as **Word;
|
|
let tydescpp = ptr::offset(tydescs, sri);
|
|
let tydesc = if ptr::is_not_null(tydescpp) &&
|
|
ptr::is_not_null(*tydescpp) {
|
|
**tydescpp
|
|
} else {
|
|
ptr::null()
|
|
};
|
|
if !visitor(root, tydesc) { return; }
|
|
}
|
|
sri += 1;
|
|
}
|
|
|
|
// Register roots
|
|
let mut rri = 0;
|
|
while rri < num_reg_roots {
|
|
if *ptr::offset(addrspaces, num_stack_roots + rri) == 1 {
|
|
// FIXME(#2997): Need to find callee saved registers on the stack.
|
|
}
|
|
rri += 1;
|
|
}
|
|
}
|
|
|
|
// Is fp contained in segment?
|
|
unsafe fn is_frame_in_segment(fp: *Word, segment: *StackSegment) -> bool {
|
|
let begin: Word = cast::reinterpret_cast(&segment);
|
|
let end: Word = cast::reinterpret_cast(&(*segment).end);
|
|
let frame: Word = cast::reinterpret_cast(&fp);
|
|
|
|
return begin <= frame && frame <= end;
|
|
}
|
|
|
|
// Find and return the segment containing the given frame pointer. At
|
|
// stack segment boundaries, returns true for boundary, so that the
|
|
// caller can do any special handling to identify where the correct
|
|
// return address is in the stack frame.
|
|
unsafe fn find_segment_for_frame(fp: *Word, segment: *StackSegment)
|
|
-> {segment: *StackSegment, boundary: bool} {
|
|
// Check if frame is in either current frame or previous frame.
|
|
let in_segment = is_frame_in_segment(fp, segment);
|
|
let in_prev_segment = ptr::is_not_null((*segment).prev) &&
|
|
is_frame_in_segment(fp, (*segment).prev);
|
|
|
|
// If frame is not in either segment, walk down segment list until
|
|
// we find the segment containing this frame.
|
|
if !in_segment && !in_prev_segment {
|
|
let mut segment = segment;
|
|
while ptr::is_not_null((*segment).next) &&
|
|
is_frame_in_segment(fp, (*segment).next) {
|
|
segment = (*segment).next;
|
|
}
|
|
return {segment: segment, boundary: false};
|
|
}
|
|
|
|
// If frame is in previous frame, then we're at a boundary.
|
|
if !in_segment && in_prev_segment {
|
|
return {segment: (*segment).prev, boundary: true};
|
|
}
|
|
|
|
// Otherwise, we're somewhere on the inside of the frame.
|
|
return {segment: segment, boundary: false};
|
|
}
|
|
|
|
type Memory = uint;
|
|
|
|
const task_local_heap: Memory = 1;
|
|
const exchange_heap: Memory = 2;
|
|
const stack: Memory = 4;
|
|
|
|
const need_cleanup: Memory = exchange_heap | stack;
|
|
|
|
// Walks stack, searching for roots of the requested type, and passes
|
|
// each root to the visitor.
|
|
unsafe fn walk_gc_roots(mem: Memory, sentinel: **Word, visitor: Visitor) {
|
|
let mut segment = rustrt::rust_get_stack_segment();
|
|
let mut last_ret: *Word = ptr::null();
|
|
// To avoid collecting memory used by the GC itself, skip stack
|
|
// frames until past the root GC stack frame. The root GC stack
|
|
// frame is marked by a sentinel, which is a box pointer stored on
|
|
// the stack.
|
|
let mut reached_sentinel = ptr::is_null(sentinel);
|
|
for stackwalk::walk_stack |frame| {
|
|
unsafe {
|
|
let pc = last_ret;
|
|
let {segment: next_segment, boundary: boundary} =
|
|
find_segment_for_frame(frame.fp, segment);
|
|
segment = next_segment;
|
|
// Each stack segment is bounded by a morestack frame. The
|
|
// morestack frame includes two return addresses, one for
|
|
// morestack itself, at the normal offset from the frame
|
|
// pointer, and then a second return address for the
|
|
// function prologue (which called morestack after
|
|
// determining that it had hit the end of the stack).
|
|
// Since morestack itself takes two parameters, the offset
|
|
// for this second return address is 3 greater than the
|
|
// return address for morestack.
|
|
let ret_offset = if boundary { 4 } else { 1 };
|
|
last_ret = *ptr::offset(frame.fp, ret_offset) as *Word;
|
|
|
|
if ptr::is_null(pc) {
|
|
loop;
|
|
}
|
|
|
|
let mut delay_reached_sentinel = reached_sentinel;
|
|
let sp = is_safe_point(pc);
|
|
match sp {
|
|
Some(sp_info) => {
|
|
for walk_safe_point(frame.fp, sp_info) |root, tydesc| {
|
|
// Skip roots until we see the sentinel.
|
|
if !reached_sentinel {
|
|
if root == sentinel {
|
|
delay_reached_sentinel = true;
|
|
}
|
|
loop;
|
|
}
|
|
|
|
// Skip null pointers, which can occur when a
|
|
// unique pointer has already been freed.
|
|
if ptr::is_null(*root) {
|
|
loop;
|
|
}
|
|
|
|
if ptr::is_null(tydesc) {
|
|
// Root is a generic box.
|
|
let refcount = **root;
|
|
if mem | task_local_heap != 0 && refcount != -1 {
|
|
if !visitor(root, tydesc) { return; }
|
|
} else if mem | exchange_heap != 0 && refcount == -1 {
|
|
if !visitor(root, tydesc) { return; }
|
|
}
|
|
} else {
|
|
// Root is a non-immediate.
|
|
if mem | stack != 0 {
|
|
if !visitor(root, tydesc) { return; }
|
|
}
|
|
}
|
|
}
|
|
}
|
|
None => ()
|
|
}
|
|
reached_sentinel = delay_reached_sentinel;
|
|
}
|
|
}
|
|
}
|
|
|
|
fn gc() {
|
|
unsafe {
|
|
// Abort when GC is disabled.
|
|
if get_safe_point_count() == 0 {
|
|
return;
|
|
}
|
|
|
|
for walk_gc_roots(task_local_heap, ptr::null()) |_root, _tydesc| {
|
|
// FIXME(#2997): Walk roots and mark them.
|
|
io::stdout().write([46]); // .
|
|
}
|
|
}
|
|
}
|
|
|
|
type RootSet = LinearMap<*Word,()>;
|
|
|
|
fn RootSet() -> RootSet {
|
|
LinearMap()
|
|
}
|
|
|
|
#[cfg(gc)]
|
|
fn expect_sentinel() -> bool { true }
|
|
|
|
#[cfg(nogc)]
|
|
fn expect_sentinel() -> bool { false }
|
|
|
|
// Entry point for GC-based cleanup. Walks stack looking for exchange
|
|
// heap and stack allocations requiring drop, and runs all
|
|
// destructors.
|
|
//
|
|
// This should only be called from fail, as it will drop the roots
|
|
// which are *live* on the stack, rather than dropping those that are
|
|
// dead.
|
|
fn cleanup_stack_for_failure() {
|
|
unsafe {
|
|
// Abort when GC is disabled.
|
|
if get_safe_point_count() == 0 {
|
|
return;
|
|
}
|
|
|
|
// Leave a sentinel on the stack to mark the current frame. The
|
|
// stack walker will ignore any frames above the sentinel, thus
|
|
// avoiding collecting any memory being used by the stack walker
|
|
// itself.
|
|
//
|
|
// However, when core itself is not compiled with GC, then none of
|
|
// the functions in core will have GC metadata, which means we
|
|
// won't be able to find the sentinel root on the stack. In this
|
|
// case, we can safely skip the sentinel since we won't find our
|
|
// own stack roots on the stack anyway.
|
|
let sentinel_box = ~0;
|
|
let sentinel: **Word = if expect_sentinel() {
|
|
cast::reinterpret_cast(&ptr::addr_of(sentinel_box))
|
|
} else {
|
|
ptr::null()
|
|
};
|
|
|
|
let mut roots = ~RootSet();
|
|
for walk_gc_roots(need_cleanup, sentinel) |root, tydesc| {
|
|
// Track roots to avoid double frees.
|
|
if option::is_some(roots.find(&*root)) {
|
|
loop;
|
|
}
|
|
roots.insert(*root, ());
|
|
|
|
if ptr::is_null(tydesc) {
|
|
rustrt::rust_annihilate_box(*root);
|
|
} else {
|
|
rustrt::rust_call_tydesc_glue(*root, tydesc, 3 as size_t);
|
|
}
|
|
}
|
|
}
|
|
}
|