address review comments

This commit is contained in:
Lukas Markeffsky 2024-02-11 17:13:23 +01:00
parent 8f259ade66
commit 5d989770f2

View File

@ -95,6 +95,22 @@ impl<T, A: Allocator> Drop for Drain<'_, T, A> {
fn drop(&mut self) { fn drop(&mut self) {
struct DropGuard<'r, 'a, T, A: Allocator>(&'r mut Drain<'a, T, A>); struct DropGuard<'r, 'a, T, A: Allocator>(&'r mut Drain<'a, T, A>);
let guard = DropGuard(self);
if mem::needs_drop::<T>() && guard.0.remaining != 0 {
unsafe {
// SAFETY: We just checked that `self.remaining != 0`.
let (front, back) = guard.0.as_slices();
// since idx is a logical index, we don't need to worry about wrapping.
guard.0.idx += front.len();
guard.0.remaining -= front.len();
ptr::drop_in_place(front);
guard.0.remaining = 0;
ptr::drop_in_place(back);
}
}
// Dropping `guard` handles moving the remaining elements into place.
impl<'r, 'a, T, A: Allocator> Drop for DropGuard<'r, 'a, T, A> { impl<'r, 'a, T, A: Allocator> Drop for DropGuard<'r, 'a, T, A> {
#[inline] #[inline]
fn drop(&mut self) { fn drop(&mut self) {
@ -118,30 +134,74 @@ fn drop(&mut self) {
return; return;
} }
let head_len = source_deque.len(); let head_len = source_deque.len; // #elements in front of the drain
let tail_len = new_len - head_len; let tail_len = new_len - head_len; // #elements behind the drain
// Next, we will fill the hole left by the drain with as few writes as possible.
// The code below handles the following control flow and reduces the amount of
// branches under the assumption that `head_len == 0 || tail_len == 0`, i.e.
// draining at the front or at the back of the dequeue is especially common.
//
// H = "head index" = `deque.head`
// h = elements in front of the drain
// d = elements in the drain
// t = elements behind the drain
//
// Note that the buffer may wrap at any point and the wrapping is handled by
// `wrap_copy` and `to_physical_idx`.
//
// Case 1: if `head_len == 0 && tail_len == 0`
// Everything was drained, reset the head index back to 0.
// H
// [ . . . . . d d d d . . . . . ]
// H
// [ . . . . . . . . . . . . . . ]
//
// Case 2: else if `tail_len == 0`
// Don't move data or the head index.
// H
// [ . . . h h h h d d d d . . . ]
// H
// [ . . . h h h h . . . . . . . ]
//
// Case 3: else if `head_len == 0`
// Don't move data, but move the head index.
// H
// [ . . . d d d d t t t t . . . ]
// H
// [ . . . . . . . t t t t . . . ]
//
// Case 4: else if `tail_len <= head_len`
// Move data, but not the head index.
// H
// [ . . h h h h d d d d t t . . ]
// H
// [ . . h h h h t t . . . . . . ]
//
// Case 5: else
// Move data and the head index.
// H
// [ . . h h d d d d t t t t . . ]
// H
// [ . . . . . . h h t t t t . . ]
// When draining at the front (`.drain(..n)`) or at the back (`.drain(n..)`), // When draining at the front (`.drain(..n)`) or at the back (`.drain(n..)`),
// we don't need to copy any data. // we don't need to copy any data. The number of elements copied would be 0.
// Outlining this function helps LLVM to eliminate the copies in these cases.
if head_len != 0 && tail_len != 0 { if head_len != 0 && tail_len != 0 {
copy_data(source_deque, drain_len, head_len, tail_len); join_head_and_tail_wrapping(source_deque, drain_len, head_len, tail_len);
} // Marking this function as cold helps LLVM to eliminate it entirely if
// this branch is never taken.
if new_len == 0 { // We use `#[cold]` instead of `#[inline(never)]`, because inlining this
source_deque.head = 0; // function into the general case (`.drain(n..m)`) is fine.
} else if head_len < tail_len { // See `tests/codegen/vecdeque-drain.rs` for a test.
source_deque.head = source_deque.to_physical_idx(drain_len);
}
source_deque.len = new_len;
#[cold] #[cold]
fn copy_data<T, A: Allocator>( fn join_head_and_tail_wrapping<T, A: Allocator>(
source_deque: &mut VecDeque<T, A>, source_deque: &mut VecDeque<T, A>,
drain_len: usize, drain_len: usize,
head_len: usize, head_len: usize,
tail_len: usize, tail_len: usize,
) { ) {
// Pick whether to move the head or the tail here.
let (src, dst, len); let (src, dst, len);
if head_len < tail_len { if head_len < tail_len {
src = source_deque.head; src = source_deque.head;
@ -158,23 +218,18 @@ fn copy_data<T, A: Allocator>(
} }
} }
} }
}
let guard = DropGuard(self); if new_len == 0 {
if mem::needs_drop::<T>() && guard.0.remaining != 0 { // Special case: If the entire dequeue was drained, reset the head back to 0,
unsafe { // like `.clear()` does.
// SAFETY: We just checked that `self.remaining != 0`. source_deque.head = 0;
let (front, back) = guard.0.as_slices(); } else if head_len < tail_len {
// since idx is a logical index, we don't need to worry about wrapping. // If we moved the head above, then we need to adjust the head index here.
guard.0.idx += front.len(); source_deque.head = source_deque.to_physical_idx(drain_len);
guard.0.remaining -= front.len(); }
ptr::drop_in_place(front); source_deque.len = new_len;
guard.0.remaining = 0;
ptr::drop_in_place(back);
} }
} }
// Dropping `guard` handles moving the remaining elements into place.
} }
} }