Add timsort to std/sort

This commit is contained in:
Simon BD 2012-09-25 17:53:24 -05:00
parent 349ef79ce7
commit cef7763649

View File

@ -4,6 +4,7 @@
use vec::{len, push};
use core::cmp::{Eq, Ord};
use dvec::DVec;
export le;
export merge_sort;
@ -168,6 +169,599 @@ impl<T: Copy Ord Eq> &[mut T] : Sort {
fn qsort(self) { quick_sort3(self); }
}
const MIN_MERGE: uint = 64;
const MIN_GALLOP: uint = 7;
const INITIAL_TMP_STORAGE: uint = 128;
fn timsort<T: Ord>(array: &[mut T]) {
let size = array.len();
if size < 2 {
return;
}
if size < MIN_MERGE {
let initRunLen = countRunAndMakeAscending(array);
binarysort(array, initRunLen);
return;
}
let ms = &MergeState();
let minRun = minRunLength(size);
let mut idx = 0;
let mut remaining = size;
loop {
let arr = vec::mut_view(array, idx, size);
let mut runLen: uint = countRunAndMakeAscending(arr);
if runLen < minRun {
let force = if remaining <= minRun {remaining} else {minRun};
let slice = vec::mut_view(arr, 0, force);
binarysort(slice, runLen);
runLen = force;
}
ms.pushRun(idx, runLen);
ms.mergeCollapse(array);
idx += runLen;
remaining -= runLen;
if remaining == 0 { break; }
}
ms.mergeForceCollapse(array);
}
fn binarysort<T: Ord>(array: &[mut T], start: uint) {
let size = array.len();
let mut start = start;
assert start <= size;
if start == 0 { start += 1; }
let mut pivot = ~[mut];
vec::reserve(pivot, 1);
unsafe { vec::raw::set_len(pivot, 1); };
while start < size {
unsafe {
let tmpView = vec::mut_view(array, start, start+1);
vec::raw::memmove(pivot, tmpView, 1);
}
let mut left = 0;
let mut right = start;
assert left <= right;
while left < right {
let mid = (left + right) >> 1;
if pivot[0] < array[mid] {
right = mid;
} else {
left = mid+1;
}
}
assert left == right;
let mut n = start-left;
unsafe {
moveVec(array, left+1, array, left, n);
}
array[left] <-> pivot[0];
start += 1;
}
unsafe { vec::raw::set_len(pivot, 0); } // Forget the boxed element
}
/// Reverse the order of elements in a slice, in place
fn reverseSlice<T>(v: &[mut T], start: uint, end:uint) {
let mut i = start;
while i < end / 2 {
v[i] <-> v[end - i - 1];
i += 1;
}
}
pure fn minRunLength(n: uint) -> uint {
let mut n = n;
let mut r = 0; // becomes 1 if any 1 bits are shifted off
while n >= MIN_MERGE {
r |= n & 1;
n >>= 1;
}
return n + r;
}
fn countRunAndMakeAscending<T: Ord>(array: &[mut T]) -> uint {
let size = array.len();
assert size > 0;
if size == 1 { return 1; }
let mut run = 2;
if array[1] < array[0] {
while run < size && array[run] < array[run-1] {
run += 1;
}
reverseSlice(array, 0, run);
} else {
while run < size && array[run] >= array[run-1] {
run += 1;
}
}
return run;
}
pure fn gallopLeft<T: Ord>(key: &const T, array: &[const T], hint: uint) -> uint {
let size = array.len();
assert size != 0 && hint < size;
let mut lastOfs = 0;
let mut ofs = 1;
if *key > array[hint] {
// Gallop right until array[hint+lastOfs] < key <= array[hint+ofs]
let maxOfs = size - hint;
while ofs < maxOfs && *key > array[hint+ofs] {
lastOfs = ofs;
ofs = (ofs << 1) + 1;
if ofs < lastOfs { ofs = maxOfs; } // uint overflow guard
}
if ofs > maxOfs { ofs = maxOfs; }
lastOfs += hint;
ofs += hint;
} else {
let maxOfs = hint + 1;
while ofs < maxOfs && *key <= array[hint-ofs] {
lastOfs = ofs;
ofs = (ofs << 1) + 1;
if ofs < lastOfs { ofs = maxOfs; } // uint overflow guard
}
if ofs > maxOfs { ofs = maxOfs; }
let tmp = lastOfs;
lastOfs = hint - ofs;
ofs = hint - tmp;
}
assert (lastOfs < ofs || lastOfs+1 < ofs+1) && ofs <= size;
lastOfs += 1;
while lastOfs < ofs {
let m = lastOfs + ((ofs - lastOfs) >> 1);
if *key > array[m] {
lastOfs = m+1;
} else {
ofs = m;
}
}
assert lastOfs == ofs;
return ofs;
}
pure fn gallopRight<T: Ord>(key: &const T, array: &[const T], hint: uint) -> uint {
let size = array.len();
assert size != 0 && hint < size;
let mut lastOfs = 0;
let mut ofs = 1;
if *key >= array[hint] {
// Gallop right until array[hint+lastOfs] <= key < array[hint+ofs]
let maxOfs = size - hint;
while ofs < maxOfs && *key >= array[hint+ofs] {
lastOfs = ofs;
ofs = (ofs << 1) + 1;
if ofs < lastOfs { ofs = maxOfs; }
}
if ofs > maxOfs { ofs = maxOfs; }
lastOfs += hint;
ofs += hint;
} else {
// Gallop left until array[hint-ofs] <= key < array[hint-lastOfs]
let maxOfs = hint + 1;
while ofs < maxOfs && *key < array[hint-ofs] {
lastOfs = ofs;
ofs = (ofs << 1) + 1;
if ofs < lastOfs { ofs = maxOfs; }
}
if ofs > maxOfs { ofs = maxOfs; }
let tmp = lastOfs;
lastOfs = hint - ofs;
ofs = hint - tmp;
}
assert (lastOfs < ofs || lastOfs+1 < ofs+1) && ofs <= size;
lastOfs += 1;
while lastOfs < ofs {
let m = lastOfs + ((ofs - lastOfs) >> 1);
if *key >= array[m] {
lastOfs = m + 1;
} else {
ofs = m;
}
}
assert lastOfs == ofs;
return ofs;
}
struct RunState {
base: uint,
len: uint,
}
struct MergeState<T> {
mut minGallop: uint,
mut tmp: ~[T],
runs: DVec<RunState>,
drop {
unsafe {
vec::raw::set_len(self.tmp, 0);
}
}
}
fn MergeState<T>() -> MergeState<T> {
let mut tmp = ~[];
vec::reserve(tmp, INITIAL_TMP_STORAGE);
MergeState {
minGallop: MIN_GALLOP,
tmp: tmp,
runs: DVec(),
}
}
impl<T: Ord> &MergeState<T> {
fn pushRun(runBase: uint, runLen: uint) {
let tmp = RunState{base: runBase, len: runLen};
self.runs.push(tmp);
}
fn mergeAt(n: uint, array: &[mut T]) {
let mut size = self.runs.len();
assert size >= 2;
assert n == size-2 || n == size-3;
do self.runs.borrow_mut |arr| {
let mut b1 = arr[n].base;
let mut l1 = arr[n].len;
let b2 = arr[n+1].base;
let l2 = arr[n+1].len;
assert l1 > 0 && l2 > 0;
assert b1 + l1 == b2;
arr[n].len = l1 + l2;
if n == size-3 {
arr[n+1].base = arr[n+2].base;
arr[n+1].len = arr[n+2].len;
}
let slice = vec::mut_view(array, b1, b1+l1);
let k = gallopRight(&const array[b2], slice, 0);
b1 += k;
l1 -= k;
if l1 != 0 {
let slice = vec::mut_view(array, b2, b2+l2);
let l2 = gallopLeft(
&const array[b1+l1-1],slice,l2-1);
if l2 > 0 {
if l1 <= l2 {
self.mergeLo(array, b1, l1, b2, l2);
} else {
self.mergeHi(array, b1, l1, b2, l2);
}
}
}
}
self.runs.pop();
}
fn mergeLo(array: &[mut T], base1: uint, len1: uint, base2: uint, len2: uint) {
assert len1 != 0 && len2 != 0 && base1+len1 == base2;
vec::reserve(self.tmp, len1);
unsafe {
vec::raw::set_len(self.tmp, len1);
moveVec(self.tmp, 0, array, base1, len1);
}
let mut c1 = 0;
let mut c2 = base2;
let mut dest = base1;
let mut len1 = len1;
let mut len2 = len2;
array[dest] <-> array[c2];
dest += 1; c2 += 1; len2 -= 1;
if len2 == 0 {
unsafe {
moveVec(array, dest, self.tmp, 0, len1);
vec::raw::set_len(self.tmp, 0); // Forget the elements
}
return;
}
if len1 == 1 {
unsafe {
moveVec(array, dest, array, c2, len2);
array[dest+len2] <-> self.tmp[c1];
vec::raw::set_len(self.tmp, 0); // Forget the element
}
return;
}
let mut minGallop = self.minGallop;
loop {
let mut count1 = 0;
let mut count2 = 0;
let mut breakOuter = false;
loop {
assert len1 > 1 && len2 != 0;
if array[c2] < self.tmp[c1] {
array[dest] <-> array[c2];
dest += 1; c2 += 1; len2 -= 1;
count2 += 1; count1 = 0;
if len2 == 0 {
breakOuter = true;
}
} else {
array[dest] <-> self.tmp[c1];
dest += 1; c1 += 1; len1 -= 1;
count1 += 1; count2 = 0;
if len1 == 1 {
breakOuter = true;
}
}
if breakOuter || ((count1 | count2) >= minGallop) {
break;
}
}
if breakOuter { break; }
// Start to gallop
loop {
assert len1 > 1 && len2 != 0;
let tmpView = vec::mut_view(self.tmp, c1, c1+len1);
count1 = gallopRight(&const array[c2], tmpView, 0);
if count1 != 0 {
unsafe {
moveVec(array, dest, self.tmp, c1, count1);
}
dest += count1; c1 += count1; len1 -= count1;
if len1 <= 1 { breakOuter = true; break; }
}
array[dest] <-> array[c2];
dest += 1; c2 += 1; len2 -= 1;
if len2 == 0 { breakOuter = true; break; }
let tmpView = vec::mut_view(array, c2, c2+len2);
count2 = gallopLeft(&const self.tmp[c1], tmpView, 0);
if count2 != 0 {
unsafe {
moveVec(array, dest, array, c2, count2);
}
dest += count2; c2 += count2; len2 -= count2;
if len2 == 0 { breakOuter = true; break; }
}
array[dest] <-> self.tmp[c1];
dest += 1; c1 += 1; len1 -= 1;
if len1 == 1 { breakOuter = true; break; }
minGallop -= 1;
if !(count1 >= MIN_GALLOP || count2 >= MIN_GALLOP) { break; }
}
if breakOuter { break; }
if minGallop < 0 { minGallop = 0; }
minGallop += 2; // Penalize for leaving gallop
}
self.minGallop = if minGallop < 1 { 1 } else { minGallop };
if len1 == 1 {
assert len2 > 0;
unsafe {
moveVec(array, dest, array, c2, len2);
}
array[dest+len2] <-> self.tmp[c1];
} else if len1 == 0 {
fail fmt!("Method mergeLo violates its contract! %?", len1);
} else {
assert len2 == 0;
assert len1 > 1;
unsafe {
moveVec(array, dest, self.tmp, c1, len1);
}
}
unsafe { vec::raw::set_len(self.tmp, 0); }
}
fn mergeHi(array: &[mut T], base1: uint, len1: uint, base2: uint, len2: uint) {
assert len1 != 1 && len2 != 0 && base1 + len1 == base2;
vec::reserve(self.tmp, len2);
unsafe {
vec::raw::set_len(self.tmp, len2);
moveVec(self.tmp, 0, array, base2, len2);
}
let mut c1 = base1 + len1 - 1;
let mut c2 = len2 - 1;
let mut dest = base2 + len2 - 1;
let mut len1 = len1;
let mut len2 = len2;
array[dest] <-> array[c1];
dest -= 1; c1 -= 1; len1 -= 1;
if len1 == 0 {
unsafe {
moveVec(array, dest-(len2-1), self.tmp, 0, len2);
vec::raw::set_len(self.tmp, 0); // Forget the elements
}
return;
}
if len2 == 1 {
dest -= len1;
c1 -= len1;
unsafe {
moveVec(array, dest+1, array, c1+1, len1);
array[dest] <-> self.tmp[c2];
vec::raw::set_len(self.tmp, 0); // Forget the element
}
return;
}
let mut minGallop = self.minGallop;
loop {
let mut count1 = 0;
let mut count2 = 0;
let mut breakOuter = false;
loop {
assert len1 != 0 && len2 > 1;
if self.tmp[c2] < array[c1] {
array[dest] <-> array[c1];
dest -= 1; c1 -= 1; len1 -= 1;
count1 += 1; count2 = 0;
if len1 == 0 {
breakOuter = true;
}
} else {
array[dest] <-> self.tmp[c2];
dest -= 1; c2 -= 1; len2 -= 1;
count2 += 1; count1 = 0;
if len2 == 1 {
breakOuter = true;
}
}
if breakOuter || ((count1 | count2) >= minGallop) {
break;
}
}
if breakOuter { break; }
// Start to gallop
loop {
assert len2 > 1 && len1 != 0;
let tmpView = vec::mut_view(array, base1, base1+len1);
count1 = len1-gallopRight(&const self.tmp[c2], tmpView, len1-1);
if count1 != 0 {
dest -= count1; c1 -= count1; len1 -= count1;
unsafe {
moveVec(array, dest+1, array, c1+1, count1);
}
if len1 == 0 { breakOuter = true; break; }
}
array[dest] <-> self.tmp[c2];
dest -= 1; c2 -= 1; len2 -= 1;
if len2 == 1 { breakOuter = true; break; }
let tmpView = vec::mut_view(self.tmp, 0, len2);
let gL = gallopLeft(&const array[c1], tmpView, len2-1);
count2 = len2 - gL;
if count2 != 0 {
dest -= count2; c2 -= count2; len2 -= count2;
unsafe {
moveVec(array, dest+1, self.tmp, c2+1, count2);
}
if len2 <= 1 { breakOuter = true; break; }
}
array[dest] <-> array[c1];
dest -= 1; c1 -= 1; len1 -= 1;
if len1 == 0 { breakOuter = true; break; }
minGallop -= 1;
if !(count1 >= MIN_GALLOP || count2 >= MIN_GALLOP) { break; }
}
if breakOuter { break; }
if minGallop < 0 { minGallop = 0; }
minGallop += 2; // Penalize for leaving gallop
}
self.minGallop = if minGallop < 1 { 1 } else { minGallop };
if len2 == 1 {
assert len1 > 0;
dest -= len1;
c1 -= len1;
unsafe {
moveVec(array, dest+1, array, c1+1, len1);
}
array[dest] <-> self.tmp[c2];
} else if len2 == 0 {
fail fmt!("Method mergeHi violates its contract! %?", len2);
} else {
assert len1 == 0;
assert len2 != 0;
unsafe {
moveVec(array, dest-(len2-1), self.tmp, 0, len2);
}
}
unsafe { vec::raw::set_len(self.tmp, 0); }
}
fn mergeCollapse(array: &[mut T]) {
while self.runs.len() > 1 {
let mut n = self.runs.len()-2;
let chk = do self.runs.borrow |arr| {
if n > 0 && arr[n-1].len <= arr[n].len + arr[n+1].len {
if arr[n-1].len < arr[n+1].len { n -= 1; }
true
} else if arr[n].len <= arr[n+1].len {
true
} else {
false
}
};
if !chk { break; }
self.mergeAt(n, array);
}
}
fn mergeForceCollapse(array: &[mut T]) {
while self.runs.len() > 1 {
let mut n = self.runs.len()-2;
if n > 0 {
do self.runs.borrow |arr| {
if arr[n-1].len < arr[n+1].len {
n -= 1;
}
}
}
self.mergeAt(n, array);
}
}
}
// Moves elements to from dest to from
// Unsafe as it makes the from parameter invalid between s2 and s2+len
#[inline(always)]
unsafe fn moveVec<T>(dest: &[mut T], s1: uint, from: &[const T], s2: uint, len: uint) {
assert s1+len <= dest.len() && s2+len <= from.len();
do vec::as_mut_buf(dest) |p, _len| {
let destPtr = ptr::mut_offset(p, s1);
do vec::as_const_buf(from) |p, _len| {
let fromPtr = ptr::const_offset(p, s2);
ptr::memmove(destPtr, fromPtr, len);
}
}
}
#[cfg(test)]
mod test_qsort3 {
#[legacy_exports];