rust/src/libstd/sort.rs

1294 lines
36 KiB
Rust
Raw Normal View History

//! Sorting methods
2012-08-31 18:41:15 -05:00
#[forbid(deprecated_mode)];
2012-09-04 13:23:53 -05:00
use vec::{len, push};
use core::cmp::{Eq, Ord};
2012-09-25 17:53:24 -05:00
use dvec::DVec;
2011-08-12 00:48:08 -05:00
2012-09-04 16:37:47 -05:00
type Le<T> = pure fn(v1: &T, v2: &T) -> bool;
2010-12-21 02:44:06 -06:00
/**
* Merge sort. Returns a new vector containing the sorted list.
*
* Has worst case O(n log n) performance, best case O(n), but
* is not space efficient. This is a stable sort.
*/
pub fn merge_sort<T: Copy>(v: &[const T], le: Le<T>) -> ~[T] {
2012-09-04 16:37:47 -05:00
type Slice = (uint, uint);
2012-02-27 20:32:45 -06:00
return merge_sort_(v, (0u, len(v)), le);
2012-02-27 20:32:45 -06:00
fn merge_sort_<T: Copy>(v: &[const T], slice: Slice, le: Le<T>)
-> ~[T] {
let begin = slice.first();
let end = slice.second();
2012-02-27 20:32:45 -06:00
let v_len = end - begin;
2012-08-01 19:30:05 -05:00
if v_len == 0u { return ~[]; }
if v_len == 1u { return ~[v[begin]]; }
2012-02-27 20:32:45 -06:00
let mid = v_len / 2u + begin;
let a = (begin, mid);
let b = (mid, end);
return merge(le, merge_sort_(v, a, le), merge_sort_(v, b, le));
2012-02-27 20:32:45 -06:00
}
fn merge<T: Copy>(le: Le<T>, a: &[T], b: &[T]) -> ~[T] {
let mut rs = vec::with_capacity(len(a) + len(b));
2012-02-27 20:32:45 -06:00
let a_len = len(a);
let mut a_ix = 0u;
2012-02-27 20:32:45 -06:00
let b_len = len(b);
let mut b_ix = 0u;
2011-07-27 07:19:39 -05:00
while a_ix < a_len && b_ix < b_len {
if le(&a[a_ix], &b[b_ix]) {
rs.push(a[a_ix]);
a_ix += 1u;
} else { rs.push(b[b_ix]); b_ix += 1u; }
}
rs = vec::append(rs, vec::slice(a, a_ix, a_len));
rs = vec::append(rs, vec::slice(b, b_ix, b_len));
2012-08-01 19:30:05 -05:00
return rs;
2010-12-21 02:44:06 -06:00
}
}
fn part<T: Copy>(arr: &[mut T], left: uint,
right: uint, pivot: uint, compare_func: Le<T>) -> uint {
let pivot_value = arr[pivot];
arr[pivot] <-> arr[right];
let mut storage_index: uint = left;
let mut i: uint = left;
2011-07-27 07:19:39 -05:00
while i < right {
if compare_func(&arr[i], &pivot_value) {
arr[i] <-> arr[storage_index];
storage_index += 1u;
}
i += 1u;
}
arr[storage_index] <-> arr[right];
2012-08-01 19:30:05 -05:00
return storage_index;
}
fn qsort<T: Copy>(arr: &[mut T], left: uint,
right: uint, compare_func: Le<T>) {
2011-07-27 07:19:39 -05:00
if right > left {
let pivot = (left + right) / 2u;
let new_pivot = part::<T>(arr, left, right, pivot, compare_func);
2011-07-27 07:19:39 -05:00
if new_pivot != 0u {
// Need to do this check before recursing due to overflow
qsort::<T>(arr, left, new_pivot - 1u, compare_func);
}
qsort::<T>(arr, new_pivot + 1u, right, compare_func);
}
}
/**
* Quicksort. Sorts a mut vector in place.
*
* Has worst case O(n^2) performance, average case O(n log n).
* This is an unstable sort.
*/
pub fn quick_sort<T: Copy>(arr: &[mut T], compare_func: Le<T>) {
2012-08-01 19:30:05 -05:00
if len::<T>(arr) == 0u { return; }
qsort::<T>(arr, 0u, len::<T>(arr) - 1u, compare_func);
}
fn qsort3<T: Copy Ord Eq>(arr: &[mut T], left: int, right: int) {
2012-08-01 19:30:05 -05:00
if right <= left { return; }
let v: T = arr[right];
let mut i: int = left - 1;
let mut j: int = right;
let mut p: int = i;
let mut q: int = j;
loop {
i += 1;
while arr[i] < v { i += 1; }
j -= 1;
while v < arr[j] {
2011-07-27 07:19:39 -05:00
if j == left { break; }
j -= 1;
}
2011-07-27 07:19:39 -05:00
if i >= j { break; }
arr[i] <-> arr[j];
if arr[i] == v {
p += 1;
arr[p] <-> arr[i];
}
if v == arr[j] {
q -= 1;
arr[j] <-> arr[q];
}
}
arr[i] <-> arr[right];
j = i - 1;
i += 1;
let mut k: int = left;
2011-07-27 07:19:39 -05:00
while k < p {
arr[k] <-> arr[j];
k += 1;
j -= 1;
if k == len::<T>(arr) as int { break; }
}
k = right - 1;
2011-07-27 07:19:39 -05:00
while k > q {
arr[i] <-> arr[k];
k -= 1;
i += 1;
2011-07-27 07:19:39 -05:00
if k == 0 { break; }
}
qsort3::<T>(arr, left, j);
qsort3::<T>(arr, i, right);
}
/**
* Fancy quicksort. Sorts a mut vector in place.
*
* Based on algorithm presented by ~[Sedgewick and Bentley]
* (http://www.cs.princeton.edu/~rs/talks/QuicksortIsOptimal.pdf).
* According to these slides this is the algorithm of choice for
* 'randomly ordered keys, abstract compare' & 'small number of key values'.
*
* This is an unstable sort.
*/
pub fn quick_sort3<T: Copy Ord Eq>(arr: &[mut T]) {
if arr.len() <= 1 { return; }
qsort3(arr, 0, (arr.len() - 1) as int);
}
pub trait Sort {
fn qsort(self);
}
impl<T: Copy Ord Eq> &[mut T] : Sort {
fn qsort(self) { quick_sort3(self); }
}
2012-09-25 17:53:24 -05:00
const MIN_MERGE: uint = 64;
const MIN_GALLOP: uint = 7;
const INITIAL_TMP_STORAGE: uint = 128;
2012-10-22 18:33:28 -05:00
pub fn tim_sort<T: Ord>(array: &[mut T]) {
2012-09-25 17:53:24 -05:00
let size = array.len();
if size < 2 {
return;
}
let ms = &MergeState();
ms.array = array;
let min_run = min_run_length(size);
2012-09-25 17:53:24 -05:00
if size < MIN_MERGE {
let init_run_len = count_run_ascending(array);
ms.binarysort(array, init_run_len);
2012-09-25 17:53:24 -05:00
return;
}
let mut idx = 0;
let mut remaining = size;
loop {
let arr = vec::mut_view(array, idx, size);
let mut run_len: uint = count_run_ascending(arr);
2012-09-25 17:53:24 -05:00
if run_len < min_run {
let force = if remaining <= min_run {remaining} else {min_run};
2012-09-25 17:53:24 -05:00
let slice = vec::mut_view(arr, 0, force);
ms.binarysort(slice, run_len);
run_len = force;
2012-09-25 17:53:24 -05:00
}
ms.push_run(idx, run_len);
ms.merge_collapse(array);
2012-09-25 17:53:24 -05:00
idx += run_len;
remaining -= run_len;
2012-09-27 20:44:14 -05:00
if remaining == 0 { break; }
2012-09-25 17:53:24 -05:00
}
2012-09-27 20:44:14 -05:00
ms.merge_force_collapse(array);
2012-09-25 17:53:24 -05:00
}
// Reverse the order of elements in a slice, in place
fn reverse_slice<T>(v: &[mut T], start: uint, end:uint) {
2012-09-25 17:53:24 -05:00
let mut i = start;
while i < end / 2 {
v[i] <-> v[end - i - 1];
i += 1;
}
}
pure fn min_run_length(n: uint) -> uint {
2012-09-25 17:53:24 -05:00
let mut n = n;
let mut r = 0; // becomes 1 if any 1 bits are shifted off
while n >= MIN_MERGE {
r |= n & 1;
n >>= 1;
}
return n + r;
}
fn count_run_ascending<T: Ord>(array: &[mut T]) -> uint {
2012-09-25 17:53:24 -05:00
let size = array.len();
assert size > 0;
if size == 1 { return 1; }
let mut run = 2;
if array[1] < array[0] {
while run < size && array[run] < array[run-1] {
run += 1;
}
reverse_slice(array, 0, run);
2012-09-25 17:53:24 -05:00
} else {
while run < size && array[run] >= array[run-1] {
run += 1;
}
}
2012-09-27 20:44:14 -05:00
2012-09-25 17:53:24 -05:00
return run;
}
pure fn gallop_left<T: Ord>(key: &const T, array: &[const T],
2012-09-27 20:44:14 -05:00
hint: uint) -> uint {
2012-09-25 17:53:24 -05:00
let size = array.len();
assert size != 0 && hint < size;
let mut last_ofs = 0;
2012-09-25 17:53:24 -05:00
let mut ofs = 1;
2012-09-27 20:44:14 -05:00
2012-09-25 17:53:24 -05:00
if *key > array[hint] {
// Gallop right until array[hint+last_ofs] < key <= array[hint+ofs]
let max_ofs = size - hint;
while ofs < max_ofs && *key > array[hint+ofs] {
last_ofs = ofs;
2012-09-25 17:53:24 -05:00
ofs = (ofs << 1) + 1;
if ofs < last_ofs { ofs = max_ofs; } // uint overflow guard
2012-09-25 17:53:24 -05:00
}
if ofs > max_ofs { ofs = max_ofs; }
2012-09-25 17:53:24 -05:00
last_ofs += hint;
2012-09-25 17:53:24 -05:00
ofs += hint;
} else {
let max_ofs = hint + 1;
while ofs < max_ofs && *key <= array[hint-ofs] {
last_ofs = ofs;
2012-09-25 17:53:24 -05:00
ofs = (ofs << 1) + 1;
if ofs < last_ofs { ofs = max_ofs; } // uint overflow guard
2012-09-25 17:53:24 -05:00
}
2012-09-27 20:44:14 -05:00
if ofs > max_ofs { ofs = max_ofs; }
2012-09-25 17:53:24 -05:00
let tmp = last_ofs;
last_ofs = hint - ofs;
2012-09-25 17:53:24 -05:00
ofs = hint - tmp;
}
assert (last_ofs < ofs || last_ofs+1 < ofs+1) && ofs <= size;
2012-09-25 17:53:24 -05:00
last_ofs += 1;
while last_ofs < ofs {
let m = last_ofs + ((ofs - last_ofs) >> 1);
2012-09-25 17:53:24 -05:00
if *key > array[m] {
last_ofs = m+1;
2012-09-25 17:53:24 -05:00
} else {
ofs = m;
}
}
assert last_ofs == ofs;
2012-09-25 17:53:24 -05:00
return ofs;
}
pure fn gallop_right<T: Ord>(key: &const T, array: &[const T],
hint: uint) -> uint {
2012-09-25 17:53:24 -05:00
let size = array.len();
assert size != 0 && hint < size;
let mut last_ofs = 0;
2012-09-25 17:53:24 -05:00
let mut ofs = 1;
2012-09-27 20:44:14 -05:00
2012-09-25 17:53:24 -05:00
if *key >= array[hint] {
// Gallop right until array[hint+last_ofs] <= key < array[hint+ofs]
let max_ofs = size - hint;
while ofs < max_ofs && *key >= array[hint+ofs] {
last_ofs = ofs;
2012-09-25 17:53:24 -05:00
ofs = (ofs << 1) + 1;
if ofs < last_ofs { ofs = max_ofs; }
2012-09-25 17:53:24 -05:00
}
if ofs > max_ofs { ofs = max_ofs; }
2012-09-25 17:53:24 -05:00
last_ofs += hint;
2012-09-27 20:44:14 -05:00
ofs += hint;
2012-09-25 17:53:24 -05:00
} else {
// Gallop left until array[hint-ofs] <= key < array[hint-last_ofs]
let max_ofs = hint + 1;
while ofs < max_ofs && *key < array[hint-ofs] {
last_ofs = ofs;
2012-09-25 17:53:24 -05:00
ofs = (ofs << 1) + 1;
if ofs < last_ofs { ofs = max_ofs; }
2012-09-25 17:53:24 -05:00
}
if ofs > max_ofs { ofs = max_ofs; }
2012-09-25 17:53:24 -05:00
let tmp = last_ofs;
last_ofs = hint - ofs;
2012-09-25 17:53:24 -05:00
ofs = hint - tmp;
}
assert (last_ofs < ofs || last_ofs+1 < ofs+1) && ofs <= size;
2012-09-25 17:53:24 -05:00
last_ofs += 1;
while last_ofs < ofs {
let m = last_ofs + ((ofs - last_ofs) >> 1);
2012-09-25 17:53:24 -05:00
if *key >= array[m] {
last_ofs = m + 1;
2012-09-25 17:53:24 -05:00
} else {
ofs = m;
}
}
assert last_ofs == ofs;
2012-09-25 17:53:24 -05:00
return ofs;
}
struct RunState {
base: uint,
len: uint,
}
struct MergeState<T> {
mut min_gallop: uint,
2012-09-25 17:53:24 -05:00
mut tmp: ~[T],
mut last_hi: bool,
mut last_bsort: bool,
mut mergePt: uint,
mut tmpPt: uint,
mut array: &[mut T],
2012-09-25 17:53:24 -05:00
runs: DVec<RunState>,
drop {
unsafe {
let size = self.tmp.len();
// Move tmp back into invalid part of array
if self.last_bsort {
} else if self.last_hi && size > 0 {
self.mergePt -= self.tmpPt;
move_vec(self.array, self.mergePt, self.tmp, 0, self.tmpPt);
} else if !self.last_hi && size-self.tmpPt > 0 {
move_vec(self.array, self.mergePt,
self.tmp, self.tmpPt, size-self.tmpPt);
}
vec::raw::set_len(&mut self.tmp, 0);
2012-09-25 17:53:24 -05:00
}
}
}
fn MergeState<T>() -> MergeState<T> {
let mut tmp = ~[];
2012-09-27 20:44:14 -05:00
vec::reserve(&mut tmp, INITIAL_TMP_STORAGE);
2012-09-25 17:53:24 -05:00
MergeState {
min_gallop: MIN_GALLOP,
tmp: move tmp,
last_hi: false,
last_bsort: false,
mergePt: 0,
tmpPt: 0,
array: &[mut],
2012-09-25 17:53:24 -05:00
runs: DVec(),
}
}
2012-10-22 21:44:43 -05:00
impl<T: Ord> MergeState<T> {
fn binarysort(&self, array: &[mut T], start: uint) {
let size = array.len();
let mut start = start;
assert start <= size;
if start == 0 { start += 1; }
self.last_bsort = true;
unsafe { vec::raw::set_len(&mut self.tmp, 1); };
while start < size {
unsafe {
move_vec(self.tmp, 0, array, start, 1);
}
let mut left = 0;
let mut right = start;
assert left <= right;
while left < right {
let mid = (left + right) >> 1;
if self.tmp[0] < array[mid] {
right = mid;
} else {
left = mid+1;
}
}
assert left == right;
let mut n = start-left;
unsafe {
move_vec(array, left+1, array, left, n);
}
array[left] <-> self.tmp[0];
start += 1;
}
unsafe { vec::raw::set_len(&mut self.tmp, 0); } // Forget the boxed element
self.last_bsort = false;
}
2012-10-22 21:44:43 -05:00
fn push_run(&self, run_base: uint, run_len: uint) {
let tmp = RunState{base: run_base, len: run_len};
2012-09-25 17:53:24 -05:00
self.runs.push(tmp);
}
2012-10-22 21:44:43 -05:00
fn merge_at(&self, n: uint, array: &[mut T]) {
2012-09-25 17:53:24 -05:00
let mut size = self.runs.len();
assert size >= 2;
assert n == size-2 || n == size-3;
do self.runs.borrow_mut |arr| {
let mut b1 = arr[n].base;
let mut l1 = arr[n].len;
let b2 = arr[n+1].base;
let l2 = arr[n+1].len;
assert l1 > 0 && l2 > 0;
assert b1 + l1 == b2;
arr[n].len = l1 + l2;
if n == size-3 {
arr[n+1].base = arr[n+2].base;
arr[n+1].len = arr[n+2].len;
}
let slice = vec::mut_view(array, b1, b1+l1);
self.mergePt = b1;
let k = gallop_right(&const array[b2], slice, 0);
2012-09-25 17:53:24 -05:00
b1 += k;
l1 -= k;
if l1 != 0 {
let slice = vec::mut_view(array, b2, b2+l2);
self.mergePt = b2;
let l2 = gallop_left(
2012-09-25 17:53:24 -05:00
&const array[b1+l1-1],slice,l2-1);
if l2 > 0 {
if l1 <= l2 {
self.merge_lo(array, b1, l1, b2, l2);
2012-09-25 17:53:24 -05:00
} else {
self.merge_hi(array, b1, l1, b2, l2);
2012-09-25 17:53:24 -05:00
}
}
}
}
self.runs.pop();
self.mergePt = 0;
2012-09-25 17:53:24 -05:00
}
2012-10-22 21:44:43 -05:00
fn merge_lo(&self, array: &[mut T], base1: uint, len1: uint,
base2: uint, len2: uint) {
2012-09-25 17:53:24 -05:00
assert len1 != 0 && len2 != 0 && base1+len1 == base2;
2012-09-27 20:44:14 -05:00
vec::reserve(&mut self.tmp, len1);
self.last_hi = false;
2012-09-25 17:53:24 -05:00
unsafe {
vec::raw::set_len(&mut self.tmp, len1);
move_vec(self.tmp, 0, array, base1, len1);
2012-09-25 17:53:24 -05:00
}
self.tmpPt = 0;
self.mergePt = base1;
2012-09-25 17:53:24 -05:00
let mut c1 = 0;
let mut c2 = base2;
let mut dest = base1;
let mut len1 = len1;
let mut len2 = len2;
array[dest] <-> array[c2];
dest += 1; c2 += 1; len2 -= 1;
self.mergePt += 1;
2012-09-25 17:53:24 -05:00
if len2 == 0 {
unsafe {
move_vec(array, dest, self.tmp, 0, len1);
vec::raw::set_len(&mut self.tmp, 0); // Forget the elements
2012-09-25 17:53:24 -05:00
}
return;
}
if len1 == 1 {
unsafe {
move_vec(array, dest, array, c2, len2);
2012-09-25 17:53:24 -05:00
array[dest+len2] <-> self.tmp[c1];
vec::raw::set_len(&mut self.tmp, 0); // Forget the element
2012-09-25 17:53:24 -05:00
}
return;
}
let mut min_gallop = self.min_gallop;
2012-09-25 17:53:24 -05:00
loop {
let mut count1 = 0;
let mut count2 = 0;
let mut break_outer = false;
2012-09-25 17:53:24 -05:00
loop {
assert len1 > 1 && len2 != 0;
if array[c2] < self.tmp[c1] {
array[dest] <-> array[c2];
dest += 1; c2 += 1; len2 -= 1;
self.mergePt += 1;
2012-09-25 17:53:24 -05:00
count2 += 1; count1 = 0;
if len2 == 0 {
break_outer = true;
2012-09-25 17:53:24 -05:00
}
} else {
array[dest] <-> self.tmp[c1];
dest += 1; c1 += 1; len1 -= 1;
self.mergePt += 1;
self.tmpPt += 1;
2012-09-25 17:53:24 -05:00
count1 += 1; count2 = 0;
if len1 == 1 {
break_outer = true;
2012-09-25 17:53:24 -05:00
}
}
if break_outer || ((count1 | count2) >= min_gallop) {
2012-09-25 17:53:24 -05:00
break;
}
}
if break_outer { break; }
2012-09-25 17:53:24 -05:00
// Start to gallop
loop {
assert len1 > 1 && len2 != 0;
//let tmp_view = vec::const_view(self.tmp, c1, c1+len1);
count1 = gallop_right(&const array[c2],
vec::const_view(self.tmp, c1, c1+len1), 0);
2012-09-25 17:53:24 -05:00
if count1 != 0 {
unsafe {
move_vec(array, dest, self.tmp, c1, count1);
2012-09-25 17:53:24 -05:00
}
dest += count1; c1 += count1; len1 -= count1;
self.mergePt += count1; self.tmpPt += count1;
if len1 <= 1 { break_outer = true; break; }
2012-09-25 17:53:24 -05:00
}
array[dest] <-> array[c2];
dest += 1; c2 += 1; len2 -= 1;
self.mergePt += 1;
if len2 == 0 { break_outer = true; break; }
2012-09-25 17:53:24 -05:00
let tmp_view = vec::const_view(array, c2, c2+len2);
count2 = gallop_left(&const self.tmp[c1], tmp_view, 0);
2012-09-25 17:53:24 -05:00
if count2 != 0 {
unsafe {
move_vec(array, dest, array, c2, count2);
2012-09-25 17:53:24 -05:00
}
dest += count2; c2 += count2; len2 -= count2;
self.mergePt += count2;
if len2 == 0 { break_outer = true; break; }
2012-09-25 17:53:24 -05:00
}
array[dest] <-> self.tmp[c1];
dest += 1; c1 += 1; len1 -= 1;
self.mergePt += 1; self.tmpPt += 1;
if len1 == 1 { break_outer = true; break; }
min_gallop -= 1;
if !(count1 >= MIN_GALLOP || count2 >= MIN_GALLOP) {
break;
2012-09-27 20:44:14 -05:00
}
2012-09-25 17:53:24 -05:00
}
if break_outer { break; }
if min_gallop < 0 { min_gallop = 0; }
min_gallop += 2; // Penalize for leaving gallop
2012-09-25 17:53:24 -05:00
}
self.min_gallop = if min_gallop < 1 { 1 } else { min_gallop };
2012-09-25 17:53:24 -05:00
if len1 == 1 {
assert len2 > 0;
unsafe {
move_vec(array, dest, array, c2, len2);
2012-09-25 17:53:24 -05:00
}
array[dest+len2] <-> self.tmp[c1];
} else if len1 == 0 {
2012-10-06 12:44:56 -05:00
fail ~"Comparison violates its contract!";
2012-09-25 17:53:24 -05:00
} else {
assert len2 == 0;
assert len1 > 1;
unsafe {
move_vec(array, dest, self.tmp, c1, len1);
2012-09-25 17:53:24 -05:00
}
}
self.tmpPt = 0;
unsafe { vec::raw::set_len(&mut self.tmp, 0); }
2012-09-25 17:53:24 -05:00
}
2012-10-22 21:44:43 -05:00
fn merge_hi(&self, array: &[mut T], base1: uint, len1: uint,
base2: uint, len2: uint) {
2012-09-25 17:53:24 -05:00
assert len1 != 1 && len2 != 0 && base1 + len1 == base2;
vec::reserve(&mut self.tmp, len2);
self.last_hi = true;
2012-09-25 17:53:24 -05:00
unsafe {
vec::raw::set_len(&mut self.tmp, len2);
move_vec(self.tmp, 0, array, base2, len2);
2012-09-25 17:53:24 -05:00
}
let mut c1 = base1 + len1 - 1;
let mut c2 = len2 - 1;
let mut dest = base2 + len2 - 1;
let mut len1 = len1;
let mut len2 = len2;
self.mergePt = dest;
self.tmpPt = len2 - 1;
2012-09-25 17:53:24 -05:00
array[dest] <-> array[c1];
dest -= 1; c1 -= 1; len1 -= 1;
if len1 == 0 {
unsafe {
move_vec(array, dest-(len2-1), self.tmp, 0, len2);
vec::raw::set_len(&mut self.tmp, 0); // Forget the elements
2012-09-25 17:53:24 -05:00
}
return;
}
if len2 == 1 {
dest -= len1;
c1 -= len1;
unsafe {
move_vec(array, dest+1, array, c1+1, len1);
2012-09-25 17:53:24 -05:00
array[dest] <-> self.tmp[c2];
vec::raw::set_len(&mut self.tmp, 0); // Forget the element
2012-09-25 17:53:24 -05:00
}
return;
}
let mut min_gallop = self.min_gallop;
2012-09-25 17:53:24 -05:00
loop {
let mut count1 = 0;
let mut count2 = 0;
let mut break_outer = false;
2012-09-25 17:53:24 -05:00
loop {
assert len1 != 0 && len2 > 1;
if self.tmp[c2] < array[c1] {
array[dest] <-> array[c1];
dest -= 1; c1 -= 1; len1 -= 1;
self.mergePt -= 1;
2012-09-25 17:53:24 -05:00
count1 += 1; count2 = 0;
if len1 == 0 {
break_outer = true;
2012-09-25 17:53:24 -05:00
}
} else {
array[dest] <-> self.tmp[c2];
dest -= 1; c2 -= 1; len2 -= 1;
self.mergePt -= 1; self.tmpPt -= 1;
2012-09-25 17:53:24 -05:00
count2 += 1; count1 = 0;
if len2 == 1 {
break_outer = true;
2012-09-25 17:53:24 -05:00
}
}
if break_outer || ((count1 | count2) >= min_gallop) {
2012-09-25 17:53:24 -05:00
break;
}
}
if break_outer { break; }
2012-09-27 20:44:14 -05:00
2012-09-25 17:53:24 -05:00
// Start to gallop
loop {
assert len2 > 1 && len1 != 0;
let tmp_view = vec::mut_view(array, base1, base1+len1);
count1 = len1 - gallop_right(
&const self.tmp[c2], tmp_view, len1-1);
2012-09-25 17:53:24 -05:00
if count1 != 0 {
dest -= count1; c1 -= count1; len1 -= count1;
self.mergePt -= count1;
2012-09-25 17:53:24 -05:00
unsafe {
move_vec(array, dest+1, array, c1+1, count1);
2012-09-25 17:53:24 -05:00
}
if len1 == 0 { break_outer = true; break; }
2012-09-25 17:53:24 -05:00
}
array[dest] <-> self.tmp[c2];
dest -= 1; c2 -= 1; len2 -= 1;
self.mergePt -= 1; self.tmpPt -= 1;
if len2 == 1 { break_outer = true; break; }
2012-09-25 17:53:24 -05:00
//let tmp_view = vec::mut_view(self.tmp, 0, len2);
let count2 = len2 - gallop_left(&const array[c1],
vec::mut_view(self.tmp, 0, len2), len2-1);
2012-09-25 17:53:24 -05:00
if count2 != 0 {
dest -= count2; c2 -= count2; len2 -= count2;
self.mergePt -= count2; self.tmpPt -= count2;
2012-09-25 17:53:24 -05:00
unsafe {
move_vec(array, dest+1, self.tmp, c2+1, count2);
2012-09-25 17:53:24 -05:00
}
if len2 <= 1 { break_outer = true; break; }
2012-09-25 17:53:24 -05:00
}
array[dest] <-> array[c1];
dest -= 1; c1 -= 1; len1 -= 1;
self.mergePt -= 1;
if len1 == 0 { break_outer = true; break; }
min_gallop -= 1;
if !(count1 >= MIN_GALLOP || count2 >= MIN_GALLOP) {
break;
2012-09-27 20:44:14 -05:00
}
2012-09-25 17:53:24 -05:00
}
2012-09-27 20:44:14 -05:00
if break_outer { break; }
if min_gallop < 0 { min_gallop = 0; }
min_gallop += 2; // Penalize for leaving gallop
2012-09-25 17:53:24 -05:00
}
self.min_gallop = if min_gallop < 1 { 1 } else { min_gallop };
2012-09-27 20:44:14 -05:00
2012-09-25 17:53:24 -05:00
if len2 == 1 {
assert len1 > 0;
dest -= len1;
c1 -= len1;
unsafe {
move_vec(array, dest+1, array, c1+1, len1);
2012-09-25 17:53:24 -05:00
}
array[dest] <-> self.tmp[c2];
} else if len2 == 0 {
2012-10-06 12:44:56 -05:00
fail ~"Coparison violates its contract!";
2012-09-25 17:53:24 -05:00
} else {
assert len1 == 0;
assert len2 != 0;
unsafe {
move_vec(array, dest-(len2-1), self.tmp, 0, len2);
2012-09-25 17:53:24 -05:00
}
}
self.tmpPt = 0;
unsafe { vec::raw::set_len(&mut self.tmp, 0); }
2012-09-25 17:53:24 -05:00
}
2012-10-22 21:44:43 -05:00
fn merge_collapse(&self, array: &[mut T]) {
2012-09-25 17:53:24 -05:00
while self.runs.len() > 1 {
let mut n = self.runs.len()-2;
let chk = do self.runs.borrow |arr| {
if n > 0 && arr[n-1].len <= arr[n].len + arr[n+1].len {
if arr[n-1].len < arr[n+1].len { n -= 1; }
true
} else if arr[n].len <= arr[n+1].len {
true
} else {
false
}
};
if !chk { break; }
self.merge_at(n, array);
2012-09-25 17:53:24 -05:00
}
}
2012-10-22 21:44:43 -05:00
fn merge_force_collapse(&self, array: &[mut T]) {
2012-09-25 17:53:24 -05:00
while self.runs.len() > 1 {
let mut n = self.runs.len()-2;
if n > 0 {
do self.runs.borrow |arr| {
if arr[n-1].len < arr[n+1].len {
n -= 1;
}
}
}
self.merge_at(n, array);
2012-09-25 17:53:24 -05:00
}
}
}
// Moves elements to from dest to from
// Unsafe as it makes the from parameter invalid between s2 and s2+len
#[inline(always)]
unsafe fn move_vec<T>(dest: &[mut T], s1: uint,
2012-09-27 20:44:14 -05:00
from: &[const T], s2: uint, len: uint) {
2012-09-25 17:53:24 -05:00
assert s1+len <= dest.len() && s2+len <= from.len();
do vec::as_mut_buf(dest) |p, _len| {
let destPtr = ptr::mut_offset(p, s1);
do vec::as_const_buf(from) |p, _len| {
let fromPtr = ptr::const_offset(p, s2);
ptr::memmove(destPtr, fromPtr, len);
}
}
}
2012-01-17 21:05:07 -06:00
#[cfg(test)]
mod test_qsort3 {
#[legacy_exports];
2012-08-31 18:41:15 -05:00
fn check_sort(v1: &[mut int], v2: &[mut int]) {
2012-01-17 21:05:07 -06:00
let len = vec::len::<int>(v1);
quick_sort3::<int>(v1);
let mut i = 0u;
2012-01-17 21:05:07 -06:00
while i < len {
log(debug, v2[i]);
assert (v2[i] == v1[i]);
i += 1u;
}
}
#[test]
fn test() {
{
let v1 = ~[mut 3, 7, 4, 5, 2, 9, 5, 8];
let v2 = ~[mut 2, 3, 4, 5, 5, 7, 8, 9];
2012-01-17 21:05:07 -06:00
check_sort(v1, v2);
}
{
let v1 = ~[mut 1, 1, 1];
let v2 = ~[mut 1, 1, 1];
2012-01-17 21:05:07 -06:00
check_sort(v1, v2);
}
{
let v1: ~[mut int] = ~[mut];
let v2: ~[mut int] = ~[mut];
2012-01-17 21:05:07 -06:00
check_sort(v1, v2);
}
{ let v1 = ~[mut 9]; let v2 = ~[mut 9]; check_sort(v1, v2); }
2012-01-17 21:05:07 -06:00
{
let v1 = ~[mut 9, 3, 3, 3, 9];
let v2 = ~[mut 3, 3, 3, 9, 9];
2012-01-17 21:05:07 -06:00
check_sort(v1, v2);
}
}
}
#[cfg(test)]
mod test_qsort {
#[legacy_exports];
2012-08-31 18:41:15 -05:00
fn check_sort(v1: &[mut int], v2: &[mut int]) {
2012-01-17 21:05:07 -06:00
let len = vec::len::<int>(v1);
pure fn leual(a: &int, b: &int) -> bool { *a <= *b }
2012-09-27 20:44:14 -05:00
quick_sort::<int>(v1, leual);
let mut i = 0u;
2012-01-17 21:05:07 -06:00
while i < len {
log(debug, v2[i]);
assert (v2[i] == v1[i]);
i += 1u;
}
}
#[test]
fn test() {
{
let v1 = ~[mut 3, 7, 4, 5, 2, 9, 5, 8];
let v2 = ~[mut 2, 3, 4, 5, 5, 7, 8, 9];
2012-01-17 21:05:07 -06:00
check_sort(v1, v2);
}
{
let v1 = ~[mut 1, 1, 1];
let v2 = ~[mut 1, 1, 1];
2012-01-17 21:05:07 -06:00
check_sort(v1, v2);
}
{
let v1: ~[mut int] = ~[mut];
let v2: ~[mut int] = ~[mut];
2012-01-17 21:05:07 -06:00
check_sort(v1, v2);
}
{ let v1 = ~[mut 9]; let v2 = ~[mut 9]; check_sort(v1, v2); }
2012-01-17 21:05:07 -06:00
{
let v1 = ~[mut 9, 3, 3, 3, 9];
let v2 = ~[mut 3, 3, 3, 9, 9];
2012-01-17 21:05:07 -06:00
check_sort(v1, v2);
}
}
// Regression test for #750
#[test]
fn test_simple() {
let names = ~[mut 2, 1, 3];
2012-01-17 21:05:07 -06:00
let expected = ~[1, 2, 3];
2012-01-17 21:05:07 -06:00
2012-09-27 20:44:14 -05:00
do sort::quick_sort(names) |x, y| { int::le(*x, *y) };
2012-01-17 21:05:07 -06:00
2012-09-19 00:35:42 -05:00
let immut_names = vec::from_mut(move names);
2012-01-17 21:05:07 -06:00
let pairs = vec::zip(expected, immut_names);
for vec::each(pairs) |p| {
let (a, b) = *p;
2012-08-22 19:24:52 -05:00
debug!("%d %d", a, b);
assert (a == b);
}
2012-01-17 21:05:07 -06:00
}
}
#[cfg(test)]
mod tests {
#[legacy_exports];
2012-01-17 21:05:07 -06:00
2012-08-31 18:41:15 -05:00
fn check_sort(v1: &[int], v2: &[int]) {
2012-01-17 21:05:07 -06:00
let len = vec::len::<int>(v1);
pub pure fn le(a: &int, b: &int) -> bool { *a <= *b }
2012-02-03 04:53:00 -06:00
let f = le;
2012-09-27 20:44:14 -05:00
let v3 = merge_sort::<int>(v1, f);
let mut i = 0u;
2012-01-17 21:05:07 -06:00
while i < len {
log(debug, v3[i]);
assert (v3[i] == v2[i]);
i += 1u;
}
}
#[test]
fn test() {
{
let v1 = ~[3, 7, 4, 5, 2, 9, 5, 8];
let v2 = ~[2, 3, 4, 5, 5, 7, 8, 9];
2012-01-17 21:05:07 -06:00
check_sort(v1, v2);
}
{ let v1 = ~[1, 1, 1]; let v2 = ~[1, 1, 1]; check_sort(v1, v2); }
{ let v1:~[int] = ~[]; let v2:~[int] = ~[]; check_sort(v1, v2); }
{ let v1 = ~[9]; let v2 = ~[9]; check_sort(v1, v2); }
2012-01-17 21:05:07 -06:00
{
let v1 = ~[9, 3, 3, 3, 9];
let v2 = ~[3, 3, 3, 9, 9];
2012-01-17 21:05:07 -06:00
check_sort(v1, v2);
}
}
#[test]
fn test_merge_sort_mutable() {
pub pure fn le(a: &int, b: &int) -> bool { *a <= *b }
let v1 = ~[mut 3, 2, 1];
2012-09-27 20:44:14 -05:00
let v2 = merge_sort(v1, le);
assert v2 == ~[1, 2, 3];
2012-01-17 21:05:07 -06:00
}
#[test]
fn test_merge_sort_stability()
{
// tjc: funny that we have to use parens
pure fn ile(x: &(&static/str), y: &(&static/str)) -> bool
{
unsafe // to_lower is not pure...
{
let x = x.to_lower();
let y = y.to_lower();
x <= y
}
}
let names1 = ~["joe bob", "Joe Bob", "Jack Brown", "JOE Bob",
"Sally Mae", "JOE BOB", "Alex Andy"];
let names2 = ~["Alex Andy", "Jack Brown", "joe bob", "Joe Bob",
"JOE Bob", "JOE BOB", "Sally Mae"];
2012-09-27 20:44:14 -05:00
let names3 = merge_sort(names1, ile);
assert names3 == names2;
}
2012-01-17 21:05:07 -06:00
}
#[cfg(test)]
mod test_tim_sort {
struct CVal {
val: ~float,
}
impl CVal: Ord {
pure fn lt(other: &CVal) -> bool {
unsafe {
let rng = rand::Rng();
if rng.gen_float() > 0.995 { fail ~"It's happening!!!"; }
}
self.val < other.val
}
pure fn le(other: &CVal) -> bool { self.val <= other.val }
pure fn gt(other: &CVal) -> bool { self.val > other.val }
pure fn ge(other: &CVal) -> bool { self.val >= other.val }
}
2012-09-27 21:01:43 -05:00
fn check_sort(v1: &[mut int], v2: &[mut int]) {
let len = vec::len::<int>(v1);
tim_sort::<int>(v1);
2012-09-27 21:01:43 -05:00
let mut i = 0u;
while i < len {
log(debug, v2[i]);
assert (v2[i] == v1[i]);
i += 1u;
}
}
#[test]
fn test() {
{
let v1 = ~[mut 3, 7, 4, 5, 2, 9, 5, 8];
let v2 = ~[mut 2, 3, 4, 5, 5, 7, 8, 9];
check_sort(v1, v2);
}
{
let v1 = ~[mut 1, 1, 1];
let v2 = ~[mut 1, 1, 1];
check_sort(v1, v2);
}
{
let v1: ~[mut int] = ~[mut];
let v2: ~[mut int] = ~[mut];
check_sort(v1, v2);
}
{ let v1 = ~[mut 9]; let v2 = ~[mut 9]; check_sort(v1, v2); }
{
let v1 = ~[mut 9, 3, 3, 3, 9];
let v2 = ~[mut 3, 3, 3, 9, 9];
check_sort(v1, v2);
}
}
#[test]
#[should_fail]
fn crash_test() {
let rng = rand::Rng();
let mut arr = do vec::from_fn(1000) |_i| {
let randVal = rng.gen_float();
CVal { val: ~randVal }
};
tim_sort(arr);
fail ~"Guarantee the fail";
}
}
2012-10-22 18:33:28 -05:00
#[cfg(test)]
mod big_tests {
2012-10-22 18:33:28 -05:00
#[test]
fn test_unique() {
let low = 5;
let high = 10;
2012-10-22 18:33:28 -05:00
tabulate_unique(low, high);
}
#[test]
fn test_managed() {
let low = 5;
let high = 10;
2012-10-22 18:33:28 -05:00
tabulate_managed(low, high);
}
#[test]
fn test_linear() {
2012-10-22 18:33:28 -05:00
tabulate_linear();
}
fn multiplyVec<T: Copy>(arr: &[const T], num: uint) -> ~[mut T] {
let size = arr.len();
let res = do vec::from_fn(num) |i| {
arr[i % size]
};
vec::to_mut(move res)
}
fn makeRange(n: uint) -> ~[uint] {
let one = do vec::from_fn(n) |i| { i };
let mut two = copy one;
vec::reverse(two);
vec::append(move two, one)
}
2012-10-22 18:33:28 -05:00
fn tabulate_unique(lo: uint, hi: uint) {
fn isSorted<T: Ord>(arr: &[const T]) {
for uint::range(0, arr.len()-1) |i| {
if arr[i] > arr[i+1] {
fail ~"Array not sorted";
}
}
}
let rng = rand::Rng();
for uint::range(lo, hi) |i| {
let n = 1 << i;
let arr = do vec::from_fn(n) |_i| {
~rng.gen_float()
};
let arr = vec::to_mut(move arr);
tim_sort(arr); // *sort
isSorted(arr);
vec::reverse(arr);
tim_sort(arr); // \sort
isSorted(arr);
tim_sort(arr); // /sort
isSorted(arr);
for 3.times {
let i1 = rng.gen_uint_range(0, n);
let i2 = rng.gen_uint_range(0, n);
arr[i1] <-> arr[i2];
}
tim_sort(arr); // 3sort
isSorted(arr);
if n >= 10 {
let size = arr.len();
let mut idx = 1;
while idx <= 10 {
arr[size-idx] = ~rng.gen_float();
idx += 1;
}
}
tim_sort(arr); // +sort
isSorted(arr);
for (n/100).times {
let idx = rng.gen_uint_range(0, n);
arr[idx] = ~rng.gen_float();
}
tim_sort(arr);
isSorted(arr);
let arr = if n > 4 {
let part = vec::view(arr, 0, 4);
multiplyVec(part, n)
} else { move arr };
tim_sort(arr); // ~sort
isSorted(arr);
let mut arr = vec::from_elem(n, ~(-0.5));
tim_sort(arr); // =sort
isSorted(arr);
let half = n / 2;
let mut arr = makeRange(half).map(|i| ~(*i as float));
tim_sort(arr); // !sort
isSorted(arr);
}
2012-10-22 18:33:28 -05:00
}
2012-10-22 18:33:28 -05:00
fn tabulate_managed(lo: uint, hi: uint) {
fn isSorted<T: Ord>(arr: &[const @T], expected_refcount: uint) {
for uint::range(0, arr.len()-1) |i| {
if arr[i] > arr[i+1] {
fail ~"Array not sorted";
}
assert sys::refcount(arr[i]) == expected_refcount;
}
}
let rng = rand::Rng();
for uint::range(lo, hi) |i| {
let n = 1 << i;
let arr = do vec::from_fn(n) |_i| {
@rng.gen_float()
};
let arr = vec::to_mut(move arr);
tim_sort(arr); // *sort
isSorted(arr, 1);
vec::reverse(arr);
tim_sort(arr); // \sort
isSorted(arr, 1);
tim_sort(arr); // /sort
isSorted(arr, 1);
for 3.times {
let i1 = rng.gen_uint_range(0, n);
let i2 = rng.gen_uint_range(0, n);
arr[i1] <-> arr[i2];
}
tim_sort(arr); // 3sort
isSorted(arr, 1);
if n >= 10 {
let size = arr.len();
let mut idx = 1;
while idx <= 10 {
arr[size-idx] = @rng.gen_float();
idx += 1;
}
}
tim_sort(arr); // +sort
isSorted(arr, 1);
for (n/100).times {
let idx = rng.gen_uint_range(0, n);
arr[idx] = @rng.gen_float();
}
tim_sort(arr);
isSorted(arr, 1);
let arr = if n > 4 {
let part = vec::view(arr, 0, 4);
multiplyVec(part, n)
} else { move arr };
tim_sort(arr); // ~sort
isSorted(arr, n/4+1);
let mut arr = vec::from_elem(n, @(-0.5));
tim_sort(arr); // =sort
isSorted(arr, n);
let half = n / 2;
let mut arr = makeRange(half).map(|i| @(*i as float));
tim_sort(arr); // !sort
isSorted(arr, 1);
}
}
2012-10-22 18:33:28 -05:00
struct LVal {
val: uint,
key: fn(@uint),
drop {
let x = unsafe { task::local_data::local_data_get(self.key) };
match x {
Some(@y) => {
unsafe {
task::local_data::local_data_set(self.key, @(y+1));
}
}
_ => fail ~"Expected key to work",
}
}
}
impl LVal: Ord {
pure fn lt(other: &LVal) -> bool { self.val < other.val }
pure fn le(other: &LVal) -> bool { self.val <= other.val }
pure fn gt(other: &LVal) -> bool { self.val > other.val }
pure fn ge(other: &LVal) -> bool { self.val >= other.val }
}
2012-10-22 18:33:28 -05:00
fn tabulate_linear() {
fn key(_x: @uint) { }
fn isSorted<T: Ord>(arr: &[const T]) {
for uint::range(0, arr.len()-1) |i| {
if arr[i] > arr[i+1] {
fail ~"Array not sorted";
}
}
}
let n = 1000;
unsafe {
task::local_data::local_data_set(key, @0u);
}
{
let mut arr = do vec::from_fn(n) |i| {
LVal { val: i, key: key }
};
tim_sort(arr);
isSorted(arr);
}
let @dropped = unsafe {
task::local_data::local_data_get(key).get()
};
assert n == dropped;
}
}
2012-09-27 21:01:43 -05:00
2010-12-21 02:44:06 -06:00
// Local Variables:
// mode: rust;
// fill-column: 78;
// indent-tabs-mode: nil
// c-basic-offset: 4
// buffer-file-coding-system: utf-8-unix
// End: