rust/src/libstd/treemap.rs

735 lines
22 KiB
Rust
Raw Normal View History

2013-01-14 09:27:26 -06:00
// Copyright 2013 The Rust Project Developers. See the COPYRIGHT
// file at the top-level directory of this distribution and at
// http://rust-lang.org/COPYRIGHT.
//
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
// option. This file may not be copied, modified, or distributed
// except according to those terms.
2013-01-14 09:27:26 -06:00
//! An ordered map and set implemented as self-balancing binary search
//! trees. The only requirement for the types is that the key implements
//! `Ord`, and that the `lt` method provides a total ordering.
#[forbid(deprecated_mode)];
2012-09-04 13:23:53 -05:00
use core::cmp::{Eq, Ord};
use core::option::{Option, Some, None};
use core::prelude::*;
2013-01-14 09:27:26 -06:00
// This is implemented as an AA tree, which is a simplified variation of
// a red-black tree where where red (horizontal) nodes can only be added
// as a right child. The time complexity is the same, and re-balancing
// operations are more frequent but also cheaper.
2012-05-23 19:18:31 -05:00
2013-01-14 09:27:26 -06:00
// TODO: lazy iteration, for O(n) Eq and set operations instead of O(n*log(m))
2013-01-14 09:27:26 -06:00
// TODO: implement Ord for TreeSet
// could be superset/subset-based or in-order lexicographic comparison... but
// there are methods for is_superset/is_subset so lexicographic is more useful
// TODO: (possibly) implement the overloads Python does for sets:
// * union: |
// * intersection: &
// * difference: -
// * symmetric difference: ^
// These would be convenient since the methods will work like `each`
pub struct TreeMap<K: Ord, V> {
priv root: Option<~TreeNode<K, V>>,
priv length: uint
}
// FIXME: this is a naive O(n*log(m)) implementation, could be O(n)
impl <K: Ord, V: Eq> TreeMap<K, V>: Eq {
pure fn eq(&self, other: &TreeMap<K, V>) -> bool {
if self.len() != other.len() {
return false
}
2013-01-14 09:27:26 -06:00
for self.each |x, y| {
match other.find(x) {
Some(z) => if z != y { return false },
None => return false
}
}
true
}
pure fn ne(&self, other: &TreeMap<K, V>) -> bool {
!self.eq(other)
}
}
2013-01-14 09:27:26 -06:00
impl <K: Ord, V> TreeMap<K, V> {
/// Create an empty TreeMap
static pure fn new() -> TreeMap<K, V> { TreeMap{root: None, length: 0} }
2012-05-23 19:18:31 -05:00
2013-01-14 09:27:26 -06:00
/// Return the number of elements in the map
pure fn len(&self) -> uint { self.length }
/// Return true if the map contains no elements
pure fn is_empty(&self) -> bool { self.root.is_none() }
/// Return true if the map contains some elements
pure fn is_not_empty(&self) -> bool { self.root.is_some() }
/// Visit all key-value pairs in order
pure fn each(&self, f: fn(&K, &V) -> bool) { each(&self.root, f) }
/// Visit all keys in order
pure fn each_key(&self, f: fn(&K) -> bool) { self.each(|k, _| f(k)) }
/// Visit all values in order
pure fn each_value(&self, f: fn(&V) -> bool) { self.each(|_, v| f(v)) }
/// Visit all key-value pairs in reverse order
pure fn each_reverse(&self, f: fn(&K, &V) -> bool) {
each_reverse(&self.root, f);
}
/// Visit all keys in reverse order
pure fn each_key_reverse(&self, f: fn(&K) -> bool) {
self.each_reverse(|k, _| f(k))
}
/// Visit all values in reverse order
pure fn each_value_reverse(&self, f: fn(&V) -> bool) {
self.each_reverse(|_, v| f(v))
}
/// Return true if the map contains a value for the specified key
pure fn contains_key(&self, key: &K) -> bool {
self.find(key).is_some()
}
/// Return the value corresponding to the key in the map
pure fn find(&self, key: &K) -> Option<&self/V> {
let mut current: &self/Option<~TreeNode<K, V>> = &self.root;
loop {
match *current {
Some(ref r) => {
let r: &self/~TreeNode<K, V> = r; // FIXME: #3148
if *key < r.key {
current = &r.left;
} else if r.key < *key {
current = &r.right;
} else {
return Some(&r.value);
}
}
None => return None
}
2012-05-23 19:18:31 -05:00
}
2013-01-14 09:27:26 -06:00
}
/// Insert a key-value pair into the map. An existing value for a
/// key is replaced by the new value. Return true if the key did
/// not already exist in the map.
fn insert(&mut self, key: K, value: V) -> bool {
let ret = insert(&mut self.root, key, value);
if ret { self.length += 1 }
ret
}
/// Remove a key-value pair from the map. Return true if the key
/// was present in the map, otherwise false.
fn remove(&mut self, key: &K) -> bool {
let ret = remove(&mut self.root, key);
if ret { self.length -= 1 }
ret
}
}
2013-01-14 09:27:26 -06:00
pub struct TreeSet<T: Ord> {
priv map: TreeMap<T, ()>
}
impl <T: Ord> TreeSet<T>: iter::BaseIter<T> {
/// Visit all values in order
pure fn each(&self, f: fn(&T) -> bool) { self.map.each_key(f) }
pure fn size_hint(&self) -> Option<uint> { Some(self.len()) }
}
impl <T: Ord> TreeSet<T>: Eq {
pure fn eq(&self, other: &TreeSet<T>) -> bool { self.map == other.map }
pure fn ne(&self, other: &TreeSet<T>) -> bool { self.map != other.map }
}
impl <T: Ord> TreeSet<T> {
/// Create an empty TreeSet
static pure fn new() -> TreeSet<T> { TreeSet{map: TreeMap::new()} }
/// Return the number of elements in the set
pure fn len(&self) -> uint { self.map.len() }
/// Return true if the set contains no elements
pure fn is_empty(&self) -> bool { self.map.is_empty() }
/// Return true if the set contains some elements
pure fn is_not_empty(&self) -> bool { self.map.is_not_empty() }
/// Visit all values in reverse order
pure fn each_reverse(&self, f: fn(&T) -> bool) {
self.map.each_key_reverse(f)
}
/// Return true if the set contains a value
pure fn contains(&self, value: &T) -> bool { self.map.contains_key(value) }
/// Add a value to the set. Return true if the value was not
/// already present in the set.
fn insert(&mut self, value: T) -> bool { self.map.insert(value, ()) }
/// Remove a value from the set. Return true if the value was
/// present in the set.
fn remove(&mut self, value: &T) -> bool { self.map.remove(value) }
/// Return true if the set has no elements in common with `other`.
/// This is equivalent to checking for an empty intersection.
pure fn is_disjoint(&self, other: &TreeSet<T>) -> bool {
// FIXME: this is a naive O(n*log(m)) implementation, could be O(n)
!iter::any(self, |x| other.contains(x))
}
/// Check of the set is a subset of another
pure fn is_subset(&self, other: &TreeSet<T>) -> bool {
// FIXME: this is a naive O(n*log(m)) implementation, could be O(n)
!iter::any(self, |x| !other.contains(x))
}
/// Check of the set is a superset of another
pure fn is_superset(&self, other: &TreeSet<T>) -> bool {
other.is_subset(self)
}
/// Visit the values (in-order) representing the difference
pure fn difference(&self, _other: &TreeSet<T>,
_f: fn(&T) -> bool) {
fail ~"not yet implemented" // TODO
}
/// Visit the values (in-order) representing the symmetric difference
pure fn symmetric_difference(&self, _other: &TreeSet<T>,
_f: fn(&T) -> bool) {
fail ~"not yet implemented" // TODO
}
/// Visit the values (in-order) representing the intersection
pure fn intersection(&self, other: &TreeSet<T>,
f: fn(&T) -> bool) {
// FIXME: this is a naive O(n*log(m)) implementation, could be O(n)
for self.each |x| {
if other.contains(x) {
if !f(x) { break }
}
}
}
/// Visit the values (in-order) representing the union
pure fn union(&self, _other: &TreeSet<T>, _f: fn(&T) -> bool) -> TreeSet<T> {
fail ~"not yet implemented" // TODO
}
}
2012-01-17 21:05:07 -06:00
2013-01-14 09:27:26 -06:00
// Nodes keep track of their level in the tree, starting at 1 in the
// leaves and with a red child sharing the level of the parent.
struct TreeNode<K: Ord, V> {
key: K,
value: V,
left: Option<~TreeNode<K, V>>,
right: Option<~TreeNode<K, V>>,
level: uint
}
2013-01-14 09:27:26 -06:00
impl <K: Ord, V> TreeNode<K, V> {
#[inline(always)]
static pure fn new(key: K, value: V) -> TreeNode<K, V> {
TreeNode{key: key, value: value, left: None, right: None, level: 1}
}
}
2013-01-14 09:27:26 -06:00
pure fn each<K: Ord, V>(node: &Option<~TreeNode<K, V>>,
f: fn(&K, &V) -> bool) {
do node.map |x| {
each(&x.left, f);
if f(&x.key, &x.value) { each(&x.right, f) }
};
}
pure fn each_reverse<K: Ord, V>(node: &Option<~TreeNode<K, V>>,
f: fn(&K, &V) -> bool) {
do node.map |x| {
each_reverse(&x.right, f);
if f(&x.key, &x.value) { each_reverse(&x.left, f) }
};
}
// Remove left horizontal link by rotating right
fn skew<K: Ord, V>(node: ~TreeNode<K, V>) -> ~TreeNode<K, V> {
if node.left.map_default(false, |x| x.level == node.level) {
let mut node = node;
let mut save = node.left.swap_unwrap();
node.left <-> save.right; // save.right now None
save.right = Some(node);
save
} else {
node // nothing to do
}
}
// Remove dual horizontal link by rotating left and increasing level of
// the parent
fn split<K: Ord, V>(node: ~TreeNode<K, V>) -> ~TreeNode<K, V> {
if node.right.map_default(false, |x| x.right.map_default(false, |y| y.level == node.level)) {
let mut node = node;
let mut save = node.right.swap_unwrap();
node.right <-> save.left; // save.left now None
save.left = Some(node);
save.level += 1;
save
} else {
node // nothing to do
}
}
fn insert<K: Ord, V>(node: &mut Option<~TreeNode<K, V>>, key: K,
value: V) -> bool {
if node.is_none() {
*node = Some(~TreeNode::new(key, value));
true
} else {
let mut save = node.swap_unwrap();
if key < save.key {
let inserted = insert(&mut save.left, key, value);
*node = Some(split(skew(save))); // re-balance, if necessary
inserted
} else if save.key < key {
let inserted = insert(&mut save.right, key, value);
*node = Some(split(skew(save))); // re-balance, if necessary
inserted
} else {
save.key = key;
save.value = value;
*node = Some(save);
false
}
}
}
fn remove<K: Ord, V>(node: &mut Option<~TreeNode<K, V>>, key: &K) -> bool {
fn heir_swap<K: Ord, V>(node: &mut TreeNode<K, V>,
child: &mut Option<~TreeNode<K, V>>) {
// *could* be done without recursion, but it won't borrow check
do child.mutate |child| {
let mut child = child;
if child.right.is_some() {
heir_swap(node, &mut child.right);
} else {
node.key <-> child.key;
node.value <-> child.value;
}
child
}
}
if node.is_none() {
return false // bottom of tree
} else {
let mut save = node.swap_unwrap();
let removed = if save.key < *key {
remove(&mut save.right, key)
} else if *key < save.key {
remove(&mut save.left, key)
} else {
if save.left.is_some() {
if save.right.is_some() {
let mut left = save.left.swap_unwrap();
if left.right.is_some() {
heir_swap(save, &mut left.right);
save.left = Some(left);
remove(&mut save.left, key);
} else {
save.key <-> left.key;
save.value <-> left.value;
save.left = Some(left);
remove(&mut save.left, key);
}
} else {
let mut rm = save.left.swap_unwrap();
save.key <-> rm.key;
save.value <-> rm.value;
save.level <-> rm.level; // FIXME: may not be needed
save.left <-> rm.left; // FIXME: may not be needed
save.right <-> rm.right; // FIXME: may not be needed
}
} else if save.right.is_some() {
let mut rm = save.right.swap_unwrap();
save.key <-> rm.key;
save.value <-> rm.value;
save.level <-> rm.level; // FIXME: may not be needed
save.left <-> rm.left; // FIXME: may not be needed
save.right <-> rm.right; // FIXME: may not be needed
} else {
return true // leaf
}
true
};
let left_level = save.left.map_default(0, |x| x.level);
let right_level = save.right.map_default(0, |x| x.level);
// re-balance, if necessary
if left_level < save.level - 1 || right_level < save.level - 1 {
save.level -= 1;
if right_level > save.level {
do save.right.mutate |x| {
let mut x = x; x.level = save.level; x
}
}
save = skew(save);
do save.right.mutate |right| {
let mut right = skew(right);
right.right.mutate(skew);
right
}
save = split(save);
save.right.mutate(split);
}
2012-01-17 21:05:07 -06:00
2013-01-14 09:27:26 -06:00
*node = Some(save);
removed
}
}
2013-01-14 09:27:26 -06:00
#[cfg(test)]
mod test_treemap {
use super::*;
use core::str;
2012-01-17 21:05:07 -06:00
#[test]
2013-01-14 09:27:26 -06:00
fn find_empty() {
let m = TreeMap::new::<int, int>(); assert m.find(&5) == None;
}
2012-01-17 21:05:07 -06:00
#[test]
2013-01-14 09:27:26 -06:00
fn find_not_found() {
let mut m = TreeMap::new();
assert m.insert(1, 2);
assert m.insert(5, 3);
assert m.insert(9, 3);
assert m.find(&2) == None;
}
2012-01-17 21:05:07 -06:00
#[test]
2013-01-14 09:27:26 -06:00
fn insert_replace() {
let mut m = TreeMap::new();
assert m.insert(5, 2);
assert m.insert(2, 9);
assert !m.insert(2, 11);
assert m.find(&2).unwrap() == &11;
}
2012-01-17 21:05:07 -06:00
#[test]
2013-01-14 09:27:26 -06:00
fn u8_map() {
let mut m = TreeMap::new();
let k1 = str::to_bytes(~"foo");
let k2 = str::to_bytes(~"bar");
let v1 = str::to_bytes(~"baz");
let v2 = str::to_bytes(~"foobar");
m.insert(k1, v1);
m.insert(k2, v2);
assert m.find(&k2) == Some(&v2);
assert m.find(&k1) == Some(&v1);
}
fn check_equal<K: Eq Ord, V: Eq>(ctrl: &[(K, V)], map: &TreeMap<K, V>) {
assert ctrl.is_empty() == map.is_empty();
assert ctrl.is_not_empty() == map.is_not_empty();
for ctrl.each |x| {
let &(k, v) = x;
assert map.find(&k).unwrap() == &v
}
for map.each |map_k, map_v| {
let mut found = false;
for ctrl.each |x| {
let &(ctrl_k, ctrl_v) = x;
if *map_k == ctrl_k {
assert *map_v == ctrl_v;
found = true;
break;
}
}
assert found;
}
}
fn check_left<K: Ord, V>(node: &Option<~TreeNode<K, V>>, parent: &~TreeNode<K, V>) {
match *node {
Some(ref r) => {
assert r.key < parent.key;
assert r.level == parent.level - 1; // left is black
check_left(&r.left, r);
check_right(&r.right, r, false);
}
None => assert parent.level == 1 // parent is leaf
}
}
fn check_right<K: Ord, V>(node: &Option<~TreeNode<K, V>>,
parent: &~TreeNode<K, V>, parent_red: bool) {
match *node {
Some(ref r) => {
assert r.key > parent.key;
let red = r.level == parent.level;
if parent_red { assert !red } // no dual horizontal links
assert red || r.level == parent.level - 1; // right is red or black
check_left(&r.left, r);
check_right(&r.right, r, red);
}
None => assert parent.level == 1 // parent is leaf
}
}
fn check_structure<K: Ord, V>(map: &TreeMap<K, V>) {
match map.root {
Some(ref r) => {
check_left(&r.left, r);
check_right(&r.right, r, false);
}
None => ()
}
2012-01-17 21:05:07 -06:00
}
#[test]
2013-01-14 09:27:26 -06:00
fn test_rand_int() {
let mut map = TreeMap::new::<int, int>();
let mut ctrl = ~[];
check_equal(ctrl, &map);
assert map.find(&5).is_none();
let rng = rand::seeded_rng(&~[42]);
for 3.times {
for 90.times {
let k = rng.gen_int();
let v = rng.gen_int();
if !ctrl.contains(&(k, v)) {
assert map.insert(k, v);
ctrl.push((k, v));
check_structure(&map);
check_equal(ctrl, &map);
}
}
for 30.times {
let r = rng.gen_uint_range(0, ctrl.len());
let (key, _) = vec::remove(&mut ctrl, r);
assert map.remove(&key);
check_structure(&map);
check_equal(ctrl, &map);
}
}
2012-01-17 21:05:07 -06:00
}
#[test]
2013-01-14 09:27:26 -06:00
fn test_len() {
let mut m = TreeMap::new();
assert m.insert(3, 6);
assert m.len() == 1;
assert m.insert(0, 0);
assert m.len() == 2;
assert m.insert(4, 8);
assert m.len() == 3;
assert m.remove(&3);
assert m.len() == 2;
assert !m.remove(&5);
assert m.len() == 2;
assert m.insert(2, 4);
assert m.len() == 3;
assert m.insert(1, 2);
assert m.len() == 4;
}
#[test]
fn test_each() {
let mut m = TreeMap::new();
assert m.insert(3, 6);
assert m.insert(0, 0);
assert m.insert(4, 8);
assert m.insert(2, 4);
assert m.insert(1, 2);
let mut n = 0;
for m.each |k, v| {
assert *k == n;
assert *v == n * 2;
n += 1;
}
2012-01-17 21:05:07 -06:00
}
#[test]
2013-01-14 09:27:26 -06:00
fn test_each_reverse() {
let mut m = TreeMap::new();
assert m.insert(3, 6);
assert m.insert(0, 0);
assert m.insert(4, 8);
assert m.insert(2, 4);
assert m.insert(1, 2);
2012-01-17 21:05:07 -06:00
2013-01-14 09:27:26 -06:00
let mut n = 4;
for m.each_reverse |k, v| {
assert *k == n;
assert *v == n * 2;
n -= 1;
2012-01-17 21:05:07 -06:00
}
}
#[test]
2013-01-14 09:27:26 -06:00
fn test_eq() {
let mut a = TreeMap::new();
let mut b = TreeMap::new();
2013-01-14 09:27:26 -06:00
assert a == b;
assert a.insert(0, 5);
assert a != b;
assert b.insert(0, 4);
assert a != b;
assert a.insert(5, 19);
assert a != b;
assert !b.insert(0, 5);
assert a != b;
assert b.insert(5, 19);
assert a == b;
}
}
2013-01-14 09:27:26 -06:00
#[cfg(test)]
mod test_set {
use super::*;
2013-01-14 09:27:26 -06:00
#[test]
fn test_disjoint() {
let mut xs = TreeSet::new();
let mut ys = TreeSet::new();
assert xs.is_disjoint(&ys);
assert ys.is_disjoint(&xs);
assert xs.insert(5);
assert ys.insert(11);
assert xs.is_disjoint(&ys);
assert ys.is_disjoint(&xs);
assert xs.insert(7);
assert xs.insert(19);
assert xs.insert(4);
assert ys.insert(2);
assert ys.insert(-11);
assert xs.is_disjoint(&ys);
assert ys.is_disjoint(&xs);
assert ys.insert(7);
assert !xs.is_disjoint(&ys);
assert !ys.is_disjoint(&xs);
}
2012-01-17 21:05:07 -06:00
#[test]
2013-01-14 09:27:26 -06:00
fn test_subset_and_superset() {
let mut a = TreeSet::new();
assert a.insert(0);
assert a.insert(5);
assert a.insert(11);
assert a.insert(7);
2012-01-17 21:05:07 -06:00
2013-01-14 09:27:26 -06:00
let mut b = TreeSet::new();
assert b.insert(0);
assert b.insert(7);
assert b.insert(19);
assert b.insert(250);
assert b.insert(11);
assert b.insert(200);
assert !a.is_subset(&b);
assert !a.is_superset(&b);
assert !b.is_subset(&a);
assert !b.is_superset(&a);
2012-01-17 21:05:07 -06:00
2013-01-14 09:27:26 -06:00
assert b.insert(5);
2012-01-17 21:05:07 -06:00
2013-01-14 09:27:26 -06:00
assert a.is_subset(&b);
assert !a.is_superset(&b);
assert !b.is_subset(&a);
assert b.is_superset(&a);
}
#[test]
fn test_each() {
let mut m = TreeSet::new();
assert m.insert(3);
assert m.insert(0);
assert m.insert(4);
assert m.insert(2);
assert m.insert(1);
let mut n = 0;
for m.each |x| {
assert *x == n;
n += 1
}
}
#[test]
fn test_each_reverse() {
let mut m = TreeSet::new();
assert m.insert(3);
assert m.insert(0);
assert m.insert(4);
assert m.insert(2);
assert m.insert(1);
let mut n = 4;
for m.each_reverse |x| {
assert *x == n;
n -= 1
}
}
#[test]
fn test_intersection() {
let mut a = TreeSet::new();
let mut b = TreeSet::new();
a.insert(11);
a.insert(1);
a.insert(3);
a.insert(77);
a.insert(103);
a.insert(5);
a.insert(-5);
b.insert(2);
b.insert(11);
b.insert(77);
b.insert(-9);
b.insert(-42);
b.insert(5);
b.insert(3);
let mut i = 0;
let expected = [3, 5, 11, 77];
for a.intersection(&b) |x| {
assert *x == expected[i];
i += 1
}
assert i == expected.len();
2012-01-17 21:05:07 -06:00
}
2012-05-23 19:18:31 -05:00
}