// Copyright 2013 The Rust Project Developers. See the COPYRIGHT // file at the top-level directory of this distribution and at // http://rust-lang.org/COPYRIGHT. // // Licensed under the Apache License, Version 2.0 or the MIT license // , at your // option. This file may not be copied, modified, or distributed // except according to those terms. //! A radix trie for storing integers in sorted order use prelude::*; // FIXME: #5244: need to manually update the TrieNode constructor const SHIFT: uint = 4; const SIZE: uint = 1 << SHIFT; const MASK: uint = SIZE - 1; enum Child { Internal(~TrieNode), External(uint, T), Nothing } pub struct TrieMap { priv root: TrieNode, priv length: uint } impl BaseIter<(uint, &'self T)> for TrieMap { /// Visit all key-value pairs in order #[inline(always)] fn each(&self, f: &fn(&(uint, &'self T)) -> bool) { self.root.each(f); } #[inline(always)] fn size_hint(&self) -> Option { Some(self.len()) } } impl ReverseIter<(uint, &'self T)> for TrieMap { /// Visit all key-value pairs in reverse order #[inline(always)] fn each_reverse(&self, f: &fn(&(uint, &'self T)) -> bool) { self.root.each_reverse(f); } } impl Container for TrieMap { /// Return the number of elements in the map #[inline(always)] fn len(&const self) -> uint { self.length } /// Return true if the map contains no elements #[inline(always)] fn is_empty(&const self) -> bool { self.len() == 0 } } impl Mutable for TrieMap { /// Clear the map, removing all values. #[inline(always)] fn clear(&mut self) { self.root = TrieNode::new(); self.length = 0; } } impl Map for TrieMap { /// Return true if the map contains a value for the specified key #[inline(always)] fn contains_key(&self, key: &uint) -> bool { self.find(key).is_some() } /// Visit all keys in order #[inline(always)] fn each_key(&self, f: &fn(&uint) -> bool) { self.each(|&(k, _)| f(&k)) } /// Visit all values in order #[inline(always)] fn each_value(&self, f: &fn(&T) -> bool) { self.each(|&(_, v)| f(v)) } /// Iterate over the map and mutate the contained values #[inline(always)] fn mutate_values(&mut self, f: &fn(&uint, &mut T) -> bool) { self.root.mutate_values(f); } /// Return the value corresponding to the key in the map #[inline(hint)] fn find(&self, key: &uint) -> Option<&'self T> { let mut node: &'self TrieNode = &self.root; let mut idx = 0; loop { match node.children[chunk(*key, idx)] { Internal(ref x) => node = &**x, External(stored, ref value) => { if stored == *key { return Some(value) } else { return None } } Nothing => return None } idx += 1; } } /// Insert a key-value pair into the map. An existing value for a /// key is replaced by the new value. Return true if the key did /// not already exist in the map. #[inline(always)] fn insert(&mut self, key: uint, value: T) -> bool { let ret = insert(&mut self.root.count, &mut self.root.children[chunk(key, 0)], key, value, 1); if ret { self.length += 1 } ret } /// Remove a key-value pair from the map. Return true if the key /// was present in the map, otherwise false. #[inline(always)] fn remove(&mut self, key: &uint) -> bool { let ret = remove(&mut self.root.count, &mut self.root.children[chunk(*key, 0)], *key, 1); if ret { self.length -= 1 } ret } } pub impl TrieMap { /// Create an empty TrieMap #[inline(always)] fn new() -> TrieMap { TrieMap{root: TrieNode::new(), length: 0} } /// Visit all keys in reverse order #[inline(always)] fn each_key_reverse(&self, f: &fn(&uint) -> bool) { self.each_reverse(|&(k, _)| f(&k)) } /// Visit all values in reverse order #[inline(always)] fn each_value_reverse(&self, f: &fn(&T) -> bool) { self.each_reverse(|&(_, v)| f(v)) } } pub struct TrieSet { priv map: TrieMap<()> } impl BaseIter for TrieSet { /// Visit all values in order fn each(&self, f: &fn(&uint) -> bool) { self.map.each_key(f) } fn size_hint(&self) -> Option { Some(self.len()) } } impl ReverseIter for TrieSet { /// Visit all values in reverse order fn each_reverse(&self, f: &fn(&uint) -> bool) { self.map.each_key_reverse(f) } } impl Container for TrieSet { /// Return the number of elements in the set #[inline(always)] fn len(&const self) -> uint { self.map.len() } /// Return true if the set contains no elements #[inline(always)] fn is_empty(&const self) -> bool { self.map.is_empty() } } impl Mutable for TrieSet { /// Clear the set, removing all values. #[inline(always)] fn clear(&mut self) { self.map.clear() } } impl TrieSet { /// Create an empty TrieSet #[inline(always)] fn new() -> TrieSet { TrieSet{map: TrieMap::new()} } /// Return true if the set contains a value #[inline(always)] fn contains(&self, value: &uint) -> bool { self.map.contains_key(value) } /// Add a value to the set. Return true if the value was not already /// present in the set. #[inline(always)] fn insert(&mut self, value: uint) -> bool { self.map.insert(value, ()) } /// Remove a value from the set. Return true if the value was /// present in the set. #[inline(always)] fn remove(&mut self, value: &uint) -> bool { self.map.remove(value) } } struct TrieNode { count: uint, children: [Child * SIZE] } impl TrieNode { #[inline(always)] fn new() -> TrieNode { // FIXME: #5244: [Nothing, ..SIZE] should be possible without Copy TrieNode{count: 0, children: [Nothing, Nothing, Nothing, Nothing, Nothing, Nothing, Nothing, Nothing, Nothing, Nothing, Nothing, Nothing, Nothing, Nothing, Nothing, Nothing]} } } impl TrieNode { fn each(&self, f: &fn(&(uint, &'self T)) -> bool) -> bool { for uint::range(0, self.children.len()) |idx| { match self.children[idx] { Internal(ref x) => if !x.each(f) { return false }, External(k, ref v) => if !f(&(k, v)) { return false }, Nothing => () } } true } fn each_reverse(&self, f: &fn(&(uint, &'self T)) -> bool) -> bool { for uint::range_rev(self.children.len(), 0) |idx| { match self.children[idx - 1] { Internal(ref x) => if !x.each_reverse(f) { return false }, External(k, ref v) => if !f(&(k, v)) { return false }, Nothing => () } } true } fn mutate_values(&mut self, f: &fn(&uint, &mut T) -> bool) -> bool { for vec::each_mut(self.children) |child| { match *child { Internal(ref mut x) => if !x.mutate_values(f) { return false }, External(k, ref mut v) => if !f(&k, v) { return false }, Nothing => () } } true } } // if this was done via a trait, the key could be generic #[inline(always)] fn chunk(n: uint, idx: uint) -> uint { let sh = uint::bits - (SHIFT * (idx + 1)); (n >> sh) & MASK } fn insert(count: &mut uint, child: &mut Child, key: uint, value: T, idx: uint) -> bool { let mut tmp = Nothing; tmp <-> *child; let mut added = false; *child = match tmp { External(stored_key, stored_value) => { if stored_key == key { External(stored_key, value) } else { // conflict - split the node let mut new = ~TrieNode::new(); insert(&mut new.count, &mut new.children[chunk(stored_key, idx)], stored_key, stored_value, idx + 1); insert(&mut new.count, &mut new.children[chunk(key, idx)], key, value, idx + 1); added = true; Internal(new) } } Internal(x) => { let mut x = x; added = insert(&mut x.count, &mut x.children[chunk(key, idx)], key, value, idx + 1); Internal(x) } Nothing => { *count += 1; added = true; External(key, value) } }; added } fn remove(count: &mut uint, child: &mut Child, key: uint, idx: uint) -> bool { let (ret, this) = match *child { External(stored, _) => { if stored == key { (true, true) } else { (false, false) } } Internal(ref mut x) => { let ret = remove(&mut x.count, &mut x.children[chunk(key, idx)], key, idx + 1); (ret, x.count == 0) } Nothing => (false, false) }; if this { *child = Nothing; *count -= 1; } ret } #[cfg(test)] pub fn check_integrity(trie: &TrieNode) { fail_unless!(trie.count != 0); let mut sum = 0; for trie.children.each |x| { match *x { Nothing => (), Internal(ref y) => { check_integrity(&**y); sum += 1 } External(_, _) => { sum += 1 } } } fail_unless!(sum == trie.count); } #[cfg(test)] mod tests { use super::*; use uint; #[test] fn test_step() { let mut trie = TrieMap::new(); let n = 300; for uint::range_step(1, n, 2) |x| { fail_unless!(trie.insert(x, x + 1)); fail_unless!(trie.contains_key(&x)); check_integrity(&trie.root); } for uint::range_step(0, n, 2) |x| { fail_unless!(!trie.contains_key(&x)); fail_unless!(trie.insert(x, x + 1)); check_integrity(&trie.root); } for uint::range(0, n) |x| { fail_unless!(trie.contains_key(&x)); fail_unless!(!trie.insert(x, x + 1)); check_integrity(&trie.root); } for uint::range_step(1, n, 2) |x| { fail_unless!(trie.remove(&x)); fail_unless!(!trie.contains_key(&x)); check_integrity(&trie.root); } for uint::range_step(0, n, 2) |x| { fail_unless!(trie.contains_key(&x)); fail_unless!(!trie.insert(x, x + 1)); check_integrity(&trie.root); } } #[test] fn test_each() { let mut m = TrieMap::new(); fail_unless!(m.insert(3, 6)); fail_unless!(m.insert(0, 0)); fail_unless!(m.insert(4, 8)); fail_unless!(m.insert(2, 4)); fail_unless!(m.insert(1, 2)); let mut n = 0; for m.each |&(k, v)| { fail_unless!(k == n); fail_unless!(*v == n * 2); n += 1; } } #[test] fn test_each_break() { let mut m = TrieMap::new(); for uint::range_rev(uint::max_value, uint::max_value - 10000) |x| { m.insert(x, x / 2); } let mut n = uint::max_value - 9999; for m.each |&(k, v)| { if n == uint::max_value - 5000 { break } fail_unless!(n < uint::max_value - 5000); fail_unless!(k == n); fail_unless!(*v == n / 2); n += 1; } } #[test] fn test_each_reverse() { let mut m = TrieMap::new(); fail_unless!(m.insert(3, 6)); fail_unless!(m.insert(0, 0)); fail_unless!(m.insert(4, 8)); fail_unless!(m.insert(2, 4)); fail_unless!(m.insert(1, 2)); let mut n = 4; for m.each_reverse |&(k, v)| { fail_unless!(k == n); fail_unless!(*v == n * 2); n -= 1; } } #[test] fn test_each_reverse_break() { let mut m = TrieMap::new(); for uint::range_rev(uint::max_value, uint::max_value - 10000) |x| { m.insert(x, x / 2); } let mut n = uint::max_value; for m.each_reverse |&(k, v)| { if n == uint::max_value - 5000 { break } fail_unless!(n > uint::max_value - 5000); fail_unless!(k == n); fail_unless!(*v == n / 2); n -= 1; } } #[test] fn test_sane_chunk() { let x = 1; let y = 1 << (uint::bits - 1); let mut trie = TrieSet::new(); fail_unless!(trie.insert(x)); fail_unless!(trie.insert(y)); fail_unless!(trie.len() == 2); let expected = [x, y]; let mut i = 0; for trie.each |x| { fail_unless!(expected[i] == *x); i += 1; } } }