2011-10-26 13:28:23 -05:00
|
|
|
/*
|
|
|
|
Module: map
|
|
|
|
|
|
|
|
A hashmap
|
|
|
|
*/
|
|
|
|
|
|
|
|
/* Section: Types */
|
|
|
|
|
|
|
|
/*
|
|
|
|
Type: hashfn
|
|
|
|
|
2011-12-07 10:14:57 -06:00
|
|
|
A function that returns a hash of a value.
|
|
|
|
The hash should concentrate entropy in the
|
|
|
|
lower bits.
|
2011-10-26 13:28:23 -05:00
|
|
|
*/
|
2011-10-25 10:57:26 -05:00
|
|
|
type hashfn<K> = fn(K) -> uint;
|
2011-06-15 13:19:50 -05:00
|
|
|
|
2011-10-26 13:28:23 -05:00
|
|
|
/*
|
|
|
|
Type: eqfn
|
|
|
|
|
|
|
|
Equality
|
|
|
|
*/
|
2011-10-25 10:57:26 -05:00
|
|
|
type eqfn<K> = fn(K, K) -> bool;
|
2011-06-15 13:19:50 -05:00
|
|
|
|
2011-10-26 13:28:23 -05:00
|
|
|
/*
|
|
|
|
Type: hashset
|
|
|
|
|
|
|
|
A convenience type to treat a hashmap as a set
|
|
|
|
*/
|
2011-08-12 08:37:10 -05:00
|
|
|
type hashset<K> = hashmap<K, ()>;
|
2011-07-21 20:14:39 -05:00
|
|
|
|
2011-10-26 13:28:23 -05:00
|
|
|
/*
|
|
|
|
Obj: hashmap
|
|
|
|
*/
|
|
|
|
type hashmap<K, V> = obj {
|
|
|
|
/*
|
|
|
|
Method: size
|
|
|
|
|
|
|
|
Return the number of elements in the map
|
|
|
|
*/
|
|
|
|
fn size() -> uint;
|
|
|
|
/*
|
|
|
|
Method: insert
|
|
|
|
|
|
|
|
Add a value to the map. If the map already contains a value for
|
|
|
|
the specified key then the original value is replaced.
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
|
|
|
|
True if the key did not already exist in the map
|
|
|
|
*/
|
|
|
|
fn insert(K, V) -> bool;
|
|
|
|
/*
|
|
|
|
Method: contains_key
|
|
|
|
|
|
|
|
Returns true if the map contains a value for the specified key
|
|
|
|
*/
|
|
|
|
fn contains_key(K) -> bool;
|
|
|
|
/*
|
|
|
|
Method: get
|
|
|
|
|
|
|
|
Get the value for the specified key
|
|
|
|
|
|
|
|
Failure:
|
|
|
|
|
|
|
|
If the key does not exist in the map
|
|
|
|
*/
|
|
|
|
fn get(K) -> V;
|
|
|
|
/*
|
|
|
|
Method: find
|
2010-07-16 20:14:52 -05:00
|
|
|
|
2011-10-26 13:28:23 -05:00
|
|
|
Get the value for the specified key. If the key does not exist
|
|
|
|
in the map then returns none.
|
|
|
|
*/
|
|
|
|
fn find(K) -> option::t<V>;
|
|
|
|
/*
|
|
|
|
Method: remove
|
|
|
|
|
|
|
|
Remove and return a value from the map. If the key does not exist
|
|
|
|
in the map then returns none.
|
|
|
|
*/
|
|
|
|
fn remove(K) -> option::t<V>;
|
|
|
|
/*
|
|
|
|
Method: rehash
|
|
|
|
|
|
|
|
Force map growth and rehashing
|
|
|
|
*/
|
|
|
|
fn rehash();
|
|
|
|
/*
|
|
|
|
Method: items
|
|
|
|
|
|
|
|
Iterate over all the key/value pairs in the map
|
|
|
|
*/
|
|
|
|
fn items(block(K, V));
|
|
|
|
/*
|
|
|
|
Method: keys
|
|
|
|
|
|
|
|
Iterate over all the keys in the map
|
|
|
|
*/
|
|
|
|
fn keys(block(K));
|
|
|
|
/*
|
|
|
|
Iterate over all the values in the map
|
|
|
|
*/
|
|
|
|
fn values(block(V));
|
|
|
|
};
|
|
|
|
|
|
|
|
/* Section: Operations */
|
|
|
|
|
2011-12-06 21:56:47 -06:00
|
|
|
mod chained {
|
|
|
|
type entry<copy K, copy V> = {
|
|
|
|
hash: uint,
|
|
|
|
key: K,
|
|
|
|
mutable value: V,
|
|
|
|
mutable next: chain<K, V>
|
|
|
|
};
|
|
|
|
|
|
|
|
tag chain<copy K, copy V> {
|
|
|
|
present(@entry<K, V>);
|
|
|
|
absent;
|
|
|
|
}
|
|
|
|
|
|
|
|
type t<copy K, copy V> = {
|
|
|
|
mutable size: uint,
|
|
|
|
mutable chains: [mutable chain<K,V>],
|
|
|
|
hasher: hashfn<K>,
|
|
|
|
eqer: eqfn<K>
|
|
|
|
};
|
|
|
|
|
|
|
|
tag search_result<copy K, copy V> {
|
2011-12-06 22:22:12 -06:00
|
|
|
not_found;
|
2011-12-06 21:56:47 -06:00
|
|
|
found_first(uint, @entry<K,V>);
|
|
|
|
found_after(@entry<K,V>, @entry<K,V>);
|
|
|
|
}
|
|
|
|
|
|
|
|
fn search_rem<copy K, copy V>(tbl: t<K,V>,
|
|
|
|
k: K,
|
|
|
|
h: uint,
|
2011-12-06 23:33:47 -06:00
|
|
|
idx: uint,
|
2011-12-06 21:56:47 -06:00
|
|
|
e_root: @entry<K,V>) -> search_result<K,V> {
|
|
|
|
let e0 = e_root;
|
2011-12-06 23:33:47 -06:00
|
|
|
let comp = 1u; // for logging
|
2011-12-06 21:56:47 -06:00
|
|
|
while true {
|
|
|
|
alt e0.next {
|
|
|
|
absent. {
|
2011-12-06 23:33:47 -06:00
|
|
|
log("search_tbl", "absent", "comparisons", comp,
|
|
|
|
"hash", h, "idx", idx);
|
|
|
|
|
2011-12-06 22:22:12 -06:00
|
|
|
ret not_found;
|
2011-12-06 21:56:47 -06:00
|
|
|
}
|
|
|
|
present(e1) {
|
2011-12-06 23:33:47 -06:00
|
|
|
comp += 1u;
|
2011-12-06 21:56:47 -06:00
|
|
|
let e1_key = e1.key; // Satisfy alias checker.
|
|
|
|
if e1.hash == h && tbl.eqer(e1_key, k) {
|
2011-12-06 23:33:47 -06:00
|
|
|
log("search_tbl", "present", "comparisons", comp,
|
|
|
|
"hash", h, "idx", idx);
|
2011-12-06 21:56:47 -06:00
|
|
|
ret found_after(e0, e1);
|
|
|
|
} else {
|
|
|
|
e0 = e1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
util::unreachable();
|
|
|
|
}
|
|
|
|
|
|
|
|
fn search_tbl<copy K, copy V>(
|
|
|
|
tbl: t<K,V>, k: K, h: uint) -> search_result<K,V> {
|
|
|
|
let idx = h % vec::len(tbl.chains);
|
|
|
|
alt tbl.chains[idx] {
|
|
|
|
absent. {
|
2011-12-06 23:33:47 -06:00
|
|
|
log("search_tbl", "absent", "comparisons", 0u,
|
|
|
|
"hash", h, "idx", idx);
|
2011-12-06 22:22:12 -06:00
|
|
|
ret not_found;
|
2011-12-06 21:56:47 -06:00
|
|
|
}
|
|
|
|
present(e) {
|
|
|
|
let e_key = e.key; // Satisfy alias checker.
|
|
|
|
if e.hash == h && tbl.eqer(e_key, k) {
|
2011-12-06 23:33:47 -06:00
|
|
|
log("search_tbl", "present", "comparisons", 1u,
|
|
|
|
"hash", h, "idx", idx);
|
2011-12-06 21:56:47 -06:00
|
|
|
ret found_first(idx, e);
|
|
|
|
} else {
|
2011-12-06 23:33:47 -06:00
|
|
|
ret search_rem(tbl, k, h, idx, e);
|
2011-12-06 21:56:47 -06:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2011-12-06 22:22:12 -06:00
|
|
|
fn insert<copy K, copy V>(tbl: t<K,V>, k: K, v: V) -> bool {
|
|
|
|
let hash = tbl.hasher(k);
|
2011-12-06 21:56:47 -06:00
|
|
|
alt search_tbl(tbl, k, hash) {
|
2011-12-06 22:22:12 -06:00
|
|
|
not_found. {
|
|
|
|
tbl.size += 1u;
|
|
|
|
let idx = hash % vec::len(tbl.chains);
|
2011-12-06 21:56:47 -06:00
|
|
|
let old_chain = tbl.chains[idx];
|
|
|
|
tbl.chains[idx] = present(@{
|
|
|
|
hash: hash,
|
|
|
|
key: k,
|
|
|
|
mutable value: v,
|
|
|
|
mutable next: old_chain});
|
|
|
|
ret true;
|
|
|
|
}
|
|
|
|
found_first(_, entry) {
|
|
|
|
entry.value = v;
|
|
|
|
ret false;
|
|
|
|
}
|
|
|
|
found_after(_, entry) {
|
|
|
|
entry.value = v;
|
|
|
|
ret false
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn get<copy K, copy V>(tbl: t<K,V>, k: K) -> option::t<V> {
|
|
|
|
alt search_tbl(tbl, k, tbl.hasher(k)) {
|
2011-12-06 22:22:12 -06:00
|
|
|
not_found. {
|
2011-12-06 21:56:47 -06:00
|
|
|
ret option::none;
|
|
|
|
}
|
|
|
|
|
|
|
|
found_first(_, entry) {
|
|
|
|
ret option::some(entry.value);
|
|
|
|
}
|
|
|
|
|
|
|
|
found_after(_, entry) {
|
|
|
|
ret option::some(entry.value);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn remove<copy K, copy V>(tbl: t<K,V>, k: K) -> option::t<V> {
|
|
|
|
alt search_tbl(tbl, k, tbl.hasher(k)) {
|
2011-12-06 22:22:12 -06:00
|
|
|
not_found. {
|
2011-12-06 21:56:47 -06:00
|
|
|
ret option::none;
|
|
|
|
}
|
|
|
|
|
|
|
|
found_first(idx, entry) {
|
2011-12-06 22:45:25 -06:00
|
|
|
tbl.size -= 1u;
|
2011-12-06 21:56:47 -06:00
|
|
|
tbl.chains[idx] = entry.next;
|
|
|
|
ret option::some(entry.value);
|
|
|
|
}
|
|
|
|
|
|
|
|
found_after(eprev, entry) {
|
2011-12-06 22:45:25 -06:00
|
|
|
tbl.size -= 1u;
|
2011-12-06 21:56:47 -06:00
|
|
|
eprev.next = entry.next;
|
|
|
|
ret option::some(entry.value);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn chains<copy K, copy V>(nchains: uint) -> [mutable chain<K,V>] {
|
|
|
|
ret vec::init_elt_mut(absent, nchains);
|
|
|
|
}
|
|
|
|
|
|
|
|
fn foreach_entry<copy K, copy V>(chain0: chain<K,V>,
|
|
|
|
blk: block(@entry<K,V>)) {
|
|
|
|
let chain = chain0;
|
|
|
|
while true {
|
|
|
|
alt chain {
|
|
|
|
absent. { ret; }
|
|
|
|
present(entry) {
|
2011-12-06 22:22:12 -06:00
|
|
|
let next = entry.next;
|
|
|
|
blk(entry); // may modify entry.next!
|
|
|
|
chain = next;
|
2011-12-06 21:56:47 -06:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn foreach_chain<copy K, copy V>(chains: [const chain<K,V>],
|
|
|
|
blk: block(@entry<K,V>)) {
|
|
|
|
let i = 0u, n = vec::len(chains);
|
|
|
|
while i < n {
|
|
|
|
foreach_entry(chains[i], blk);
|
|
|
|
i += 1u;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn rehash<copy K, copy V>(tbl: t<K,V>) {
|
|
|
|
let old_chains = tbl.chains;
|
|
|
|
let n_old_chains = vec::len(old_chains);
|
|
|
|
let n_new_chains: uint = uint::next_power_of_two(n_old_chains + 1u);
|
|
|
|
tbl.chains = chains(n_new_chains);
|
|
|
|
foreach_chain(old_chains) { |entry|
|
2011-12-06 22:22:12 -06:00
|
|
|
let idx = entry.hash % n_new_chains;
|
|
|
|
entry.next = tbl.chains[idx];
|
|
|
|
tbl.chains[idx] = present(entry);
|
2011-12-06 21:56:47 -06:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn items<copy K, copy V>(tbl: t<K,V>, blk: block(K,V)) {
|
|
|
|
let tbl_chains = tbl.chains; // Satisfy alias checker.
|
|
|
|
foreach_chain(tbl_chains) { |entry|
|
|
|
|
let key = entry.key;
|
|
|
|
let value = entry.value;
|
|
|
|
blk(key, value);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
obj o<copy K, copy V>(tbl: @t<K,V>,
|
2011-12-07 18:56:49 -06:00
|
|
|
lf: util::rational) {
|
2011-12-06 21:56:47 -06:00
|
|
|
fn size() -> uint {
|
|
|
|
ret tbl.size;
|
|
|
|
}
|
|
|
|
|
|
|
|
fn insert(k: K, v: V) -> bool {
|
|
|
|
let nchains = vec::len(tbl.chains);
|
2011-12-07 18:56:49 -06:00
|
|
|
let load = {num:tbl.size + 1u as int, den:nchains as int};
|
|
|
|
if !util::rational_leq(load, lf) {
|
2011-12-06 21:56:47 -06:00
|
|
|
rehash(*tbl);
|
|
|
|
}
|
|
|
|
ret insert(*tbl, k, v);
|
|
|
|
}
|
|
|
|
|
|
|
|
fn contains_key(k: K) -> bool {
|
|
|
|
ret option::is_some(get(*tbl, k));
|
|
|
|
}
|
|
|
|
|
|
|
|
fn get(k: K) -> V {
|
|
|
|
ret option::get(get(*tbl, k));
|
|
|
|
}
|
|
|
|
|
|
|
|
fn find(k: K) -> option::t<V> {
|
|
|
|
ret get(*tbl, k);
|
|
|
|
}
|
|
|
|
|
|
|
|
fn remove(k: K) -> option::t<V> {
|
|
|
|
ret remove(*tbl, k);
|
|
|
|
}
|
|
|
|
|
|
|
|
fn rehash() {
|
|
|
|
rehash(*tbl);
|
|
|
|
}
|
|
|
|
|
|
|
|
fn items(blk: block(K, V)) {
|
|
|
|
items(*tbl, blk);
|
|
|
|
}
|
|
|
|
|
|
|
|
fn keys(blk: block(K)) {
|
|
|
|
items(*tbl) { |k, _v| blk(k) }
|
|
|
|
}
|
|
|
|
|
|
|
|
fn values(blk: block(V)) {
|
|
|
|
items(*tbl) { |_k, v| blk(v) }
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn mk<copy K, copy V>(hasher: hashfn<K>, eqer: eqfn<K>) -> hashmap<K,V> {
|
|
|
|
let initial_capacity: uint = 32u; // 2^5
|
|
|
|
let t = @{mutable size: 0u,
|
|
|
|
mutable chains: chains(initial_capacity),
|
|
|
|
hasher: hasher,
|
|
|
|
eqer: eqer};
|
2011-12-07 18:56:49 -06:00
|
|
|
ret o(t, {num:3, den:4});
|
2011-12-06 21:56:47 -06:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2011-12-07 10:14:57 -06:00
|
|
|
/*
|
|
|
|
Function: mk_hashmap
|
|
|
|
|
|
|
|
Construct a hashmap.
|
|
|
|
|
|
|
|
Parameters:
|
|
|
|
|
|
|
|
hasher - The hash function for key type K
|
|
|
|
eqer - The equality function for key type K
|
|
|
|
*/
|
2011-12-06 21:56:47 -06:00
|
|
|
fn mk_hashmap<copy K, copy V>(hasher: hashfn<K>, eqer: eqfn<K>)
|
|
|
|
-> hashmap<K, V> {
|
|
|
|
ret chained::mk(hasher, eqer);
|
|
|
|
}
|
|
|
|
|
2011-10-26 13:28:23 -05:00
|
|
|
/*
|
|
|
|
Function: new_str_hash
|
2011-07-05 04:48:19 -05:00
|
|
|
|
2011-10-26 13:28:23 -05:00
|
|
|
Construct a hashmap for string keys
|
|
|
|
*/
|
2011-11-18 05:39:20 -06:00
|
|
|
fn new_str_hash<copy V>() -> hashmap<str, V> {
|
2011-09-01 19:27:58 -05:00
|
|
|
ret mk_hashmap(str::hash, str::eq);
|
2011-07-05 04:48:19 -05:00
|
|
|
}
|
|
|
|
|
2011-10-26 13:28:23 -05:00
|
|
|
/*
|
|
|
|
Function: new_int_hash
|
|
|
|
|
|
|
|
Construct a hashmap for int keys
|
|
|
|
*/
|
2011-11-18 05:39:20 -06:00
|
|
|
fn new_int_hash<copy V>() -> hashmap<int, V> {
|
2011-10-06 05:26:12 -05:00
|
|
|
fn hash_int(&&x: int) -> uint { ret x as uint; }
|
|
|
|
fn eq_int(&&a: int, &&b: int) -> bool { ret a == b; }
|
2011-08-09 19:36:07 -05:00
|
|
|
ret mk_hashmap(hash_int, eq_int);
|
2011-07-05 04:48:19 -05:00
|
|
|
}
|
|
|
|
|
2011-10-26 13:28:23 -05:00
|
|
|
/*
|
|
|
|
Function: new_uint_hash
|
|
|
|
|
|
|
|
Construct a hashmap for uint keys
|
|
|
|
*/
|
2011-11-18 05:39:20 -06:00
|
|
|
fn new_uint_hash<copy V>() -> hashmap<uint, V> {
|
2011-10-06 05:26:12 -05:00
|
|
|
fn hash_uint(&&x: uint) -> uint { ret x; }
|
|
|
|
fn eq_uint(&&a: uint, &&b: uint) -> bool { ret a == b; }
|
2011-08-09 19:36:07 -05:00
|
|
|
ret mk_hashmap(hash_uint, eq_uint);
|
2011-07-05 04:48:19 -05:00
|
|
|
}
|
|
|
|
|
2011-10-26 13:28:23 -05:00
|
|
|
/*
|
|
|
|
Function: set_add
|
|
|
|
|
|
|
|
Convenience function for adding keys to a hashmap with nil type keys
|
|
|
|
*/
|
|
|
|
fn set_add<K>(set: hashset<K>, key: K) -> bool { ret set.insert(key, ()); }
|
|
|
|
|
2010-09-22 17:44:13 -05:00
|
|
|
// Local Variables:
|
|
|
|
// mode: rust;
|
|
|
|
// fill-column: 78;
|
|
|
|
// indent-tabs-mode: nil
|
|
|
|
// c-basic-offset: 4
|
|
|
|
// buffer-file-coding-system: utf-8-unix
|
|
|
|
// End:
|