rust/src/libsyntax/util/interner.rs

63 lines
1.8 KiB
Rust
Raw Normal View History

// An "interner" is a data structure that associates values with uint tags and
// allows bidirectional lookup; i.e. given a value, one can easily find the
// type, and vice versa.
2012-09-04 13:37:29 -05:00
use std::map;
2012-09-10 17:38:28 -05:00
use std::map::HashMap;
2012-09-04 13:37:29 -05:00
use dvec::DVec;
use cmp::Eq;
use hash::Hash;
use to_bytes::IterBytes;
type hash_interner<T: Const> =
2012-09-10 17:38:28 -05:00
{map: HashMap<T, uint>,
vect: DVec<T>};
fn mk<T:Eq IterBytes Hash Const Copy>() -> interner<T> {
2012-09-10 17:38:28 -05:00
let m = map::HashMap::<T, uint>();
2012-07-17 13:22:11 -05:00
let hi: hash_interner<T> =
{map: m, vect: DVec()};
2012-09-10 20:28:00 -05:00
move (hi as interner::<T>)
}
2011-08-04 12:46:10 -05:00
fn mk_prefill<T:Eq IterBytes Hash Const Copy>(init: ~[T]) -> interner<T> {
let rv = mk();
for init.each() |v| { rv.intern(*v); }
return rv;
}
2012-07-17 13:22:11 -05:00
/* when traits can extend traits, we should extend index<uint,T> to get [] */
trait interner<T:Eq IterBytes Hash Const Copy> {
2012-07-17 13:22:11 -05:00
fn intern(T) -> uint;
2012-07-18 18:18:02 -05:00
fn gensym(T) -> uint;
2012-07-17 13:22:11 -05:00
pure fn get(uint) -> T;
fn len() -> uint;
}
2011-08-04 12:46:10 -05:00
impl <T:Eq IterBytes Hash Const Copy> hash_interner<T>: interner<T> {
2012-07-17 13:22:11 -05:00
fn intern(val: T) -> uint {
2012-08-06 14:34:08 -05:00
match self.map.find(val) {
2012-08-20 14:23:37 -05:00
Some(idx) => return idx,
None => {
2012-07-17 13:22:11 -05:00
let new_idx = self.vect.len();
self.map.insert(val, new_idx);
self.vect.push(val);
2012-08-01 19:30:05 -05:00
return new_idx;
2012-07-17 13:22:11 -05:00
}
}
}
2012-07-18 18:18:02 -05:00
fn gensym(val: T) -> uint {
let new_idx = self.vect.len();
// leave out of .map to avoid colliding
self.vect.push(val);
return new_idx;
}
2011-08-04 12:46:10 -05:00
2012-07-17 13:22:11 -05:00
// this isn't "pure" in the traditional sense, because it can go from
// failing to returning a value as items are interned. But for typestate,
// where we first check a pred and then rely on it, ceasing to fail is ok.
pure fn get(idx: uint) -> T { self.vect.get_elt(idx) }
2012-08-01 19:30:05 -05:00
fn len() -> uint { return self.vect.len(); }
2012-09-19 11:41:06 -05:00
}