rust/src/libsyntax/util/interner.rs

109 lines
3.2 KiB
Rust
Raw Normal View History

// Copyright 2012 The Rust Project Developers. See the COPYRIGHT
// file at the top-level directory of this distribution and at
// http://rust-lang.org/COPYRIGHT.
//
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
// option. This file may not be copied, modified, or distributed
// except according to those terms.
// An "interner" is a data structure that associates values with uint tags and
// allows bidirectional lookup; i.e. given a value, one can easily find the
// type, and vice versa.
use core::prelude::*;
use core::hashmap::HashMap;
pub struct Interner<T> {
priv map: @mut HashMap<T, uint>,
2013-03-07 17:37:22 -06:00
priv vect: @mut ~[T],
}
// when traits can extend traits, we should extend index<uint,T> to get []
pub impl<T:Eq + IterBytes + Hash + Const + Copy> Interner<T> {
fn new() -> Interner<T> {
Interner {
map: @mut HashMap::new(),
2013-03-07 17:37:22 -06:00
vect: @mut ~[],
}
}
fn prefill(init: &[T]) -> Interner<T> {
let rv = Interner::new();
for init.each() |v| { rv.intern(*v); }
rv
}
2011-08-04 12:46:10 -05:00
fn intern(&self, val: T) -> uint {
match self.map.find(&val) {
Some(&idx) => return idx,
None => (),
2012-07-17 13:22:11 -05:00
}
let vect = &*self.vect;
let new_idx = vect.len();
self.map.insert(val, new_idx);
self.vect.push(val);
new_idx
}
fn gensym(&self, val: T) -> uint {
let new_idx = {
let vect = &*self.vect;
vect.len()
};
2012-07-18 18:18:02 -05:00
// leave out of .map to avoid colliding
self.vect.push(val);
new_idx
2012-07-18 18:18:02 -05:00
}
2011-08-04 12:46:10 -05:00
2012-07-17 13:22:11 -05:00
// this isn't "pure" in the traditional sense, because it can go from
// failing to returning a value as items are interned. But for typestate,
// where we first check a pred and then rely on it, ceasing to fail is ok.
fn get(&self, idx: uint) -> T { self.vect[idx] }
fn len(&self) -> uint { let vect = &*self.vect; vect.len() }
2012-09-19 11:41:06 -05:00
}
2013-01-23 19:29:08 -06:00
#[test]
#[should_fail]
pub fn i1 () {
let i : Interner<@~str> = Interner::new();
2013-01-23 19:29:08 -06:00
i.get(13);
2013-01-23 19:41:54 -06:00
}
2013-01-23 19:29:08 -06:00
#[test]
pub fn i2 () {
let i : Interner<@~str> = Interner::new();
2013-01-23 19:29:08 -06:00
// first one is zero:
assert_eq!(i.intern (@~"dog"), 0);
2013-01-23 19:29:08 -06:00
// re-use gets the same entry:
assert_eq!(i.intern (@~"dog"), 0);
2013-01-23 19:29:08 -06:00
// different string gets a different #:
assert_eq!(i.intern (@~"cat"), 1);
assert_eq!(i.intern (@~"cat"), 1);
2013-01-23 19:29:08 -06:00
// dog is still at zero
assert_eq!(i.intern (@~"dog"), 0);
2013-01-23 19:29:08 -06:00
// gensym gets 3
assert_eq!(i.gensym (@~"zebra" ), 2);
2013-01-23 19:29:08 -06:00
// gensym of same string gets new number :
assert_eq!(i.gensym (@~"zebra" ), 3);
2013-01-23 19:29:08 -06:00
// gensym of *existing* string gets new number:
assert_eq!(i.gensym (@~"dog"), 4);
assert_eq!(i.get(0), @~"dog");
assert_eq!(i.get(1), @~"cat");
assert_eq!(i.get(2), @~"zebra");
assert_eq!(i.get(3), @~"zebra");
assert_eq!(i.get(4), @~"dog");
2013-01-23 19:41:54 -06:00
}
2013-01-23 19:29:08 -06:00
#[test]
pub fn i3 () {
let i : Interner<@~str> = Interner::prefill([@~"Alan",@~"Bob",@~"Carol"]);
assert_eq!(i.get(0), @~"Alan");
assert_eq!(i.get(1), @~"Bob");
assert_eq!(i.get(2), @~"Carol");
assert_eq!(i.intern(@~"Bob"), 1);
2013-01-23 19:29:08 -06:00
}