rust/src/libsyntax/ext/tt/transcribe.rs

220 lines
7.6 KiB
Rust
Raw Normal View History

import util::interner::interner;
import diagnostic::span_handler;
import ast::{token_tree,tt_delim,tt_flat,tt_dotdotdot,tt_interpolate,ident};
import earley_parser::{arb_depth,seq,leaf};
import codemap::span;
import parse::token::{EOF,ACTUALLY,IDENT,token,w_ident};
import std::map::{hashmap,box_str_hash};
export tt_reader, new_tt_reader, dup_tt_reader, tt_next_token;
enum tt_frame_up { /* to break a circularity */
tt_frame_up(option<tt_frame>)
}
/* TODO: figure out how to have a uniquely linked stack, and change to `~` */
///an unzipping of `token_tree`s
type tt_frame = @{
readme: ~[ast::token_tree],
mut idx: uint,
dotdotdoted: bool,
up: tt_frame_up
};
type tt_reader = @{
span_diagnostic: span_handler,
interner: @interner<@str>,
mut cur: tt_frame,
/* for MBE-style macro transcription */
interpolations: std::map::hashmap<ident, @arb_depth>,
mut repeat_idx: ~[mut uint],
mut repeat_len: ~[uint],
/* cached: */
mut cur_tok: token,
mut cur_span: span
};
/** This can do Macro-By-Example transcription. On the other hand, if
* `doc` contains no `tt_dotdotdot`s and `tt_interpolate`s, `interp` can (and
* should) be none. */
fn new_tt_reader(span_diagnostic: span_handler, itr: @interner<@str>,
interp: option<std::map::hashmap<ident,@arb_depth>>,
src: ~[ast::token_tree])
-> tt_reader {
let r = @{span_diagnostic: span_diagnostic, interner: itr,
mut cur: @{readme: src, mut idx: 0u, dotdotdoted: false,
up: tt_frame_up(option::none)},
interpolations: alt interp { /* just a convienience */
none { std::map::box_str_hash::<@arb_depth>() }
some(x) { x }
},
mut repeat_idx: ~[mut], mut repeat_len: ~[],
/* dummy values, never read: */
mut cur_tok: EOF,
mut cur_span: ast_util::mk_sp(0u,0u)
};
tt_next_token(r); /* get cur_tok and cur_span set up */
ret r;
}
pure fn dup_tt_frame(&&f: tt_frame) -> tt_frame {
@{readme: f.readme, mut idx: f.idx, dotdotdoted: f.dotdotdoted,
up: alt f.up {
tt_frame_up(some(up_frame)) {
tt_frame_up(some(dup_tt_frame(up_frame)))
}
tt_frame_up(none) { tt_frame_up(none) }
}
}
}
pure fn dup_tt_reader(&&r: tt_reader) -> tt_reader {
@{span_diagnostic: r.span_diagnostic, interner: r.interner,
mut cur: dup_tt_frame(r.cur),
interpolations: r.interpolations,
mut repeat_idx: copy r.repeat_idx, mut repeat_len: copy r.repeat_len,
mut cur_tok: r.cur_tok, mut cur_span: r.cur_span}
}
pure fn lookup_cur_ad_by_ad(r: tt_reader, start: @arb_depth) -> @arb_depth {
pure fn red(&&ad: @arb_depth, &&idx: uint) -> @arb_depth {
alt *ad {
leaf(_) { ad /* end of the line; duplicate henceforth */ }
seq(ads, _) { ads[idx] }
}
}
vec::foldl(start, r.repeat_idx, red)
}
fn lookup_cur_ad(r: tt_reader, name: ident) -> @arb_depth {
lookup_cur_ad_by_ad(r, r.interpolations.get(name))
}
enum lis {
lis_unconstrained, lis_constraint(uint, ident), lis_contradiction(str)
}
fn lockstep_iter_size(&&t: token_tree, &&r: tt_reader) -> lis {
fn lis_merge(lhs: lis, rhs: lis) -> lis {
alt lhs {
lis_unconstrained { rhs }
lis_contradiction(_) { lhs }
lis_constraint(l_len, l_id) {
alt rhs {
lis_unconstrained { lhs }
lis_contradiction(_) { rhs }
lis_constraint(r_len, _) if l_len == r_len { lhs }
lis_constraint(r_len, r_id) {
lis_contradiction(#fmt["Inconsistent lockstep iteration: \
'%s' has %u items, but '%s' has %u",
*l_id, l_len, *r_id, r_len])
}
}
}
}
}
alt t {
tt_delim(tts) | tt_dotdotdot(_, tts) {
vec::foldl(lis_unconstrained, tts, {|lis, tt|
lis_merge(lis, lockstep_iter_size(tt, r)) })
}
tt_flat(*) { lis_unconstrained }
tt_interpolate(_, name) {
alt *lookup_cur_ad(r, name) {
leaf(_) { lis_unconstrained }
seq(ads, _) { lis_constraint(ads.len(), name) }
}
}
}
}
fn tt_next_token(&&r: tt_reader) -> {tok: token, sp: span} {
let ret_val = { tok: r.cur_tok, sp: r.cur_span };
if r.cur.idx >= vec::len(r.cur.readme) {
/* done with this set; pop or repeat? */
if ! r.cur.dotdotdoted
|| r.repeat_idx.last() == r.repeat_len.last() - 1 {
if r.cur.dotdotdoted {
vec::pop(r.repeat_idx); vec::pop(r.repeat_len);
}
alt r.cur.up {
tt_frame_up(none) {
r.cur_tok = EOF;
ret ret_val;
}
tt_frame_up(some(tt_f)) {
r.cur = tt_f;
/* the outermost `if` would need to be a `while` if we
didn't know that the last thing in a `tt_delim` is always
a `tt_flat`, and that a `tt_dotdotdot` is never empty */
r.cur.idx += 1u;
}
}
} else {
r.cur.idx = 0u;
r.repeat_idx[r.repeat_idx.len() - 1u] += 1u;
}
}
/* if `tt_delim`s could be 0-length, we'd need to be able to switch
between popping and pushing until we got to an actual `tt_flat` */
loop { /* because it's easiest, this handles `tt_delim` not starting
with a `tt_flat`, even though it won't happen */
alt r.cur.readme[r.cur.idx] {
tt_delim(tts) {
r.cur = @{readme: tts, mut idx: 0u, dotdotdoted: false,
up: tt_frame_up(option::some(r.cur)) };
}
tt_flat(sp, tok) {
r.cur_span = sp; r.cur_tok = tok;
r.cur.idx += 1u;
ret ret_val;
}
tt_dotdotdot(sp, tts) {
alt lockstep_iter_size(tt_dotdotdot(sp, tts), r) {
lis_unconstrained {
r.span_diagnostic.span_fatal(
copy r.cur_span, /* blame macro writer */
"attempted to repeat an expression containing no syntax \
variables matched as repeating at this depth");
}
lis_contradiction(msg) { /* blame macro invoker */
r.span_diagnostic.span_fatal(sp, msg);
}
lis_constraint(len, _) {
vec::push(r.repeat_len, len);
vec::push(r.repeat_idx, 0u);
r.cur = @{readme: tts, mut idx: 0u, dotdotdoted: true,
up: tt_frame_up(option::some(r.cur)) };
}
}
}
// TODO: think about span stuff here
tt_interpolate(sp, ident) {
alt *lookup_cur_ad(r, ident) {
/* sidestep the interpolation tricks for ident because
(a) idents can be in lots of places, so it'd be a pain
(b) we actually can, since it's a token. */
leaf(w_ident(sn,b)) {
r.cur_span = sp; r.cur_tok = IDENT(sn,b);
r.cur.idx += 1u;
ret ret_val;
}
leaf(w_nt) {
r.cur_span = sp; r.cur_tok = ACTUALLY(w_nt);
r.cur.idx += 1u;
ret ret_val;
}
seq(*) {
r.span_diagnostic.span_fatal(
copy r.cur_span, /* blame the macro writer */
#fmt["variable '%s' is still repeating at this depth",
*ident]);
}
}
}
}
}
}