rust/src/libsyntax/parse/common.rs

379 lines
11 KiB
Rust
Raw Normal View History

// Copyright 2012 The Rust Project Developers. See the COPYRIGHT
// file at the top-level directory of this distribution and at
// http://rust-lang.org/COPYRIGHT.
//
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
// option. This file may not be copied, modified, or distributed
// except according to those terms.
use ast;
2013-01-30 09:56:33 -08:00
use codemap::{BytePos, spanned};
use parse::lexer::reader;
use parse::parser::Parser;
use parse::token;
use opt_vec;
use opt_vec::OptVec;
// SeqSep : a sequence separator (token)
2013-02-04 13:15:17 -08:00
// and whether a trailing separator is allowed.
pub struct SeqSep {
sep: Option<token::Token>,
trailing_sep_allowed: bool
}
2012-05-24 12:38:45 -07:00
pub fn seq_sep_trailing_disallowed(t: token::Token) -> SeqSep {
SeqSep {
2013-02-24 15:41:54 -08:00
sep: Some(t),
trailing_sep_allowed: false,
}
2012-05-24 12:38:45 -07:00
}
pub fn seq_sep_trailing_allowed(t: token::Token) -> SeqSep {
SeqSep {
2013-02-24 15:41:54 -08:00
sep: Some(t),
trailing_sep_allowed: true,
}
2012-05-24 12:38:45 -07:00
}
pub fn seq_sep_none() -> SeqSep {
SeqSep {
2013-02-24 15:41:54 -08:00
sep: None,
trailing_sep_allowed: false,
}
2012-05-24 12:38:45 -07:00
}
// maps any token back to a string. not necessary if you know it's
// an identifier....
pub fn token_to_str(reader: @reader, token: &token::Token) -> ~str {
token::to_str(reader.interner(), token)
}
pub impl Parser {
// convert a token to a string using self's reader
fn token_to_str(&self, token: &token::Token) -> ~str {
token::to_str(self.reader.interner(), token)
}
// convert the current token to a string using self's reader
fn this_token_to_str(&self) -> ~str {
self.token_to_str(self.token)
}
2013-03-02 13:02:27 -08:00
fn unexpected_last(&self, t: &token::Token) -> ! {
self.span_fatal(
*self.last_span,
2013-02-24 15:41:54 -08:00
fmt!(
"unexpected token: `%s`",
self.token_to_str(t)
2013-02-24 15:41:54 -08:00
)
);
}
2013-03-02 13:02:27 -08:00
fn unexpected(&self) -> ! {
2013-02-24 15:41:54 -08:00
self.fatal(
fmt!(
"unexpected token: `%s`",
self.this_token_to_str()
2013-02-24 15:41:54 -08:00
)
);
}
2013-02-04 13:15:17 -08:00
// expect and consume the token t. Signal an error if
// the next token is not t.
2013-03-02 13:02:27 -08:00
fn expect(&self, t: &token::Token) {
if *self.token == *t {
2012-05-24 12:38:45 -07:00
self.bump();
} else {
self.fatal(
fmt!(
"expected `%s` but found `%s`",
self.token_to_str(t),
self.this_token_to_str()
)
)
2012-05-24 12:38:45 -07:00
}
}
2013-03-02 13:02:27 -08:00
fn parse_ident(&self) -> ast::ident {
self.check_strict_keywords();
2012-09-11 19:26:48 -07:00
self.check_reserved_keywords();
match *self.token {
2013-02-24 15:41:54 -08:00
token::IDENT(i, _) => {
self.bump();
i
}
token::INTERPOLATED(token::nt_ident(*)) => {
self.bug(
~"ident interpolation not converted to real token"
);
}
_ => {
self.fatal(
fmt!(
"expected ident, found `%s`",
self.this_token_to_str()
2013-02-24 15:41:54 -08:00
)
);
}
2012-05-24 12:38:45 -07:00
}
}
2013-03-02 13:02:27 -08:00
fn parse_path_list_ident(&self) -> ast::path_list_ident {
2012-05-24 12:38:45 -07:00
let lo = self.span.lo;
let ident = self.parse_ident();
let hi = self.span.hi;
spanned(lo, hi, ast::path_list_ident_ { name: ident,
id: self.get_id() })
}
2013-02-04 13:15:17 -08:00
// consume token 'tok' if it exists. Returns true if the given
// token was present, false otherwise.
2013-03-02 13:02:27 -08:00
fn eat(&self, tok: &token::Token) -> bool {
2013-02-24 09:54:41 -08:00
return if *self.token == *tok { self.bump(); true } else { false };
2012-05-24 12:38:45 -07:00
}
2012-07-18 16:18:02 -07:00
// Storing keywords as interned idents instead of strings would be nifty.
2012-05-24 12:38:45 -07:00
// A sanity check that the word we are asking for is a known keyword
// NOTE: this could be done statically....
2013-03-02 13:02:27 -08:00
fn require_keyword(&self, word: &~str) {
2013-03-21 15:41:37 -04:00
if !self.keywords.contains(word) {
self.bug(fmt!("unknown keyword: %s", *word));
2012-05-24 12:38:45 -07:00
}
}
// return true when this token represents the given string, and is not
// followed immediately by :: .
fn token_is_word(&self, word: &~str, tok: &token::Token) -> bool {
match *tok {
2013-02-24 20:51:56 -08:00
token::IDENT(sid, false) => { *self.id_to_str(sid) == *word }
_ => { false }
2012-05-24 12:38:45 -07:00
}
}
2013-03-02 13:02:27 -08:00
fn token_is_keyword(&self, word: &~str, tok: &token::Token) -> bool {
2012-07-30 16:33:02 -07:00
self.require_keyword(word);
self.token_is_word(word, tok)
}
2013-03-02 13:02:27 -08:00
fn is_keyword(&self, word: &~str) -> bool {
self.token_is_keyword(word, &copy *self.token)
2012-05-24 12:38:45 -07:00
}
fn id_is_any_keyword(&self, id: ast::ident) -> bool {
self.keywords.contains(self.id_to_str(id))
}
2013-03-02 13:02:27 -08:00
fn is_any_keyword(&self, tok: &token::Token) -> bool {
match *tok {
2012-08-03 19:59:04 -07:00
token::IDENT(sid, false) => {
2013-03-21 15:41:37 -04:00
self.keywords.contains(self.id_to_str(sid))
}
2012-08-03 19:59:04 -07:00
_ => false
}
}
2013-03-08 10:19:19 -08:00
// if the given word is not a keyword, signal an error.
// if the next token is the given keyword, eat it and return
// true. Otherwise, return false.
2013-03-02 13:02:27 -08:00
fn eat_keyword(&self, word: &~str) -> bool {
2012-05-24 12:38:45 -07:00
self.require_keyword(word);
let is_kw = match *self.token {
2013-02-24 20:51:56 -08:00
token::IDENT(sid, false) => *word == *self.id_to_str(sid),
_ => false
2012-07-25 19:13:58 -07:00
};
if is_kw { self.bump() }
is_kw
}
2013-03-08 10:19:19 -08:00
// if the given word is not a keyword, signal an error.
// if the next token is not the given word, signal an error.
// otherwise, eat it.
2013-03-02 13:02:27 -08:00
fn expect_keyword(&self, word: &~str) {
2012-05-24 12:38:45 -07:00
self.require_keyword(word);
if !self.eat_keyword(word) {
2013-02-24 15:41:54 -08:00
self.fatal(
fmt!(
"expected `%s`, found `%s`",
*word,
self.this_token_to_str()
2013-02-24 15:41:54 -08:00
)
);
2012-06-12 10:59:50 -07:00
}
}
2013-03-08 10:19:19 -08:00
// return true if the given string is a strict keyword
2013-03-02 13:02:27 -08:00
fn is_strict_keyword(&self, word: &~str) -> bool {
2013-03-21 15:41:37 -04:00
self.strict_keywords.contains(word)
}
2013-03-08 10:19:19 -08:00
// signal an error if the current token is a strict keyword
2013-03-02 13:02:27 -08:00
fn check_strict_keywords(&self) {
match *self.token {
token::IDENT(_, false) => {
let w = token_to_str(self.reader, &copy *self.token);
self.check_strict_keywords_(&w);
}
_ => ()
}
}
2013-03-08 10:19:19 -08:00
// signal an error if the given string is a strict keyword
2013-03-02 13:02:27 -08:00
fn check_strict_keywords_(&self, w: &~str) {
if self.is_strict_keyword(w) {
2013-02-24 15:41:54 -08:00
self.fatal(fmt!("found `%s` in ident position", *w));
}
}
2013-03-08 10:19:19 -08:00
// return true if this is a reserved keyword
2013-03-02 13:02:27 -08:00
fn is_reserved_keyword(&self, word: &~str) -> bool {
2013-03-21 15:41:37 -04:00
self.reserved_keywords.contains(word)
2012-09-11 19:26:48 -07:00
}
2013-03-08 10:19:19 -08:00
// signal an error if the current token is a reserved keyword
2013-03-02 13:02:27 -08:00
fn check_reserved_keywords(&self) {
match *self.token {
token::IDENT(_, false) => {
let w = token_to_str(self.reader, &copy *self.token);
self.check_reserved_keywords_(&w);
}
_ => ()
2012-09-11 19:26:48 -07:00
}
}
2013-03-08 10:19:19 -08:00
// signal an error if the given string is a reserved keyword
2013-03-02 13:02:27 -08:00
fn check_reserved_keywords_(&self, w: &~str) {
2012-09-11 19:26:48 -07:00
if self.is_reserved_keyword(w) {
2013-02-24 15:41:54 -08:00
self.fatal(fmt!("`%s` is a reserved keyword", *w));
2012-09-11 19:26:48 -07:00
}
}
2013-02-04 13:15:17 -08:00
// expect and consume a GT. if a >> is seen, replace it
2013-03-08 10:19:19 -08:00
// with a single > and continue. If a GT is not seen,
// signal an error.
2013-03-02 13:02:27 -08:00
fn expect_gt(&self) {
if *self.token == token::GT {
2012-05-24 12:38:45 -07:00
self.bump();
} else if *self.token == token::BINOP(token::SHR) {
2013-02-24 15:41:54 -08:00
self.replace_token(
token::GT,
self.span.lo + BytePos(1u),
self.span.hi
);
2012-05-24 12:38:45 -07:00
} else {
let mut s: ~str = ~"expected `";
s += self.token_to_str(&token::GT);
s += ~"`, found `";
s += self.this_token_to_str();
s += ~"`";
2012-05-24 12:38:45 -07:00
self.fatal(s);
}
}
2013-02-04 13:15:17 -08:00
// parse a sequence bracketed by '<' and '>', stopping
// before the '>'.
2013-02-24 15:41:54 -08:00
fn parse_seq_to_before_gt<T: Copy>(
2013-03-02 13:02:27 -08:00
&self,
2013-02-24 15:41:54 -08:00
sep: Option<token::Token>,
f: &fn(&Parser) -> T
) -> OptVec<T> {
2012-05-24 12:38:45 -07:00
let mut first = true;
let mut v = opt_vec::Empty;
while *self.token != token::GT
&& *self.token != token::BINOP(token::SHR) {
2012-08-06 12:34:08 -07:00
match sep {
Some(ref t) => {
2012-08-03 19:59:04 -07:00
if first { first = false; }
else { self.expect(t); }
2012-08-03 19:59:04 -07:00
}
_ => ()
2012-05-24 12:38:45 -07:00
}
2013-03-02 13:02:27 -08:00
v.push(f(self));
2012-05-24 12:38:45 -07:00
}
2012-08-01 17:30:05 -07:00
return v;
2012-05-24 12:38:45 -07:00
}
2013-02-24 15:41:54 -08:00
fn parse_seq_to_gt<T: Copy>(
2013-03-02 13:02:27 -08:00
&self,
2013-02-24 15:41:54 -08:00
sep: Option<token::Token>,
f: &fn(&Parser) -> T
) -> OptVec<T> {
2012-05-24 12:38:45 -07:00
let v = self.parse_seq_to_before_gt(sep, f);
self.expect_gt();
2012-08-01 17:30:05 -07:00
return v;
2012-05-24 12:38:45 -07:00
}
2013-02-04 13:15:17 -08:00
// parse a sequence, including the closing delimiter. The function
// f must consume tokens until reaching the next separator or
// closing bracket.
2013-02-24 15:41:54 -08:00
fn parse_seq_to_end<T: Copy>(
2013-03-02 13:02:27 -08:00
&self,
ket: &token::Token,
2013-02-24 15:41:54 -08:00
sep: SeqSep,
f: &fn(&Parser) -> T
2013-02-24 15:41:54 -08:00
) -> ~[T] {
2012-05-24 12:38:45 -07:00
let val = self.parse_seq_to_before_end(ket, sep, f);
self.bump();
2013-02-24 15:41:54 -08:00
val
2012-05-24 12:38:45 -07:00
}
2013-02-04 13:15:17 -08:00
// parse a sequence, not including the closing delimiter. The function
// f must consume tokens until reaching the next separator or
// closing bracket.
2013-02-24 15:41:54 -08:00
fn parse_seq_to_before_end<T: Copy>(
2013-03-02 13:02:27 -08:00
&self,
ket: &token::Token,
2013-02-24 15:41:54 -08:00
sep: SeqSep,
f: &fn(&Parser) -> T
2013-02-24 15:41:54 -08:00
) -> ~[T] {
2012-05-24 12:38:45 -07:00
let mut first: bool = true;
let mut v: ~[T] = ~[];
while *self.token != *ket {
2012-08-06 12:34:08 -07:00
match sep.sep {
Some(ref t) => {
2012-08-03 19:59:04 -07:00
if first { first = false; }
else { self.expect(t); }
2012-08-03 19:59:04 -07:00
}
_ => ()
2012-05-24 12:38:45 -07:00
}
if sep.trailing_sep_allowed && *self.token == *ket { break; }
2013-03-02 13:02:27 -08:00
v.push(f(self));
}
return v;
}
2013-02-04 13:15:17 -08:00
// parse a sequence, including the closing delimiter. The function
// f must consume tokens until reaching the next separator or
// closing bracket.
2013-02-24 15:41:54 -08:00
fn parse_unspanned_seq<T: Copy>(
2013-03-02 13:02:27 -08:00
&self,
bra: &token::Token,
ket: &token::Token,
2013-02-24 15:41:54 -08:00
sep: SeqSep,
f: &fn(&Parser) -> T
2013-02-24 15:41:54 -08:00
) -> ~[T] {
self.expect(bra);
2013-02-24 15:41:54 -08:00
let result = self.parse_seq_to_before_end(ket, sep, f);
self.bump();
2013-02-24 15:41:54 -08:00
result
}
// NB: Do not use this function unless you actually plan to place the
// spanned list in the AST.
2013-02-24 15:41:54 -08:00
fn parse_seq<T: Copy>(
2013-03-02 13:02:27 -08:00
&self,
bra: &token::Token,
ket: &token::Token,
2013-02-24 15:41:54 -08:00
sep: SeqSep,
f: &fn(&Parser) -> T
2013-02-24 15:41:54 -08:00
) -> spanned<~[T]> {
2012-05-24 12:38:45 -07:00
let lo = self.span.lo;
self.expect(bra);
2013-02-24 15:41:54 -08:00
let result = self.parse_seq_to_before_end(ket, sep, f);
2012-05-24 12:38:45 -07:00
let hi = self.span.hi;
self.bump();
2013-02-24 15:41:54 -08:00
spanned(lo, hi, result)
2012-05-24 12:38:45 -07:00
}
2012-06-07 21:53:47 -07:00
}