rust/crates/ra_syntax/src/parsing/text_tree_sink.rs

170 lines
5.1 KiB
Rust
Raw Normal View History

//! FIXME: write short doc here
2019-02-21 15:24:42 +03:00
use std::mem;
use ra_parser::{ParseError, TreeSink};
2019-02-21 13:37:32 +03:00
2018-10-15 19:55:32 +03:00
use crate::{
2019-02-21 13:37:32 +03:00
parsing::Token,
2019-02-23 16:55:01 +03:00
syntax_node::GreenNode,
SmolStr, SyntaxError,
SyntaxKind::{self, *},
SyntaxTreeBuilder, TextRange, TextUnit,
2018-07-29 13:51:55 +03:00
};
2019-02-20 16:16:14 +03:00
2019-02-21 15:24:42 +03:00
/// Bridges the parser with our specific syntax tree representation.
///
2019-02-23 16:07:29 +03:00
/// `TextTreeSink` also handles attachment of trivia (whitespace) to nodes.
pub(crate) struct TextTreeSink<'a> {
text: &'a str,
tokens: &'a [Token],
2019-02-20 23:17:07 +03:00
text_pos: TextUnit,
token_pos: usize,
2019-02-21 15:24:42 +03:00
state: State,
2019-02-23 16:55:01 +03:00
inner: SyntaxTreeBuilder,
2018-07-29 13:51:55 +03:00
}
2019-02-21 15:24:42 +03:00
enum State {
PendingStart,
Normal,
PendingFinish,
}
2019-02-23 16:07:29 +03:00
impl<'a> TreeSink for TextTreeSink<'a> {
2019-03-30 13:25:53 +03:00
fn token(&mut self, kind: SyntaxKind, n_tokens: u8) {
2019-02-21 15:24:42 +03:00
match mem::replace(&mut self.state, State::Normal) {
State::PendingStart => unreachable!(),
2019-03-30 13:25:53 +03:00
State::PendingFinish => self.inner.finish_node(),
2019-02-21 15:24:42 +03:00
State::Normal => (),
}
self.eat_trivias();
let n_tokens = n_tokens as usize;
let len = self.tokens[self.token_pos..self.token_pos + n_tokens]
.iter()
.map(|it| it.len)
.sum::<TextUnit>();
2019-03-30 13:25:53 +03:00
self.do_token(kind, len, n_tokens);
2018-07-29 13:51:55 +03:00
}
2019-03-30 13:25:53 +03:00
fn start_node(&mut self, kind: SyntaxKind) {
2019-02-21 15:24:42 +03:00
match mem::replace(&mut self.state, State::Normal) {
State::PendingStart => {
2019-03-30 13:25:53 +03:00
self.inner.start_node(kind);
2019-02-21 15:24:42 +03:00
// No need to attach trivias to previous node: there is no
// previous node.
return;
}
2019-03-30 13:25:53 +03:00
State::PendingFinish => self.inner.finish_node(),
2019-02-21 15:24:42 +03:00
State::Normal => (),
}
2019-02-21 15:24:42 +03:00
let n_trivias =
self.tokens[self.token_pos..].iter().take_while(|it| it.kind.is_trivia()).count();
let leading_trivias = &self.tokens[self.token_pos..self.token_pos + n_trivias];
let mut trivia_end =
self.text_pos + leading_trivias.iter().map(|it| it.len).sum::<TextUnit>();
let n_attached_trivias = {
let leading_trivias = leading_trivias.iter().rev().map(|it| {
let next_end = trivia_end - it.len;
let range = TextRange::from_to(next_end, trivia_end);
trivia_end = next_end;
(it.kind, &self.text[range])
});
n_attached_trivias(kind, leading_trivias)
};
self.eat_n_trivias(n_trivias - n_attached_trivias);
2019-03-30 13:25:53 +03:00
self.inner.start_node(kind);
self.eat_n_trivias(n_attached_trivias);
2018-07-29 13:51:55 +03:00
}
2019-03-30 13:25:53 +03:00
fn finish_node(&mut self) {
2019-02-21 15:24:42 +03:00
match mem::replace(&mut self.state, State::PendingFinish) {
State::PendingStart => unreachable!(),
2019-03-30 13:25:53 +03:00
State::PendingFinish => self.inner.finish_node(),
2019-02-21 15:24:42 +03:00
State::Normal => (),
}
2018-07-29 13:51:55 +03:00
}
2019-02-20 23:17:07 +03:00
fn error(&mut self, error: ParseError) {
2019-02-23 16:55:01 +03:00
self.inner.error(error, self.text_pos)
2018-07-29 13:51:55 +03:00
}
}
2019-02-23 16:07:29 +03:00
impl<'a> TextTreeSink<'a> {
pub(super) fn new(text: &'a str, tokens: &'a [Token]) -> TextTreeSink<'a> {
TextTreeSink {
text,
tokens,
text_pos: 0.into(),
token_pos: 0,
2019-02-21 15:24:42 +03:00
state: State::PendingStart,
2019-02-23 16:55:01 +03:00
inner: SyntaxTreeBuilder::default(),
}
}
2019-02-21 13:37:32 +03:00
2019-02-21 15:24:42 +03:00
pub(super) fn finish(mut self) -> (GreenNode, Vec<SyntaxError>) {
match mem::replace(&mut self.state, State::Normal) {
State::PendingFinish => {
self.eat_trivias();
2019-03-30 13:25:53 +03:00
self.inner.finish_node()
2019-02-21 15:24:42 +03:00
}
State::PendingStart | State::Normal => unreachable!(),
}
2019-02-23 16:55:01 +03:00
self.inner.finish_raw()
2019-02-21 13:37:32 +03:00
}
fn eat_trivias(&mut self) {
while let Some(&token) = self.tokens.get(self.token_pos) {
if !token.kind.is_trivia() {
break;
}
2019-03-30 13:25:53 +03:00
self.do_token(token.kind, token.len, 1);
}
}
fn eat_n_trivias(&mut self, n: usize) {
for _ in 0..n {
let token = self.tokens[self.token_pos];
assert!(token.kind.is_trivia());
2019-03-30 13:25:53 +03:00
self.do_token(token.kind, token.len, 1);
}
}
2019-03-30 13:25:53 +03:00
fn do_token(&mut self, kind: SyntaxKind, len: TextUnit, n_tokens: usize) {
let range = TextRange::offset_len(self.text_pos, len);
let text: SmolStr = self.text[range].into();
self.text_pos += len;
self.token_pos += n_tokens;
2019-03-30 13:25:53 +03:00
self.inner.token(kind, text);
}
}
fn n_attached_trivias<'a>(
kind: SyntaxKind,
trivias: impl Iterator<Item = (SyntaxKind, &'a str)>,
) -> usize {
match kind {
MACRO_CALL | CONST_DEF | TYPE_ALIAS_DEF | STRUCT_DEF | ENUM_DEF | ENUM_VARIANT | FN_DEF
| TRAIT_DEF | MODULE | RECORD_FIELD_DEF => {
let mut res = 0;
for (i, (kind, text)) in trivias.enumerate() {
match kind {
WHITESPACE => {
if text.contains("\n\n") {
break;
}
}
COMMENT => {
res = i + 1;
}
_ => (),
}
}
res
}
_ => 0,
}
}