rust/crates/ra_syntax/src/parsing/text_token_source.rs

//! FIXME: write short doc here

use ra_parser::Token as PToken;
use ra_parser::TokenSource;

use crate::{parsing::lexer::Token, SyntaxKind::EOF, TextRange, TextUnit};

pub(crate) struct TextTokenSource<'t> {
    text: &'t str,
    /// start position of each token(expect whitespace and comment)
    /// ```non-rust
    ///  struct Foo;
    /// ^------^---
    /// |      |  ^-
    /// 0      7  10
    /// ```
    /// (token, start_offset): `[(struct, 0), (Foo, 7), (;, 10)]`
    start_offsets: Vec<TextUnit>,
    /// non-whitespace/comment tokens
    /// ```non-rust
    /// struct Foo {}
    /// ^^^^^^ ^^^ ^^
    /// ```
    /// tokens: `[struct, Foo, {, }]`
    tokens: Vec<Token>,

    /// Current token and position
    curr: (PToken, usize),
}

impl<'t> TokenSource for TextTokenSource<'t> {
    fn current(&self) -> PToken {
        self.curr.0
    }

    fn lookahead_nth(&self, n: usize) -> PToken {
        mk_token(self.curr.1 + n, &self.start_offsets, &self.tokens)
    }

    fn bump(&mut self) {
        if self.curr.0.kind == EOF {
            return;
        }

        let pos = self.curr.1 + 1;
        self.curr = (mk_token(pos, &self.start_offsets, &self.tokens), pos);
    }

    fn is_keyword(&self, kw: &str) -> bool {
        let pos = self.curr.1;
        if pos >= self.tokens.len() {
            return false;
        }
        let range = TextRange::offset_len(self.start_offsets[pos], self.tokens[pos].len);
        self.text[range] == *kw
    }
}

fn mk_token(pos: usize, start_offsets: &[TextUnit], tokens: &[Token]) -> PToken {
    let kind = tokens.get(pos).map(|t| t.kind).unwrap_or(EOF);
    let is_jointed_to_next = if pos + 1 < start_offsets.len() {
        start_offsets[pos] + tokens[pos].len == start_offsets[pos + 1]
    } else {
        false
    };

    PToken { kind, is_jointed_to_next }
}

impl<'t> TextTokenSource<'t> {
    /// Generate input from tokens(expect comment and whitespace).
    pub fn new(text: &'t str, raw_tokens: &'t [Token]) -> TextTokenSource<'t> {
        let mut tokens = Vec::new();
        let mut start_offsets = Vec::new();
        let mut len = 0.into();
        for &token in raw_tokens.iter() {
            if !token.kind.is_trivia() {
                tokens.push(token);
                start_offsets.push(len);
            }
            len += token.len;
        }

        let first = mk_token(0, &start_offsets, &tokens);
        TextTokenSource { text, start_offsets, tokens, curr: (first, 0) }
    }
}
Added test for check doc strings in crates. #1856 2019-09-30 03:58:53 -05:00			`//! FIXME: write short doc here`

Change TokenSource to iteration based 2019-05-25 07:31:53 -05:00			`use ra_parser::Token as PToken;`
allow rustfmt to reorder imports This wasn't a right decision in the first place, the feature flag was broken in the last rustfmt release, and syntax highlighting of imports is more important anyway 2019-07-04 15:05:17 -05:00			`use ra_parser::TokenSource;`
fix compilation 2019-02-21 04:37:32 -06:00
allow rustfmt to reorder imports This wasn't a right decision in the first place, the feature flag was broken in the last rustfmt release, and syntax highlighting of imports is more important anyway 2019-07-04 15:05:17 -05:00			`use crate::{parsing::lexer::Token, SyntaxKind::EOF, TextRange, TextUnit};`
Extract parser input into a separate struct 2018-02-04 05:35:59 -06:00
rename 2019-02-23 07:07:29 -06:00			`pub(crate) struct TextTokenSource<'t> {`
docs 2019-02-21 06:24:42 -06:00			`text: &'t str,`
			`/// start position of each token(expect whitespace and comment)`
			/// ```non-rust
			`/// struct Foo;`
			`/// ^------^---`
			`/// \| \| ^-`
			`/// 0 7 10`
			/// ```
			/// (token, start_offset): `[(struct, 0), (Foo, 7), (;, 10)]`
			`start_offsets: Vec<TextUnit>,`
			`/// non-whitespace/comment tokens`
			/// ```non-rust
			`/// struct Foo {}`
			`/// ^^^^^^ ^^^ ^^`
			/// ```
			/// tokens: `[struct, Foo, {, }]`
			`tokens: Vec<Token>,`
Change TokenSource to iteration based 2019-05-25 07:31:53 -05:00
			`/// Current token and position`
			`curr: (PToken, usize),`
docs 2019-02-21 06:24:42 -06:00			`}`

rename 2019-02-23 07:07:29 -06:00			`impl<'t> TokenSource for TextTokenSource<'t> {`
Change TokenSource to iteration based 2019-05-25 07:31:53 -05:00			`fn current(&self) -> PToken {`
Some clippy fixes for 1.36 2019-07-04 12:26:44 -05:00			`self.curr.0`
route parsing via TokenSource trait 2019-02-20 12:50:07 -06:00			`}`
Change TokenSource to iteration based 2019-05-25 07:31:53 -05:00
			`fn lookahead_nth(&self, n: usize) -> PToken {`
			`mk_token(self.curr.1 + n, &self.start_offsets, &self.tokens)`
			`}`

			`fn bump(&mut self) {`
			`if self.curr.0.kind == EOF {`
			`return;`
route parsing via TokenSource trait 2019-02-20 12:50:07 -06:00			`}`
Change TokenSource to iteration based 2019-05-25 07:31:53 -05:00
			`let pos = self.curr.1 + 1;`
			`self.curr = (mk_token(pos, &self.start_offsets, &self.tokens), pos);`
route parsing via TokenSource trait 2019-02-20 12:50:07 -06:00			`}`
Change TokenSource to iteration based 2019-05-25 07:31:53 -05:00
			`fn is_keyword(&self, kw: &str) -> bool {`
			`let pos = self.curr.1;`
Run cargo +nightly fix --clippy -Z unstable-options 2020-02-18 06:53:02 -06:00			`if pos >= self.tokens.len() {`
route parsing via TokenSource trait 2019-02-20 12:50:07 -06:00			`return false;`
			`}`
remove TokenPos 2019-02-20 13:58:56 -06:00			`let range = TextRange::offset_len(self.start_offsets[pos], self.tokens[pos].len);`
route parsing via TokenSource trait 2019-02-20 12:50:07 -06:00			`self.text[range] == *kw`
			`}`
			`}`

Change TokenSource to iteration based 2019-05-25 07:31:53 -05:00			`fn mk_token(pos: usize, start_offsets: &[TextUnit], tokens: &[Token]) -> PToken {`
			`let kind = tokens.get(pos).map(\|t\| t.kind).unwrap_or(EOF);`
			`let is_jointed_to_next = if pos + 1 < start_offsets.len() {`
			`start_offsets[pos] + tokens[pos].len == start_offsets[pos + 1]`
			`} else {`
			`false`
			`};`

			`PToken { kind, is_jointed_to_next }`
			`}`

rename 2019-02-23 07:07:29 -06:00			`impl<'t> TextTokenSource<'t> {`
doc parser input 2018-12-31 07:30:37 -06:00			`/// Generate input from tokens(expect comment and whitespace).`
rename 2019-02-23 07:07:29 -06:00			`pub fn new(text: &'t str, raw_tokens: &'t [Token]) -> TextTokenSource<'t> {`
Extract parser input into a separate struct 2018-02-04 05:35:59 -06:00			`let mut tokens = Vec::new();`
			`let mut start_offsets = Vec::new();`
Migrate to text-unit 2018-07-28 05:07:10 -05:00			`let mut len = 0.into();`
Extract parser input into a separate struct 2018-02-04 05:35:59 -06:00			`for &token in raw_tokens.iter() {`
Reorganize 2018-07-29 07:16:07 -05:00			`if !token.kind.is_trivia() {`
Extract parser input into a separate struct 2018-02-04 05:35:59 -06:00			`tokens.push(token);`
			`start_offsets.push(len);`
			`}`
			`len += token.len;`
			`}`

Change TokenSource to iteration based 2019-05-25 07:31:53 -05:00			`let first = mk_token(0, &start_offsets, &tokens);`
			`TextTokenSource { text, start_offsets, tokens, curr: (first, 0) }`
Extract parser input into a separate struct 2018-02-04 05:35:59 -06:00			`}`
			`}`