rust/crates/mbe/src/lib.rs

351 lines
11 KiB
Rust
Raw Normal View History

//! `mbe` (short for Macro By Example) crate contains code for handling
2020-08-12 09:46:20 -05:00
//! `macro_rules` macros. It uses `TokenTree` (from `tt` package) as the
//! interface, although it contains some code to bridge `SyntaxNode`s and
//! `TokenTree`s as well!
2021-10-09 06:48:38 -05:00
//!
2023-10-13 22:28:23 -05:00
//! The tests for this functionality live in another crate:
2021-10-09 06:48:38 -05:00
//! `hir_def::macro_expansion_tests::mbe`.
2019-01-31 12:29:04 -06:00
#![warn(rust_2018_idioms, unused_lifetimes)]
mod parser;
2021-01-29 06:23:38 -06:00
mod expander;
2019-01-31 12:29:04 -06:00
mod syntax_bridge;
mod tt_iter;
2021-12-25 12:59:02 -06:00
mod to_parser_input;
2019-01-30 14:17:32 -06:00
2021-02-05 05:57:32 -06:00
#[cfg(test)]
mod benchmark;
use stdx::impl_from;
use tt::Span;
2023-01-31 04:49:49 -06:00
use std::fmt;
use crate::{
parser::{MetaTemplate, MetaVarKind, Op},
tt_iter::TtIter,
};
// FIXME: we probably should re-think `token_tree_to_syntax_node` interfaces
2021-12-27 08:54:51 -06:00
pub use ::parser::TopEntryPoint;
2023-12-18 06:30:41 -06:00
pub use tt::{Delimiter, DelimiterKind, Punct};
2023-12-18 06:30:41 -06:00
pub use crate::syntax_bridge::{
parse_exprs_with_sep, parse_to_token_tree, parse_to_token_tree_static_span,
syntax_node_to_token_tree, syntax_node_to_token_tree_modified, token_tree_to_syntax_node,
SpanMapper,
2022-01-01 19:39:14 -06:00
};
2023-11-25 08:10:31 -06:00
pub use crate::syntax_bridge::dummy_test_span_utils::*;
#[derive(Debug, PartialEq, Eq, Clone)]
2019-03-03 03:40:03 -06:00
pub enum ParseError {
UnexpectedToken(Box<str>),
Expected(Box<str>),
InvalidRepeat,
2021-01-08 08:42:40 -06:00
RepetitionEmptyTokenTree,
2019-03-03 03:40:03 -06:00
}
impl ParseError {
fn expected(e: &str) -> ParseError {
ParseError::Expected(e.into())
}
fn unexpected(e: &str) -> ParseError {
ParseError::UnexpectedToken(e.into())
}
}
impl fmt::Display for ParseError {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
match self {
ParseError::UnexpectedToken(it) => f.write_str(it),
ParseError::Expected(it) => f.write_str(it),
ParseError::InvalidRepeat => f.write_str("invalid repeat"),
ParseError::RepetitionEmptyTokenTree => f.write_str("empty token tree in repetition"),
}
}
}
#[derive(Debug, PartialEq, Eq, Clone, Hash)]
2019-03-03 03:40:03 -06:00
pub enum ExpandError {
BindingError(Box<Box<str>>),
2023-11-17 12:07:31 -06:00
UnresolvedBinding(Box<Box<str>>),
LeftoverTokens,
ConversionError,
LimitExceeded,
2019-03-02 13:20:26 -06:00
NoMatchingRule,
UnexpectedToken,
CountError(CountError),
}
impl_from!(CountError for ExpandError);
impl ExpandError {
fn binding_error(e: impl Into<Box<str>>) -> ExpandError {
ExpandError::BindingError(Box::new(e.into()))
}
2020-03-26 11:41:44 -05:00
}
impl fmt::Display for ExpandError {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
match self {
ExpandError::NoMatchingRule => f.write_str("no rule matches input tokens"),
ExpandError::UnexpectedToken => f.write_str("unexpected token in input"),
ExpandError::BindingError(e) => f.write_str(e),
2023-11-17 12:07:31 -06:00
ExpandError::UnresolvedBinding(binding) => {
f.write_str("could not find binding ")?;
f.write_str(binding)
}
ExpandError::ConversionError => f.write_str("could not convert tokens"),
ExpandError::LimitExceeded => f.write_str("Expand exceed limit"),
ExpandError::LeftoverTokens => f.write_str("leftover tokens"),
ExpandError::CountError(e) => e.fmt(f),
}
}
}
// FIXME: Showing these errors could be nicer.
#[derive(Debug, PartialEq, Eq, Clone, Hash)]
pub enum CountError {
OutOfBounds,
Misplaced,
}
impl fmt::Display for CountError {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
match self {
CountError::OutOfBounds => f.write_str("${count} out of bounds"),
CountError::Misplaced => f.write_str("${count} misplaced"),
}
}
}
2019-02-11 10:07:49 -06:00
/// This struct contains AST for a single `macro_rules` definition. What might
2019-01-31 13:14:28 -06:00
/// be very confusing is that AST has almost exactly the same shape as
/// `tt::TokenTree`, but there's a crucial difference: in macro rules, `$ident`
/// and `$()*` have special meaning (see `Var` and `Repeat` data structures)
#[derive(Clone, Debug, PartialEq, Eq)]
pub struct DeclarativeMacro<S> {
rules: Box<[Rule<S>]>,
// This is used for correctly determining the behavior of the pat fragment
// FIXME: This should be tracked by hygiene of the fragment identifier!
is_2021: bool,
2023-07-10 09:23:29 -05:00
err: Option<Box<ParseError>>,
2021-01-25 15:15:47 -06:00
}
#[derive(Clone, Debug, PartialEq, Eq)]
struct Rule<S> {
lhs: MetaTemplate<S>,
rhs: MetaTemplate<S>,
2020-12-29 12:35:21 -06:00
}
impl<S: Span> DeclarativeMacro<S> {
pub fn from_err(err: ParseError, is_2021: bool) -> DeclarativeMacro<S> {
DeclarativeMacro { rules: Box::default(), is_2021, err: Some(Box::new(err)) }
2023-07-10 09:23:29 -05:00
}
2021-10-10 13:07:43 -05:00
/// The old, `macro_rules! m {}` flavor.
pub fn parse_macro_rules(
tt: &tt::Subtree<S>,
is_2021: bool,
// FIXME: Remove this once we drop support for rust 1.76 (defaults to true then)
new_meta_vars: bool,
) -> DeclarativeMacro<S> {
2019-09-22 15:39:29 -05:00
// Note: this parsing can be implemented using mbe machinery itself, by
// matching against `$($lhs:tt => $rhs:tt);*` pattern, but implementing
// manually seems easier.
let mut src = TtIter::new(tt);
let mut rules = Vec::new();
2023-07-10 09:23:29 -05:00
let mut err = None;
while src.len() > 0 {
let rule = match Rule::parse(&mut src, true, new_meta_vars) {
2023-07-10 09:23:29 -05:00
Ok(it) => it,
Err(e) => {
err = Some(Box::new(e));
break;
}
};
rules.push(rule);
if let Err(()) = src.expect_char(';') {
if src.len() > 0 {
2023-07-10 09:23:29 -05:00
err = Some(Box::new(ParseError::expected("expected `;`")));
}
break;
}
}
2019-09-22 15:39:29 -05:00
2022-01-01 19:39:14 -06:00
for Rule { lhs, .. } in &rules {
2023-07-10 09:23:29 -05:00
if let Err(e) = validate(lhs) {
err = Some(Box::new(e));
break;
}
2019-09-22 15:39:29 -05:00
}
DeclarativeMacro { rules: rules.into_boxed_slice(), is_2021, err }
2021-01-25 15:15:47 -06:00
}
2021-10-10 13:07:43 -05:00
/// The new, unstable `macro m {}` flavor.
pub fn parse_macro2(
tt: &tt::Subtree<S>,
is_2021: bool,
// FIXME: Remove this once we drop support for rust 1.76 (defaults to true then)
new_meta_vars: bool,
) -> DeclarativeMacro<S> {
2021-01-25 15:15:47 -06:00
let mut src = TtIter::new(tt);
let mut rules = Vec::new();
2023-07-10 09:23:29 -05:00
let mut err = None;
2021-01-25 15:15:47 -06:00
2023-01-31 04:49:49 -06:00
if tt::DelimiterKind::Brace == tt.delimiter.kind {
2021-03-08 14:19:44 -06:00
cov_mark::hit!(parse_macro_def_rules);
2021-01-25 15:15:47 -06:00
while src.len() > 0 {
let rule = match Rule::parse(&mut src, true, new_meta_vars) {
2023-07-10 09:23:29 -05:00
Ok(it) => it,
Err(e) => {
err = Some(Box::new(e));
break;
}
};
2021-01-25 15:15:47 -06:00
rules.push(rule);
2021-04-02 20:08:31 -05:00
if let Err(()) = src.expect_any_char(&[';', ',']) {
2021-01-25 15:15:47 -06:00
if src.len() > 0 {
2023-07-10 09:23:29 -05:00
err = Some(Box::new(ParseError::expected(
"expected `;` or `,` to delimit rules",
)));
2021-01-25 15:15:47 -06:00
}
break;
}
}
} else {
2021-03-08 14:19:44 -06:00
cov_mark::hit!(parse_macro_def_simple);
match Rule::parse(&mut src, false, new_meta_vars) {
2023-07-10 09:23:29 -05:00
Ok(rule) => {
if src.len() != 0 {
err = Some(Box::new(ParseError::expected("remaining tokens in macro def")));
}
rules.push(rule);
}
Err(e) => {
err = Some(Box::new(e));
}
2021-01-25 15:15:47 -06:00
}
}
2022-01-01 19:39:14 -06:00
for Rule { lhs, .. } in &rules {
2023-07-10 09:23:29 -05:00
if let Err(e) = validate(lhs) {
err = Some(Box::new(e));
break;
}
2021-01-25 15:15:47 -06:00
}
DeclarativeMacro { rules: rules.into_boxed_slice(), is_2021, err }
2019-01-31 13:14:28 -06:00
}
2023-07-10 09:23:29 -05:00
pub fn err(&self) -> Option<&ParseError> {
self.err.as_deref()
}
2023-11-17 12:07:31 -06:00
pub fn expand(
&self,
tt: &tt::Subtree<S>,
marker: impl Fn(&mut S) + Copy,
new_meta_vars: bool,
2023-11-17 12:07:31 -06:00
) -> ExpandResult<tt::Subtree<S>> {
expander::expand_rules(&self.rules, &tt, marker, self.is_2021, new_meta_vars)
}
2019-01-31 13:14:28 -06:00
}
impl<S: Span> Rule<S> {
fn parse(
src: &mut TtIter<'_, S>,
expect_arrow: bool,
new_meta_vars: bool,
) -> Result<Self, ParseError> {
let lhs = src.expect_subtree().map_err(|()| ParseError::expected("expected subtree"))?;
2021-01-25 15:15:47 -06:00
if expect_arrow {
src.expect_char('=').map_err(|()| ParseError::expected("expected `=`"))?;
src.expect_char('>').map_err(|()| ParseError::expected("expected `>`"))?;
2021-01-25 15:15:47 -06:00
}
let rhs = src.expect_subtree().map_err(|()| ParseError::expected("expected subtree"))?;
2020-12-29 12:35:21 -06:00
2021-10-02 12:21:23 -05:00
let lhs = MetaTemplate::parse_pattern(lhs)?;
let rhs = MetaTemplate::parse_template(rhs, new_meta_vars)?;
2020-12-29 12:35:21 -06:00
Ok(crate::Rule { lhs, rhs })
}
2019-04-24 10:01:32 -05:00
}
fn validate<S: Span>(pattern: &MetaTemplate<S>) -> Result<(), ParseError> {
2020-12-29 12:35:21 -06:00
for op in pattern.iter() {
match op {
2021-06-12 22:54:16 -05:00
Op::Subtree { tokens, .. } => validate(tokens)?,
2021-01-30 02:12:30 -06:00
Op::Repeat { tokens: subtree, separator, .. } => {
// Checks that no repetition which could match an empty token
// https://github.com/rust-lang/rust/blob/a58b1ed44f5e06976de2bdc4d7dc81c36a96934f/src/librustc_expand/mbe/macro_rules.rs#L558
2022-01-01 19:39:14 -06:00
let lsh_is_empty_seq = separator.is_none() && subtree.iter().all(|child_op| {
match *child_op {
2022-01-01 19:39:14 -06:00
// vis is optional
Op::Var { kind: Some(kind), .. } => kind == MetaVarKind::Vis,
2022-01-01 19:39:14 -06:00
Op::Repeat {
kind: parser::RepeatKind::ZeroOrMore | parser::RepeatKind::ZeroOrOne,
..
} => true,
_ => false,
}
});
if lsh_is_empty_seq {
return Err(ParseError::RepetitionEmptyTokenTree);
}
validate(subtree)?
}
_ => (),
}
}
Ok(())
2019-01-30 14:25:02 -06:00
}
2019-01-31 13:14:28 -06:00
pub type ExpandResult<T> = ValueResult<T, ExpandError>;
2020-11-26 09:04:23 -06:00
#[derive(Debug, Clone, Eq, PartialEq)]
pub struct ValueResult<T, E> {
2020-11-26 09:04:23 -06:00
pub value: T,
pub err: Option<E>,
2020-11-26 09:04:23 -06:00
}
2020-03-16 06:22:10 -05:00
impl<T, E> ValueResult<T, E> {
2023-04-16 12:20:48 -05:00
pub fn new(value: T, err: E) -> Self {
Self { value, err: Some(err) }
2020-03-16 06:22:10 -05:00
}
2023-04-16 12:20:48 -05:00
pub fn ok(value: T) -> Self {
Self { value, err: None }
2023-01-31 04:49:49 -06:00
}
pub fn only_err(err: E) -> Self
2020-03-16 06:22:10 -05:00
where
T: Default,
{
2020-11-26 09:04:23 -06:00
Self { value: Default::default(), err: Some(err) }
2020-03-16 06:22:10 -05:00
}
pub fn map<U>(self, f: impl FnOnce(T) -> U) -> ValueResult<U, E> {
ValueResult { value: f(self.value), err: self.err }
}
pub fn map_err<E2>(self, f: impl FnOnce(E) -> E2) -> ValueResult<T, E2> {
ValueResult { value: self.value, err: self.err.map(f) }
2020-03-16 06:22:10 -05:00
}
pub fn result(self) -> Result<T, E> {
2021-06-07 06:59:01 -05:00
self.err.map_or(Ok(self.value), Err)
2020-03-16 06:22:10 -05:00
}
}
impl<T: Default, E> From<Result<T, E>> for ValueResult<T, E> {
fn from(result: Result<T, E>) -> Self {
2021-03-21 09:33:18 -05:00
result.map_or_else(Self::only_err, Self::ok)
2020-03-16 06:22:10 -05:00
}
}