rust-analyzer/crates/ra_mbe/src/lib.rs

//! `mbe` (short for Macro By Example) crate contains code for handling
//! `macro_rules` macros. It uses `TokenTree` (from `ra_tt` package) as the
//! interface, although it contains some code to bridge `SyntaxNode`s and
//! `TokenTree`s as well!

mod parser;
mod mbe_expander;
mod syntax_bridge;
mod tt_iter;
mod subtree_source;

pub use tt::{Delimiter, Punct};

use crate::{
    parser::{parse_pattern, Op},
    tt_iter::TtIter,
};

#[derive(Debug, PartialEq, Eq)]
pub enum ParseError {
    Expected(String),
}

#[derive(Debug, PartialEq, Eq)]
pub enum ExpandError {
    NoMatchingRule,
    UnexpectedToken,
    BindingError(String),
    ConversionError,
    InvalidRepeat,
}

pub use crate::syntax_bridge::{
    ast_to_token_tree, syntax_node_to_token_tree, token_tree_to_syntax_node, TokenMap,
};

/// This struct contains AST for a single `macro_rules` definition. What might
/// be very confusing is that AST has almost exactly the same shape as
/// `tt::TokenTree`, but there's a crucial difference: in macro rules, `$ident`
/// and `$()*` have special meaning (see `Var` and `Repeat` data structures)
#[derive(Clone, Debug, PartialEq, Eq)]
pub struct MacroRules {
    rules: Vec<Rule>,
    /// Highest id of the token we have in TokenMap
    shift: Shift,
}

#[derive(Clone, Debug, PartialEq, Eq)]
struct Rule {
    lhs: tt::Subtree,
    rhs: tt::Subtree,
}

#[derive(Clone, Copy, Debug, PartialEq, Eq)]
struct Shift(u32);

impl Shift {
    fn new(tt: &tt::Subtree) -> Shift {
        // Note that TokenId is started from zero,
        // We have to add 1 to prevent duplication.
        let value = max_id(tt).map_or(0, |it| it + 1);
        return Shift(value);

        // Find the max token id inside a subtree
        fn max_id(subtree: &tt::Subtree) -> Option<u32> {
            subtree
                .token_trees
                .iter()
                .filter_map(|tt| match tt {
                    tt::TokenTree::Subtree(subtree) => max_id(subtree),
                    tt::TokenTree::Leaf(tt::Leaf::Ident(ident))
                        if ident.id != tt::TokenId::unspecified() =>
                    {
                        Some(ident.id.0)
                    }
                    _ => None,
                })
                .max()
        }
    }

    /// Shift given TokenTree token id
    fn shift_all(self, tt: &mut tt::Subtree) {
        for t in tt.token_trees.iter_mut() {
            match t {
                tt::TokenTree::Leaf(leaf) => match leaf {
                    tt::Leaf::Ident(ident) => ident.id = self.shift(ident.id),
                    _ => (),
                },
                tt::TokenTree::Subtree(tt) => self.shift_all(tt),
            }
        }
    }

    fn shift(self, id: tt::TokenId) -> tt::TokenId {
        if id == tt::TokenId::unspecified() {
            return id;
        }
        tt::TokenId(id.0 + self.0)
    }

    fn unshift(self, id: tt::TokenId) -> Option<tt::TokenId> {
        id.0.checked_sub(self.0).map(tt::TokenId)
    }
}

#[derive(Debug, Eq, PartialEq)]
pub enum Origin {
    Def,
    Call,
}

impl MacroRules {
    pub fn parse(tt: &tt::Subtree) -> Result<MacroRules, ParseError> {
        // Note: this parsing can be implemented using mbe machinery itself, by
        // matching against `$($lhs:tt => $rhs:tt);*` pattern, but implementing
        // manually seems easier.
        let mut src = TtIter::new(tt);
        let mut rules = Vec::new();
        while src.len() > 0 {
            let rule = Rule::parse(&mut src)?;
            rules.push(rule);
            if let Err(()) = src.expect_char(';') {
                if src.len() > 0 {
                    return Err(ParseError::Expected("expected `:`".to_string()));
                }
                break;
            }
        }

        for rule in rules.iter() {
            validate(&rule.lhs)?;
        }

        Ok(MacroRules { rules, shift: Shift::new(tt) })
    }

    pub fn expand(&self, tt: &tt::Subtree) -> Result<tt::Subtree, ExpandError> {
        // apply shift
        let mut tt = tt.clone();
        self.shift.shift_all(&mut tt);
        mbe_expander::expand(self, &tt)
    }

    pub fn map_id_down(&self, id: tt::TokenId) -> tt::TokenId {
        self.shift.shift(id)
    }

    pub fn map_id_up(&self, id: tt::TokenId) -> (tt::TokenId, Origin) {
        match self.shift.unshift(id) {
            Some(id) => (id, Origin::Call),
            None => (id, Origin::Def),
        }
    }
}

impl Rule {
    fn parse(src: &mut TtIter) -> Result<Rule, ParseError> {
        let mut lhs = src
            .expect_subtree()
            .map_err(|()| ParseError::Expected("expected subtree".to_string()))?
            .clone();
        lhs.delimiter = None;
        src.expect_char('=').map_err(|()| ParseError::Expected("expected `=`".to_string()))?;
        src.expect_char('>').map_err(|()| ParseError::Expected("expected `>`".to_string()))?;
        let mut rhs = src
            .expect_subtree()
            .map_err(|()| ParseError::Expected("expected subtree".to_string()))?
            .clone();
        rhs.delimiter = None;
        Ok(crate::Rule { lhs, rhs })
    }
}

fn validate(pattern: &tt::Subtree) -> Result<(), ParseError> {
    for op in parse_pattern(pattern) {
        let op = match op {
            Ok(it) => it,
            Err(e) => {
                let msg = match e {
                    ExpandError::InvalidRepeat => "invalid repeat".to_string(),
                    _ => "invalid macro definition".to_string(),
                };
                return Err(ParseError::Expected(msg));
            }
        };
        match op {
            Op::TokenTree(tt::TokenTree::Subtree(subtree)) | Op::Repeat { subtree, .. } => {
                validate(subtree)?
            }
            _ => (),
        }
    }
    Ok(())
}

#[cfg(test)]
mod tests;
Added test for check doc strings in crates. #1856 2019-09-30 08:58:53 +00:00			//! `mbe` (short for Macro By Example) crate contains code for handling
			//! `macro_rules` macros. It uses `TokenTree` (from `ra_tt` package) as the
			//! interface, although it contains some code to bridge `SyntaxNode`s and
			//! `TokenTree`s as well!
move test 2019-01-31 18:29:04 +00:00
use usual token tree for macro expansion 2019-09-16 23:54:22 +00:00			`mod parser;`
split macros across crates 2019-01-31 18:09:43 +00:00			`mod mbe_expander;`
move test 2019-01-31 18:29:04 +00:00			`mod syntax_bridge;`
use usual token tree for macro expansion 2019-09-16 23:54:22 +00:00			`mod tt_iter;`
Refactoring subtree_source 2019-04-07 13:42:53 +00:00			`mod subtree_source;`
add macro by example ide 2019-01-30 20:17:32 +00:00
split macros across crates 2019-01-31 18:09:43 +00:00			`pub use tt::{Delimiter, Punct};`
add conversion boilerplate 2019-01-30 20:25:02 +00:00
use usual token tree for macro expansion 2019-09-16 23:54:22 +00:00			`use crate::{`
			`parser::{parse_pattern, Op},`
			`tt_iter::TtIter,`
			`};`

Replace option with result in mbe 2019-03-02 19:20:26 +00:00			`#[derive(Debug, PartialEq, Eq)]`
Split parse and expand errors 2019-03-03 09:40:03 +00:00			`pub enum ParseError {`
Add parser unit tests 2019-03-03 11:45:30 +00:00			`Expected(String),`
Split parse and expand errors 2019-03-03 09:40:03 +00:00			`}`

			`#[derive(Debug, PartialEq, Eq)]`
			`pub enum ExpandError {`
Replace option with result in mbe 2019-03-02 19:20:26 +00:00			`NoMatchingRule,`
			`UnexpectedToken,`
			`BindingError(String),`
Add MacroItems and MacroStmts in grammer.ron 2019-04-18 18:47:29 +00:00			`ConversionError,`
use usual token tree for macro expansion 2019-09-16 23:54:22 +00:00			`InvalidRepeat,`
Replace option with result in mbe 2019-03-02 19:20:26 +00:00			`}`

Add MacroItems and MacroStmts in grammer.ron 2019-04-18 18:47:29 +00:00			`pub use crate::syntax_bridge::{`
Collapse TokenMap and RevTokenMap 2019-11-18 13:08:41 +00:00			`ast_to_token_tree, syntax_node_to_token_tree, token_tree_to_syntax_node, TokenMap,`
Add MacroItems and MacroStmts in grammer.ron 2019-04-18 18:47:29 +00:00			`};`
reshuffle 2019-01-31 10:46:40 +00:00
typo 2019-02-11 16:07:49 +00:00			/// This struct contains AST for a single `macro_rules` definition. What might
cleanup the api 2019-01-31 19:14:28 +00:00			`/// be very confusing is that AST has almost exactly the same shape as`
			/// `tt::TokenTree`, but there's a crucial difference: in macro rules, `$ident`
			/// and `$()*` have special meaning (see `Var` and `Repeat` data structures)
add name resolution from the old impl unlike the old impl, this also handles macro imports across crates 2019-03-13 13:04:28 +00:00			`#[derive(Clone, Debug, PartialEq, Eq)]`
move macros to a separate crate 2019-01-31 10:40:05 +00:00			`pub struct MacroRules {`
Make shift an implementation detail of mbe 2019-11-17 16:11:43 +00:00			`rules: Vec<Rule>,`
Add TokenId Shif in macro_rules 2019-11-04 15:22:18 +00:00			`/// Highest id of the token we have in TokenMap`
Make shift an implementation detail of mbe 2019-11-17 16:11:43 +00:00			`shift: Shift,`
add macro by example ide 2019-01-30 20:17:32 +00:00			`}`

use usual token tree for macro expansion 2019-09-16 23:54:22 +00:00			`#[derive(Clone, Debug, PartialEq, Eq)]`
Make shift an implementation detail of mbe 2019-11-17 16:11:43 +00:00			`struct Rule {`
			`lhs: tt::Subtree,`
			`rhs: tt::Subtree,`
use usual token tree for macro expansion 2019-09-16 23:54:22 +00:00			`}`

Make shift an implementation detail of mbe 2019-11-17 16:11:43 +00:00			`#[derive(Clone, Copy, Debug, PartialEq, Eq)]`
			`struct Shift(u32);`

			`impl Shift {`
			`fn new(tt: &tt::Subtree) -> Shift {`
			`// Note that TokenId is started from zero,`
			`// We have to add 1 to prevent duplication.`
			`let value = max_id(tt).map_or(0, \|it\| it + 1);`
			`return Shift(value);`

			`// Find the max token id inside a subtree`
			`fn max_id(subtree: &tt::Subtree) -> Option<u32> {`
			`subtree`
			`.token_trees`
			`.iter()`
			`.filter_map(\|tt\| match tt {`
			`tt::TokenTree::Subtree(subtree) => max_id(subtree),`
			`tt::TokenTree::Leaf(tt::Leaf::Ident(ident))`
			`if ident.id != tt::TokenId::unspecified() =>`
			`{`
			`Some(ident.id.0)`
			`}`
			`_ => None,`
			`})`
			`.max()`
			`}`
			`}`

			`/// Shift given TokenTree token id`
			`fn shift_all(self, tt: &mut tt::Subtree) {`
			`for t in tt.token_trees.iter_mut() {`
			`match t {`
			`tt::TokenTree::Leaf(leaf) => match leaf {`
			`tt::Leaf::Ident(ident) => ident.id = self.shift(ident.id),`
			`_ => (),`
			`},`
			`tt::TokenTree::Subtree(tt) => self.shift_all(tt),`
Refactor and rename 2019-11-04 17:01:05 +00:00			`}`
Make shift an implementation detail of mbe 2019-11-17 16:11:43 +00:00			`}`
			`}`
Add TokenId Shif in macro_rules 2019-11-04 15:22:18 +00:00
Make shift an implementation detail of mbe 2019-11-17 16:11:43 +00:00			`fn shift(self, id: tt::TokenId) -> tt::TokenId {`
			`if id == tt::TokenId::unspecified() {`
			`return id;`
Add TokenId Shif in macro_rules 2019-11-04 15:22:18 +00:00			`}`
Make shift an implementation detail of mbe 2019-11-17 16:11:43 +00:00			`tt::TokenId(id.0 + self.0)`
			`}`

			`fn unshift(self, id: tt::TokenId) -> Option<tt::TokenId> {`
			`id.0.checked_sub(self.0).map(tt::TokenId)`
Add TokenId Shif in macro_rules 2019-11-04 15:22:18 +00:00			`}`
			`}`

Re-export Origin to replace ExpansionOrigin 2019-12-14 17:46:39 +00:00			`#[derive(Debug, Eq, PartialEq)]`
Make shift an implementation detail of mbe 2019-11-17 16:11:43 +00:00			`pub enum Origin {`
			`Def,`
			`Call,`
			`}`

cleanup the api 2019-01-31 19:14:28 +00:00			`impl MacroRules {`
Split parse and expand errors 2019-03-03 09:40:03 +00:00			`pub fn parse(tt: &tt::Subtree) -> Result<MacroRules, ParseError> {`
minor cleanup 2019-09-22 20:39:29 +00:00			`// Note: this parsing can be implemented using mbe machinery itself, by`
			// matching against `$($lhs:tt => $rhs:tt);*` pattern, but implementing
			`// manually seems easier.`
use usual token tree for macro expansion 2019-09-16 23:54:22 +00:00			`let mut src = TtIter::new(tt);`
			`let mut rules = Vec::new();`
			`while src.len() > 0 {`
			`let rule = Rule::parse(&mut src)?;`
			`rules.push(rule);`
			`if let Err(()) = src.expect_char(';') {`
			`if src.len() > 0 {`
			return Err(ParseError::Expected("expected `:`".to_string()));
			`}`
			`break;`
			`}`
			`}`
minor cleanup 2019-09-22 20:39:29 +00:00
			`for rule in rules.iter() {`
			`validate(&rule.lhs)?;`
			`}`

Make shift an implementation detail of mbe 2019-11-17 16:11:43 +00:00			`Ok(MacroRules { rules, shift: Shift::new(tt) })`
cleanup the api 2019-01-31 19:14:28 +00:00			`}`
Add TokenId Shif in macro_rules 2019-11-04 15:22:18 +00:00
Split parse and expand errors 2019-03-03 09:40:03 +00:00			`pub fn expand(&self, tt: &tt::Subtree) -> Result<tt::Subtree, ExpandError> {`
Add TokenId Shif in macro_rules 2019-11-04 15:22:18 +00:00			`// apply shift`
			`let mut tt = tt.clone();`
Make shift an implementation detail of mbe 2019-11-17 16:11:43 +00:00			`self.shift.shift_all(&mut tt);`
Add TokenId Shif in macro_rules 2019-11-04 15:22:18 +00:00			`mbe_expander::expand(self, &tt)`
cleanup the api 2019-01-31 19:14:28 +00:00			`}`
Use macro_rules shift to map text ranges 2019-11-04 18:09:16 +00:00
Make shift an implementation detail of mbe 2019-11-17 16:11:43 +00:00			`pub fn map_id_down(&self, id: tt::TokenId) -> tt::TokenId {`
			`self.shift.shift(id)`
			`}`

			`pub fn map_id_up(&self, id: tt::TokenId) -> (tt::TokenId, Origin) {`
			`match self.shift.unshift(id) {`
			`Some(id) => (id, Origin::Call),`
			`None => (id, Origin::Def),`
			`}`
Use macro_rules shift to map text ranges 2019-11-04 18:09:16 +00:00			`}`
cleanup the api 2019-01-31 19:14:28 +00:00			`}`

use usual token tree for macro expansion 2019-09-16 23:54:22 +00:00			`impl Rule {`
			`fn parse(src: &mut TtIter) -> Result<Rule, ParseError> {`
			`let mut lhs = src`
			`.expect_subtree()`
			`.map_err(\|()\| ParseError::Expected("expected subtree".to_string()))?`
			`.clone();`
Refactor tt::Delimiter 2019-12-13 13:53:34 +00:00			`lhs.delimiter = None;`
use usual token tree for macro expansion 2019-09-16 23:54:22 +00:00			src.expect_char('=').map_err(\|()\| ParseError::Expected("expected `=`".to_string()))?;
			src.expect_char('>').map_err(\|()\| ParseError::Expected("expected `>`".to_string()))?;
			`let mut rhs = src`
			`.expect_subtree()`
			`.map_err(\|()\| ParseError::Expected("expected subtree".to_string()))?`
			`.clone();`
Refactor tt::Delimiter 2019-12-13 13:53:34 +00:00			`rhs.delimiter = None;`
use usual token tree for macro expansion 2019-09-16 23:54:22 +00:00			`Ok(crate::Rule { lhs, rhs })`
			`}`
Add handling `token` seperator in mbe 2019-04-24 15:01:32 +00:00			`}`
Add empty bindings and some refactoring 2019-05-02 15:23:14 +00:00
use usual token tree for macro expansion 2019-09-16 23:54:22 +00:00			`fn validate(pattern: &tt::Subtree) -> Result<(), ParseError> {`
			`for op in parse_pattern(pattern) {`
			`let op = match op {`
			`Ok(it) => it,`
			`Err(e) => {`
			`let msg = match e {`
			`ExpandError::InvalidRepeat => "invalid repeat".to_string(),`
			`_ => "invalid macro definition".to_string(),`
			`};`
			`return Err(ParseError::Expected(msg));`
			`}`
			`};`
			`match op {`
			`Op::TokenTree(tt::TokenTree::Subtree(subtree)) \| Op::Repeat { subtree, .. } => {`
			`validate(subtree)?`
Add empty bindings and some refactoring 2019-05-02 15:23:14 +00:00			`}`
use usual token tree for macro expansion 2019-09-16 23:54:22 +00:00			`_ => (),`
Add empty bindings and some refactoring 2019-05-02 15:23:14 +00:00			`}`
			`}`
use usual token tree for macro expansion 2019-09-16 23:54:22 +00:00			`Ok(())`
add conversion boilerplate 2019-01-30 20:25:02 +00:00			`}`
cleanup the api 2019-01-31 19:14:28 +00:00
			`#[cfg(test)]`
By pass unbind $var while mbe expanding 2019-05-03 15:23:21 +00:00			`mod tests;`