rust-analyzer/crates/ra_mbe/src/lib.rs

214 lines
6.4 KiB
Rust
Raw Normal View History

//! `mbe` (short for Macro By Example) crate contains code for handling
//! `macro_rules` macros. It uses `TokenTree` (from `ra_tt` package) as the
//! interface, although it contains some code to bridge `SyntaxNode`s and
//! `TokenTree`s as well!
2019-01-31 18:29:04 +00:00
mod parser;
2019-01-31 18:09:43 +00:00
mod mbe_expander;
2019-01-31 18:29:04 +00:00
mod syntax_bridge;
mod tt_iter;
2019-04-07 13:42:53 +00:00
mod subtree_source;
2019-01-30 20:17:32 +00:00
2019-01-31 18:09:43 +00:00
pub use tt::{Delimiter, Punct};
2019-01-30 20:25:02 +00:00
use crate::{
parser::{parse_pattern, Op},
tt_iter::TtIter,
};
2019-03-02 19:20:26 +00:00
#[derive(Debug, PartialEq, Eq)]
2019-03-03 09:40:03 +00:00
pub enum ParseError {
2019-03-03 11:45:30 +00:00
Expected(String),
2019-03-03 09:40:03 +00:00
}
#[derive(Debug, PartialEq, Eq)]
pub enum ExpandError {
2019-03-02 19:20:26 +00:00
NoMatchingRule,
UnexpectedToken,
BindingError(String),
ConversionError,
InvalidRepeat,
2019-03-02 19:20:26 +00:00
}
pub use crate::syntax_bridge::{
2020-03-08 16:13:04 +00:00
ast_to_token_tree, parse_to_token_tree, syntax_node_to_token_tree, token_tree_to_syntax_node,
TokenMap,
};
2019-01-31 10:46:40 +00:00
2019-02-11 16:07:49 +00:00
/// This struct contains AST for a single `macro_rules` definition. What might
2019-01-31 19:14:28 +00:00
/// be very confusing is that AST has almost exactly the same shape as
/// `tt::TokenTree`, but there's a crucial difference: in macro rules, `$ident`
/// and `$()*` have special meaning (see `Var` and `Repeat` data structures)
#[derive(Clone, Debug, PartialEq, Eq)]
2019-01-31 10:40:05 +00:00
pub struct MacroRules {
rules: Vec<Rule>,
2019-11-04 15:22:18 +00:00
/// Highest id of the token we have in TokenMap
shift: Shift,
2019-01-30 20:17:32 +00:00
}
#[derive(Clone, Debug, PartialEq, Eq)]
struct Rule {
lhs: tt::Subtree,
rhs: tt::Subtree,
}
#[derive(Clone, Copy, Debug, PartialEq, Eq)]
struct Shift(u32);
impl Shift {
fn new(tt: &tt::Subtree) -> Shift {
// Note that TokenId is started from zero,
// We have to add 1 to prevent duplication.
let value = max_id(tt).map_or(0, |it| it + 1);
return Shift(value);
// Find the max token id inside a subtree
fn max_id(subtree: &tt::Subtree) -> Option<u32> {
subtree
.token_trees
.iter()
.filter_map(|tt| match tt {
tt::TokenTree::Subtree(subtree) => {
let tree_id = max_id(subtree);
match subtree.delimiter {
Some(it) if it.id != tt::TokenId::unspecified() => {
Some(tree_id.map_or(it.id.0, |t| t.max(it.id.0)))
}
_ => tree_id,
}
}
tt::TokenTree::Leaf(tt::Leaf::Ident(ident))
if ident.id != tt::TokenId::unspecified() =>
{
Some(ident.id.0)
}
_ => None,
})
.max()
}
}
/// Shift given TokenTree token id
fn shift_all(self, tt: &mut tt::Subtree) {
for t in tt.token_trees.iter_mut() {
match t {
tt::TokenTree::Leaf(leaf) => match leaf {
tt::Leaf::Ident(ident) => ident.id = self.shift(ident.id),
tt::Leaf::Punct(punct) => punct.id = self.shift(punct.id),
tt::Leaf::Literal(lit) => lit.id = self.shift(lit.id),
},
tt::TokenTree::Subtree(tt) => {
2019-12-20 20:14:30 +00:00
if let Some(it) = tt.delimiter.as_mut() {
it.id = self.shift(it.id);
};
self.shift_all(tt)
}
2019-11-04 17:01:05 +00:00
}
}
}
2019-11-04 15:22:18 +00:00
fn shift(self, id: tt::TokenId) -> tt::TokenId {
if id == tt::TokenId::unspecified() {
return id;
2019-11-04 15:22:18 +00:00
}
tt::TokenId(id.0 + self.0)
}
fn unshift(self, id: tt::TokenId) -> Option<tt::TokenId> {
id.0.checked_sub(self.0).map(tt::TokenId)
2019-11-04 15:22:18 +00:00
}
}
#[derive(Debug, Eq, PartialEq)]
pub enum Origin {
Def,
Call,
}
2019-01-31 19:14:28 +00:00
impl MacroRules {
2019-03-03 09:40:03 +00:00
pub fn parse(tt: &tt::Subtree) -> Result<MacroRules, ParseError> {
2019-09-22 20:39:29 +00:00
// Note: this parsing can be implemented using mbe machinery itself, by
// matching against `$($lhs:tt => $rhs:tt);*` pattern, but implementing
// manually seems easier.
let mut src = TtIter::new(tt);
let mut rules = Vec::new();
while src.len() > 0 {
let rule = Rule::parse(&mut src)?;
rules.push(rule);
if let Err(()) = src.expect_char(';') {
if src.len() > 0 {
return Err(ParseError::Expected("expected `:`".to_string()));
}
break;
}
}
2019-09-22 20:39:29 +00:00
for rule in rules.iter() {
validate(&rule.lhs)?;
}
Ok(MacroRules { rules, shift: Shift::new(tt) })
2019-01-31 19:14:28 +00:00
}
2019-11-04 15:22:18 +00:00
2019-03-03 09:40:03 +00:00
pub fn expand(&self, tt: &tt::Subtree) -> Result<tt::Subtree, ExpandError> {
2019-11-04 15:22:18 +00:00
// apply shift
let mut tt = tt.clone();
self.shift.shift_all(&mut tt);
2019-11-04 15:22:18 +00:00
mbe_expander::expand(self, &tt)
2019-01-31 19:14:28 +00:00
}
pub fn map_id_down(&self, id: tt::TokenId) -> tt::TokenId {
self.shift.shift(id)
}
pub fn map_id_up(&self, id: tt::TokenId) -> (tt::TokenId, Origin) {
match self.shift.unshift(id) {
Some(id) => (id, Origin::Call),
None => (id, Origin::Def),
}
}
2019-01-31 19:14:28 +00:00
}
impl Rule {
fn parse(src: &mut TtIter) -> Result<Rule, ParseError> {
let mut lhs = src
.expect_subtree()
.map_err(|()| ParseError::Expected("expected subtree".to_string()))?
.clone();
2019-12-13 13:53:34 +00:00
lhs.delimiter = None;
src.expect_char('=').map_err(|()| ParseError::Expected("expected `=`".to_string()))?;
src.expect_char('>').map_err(|()| ParseError::Expected("expected `>`".to_string()))?;
let mut rhs = src
.expect_subtree()
.map_err(|()| ParseError::Expected("expected subtree".to_string()))?
.clone();
2019-12-13 13:53:34 +00:00
rhs.delimiter = None;
Ok(crate::Rule { lhs, rhs })
}
2019-04-24 15:01:32 +00:00
}
fn validate(pattern: &tt::Subtree) -> Result<(), ParseError> {
for op in parse_pattern(pattern) {
let op = match op {
Ok(it) => it,
Err(e) => {
let msg = match e {
ExpandError::InvalidRepeat => "invalid repeat".to_string(),
_ => "invalid macro definition".to_string(),
};
return Err(ParseError::Expected(msg));
}
};
match op {
Op::TokenTree(tt::TokenTree::Subtree(subtree)) | Op::Repeat { subtree, .. } => {
validate(subtree)?
}
_ => (),
}
}
Ok(())
2019-01-30 20:25:02 +00:00
}
2019-01-31 19:14:28 +00:00
#[cfg(test)]
mod tests;