mirror of
https://github.com/rust-lang/rust-analyzer
synced 2025-01-19 16:44:21 +00:00
334 lines
11 KiB
Rust
334 lines
11 KiB
Rust
//! Parser recognizes special macro syntax, `$var` and `$(repeat)*`, in token
|
|
//! trees.
|
|
|
|
use smallvec::{smallvec, SmallVec};
|
|
use syntax::SmolStr;
|
|
|
|
use crate::{tt, tt_iter::TtIter, ParseError};
|
|
|
|
/// Consider
|
|
///
|
|
/// ```
|
|
/// macro_rules! an_macro {
|
|
/// ($x:expr + $y:expr) => ($y * $x)
|
|
/// }
|
|
/// ```
|
|
///
|
|
/// Stuff to the left of `=>` is a [`MetaTemplate`] pattern (which is matched
|
|
/// with input).
|
|
///
|
|
/// Stuff to the right is a [`MetaTemplate`] template which is used to produce
|
|
/// output.
|
|
#[derive(Clone, Debug, PartialEq, Eq)]
|
|
pub(crate) struct MetaTemplate(pub(crate) Box<[Op]>);
|
|
|
|
impl MetaTemplate {
|
|
pub(crate) fn parse_pattern(pattern: &tt::Subtree) -> Result<MetaTemplate, ParseError> {
|
|
MetaTemplate::parse(pattern, Mode::Pattern)
|
|
}
|
|
|
|
pub(crate) fn parse_template(template: &tt::Subtree) -> Result<MetaTemplate, ParseError> {
|
|
MetaTemplate::parse(template, Mode::Template)
|
|
}
|
|
|
|
pub(crate) fn iter(&self) -> impl Iterator<Item = &Op> {
|
|
self.0.iter()
|
|
}
|
|
|
|
fn parse(tt: &tt::Subtree, mode: Mode) -> Result<MetaTemplate, ParseError> {
|
|
let mut src = TtIter::new(tt);
|
|
|
|
let mut res = Vec::new();
|
|
while let Some(first) = src.peek_n(0) {
|
|
let op = next_op(first, &mut src, mode)?;
|
|
res.push(op);
|
|
}
|
|
|
|
Ok(MetaTemplate(res.into_boxed_slice()))
|
|
}
|
|
}
|
|
|
|
#[derive(Clone, Debug, PartialEq, Eq)]
|
|
pub(crate) enum Op {
|
|
Var { name: SmolStr, kind: Option<MetaVarKind>, id: tt::TokenId },
|
|
Ignore { name: SmolStr, id: tt::TokenId },
|
|
Index { depth: usize },
|
|
Count { name: SmolStr, depth: Option<usize> },
|
|
Repeat { tokens: MetaTemplate, kind: RepeatKind, separator: Option<Separator> },
|
|
Subtree { tokens: MetaTemplate, delimiter: tt::Delimiter },
|
|
Literal(tt::Literal),
|
|
Punct(SmallVec<[tt::Punct; 3]>),
|
|
Ident(tt::Ident),
|
|
}
|
|
|
|
#[derive(Copy, Clone, Debug, PartialEq, Eq)]
|
|
pub(crate) enum RepeatKind {
|
|
ZeroOrMore,
|
|
OneOrMore,
|
|
ZeroOrOne,
|
|
}
|
|
|
|
#[derive(Copy, Clone, Debug, PartialEq, Eq)]
|
|
pub(crate) enum MetaVarKind {
|
|
Path,
|
|
Ty,
|
|
Pat,
|
|
PatParam,
|
|
Stmt,
|
|
Block,
|
|
Meta,
|
|
Item,
|
|
Vis,
|
|
Expr,
|
|
Ident,
|
|
Tt,
|
|
Lifetime,
|
|
Literal,
|
|
}
|
|
|
|
#[derive(Clone, Debug, Eq)]
|
|
pub(crate) enum Separator {
|
|
Literal(tt::Literal),
|
|
Ident(tt::Ident),
|
|
Puncts(SmallVec<[tt::Punct; 3]>),
|
|
}
|
|
|
|
// Note that when we compare a Separator, we just care about its textual value.
|
|
impl PartialEq for Separator {
|
|
fn eq(&self, other: &Separator) -> bool {
|
|
use Separator::*;
|
|
|
|
match (self, other) {
|
|
(Ident(a), Ident(b)) => a.text == b.text,
|
|
(Literal(a), Literal(b)) => a.text == b.text,
|
|
(Puncts(a), Puncts(b)) if a.len() == b.len() => {
|
|
let a_iter = a.iter().map(|a| a.char);
|
|
let b_iter = b.iter().map(|b| b.char);
|
|
a_iter.eq(b_iter)
|
|
}
|
|
_ => false,
|
|
}
|
|
}
|
|
}
|
|
|
|
#[derive(Clone, Copy)]
|
|
enum Mode {
|
|
Pattern,
|
|
Template,
|
|
}
|
|
|
|
fn next_op(
|
|
first_peeked: &tt::TokenTree,
|
|
src: &mut TtIter<'_>,
|
|
mode: Mode,
|
|
) -> Result<Op, ParseError> {
|
|
let res = match first_peeked {
|
|
tt::TokenTree::Leaf(tt::Leaf::Punct(p @ tt::Punct { char: '$', .. })) => {
|
|
src.next().expect("first token already peeked");
|
|
// Note that the '$' itself is a valid token inside macro_rules.
|
|
let second = match src.next() {
|
|
None => return Ok(Op::Punct(smallvec![*p])),
|
|
Some(it) => it,
|
|
};
|
|
match second {
|
|
tt::TokenTree::Subtree(subtree) => match subtree.delimiter.kind {
|
|
tt::DelimiterKind::Parenthesis => {
|
|
let (separator, kind) = parse_repeat(src)?;
|
|
let tokens = MetaTemplate::parse(subtree, mode)?;
|
|
Op::Repeat { tokens, separator, kind }
|
|
}
|
|
tt::DelimiterKind::Brace => match mode {
|
|
Mode::Template => {
|
|
parse_metavar_expr(&mut TtIter::new(subtree)).map_err(|()| {
|
|
ParseError::unexpected("invalid metavariable expression")
|
|
})?
|
|
}
|
|
Mode::Pattern => {
|
|
return Err(ParseError::unexpected(
|
|
"`${}` metavariable expressions are not allowed in matchers",
|
|
))
|
|
}
|
|
},
|
|
_ => {
|
|
return Err(ParseError::expected(
|
|
"expected `$()` repetition or `${}` expression",
|
|
))
|
|
}
|
|
},
|
|
tt::TokenTree::Leaf(leaf) => match leaf {
|
|
tt::Leaf::Ident(ident) if ident.text == "crate" => {
|
|
// We simply produce identifier `$crate` here. And it will be resolved when lowering ast to Path.
|
|
Op::Ident(tt::Ident { text: "$crate".into(), span: ident.span })
|
|
}
|
|
tt::Leaf::Ident(ident) => {
|
|
let kind = eat_fragment_kind(src, mode)?;
|
|
let name = ident.text.clone();
|
|
let id = ident.span;
|
|
Op::Var { name, kind, id }
|
|
}
|
|
tt::Leaf::Literal(lit) if is_boolean_literal(lit) => {
|
|
let kind = eat_fragment_kind(src, mode)?;
|
|
let name = lit.text.clone();
|
|
let id = lit.span;
|
|
Op::Var { name, kind, id }
|
|
}
|
|
tt::Leaf::Punct(punct @ tt::Punct { char: '$', .. }) => match mode {
|
|
Mode::Pattern => {
|
|
return Err(ParseError::unexpected(
|
|
"`$$` is not allowed on the pattern side",
|
|
))
|
|
}
|
|
Mode::Template => Op::Punct(smallvec![*punct]),
|
|
},
|
|
tt::Leaf::Punct(_) | tt::Leaf::Literal(_) => {
|
|
return Err(ParseError::expected("expected ident"))
|
|
}
|
|
},
|
|
}
|
|
}
|
|
|
|
tt::TokenTree::Leaf(tt::Leaf::Literal(it)) => {
|
|
src.next().expect("first token already peeked");
|
|
Op::Literal(it.clone())
|
|
}
|
|
|
|
tt::TokenTree::Leaf(tt::Leaf::Ident(it)) => {
|
|
src.next().expect("first token already peeked");
|
|
Op::Ident(it.clone())
|
|
}
|
|
|
|
tt::TokenTree::Leaf(tt::Leaf::Punct(_)) => {
|
|
// There's at least one punct so this shouldn't fail.
|
|
let puncts = src.expect_glued_punct().unwrap();
|
|
Op::Punct(puncts)
|
|
}
|
|
|
|
tt::TokenTree::Subtree(subtree) => {
|
|
src.next().expect("first token already peeked");
|
|
let tokens = MetaTemplate::parse(subtree, mode)?;
|
|
Op::Subtree { tokens, delimiter: subtree.delimiter }
|
|
}
|
|
};
|
|
Ok(res)
|
|
}
|
|
|
|
fn eat_fragment_kind(src: &mut TtIter<'_>, mode: Mode) -> Result<Option<MetaVarKind>, ParseError> {
|
|
if let Mode::Pattern = mode {
|
|
src.expect_char(':').map_err(|()| ParseError::unexpected("missing fragment specifier"))?;
|
|
let ident = src
|
|
.expect_ident()
|
|
.map_err(|()| ParseError::unexpected("missing fragment specifier"))?;
|
|
let kind = match ident.text.as_str() {
|
|
"path" => MetaVarKind::Path,
|
|
"ty" => MetaVarKind::Ty,
|
|
"pat" => MetaVarKind::Pat,
|
|
"pat_param" => MetaVarKind::PatParam,
|
|
"stmt" => MetaVarKind::Stmt,
|
|
"block" => MetaVarKind::Block,
|
|
"meta" => MetaVarKind::Meta,
|
|
"item" => MetaVarKind::Item,
|
|
"vis" => MetaVarKind::Vis,
|
|
"expr" => MetaVarKind::Expr,
|
|
"ident" => MetaVarKind::Ident,
|
|
"tt" => MetaVarKind::Tt,
|
|
"lifetime" => MetaVarKind::Lifetime,
|
|
"literal" => MetaVarKind::Literal,
|
|
_ => return Ok(None),
|
|
};
|
|
return Ok(Some(kind));
|
|
};
|
|
Ok(None)
|
|
}
|
|
|
|
fn is_boolean_literal(lit: &tt::Literal) -> bool {
|
|
matches!(lit.text.as_str(), "true" | "false")
|
|
}
|
|
|
|
fn parse_repeat(src: &mut TtIter<'_>) -> Result<(Option<Separator>, RepeatKind), ParseError> {
|
|
let mut separator = Separator::Puncts(SmallVec::new());
|
|
for tt in src {
|
|
let tt = match tt {
|
|
tt::TokenTree::Leaf(leaf) => leaf,
|
|
tt::TokenTree::Subtree(_) => return Err(ParseError::InvalidRepeat),
|
|
};
|
|
let has_sep = match &separator {
|
|
Separator::Puncts(puncts) => !puncts.is_empty(),
|
|
_ => true,
|
|
};
|
|
match tt {
|
|
tt::Leaf::Ident(_) | tt::Leaf::Literal(_) if has_sep => {
|
|
return Err(ParseError::InvalidRepeat)
|
|
}
|
|
tt::Leaf::Ident(ident) => separator = Separator::Ident(ident.clone()),
|
|
tt::Leaf::Literal(lit) => separator = Separator::Literal(lit.clone()),
|
|
tt::Leaf::Punct(punct) => {
|
|
let repeat_kind = match punct.char {
|
|
'*' => RepeatKind::ZeroOrMore,
|
|
'+' => RepeatKind::OneOrMore,
|
|
'?' => RepeatKind::ZeroOrOne,
|
|
_ => match &mut separator {
|
|
Separator::Puncts(puncts) if puncts.len() != 3 => {
|
|
puncts.push(*punct);
|
|
continue;
|
|
}
|
|
_ => return Err(ParseError::InvalidRepeat),
|
|
},
|
|
};
|
|
return Ok((has_sep.then_some(separator), repeat_kind));
|
|
}
|
|
}
|
|
}
|
|
Err(ParseError::InvalidRepeat)
|
|
}
|
|
|
|
fn parse_metavar_expr(src: &mut TtIter<'_>) -> Result<Op, ()> {
|
|
let func = src.expect_ident()?;
|
|
let args = src.expect_subtree()?;
|
|
|
|
if args.delimiter.kind != tt::DelimiterKind::Parenthesis {
|
|
return Err(());
|
|
}
|
|
|
|
let mut args = TtIter::new(args);
|
|
|
|
let op = match &*func.text {
|
|
"ignore" => {
|
|
let ident = args.expect_ident()?;
|
|
Op::Ignore { name: ident.text.clone(), id: ident.span }
|
|
}
|
|
"index" => Op::Index { depth: parse_depth(&mut args)? },
|
|
"count" => {
|
|
let ident = args.expect_ident()?;
|
|
// `${count(t)}` and `${count(t,)}` have different meanings. Not sure if this is a bug
|
|
// but that's how it's implemented in rustc as of this writing. See rust-lang/rust#111904.
|
|
let depth = if try_eat_comma(&mut args) { Some(parse_depth(&mut args)?) } else { None };
|
|
Op::Count { name: ident.text.clone(), depth }
|
|
}
|
|
_ => return Err(()),
|
|
};
|
|
|
|
if args.next().is_some() {
|
|
return Err(());
|
|
}
|
|
|
|
Ok(op)
|
|
}
|
|
|
|
fn parse_depth(src: &mut TtIter<'_>) -> Result<usize, ()> {
|
|
if src.len() == 0 {
|
|
Ok(0)
|
|
} else if let tt::Leaf::Literal(lit) = src.expect_literal()? {
|
|
// Suffixes are not allowed.
|
|
lit.text.parse().map_err(|_| ())
|
|
} else {
|
|
Err(())
|
|
}
|
|
}
|
|
|
|
fn try_eat_comma(src: &mut TtIter<'_>) -> bool {
|
|
if let Some(tt::TokenTree::Leaf(tt::Leaf::Punct(tt::Punct { char: ',', .. }))) = src.peek_n(0) {
|
|
let _ = src.next();
|
|
return true;
|
|
}
|
|
false
|
|
}
|