2019-09-16 23:54:22 +00:00
|
|
|
//! Parser recognizes special macro syntax, `$var` and `$(repeat)*`, in token
|
|
|
|
//! trees.
|
|
|
|
|
|
|
|
use smallvec::SmallVec;
|
2020-08-12 16:26:51 +00:00
|
|
|
use syntax::SmolStr;
|
2019-09-16 23:54:22 +00:00
|
|
|
|
2021-02-01 20:42:37 +00:00
|
|
|
use crate::{tt_iter::TtIter, ParseError};
|
|
|
|
|
2021-10-02 17:21:23 +00:00
|
|
|
/// Consider
|
|
|
|
///
|
|
|
|
/// ```
|
|
|
|
/// macro_rules! an_macro {
|
|
|
|
/// ($x:expr + $y:expr) => ($y * $x)
|
|
|
|
/// }
|
|
|
|
/// ```
|
|
|
|
///
|
|
|
|
/// Stuff to the left of `=>` is a [`MetaTemplate`] pattern (which is matched
|
|
|
|
/// with input).
|
|
|
|
///
|
|
|
|
/// Stuff to the right is a [`MetaTemplate`] template which is used to produce
|
|
|
|
/// output.
|
|
|
|
#[derive(Clone, Debug, PartialEq, Eq)]
|
|
|
|
pub(crate) struct MetaTemplate(pub(crate) Vec<Op>);
|
|
|
|
|
|
|
|
impl MetaTemplate {
|
|
|
|
pub(crate) fn parse_pattern(pattern: &tt::Subtree) -> Result<MetaTemplate, ParseError> {
|
|
|
|
let ops =
|
|
|
|
parse_inner(pattern, Mode::Pattern).into_iter().collect::<Result<_, ParseError>>()?;
|
|
|
|
Ok(MetaTemplate(ops))
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn parse_template(template: &tt::Subtree) -> Result<MetaTemplate, ParseError> {
|
|
|
|
let ops =
|
|
|
|
parse_inner(template, Mode::Template).into_iter().collect::<Result<_, ParseError>>()?;
|
|
|
|
Ok(MetaTemplate(ops))
|
|
|
|
}
|
2021-02-01 20:42:37 +00:00
|
|
|
|
2021-10-02 17:21:23 +00:00
|
|
|
pub(crate) fn iter(&self) -> impl Iterator<Item = &Op> {
|
|
|
|
self.0.iter()
|
|
|
|
}
|
2021-02-01 20:42:37 +00:00
|
|
|
}
|
2019-09-16 23:54:22 +00:00
|
|
|
|
2020-12-29 18:35:21 +00:00
|
|
|
#[derive(Clone, Debug, PartialEq, Eq)]
|
|
|
|
pub(crate) enum Op {
|
2021-01-04 02:53:31 +00:00
|
|
|
Var { name: SmolStr, kind: Option<SmolStr>, id: tt::TokenId },
|
2021-01-30 08:12:30 +00:00
|
|
|
Repeat { tokens: MetaTemplate, kind: RepeatKind, separator: Option<Separator> },
|
2020-12-29 18:35:21 +00:00
|
|
|
Leaf(tt::Leaf),
|
2021-10-02 17:11:08 +00:00
|
|
|
Subtree { tokens: MetaTemplate, delimiter: Option<tt::Delimiter> },
|
2019-09-16 23:54:22 +00:00
|
|
|
}
|
|
|
|
|
2020-12-29 18:35:21 +00:00
|
|
|
#[derive(Copy, Clone, Debug, PartialEq, Eq)]
|
2019-09-16 23:54:22 +00:00
|
|
|
pub(crate) enum RepeatKind {
|
|
|
|
ZeroOrMore,
|
|
|
|
OneOrMore,
|
|
|
|
ZeroOrOne,
|
|
|
|
}
|
|
|
|
|
|
|
|
#[derive(Clone, Debug, Eq)]
|
|
|
|
pub(crate) enum Separator {
|
|
|
|
Literal(tt::Literal),
|
|
|
|
Ident(tt::Ident),
|
|
|
|
Puncts(SmallVec<[tt::Punct; 3]>),
|
|
|
|
}
|
|
|
|
|
|
|
|
// Note that when we compare a Separator, we just care about its textual value.
|
|
|
|
impl PartialEq for Separator {
|
|
|
|
fn eq(&self, other: &Separator) -> bool {
|
|
|
|
use Separator::*;
|
|
|
|
|
|
|
|
match (self, other) {
|
|
|
|
(Ident(ref a), Ident(ref b)) => a.text == b.text,
|
|
|
|
(Literal(ref a), Literal(ref b)) => a.text == b.text,
|
|
|
|
(Puncts(ref a), Puncts(ref b)) if a.len() == b.len() => {
|
|
|
|
let a_iter = a.iter().map(|a| a.char);
|
|
|
|
let b_iter = b.iter().map(|b| b.char);
|
|
|
|
a_iter.eq(b_iter)
|
|
|
|
}
|
|
|
|
_ => false,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-02-01 20:42:37 +00:00
|
|
|
impl Separator {
|
|
|
|
pub(crate) fn tt_count(&self) -> usize {
|
|
|
|
match self {
|
|
|
|
Separator::Literal(_) => 1,
|
|
|
|
Separator::Ident(_) => 1,
|
|
|
|
Separator::Puncts(it) => it.len(),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-09-16 23:54:22 +00:00
|
|
|
#[derive(Clone, Copy)]
|
|
|
|
enum Mode {
|
|
|
|
Pattern,
|
|
|
|
Template,
|
|
|
|
}
|
|
|
|
|
2021-01-29 16:21:43 +00:00
|
|
|
fn parse_inner(tt: &tt::Subtree, mode: Mode) -> Vec<Result<Op, ParseError>> {
|
2021-06-13 03:54:16 +00:00
|
|
|
let mut src = TtIter::new(tt);
|
2019-09-16 23:54:22 +00:00
|
|
|
std::iter::from_fn(move || {
|
|
|
|
let first = src.next()?;
|
|
|
|
Some(next_op(first, &mut src, mode))
|
|
|
|
})
|
2020-12-29 18:35:21 +00:00
|
|
|
.collect()
|
2019-09-16 23:54:22 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
macro_rules! err {
|
|
|
|
($($tt:tt)*) => {
|
2021-01-29 16:21:43 +00:00
|
|
|
ParseError::UnexpectedToken(($($tt)*).to_string())
|
2019-09-16 23:54:22 +00:00
|
|
|
};
|
|
|
|
}
|
|
|
|
|
|
|
|
macro_rules! bail {
|
|
|
|
($($tt:tt)*) => {
|
|
|
|
return Err(err!($($tt)*))
|
|
|
|
};
|
|
|
|
}
|
|
|
|
|
2021-01-29 16:21:43 +00:00
|
|
|
fn next_op<'a>(first: &tt::TokenTree, src: &mut TtIter<'a>, mode: Mode) -> Result<Op, ParseError> {
|
2019-09-16 23:54:22 +00:00
|
|
|
let res = match first {
|
2020-12-29 18:35:21 +00:00
|
|
|
tt::TokenTree::Leaf(leaf @ tt::Leaf::Punct(tt::Punct { char: '$', .. })) => {
|
2020-03-03 17:03:44 +00:00
|
|
|
// Note that the '$' itself is a valid token inside macro_rules.
|
|
|
|
let second = match src.next() {
|
2020-12-29 18:35:21 +00:00
|
|
|
None => return Ok(Op::Leaf(leaf.clone())),
|
2020-03-03 17:03:44 +00:00
|
|
|
Some(it) => it,
|
|
|
|
};
|
2019-09-16 23:54:22 +00:00
|
|
|
match second {
|
|
|
|
tt::TokenTree::Subtree(subtree) => {
|
|
|
|
let (separator, kind) = parse_repeat(src)?;
|
2021-06-13 03:54:16 +00:00
|
|
|
let tokens = parse_inner(subtree, mode)
|
2021-01-29 16:21:43 +00:00
|
|
|
.into_iter()
|
|
|
|
.collect::<Result<Vec<Op>, ParseError>>()?;
|
2021-01-30 08:12:30 +00:00
|
|
|
Op::Repeat { tokens: MetaTemplate(tokens), separator, kind }
|
2019-09-16 23:54:22 +00:00
|
|
|
}
|
|
|
|
tt::TokenTree::Leaf(leaf) => match leaf {
|
2021-03-20 18:18:57 +00:00
|
|
|
tt::Leaf::Punct(_) => {
|
|
|
|
return Err(ParseError::Expected("ident".to_string()));
|
2020-12-18 15:47:48 +00:00
|
|
|
}
|
2021-01-08 06:00:16 +00:00
|
|
|
tt::Leaf::Ident(ident) if ident.text == "crate" => {
|
|
|
|
// We simply produce identifier `$crate` here. And it will be resolved when lowering ast to Path.
|
|
|
|
Op::Leaf(tt::Leaf::from(tt::Ident { text: "$crate".into(), id: ident.id }))
|
|
|
|
}
|
2019-09-16 23:54:22 +00:00
|
|
|
tt::Leaf::Ident(ident) => {
|
2020-12-29 18:35:21 +00:00
|
|
|
let name = ident.text.clone();
|
2019-09-16 23:54:22 +00:00
|
|
|
let kind = eat_fragment_kind(src, mode)?;
|
2021-01-04 02:53:31 +00:00
|
|
|
let id = ident.id;
|
|
|
|
Op::Var { name, kind, id }
|
2019-09-16 23:54:22 +00:00
|
|
|
}
|
|
|
|
tt::Leaf::Literal(lit) => {
|
2021-06-13 03:54:16 +00:00
|
|
|
if is_boolean_literal(lit) {
|
2020-12-29 18:35:21 +00:00
|
|
|
let name = lit.text.clone();
|
2019-09-16 23:54:22 +00:00
|
|
|
let kind = eat_fragment_kind(src, mode)?;
|
2021-01-04 02:53:31 +00:00
|
|
|
let id = lit.id;
|
|
|
|
Op::Var { name, kind, id }
|
2019-09-16 23:54:22 +00:00
|
|
|
} else {
|
|
|
|
bail!("bad var 2");
|
|
|
|
}
|
|
|
|
}
|
|
|
|
},
|
|
|
|
}
|
|
|
|
}
|
2020-12-29 18:35:21 +00:00
|
|
|
tt::TokenTree::Leaf(tt) => Op::Leaf(tt.clone()),
|
|
|
|
tt::TokenTree::Subtree(subtree) => {
|
2021-01-29 16:21:43 +00:00
|
|
|
let tokens =
|
2021-06-13 03:54:16 +00:00
|
|
|
parse_inner(subtree, mode).into_iter().collect::<Result<Vec<Op>, ParseError>>()?;
|
2021-01-30 08:12:30 +00:00
|
|
|
Op::Subtree { tokens: MetaTemplate(tokens), delimiter: subtree.delimiter }
|
2020-12-29 18:35:21 +00:00
|
|
|
}
|
2019-09-16 23:54:22 +00:00
|
|
|
};
|
|
|
|
Ok(res)
|
|
|
|
}
|
|
|
|
|
2021-06-03 10:46:56 +00:00
|
|
|
fn eat_fragment_kind(src: &mut TtIter<'_>, mode: Mode) -> Result<Option<SmolStr>, ParseError> {
|
2019-09-16 23:54:22 +00:00
|
|
|
if let Mode::Pattern = mode {
|
|
|
|
src.expect_char(':').map_err(|()| err!("bad fragment specifier 1"))?;
|
|
|
|
let ident = src.expect_ident().map_err(|()| err!("bad fragment specifier 1"))?;
|
2020-12-29 18:35:21 +00:00
|
|
|
return Ok(Some(ident.text.clone()));
|
2019-09-16 23:54:22 +00:00
|
|
|
};
|
|
|
|
Ok(None)
|
|
|
|
}
|
|
|
|
|
|
|
|
fn is_boolean_literal(lit: &tt::Literal) -> bool {
|
2020-06-28 01:02:03 +00:00
|
|
|
matches!(lit.text.as_str(), "true" | "false")
|
2019-09-16 23:54:22 +00:00
|
|
|
}
|
|
|
|
|
2021-01-29 16:21:43 +00:00
|
|
|
fn parse_repeat(src: &mut TtIter) -> Result<(Option<Separator>, RepeatKind), ParseError> {
|
2019-09-16 23:54:22 +00:00
|
|
|
let mut separator = Separator::Puncts(SmallVec::new());
|
|
|
|
for tt in src {
|
|
|
|
let tt = match tt {
|
|
|
|
tt::TokenTree::Leaf(leaf) => leaf,
|
2021-01-29 16:21:43 +00:00
|
|
|
tt::TokenTree::Subtree(_) => return Err(ParseError::InvalidRepeat),
|
2019-09-16 23:54:22 +00:00
|
|
|
};
|
|
|
|
let has_sep = match &separator {
|
2020-02-18 12:53:02 +00:00
|
|
|
Separator::Puncts(puncts) => !puncts.is_empty(),
|
2019-09-16 23:54:22 +00:00
|
|
|
_ => true,
|
|
|
|
};
|
|
|
|
match tt {
|
|
|
|
tt::Leaf::Ident(_) | tt::Leaf::Literal(_) if has_sep => {
|
2021-01-29 16:21:43 +00:00
|
|
|
return Err(ParseError::InvalidRepeat)
|
2019-09-16 23:54:22 +00:00
|
|
|
}
|
|
|
|
tt::Leaf::Ident(ident) => separator = Separator::Ident(ident.clone()),
|
|
|
|
tt::Leaf::Literal(lit) => separator = Separator::Literal(lit.clone()),
|
|
|
|
tt::Leaf::Punct(punct) => {
|
|
|
|
let repeat_kind = match punct.char {
|
|
|
|
'*' => RepeatKind::ZeroOrMore,
|
|
|
|
'+' => RepeatKind::OneOrMore,
|
|
|
|
'?' => RepeatKind::ZeroOrOne,
|
|
|
|
_ => {
|
|
|
|
match &mut separator {
|
|
|
|
Separator::Puncts(puncts) => {
|
|
|
|
if puncts.len() == 3 {
|
2021-01-29 16:21:43 +00:00
|
|
|
return Err(ParseError::InvalidRepeat);
|
2019-09-16 23:54:22 +00:00
|
|
|
}
|
2021-03-17 00:56:31 +00:00
|
|
|
puncts.push(*punct)
|
2019-09-16 23:54:22 +00:00
|
|
|
}
|
2021-01-29 16:21:43 +00:00
|
|
|
_ => return Err(ParseError::InvalidRepeat),
|
2019-09-16 23:54:22 +00:00
|
|
|
}
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
};
|
|
|
|
let separator = if has_sep { Some(separator) } else { None };
|
|
|
|
return Ok((separator, repeat_kind));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2021-01-29 16:21:43 +00:00
|
|
|
Err(ParseError::InvalidRepeat)
|
2019-09-16 23:54:22 +00:00
|
|
|
}
|