2021-05-22 14:20:22 +00:00
|
|
|
//! A "Parser" structure for token trees. We use this when parsing a declarative
|
|
|
|
//! macro definition into a list of patterns and templates.
|
2019-09-30 08:58:53 +00:00
|
|
|
|
2022-12-24 08:57:50 +00:00
|
|
|
use smallvec::{smallvec, SmallVec};
|
2021-02-28 05:06:17 +00:00
|
|
|
use syntax::SyntaxKind;
|
|
|
|
|
2023-01-31 10:49:49 +00:00
|
|
|
use crate::{to_parser_input::to_parser_input, tt, ExpandError, ExpandResult};
|
2022-01-02 01:39:14 +00:00
|
|
|
|
2019-09-16 23:54:22 +00:00
|
|
|
#[derive(Debug, Clone)]
|
|
|
|
pub(crate) struct TtIter<'a> {
|
|
|
|
pub(crate) inner: std::slice::Iter<'a, tt::TokenTree>,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<'a> TtIter<'a> {
|
|
|
|
pub(crate) fn new(subtree: &'a tt::Subtree) -> TtIter<'a> {
|
|
|
|
TtIter { inner: subtree.token_trees.iter() }
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn expect_char(&mut self, char: char) -> Result<(), ()> {
|
|
|
|
match self.next() {
|
2022-01-02 01:39:14 +00:00
|
|
|
Some(&tt::TokenTree::Leaf(tt::Leaf::Punct(tt::Punct { char: c, .. }))) if c == char => {
|
2019-09-16 23:54:22 +00:00
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
_ => Err(()),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-04-03 01:08:31 +00:00
|
|
|
pub(crate) fn expect_any_char(&mut self, chars: &[char]) -> Result<(), ()> {
|
|
|
|
match self.next() {
|
|
|
|
Some(tt::TokenTree::Leaf(tt::Leaf::Punct(tt::Punct { char: c, .. })))
|
|
|
|
if chars.contains(c) =>
|
|
|
|
{
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
_ => Err(()),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-09-16 23:54:22 +00:00
|
|
|
pub(crate) fn expect_subtree(&mut self) -> Result<&'a tt::Subtree, ()> {
|
|
|
|
match self.next() {
|
|
|
|
Some(tt::TokenTree::Subtree(it)) => Ok(it),
|
|
|
|
_ => Err(()),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn expect_leaf(&mut self) -> Result<&'a tt::Leaf, ()> {
|
|
|
|
match self.next() {
|
|
|
|
Some(tt::TokenTree::Leaf(it)) => Ok(it),
|
|
|
|
_ => Err(()),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn expect_ident(&mut self) -> Result<&'a tt::Ident, ()> {
|
2021-03-20 23:43:51 +00:00
|
|
|
match self.expect_leaf()? {
|
|
|
|
tt::Leaf::Ident(it) if it.text != "_" => Ok(it),
|
|
|
|
_ => Err(()),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn expect_ident_or_underscore(&mut self) -> Result<&'a tt::Ident, ()> {
|
2019-09-16 23:54:22 +00:00
|
|
|
match self.expect_leaf()? {
|
|
|
|
tt::Leaf::Ident(it) => Ok(it),
|
|
|
|
_ => Err(()),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-04-18 19:24:17 +00:00
|
|
|
pub(crate) fn expect_literal(&mut self) -> Result<&'a tt::Leaf, ()> {
|
|
|
|
let it = self.expect_leaf()?;
|
|
|
|
match it {
|
|
|
|
tt::Leaf::Literal(_) => Ok(it),
|
|
|
|
tt::Leaf::Ident(ident) if ident.text == "true" || ident.text == "false" => Ok(it),
|
2019-09-16 23:54:22 +00:00
|
|
|
_ => Err(()),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-07-11 16:31:42 +00:00
|
|
|
pub(crate) fn expect_u32_literal(&mut self) -> Result<u32, ()> {
|
|
|
|
match self.expect_literal()? {
|
|
|
|
tt::Leaf::Literal(lit) => lit.text.parse().map_err(drop),
|
|
|
|
_ => Err(()),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-12-24 08:57:50 +00:00
|
|
|
pub(crate) fn expect_single_punct(&mut self) -> Result<&'a tt::Punct, ()> {
|
2019-09-16 23:54:22 +00:00
|
|
|
match self.expect_leaf()? {
|
|
|
|
tt::Leaf::Punct(it) => Ok(it),
|
|
|
|
_ => Err(()),
|
|
|
|
}
|
|
|
|
}
|
2020-03-04 14:29:55 +00:00
|
|
|
|
2022-12-27 09:18:18 +00:00
|
|
|
/// Returns consecutive `Punct`s that can be glued together.
|
|
|
|
///
|
|
|
|
/// This method currently may return a single quotation, which is part of lifetime ident and
|
|
|
|
/// conceptually not a punct in the context of mbe. Callers should handle this.
|
2022-12-24 08:57:50 +00:00
|
|
|
pub(crate) fn expect_glued_punct(&mut self) -> Result<SmallVec<[tt::Punct; 3]>, ()> {
|
|
|
|
let tt::TokenTree::Leaf(tt::Leaf::Punct(first)) = self.next().ok_or(())?.clone() else {
|
|
|
|
return Err(());
|
|
|
|
};
|
|
|
|
|
|
|
|
if first.spacing == tt::Spacing::Alone {
|
|
|
|
return Ok(smallvec![first]);
|
|
|
|
}
|
|
|
|
|
|
|
|
let (second, third) = match (self.peek_n(0), self.peek_n(1)) {
|
|
|
|
(
|
|
|
|
Some(tt::TokenTree::Leaf(tt::Leaf::Punct(p2))),
|
|
|
|
Some(tt::TokenTree::Leaf(tt::Leaf::Punct(p3))),
|
|
|
|
) if p2.spacing == tt::Spacing::Joint => (p2, Some(p3)),
|
|
|
|
(Some(tt::TokenTree::Leaf(tt::Leaf::Punct(p2))), _) => (p2, None),
|
|
|
|
_ => return Ok(smallvec![first]),
|
|
|
|
};
|
|
|
|
|
|
|
|
match (first.char, second.char, third.map(|it| it.char)) {
|
|
|
|
('.', '.', Some('.' | '=')) | ('<', '<', Some('=')) | ('>', '>', Some('=')) => {
|
|
|
|
let _ = self.next().unwrap();
|
|
|
|
let _ = self.next().unwrap();
|
2023-01-10 18:20:12 +00:00
|
|
|
Ok(smallvec![first, *second, *third.unwrap()])
|
2022-12-24 08:57:50 +00:00
|
|
|
}
|
|
|
|
('-' | '!' | '*' | '/' | '&' | '%' | '^' | '+' | '<' | '=' | '>' | '|', '=', _)
|
|
|
|
| ('-' | '=' | '>', '>', _)
|
2022-12-27 09:33:21 +00:00
|
|
|
| ('<', '-', _)
|
2022-12-24 08:57:50 +00:00
|
|
|
| (':', ':', _)
|
|
|
|
| ('.', '.', _)
|
|
|
|
| ('&', '&', _)
|
|
|
|
| ('<', '<', _)
|
|
|
|
| ('|', '|', _) => {
|
|
|
|
let _ = self.next().unwrap();
|
2023-01-10 18:20:12 +00:00
|
|
|
Ok(smallvec![first, *second])
|
2022-12-24 08:57:50 +00:00
|
|
|
}
|
|
|
|
_ => Ok(smallvec![first]),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-02-28 05:06:17 +00:00
|
|
|
pub(crate) fn expect_fragment(
|
2021-12-27 12:22:44 +00:00
|
|
|
&mut self,
|
|
|
|
entry_point: parser::PrefixEntryPoint,
|
|
|
|
) -> ExpandResult<Option<tt::TokenTree>> {
|
2023-01-31 10:49:49 +00:00
|
|
|
let buffer = tt::buffer::TokenBuffer::from_tokens(self.inner.as_slice());
|
2021-12-27 12:22:44 +00:00
|
|
|
let parser_input = to_parser_input(&buffer);
|
|
|
|
let tree_traversal = entry_point.parse(&parser_input);
|
|
|
|
|
|
|
|
let mut cursor = buffer.begin();
|
|
|
|
let mut error = false;
|
|
|
|
for step in tree_traversal.iter() {
|
|
|
|
match step {
|
|
|
|
parser::Step::Token { kind, mut n_input_tokens } => {
|
|
|
|
if kind == SyntaxKind::LIFETIME_IDENT {
|
|
|
|
n_input_tokens = 2;
|
|
|
|
}
|
|
|
|
for _ in 0..n_input_tokens {
|
|
|
|
cursor = cursor.bump_subtree();
|
|
|
|
}
|
|
|
|
}
|
2023-02-03 20:39:24 +00:00
|
|
|
parser::Step::FloatSplit { .. } => {
|
2023-02-07 16:12:24 +00:00
|
|
|
// FIXME: We need to split the tree properly here, but mutating the token trees
|
|
|
|
// in the buffer is somewhat tricky to pull off.
|
2023-02-03 20:39:24 +00:00
|
|
|
cursor = cursor.bump_subtree();
|
|
|
|
}
|
2021-12-27 12:22:44 +00:00
|
|
|
parser::Step::Enter { .. } | parser::Step::Exit => (),
|
|
|
|
parser::Step::Error { .. } => error = true,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-01-03 13:22:41 +00:00
|
|
|
let err = if error || !cursor.is_root() {
|
2022-02-21 18:14:06 +00:00
|
|
|
Some(ExpandError::binding_error(format!("expected {entry_point:?}")))
|
2021-12-27 12:22:44 +00:00
|
|
|
} else {
|
|
|
|
None
|
|
|
|
};
|
|
|
|
|
|
|
|
let mut curr = buffer.begin();
|
|
|
|
let mut res = vec![];
|
|
|
|
|
internal: replace TreeSink with a data structure
The general theme of this is to make parser a better independent
library.
The specific thing we do here is replacing callback based TreeSink with
a data structure. That is, rather than calling user-provided tree
construction methods, the parser now spits out a very bare-bones tree,
effectively a log of a DFS traversal.
This makes the parser usable without any *specifc* tree sink, and allows
us to, eg, move tests into this crate.
Now, it's also true that this is a distinction without a difference, as
the old and the new interface are equivalent in expressiveness. Still,
this new thing seems somewhat simpler. But yeah, I admit I don't have a
suuper strong motivation here, just a hunch that this is better.
2021-12-19 14:36:23 +00:00
|
|
|
if cursor.is_root() {
|
2023-02-07 16:12:24 +00:00
|
|
|
while curr != cursor {
|
|
|
|
let Some(token) = curr.token_tree() else { break };
|
|
|
|
res.push(token.cloned());
|
|
|
|
curr = curr.bump();
|
2021-02-28 05:06:17 +00:00
|
|
|
}
|
|
|
|
}
|
2023-02-07 16:12:24 +00:00
|
|
|
|
2021-02-28 05:06:17 +00:00
|
|
|
self.inner = self.inner.as_slice()[res.len()..].iter();
|
|
|
|
let res = match res.len() {
|
2023-02-03 20:39:24 +00:00
|
|
|
0 | 1 => res.pop(),
|
2021-02-28 05:06:17 +00:00
|
|
|
_ => Some(tt::TokenTree::Subtree(tt::Subtree {
|
2023-01-31 10:49:49 +00:00
|
|
|
delimiter: tt::Delimiter::unspecified(),
|
2023-02-03 20:39:24 +00:00
|
|
|
token_trees: res,
|
2021-02-28 05:06:17 +00:00
|
|
|
})),
|
|
|
|
};
|
|
|
|
ExpandResult { value: res, err }
|
|
|
|
}
|
|
|
|
|
2022-12-27 09:18:18 +00:00
|
|
|
pub(crate) fn peek_n(&self, n: usize) -> Option<&'a tt::TokenTree> {
|
2020-03-04 14:29:55 +00:00
|
|
|
self.inner.as_slice().get(n)
|
|
|
|
}
|
2019-09-16 23:54:22 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
impl<'a> Iterator for TtIter<'a> {
|
|
|
|
type Item = &'a tt::TokenTree;
|
|
|
|
fn next(&mut self) -> Option<Self::Item> {
|
|
|
|
self.inner.next()
|
|
|
|
}
|
|
|
|
|
|
|
|
fn size_hint(&self) -> (usize, Option<usize>) {
|
|
|
|
self.inner.size_hint()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<'a> std::iter::ExactSizeIterator for TtIter<'a> {}
|