rust-analyzer/crates/parser/src/lib.rs

160 lines
4.8 KiB
Rust
Raw Normal View History

2019-02-21 12:24:42 +00:00
//! The Rust parser.
//!
2021-12-12 16:06:40 +00:00
//! NOTE: The crate is undergoing refactors, don't believe everything the docs
//! say :-)
//!
2019-02-21 12:24:42 +00:00
//! The parser doesn't know about concrete representation of tokens and syntax
2021-12-12 16:06:40 +00:00
//! trees. Abstract [`TokenSource`] and [`TreeSink`] traits are used instead. As
//! a consequence, this crate does not contain a lexer.
2019-02-21 12:24:42 +00:00
//!
//! The [`Parser`] struct from the [`parser`] module is a cursor into the
//! sequence of tokens. Parsing routines use [`Parser`] to inspect current
//! state and advance the parsing.
2019-02-21 12:24:42 +00:00
//!
//! The actual parsing happens in the [`grammar`] module.
2019-02-21 12:24:42 +00:00
//!
//! Tests for this crate live in the `syntax` crate.
//!
//! [`Parser`]: crate::parser::Parser
#![allow(rustdoc::private_intra_doc_links)]
2021-09-06 15:42:07 +00:00
2021-12-18 12:31:50 +00:00
mod lexed_str;
2019-02-21 10:27:45 +00:00
mod token_set;
mod syntax_kind;
mod event;
mod parser;
mod grammar;
2021-12-25 18:59:02 +00:00
mod input;
mod output;
mod shortcuts;
2019-02-21 10:27:45 +00:00
2021-12-12 18:32:58 +00:00
#[cfg(test)]
mod tests;
2019-02-21 10:27:45 +00:00
pub(crate) use token_set::TokenSet;
pub use crate::{
2021-12-25 18:59:02 +00:00
input::Input,
lexed_str::LexedStr,
2021-12-25 18:59:02 +00:00
output::{Output, Step},
shortcuts::StrStep,
syntax_kind::SyntaxKind,
};
2019-02-21 10:27:45 +00:00
2021-12-27 14:54:51 +00:00
/// Parse a prefix of the input as a given syntactic construct.
2021-12-27 12:17:48 +00:00
///
2021-12-27 13:06:02 +00:00
/// This is used by macro-by-example parser to implement things like `$i:item`
/// and the naming of variants follows the naming of macro fragments.
2021-12-27 12:17:48 +00:00
///
/// Note that this is generally non-optional -- the result is intentionally not
/// `Option<Output>`. The way MBE work, by the time we *try* to parse `$e:expr`
/// we already commit to expression. In other words, this API by design can't be
/// used to implement "rollback and try another alternative" logic.
#[derive(Debug)]
2021-12-27 12:17:48 +00:00
pub enum PrefixEntryPoint {
Vis,
Block,
2021-12-27 12:54:00 +00:00
Stmt,
2021-12-27 13:06:02 +00:00
Pat,
2021-12-27 13:08:35 +00:00
Ty,
2021-12-27 13:17:29 +00:00
Expr,
2021-12-27 13:23:07 +00:00
Path,
2021-12-27 13:28:54 +00:00
Item,
MetaItem,
2021-12-27 12:17:48 +00:00
}
impl PrefixEntryPoint {
pub fn parse(&self, input: &Input) -> Output {
2021-12-27 12:17:48 +00:00
let entry_point: fn(&'_ mut parser::Parser) = match self {
PrefixEntryPoint::Vis => grammar::entry::prefix::vis,
PrefixEntryPoint::Block => grammar::entry::prefix::block,
2021-12-27 12:54:00 +00:00
PrefixEntryPoint::Stmt => grammar::entry::prefix::stmt,
2021-12-27 13:06:02 +00:00
PrefixEntryPoint::Pat => grammar::entry::prefix::pat,
2021-12-27 13:08:35 +00:00
PrefixEntryPoint::Ty => grammar::entry::prefix::ty,
2021-12-27 13:17:29 +00:00
PrefixEntryPoint::Expr => grammar::entry::prefix::expr,
2021-12-27 13:23:07 +00:00
PrefixEntryPoint::Path => grammar::entry::prefix::path,
2021-12-27 13:28:54 +00:00
PrefixEntryPoint::Item => grammar::entry::prefix::item,
PrefixEntryPoint::MetaItem => grammar::entry::prefix::meta_item,
2021-12-27 12:17:48 +00:00
};
let mut p = parser::Parser::new(input);
entry_point(&mut p);
let events = p.finish();
event::process(events)
}
}
2021-12-27 14:54:51 +00:00
/// Parse the whole of the input as a given syntactic construct.
///
/// This covers two main use-cases:
///
/// * Parsing a Rust file.
/// * Parsing a result of macro expansion.
///
/// That is, for something like
///
/// ```
/// quick_check! {
/// fn prop() {}
/// }
/// ```
///
/// the input to the macro will be parsed with [`PrefixEntryPoint::Item`], and
/// the result will be [`TopEntryPoint::Items`].
///
/// This *should* (but currently doesn't) guarantee that all input is consumed.
#[derive(Debug)]
pub enum TopEntryPoint {
SourceFile,
MacroStmts,
MacroItems,
Pattern,
Type,
Expr,
MetaItem,
}
impl TopEntryPoint {
pub fn parse(&self, input: &Input) -> Output {
let entry_point: fn(&'_ mut parser::Parser) = match self {
TopEntryPoint::SourceFile => grammar::entry::top::source_file,
TopEntryPoint::MacroStmts => grammar::entry::top::macro_stmts,
TopEntryPoint::MacroItems => grammar::entry::top::macro_items,
2022-01-02 14:32:15 +00:00
TopEntryPoint::Pattern => grammar::entry::top::pattern,
2021-12-27 14:54:51 +00:00
// FIXME
TopEntryPoint::Type => grammar::entry::prefix::ty,
TopEntryPoint::Expr => grammar::entry::prefix::expr,
TopEntryPoint::MetaItem => grammar::entry::prefix::meta_item,
};
let mut p = parser::Parser::new(input);
entry_point(&mut p);
let events = p.finish();
event::process(events)
}
}
2019-02-21 12:24:42 +00:00
/// A parsing function for a specific braced-block.
2019-02-21 10:27:45 +00:00
pub struct Reparser(fn(&mut parser::Parser));
impl Reparser {
2019-02-21 12:24:42 +00:00
/// If the node is a braced block, return the corresponding `Reparser`.
2019-02-21 10:27:45 +00:00
pub fn for_node(
node: SyntaxKind,
first_child: Option<SyntaxKind>,
parent: Option<SyntaxKind>,
) -> Option<Reparser> {
grammar::reparser(node, first_child, parent).map(Reparser)
}
2019-02-21 12:24:42 +00:00
/// Re-parse given tokens using this `Reparser`.
///
/// Tokens must start with `{`, end with `}` and form a valid brace
/// sequence.
2021-12-25 18:59:02 +00:00
pub fn parse(self, tokens: &Input) -> Output {
2019-02-21 10:37:32 +00:00
let Reparser(r) = self;
2021-11-14 19:13:44 +00:00
let mut p = parser::Parser::new(tokens);
2019-02-21 10:37:32 +00:00
r(&mut p);
let events = p.finish();
event::process(events)
2019-02-21 10:37:32 +00:00
}
2019-02-21 10:27:45 +00:00
}