rust-analyzer/crates/syntax/src/parsing.rs

83 lines
2.6 KiB
Rust
Raw Normal View History

2020-08-12 15:06:49 +00:00
//! Lexing, bridging to parser (which does the actual parsing) and
2019-02-21 12:24:42 +00:00
//! incremental reparsing.
pub(crate) mod lexer;
2019-02-23 13:07:29 +00:00
mod text_tree_sink;
mod reparsing;
2021-05-13 10:44:47 +00:00
use parser::SyntaxKind;
use text_tree_sink::TextTreeSink;
2021-05-13 10:44:47 +00:00
use crate::{syntax_node::GreenNode, AstNode, SyntaxError, SyntaxNode};
2021-05-13 10:44:47 +00:00
pub(crate) use crate::parsing::{lexer::*, reparsing::incremental_reparse};
pub(crate) fn parse_text(text: &str) -> (GreenNode, Vec<SyntaxError>) {
2021-12-12 14:58:45 +00:00
let (lexer_tokens, lexer_errors) = tokenize(text);
let parser_tokens = to_parser_tokens(text, &lexer_tokens);
2021-12-12 14:58:45 +00:00
let mut tree_sink = TextTreeSink::new(text, &lexer_tokens);
2021-12-12 14:58:45 +00:00
parser::parse_source_file(&parser_tokens, &mut tree_sink);
let (tree, mut parser_errors) = tree_sink.finish();
parser_errors.extend(lexer_errors);
(tree, parser_errors)
}
/// Returns `text` parsed as a `T` provided there are no parse errors.
pub(crate) fn parse_text_as<T: AstNode>(
text: &str,
entry_point: parser::ParserEntryPoint,
) -> Result<T, ()> {
2021-12-12 14:58:45 +00:00
let (lexer_tokens, lexer_errors) = tokenize(text);
if !lexer_errors.is_empty() {
return Err(());
}
2021-12-12 14:58:45 +00:00
let parser_tokens = to_parser_tokens(text, &lexer_tokens);
let mut tree_sink = TextTreeSink::new(text, &lexer_tokens);
// TextTreeSink assumes that there's at least some root node to which it can attach errors and
// tokens. We arbitrarily give it a SourceFile.
2020-08-12 15:06:49 +00:00
use parser::TreeSink;
tree_sink.start_node(SyntaxKind::SOURCE_FILE);
2021-12-12 14:58:45 +00:00
parser::parse(&parser_tokens, &mut tree_sink, entry_point);
tree_sink.finish_node();
2021-12-12 14:58:45 +00:00
let (tree, parser_errors, eof) = tree_sink.finish_eof();
if !parser_errors.is_empty() || !eof {
return Err(());
}
SyntaxNode::new_root(tree).first_child().and_then(T::cast).ok_or(())
}
2021-12-12 14:58:45 +00:00
pub(crate) fn to_parser_tokens(text: &str, lexer_tokens: &[lexer::Token]) -> ::parser::Tokens {
let mut off = 0;
let mut res = parser::Tokens::default();
2021-12-12 16:22:37 +00:00
let mut was_joint = false;
2021-12-12 14:58:45 +00:00
for t in lexer_tokens {
if t.kind.is_trivia() {
was_joint = false;
} else {
2021-12-12 16:22:37 +00:00
if t.kind == SyntaxKind::IDENT {
let token_text = &text[off..][..usize::from(t.len)];
let contextual_kw =
SyntaxKind::from_contextual_keyword(token_text).unwrap_or(SyntaxKind::IDENT);
res.push_ident(contextual_kw);
} else {
if was_joint {
res.was_joint();
}
res.push(t.kind);
}
2021-12-12 14:58:45 +00:00
was_joint = true;
}
off += usize::from(t.len);
}
res
}