rust-analyzer/crates/parser/src/grammar.rs

Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

429 lines
12 KiB
Rust
Raw Normal View History

2018-02-11 14:58:22 +00:00
//! This is the actual "grammar" of the Rust language.
//!
//! Each function in this module and its children corresponds
//! to a production of the formal grammar. Submodules roughly
2018-02-11 14:58:22 +00:00
//! correspond to different *areas* of the grammar. By convention,
//! each submodule starts with `use super::*` import and exports
//! "public" productions via `pub(super)`.
//!
//! See docs for [`Parser`](super::parser::Parser) to learn about API,
//! available to the grammar, and see docs for [`Event`](super::event::Event)
//! to learn how this actually manages to produce parse trees.
2018-02-11 14:58:22 +00:00
//!
//! Code in this module also contains inline tests, which start with
//! `// test name-of-the-test` comment and look like this:
//!
//! ```
2018-08-09 14:44:40 +00:00
//! // test function_with_zero_parameters
2018-02-11 14:58:22 +00:00
//! // fn foo() {}
//! ```
//!
//! After adding a new inline-test, run `cargo test -p xtask` to
//! extract it as a standalone text-fixture into
2020-08-12 16:26:51 +00:00
//! `crates/syntax/test_data/parser/`, and run `cargo test` once to
//! create the "gold" value.
//!
//! Coding convention: rules like `where_clause` always produce either a
//! node or an error, rules like `opt_where_clause` may produce nothing.
//! Non-opt rules typically start with `assert!(p.at(FIRST_TOKEN))`, the
//! caller is responsible for branching on the first token.
2021-05-22 14:20:22 +00:00
2018-01-07 18:46:10 +00:00
mod attributes;
mod expressions;
2024-01-26 19:08:10 +00:00
mod generic_args;
mod generic_params;
2018-07-30 11:08:06 +00:00
mod items;
2018-07-31 20:38:19 +00:00
mod params;
2018-01-09 20:32:18 +00:00
mod paths;
2018-07-30 11:08:06 +00:00
mod patterns;
mod types;
2018-01-01 15:58:46 +00:00
use crate::{
parser::{CompletedMarker, Marker, Parser},
SyntaxKind::{self, *},
2021-09-06 15:42:07 +00:00
TokenSet, T,
};
2018-07-29 12:16:07 +00:00
2021-12-27 12:17:48 +00:00
pub(crate) mod entry {
use super::*;
pub(crate) mod prefix {
use super::*;
2022-07-20 13:02:08 +00:00
pub(crate) fn vis(p: &mut Parser<'_>) {
opt_visibility(p, false);
2021-12-27 12:17:48 +00:00
}
2022-07-20 13:02:08 +00:00
pub(crate) fn block(p: &mut Parser<'_>) {
expressions::block_expr(p);
}
2021-12-27 12:54:00 +00:00
2022-07-20 13:02:08 +00:00
pub(crate) fn stmt(p: &mut Parser<'_>) {
2021-12-29 16:18:34 +00:00
expressions::stmt(p, expressions::Semicolon::Forbidden);
2021-12-27 12:54:00 +00:00
}
2021-12-27 13:06:02 +00:00
2022-07-20 13:02:08 +00:00
pub(crate) fn pat(p: &mut Parser<'_>) {
2021-12-27 13:06:02 +00:00
patterns::pattern_single(p);
}
2021-12-27 13:08:35 +00:00
pub(crate) fn pat_top(p: &mut Parser<'_>) {
patterns::pattern_top(p);
}
2022-07-20 13:02:08 +00:00
pub(crate) fn ty(p: &mut Parser<'_>) {
2021-12-27 13:08:35 +00:00
types::type_(p);
}
2022-07-20 13:02:08 +00:00
pub(crate) fn expr(p: &mut Parser<'_>) {
expressions::expr(p);
2021-12-27 13:17:29 +00:00
}
2022-07-20 13:02:08 +00:00
pub(crate) fn path(p: &mut Parser<'_>) {
paths::type_path(p);
2021-12-27 13:23:07 +00:00
}
2022-07-20 13:02:08 +00:00
pub(crate) fn item(p: &mut Parser<'_>) {
2021-12-27 13:28:54 +00:00
items::item_or_macro(p, true);
}
// Parse a meta item , which excluded [], e.g : #[ MetaItem ]
2022-07-20 13:02:08 +00:00
pub(crate) fn meta_item(p: &mut Parser<'_>) {
2021-12-27 13:28:54 +00:00
attributes::meta(p);
}
2021-12-27 12:17:48 +00:00
}
2021-12-27 14:54:51 +00:00
pub(crate) mod top {
use super::*;
2022-07-20 13:02:08 +00:00
pub(crate) fn source_file(p: &mut Parser<'_>) {
2021-12-27 14:54:51 +00:00
let m = p.start();
p.eat(SHEBANG);
items::mod_contents(p, false);
m.complete(p, SOURCE_FILE);
}
2022-07-20 13:02:08 +00:00
pub(crate) fn macro_stmts(p: &mut Parser<'_>) {
2021-12-27 14:54:51 +00:00
let m = p.start();
2019-04-19 11:33:29 +00:00
2021-12-27 14:54:51 +00:00
while !p.at(EOF) {
2021-12-29 16:18:34 +00:00
expressions::stmt(p, expressions::Semicolon::Optional);
2019-04-25 15:12:57 +00:00
}
2019-09-02 14:37:48 +00:00
2021-12-27 14:54:51 +00:00
m.complete(p, MACRO_STMTS);
}
2022-07-20 13:02:08 +00:00
pub(crate) fn macro_items(p: &mut Parser<'_>) {
2021-12-27 14:54:51 +00:00
let m = p.start();
items::mod_contents(p, false);
m.complete(p, MACRO_ITEMS);
2019-04-19 11:33:29 +00:00
}
2022-01-02 14:32:15 +00:00
2022-07-20 13:02:08 +00:00
pub(crate) fn pattern(p: &mut Parser<'_>) {
2022-01-02 14:32:15 +00:00
let m = p.start();
2022-01-17 15:52:53 +00:00
patterns::pattern_top(p);
2022-01-02 14:32:15 +00:00
if p.at(EOF) {
m.abandon(p);
return;
}
while !p.at(EOF) {
p.bump_any();
}
m.complete(p, ERROR);
}
2022-01-02 14:45:18 +00:00
2022-07-20 13:02:08 +00:00
pub(crate) fn type_(p: &mut Parser<'_>) {
2022-01-02 14:45:18 +00:00
let m = p.start();
types::type_(p);
if p.at(EOF) {
m.abandon(p);
return;
}
while !p.at(EOF) {
p.bump_any();
}
m.complete(p, ERROR);
}
2022-01-02 14:52:05 +00:00
2022-07-20 13:02:08 +00:00
pub(crate) fn expr(p: &mut Parser<'_>) {
2022-01-02 14:52:05 +00:00
let m = p.start();
expressions::expr(p);
if p.at(EOF) {
m.abandon(p);
return;
}
while !p.at(EOF) {
p.bump_any();
}
m.complete(p, ERROR);
}
2022-01-02 15:41:32 +00:00
2022-07-20 13:02:08 +00:00
pub(crate) fn meta_item(p: &mut Parser<'_>) {
2022-01-02 15:41:32 +00:00
let m = p.start();
attributes::meta(p);
if p.at(EOF) {
m.abandon(p);
return;
}
while !p.at(EOF) {
p.bump_any();
}
m.complete(p, ERROR);
}
pub(crate) fn eager_macro_input(p: &mut Parser<'_>) {
let m = p.start();
let closing_paren_kind = match p.current() {
T!['{'] => T!['}'],
T!['('] => T![')'],
T!['['] => T![']'],
_ => {
p.error("expected `{`, `[`, `(`");
while !p.at(EOF) {
p.bump_any();
}
m.complete(p, ERROR);
return;
}
};
p.bump_any();
while !p.at(EOF) && !p.at(closing_paren_kind) {
if expressions::expr(p).is_none() {
break;
}
if !p.at(EOF) && !p.at(closing_paren_kind) {
p.expect(T![,]);
}
}
p.expect(closing_paren_kind);
if p.at(EOF) {
m.complete(p, MACRO_EAGER_INPUT);
return;
}
while !p.at(EOF) {
p.bump_any();
}
m.complete(p, ERROR);
}
2021-12-27 14:54:51 +00:00
}
}
2019-04-19 11:33:29 +00:00
2019-02-21 10:27:45 +00:00
pub(crate) fn reparser(
node: SyntaxKind,
first_child: Option<SyntaxKind>,
parent: Option<SyntaxKind>,
2022-07-20 13:02:08 +00:00
) -> Option<fn(&mut Parser<'_>)> {
let res = match node {
2020-05-02 12:34:39 +00:00
BLOCK_EXPR => expressions::block_expr,
2020-08-13 15:58:35 +00:00
RECORD_FIELD_LIST => items::record_field_list,
RECORD_EXPR_FIELD_LIST => items::record_expr_field_list,
VARIANT_LIST => items::variant_list,
2019-02-20 13:02:06 +00:00
MATCH_ARM_LIST => items::match_arm_list,
USE_TREE_LIST => items::use_tree_list,
EXTERN_ITEM_LIST => items::extern_item_list,
2019-05-15 12:35:47 +00:00
TOKEN_TREE if first_child? == T!['{'] => items::token_tree,
2020-07-30 09:48:19 +00:00
ASSOC_ITEM_LIST => match parent? {
2021-10-03 12:45:08 +00:00
IMPL | TRAIT => items::assoc_item_list,
_ => return None,
},
2020-08-13 15:58:35 +00:00
ITEM_LIST => items::item_list,
2019-02-20 13:02:06 +00:00
_ => return None,
};
Some(res)
}
2018-08-07 13:32:09 +00:00
#[derive(Clone, Copy, PartialEq, Eq)]
2018-08-07 13:11:40 +00:00
enum BlockLike {
Block,
NotBlock,
}
2018-08-07 13:32:09 +00:00
impl BlockLike {
fn is_block(self) -> bool {
self == BlockLike::Block
}
2023-03-07 00:24:05 +00:00
fn is_blocklike(kind: SyntaxKind) -> bool {
matches!(kind, BLOCK_EXPR | IF_EXPR | WHILE_EXPR | FOR_EXPR | LOOP_EXPR | MATCH_EXPR)
}
2018-08-07 13:32:09 +00:00
}
const VISIBILITY_FIRST: TokenSet = TokenSet::new(&[T![pub]]);
2022-07-20 13:02:08 +00:00
fn opt_visibility(p: &mut Parser<'_>, in_tuple_field: bool) -> bool {
2023-07-15 14:55:57 +00:00
if !p.at(T![pub]) {
return false;
}
let m = p.start();
p.bump(T![pub]);
if p.at(T!['(']) {
match p.nth(1) {
// test crate_visibility
// pub(crate) struct S;
// pub(self) struct S;
// pub(super) struct S;
// test_err crate_visibility_empty_recover
// pub() struct S;
// test pub_parens_typepath
// struct B(pub (super::A));
// struct B(pub (crate::A,));
T![crate] | T![self] | T![super] | T![ident] | T![')'] if p.nth(2) != T![:] => {
// If we are in a tuple struct, then the parens following `pub`
// might be an tuple field, not part of the visibility. So in that
// case we don't want to consume an identifier.
// test pub_tuple_field
// struct MyStruct(pub (u32, u32));
// struct MyStruct(pub (u32));
// struct MyStruct(pub ());
if !(in_tuple_field && matches!(p.nth(1), T![ident] | T![')'])) {
p.bump(T!['(']);
paths::use_path(p);
p.expect(T![')']);
2018-01-20 14:21:13 +00:00
}
2018-01-12 19:05:46 +00:00
}
2023-07-15 14:55:57 +00:00
// test crate_visibility_in
// pub(in super::A) struct S;
// pub(in crate) struct S;
T![in] => {
p.bump(T!['(']);
p.bump(T![in]);
paths::use_path(p);
p.expect(T![')']);
}
2023-07-15 14:55:57 +00:00
_ => {}
2018-08-08 19:09:47 +00:00
}
2018-01-20 14:21:13 +00:00
}
2023-07-15 14:55:57 +00:00
m.complete(p, VISIBILITY);
true
2018-01-01 15:58:46 +00:00
}
2018-08-23 22:19:38 +00:00
2022-07-20 13:02:08 +00:00
fn opt_rename(p: &mut Parser<'_>) {
2019-05-15 12:35:47 +00:00
if p.at(T![as]) {
2018-08-23 22:19:38 +00:00
let m = p.start();
2019-09-19 19:51:46 +00:00
p.bump(T![as]);
2019-05-15 12:35:47 +00:00
if !p.eat(T![_]) {
name(p);
}
2020-07-30 09:58:41 +00:00
m.complete(p, RENAME);
2018-01-20 14:21:13 +00:00
}
2018-01-08 21:06:42 +00:00
}
2022-07-20 13:02:08 +00:00
fn abi(p: &mut Parser<'_>) {
2019-05-15 12:35:47 +00:00
assert!(p.at(T![extern]));
2018-02-11 09:51:09 +00:00
let abi = p.start();
2019-09-19 19:51:46 +00:00
p.bump(T![extern]);
p.eat(STRING);
2018-02-11 09:51:09 +00:00
abi.complete(p, ABI);
}
2022-07-20 13:02:08 +00:00
fn opt_ret_type(p: &mut Parser<'_>) -> bool {
2019-05-15 12:35:47 +00:00
if p.at(T![->]) {
2018-08-28 18:11:17 +00:00
let m = p.start();
p.bump(T![->]);
types::type_no_bounds(p);
2018-08-28 18:11:17 +00:00
m.complete(p, RET_TYPE);
2018-07-31 20:13:08 +00:00
true
} else {
false
2018-02-11 09:51:09 +00:00
}
}
2022-07-20 13:02:08 +00:00
fn name_r(p: &mut Parser<'_>, recovery: TokenSet) {
2018-02-10 11:00:23 +00:00
if p.at(IDENT) {
let m = p.start();
2019-09-19 19:51:46 +00:00
p.bump(IDENT);
2018-02-10 11:00:23 +00:00
m.complete(p, NAME);
} else {
2018-08-31 10:35:48 +00:00
p.err_recover("expected a name", recovery);
2018-02-10 11:00:23 +00:00
}
}
2022-07-20 13:02:08 +00:00
fn name(p: &mut Parser<'_>) {
name_r(p, TokenSet::EMPTY);
2018-08-31 10:35:48 +00:00
}
2022-07-20 13:02:08 +00:00
fn name_ref(p: &mut Parser<'_>) {
2019-08-09 10:16:47 +00:00
if p.at(IDENT) {
2018-02-10 11:17:38 +00:00
let m = p.start();
2019-09-19 19:51:46 +00:00
p.bump(IDENT);
2018-02-10 11:17:38 +00:00
m.complete(p, NAME_REF);
} else {
2018-08-13 15:30:56 +00:00
p.err_and_bump("expected identifier");
2018-02-10 11:17:38 +00:00
}
}
2022-07-20 13:02:08 +00:00
fn name_ref_or_index(p: &mut Parser<'_>) {
assert!(p.at(IDENT) || p.at(INT_NUMBER));
2020-04-11 21:08:05 +00:00
let m = p.start();
p.bump_any();
2020-04-11 21:08:05 +00:00
m.complete(p, NAME_REF);
2019-08-09 10:16:47 +00:00
}
2022-07-20 13:02:08 +00:00
fn lifetime(p: &mut Parser<'_>) {
2020-12-15 18:23:51 +00:00
assert!(p.at(LIFETIME_IDENT));
let m = p.start();
p.bump(LIFETIME_IDENT);
m.complete(p, LIFETIME);
}
2022-07-20 13:02:08 +00:00
fn error_block(p: &mut Parser<'_>, message: &str) {
2019-05-15 12:35:47 +00:00
assert!(p.at(T!['{']));
let m = p.start();
p.error(message);
2019-09-19 19:51:46 +00:00
p.bump(T!['{']);
expressions::expr_block_contents(p);
2019-05-15 12:35:47 +00:00
p.eat(T!['}']);
m.complete(p, ERROR);
2018-01-28 17:48:37 +00:00
}
// test_err top_level_let
// let ref foo: fn() = 1 + 3;
fn error_let_stmt(p: &mut Parser<'_>, message: &str) {
assert!(p.at(T![let]));
let m = p.start();
p.error(message);
expressions::let_stmt(p, expressions::Semicolon::Optional);
m.complete(p, ERROR);
}
/// The `parser` passed this is required to at least consume one token if it returns `true`.
/// If the `parser` returns false, parsing will stop.
fn delimited(
p: &mut Parser<'_>,
bra: SyntaxKind,
ket: SyntaxKind,
delim: SyntaxKind,
unexpected_delim_message: impl Fn() -> String,
first_set: TokenSet,
mut parser: impl FnMut(&mut Parser<'_>) -> bool,
) {
p.bump(bra);
while !p.at(ket) && !p.at(EOF) {
if p.at(delim) {
// Recover if an argument is missing and only got a delimiter,
// e.g. `(a, , b)`.
// Wrap the erroneous delimiter in an error node so that fixup logic gets rid of it.
// FIXME: Ideally this should be handled in fixup in a structured way, but our list
// nodes currently have no concept of a missing node between two delimiters.
// So doing it this way is easier.
let m = p.start();
p.error(unexpected_delim_message());
p.bump(delim);
m.complete(p, ERROR);
continue;
}
if !parser(p) {
break;
}
2024-03-06 21:09:30 +00:00
if !p.eat(delim) {
if p.at_ts(first_set) {
2024-05-30 23:18:49 +00:00
p.error(format!("expected {delim:?}"));
} else {
break;
}
}
}
p.expect(ket);
}