rust-analyzer/crates/ide/src/syntax_highlighting.rs

385 lines
14 KiB
Rust
Raw Normal View History

2021-01-09 11:45:47 +00:00
pub(crate) mod tags;
mod highlights;
mod injector;
2021-01-09 20:07:32 +00:00
mod highlight;
2020-10-13 22:56:41 +00:00
mod format;
mod macro_;
2021-01-09 20:07:32 +00:00
mod inject;
2021-01-09 11:45:47 +00:00
mod html;
2020-02-27 13:15:32 +00:00
#[cfg(test)]
mod tests;
2020-02-26 16:08:15 +00:00
use hir::{InFile, Name, Semantics};
2021-01-20 14:25:34 +00:00
use ide_db::{RootDatabase, SymbolKind};
2020-08-12 16:26:51 +00:00
use rustc_hash::FxHashMap;
use syntax::{
ast::{self, HasFormatSpecifier},
2021-07-15 19:28:30 +00:00
match_ast, AstNode, AstToken, Direction, NodeOrToken,
2021-01-09 20:07:32 +00:00
SyntaxKind::*,
SyntaxNode, TextRange, WalkEvent, T,
};
2019-01-08 19:33:36 +00:00
2020-10-14 17:23:59 +00:00
use crate::{
2020-11-02 15:31:38 +00:00
syntax_highlighting::{
format::highlight_format_string, highlights::Highlights, macro_::MacroHighlighter,
tags::Highlight,
2020-11-02 15:31:38 +00:00
},
2021-01-20 14:25:34 +00:00
FileId, HlMod, HlTag,
2020-10-14 17:23:59 +00:00
};
2019-03-23 16:34:49 +00:00
pub(crate) use html::highlight_as_html;
2021-01-09 12:54:38 +00:00
#[derive(Debug, Clone, Copy)]
2021-01-09 11:48:15 +00:00
pub struct HlRange {
2019-03-23 16:34:49 +00:00
pub range: TextRange,
2020-02-26 18:39:32 +00:00
pub highlight: Highlight,
pub binding_hash: Option<u64>,
2019-03-23 16:34:49 +00:00
}
2019-01-08 19:33:36 +00:00
// Feature: Semantic Syntax Highlighting
//
// rust-analyzer highlights the code semantically.
2021-05-26 13:23:05 +00:00
// For example, `Bar` in `foo::Bar` might be colored differently depending on whether `Bar` is an enum or a trait.
// rust-analyzer does not specify colors directly, instead it assigns a tag (like `struct`) and a set of modifiers (like `declaration`) to each token.
// It's up to the client to map those to specific colors.
//
// The general rule is that a reference to an entity gets colored the same way as the entity itself.
// We also give special modifier for `mut` and `&mut` local variables.
//
2021-05-26 13:23:05 +00:00
//
// .Token Tags
//
// Rust-analyzer currently emits the following token tags:
//
// - For items:
// +
// [horizontal]
// enum:: Emitted for enums.
// function:: Emitted for free-standing functions.
// macro:: Emitted for macros.
// method:: Emitted for associated functions, also knowns as methods.
// namespace:: Emitted for modules.
// struct:: Emitted for structs.
// trait:: Emitted for traits.
// typeAlias:: Emitted for type aliases and `Self` in `impl`s.
// union:: Emitted for unions.
//
// - For literals:
// +
// [horizontal]
// boolean:: Emitted for the boolean literals `true` and `false`.
// character:: Emitted for character literals.
// number:: Emitted for numeric literals.
// string:: Emitted for string literals.
// escapeSequence:: Emitted for escaped sequences inside strings like `\n`.
// formatSpecifier:: Emitted for format specifiers `{:?}` in `format!`-like macros.
//
// - For operators:
// +
// [horizontal]
// operator:: Emitted for general operators.
// arithmetic:: Emitted for the arithmetic operators `+`, `-`, `*`, `/`, `+=`, `-=`, `*=`, `/=`.
// bitwise:: Emitted for the bitwise operators `|`, `&`, `!`, `^`, `|=`, `&=`, `^=`.
// comparison:: Emitted for the comparison operators `>`, `<`, `==`, `>=`, `<=`, `!=`.
// logical:: Emitted for the logical operators `||`, `&&`, `!`.
//
// - For punctuation:
// +
// [horizontal]
// punctuation:: Emitted for general punctuation.
// angle:: Emitted for `<>` angle brackets.
// brace:: Emitted for `{}` braces.
// bracket:: Emitted for `[]` brackets.
// parenthesis:: Emitted for `()` parentheses.
// colon:: Emitted for the `:` token.
// comma:: Emitted for the `,` token.
// dot:: Emitted for the `.` token.
// Semi:: Emitted for the `;` token.
//
// //-
//
// [horizontal]
// attribute:: Emitted for the `#[` `]` tokens.
// builtinAttribute:: Emitted for names to builtin attributes in attribute path, the `repr` in `#[repr(u8)]` for example.
2021-05-26 13:23:05 +00:00
// builtinType:: Emitted for builtin types like `u32`, `str` and `f32`.
// comment:: Emitted for comments.
// constParameter:: Emitted for const parameters.
// enumMember:: Emitted for enum variants.
// generic:: Emitted for generic tokens that have no mapping.
// keyword:: Emitted for keywords.
// label:: Emitted for labels.
// lifetime:: Emitted for lifetimes.
// parameter:: Emitted for non-self function parameters.
// property:: Emitted for struct and union fields.
// selfKeyword:: Emitted for the self function parameter and self path-specifier.
// typeParameter:: Emitted for type parameters.
// unresolvedReference:: Emitted for unresolved references, names that rust-analyzer can't find the definition of.
// variable:: Emitted for locals, constants and statics.
//
//
2021-05-26 11:29:00 +00:00
// .Token Modifiers
//
// Token modifiers allow to style some elements in the source code more precisely.
//
// Rust-analyzer currently emits the following token modifiers:
//
// [horizontal]
// async:: Emitted for async functions and the `async` and `await` keywords.
// attribute:: Emitted for tokens inside attributes.
// callable:: Emitted for locals whose types implements one of the `Fn*` traits.
2021-05-26 13:23:05 +00:00
// constant:: Emitted for consts.
2021-05-26 11:29:00 +00:00
// consuming:: Emitted for locals that are being consumed when use in a function call.
// controlFlow:: Emitted for control-flow related tokens, this includes the `?` operator.
// declaration:: Emitted for names of definitions, like `foo` in `fn foo() {}`.
// documentation:: Emitted for documentation comments.
// injected:: Emitted for doc-string injected highlighting like rust source blocks in documentation.
// intraDocLink:: Emitted for intra doc links in doc-strings.
// library:: Emitted for items that are defined outside of the current crate.
// public:: Emitted for items that are from the current crate and are `pub`.
2021-05-26 11:29:00 +00:00
// mutable:: Emitted for mutable locals and statics.
2021-05-26 13:23:05 +00:00
// static:: Emitted for "static" functions, also known as functions that do not take a `self` param, as well as statics and consts.
2021-05-26 11:29:00 +00:00
// trait:: Emitted for associated trait items.
// unsafe:: Emitted for unsafe operations, like unsafe function calls, as well as the `unsafe` token.
//
//
// image::https://user-images.githubusercontent.com/48062697/113164457-06cfb980-9239-11eb-819b-0f93e646acf8.png[]
// image::https://user-images.githubusercontent.com/48062697/113187625-f7f50100-9250-11eb-825e-91c58f236071.png[]
pub(crate) fn highlight(
2020-02-25 13:38:50 +00:00
db: &RootDatabase,
file_id: FileId,
2020-02-27 10:37:21 +00:00
range_to_highlight: Option<TextRange>,
syntactic_name_ref_highlighting: bool,
2021-01-09 11:48:15 +00:00
) -> Vec<HlRange> {
2020-08-12 14:32:36 +00:00
let _p = profile::span("highlight");
let sema = Semantics::new(db);
2020-02-27 10:37:21 +00:00
// Determine the root based on the given range.
let (root, range_to_highlight) = {
let source_file = sema.parse(file_id);
2021-07-15 19:28:30 +00:00
let source_file = source_file.syntax();
2020-02-27 10:37:21 +00:00
match range_to_highlight {
Some(range) => {
2021-07-15 19:28:30 +00:00
let node = match source_file.covering_element(range) {
2020-02-27 10:37:21 +00:00
NodeOrToken::Node(it) => it,
2021-07-15 19:28:30 +00:00
NodeOrToken::Token(it) => it.parent().unwrap_or_else(|| source_file.clone()),
2020-02-27 10:37:21 +00:00
};
(node, range)
}
2021-07-15 19:28:30 +00:00
None => (source_file.clone(), source_file.text_range()),
2020-02-27 10:37:21 +00:00
}
};
2020-02-25 13:38:50 +00:00
let mut hl = highlights::Highlights::new(root.text_range());
traverse(
&mut hl,
&sema,
InFile::new(file_id.into(), &root),
sema.scope(&root).krate(),
range_to_highlight,
syntactic_name_ref_highlighting,
);
2021-01-09 20:07:32 +00:00
hl.to_vec()
}
fn traverse(
hl: &mut Highlights,
sema: &Semantics<RootDatabase>,
root: InFile<&SyntaxNode>,
krate: Option<hir::Crate>,
2021-01-09 20:07:32 +00:00
range_to_highlight: TextRange,
syntactic_name_ref_highlighting: bool,
) {
let mut bindings_shadow_count: FxHashMap<Name, u32> = FxHashMap::default();
2020-10-14 17:23:59 +00:00
let mut current_macro_call: Option<ast::MacroCall> = None;
let mut current_attr_macro_call = None;
let mut current_macro: Option<ast::Macro> = None;
let mut macro_highlighter = MacroHighlighter::default();
let mut inside_attribute = false;
2020-02-27 13:00:51 +00:00
// Walk all nodes, keeping track of whether we are inside a macro or not.
// If in macro, expand it first and highlight the expanded code.
for event in root.value.preorder_with_tokens() {
2020-02-27 10:39:54 +00:00
let event_range = match &event {
WalkEvent::Enter(it) | WalkEvent::Leave(it) => it.text_range(),
2020-02-27 10:39:54 +00:00
};
2020-02-27 13:00:51 +00:00
// Element outside of the viewport, no need to highlight
2020-04-24 21:40:41 +00:00
if range_to_highlight.intersect(event_range).is_none() {
2020-02-27 10:39:54 +00:00
continue;
}
2021-07-15 19:28:30 +00:00
match event.clone() {
WalkEvent::Enter(NodeOrToken::Node(node)) => {
match_ast! {
match node {
ast::MacroCall(mcall) => {
if let Some(range) = macro_call_range(&mcall) {
hl.add(HlRange {
range,
highlight: HlTag::Symbol(SymbolKind::Macro).into(),
binding_hash: None,
});
}
current_macro_call = Some(mcall);
continue;
},
ast::Macro(mac) => {
macro_highlighter.init();
current_macro = Some(mac);
continue;
},
ast::Item(item) => {
if sema.is_attr_macro_call(&item) {
current_attr_macro_call = Some(item);
}
},
ast::Attr(__) => inside_attribute = true,
_ => ()
}
2020-02-27 10:39:54 +00:00
}
2020-02-27 10:56:42 +00:00
}
2021-07-15 19:28:30 +00:00
WalkEvent::Leave(NodeOrToken::Node(node)) => {
match_ast! {
match node {
ast::MacroCall(mcall) => {
assert_eq!(current_macro_call, Some(mcall));
current_macro_call = None;
},
ast::Macro(mac) => {
assert_eq!(current_macro, Some(mac));
current_macro = None;
macro_highlighter = MacroHighlighter::default();
},
ast::Item(item) => {
if current_attr_macro_call == Some(item) {
current_attr_macro_call = None;
}
},
ast::Attr(__) => inside_attribute = false,
_ => ()
}
}
}
_ => (),
}
2020-02-27 13:00:51 +00:00
let element = match event {
2020-02-27 10:56:42 +00:00
WalkEvent::Enter(it) => it,
2021-01-09 20:07:32 +00:00
WalkEvent::Leave(it) => {
if let Some(node) = it.as_node() {
inject::doc_comment(hl, sema, root.with_value(node));
2021-01-09 20:07:32 +00:00
}
continue;
}
2020-02-27 10:56:42 +00:00
};
2020-02-27 15:05:35 +00:00
2020-02-27 13:00:51 +00:00
let range = element.text_range();
2020-02-27 10:56:42 +00:00
if current_macro.is_some() {
2020-12-15 14:37:37 +00:00
if let Some(tok) = element.as_token() {
macro_highlighter.advance(tok);
2020-12-15 14:37:37 +00:00
}
}
let element_to_highlight = if current_macro_call.is_some() && element.kind() != COMMENT {
2020-02-27 13:00:51 +00:00
// Inside a macro -- expand it first
2020-02-27 15:05:35 +00:00
let token = match element.clone().into_token() {
Some(it) if it.parent().map_or(false, |it| it.kind() == TOKEN_TREE) => it,
2020-02-27 13:00:51 +00:00
_ => continue,
};
let token = sema.descend_into_macros(token.clone());
match token.parent() {
Some(parent) => {
// We only care Name and Name_ref
match (token.kind(), parent.kind()) {
2021-06-17 15:37:14 +00:00
(IDENT, NAME | NAME_REF) => parent.into(),
_ => token.into(),
}
}
None => token.into(),
}
} else if current_attr_macro_call.is_some() {
let token = match element.clone().into_token() {
Some(it) => it,
_ => continue,
};
let token = sema.descend_into_macros(token.clone());
match token.parent() {
Some(parent) => {
// We only care Name and Name_ref
match (token.kind(), parent.kind()) {
2021-06-17 15:37:14 +00:00
(IDENT, NAME | NAME_REF) => parent.into(),
_ => token.into(),
}
}
None => token.into(),
}
2020-02-27 13:00:51 +00:00
} else {
2020-02-27 15:05:35 +00:00
element.clone()
2020-02-27 13:00:51 +00:00
};
2020-02-27 10:56:42 +00:00
if let Some(token) = element.as_token().cloned().and_then(ast::String::cast) {
if token.is_raw() {
let expanded = element_to_highlight.as_token().unwrap().clone();
2021-06-13 03:54:16 +00:00
if inject::ra_fixture(hl, sema, token, expanded).is_some() {
continue;
}
2020-02-27 15:05:35 +00:00
}
}
if let Some(_) = macro_highlighter.highlight(element_to_highlight.clone()) {
2021-01-10 08:57:17 +00:00
continue;
}
2021-01-09 20:07:32 +00:00
if let Some((mut highlight, binding_hash)) = highlight::element(
2021-06-13 03:54:16 +00:00
sema,
krate,
&mut bindings_shadow_count,
syntactic_name_ref_highlighting,
element_to_highlight.clone(),
) {
if inside_attribute {
2021-01-09 11:44:01 +00:00
highlight = highlight | HlMod::Attribute;
}
2021-01-10 08:57:17 +00:00
hl.add(HlRange { range, highlight, binding_hash });
}
2020-10-14 17:23:59 +00:00
2021-01-10 08:57:17 +00:00
if let Some(string) = element_to_highlight.as_token().cloned().and_then(ast::String::cast) {
highlight_format_string(hl, &string, range);
// Highlight escape sequences
if let Some(char_ranges) = string.char_ranges() {
for (piece_range, _) in char_ranges.iter().filter(|(_, char)| char.is_ok()) {
if string.text()[piece_range.start().into()..].starts_with('\\') {
hl.add(HlRange {
range: piece_range + range.start(),
highlight: HlTag::EscapeSequence.into(),
binding_hash: None,
});
}
}
}
}
}
}
2020-02-27 13:00:51 +00:00
fn macro_call_range(macro_call: &ast::MacroCall) -> Option<TextRange> {
let path = macro_call.path()?;
let name_ref = path.segment()?.name_ref()?;
let range_start = name_ref.syntax().text_range().start();
let mut range_end = name_ref.syntax().text_range().end();
for sibling in path.syntax().siblings_with_tokens(Direction::Next) {
match sibling.kind() {
T![!] | IDENT => range_end = sibling.text_range().end(),
_ => (),
}
}
2020-04-24 21:40:41 +00:00
Some(TextRange::new(range_start, range_end))
}