2020-06-17 06:53:51 +00:00
|
|
|
//! Structural Search Replace
|
|
|
|
//!
|
|
|
|
//! Allows searching the AST for code that matches one or more patterns and then replacing that code
|
|
|
|
//! based on a template.
|
|
|
|
|
|
|
|
mod matching;
|
|
|
|
mod parsing;
|
|
|
|
mod replacing;
|
2020-06-23 12:03:39 +00:00
|
|
|
#[macro_use]
|
|
|
|
mod errors;
|
2020-06-17 06:53:51 +00:00
|
|
|
#[cfg(test)]
|
|
|
|
mod tests;
|
|
|
|
|
2020-06-23 12:03:39 +00:00
|
|
|
pub use crate::errors::SsrError;
|
2020-06-30 05:55:20 +00:00
|
|
|
pub use crate::matching::Match;
|
2020-07-03 02:57:17 +00:00
|
|
|
use crate::matching::MatchFailureReason;
|
2020-06-17 06:53:51 +00:00
|
|
|
use hir::Semantics;
|
|
|
|
use ra_db::{FileId, FileRange};
|
2020-07-03 02:57:17 +00:00
|
|
|
use ra_syntax::{ast, AstNode, SyntaxNode, TextRange};
|
2020-06-17 06:53:51 +00:00
|
|
|
use ra_text_edit::TextEdit;
|
|
|
|
|
|
|
|
// A structured search replace rule. Create by calling `parse` on a str.
|
|
|
|
#[derive(Debug)]
|
|
|
|
pub struct SsrRule {
|
|
|
|
/// A structured pattern that we're searching for.
|
2020-07-03 02:57:17 +00:00
|
|
|
pattern: parsing::RawPattern,
|
2020-06-17 06:53:51 +00:00
|
|
|
/// What we'll replace it with.
|
2020-07-22 09:15:19 +00:00
|
|
|
template: parsing::RawPattern,
|
2020-07-03 02:57:17 +00:00
|
|
|
parsed_rules: Vec<parsing::ParsedRule>,
|
2020-06-17 06:53:51 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
#[derive(Debug)]
|
2020-06-30 05:55:20 +00:00
|
|
|
pub struct SsrPattern {
|
2020-07-03 02:57:17 +00:00
|
|
|
raw: parsing::RawPattern,
|
|
|
|
parsed_rules: Vec<parsing::ParsedRule>,
|
2020-06-17 06:53:51 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
#[derive(Debug, Default)]
|
|
|
|
pub struct SsrMatches {
|
2020-06-30 05:55:20 +00:00
|
|
|
pub matches: Vec<Match>,
|
2020-06-17 06:53:51 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/// Searches a crate for pattern matches and possibly replaces them with something else.
|
|
|
|
pub struct MatchFinder<'db> {
|
|
|
|
/// Our source of information about the user's code.
|
|
|
|
sema: Semantics<'db, ra_ide_db::RootDatabase>,
|
2020-07-03 02:57:17 +00:00
|
|
|
rules: Vec<parsing::ParsedRule>,
|
2020-06-17 06:53:51 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
impl<'db> MatchFinder<'db> {
|
|
|
|
pub fn new(db: &'db ra_ide_db::RootDatabase) -> MatchFinder<'db> {
|
|
|
|
MatchFinder { sema: Semantics::new(db), rules: Vec::new() }
|
|
|
|
}
|
|
|
|
|
2020-07-03 02:57:17 +00:00
|
|
|
/// Adds a rule to be applied. The order in which rules are added matters. Earlier rules take
|
|
|
|
/// precedence. If a node is matched by an earlier rule, then later rules won't be permitted to
|
|
|
|
/// match to it.
|
2020-06-17 06:53:51 +00:00
|
|
|
pub fn add_rule(&mut self, rule: SsrRule) {
|
2020-07-03 02:57:17 +00:00
|
|
|
self.add_parsed_rules(rule.parsed_rules);
|
2020-06-17 06:53:51 +00:00
|
|
|
}
|
|
|
|
|
2020-06-30 05:55:20 +00:00
|
|
|
/// Adds a search pattern. For use if you intend to only call `find_matches_in_file`. If you
|
|
|
|
/// intend to do replacement, use `add_rule` instead.
|
|
|
|
pub fn add_search_pattern(&mut self, pattern: SsrPattern) {
|
2020-07-03 02:57:17 +00:00
|
|
|
self.add_parsed_rules(pattern.parsed_rules);
|
2020-06-30 05:55:20 +00:00
|
|
|
}
|
|
|
|
|
2020-06-17 06:53:51 +00:00
|
|
|
pub fn edits_for_file(&self, file_id: FileId) -> Option<TextEdit> {
|
|
|
|
let matches = self.find_matches_in_file(file_id);
|
|
|
|
if matches.matches.is_empty() {
|
|
|
|
None
|
|
|
|
} else {
|
2020-06-27 10:34:21 +00:00
|
|
|
use ra_db::SourceDatabaseExt;
|
2020-07-22 09:15:19 +00:00
|
|
|
Some(replacing::matches_to_edit(
|
|
|
|
&matches,
|
|
|
|
&self.sema.db.file_text(file_id),
|
|
|
|
&self.rules,
|
|
|
|
))
|
2020-06-17 06:53:51 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-06-30 05:55:20 +00:00
|
|
|
pub fn find_matches_in_file(&self, file_id: FileId) -> SsrMatches {
|
2020-06-17 06:53:51 +00:00
|
|
|
let file = self.sema.parse(file_id);
|
|
|
|
let code = file.syntax();
|
|
|
|
let mut matches = SsrMatches::default();
|
|
|
|
self.find_matches(code, &None, &mut matches);
|
|
|
|
matches
|
|
|
|
}
|
|
|
|
|
2020-06-30 05:55:20 +00:00
|
|
|
/// Finds all nodes in `file_id` whose text is exactly equal to `snippet` and attempts to match
|
|
|
|
/// them, while recording reasons why they don't match. This API is useful for command
|
|
|
|
/// line-based debugging where providing a range is difficult.
|
|
|
|
pub fn debug_where_text_equal(&self, file_id: FileId, snippet: &str) -> Vec<MatchDebugInfo> {
|
|
|
|
use ra_db::SourceDatabaseExt;
|
|
|
|
let file = self.sema.parse(file_id);
|
|
|
|
let mut res = Vec::new();
|
|
|
|
let file_text = self.sema.db.file_text(file_id);
|
|
|
|
let mut remaining_text = file_text.as_str();
|
|
|
|
let mut base = 0;
|
|
|
|
let len = snippet.len() as u32;
|
|
|
|
while let Some(offset) = remaining_text.find(snippet) {
|
|
|
|
let start = base + offset as u32;
|
|
|
|
let end = start + len;
|
|
|
|
self.output_debug_for_nodes_at_range(
|
|
|
|
file.syntax(),
|
|
|
|
FileRange { file_id, range: TextRange::new(start.into(), end.into()) },
|
|
|
|
&None,
|
|
|
|
&mut res,
|
|
|
|
);
|
|
|
|
remaining_text = &remaining_text[offset + snippet.len()..];
|
|
|
|
base = end;
|
|
|
|
}
|
|
|
|
res
|
|
|
|
}
|
|
|
|
|
2020-07-03 02:57:17 +00:00
|
|
|
fn add_parsed_rules(&mut self, parsed_rules: Vec<parsing::ParsedRule>) {
|
2020-07-22 09:15:19 +00:00
|
|
|
for mut parsed_rule in parsed_rules {
|
|
|
|
parsed_rule.index = self.rules.len();
|
2020-07-03 02:57:17 +00:00
|
|
|
self.rules.push(parsed_rule);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-06-17 06:53:51 +00:00
|
|
|
fn find_matches(
|
|
|
|
&self,
|
|
|
|
code: &SyntaxNode,
|
|
|
|
restrict_range: &Option<FileRange>,
|
|
|
|
matches_out: &mut SsrMatches,
|
|
|
|
) {
|
|
|
|
for rule in &self.rules {
|
|
|
|
if let Ok(mut m) = matching::get_match(false, rule, &code, restrict_range, &self.sema) {
|
|
|
|
// Continue searching in each of our placeholders.
|
|
|
|
for placeholder_value in m.placeholder_values.values_mut() {
|
2020-06-22 08:15:51 +00:00
|
|
|
if let Some(placeholder_node) = &placeholder_value.node {
|
|
|
|
// Don't search our placeholder if it's the entire matched node, otherwise we'd
|
|
|
|
// find the same match over and over until we got a stack overflow.
|
|
|
|
if placeholder_node != code {
|
|
|
|
self.find_matches(
|
|
|
|
placeholder_node,
|
|
|
|
restrict_range,
|
|
|
|
&mut placeholder_value.inner_matches,
|
|
|
|
);
|
|
|
|
}
|
2020-06-17 06:53:51 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
matches_out.matches.push(m);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
2020-06-23 08:59:18 +00:00
|
|
|
// If we've got a macro call, we already tried matching it pre-expansion, which is the only
|
|
|
|
// way to match the whole macro, now try expanding it and matching the expansion.
|
|
|
|
if let Some(macro_call) = ast::MacroCall::cast(code.clone()) {
|
|
|
|
if let Some(expanded) = self.sema.expand(¯o_call) {
|
|
|
|
if let Some(tt) = macro_call.token_tree() {
|
|
|
|
// When matching within a macro expansion, we only want to allow matches of
|
|
|
|
// nodes that originated entirely from within the token tree of the macro call.
|
|
|
|
// i.e. we don't want to match something that came from the macro itself.
|
|
|
|
self.find_matches(
|
|
|
|
&expanded,
|
|
|
|
&Some(self.sema.original_range(tt.syntax())),
|
|
|
|
matches_out,
|
|
|
|
);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2020-06-17 06:53:51 +00:00
|
|
|
for child in code.children() {
|
|
|
|
self.find_matches(&child, restrict_range, matches_out);
|
|
|
|
}
|
|
|
|
}
|
2020-06-30 05:55:20 +00:00
|
|
|
|
|
|
|
fn output_debug_for_nodes_at_range(
|
|
|
|
&self,
|
|
|
|
node: &SyntaxNode,
|
|
|
|
range: FileRange,
|
|
|
|
restrict_range: &Option<FileRange>,
|
|
|
|
out: &mut Vec<MatchDebugInfo>,
|
|
|
|
) {
|
|
|
|
for node in node.children() {
|
|
|
|
let node_range = self.sema.original_range(&node);
|
|
|
|
if node_range.file_id != range.file_id || !node_range.range.contains_range(range.range)
|
|
|
|
{
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
if node_range.range == range.range {
|
|
|
|
for rule in &self.rules {
|
2020-07-03 02:57:17 +00:00
|
|
|
// For now we ignore rules that have a different kind than our node, otherwise
|
|
|
|
// we get lots of noise. If at some point we add support for restricting rules
|
|
|
|
// to a particular kind of thing (e.g. only match type references), then we can
|
|
|
|
// relax this.
|
|
|
|
if rule.pattern.kind() != node.kind() {
|
|
|
|
continue;
|
|
|
|
}
|
2020-06-30 05:55:20 +00:00
|
|
|
out.push(MatchDebugInfo {
|
|
|
|
matched: matching::get_match(true, rule, &node, restrict_range, &self.sema)
|
|
|
|
.map_err(|e| MatchFailureReason {
|
|
|
|
reason: e.reason.unwrap_or_else(|| {
|
|
|
|
"Match failed, but no reason was given".to_owned()
|
|
|
|
}),
|
|
|
|
}),
|
2020-07-03 02:57:17 +00:00
|
|
|
pattern: rule.pattern.clone(),
|
2020-06-30 05:55:20 +00:00
|
|
|
node: node.clone(),
|
|
|
|
});
|
|
|
|
}
|
|
|
|
} else if let Some(macro_call) = ast::MacroCall::cast(node.clone()) {
|
|
|
|
if let Some(expanded) = self.sema.expand(¯o_call) {
|
|
|
|
if let Some(tt) = macro_call.token_tree() {
|
|
|
|
self.output_debug_for_nodes_at_range(
|
|
|
|
&expanded,
|
|
|
|
range,
|
|
|
|
&Some(self.sema.original_range(tt.syntax())),
|
|
|
|
out,
|
|
|
|
);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2020-07-03 03:15:00 +00:00
|
|
|
self.output_debug_for_nodes_at_range(&node, range, restrict_range, out);
|
2020-06-30 05:55:20 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
pub struct MatchDebugInfo {
|
|
|
|
node: SyntaxNode,
|
2020-07-03 02:57:17 +00:00
|
|
|
/// Our search pattern parsed as an expression or item, etc
|
|
|
|
pattern: SyntaxNode,
|
2020-06-30 05:55:20 +00:00
|
|
|
matched: Result<Match, MatchFailureReason>,
|
2020-06-17 06:53:51 +00:00
|
|
|
}
|
|
|
|
|
2020-06-30 05:55:20 +00:00
|
|
|
impl std::fmt::Debug for MatchDebugInfo {
|
|
|
|
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
|
2020-07-03 03:15:00 +00:00
|
|
|
match &self.matched {
|
|
|
|
Ok(_) => writeln!(f, "Node matched")?,
|
|
|
|
Err(reason) => writeln!(f, "Node failed to match because: {}", reason.reason)?,
|
|
|
|
}
|
|
|
|
writeln!(
|
|
|
|
f,
|
|
|
|
"============ AST ===========\n\
|
|
|
|
{:#?}",
|
|
|
|
self.node
|
|
|
|
)?;
|
|
|
|
writeln!(f, "========= PATTERN ==========")?;
|
2020-07-03 02:57:17 +00:00
|
|
|
writeln!(f, "{:#?}", self.pattern)?;
|
2020-07-03 03:15:00 +00:00
|
|
|
writeln!(f, "============================")?;
|
2020-06-30 05:55:20 +00:00
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl SsrMatches {
|
|
|
|
/// Returns `self` with any nested matches removed and made into top-level matches.
|
|
|
|
pub fn flattened(self) -> SsrMatches {
|
|
|
|
let mut out = SsrMatches::default();
|
|
|
|
self.flatten_into(&mut out);
|
|
|
|
out
|
|
|
|
}
|
|
|
|
|
|
|
|
fn flatten_into(self, out: &mut SsrMatches) {
|
|
|
|
for mut m in self.matches {
|
|
|
|
for p in m.placeholder_values.values_mut() {
|
|
|
|
std::mem::replace(&mut p.inner_matches, SsrMatches::default()).flatten_into(out);
|
|
|
|
}
|
|
|
|
out.matches.push(m);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl Match {
|
|
|
|
pub fn matched_text(&self) -> String {
|
|
|
|
self.matched_node.text().to_string()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-06-17 06:53:51 +00:00
|
|
|
impl std::error::Error for SsrError {}
|
2020-06-30 05:55:20 +00:00
|
|
|
|
|
|
|
#[cfg(test)]
|
|
|
|
impl MatchDebugInfo {
|
|
|
|
pub(crate) fn match_failure_reason(&self) -> Option<&str> {
|
|
|
|
self.matched.as_ref().err().map(|r| r.reason.as_str())
|
|
|
|
}
|
|
|
|
}
|