use clippy_utils::{ can_move_expr_to_closure_no_visit, diagnostics::span_lint_and_sugg, is_expr_final_block_expr, is_expr_used_or_unified, match_def_path, paths, peel_hir_expr_while, source::{reindent_multiline, snippet_indent, snippet_with_applicability, snippet_with_context}, SpanlessEq, }; use rustc_errors::Applicability; use rustc_hir::{ intravisit::{walk_expr, ErasedMap, NestedVisitorMap, Visitor}, Block, Expr, ExprKind, Guard, HirId, Local, Stmt, StmtKind, UnOp, }; use rustc_lint::{LateContext, LateLintPass}; use rustc_session::{declare_lint_pass, declare_tool_lint}; use rustc_span::{Span, SyntaxContext, DUMMY_SP}; use std::fmt::Write; declare_clippy_lint! { /// **What it does:** Checks for uses of `contains_key` + `insert` on `HashMap` /// or `BTreeMap`. /// /// **Why is this bad?** Using `entry` is more efficient. /// /// **Known problems:** The suggestion may have type inference errors in some cases. e.g. /// ```rust /// let mut map = std::collections::HashMap::new(); /// let _ = if !map.contains_key(&0) { /// map.insert(0, 0) /// } else { /// None /// }; /// ``` /// /// **Example:** /// ```rust /// # use std::collections::HashMap; /// # let mut map = HashMap::new(); /// # let k = 1; /// # let v = 1; /// if !map.contains_key(&k) { /// map.insert(k, v); /// } /// ``` /// can both be rewritten as: /// ```rust /// # use std::collections::HashMap; /// # let mut map = HashMap::new(); /// # let k = 1; /// # let v = 1; /// map.entry(k).or_insert(v); /// ``` pub MAP_ENTRY, perf, "use of `contains_key` followed by `insert` on a `HashMap` or `BTreeMap`" } declare_lint_pass!(HashMapPass => [MAP_ENTRY]); impl<'tcx> LateLintPass<'tcx> for HashMapPass { #[allow(clippy::too_many_lines)] fn check_expr(&mut self, cx: &LateContext<'tcx>, expr: &'tcx Expr<'_>) { let (cond_expr, then_expr, else_expr) = match expr.kind { ExprKind::If(c, t, e) => (c, t, e), _ => return, }; let (map_ty, contains_expr) = match try_parse_contains(cx, cond_expr) { Some(x) => x, None => return, }; let then_search = match find_insert_calls(cx, &contains_expr, then_expr) { Some(x) => x, None => return, }; let mut app = Applicability::MachineApplicable; let map_str = snippet_with_context(cx, contains_expr.map.span, contains_expr.call_ctxt, "..", &mut app).0; let key_str = snippet_with_context(cx, contains_expr.key.span, contains_expr.call_ctxt, "..", &mut app).0; let sugg = if let Some(else_expr) = else_expr { // if .. { .. } else { .. } let else_search = match find_insert_calls(cx, &contains_expr, else_expr) { Some(search) if !(then_search.edits.is_empty() && search.edits.is_empty()) => search, _ => return, }; if then_search.edits.is_empty() || else_search.edits.is_empty() { // if .. { insert } else { .. } or if .. { .. } else { then } of let (then_str, else_str, entry_kind) = if else_search.edits.is_empty() { if contains_expr.negated { ( then_search.snippet_vacant(cx, then_expr.span, &mut app), snippet_with_applicability(cx, else_expr.span, "{ .. }", &mut app), "Vacant(e)", ) } else { ( then_search.snippet_occupied(cx, then_expr.span, &mut app), snippet_with_applicability(cx, else_expr.span, "{ .. }", &mut app), "Occupied(mut e)", ) } } else if contains_expr.negated { ( else_search.snippet_occupied(cx, else_expr.span, &mut app), snippet_with_applicability(cx, then_expr.span, "{ .. }", &mut app), "Occupied(mut e)", ) } else { ( else_search.snippet_vacant(cx, else_expr.span, &mut app), snippet_with_applicability(cx, then_expr.span, "{ .. }", &mut app), "Vacant(e)", ) }; format!( "if let {}::{} = {}.entry({}) {} else {}", map_ty.entry_path(), entry_kind, map_str, key_str, then_str, else_str, ) } else { // if .. { insert } else { insert } let (then_str, else_str, then_entry, else_entry) = if contains_expr.negated { ( then_search.snippet_vacant(cx, then_expr.span, &mut app), else_search.snippet_occupied(cx, else_expr.span, &mut app), "Vacant(e)", "Occupied(mut e)", ) } else { ( then_search.snippet_occupied(cx, then_expr.span, &mut app), else_search.snippet_vacant(cx, else_expr.span, &mut app), "Occupied(mut e)", "Vacant(e)", ) }; let indent_str = snippet_indent(cx, expr.span); let indent_str = indent_str.as_deref().unwrap_or(""); format!( "match {}.entry({}) {{\n{indent} {entry}::{} => {}\n\ {indent} {entry}::{} => {}\n{indent}}}", map_str, key_str, then_entry, reindent_multiline(then_str.into(), true, Some(4 + indent_str.len())), else_entry, reindent_multiline(else_str.into(), true, Some(4 + indent_str.len())), entry = map_ty.entry_path(), indent = indent_str, ) } } else if then_search.edits.is_empty() { // no insertions return; } else { // if .. { insert } if !then_search.allow_insert_closure { let (body_str, entry_kind) = if contains_expr.negated { (then_search.snippet_vacant(cx, then_expr.span, &mut app), "Vacant(e)") } else { ( then_search.snippet_occupied(cx, then_expr.span, &mut app), "Occupied(mut e)", ) }; format!( "if let {}::{} = {}.entry({}) {}", map_ty.entry_path(), entry_kind, map_str, key_str, body_str, ) } else if let Some(insertion) = then_search.as_single_insertion() { let value_str = snippet_with_context(cx, insertion.value.span, then_expr.span.ctxt(), "..", &mut app).0; if contains_expr.negated { if insertion.value.can_have_side_effects() { format!("{}.entry({}).or_insert_with(|| {});", map_str, key_str, value_str) } else { format!("{}.entry({}).or_insert({});", map_str, key_str, value_str) } } else { // Todo: if let Some(v) = map.get_mut(k) return; } } else { let block_str = then_search.snippet_closure(cx, then_expr.span, &mut app); if contains_expr.negated { format!("{}.entry({}).or_insert_with(|| {});", map_str, key_str, block_str) } else { // Todo: if let Some(v) = map.get_mut(k) return; } } }; span_lint_and_sugg( cx, MAP_ENTRY, expr.span, &format!("usage of `contains_key` followed by `insert` on a `{}`", map_ty.name()), "try this", sugg, app, ); } } #[derive(Clone, Copy)] enum MapType { Hash, BTree, } impl MapType { fn name(self) -> &'static str { match self { Self::Hash => "HashMap", Self::BTree => "BTreeMap", } } fn entry_path(self) -> &'staic str { match self { Self::Hash => "std::collections::hash_map::Entry", Self::BTree => "std::collections::btree_map::Entry", } } } struct ContainsExpr<'tcx> { negated: bool, map: &'tcx Expr<'tcx>, key: &'tcx Expr<'tcx>, call_ctxt: SyntaxContext, } fn try_parse_contains(cx: &LateContext<'_>, expr: &'tcx Expr<'_>) -> Option<(MapType, ContainsExpr<'tcx>)> { let mut negated = false; let expr = peel_hir_expr_while(expr, |e| match e.kind { ExprKind::Unary(UnOp::Not, e) => { negated = !negated; Some(e) }, _ => None, }); match expr.kind { ExprKind::MethodCall( _, _, [map, Expr { kind: ExprKind::AddrOf(_, _, key), span: key_span, .. }], _, ) if key_span.ctxt() == expr.span.ctxt() => { let id = cx.typeck_results().type_dependent_def_id(expr.hir_id)?; let expr = ContainsExpr { negated, map, key, call_ctxt: expr.span.ctxt(), }; if match_def_path(cx, id, &paths::BTREEMAP_CONTAINS_KEY) { Some((MapType::BTree, expr)) } else if match_def_path(cx, id, &paths::HASHMAP_CONTAINS_KEY) { Some((MapType::Hash, expr)) } else { None } }, _ => None, } } struct InsertExpr<'tcx> { map: &'tcx Expr<'tcx>, key: &'tcx Expr<'tcx>, value: &'tcx Expr<'tcx>, } fn try_parse_insert(cx: &LateContext<'tcx>, expr: &'tcx Expr<'_>) -> Option> { if let ExprKind::MethodCall(_, _, [map, key, value], _) = expr.kind { let id = cx.typeck_results().type_dependent_def_id(expr.hir_id)?; if match_def_path(cx, id, &paths::BTREEMAP_INSERT) || match_def_path(cx, id, &paths::HASHMAP_INSERT) { Some(InsertExpr { map, key, value }) } else { None } } else { None } } /// An edit that will need to be made to move the expression to use the entry api #[derive(Clone, Copy)] enum Edit<'tcx> { /// A semicolon that needs to be removed. Used to create a closure for `insert_with`. RemoveSemi(Span), /// An insertion into the map. Insertion(Insertion<'tcx>), } impl Edit<'tcx> { fn as_insertion(self) -> Option> { if let Self::Insertion(i) = self { Some(i) } else { None } } } #[derive(Clone, Copy)] struct Insertion<'tcx> { call: &'tcx Expr<'tcx>, value: &'tcx Expr<'tcx>, } // This visitor needs to do a multiple things: // * Find all usages of the map. Only insertions into the map which share the same key are // permitted. All others will prevent the lint. // * Determine if the final statement executed is an insertion. This is needed to use `insert_with`. // * Determine if there's any sub-expression that can't be placed in a closure. // * Determine if there's only a single insert statement. This is needed to give better suggestions. #[allow(clippy::struct_excessive_bools)] struct InsertSearcher<'cx, 'i, 'tcx> { cx: &'cx LateContext<'tcx>, /// The map expression used in the contains call. map: &'tcx Expr<'tcx>, /// The key expression used in the contains call. key: &'tcx Expr<'tcx>, /// The context of the top level block. All insert calls must be in the same context. ctxt: SyntaxContext, /// Whether this expression can be safely moved into a closure. allow_insert_closure: bool, /// Whether this expression can use the entry api. can_use_entry: bool, /// Whether this expression is the final expression in this code path. This may be a statement. in_tail_pos: bool, // A single insert expression has a slightly different suggestion. is_single_insert: bool, is_map_used: bool, edits: &'i mut Vec>, loops: Vec, } impl<'tcx> InsertSearcher<'_, '_, 'tcx> { /// Visit the expression as a branch in control flow. Multiple insert calls can be used, but /// only if they are on separate code paths. This will return whether the map was used in the /// given expression. fn visit_cond_arm(&mut self, e: &'tcx Expr<'_>) -> bool { let is_map_used = self.is_map_used; let in_tail_pos = self.in_tail_pos; self.visit_expr(e); let res = self.is_map_used; self.is_map_used = is_map_used; self.in_tail_pos = in_tail_pos; res } /// Visits an expression which is not itself in a tail position, but other sibling expressions /// may be. e.g. if conditions fn visit_non_tail_expr(&mut self, e: &'tcx Expr<'_>) { let in_tail_pos = self.in_tail_pos; self.in_tail_pos = false; self.visit_expr(e); self.in_tail_pos = in_tail_pos; } } impl<'tcx> Visitor<'tcx> for InsertSearcher<'_, '_, 'tcx> { type Map = ErasedMap<'tcx>; fn nested_visit_map(&mut self) -> NestedVisitorMap { NestedVisitorMap::None } fn visit_stmt(&mut self, stmt: &'tcx Stmt<'_>) { match stmt.kind { StmtKind::Semi(e) => { self.visit_expr(e); if self.in_tail_pos && self.allow_insert_closure { // The spans are used to slice the top level expression into multiple parts. This requires that // they all come from the same part of the source code. if stmt.span.ctxt() == self.ctxt && e.span.ctxt() == self.ctxt { self.edits .push(Edit::RemoveSemi(stmt.span.trim_start(e.span).unwrap_or(DUMMY_SP))); } else { self.allow_insert_closure = false; } } }, StmtKind::Expr(e) => self.visit_expr(e), StmtKind::Local(Local { init: Some(e), .. }) => { self.allow_insert_closure &= !self.in_tail_pos; self.in_tail_pos = false; self.is_single_insert = false; self.visit_expr(e); }, _ => { self.allow_insert_closure &= !self.in_tail_pos; self.is_single_insert = false; }, } } fn visit_block(&mut self, block: &'tcx Block<'_>) { // If the block is in a tail position, then the last expression (possibly a statement) is in the // tail position. The rest, however, are not. match (block.stmts, block.expr) { ([], None) => { self.allow_insert_closure &= !self.in_tail_pos; }, ([], Some(expr)) => self.visit_expr(expr), (stmts, Some(expr)) => { let in_tail_pos = self.in_tail_pos; self.in_tail_pos = false; for stmt in stmts { self.visit_stmt(stmt); } self.in_tail_pos = in_tail_pos; self.visit_expr(expr); }, ([stmts @ .., stmt], None) => { let in_tail_pos = self.in_tail_pos; self.in_tail_pos = false; for stmt in stmts { self.visit_stmt(stmt); } self.in_tail_pos = in_tail_pos; self.visit_stmt(stmt); }, } } fn visit_expr(&mut self, expr: &'tcx Expr<'_>) { if !self.can_use_entry { return; } match try_parse_insert(self.cx, expr) { Some(insert_expr) if SpanlessEq::new(self.cx).eq_expr(self.map, insert_expr.map) => { // Multiple inserts, inserts with a different key, and inserts from a macro can't use the entry api. if self.is_map_used || !SpanlessEq::new(self.cx).eq_expr(self.key, insert_expr.key) || expr.span.ctxt() != self.ctxt { self.can_use_entry = false; return; } self.edits.push(Edit::Insertion(Insertion { call: expr, value: insert_expr.value, })); self.is_map_used = true; self.allow_insert_closure &= self.in_tail_pos; // The value doesn't affect whether there is only a single insert expression. let is_single_insert = self.is_single_insert; self.visit_non_tail_expr(insert_expr.value); self.is_single_insert = is_single_insert; }, _ if SpanlessEq::new(self.cx).eq_expr(self.map, expr) => { self.is_map_used = true; }, _ => match expr.kind { ExprKind::If(cond_expr, then_expr, Some(else_expr)) => { self.is_single_insert = false; self.visit_non_tail_expr(cond_expr); // Each branch may contain it's own insert expression. let mut is_map_used = self.visit_cond_arm(then_expr); is_map_used |= self.visit_cond_arm(else_expr); self.is_map_used = is_map_used; }, ExprKind::Match(scrutinee_expr, arms, _) => { self.is_single_insert = false; self.visit_non_tail_expr(scrutinee_expr); // Each branch may contain it's own insert expression. let mut is_map_used = self.is_map_used; for arm in arms { if let Some(Guard::If(guard) | Guard::IfLet(_, guard)) = arm.guard { self.visit_non_tail_expr(guard) } is_map_used |= self.visit_cond_arm(arm.body); } self.is_map_used = is_map_used; }, ExprKind::Loop(block, ..) => { self.loops.push(expr.hir_id); self.allow_insert_closure &= !self.in_tail_pos; // Don't allow insertions inside of a loop. let edit_len = self.edits.len(); self.visit_block(block); if self.edits.len() != edit_len { self.can_use_entry = false; } self.loops.pop(); }, ExprKind::Block(block, _) => self.visit_block(block), ExprKind::InlineAsm(_) | ExprKind::LlvmInlineAsm(_) => { self.can_use_entry = false; }, _ => { self.allow_insert_closure &= !self.in_tail_pos; self.allow_insert_closure &= can_move_expr_to_closure_no_visit(self.cx, expr, &self.loops); // Sub expressions are no longer in the tail position. self.is_single_insert = false; self.in_tail_pos = false; walk_expr(self, expr); }, }, } } } struct InsertSearchResults<'tcx> { edits: Vec>, allow_insert_closure: bool, is_single_insert: bool, } impl InsertSearchResults<'tcx> { fn as_single_insertion(&self) -> Option> { self.is_single_insert.then(|| self.edits[0].as_insertion().unwrap()) } fn snippet_occupied(&self, cx: &LateContext<'_>, mut span: Span, app: &mut Applicability) -> String { let ctxt = span.ctxt(); let mut res = String::new(); for insertion in self.edits.iter().filter_map(|e| e.as_insertion()) { res.push_str(&snippet_with_applicability( cx, span.until(insertion.call.span), "..", app, )); if is_expr_used_or_unified(cx.tcx, insertion.call) { res.push_str("Some(e.insert("); res.push_str(&snippet_with_context(cx, insertion.value.span, ctxt, "..", app).0); res.push_str("))"); } else { res.push_str("e.insert("); res.push_str(&snippet_with_context(cx, insertion.value.span, ctxt, "..", app).0); res.push(')'); } span = span.trim_start(insertion.call.span).unwrap_or(DUMMY_SP); } res.push_str(&snippet_with_applicability(cx, span, "..", app)); res } fn snippet_vacant(&self, cx: &LateContext<'_>, mut span: Span, app: &mut Applicability) -> String { let ctxt = span.ctxt(); let mut res = String::new(); for insertion in self.edits.iter().filter_map(|e| e.as_insertion()) { res.push_str(&snippet_with_applicability( cx, span.until(insertion.call.span), "..", app, )); if is_expr_used_or_unified(cx.tcx, insertion.call) { if is_expr_final_block_expr(cx.tcx, insertion.call) { let _ = write!( res, "e.insert({});\n{}None", snippet_with_context(cx, insertion.value.span, ctxt, "..", app).0, snippet_indent(cx, insertion.call.span).as_deref().unwrap_or(""), ); } else { let _ = write!( res, "{{ e.insert({}); None }}", snippet_with_context(cx, insertion.value.span, ctxt, "..", app).0, ); } } else { let _ = write!( res, "e.insert({})", snippet_with_context(cx, insertion.value.span, ctxt, "..", app).0, ); } span = span.trim_start(insertion.call.span).unwrap_or(DUMMY_SP); } res.push_str(&snippet_with_applicability(cx, span, "..", app)); res } fn snippet_closure(&self, cx: &LateContext<'_>, mut span: Span, app: &mut Applicability) -> String { let ctxt = span.ctxt(); let mut res = String::new(); for edit in &self.edits { match *edit { Edit::Insertion(insertion) => { res.push_str(&snippet_with_applicability( cx, span.until(insertion.call.span), "..", app, )); res.push_str(&snippet_with_context(cx, insertion.value.span, ctxt, "..", app).0); span = span.trim_start(insertion.call.span).unwrap_or(DUMMY_SP); }, Edit::RemoveSemi(semi_span) => { res.push_str(&snippet_with_applicability(cx, span.until(semi_span), "..", app)); span = span.trim_start(semi_span).unwrap_or(DUMMY_SP); }, } } res.push_str(&snippet_with_applicability(cx, span, "..", app)); res } } fn find_insert_calls( cx: &LateContext<'tcx>, contains_expr: &ContainsExpr<'tcx>, expr: &'tcx Expr<'_>, ) -> Option> { let mut edits = Vec::new(); let mut s = InsertSearcher { cx, map: contains_expr.map, key: contains_expr.key, ctxt: expr.span.ctxt(), edits: &mut edits, is_map_used: false, allow_insert_closure: true, can_use_entry: true, in_tail_pos: true, is_single_insert: true, loops: Vec::new(), }; s.visit_expr(expr); let allow_insert_closure = s.allow_insert_closure; let is_single_insert = s.is_single_insert; s.can_use_entry.then(|| InsertSearchResults { edits, allow_insert_closure, is_single_insert, }) }