2022-02-06 18:53:51 +00:00
|
|
|
|
use clippy_utils::diagnostics::span_lint_and_then;
|
|
|
|
|
use clippy_utils::source::snippet;
|
|
|
|
|
use clippy_utils::{path_to_local, search_same, SpanlessEq, SpanlessHash};
|
2022-01-06 07:54:35 +00:00
|
|
|
|
use rustc_ast::ast::LitKind;
|
|
|
|
|
use rustc_hir::def_id::DefId;
|
|
|
|
|
use rustc_hir::{Arm, Expr, ExprKind, HirId, HirIdMap, HirIdSet, Pat, PatKind, RangeEnd};
|
2022-02-06 18:53:51 +00:00
|
|
|
|
use rustc_lint::LateContext;
|
2022-01-06 07:54:35 +00:00
|
|
|
|
use rustc_span::Symbol;
|
2022-02-06 18:53:51 +00:00
|
|
|
|
use std::collections::hash_map::Entry;
|
|
|
|
|
|
|
|
|
|
use super::MATCH_SAME_ARMS;
|
|
|
|
|
|
2022-01-06 07:54:35 +00:00
|
|
|
|
pub(super) fn check<'tcx>(cx: &LateContext<'tcx>, arms: &'tcx [Arm<'_>]) {
|
2022-02-17 15:48:24 +00:00
|
|
|
|
let hash = |&(_, arm): &(usize, &Arm<'_>)| -> u64 {
|
|
|
|
|
let mut h = SpanlessHash::new(cx);
|
|
|
|
|
h.hash_expr(arm.body);
|
|
|
|
|
h.finish()
|
|
|
|
|
};
|
2022-02-06 18:53:51 +00:00
|
|
|
|
|
2022-01-06 07:54:35 +00:00
|
|
|
|
let resolved_pats: Vec<_> = arms.iter().map(|a| ResolvedPat::from_pat(cx, a.pat)).collect();
|
|
|
|
|
|
|
|
|
|
// The furthast forwards a pattern can move without semantic changes
|
|
|
|
|
let forwards_blocking_idxs: Vec<_> = resolved_pats
|
|
|
|
|
.iter()
|
|
|
|
|
.enumerate()
|
|
|
|
|
.map(|(i, pat)| {
|
|
|
|
|
resolved_pats[i + 1..]
|
|
|
|
|
.iter()
|
|
|
|
|
.enumerate()
|
|
|
|
|
.find_map(|(j, other)| pat.can_also_match(other).then(|| i + 1 + j))
|
|
|
|
|
.unwrap_or(resolved_pats.len())
|
|
|
|
|
})
|
|
|
|
|
.collect();
|
|
|
|
|
|
|
|
|
|
// The furthast backwards a pattern can move without semantic changes
|
|
|
|
|
let backwards_blocking_idxs: Vec<_> = resolved_pats
|
|
|
|
|
.iter()
|
|
|
|
|
.enumerate()
|
|
|
|
|
.map(|(i, pat)| {
|
|
|
|
|
resolved_pats[..i]
|
|
|
|
|
.iter()
|
|
|
|
|
.enumerate()
|
|
|
|
|
.rev()
|
|
|
|
|
.zip(forwards_blocking_idxs[..i].iter().copied().rev())
|
|
|
|
|
.skip_while(|&(_, forward_block)| forward_block > i)
|
|
|
|
|
.find_map(|((j, other), forward_block)| (forward_block == i || pat.can_also_match(other)).then(|| j))
|
|
|
|
|
.unwrap_or(0)
|
|
|
|
|
})
|
|
|
|
|
.collect();
|
|
|
|
|
|
2022-02-17 15:48:24 +00:00
|
|
|
|
let eq = |&(lindex, lhs): &(usize, &Arm<'_>), &(rindex, rhs): &(usize, &Arm<'_>)| -> bool {
|
|
|
|
|
let min_index = usize::min(lindex, rindex);
|
|
|
|
|
let max_index = usize::max(lindex, rindex);
|
2022-02-06 18:53:51 +00:00
|
|
|
|
|
2022-02-17 15:48:24 +00:00
|
|
|
|
let mut local_map: HirIdMap<HirId> = HirIdMap::default();
|
|
|
|
|
let eq_fallback = |a: &Expr<'_>, b: &Expr<'_>| {
|
|
|
|
|
if_chain! {
|
|
|
|
|
if let Some(a_id) = path_to_local(a);
|
|
|
|
|
if let Some(b_id) = path_to_local(b);
|
|
|
|
|
let entry = match local_map.entry(a_id) {
|
|
|
|
|
Entry::Vacant(entry) => entry,
|
|
|
|
|
// check if using the same bindings as before
|
|
|
|
|
Entry::Occupied(entry) => return *entry.get() == b_id,
|
|
|
|
|
};
|
|
|
|
|
// the names technically don't have to match; this makes the lint more conservative
|
|
|
|
|
if cx.tcx.hir().name(a_id) == cx.tcx.hir().name(b_id);
|
|
|
|
|
if cx.typeck_results().expr_ty(a) == cx.typeck_results().expr_ty(b);
|
|
|
|
|
if pat_contains_local(lhs.pat, a_id);
|
|
|
|
|
if pat_contains_local(rhs.pat, b_id);
|
|
|
|
|
then {
|
|
|
|
|
entry.insert(b_id);
|
|
|
|
|
true
|
|
|
|
|
} else {
|
|
|
|
|
false
|
2022-02-06 18:53:51 +00:00
|
|
|
|
}
|
2022-02-17 15:48:24 +00:00
|
|
|
|
}
|
2022-02-06 18:53:51 +00:00
|
|
|
|
};
|
2022-02-17 15:48:24 +00:00
|
|
|
|
// Arms with a guard are ignored, those can’t always be merged together
|
2022-01-06 07:54:35 +00:00
|
|
|
|
// If both arms overlap with an arm in between then these can't be merged either.
|
|
|
|
|
!(backwards_blocking_idxs[max_index] > min_index && forwards_blocking_idxs[min_index] < max_index)
|
|
|
|
|
&& lhs.guard.is_none()
|
|
|
|
|
&& rhs.guard.is_none()
|
|
|
|
|
&& SpanlessEq::new(cx)
|
|
|
|
|
.expr_fallback(eq_fallback)
|
|
|
|
|
.eq_expr(lhs.body, rhs.body)
|
|
|
|
|
// these checks could be removed to allow unused bindings
|
|
|
|
|
&& bindings_eq(lhs.pat, local_map.keys().copied().collect())
|
|
|
|
|
&& bindings_eq(rhs.pat, local_map.values().copied().collect())
|
2022-02-17 15:48:24 +00:00
|
|
|
|
};
|
2022-02-06 18:53:51 +00:00
|
|
|
|
|
2022-02-17 15:48:24 +00:00
|
|
|
|
let indexed_arms: Vec<(usize, &Arm<'_>)> = arms.iter().enumerate().collect();
|
|
|
|
|
for (&(_, i), &(_, j)) in search_same(&indexed_arms, hash, eq) {
|
|
|
|
|
span_lint_and_then(
|
|
|
|
|
cx,
|
|
|
|
|
MATCH_SAME_ARMS,
|
|
|
|
|
j.body.span,
|
|
|
|
|
"this `match` has identical arm bodies",
|
|
|
|
|
|diag| {
|
|
|
|
|
diag.span_note(i.body.span, "same as this");
|
2022-02-06 18:53:51 +00:00
|
|
|
|
|
2022-02-17 15:48:24 +00:00
|
|
|
|
// Note: this does not use `span_suggestion` on purpose:
|
|
|
|
|
// there is no clean way
|
|
|
|
|
// to remove the other arm. Building a span and suggest to replace it to ""
|
|
|
|
|
// makes an even more confusing error message. Also in order not to make up a
|
|
|
|
|
// span for the whole pattern, the suggestion is only shown when there is only
|
|
|
|
|
// one pattern. The user should know about `|` if they are already using it…
|
2022-02-06 18:53:51 +00:00
|
|
|
|
|
2022-02-17 15:48:24 +00:00
|
|
|
|
let lhs = snippet(cx, i.pat.span, "<pat1>");
|
|
|
|
|
let rhs = snippet(cx, j.pat.span, "<pat2>");
|
2022-02-06 18:53:51 +00:00
|
|
|
|
|
2022-02-17 15:48:24 +00:00
|
|
|
|
if let PatKind::Wild = j.pat.kind {
|
|
|
|
|
// if the last arm is _, then i could be integrated into _
|
|
|
|
|
// note that i.pat cannot be _, because that would mean that we're
|
|
|
|
|
// hiding all the subsequent arms, and rust won't compile
|
|
|
|
|
diag.span_note(
|
|
|
|
|
i.body.span,
|
|
|
|
|
&format!(
|
|
|
|
|
"`{}` has the same arm body as the `_` wildcard, consider removing it",
|
|
|
|
|
lhs
|
|
|
|
|
),
|
|
|
|
|
);
|
|
|
|
|
} else {
|
|
|
|
|
diag.span_help(i.pat.span, &format!("consider refactoring into `{} | {}`", lhs, rhs,))
|
|
|
|
|
.help("...or consider changing the match arm bodies");
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
);
|
2022-02-06 18:53:51 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2022-01-06 07:54:35 +00:00
|
|
|
|
#[derive(Debug)]
|
|
|
|
|
enum ResolvedPat<'hir> {
|
|
|
|
|
Wild,
|
|
|
|
|
Struct(Option<DefId>, Vec<(Symbol, ResolvedPat<'hir>)>),
|
|
|
|
|
Sequence(Option<DefId>, Vec<ResolvedPat<'hir>>, Option<usize>),
|
|
|
|
|
Or(Vec<ResolvedPat<'hir>>),
|
|
|
|
|
Path(Option<DefId>),
|
|
|
|
|
LitStr(Symbol),
|
|
|
|
|
LitBytes(&'hir [u8]),
|
|
|
|
|
LitInt(u128),
|
|
|
|
|
LitBool(bool),
|
|
|
|
|
Range(PatRange),
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[derive(Debug)]
|
|
|
|
|
struct PatRange {
|
|
|
|
|
start: u128,
|
|
|
|
|
end: u128,
|
|
|
|
|
bounds: RangeEnd,
|
|
|
|
|
}
|
|
|
|
|
impl PatRange {
|
|
|
|
|
fn contains(&self, x: u128) -> bool {
|
|
|
|
|
x >= self.start
|
|
|
|
|
&& match self.bounds {
|
|
|
|
|
RangeEnd::Included => x <= self.end,
|
|
|
|
|
RangeEnd::Excluded => x < self.end,
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
fn overlaps(&self, other: &Self) -> bool {
|
|
|
|
|
!(self.is_empty() || other.is_empty())
|
|
|
|
|
&& match self.bounds {
|
|
|
|
|
RangeEnd::Included => self.end >= other.start,
|
|
|
|
|
RangeEnd::Excluded => self.end > other.start,
|
|
|
|
|
}
|
|
|
|
|
&& match other.bounds {
|
|
|
|
|
RangeEnd::Included => self.start <= other.end,
|
|
|
|
|
RangeEnd::Excluded => self.start < other.end,
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
fn is_empty(&self) -> bool {
|
|
|
|
|
match self.bounds {
|
|
|
|
|
RangeEnd::Included => false,
|
|
|
|
|
RangeEnd::Excluded => self.start == self.end,
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
impl<'hir> ResolvedPat<'hir> {
|
|
|
|
|
fn from_pat(cx: &LateContext<'_>, pat: &'hir Pat<'_>) -> Self {
|
|
|
|
|
match pat.kind {
|
|
|
|
|
PatKind::Wild | PatKind::Binding(.., None) => Self::Wild,
|
|
|
|
|
PatKind::Binding(.., Some(pat)) | PatKind::Box(pat) | PatKind::Ref(pat, _) => Self::from_pat(cx, pat),
|
|
|
|
|
PatKind::Struct(ref path, fields, _) => {
|
|
|
|
|
let mut fields: Vec<_> = fields
|
|
|
|
|
.iter()
|
|
|
|
|
.map(|f| (f.ident.name, Self::from_pat(cx, f.pat)))
|
|
|
|
|
.collect();
|
|
|
|
|
fields.sort_by_key(|&(name, _)| name);
|
|
|
|
|
Self::Struct(cx.qpath_res(path, pat.hir_id).opt_def_id(), fields)
|
|
|
|
|
},
|
|
|
|
|
PatKind::TupleStruct(ref path, pats, wild_idx) => Self::Sequence(
|
|
|
|
|
cx.qpath_res(path, pat.hir_id).opt_def_id(),
|
|
|
|
|
pats.iter().map(|pat| Self::from_pat(cx, pat)).collect(),
|
|
|
|
|
wild_idx,
|
|
|
|
|
),
|
|
|
|
|
PatKind::Or(pats) => Self::Or(pats.iter().map(|pat| Self::from_pat(cx, pat)).collect()),
|
|
|
|
|
PatKind::Path(ref path) => Self::Path(cx.qpath_res(path, pat.hir_id).opt_def_id()),
|
|
|
|
|
PatKind::Tuple(pats, wild_idx) => {
|
|
|
|
|
Self::Sequence(None, pats.iter().map(|pat| Self::from_pat(cx, pat)).collect(), wild_idx)
|
|
|
|
|
},
|
|
|
|
|
PatKind::Lit(e) => match &e.kind {
|
|
|
|
|
ExprKind::Lit(lit) => match lit.node {
|
|
|
|
|
LitKind::Str(sym, _) => Self::LitStr(sym),
|
|
|
|
|
LitKind::ByteStr(ref bytes) => Self::LitBytes(&**bytes),
|
|
|
|
|
LitKind::Byte(val) => Self::LitInt(val.into()),
|
|
|
|
|
LitKind::Char(val) => Self::LitInt(val.into()),
|
|
|
|
|
LitKind::Int(val, _) => Self::LitInt(val),
|
|
|
|
|
LitKind::Bool(val) => Self::LitBool(val),
|
|
|
|
|
LitKind::Float(..) | LitKind::Err(_) => Self::Wild,
|
|
|
|
|
},
|
|
|
|
|
_ => Self::Wild,
|
|
|
|
|
},
|
|
|
|
|
PatKind::Range(start, end, bounds) => {
|
|
|
|
|
let start = match start {
|
|
|
|
|
None => 0,
|
|
|
|
|
Some(e) => match &e.kind {
|
|
|
|
|
ExprKind::Lit(lit) => match lit.node {
|
|
|
|
|
LitKind::Int(val, _) => val,
|
|
|
|
|
LitKind::Char(val) => val.into(),
|
|
|
|
|
LitKind::Byte(val) => val.into(),
|
|
|
|
|
_ => return Self::Wild,
|
|
|
|
|
},
|
|
|
|
|
_ => return Self::Wild,
|
|
|
|
|
},
|
|
|
|
|
};
|
|
|
|
|
let (end, bounds) = match end {
|
|
|
|
|
None => (u128::MAX, RangeEnd::Included),
|
|
|
|
|
Some(e) => match &e.kind {
|
|
|
|
|
ExprKind::Lit(lit) => match lit.node {
|
|
|
|
|
LitKind::Int(val, _) => (val, bounds),
|
|
|
|
|
LitKind::Char(val) => (val.into(), bounds),
|
|
|
|
|
LitKind::Byte(val) => (val.into(), bounds),
|
|
|
|
|
_ => return Self::Wild,
|
|
|
|
|
},
|
|
|
|
|
_ => return Self::Wild,
|
|
|
|
|
},
|
|
|
|
|
};
|
|
|
|
|
Self::Range(PatRange { start, end, bounds })
|
|
|
|
|
},
|
|
|
|
|
PatKind::Slice(pats, wild, pats2) => Self::Sequence(
|
|
|
|
|
None,
|
|
|
|
|
pats.iter()
|
|
|
|
|
.chain(pats2.iter())
|
|
|
|
|
.map(|pat| Self::from_pat(cx, pat))
|
|
|
|
|
.collect(),
|
|
|
|
|
wild.map(|_| pats.len()),
|
|
|
|
|
),
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// Checks if two patterns overlap in the values they can match assuming they are for the same
|
|
|
|
|
/// type.
|
|
|
|
|
fn can_also_match(&self, other: &Self) -> bool {
|
|
|
|
|
match (self, other) {
|
|
|
|
|
(Self::Wild, _) | (_, Self::Wild) => true,
|
|
|
|
|
(Self::Or(pats), other) | (other, Self::Or(pats)) => pats.iter().any(|pat| pat.can_also_match(other)),
|
|
|
|
|
(Self::Struct(lpath, lfields), Self::Struct(rpath, rfields)) => {
|
|
|
|
|
if lpath != rpath {
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
let mut rfields = rfields.iter();
|
|
|
|
|
let mut rfield = match rfields.next() {
|
|
|
|
|
Some(x) => x,
|
|
|
|
|
None => return true,
|
|
|
|
|
};
|
|
|
|
|
'outer: for lfield in lfields {
|
|
|
|
|
loop {
|
|
|
|
|
if lfield.0 < rfield.0 {
|
|
|
|
|
continue 'outer;
|
|
|
|
|
} else if lfield.0 > rfield.0 {
|
|
|
|
|
rfield = match rfields.next() {
|
|
|
|
|
Some(x) => x,
|
|
|
|
|
None => return true,
|
|
|
|
|
};
|
|
|
|
|
} else if !lfield.1.can_also_match(&rfield.1) {
|
|
|
|
|
return false;
|
|
|
|
|
} else {
|
|
|
|
|
rfield = match rfields.next() {
|
|
|
|
|
Some(x) => x,
|
|
|
|
|
None => return true,
|
|
|
|
|
};
|
|
|
|
|
continue 'outer;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
true
|
|
|
|
|
},
|
|
|
|
|
(Self::Sequence(lpath, lpats, lwild_idx), Self::Sequence(rpath, rpats, rwild_idx)) => {
|
|
|
|
|
if lpath != rpath {
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
let (lpats_start, lpats_end) = lwild_idx
|
|
|
|
|
.or(*rwild_idx)
|
|
|
|
|
.map_or((&**lpats, [].as_slice()), |idx| lpats.split_at(idx));
|
|
|
|
|
let (rpats_start, rpats_end) = rwild_idx
|
|
|
|
|
.or(*lwild_idx)
|
|
|
|
|
.map_or((&**rpats, [].as_slice()), |idx| rpats.split_at(idx));
|
|
|
|
|
|
|
|
|
|
lpats_start
|
|
|
|
|
.iter()
|
|
|
|
|
.zip(rpats_start.iter())
|
|
|
|
|
.all(|(lpat, rpat)| lpat.can_also_match(rpat))
|
|
|
|
|
// `lpats_end` and `rpats_end` lengths may be disjointed, so start from the end and ignore any
|
|
|
|
|
// extras.
|
|
|
|
|
&& lpats_end
|
|
|
|
|
.iter()
|
|
|
|
|
.rev()
|
|
|
|
|
.zip(rpats_end.iter().rev())
|
|
|
|
|
.all(|(lpat, rpat)| lpat.can_also_match(rpat))
|
|
|
|
|
},
|
|
|
|
|
(Self::Path(x), Self::Path(y)) => x == y,
|
|
|
|
|
(Self::LitStr(x), Self::LitStr(y)) => x == y,
|
|
|
|
|
(Self::LitBytes(x), Self::LitBytes(y)) => x == y,
|
|
|
|
|
(Self::LitInt(x), Self::LitInt(y)) => x == y,
|
|
|
|
|
(Self::LitBool(x), Self::LitBool(y)) => x == y,
|
|
|
|
|
(Self::Range(x), Self::Range(y)) => x.overlaps(y),
|
|
|
|
|
(Self::Range(range), Self::LitInt(x)) | (Self::LitInt(x), Self::Range(range)) => range.contains(*x),
|
|
|
|
|
|
|
|
|
|
// Todo: Lit* with Path, Range with Path, LitBytes with Sequence
|
|
|
|
|
_ => true,
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2022-02-06 18:53:51 +00:00
|
|
|
|
fn pat_contains_local(pat: &Pat<'_>, id: HirId) -> bool {
|
|
|
|
|
let mut result = false;
|
|
|
|
|
pat.walk_short(|p| {
|
|
|
|
|
result |= matches!(p.kind, PatKind::Binding(_, binding_id, ..) if binding_id == id);
|
|
|
|
|
!result
|
|
|
|
|
});
|
|
|
|
|
result
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// Returns true if all the bindings in the `Pat` are in `ids` and vice versa
|
|
|
|
|
fn bindings_eq(pat: &Pat<'_>, mut ids: HirIdSet) -> bool {
|
|
|
|
|
let mut result = true;
|
|
|
|
|
pat.each_binding_or_first(&mut |_, id, _, _| result &= ids.remove(&id));
|
|
|
|
|
result && ids.is_empty()
|
|
|
|
|
}
|