Handle repeated str::replace calls with single char kind to str

This commit is contained in:
Nahua Kang 2022-08-07 14:08:09 +02:00
parent 6e86687529
commit a9bd0bd321
3 changed files with 264 additions and 97 deletions

View File

@ -1,17 +1,16 @@
use clippy_utils::diagnostics::span_lint_and_sugg;
// use clippy_utils::source::snippet_with_context;
use clippy_utils::get_parent_expr;
use clippy_utils::visitors::for_each_expr;
use core::ops::ControlFlow;
use if_chain::if_chain;
use rustc_ast::ast::LitKind;
use rustc_data_structures::fx::FxHashSet;
use rustc_errors::Applicability;
use rustc_hir as hir;
use rustc_hir::*;
use rustc_lint::LateContext;
use rustc_middle::ty;
use rustc_span::source_map::Spanned;
use std::unreachable;
// use rustc_span::Span;
use super::method_call;
use super::COLLAPSIBLE_STR_REPLACE;
@ -25,28 +24,46 @@ pub(super) fn check<'tcx>(
) {
match (name, args) {
("replace", [from, to]) => {
// Check for `str::replace` calls with char slice for linting
// The receiver of the method call must be `str` type to lint `collapsible_str_replace`
let original_recv = find_original_recv(recv);
let original_recv_ty = cx.typeck_results().expr_ty(original_recv).peel_refs();
let original_recv_ty_kind = cx.typeck_results().expr_ty(original_recv).peel_refs().kind();
let original_recv_is_str_kind = matches!(original_recv_ty_kind, ty::Str);
if_chain! {
// Check the receiver of the method call is `str` type
if matches!(original_recv_ty.kind(), ty::Str);
let from_ty = cx.typeck_results().expr_ty(from).peel_refs();
if let ty::Array(array_ty, _) = from_ty.kind();
// Check for `str::replace` calls with char slice for linting
if original_recv_is_str_kind;
let from_ty_kind = cx.typeck_results().expr_ty(from).peel_refs().kind();
if let ty::Array(array_ty, _) = from_ty_kind;
if matches!(array_ty.kind(), ty::Char);
then {
check_replace_call_with_char_slice(cx, from, to);
return;
}
}
if_chain! {
if original_recv_is_str_kind;
if let Some(parent) = get_parent_expr(cx, expr);
if let Some((name, [..], _)) = method_call(parent);
then {
match name {
"replace" => return,
_ => {
check_consecutive_replace_calls(cx, expr);
return;
},
}
}
}
match method_call(recv) {
// Check if there's an earlier `str::replace` call
Some(("replace", [prev_recv, prev_from, prev_to], prev_span)) => {
println!("Consecutive replace calls");
// Check that the original receiver is of `ty::Str` type
// Check that all the `from` args are char literals
// Check that all the `to` args are the same variable or has the same &str value
// If so, then lint
Some(("replace", [_, _, _], _)) => {
if original_recv_is_str_kind {
check_consecutive_replace_calls(cx, expr);
return;
}
},
_ => {},
}
@ -55,6 +72,230 @@ pub(super) fn check<'tcx>(
}
}
/// Check a `str::replace` call that contains a char slice as `from` argument for
/// `collapsible_str_replace` lint.
fn check_replace_call_with_char_slice<'tcx>(
cx: &LateContext<'tcx>,
from_arg: &'tcx hir::Expr<'tcx>,
to_arg: &'tcx hir::Expr<'tcx>,
) {
let mut char_slice_has_no_variables = true;
let mut chars: Vec<String> = Vec::new();
// Go through the `from_arg` to collect all char literals
let _: Option<()> = for_each_expr(from_arg, |e| {
if let ExprKind::Lit(Spanned {
node: LitKind::Char(_), ..
}) = e.kind
{
chars.push(get_replace_call_char_arg_repr(e).unwrap());
ControlFlow::Continue(())
} else if let ExprKind::Path(..) = e.kind {
// If a variable is found in the char slice, no lint for first version of this lint
char_slice_has_no_variables = false;
ControlFlow::BREAK
} else {
ControlFlow::Continue(())
}
});
if char_slice_has_no_variables {
if let Some(to_arg_repr) = get_replace_call_char_arg_repr(to_arg) {
let app = Applicability::MachineApplicable;
span_lint_and_sugg(
cx,
COLLAPSIBLE_STR_REPLACE,
from_arg.span,
"used slice of chars in `str::replace` call",
"replace with",
format!("replace(|c| matches!(c, {}), {})", chars.join(" | "), to_arg_repr,),
app,
);
}
}
}
/// Check a chain of `str::replace` calls for `collapsible_str_replace` lint.
fn check_consecutive_replace_calls<'tcx>(cx: &LateContext<'tcx>, expr: &'tcx hir::Expr<'tcx>) {
if_chain! {
if let Some(from_args) = get_replace_call_from_args_if_all_char_ty(cx, expr);
if let Some(to_arg) = get_replace_call_unique_to_arg_repr(expr);
then {
if replace_call_from_args_are_only_lit_chars(&from_args) {
let from_arg_reprs: Vec<String> = from_args.iter().map(|from_arg| {
get_replace_call_char_arg_repr(from_arg).unwrap()
}).collect();
let app = Applicability::MachineApplicable;
span_lint_and_sugg(
cx,
COLLAPSIBLE_STR_REPLACE,
expr.span,
"used consecutive `str::replace` call",
"replace with",
format!(
"replace(|c| matches!(c, {}), {})",
from_arg_reprs.join(" | "),
to_arg,
),
app,
);
} else {
// Use fallback lint
let from_arg_reprs: Vec<String> = from_args.iter().map(|from_arg| {
get_replace_call_char_arg_repr(from_arg).unwrap()
}).collect();
let app = Applicability::MachineApplicable;
span_lint_and_sugg(
cx,
COLLAPSIBLE_STR_REPLACE,
expr.span,
"used consecutive `str::replace` call",
"replace with",
format!(
"replace(&[{}], {})",
from_arg_reprs.join(" , "),
to_arg,
),
app,
);
}
}
}
}
/// Check if all the `from` arguments of a chain of consecutive calls to `str::replace`
/// are all of `ExprKind::Lit` types. If any is not, return false.
fn replace_call_from_args_are_only_lit_chars<'tcx>(from_args: &Vec<&'tcx hir::Expr<'tcx>>) -> bool {
let mut only_lit_chars = true;
for from_arg in from_args.iter() {
match from_arg.kind {
ExprKind::Lit(..) => {},
_ => only_lit_chars = false,
}
}
only_lit_chars
}
/// Collect and return all of the `from` arguments of a chain of consecutive `str::replace` calls
/// if these `from` arguments's expressions are of the `ty::Char` kind. Otherwise return `None`.
fn get_replace_call_from_args_if_all_char_ty<'tcx>(
cx: &LateContext<'tcx>,
expr: &'tcx hir::Expr<'tcx>,
) -> Option<Vec<&'tcx hir::Expr<'tcx>>> {
let mut all_from_args_are_chars = true;
let mut from_args = Vec::new();
let _: Option<()> = for_each_expr(expr, |e| {
if let Some((name, [_, args @ ..], _)) = method_call(e) {
match (name, args) {
("replace", [from, _]) => {
let from_ty_kind = cx.typeck_results().expr_ty(from).peel_refs().kind();
if matches!(from_ty_kind, ty::Char) {
from_args.push(from);
} else {
all_from_args_are_chars = false;
}
ControlFlow::Continue(())
},
_ => ControlFlow::BREAK,
}
} else {
ControlFlow::Continue(())
}
});
if all_from_args_are_chars {
return Some(from_args);
} else {
return None;
}
}
/// Return a unique String representation of the `to` argument used in a chain of `str::replace`
/// calls if each `str::replace` call's `to` argument is identical to the other `to` arguments in
/// the chain. Otherwise, return `None`.
fn get_replace_call_unique_to_arg_repr<'tcx>(expr: &'tcx hir::Expr<'tcx>) -> Option<String> {
let mut to_args = Vec::new();
let _: Option<()> = for_each_expr(expr, |e| {
if let Some((name, [_, args @ ..], _)) = method_call(e) {
match (name, args) {
("replace", [_, to]) => {
to_args.push(to);
ControlFlow::Continue(())
},
_ => ControlFlow::BREAK,
}
} else {
ControlFlow::Continue(())
}
});
// let mut to_arg_repr_set = FxHashSet::default();
let mut to_arg_reprs = Vec::new();
for &to_arg in to_args.iter() {
if let Some(to_arg_repr) = get_replace_call_char_arg_repr(to_arg) {
to_arg_reprs.push(to_arg_repr);
}
}
let to_arg_repr_set = FxHashSet::from_iter(to_arg_reprs.iter().cloned());
// Check if the set of `to` argument representations has more than one unique value
if to_arg_repr_set.len() != 1 {
return None;
}
// Return the single representation value
to_arg_reprs.pop()
}
/// Get the representation of an argument of a `str::replace` call either of the literal char value
/// or variable name, i.e. the resolved path segments `ident`.
/// Return:
/// - the str literal with double quotes, e.g. "\"l\""
/// - the char literal with single quotes, e.g. "'l'"
/// - the variable as a String, e.g. "l"
fn get_replace_call_char_arg_repr<'tcx>(arg: &'tcx hir::Expr<'tcx>) -> Option<String> {
match arg.kind {
ExprKind::Lit(Spanned {
node: LitKind::Str(to_arg_val, _),
..
}) => {
let repr = to_arg_val.as_str();
let double_quote = "\"";
Some(double_quote.to_owned() + repr + double_quote)
},
ExprKind::Lit(Spanned {
node: LitKind::Char(to_arg_val),
..
}) => {
let repr = to_arg_val.to_string();
let double_quote = "\'";
Some(double_quote.to_owned() + &repr + double_quote)
},
ExprKind::Path(QPath::Resolved(
_,
Path {
segments: path_segments,
..
},
)) => {
// join the path_segments values by "::"
let path_segment_ident_names: Vec<&str> = path_segments
.iter()
.map(|path_seg| path_seg.ident.name.as_str())
.collect();
Some(path_segment_ident_names.join("::"))
},
_ => None,
}
}
/// Find the original receiver of a chain of `str::replace` method calls.
fn find_original_recv<'tcx>(recv: &'tcx hir::Expr<'tcx>) -> &'tcx hir::Expr<'tcx> {
let mut original_recv = recv;
@ -74,81 +315,3 @@ fn find_original_recv<'tcx>(recv: &'tcx hir::Expr<'tcx>) -> &'tcx hir::Expr<'tcx
original_recv
}
fn check_replace_call_with_char_slice<'tcx>(
cx: &LateContext<'tcx>,
from_arg: &'tcx hir::Expr<'tcx>,
to_arg: &'tcx hir::Expr<'tcx>,
) {
let mut has_no_var = true;
let mut char_list: Vec<char> = Vec::new();
// Go through the `from_arg` to collect all char literals
let _: Option<()> = for_each_expr(from_arg, |e| {
if let ExprKind::Lit(Spanned {
node: LitKind::Char(val),
..
}) = e.kind
{
char_list.push(val);
ControlFlow::Continue(())
} else if let ExprKind::Path(..) = e.kind {
// If a variable is found in the char slice, no lint for first version of this lint
has_no_var = false;
ControlFlow::BREAK
} else {
ControlFlow::Continue(())
}
});
if has_no_var {
let to_arg_repr = match to_arg.kind {
ExprKind::Lit(Spanned {
node: LitKind::Str(to_arg_val, _),
..
}) => {
let repr = to_arg_val.as_str();
let double_quote = "\"";
double_quote.to_owned() + repr + double_quote
},
ExprKind::Path(QPath::Resolved(
_,
Path {
segments: path_segments,
..
},
)) => {
// join the path_segments values by "::"
let path_segment_ident_names: Vec<&str> = path_segments
.iter()
.map(|path_seg| path_seg.ident.name.as_str())
.collect();
path_segment_ident_names.join("::")
},
_ => unreachable!(),
};
let app = Applicability::MachineApplicable;
span_lint_and_sugg(
cx,
COLLAPSIBLE_STR_REPLACE,
from_arg.span,
"used slice of chars in `str::replace` call",
"replace with",
format!(
"replace(|c| matches!(c, {}), {})",
format_slice_of_chars_for_sugg(&char_list),
to_arg_repr,
),
app,
);
}
}
fn format_slice_of_chars_for_sugg(chars: &Vec<char>) -> String {
let single_quoted_chars: Vec<String> = chars
.iter()
.map(|c| "'".to_owned() + &c.to_string() + &"'".to_owned())
.collect();
single_quoted_chars.join(" | ")
}

View File

@ -3519,7 +3519,10 @@ impl Methods {
("sort_unstable_by", [arg]) => {
unnecessary_sort_by::check(cx, expr, recv, arg, true);
},
("replace", [_, _]) => collapsible_str_replace::check(cx, expr, name, recv, args),
("replace" | "replacen", [arg1, arg2] | [arg1, arg2, _]) => {
no_effect_replace::check(cx, expr, arg1, arg2);
collapsible_str_replace::check(cx, expr, name, recv, args);
},
("splitn" | "rsplitn", [count_arg, pat_arg]) => {
if let Some((Constant::Int(count), _)) = constant(cx, cx.typeck_results(), count_arg) {
suspicious_splitn::check(cx, name, expr, recv, count);
@ -3585,9 +3588,6 @@ impl Methods {
unnecessary_lazy_eval::check(cx, expr, recv, u_arg, "unwrap_or");
},
},
("replace" | "replacen", [arg1, arg2] | [arg1, arg2, _]) => {
no_effect_replace::check(cx, expr, arg1, arg2);
},
("zip", [arg]) => {
if let ExprKind::MethodCall(name, [iter_recv], _) = recv.kind
&& name.ident.name == sym::iter

View File

@ -49,6 +49,10 @@ fn main() {
let replacement = misspelled.replace(s, "l");
println!("{replacement}");
// If the consecutive `str::replace` calls have different `to` arguments, do not lint
let replacement = misspelled.replace('s', "l").replace('u', "p");
println!("{replacement}");
// If the `from` argument is of kind other than a slice or a char, do not lint
let replacement = misspelled.replace(&get_filter(), "l");