rust/clippy_lints/src/literal_representation.rs

614 lines
20 KiB
Rust
Raw Normal View History

2017-07-19 18:56:32 -05:00
//! Lints concerned with the grouping of digits with underscores in integral or
//! floating-point literal expressions.
use crate::utils::{in_macro, snippet_opt, span_lint_and_sugg};
use if_chain::if_chain;
use rustc::lint::{in_external_macro, EarlyContext, EarlyLintPass, LintArray, LintContext, LintPass};
2019-04-08 15:43:55 -05:00
use rustc::{declare_lint_pass, declare_tool_lint, impl_lint_pass};
use rustc_errors::Applicability;
use syntax::ast::*;
use syntax_pos;
2017-07-19 18:56:32 -05:00
2018-03-28 08:24:26 -05:00
declare_clippy_lint! {
/// **What it does:** Warns if a long integral or floating-point constant does
/// not contain underscores.
///
/// **Why is this bad?** Reading long numbers is difficult without separators.
///
/// **Known problems:** None.
///
/// **Example:**
///
/// ```rust
2019-03-05 16:23:50 -06:00
/// let x: u64 = 61864918973511;
/// ```
2017-07-19 18:56:32 -05:00
pub UNREADABLE_LITERAL,
2018-03-28 08:24:26 -05:00
style,
2017-07-19 18:56:32 -05:00
"long integer literal without underscores"
}
2018-09-02 16:07:55 -05:00
declare_clippy_lint! {
/// **What it does:** Warns for mistyped suffix in literals
///
/// **Why is this bad?** This is most probably a typo
///
/// **Known problems:**
/// - Recommends a signed suffix, even though the number might be too big and an unsigned
/// suffix is required
/// - Does not match on `_128` since that is a valid grouping for decimal and octal numbers
///
/// **Example:**
///
/// ```rust
2019-03-05 16:23:50 -06:00
/// 2_32;
/// ```
2018-09-02 16:07:55 -05:00
pub MISTYPED_LITERAL_SUFFIXES,
correctness,
"mistyped literal suffix"
}
2018-03-28 08:24:26 -05:00
declare_clippy_lint! {
/// **What it does:** Warns if an integral or floating-point constant is
/// grouped inconsistently with underscores.
///
/// **Why is this bad?** Readers may incorrectly interpret inconsistently
/// grouped digits.
///
/// **Known problems:** None.
///
/// **Example:**
///
/// ```rust
2019-03-05 16:23:50 -06:00
/// let x: u64 = 618_64_9189_73_511;
/// ```
2017-07-19 18:56:32 -05:00
pub INCONSISTENT_DIGIT_GROUPING,
2018-03-28 08:24:26 -05:00
style,
2017-07-19 18:56:32 -05:00
"integer literals with digits grouped inconsistently"
}
2018-03-28 08:24:26 -05:00
declare_clippy_lint! {
/// **What it does:** Warns if the digits of an integral or floating-point
/// constant are grouped into groups that
/// are too large.
///
/// **Why is this bad?** Negatively impacts readability.
///
/// **Known problems:** None.
///
/// **Example:**
///
/// ```rust
2019-03-05 16:23:50 -06:00
/// let x: u64 = 6186491_8973511;
/// ```
2017-07-19 18:56:32 -05:00
pub LARGE_DIGIT_GROUPS,
pedantic,
2017-07-19 18:56:32 -05:00
"grouping digits into groups that are too large"
}
2018-03-28 08:24:26 -05:00
declare_clippy_lint! {
/// **What it does:** Warns if there is a better representation for a numeric literal.
///
/// **Why is this bad?** Especially for big powers of 2 a hexadecimal representation is more
/// readable than a decimal representation.
///
/// **Known problems:** None.
///
/// **Example:**
///
/// `255` => `0xFF`
/// `65_535` => `0xFFFF`
/// `4_042_322_160` => `0xF0F0_F0F0`
2018-01-23 08:29:31 -06:00
pub DECIMAL_LITERAL_REPRESENTATION,
2018-03-28 08:24:26 -05:00
restriction,
"using decimal representation when hexadecimal would be better"
}
#[derive(Debug, PartialEq)]
pub(super) enum Radix {
Binary,
Octal,
Decimal,
Hexadecimal,
}
impl Radix {
2019-01-30 19:15:29 -06:00
/// Returns a reasonable digit group size for this radix.
#[must_use]
2018-06-25 13:50:20 -05:00
crate fn suggest_grouping(&self) -> usize {
match *self {
Self::Binary | Self::Hexadecimal => 4,
Self::Octal | Self::Decimal => 3,
}
}
}
#[derive(Debug)]
pub(super) struct DigitInfo<'a> {
/// Characters of a literal between the radix prefix and type suffix.
2018-06-25 13:50:20 -05:00
crate digits: &'a str,
/// Which radix the literal was represented in.
2018-06-25 13:50:20 -05:00
crate radix: Radix,
/// The radix prefix, if present.
2018-06-25 13:50:20 -05:00
crate prefix: Option<&'a str>,
/// The type suffix, including preceding underscore if present.
2018-06-25 13:50:20 -05:00
crate suffix: Option<&'a str>,
/// True for floating-point literals.
2018-06-25 13:50:20 -05:00
crate float: bool,
}
impl<'a> DigitInfo<'a> {
#[must_use]
2018-06-25 13:50:20 -05:00
crate fn new(lit: &'a str, float: bool) -> Self {
// Determine delimiter for radix prefix, if present, and radix.
let radix = if lit.starts_with("0x") {
Radix::Hexadecimal
} else if lit.starts_with("0b") {
Radix::Binary
} else if lit.starts_with("0o") {
Radix::Octal
} else {
Radix::Decimal
};
// Grab part of the literal after prefix, if present.
let (prefix, sans_prefix) = if let Radix::Decimal = radix {
(None, lit)
} else {
let (p, s) = lit.split_at(2);
(Some(p), s)
};
2018-09-06 09:26:17 -05:00
let len = sans_prefix.len();
let mut last_d = '\0';
for (d_idx, d) in sans_prefix.char_indices() {
let suffix_start = if last_d == '_' { d_idx - 1 } else { d_idx };
if float
&& (d == 'f'
|| is_possible_float_suffix_index(&sans_prefix, suffix_start, len)
|| ((d == 'E' || d == 'e') && !has_possible_float_suffix(&sans_prefix)))
|| !float && (d == 'i' || d == 'u' || is_possible_suffix_index(&sans_prefix, suffix_start, len))
{
let (digits, suffix) = sans_prefix.split_at(suffix_start);
return Self {
digits,
radix,
prefix,
suffix: Some(suffix),
float,
};
}
last_d = d
}
// No suffix found
2017-08-21 06:32:12 -05:00
Self {
digits: sans_prefix,
radix,
prefix,
suffix: None,
float,
}
}
fn split_digit_parts(&self) -> (&str, Option<&str>, Option<(char, &str)>) {
let digits = self.digits;
let mut integer = digits;
let mut fraction = None;
let mut exponent = None;
if self.float {
for (i, c) in digits.char_indices() {
match c {
'.' => {
integer = &digits[..i];
fraction = Some(&digits[i + 1..]);
},
'e' | 'E' => {
if integer.len() > i {
integer = &digits[..i];
} else {
fraction = Some(&digits[integer.len() + 1..i]);
};
exponent = Some((c, &digits[i + 1..]));
break;
},
_ => {},
}
}
}
(integer, fraction, exponent)
}
2018-09-02 16:07:55 -05:00
/// Returns literal formatted in a sensible way.
2018-06-25 13:50:20 -05:00
crate fn grouping_hint(&self) -> String {
let mut output = String::new();
if let Some(prefix) = self.prefix {
output.push_str(prefix);
}
let group_size = self.radix.suggest_grouping();
let (integer, fraction, exponent) = &self.split_digit_parts();
let int_digits: Vec<_> = integer.chars().rev().filter(|&c| c != '_').collect();
let int_part_hint = int_digits
.chunks(group_size)
.map(|chunk| chunk.iter().rev().collect())
.rev()
.collect::<Vec<String>>()
.join("_");
// Pad leading hexidecimal group with zeros
if self.radix == Radix::Hexadecimal {
debug_assert!(group_size > 0);
let first_group_size = (int_digits.len() + group_size - 1) % group_size + 1;
for _ in 0..group_size - first_group_size {
output.push('0');
}
}
output.push_str(&int_part_hint);
if let Some(fraction) = fraction {
let frac_part_hint = fraction
.chars()
.filter(|&c| c != '_')
.collect::<Vec<_>>()
.chunks(group_size)
.map(|chunk| chunk.iter().collect())
.collect::<Vec<String>>()
.join("_");
output.push('.');
output.push_str(&frac_part_hint);
}
if let Some((separator, exponent)) = exponent {
let after_e_hint = exponent
.chars()
.rev()
.filter(|&c| c != '_')
.collect::<Vec<_>>()
.chunks(group_size)
.map(|chunk| chunk.iter().rev().collect())
.rev()
.collect::<Vec<String>>()
.join("_");
output.push(*separator);
output.push_str(&after_e_hint);
}
if let Some(suffix) = self.suffix {
if self.float && is_mistyped_float_suffix(suffix) {
output.push_str("_f");
output.push_str(&suffix[1..]);
} else if is_mistyped_suffix(suffix) {
output.push_str("_i");
output.push_str(&suffix[1..]);
} else {
output.push_str(suffix);
}
}
output
}
}
enum WarningType {
UnreadableLiteral,
InconsistentDigitGrouping,
LargeDigitGroups,
2018-01-23 08:29:31 -06:00
DecimalRepresentation,
MistypedLiteralSuffix,
}
impl WarningType {
2018-07-23 06:01:12 -05:00
crate fn display(&self, grouping_hint: &str, cx: &EarlyContext<'_>, span: syntax_pos::Span) {
match self {
Self::MistypedLiteralSuffix => span_lint_and_sugg(
cx,
MISTYPED_LITERAL_SUFFIXES,
span,
"mistyped literal suffix",
"did you mean to write",
grouping_hint.to_string(),
Applicability::MaybeIncorrect,
),
Self::UnreadableLiteral => span_lint_and_sugg(
2017-09-05 04:33:04 -05:00
cx,
UNREADABLE_LITERAL,
span,
2017-09-05 04:33:04 -05:00
"long literal lacking separators",
"consider",
grouping_hint.to_owned(),
Applicability::MachineApplicable,
2017-09-05 04:33:04 -05:00
),
Self::LargeDigitGroups => span_lint_and_sugg(
2017-09-05 04:33:04 -05:00
cx,
LARGE_DIGIT_GROUPS,
span,
2017-09-05 04:33:04 -05:00
"digit groups should be smaller",
"consider",
grouping_hint.to_owned(),
Applicability::MachineApplicable,
2017-09-05 04:33:04 -05:00
),
Self::InconsistentDigitGrouping => span_lint_and_sugg(
2017-09-05 04:33:04 -05:00
cx,
INCONSISTENT_DIGIT_GROUPING,
span,
2017-09-05 04:33:04 -05:00
"digits grouped inconsistently by underscores",
"consider",
grouping_hint.to_owned(),
Applicability::MachineApplicable,
2017-09-05 04:33:04 -05:00
),
Self::DecimalRepresentation => span_lint_and_sugg(
cx,
2018-01-23 08:29:31 -06:00
DECIMAL_LITERAL_REPRESENTATION,
span,
2018-01-23 08:29:31 -06:00
"integer literal has a better hexadecimal representation",
"consider",
grouping_hint.to_owned(),
Applicability::MachineApplicable,
),
};
}
}
2019-04-08 15:43:55 -05:00
declare_lint_pass!(LiteralDigitGrouping => [
UNREADABLE_LITERAL,
INCONSISTENT_DIGIT_GROUPING,
LARGE_DIGIT_GROUPS,
MISTYPED_LITERAL_SUFFIXES,
]);
2017-07-19 18:56:32 -05:00
impl EarlyLintPass for LiteralDigitGrouping {
2018-07-23 06:01:12 -05:00
fn check_expr(&mut self, cx: &EarlyContext<'_>, expr: &Expr) {
2018-07-24 01:55:38 -05:00
if in_external_macro(cx.sess(), expr.span) {
2017-07-19 18:56:32 -05:00
return;
}
2019-09-27 10:16:06 -05:00
if let ExprKind::Lit(ref lit) = expr.kind {
2019-10-03 14:09:32 -05:00
Self::check_lit(cx, lit)
2017-07-19 18:56:32 -05:00
}
}
}
impl LiteralDigitGrouping {
2019-10-03 14:09:32 -05:00
fn check_lit(cx: &EarlyContext<'_>, lit: &Lit) {
let in_macro = in_macro(lit.span);
if_chain! {
if let Some(src) = snippet_opt(cx, lit.span);
if let Some(firstch) = src.chars().next();
if char::is_digit(firstch, 10);
then {
let digit_info = match lit.kind {
LitKind::Int(..) => DigitInfo::new(&src, false),
LitKind::Float(..) => DigitInfo::new(&src, true),
_ => return,
};
let result = (|| {
if let Some(suffix) = digit_info.suffix {
if is_mistyped_suffix(suffix) {
return Err(WarningType::MistypedLiteralSuffix);
}
}
match lit.kind {
LitKind::Int(..) => {
Self::do_lint(digit_info.digits, in_macro)?;
},
LitKind::Float(..) => {
// Separate digits into integral and fractional parts.
let parts: Vec<&str> = digit_info
.digits
.split_terminator('.')
.collect();
2017-07-19 18:56:32 -05:00
// Lint integral and fractional parts separately, and then check consistency of digit
// groups if both pass.
let integral_group_size = Self::do_lint(parts[0], in_macro)?;
if parts.len() > 1 {
// Lint the fractional part of literal just like integral part, but reversed.
let fractional_part = &parts[1].chars().rev().collect::<String>();
let fractional_group_size = Self::do_lint(fractional_part, in_macro)?;
let consistent = Self::parts_consistent(integral_group_size,
fractional_group_size,
parts[0].len(),
parts[1].len());
if !consistent {
return Err(WarningType::InconsistentDigitGrouping);
};
};
},
_ => (),
}
Ok(())
})();
if let Err(warning_type) = result {
warning_type.display(&digit_info.grouping_hint(), cx, lit.span)
}
}
}
2017-07-19 18:56:32 -05:00
}
/// Given the sizes of the digit groups of both integral and fractional
/// parts, and the length
/// of both parts, determine if the digits have been grouped consistently.
#[must_use]
fn parts_consistent(int_group_size: usize, frac_group_size: usize, int_size: usize, frac_size: usize) -> bool {
match (int_group_size, frac_group_size) {
// No groups on either side of decimal point - trivially consistent.
(0, 0) => true,
// Integral part has grouped digits, fractional part does not.
(_, 0) => frac_size <= int_group_size,
// Fractional part has grouped digits, integral part does not.
(0, _) => int_size <= frac_group_size,
// Both parts have grouped digits. Groups should be the same size.
(_, _) => int_group_size == frac_group_size,
2017-07-19 18:56:32 -05:00
}
}
2017-07-30 17:46:41 -05:00
/// Performs lint on `digits` (no decimal point) and returns the group
/// size on success or `WarningType` when emitting a warning.
fn do_lint(digits: &str, in_macro: bool) -> Result<usize, WarningType> {
2017-07-19 18:56:32 -05:00
// Grab underscore indices with respect to the units digit.
2017-08-09 02:30:56 -05:00
let underscore_positions: Vec<usize> = digits
.chars()
2017-07-30 17:46:41 -05:00
.rev()
.enumerate()
.filter_map(|(idx, digit)| if digit == '_' { Some(idx) } else { None })
2017-07-19 18:56:32 -05:00
.collect();
if underscore_positions.is_empty() {
// Check if literal needs underscores.
if !in_macro && digits.len() > 5 {
2017-08-01 02:45:36 -05:00
Err(WarningType::UnreadableLiteral)
2017-07-19 18:56:32 -05:00
} else {
2017-08-01 02:45:36 -05:00
Ok(0)
2017-07-19 18:56:32 -05:00
}
} else {
// Check consistency and the sizes of the groups.
let group_size = underscore_positions[0];
let consistent = underscore_positions
.windows(2)
.all(|ps| ps[1] - ps[0] == group_size + 1)
// number of digits to the left of the last group cannot be bigger than group size.
&& (digits.len() - underscore_positions.last()
.expect("there's at least one element") <= group_size + 1);
2017-07-19 18:56:32 -05:00
if !consistent {
2017-07-30 17:46:41 -05:00
return Err(WarningType::InconsistentDigitGrouping);
2017-07-19 18:56:32 -05:00
} else if group_size > 4 {
2017-07-30 17:46:41 -05:00
return Err(WarningType::LargeDigitGroups);
2017-07-19 18:56:32 -05:00
}
2017-08-01 02:45:36 -05:00
Ok(group_size)
2017-07-19 18:56:32 -05:00
}
}
}
2019-04-08 15:43:55 -05:00
#[allow(clippy::module_name_repetitions)]
#[derive(Copy, Clone)]
2019-04-08 15:43:55 -05:00
pub struct DecimalLiteralRepresentation {
threshold: u64,
}
2019-04-08 15:43:55 -05:00
impl_lint_pass!(DecimalLiteralRepresentation => [DECIMAL_LITERAL_REPRESENTATION]);
2019-04-08 15:43:55 -05:00
impl EarlyLintPass for DecimalLiteralRepresentation {
2018-07-23 06:01:12 -05:00
fn check_expr(&mut self, cx: &EarlyContext<'_>, expr: &Expr) {
2018-07-24 01:55:38 -05:00
if in_external_macro(cx.sess(), expr.span) {
return;
}
2019-09-27 10:16:06 -05:00
if let ExprKind::Lit(ref lit) = expr.kind {
self.check_lit(cx, lit)
}
}
}
2019-04-08 15:43:55 -05:00
impl DecimalLiteralRepresentation {
#[must_use]
pub fn new(threshold: u64) -> Self {
Self { threshold }
}
2018-07-23 06:01:12 -05:00
fn check_lit(self, cx: &EarlyContext<'_>, lit: &Lit) {
// Lint integral literals.
if_chain! {
if let LitKind::Int(val, _) = lit.kind;
if let Some(src) = snippet_opt(cx, lit.span);
if let Some(firstch) = src.chars().next();
2019-11-10 07:14:26 -06:00
if char::is_digit(firstch, 10);
2019-04-10 14:05:56 -05:00
let digit_info = DigitInfo::new(&src, false);
if digit_info.radix == Radix::Decimal;
if val >= u128::from(self.threshold);
then {
2019-04-10 14:05:56 -05:00
let hex = format!("{:#X}", val);
let digit_info = DigitInfo::new(&hex, false);
let _ = Self::do_lint(digit_info.digits).map_err(|warning_type| {
warning_type.display(&digit_info.grouping_hint(), cx, lit.span)
});
}
}
}
fn do_lint(digits: &str) -> Result<(), WarningType> {
if digits.len() == 1 {
// Lint for 1 digit literals, if someone really sets the threshold that low
if digits == "1"
|| digits == "2"
|| digits == "4"
|| digits == "8"
|| digits == "3"
|| digits == "7"
|| digits == "F"
{
2018-01-23 08:29:31 -06:00
return Err(WarningType::DecimalRepresentation);
}
} else if digits.len() < 4 {
// Lint for Literals with a hex-representation of 2 or 3 digits
let f = &digits[0..1]; // first digit
let s = &digits[1..]; // suffix
2018-11-01 16:43:40 -05:00
// Powers of 2
if ((f.eq("1") || f.eq("2") || f.eq("4") || f.eq("8")) && s.chars().all(|c| c == '0'))
// Powers of 2 minus 1
|| ((f.eq("1") || f.eq("3") || f.eq("7") || f.eq("F")) && s.chars().all(|c| c == 'F'))
{
2018-01-23 08:29:31 -06:00
return Err(WarningType::DecimalRepresentation);
}
} else {
// Lint for Literals with a hex-representation of 4 digits or more
let f = &digits[0..1]; // first digit
let m = &digits[1..digits.len() - 1]; // middle digits, except last
let s = &digits[1..]; // suffix
2018-11-01 16:43:40 -05:00
// Powers of 2 with a margin of +15/-16
if ((f.eq("1") || f.eq("2") || f.eq("4") || f.eq("8")) && m.chars().all(|c| c == '0'))
|| ((f.eq("1") || f.eq("3") || f.eq("7") || f.eq("F")) && m.chars().all(|c| c == 'F'))
// Lint for representations with only 0s and Fs, while allowing 7 as the first
// digit
|| ((f.eq("7") || f.eq("F")) && s.chars().all(|c| c == '0' || c == 'F'))
{
2018-01-23 08:29:31 -06:00
return Err(WarningType::DecimalRepresentation);
}
}
Ok(())
}
}
2018-09-02 16:07:55 -05:00
#[must_use]
2018-09-02 16:07:55 -05:00
fn is_mistyped_suffix(suffix: &str) -> bool {
["_8", "_16", "_32", "_64"].contains(&suffix)
}
2018-09-06 09:26:17 -05:00
#[must_use]
2018-09-06 09:26:17 -05:00
fn is_possible_suffix_index(lit: &str, idx: usize, len: usize) -> bool {
((len > 3 && idx == len - 3) || (len > 2 && idx == len - 2)) && is_mistyped_suffix(lit.split_at(idx).1)
2018-09-06 09:26:17 -05:00
}
2018-10-11 23:15:01 -05:00
#[must_use]
2018-10-11 23:15:01 -05:00
fn is_mistyped_float_suffix(suffix: &str) -> bool {
["_32", "_64"].contains(&suffix)
}
#[must_use]
2018-10-11 23:15:01 -05:00
fn is_possible_float_suffix_index(lit: &str, idx: usize, len: usize) -> bool {
(len > 3 && idx == len - 3) && is_mistyped_float_suffix(lit.split_at(idx).1)
}
#[must_use]
fn has_possible_float_suffix(lit: &str) -> bool {
lit.ends_with("_32") || lit.ends_with("_64")
2018-09-06 09:26:17 -05:00
}