2016-02-04 17:36:06 -06:00
use regex_syntax ;
2016-04-07 10:46:48 -05:00
use rustc ::hir ::* ;
2016-02-24 10:38:57 -06:00
use rustc ::lint ::* ;
2016-03-31 10:05:43 -05:00
use rustc ::middle ::const_val ::ConstVal ;
use rustc_const_eval ::EvalHint ::ExprTypeChecked ;
use rustc_const_eval ::eval_const_expr_partial ;
2016-02-08 16:48:04 -06:00
use std ::collections ::HashSet ;
2016-02-24 10:38:57 -06:00
use std ::error ::Error ;
2016-02-14 09:55:02 -06:00
use syntax ::ast ::{ LitKind , NodeId } ;
2016-02-05 09:48:35 -06:00
use syntax ::codemap ::{ Span , BytePos } ;
use syntax ::parse ::token ::InternedString ;
2016-04-14 11:13:15 -05:00
use utils ::paths ;
use utils ::{ is_expn_of , match_path , match_type , span_lint , span_help_and_lint } ;
2016-02-04 17:36:06 -06:00
2016-02-05 17:41:54 -06:00
/// **What it does:** This lint checks `Regex::new(_)` invocations for correct regex syntax.
2016-02-04 17:36:06 -06:00
///
/// **Why is this bad?** This will lead to a runtime panic.
///
/// **Known problems:** None.
///
/// **Example:** `Regex::new("|")`
declare_lint! {
pub INVALID_REGEX ,
Deny ,
" finds invalid regular expressions in `Regex::new(_)` invocations "
}
2016-02-05 16:10:48 -06:00
/// **What it does:** This lint checks for `Regex::new(_)` invocations with trivial regex.
///
/// **Why is this bad?** This can likely be replaced by `==` or `str::starts_with`,
/// `str::ends_with` or `std::contains` or other `str` methods.
///
/// **Known problems:** None.
///
/// **Example:** `Regex::new("^foobar")`
declare_lint! {
pub TRIVIAL_REGEX ,
Warn ,
" finds trivial regular expressions in `Regex::new(_)` invocations "
}
2016-02-07 15:50:54 -06:00
/// **What it does:** This lint checks for usage of `regex!(_)` which as of now is usually slower than `Regex::new(_)` unless called in a loop (which is a bad idea anyway).
///
/// **Why is this bad?** Performance, at least for now. The macro version is likely to catch up long-term, but for now the dynamic version is faster.
///
/// **Known problems:** None
///
/// **Example:** `regex!("foo|bar")`
declare_lint! {
pub REGEX_MACRO ,
2016-02-08 16:48:04 -06:00
Warn ,
2016-02-07 15:50:54 -06:00
" finds use of `regex!(_)`, suggests `Regex::new(_)` instead "
}
2016-02-14 09:55:02 -06:00
#[ derive(Clone, Default) ]
pub struct RegexPass {
spans : HashSet < Span > ,
2016-02-24 10:38:57 -06:00
last : Option < NodeId > ,
2016-02-14 09:55:02 -06:00
}
2016-02-04 17:36:06 -06:00
impl LintPass for RegexPass {
fn get_lints ( & self ) -> LintArray {
2016-02-07 15:50:54 -06:00
lint_array! ( INVALID_REGEX , REGEX_MACRO , TRIVIAL_REGEX )
2016-02-04 17:36:06 -06:00
}
}
impl LateLintPass for RegexPass {
2016-02-14 09:55:02 -06:00
fn check_crate ( & mut self , _ : & LateContext , _ : & Crate ) {
self . spans . clear ( ) ;
2016-02-07 15:50:54 -06:00
}
2016-02-14 09:55:02 -06:00
fn check_block ( & mut self , cx : & LateContext , block : & Block ) {
if_let_chain! { [
self . last . is_none ( ) ,
let Some ( ref expr ) = block . expr ,
match_type ( cx , cx . tcx . expr_ty ( expr ) , & [ " regex " , " re " , " Regex " ] ) ,
let Some ( span ) = is_expn_of ( cx , expr . span , " regex " )
] , {
if ! self . spans . contains ( & span ) {
span_lint ( cx ,
REGEX_MACRO ,
span ,
" `regex!(_)` found. \
Please use ` Regex ::new ( _ ) ` , which is faster for now . " );
self . spans . insert ( span ) ;
}
self . last = Some ( block . id ) ;
} }
}
2016-02-24 10:38:57 -06:00
2016-02-14 09:55:02 -06:00
fn check_block_post ( & mut self , _ : & LateContext , block : & Block ) {
if self . last . map_or ( false , | id | block . id = = id ) {
2016-02-24 10:38:57 -06:00
self . last = None ;
2016-02-14 09:55:02 -06:00
}
}
2016-02-07 15:50:54 -06:00
2016-02-04 17:36:06 -06:00
fn check_expr ( & mut self , cx : & LateContext , expr : & Expr ) {
if_let_chain! { [
let ExprCall ( ref fun , ref args ) = expr . node ,
let ExprPath ( _ , ref path ) = fun . node ,
2016-04-14 11:13:15 -05:00
match_path ( path , & paths ::REGEX_NEW ) & & args . len ( ) = = 1
2016-02-04 17:36:06 -06:00
] , {
2016-02-05 09:48:35 -06:00
if let ExprLit ( ref lit ) = args [ 0 ] . node {
2016-02-12 11:35:44 -06:00
if let LitKind ::Str ( ref r , _ ) = lit . node {
2016-02-06 11:06:39 -06:00
match regex_syntax ::Expr ::parse ( r ) {
Ok ( r ) = > {
if let Some ( repl ) = is_trivial_regex ( & r ) {
span_help_and_lint ( cx , TRIVIAL_REGEX , args [ 0 ] . span ,
2016-02-20 14:20:56 -06:00
" trivial regex " ,
2016-02-06 11:06:39 -06:00
& format! ( " consider using {} " , repl ) ) ;
}
}
Err ( e ) = > {
span_lint ( cx ,
INVALID_REGEX ,
str_span ( args [ 0 ] . span , & r , e . position ( ) ) ,
& format! ( " regex syntax error: {} " ,
e . description ( ) ) ) ;
}
}
}
} else if let Some ( r ) = const_str ( cx , & * args [ 0 ] ) {
match regex_syntax ::Expr ::parse ( & r ) {
Ok ( r ) = > {
if let Some ( repl ) = is_trivial_regex ( & r ) {
span_help_and_lint ( cx , TRIVIAL_REGEX , args [ 0 ] . span ,
2016-02-20 14:20:56 -06:00
" trivial regex " ,
2016-02-06 11:06:39 -06:00
& format! ( " consider using {} " , repl ) ) ;
}
}
Err ( e ) = > {
2016-02-05 09:48:35 -06:00
span_lint ( cx ,
INVALID_REGEX ,
2016-02-06 11:06:39 -06:00
args [ 0 ] . span ,
& format! ( " regex syntax error on position {} : {} " ,
e . position ( ) ,
2016-02-05 09:48:35 -06:00
e . description ( ) ) ) ;
}
2016-02-05 16:10:48 -06:00
}
2016-02-05 09:48:35 -06:00
}
2016-02-04 17:36:06 -06:00
} }
}
}
2016-02-05 09:48:35 -06:00
#[ allow(cast_possible_truncation) ]
fn str_span ( base : Span , s : & str , c : usize ) -> Span {
let lo = match s . char_indices ( ) . nth ( c ) {
Some ( ( b , _ ) ) = > base . lo + BytePos ( b as u32 ) ,
2016-02-24 10:38:57 -06:00
_ = > base . hi ,
2016-02-05 09:48:35 -06:00
} ;
2016-02-29 05:19:32 -06:00
Span {
lo : lo ,
hi : lo ,
.. base
}
2016-02-05 09:48:35 -06:00
}
fn const_str ( cx : & LateContext , e : & Expr ) -> Option < InternedString > {
match eval_const_expr_partial ( cx . tcx , e , ExprTypeChecked , None ) {
Ok ( ConstVal ::Str ( r ) ) = > Some ( r ) ,
2016-02-24 10:38:57 -06:00
_ = > None ,
2016-02-05 09:48:35 -06:00
}
}
2016-02-05 16:10:48 -06:00
2016-02-06 11:06:39 -06:00
fn is_trivial_regex ( s : & regex_syntax ::Expr ) -> Option < & 'static str > {
use regex_syntax ::Expr ;
2016-02-05 16:10:48 -06:00
2016-02-06 11:06:39 -06:00
match * s {
Expr ::Empty | Expr ::StartText | Expr ::EndText = > Some ( " the regex is unlikely to be useful as it is " ) ,
Expr ::Literal { .. } = > Some ( " consider using `str::contains` " ) ,
Expr ::Concat ( ref exprs ) = > {
match exprs . len ( ) {
2016-02-24 10:38:57 -06:00
2 = > {
match ( & exprs [ 0 ] , & exprs [ 1 ] ) {
( & Expr ::StartText , & Expr ::EndText ) = > Some ( " consider using `str::is_empty` " ) ,
( & Expr ::StartText , & Expr ::Literal { .. } ) = > Some ( " consider using `str::starts_with` " ) ,
( & Expr ::Literal { .. } , & Expr ::EndText ) = > Some ( " consider using `str::ends_with` " ) ,
_ = > None ,
}
}
2016-02-06 11:06:39 -06:00
3 = > {
if let ( & Expr ::StartText , & Expr ::Literal { .. } , & Expr ::EndText ) = ( & exprs [ 0 ] , & exprs [ 1 ] , & exprs [ 2 ] ) {
Some ( " consider using `==` on `str`s " )
2016-02-24 10:38:57 -06:00
} else {
2016-02-06 11:06:39 -06:00
None
}
2016-02-24 10:38:57 -06:00
}
2016-02-06 11:06:39 -06:00
_ = > None ,
}
}
_ = > None ,
2016-02-05 16:10:48 -06:00
}
}