2016-02-05 00:36:06 +01:00
|
|
|
use regex_syntax;
|
|
|
|
|
use std::error::Error;
|
2016-02-05 16:48:35 +01:00
|
|
|
use syntax::ast::Lit_::LitStr;
|
|
|
|
|
use syntax::codemap::{Span, BytePos};
|
|
|
|
|
use syntax::parse::token::InternedString;
|
2016-02-05 00:36:06 +01:00
|
|
|
use rustc_front::hir::*;
|
|
|
|
|
use rustc::middle::const_eval::{eval_const_expr_partial, ConstVal};
|
|
|
|
|
use rustc::middle::const_eval::EvalHint::ExprTypeChecked;
|
|
|
|
|
use rustc::lint::*;
|
|
|
|
|
|
2016-02-05 23:10:48 +01:00
|
|
|
use utils::{match_path, REGEX_NEW_PATH, span_lint, span_help_and_lint};
|
2016-02-05 00:36:06 +01:00
|
|
|
|
2016-02-06 00:41:54 +01:00
|
|
|
/// **What it does:** This lint checks `Regex::new(_)` invocations for correct regex syntax.
|
2016-02-05 00:36:06 +01:00
|
|
|
///
|
|
|
|
|
/// **Why is this bad?** This will lead to a runtime panic.
|
|
|
|
|
///
|
|
|
|
|
/// **Known problems:** None.
|
|
|
|
|
///
|
|
|
|
|
/// **Example:** `Regex::new("|")`
|
|
|
|
|
declare_lint! {
|
|
|
|
|
pub INVALID_REGEX,
|
|
|
|
|
Deny,
|
|
|
|
|
"finds invalid regular expressions in `Regex::new(_)` invocations"
|
|
|
|
|
}
|
|
|
|
|
|
2016-02-05 23:10:48 +01:00
|
|
|
/// **What it does:** This lint checks for `Regex::new(_)` invocations with trivial regex.
|
|
|
|
|
///
|
|
|
|
|
/// **Why is this bad?** This can likely be replaced by `==` or `str::starts_with`,
|
|
|
|
|
/// `str::ends_with` or `std::contains` or other `str` methods.
|
|
|
|
|
///
|
|
|
|
|
/// **Known problems:** None.
|
|
|
|
|
///
|
|
|
|
|
/// **Example:** `Regex::new("^foobar")`
|
|
|
|
|
declare_lint! {
|
|
|
|
|
pub TRIVIAL_REGEX,
|
|
|
|
|
Warn,
|
|
|
|
|
"finds trivial regular expressions in `Regex::new(_)` invocations"
|
|
|
|
|
}
|
|
|
|
|
|
2016-02-05 00:36:06 +01:00
|
|
|
#[derive(Copy,Clone)]
|
|
|
|
|
pub struct RegexPass;
|
|
|
|
|
|
|
|
|
|
impl LintPass for RegexPass {
|
|
|
|
|
fn get_lints(&self) -> LintArray {
|
2016-02-05 23:10:48 +01:00
|
|
|
lint_array!(INVALID_REGEX, TRIVIAL_REGEX)
|
2016-02-05 00:36:06 +01:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
impl LateLintPass for RegexPass {
|
|
|
|
|
fn check_expr(&mut self, cx: &LateContext, expr: &Expr) {
|
|
|
|
|
if_let_chain!{[
|
|
|
|
|
let ExprCall(ref fun, ref args) = expr.node,
|
|
|
|
|
let ExprPath(_, ref path) = fun.node,
|
2016-02-05 16:48:35 +01:00
|
|
|
match_path(path, ®EX_NEW_PATH) && args.len() == 1
|
2016-02-05 00:36:06 +01:00
|
|
|
], {
|
2016-02-05 16:48:35 +01:00
|
|
|
if let ExprLit(ref lit) = args[0].node {
|
|
|
|
|
if let LitStr(ref r, _) = lit.node {
|
|
|
|
|
if let Err(e) = regex_syntax::Expr::parse(r) {
|
|
|
|
|
span_lint(cx,
|
|
|
|
|
INVALID_REGEX,
|
|
|
|
|
str_span(args[0].span, &r, e.position()),
|
2016-02-05 21:54:29 +01:00
|
|
|
&format!("regex syntax error: {}",
|
2016-02-05 16:48:35 +01:00
|
|
|
e.description()));
|
|
|
|
|
}
|
2016-02-05 23:10:48 +01:00
|
|
|
else if let Some(repl) = is_trivial_regex(r) {
|
|
|
|
|
span_help_and_lint(cx, TRIVIAL_REGEX, args[0].span,
|
|
|
|
|
&"trivial regex",
|
|
|
|
|
&format!("consider using {}", repl));
|
|
|
|
|
}
|
2016-02-05 16:48:35 +01:00
|
|
|
}
|
2016-02-05 23:10:48 +01:00
|
|
|
} else if let Some(r) = const_str(cx, &*args[0]) {
|
|
|
|
|
if let Err(e) = regex_syntax::Expr::parse(&r) {
|
2016-02-05 16:48:35 +01:00
|
|
|
span_lint(cx,
|
|
|
|
|
INVALID_REGEX,
|
|
|
|
|
args[0].span,
|
2016-02-05 21:54:29 +01:00
|
|
|
&format!("regex syntax error on position {}: {}",
|
2016-02-05 16:48:35 +01:00
|
|
|
e.position(),
|
|
|
|
|
e.description()));
|
2016-02-05 23:10:48 +01:00
|
|
|
}
|
|
|
|
|
else if let Some(repl) = is_trivial_regex(&r) {
|
|
|
|
|
span_help_and_lint(cx, TRIVIAL_REGEX, args[0].span,
|
|
|
|
|
&"trivial regex",
|
|
|
|
|
&format!("{}", repl));
|
|
|
|
|
}
|
2016-02-05 16:48:35 +01:00
|
|
|
}
|
2016-02-05 00:36:06 +01:00
|
|
|
}}
|
|
|
|
|
}
|
|
|
|
|
}
|
2016-02-05 16:48:35 +01:00
|
|
|
|
|
|
|
|
#[allow(cast_possible_truncation)]
|
|
|
|
|
fn str_span(base: Span, s: &str, c: usize) -> Span {
|
|
|
|
|
let lo = match s.char_indices().nth(c) {
|
|
|
|
|
Some((b, _)) => base.lo + BytePos(b as u32),
|
|
|
|
|
_ => base.hi
|
|
|
|
|
};
|
|
|
|
|
Span{ lo: lo, hi: lo, ..base }
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
fn const_str(cx: &LateContext, e: &Expr) -> Option<InternedString> {
|
|
|
|
|
match eval_const_expr_partial(cx.tcx, e, ExprTypeChecked, None) {
|
|
|
|
|
Ok(ConstVal::Str(r)) => Some(r),
|
|
|
|
|
_ => None
|
|
|
|
|
}
|
|
|
|
|
}
|
2016-02-05 23:10:48 +01:00
|
|
|
|
|
|
|
|
fn is_trivial_regex(s: &str) -> Option<&'static str> {
|
|
|
|
|
// some unlikely but valid corner cases
|
|
|
|
|
match s {
|
|
|
|
|
"" | "^" | "$" => return Some("the regex is unlikely to be useful as it is"),
|
|
|
|
|
"^$" => return Some("consider using `str::is_empty`"),
|
|
|
|
|
_ => (),
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
let (start, end, repl) = match (s.starts_with('^'), s.ends_with('$')) {
|
|
|
|
|
(true, true) => (1, s.len()-1, "consider using `==` on `str`s"),
|
|
|
|
|
(false, true) => (0, s.len()-1, "consider using `str::ends_with`"),
|
|
|
|
|
(true, false) => (1, s.len(), "consider using `str::starts_with`"),
|
|
|
|
|
(false, false) => (0, s.len(), "consider using `str::contains`"),
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
if !s.chars().take(end).skip(start).any(regex_syntax::is_punct) {
|
|
|
|
|
Some(repl)
|
|
|
|
|
}
|
|
|
|
|
else {
|
|
|
|
|
None
|
|
|
|
|
}
|
|
|
|
|
}
|