From 66efbad871620fe2dbe675438fdc8d9922e72826 Mon Sep 17 00:00:00 2001 From: Marc Tiehuis Date: Sun, 2 Apr 2017 09:55:58 +1200 Subject: Add dfa-size-limit and regex-size-limit arguments Fixes #362. --- src/args.rs | 96 +++++++++++++++++++++++++++++++++++++++++++++++++------------ 1 file changed, 78 insertions(+), 18 deletions(-) (limited to 'src/args.rs') diff --git a/src/args.rs b/src/args.rs index 34f38792..48c4ad56 100644 --- a/src/args.rs +++ b/src/args.rs @@ -771,12 +771,18 @@ impl<'a> ArgMatches<'a> { let casei = self.is_present("ignore-case") && !self.is_present("case-sensitive"); - GrepBuilder::new(&try!(self.pattern())) + let mut gb = GrepBuilder::new(&try!(self.pattern())) .case_smart(smart) .case_insensitive(casei) - .line_terminator(b'\n') - .build() - .map_err(From::from) + .line_terminator(b'\n'); + + if let Some(limit) = try!(self.dfa_size_limit()) { + gb = gb.dfa_size_limit(limit); + } + if let Some(limit) = try!(self.regex_size_limit()) { + gb = gb.size_limit(limit); + } + gb.build().map_err(From::from) } /// Builds the set of glob overrides from the command line flags. @@ -807,31 +813,64 @@ impl<'a> ArgMatches<'a> { btypes.build().map_err(From::from) } - /// Parses the max-filesize argument option into a byte count. - fn max_filesize(&self) -> Result> { - use regex::Regex; - - let max_filesize = match self.value_of_lossy("max-filesize") { + /// Parses an argument of the form `[0-9]+(KMG)?`. + /// + /// This always returns the result as a type `u64`. This must be converted + /// to the appropriate type by the caller. + fn parse_human_readable_size_arg( + &self, + arg_name: &str, + ) -> Result> { + let arg_value = match self.value_of_lossy(arg_name) { Some(x) => x, None => return Ok(None) }; + let re = regex::Regex::new("^([0-9]+)([KMG])?$").unwrap(); + let caps = try!( + re.captures(&arg_value).ok_or_else(|| { + format!("invalid format for {}", arg_name) + })); - let re = Regex::new("^([0-9]+)([KMG])?$").unwrap(); - let caps = try!(re.captures(&max_filesize) - .ok_or("invalid format for max-filesize argument")); - - let value = try!(caps[1].parse::().map_err(|err|err.to_string())); + let value = try!(caps[1].parse::()); let suffix = caps.get(2).map(|x| x.as_str()); + let v_10 = value.checked_mul(1024); + let v_20 = v_10.and_then(|x| x.checked_mul(1024)); + let v_30 = v_20.and_then(|x| x.checked_mul(1024)); + + let try_suffix = |x: Option| { + if x.is_some() { + Ok(x) + } else { + Err(From::from(format!("number too large for {}", arg_name))) + } + }; match suffix { None => Ok(Some(value)), - Some("K") => Ok(Some(value * 1024)), - Some("M") => Ok(Some(value * 1024 * 1024)), - Some("G") => Ok(Some(value * 1024 * 1024 * 1024)), - _ => Err(From::from("invalid suffix for max-filesize argument")) + Some("K") => try_suffix(v_10), + Some("M") => try_suffix(v_20), + Some("G") => try_suffix(v_30), + _ => Err(From::from(format!("invalid suffix for {}", arg_name))) } } + /// Parse the dfa-size-limit argument option into a byte count. + fn dfa_size_limit(&self) -> Result> { + let r = try!(self.parse_human_readable_size_arg("dfa-size-limit")); + human_readable_to_usize("dfa-size-limit", r) + } + + /// Parse the regex-size-limit argument option into a byte count. + fn regex_size_limit(&self) -> Result> { + let r = try!(self.parse_human_readable_size_arg("regex-size-limit")); + human_readable_to_usize("regex-size-limit", r) + } + + /// Parses the max-filesize argument option into a byte count. + fn max_filesize(&self) -> Result> { + self.parse_human_readable_size_arg("max-filesize") + } + /// Returns true if ignore files should be ignored. fn no_ignore(&self) -> bool { self.is_present("no-ignore") @@ -926,6 +965,27 @@ impl QuietMatched { } } +/// Convert the result of a `parse_human_readable_size_arg` call into +/// a `usize`, failing if the type does not fit. +fn human_readable_to_usize( + arg_name: &str, + value: Option, +) -> Result> { + use std::usize; + + match value { + None => Ok(None), + Some(v) => { + if v <= usize::MAX as u64 { + Ok(Some(v as usize)) + } else { + let msg = format!("number too large for {}", arg_name); + Err(From::from(msg)) + } + } + } +} + /// Returns true if and only if stdin is deemed searchable. #[cfg(unix)] fn stdin_is_readable() -> bool { -- cgit v1.2.3