1
Fork 0
mirror of https://github.com/RGBCube/uutils-coreutils synced 2025-07-28 11:37:44 +00:00

tail: simplify obsolete parsing

This commit is contained in:
Benjamin Bara 2023-02-19 15:16:58 +01:00
parent 9b49f368c7
commit 26a945f3b5
3 changed files with 140 additions and 102 deletions

View file

@ -348,39 +348,33 @@ impl Settings {
VerificationResult::Ok VerificationResult::Ok
} }
pub fn is_default(&self) -> bool {
let default = Self::default();
self.max_unchanged_stats == default.max_unchanged_stats
&& self.sleep_sec == default.sleep_sec
&& self.follow == default.follow
&& self.mode == default.mode
&& self.pid == default.pid
&& self.retry == default.retry
&& self.use_polling == default.use_polling
&& (self.verbose == default.verbose || self.inputs.len() > 1)
&& self.presume_input_pipe == default.presume_input_pipe
}
} }
pub fn parse_obsolete(args: &str) -> UResult<Option<parse::ObsoleteArgs>> { pub fn parse_obsolete(arg: &OsString, input: Option<&OsString>) -> UResult<Option<Settings>> {
match parse::parse_obsolete(args) { match parse::parse_obsolete(arg) {
Some(Ok(args)) => Ok(Some(args)), Some(Ok(args)) => Ok(Some(Settings::from_obsolete_args(&args, input))),
None => Ok(None), None => Ok(None),
Some(Err(e)) => Err(USimpleError::new( Some(Err(e)) => {
1, let arg_str = arg.to_string_lossy();
match e { Err(USimpleError::new(
parse::ParseError::OutOfRange => format!( 1,
"invalid number: {}: Numerical result out of range", match e {
args.quote() parse::ParseError::OutOfRange => format!(
), "invalid number: {}: Numerical result out of range",
parse::ParseError::Overflow => format!("invalid number: {}", args.quote()), arg_str.quote()
parse::ParseError::Context => format!( ),
"option used in invalid context -- {}", parse::ParseError::Overflow => format!("invalid number: {}", arg_str.quote()),
args.chars().nth(1).unwrap_or_default() // this ensures compatibility to GNU's error message (as tested in misc/tail)
), parse::ParseError::Context => format!(
}, "option used in invalid context -- {}",
)), arg_str.chars().nth(1).unwrap_or_default()
),
parse::ParseError::InvalidEncoding => {
format!("bad argument encoding: '{arg_str}'")
}
},
))
}
} }
} }
@ -410,39 +404,41 @@ fn parse_num(src: &str) -> Result<Signum, ParseSizeError> {
pub fn parse_args(args: impl uucore::Args) -> UResult<Settings> { pub fn parse_args(args: impl uucore::Args) -> UResult<Settings> {
let args_vec: Vec<OsString> = args.collect(); let args_vec: Vec<OsString> = args.collect();
let clap_result = match uu_app().try_get_matches_from(args_vec.clone()) { let clap_args = uu_app().try_get_matches_from(args_vec.clone());
Ok(matches) => { let clap_result = match clap_args {
let settings = Settings::from(&matches)?; Ok(matches) => Ok(Settings::from(&matches)?),
if !settings.is_default() {
// non-default settings can't have obsolete arguments
return Ok(settings);
}
Ok(settings)
}
Err(err) => Err(err.into()), Err(err) => Err(err.into()),
}; };
// clap parsing failed or resulted to default -> check for obsolete/deprecated args // clap isn't able to handle obsolete syntax.
// argv[0] is always present // therefore, we want to check further for obsolete arguments.
let second = match args_vec.get(1) { // argv[0] is always present, argv[1] might be obsolete arguments
Some(second) => second, // argv[2] might contain an input file, argv[3] isn't allowed in obsolete mode
None => return clap_result, if args_vec.len() != 2 && args_vec.len() != 3 {
}; return clap_result;
let second_str = match second.to_str() { }
Some(second_str) => second_str,
None => { // At this point, there are a few possible cases:
let invalid_string = second.to_string_lossy(); //
return Err(USimpleError::new( // 1. clap has succeeded and the arguments would be invalid for the obsolete syntax.
1, // 2. The case of `tail -c 5` is ambiguous. clap parses this as `tail -c5`,
format!("bad argument encoding: '{invalid_string}'"), // but it could also be interpreted as valid obsolete syntax (tail -c on file '5').
)); // GNU chooses to interpret this as `tail -c5`, like clap.
} // 3. `tail -f foo` is also ambiguous, but has the same effect in both cases. We can safely
}; // use the clap result here.
match parse_obsolete(second_str)? { // 4. clap succeeded for obsolete arguments starting with '+', but misinterprets them as
Some(obsolete_args) => Ok(Settings::from_obsolete_args( // input files (e.g. 'tail +f').
&obsolete_args, // 5. clap failed because of unknown flags, but possibly valid obsolete arguments
args_vec.get(2), // (e.g. tail -l; tail -10c).
)), //
// In cases 4 & 5, we want to try parsing the obsolete arguments, which corresponds to
// checking whether clap succeeded or the first argument starts with '+'.
let possible_obsolete_args = &args_vec[1];
if clap_result.is_ok() && !possible_obsolete_args.to_string_lossy().starts_with('+') {
return clap_result;
}
match parse_obsolete(possible_obsolete_args, args_vec.get(2))? {
Some(settings) => Ok(settings),
None => clap_result, None => clap_result,
} }
} }
@ -477,6 +473,7 @@ pub fn uu_app() -> Command {
.num_args(0..=1) .num_args(0..=1)
.require_equals(true) .require_equals(true)
.value_parser(["descriptor", "name"]) .value_parser(["descriptor", "name"])
.overrides_with(options::FOLLOW)
.help("Print the file as it grows"), .help("Print the file as it grows"),
) )
.arg( .arg(

View file

@ -3,6 +3,8 @@
// * For the full copyright and license information, please view the LICENSE // * For the full copyright and license information, please view the LICENSE
// * file that was distributed with this source code. // * file that was distributed with this source code.
use std::ffi::OsString;
#[derive(PartialEq, Eq, Debug, Copy, Clone)] #[derive(PartialEq, Eq, Debug, Copy, Clone)]
pub struct ObsoleteArgs { pub struct ObsoleteArgs {
pub num: u64, pub num: u64,
@ -27,20 +29,31 @@ pub enum ParseError {
OutOfRange, OutOfRange,
Overflow, Overflow,
Context, Context,
InvalidEncoding,
} }
/// Parses obsolete syntax /// Parses obsolete syntax
/// tail -\[NUM\]\[bl\]\[f\] and tail +\[NUM\]\[bcl\]\[f\] // spell-checker:disable-line /// tail -\[NUM\]\[bcl\]\[f\] and tail +\[NUM\]\[bcl\]\[f\] // spell-checker:disable-line
pub fn parse_obsolete(src: &str) -> Option<Result<ObsoleteArgs, ParseError>> { pub fn parse_obsolete(src: &OsString) -> Option<Result<ObsoleteArgs, ParseError>> {
let mut chars = src.chars(); let mut rest = match src.to_str() {
let sign = chars.next()?; Some(src) => src,
if sign != '+' && sign != '-' { None => return Some(Err(ParseError::InvalidEncoding)),
};
let sign = if let Some(r) = rest.strip_prefix('-') {
rest = r;
'-'
} else if let Some(r) = rest.strip_prefix('+') {
rest = r;
'+'
} else {
return None; return None;
} };
let numbers: String = chars.clone().take_while(|&c| c.is_ascii_digit()).collect(); let end_num = rest
let has_num = !numbers.is_empty(); .find(|c: char| !c.is_ascii_digit())
.unwrap_or(rest.len());
let has_num = !rest[..end_num].is_empty();
let num: u64 = if has_num { let num: u64 = if has_num {
if let Ok(num) = numbers.parse() { if let Ok(num) = rest[..end_num].parse() {
num num
} else { } else {
return Some(Err(ParseError::OutOfRange)); return Some(Err(ParseError::OutOfRange));
@ -48,25 +61,30 @@ pub fn parse_obsolete(src: &str) -> Option<Result<ObsoleteArgs, ParseError>> {
} else { } else {
10 10
}; };
rest = &rest[end_num..];
let mut follow = false; let mode = if let Some(r) = rest.strip_prefix('l') {
let mut mode = 'l'; rest = r;
let mut first_char = true; 'l'
for char in chars.skip_while(|&c| c.is_ascii_digit()) { } else if let Some(r) = rest.strip_prefix('c') {
if !has_num && first_char && sign == '-' && (char == 'c' || char == 'f') { rest = r;
// special cases: -c, -f should be handled by clap (are ambiguous) 'c'
return None; } else if let Some(r) = rest.strip_prefix('b') {
} else if char == 'f' { rest = r;
follow = true; 'b'
} else if first_char && (char == 'b' || char == 'c' || char == 'l') { } else {
mode = char; 'l'
} else if has_num && sign == '-' { };
let follow = rest.contains('f');
if !rest.chars().all(|f| f == 'f') {
// GNU allows an arbitrary amount of following fs, but nothing else
if sign == '-' && has_num {
return Some(Err(ParseError::Context)); return Some(Err(ParseError::Context));
} else {
return None;
} }
first_char = false; return None;
} }
let multiplier = if mode == 'b' { 512 } else { 1 }; let multiplier = if mode == 'b' { 512 } else { 1 };
let num = match num.checked_mul(multiplier) { let num = match num.checked_mul(multiplier) {
Some(n) => n, Some(n) => n,
@ -87,7 +105,7 @@ mod tests {
#[test] #[test]
fn test_parse_numbers_obsolete() { fn test_parse_numbers_obsolete() {
assert_eq!( assert_eq!(
parse_obsolete("+2c"), parse_obsolete(&OsString::from("+2c")),
Some(Ok(ObsoleteArgs { Some(Ok(ObsoleteArgs {
num: 2, num: 2,
plus: true, plus: true,
@ -96,7 +114,7 @@ mod tests {
})) }))
); );
assert_eq!( assert_eq!(
parse_obsolete("-5"), parse_obsolete(&OsString::from("-5")),
Some(Ok(ObsoleteArgs { Some(Ok(ObsoleteArgs {
num: 5, num: 5,
plus: false, plus: false,
@ -105,7 +123,7 @@ mod tests {
})) }))
); );
assert_eq!( assert_eq!(
parse_obsolete("+100f"), parse_obsolete(&OsString::from("+100f")),
Some(Ok(ObsoleteArgs { Some(Ok(ObsoleteArgs {
num: 100, num: 100,
plus: true, plus: true,
@ -114,7 +132,7 @@ mod tests {
})) }))
); );
assert_eq!( assert_eq!(
parse_obsolete("-2b"), parse_obsolete(&OsString::from("-2b")),
Some(Ok(ObsoleteArgs { Some(Ok(ObsoleteArgs {
num: 1024, num: 1024,
plus: false, plus: false,
@ -125,23 +143,47 @@ mod tests {
} }
#[test] #[test]
fn test_parse_errors_obsolete() { fn test_parse_errors_obsolete() {
assert_eq!(parse_obsolete("-5n"), Some(Err(ParseError::Context)));
assert_eq!(parse_obsolete("-5c5"), Some(Err(ParseError::Context)));
assert_eq!(parse_obsolete("-1vzc"), Some(Err(ParseError::Context)));
assert_eq!(parse_obsolete("-5m"), Some(Err(ParseError::Context)));
assert_eq!(parse_obsolete("-1k"), Some(Err(ParseError::Context)));
assert_eq!(parse_obsolete("-1mmk"), Some(Err(ParseError::Context)));
assert_eq!(parse_obsolete("-105kzm"), Some(Err(ParseError::Context)));
assert_eq!(parse_obsolete("-1vz"), Some(Err(ParseError::Context)));
assert_eq!( assert_eq!(
parse_obsolete("-1vzqvq"), // spell-checker:disable-line parse_obsolete(&OsString::from("-5n")),
Some(Err(ParseError::Context))
);
assert_eq!(
parse_obsolete(&OsString::from("-5c5")),
Some(Err(ParseError::Context))
);
assert_eq!(
parse_obsolete(&OsString::from("-1vzc")),
Some(Err(ParseError::Context))
);
assert_eq!(
parse_obsolete(&OsString::from("-5m")),
Some(Err(ParseError::Context))
);
assert_eq!(
parse_obsolete(&OsString::from("-1k")),
Some(Err(ParseError::Context))
);
assert_eq!(
parse_obsolete(&OsString::from("-1mmk")),
Some(Err(ParseError::Context))
);
assert_eq!(
parse_obsolete(&OsString::from("-105kzm")),
Some(Err(ParseError::Context))
);
assert_eq!(
parse_obsolete(&OsString::from("-1vz")),
Some(Err(ParseError::Context))
);
assert_eq!(
parse_obsolete(&OsString::from("-1vzqvq")), // spell-checker:disable-line
Some(Err(ParseError::Context)) Some(Err(ParseError::Context))
); );
} }
#[test] #[test]
fn test_parse_obsolete_no_match() { fn test_parse_obsolete_no_match() {
assert_eq!(parse_obsolete("-k"), None); assert_eq!(parse_obsolete(&OsString::from("-k")), None);
assert_eq!(parse_obsolete("asd"), None); assert_eq!(parse_obsolete(&OsString::from("asd")), None);
assert_eq!(parse_obsolete("-cc"), None); assert_eq!(parse_obsolete(&OsString::from("-cc")), None);
} }
} }

View file

@ -28,8 +28,7 @@ pub struct Input {
impl Input { impl Input {
pub fn from<T: AsRef<OsStr>>(string: &T) -> Self { pub fn from<T: AsRef<OsStr>>(string: &T) -> Self {
let valid_string = string.as_ref().to_str(); let kind = if string.as_ref() == Path::new(text::DASH) {
let kind = if valid_string.is_some() && valid_string.unwrap() == text::DASH {
InputKind::Stdin InputKind::Stdin
} else { } else {
InputKind::File(PathBuf::from(string.as_ref())) InputKind::File(PathBuf::from(string.as_ref()))