mirror of
https://github.com/RGBCube/uutils-coreutils
synced 2025-07-28 19:47:45 +00:00
uucore(lib): add u8/OsString conversion utils
This commit is contained in:
parent
5bc7d67274
commit
3031874d22
1 changed files with 71 additions and 1 deletions
|
@ -100,10 +100,14 @@ pub use crate::features::fsxattr;
|
|||
|
||||
//## core functions
|
||||
|
||||
use std::borrow::Cow;
|
||||
use std::ffi::OsStr;
|
||||
use std::ffi::OsString;
|
||||
use std::io::{BufRead, BufReader};
|
||||
use std::iter;
|
||||
#[cfg(unix)]
|
||||
use std::os::unix::ffi::OsStrExt;
|
||||
use std::os::unix::ffi::{OsStrExt, OsStringExt};
|
||||
use std::str;
|
||||
use std::sync::atomic::Ordering;
|
||||
|
||||
use once_cell::sync::Lazy;
|
||||
|
@ -240,6 +244,72 @@ pub fn os_str_as_bytes(os_string: &OsStr) -> mods::error::UResult<&[u8]> {
|
|||
Ok(bytes)
|
||||
}
|
||||
|
||||
/// Helper function for converting a slice of bytes into an &OsStr
|
||||
/// or OsString in non-unix targets.
|
||||
///
|
||||
/// It converts `&[u8]` to `Cow<OsStr>` for unix targets only.
|
||||
/// On non-unix (i.e. Windows), the conversion goes through the String type
|
||||
/// and thus undergo UTF-8 validation, making it fail if the stream contains
|
||||
/// non-UTF-8 characters.
|
||||
pub fn os_str_from_bytes(bytes: &[u8]) -> mods::error::UResult<Cow<'_, OsStr>> {
|
||||
#[cfg(unix)]
|
||||
let os_str = Cow::Borrowed(OsStr::from_bytes(bytes));
|
||||
#[cfg(not(unix))]
|
||||
let os_str = Cow::Owned(OsString::from(str::from_utf8(bytes).map_err(|_| {
|
||||
mods::error::UUsageError::new(1, "Unable to transform bytes into OsStr")
|
||||
})?));
|
||||
|
||||
Ok(os_str)
|
||||
}
|
||||
|
||||
/// Helper function for making an `OsString` from a byte field
|
||||
/// It converts `Vec<u8>` to `OsString` for unix targets only.
|
||||
/// On non-unix (i.e. Windows) it may fail if the bytes are not valid UTF-8
|
||||
pub fn os_string_from_vec(vec: Vec<u8>) -> mods::error::UResult<OsString> {
|
||||
#[cfg(unix)]
|
||||
let s = OsString::from_vec(vec);
|
||||
#[cfg(not(unix))]
|
||||
let s = OsString::from(String::from_utf8(vec).map_err(|_| {
|
||||
mods::error::UUsageError::new(1, "invalid UTF-8 was detected in one or more arguments")
|
||||
})?);
|
||||
|
||||
Ok(s)
|
||||
}
|
||||
|
||||
/// Equivalent to `std::BufRead::lines` which outputs each line as a `Vec<u8>`,
|
||||
/// which avoids panicking on non UTF-8 input.
|
||||
pub fn read_byte_lines<R: std::io::Read>(
|
||||
mut buf_reader: BufReader<R>,
|
||||
) -> impl Iterator<Item = Vec<u8>> {
|
||||
iter::from_fn(move || {
|
||||
let mut buf = Vec::with_capacity(256);
|
||||
let size = buf_reader.read_until(b'\n', &mut buf).ok()?;
|
||||
|
||||
if size == 0 {
|
||||
return None;
|
||||
}
|
||||
|
||||
// Trim (\r)\n
|
||||
if buf.ends_with(b"\n") {
|
||||
buf.pop();
|
||||
if buf.ends_with(b"\r") {
|
||||
buf.pop();
|
||||
}
|
||||
}
|
||||
|
||||
Some(buf)
|
||||
})
|
||||
}
|
||||
|
||||
/// Equivalent to `std::BufRead::lines` which outputs each line as an `OsString`
|
||||
/// This won't panic on non UTF-8 characters on Unix,
|
||||
/// but it still will on Windows.
|
||||
pub fn read_os_string_lines<R: std::io::Read>(
|
||||
buf_reader: BufReader<R>,
|
||||
) -> impl Iterator<Item = OsString> {
|
||||
read_byte_lines(buf_reader).map(|byte_line| os_string_from_vec(byte_line).expect("UTF-8 error"))
|
||||
}
|
||||
|
||||
/// Prompt the user with a formatted string and returns `true` if they reply `'y'` or `'Y'`
|
||||
///
|
||||
/// This macro functions accepts the same syntax as `format!`. The prompt is written to
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue