mirror of
https://github.com/fish-shell/fish-shell
synced 2025-01-28 12:45:13 +00:00
Port the rest of wutil
This commit is contained in:
parent
d3a7e3ffd9
commit
f53aa6f2e3
2 changed files with 680 additions and 41 deletions
|
@ -58,6 +58,14 @@ fn wcs2string_bad_char(c: char) {
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/// Split a string by a separator character.
|
||||||
|
pub fn split_string(val: &wstr, sep: char) -> Vec<WString> {
|
||||||
|
val.as_char_slice()
|
||||||
|
.split(|c| *c == sep)
|
||||||
|
.map(WString::from_chars)
|
||||||
|
.collect()
|
||||||
|
}
|
||||||
|
|
||||||
/// Joins strings with a separator.
|
/// Joins strings with a separator.
|
||||||
pub fn join_strings<S: AsRef<wstr>>(strs: &[S], sep: char) -> WString {
|
pub fn join_strings<S: AsRef<wstr>>(strs: &[S], sep: char) -> WString {
|
||||||
if strs.is_empty() {
|
if strs.is_empty() {
|
||||||
|
|
|
@ -5,19 +5,68 @@ pub mod printf;
|
||||||
pub mod wcstod;
|
pub mod wcstod;
|
||||||
pub mod wcstoi;
|
pub mod wcstoi;
|
||||||
|
|
||||||
use crate::common::fish_reserved_codepoint;
|
use crate::common::{
|
||||||
use crate::common::{str2wcstring, wcs2zstring};
|
cstr2wcstring, fish_reserved_codepoint, str2wcstring, wcs2osstring, wcs2string, wcs2zstring,
|
||||||
|
};
|
||||||
|
use crate::fallback;
|
||||||
|
use crate::fds::AutoCloseFd;
|
||||||
|
use crate::flog::FLOGF;
|
||||||
use crate::wchar::{wstr, WString, L};
|
use crate::wchar::{wstr, WString, L};
|
||||||
use crate::wcstringutil::join_strings;
|
use crate::wcstringutil::{join_strings, split_string, wcs2string_callback};
|
||||||
pub(crate) use gettext::{wgettext, wgettext_fmt};
|
pub(crate) use gettext::{wgettext, wgettext_fmt};
|
||||||
|
use libc::{
|
||||||
|
DT_BLK, DT_CHR, DT_DIR, DT_FIFO, DT_LNK, DT_REG, DT_SOCK, EACCES, EIO, ELOOP, ENAMETOOLONG,
|
||||||
|
ENODEV, ENOENT, ENOTDIR, S_IFBLK, S_IFCHR, S_IFDIR, S_IFIFO, S_IFLNK, S_IFMT, S_IFREG,
|
||||||
|
S_IFSOCK,
|
||||||
|
};
|
||||||
pub(crate) use printf::sprintf;
|
pub(crate) use printf::sprintf;
|
||||||
use std::ffi::OsStr;
|
use std::ffi::OsStr;
|
||||||
|
use std::fs;
|
||||||
use std::fs::canonicalize;
|
use std::fs::canonicalize;
|
||||||
|
use std::io::Write;
|
||||||
|
use std::os::fd::RawFd;
|
||||||
|
use std::os::fd::{FromRawFd, IntoRawFd};
|
||||||
use std::os::unix::prelude::{OsStrExt, OsStringExt};
|
use std::os::unix::prelude::{OsStrExt, OsStringExt};
|
||||||
pub use wcstoi::*;
|
pub use wcstoi::*;
|
||||||
|
use widestring_suffix::widestrs;
|
||||||
|
|
||||||
|
/// Wide character version of opendir(). Note that opendir() is guaranteed to set close-on-exec by
|
||||||
|
/// POSIX (hooray).
|
||||||
|
pub fn wopendir(name: &wstr) -> *mut libc::DIR {
|
||||||
|
let tmp = wcs2zstring(name);
|
||||||
|
unsafe { libc::opendir(tmp.as_ptr()) }
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Wide character version of stat().
|
||||||
|
pub fn wstat(file_name: &wstr) -> Option<fs::Metadata> {
|
||||||
|
let tmp = wcs2osstring(file_name);
|
||||||
|
fs::metadata(tmp).ok()
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Wide character version of lstat().
|
||||||
|
pub fn lwstat(file_name: &wstr) -> Option<fs::Metadata> {
|
||||||
|
let tmp = wcs2osstring(file_name);
|
||||||
|
fs::symlink_metadata(tmp).ok()
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Wide character version of access().
|
||||||
|
pub fn waccess(file_name: &wstr, mode: libc::c_int) -> libc::c_int {
|
||||||
|
let tmp = wcs2zstring(file_name);
|
||||||
|
unsafe { libc::access(tmp.as_ptr(), mode) }
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Wide character version of unlink().
|
||||||
|
pub fn wunlink(file_name: &wstr) -> libc::c_int {
|
||||||
|
let tmp = wcs2zstring(file_name);
|
||||||
|
unsafe { libc::unlink(tmp.as_ptr()) }
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn wperror(s: &wstr) {
|
||||||
|
// TODO This should not crash on invalid UTF-8
|
||||||
|
perror(std::str::from_utf8(&wcs2string(s)).unwrap())
|
||||||
|
}
|
||||||
|
|
||||||
/// Port of the wide-string wperror from `src/wutil.cpp` but for rust `&str`.
|
/// Port of the wide-string wperror from `src/wutil.cpp` but for rust `&str`.
|
||||||
use std::io::Write;
|
|
||||||
pub fn perror(s: &str) {
|
pub fn perror(s: &str) {
|
||||||
let e = errno::errno().0;
|
let e = errno::errno().0;
|
||||||
let mut stderr = std::io::stderr().lock();
|
let mut stderr = std::io::stderr().lock();
|
||||||
|
@ -33,6 +82,55 @@ pub fn perror(s: &str) {
|
||||||
let _ = stderr.write_all(b"\n");
|
let _ = stderr.write_all(b"\n");
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/// Wide character version of getcwd().
|
||||||
|
pub fn wgetcwd() -> WString {
|
||||||
|
let mut cwd = [b'\0'; libc::PATH_MAX as usize];
|
||||||
|
let res = unsafe {
|
||||||
|
libc::getcwd(
|
||||||
|
std::ptr::addr_of_mut!(cwd).cast(),
|
||||||
|
std::mem::size_of_val(&cwd),
|
||||||
|
)
|
||||||
|
};
|
||||||
|
if !res.is_null() {
|
||||||
|
return cstr2wcstring(&cwd);
|
||||||
|
}
|
||||||
|
|
||||||
|
FLOGF!(
|
||||||
|
error,
|
||||||
|
"getcwd() failed with errno %d/%s",
|
||||||
|
errno::errno().0,
|
||||||
|
"errno::errno"
|
||||||
|
);
|
||||||
|
WString::new()
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Wide character version of readlink().
|
||||||
|
pub fn wreadlink(file_name: &wstr) -> Option<WString> {
|
||||||
|
let md = lwstat(file_name)?;
|
||||||
|
let bufsize = usize::try_from(md.len()).unwrap() + 1;
|
||||||
|
let mut target_buf = vec![b'\0'; bufsize];
|
||||||
|
let tmp = wcs2zstring(file_name);
|
||||||
|
let nbytes = unsafe {
|
||||||
|
libc::readlink(
|
||||||
|
tmp.as_ptr(),
|
||||||
|
std::ptr::addr_of_mut!(target_buf[0]).cast(),
|
||||||
|
bufsize,
|
||||||
|
)
|
||||||
|
};
|
||||||
|
if nbytes == -1 {
|
||||||
|
perror("readlink");
|
||||||
|
return None;
|
||||||
|
}
|
||||||
|
// The link might have been modified after our call to lstat. If the link now points to a path
|
||||||
|
// that's longer than the original one, we can't read everything in our buffer. Simply give
|
||||||
|
// up. We don't need to report an error since our only caller will already fall back to ENOENT.
|
||||||
|
let nbytes = usize::try_from(nbytes).unwrap();
|
||||||
|
if nbytes == bufsize {
|
||||||
|
return None;
|
||||||
|
}
|
||||||
|
Some(str2wcstring(&target_buf[0..nbytes]))
|
||||||
|
}
|
||||||
|
|
||||||
/// Wide character realpath. The last path component does not need to be valid. If an error occurs,
|
/// Wide character realpath. The last path component does not need to be valid. If an error occurs,
|
||||||
/// `wrealpath()` returns `None`
|
/// `wrealpath()` returns `None`
|
||||||
pub fn wrealpath(pathname: &wstr) -> Option<WString> {
|
pub fn wrealpath(pathname: &wstr) -> Option<WString> {
|
||||||
|
@ -141,43 +239,6 @@ pub fn normalize_path(path: &wstr, allow_leading_double_slashes: bool) -> WStrin
|
||||||
result
|
result
|
||||||
}
|
}
|
||||||
|
|
||||||
const PUA1_START: char = '\u{E000}';
|
|
||||||
const PUA1_END: char = '\u{F900}';
|
|
||||||
const PUA2_START: char = '\u{F0000}';
|
|
||||||
const PUA2_END: char = '\u{FFFFE}';
|
|
||||||
const PUA3_START: char = '\u{100000}';
|
|
||||||
const PUA3_END: char = '\u{10FFFE}';
|
|
||||||
|
|
||||||
/// Return one if the code point is in a Unicode private use area.
|
|
||||||
fn fish_is_pua(c: char) -> bool {
|
|
||||||
PUA1_START <= c && c < PUA1_END
|
|
||||||
}
|
|
||||||
|
|
||||||
/// We need this because there are too many implementations that don't return the proper answer for
|
|
||||||
/// some code points. See issue #3050.
|
|
||||||
pub fn fish_iswalnum(c: char) -> bool {
|
|
||||||
!fish_reserved_codepoint(c) && !fish_is_pua(c) && c.is_alphanumeric()
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Given that \p cursor is a pointer into \p base, return the offset in characters.
|
|
||||||
/// This emulates C pointer arithmetic:
|
|
||||||
/// `wstr_offset_in(cursor, base)` is equivalent to C++ `cursor - base`.
|
|
||||||
pub fn wstr_offset_in(cursor: &wstr, base: &wstr) -> usize {
|
|
||||||
let cursor = cursor.as_slice();
|
|
||||||
let base = base.as_slice();
|
|
||||||
// cursor may be a zero-length slice at the end of base,
|
|
||||||
// which base.as_ptr_range().contains(cursor.as_ptr()) will reject.
|
|
||||||
let base_range = base.as_ptr_range();
|
|
||||||
let curs_range = cursor.as_ptr_range();
|
|
||||||
assert!(
|
|
||||||
base_range.start <= curs_range.start && curs_range.end <= base_range.end,
|
|
||||||
"cursor should be a subslice of base"
|
|
||||||
);
|
|
||||||
let offset = unsafe { cursor.as_ptr().offset_from(base.as_ptr()) };
|
|
||||||
assert!(offset >= 0, "offset should be non-negative");
|
|
||||||
offset as usize
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_normalize_path() {
|
fn test_normalize_path() {
|
||||||
fn norm_path(path: &wstr) -> WString {
|
fn norm_path(path: &wstr) -> WString {
|
||||||
|
@ -208,6 +269,576 @@ fn test_normalize_path() {
|
||||||
assert_eq!(norm_path(L!("foo/././bar/.././baz")), "foo/baz");
|
assert_eq!(norm_path(L!("foo/././bar/.././baz")), "foo/baz");
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/// Given an input path \p path and a working directory \p wd, do a "normalizing join" in a way
|
||||||
|
/// appropriate for cd. That is, return effectively wd + path while resolving leading ../s from
|
||||||
|
/// path. The intent here is to allow 'cd' out of a directory which may no longer exist, without
|
||||||
|
/// allowing 'cd' into a directory that may not exist; see #5341.
|
||||||
|
#[widestrs]
|
||||||
|
pub fn path_normalize_for_cd(wd: &wstr, path: &wstr) -> WString {
|
||||||
|
// Fast paths.
|
||||||
|
const sep: char = '/';
|
||||||
|
assert!(
|
||||||
|
wd.as_char_slice().first() == Some(&'/') && wd.as_char_slice().last() == Some(&'/'),
|
||||||
|
"Invalid working directory, it must start and end with /"
|
||||||
|
);
|
||||||
|
if path.is_empty() {
|
||||||
|
return wd.to_owned();
|
||||||
|
} else if path.as_char_slice().first() == Some(&sep) {
|
||||||
|
return path.to_owned();
|
||||||
|
} else if path.as_char_slice().first() != Some(&'.') {
|
||||||
|
return wd.to_owned() + path;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Split our strings by the sep.
|
||||||
|
let mut wd_comps = split_string(wd, sep);
|
||||||
|
let path_comps = split_string(path, sep);
|
||||||
|
|
||||||
|
// Remove empty segments from wd_comps.
|
||||||
|
// In particular this removes the leading and trailing empties.
|
||||||
|
wd_comps.retain(|comp| !comp.is_empty());
|
||||||
|
|
||||||
|
// Erase leading . and .. components from path_comps, popping from wd_comps as we go.
|
||||||
|
let mut erase_count = 0;
|
||||||
|
for comp in &path_comps {
|
||||||
|
let mut erase_it = false;
|
||||||
|
if comp.is_empty() || comp == "."L {
|
||||||
|
erase_it = true;
|
||||||
|
} else if comp == ".."L && !wd_comps.is_empty() {
|
||||||
|
erase_it = true;
|
||||||
|
wd_comps.pop();
|
||||||
|
}
|
||||||
|
if erase_it {
|
||||||
|
erase_count += 1;
|
||||||
|
} else {
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
// Append un-erased elements to wd_comps and join them, then prepend the leading /.
|
||||||
|
wd_comps.extend(path_comps.into_iter().skip(erase_count));
|
||||||
|
|
||||||
|
let mut result = join_strings(&wd_comps, sep);
|
||||||
|
result.insert(0, '/');
|
||||||
|
result
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Wide character version of dirname().
|
||||||
|
#[widestrs]
|
||||||
|
pub fn wdirname(mut path: WString) -> WString {
|
||||||
|
// Do not use system-provided dirname (#7837).
|
||||||
|
// On Mac it's not thread safe, and will error for paths exceeding PATH_MAX.
|
||||||
|
// This follows OpenGroup dirname recipe.
|
||||||
|
|
||||||
|
// 1: Double-slash stays.
|
||||||
|
if path == "//"L {
|
||||||
|
return path;
|
||||||
|
}
|
||||||
|
|
||||||
|
// 2: All slashes => return slash.
|
||||||
|
if !path.is_empty() && path.chars().find(|c| *c == '/').is_none() {
|
||||||
|
return "/"L.to_owned();
|
||||||
|
}
|
||||||
|
|
||||||
|
// 3: Trim trailing slashes.
|
||||||
|
while path.as_char_slice().last() == Some(&'/') {
|
||||||
|
path.pop();
|
||||||
|
}
|
||||||
|
|
||||||
|
// 4: No slashes left => return period.
|
||||||
|
let Some(last_slash) = path.chars().rev().position(|c| c == '/') else {
|
||||||
|
return "."L.to_owned()
|
||||||
|
};
|
||||||
|
|
||||||
|
// 5: Remove trailing non-slashes.
|
||||||
|
path.truncate(last_slash + 1);
|
||||||
|
|
||||||
|
// 6: Skip as permitted.
|
||||||
|
// 7: Remove trailing slashes again.
|
||||||
|
while path.as_char_slice().last() == Some(&'/') {
|
||||||
|
path.pop();
|
||||||
|
}
|
||||||
|
|
||||||
|
// 8: Empty => return slash.
|
||||||
|
if path.is_empty() {
|
||||||
|
path = "/"L.to_owned();
|
||||||
|
}
|
||||||
|
path
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Wide character version of basename().
|
||||||
|
#[widestrs]
|
||||||
|
pub fn wbasename(mut path: WString) -> WString {
|
||||||
|
// This follows OpenGroup basename recipe.
|
||||||
|
// 1: empty => allowed to return ".". This is what system impls do.
|
||||||
|
if path.is_empty() {
|
||||||
|
return "."L.to_owned();
|
||||||
|
}
|
||||||
|
|
||||||
|
// 2: Skip as permitted.
|
||||||
|
// 3: All slashes => return slash.
|
||||||
|
if !path.is_empty() && path.chars().find(|c| *c == '/').is_none() {
|
||||||
|
return "/"L.to_owned();
|
||||||
|
}
|
||||||
|
|
||||||
|
// 4: Remove trailing slashes.
|
||||||
|
// while (!path.is_empty() && path.back() == '/') path.pop_back();
|
||||||
|
while path.as_char_slice().last() == Some(&'/') {
|
||||||
|
path.pop();
|
||||||
|
}
|
||||||
|
|
||||||
|
// 5: Remove up to and including last slash.
|
||||||
|
if let Some(last_slash) = path.chars().rev().position(|c| c == '/') {
|
||||||
|
path.truncate(last_slash + 1);
|
||||||
|
};
|
||||||
|
path
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Wide character version of mkdir.
|
||||||
|
pub fn wmkdir(name: &wstr, mode: libc::mode_t) -> libc::c_int {
|
||||||
|
let name_narrow = wcs2zstring(name);
|
||||||
|
unsafe { libc::mkdir(name_narrow.as_ptr(), mode) }
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Wide character version of rename.
|
||||||
|
pub fn wrename(old_name: &wstr, new_name: &wstr) -> libc::c_int {
|
||||||
|
let old_narrow = wcs2zstring(old_name);
|
||||||
|
let new_narrow = wcs2zstring(new_name);
|
||||||
|
unsafe { libc::rename(old_narrow.as_ptr(), new_narrow.as_ptr()) }
|
||||||
|
}
|
||||||
|
|
||||||
|
fn write_to_fd(input: &[u8], fd: RawFd) -> std::io::Result<usize> {
|
||||||
|
let mut file = unsafe { std::fs::File::from_raw_fd(fd) };
|
||||||
|
let amt = file.write(input);
|
||||||
|
// Ensure the file is not closed.
|
||||||
|
file.into_raw_fd();
|
||||||
|
amt
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Write a wide string to a file descriptor. This avoids doing any additional allocation.
|
||||||
|
/// This does NOT retry on EINTR or EAGAIN, it simply returns.
|
||||||
|
/// \return -1 on error in which case errno will have been set. In this event, the number of bytes
|
||||||
|
/// actually written cannot be obtained.
|
||||||
|
pub fn wwrite_to_fd(input: &wstr, fd: RawFd) -> Option<usize> {
|
||||||
|
// Accumulate data in a local buffer.
|
||||||
|
let mut accum = [b'\0'; 512];
|
||||||
|
let mut accumlen = 0;
|
||||||
|
let maxaccum: usize = std::mem::size_of_val(&accum);
|
||||||
|
|
||||||
|
// Helper to perform a write to 'fd', looping as necessary.
|
||||||
|
// \return true on success, false on error.
|
||||||
|
let mut total_written = 0;
|
||||||
|
|
||||||
|
fn do_write(fd: RawFd, total_written: &mut usize, mut buf: &[u8]) -> bool {
|
||||||
|
while !buf.is_empty() {
|
||||||
|
let Ok(amt) = write_to_fd(buf, fd) else {
|
||||||
|
return false;
|
||||||
|
};
|
||||||
|
*total_written += amt;
|
||||||
|
assert!(amt <= buf.len(), "Wrote more than requested");
|
||||||
|
buf = &buf[amt..];
|
||||||
|
}
|
||||||
|
true
|
||||||
|
}
|
||||||
|
|
||||||
|
// Helper to flush the accumulation buffer.
|
||||||
|
let flush_accum = |total_written: &mut usize, accum: &[u8], accumlen: &mut usize| {
|
||||||
|
if !do_write(fd, total_written, &accum[..*accumlen]) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
*accumlen = 0;
|
||||||
|
true
|
||||||
|
};
|
||||||
|
|
||||||
|
let mut success = wcs2string_callback(input, |buff: &[u8]| {
|
||||||
|
if buff.len() + accumlen > maxaccum {
|
||||||
|
// We have to flush.
|
||||||
|
if !flush_accum(&mut total_written, &accum, &mut accumlen) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
if buff.len() + accumlen <= maxaccum {
|
||||||
|
// Accumulate more.
|
||||||
|
unsafe {
|
||||||
|
std::ptr::copy(&buff[0], &mut accum[accumlen], buff.len());
|
||||||
|
}
|
||||||
|
true
|
||||||
|
} else {
|
||||||
|
// Too much data to even fit, just write it immediately.
|
||||||
|
do_write(fd, &mut total_written, buff)
|
||||||
|
}
|
||||||
|
});
|
||||||
|
// Flush any remaining.
|
||||||
|
if success {
|
||||||
|
success = flush_accum(&mut total_written, &accum, &mut accumlen);
|
||||||
|
}
|
||||||
|
if success {
|
||||||
|
Some(total_written)
|
||||||
|
} else {
|
||||||
|
None
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
const PUA1_START: char = '\u{E000}';
|
||||||
|
const PUA1_END: char = '\u{F900}';
|
||||||
|
const PUA2_START: char = '\u{F0000}';
|
||||||
|
const PUA2_END: char = '\u{FFFFE}';
|
||||||
|
const PUA3_START: char = '\u{100000}';
|
||||||
|
const PUA3_END: char = '\u{10FFFE}';
|
||||||
|
|
||||||
|
/// Return one if the code point is in a Unicode private use area.
|
||||||
|
fn fish_is_pua(c: char) -> bool {
|
||||||
|
PUA1_START <= c && c < PUA1_END
|
||||||
|
}
|
||||||
|
|
||||||
|
/// We need this because there are too many implementations that don't return the proper answer for
|
||||||
|
/// some code points. See issue #3050.
|
||||||
|
pub fn fish_iswalnum(c: char) -> bool {
|
||||||
|
!fish_reserved_codepoint(c) && !fish_is_pua(c) && c.is_alphanumeric()
|
||||||
|
}
|
||||||
|
|
||||||
|
extern "C" {
|
||||||
|
fn iswgraph(wc: libc::wchar_t) -> libc::c_int; // Technically it's wint_t
|
||||||
|
}
|
||||||
|
|
||||||
|
/// We need this because there are too many implementations that don't return the proper answer for
|
||||||
|
/// some code points. See issue #3050.
|
||||||
|
pub fn fish_iswgraph(c: char) -> bool {
|
||||||
|
!fish_reserved_codepoint(c) && (fish_is_pua(c) || unsafe { iswgraph(c as libc::wchar_t) } != 0)
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn fish_wcswidth(s: &wstr) -> libc::c_int {
|
||||||
|
fallback::fish_wcswidth(s)
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Class for representing a file's inode. We use this to detect and avoid symlink loops, among
|
||||||
|
/// other things. While an inode / dev pair is sufficient to distinguish co-existing files, Linux
|
||||||
|
/// seems to aggressively re-use inodes, so it cannot determine if a file has been deleted (ABA
|
||||||
|
/// problem). Therefore we include richer information.
|
||||||
|
#[derive(Clone, Eq, Hash, Ord, PartialEq, PartialOrd)]
|
||||||
|
pub struct FileId {
|
||||||
|
device: libc::dev_t,
|
||||||
|
inode: libc::ino_t,
|
||||||
|
size: u64,
|
||||||
|
change_seconds: libc::time_t,
|
||||||
|
change_nanoseconds: i64,
|
||||||
|
mod_seconds: libc::time_t,
|
||||||
|
mod_nanoseconds: i64,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl FileId {
|
||||||
|
pub const fn new() -> Self {
|
||||||
|
FileId {
|
||||||
|
device: -1 as _,
|
||||||
|
inode: -1 as _,
|
||||||
|
size: -1 as _,
|
||||||
|
change_seconds: libc::time_t::MIN,
|
||||||
|
change_nanoseconds: i64::MIN,
|
||||||
|
mod_seconds: libc::time_t::MIN,
|
||||||
|
mod_nanoseconds: -1 as _,
|
||||||
|
}
|
||||||
|
}
|
||||||
|
pub fn from_stat(buf: &libc::stat) -> FileId {
|
||||||
|
let mut result = FileId::new();
|
||||||
|
result.device = buf.st_dev;
|
||||||
|
result.inode = buf.st_ino;
|
||||||
|
result.size = buf.st_size as u64;
|
||||||
|
result.change_seconds = buf.st_ctime;
|
||||||
|
result.mod_seconds = buf.st_mtime;
|
||||||
|
#[allow(clippy::unnecessary_cast)] // platform-dependent
|
||||||
|
{
|
||||||
|
result.change_nanoseconds = buf.st_ctime_nsec as _;
|
||||||
|
result.mod_nanoseconds = buf.st_mtime_nsec as _;
|
||||||
|
}
|
||||||
|
result
|
||||||
|
}
|
||||||
|
|
||||||
|
/// \return true if \param rhs has higher mtime seconds than this file_id_t.
|
||||||
|
/// If identical, nanoseconds are compared.
|
||||||
|
pub fn older_than(&self, rhs: &FileId) -> bool {
|
||||||
|
let lhs = (self.mod_seconds, self.mod_nanoseconds);
|
||||||
|
let rhs = (rhs.mod_seconds, rhs.mod_nanoseconds);
|
||||||
|
lhs.cmp(&rhs).is_lt()
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn dump(&self) -> WString {
|
||||||
|
let mut result = WString::new();
|
||||||
|
result += &sprintf!(" device: %lld\n", self.device)[..];
|
||||||
|
result += &sprintf!(" inode: %lld\n", self.inode)[..];
|
||||||
|
result += &sprintf!(" size: %lld\n", self.size)[..];
|
||||||
|
result += &sprintf!(" change: %lld\n", self.change_seconds)[..];
|
||||||
|
result += &sprintf!("change_nano: %lld\n", self.change_nanoseconds)[..];
|
||||||
|
result += &sprintf!(" mod: %lld\n", self.mod_seconds)[..];
|
||||||
|
result += &sprintf!(" mod_nano: %lld", self.mod_nanoseconds)[..];
|
||||||
|
result
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub const INVALID_FILE_ID: FileId = FileId::new();
|
||||||
|
|
||||||
|
pub fn file_id_for_fd(fd: RawFd) -> FileId {
|
||||||
|
let mut result = INVALID_FILE_ID;
|
||||||
|
let mut buf: libc::stat = unsafe { std::mem::zeroed() };
|
||||||
|
if fd >= 0 && unsafe { libc::fstat(fd, &mut buf) } == 0 {
|
||||||
|
result = FileId::from_stat(&buf);
|
||||||
|
}
|
||||||
|
result
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn file_id_for_autoclose_fd(fd: &AutoCloseFd) -> FileId {
|
||||||
|
file_id_for_fd(fd.fd())
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn file_id_for_path(path: &wstr) -> FileId {
|
||||||
|
let mut result = INVALID_FILE_ID;
|
||||||
|
let path = wcs2zstring(path);
|
||||||
|
let mut buf: libc::stat = unsafe { std::mem::zeroed() };
|
||||||
|
if unsafe { libc::stat(path.as_ptr(), &mut buf) } == 0 {
|
||||||
|
result = FileId::from_stat(&buf);
|
||||||
|
}
|
||||||
|
result
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Types of files that may be in a directory.
|
||||||
|
#[derive(Clone, Copy, Eq, PartialEq)]
|
||||||
|
pub enum DirEntryType {
|
||||||
|
fifo = 1, // FIFO file
|
||||||
|
chr, // character device
|
||||||
|
dir, // directory
|
||||||
|
blk, // block device
|
||||||
|
reg, // regular file
|
||||||
|
lnk, // symlink
|
||||||
|
sock, // socket
|
||||||
|
whiteout, // whiteout (from BSD)
|
||||||
|
}
|
||||||
|
|
||||||
|
/// An entry returned by dir_iter_t.
|
||||||
|
#[derive(Default)]
|
||||||
|
pub struct DirEntry {
|
||||||
|
/// File name of this entry.
|
||||||
|
pub name: WString,
|
||||||
|
|
||||||
|
/// inode of this entry.
|
||||||
|
pub inode: libc::ino_t,
|
||||||
|
|
||||||
|
// Stat buff for this entry, or none if not yet computed.
|
||||||
|
stat: Option<libc::stat>,
|
||||||
|
|
||||||
|
// The type of the entry. This is initially none; it may be populated eagerly via readdir()
|
||||||
|
// on some filesystems, or later via stat(). If stat() fails, the error is silently ignored
|
||||||
|
// and the type is left as none(). Note this is an unavoidable race.
|
||||||
|
typ: Option<DirEntryType>,
|
||||||
|
|
||||||
|
// fd of the DIR*, used for fstatat().
|
||||||
|
dirfd: RawFd,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl DirEntry {
|
||||||
|
/// \return the type of this entry if it is already available, otherwise none().
|
||||||
|
pub fn fast_type(&self) -> Option<DirEntryType> {
|
||||||
|
self.typ
|
||||||
|
}
|
||||||
|
|
||||||
|
/// \return the type of this entry, falling back to stat() if necessary.
|
||||||
|
/// If stat() fails because the file has disappeared, this will return none().
|
||||||
|
/// If stat() fails because of a broken symlink, this will return type lnk.
|
||||||
|
pub fn check_type(&mut self) -> Option<DirEntryType> {
|
||||||
|
// Call stat if needed to populate our type, swallowing errors.
|
||||||
|
if self.typ.is_none() {
|
||||||
|
self.do_stat()
|
||||||
|
}
|
||||||
|
self.typ
|
||||||
|
}
|
||||||
|
|
||||||
|
/// \return whether this is a directory. This may call stat().
|
||||||
|
pub fn is_dir(&mut self) -> bool {
|
||||||
|
self.check_type() == Some(DirEntryType::dir)
|
||||||
|
}
|
||||||
|
|
||||||
|
/// \return the stat buff for this entry, invoking stat() if necessary.
|
||||||
|
pub fn stat(&mut self) -> Option<libc::stat> {
|
||||||
|
if self.stat.is_none() {
|
||||||
|
self.do_stat();
|
||||||
|
}
|
||||||
|
self.stat
|
||||||
|
}
|
||||||
|
|
||||||
|
// Reset our fields.
|
||||||
|
fn reset(&mut self) {
|
||||||
|
self.name.clear();
|
||||||
|
self.inode = unsafe { std::mem::zeroed() };
|
||||||
|
self.typ = None;
|
||||||
|
self.stat = None;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Populate our stat buffer, and type. Errors are silently ignored.
|
||||||
|
fn do_stat(&mut self) {
|
||||||
|
// We want to set both our type and our stat buffer.
|
||||||
|
// If we follow symlinks and stat() errors with a bad symlink, set the type to link, but do not
|
||||||
|
// populate the stat buffer.
|
||||||
|
if self.dirfd < 0 {
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
let narrow = wcs2zstring(&self.name);
|
||||||
|
let mut s: libc::stat = unsafe { std::mem::zeroed() };
|
||||||
|
if unsafe { libc::fstatat(self.dirfd, narrow.as_ptr(), &mut s, 0) } == 0 {
|
||||||
|
self.stat = Some(s);
|
||||||
|
self.typ = stat_mode_to_entry_type(s.st_mode);
|
||||||
|
} else {
|
||||||
|
match errno::errno().0 {
|
||||||
|
ELOOP => {
|
||||||
|
self.typ = Some(DirEntryType::lnk);
|
||||||
|
}
|
||||||
|
EACCES | EIO | ENOENT | ENOTDIR | ENAMETOOLONG | ENODEV => {
|
||||||
|
// These are "expected" errors.
|
||||||
|
self.typ = None;
|
||||||
|
}
|
||||||
|
_ => {
|
||||||
|
self.typ = None;
|
||||||
|
// This used to print an error, but given that we have seen
|
||||||
|
// both ENODEV (above) and ENOTCONN,
|
||||||
|
// and that the error isn't actionable and shows up while typing,
|
||||||
|
// let's not do that.
|
||||||
|
// perror("fstatat");
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
fn dirent_type_to_entry_type(dt: u8) -> Option<DirEntryType> {
|
||||||
|
match dt {
|
||||||
|
DT_FIFO => Some(DirEntryType::fifo),
|
||||||
|
DT_CHR => Some(DirEntryType::chr),
|
||||||
|
DT_DIR => Some(DirEntryType::dir),
|
||||||
|
DT_BLK => Some(DirEntryType::blk),
|
||||||
|
DT_REG => Some(DirEntryType::reg),
|
||||||
|
DT_LNK => Some(DirEntryType::lnk),
|
||||||
|
DT_SOCK => Some(DirEntryType::sock),
|
||||||
|
// todo! whiteout
|
||||||
|
_ => None,
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
fn stat_mode_to_entry_type(m: libc::mode_t) -> Option<DirEntryType> {
|
||||||
|
match m & S_IFMT {
|
||||||
|
S_IFIFO => Some(DirEntryType::fifo),
|
||||||
|
S_IFCHR => Some(DirEntryType::chr),
|
||||||
|
S_IFDIR => Some(DirEntryType::dir),
|
||||||
|
S_IFBLK => Some(DirEntryType::blk),
|
||||||
|
S_IFREG => Some(DirEntryType::reg),
|
||||||
|
S_IFLNK => Some(DirEntryType::lnk),
|
||||||
|
S_IFSOCK => Some(DirEntryType::sock),
|
||||||
|
_ => {
|
||||||
|
// todo! whiteout
|
||||||
|
None
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Class for iterating over a directory, wrapping readdir().
|
||||||
|
/// This allows enumerating the contents of a directory, exposing the file type if the filesystem
|
||||||
|
/// itself exposes that from readdir(). stat() is incurred only if necessary: if the entry is a
|
||||||
|
/// symlink, or if the caller asks for the stat buffer.
|
||||||
|
/// Symlinks are followed.
|
||||||
|
pub struct DirIter {
|
||||||
|
/// Whether this dir_iter considers the "." and ".." filesystem entries.
|
||||||
|
withdot: bool,
|
||||||
|
|
||||||
|
dir: *mut libc::DIR,
|
||||||
|
error: libc::c_int,
|
||||||
|
entry: DirEntry,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl DirIter {
|
||||||
|
/// Open a directory at a given path. On failure, \p error() will return the error code.
|
||||||
|
/// Note opendir is guaranteed to set close-on-exec by POSIX (hooray).
|
||||||
|
pub fn new(path: &wstr, withdot: bool) -> Self {
|
||||||
|
let mut error = 0;
|
||||||
|
let dir = wopendir(path);
|
||||||
|
if dir.is_null() {
|
||||||
|
error = errno::errno().0;
|
||||||
|
}
|
||||||
|
let entry = DirEntry {
|
||||||
|
dirfd: unsafe { libc::dirfd(dir) },
|
||||||
|
..Default::default()
|
||||||
|
};
|
||||||
|
DirIter {
|
||||||
|
withdot,
|
||||||
|
dir,
|
||||||
|
error,
|
||||||
|
entry,
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Rewind the directory to the beginning.
|
||||||
|
pub fn rewind(&mut self) {
|
||||||
|
if self.dir.is_null() {
|
||||||
|
unsafe { libc::rewinddir(self.dir) };
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn next(&mut self) -> Option<&DirEntry> {
|
||||||
|
if self.dir.is_null() {
|
||||||
|
return None;
|
||||||
|
}
|
||||||
|
errno::set_errno(errno::Errno(0));
|
||||||
|
let dent = unsafe { libc::readdir(self.dir) };
|
||||||
|
if dent.is_null() {
|
||||||
|
self.error = errno::errno().0;
|
||||||
|
return None;
|
||||||
|
}
|
||||||
|
let dent = unsafe { &*dent };
|
||||||
|
// Skip . and ..,
|
||||||
|
// unless we've been told not to.
|
||||||
|
if !self.withdot
|
||||||
|
&& [
|
||||||
|
&[b'.' as i8, b'\0' as i8, b'\0' as i8][..],
|
||||||
|
&[b'.' as i8, b'.' as i8, b'\0' as i8][..],
|
||||||
|
]
|
||||||
|
.contains(&&dent.d_name[..3])
|
||||||
|
{
|
||||||
|
return self.next();
|
||||||
|
}
|
||||||
|
|
||||||
|
self.entry.reset();
|
||||||
|
let d_name: Vec<u8> = dent.d_name.iter().map(|b| *b as u8).collect();
|
||||||
|
self.entry.name = cstr2wcstring(&d_name);
|
||||||
|
#[cfg(any(target_os = "freebsd", target_os = "netbsd", target_os = "openbsd"))]
|
||||||
|
{
|
||||||
|
self.entry.inode = dent.d_fileno;
|
||||||
|
}
|
||||||
|
#[cfg(not(any(target_os = "freebsd", target_os = "netbsd", target_os = "openbsd")))]
|
||||||
|
{
|
||||||
|
self.entry.inode = dent.d_ino;
|
||||||
|
}
|
||||||
|
let typ = dirent_type_to_entry_type(dent.d_type);
|
||||||
|
// Do not store symlinks as we will need to resolve them.
|
||||||
|
if typ != Some(DirEntryType::lnk) {
|
||||||
|
self.entry.typ = typ;
|
||||||
|
}
|
||||||
|
|
||||||
|
Some(&self.entry)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Given that \p cursor is a pointer into \p base, return the offset in characters.
|
||||||
|
/// This emulates C pointer arithmetic:
|
||||||
|
/// `wstr_offset_in(cursor, base)` is equivalent to C++ `cursor - base`.
|
||||||
|
pub fn wstr_offset_in(cursor: &wstr, base: &wstr) -> usize {
|
||||||
|
let cursor = cursor.as_slice();
|
||||||
|
let base = base.as_slice();
|
||||||
|
// cursor may be a zero-length slice at the end of base,
|
||||||
|
// which base.as_ptr_range().contains(cursor.as_ptr()) will reject.
|
||||||
|
let base_range = base.as_ptr_range();
|
||||||
|
let curs_range = cursor.as_ptr_range();
|
||||||
|
assert!(
|
||||||
|
base_range.start <= curs_range.start && curs_range.end <= base_range.end,
|
||||||
|
"cursor should be a subslice of base"
|
||||||
|
);
|
||||||
|
let offset = unsafe { cursor.as_ptr().offset_from(base.as_ptr()) };
|
||||||
|
assert!(offset >= 0, "offset should be non-negative");
|
||||||
|
offset as usize
|
||||||
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_wstr_offset_in() {
|
fn test_wstr_offset_in() {
|
||||||
use crate::wchar::L;
|
use crate::wchar::L;
|
||||||
|
|
Loading…
Reference in a new issue