Clean up fish-printf in preparation for publishing

Make fish-printf no longer depend on the widestring crate, as other clients
won't use it; instead this is an optional feature.

Make format strings a generic type, so that both narrow and wide strings can
serve. This removes a lot of the complexity around converting from narrow to
wide.

Add a README.md to this crate.
This commit is contained in:
Peter Ammon 2024-09-19 15:34:40 -07:00
parent cdcf460edf
commit 974ad882fa
No known key found for this signature in database
20 changed files with 419 additions and 227 deletions

2
Cargo.lock generated
View file

@ -104,7 +104,7 @@ dependencies = [
[[package]] [[package]]
name = "fish-printf" name = "fish-printf"
version = "0.1.0" version = "0.2.0"
dependencies = [ dependencies = [
"libc", "libc",
"widestring", "widestring",

View file

@ -44,14 +44,16 @@ nix = { version = "0.29.0", default-features = false, features = [
] } ] }
num-traits = "0.2.19" num-traits = "0.2.19"
once_cell = "1.19.0" once_cell = "1.19.0"
fish-printf = { path = "./printf" } fish-printf = { path = "./printf", features = ["widestring"] }
rand = { version = "0.8.5", features = ["small_rng"] } rand = { version = "0.8.5", features = ["small_rng"] }
widestring = "1.1.0" widestring = "1.1.0"
# We need 0.9.0 specifically for some crash fixes. # We need 0.9.0 specifically for some crash fixes.
terminfo = "0.9.0" terminfo = "0.9.0"
[target.'cfg(not(target_has_atomic = "64"))'.dependencies] [target.'cfg(not(target_has_atomic = "64"))'.dependencies]
portable-atomic = { version = "1", default-features = false, features = ["fallback"] } portable-atomic = { version = "1", default-features = false, features = [
"fallback",
] }
[dev-dependencies] [dev-dependencies]
rand_pcg = "0.3.1" rand_pcg = "0.3.1"

View file

@ -1,10 +1,10 @@
[package] [package]
name = "fish-printf" name = "fish-printf"
edition = "2021" edition = "2021"
version = "0.1.0" version = "0.2.0"
description = "printf implementation, based on musl" description = "printf implementation, based on musl"
license = "MIT" license = "MIT"
[dependencies] [dependencies]
libc = "0.2.155" libc = "0.2.155"
widestring = "1.0.2" widestring = { version = "1.0.2", optional = true }

43
printf/README.md Normal file
View file

@ -0,0 +1,43 @@
# fish-printf
The printf implementation used in [fish-shell](https://fishshell.com), based on musl printf.
[![crates.io](https://img.shields.io/crates/v/fish-printf.svg)](https://crates.io/crates/fish-printf)
Licensed under the MIT license.
### Usage
Run `cargo add fish-printf` to add this crate to your `Cargo.toml` file.
Also run `cargo add widestring` to add the widestring crate.
### Notes
fish-printf attempts to match the C standard for printf. It supports the following features:
- Locale-specific formatting (decimal point, thousands separator, etc.)
- Honors the current rounding mode.
- Supports the `%n` modifier for counting characters written.
fish-printf does not support positional arguments, such as `printf("%2$d", 1, 2)`.
Prefixes like `l` or `ll` are recognized, but only used for validating the format string.
The size of integer values is taken from the argument type.
fish-printf can output to an `std::fmt::Write` object, or return a string.
For reasons related to fish-shell, fish-printf has a feature "widestring" which uses the [widestring](https://crates.io/crates/widestring) crate. This is off by default.
### Examples
```rust
use fish_printf::sprintf;
// Create a `String` from a format string.
let s = sprintf!("%0.5g", 123456.0) // 1.2346e+05
// Append to an existing string.
let s = String::new();
sprintf!(=> &mut s, "%0.5g", 123456.0) // 1.2346e+05
```

View file

@ -1,15 +1,18 @@
use super::printf_impl::Error; use super::printf_impl::Error;
use std::result::Result; use std::result::Result;
#[cfg(feature = "widestring")]
use widestring::{Utf32Str as wstr, Utf32String as WString}; use widestring::{Utf32Str as wstr, Utf32String as WString};
/// Printf argument types. /// Printf argument types.
/// Note no implementation of ToArg constructs the owned variants (String and WString); /// Note no implementation of `ToArg` constructs the owned variants (String and WString);
/// callers can do so explicitly. /// callers can do so explicitly.
#[derive(Debug, PartialEq)] #[derive(Debug, PartialEq)]
pub enum Arg<'a> { pub enum Arg<'a> {
Str(&'a str), Str(&'a str),
#[cfg(feature = "widestring")]
WStr(&'a wstr), WStr(&'a wstr),
String(String), String(String),
#[cfg(feature = "widestring")]
WString(WString), WString(WString),
UInt(u64), UInt(u64),
SInt(i64, u8), // signed integers track their width as the number of bits SInt(i64, u8), // signed integers track their width as the number of bits
@ -27,6 +30,8 @@ impl<'a> Arg<'a> {
} }
// Convert this to a narrow string, using the provided storage if necessary. // Convert this to a narrow string, using the provided storage if necessary.
// In practice 'storage' is only used if the widestring feature is enabled.
#[allow(unused_variables, clippy::ptr_arg)]
pub fn as_str<'s>(&'s self, storage: &'s mut String) -> Result<&'s str, Error> pub fn as_str<'s>(&'s self, storage: &'s mut String) -> Result<&'s str, Error>
where where
'a: 's, 'a: 's,
@ -34,11 +39,13 @@ impl<'a> Arg<'a> {
match self { match self {
Arg::Str(s) => Ok(s), Arg::Str(s) => Ok(s),
Arg::String(s) => Ok(s), Arg::String(s) => Ok(s),
#[cfg(feature = "widestring")]
Arg::WStr(s) => { Arg::WStr(s) => {
storage.clear(); storage.clear();
storage.extend(s.chars()); storage.extend(s.chars());
Ok(storage) Ok(storage)
} }
#[cfg(feature = "widestring")]
Arg::WString(s) => { Arg::WString(s) => {
storage.clear(); storage.clear();
storage.extend(s.chars()); storage.extend(s.chars());
@ -118,12 +125,14 @@ impl<'a> ToArg<'a> for &'a String {
} }
} }
#[cfg(feature = "widestring")]
impl<'a> ToArg<'a> for &'a wstr { impl<'a> ToArg<'a> for &'a wstr {
fn to_arg(self) -> Arg<'a> { fn to_arg(self) -> Arg<'a> {
Arg::WStr(self) Arg::WStr(self)
} }
} }
#[cfg(feature = "widestring")]
impl<'a> ToArg<'a> for &'a WString { impl<'a> ToArg<'a> for &'a WString {
fn to_arg(self) -> Arg<'a> { fn to_arg(self) -> Arg<'a> {
Arg::WStr(self) Arg::WStr(self)
@ -191,6 +200,7 @@ impl_to_arg_u!(u8, u16, u32, u64, usize);
#[cfg(test)] #[cfg(test)]
mod tests { mod tests {
use super::*; use super::*;
#[cfg(feature = "widestring")]
use widestring::utf32str; use widestring::utf32str;
#[test] #[test]
@ -199,7 +209,9 @@ mod tests {
assert!(matches!("test".to_arg(), Arg::Str("test"))); assert!(matches!("test".to_arg(), Arg::Str("test")));
assert!(matches!(String::from("test").to_arg(), Arg::Str(_))); assert!(matches!(String::from("test").to_arg(), Arg::Str(_)));
#[cfg(feature = "widestring")]
assert!(matches!(utf32str!("test").to_arg(), Arg::WStr(_))); assert!(matches!(utf32str!("test").to_arg(), Arg::WStr(_)));
#[cfg(feature = "widestring")]
assert!(matches!(WString::from("test").to_arg(), Arg::WStr(_))); assert!(matches!(WString::from("test").to_arg(), Arg::WStr(_)));
assert!(matches!(42f32.to_arg(), Arg::Float(_))); assert!(matches!(42f32.to_arg(), Arg::Float(_)));
assert!(matches!(42f64.to_arg(), Arg::Float(_))); assert!(matches!(42f64.to_arg(), Arg::Float(_)));

View file

@ -4,41 +4,50 @@ pub use arg::{Arg, ToArg};
mod fmt_fp; mod fmt_fp;
mod printf_impl; mod printf_impl;
pub use printf_impl::{sprintf_locale, Error}; pub use printf_impl::{sprintf_locale, Error, FormatString};
pub mod locale; pub mod locale;
pub use locale::{Locale, C_LOCALE, EN_US_LOCALE}; pub use locale::{Locale, C_LOCALE, EN_US_LOCALE};
#[cfg(test)] #[cfg(test)]
mod tests; mod tests;
/// A macro to format a string using `fish_printf` with C-locale formatting rules.
///
/// # Examples
///
/// ```
/// use fish_printf::sprintf;
///
/// // Create a `String` from a format string.
/// let s = sprintf!("%0.5g", 123456.0);
/// assert_eq!(s, "1.2346e+05");
///
/// // Append to an existing string.
/// let mut s = String::new();
/// sprintf!(=> &mut s, "%0.5g", 123456.0);
/// assert_eq!(s, "1.2346e+05");
/// ```
#[macro_export] #[macro_export]
macro_rules! sprintf { macro_rules! sprintf {
// Variant which allows a string literal and returns a `Utf32String`. // Write to a newly allocated String, and return it.
($fmt:literal, $($arg:expr),* $(,)?) => { // This panics if the format string or arguments are invalid.
{
let mut target = widestring::Utf32String::new();
$crate::sprintf!(=> &mut target, widestring::utf32str!($fmt), $($arg),*);
target
}
};
// Variant which allows a string literal and writes to a target.
// The target should implement std::fmt::Write.
( (
=> $target:expr, // target string $fmt:expr, // Format string, which should implement FormatString.
$fmt:literal, // format string
$($arg:expr),* // arguments $($arg:expr),* // arguments
$(,)? // optional trailing comma $(,)? // optional trailing comma
) => { ) => {
{ {
$crate::sprintf!(=> $target, widestring::utf32str!($fmt), $($arg),*); let mut target = String::new();
$crate::sprintf!(=> &mut target, $fmt, $($arg),*);
target
} }
}; };
// Variant which allows a `Utf32String` as a format, and writes to a target. // Variant which writes to a target.
// The target should implement std::fmt::Write.
( (
=> $target:expr, // target string => $target:expr, // target string
$fmt:expr, // format string as UTF32String $fmt:expr, // format string
$($arg:expr),* // arguments $($arg:expr),* // arguments
$(,)? // optional trailing comma $(,)? // optional trailing comma
) => { ) => {
@ -46,22 +55,13 @@ macro_rules! sprintf {
// May be no args! // May be no args!
#[allow(unused_imports)] #[allow(unused_imports)]
use $crate::ToArg; use $crate::ToArg;
$crate::sprintf_c_locale( $crate::printf_c_locale(
$target, $target,
$fmt.as_char_slice(), $fmt,
&mut [$($arg.to_arg()),*], &mut [$($arg.to_arg()),*],
).unwrap() ).unwrap()
} }
}; };
// Variant which allows a `Utf32String` as a format, and returns a `Utf32String`.
($fmt:expr, $($arg:expr),* $(,)?) => {
{
let mut target = widestring::Utf32String::new();
$crate::sprintf!(=> &mut target, $fmt, $($arg),*);
target
}
};
} }
/// Formats a string using the provided format specifiers and arguments, using the C locale, /// Formats a string using the provided format specifiers and arguments, using the C locale,
@ -70,14 +70,29 @@ macro_rules! sprintf {
/// # Parameters /// # Parameters
/// - `f`: The receiver of formatted output. /// - `f`: The receiver of formatted output.
/// - `fmt`: The format string being parsed. /// - `fmt`: The format string being parsed.
/// - `locale`: The locale to use for number formatting.
/// - `args`: Iterator over the arguments to format. /// - `args`: Iterator over the arguments to format.
/// ///
/// # Returns /// # Returns
/// A `Result` which is `Ok` containing the number of bytes written on success, or an `Error`. /// A `Result` which is `Ok` containing the number of characters written on success, or an `Error`.
pub fn sprintf_c_locale( ///
/// # Example
///
/// ```
/// use fish_printf::{printf_c_locale, ToArg, FormatString};
/// use std::fmt::Write;
///
/// let mut output = String::new();
/// let fmt: &str = "%0.5g"; // Example format string
/// let mut args = [123456.0.to_arg()];
///
/// let result = printf_c_locale(&mut output, fmt, &mut args);
///
/// assert!(result == Ok(10));
/// assert_eq!(output, "1.2346e+05");
/// ```
pub fn printf_c_locale(
f: &mut impl std::fmt::Write, f: &mut impl std::fmt::Write,
fmt: &[char], fmt: impl FormatString,
args: &mut [Arg], args: &mut [Arg],
) -> Result<usize, Error> { ) -> Result<usize, Error> {
sprintf_locale(f, fmt, &locale::C_LOCALE, args) sprintf_locale(f, fmt, &locale::C_LOCALE, args)

View file

@ -4,9 +4,11 @@ use super::fmt_fp::format_float;
use super::locale::Locale; use super::locale::Locale;
use std::fmt::{self, Write}; use std::fmt::{self, Write};
use std::mem; use std::mem;
use std::ops::{AddAssign, Index};
use std::result::Result; use std::result::Result;
#[cfg(feature = "widestring")]
use widestring::Utf32Str as wstr;
/// Possible errors from printf. /// Possible errors from printf.
#[derive(Debug, PartialEq, Eq)] #[derive(Debug, PartialEq, Eq)]
pub enum Error { pub enum Error {
@ -151,107 +153,143 @@ impl ConversionSpec {
} }
} }
// A helper type that holds a format string slice and points into it. // A helper type with convenience functions for format strings.
// As a convenience, this returns '\0' for one-past-the-end. pub trait FormatString {
#[derive(Debug)]
struct FormatString<'a>(&'a [char]);
impl<'a> FormatString<'a> {
// Return the underlying slice.
fn as_slice(&self) -> &'a [char] {
self.0
}
// Return true if we are empty. // Return true if we are empty.
fn is_empty(&self) -> bool { fn is_empty(&self) -> bool;
self.0.is_empty()
}
// Read an int from our cursor, stopping at the first non-digit. // Return the character at a given index, or None if out of bounds.
// Negative values are not supported. // Note the index is a count of characters, not bytes.
// If there are no digits, return 0. fn at(&self, index: usize) -> Option<char>;
// Adjust the cursor to point to the char after the int.
fn get_int(&mut self) -> Result<usize, Error> {
use Error::Overflow;
let mut i: usize = 0;
while let Some(digit) = self[0].to_digit(10) {
i = i.checked_mul(10).ok_or(Overflow)?;
i = i.checked_add(digit as usize).ok_or(Overflow)?;
*self += 1;
}
Ok(i)
}
// Read a conversion prefix from our cursor, advancing it. // Advance by the given number of characters.
fn get_prefix(&mut self) -> ConversionPrefix { fn advance_by(&mut self, n: usize);
use ConversionPrefix as CP;
let prefix = match self[0] {
'h' if self[1] == 'h' => CP::hh,
'h' => CP::h,
'l' if self[1] == 'l' => CP::ll,
'l' => CP::l,
'j' => CP::j,
't' => CP::t,
'z' => CP::z,
'L' => CP::L,
_ => CP::Empty,
};
*self += match prefix {
CP::Empty => 0,
CP::hh | CP::ll => 2,
_ => 1,
};
prefix
}
// Read an (optionally prefixed) format specifier, such as d, Lf, etc.
// Adjust the cursor to point to the char after the specifier.
fn get_specifier(&mut self) -> Result<ConversionSpec, Error> {
let prefix = self.get_prefix();
// Awkwardly placed hack to disallow %lC and %lS, since we otherwise treat
// them as the same.
if prefix != ConversionPrefix::Empty && matches!(self[0], 'C' | 'S') {
return Err(Error::BadFormatString);
}
let spec = ConversionSpec::from_char(self[0]).ok_or(Error::BadFormatString)?;
if !spec.supports_prefix(prefix) {
return Err(Error::BadFormatString);
}
*self += 1;
Ok(spec)
}
// Read a sequence of characters to be output literally, advancing the cursor. // Read a sequence of characters to be output literally, advancing the cursor.
// The characters may optionally be stored in the given buffer.
// This handles a tail of %%. // This handles a tail of %%.
fn get_lit(&mut self) -> &'a [char] { fn take_literal<'a: 'b, 'b>(&'a mut self, buffer: &'b mut String) -> &'b str;
let s = self.0; }
impl FormatString for &str {
fn is_empty(&self) -> bool {
(*self).is_empty()
}
fn at(&self, index: usize) -> Option<char> {
self.chars().nth(index)
}
fn advance_by(&mut self, n: usize) {
let mut chars = self.chars();
for _ in 0..n {
let c = chars.next();
assert!(c.is_some(), "FormatString::advance(): index out of bounds");
}
*self = chars.as_str();
}
fn take_literal<'a: 'b, 'b>(&'a mut self, _buffer: &'b mut String) -> &'b str {
// Count length of non-percent characters.
let non_percents: usize = self
.chars()
.take_while(|&c| c != '%')
.map(|c| c.len_utf8())
.sum();
// Take only an even number of percents. Note we know these have byte length 1.
let percent_pairs = self[non_percents..]
.chars()
.take_while(|&c| c == '%')
.count()
/ 2;
let (prefix, rest) = self.split_at(non_percents + percent_pairs * 2);
*self = rest;
// Trim half of the trailing percent characters from the prefix.
&prefix[..prefix.len() - percent_pairs]
}
}
#[cfg(feature = "widestring")]
impl FormatString for &wstr {
fn is_empty(&self) -> bool {
(*self).is_empty()
}
fn at(&self, index: usize) -> Option<char> {
self.as_char_slice().get(index).copied()
}
fn advance_by(&mut self, n: usize) {
*self = &self[n..];
}
fn take_literal<'a: 'b, 'b>(&'a mut self, buffer: &'b mut String) -> &'b str {
let s = self.as_char_slice();
let non_percents = s.iter().take_while(|&&c| c != '%').count(); let non_percents = s.iter().take_while(|&&c| c != '%').count();
// Take only an even number of percents. // Take only an even number of percents.
let percent_pairs: usize = s[non_percents..].iter().take_while(|&&c| c == '%').count() / 2; let percent_pairs: usize = s[non_percents..].iter().take_while(|&&c| c == '%').count() / 2;
*self += non_percents + percent_pairs * 2; *self = &self[non_percents + percent_pairs * 2..];
&s[..non_percents + percent_pairs] buffer.clear();
buffer.extend(s[..non_percents + percent_pairs].iter());
buffer.as_str()
} }
} }
// Advance this format string by a number of chars. // Read an int from a format string, stopping at the first non-digit.
impl AddAssign<usize> for FormatString<'_> { // Negative values are not supported.
fn add_assign(&mut self, rhs: usize) { // If there are no digits, return 0.
self.0 = &self.0[rhs..]; // Adjust the format string to point to the char after the int.
fn get_int(fmt: &mut impl FormatString) -> Result<usize, Error> {
use Error::Overflow;
let mut i: usize = 0;
while let Some(digit) = fmt.at(0).and_then(|c| c.to_digit(10)) {
i = i.checked_mul(10).ok_or(Overflow)?;
i = i.checked_add(digit as usize).ok_or(Overflow)?;
fmt.advance_by(1);
} }
Ok(i)
} }
// Index into FormatString, returning \0 for one-past-the-end. // Read a conversion prefix from a format string, advancing it.
impl Index<usize> for FormatString<'_> { fn get_prefix(fmt: &mut impl FormatString) -> ConversionPrefix {
type Output = char; use ConversionPrefix as CP;
let prefix = match fmt.at(0).unwrap_or('\0') {
'h' if fmt.at(1) == Some('h') => CP::hh,
'h' => CP::h,
'l' if fmt.at(1) == Some('l') => CP::ll,
'l' => CP::l,
'j' => CP::j,
't' => CP::t,
'z' => CP::z,
'L' => CP::L,
_ => CP::Empty,
};
fmt.advance_by(match prefix {
CP::Empty => 0,
CP::hh | CP::ll => 2,
_ => 1,
});
prefix
}
fn index(&self, idx: usize) -> &char { // Read an (optionally prefixed) format specifier, such as d, Lf, etc.
let s = self.as_slice(); // Adjust the cursor to point to the char after the specifier.
if idx == s.len() { fn get_specifier(fmt: &mut impl FormatString) -> Result<ConversionSpec, Error> {
&'\0' let prefix = get_prefix(fmt);
} else { // Awkwardly placed hack to disallow %lC and %lS, since we otherwise treat
&s[idx] // them as the same.
} if prefix != ConversionPrefix::Empty && matches!(fmt.at(0), Some('C' | 'S')) {
return Err(Error::BadFormatString);
} }
let spec = fmt
.at(0)
.and_then(ConversionSpec::from_char)
.ok_or(Error::BadFormatString)?;
if !spec.supports_prefix(prefix) {
return Err(Error::BadFormatString);
}
fmt.advance_by(1);
Ok(spec)
} }
// Pad output by emitting `c` until `min_width` is reached. // Pad output by emitting `c` until `min_width` is reached.
@ -288,14 +326,30 @@ pub(super) fn pad(
/// ///
/// # Returns /// # Returns
/// A `Result` which is `Ok` containing the number of bytes written on success, or an `Error`. /// A `Result` which is `Ok` containing the number of bytes written on success, or an `Error`.
///
/// # Example
///
/// ```
/// use fish_printf::{sprintf_locale, ToArg, FormatString, locale};
/// use std::fmt::Write;
///
/// let mut output = String::new();
/// let fmt: &str = "%'0.2f";
/// let mut args = [1234567.89.to_arg()];
///
/// let result = sprintf_locale(&mut output, fmt, &locale::EN_US_LOCALE, &mut args);
///
/// assert!(result == Ok(12));
/// assert_eq!(output, "1,234,567.89");
/// ```
pub fn sprintf_locale( pub fn sprintf_locale(
f: &mut impl Write, f: &mut impl Write,
fmt: &[char], fmt: impl FormatString,
locale: &Locale, locale: &Locale,
args: &mut [Arg], args: &mut [Arg],
) -> Result<usize, Error> { ) -> Result<usize, Error> {
use ConversionSpec as CS; use ConversionSpec as CS;
let mut s = FormatString(fmt); let mut s = fmt;
let mut args = args.iter_mut(); let mut args = args.iter_mut();
let mut out_len: usize = 0; let mut out_len: usize = 0;
@ -305,31 +359,32 @@ pub fn sprintf_locale(
buf.clear(); buf.clear();
// Handle literal text and %% format specifiers. // Handle literal text and %% format specifiers.
let lit = s.get_lit(); let lit = s.take_literal(buf);
if !lit.is_empty() { if !lit.is_empty() {
buf.extend(lit.iter()); f.write_str(lit)?;
f.write_str(buf)?; out_len = out_len
out_len = out_len.checked_add(lit.len()).ok_or(Error::Overflow)?; .checked_add(lit.chars().count())
.ok_or(Error::Overflow)?;
continue 'main; continue 'main;
} }
// Consume the % at the start of the format specifier. // Consume the % at the start of the format specifier.
debug_assert!(s[0] == '%'); debug_assert!(s.at(0) == Some('%'));
s += 1; s.advance_by(1);
// Read modifier flags. '-' and '0' flags are mutually exclusive. // Read modifier flags. '-' and '0' flags are mutually exclusive.
let mut flags = ModifierFlags::default(); let mut flags = ModifierFlags::default();
while flags.try_set(s[0]) { while flags.try_set(s.at(0).unwrap_or('\0')) {
s += 1; s.advance_by(1);
} }
if flags.left_adj { if flags.left_adj {
flags.zero_pad = false; flags.zero_pad = false;
} }
// Read field width. We do not support $. // Read field width. We do not support $.
let width = if s[0] == '*' { let width = if s.at(0) == Some('*') {
let arg_width = args.next().ok_or(Error::MissingArg)?.as_sint()?; let arg_width = args.next().ok_or(Error::MissingArg)?.as_sint()?;
s += 1; s.advance_by(1);
if arg_width < 0 { if arg_width < 0 {
flags.left_adj = true; flags.left_adj = true;
} }
@ -338,19 +393,19 @@ pub fn sprintf_locale(
.try_into() .try_into()
.map_err(|_| Error::Overflow)? .map_err(|_| Error::Overflow)?
} else { } else {
s.get_int()? get_int(&mut s)?
}; };
// Optionally read precision. We do not support $. // Optionally read precision. We do not support $.
let mut prec: Option<usize> = if s[0] == '.' && s[1] == '*' { let mut prec: Option<usize> = if s.at(0) == Some('.') && s.at(1) == Some('*') {
// "A negative precision is treated as though it were missing." // "A negative precision is treated as though it were missing."
// Here we assume the precision is always signed. // Here we assume the precision is always signed.
s += 2; s.advance_by(2);
let p = args.next().ok_or(Error::MissingArg)?.as_sint()?; let p = args.next().ok_or(Error::MissingArg)?.as_sint()?;
p.try_into().ok() p.try_into().ok()
} else if s[0] == '.' { } else if s.at(0) == Some('.') {
s += 1; s.advance_by(1);
Some(s.get_int()?) Some(get_int(&mut s)?)
} else { } else {
None None
}; };
@ -360,7 +415,7 @@ pub fn sprintf_locale(
} }
// Read out the format specifier and arg. // Read out the format specifier and arg.
let conv_spec = s.get_specifier()?; let conv_spec = get_specifier(&mut s)?;
let arg = args.next().ok_or(Error::MissingArg)?; let arg = args.next().ok_or(Error::MissingArg)?;
let mut prefix = ""; let mut prefix = "";

View file

@ -1,10 +1,9 @@
use crate::arg::ToArg; use crate::arg::ToArg;
use crate::locale::{Locale, C_LOCALE, EN_US_LOCALE}; use crate::locale::{Locale, C_LOCALE, EN_US_LOCALE};
use crate::{sprintf_locale, Error}; use crate::{sprintf_locale, Error, FormatString};
use libc::c_char; use libc::c_char;
use std::f64::consts::{E, PI, TAU}; use std::f64::consts::{E, PI, TAU};
use std::fmt; use std::fmt;
use widestring::{utf32str, Utf32Str};
// sprintf, checking length // sprintf, checking length
macro_rules! sprintf_check { macro_rules! sprintf_check {
@ -15,11 +14,11 @@ macro_rules! sprintf_check {
) => { ) => {
{ {
let mut target = String::new(); let mut target = String::new();
let chars: Vec<char> = $fmt.chars().collect(); let mut args = [$($arg.to_arg()),*];
let len = $crate::sprintf_c_locale( let len = $crate::printf_c_locale(
&mut target, &mut target,
&chars, $fmt.as_ref() as &str,
&mut [$($arg.to_arg()),*] &mut args,
).expect("printf failed"); ).expect("printf failed");
assert!(len == target.len(), "Wrong length returned: {} vs {}", len, target.len()); assert!(len == target.len(), "Wrong length returned: {} vs {}", len, target.len());
target target
@ -43,10 +42,9 @@ macro_rules! assert_fmt1 {
macro_rules! sprintf_err { macro_rules! sprintf_err {
($fmt:expr, $($arg:expr),* => $expected:expr) => { ($fmt:expr, $($arg:expr),* => $expected:expr) => {
{ {
let chars: Vec<char> = $fmt.chars().collect(); let err = $crate::printf_c_locale(
let err = $crate::sprintf_c_locale(
&mut NullOutput, &mut NullOutput,
&chars, $fmt.as_ref() as &str,
&mut [$($arg.to_arg()),*], &mut [$($arg.to_arg()),*],
).unwrap_err(); ).unwrap_err();
assert_eq!(err, $expected, "Wrong error returned: {:?}", err); assert_eq!(err, $expected, "Wrong error returned: {:?}", err);
@ -58,10 +56,9 @@ macro_rules! sprintf_err {
macro_rules! sprintf_count { macro_rules! sprintf_count {
($fmt:expr $(, $arg:expr)*) => { ($fmt:expr $(, $arg:expr)*) => {
{ {
let chars: Vec<char> = $fmt.chars().collect(); $crate::printf_c_locale(
$crate::sprintf_c_locale(
&mut NullOutput, &mut NullOutput,
&chars, $fmt,
&mut [$($arg.to_arg()),*], &mut [$($arg.to_arg()),*],
).expect("printf failed") ).expect("printf failed")
} }
@ -84,6 +81,69 @@ fn smoke() {
assert_fmt!("" => ""); assert_fmt!("" => "");
} }
#[test]
fn test_format_string_str() {
let mut s: &str = "hello%world%%%%%";
assert_eq!(s.is_empty(), false);
for (idx, c) in s.char_indices() {
assert_eq!(s.at(idx), Some(c));
}
assert_eq!(s.at(s.chars().count()), None);
let mut buffer = String::new();
assert_eq!(s.take_literal(&mut buffer), "hello");
s.advance_by(1); // skip '%'
assert_eq!(s.at(0), Some('w'));
assert_eq!(s.take_literal(&mut buffer), "world%%");
s.advance_by(1); // advancing over one more %
assert_eq!(s.is_empty(), true); // remaining content is empty
}
#[cfg(feature = "widestring")]
#[test]
fn test_format_string_wstr() {
use widestring::Utf32String;
let utf32: Utf32String = Utf32String::from_str("hello%world%%%%%");
let mut s = utf32.as_utfstr();
for (idx, c) in s.char_indices() {
assert_eq!(s.at(idx), Some(c));
}
assert_eq!(s.at(s.chars().count()), None);
let mut buffer = String::new();
assert_eq!(s.take_literal(&mut buffer), "hello");
s.advance_by(1); // skip '%'
assert_eq!(s.at(0), Some('w'));
assert_eq!(s.take_literal(&mut buffer), "world%%");
s.advance_by(1); // advancing over one more %
assert_eq!(s.is_empty(), true); // remaining content is empty
}
#[test]
fn test_char_counts() {
// printf returns the number of characters, not the number of bytes.
assert_eq!(sprintf_count!("%d", 123), 3);
assert_eq!(sprintf_count!("%d", -123), 4);
assert_eq!(sprintf_count!("\u{1F680}"), 1);
}
#[cfg(feature = "widestring")]
#[test]
fn test_wide_char_counts() {
use widestring::utf32str;
// printf returns the number of characters, not the number of bytes.
assert_eq!(sprintf_count!(utf32str!("%d"), 123), 3);
assert_eq!(sprintf_count!(utf32str!("%d"), -123), 4);
assert_eq!(sprintf_count!(utf32str!("\u{1F680}")), 1);
}
#[test] #[test]
fn test1() { fn test1() {
// A convenient place to isolate a single test, e.g. cargo test -- test1 // A convenient place to isolate a single test, e.g. cargo test -- test1
@ -591,6 +651,16 @@ fn test_prefixes() {
assert_eq!(sprintf_check!("%ls", "cs"), "cs"); assert_eq!(sprintf_check!("%ls", "cs"), "cs");
} }
#[test]
fn test_crate_macros() {
let mut target = String::new();
crate::sprintf!(=> &mut target, "%d ok %d", 1, 2);
assert_eq!(target, "1 ok 2");
target = crate::sprintf!("%d ok %d", 3, 4);
assert_eq!(target, "3 ok 4");
}
#[test] #[test]
#[cfg_attr( #[cfg_attr(
all(target_arch = "x86", not(target_feature = "sse2")), all(target_arch = "x86", not(target_feature = "sse2")),
@ -711,8 +781,7 @@ fn test_errors() {
fn test_locale() { fn test_locale() {
fn test_printf_loc<'a>(expected: &str, locale: &Locale, format: &str, arg: impl ToArg<'a>) { fn test_printf_loc<'a>(expected: &str, locale: &Locale, format: &str, arg: impl ToArg<'a>) {
let mut target = String::new(); let mut target = String::new();
let format_chars: Vec<char> = format.chars().collect(); let len = sprintf_locale(&mut target, format, locale, &mut [arg.to_arg()])
let len = sprintf_locale(&mut target, &format_chars, locale, &mut [arg.to_arg()])
.expect("printf failed"); .expect("printf failed");
assert_eq!(len, target.len()); assert_eq!(len, target.len());
assert_eq!(target, expected); assert_eq!(target, expected);
@ -769,7 +838,7 @@ fn test_float_hex_prec() {
v *= sign; v *= sign;
for preci in 1..=200_i32 { for preci in 1..=200_i32 {
rust_str.clear(); rust_str.clear();
crate::sprintf!(=> &mut rust_str, utf32str!("%.*a"), preci, v); crate::sprintf!(=> &mut rust_str, "%.*a", preci, v);
let printf_str = unsafe { let printf_str = unsafe {
let len = libc::snprintf(c_storage_ptr, c_storage.len(), c_fmt, preci, v); let len = libc::snprintf(c_storage_ptr, c_storage.len(), c_fmt, preci, v);
@ -792,7 +861,7 @@ fn test_float_hex_prec() {
assert!(!failed); assert!(!failed);
} }
fn test_exhaustive(rust_fmt: &Utf32Str, c_fmt: *const c_char) { fn test_exhaustive(rust_fmt: &str, c_fmt: *const c_char) {
// "There's only 4 billion floats so test them all." // "There's only 4 billion floats so test them all."
// This tests a format string expected to be of the form "%.*g" or "%.*e". // This tests a format string expected to be of the form "%.*g" or "%.*e".
// That is, it takes a precision and a double. // That is, it takes a precision and a double.
@ -835,28 +904,19 @@ fn test_exhaustive(rust_fmt: &Utf32Str, c_fmt: *const c_char) {
#[ignore] #[ignore]
fn test_float_g_exhaustive() { fn test_float_g_exhaustive() {
// To run: cargo test test_float_g_exhaustive --release -- --ignored --nocapture // To run: cargo test test_float_g_exhaustive --release -- --ignored --nocapture
test_exhaustive( test_exhaustive("%.*g", b"%.*g\0".as_ptr() as *const c_char);
widestring::utf32str!("%.*g"),
b"%.*g\0".as_ptr() as *const c_char,
);
} }
#[test] #[test]
#[ignore] #[ignore]
fn test_float_e_exhaustive() { fn test_float_e_exhaustive() {
// To run: cargo test test_float_e_exhaustive --release -- --ignored --nocapture // To run: cargo test test_float_e_exhaustive --release -- --ignored --nocapture
test_exhaustive( test_exhaustive("%.*e", b"%.*e\0".as_ptr() as *const c_char);
widestring::utf32str!("%.*e"),
b"%.*e\0".as_ptr() as *const c_char,
);
} }
#[test] #[test]
#[ignore] #[ignore]
fn test_float_f_exhaustive() { fn test_float_f_exhaustive() {
// To run: cargo test test_float_f_exhaustive --release -- --ignored --nocapture // To run: cargo test test_float_f_exhaustive --release -- --ignored --nocapture
test_exhaustive( test_exhaustive("%.*f", b"%.*f\0".as_ptr() as *const c_char);
widestring::utf32str!("%.*f"),
b"%.*f\0".as_ptr() as *const c_char,
);
} }

View file

@ -15,9 +15,8 @@ use crate::wutil::wgettext;
use crate::{ use crate::{
builtins::shared::STATUS_CMD_OK, builtins::shared::STATUS_CMD_OK,
wchar::{wstr, WString, L}, wchar::{wstr, WString, L},
wutil::{fish_wcstoi, wgettext_fmt}, wutil::{fish_wcstoi, sprintf, wgettext_fmt},
}; };
use fish_printf::sprintf;
use libc::c_int; use libc::c_int;
use std::num::NonZeroU32; use std::num::NonZeroU32;
use std::sync::atomic::Ordering; use std::sync::atomic::Ordering;

View file

@ -265,7 +265,7 @@ impl<'a, 'b> builtin_printf_state_t<'a, 'b> {
if !self.early_exit { if !self.early_exit {
sprintf_locale( sprintf_locale(
&mut self.buff, &mut self.buff,
$fmt.as_char_slice(), $fmt,
&self.locale, &self.locale,
&mut [$($arg.to_arg()),*] &mut [$($arg.to_arg()),*]
).expect("sprintf failed"); ).expect("sprintf failed");

View file

@ -1,4 +1,3 @@
use fish_printf::sprintf;
use pcre2::utf32::{Captures, Regex, RegexBuilder}; use pcre2::utf32::{Captures, Regex, RegexBuilder};
use std::collections::HashMap; use std::collections::HashMap;
use std::num::NonZeroUsize; use std::num::NonZeroUsize;

View file

@ -2006,44 +2006,3 @@ impl ToCString for &[u8] {
CString::new(self).unwrap() CString::new(self).unwrap()
} }
} }
#[allow(unused_macros)]
#[deprecated = "use printf!, eprintf! or fprintf"]
macro_rules! fwprintf {
($args:tt) => {
panic!()
};
}
// test-only
#[allow(unused_macros)]
#[deprecated = "use printf!"]
macro_rules! err {
($format:expr $(, $args:expr)* $(,)? ) => {
printf!($format $(, $args )*);
}
}
#[macro_export]
macro_rules! fprintf {
($fd:expr, $format:expr $(, $arg:expr)* $(,)?) => {
{
let wide = $crate::wutil::sprintf!($format, $( $arg ),*);
$crate::wutil::wwrite_to_fd(&wide, $fd);
}
}
}
#[macro_export]
macro_rules! printf {
($format:expr $(, $arg:expr)* $(,)?) => {
fprintf!(libc::STDOUT_FILENO, $format $(, $arg)*)
}
}
#[macro_export]
macro_rules! eprintf {
($format:expr $(, $arg:expr)* $(,)?) => {
fprintf!(libc::STDERR_FILENO, $format $(, $arg)*)
}
}

View file

@ -13,9 +13,9 @@ use crate::{
common::{charptr2wcstring, escape_string, EscapeFlags, EscapeStringStyle}, common::{charptr2wcstring, escape_string, EscapeFlags, EscapeStringStyle},
reader::{get_quote, is_backslashed}, reader::{get_quote, is_backslashed},
util::wcsfilecmp, util::wcsfilecmp,
wutil::sprintf,
}; };
use bitflags::bitflags; use bitflags::bitflags;
use fish_printf::sprintf;
use once_cell::sync::Lazy; use once_cell::sync::Lazy;
use crate::{ use crate::{

View file

@ -25,6 +25,9 @@ pub const BUILD_VERSION: &str = env!("FISH_BUILD_VERSION");
#[macro_use] #[macro_use]
pub mod common; pub mod common;
#[macro_use]
pub mod wutil;
pub mod abbrs; pub mod abbrs;
pub mod ast; pub mod ast;
pub mod autoload; pub mod autoload;
@ -97,7 +100,6 @@ pub mod wcstringutil;
pub mod wgetopt; pub mod wgetopt;
pub mod widecharwidth; pub mod widecharwidth;
pub mod wildcard; pub mod wildcard;
pub mod wutil;
#[cfg(test)] #[cfg(test)]
mod tests; mod tests;

View file

@ -31,7 +31,6 @@ use crate::wait_handle::WaitHandleStore;
use crate::wchar::{wstr, WString, L}; use crate::wchar::{wstr, WString, L};
use crate::wutil::{perror, wgettext, wgettext_fmt}; use crate::wutil::{perror, wgettext, wgettext_fmt};
use crate::{function, FLOG}; use crate::{function, FLOG};
use fish_printf::sprintf;
use libc::c_int; use libc::c_int;
#[cfg(not(target_has_atomic = "64"))] #[cfg(not(target_has_atomic = "64"))]
use portable_atomic::AtomicU64; use portable_atomic::AtomicU64;

View file

@ -24,8 +24,7 @@ use crate::topic_monitor::{topic_monitor_principal, GenerationsList, Topic};
use crate::wait_handle::{InternalJobId, WaitHandle, WaitHandleRef, WaitHandleStore}; use crate::wait_handle::{InternalJobId, WaitHandle, WaitHandleRef, WaitHandleStore};
use crate::wchar::{wstr, WString, L}; use crate::wchar::{wstr, WString, L};
use crate::wchar_ext::ToWString; use crate::wchar_ext::ToWString;
use crate::wutil::{perror, wbasename, wgettext, wperror}; use crate::wutil::{perror, sprintf, wbasename, wgettext, wperror};
use fish_printf::sprintf;
use libc::{ use libc::{
EBADF, EINVAL, ENOTTY, EPERM, EXIT_SUCCESS, SIGABRT, SIGBUS, SIGCONT, SIGFPE, SIGHUP, SIGILL, EBADF, EINVAL, ENOTTY, EPERM, EXIT_SUCCESS, SIGABRT, SIGBUS, SIGCONT, SIGFPE, SIGHUP, SIGILL,
SIGINT, SIGKILL, SIGPIPE, SIGQUIT, SIGSEGV, SIGSYS, SIGTTOU, SIG_DFL, SIG_IGN, STDIN_FILENO, SIGINT, SIGKILL, SIGPIPE, SIGQUIT, SIGSEGV, SIGSYS, SIGTTOU, SIG_DFL, SIG_IGN, STDIN_FILENO,

View file

@ -14,7 +14,7 @@ pub mod prelude {
pub use crate::{ pub use crate::{
wchar::{wstr, IntoCharIter, WString, L}, wchar::{wstr, IntoCharIter, WString, L},
wchar_ext::{ToWString, WExt}, wchar_ext::{ToWString, WExt},
wutil::{sprintf, wgettext, wgettext_fmt, wgettext_maybe_fmt, wgettext_str}, wutil::{eprintf, sprintf, wgettext, wgettext_fmt, wgettext_maybe_fmt, wgettext_str},
}; };
} }

View file

@ -146,7 +146,7 @@ macro_rules! wgettext_fmt {
$($args:expr),+ // list of expressions $($args:expr),+ // list of expressions
$(,)? // optional trailing comma $(,)? // optional trailing comma
) => { ) => {
$crate::wutil::sprintf!(&$crate::wutil::wgettext!($string), $($args),+) $crate::wutil::sprintf!($crate::wutil::wgettext!($string), $($args),+)
}; };
} }
pub use wgettext_fmt; pub use wgettext_fmt;
@ -160,7 +160,7 @@ macro_rules! wgettext_maybe_fmt {
$(, $args:expr)* // list of expressions $(, $args:expr)* // list of expressions
$(,)? // optional trailing comma $(,)? // optional trailing comma
) => { ) => {
$crate::wutil::sprintf!(&$crate::wutil::wgettext!($string), $($args),*) $crate::wutil::sprintf!($crate::wutil::wgettext!($string), $($args),*)
}; };
} }
pub use wgettext_maybe_fmt; pub use wgettext_maybe_fmt;

View file

@ -4,6 +4,7 @@ pub mod errors;
pub mod fileid; pub mod fileid;
pub mod gettext; pub mod gettext;
mod hex_float; mod hex_float;
#[macro_use]
pub mod printf; pub mod printf;
#[cfg(test)] #[cfg(test)]
mod tests; mod tests;
@ -25,8 +26,7 @@ use std::fs::{self, canonicalize};
use std::io::{self, Write}; use std::io::{self, Write};
use std::os::unix::prelude::*; use std::os::unix::prelude::*;
extern crate fish_printf; pub use crate::wutil::printf::{eprintf, fprintf, printf, sprintf};
pub use fish_printf::sprintf;
pub use fileid::{ pub use fileid::{
file_id_for_fd, file_id_for_path, file_id_for_path_narrow, DevInode, FileId, INVALID_FILE_ID, file_id_for_fd, file_id_for_path, file_id_for_path_narrow, DevInode, FileId, INVALID_FILE_ID,

View file

@ -1,5 +1,53 @@
// Re-export sprintf macro. // Support for printf-style formatting.
pub use fish_printf::sprintf; #[macro_export]
macro_rules! sprintf {
// Allow a `&str` or `&Utf32Str` as a format, and return a `Utf32String`.
($fmt:expr $(, $arg:expr)* $(,)?) => {
{
let mut target = widestring::Utf32String::new();
$crate::sprintf!(=> &mut target, $fmt, $($arg),*);
target
}
};
// Allow a `&str` or `&Utf32Str` as a format, and write to a target,
// which should be a `&mut String` or `&mut Utf32String`.
//
(=> $target:expr, $fmt:expr $(, $arg:expr)* $(,)?) => {
{
let _ = fish_printf::sprintf!(=> $target, $fmt, $($arg),*);
}
};
}
#[macro_export]
macro_rules! fprintf {
// Allow a `&str` or `&Utf32Str` as a format, and write to an fd.
($fd:expr, $fmt:expr $(, $arg:expr)* $(,)?) => {
{
let wide = $crate::wutil::sprintf!($fmt, $( $arg ),*);
$crate::wutil::wwrite_to_fd(&wide, $fd);
}
}
}
#[macro_export]
macro_rules! printf {
// Allow a `&str` or `&Utf32Str` as a format, and write to stdout.
($fmt:expr $(, $arg:expr)* $(,)?) => {
$crate::fprintf!(libc::STDOUT_FILENO, $fmt $(, $arg)*)
}
}
#[macro_export]
macro_rules! eprintf {
// Allow a `&str` or `&Utf32Str` as a format, and write to stderr.
($fmt:expr $(, $arg:expr)* $(,)?) => {
fprintf!(libc::STDERR_FILENO, $fmt $(, $arg)*)
}
}
pub use {eprintf, fprintf, printf, sprintf};
#[cfg(test)] #[cfg(test)]
mod tests { mod tests {