2023-03-06 03:52:11 +00:00
|
|
|
pub use super::errors::Error;
|
2023-03-06 03:52:12 +00:00
|
|
|
use crate::wchar::IntoCharIter;
|
2023-01-15 00:34:49 +00:00
|
|
|
use num_traits::{NumCast, PrimInt};
|
2023-03-06 03:52:12 +00:00
|
|
|
use std::iter::{Fuse, Peekable};
|
2023-03-06 03:52:11 +00:00
|
|
|
use std::result::Result;
|
2023-01-15 00:34:49 +00:00
|
|
|
|
|
|
|
struct ParseResult {
|
|
|
|
result: u64,
|
|
|
|
negative: bool,
|
2023-02-02 17:33:49 +00:00
|
|
|
consumed_all: bool,
|
2023-03-06 03:52:12 +00:00
|
|
|
consumed: usize,
|
2023-01-15 00:34:49 +00:00
|
|
|
}
|
|
|
|
|
2023-03-06 03:52:12 +00:00
|
|
|
struct CharsIterator<Iter: Iterator<Item = char>> {
|
|
|
|
chars: Peekable<Fuse<Iter>>,
|
|
|
|
consumed: usize,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<Iter: Iterator<Item = char>> CharsIterator<Iter> {
|
|
|
|
/// Get the current char, or \0.
|
|
|
|
fn current(&mut self) -> char {
|
|
|
|
self.peek().unwrap_or('\0')
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Get the current char, or None.
|
|
|
|
fn peek(&mut self) -> Option<char> {
|
|
|
|
self.chars.peek().copied()
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Get the next char, incrementing self.consumed.
|
|
|
|
fn next(&mut self) -> Option<char> {
|
|
|
|
let res = self.chars.next();
|
|
|
|
if res.is_some() {
|
|
|
|
self.consumed += 1;
|
|
|
|
}
|
|
|
|
res
|
2023-01-15 00:34:49 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Parse the given \p src as an integer.
|
|
|
|
/// If mradix is not None, it is used as the radix; otherwise the radix is inferred:
|
|
|
|
/// - Leading 0x or 0X means 16.
|
|
|
|
/// - Leading 0 means 8.
|
|
|
|
/// - Otherwise 10.
|
|
|
|
/// The parse result contains the number as a u64, and whether it was negative.
|
2023-03-06 03:52:12 +00:00
|
|
|
fn fish_parse_radix<Iter: Iterator<Item = char>>(
|
|
|
|
iter: Iter,
|
|
|
|
mradix: Option<u32>,
|
|
|
|
) -> Result<ParseResult, Error> {
|
2023-01-15 00:34:49 +00:00
|
|
|
if let Some(r) = mradix {
|
2023-02-04 23:45:25 +00:00
|
|
|
assert!((2..=36).contains(&r), "fish_parse_radix: invalid radix {r}");
|
2023-01-15 00:34:49 +00:00
|
|
|
}
|
2023-03-06 03:52:12 +00:00
|
|
|
|
|
|
|
// Construct a CharsIterator to keep track of how many we consume.
|
|
|
|
let mut chars = CharsIterator {
|
|
|
|
chars: iter.fuse().peekable(),
|
|
|
|
consumed: 0,
|
|
|
|
};
|
2023-01-15 00:34:49 +00:00
|
|
|
|
|
|
|
// Skip leading whitespace.
|
2023-03-06 03:52:12 +00:00
|
|
|
while chars.current().is_whitespace() {
|
2023-01-15 00:34:49 +00:00
|
|
|
chars.next();
|
|
|
|
}
|
|
|
|
|
|
|
|
if chars.peek().is_none() {
|
|
|
|
return Err(Error::Empty);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Consume leading +/-.
|
|
|
|
let mut negative;
|
2023-03-06 03:52:12 +00:00
|
|
|
match chars.current() {
|
2023-01-15 00:34:49 +00:00
|
|
|
'-' | '+' => {
|
2023-03-06 03:52:12 +00:00
|
|
|
negative = chars.current() == '-';
|
2023-01-15 00:34:49 +00:00
|
|
|
chars.next();
|
|
|
|
}
|
|
|
|
_ => negative = false,
|
|
|
|
}
|
|
|
|
|
|
|
|
// Determine the radix.
|
2023-02-04 23:45:25 +00:00
|
|
|
let radix = if let Some(radix) = mradix {
|
|
|
|
radix
|
2023-03-06 03:52:12 +00:00
|
|
|
} else if chars.current() == '0' {
|
2023-01-15 00:34:49 +00:00
|
|
|
chars.next();
|
2023-03-06 03:52:12 +00:00
|
|
|
match chars.current() {
|
2023-01-15 00:34:49 +00:00
|
|
|
'x' | 'X' => {
|
|
|
|
chars.next();
|
2023-02-04 23:45:25 +00:00
|
|
|
16
|
2023-01-15 00:34:49 +00:00
|
|
|
}
|
2023-02-04 23:45:25 +00:00
|
|
|
c if ('0'..='9').contains(&c) => 8,
|
2023-01-15 00:34:49 +00:00
|
|
|
_ => {
|
|
|
|
// Just a 0.
|
|
|
|
return Ok(ParseResult {
|
|
|
|
result: 0,
|
|
|
|
negative: false,
|
2023-02-25 11:10:31 +00:00
|
|
|
consumed_all: chars.peek().is_none(),
|
2023-03-06 03:52:12 +00:00
|
|
|
consumed: chars.consumed,
|
2023-01-15 00:34:49 +00:00
|
|
|
});
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} else {
|
2023-02-04 23:45:25 +00:00
|
|
|
10
|
|
|
|
};
|
2023-01-15 00:34:49 +00:00
|
|
|
|
|
|
|
// Compute as u64.
|
2023-03-06 03:52:12 +00:00
|
|
|
let start_consumed = chars.consumed;
|
2023-01-15 00:34:49 +00:00
|
|
|
let mut result: u64 = 0;
|
2023-03-06 03:52:12 +00:00
|
|
|
while let Some(digit) = chars.current().to_digit(radix) {
|
2023-01-15 00:34:49 +00:00
|
|
|
result = result
|
|
|
|
.checked_mul(radix as u64)
|
|
|
|
.and_then(|r| r.checked_add(digit as u64))
|
|
|
|
.ok_or(Error::Overflow)?;
|
|
|
|
chars.next();
|
|
|
|
}
|
|
|
|
|
2023-03-06 03:52:12 +00:00
|
|
|
// Did we consume at least one char after the prefix?
|
|
|
|
let consumed = chars.consumed;
|
|
|
|
if consumed == start_consumed {
|
2023-03-06 03:52:11 +00:00
|
|
|
return Err(Error::InvalidChar);
|
2023-01-15 00:34:49 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Do not return -0.
|
|
|
|
if result == 0 {
|
|
|
|
negative = false;
|
|
|
|
}
|
2023-02-25 11:10:31 +00:00
|
|
|
let consumed_all = chars.peek().is_none();
|
2023-02-18 21:06:05 +00:00
|
|
|
Ok(ParseResult {
|
|
|
|
result,
|
|
|
|
negative,
|
|
|
|
consumed_all,
|
2023-03-06 03:52:12 +00:00
|
|
|
consumed,
|
2023-02-18 21:06:05 +00:00
|
|
|
})
|
2023-01-15 00:34:49 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/// Parse some iterator over Chars into some Integer type, optionally with a radix.
|
2023-02-18 21:06:05 +00:00
|
|
|
fn fish_wcstoi_impl<Int, Chars>(
|
|
|
|
src: Chars,
|
|
|
|
mradix: Option<u32>,
|
|
|
|
consume_all: bool,
|
2023-03-06 03:52:12 +00:00
|
|
|
out_consumed: &mut usize,
|
2023-02-18 21:06:05 +00:00
|
|
|
) -> Result<Int, Error>
|
2023-01-15 00:34:49 +00:00
|
|
|
where
|
|
|
|
Chars: Iterator<Item = char>,
|
|
|
|
Int: PrimInt,
|
|
|
|
{
|
|
|
|
let bits = Int::zero().count_zeros();
|
|
|
|
assert!(bits <= 64, "fish_wcstoi: Int must be <= 64 bits");
|
|
|
|
let signed = Int::min_value() < Int::zero();
|
|
|
|
|
|
|
|
let ParseResult {
|
2023-02-18 21:06:05 +00:00
|
|
|
result,
|
|
|
|
negative,
|
|
|
|
consumed_all,
|
2023-03-06 03:52:12 +00:00
|
|
|
consumed,
|
2023-01-15 00:34:49 +00:00
|
|
|
} = fish_parse_radix(src, mradix)?;
|
2023-03-06 03:52:12 +00:00
|
|
|
*out_consumed = consumed;
|
2023-01-15 00:34:49 +00:00
|
|
|
|
|
|
|
if !signed && negative {
|
2023-03-06 03:52:11 +00:00
|
|
|
Err(Error::InvalidChar)
|
2023-02-02 17:33:49 +00:00
|
|
|
} else if consume_all && !consumed_all {
|
|
|
|
Err(Error::CharsLeft)
|
2023-01-15 00:34:49 +00:00
|
|
|
} else if !signed || !negative {
|
|
|
|
match Int::from(result) {
|
|
|
|
Some(r) => Ok(r),
|
|
|
|
None => Err(Error::Overflow),
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
assert!(signed && negative);
|
|
|
|
// Signed type, so convert to s64.
|
|
|
|
// Careful of the most negative value.
|
|
|
|
if bits == 64 && result == 1 << 63 {
|
|
|
|
return Ok(Int::min_value());
|
|
|
|
}
|
|
|
|
<i64 as NumCast>::from(result)
|
|
|
|
.and_then(|r| r.checked_neg())
|
|
|
|
.and_then(|r| Int::from(r))
|
|
|
|
.ok_or(Error::Overflow)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Convert the given wide string to an integer.
|
|
|
|
/// The semantics here match wcstol():
|
|
|
|
/// - Leading whitespace is skipped.
|
|
|
|
/// - 0 means octal, 0x means hex
|
|
|
|
/// - Leading + is supported.
|
|
|
|
pub fn fish_wcstoi<Int, Chars>(src: Chars) -> Result<Int, Error>
|
|
|
|
where
|
2023-03-06 03:52:12 +00:00
|
|
|
Chars: IntoCharIter,
|
2023-01-15 00:34:49 +00:00
|
|
|
Int: PrimInt,
|
|
|
|
{
|
2023-03-06 03:52:12 +00:00
|
|
|
fish_wcstoi_impl(src.chars(), None, false, &mut 0)
|
2023-01-15 00:34:49 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/// Convert the given wide string to an integer using the given radix.
|
|
|
|
/// Leading whitespace is skipped.
|
|
|
|
pub fn fish_wcstoi_radix<Int, Chars>(src: Chars, radix: u32) -> Result<Int, Error>
|
|
|
|
where
|
2023-03-06 03:52:12 +00:00
|
|
|
Chars: IntoCharIter,
|
2023-01-15 00:34:49 +00:00
|
|
|
Int: PrimInt,
|
|
|
|
{
|
2023-03-06 03:52:12 +00:00
|
|
|
fish_wcstoi_impl(src.chars(), Some(radix), false, &mut 0)
|
2023-02-02 17:33:49 +00:00
|
|
|
}
|
|
|
|
|
2023-02-18 21:06:05 +00:00
|
|
|
pub fn fish_wcstoi_radix_all<Int, Chars>(
|
|
|
|
src: Chars,
|
|
|
|
radix: Option<u32>,
|
|
|
|
consume_all: bool,
|
|
|
|
) -> Result<Int, Error>
|
2023-02-02 17:33:49 +00:00
|
|
|
where
|
2023-03-06 03:52:12 +00:00
|
|
|
Chars: IntoCharIter,
|
|
|
|
Int: PrimInt,
|
|
|
|
{
|
|
|
|
fish_wcstoi_impl(src.chars(), radix, consume_all, &mut 0)
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Convert the given wide string to an integer.
|
|
|
|
/// The semantics here match wcstol():
|
|
|
|
/// - Leading whitespace is skipped.
|
|
|
|
/// - 0 means octal, 0x means hex
|
|
|
|
/// - Leading + is supported.
|
|
|
|
/// The number of consumed characters is returned in out_consumed.
|
|
|
|
pub fn fish_wcstoi_partial<Int, Chars>(src: Chars, out_consumed: &mut usize) -> Result<Int, Error>
|
|
|
|
where
|
|
|
|
Chars: IntoCharIter,
|
2023-02-02 17:33:49 +00:00
|
|
|
Int: PrimInt,
|
|
|
|
{
|
2023-03-06 03:52:12 +00:00
|
|
|
fish_wcstoi_impl(src.chars(), None, false, out_consumed)
|
2023-01-15 00:34:49 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
#[cfg(test)]
|
|
|
|
mod tests {
|
|
|
|
use super::*;
|
|
|
|
|
|
|
|
fn test_min_max<Int: PrimInt + std::fmt::Display + std::fmt::Debug>(min: Int, max: Int) {
|
|
|
|
assert_eq!(fish_wcstoi(min.to_string().chars()), Ok(min));
|
|
|
|
assert_eq!(fish_wcstoi(max.to_string().chars()), Ok(max));
|
|
|
|
}
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn tests() {
|
|
|
|
let run1 = |s: &str| -> Result<i32, Error> { fish_wcstoi(s.chars()) };
|
|
|
|
let run1_rad =
|
|
|
|
|s: &str, radix: u32| -> Result<i32, Error> { fish_wcstoi_radix(s.chars(), radix) };
|
|
|
|
assert_eq!(run1(""), Err(Error::Empty));
|
|
|
|
assert_eq!(run1(" \n "), Err(Error::Empty));
|
|
|
|
assert_eq!(run1("0"), Ok(0));
|
|
|
|
assert_eq!(run1("-0"), Ok(0));
|
|
|
|
assert_eq!(run1("+0"), Ok(0));
|
2023-03-06 03:52:12 +00:00
|
|
|
assert_eq!(run1("+00"), Ok(0));
|
|
|
|
assert_eq!(run1("-00"), Ok(0));
|
|
|
|
assert_eq!(run1("+0x00"), Ok(0));
|
|
|
|
assert_eq!(run1("-0x00"), Ok(0));
|
2023-03-06 03:52:11 +00:00
|
|
|
assert_eq!(run1("+-0"), Err(Error::InvalidChar));
|
|
|
|
assert_eq!(run1("-+0"), Err(Error::InvalidChar));
|
2023-03-06 03:52:12 +00:00
|
|
|
assert_eq!(run1("5"), Ok(5));
|
|
|
|
assert_eq!(run1("-5"), Ok(-5));
|
2023-01-15 00:34:49 +00:00
|
|
|
assert_eq!(run1("123"), Ok(123));
|
|
|
|
assert_eq!(run1("+123"), Ok(123));
|
|
|
|
assert_eq!(run1("-123"), Ok(-123));
|
|
|
|
assert_eq!(run1("123"), Ok(123));
|
|
|
|
assert_eq!(run1("+0x123"), Ok(291));
|
|
|
|
assert_eq!(run1("-0x123"), Ok(-291));
|
|
|
|
assert_eq!(run1("+0X123"), Ok(291));
|
|
|
|
assert_eq!(run1("-0X123"), Ok(-291));
|
|
|
|
assert_eq!(run1("+0123"), Ok(83));
|
|
|
|
assert_eq!(run1("-0123"), Ok(-83));
|
|
|
|
assert_eq!(run1(" 345 "), Ok(345));
|
|
|
|
assert_eq!(run1(" -345 "), Ok(-345));
|
2023-03-06 03:52:11 +00:00
|
|
|
assert_eq!(run1(" x345"), Err(Error::InvalidChar));
|
2023-01-15 00:34:49 +00:00
|
|
|
assert_eq!(run1("456x"), Ok(456));
|
|
|
|
assert_eq!(run1("456 x"), Ok(456));
|
|
|
|
assert_eq!(run1("99999999999999999999999"), Err(Error::Overflow));
|
|
|
|
assert_eq!(run1("-99999999999999999999999"), Err(Error::Overflow));
|
|
|
|
// This is subtle. "567" in base 8 is "375" in base 10. The final "8" is not converted.
|
|
|
|
assert_eq!(run1_rad("5678", 8), Ok(375));
|
|
|
|
|
|
|
|
test_min_max(std::i8::MIN, std::i8::MAX);
|
|
|
|
test_min_max(std::i16::MIN, std::i16::MAX);
|
|
|
|
test_min_max(std::i32::MIN, std::i32::MAX);
|
|
|
|
test_min_max(std::i64::MIN, std::i64::MAX);
|
|
|
|
test_min_max(std::u8::MIN, std::u8::MAX);
|
|
|
|
test_min_max(std::u16::MIN, std::u16::MAX);
|
|
|
|
test_min_max(std::u32::MIN, std::u32::MAX);
|
|
|
|
test_min_max(std::u64::MIN, std::u64::MAX);
|
|
|
|
}
|
2023-03-06 03:52:12 +00:00
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn test_partial() {
|
|
|
|
let run1 = |s: &str| -> (i32, usize) {
|
|
|
|
let mut consumed = 0;
|
|
|
|
let res =
|
|
|
|
fish_wcstoi_partial(s.chars(), &mut consumed).expect("Should have parsed an int");
|
|
|
|
(res, consumed)
|
|
|
|
};
|
|
|
|
|
|
|
|
assert_eq!(run1("0"), (0, 1));
|
|
|
|
assert_eq!(run1("-0"), (0, 2));
|
|
|
|
assert_eq!(run1(" -1 "), (-1, 3));
|
|
|
|
assert_eq!(run1(" +1 "), (1, 3));
|
|
|
|
assert_eq!(run1(" 345 "), (345, 5));
|
|
|
|
assert_eq!(run1(" -345 "), (-345, 5));
|
|
|
|
assert_eq!(run1(" 0345 "), (229, 6));
|
|
|
|
assert_eq!(run1(" +0345 "), (229, 7));
|
|
|
|
assert_eq!(run1(" -0345 "), (-229, 7));
|
|
|
|
assert_eq!(run1(" 0x345 "), (0x345, 6));
|
|
|
|
assert_eq!(run1(" -0x345 "), (-0x345, 7));
|
|
|
|
}
|
2023-01-15 00:34:49 +00:00
|
|
|
}
|