use core::{
marker::PhantomData,
ops::{Add, Shl},
};
use crate::{
branch::alt,
character::{char, digit1},
combinator::{cut, map, opt, recognize},
error::{make_error, ErrorKind, ParseError},
sequence::pair,
AsBytes, AsChar, Compare, Either, Emit, Err, Input, IsStreaming, Mode, Needed, Offset, OutputM,
Parser,
};
pub mod complete;
pub mod streaming;
#[derive(Debug, PartialEq, Eq, Clone, Copy)]
pub enum Endianness {
Big,
Little,
Native,
}
#[inline]
fn be_uint<I, Uint, E: ParseError<I>>(bound: usize) -> impl Parser<I, Output = Uint, Error = E>
where
I: Input<Item = u8>,
Uint: Default + Shl<u8, Output = Uint> + Add<Uint, Output = Uint> + From<u8>,
{
BeUint {
bound,
e: PhantomData,
u: PhantomData,
}
}
struct BeUint<Uint, E> {
bound: usize,
e: PhantomData<E>,
u: PhantomData<Uint>,
}
impl<I, Uint, E: ParseError<I>> Parser<I> for BeUint<Uint, E>
where
I: Input<Item = u8>,
Uint: Default + Shl<u8, Output = Uint> + Add<Uint, Output = Uint> + From<u8>,
{
type Output = Uint;
type Error = E;
#[inline(always)]
fn process<OM: crate::OutputMode>(
&mut self,
input: I,
) -> crate::PResult<OM, I, Self::Output, Self::Error> {
if input.input_len() < self.bound {
if OM::Incomplete::is_streaming() {
Err(Err::Incomplete(Needed::new(self.bound - input.input_len())))
} else {
Err(Err::Error(OM::Error::bind(|| {
make_error(input, ErrorKind::Eof)
})))
}
} else {
let res = OM::Output::bind(|| {
let mut res = Uint::default();
if self.bound > 1 {
for byte in input.iter_elements().take(self.bound) {
res = (res << 8) + byte.into();
}
} else {
for byte in input.iter_elements().take(self.bound) {
res = byte.into();
}
}
res
});
Ok((input.take_from(self.bound), res))
}
}
}
#[inline]
pub fn be_u8<I, E: ParseError<I>>() -> impl Parser<I, Output = u8, Error = E>
where
I: Input<Item = u8>,
{
be_uint(1)
}
#[inline]
pub fn be_u16<I, E: ParseError<I>>() -> impl Parser<I, Output = u16, Error = E>
where
I: Input<Item = u8>,
{
be_uint(2)
}
#[inline]
pub fn be_u24<I, E: ParseError<I>>() -> impl Parser<I, Output = u32, Error = E>
where
I: Input<Item = u8>,
{
be_uint(3)
}
#[inline]
pub fn be_u32<I, E: ParseError<I>>() -> impl Parser<I, Output = u32, Error = E>
where
I: Input<Item = u8>,
{
be_uint(4)
}
#[inline]
pub fn be_u64<I, E: ParseError<I>>() -> impl Parser<I, Output = u64, Error = E>
where
I: Input<Item = u8>,
{
be_uint(8)
}
#[inline]
pub fn be_u128<I, E: ParseError<I>>() -> impl Parser<I, Output = u128, Error = E>
where
I: Input<Item = u8>,
{
be_uint(16)
}
#[inline]
pub fn be_i8<I, E: ParseError<I>>() -> impl Parser<I, Output = i8, Error = E>
where
I: Input<Item = u8>,
{
be_u8().map(|x| x as i8)
}
#[inline]
pub fn be_i16<I, E: ParseError<I>>() -> impl Parser<I, Output = i16, Error = E>
where
I: Input<Item = u8>,
{
be_u16().map(|x| x as i16)
}
#[inline]
pub fn be_i24<I, E: ParseError<I>>() -> impl Parser<I, Output = i32, Error = E>
where
I: Input<Item = u8>,
{
be_u24().map(|x| {
if x & 0x80_00_00 != 0 {
(x | 0xff_00_00_00) as i32
} else {
x as i32
}
})
}
#[inline]
pub fn be_i32<I, E: ParseError<I>>() -> impl Parser<I, Output = i32, Error = E>
where
I: Input<Item = u8>,
{
be_u32().map(|x| x as i32)
}
#[inline]
pub fn be_i64<I, E: ParseError<I>>() -> impl Parser<I, Output = i64, Error = E>
where
I: Input<Item = u8>,
{
be_u64().map(|x| x as i64)
}
#[inline]
pub fn be_i128<I, E: ParseError<I>>() -> impl Parser<I, Output = i128, Error = E>
where
I: Input<Item = u8>,
{
be_u128().map(|x| x as i128)
}
#[inline]
fn le_uint<I, Uint, E: ParseError<I>>(bound: usize) -> impl Parser<I, Output = Uint, Error = E>
where
I: Input<Item = u8>,
Uint: Default + Shl<u8, Output = Uint> + Add<Uint, Output = Uint> + From<u8>,
{
LeUint {
bound,
e: PhantomData,
u: PhantomData,
}
}
struct LeUint<Uint, E> {
bound: usize,
e: PhantomData<E>,
u: PhantomData<Uint>,
}
impl<I, Uint, E: ParseError<I>> Parser<I> for LeUint<Uint, E>
where
I: Input<Item = u8>,
Uint: Default + Shl<u8, Output = Uint> + Add<Uint, Output = Uint> + From<u8>,
{
type Output = Uint;
type Error = E;
#[inline(always)]
fn process<OM: crate::OutputMode>(
&mut self,
input: I,
) -> crate::PResult<OM, I, Self::Output, Self::Error> {
if input.input_len() < self.bound {
if OM::Incomplete::is_streaming() {
Err(Err::Incomplete(Needed::new(self.bound - input.input_len())))
} else {
Err(Err::Error(OM::Error::bind(|| {
make_error(input, ErrorKind::Eof)
})))
}
} else {
let res = OM::Output::bind(|| {
let mut res = Uint::default();
for (index, byte) in input.iter_elements().take(self.bound).enumerate() {
res = res + (Uint::from(byte) << (8 * index as u8));
}
res
});
Ok((input.take_from(self.bound), res))
}
}
}
#[inline]
pub fn le_u8<I, E: ParseError<I>>() -> impl Parser<I, Output = u8, Error = E>
where
I: Input<Item = u8>,
{
le_uint(1)
}
#[inline]
pub fn le_u16<I, E: ParseError<I>>() -> impl Parser<I, Output = u16, Error = E>
where
I: Input<Item = u8>,
{
le_uint(2)
}
#[inline]
pub fn le_u24<I, E: ParseError<I>>() -> impl Parser<I, Output = u32, Error = E>
where
I: Input<Item = u8>,
{
le_uint(3)
}
#[inline]
pub fn le_u32<I, E: ParseError<I>>() -> impl Parser<I, Output = u32, Error = E>
where
I: Input<Item = u8>,
{
le_uint(4)
}
#[inline]
pub fn le_u64<I, E: ParseError<I>>() -> impl Parser<I, Output = u64, Error = E>
where
I: Input<Item = u8>,
{
le_uint(8)
}
#[inline]
pub fn le_u128<I, E: ParseError<I>>() -> impl Parser<I, Output = u128, Error = E>
where
I: Input<Item = u8>,
{
le_uint(16)
}
#[inline]
pub fn le_i8<I, E: ParseError<I>>() -> impl Parser<I, Output = i8, Error = E>
where
I: Input<Item = u8>,
{
le_u8().map(|x| x as i8)
}
#[inline]
pub fn le_i16<I, E: ParseError<I>>() -> impl Parser<I, Output = i16, Error = E>
where
I: Input<Item = u8>,
{
le_u16().map(|x| x as i16)
}
#[inline]
pub fn le_i24<I, E: ParseError<I>>() -> impl Parser<I, Output = i32, Error = E>
where
I: Input<Item = u8>,
{
le_u24().map(|x| {
if x & 0x80_00_00 != 0 {
(x | 0xff_00_00_00) as i32
} else {
x as i32
}
})
}
#[inline]
pub fn le_i32<I, E: ParseError<I>>() -> impl Parser<I, Output = i32, Error = E>
where
I: Input<Item = u8>,
{
le_u32().map(|x| x as i32)
}
#[inline]
pub fn le_i64<I, E: ParseError<I>>() -> impl Parser<I, Output = i64, Error = E>
where
I: Input<Item = u8>,
{
le_u64().map(|x| x as i64)
}
#[inline]
pub fn le_i128<I, E: ParseError<I>>() -> impl Parser<I, Output = i128, Error = E>
where
I: Input<Item = u8>,
{
le_u128().map(|x| x as i128)
}
#[inline]
pub fn u8<I, E: ParseError<I>>() -> impl Parser<I, Output = u8, Error = E>
where
I: Input<Item = u8>,
{
be_u8()
}
#[inline]
pub fn u16<I, E: ParseError<I>>(
endian: crate::number::Endianness,
) -> impl Parser<I, Output = u16, Error = E>
where
I: Input<Item = u8>,
{
match endian {
crate::number::Endianness::Big => Either::Left(be_u16()),
crate::number::Endianness::Little => Either::Right(le_u16()),
#[cfg(target_endian = "big")]
crate::number::Endianness::Native => Either::Left(be_u16()),
#[cfg(target_endian = "little")]
crate::number::Endianness::Native => Either::Right(le_u16()),
}
}
#[inline]
pub fn u24<I, E: ParseError<I>>(
endian: crate::number::Endianness,
) -> impl Parser<I, Output = u32, Error = E>
where
I: Input<Item = u8>,
{
match endian {
crate::number::Endianness::Big => Either::Left(be_u24()),
crate::number::Endianness::Little => Either::Right(le_u24()),
#[cfg(target_endian = "big")]
crate::number::Endianness::Native => Either::Left(be_u24()),
#[cfg(target_endian = "little")]
crate::number::Endianness::Native => Either::Right(le_u24()),
}
}
#[inline]
pub fn u32<I, E: ParseError<I>>(
endian: crate::number::Endianness,
) -> impl Parser<I, Output = u32, Error = E>
where
I: Input<Item = u8>,
{
match endian {
crate::number::Endianness::Big => Either::Left(be_u32()),
crate::number::Endianness::Little => Either::Right(le_u32()),
#[cfg(target_endian = "big")]
crate::number::Endianness::Native => Either::Left(be_u32()),
#[cfg(target_endian = "little")]
crate::number::Endianness::Native => Either::Right(le_u32()),
}
}
#[inline]
pub fn u64<I, E: ParseError<I>>(
endian: crate::number::Endianness,
) -> impl Parser<I, Output = u64, Error = E>
where
I: Input<Item = u8>,
{
match endian {
crate::number::Endianness::Big => Either::Left(be_u64()),
crate::number::Endianness::Little => Either::Right(le_u64()),
#[cfg(target_endian = "big")]
crate::number::Endianness::Native => Either::Left(be_u64()),
#[cfg(target_endian = "little")]
crate::number::Endianness::Native => Either::Right(le_u64()),
}
}
#[inline]
pub fn u128<I, E: ParseError<I>>(
endian: crate::number::Endianness,
) -> impl Parser<I, Output = u128, Error = E>
where
I: Input<Item = u8>,
{
match endian {
crate::number::Endianness::Big => Either::Left(be_u128()),
crate::number::Endianness::Little => Either::Right(le_u128()),
#[cfg(target_endian = "big")]
crate::number::Endianness::Native => Either::Left(be_u128()),
#[cfg(target_endian = "little")]
crate::number::Endianness::Native => Either::Right(le_u128()),
}
}
#[inline]
pub fn i8<I, E: ParseError<I>>() -> impl Parser<I, Output = i8, Error = E>
where
I: Input<Item = u8>,
{
u8().map(|x| x as i8)
}
#[inline]
pub fn i16<I, E: ParseError<I>>(
endian: crate::number::Endianness,
) -> impl Parser<I, Output = i16, Error = E>
where
I: Input<Item = u8>,
{
match endian {
crate::number::Endianness::Big => Either::Left(be_i16()),
crate::number::Endianness::Little => Either::Right(le_i16()),
#[cfg(target_endian = "big")]
crate::number::Endianness::Native => Either::Left(be_i16()),
#[cfg(target_endian = "little")]
crate::number::Endianness::Native => Either::Right(le_i16()),
}
}
#[inline]
pub fn i24<I, E: ParseError<I>>(
endian: crate::number::Endianness,
) -> impl Parser<I, Output = i32, Error = E>
where
I: Input<Item = u8>,
{
match endian {
crate::number::Endianness::Big => Either::Left(be_i24()),
crate::number::Endianness::Little => Either::Right(le_i24()),
#[cfg(target_endian = "big")]
crate::number::Endianness::Native => Either::Left(be_i24()),
#[cfg(target_endian = "little")]
crate::number::Endianness::Native => Either::Right(le_i24()),
}
}
#[inline]
pub fn i32<I, E: ParseError<I>>(
endian: crate::number::Endianness,
) -> impl Parser<I, Output = i32, Error = E>
where
I: Input<Item = u8>,
{
match endian {
crate::number::Endianness::Big => Either::Left(be_i32()),
crate::number::Endianness::Little => Either::Right(le_i32()),
#[cfg(target_endian = "big")]
crate::number::Endianness::Native => Either::Left(be_i32()),
#[cfg(target_endian = "little")]
crate::number::Endianness::Native => Either::Right(le_i32()),
}
}
#[inline]
pub fn i64<I, E: ParseError<I>>(
endian: crate::number::Endianness,
) -> impl Parser<I, Output = i64, Error = E>
where
I: Input<Item = u8>,
{
match endian {
crate::number::Endianness::Big => Either::Left(be_i64()),
crate::number::Endianness::Little => Either::Right(le_i64()),
#[cfg(target_endian = "big")]
crate::number::Endianness::Native => Either::Left(be_i64()),
#[cfg(target_endian = "little")]
crate::number::Endianness::Native => Either::Right(le_i64()),
}
}
#[inline]
pub fn i128<I, E: ParseError<I>>(
endian: crate::number::Endianness,
) -> impl Parser<I, Output = i128, Error = E>
where
I: Input<Item = u8>,
{
match endian {
crate::number::Endianness::Big => Either::Left(be_i128()),
crate::number::Endianness::Little => Either::Right(le_i128()),
#[cfg(target_endian = "big")]
crate::number::Endianness::Native => Either::Left(be_i128()),
#[cfg(target_endian = "little")]
crate::number::Endianness::Native => Either::Right(le_i128()),
}
}
#[inline]
pub fn be_f32<I, E: ParseError<I>>() -> impl Parser<I, Output = f32, Error = E>
where
I: Input<Item = u8>,
{
be_u32().map(f32::from_bits)
}
#[inline]
pub fn be_f64<I, E: ParseError<I>>() -> impl Parser<I, Output = f64, Error = E>
where
I: Input<Item = u8>,
{
be_u64().map(f64::from_bits)
}
#[inline]
pub fn le_f32<I, E: ParseError<I>>() -> impl Parser<I, Output = f32, Error = E>
where
I: Input<Item = u8>,
{
le_u32().map(f32::from_bits)
}
#[inline]
pub fn le_f64<I, E: ParseError<I>>() -> impl Parser<I, Output = f64, Error = E>
where
I: Input<Item = u8>,
{
le_u64().map(f64::from_bits)
}
#[inline]
pub fn f32<I, E: ParseError<I>>(
endian: crate::number::Endianness,
) -> impl Parser<I, Output = f32, Error = E>
where
I: Input<Item = u8>,
{
match endian {
crate::number::Endianness::Big => Either::Left(be_f32()),
crate::number::Endianness::Little => Either::Right(le_f32()),
#[cfg(target_endian = "big")]
crate::number::Endianness::Native => Either::Left(be_f32()),
#[cfg(target_endian = "little")]
crate::number::Endianness::Native => Either::Right(le_f32()),
}
}
#[inline]
pub fn f64<I, E: ParseError<I>>(
endian: crate::number::Endianness,
) -> impl Parser<I, Output = f64, Error = E>
where
I: Input<Item = u8>,
{
match endian {
crate::number::Endianness::Big => Either::Left(be_f64()),
crate::number::Endianness::Little => Either::Right(le_f64()),
#[cfg(target_endian = "big")]
crate::number::Endianness::Native => Either::Left(be_f64()),
#[cfg(target_endian = "little")]
crate::number::Endianness::Native => Either::Right(le_f64()),
}
}
#[rustfmt::skip]
pub fn recognize_float<T, E:ParseError<T>>() -> impl Parser<T, Output=T,Error= E>
where
T: Clone + Offset,
T: Input,
<T as Input>::Item: AsChar,
{
recognize((
opt(alt((char('+'), char('-')))),
alt((
map((digit1(), opt(pair(char('.'), opt(digit1())))), |_| ()),
map((char('.'), digit1()), |_| ())
)),
opt((
alt((char('e'), char('E'))),
opt(alt((char('+'), char('-')))),
cut(digit1())
))
))
}
pub fn recognize_float_or_exceptions<T, E: ParseError<T>>() -> impl Parser<T, Output = T, Error = E>
where
T: Clone + Offset,
T: Input + Compare<&'static str>,
<T as Input>::Item: AsChar,
{
alt((
recognize_float::<_, E>(),
|i: T| {
crate::bytes::streaming::tag_no_case::<_, _, E>("nan")(i.clone())
.map_err(|_| crate::Err::Error(E::from_error_kind(i, ErrorKind::Float)))
},
|i: T| {
crate::bytes::streaming::tag_no_case::<_, _, E>("infinity")(i.clone())
.map_err(|_| crate::Err::Error(E::from_error_kind(i, ErrorKind::Float)))
},
|i: T| {
crate::bytes::streaming::tag_no_case::<_, _, E>("inf")(i.clone())
.map_err(|_| crate::Err::Error(E::from_error_kind(i, ErrorKind::Float)))
},
))
}
pub fn float<T, E: ParseError<T>>() -> impl Parser<T, Output = f32, Error = E>
where
T: Clone + Offset,
T: Input + crate::traits::ParseTo<f32> + Compare<&'static str>,
<T as Input>::Item: AsChar + Clone,
T: AsBytes,
T: for<'a> Compare<&'a [u8]>,
{
Float {
o: PhantomData,
e: PhantomData,
}
}
pub fn double<T, E: ParseError<T>>() -> impl Parser<T, Output = f64, Error = E>
where
T: Clone + Offset,
T: Input + crate::traits::ParseTo<f64> + Compare<&'static str>,
<T as Input>::Item: AsChar + Clone,
T: AsBytes,
T: for<'a> Compare<&'a [u8]>,
{
Float {
o: PhantomData,
e: PhantomData,
}
}
struct Float<O, E> {
o: PhantomData<O>,
e: PhantomData<E>,
}
impl<I, O, E: ParseError<I>> Parser<I> for Float<O, E>
where
I: Clone + Offset,
I: Input + crate::traits::ParseTo<O> + Compare<&'static str>,
<I as Input>::Item: AsChar + Clone,
I: AsBytes,
I: for<'a> Compare<&'a [u8]>,
{
type Output = O;
type Error = E;
fn process<OM: crate::OutputMode>(
&mut self,
input: I,
) -> crate::PResult<OM, I, Self::Output, Self::Error> {
let (i, s) =
recognize_float_or_exceptions().process::<OutputM<Emit, OM::Error, OM::Incomplete>>(input)?;
match s.parse_to() {
Some(f) => Ok((i, OM::Output::bind(|| f))),
None => Err(crate::Err::Error(OM::Error::bind(|| {
E::from_error_kind(i, crate::error::ErrorKind::Float)
}))),
}
}
}
#[cfg(test)]
#[cfg(feature = "std")]
mod tests {
use super::*;
use crate::error::ErrorKind;
use crate::internal::Err;
macro_rules! assert_parse(
($left: expr, $right: expr) => {
let res: $crate::IResult<_, _, (_, ErrorKind)> = $left;
assert_eq!(res, $right);
};
);
#[test]
fn float_test() {
let mut test_cases = vec![
"+3.14",
"3.14",
"-3.14",
"0",
"0.0",
"1.",
".789",
"-.5",
"1e7",
"-1E-7",
".3e-2",
"1.e4",
"1.2e4",
"12.34",
"-1.234E-12",
"-1.234e-12",
"0.00000000000000000087",
];
for test in test_cases.drain(..) {
let expected32 = str::parse::<f32>(test).unwrap();
let expected64 = str::parse::<f64>(test).unwrap();
println!("now parsing: {} -> {}", test, expected32);
assert_parse!(recognize_float().parse_complete(test), Ok(("", test)));
assert_parse!(
double().parse_complete(test.as_bytes()),
Ok((&b""[..], expected64))
);
assert_parse!(double().parse_complete(test), Ok(("", expected64)));
}
let remaining_exponent = "-1.234E-";
assert_parse!(
recognize_float().parse_complete(remaining_exponent),
Err(Err::Failure(("", ErrorKind::Digit)))
);
}
}