1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100
// Copyright (c) 2023 Joining7943 <joining@posteo.de>
//
// This software is released under the MIT License.
// https://opensource.org/licenses/MIT
use crate::time::{Multiplier, DEFAULT_TIME_UNIT};
use crate::TimeUnit;
/// An ascii delimiter defined as closure.
///
/// The [`Delimiter`] is currently a type alias for a closure taking a `u8` byte and returning a
/// `bool`. Most likely, the [`Delimiter`] is used to define some whitespace but whitespace
/// definitions differ, so a closure provides the most flexible definition of a delimiter. For
/// example the definition of whitespace from rust [`u8::is_ascii_whitespace`]:
///
/// ```text
/// Checks if the value is an ASCII whitespace character: U+0020 SPACE, U+0009 HORIZONTAL TAB,
/// U+000A LINE FEED, U+000C FORM FEED, or U+000D CARRIAGE RETURN.
///
/// Rust uses the WhatWG Infra Standard’s definition of ASCII whitespace. There are several other
/// definitions in wide use. For instance, the POSIX locale includes U+000B VERTICAL TAB as well
/// as all the above characters, but—from the very same specification—the default rule for “field
/// splitting” in the Bourne shell considers only SPACE, HORIZONTAL TAB, and LINE FEED as
/// whitespace.
/// ```
///
/// # Problems
///
/// The delimiter takes a `u8` as input, but matching any non-ascii (`0x80 - 0xff`) bytes may lead
/// to serious problems if the input string contains multi-byte utf-8 characters. It's always a good
/// idea to consider this, especially, if the input for the parser comes from an untrusted source.
/// So, as a general rule of thumb, don't match any byte within the `0x80 - 0xff` range.
///
/// # Examples
///
/// ```rust
/// use fundu::Delimiter;
///
/// fn is_delimiter(delimiter: Delimiter, byte: u8) -> bool {
/// delimiter(byte)
/// }
///
/// assert!(is_delimiter(
/// |byte| matches!(byte, b' ' | b'\n' | b'\t'),
/// b' '
/// ));
/// assert!(!is_delimiter(
/// |byte| matches!(byte, b' ' | b'\n' | b'\t'),
/// b'\r'
/// ));
/// assert!(is_delimiter(|byte| byte.is_ascii_whitespace(), b'\r'));
/// ```
pub type Delimiter = fn(u8) -> bool;
#[derive(Debug, PartialEq, Eq, Clone)]
pub(crate) struct Config {
pub(crate) allow_delimiter: Option<Delimiter>,
pub(crate) default_unit: TimeUnit,
pub(crate) default_multiplier: Multiplier,
pub(crate) disable_exponent: bool,
pub(crate) disable_fraction: bool,
pub(crate) disable_infinity: bool,
pub(crate) number_is_optional: bool,
pub(crate) max_exponent: i16,
pub(crate) min_exponent: i16,
pub(crate) parse_multiple: Option<Delimiter>,
}
impl Default for Config {
fn default() -> Self {
Self::new()
}
}
impl Config {
pub(crate) const fn new() -> Self {
Self {
allow_delimiter: None,
default_unit: DEFAULT_TIME_UNIT,
default_multiplier: Multiplier(1, 0),
disable_exponent: false,
disable_fraction: false,
number_is_optional: false,
max_exponent: i16::MAX,
min_exponent: i16::MIN,
disable_infinity: false,
parse_multiple: None,
}
}
}
#[cfg(test)]
mod tests {
use super::*;
#[test]
fn test_default_for_config() {
assert_eq!(Config::default(), Config::new());
}
}