Struct rustlr::lexer_interface::StrTokenizer

source ·

pub struct StrTokenizer<'t> {
    pub keep_whitespace: bool,
    pub keep_newline: bool,
    pub keep_comment: bool,
    pub line_positions: Vec<usize>,
    pub specialeof: &'static str,
    pub tab_spaces: usize,
    pub allow_newline_in_string: bool,
    pub priority_symbols: BTreeMap<&'static str, u32>,
    /* private fields */
}

Expand description

General-purpose, zero-copy lexical analyzer that produces RawTokens from an str. This tokenizer uses regex, although not for everything. For example, to allow for string literals that contain escaped quotations, a direct loop is implemented. The tokenizer gives the option of returning newlines, whitespaces (with count) and comments as special tokens. It recognizes mult-line string literals, multi-line as well as single-line comments, and returns the starting line and column positions of each token.

Example:

  let mut scanner = StrTokenizer::from_str("while (1) fork();//run at your own risk");
  scanner.set_line_comment("//");
  scanner.keep_comment=true;
  scanner.add_single(';'); // separates ; from following symbols
  while let Some(token) = scanner.next() {
     println!("Token,line,column: {:?}",&token);
  }

this code produces output

  Token,line,column: (Alphanum("while"), 1, 1)
  Token,line,column: (Symbol("("), 1, 7)
  Token,line,column: (Num(1), 1, 8)
  Token,line,column: (Symbol(")"), 1, 9)
  Token,line,column: (Alphanum("fork"), 1, 11)
  Token,line,column: (Symbol("("), 1, 15)
  Token,line,column: (Symbol(")"), 1, 16)
  Token,line,column: (Symbol(";"), 1, 17)
  Token,line,column: (Verbatim("//run at your own risk"), 1, 18)

Fields§

§keep_whitespace: bool

flag to toggle whether whitespaces should be returned as Whitespace tokens, default is false.

§keep_newline: bool

flag to toggle whether newline characters (‘\n’) are returned as Newline tokens. Default is false. Note that if this flag is set to true then newline characters are treated differently from other whitespaces. For example, when parsing languages like Python, both keep_whitespace and keep_newline should be set to true. Change option in grammar with lexattribute keep_newline=true

§keep_comment: bool

flag to determine if comments are kept and returned as Verbatim tokens, default is false.

§line_positions: Vec<usize>

vector of starting byte position of each line, position 0 not used.

§specialeof: &'static str§tab_spaces: usize

number of whitespaces to count for each tab (default 6). This can be changed with a declaration such as lexattribute tab_spaces=8. Do not set this value to zero.

§allow_newline_in_string: bool

allows string literals to contain non-escaped newline characters: warning: changing the default (false) may reduce the accuracy of error reporting.

§priority_symbols: BTreeMap<&'static str, u32>

Multiset of verbatim symbols that have priority over other categories; sorted by string order. The multiset is implemented as a map from strings to counts.

Struct rustlr::lexer_interface::StrTokenizerCopy item path

Fields§

Implementations§

impl<'t> StrTokenizer<'t>

pub fn new() -> StrTokenizer<'t> ⓘ

pub fn map<G, FM: FnOnce(&mut StrTokenizer<'t>) -> G>(&mut self, f: FM) -> G

pub fn current_text(&self) -> &'t str

pub fn add_double(&mut self, s: &'t str)

pub fn add_single(&mut self, c: char)

pub fn add_triple(&mut self, s: &'t str)

pub fn add_priority_symbol(&mut self, s: &'static str)

pub fn del_priority_symbol(&mut self, s: &'static str)

pub fn skip_to(&mut self, target: &'static str)

pub fn skip_reset(&mut self)

pub fn skip_match( &mut self, lbr: &'static str, rbr: &'static str, offset: i32, delimit: &'static str, )

pub fn add_custom(&mut self, tkind: &'static str, reg_expr: &str)

pub fn set_input(&mut self, inp: &'t str)

pub fn set_line_comment(&mut self, cm: &'t str)

pub fn set_multiline_comments(&mut self, cm: &'t str)

pub fn line(&self) -> usize

pub fn column(&self) -> usize

pub fn current_position(&self) -> usize

pub fn previous_position(&self) -> usize

pub fn get_source(&self) -> &str

pub fn set_source<'u: 't>(&mut self, s: &'u str)

pub fn current_line(&self) -> &str

pub fn get_line(&self, i: usize) -> Option<&str>

pub fn get_slice(&self, start: usize, end: usize) -> &str

pub fn reset(&mut self)

pub fn backtrack(&mut self, offset: usize)

pub fn next_token(&mut self) -> Option<(RawToken<'t>, usize, usize)>

impl<'t> StrTokenizer<'t>

pub fn from_source(ls: &'t LexSource<'t>) -> StrTokenizer<'t> ⓘ

pub fn from_str(s: &'t str) -> StrTokenizer<'t> ⓘ

Trait Implementations§

impl<'t> Iterator for StrTokenizer<'t>

type Item = (RawToken<'t>, usize, usize)

fn next(&mut self) -> Option<(RawToken<'t>, usize, usize)>

fn next_chunk<const N: usize>( &mut self, ) -> Result<[Self::Item; N], IntoIter<Self::Item, N>>where Self: Sized,

fn size_hint(&self) -> (usize, Option<usize>)

fn count(self) -> usizewhere Self: Sized,

fn last(self) -> Option<Self::Item>where Self: Sized,

fn advance_by(&mut self, n: usize) -> Result<(), NonZero<usize>>

fn nth(&mut self, n: usize) -> Option<Self::Item>

fn step_by(self, step: usize) -> StepBy<Self>where Self: Sized,

fn chain<U>(self, other: U) -> Chain<Self, <U as IntoIterator>::IntoIter>where Self: Sized, U: IntoIterator<Item = Self::Item>,

fn zip<U>(self, other: U) -> Zip<Self, <U as IntoIterator>::IntoIter>where Self: Sized, U: IntoIterator,

fn intersperse_with<G>(self, separator: G) -> IntersperseWith<Self, G>where Self: Sized, G: FnMut() -> Self::Item,

fn map<B, F>(self, f: F) -> Map<Self, F>where Self: Sized, F: FnMut(Self::Item) -> B,

fn for_each<F>(self, f: F)where Self: Sized, F: FnMut(Self::Item),

fn filter<P>(self, predicate: P) -> Filter<Self, P>where Self: Sized, P: FnMut(&Self::Item) -> bool,

fn filter_map<B, F>(self, f: F) -> FilterMap<Self, F>where Self: Sized, F: FnMut(Self::Item) -> Option<B>,

fn enumerate(self) -> Enumerate<Self>where Self: Sized,

fn peekable(self) -> Peekable<Self>where Self: Sized,

fn skip_while<P>(self, predicate: P) -> SkipWhile<Self, P>where Self: Sized, P: FnMut(&Self::Item) -> bool,

fn take_while<P>(self, predicate: P) -> TakeWhile<Self, P>where Self: Sized, P: FnMut(&Self::Item) -> bool,

fn map_while<B, P>(self, predicate: P) -> MapWhile<Self, P>where Self: Sized, P: FnMut(Self::Item) -> Option<B>,

fn skip(self, n: usize) -> Skip<Self>where Self: Sized,

fn take(self, n: usize) -> Take<Self>where Self: Sized,

fn scan<St, B, F>(self, initial_state: St, f: F) -> Scan<Self, St, F>where Self: Sized, F: FnMut(&mut St, Self::Item) -> Option<B>,

fn flat_map<U, F>(self, f: F) -> FlatMap<Self, U, F>where Self: Sized, U: IntoIterator, F: FnMut(Self::Item) -> U,

fn map_windows<F, R, const N: usize>(self, f: F) -> MapWindows<Self, F, N>where Self: Sized, F: FnMut(&[Self::Item; N]) -> R,

fn fuse(self) -> Fuse<Self>where Self: Sized,

fn inspect<F>(self, f: F) -> Inspect<Self, F>where Self: Sized, F: FnMut(&Self::Item),

fn by_ref(&mut self) -> &mut Selfwhere Self: Sized,

fn collect<B>(self) -> Bwhere B: FromIterator<Self::Item>, Self: Sized,

fn collect_into<E>(self, collection: &mut E) -> &mut Ewhere E: Extend<Self::Item>, Self: Sized,

fn partition<B, F>(self, f: F) -> (B, B)where Self: Sized, B: Default + Extend<Self::Item>, F: FnMut(&Self::Item) -> bool,

fn is_partitioned<P>(self, predicate: P) -> boolwhere Self: Sized, P: FnMut(Self::Item) -> bool,

fn try_fold<B, F, R>(&mut self, init: B, f: F) -> Rwhere Self: Sized, F: FnMut(B, Self::Item) -> R, R: Try<Output = B>,

fn try_for_each<F, R>(&mut self, f: F) -> Rwhere Self: Sized, F: FnMut(Self::Item) -> R, R: Try<Output = ()>,

fn fold<B, F>(self, init: B, f: F) -> Bwhere Self: Sized, F: FnMut(B, Self::Item) -> B,

fn reduce<F>(self, f: F) -> Option<Self::Item>where Self: Sized, F: FnMut(Self::Item, Self::Item) -> Self::Item,

fn try_reduce<R>( &mut self, f: impl FnMut(Self::Item, Self::Item) -> R, ) -> <<R as Try>::Residual as Residual<Option<<R as Try>::Output>>>::TryTypewhere Self: Sized, R: Try<Output = Self::Item>, <R as Try>::Residual: Residual<Option<Self::Item>>,

fn all<F>(&mut self, f: F) -> boolwhere Self: Sized, F: FnMut(Self::Item) -> bool,

fn any<F>(&mut self, f: F) -> boolwhere Self: Sized, F: FnMut(Self::Item) -> bool,

fn find<P>(&mut self, predicate: P) -> Option<Self::Item>where Self: Sized, P: FnMut(&Self::Item) -> bool,

fn find_map<B, F>(&mut self, f: F) -> Option<B>where Self: Sized, F: FnMut(Self::Item) -> Option<B>,

fn try_find<R>( &mut self, f: impl FnMut(&Self::Item) -> R, ) -> <<R as Try>::Residual as Residual<Option<Self::Item>>>::TryTypewhere Self: Sized, R: Try<Output = bool>, <R as Try>::Residual: Residual<Option<Self::Item>>,

fn position<P>(&mut self, predicate: P) -> Option<usize>where Self: Sized, P: FnMut(Self::Item) -> bool,

Struct rustlr::lexer_interface::StrTokenizer

fn next_chunk<const N: usize>( &mut self, ) -> Result<[Self::Item; N], IntoIter<Self::Item, N>>
where Self: Sized,

fn count(self) -> usize
where Self: Sized,

fn last(self) -> Option<Self::Item>
where Self: Sized,

fn step_by(self, step: usize) -> StepBy<Self>
where Self: Sized,

fn chain<U>(self, other: U) -> Chain<Self, <U as IntoIterator>::IntoIter>
where Self: Sized, U: IntoIterator<Item = Self::Item>,

fn zip<U>(self, other: U) -> Zip<Self, <U as IntoIterator>::IntoIter>
where Self: Sized, U: IntoIterator,

fn intersperse_with<G>(self, separator: G) -> IntersperseWith<Self, G>
where Self: Sized, G: FnMut() -> Self::Item,

fn map<B, F>(self, f: F) -> Map<Self, F>
where Self: Sized, F: FnMut(Self::Item) -> B,

fn for_each<F>(self, f: F)
where Self: Sized, F: FnMut(Self::Item),

fn filter<P>(self, predicate: P) -> Filter<Self, P>
where Self: Sized, P: FnMut(&Self::Item) -> bool,

fn filter_map<B, F>(self, f: F) -> FilterMap<Self, F>
where Self: Sized, F: FnMut(Self::Item) -> Option<B>,

fn enumerate(self) -> Enumerate<Self>
where Self: Sized,

fn peekable(self) -> Peekable<Self>
where Self: Sized,

fn skip_while<P>(self, predicate: P) -> SkipWhile<Self, P>
where Self: Sized, P: FnMut(&Self::Item) -> bool,

fn take_while<P>(self, predicate: P) -> TakeWhile<Self, P>
where Self: Sized, P: FnMut(&Self::Item) -> bool,

fn map_while<B, P>(self, predicate: P) -> MapWhile<Self, P>
where Self: Sized, P: FnMut(Self::Item) -> Option<B>,

fn skip(self, n: usize) -> Skip<Self>
where Self: Sized,

fn take(self, n: usize) -> Take<Self>
where Self: Sized,

fn scan<St, B, F>(self, initial_state: St, f: F) -> Scan<Self, St, F>
where Self: Sized, F: FnMut(&mut St, Self::Item) -> Option<B>,

fn flat_map<U, F>(self, f: F) -> FlatMap<Self, U, F>
where Self: Sized, U: IntoIterator, F: FnMut(Self::Item) -> U,

fn map_windows<F, R, const N: usize>(self, f: F) -> MapWindows<Self, F, N>
where Self: Sized, F: FnMut(&[Self::Item; N]) -> R,

fn fuse(self) -> Fuse<Self>
where Self: Sized,

fn inspect<F>(self, f: F) -> Inspect<Self, F>
where Self: Sized, F: FnMut(&Self::Item),

fn by_ref(&mut self) -> &mut Self
where Self: Sized,

fn collect<B>(self) -> B
where B: FromIterator<Self::Item>, Self: Sized,

fn collect_into<E>(self, collection: &mut E) -> &mut E
where E: Extend<Self::Item>, Self: Sized,

fn partition<B, F>(self, f: F) -> (B, B)
where Self: Sized, B: Default + Extend<Self::Item>, F: FnMut(&Self::Item) -> bool,

fn is_partitioned<P>(self, predicate: P) -> bool
where Self: Sized, P: FnMut(Self::Item) -> bool,

fn try_fold<B, F, R>(&mut self, init: B, f: F) -> R
where Self: Sized, F: FnMut(B, Self::Item) -> R, R: Try<Output = B>,

fn try_for_each<F, R>(&mut self, f: F) -> R
where Self: Sized, F: FnMut(Self::Item) -> R, R: Try<Output = ()>,

fn fold<B, F>(self, init: B, f: F) -> B
where Self: Sized, F: FnMut(B, Self::Item) -> B,

fn reduce<F>(self, f: F) -> Option<Self::Item>
where Self: Sized, F: FnMut(Self::Item, Self::Item) -> Self::Item,

fn try_reduce<R>( &mut self, f: impl FnMut(Self::Item, Self::Item) -> R, ) -> <<R as Try>::Residual as Residual<Option<<R as Try>::Output>>>::TryType
where Self: Sized, R: Try<Output = Self::Item>, <R as Try>::Residual: Residual<Option<Self::Item>>,

fn all<F>(&mut self, f: F) -> bool
where Self: Sized, F: FnMut(Self::Item) -> bool,

fn any<F>(&mut self, f: F) -> bool
where Self: Sized, F: FnMut(Self::Item) -> bool,

fn find<P>(&mut self, predicate: P) -> Option<Self::Item>
where Self: Sized, P: FnMut(&Self::Item) -> bool,

fn find_map<B, F>(&mut self, f: F) -> Option<B>
where Self: Sized, F: FnMut(Self::Item) -> Option<B>,

fn try_find<R>( &mut self, f: impl FnMut(&Self::Item) -> R, ) -> <<R as Try>::Residual as Residual<Option<Self::Item>>>::TryType
where Self: Sized, R: Try<Output = bool>, <R as Try>::Residual: Residual<Option<Self::Item>>,

fn position<P>(&mut self, predicate: P) -> Option<usize>
where Self: Sized, P: FnMut(Self::Item) -> bool,

fn max_by_key<B, F>(self, f: F) -> Option<Self::Item>
where B: Ord, Self: Sized, F: FnMut(&Self::Item) -> B,

fn max_by<F>(self, compare: F) -> Option<Self::Item>
where Self: Sized, F: FnMut(&Self::Item, &Self::Item) -> Ordering,

fn min_by_key<B, F>(self, f: F) -> Option<Self::Item>
where B: Ord, Self: Sized, F: FnMut(&Self::Item) -> B,

fn min_by<F>(self, compare: F) -> Option<Self::Item>
where Self: Sized, F: FnMut(&Self::Item, &Self::Item) -> Ordering,

fn unzip<A, B, FromA, FromB>(self) -> (FromA, FromB)
where FromA: Default + Extend<A>, FromB: Default + Extend<B>, Self: Sized + Iterator<Item = (A, B)>,

fn copied<'a, T>(self) -> Copied<Self>
where T: 'a + Copy, Self: Sized + Iterator<Item = &'a T>,

fn cloned<'a, T>(self) -> Cloned<Self>
where T: 'a + Clone, Self: Sized + Iterator<Item = &'a T>,

fn array_chunks<const N: usize>(self) -> ArrayChunks<Self, N>
where Self: Sized,

fn sum<S>(self) -> S
where Self: Sized, S: Sum<Self::Item>,

fn product<P>(self) -> P
where Self: Sized, P: Product<Self::Item>,

fn cmp_by<I, F>(self, other: I, cmp: F) -> Ordering
where Self: Sized, I: IntoIterator, F: FnMut(Self::Item, <I as IntoIterator>::Item) -> Ordering,

fn partial_cmp<I>(self, other: I) -> Option<Ordering>
where I: IntoIterator, Self::Item: PartialOrd<<I as IntoIterator>::Item>, Self: Sized,

fn partial_cmp_by<I, F>(self, other: I, partial_cmp: F) -> Option<Ordering>
where Self: Sized, I: IntoIterator, F: FnMut(Self::Item, <I as IntoIterator>::Item) -> Option<Ordering>,

fn eq<I>(self, other: I) -> bool
where I: IntoIterator, Self::Item: PartialEq<<I as IntoIterator>::Item>, Self: Sized,

fn eq_by<I, F>(self, other: I, eq: F) -> bool
where Self: Sized, I: IntoIterator, F: FnMut(Self::Item, <I as IntoIterator>::Item) -> bool,

fn ne<I>(self, other: I) -> bool
where I: IntoIterator, Self::Item: PartialEq<<I as IntoIterator>::Item>, Self: Sized,

fn lt<I>(self, other: I) -> bool
where I: IntoIterator, Self::Item: PartialOrd<<I as IntoIterator>::Item>, Self: Sized,

fn le<I>(self, other: I) -> bool
where I: IntoIterator, Self::Item: PartialOrd<<I as IntoIterator>::Item>, Self: Sized,

fn gt<I>(self, other: I) -> bool
where I: IntoIterator, Self::Item: PartialOrd<<I as IntoIterator>::Item>, Self: Sized,

fn ge<I>(self, other: I) -> bool
where I: IntoIterator, Self::Item: PartialOrd<<I as IntoIterator>::Item>, Self: Sized,

fn is_sorted_by<F>(self, compare: F) -> bool
where Self: Sized, F: FnMut(&Self::Item, &Self::Item) -> bool,

fn is_sorted_by_key<F, K>(self, f: F) -> bool
where Self: Sized, F: FnMut(Self::Item) -> K, K: PartialOrd,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

impl<I> IntoIterator for I
where I: Iterator,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,