Struct serde_gff::parser::Parser

source ·

pub struct Parser<R: Read + Seek> { /* private fields */ }

Expand description

Реализует потоковый (наподобие SAX) парсер GFF файла. Парсер реализует интерфейс итератора по токенам. Каждый вызов метода next_token возвращает следующий токен из потока, который сразу же может быть использован для анализа или сохранен для дальнейшего использования.

События разбора

Парсер представляет собой pull-down парсер, т.е. для получения данных его нужно опрашивать внешним циклом (в противоположность push-down парсеру, который испускает события при разборе очередного элемента).

Так как GFF файл может быть представлен в XML виде, и эта структура проще для представления в тексте, то ниже показан пример файла, в котором отмечены места после которых парсер генерирует токены при разборе. В виде кода Rust описанная структура данных может быть представлена таким образом:

struct Struct;
struct Item {
  double: f64,
}
struct Root {
  int: i32,
  struc: Struct,
  list: Vec<Item>,
}

XML представление:

<STRUCT tag='4294967295'>[1]
  <FIELD label='int'[2] type='INT'>8</FIELD>[3]
  <FIELD label='struc'[4] type='STRUCT'>
    <STRUCT tag='1'>[5]
    </STRUCT>[6]
  </FIELD>
  <FIELD label='list'[7] type='LIST'>[8]
    <STRUCT tag='2'>[9]
      <FIELD label='double'[10] type='DOUBLE'>0.000000</FIELD>[11]
    </STRUCT>[12]
  </FIELD>[13]
</STRUCT>[14]

Токены, получаемые последовательным вызовом next_token:

RootBegin. Прочитано описание корневой структуры – в этом состоянии уже известен тег типа структуры и количество полей в ней.
Label. Прочитан индекс метки, по этому индексу может быть прочитано значение метки
Value. Прочитано примитивное значение
Label. Прочитан индекс метки, по этому индексу может быть прочитано значение метки
StructBegin. Прочитано количество полей структуры и ее тег
StructEnd
Label. Прочитан индекс метки, по этому индексу может быть прочитано значение метки
ListBegin. Прочитано количество элементов списка
ItemBegin. Прочитано количество полей структуры, ее тег, а также предоставляется информация о порядковом индексе элемента
Label. Прочитан индекс метки, по этому индексу может быть прочитано значение метки
Value. Прочитан индекс большого значения (больше 4-х байт), по этому индексу само значение может быть прочитано отдельным вызовом
ItemEnd. Элемент списка прочитан
ListEnd. Весь список прочитан
RootEnd. Файл прочитан

Пример

В данном примере читается файл с диска, и в потоковом режиме выводится на экран, формируя что-то, напоминающее JSON.

use std::fs::File;
use serde_gff::parser::Parser;
use serde_gff::parser::Token::*;

// Читаем файл с диска и создаем парсер. При создании парсер сразу же читает небольшую
// порцию данных -- заголовок, которая нужна ему для правильного разрешения ссылок
let file = File::open("test-data/all.gff").expect("test file not exist");
let mut parser = Parser::new(file).expect("reading GFF header failed");
let mut indent = 0;
loop {
  // В данном случае мы используем методы типажа Iterator для итерирования по файлу, так
  // как мы полагаем, что ошибок в процессе чтения не возникнет. Если же они интересны,
  // следует использовать метод `next_token`
  if let Some(token) = parser.next() {
    match token {
      RootBegin {..} | RootEnd => {},
      // Обрамляем структуры в `{ ... }`
      StructBegin {..} => { indent += 1; println!("{{"); },
      StructEnd        => { indent -= 1; println!("{:indent$}}}", "", indent=indent*2); },
      // Обрамляем списки в `[ ... ]`
      ListBegin {..}   => { indent += 1; println!("["); },
      ListEnd          => { indent -= 1; println!("{:indent$}]", "", indent=indent*2); },
      // Обрамляем элементы списков в `[index]: { ... }`
      ItemBegin { index, .. } => {
        println!("{:indent$}[{}]: {{", "", index, indent=indent*2);
        indent += 1;
      },
      ItemEnd => {
        indent -= 1;
        println!("{:indent$}}}", "", indent=indent*2);
      },

      Label(index) => {
        // Физически значение меток хранится в другом месте файла. Так как при итерировании они
        // могут быть нам неинтересны, то токен содержит только индекс используемой метки (имени
        // поля). В данном же случае они нас интересуют, поэтому выполняем полное чтение
        let label = parser.read_label(index).expect(&format!("can't read label {:?}", index));
        print!("{:indent$}{}: ", "", label, indent=indent*2)
      },

      // Аналогично со значениями. Некоторые значения доступны сразу (те, чей размер не превышает
      // 4 байта), другие хранятся с других частях файла и должны быть явно прочитаны.
      // Также, если вас интересует только какое-то конкретное значение, может быть использован
      // один из методов `read_*` парсера
      Value(value) => println!("{:?}", parser.read_value(value).expect("can't read value")),
    }
    continue;
  }
  // Как только итератор возвращает None, файл закончился, либо произошла ошибка; завершаем работу
  break;
}

Struct serde_gff::parser::Parser

Implementations

impl<R: Read + Seek> Parser<R>

pub fn new(reader: R) -> Result<Self>

pub fn with_encoding( reader: R, encoding: EncodingRef, trap: DecoderTrap) -> Result<Self>

pub fn next_token(&mut self) -> Result<Token>

pub fn skip_next(&mut self, token: Token)

pub fn read_label(&mut self, index: LabelIndex) -> Result<Label>

pub fn read_u64(&mut self, index: U64Index) -> Result<u64>

pub fn read_i64(&mut self, index: I64Index) -> Result<i64>

pub fn read_f64(&mut self, index: F64Index) -> Result<f64>

pub fn read_string(&mut self, index: StringIndex) -> Result<String>

pub fn read_resref(&mut self, index: ResRefIndex) -> Result<ResRef>

pub fn read_loc_string(&mut self, index: LocStringIndex) -> Result<LocString>

pub fn read_byte_buf(&mut self, index: BinaryIndex) -> Result<Vec<u8>>

pub fn read_value(&mut self, value: SimpleValueRef) -> Result<SimpleValue>

Trait Implementations

impl<R: Read + Seek> Iterator for Parser<R>

type Item = Token

fn next(&mut self) -> Option<Token>

fn size_hint(&self) -> (usize, Option<usize>)

fn next_chunk<const N: usize>( &mut self) -> Result<[Self::Item; N], IntoIter<Self::Item, N>>where Self: Sized,

fn count(self) -> usizewhere Self: Sized,

fn last(self) -> Option<Self::Item>where Self: Sized,

fn advance_by(&mut self, n: usize) -> Result<(), usize>

fn nth(&mut self, n: usize) -> Option<Self::Item>

fn step_by(self, step: usize) -> StepBy<Self>where Self: Sized,

fn chain<U>(self, other: U) -> Chain<Self, <U as IntoIterator>::IntoIter>where Self: Sized, U: IntoIterator<Item = Self::Item>,

fn zip<U>(self, other: U) -> Zip<Self, <U as IntoIterator>::IntoIter>where Self: Sized, U: IntoIterator,

fn intersperse_with<G>(self, separator: G) -> IntersperseWith<Self, G>where Self: Sized, G: FnMut() -> Self::Item,

fn map<B, F>(self, f: F) -> Map<Self, F>where Self: Sized, F: FnMut(Self::Item) -> B,

fn for_each<F>(self, f: F)where Self: Sized, F: FnMut(Self::Item),

fn filter<P>(self, predicate: P) -> Filter<Self, P>where Self: Sized, P: FnMut(&Self::Item) -> bool,

fn filter_map<B, F>(self, f: F) -> FilterMap<Self, F>where Self: Sized, F: FnMut(Self::Item) -> Option<B>,

fn enumerate(self) -> Enumerate<Self>where Self: Sized,

fn peekable(self) -> Peekable<Self>where Self: Sized,

fn skip_while<P>(self, predicate: P) -> SkipWhile<Self, P>where Self: Sized, P: FnMut(&Self::Item) -> bool,

fn take_while<P>(self, predicate: P) -> TakeWhile<Self, P>where Self: Sized, P: FnMut(&Self::Item) -> bool,

fn map_while<B, P>(self, predicate: P) -> MapWhile<Self, P>where Self: Sized, P: FnMut(Self::Item) -> Option<B>,

fn skip(self, n: usize) -> Skip<Self>where Self: Sized,

fn take(self, n: usize) -> Take<Self>where Self: Sized,

fn scan<St, B, F>(self, initial_state: St, f: F) -> Scan<Self, St, F>where Self: Sized, F: FnMut(&mut St, Self::Item) -> Option<B>,

fn flat_map<U, F>(self, f: F) -> FlatMap<Self, U, F>where Self: Sized, U: IntoIterator, F: FnMut(Self::Item) -> U,

fn fuse(self) -> Fuse<Self>where Self: Sized,

fn inspect<F>(self, f: F) -> Inspect<Self, F>where Self: Sized, F: FnMut(&Self::Item),

fn by_ref(&mut self) -> &mut Selfwhere Self: Sized,

fn collect<B>(self) -> Bwhere B: FromIterator<Self::Item>, Self: Sized,

fn collect_into<E>(self, collection: &mut E) -> &mut Ewhere E: Extend<Self::Item>, Self: Sized,

fn partition<B, F>(self, f: F) -> (B, B)where Self: Sized, B: Default + Extend<Self::Item>, F: FnMut(&Self::Item) -> bool,

fn is_partitioned<P>(self, predicate: P) -> boolwhere Self: Sized, P: FnMut(Self::Item) -> bool,

fn try_fold<B, F, R>(&mut self, init: B, f: F) -> Rwhere Self: Sized, F: FnMut(B, Self::Item) -> R, R: Try<Output = B>,

fn try_for_each<F, R>(&mut self, f: F) -> Rwhere Self: Sized, F: FnMut(Self::Item) -> R, R: Try<Output = ()>,

fn fold<B, F>(self, init: B, f: F) -> Bwhere Self: Sized, F: FnMut(B, Self::Item) -> B,

fn reduce<F>(self, f: F) -> Option<Self::Item>where Self: Sized, F: FnMut(Self::Item, Self::Item) -> Self::Item,

fn try_reduce<F, R>( &mut self, f: F) -> <<R as Try>::Residual as Residual<Option<<R as Try>::Output>>>::TryTypewhere Self: Sized, F: FnMut(Self::Item, Self::Item) -> R, R: Try<Output = Self::Item>, <R as Try>::Residual: Residual<Option<Self::Item>>,

fn all<F>(&mut self, f: F) -> boolwhere Self: Sized, F: FnMut(Self::Item) -> bool,

fn any<F>(&mut self, f: F) -> boolwhere Self: Sized, F: FnMut(Self::Item) -> bool,

fn find<P>(&mut self, predicate: P) -> Option<Self::Item>where Self: Sized, P: FnMut(&Self::Item) -> bool,

fn find_map<B, F>(&mut self, f: F) -> Option<B>where Self: Sized, F: FnMut(Self::Item) -> Option<B>,

fn try_find<F, R>( &mut self, f: F) -> <<R as Try>::Residual as Residual<Option<Self::Item>>>::TryTypewhere Self: Sized, F: FnMut(&Self::Item) -> R, R: Try<Output = bool>, <R as Try>::Residual: Residual<Option<Self::Item>>,

fn position<P>(&mut self, predicate: P) -> Option<usize>where Self: Sized, P: FnMut(Self::Item) -> bool,

fn max_by_key<B, F>(self, f: F) -> Option<Self::Item>where B: Ord, Self: Sized, F: FnMut(&Self::Item) -> B,

fn max_by<F>(self, compare: F) -> Option<Self::Item>where Self: Sized, F: FnMut(&Self::Item, &Self::Item) -> Ordering,

fn min_by_key<B, F>(self, f: F) -> Option<Self::Item>where B: Ord, Self: Sized, F: FnMut(&Self::Item) -> B,

fn min_by<F>(self, compare: F) -> Option<Self::Item>where Self: Sized, F: FnMut(&Self::Item, &Self::Item) -> Ordering,

fn unzip<A, B, FromA, FromB>(self) -> (FromA, FromB)where FromA: Default + Extend<A>, FromB: Default + Extend<B>, Self: Sized + Iterator<Item = (A, B)>,

fn copied<'a, T>(self) -> Copied<Self>where T: 'a + Copy, Self: Sized + Iterator<Item = &'a T>,

fn cloned<'a, T>(self) -> Cloned<Self>where T: 'a + Clone, Self: Sized + Iterator<Item = &'a T>,

fn array_chunks<const N: usize>(self) -> ArrayChunks<Self, N>where Self: Sized,

fn sum<S>(self) -> Swhere Self: Sized, S: Sum<Self::Item>,

fn product<P>(self) -> Pwhere Self: Sized, P: Product<Self::Item>,

fn cmp_by<I, F>(self, other: I, cmp: F) -> Orderingwhere Self: Sized, I: IntoIterator, F: FnMut(Self::Item, <I as IntoIterator>::Item) -> Ordering,

fn partial_cmp<I>(self, other: I) -> Option<Ordering>where I: IntoIterator, Self::Item: PartialOrd<<I as IntoIterator>::Item>, Self: Sized,

fn partial_cmp_by<I, F>(self, other: I, partial_cmp: F) -> Option<Ordering>where Self: Sized, I: IntoIterator, F: FnMut(Self::Item, <I as IntoIterator>::Item) -> Option<Ordering>,

fn eq<I>(self, other: I) -> boolwhere I: IntoIterator, Self::Item: PartialEq<<I as IntoIterator>::Item>, Self: Sized,

fn eq_by<I, F>(self, other: I, eq: F) -> boolwhere Self: Sized, I: IntoIterator, F: FnMut(Self::Item, <I as IntoIterator>::Item) -> bool,

fn ne<I>(self, other: I) -> boolwhere I: IntoIterator, Self::Item: PartialEq<<I as IntoIterator>::Item>, Self: Sized,

fn lt<I>(self, other: I) -> boolwhere I: IntoIterator, Self::Item: PartialOrd<<I as IntoIterator>::Item>, Self: Sized,

fn le<I>(self, other: I) -> boolwhere I: IntoIterator, Self::Item: PartialOrd<<I as IntoIterator>::Item>, Self: Sized,

fn gt<I>(self, other: I) -> boolwhere I: IntoIterator, Self::Item: PartialOrd<<I as IntoIterator>::Item>, Self: Sized,

pub fn with_encoding(
reader: R,
encoding: EncodingRef,
trap: DecoderTrap
) -> Result<Self>

fn next_chunk<const N: usize>(
&mut self
) -> Result<[Self::Item; N], IntoIter<Self::Item, N>>where
Self: Sized,

fn count(self) -> usizewhere
Self: Sized,

fn last(self) -> Option<Self::Item>where
Self: Sized,

fn step_by(self, step: usize) -> StepBy<Self>where
Self: Sized,

fn chain<U>(self, other: U) -> Chain<Self, <U as IntoIterator>::IntoIter>where
Self: Sized,
U: IntoIterator<Item = Self::Item>,

fn zip<U>(self, other: U) -> Zip<Self, <U as IntoIterator>::IntoIter>where
Self: Sized,
U: IntoIterator,

fn intersperse_with<G>(self, separator: G) -> IntersperseWith<Self, G>where
Self: Sized,
G: FnMut() -> Self::Item,

fn map<B, F>(self, f: F) -> Map<Self, F>where
Self: Sized,
F: FnMut(Self::Item) -> B,

fn for_each<F>(self, f: F)where
Self: Sized,
F: FnMut(Self::Item),

fn filter<P>(self, predicate: P) -> Filter<Self, P>where
Self: Sized,
P: FnMut(&Self::Item) -> bool,

fn filter_map<B, F>(self, f: F) -> FilterMap<Self, F>where
Self: Sized,
F: FnMut(Self::Item) -> Option<B>,

fn enumerate(self) -> Enumerate<Self>where
Self: Sized,

fn peekable(self) -> Peekable<Self>where
Self: Sized,

fn skip_while<P>(self, predicate: P) -> SkipWhile<Self, P>where
Self: Sized,
P: FnMut(&Self::Item) -> bool,

fn take_while<P>(self, predicate: P) -> TakeWhile<Self, P>where
Self: Sized,
P: FnMut(&Self::Item) -> bool,

fn map_while<B, P>(self, predicate: P) -> MapWhile<Self, P>where
Self: Sized,
P: FnMut(Self::Item) -> Option<B>,

fn skip(self, n: usize) -> Skip<Self>where
Self: Sized,

fn take(self, n: usize) -> Take<Self>where
Self: Sized,

fn scan<St, B, F>(self, initial_state: St, f: F) -> Scan<Self, St, F>where
Self: Sized,
F: FnMut(&mut St, Self::Item) -> Option<B>,

fn flat_map<U, F>(self, f: F) -> FlatMap<Self, U, F>where
Self: Sized,
U: IntoIterator,
F: FnMut(Self::Item) -> U,

fn fuse(self) -> Fuse<Self>where
Self: Sized,

fn inspect<F>(self, f: F) -> Inspect<Self, F>where
Self: Sized,
F: FnMut(&Self::Item),

fn by_ref(&mut self) -> &mut Selfwhere
Self: Sized,

fn collect<B>(self) -> Bwhere
B: FromIterator<Self::Item>,
Self: Sized,

fn collect_into<E>(self, collection: &mut E) -> &mut Ewhere
E: Extend<Self::Item>,
Self: Sized,

fn partition<B, F>(self, f: F) -> (B, B)where
Self: Sized,
B: Default + Extend<Self::Item>,
F: FnMut(&Self::Item) -> bool,

fn is_partitioned<P>(self, predicate: P) -> boolwhere
Self: Sized,
P: FnMut(Self::Item) -> bool,

fn try_fold<B, F, R>(&mut self, init: B, f: F) -> Rwhere
Self: Sized,
F: FnMut(B, Self::Item) -> R,
R: Try<Output = B>,

fn try_for_each<F, R>(&mut self, f: F) -> Rwhere
Self: Sized,
F: FnMut(Self::Item) -> R,
R: Try<Output = ()>,

fn fold<B, F>(self, init: B, f: F) -> Bwhere
Self: Sized,
F: FnMut(B, Self::Item) -> B,

fn reduce<F>(self, f: F) -> Option<Self::Item>where
Self: Sized,
F: FnMut(Self::Item, Self::Item) -> Self::Item,

fn try_reduce<F, R>(
&mut self,
f: F
) -> <<R as Try>::Residual as Residual<Option<<R as Try>::Output>>>::TryTypewhere
Self: Sized,
F: FnMut(Self::Item, Self::Item) -> R,
R: Try<Output = Self::Item>,
<R as Try>::Residual: Residual<Option<Self::Item>>,

fn all<F>(&mut self, f: F) -> boolwhere
Self: Sized,
F: FnMut(Self::Item) -> bool,

fn any<F>(&mut self, f: F) -> boolwhere
Self: Sized,
F: FnMut(Self::Item) -> bool,

fn find<P>(&mut self, predicate: P) -> Option<Self::Item>where
Self: Sized,
P: FnMut(&Self::Item) -> bool,

fn find_map<B, F>(&mut self, f: F) -> Option<B>where
Self: Sized,
F: FnMut(Self::Item) -> Option<B>,

fn try_find<F, R>(
&mut self,
f: F
) -> <<R as Try>::Residual as Residual<Option<Self::Item>>>::TryTypewhere
Self: Sized,
F: FnMut(&Self::Item) -> R,
R: Try<Output = bool>,
<R as Try>::Residual: Residual<Option<Self::Item>>,

fn position<P>(&mut self, predicate: P) -> Option<usize>where
Self: Sized,
P: FnMut(Self::Item) -> bool,

fn max_by_key<B, F>(self, f: F) -> Option<Self::Item>where
B: Ord,
Self: Sized,
F: FnMut(&Self::Item) -> B,

fn max_by<F>(self, compare: F) -> Option<Self::Item>where
Self: Sized,
F: FnMut(&Self::Item, &Self::Item) -> Ordering,

fn min_by_key<B, F>(self, f: F) -> Option<Self::Item>where
B: Ord,
Self: Sized,
F: FnMut(&Self::Item) -> B,

fn min_by<F>(self, compare: F) -> Option<Self::Item>where
Self: Sized,
F: FnMut(&Self::Item, &Self::Item) -> Ordering,

fn unzip<A, B, FromA, FromB>(self) -> (FromA, FromB)where
FromA: Default + Extend<A>,
FromB: Default + Extend<B>,
Self: Sized + Iterator<Item = (A, B)>,

fn copied<'a, T>(self) -> Copied<Self>where
T: 'a + Copy,
Self: Sized + Iterator<Item = &'a T>,

fn cloned<'a, T>(self) -> Cloned<Self>where
T: 'a + Clone,
Self: Sized + Iterator<Item = &'a T>,

fn array_chunks<const N: usize>(self) -> ArrayChunks<Self, N>where
Self: Sized,

fn sum<S>(self) -> Swhere
Self: Sized,
S: Sum<Self::Item>,

fn product<P>(self) -> Pwhere
Self: Sized,
P: Product<Self::Item>,

fn cmp_by<I, F>(self, other: I, cmp: F) -> Orderingwhere
Self: Sized,
I: IntoIterator,
F: FnMut(Self::Item, <I as IntoIterator>::Item) -> Ordering,

fn partial_cmp<I>(self, other: I) -> Option<Ordering>where
I: IntoIterator,
Self::Item: PartialOrd<<I as IntoIterator>::Item>,
Self: Sized,

fn partial_cmp_by<I, F>(self, other: I, partial_cmp: F) -> Option<Ordering>where
Self: Sized,
I: IntoIterator,
F: FnMut(Self::Item, <I as IntoIterator>::Item) -> Option<Ordering>,

fn eq<I>(self, other: I) -> boolwhere
I: IntoIterator,
Self::Item: PartialEq<<I as IntoIterator>::Item>,
Self: Sized,

fn eq_by<I, F>(self, other: I, eq: F) -> boolwhere
Self: Sized,
I: IntoIterator,
F: FnMut(Self::Item, <I as IntoIterator>::Item) -> bool,

fn ne<I>(self, other: I) -> boolwhere
I: IntoIterator,
Self::Item: PartialEq<<I as IntoIterator>::Item>,
Self: Sized,

fn lt<I>(self, other: I) -> boolwhere
I: IntoIterator,
Self::Item: PartialOrd<<I as IntoIterator>::Item>,
Self: Sized,

fn le<I>(self, other: I) -> boolwhere
I: IntoIterator,
Self::Item: PartialOrd<<I as IntoIterator>::Item>,
Self: Sized,

fn gt<I>(self, other: I) -> boolwhere
I: IntoIterator,
Self::Item: PartialOrd<<I as IntoIterator>::Item>,
Self: Sized,

fn ge<I>(self, other: I) -> boolwhere
I: IntoIterator,
Self::Item: PartialOrd<<I as IntoIterator>::Item>,
Self: Sized,

fn is_sorted_by<F>(self, compare: F) -> boolwhere
Self: Sized,
F: FnMut(&Self::Item, &Self::Item) -> Option<Ordering>,

fn is_sorted_by_key<F, K>(self, f: F) -> boolwhere
Self: Sized,
F: FnMut(Self::Item) -> K,
K: PartialOrd<K>,

impl<R> Send for Parser<R>where
R: Send,

impl<R> Sync for Parser<R>where
R: Sync,

impl<R> Unpin for Parser<R>where
R: Unpin,

impl<T> Any for Twhere
T: 'static + ?Sized,

impl<T> Borrow<T> for Twhere
T: ?Sized,

impl<T> BorrowMut<T> for Twhere
T: ?Sized,

impl<T, U> Into<U> for Twhere
U: From<T>,

impl<I> IntoIterator for Iwhere
I: Iterator,

impl<T, U> TryFrom<U> for Twhere
U: Into<T>,

impl<T, U> TryInto<U> for Twhere
U: TryFrom<T>,