pub struct StreamingParser<R: Read> { /* private fields */ }Expand description
Streaming HEDL parser.
Processes HEDL documents incrementally, yielding NodeEvent items as they
are parsed without loading the entire document into memory.
Implementations§
Source§impl<R: Read> StreamingParser<R>
impl<R: Read> StreamingParser<R>
Sourcepub fn new(reader: R) -> StreamResult<Self>
pub fn new(reader: R) -> StreamResult<Self>
Create a new streaming parser with default configuration.
The parser immediately reads and validates the HEDL header (version and schema directives). If the header is invalid, this function returns an error.
§Parameters
reader: Any type implementingRead(files, network streams, buffers, etc.)
§Returns
Ok(parser): Parser ready to yield eventsErr(e): Header parsing failed (missing version, invalid schema, etc.)
§Examples
§From a File
use hedl_stream::StreamingParser;
use std::fs::File;
use std::io::BufReader;
let file = File::open("data.hedl")?;
let reader = BufReader::new(file);
let parser = StreamingParser::new(reader)?;§From a String
use hedl_stream::StreamingParser;
use std::io::Cursor;
let data = r#"
%VERSION: 1.0
%STRUCT: User: [id, name]
---
users:@User
| alice, Alice
"#;
let parser = StreamingParser::new(Cursor::new(data))?;§From Stdin
use hedl_stream::StreamingParser;
use std::io::stdin;
let parser = StreamingParser::new(stdin().lock())?;§Errors
StreamError::MissingVersion: No%VERSIONdirective foundStreamError::InvalidVersion: Invalid version formatStreamError::Syntax: Malformed header directiveStreamError::Io: I/O error reading input
Sourcepub fn with_config(
reader: R,
config: StreamingParserConfig,
) -> StreamResult<Self>
pub fn with_config( reader: R, config: StreamingParserConfig, ) -> StreamResult<Self>
Create a streaming parser with custom configuration.
Use this when you need to control memory limits, buffer sizes, or enable timeout protection for untrusted input.
§Parameters
reader: Any type implementingReadconfig: Parser configuration options
§Returns
Ok(parser): Parser ready to yield eventsErr(e): Configuration invalid or header parsing failed
§Examples
§With Timeout Protection
use hedl_stream::{StreamingParser, StreamingParserConfig};
use std::time::Duration;
use std::io::Cursor;
let config = StreamingParserConfig {
timeout: Some(Duration::from_secs(30)),
..Default::default()
};
let untrusted_input = "...";
let parser = StreamingParser::with_config(
Cursor::new(untrusted_input),
config
)?;§For Large Files
use hedl_stream::{StreamingParser, StreamingParserConfig};
use std::io::Cursor;
let config = StreamingParserConfig {
buffer_size: 256 * 1024, // 256KB read buffer
max_line_length: 10_000_000, // 10MB max line
max_indent_depth: 1000, // Deep nesting allowed
timeout: None,
..Default::default()
};
let parser = StreamingParser::with_config(
Cursor::new("..."),
config
)?;§For Constrained Environments
use hedl_stream::{StreamingParser, StreamingParserConfig};
use std::time::Duration;
use std::io::Cursor;
let config = StreamingParserConfig {
buffer_size: 8 * 1024, // Small 8KB buffer
max_line_length: 100_000, // 100KB max line
max_indent_depth: 50, // Limited nesting
timeout: Some(Duration::from_secs(10)),
..Default::default()
};
let parser = StreamingParser::with_config(
Cursor::new("..."),
config
)?;§Errors
Same as new(), plus:
StreamError::Timeout: Header parsing exceeded configured timeout
Sourcepub fn header(&self) -> Option<&HeaderInfo>
pub fn header(&self) -> Option<&HeaderInfo>
Get the parsed header information.
Returns header metadata including version, schema definitions, aliases, and nesting rules. This is available immediately after parser creation.
§Returns
Some(&HeaderInfo): Header was successfully parsedNone: Should never happen after successful parser creation
§Examples
§Inspecting Schema Definitions
use hedl_stream::StreamingParser;
use std::io::Cursor;
let input = r#"
%VERSION: 1.0
%STRUCT: User: [id, name, email]
%STRUCT: Order: [id, user_id, amount]
%ALIAS: active = "Active"
%NEST: User > Order
---
"#;
let parser = StreamingParser::new(Cursor::new(input))?;
let header = parser.header().unwrap();
// Check version
assert_eq!(header.version, (1, 0));
// Get schema
let user_schema = header.get_schema("User").unwrap();
assert_eq!(user_schema, &vec!["id", "name", "email"]);
// Check aliases
assert_eq!(header.aliases.get("active"), Some(&"Active".to_string()));
// Check nesting rules
assert!(header.get_child_types("User").map_or(false, |v| v.contains(&"Order".to_string())));§Validating Before Processing
use hedl_stream::StreamingParser;
use std::io::Cursor;
let input = r#"
%VERSION: 1.0
%STRUCT: User: [id, name]
---
users:@User
| alice, Alice
"#;
let parser = StreamingParser::new(Cursor::new(input))?;
// Validate we have the expected schema before processing
if let Some(header) = parser.header() {
if header.version.0 != 1 {
eprintln!("Warning: Unexpected major version");
}
if !header.structs.contains_key("User") {
return Err("Missing User schema".into());
}
}
// Proceed with parsing...Source§impl StreamingParser<CompressionReader<File>>
impl StreamingParser<CompressionReader<File>>
Sourcepub fn open<P: AsRef<Path>>(path: P) -> StreamResult<Self>
pub fn open<P: AsRef<Path>>(path: P) -> StreamResult<Self>
Open a file with automatic compression detection.
Detects compression format from the file extension (.gz, .zst, .lz4)
and automatically decompresses the content.
§Examples
use hedl_stream::StreamingParser;
// Open a GZIP-compressed HEDL file
let parser = StreamingParser::open("data.hedl.gz")?;
for event in parser {
println!("{:?}", event?);
}§Errors
StreamError::Io: File not found or cannot be openedStreamError::Compression: Decompression initialization failedStreamError::MissingVersion: Invalid HEDL header
Sourcepub fn open_with_config<P: AsRef<Path>>(
path: P,
config: StreamingParserConfig,
) -> StreamResult<Self>
pub fn open_with_config<P: AsRef<Path>>( path: P, config: StreamingParserConfig, ) -> StreamResult<Self>
Open a file with automatic compression detection and custom configuration.
Combines automatic compression detection with custom parser settings.
§Examples
use hedl_stream::{StreamingParser, StreamingParserConfig};
use std::time::Duration;
let config = StreamingParserConfig {
timeout: Some(Duration::from_secs(30)),
..Default::default()
};
let parser = StreamingParser::open_with_config("data.hedl.zst", config)?;Sourcepub fn open_with_compression<P: AsRef<Path>>(
path: P,
format: CompressionFormat,
) -> StreamResult<Self>
pub fn open_with_compression<P: AsRef<Path>>( path: P, format: CompressionFormat, ) -> StreamResult<Self>
Open a file with explicit compression format.
Use this when the file extension doesn’t match the actual compression format, or when you want to force a specific decompression algorithm.
§Examples
use hedl_stream::StreamingParser;
use hedl_stream::compression::CompressionFormat;
// File has no extension but is GZIP compressed
let parser = StreamingParser::open_with_compression(
"data.hedl",
CompressionFormat::Gzip,
)?;Trait Implementations§
Source§impl<R: Read> Iterator for StreamingParser<R>
impl<R: Read> Iterator for StreamingParser<R>
Source§fn next(&mut self) -> Option<Self::Item>
fn next(&mut self) -> Option<Self::Item>
Source§fn next_chunk<const N: usize>(
&mut self,
) -> Result<[Self::Item; N], IntoIter<Self::Item, N>>where
Self: Sized,
fn next_chunk<const N: usize>(
&mut self,
) -> Result<[Self::Item; N], IntoIter<Self::Item, N>>where
Self: Sized,
iter_next_chunk)N values. Read more1.0.0 · Source§fn size_hint(&self) -> (usize, Option<usize>)
fn size_hint(&self) -> (usize, Option<usize>)
1.0.0 · Source§fn count(self) -> usizewhere
Self: Sized,
fn count(self) -> usizewhere
Self: Sized,
1.0.0 · Source§fn last(self) -> Option<Self::Item>where
Self: Sized,
fn last(self) -> Option<Self::Item>where
Self: Sized,
Source§fn advance_by(&mut self, n: usize) -> Result<(), NonZero<usize>>
fn advance_by(&mut self, n: usize) -> Result<(), NonZero<usize>>
iter_advance_by)n elements. Read more1.0.0 · Source§fn nth(&mut self, n: usize) -> Option<Self::Item>
fn nth(&mut self, n: usize) -> Option<Self::Item>
nth element of the iterator. Read more1.28.0 · Source§fn step_by(self, step: usize) -> StepBy<Self>where
Self: Sized,
fn step_by(self, step: usize) -> StepBy<Self>where
Self: Sized,
1.0.0 · Source§fn chain<U>(self, other: U) -> Chain<Self, <U as IntoIterator>::IntoIter>
fn chain<U>(self, other: U) -> Chain<Self, <U as IntoIterator>::IntoIter>
1.0.0 · Source§fn zip<U>(self, other: U) -> Zip<Self, <U as IntoIterator>::IntoIter>where
Self: Sized,
U: IntoIterator,
fn zip<U>(self, other: U) -> Zip<Self, <U as IntoIterator>::IntoIter>where
Self: Sized,
U: IntoIterator,
Source§fn intersperse(self, separator: Self::Item) -> Intersperse<Self>
fn intersperse(self, separator: Self::Item) -> Intersperse<Self>
iter_intersperse)separator between adjacent
items of the original iterator. Read moreSource§fn intersperse_with<G>(self, separator: G) -> IntersperseWith<Self, G>
fn intersperse_with<G>(self, separator: G) -> IntersperseWith<Self, G>
iter_intersperse)separator
between adjacent items of the original iterator. Read more1.0.0 · Source§fn map<B, F>(self, f: F) -> Map<Self, F>
fn map<B, F>(self, f: F) -> Map<Self, F>
1.0.0 · Source§fn filter<P>(self, predicate: P) -> Filter<Self, P>
fn filter<P>(self, predicate: P) -> Filter<Self, P>
1.0.0 · Source§fn filter_map<B, F>(self, f: F) -> FilterMap<Self, F>
fn filter_map<B, F>(self, f: F) -> FilterMap<Self, F>
1.0.0 · Source§fn enumerate(self) -> Enumerate<Self>where
Self: Sized,
fn enumerate(self) -> Enumerate<Self>where
Self: Sized,
1.0.0 · Source§fn skip_while<P>(self, predicate: P) -> SkipWhile<Self, P>
fn skip_while<P>(self, predicate: P) -> SkipWhile<Self, P>
1.0.0 · Source§fn take_while<P>(self, predicate: P) -> TakeWhile<Self, P>
fn take_while<P>(self, predicate: P) -> TakeWhile<Self, P>
1.57.0 · Source§fn map_while<B, P>(self, predicate: P) -> MapWhile<Self, P>
fn map_while<B, P>(self, predicate: P) -> MapWhile<Self, P>
1.0.0 · Source§fn skip(self, n: usize) -> Skip<Self>where
Self: Sized,
fn skip(self, n: usize) -> Skip<Self>where
Self: Sized,
n elements. Read more1.0.0 · Source§fn take(self, n: usize) -> Take<Self>where
Self: Sized,
fn take(self, n: usize) -> Take<Self>where
Self: Sized,
n elements, or fewer
if the underlying iterator ends sooner. Read more1.0.0 · Source§fn flat_map<U, F>(self, f: F) -> FlatMap<Self, U, F>
fn flat_map<U, F>(self, f: F) -> FlatMap<Self, U, F>
1.29.0 · Source§fn flatten(self) -> Flatten<Self>
fn flatten(self) -> Flatten<Self>
Source§fn map_windows<F, R, const N: usize>(self, f: F) -> MapWindows<Self, F, N>
fn map_windows<F, R, const N: usize>(self, f: F) -> MapWindows<Self, F, N>
iter_map_windows)f for each contiguous window of size N over
self and returns an iterator over the outputs of f. Like slice::windows(),
the windows during mapping overlap as well. Read more1.0.0 · Source§fn inspect<F>(self, f: F) -> Inspect<Self, F>
fn inspect<F>(self, f: F) -> Inspect<Self, F>
1.0.0 · Source§fn by_ref(&mut self) -> &mut Selfwhere
Self: Sized,
fn by_ref(&mut self) -> &mut Selfwhere
Self: Sized,
Iterator. Read moreSource§fn try_collect<B>(
&mut self,
) -> <<Self::Item as Try>::Residual as Residual<B>>::TryType
fn try_collect<B>( &mut self, ) -> <<Self::Item as Try>::Residual as Residual<B>>::TryType
iterator_try_collect)Source§fn collect_into<E>(self, collection: &mut E) -> &mut E
fn collect_into<E>(self, collection: &mut E) -> &mut E
iter_collect_into)1.0.0 · Source§fn partition<B, F>(self, f: F) -> (B, B)
fn partition<B, F>(self, f: F) -> (B, B)
Source§fn is_partitioned<P>(self, predicate: P) -> bool
fn is_partitioned<P>(self, predicate: P) -> bool
iter_is_partitioned)true precede all those that return false. Read more1.27.0 · Source§fn try_fold<B, F, R>(&mut self, init: B, f: F) -> R
fn try_fold<B, F, R>(&mut self, init: B, f: F) -> R
1.27.0 · Source§fn try_for_each<F, R>(&mut self, f: F) -> R
fn try_for_each<F, R>(&mut self, f: F) -> R
1.0.0 · Source§fn fold<B, F>(self, init: B, f: F) -> B
fn fold<B, F>(self, init: B, f: F) -> B
1.51.0 · Source§fn reduce<F>(self, f: F) -> Option<Self::Item>
fn reduce<F>(self, f: F) -> Option<Self::Item>
Source§fn try_reduce<R>(
&mut self,
f: impl FnMut(Self::Item, Self::Item) -> R,
) -> <<R as Try>::Residual as Residual<Option<<R as Try>::Output>>>::TryType
fn try_reduce<R>( &mut self, f: impl FnMut(Self::Item, Self::Item) -> R, ) -> <<R as Try>::Residual as Residual<Option<<R as Try>::Output>>>::TryType
iterator_try_reduce)1.0.0 · Source§fn all<F>(&mut self, f: F) -> bool
fn all<F>(&mut self, f: F) -> bool
1.0.0 · Source§fn any<F>(&mut self, f: F) -> bool
fn any<F>(&mut self, f: F) -> bool
1.0.0 · Source§fn find<P>(&mut self, predicate: P) -> Option<Self::Item>
fn find<P>(&mut self, predicate: P) -> Option<Self::Item>
1.30.0 · Source§fn find_map<B, F>(&mut self, f: F) -> Option<B>
fn find_map<B, F>(&mut self, f: F) -> Option<B>
Source§fn try_find<R>(
&mut self,
f: impl FnMut(&Self::Item) -> R,
) -> <<R as Try>::Residual as Residual<Option<Self::Item>>>::TryType
fn try_find<R>( &mut self, f: impl FnMut(&Self::Item) -> R, ) -> <<R as Try>::Residual as Residual<Option<Self::Item>>>::TryType
try_find)1.0.0 · Source§fn position<P>(&mut self, predicate: P) -> Option<usize>
fn position<P>(&mut self, predicate: P) -> Option<usize>
1.0.0 · Source§fn max(self) -> Option<Self::Item>
fn max(self) -> Option<Self::Item>
1.0.0 · Source§fn min(self) -> Option<Self::Item>
fn min(self) -> Option<Self::Item>
1.6.0 · Source§fn max_by_key<B, F>(self, f: F) -> Option<Self::Item>
fn max_by_key<B, F>(self, f: F) -> Option<Self::Item>
1.15.0 · Source§fn max_by<F>(self, compare: F) -> Option<Self::Item>
fn max_by<F>(self, compare: F) -> Option<Self::Item>
1.6.0 · Source§fn min_by_key<B, F>(self, f: F) -> Option<Self::Item>
fn min_by_key<B, F>(self, f: F) -> Option<Self::Item>
1.15.0 · Source§fn min_by<F>(self, compare: F) -> Option<Self::Item>
fn min_by<F>(self, compare: F) -> Option<Self::Item>
1.0.0 · Source§fn unzip<A, B, FromA, FromB>(self) -> (FromA, FromB)
fn unzip<A, B, FromA, FromB>(self) -> (FromA, FromB)
1.36.0 · Source§fn copied<'a, T>(self) -> Copied<Self>
fn copied<'a, T>(self) -> Copied<Self>
Source§fn array_chunks<const N: usize>(self) -> ArrayChunks<Self, N>where
Self: Sized,
fn array_chunks<const N: usize>(self) -> ArrayChunks<Self, N>where
Self: Sized,
iter_array_chunks)N elements of the iterator at a time. Read more1.11.0 · Source§fn product<P>(self) -> P
fn product<P>(self) -> P
Source§fn cmp_by<I, F>(self, other: I, cmp: F) -> Ordering
fn cmp_by<I, F>(self, other: I, cmp: F) -> Ordering
iter_order_by)Iterator with those
of another with respect to the specified comparison function. Read more1.5.0 · Source§fn partial_cmp<I>(self, other: I) -> Option<Ordering>
fn partial_cmp<I>(self, other: I) -> Option<Ordering>
PartialOrd elements of
this Iterator with those of another. The comparison works like short-circuit
evaluation, returning a result without comparing the remaining elements.
As soon as an order can be determined, the evaluation stops and a result is returned. Read moreSource§fn partial_cmp_by<I, F>(self, other: I, partial_cmp: F) -> Option<Ordering>where
Self: Sized,
I: IntoIterator,
F: FnMut(Self::Item, <I as IntoIterator>::Item) -> Option<Ordering>,
fn partial_cmp_by<I, F>(self, other: I, partial_cmp: F) -> Option<Ordering>where
Self: Sized,
I: IntoIterator,
F: FnMut(Self::Item, <I as IntoIterator>::Item) -> Option<Ordering>,
iter_order_by)Iterator with those
of another with respect to the specified comparison function. Read moreSource§fn eq_by<I, F>(self, other: I, eq: F) -> bool
fn eq_by<I, F>(self, other: I, eq: F) -> bool
iter_order_by)1.5.0 · Source§fn lt<I>(self, other: I) -> bool
fn lt<I>(self, other: I) -> bool
Iterator are lexicographically
less than those of another. Read more1.5.0 · Source§fn le<I>(self, other: I) -> bool
fn le<I>(self, other: I) -> bool
Iterator are lexicographically
less or equal to those of another. Read more1.5.0 · Source§fn gt<I>(self, other: I) -> bool
fn gt<I>(self, other: I) -> bool
Iterator are lexicographically
greater than those of another. Read more1.5.0 · Source§fn ge<I>(self, other: I) -> bool
fn ge<I>(self, other: I) -> bool
Iterator are lexicographically
greater than or equal to those of another. Read more