pub struct HtmlParserConfig {
pub preserve_whitespace: bool,
pub extract_images: bool,
pub extract_links: bool,
pub heading_strategy: HeadingStrategy,
pub max_depth: usize,
pub max_blocks: usize,
pub min_text_length: usize,
}Expand description
Configuration for HTML parsing
Fields§
§preserve_whitespace: boolWhether to preserve whitespace in text nodes
extract_images: boolWhether to extract images as media blocks
extract_links: boolWhether to extract links and store href in edges
heading_strategy: HeadingStrategyStrategy for handling heading levels
max_depth: usizeMaximum nesting depth to process
max_blocks: usizeMaximum number of blocks to create
min_text_length: usizeMinimum text length to create a block (filters noise)
Trait Implementations§
Source§impl Clone for HtmlParserConfig
impl Clone for HtmlParserConfig
Source§fn clone(&self) -> HtmlParserConfig
fn clone(&self) -> HtmlParserConfig
Returns a duplicate of the value. Read more
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
Performs copy-assignment from
source. Read moreSource§impl Debug for HtmlParserConfig
impl Debug for HtmlParserConfig
Auto Trait Implementations§
impl Freeze for HtmlParserConfig
impl RefUnwindSafe for HtmlParserConfig
impl Send for HtmlParserConfig
impl Sync for HtmlParserConfig
impl Unpin for HtmlParserConfig
impl UnsafeUnpin for HtmlParserConfig
impl UnwindSafe for HtmlParserConfig
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more