pub struct ExtractorConfig {
pub max_length: usize,
pub timeout_secs: u64,
pub clean_text: bool,
pub preserve_whitespace: bool,
pub user_agent: String,
pub follow_redirects: bool,
pub max_redirects: usize,
pub sanitize: bool,
pub redact_pii: bool,
pub detect_injection: bool,
}Expand description
Configuration for content extraction
Fields§
§max_length: usizeMaximum content length to extract (in characters)
timeout_secs: u64Request timeout in seconds
clean_text: boolWhether to extract clean text (remove HTML tags, scripts, etc.)
preserve_whitespace: boolWhether to preserve whitespace formatting
user_agent: StringUser agent for web requests
follow_redirects: boolWhether to follow redirects
max_redirects: usizeMaximum redirects to follow
sanitize: boolWhether to sanitize output via hanzo-guard
redact_pii: boolWhether to redact PII
detect_injection: boolWhether to detect injection attempts
Implementations§
Source§impl ExtractorConfig
impl ExtractorConfig
Sourcepub fn with_max_length(self, max_length: usize) -> Self
pub fn with_max_length(self, max_length: usize) -> Self
Create a new config with custom max length
Sourcepub fn with_timeout(self, timeout_secs: u64) -> Self
pub fn with_timeout(self, timeout_secs: u64) -> Self
Create a new config with custom timeout
Sourcepub fn with_clean_text(self, clean: bool) -> Self
pub fn with_clean_text(self, clean: bool) -> Self
Enable or disable text cleaning
Sourcepub fn with_sanitize(self, sanitize: bool) -> Self
pub fn with_sanitize(self, sanitize: bool) -> Self
Enable or disable sanitization
Sourcepub fn with_redact_pii(self, redact: bool) -> Self
pub fn with_redact_pii(self, redact: bool) -> Self
Enable or disable PII redaction
Sourcepub fn with_detect_injection(self, detect: bool) -> Self
pub fn with_detect_injection(self, detect: bool) -> Self
Enable or disable injection detection
Trait Implementations§
Source§impl Clone for ExtractorConfig
impl Clone for ExtractorConfig
Source§fn clone(&self) -> ExtractorConfig
fn clone(&self) -> ExtractorConfig
Returns a duplicate of the value. Read more
1.0.0 (const: unstable) · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
Performs copy-assignment from
source. Read moreSource§impl Debug for ExtractorConfig
impl Debug for ExtractorConfig
Source§impl Default for ExtractorConfig
impl Default for ExtractorConfig
Source§impl<'de> Deserialize<'de> for ExtractorConfig
impl<'de> Deserialize<'de> for ExtractorConfig
Source§fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
Deserialize this value from the given Serde deserializer. Read more
Auto Trait Implementations§
impl Freeze for ExtractorConfig
impl RefUnwindSafe for ExtractorConfig
impl Send for ExtractorConfig
impl Sync for ExtractorConfig
impl Unpin for ExtractorConfig
impl UnsafeUnpin for ExtractorConfig
impl UnwindSafe for ExtractorConfig
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read more