pub struct UserAgentMiddleware { /* private fields */ }Implementations§
Source§impl UserAgentMiddleware
impl UserAgentMiddleware
Sourcepub fn builder() -> UserAgentMiddlewareBuilder
pub fn builder() -> UserAgentMiddlewareBuilder
Creates a new UserAgentMiddlewareBuilder to start building a UserAgentMiddleware.
Examples found in repository?
examples/quotes_scraper.rs (line 99)
83async fn main() -> Result<(), SpiderError> {
84 tracing_subscriber::fmt()
85 .with_env_filter("info,spider_lib=debug")
86 .without_time()
87 .init();
88
89 let crawler = CrawlerBuilder::<_, ReqwestClientDownloader>::new(QuotesSpider)
90 .add_pipeline(DeduplicationPipeline::new(&["text"]))
91 .add_pipeline(CsvExporterPipeline::<QuoteItem>::new("output/quotes.csv")?)
92 .add_middleware(HttpCacheMiddleware::builder().build()?)
93 .add_middleware(
94 RateLimitMiddleware::builder()
95 .use_token_bucket_limiter(5)
96 .build(),
97 )
98 .add_middleware(RetryMiddleware::default().max_retries(2))
99 .add_middleware(UserAgentMiddleware::builder().build()?)
100 .add_middleware(RobotsTxtMiddleware::new())
101 .add_middleware(
102 RefererMiddleware::new()
103 .same_origin_only(true)
104 .max_chain_length(100)
105 .include_fragment(false),
106 )
107 .with_checkpoint_path("output/quotes.bin")
108 .with_checkpoint_interval(Duration::from_secs(15))
109 .max_concurrent_downloads(5)
110 .max_parser_workers(2)
111 .max_concurrent_pipelines(2)
112 .build()
113 .await?;
114
115 crawler.start_crawl().await?;
116
117 Ok(())
118}Trait Implementations§
Source§impl Debug for UserAgentMiddleware
impl Debug for UserAgentMiddleware
Source§impl<C: Send + Sync> Middleware<C> for UserAgentMiddleware
impl<C: Send + Sync> Middleware<C> for UserAgentMiddleware
fn name(&self) -> &str
fn process_request<'life0, 'life1, 'async_trait>(
&'life0 mut self,
_client: &'life1 C,
request: Request,
) -> Pin<Box<dyn Future<Output = Result<MiddlewareAction<Request>, SpiderError>> + Send + 'async_trait>>where
Self: 'async_trait,
'life0: 'async_trait,
'life1: 'async_trait,
fn process_response<'life0, 'async_trait>(
&'life0 mut self,
response: Response,
) -> Pin<Box<dyn Future<Output = Result<MiddlewareAction<Response>, SpiderError>> + Send + 'async_trait>>where
Self: 'async_trait,
'life0: 'async_trait,
fn handle_error<'life0, 'life1, 'life2, 'async_trait>(
&'life0 mut self,
_request: &'life1 Request,
error: &'life2 SpiderError,
) -> Pin<Box<dyn Future<Output = Result<MiddlewareAction<Request>, SpiderError>> + Send + 'async_trait>>where
Self: 'async_trait,
'life0: 'async_trait,
'life1: 'async_trait,
'life2: 'async_trait,
Auto Trait Implementations§
impl !Freeze for UserAgentMiddleware
impl !RefUnwindSafe for UserAgentMiddleware
impl Send for UserAgentMiddleware
impl Sync for UserAgentMiddleware
impl Unpin for UserAgentMiddleware
impl !UnwindSafe for UserAgentMiddleware
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more