http_cache/
lib.rs

1#![forbid(unsafe_code, future_incompatible)]
2#![deny(
3    missing_docs,
4    missing_debug_implementations,
5    missing_copy_implementations,
6    nonstandard_style,
7    unused_qualifications,
8    unused_import_braces,
9    unused_extern_crates,
10    trivial_casts,
11    trivial_numeric_casts
12)]
13#![allow(clippy::doc_lazy_continuation)]
14#![cfg_attr(docsrs, feature(doc_cfg))]
15//! A caching middleware that follows HTTP caching rules, thanks to
16//! [`http-cache-semantics`](https://github.com/kornelski/rusty-http-cache-semantics).
17//! By default, it uses [`cacache`](https://github.com/zkat/cacache-rs) as the backend cache manager.
18//!
19//! This crate provides the core HTTP caching functionality that can be used to build
20//! caching middleware for various HTTP clients and server frameworks. It implements
21//! RFC 7234 HTTP caching semantics, supporting features like:
22//!
23//! - Automatic cache invalidation for unsafe HTTP methods (PUT, POST, DELETE, PATCH)
24//! - Respect for HTTP cache-control headers
25//! - Conditional requests (ETag, Last-Modified)
26//! - Multiple cache storage backends
27//! - Streaming response support
28//!
29//! ## Basic Usage
30//!
31//! The core types for building HTTP caches:
32//!
33//! ```rust
34//! # #[cfg(feature = "manager-cacache")]
35//! # fn main() {
36//! use http_cache::{CACacheManager, HttpCache, CacheMode, HttpCacheOptions};
37//!
38//! // Create a cache manager with disk storage
39//! let manager = CACacheManager::new("./cache".into(), true);
40//!
41//! // Create an HTTP cache with default behavior
42//! let cache = HttpCache {
43//!     mode: CacheMode::Default,
44//!     manager,
45//!     options: HttpCacheOptions::default(),
46//! };
47//! # }
48//! # #[cfg(not(feature = "manager-cacache"))]
49//! # fn main() {}
50//! ```
51//!
52//! ## Cache Modes
53//!
54//! Different cache modes provide different behaviors:
55//!
56//! ```rust
57//! # #[cfg(feature = "manager-cacache")]
58//! # fn main() {
59//! use http_cache::{CacheMode, HttpCache, CACacheManager, HttpCacheOptions};
60//!
61//! let manager = CACacheManager::new("./cache".into(), true);
62//!
63//! // Default mode: follows HTTP caching rules
64//! let default_cache = HttpCache {
65//!     mode: CacheMode::Default,
66//!     manager: manager.clone(),
67//!     options: HttpCacheOptions::default(),
68//! };
69//!
70//! // NoStore mode: never caches responses
71//! let no_store_cache = HttpCache {
72//!     mode: CacheMode::NoStore,
73//!     manager: manager.clone(),
74//!     options: HttpCacheOptions::default(),
75//! };
76//!
77//! // ForceCache mode: caches responses even if headers suggest otherwise
78//! let force_cache = HttpCache {
79//!     mode: CacheMode::ForceCache,
80//!     manager,
81//!     options: HttpCacheOptions::default(),
82//! };
83//! # }
84//! # #[cfg(not(feature = "manager-cacache"))]
85//! # fn main() {}
86//! ```
87//!
88//! ## Custom Cache Keys
89//!
90//! You can customize how cache keys are generated:
91//!
92//! ```rust
93//! # #[cfg(feature = "manager-cacache")]
94//! # fn main() {
95//! use http_cache::{HttpCacheOptions, CACacheManager, HttpCache, CacheMode};
96//! use std::sync::Arc;
97//! use http::request::Parts;
98//!
99//! let manager = CACacheManager::new("./cache".into(), true);
100//!
101//! let options = HttpCacheOptions {
102//!     cache_key: Some(Arc::new(|req: &Parts| {
103//!         // Custom cache key that includes query parameters
104//!         format!("{}:{}", req.method, req.uri)
105//!     })),
106//!     ..Default::default()
107//! };
108//!
109//! let cache = HttpCache {
110//!     mode: CacheMode::Default,
111//!     manager,
112//!     options,
113//! };
114//! # }
115//! # #[cfg(not(feature = "manager-cacache"))]
116//! # fn main() {}
117//! ```
118//!
119//! ## Maximum TTL Control
120//!
121//! Set a maximum time-to-live for cached responses, particularly useful with `CacheMode::IgnoreRules`:
122//!
123//! ```rust
124//! # #[cfg(feature = "manager-cacache")]
125//! # fn main() {
126//! use http_cache::{HttpCacheOptions, CACacheManager, HttpCache, CacheMode};
127//! use std::time::Duration;
128//!
129//! let manager = CACacheManager::new("./cache".into(), true);
130//!
131//! // Limit cache duration to 5 minutes regardless of server headers
132//! let options = HttpCacheOptions {
133//!     max_ttl: Some(Duration::from_secs(300)), // 5 minutes
134//!     ..Default::default()
135//! };
136//!
137//! let cache = HttpCache {
138//!     mode: CacheMode::IgnoreRules, // Ignore server cache-control headers
139//!     manager,
140//!     options,
141//! };
142//! # }
143//! # #[cfg(not(feature = "manager-cacache"))]
144//! # fn main() {}
145//! ```
146//!
147//! ## Response-Based Cache Mode Override
148//!
149//! Override cache behavior based on the response you receive. This is useful for scenarios like
150//! forcing cache for successful responses even when headers say not to cache, or never caching
151//! error responses like rate limits:
152//!
153//! ```rust
154//! # #[cfg(feature = "manager-cacache")]
155//! # fn main() {
156//! use http_cache::{HttpCacheOptions, CACacheManager, HttpCache, CacheMode};
157//! use std::sync::Arc;
158//!
159//! let manager = CACacheManager::new("./cache".into(), true);
160//!
161//! let options = HttpCacheOptions {
162//!     response_cache_mode_fn: Some(Arc::new(|_request_parts, response| {
163//!         match response.status {
164//!             // Force cache successful responses even if headers say not to cache
165//!             200..=299 => Some(CacheMode::ForceCache),
166//!             // Never cache rate-limited responses
167//!             429 => Some(CacheMode::NoStore),
168//!             // Use default behavior for everything else
169//!             _ => None,
170//!         }
171//!     })),
172//!     ..Default::default()
173//! };
174//!
175//! let cache = HttpCache {
176//!     mode: CacheMode::Default,
177//!     manager,
178//!     options,
179//! };
180//! # }
181//! # #[cfg(not(feature = "manager-cacache"))]
182//! # fn main() {}
183//! ```
184//!
185//! ## Content-Type Based Caching
186//!
187//! You can implement selective caching based on response content types using `response_cache_mode_fn`.
188//! This is useful when you only want to cache certain types of content:
189//!
190//! ```rust
191//! # #[cfg(feature = "manager-cacache")]
192//! # fn main() {
193//! use http_cache::{HttpCacheOptions, CACacheManager, HttpCache, CacheMode};
194//! use std::sync::Arc;
195//!
196//! let manager = CACacheManager::new("./cache".into(), true);
197//!
198//! let options = HttpCacheOptions {
199//!     response_cache_mode_fn: Some(Arc::new(|_request_parts, response| {
200//!         // Check the Content-Type header to decide caching behavior
201//!         if let Some(content_type) = response.headers.get("content-type") {
202//!             match content_type.as_str() {
203//!                 // Cache JSON APIs aggressively
204//!                 ct if ct.starts_with("application/json") => Some(CacheMode::ForceCache),
205//!                 // Cache images with default rules
206//!                 ct if ct.starts_with("image/") => Some(CacheMode::Default),
207//!                 // Cache static assets
208//!                 ct if ct.starts_with("text/css") => Some(CacheMode::ForceCache),
209//!                 ct if ct.starts_with("application/javascript") => Some(CacheMode::ForceCache),
210//!                 // Don't cache HTML pages (dynamic content)
211//!                 ct if ct.starts_with("text/html") => Some(CacheMode::NoStore),
212//!                 // Don't cache unknown content types
213//!                 _ => Some(CacheMode::NoStore),
214//!             }
215//!         } else {
216//!             // No Content-Type header - don't cache
217//!             Some(CacheMode::NoStore)
218//!         }
219//!     })),
220//!     ..Default::default()
221//! };
222//!
223//! let cache = HttpCache {
224//!     mode: CacheMode::Default, // This gets overridden by response_cache_mode_fn
225//!     manager,
226//!     options,
227//! };
228//! # }
229//! # #[cfg(not(feature = "manager-cacache"))]
230//! # fn main() {}
231//! ```
232//!
233//! ## Streaming Support
234//!
235//! For handling large responses without full buffering, use the `StreamingManager`:
236//!
237//! ```rust
238//! # #[cfg(feature = "streaming")]
239//! # {
240//! use http_cache::StreamingBody;
241//! use bytes::Bytes;
242//! use http_body::Body;
243//! use http_body_util::Full;
244//!
245//! // StreamingManager uses foyer for high-performance caching
246//! // Create with: StreamingManager::in_memory(1000).await.unwrap()
247//!
248//! // StreamingBody can handle both buffered and streaming scenarios
249//! let body: StreamingBody<Full<Bytes>> = StreamingBody::buffered(Bytes::from("cached content"));
250//! println!("Body size: {:?}", body.size_hint());
251//! # }
252//! ```
253//!
254//! **Note**: Streaming support requires the `StreamingManager` with the `streaming` feature.
255//! Other cache managers (CACacheManager, MokaManager, QuickManager) do not support streaming
256//! and will buffer response bodies in memory.
257//!
258//! ## Features
259//!
260//! The following features are available. By default `manager-cacache` is enabled.
261//!
262//! - `manager-cacache` (default): enable [cacache](https://github.com/zkat/cacache-rs),
263//! a disk cache, backend manager. Uses tokio runtime.
264//! - `manager-moka` (disabled): enable [moka](https://github.com/moka-rs/moka),
265//! an in-memory cache, backend manager.
266//! - `manager-foyer` (disabled): enable [foyer](https://github.com/foyer-rs/foyer),
267//! a hybrid in-memory + disk cache, backend manager. Uses tokio runtime.
268//! - `http-headers-compat` (disabled): enable backwards compatibility for deserializing cached
269//! responses from older versions that used single-value headers. Enable this if you need to read
270//! cache entries created by older versions of http-cache.
271//! - `streaming` (disabled): enable the `StreamingManager` for streaming cache support.
272//!   Uses foyer as the backend with async-compat for runtime-agnostic operation.
273//! - `with-http-types` (disabled): enable [http-types](https://github.com/http-rs/http-types)
274//! type conversion support
275//!
276//! ### URL Implementation Features
277//!
278//! Exactly one URL implementation must be enabled. These features are **mutually exclusive**:
279//!
280//! - `url-standard` (default): uses the [url](https://github.com/servo/rust-url) crate.
281//!   Note: This brings in the `idna` crate which has a Unicode license.
282//! - `url-ada` (disabled): uses [ada-url](https://github.com/ada-url/rust) for WHATWG-compliant
283//!   URL parsing without the Unicode/IDNA license dependency.
284//!
285//! If you need to avoid the Unicode license, use `url-ada`:
286//!
287//! ```toml
288//! [dependencies]
289//! http-cache = { version = "1.0", default-features = false, features = ["manager-cacache", "url-ada"] }
290//! ```
291//!
292//! ### Legacy bincode features (deprecated)
293//!
294//! These features are deprecated due to [RUSTSEC-2025-0141](https://rustsec.org/advisories/RUSTSEC-2025-0141)
295//! and will be removed in the next major version:
296//!
297//! - `manager-cacache-bincode`: cacache with bincode serialization
298//! - `manager-moka-bincode`: moka with bincode serialization
299//!
300//! **Note**: Only `StreamingManager` (via the `streaming` feature) provides streaming support.
301//! Other managers will buffer response bodies in memory even when used with `StreamingManager`.
302//!
303//! ## Integration
304//!
305//! This crate is designed to be used as a foundation for HTTP client and server middleware.
306//! See the companion crates for specific integrations:
307//!
308//! - [`http-cache-reqwest`](https://docs.rs/http-cache-reqwest) for reqwest client middleware
309//! - [`http-cache-surf`](https://docs.rs/http-cache-surf) for surf client middleware  
310//! - [`http-cache-tower`](https://docs.rs/http-cache-tower) for tower service middleware
311
312// URL feature validation - exactly one URL implementation must be enabled
313#[cfg(all(feature = "url-standard", feature = "url-ada"))]
314compile_error!("features `url-standard` and `url-ada` are mutually exclusive");
315
316#[cfg(not(any(feature = "url-standard", feature = "url-ada")))]
317compile_error!("either feature `url-standard` or `url-ada` must be enabled");
318
319mod body;
320mod error;
321mod managers;
322
323#[cfg(feature = "rate-limiting")]
324pub mod rate_limiting;
325
326use std::{
327    collections::HashMap,
328    convert::TryFrom,
329    fmt::{self, Debug},
330    str::FromStr,
331    sync::Arc,
332    time::{Duration, SystemTime},
333};
334
335use http::{
336    header::CACHE_CONTROL, request, response, HeaderValue, Response, StatusCode,
337};
338use http_cache_semantics::{AfterResponse, BeforeRequest, CachePolicy};
339use serde::{Deserialize, Deserializer, Serialize, Serializer};
340
341// URL type alias - allows users to choose between `url` (default) and `ada-url` crates
342// When using `url-ada` feature, this becomes `ada_url::Url`
343#[cfg(feature = "url-ada")]
344pub use ada_url::Url;
345#[cfg(not(feature = "url-ada"))]
346pub use url::Url;
347
348// ============================================================================
349// URL Helper Functions
350// ============================================================================
351// These functions abstract away API differences between `url` and `ada-url` crates.
352// Internal code should use these helpers instead of calling URL methods directly.
353
354/// Parse a URL string into a `Url` type.
355///
356/// This helper abstracts the parsing API difference between `url` and `ada-url`:
357/// - `url` crate: `Url::parse(s)` returns `Result<Url, ParseError>`
358/// - `ada-url` crate: `Url::parse(s, None)` returns `Result<Url, ParseUrlError>`
359#[inline]
360pub fn url_parse(s: &str) -> Result<Url> {
361    #[cfg(feature = "url-ada")]
362    {
363        Url::parse(s, None).map_err(|e| -> BoxError { e.to_string().into() })
364    }
365    #[cfg(not(feature = "url-ada"))]
366    {
367        Url::parse(s).map_err(|e| -> BoxError { Box::new(e) })
368    }
369}
370
371/// Set the path component of a URL.
372///
373/// API differences:
374/// - `url` crate: `url.set_path(path)`
375/// - `ada-url` crate: `url.set_pathname(Some(path))`
376#[inline]
377pub fn url_set_path(url: &mut Url, path: &str) {
378    #[cfg(feature = "url-ada")]
379    {
380        let _ = url.set_pathname(Some(path));
381    }
382    #[cfg(not(feature = "url-ada"))]
383    {
384        url.set_path(path);
385    }
386}
387
388/// Set the query component of a URL.
389///
390/// API differences:
391/// - `url` crate: `url.set_query(Some(query))` or `url.set_query(None)`
392/// - `ada-url` crate: `url.set_search(Some(query))` or `url.set_search(None)`
393#[inline]
394pub fn url_set_query(url: &mut Url, query: Option<&str>) {
395    #[cfg(feature = "url-ada")]
396    {
397        url.set_search(query);
398    }
399    #[cfg(not(feature = "url-ada"))]
400    {
401        url.set_query(query);
402    }
403}
404
405/// Get the hostname of a URL as a string.
406///
407/// API differences:
408/// - `url` crate: `url.host_str()` returns `Option<&str>`
409/// - `ada-url` crate: `url.hostname()` returns `&str` (empty string if no host)
410#[inline]
411#[must_use]
412pub fn url_hostname(url: &Url) -> Option<&str> {
413    #[cfg(feature = "url-ada")]
414    {
415        let hostname = url.hostname();
416        if hostname.is_empty() {
417            None
418        } else {
419            Some(hostname)
420        }
421    }
422    #[cfg(not(feature = "url-ada"))]
423    {
424        url.host_str()
425    }
426}
427
428/// Get the host of a URL as a string for display purposes (e.g., warning headers).
429///
430/// This returns the host portion as a string, or "unknown" if not available.
431/// Used in places like HTTP Warning headers where we need a displayable host value.
432#[inline]
433#[must_use]
434pub fn url_host_str(url: &Url) -> String {
435    #[cfg(feature = "url-ada")]
436    {
437        let hostname = url.hostname();
438        if hostname.is_empty() {
439            "unknown".to_string()
440        } else {
441            hostname.to_string()
442        }
443    }
444    #[cfg(not(feature = "url-ada"))]
445    {
446        url.host()
447            .map(|h| h.to_string())
448            .unwrap_or_else(|| "unknown".to_string())
449    }
450}
451
452pub use body::StreamingBody;
453pub use error::{
454    BadHeader, BadRequest, BadVersion, BoxError, ClientStreamingError,
455    HttpCacheError, HttpCacheResult, Result, StreamingError,
456};
457
458#[cfg(any(
459    feature = "manager-cacache",
460    feature = "manager-cacache-bincode"
461))]
462pub use managers::cacache::CACacheManager;
463
464#[cfg(feature = "streaming")]
465pub use managers::streaming_cache::StreamingManager;
466
467#[cfg(feature = "manager-moka")]
468pub use managers::moka::MokaManager;
469
470#[cfg(feature = "manager-foyer")]
471pub use managers::foyer::FoyerManager;
472
473#[cfg(feature = "rate-limiting")]
474pub use rate_limiting::{
475    CacheAwareRateLimiter, DirectRateLimiter, DomainRateLimiter,
476};
477
478#[cfg(feature = "rate-limiting")]
479pub use rate_limiting::Quota;
480
481// Exposing the moka cache for convenience, renaming to avoid naming conflicts
482#[cfg(feature = "manager-moka")]
483#[cfg_attr(docsrs, doc(cfg(feature = "manager-moka")))]
484pub use moka::future::{Cache as MokaCache, CacheBuilder as MokaCacheBuilder};
485
486// Custom headers used to indicate cache status (hit or miss)
487/// `x-cache` header: Value will be HIT if the response was served from cache, MISS if not
488pub const XCACHE: &str = "x-cache";
489/// `x-cache-lookup` header: Value will be HIT if a response existed in cache, MISS if not
490pub const XCACHELOOKUP: &str = "x-cache-lookup";
491/// `warning` header: HTTP warning header as per RFC 7234
492const WARNING: &str = "warning";
493
494/// Represents a basic cache status
495/// Used in the custom headers `x-cache` and `x-cache-lookup`
496#[derive(Debug, Copy, Clone)]
497pub enum HitOrMiss {
498    /// Yes, there was a hit
499    HIT,
500    /// No, there was no hit
501    MISS,
502}
503
504impl fmt::Display for HitOrMiss {
505    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
506        match self {
507            Self::HIT => write!(f, "HIT"),
508            Self::MISS => write!(f, "MISS"),
509        }
510    }
511}
512
513/// Represents an HTTP version
514#[derive(Debug, Copy, Clone, PartialEq, Eq, Deserialize, Serialize)]
515#[non_exhaustive]
516pub enum HttpVersion {
517    /// HTTP Version 0.9
518    #[serde(rename = "HTTP/0.9")]
519    Http09,
520    /// HTTP Version 1.0
521    #[serde(rename = "HTTP/1.0")]
522    Http10,
523    /// HTTP Version 1.1
524    #[serde(rename = "HTTP/1.1")]
525    Http11,
526    /// HTTP Version 2.0
527    #[serde(rename = "HTTP/2.0")]
528    H2,
529    /// HTTP Version 3.0
530    #[serde(rename = "HTTP/3.0")]
531    H3,
532}
533
534impl fmt::Display for HttpVersion {
535    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
536        match *self {
537            HttpVersion::Http09 => write!(f, "HTTP/0.9"),
538            HttpVersion::Http10 => write!(f, "HTTP/1.0"),
539            HttpVersion::Http11 => write!(f, "HTTP/1.1"),
540            HttpVersion::H2 => write!(f, "HTTP/2.0"),
541            HttpVersion::H3 => write!(f, "HTTP/3.0"),
542        }
543    }
544}
545
546/// Extract a URL from HTTP request parts for cache key generation
547///
548/// This function reconstructs the full URL from the request parts, handling both
549/// HTTP and HTTPS schemes based on the connection type or explicit headers.
550fn extract_url_from_request_parts(parts: &request::Parts) -> Result<Url> {
551    // First check if the URI is already absolute
552    if let Some(_scheme) = parts.uri.scheme() {
553        // URI is absolute, use it directly
554        return url_parse(&parts.uri.to_string())
555            .map_err(|_| -> BoxError { BadHeader.into() });
556    }
557
558    // Get the host header
559    let host = parts
560        .headers
561        .get("host")
562        .ok_or(BadHeader)?
563        .to_str()
564        .map_err(|_| BadHeader)?;
565
566    // Determine scheme based on host and headers
567    let scheme = determine_scheme(host, &parts.headers)?;
568
569    // Create base URL using the URL helper for cross-crate compatibility
570    let mut base_url = url_parse(&format!("{}://{}/", &scheme, host))
571        .map_err(|_| -> BoxError { BadHeader.into() })?;
572
573    // Set the path and query from the URI using helpers
574    if let Some(path_and_query) = parts.uri.path_and_query() {
575        url_set_path(&mut base_url, path_and_query.path());
576        if let Some(query) = path_and_query.query() {
577            url_set_query(&mut base_url, Some(query));
578        }
579    }
580
581    Ok(base_url)
582}
583
584/// Determine the appropriate scheme for URL construction
585fn determine_scheme(host: &str, headers: &http::HeaderMap) -> Result<String> {
586    // Check for explicit protocol forwarding header first
587    if let Some(forwarded_proto) = headers.get("x-forwarded-proto") {
588        let proto = forwarded_proto.to_str().map_err(|_| BadHeader)?;
589        return match proto {
590            "http" | "https" => Ok(proto.to_string()),
591            _ => Ok("https".to_string()), // Default to secure for unknown protocols
592        };
593    }
594
595    // Check if this looks like a local development host
596    if host.starts_with("localhost") || host.starts_with("127.0.0.1") {
597        Ok("http".to_string())
598    } else {
599        Ok("https".to_string()) // Default to secure for all other hosts
600    }
601}
602
603/// Represents HTTP headers in either legacy or modern format
604#[derive(Debug, Clone)]
605pub enum HttpHeaders {
606    /// Modern header representation - allows multiple values per key
607    Modern(HashMap<String, Vec<String>>),
608    /// Legacy header representation - kept for backward compatibility with deserialization
609    #[cfg(feature = "http-headers-compat")]
610    Legacy(HashMap<String, String>),
611}
612
613// Serialize directly as the inner HashMap (no enum variant wrapper)
614// This ensures compatibility: serialized data is just the raw HashMap
615impl Serialize for HttpHeaders {
616    fn serialize<S>(
617        &self,
618        serializer: S,
619    ) -> std::result::Result<S::Ok, S::Error>
620    where
621        S: Serializer,
622    {
623        #[cfg(feature = "http-headers-compat")]
624        {
625            // Always serialize as Legacy format when compat is enabled
626            match self {
627                HttpHeaders::Modern(modern) => {
628                    // Convert Modern to Legacy format by joining values
629                    let legacy: HashMap<String, String> = modern
630                        .iter()
631                        .map(|(k, v)| (k.clone(), v.join(", ")))
632                        .collect();
633                    legacy.serialize(serializer)
634                }
635                HttpHeaders::Legacy(legacy) => legacy.serialize(serializer),
636            }
637        }
638
639        #[cfg(not(feature = "http-headers-compat"))]
640        {
641            match self {
642                HttpHeaders::Modern(modern) => modern.serialize(serializer),
643            }
644        }
645    }
646}
647
648// Deserialize directly as HashMap based on feature flag
649// With http-headers-compat: reads HashMap<String, String> (legacy alpha.2 format)
650// Without http-headers-compat: reads HashMap<String, Vec<String>> (modern format)
651impl<'de> Deserialize<'de> for HttpHeaders {
652    fn deserialize<D>(deserializer: D) -> std::result::Result<Self, D::Error>
653    where
654        D: Deserializer<'de>,
655    {
656        #[cfg(feature = "http-headers-compat")]
657        {
658            let legacy = HashMap::<String, String>::deserialize(deserializer)?;
659            Ok(HttpHeaders::Legacy(legacy))
660        }
661
662        #[cfg(not(feature = "http-headers-compat"))]
663        {
664            let modern =
665                HashMap::<String, Vec<String>>::deserialize(deserializer)?;
666            Ok(HttpHeaders::Modern(modern))
667        }
668    }
669}
670
671impl HttpHeaders {
672    /// Creates a new empty HttpHeaders in modern format
673    pub fn new() -> Self {
674        HttpHeaders::Modern(HashMap::new())
675    }
676
677    /// Inserts a header key-value pair, replacing any existing values for that key
678    /// Keys are normalized to lowercase per RFC 7230
679    pub fn insert(&mut self, key: String, value: String) {
680        let normalized_key = key.to_ascii_lowercase();
681        match self {
682            #[cfg(feature = "http-headers-compat")]
683            HttpHeaders::Legacy(legacy) => {
684                legacy.insert(normalized_key, value);
685            }
686            HttpHeaders::Modern(modern) => {
687                // Replace existing values with a new single-element vec
688                modern.insert(normalized_key, vec![value]);
689            }
690        }
691    }
692
693    /// Appends a header value, preserving existing values for the same key
694    /// Keys are normalized to lowercase per RFC 7230
695    pub fn append(&mut self, key: String, value: String) {
696        let normalized_key = key.to_ascii_lowercase();
697        match self {
698            #[cfg(feature = "http-headers-compat")]
699            HttpHeaders::Legacy(legacy) => {
700                // Legacy format doesn't support multi-value, fall back to insert
701                legacy.insert(normalized_key, value);
702            }
703            HttpHeaders::Modern(modern) => {
704                modern
705                    .entry(normalized_key)
706                    .or_insert_with(Vec::new)
707                    .push(value);
708            }
709        }
710    }
711
712    /// Retrieves the first value for a given header key
713    /// Keys are normalized to lowercase per RFC 7230
714    pub fn get(&self, key: &str) -> Option<&String> {
715        let normalized_key = key.to_ascii_lowercase();
716        match self {
717            #[cfg(feature = "http-headers-compat")]
718            HttpHeaders::Legacy(legacy) => legacy.get(&normalized_key),
719            HttpHeaders::Modern(modern) => {
720                modern.get(&normalized_key).and_then(|vals| vals.first())
721            }
722        }
723    }
724
725    /// Removes a header key and its associated values
726    /// Keys are normalized to lowercase per RFC 7230
727    pub fn remove(&mut self, key: &str) {
728        let normalized_key = key.to_ascii_lowercase();
729        match self {
730            #[cfg(feature = "http-headers-compat")]
731            HttpHeaders::Legacy(legacy) => {
732                legacy.remove(&normalized_key);
733            }
734            HttpHeaders::Modern(modern) => {
735                modern.remove(&normalized_key);
736            }
737        }
738    }
739
740    /// Checks if a header key exists
741    /// Keys are normalized to lowercase per RFC 7230
742    pub fn contains_key(&self, key: &str) -> bool {
743        let normalized_key = key.to_ascii_lowercase();
744        match self {
745            #[cfg(feature = "http-headers-compat")]
746            HttpHeaders::Legacy(legacy) => legacy.contains_key(&normalized_key),
747            HttpHeaders::Modern(modern) => modern.contains_key(&normalized_key),
748        }
749    }
750
751    /// Returns an iterator over the header key-value pairs
752    pub fn iter(&self) -> HttpHeadersIterator<'_> {
753        match self {
754            #[cfg(feature = "http-headers-compat")]
755            HttpHeaders::Legacy(legacy) => {
756                HttpHeadersIterator { inner: legacy.iter().collect(), index: 0 }
757            }
758            HttpHeaders::Modern(modern) => HttpHeadersIterator {
759                inner: modern
760                    .iter()
761                    .flat_map(|(k, vals)| vals.iter().map(move |v| (k, v)))
762                    .collect(),
763                index: 0,
764            },
765        }
766    }
767}
768
769impl From<&http::HeaderMap> for HttpHeaders {
770    fn from(headers: &http::HeaderMap) -> Self {
771        let mut modern_headers = HashMap::new();
772
773        // Collect all unique header names first
774        let header_names: std::collections::HashSet<_> =
775            headers.keys().collect();
776
777        // For each header name, collect ALL values
778        for name in header_names {
779            let values: Vec<String> = headers
780                .get_all(name)
781                .iter()
782                .filter_map(|v| v.to_str().ok())
783                .map(|s| s.to_string())
784                .collect();
785
786            if !values.is_empty() {
787                modern_headers.insert(name.to_string(), values);
788            }
789        }
790
791        HttpHeaders::Modern(modern_headers)
792    }
793}
794
795impl From<HttpHeaders> for HashMap<String, Vec<String>> {
796    fn from(headers: HttpHeaders) -> Self {
797        match headers {
798            #[cfg(feature = "http-headers-compat")]
799            HttpHeaders::Legacy(legacy) => {
800                legacy.into_iter().map(|(k, v)| (k, vec![v])).collect()
801            }
802            HttpHeaders::Modern(modern) => modern,
803        }
804    }
805}
806
807impl Default for HttpHeaders {
808    fn default() -> Self {
809        HttpHeaders::new()
810    }
811}
812
813impl IntoIterator for HttpHeaders {
814    type Item = (String, String);
815    type IntoIter = HttpHeadersIntoIterator;
816
817    fn into_iter(self) -> Self::IntoIter {
818        HttpHeadersIntoIterator {
819            inner: match self {
820                #[cfg(feature = "http-headers-compat")]
821                HttpHeaders::Legacy(legacy) => legacy.into_iter().collect(),
822                HttpHeaders::Modern(modern) => modern
823                    .into_iter()
824                    .flat_map(|(k, vals)| {
825                        vals.into_iter().map(move |v| (k.clone(), v))
826                    })
827                    .collect(),
828            },
829            index: 0,
830        }
831    }
832}
833
834/// Iterator for HttpHeaders
835#[derive(Debug)]
836pub struct HttpHeadersIntoIterator {
837    inner: Vec<(String, String)>,
838    index: usize,
839}
840
841impl Iterator for HttpHeadersIntoIterator {
842    type Item = (String, String);
843
844    fn next(&mut self) -> Option<Self::Item> {
845        if self.index < self.inner.len() {
846            let item = self.inner[self.index].clone();
847            self.index += 1;
848            Some(item)
849        } else {
850            None
851        }
852    }
853}
854
855impl<'a> IntoIterator for &'a HttpHeaders {
856    type Item = (&'a String, &'a String);
857    type IntoIter = HttpHeadersIterator<'a>;
858
859    fn into_iter(self) -> Self::IntoIter {
860        self.iter()
861    }
862}
863
864/// Iterator for HttpHeaders references
865#[derive(Debug)]
866pub struct HttpHeadersIterator<'a> {
867    inner: Vec<(&'a String, &'a String)>,
868    index: usize,
869}
870
871impl<'a> Iterator for HttpHeadersIterator<'a> {
872    type Item = (&'a String, &'a String);
873
874    fn next(&mut self) -> Option<Self::Item> {
875        if self.index < self.inner.len() {
876            let item = self.inner[self.index];
877            self.index += 1;
878            Some(item)
879        } else {
880            None
881        }
882    }
883}
884
885/// A basic generic type that represents an HTTP response
886#[derive(Debug, Clone, Deserialize, Serialize)]
887pub struct HttpResponse {
888    /// HTTP response body
889    pub body: Vec<u8>,
890    /// HTTP response headers
891    pub headers: HttpHeaders,
892    /// HTTP response status code
893    pub status: u16,
894    /// HTTP response url
895    pub url: Url,
896    /// HTTP response version
897    pub version: HttpVersion,
898    /// Metadata
899    #[serde(default)]
900    pub metadata: Option<Vec<u8>>,
901}
902
903impl HttpResponse {
904    /// Returns `http::response::Parts`
905    pub fn parts(&self) -> Result<response::Parts> {
906        let mut converted =
907            response::Builder::new().status(self.status).body(())?;
908        {
909            let headers = converted.headers_mut();
910            for header in &self.headers {
911                headers.append(
912                    http::header::HeaderName::from_str(header.0.as_str())?,
913                    HeaderValue::from_str(header.1.as_str())?,
914                );
915            }
916        }
917        Ok(converted.into_parts().0)
918    }
919
920    /// Returns the status code of the warning header if present
921    #[must_use]
922    fn warning_code(&self) -> Option<usize> {
923        self.headers.get(WARNING).and_then(|hdr| {
924            hdr.as_str().chars().take(3).collect::<String>().parse().ok()
925        })
926    }
927
928    /// Adds a warning header to a response
929    fn add_warning(&mut self, url: &Url, code: usize, message: &str) {
930        // warning    = "warning" ":" 1#warning-value
931        // warning-value = warn-code SP warn-agent SP warn-text [SP warn-date]
932        // warn-code  = 3DIGIT
933        // warn-agent = ( host [ ":" port ] ) | pseudonym
934        //                 ; the name or pseudonym of the server adding
935        //                 ; the warning header, for use in debugging
936        // warn-text  = quoted-string
937        // warn-date  = <"> HTTP-date <">
938        // (https://tools.ietf.org/html/rfc2616#section-14.46)
939        let host = url_host_str(url);
940        // Escape message to prevent header injection and ensure valid HTTP format
941        let escaped_message =
942            message.replace('"', "'").replace(['\n', '\r'], " ");
943        self.headers.insert(
944            WARNING.to_string(),
945            format!(
946                "{} {} \"{}\" \"{}\"",
947                code,
948                host,
949                escaped_message,
950                httpdate::fmt_http_date(SystemTime::now())
951            ),
952        );
953    }
954
955    /// Removes a warning header from a response
956    fn remove_warning(&mut self) {
957        self.headers.remove(WARNING);
958    }
959
960    /// Update the headers from `http::response::Parts`
961    pub fn update_headers(&mut self, parts: &response::Parts) -> Result<()> {
962        for header in parts.headers.iter() {
963            self.headers.insert(
964                header.0.as_str().to_string(),
965                header.1.to_str()?.to_string(),
966            );
967        }
968        Ok(())
969    }
970
971    /// Checks if the Cache-Control header contains the must-revalidate directive
972    #[must_use]
973    fn must_revalidate(&self) -> bool {
974        self.headers.get(CACHE_CONTROL.as_str()).is_some_and(|val| {
975            val.as_str().to_lowercase().contains("must-revalidate")
976        })
977    }
978
979    /// Adds the custom `x-cache` header to the response
980    pub fn cache_status(&mut self, hit_or_miss: HitOrMiss) {
981        self.headers.insert(XCACHE.to_string(), hit_or_miss.to_string());
982    }
983
984    /// Adds the custom `x-cache-lookup` header to the response
985    pub fn cache_lookup_status(&mut self, hit_or_miss: HitOrMiss) {
986        self.headers.insert(XCACHELOOKUP.to_string(), hit_or_miss.to_string());
987    }
988}
989
990/// A trait providing methods for storing, reading, and removing cache records.
991#[async_trait::async_trait]
992pub trait CacheManager: Send + Sync + 'static {
993    /// Attempts to pull a cached response and related policy from cache.
994    async fn get(
995        &self,
996        cache_key: &str,
997    ) -> Result<Option<(HttpResponse, CachePolicy)>>;
998    /// Attempts to cache a response and related policy.
999    async fn put(
1000        &self,
1001        cache_key: String,
1002        res: HttpResponse,
1003        policy: CachePolicy,
1004    ) -> Result<HttpResponse>;
1005    /// Attempts to remove a record from cache.
1006    async fn delete(&self, cache_key: &str) -> Result<()>;
1007}
1008
1009/// A streaming cache manager that supports streaming request/response bodies
1010/// without buffering them in memory. This is ideal for large responses.
1011#[async_trait::async_trait]
1012pub trait StreamingCacheManager: Send + Sync + 'static {
1013    /// The body type used by this cache manager
1014    type Body: http_body::Body + Send + 'static;
1015
1016    /// Attempts to pull a cached response and related policy from cache with streaming body.
1017    async fn get(
1018        &self,
1019        cache_key: &str,
1020    ) -> Result<Option<(Response<Self::Body>, CachePolicy)>>
1021    where
1022        <Self::Body as http_body::Body>::Data: Send,
1023        <Self::Body as http_body::Body>::Error:
1024            Into<StreamingError> + Send + Sync + 'static;
1025
1026    /// Attempts to cache a response with a streaming body and related policy.
1027    async fn put<B>(
1028        &self,
1029        cache_key: String,
1030        response: Response<B>,
1031        policy: CachePolicy,
1032        request_url: Url,
1033        metadata: Option<Vec<u8>>,
1034    ) -> Result<Response<Self::Body>>
1035    where
1036        B: http_body::Body + Send + 'static,
1037        B::Data: Send,
1038        B::Error: Into<StreamingError>,
1039        <Self::Body as http_body::Body>::Data: Send,
1040        <Self::Body as http_body::Body>::Error:
1041            Into<StreamingError> + Send + Sync + 'static;
1042
1043    /// Converts a generic body to the manager's body type for non-cacheable responses.
1044    /// This is called when a response should not be cached but still needs to be returned
1045    /// with the correct body type.
1046    async fn convert_body<B>(
1047        &self,
1048        response: Response<B>,
1049    ) -> Result<Response<Self::Body>>
1050    where
1051        B: http_body::Body + Send + 'static,
1052        B::Data: Send,
1053        B::Error: Into<StreamingError>,
1054        <Self::Body as http_body::Body>::Data: Send,
1055        <Self::Body as http_body::Body>::Error:
1056            Into<StreamingError> + Send + Sync + 'static;
1057
1058    /// Attempts to remove a record from cache.
1059    async fn delete(&self, cache_key: &str) -> Result<()>;
1060
1061    /// Creates an empty body of the manager's body type.
1062    /// Used for returning 504 Gateway Timeout responses on OnlyIfCached cache misses.
1063    fn empty_body(&self) -> Self::Body;
1064
1065    /// Convert the manager's body type to a reqwest-compatible bytes stream.
1066    /// This enables efficient streaming without collecting the entire body.
1067    #[cfg(feature = "streaming")]
1068    fn body_to_bytes_stream(
1069        body: Self::Body,
1070    ) -> impl futures_util::Stream<
1071        Item = std::result::Result<
1072            bytes::Bytes,
1073            Box<dyn std::error::Error + Send + Sync>,
1074        >,
1075    > + Send
1076    where
1077        <Self::Body as http_body::Body>::Data: Send,
1078        <Self::Body as http_body::Body>::Error: Send + Sync + 'static;
1079}
1080
1081/// Describes the functionality required for interfacing with HTTP client middleware
1082#[async_trait::async_trait]
1083pub trait Middleware: Send {
1084    /// Allows the cache mode to be overridden.
1085    ///
1086    /// This overrides any cache mode set in the configuration, including cache_mode_fn.
1087    fn overridden_cache_mode(&self) -> Option<CacheMode> {
1088        None
1089    }
1090    /// Determines if the request method is either GET or HEAD
1091    fn is_method_get_head(&self) -> bool;
1092    /// Returns a new cache policy with default options
1093    fn policy(&self, response: &HttpResponse) -> Result<CachePolicy>;
1094    /// Returns a new cache policy with custom options
1095    fn policy_with_options(
1096        &self,
1097        response: &HttpResponse,
1098        options: CacheOptions,
1099    ) -> Result<CachePolicy>;
1100    /// Attempts to update the request headers with the passed `http::request::Parts`
1101    fn update_headers(&mut self, parts: &request::Parts) -> Result<()>;
1102    /// Attempts to force the "no-cache" directive on the request
1103    fn force_no_cache(&mut self) -> Result<()>;
1104    /// Attempts to construct `http::request::Parts` from the request
1105    fn parts(&self) -> Result<request::Parts>;
1106    /// Attempts to determine the requested url
1107    fn url(&self) -> Result<Url>;
1108    /// Attempts to determine the request method
1109    fn method(&self) -> Result<String>;
1110    /// Attempts to fetch an upstream resource and return an [`HttpResponse`]
1111    async fn remote_fetch(&mut self) -> Result<HttpResponse>;
1112}
1113
1114/// An interface for HTTP caching that works with composable middleware patterns
1115/// like Tower. This trait separates the concerns of request analysis, cache lookup,
1116/// and response processing into discrete steps.
1117pub trait HttpCacheInterface<B = Vec<u8>>: Send + Sync {
1118    /// Analyze a request to determine cache behavior
1119    fn analyze_request(
1120        &self,
1121        parts: &request::Parts,
1122        mode_override: Option<CacheMode>,
1123    ) -> Result<CacheAnalysis>;
1124
1125    /// Look up a cached response for the given cache key
1126    #[allow(async_fn_in_trait)]
1127    async fn lookup_cached_response(
1128        &self,
1129        key: &str,
1130    ) -> Result<Option<(HttpResponse, CachePolicy)>>;
1131
1132    /// Process a fresh response from upstream and potentially cache it
1133    #[allow(async_fn_in_trait)]
1134    async fn process_response(
1135        &self,
1136        analysis: CacheAnalysis,
1137        response: Response<B>,
1138        metadata: Option<Vec<u8>>,
1139    ) -> Result<Response<B>>;
1140
1141    /// Update request headers for conditional requests (e.g., If-None-Match)
1142    fn prepare_conditional_request(
1143        &self,
1144        parts: &mut request::Parts,
1145        cached_response: &HttpResponse,
1146        policy: &CachePolicy,
1147    ) -> Result<()>;
1148
1149    /// Handle a 304 Not Modified response by returning the cached response
1150    #[allow(async_fn_in_trait)]
1151    async fn handle_not_modified(
1152        &self,
1153        cached_response: HttpResponse,
1154        fresh_parts: &response::Parts,
1155    ) -> Result<HttpResponse>;
1156}
1157
1158/// Streaming version of the HTTP cache interface that supports streaming request/response bodies
1159/// without buffering them in memory. This is ideal for large responses or when memory usage
1160/// is a concern.
1161pub trait HttpCacheStreamInterface: Send + Sync {
1162    /// The body type used by this cache implementation
1163    type Body: http_body::Body + Send + 'static;
1164
1165    /// Analyze a request to determine cache behavior
1166    fn analyze_request(
1167        &self,
1168        parts: &request::Parts,
1169        mode_override: Option<CacheMode>,
1170    ) -> Result<CacheAnalysis>;
1171
1172    /// Look up a cached response for the given cache key, returning a streaming body
1173    #[allow(async_fn_in_trait)]
1174    async fn lookup_cached_response(
1175        &self,
1176        key: &str,
1177    ) -> Result<Option<(Response<Self::Body>, CachePolicy)>>
1178    where
1179        <Self::Body as http_body::Body>::Data: Send,
1180        <Self::Body as http_body::Body>::Error:
1181            Into<StreamingError> + Send + Sync + 'static;
1182
1183    /// Process a fresh response from upstream and potentially cache it with streaming support
1184    #[allow(async_fn_in_trait)]
1185    async fn process_response<B>(
1186        &self,
1187        analysis: CacheAnalysis,
1188        response: Response<B>,
1189        metadata: Option<Vec<u8>>,
1190    ) -> Result<Response<Self::Body>>
1191    where
1192        B: http_body::Body + Send + 'static,
1193        B::Data: Send,
1194        B::Error: Into<StreamingError>,
1195        <Self::Body as http_body::Body>::Data: Send,
1196        <Self::Body as http_body::Body>::Error:
1197            Into<StreamingError> + Send + Sync + 'static;
1198
1199    /// Update request headers for conditional requests (e.g., If-None-Match)
1200    fn prepare_conditional_request(
1201        &self,
1202        parts: &mut request::Parts,
1203        cached_response: &Response<Self::Body>,
1204        policy: &CachePolicy,
1205    ) -> Result<()>;
1206
1207    /// Handle a 304 Not Modified response by returning the cached response
1208    #[allow(async_fn_in_trait)]
1209    async fn handle_not_modified(
1210        &self,
1211        cached_response: Response<Self::Body>,
1212        fresh_parts: &response::Parts,
1213    ) -> Result<Response<Self::Body>>
1214    where
1215        <Self::Body as http_body::Body>::Data: Send,
1216        <Self::Body as http_body::Body>::Error:
1217            Into<StreamingError> + Send + Sync + 'static;
1218}
1219
1220/// Analysis result for a request, containing cache key and caching decisions
1221#[derive(Debug, Clone)]
1222pub struct CacheAnalysis {
1223    /// The cache key for this request
1224    pub cache_key: String,
1225    /// Whether this request should be cached
1226    pub should_cache: bool,
1227    /// The effective cache mode for this request
1228    pub cache_mode: CacheMode,
1229    /// Keys to bust from cache before processing
1230    pub cache_bust_keys: Vec<String>,
1231    /// The request parts for policy creation
1232    pub request_parts: request::Parts,
1233    /// Whether this is a GET or HEAD request
1234    pub is_get_head: bool,
1235}
1236
1237/// Cache mode determines how the HTTP cache behaves for requests.
1238///
1239/// These modes are similar to [make-fetch-happen cache options](https://github.com/npm/make-fetch-happen#--optscache)
1240/// and provide fine-grained control over caching behavior.
1241///
1242/// # Examples
1243///
1244/// ```rust
1245/// # #[cfg(feature = "manager-cacache")]
1246/// # fn main() {
1247/// use http_cache::{CacheMode, HttpCache, CACacheManager, HttpCacheOptions};
1248///
1249/// let manager = CACacheManager::new("./cache".into(), true);
1250///
1251/// // Use different cache modes for different scenarios
1252/// let default_cache = HttpCache {
1253///     mode: CacheMode::Default,        // Standard HTTP caching rules
1254///     manager: manager.clone(),
1255///     options: HttpCacheOptions::default(),
1256/// };
1257///
1258/// let force_cache = HttpCache {
1259///     mode: CacheMode::ForceCache,     // Cache everything, ignore staleness
1260///     manager: manager.clone(),
1261///     options: HttpCacheOptions::default(),
1262/// };
1263///
1264/// let no_cache = HttpCache {
1265///     mode: CacheMode::NoStore,        // Never cache anything
1266///     manager,
1267///     options: HttpCacheOptions::default(),
1268/// };
1269/// # }
1270/// # #[cfg(not(feature = "manager-cacache"))]
1271/// # fn main() {}
1272/// ```
1273#[derive(Debug, Default, Clone, Copy, PartialEq, Eq)]
1274pub enum CacheMode {
1275    /// Standard HTTP caching behavior (recommended for most use cases).
1276    ///
1277    /// This mode:
1278    /// - Checks the cache for fresh responses and uses them
1279    /// - Makes conditional requests for stale responses (revalidation)
1280    /// - Makes normal requests when no cached response exists
1281    /// - Updates the cache with new responses
1282    /// - Falls back to stale responses if revalidation fails
1283    ///
1284    /// This is the most common mode and follows HTTP caching standards closely.
1285    #[default]
1286    Default,
1287
1288    /// Completely bypasses the cache.
1289    ///
1290    /// This mode:
1291    /// - Never reads from the cache
1292    /// - Never writes to the cache
1293    /// - Always makes fresh network requests
1294    ///
1295    /// Use this when you need to ensure every request goes to the origin server.
1296    NoStore,
1297
1298    /// Bypasses cache on request but updates cache with response.
1299    ///
1300    /// This mode:
1301    /// - Ignores any cached responses
1302    /// - Always makes a fresh network request
1303    /// - Updates the cache with the response
1304    ///
1305    /// Equivalent to a "hard refresh" - useful when you know the cache is stale.
1306    Reload,
1307
1308    /// Always revalidates cached responses.
1309    ///
1310    /// This mode:
1311    /// - Makes conditional requests if a cached response exists
1312    /// - Makes normal requests if no cached response exists
1313    /// - Updates the cache with responses
1314    ///
1315    /// Use this when you want to ensure content freshness while still benefiting
1316    /// from conditional requests (304 Not Modified responses).
1317    NoCache,
1318
1319    /// Uses cached responses regardless of staleness.
1320    ///
1321    /// This mode:
1322    /// - Uses any cached response, even if stale
1323    /// - Makes network requests only when no cached response exists
1324    /// - Updates the cache with new responses
1325    ///
1326    /// Useful for offline scenarios or when performance is more important than freshness.
1327    ForceCache,
1328
1329    /// Only serves from cache, never makes network requests.
1330    ///
1331    /// This mode:
1332    /// - Uses any cached response, even if stale
1333    /// - Returns an error if no cached response exists
1334    /// - Never makes network requests
1335    ///
1336    /// Use this for offline-only scenarios or when you want to guarantee
1337    /// no network traffic.
1338    OnlyIfCached,
1339
1340    /// Ignores HTTP caching rules and caches everything.
1341    ///
1342    /// This mode:
1343    /// - Caches all 200 responses regardless of cache-control headers
1344    /// - Uses cached responses regardless of staleness
1345    /// - Makes network requests when no cached response exists
1346    ///
1347    /// Use this when you want aggressive caching and don't want to respect
1348    /// server cache directives.
1349    IgnoreRules,
1350}
1351
1352impl TryFrom<http::Version> for HttpVersion {
1353    type Error = BoxError;
1354
1355    fn try_from(value: http::Version) -> Result<Self> {
1356        Ok(match value {
1357            http::Version::HTTP_09 => Self::Http09,
1358            http::Version::HTTP_10 => Self::Http10,
1359            http::Version::HTTP_11 => Self::Http11,
1360            http::Version::HTTP_2 => Self::H2,
1361            http::Version::HTTP_3 => Self::H3,
1362            _ => return Err(Box::new(BadVersion)),
1363        })
1364    }
1365}
1366
1367impl From<HttpVersion> for http::Version {
1368    fn from(value: HttpVersion) -> Self {
1369        match value {
1370            HttpVersion::Http09 => Self::HTTP_09,
1371            HttpVersion::Http10 => Self::HTTP_10,
1372            HttpVersion::Http11 => Self::HTTP_11,
1373            HttpVersion::H2 => Self::HTTP_2,
1374            HttpVersion::H3 => Self::HTTP_3,
1375        }
1376    }
1377}
1378
1379#[cfg(feature = "http-types")]
1380impl TryFrom<http_types::Version> for HttpVersion {
1381    type Error = BoxError;
1382
1383    fn try_from(value: http_types::Version) -> Result<Self> {
1384        Ok(match value {
1385            http_types::Version::Http0_9 => Self::Http09,
1386            http_types::Version::Http1_0 => Self::Http10,
1387            http_types::Version::Http1_1 => Self::Http11,
1388            http_types::Version::Http2_0 => Self::H2,
1389            http_types::Version::Http3_0 => Self::H3,
1390            _ => return Err(Box::new(BadVersion)),
1391        })
1392    }
1393}
1394
1395#[cfg(feature = "http-types")]
1396impl From<HttpVersion> for http_types::Version {
1397    fn from(value: HttpVersion) -> Self {
1398        match value {
1399            HttpVersion::Http09 => Self::Http0_9,
1400            HttpVersion::Http10 => Self::Http1_0,
1401            HttpVersion::Http11 => Self::Http1_1,
1402            HttpVersion::H2 => Self::Http2_0,
1403            HttpVersion::H3 => Self::Http3_0,
1404        }
1405    }
1406}
1407
1408/// Options struct provided by
1409/// [`http-cache-semantics`](https://github.com/kornelski/rusty-http-cache-semantics).
1410pub use http_cache_semantics::CacheOptions;
1411
1412/// A closure that takes [`http::request::Parts`] and returns a [`String`].
1413/// By default, the cache key is a combination of the request method and uri with a colon in between.
1414pub type CacheKey = Arc<dyn Fn(&request::Parts) -> String + Send + Sync>;
1415
1416/// A closure that takes [`http::request::Parts`] and returns a [`CacheMode`]
1417pub type CacheModeFn = Arc<dyn Fn(&request::Parts) -> CacheMode + Send + Sync>;
1418
1419/// A closure that takes [`http::request::Parts`], [`HttpResponse`] and returns a [`CacheMode`] to override caching behavior based on the response
1420pub type ResponseCacheModeFn = Arc<
1421    dyn Fn(&request::Parts, &HttpResponse) -> Option<CacheMode> + Send + Sync,
1422>;
1423
1424/// A closure that takes [`http::request::Parts`], [`Option<CacheKey>`], the default cache key ([`&str`]) and returns [`Vec<String>`] of keys to bust the cache for.
1425/// An empty vector means that no cache busting will be performed.
1426pub type CacheBust = Arc<
1427    dyn Fn(&request::Parts, &Option<CacheKey>, &str) -> Vec<String>
1428        + Send
1429        + Sync,
1430>;
1431
1432/// Type alias for metadata stored alongside cached responses.
1433/// Users are responsible for serialization/deserialization of this data.
1434pub type HttpCacheMetadata = Vec<u8>;
1435
1436/// A closure that takes [`http::request::Parts`] and [`http::response::Parts`] and returns optional metadata to store with the cached response.
1437/// This allows middleware to compute and store additional information alongside cached responses.
1438pub type MetadataProvider = Arc<
1439    dyn Fn(&request::Parts, &response::Parts) -> Option<HttpCacheMetadata>
1440        + Send
1441        + Sync,
1442>;
1443
1444/// A closure that takes a mutable reference to [`HttpResponse`] and modifies it before caching.
1445pub type ModifyResponse = Arc<dyn Fn(&mut HttpResponse) + Send + Sync>;
1446
1447/// Configuration options for customizing HTTP cache behavior on a per-request basis.
1448///
1449/// This struct allows you to override default caching behavior for individual requests
1450/// by providing custom cache options, cache keys, cache modes, and cache busting logic.
1451///
1452/// # Examples
1453///
1454/// ## Basic Custom Cache Key
1455/// ```rust
1456/// use http_cache::{HttpCacheOptions, CacheKey};
1457/// use http::request::Parts;
1458/// use std::sync::Arc;
1459///
1460/// let options = HttpCacheOptions {
1461///     cache_key: Some(Arc::new(|parts: &Parts| {
1462///         format!("custom:{}:{}", parts.method, parts.uri.path())
1463///     })),
1464///     ..Default::default()
1465/// };
1466/// ```
1467///
1468/// ## Custom Cache Mode per Request
1469/// ```rust
1470/// use http_cache::{HttpCacheOptions, CacheMode, CacheModeFn};
1471/// use http::request::Parts;
1472/// use std::sync::Arc;
1473///
1474/// let options = HttpCacheOptions {
1475///     cache_mode_fn: Some(Arc::new(|parts: &Parts| {
1476///         if parts.headers.contains_key("x-no-cache") {
1477///             CacheMode::NoStore
1478///         } else {
1479///             CacheMode::Default
1480///         }
1481///     })),
1482///     ..Default::default()
1483/// };
1484/// ```
1485///
1486/// ## Response-Based Cache Mode Override
1487/// ```rust
1488/// use http_cache::{HttpCacheOptions, ResponseCacheModeFn, CacheMode};
1489/// use http::request::Parts;
1490/// use http_cache::HttpResponse;
1491/// use std::sync::Arc;
1492///
1493/// let options = HttpCacheOptions {
1494///     response_cache_mode_fn: Some(Arc::new(|_parts: &Parts, response: &HttpResponse| {
1495///         // Force cache 2xx responses even if headers say not to cache
1496///         if response.status >= 200 && response.status < 300 {
1497///             Some(CacheMode::ForceCache)
1498///         } else if response.status == 429 { // Rate limited
1499///             Some(CacheMode::NoStore) // Don't cache rate limit responses
1500///         } else {
1501///             None // Use default behavior
1502///         }
1503///     })),
1504///     ..Default::default()
1505/// };
1506/// ```
1507///
1508/// ## Content-Type Based Cache Mode Override
1509/// ```rust
1510/// use http_cache::{HttpCacheOptions, ResponseCacheModeFn, CacheMode};
1511/// use http::request::Parts;
1512/// use http_cache::HttpResponse;
1513/// use std::sync::Arc;
1514///
1515/// let options = HttpCacheOptions {
1516///     response_cache_mode_fn: Some(Arc::new(|_parts: &Parts, response: &HttpResponse| {
1517///         // Cache different content types with different strategies
1518///         if let Some(content_type) = response.headers.get("content-type") {
1519///             match content_type.as_str() {
1520///                 ct if ct.starts_with("application/json") => Some(CacheMode::ForceCache),
1521///                 ct if ct.starts_with("image/") => Some(CacheMode::Default),
1522///                 ct if ct.starts_with("text/html") => Some(CacheMode::NoStore),
1523///                 _ => None, // Use default behavior for other types
1524///             }
1525///         } else {
1526///             Some(CacheMode::NoStore) // No content-type = don't cache
1527///         }
1528///     })),
1529///     ..Default::default()
1530/// };
1531/// ```
1532///
1533/// ## Cache Busting for Related Resources
1534/// ```rust
1535/// use http_cache::{HttpCacheOptions, CacheBust, CacheKey};
1536/// use http::request::Parts;
1537/// use std::sync::Arc;
1538///
1539/// let options = HttpCacheOptions {
1540///     cache_bust: Some(Arc::new(|parts: &Parts, _cache_key: &Option<CacheKey>, _uri: &str| {
1541///         if parts.method == "POST" && parts.uri.path().starts_with("/api/users") {
1542///             vec![
1543///                 "GET:/api/users".to_string(),
1544///                 "GET:/api/users/list".to_string(),
1545///             ]
1546///         } else {
1547///             vec![]
1548///         }
1549///     })),
1550///     ..Default::default()
1551/// };
1552/// ```
1553///
1554/// ## Storing Metadata with Cached Responses
1555/// ```rust
1556/// use http_cache::{HttpCacheOptions, MetadataProvider};
1557/// use http::{request, response};
1558/// use std::sync::Arc;
1559///
1560/// let options = HttpCacheOptions {
1561///     metadata_provider: Some(Arc::new(|request_parts: &request::Parts, response_parts: &response::Parts| {
1562///         // Store computed information with the cached response
1563///         let content_type = response_parts
1564///             .headers
1565///             .get("content-type")
1566///             .and_then(|v| v.to_str().ok())
1567///             .unwrap_or("unknown");
1568///
1569///         // Return serialized metadata (users handle serialization)
1570///         Some(format!("path={};content-type={}", request_parts.uri.path(), content_type).into_bytes())
1571///     })),
1572///     ..Default::default()
1573/// };
1574/// ```
1575#[derive(Clone)]
1576pub struct HttpCacheOptions {
1577    /// Override the default cache options.
1578    pub cache_options: Option<CacheOptions>,
1579    /// Override the default cache key generator.
1580    pub cache_key: Option<CacheKey>,
1581    /// Override the default cache mode.
1582    pub cache_mode_fn: Option<CacheModeFn>,
1583    /// Override cache behavior based on the response received.
1584    /// This function is called after receiving a response and can override
1585    /// the cache mode for that specific response. Returning `None` means
1586    /// use the default cache mode. This allows fine-grained control over
1587    /// caching behavior based on response status, headers, or content.
1588    pub response_cache_mode_fn: Option<ResponseCacheModeFn>,
1589    /// Bust the caches of the returned keys.
1590    pub cache_bust: Option<CacheBust>,
1591    /// Modifies the response before storing it in the cache.
1592    pub modify_response: Option<ModifyResponse>,
1593    /// Determines if the cache status headers should be added to the response.
1594    pub cache_status_headers: bool,
1595    /// Maximum time-to-live for cached responses.
1596    /// When set, this overrides any longer cache durations specified by the server.
1597    /// Particularly useful with `CacheMode::IgnoreRules` to provide expiration control.
1598    pub max_ttl: Option<Duration>,
1599    /// Rate limiter that applies only on cache misses.
1600    /// When enabled, requests that result in cache hits are returned immediately,
1601    /// while cache misses are rate limited before making network requests.
1602    /// This provides the optimal behavior for web scrapers and similar applications.
1603    #[cfg(feature = "rate-limiting")]
1604    pub rate_limiter: Option<Arc<dyn CacheAwareRateLimiter>>,
1605    /// Optional callback to provide metadata to store alongside cached responses.
1606    /// The callback receives request and response parts and can return metadata bytes.
1607    /// This is useful for storing computed information that should be associated with
1608    /// cached responses without recomputation on cache hits.
1609    pub metadata_provider: Option<MetadataProvider>,
1610}
1611
1612impl Default for HttpCacheOptions {
1613    fn default() -> Self {
1614        Self {
1615            cache_options: None,
1616            cache_key: None,
1617            cache_mode_fn: None,
1618            response_cache_mode_fn: None,
1619            cache_bust: None,
1620            modify_response: None,
1621            cache_status_headers: true,
1622            max_ttl: None,
1623            #[cfg(feature = "rate-limiting")]
1624            rate_limiter: None,
1625            metadata_provider: None,
1626        }
1627    }
1628}
1629
1630impl Debug for HttpCacheOptions {
1631    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
1632        #[cfg(feature = "rate-limiting")]
1633        {
1634            f.debug_struct("HttpCacheOptions")
1635                .field("cache_options", &self.cache_options)
1636                .field("cache_key", &"Fn(&request::Parts) -> String")
1637                .field("cache_mode_fn", &"Fn(&request::Parts) -> CacheMode")
1638                .field(
1639                    "response_cache_mode_fn",
1640                    &"Fn(&request::Parts, &HttpResponse) -> Option<CacheMode>",
1641                )
1642                .field("cache_bust", &"Fn(&request::Parts) -> Vec<String>")
1643                .field("modify_response", &"Fn(&mut ModifyResponse)")
1644                .field("cache_status_headers", &self.cache_status_headers)
1645                .field("max_ttl", &self.max_ttl)
1646                .field("rate_limiter", &"Option<CacheAwareRateLimiter>")
1647                .field(
1648                    "metadata_provider",
1649                    &"Fn(&request::Parts, &response::Parts) -> Option<Vec<u8>>",
1650                )
1651                .finish()
1652        }
1653
1654        #[cfg(not(feature = "rate-limiting"))]
1655        {
1656            f.debug_struct("HttpCacheOptions")
1657                .field("cache_options", &self.cache_options)
1658                .field("cache_key", &"Fn(&request::Parts) -> String")
1659                .field("cache_mode_fn", &"Fn(&request::Parts) -> CacheMode")
1660                .field(
1661                    "response_cache_mode_fn",
1662                    &"Fn(&request::Parts, &HttpResponse) -> Option<CacheMode>",
1663                )
1664                .field("cache_bust", &"Fn(&request::Parts) -> Vec<String>")
1665                .field("modify_response", &"Fn(&mut ModifyResponse)")
1666                .field("cache_status_headers", &self.cache_status_headers)
1667                .field("max_ttl", &self.max_ttl)
1668                .field(
1669                    "metadata_provider",
1670                    &"Fn(&request::Parts, &response::Parts) -> Option<Vec<u8>>",
1671                )
1672                .finish()
1673        }
1674    }
1675}
1676
1677impl HttpCacheOptions {
1678    fn create_cache_key(
1679        &self,
1680        parts: &request::Parts,
1681        override_method: Option<&str>,
1682    ) -> String {
1683        if let Some(cache_key) = &self.cache_key {
1684            cache_key(parts)
1685        } else {
1686            format!(
1687                "{}:{}",
1688                override_method.unwrap_or_else(|| parts.method.as_str()),
1689                parts.uri
1690            )
1691        }
1692    }
1693
1694    /// Helper function for other crates to generate cache keys for invalidation
1695    /// This ensures consistent cache key generation across all implementations
1696    pub fn create_cache_key_for_invalidation(
1697        &self,
1698        parts: &request::Parts,
1699        method_override: &str,
1700    ) -> String {
1701        self.create_cache_key(parts, Some(method_override))
1702    }
1703
1704    /// Converts HttpResponse to http::Response with the given body type
1705    pub fn http_response_to_response<B>(
1706        http_response: &HttpResponse,
1707        body: B,
1708    ) -> Result<Response<B>> {
1709        let mut response_builder = Response::builder()
1710            .status(http_response.status)
1711            .version(http_response.version.into());
1712
1713        for (name, value) in &http_response.headers {
1714            if let (Ok(header_name), Ok(header_value)) =
1715                (name.parse::<http::HeaderName>(), value.parse::<HeaderValue>())
1716            {
1717                response_builder =
1718                    response_builder.header(header_name, header_value);
1719            }
1720        }
1721
1722        Ok(response_builder.body(body)?)
1723    }
1724
1725    /// Converts response parts to HttpResponse format for cache mode evaluation
1726    fn parts_to_http_response(
1727        &self,
1728        parts: &response::Parts,
1729        request_parts: &request::Parts,
1730        metadata: Option<Vec<u8>>,
1731    ) -> Result<HttpResponse> {
1732        Ok(HttpResponse {
1733            body: vec![], // We don't need the full body for cache mode decision
1734            headers: (&parts.headers).into(),
1735            status: parts.status.as_u16(),
1736            url: extract_url_from_request_parts(request_parts)?,
1737            version: parts.version.try_into()?,
1738            metadata,
1739        })
1740    }
1741
1742    /// Evaluates response-based cache mode override
1743    fn evaluate_response_cache_mode(
1744        &self,
1745        request_parts: &request::Parts,
1746        http_response: &HttpResponse,
1747        original_mode: CacheMode,
1748    ) -> CacheMode {
1749        if let Some(response_cache_mode_fn) = &self.response_cache_mode_fn {
1750            if let Some(override_mode) =
1751                response_cache_mode_fn(request_parts, http_response)
1752            {
1753                return override_mode;
1754            }
1755        }
1756        original_mode
1757    }
1758
1759    /// Generates metadata for a response using the metadata_provider callback if configured
1760    pub fn generate_metadata(
1761        &self,
1762        request_parts: &request::Parts,
1763        response_parts: &response::Parts,
1764    ) -> Option<HttpCacheMetadata> {
1765        self.metadata_provider
1766            .as_ref()
1767            .and_then(|provider| provider(request_parts, response_parts))
1768    }
1769
1770    /// Modifies the response before caching if a modifier function is provided
1771    fn modify_response_before_caching(&self, response: &mut HttpResponse) {
1772        if let Some(modify_response) = &self.modify_response {
1773            modify_response(response);
1774        }
1775    }
1776
1777    /// Creates a cache policy for the given request and response
1778    fn create_cache_policy(
1779        &self,
1780        request_parts: &request::Parts,
1781        response_parts: &response::Parts,
1782    ) -> CachePolicy {
1783        let cache_options = self.cache_options.unwrap_or_default();
1784
1785        // If max_ttl is specified, we need to modify the response headers to enforce it
1786        if let Some(max_ttl) = self.max_ttl {
1787            // Parse existing cache-control header
1788            let cache_control = response_parts
1789                .headers
1790                .get("cache-control")
1791                .and_then(|v| v.to_str().ok())
1792                .unwrap_or("");
1793
1794            // Extract existing max-age if present
1795            let existing_max_age =
1796                cache_control.split(',').find_map(|directive| {
1797                    let directive = directive.trim();
1798                    if directive.starts_with("max-age=") {
1799                        directive.strip_prefix("max-age=")?.parse::<u64>().ok()
1800                    } else {
1801                        None
1802                    }
1803                });
1804
1805            // Convert max_ttl to seconds
1806            let max_ttl_seconds = max_ttl.as_secs();
1807
1808            // Apply max_ttl by setting max-age to the minimum of existing max-age and max_ttl
1809            let effective_max_age = match existing_max_age {
1810                Some(existing) => std::cmp::min(existing, max_ttl_seconds),
1811                None => max_ttl_seconds,
1812            };
1813
1814            // Build new cache-control header
1815            let mut new_directives = Vec::new();
1816
1817            // Add non-max-age directives from existing cache-control
1818            for directive in cache_control.split(',').map(|d| d.trim()) {
1819                if !directive.starts_with("max-age=") && !directive.is_empty() {
1820                    new_directives.push(directive.to_string());
1821                }
1822            }
1823
1824            // Add our effective max-age
1825            new_directives.push(format!("max-age={}", effective_max_age));
1826
1827            let new_cache_control = new_directives.join(", ");
1828
1829            // Create modified response parts - we have to clone since response::Parts has private fields
1830            let mut modified_response_parts = response_parts.clone();
1831            modified_response_parts.headers.insert(
1832                "cache-control",
1833                HeaderValue::from_str(&new_cache_control)
1834                    .unwrap_or_else(|_| HeaderValue::from_static("max-age=0")),
1835            );
1836
1837            CachePolicy::new_options(
1838                request_parts,
1839                &modified_response_parts,
1840                SystemTime::now(),
1841                cache_options,
1842            )
1843        } else {
1844            CachePolicy::new_options(
1845                request_parts,
1846                response_parts,
1847                SystemTime::now(),
1848                cache_options,
1849            )
1850        }
1851    }
1852
1853    /// Determines if a response should be cached based on cache mode and HTTP semantics
1854    fn should_cache_response(
1855        &self,
1856        effective_cache_mode: CacheMode,
1857        http_response: &HttpResponse,
1858        is_get_head: bool,
1859        policy: &CachePolicy,
1860    ) -> bool {
1861        // HTTP status codes that are cacheable by default (RFC 7234)
1862        let is_cacheable_status = matches!(
1863            http_response.status,
1864            200 | 203 | 204 | 206 | 300 | 301 | 404 | 405 | 410 | 414 | 501
1865        );
1866
1867        if is_cacheable_status {
1868            match effective_cache_mode {
1869                CacheMode::ForceCache => is_get_head,
1870                CacheMode::IgnoreRules => true,
1871                CacheMode::NoStore => false,
1872                _ => is_get_head && policy.is_storable(),
1873            }
1874        } else {
1875            false
1876        }
1877    }
1878
1879    /// Common request analysis logic shared between streaming and non-streaming implementations
1880    fn analyze_request_internal(
1881        &self,
1882        parts: &request::Parts,
1883        mode_override: Option<CacheMode>,
1884        default_mode: CacheMode,
1885    ) -> Result<CacheAnalysis> {
1886        let effective_mode = mode_override
1887            .or_else(|| self.cache_mode_fn.as_ref().map(|f| f(parts)))
1888            .unwrap_or(default_mode);
1889
1890        let is_get_head = parts.method == "GET" || parts.method == "HEAD";
1891        let should_cache = effective_mode == CacheMode::IgnoreRules
1892            || (is_get_head && effective_mode != CacheMode::NoStore);
1893
1894        let cache_key = self.create_cache_key(parts, None);
1895
1896        let cache_bust_keys = if let Some(cache_bust) = &self.cache_bust {
1897            cache_bust(parts, &self.cache_key, &cache_key)
1898        } else {
1899            Vec::new()
1900        };
1901
1902        Ok(CacheAnalysis {
1903            cache_key,
1904            should_cache,
1905            cache_mode: effective_mode,
1906            cache_bust_keys,
1907            request_parts: parts.clone(),
1908            is_get_head,
1909        })
1910    }
1911}
1912
1913/// Caches requests according to http spec.
1914#[derive(Debug, Clone)]
1915pub struct HttpCache<T: CacheManager> {
1916    /// Determines the manager behavior.
1917    pub mode: CacheMode,
1918    /// Manager instance that implements the [`CacheManager`] trait.
1919    /// By default, a manager implementation with [`cacache`](https://github.com/zkat/cacache-rs)
1920    /// as the backend has been provided, see [`CACacheManager`].
1921    pub manager: T,
1922    /// Override the default cache options.
1923    pub options: HttpCacheOptions,
1924}
1925
1926/// Streaming version of HTTP cache that supports streaming request/response bodies
1927/// without buffering them in memory.
1928#[derive(Debug, Clone)]
1929pub struct HttpStreamingCache<T: StreamingCacheManager> {
1930    /// Determines the manager behavior.
1931    pub mode: CacheMode,
1932    /// Manager instance that implements the [`StreamingCacheManager`] trait.
1933    pub manager: T,
1934    /// Override the default cache options.
1935    pub options: HttpCacheOptions,
1936}
1937
1938#[allow(dead_code)]
1939impl<T: CacheManager> HttpCache<T> {
1940    /// Determines if the request should be cached
1941    pub fn can_cache_request(
1942        &self,
1943        middleware: &impl Middleware,
1944    ) -> Result<bool> {
1945        let analysis = self.analyze_request(
1946            &middleware.parts()?,
1947            middleware.overridden_cache_mode(),
1948        )?;
1949        Ok(analysis.should_cache)
1950    }
1951
1952    /// Apply rate limiting if enabled in options
1953    #[cfg(feature = "rate-limiting")]
1954    async fn apply_rate_limiting(&self, url: &Url) {
1955        if let Some(rate_limiter) = &self.options.rate_limiter {
1956            let rate_limit_key = url_hostname(url).unwrap_or("unknown");
1957            rate_limiter.until_key_ready(rate_limit_key).await;
1958        }
1959    }
1960
1961    /// Apply rate limiting if enabled in options (no-op without rate-limiting feature)
1962    #[cfg(not(feature = "rate-limiting"))]
1963    async fn apply_rate_limiting(&self, _url: &Url) {
1964        // No-op when rate limiting feature is not enabled
1965    }
1966
1967    /// Runs the actions to preform when the client middleware is running without the cache
1968    pub async fn run_no_cache(
1969        &self,
1970        middleware: &mut impl Middleware,
1971    ) -> Result<()> {
1972        let parts = middleware.parts()?;
1973
1974        self.manager
1975            .delete(&self.options.create_cache_key(&parts, Some("GET")))
1976            .await
1977            .ok();
1978
1979        let cache_key = self.options.create_cache_key(&parts, None);
1980
1981        if let Some(cache_bust) = &self.options.cache_bust {
1982            for key_to_cache_bust in
1983                cache_bust(&parts, &self.options.cache_key, &cache_key)
1984            {
1985                self.manager.delete(&key_to_cache_bust).await?;
1986            }
1987        }
1988
1989        Ok(())
1990    }
1991
1992    /// Attempts to run the passed middleware along with the cache
1993    pub async fn run(
1994        &self,
1995        mut middleware: impl Middleware,
1996    ) -> Result<HttpResponse> {
1997        // Use the HttpCacheInterface to analyze the request
1998        let analysis = self.analyze_request(
1999            &middleware.parts()?,
2000            middleware.overridden_cache_mode(),
2001        )?;
2002
2003        if !analysis.should_cache {
2004            return self.remote_fetch(&mut middleware).await;
2005        }
2006
2007        // Bust cache keys if needed
2008        for key in &analysis.cache_bust_keys {
2009            self.manager.delete(key).await?;
2010        }
2011
2012        // Look up cached response
2013        if let Some((mut cached_response, policy)) =
2014            self.lookup_cached_response(&analysis.cache_key).await?
2015        {
2016            if self.options.cache_status_headers {
2017                cached_response.cache_lookup_status(HitOrMiss::HIT);
2018            }
2019
2020            // Handle warning headers
2021            if let Some(warning_code) = cached_response.warning_code() {
2022                // https://tools.ietf.org/html/rfc7234#section-4.3.4
2023                //
2024                // If a stored response is selected for update, the cache MUST:
2025                //
2026                // * delete any warning header fields in the stored response with
2027                //   warn-code 1xx (see Section 5.5);
2028                //
2029                // * retain any warning header fields in the stored response with
2030                //   warn-code 2xx;
2031                //
2032                if (100..200).contains(&warning_code) {
2033                    cached_response.remove_warning();
2034                }
2035            }
2036
2037            match analysis.cache_mode {
2038                CacheMode::Default => {
2039                    self.conditional_fetch(middleware, cached_response, policy)
2040                        .await
2041                }
2042                CacheMode::NoCache => {
2043                    middleware.force_no_cache()?;
2044                    let mut res = self.remote_fetch(&mut middleware).await?;
2045                    if self.options.cache_status_headers {
2046                        res.cache_lookup_status(HitOrMiss::HIT);
2047                    }
2048                    Ok(res)
2049                }
2050                CacheMode::ForceCache
2051                | CacheMode::OnlyIfCached
2052                | CacheMode::IgnoreRules => {
2053                    //   112 Disconnected operation
2054                    // SHOULD be included if the cache is intentionally disconnected from
2055                    // the rest of the network for a period of time.
2056                    // (https://tools.ietf.org/html/rfc2616#section-14.46)
2057                    cached_response.add_warning(
2058                        &cached_response.url.clone(),
2059                        112,
2060                        "Disconnected operation",
2061                    );
2062                    if self.options.cache_status_headers {
2063                        cached_response.cache_status(HitOrMiss::HIT);
2064                    }
2065                    Ok(cached_response)
2066                }
2067                _ => self.remote_fetch(&mut middleware).await,
2068            }
2069        } else {
2070            match analysis.cache_mode {
2071                CacheMode::OnlyIfCached => {
2072                    // ENOTCACHED
2073                    let mut res = HttpResponse {
2074                        body: b"GatewayTimeout".to_vec(),
2075                        headers: HttpHeaders::default(),
2076                        status: 504,
2077                        url: middleware.url()?,
2078                        version: HttpVersion::Http11,
2079                        metadata: None,
2080                    };
2081                    if self.options.cache_status_headers {
2082                        res.cache_status(HitOrMiss::MISS);
2083                        res.cache_lookup_status(HitOrMiss::MISS);
2084                    }
2085                    Ok(res)
2086                }
2087                _ => self.remote_fetch(&mut middleware).await,
2088            }
2089        }
2090    }
2091
2092    fn cache_mode(&self, middleware: &impl Middleware) -> Result<CacheMode> {
2093        Ok(if let Some(mode) = middleware.overridden_cache_mode() {
2094            mode
2095        } else if let Some(cache_mode_fn) = &self.options.cache_mode_fn {
2096            cache_mode_fn(&middleware.parts()?)
2097        } else {
2098            self.mode
2099        })
2100    }
2101
2102    async fn remote_fetch(
2103        &self,
2104        middleware: &mut impl Middleware,
2105    ) -> Result<HttpResponse> {
2106        // Apply rate limiting before making the network request
2107        let url = middleware.url()?;
2108        self.apply_rate_limiting(&url).await;
2109
2110        let mut res = middleware.remote_fetch().await?;
2111        if self.options.cache_status_headers {
2112            res.cache_status(HitOrMiss::MISS);
2113            res.cache_lookup_status(HitOrMiss::MISS);
2114        }
2115        let policy = match self.options.cache_options {
2116            Some(options) => middleware.policy_with_options(&res, options)?,
2117            None => middleware.policy(&res)?,
2118        };
2119        let is_get_head = middleware.is_method_get_head();
2120        let mut mode = self.cache_mode(middleware)?;
2121        let parts = middleware.parts()?;
2122
2123        // Allow response-based cache mode override
2124        if let Some(response_cache_mode_fn) =
2125            &self.options.response_cache_mode_fn
2126        {
2127            if let Some(override_mode) = response_cache_mode_fn(&parts, &res) {
2128                mode = override_mode;
2129            }
2130        }
2131
2132        let is_cacheable = self.options.should_cache_response(
2133            mode,
2134            &res,
2135            is_get_head,
2136            &policy,
2137        );
2138
2139        if is_cacheable {
2140            // Generate metadata using the provider callback if configured
2141            let response_parts = res.parts()?;
2142            res.metadata =
2143                self.options.generate_metadata(&parts, &response_parts);
2144
2145            self.options.modify_response_before_caching(&mut res);
2146            Ok(self
2147                .manager
2148                .put(self.options.create_cache_key(&parts, None), res, policy)
2149                .await?)
2150        } else if !is_get_head {
2151            self.manager
2152                .delete(&self.options.create_cache_key(&parts, Some("GET")))
2153                .await
2154                .ok();
2155            Ok(res)
2156        } else {
2157            Ok(res)
2158        }
2159    }
2160
2161    async fn conditional_fetch(
2162        &self,
2163        mut middleware: impl Middleware,
2164        mut cached_res: HttpResponse,
2165        mut policy: CachePolicy,
2166    ) -> Result<HttpResponse> {
2167        let parts = middleware.parts()?;
2168        let before_req = policy.before_request(&parts, SystemTime::now());
2169        match before_req {
2170            BeforeRequest::Fresh(parts) => {
2171                cached_res.update_headers(&parts)?;
2172                if self.options.cache_status_headers {
2173                    cached_res.cache_status(HitOrMiss::HIT);
2174                    cached_res.cache_lookup_status(HitOrMiss::HIT);
2175                }
2176                return Ok(cached_res);
2177            }
2178            BeforeRequest::Stale { request: parts, matches } => {
2179                if matches {
2180                    middleware.update_headers(&parts)?;
2181                }
2182            }
2183        }
2184        let req_url = middleware.url()?;
2185        // Apply rate limiting before revalidation request
2186        self.apply_rate_limiting(&req_url).await;
2187        match middleware.remote_fetch().await {
2188            Ok(mut cond_res) => {
2189                let status = StatusCode::from_u16(cond_res.status)?;
2190                if status.is_server_error() && cached_res.must_revalidate() {
2191                    //   111 Revalidation failed
2192                    //   MUST be included if a cache returns a stale response
2193                    //   because an attempt to revalidate the response failed,
2194                    //   due to an inability to reach the server.
2195                    // (https://tools.ietf.org/html/rfc2616#section-14.46)
2196                    cached_res.add_warning(
2197                        &req_url,
2198                        111,
2199                        "Revalidation failed",
2200                    );
2201                    if self.options.cache_status_headers {
2202                        cached_res.cache_status(HitOrMiss::HIT);
2203                    }
2204                    Ok(cached_res)
2205                } else if cond_res.status == 304 {
2206                    let after_res = policy.after_response(
2207                        &parts,
2208                        &cond_res.parts()?,
2209                        SystemTime::now(),
2210                    );
2211                    match after_res {
2212                        AfterResponse::Modified(new_policy, parts)
2213                        | AfterResponse::NotModified(new_policy, parts) => {
2214                            policy = new_policy;
2215                            cached_res.update_headers(&parts)?;
2216                        }
2217                    }
2218                    if self.options.cache_status_headers {
2219                        cached_res.cache_status(HitOrMiss::HIT);
2220                        cached_res.cache_lookup_status(HitOrMiss::HIT);
2221                    }
2222                    self.options
2223                        .modify_response_before_caching(&mut cached_res);
2224                    let res = self
2225                        .manager
2226                        .put(
2227                            self.options.create_cache_key(&parts, None),
2228                            cached_res,
2229                            policy,
2230                        )
2231                        .await?;
2232                    Ok(res)
2233                } else if cond_res.status == 200 {
2234                    let policy = match self.options.cache_options {
2235                        Some(options) => middleware
2236                            .policy_with_options(&cond_res, options)?,
2237                        None => middleware.policy(&cond_res)?,
2238                    };
2239                    if self.options.cache_status_headers {
2240                        cond_res.cache_status(HitOrMiss::MISS);
2241                        cond_res.cache_lookup_status(HitOrMiss::HIT);
2242                    }
2243                    // Generate metadata using the provider callback if configured
2244                    let response_parts = cond_res.parts()?;
2245                    cond_res.metadata =
2246                        self.options.generate_metadata(&parts, &response_parts);
2247
2248                    self.options.modify_response_before_caching(&mut cond_res);
2249                    let res = self
2250                        .manager
2251                        .put(
2252                            self.options.create_cache_key(&parts, None),
2253                            cond_res,
2254                            policy,
2255                        )
2256                        .await?;
2257                    Ok(res)
2258                } else {
2259                    // Return fresh response for any status other than 304 or 200
2260                    if self.options.cache_status_headers {
2261                        cond_res.cache_status(HitOrMiss::MISS);
2262                        cond_res.cache_lookup_status(HitOrMiss::HIT);
2263                    }
2264                    Ok(cond_res)
2265                }
2266            }
2267            Err(e) => {
2268                if cached_res.must_revalidate() {
2269                    Err(e)
2270                } else {
2271                    //   111 Revalidation failed
2272                    //   MUST be included if a cache returns a stale response
2273                    //   because an attempt to revalidate the response failed,
2274                    //   due to an inability to reach the server.
2275                    // (https://tools.ietf.org/html/rfc2616#section-14.46)
2276                    cached_res.add_warning(
2277                        &req_url,
2278                        111,
2279                        "Revalidation failed",
2280                    );
2281                    if self.options.cache_status_headers {
2282                        cached_res.cache_status(HitOrMiss::HIT);
2283                    }
2284                    Ok(cached_res)
2285                }
2286            }
2287        }
2288    }
2289}
2290
2291impl<T: StreamingCacheManager> HttpCacheStreamInterface
2292    for HttpStreamingCache<T>
2293where
2294    <T::Body as http_body::Body>::Data: Send,
2295    <T::Body as http_body::Body>::Error:
2296        Into<StreamingError> + Send + Sync + 'static,
2297{
2298    type Body = T::Body;
2299
2300    fn analyze_request(
2301        &self,
2302        parts: &request::Parts,
2303        mode_override: Option<CacheMode>,
2304    ) -> Result<CacheAnalysis> {
2305        self.options.analyze_request_internal(parts, mode_override, self.mode)
2306    }
2307
2308    async fn lookup_cached_response(
2309        &self,
2310        key: &str,
2311    ) -> Result<Option<(Response<Self::Body>, CachePolicy)>> {
2312        if let Some((mut response, policy)) = self.manager.get(key).await? {
2313            // Add cache status headers if enabled
2314            if self.options.cache_status_headers {
2315                response.headers_mut().insert(
2316                    XCACHE,
2317                    "HIT".parse().map_err(StreamingError::new)?,
2318                );
2319                response.headers_mut().insert(
2320                    XCACHELOOKUP,
2321                    "HIT".parse().map_err(StreamingError::new)?,
2322                );
2323            }
2324            Ok(Some((response, policy)))
2325        } else {
2326            Ok(None)
2327        }
2328    }
2329
2330    async fn process_response<B>(
2331        &self,
2332        analysis: CacheAnalysis,
2333        response: Response<B>,
2334        metadata: Option<Vec<u8>>,
2335    ) -> Result<Response<Self::Body>>
2336    where
2337        B: http_body::Body + Send + 'static,
2338        B::Data: Send,
2339        B::Error: Into<StreamingError>,
2340        <T::Body as http_body::Body>::Data: Send,
2341        <T::Body as http_body::Body>::Error:
2342            Into<StreamingError> + Send + Sync + 'static,
2343    {
2344        // For non-cacheable requests based on initial analysis, convert them to manager's body type
2345        if !analysis.should_cache {
2346            let mut converted_response =
2347                self.manager.convert_body(response).await?;
2348            // Add cache miss headers
2349            if self.options.cache_status_headers {
2350                converted_response.headers_mut().insert(
2351                    XCACHE,
2352                    "MISS".parse().map_err(StreamingError::new)?,
2353                );
2354                converted_response.headers_mut().insert(
2355                    XCACHELOOKUP,
2356                    "MISS".parse().map_err(StreamingError::new)?,
2357                );
2358            }
2359            return Ok(converted_response);
2360        }
2361
2362        // Bust cache keys if needed
2363        for key in &analysis.cache_bust_keys {
2364            self.manager.delete(key).await?;
2365        }
2366
2367        // Convert response to HttpResponse format for response-based cache mode evaluation
2368        let (parts, body) = response.into_parts();
2369        // Use provided metadata or generate from provider
2370        let effective_metadata = metadata.or_else(|| {
2371            self.options.generate_metadata(&analysis.request_parts, &parts)
2372        });
2373        let http_response = self.options.parts_to_http_response(
2374            &parts,
2375            &analysis.request_parts,
2376            effective_metadata.clone(),
2377        )?;
2378
2379        // Check for response-based cache mode override
2380        let effective_cache_mode = self.options.evaluate_response_cache_mode(
2381            &analysis.request_parts,
2382            &http_response,
2383            analysis.cache_mode,
2384        );
2385
2386        // Reconstruct response for further processing
2387        let response = Response::from_parts(parts, body);
2388
2389        // If response-based override says NoStore, don't cache
2390        if effective_cache_mode == CacheMode::NoStore {
2391            let mut converted_response =
2392                self.manager.convert_body(response).await?;
2393            // Add cache miss headers
2394            if self.options.cache_status_headers {
2395                converted_response.headers_mut().insert(
2396                    XCACHE,
2397                    "MISS".parse().map_err(StreamingError::new)?,
2398                );
2399                converted_response.headers_mut().insert(
2400                    XCACHELOOKUP,
2401                    "MISS".parse().map_err(StreamingError::new)?,
2402                );
2403            }
2404            return Ok(converted_response);
2405        }
2406
2407        // Create policy for the response
2408        let (parts, body) = response.into_parts();
2409        let policy =
2410            self.options.create_cache_policy(&analysis.request_parts, &parts);
2411
2412        // Reconstruct response for caching
2413        let response = Response::from_parts(parts, body);
2414
2415        let should_cache_response = self.options.should_cache_response(
2416            effective_cache_mode,
2417            &http_response,
2418            analysis.is_get_head,
2419            &policy,
2420        );
2421
2422        if should_cache_response {
2423            // Extract URL from request parts for caching
2424            let request_url =
2425                extract_url_from_request_parts(&analysis.request_parts)?;
2426
2427            // Cache the response using the streaming manager
2428            let mut cached_response = self
2429                .manager
2430                .put(
2431                    analysis.cache_key,
2432                    response,
2433                    policy,
2434                    request_url,
2435                    effective_metadata,
2436                )
2437                .await?;
2438
2439            // Add cache miss headers (response is being stored for first time)
2440            if self.options.cache_status_headers {
2441                cached_response.headers_mut().insert(
2442                    XCACHE,
2443                    "MISS".parse().map_err(StreamingError::new)?,
2444                );
2445                cached_response.headers_mut().insert(
2446                    XCACHELOOKUP,
2447                    "MISS".parse().map_err(StreamingError::new)?,
2448                );
2449            }
2450            Ok(cached_response)
2451        } else {
2452            // Don't cache, just convert to manager's body type
2453            let mut converted_response =
2454                self.manager.convert_body(response).await?;
2455            // Add cache miss headers
2456            if self.options.cache_status_headers {
2457                converted_response.headers_mut().insert(
2458                    XCACHE,
2459                    "MISS".parse().map_err(StreamingError::new)?,
2460                );
2461                converted_response.headers_mut().insert(
2462                    XCACHELOOKUP,
2463                    "MISS".parse().map_err(StreamingError::new)?,
2464                );
2465            }
2466            Ok(converted_response)
2467        }
2468    }
2469
2470    fn prepare_conditional_request(
2471        &self,
2472        parts: &mut request::Parts,
2473        _cached_response: &Response<Self::Body>,
2474        policy: &CachePolicy,
2475    ) -> Result<()> {
2476        let before_req = policy.before_request(parts, SystemTime::now());
2477        if let BeforeRequest::Stale { request, .. } = before_req {
2478            parts.headers.extend(request.headers);
2479        }
2480        Ok(())
2481    }
2482
2483    async fn handle_not_modified(
2484        &self,
2485        cached_response: Response<Self::Body>,
2486        fresh_parts: &response::Parts,
2487    ) -> Result<Response<Self::Body>> {
2488        let (mut parts, body) = cached_response.into_parts();
2489
2490        // Update headers from the 304 response
2491        parts.headers.extend(fresh_parts.headers.clone());
2492
2493        Ok(Response::from_parts(parts, body))
2494    }
2495}
2496
2497impl<T: CacheManager> HttpCacheInterface for HttpCache<T> {
2498    fn analyze_request(
2499        &self,
2500        parts: &request::Parts,
2501        mode_override: Option<CacheMode>,
2502    ) -> Result<CacheAnalysis> {
2503        self.options.analyze_request_internal(parts, mode_override, self.mode)
2504    }
2505
2506    async fn lookup_cached_response(
2507        &self,
2508        key: &str,
2509    ) -> Result<Option<(HttpResponse, CachePolicy)>> {
2510        self.manager.get(key).await
2511    }
2512
2513    async fn process_response(
2514        &self,
2515        analysis: CacheAnalysis,
2516        response: Response<Vec<u8>>,
2517        metadata: Option<Vec<u8>>,
2518    ) -> Result<Response<Vec<u8>>> {
2519        if !analysis.should_cache {
2520            return Ok(response);
2521        }
2522
2523        // Bust cache keys if needed
2524        for key in &analysis.cache_bust_keys {
2525            self.manager.delete(key).await?;
2526        }
2527
2528        // Convert response to HttpResponse format
2529        let (parts, body) = response.into_parts();
2530        // Use provided metadata or generate from provider
2531        let effective_metadata = metadata.or_else(|| {
2532            self.options.generate_metadata(&analysis.request_parts, &parts)
2533        });
2534        let mut http_response = self.options.parts_to_http_response(
2535            &parts,
2536            &analysis.request_parts,
2537            effective_metadata,
2538        )?;
2539        http_response.body = body.clone(); // Include the body for buffered cache managers
2540
2541        // Check for response-based cache mode override
2542        let effective_cache_mode = self.options.evaluate_response_cache_mode(
2543            &analysis.request_parts,
2544            &http_response,
2545            analysis.cache_mode,
2546        );
2547
2548        // If response-based override says NoStore, don't cache
2549        if effective_cache_mode == CacheMode::NoStore {
2550            let response = Response::from_parts(parts, body);
2551            return Ok(response);
2552        }
2553
2554        // Create policy and determine if we should cache based on response-based mode
2555        let policy = self.options.create_cache_policy(
2556            &analysis.request_parts,
2557            &http_response.parts()?,
2558        );
2559
2560        let should_cache_response = self.options.should_cache_response(
2561            effective_cache_mode,
2562            &http_response,
2563            analysis.is_get_head,
2564            &policy,
2565        );
2566
2567        if should_cache_response {
2568            let cached_response = self
2569                .manager
2570                .put(analysis.cache_key, http_response, policy)
2571                .await?;
2572
2573            // Convert back to standard Response
2574            let response_parts = cached_response.parts()?;
2575            let mut response = Response::builder()
2576                .status(response_parts.status)
2577                .version(response_parts.version)
2578                .body(cached_response.body)?;
2579
2580            // Copy headers from the response parts
2581            *response.headers_mut() = response_parts.headers;
2582
2583            Ok(response)
2584        } else {
2585            // Don't cache, return original response
2586            let response = Response::from_parts(parts, body);
2587            Ok(response)
2588        }
2589    }
2590
2591    fn prepare_conditional_request(
2592        &self,
2593        parts: &mut request::Parts,
2594        _cached_response: &HttpResponse,
2595        policy: &CachePolicy,
2596    ) -> Result<()> {
2597        let before_req = policy.before_request(parts, SystemTime::now());
2598        if let BeforeRequest::Stale { request, .. } = before_req {
2599            parts.headers.extend(request.headers);
2600        }
2601        Ok(())
2602    }
2603
2604    async fn handle_not_modified(
2605        &self,
2606        mut cached_response: HttpResponse,
2607        fresh_parts: &response::Parts,
2608    ) -> Result<HttpResponse> {
2609        cached_response.update_headers(fresh_parts)?;
2610        if self.options.cache_status_headers {
2611            cached_response.cache_status(HitOrMiss::HIT);
2612            cached_response.cache_lookup_status(HitOrMiss::HIT);
2613        }
2614        Ok(cached_response)
2615    }
2616}
2617
2618#[allow(dead_code)]
2619#[cfg(test)]
2620mod test;
http_cache/lib.rs

http_cache/
lib.rs