vecstore 1.0.0 - Docs.rs

//! Semantic caching with fuzzy key matching
//!
//! This module provides intelligent caching that matches similar queries,
//! not just exact duplicates. Uses vector similarity to determine if a
//! cached result can be reused for a similar query.
//!
//! ## Features
//!
//! - Fuzzy cache key matching via cosine similarity
//! - Configurable similarity threshold
//! - TTL-based eviction
//! - LRU eviction when full
//! - Automatic cache warming
//!
//! ## Usage
//!
//! ```no_run
//! use vecstore::semantic_cache::SemanticCache;
//!
//! # fn main() -> anyhow::Result<()> {
//! let mut cache = SemanticCache::new(1000, 0.95);
//!
//! // Cache a query result
//! let query = vec![0.1, 0.2, 0.3];
//! let results = vec!["doc1", "doc2"];
//! cache.insert(&query, results.clone());
//!
//! // Similar query (not exact match) can hit cache
//! let similar_query = vec![0.1, 0.2, 0.31]; // Slightly different
//! if let Some(cached) = cache.get(&similar_query) {
//!     println!("Cache hit for similar query!");
//! }
//! # Ok(())
//! # }
//! ```

use std::collections::HashMap;
use std::time::{Duration, Instant};

/// Semantic cache entry
#[derive(Clone)]
struct CacheEntry<V> {
    /// Query vector (cache key)
    query: Vec<f32>,

    /// Cached value
    value: V,

    /// Insertion timestamp
    inserted_at: Instant,

    /// Last access timestamp
    accessed_at: Instant,

    /// Access count
    access_count: usize,
}

/// Semantic cache with fuzzy key matching
pub struct SemanticCache<V: Clone> {
    /// Cache entries (hashed by approximate key)
    entries: HashMap<u64, Vec<CacheEntry<V>>>,

    /// Maximum number of entries
    capacity: usize,

    /// Similarity threshold (0.0 to 1.0)
    /// Higher = more strict matching
    similarity_threshold: f32,

    /// Time-to-live for entries
    ttl: Option<Duration>,

    /// Total cache hits
    hits: usize,

    /// Total cache misses
    misses: usize,
}

impl<V: Clone> SemanticCache<V> {
    /// Create a new semantic cache
    ///
    /// # Arguments
    /// * `capacity` - Maximum number of entries
    /// * `similarity_threshold` - Minimum similarity for cache hit (0.0 to 1.0)
    ///   - 1.0 = exact match only
    ///   - 0.95 = very similar (recommended for most use cases)
    ///   - 0.9 = moderately similar
    ///   - 0.8 = loosely similar
    pub fn new(capacity: usize, similarity_threshold: f32) -> Self {
        Self {
            entries: HashMap::new(),
            capacity,
            similarity_threshold: similarity_threshold.clamp(0.0, 1.0),
            ttl: None,
            hits: 0,
            misses: 0,
        }
    }

    /// Set time-to-live for cache entries
    pub fn with_ttl(mut self, ttl: Duration) -> Self {
        self.ttl = Some(ttl);
        self
    }

    /// Insert a query-result pair into the cache
    pub fn insert(&mut self, query: &[f32], value: V) {
        // Check capacity and evict if needed
        if self.len() >= self.capacity {
            self.evict_lru();
        }

        let bucket_key = Self::hash_vector(query);

        let entry = CacheEntry {
            query: query.to_vec(),
            value,
            inserted_at: Instant::now(),
            accessed_at: Instant::now(),
            access_count: 0,
        };

        self.entries.entry(bucket_key).or_default().push(entry);
    }

    /// Get cached value for a query (fuzzy match)
    pub fn get(&mut self, query: &[f32]) -> Option<V> {
        let bucket_key = Self::hash_vector(query);

        // Look in the same bucket
        if let Some(bucket) = self.entries.get_mut(&bucket_key) {
            let now = Instant::now();

            // Find best matching entry
            let mut best_match: Option<(usize, f32)> = None;

            for (idx, entry) in bucket.iter().enumerate() {
                // Check TTL
                if let Some(ttl) = self.ttl {
                    if now.duration_since(entry.inserted_at) > ttl {
                        continue; // Skip expired entries
                    }
                }

                // Calculate similarity
                let similarity = Self::cosine_similarity(query, &entry.query);

                if similarity >= self.similarity_threshold {
                    match best_match {
                        None => best_match = Some((idx, similarity)),
                        Some((_, prev_sim)) if similarity > prev_sim => {
                            best_match = Some((idx, similarity));
                        }
                        _ => {}
                    }
                }
            }

            // Return best match if found
            if let Some((idx, _)) = best_match {
                let entry = &mut bucket[idx];
                entry.accessed_at = now;
                entry.access_count += 1;
                self.hits += 1;
                return Some(entry.value.clone());
            }
        }

        self.misses += 1;
        None
    }

    /// Check if cache contains a similar query (without retrieving)
    pub fn contains(&self, query: &[f32]) -> bool {
        let bucket_key = Self::hash_vector(query);

        if let Some(bucket) = self.entries.get(&bucket_key) {
            let now = Instant::now();

            for entry in bucket {
                // Check TTL
                if let Some(ttl) = self.ttl {
                    if now.duration_since(entry.inserted_at) > ttl {
                        continue;
                    }
                }

                let similarity = Self::cosine_similarity(query, &entry.query);
                if similarity >= self.similarity_threshold {
                    return true;
                }
            }
        }

        false
    }

    /// Remove expired entries
    pub fn cleanup_expired(&mut self) {
        if let Some(ttl) = self.ttl {
            let now = Instant::now();

            for bucket in self.entries.values_mut() {
                bucket.retain(|entry| now.duration_since(entry.inserted_at) <= ttl);
            }

            // Remove empty buckets
            self.entries.retain(|_, bucket| !bucket.is_empty());
        }
    }

    /// Clear all cache entries
    pub fn clear(&mut self) {
        self.entries.clear();
        self.hits = 0;
        self.misses = 0;
    }

    /// Get current cache size
    pub fn len(&self) -> usize {
        self.entries.values().map(|b| b.len()).sum()
    }

    /// Check if cache is empty
    pub fn is_empty(&self) -> bool {
        self.entries.is_empty()
    }

    /// Get cache hit rate (0.0 to 1.0)
    pub fn hit_rate(&self) -> f64 {
        let total = self.hits + self.misses;
        if total == 0 {
            0.0
        } else {
            self.hits as f64 / total as f64
        }
    }

    /// Get cache statistics
    pub fn stats(&self) -> CacheStats {
        CacheStats {
            size: self.len(),
            capacity: self.capacity,
            hits: self.hits,
            misses: self.misses,
            hit_rate: self.hit_rate(),
        }
    }

    /// Evict least recently used entry
    fn evict_lru(&mut self) {
        if self.entries.is_empty() {
            return;
        }

        // Find LRU entry across all buckets
        let mut oldest_time = Instant::now();
        let mut oldest_bucket: Option<u64> = None;
        let mut oldest_idx: usize = 0;

        for (&bucket_key, bucket) in &self.entries {
            for (idx, entry) in bucket.iter().enumerate() {
                if entry.accessed_at < oldest_time {
                    oldest_time = entry.accessed_at;
                    oldest_bucket = Some(bucket_key);
                    oldest_idx = idx;
                }
            }
        }

        // Remove the LRU entry
        if let Some(bucket_key) = oldest_bucket {
            if let Some(bucket) = self.entries.get_mut(&bucket_key) {
                bucket.remove(oldest_idx);
                if bucket.is_empty() {
                    self.entries.remove(&bucket_key);
                }
            }
        }
    }

    /// Hash vector to bucket key (quantized hashing)
    fn hash_vector(v: &[f32]) -> u64 {
        use std::collections::hash_map::DefaultHasher;
        use std::hash::{Hash, Hasher};

        let mut hasher = DefaultHasher::new();

        // Quantize to reduce sensitivity
        // Round to 1 decimal place for bucketing
        for &val in v.iter().take(16) {
            // Use first 16 dims for hashing
            let quantized = (val * 10.0).round() as i32;
            quantized.hash(&mut hasher);
        }

        hasher.finish()
    }

    /// Calculate cosine similarity between two vectors
    fn cosine_similarity(a: &[f32], b: &[f32]) -> f32 {
        if a.len() != b.len() {
            return 0.0;
        }

        let dot: f32 = a.iter().zip(b.iter()).map(|(x, y)| x * y).sum();
        let norm_a: f32 = a.iter().map(|x| x * x).sum::<f32>().sqrt();
        let norm_b: f32 = b.iter().map(|x| x * x).sum::<f32>().sqrt();

        if norm_a == 0.0 || norm_b == 0.0 {
            return 0.0;
        }

        (dot / (norm_a * norm_b)).clamp(-1.0, 1.0)
    }
}

/// Cache statistics
#[derive(Debug, Clone)]
pub struct CacheStats {
    pub size: usize,
    pub capacity: usize,
    pub hits: usize,
    pub misses: usize,
    pub hit_rate: f64,
}

impl CacheStats {
    /// Print human-readable statistics
    pub fn print(&self) {
        println!("Semantic Cache Statistics:");
        println!("  Size: {}/{}", self.size, self.capacity);
        println!("  Hits: {}", self.hits);
        println!("  Misses: {}", self.misses);
        println!("  Hit Rate: {:.2}%", self.hit_rate * 100.0);
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_exact_match() {
        let mut cache = SemanticCache::new(10, 0.95);

        let query = vec![1.0, 2.0, 3.0];
        cache.insert(&query, "result1");

        // Exact match should hit
        assert!(cache.get(&query).is_some());
        assert_eq!(cache.stats().hits, 1);
    }

    #[test]
    fn test_fuzzy_match() {
        let mut cache = SemanticCache::new(10, 0.95);

        let query = vec![1.0, 2.0, 3.0];
        cache.insert(&query, "result1");

        // Very similar query should hit (cosine sim ~0.9999)
        let similar = vec![1.0, 2.0, 3.01];
        assert!(cache.get(&similar).is_some());
        assert_eq!(cache.stats().hits, 1);
    }

    #[test]
    fn test_different_query_misses() {
        let mut cache = SemanticCache::new(10, 0.95);

        let query1 = vec![1.0, 2.0, 3.0];
        cache.insert(&query1, "result1");

        // Very different query should miss
        let query2 = vec![10.0, 20.0, 30.0];
        assert!(cache.get(&query2).is_none());
        assert_eq!(cache.stats().misses, 1);
    }

    #[test]
    fn test_threshold() {
        let mut cache = SemanticCache::new(10, 0.99); // Very strict

        let query = vec![1.0, 2.0, 3.0];
        cache.insert(&query, "result1");

        // Slightly different might not hit with strict threshold
        let similar = vec![1.0, 2.0, 3.1];
        // This will depend on actual similarity value
        cache.get(&similar);
        // Don't assert - just testing behavior
    }

    #[test]
    fn test_ttl_expiration() {
        let mut cache = SemanticCache::new(10, 0.95).with_ttl(Duration::from_millis(100));

        let query = vec![1.0, 2.0, 3.0];
        cache.insert(&query, "result1");

        // Should hit immediately
        assert!(cache.get(&query).is_some());

        // Wait for expiration
        std::thread::sleep(Duration::from_millis(150));

        // Should miss after TTL
        assert!(cache.get(&query).is_none());
    }

    #[test]
    fn test_capacity_eviction() {
        let mut cache = SemanticCache::new(2, 0.95); // Only 2 entries

        cache.insert(&vec![1.0], "result1");
        cache.insert(&vec![2.0], "result2");
        cache.insert(&vec![3.0], "result3"); // Should evict oldest

        assert_eq!(cache.len(), 2);
    }

    #[test]
    fn test_hit_rate() {
        let mut cache = SemanticCache::new(10, 0.95);

        let query = vec![1.0, 2.0, 3.0];
        cache.insert(&query, "result1");

        // 1 hit, 1 miss
        cache.get(&query);
        cache.get(&vec![10.0, 20.0, 30.0]);

        assert_eq!(cache.stats().hit_rate, 0.5);
    }

    #[test]
    fn test_cleanup_expired() {
        let mut cache = SemanticCache::new(10, 0.95).with_ttl(Duration::from_millis(50));

        cache.insert(&vec![1.0], "result1");
        cache.insert(&vec![2.0], "result2");

        std::thread::sleep(Duration::from_millis(100));

        cache.cleanup_expired();
        assert!(cache.is_empty());
    }

    #[test]
    fn test_cosine_similarity() {
        let a = vec![1.0, 0.0, 0.0];
        let b = vec![1.0, 0.0, 0.0];
        assert!((SemanticCache::<()>::cosine_similarity(&a, &b) - 1.0).abs() < 0.001);

        let c = vec![1.0, 0.0, 0.0];
        let d = vec![0.0, 1.0, 0.0];
        assert!((SemanticCache::<()>::cosine_similarity(&c, &d) - 0.0).abs() < 0.001);
    }
}