use serde::{Deserialize, Serialize};
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct SimilaritySearchResult<T> {
pub item: T,
pub similarity: f32,
pub metadata: SimilarityMetadata,
}
#[derive(Debug, Clone, Serialize, Deserialize, Default)]
pub struct SimilarityMetadata {
#[serde(default)]
pub embedding_model: String,
pub embedding_timestamp: Option<chrono::DateTime<chrono::Utc>>,
#[serde(default)]
pub context: serde_json::Value,
}
#[must_use]
pub fn cosine_similarity(a: &[f32], b: &[f32]) -> f32 {
if a.len() != b.len() {
return 0.0;
}
if a.is_empty() {
return 0.0;
}
let dot_product: f32 = a.iter().zip(b.iter()).map(|(x, y)| x * y).sum();
let magnitude_a: f32 = a.iter().map(|x| x * x).sum::<f32>().sqrt();
let magnitude_b: f32 = b.iter().map(|x| x * x).sum::<f32>().sqrt();
if magnitude_a == 0.0 || magnitude_b == 0.0 {
return 0.0;
}
let similarity = dot_product / (magnitude_a * magnitude_b);
(similarity + 1.0) / 2.0
}
#[cfg(test)]
mod tests {
use super::*;
#[test]
fn test_cosine_similarity() {
let vec1 = vec![1.0, 2.0, 3.0];
let vec2 = vec![1.0, 2.0, 3.0];
let similarity = cosine_similarity(&vec1, &vec2);
assert!((similarity - 1.0).abs() < 0.001);
let vec3 = vec![1.0, 0.0];
let vec4 = vec![0.0, 1.0];
let similarity = cosine_similarity(&vec3, &vec4);
assert!((similarity - 0.5).abs() < 0.001);
let vec5 = vec![1.0, 2.0, 3.0];
let vec6 = vec![-1.0, -2.0, -3.0];
let similarity = cosine_similarity(&vec5, &vec6);
assert!((similarity - 0.0).abs() < 0.001);
let vec7 = vec![1.0, 2.0];
let vec8 = vec![1.0, 2.0, 3.0];
let similarity = cosine_similarity(&vec7, &vec8);
assert_eq!(similarity, 0.0);
}
}