#![warn(missing_docs)]
use std::cmp::max;
#[inline]
fn get_shorter_longer_strings(left: impl AsRef<str>, right: impl AsRef<str>) -> (String, String) {
if left.as_ref().len() < right.as_ref().len() {
(left.as_ref().to_string(), right.as_ref().to_string())
} else {
(right.as_ref().to_string(), left.as_ref().to_string())
}
}
pub fn lcs_length(left: impl AsRef<str>, right: impl AsRef<str>) -> usize {
let (left, right) = get_shorter_longer_strings(left, right);
let mut table = vec![vec![0 as usize; left.len() + 1]; 2];
for rletter in right.chars() {
for (col, lletter) in left.chars().enumerate() {
if rletter == lletter {
table[1][col + 1] = 1 + table[0][col];
} else {
table[1][col + 1] = max(table[0][col + 1], table[1][col]);
}
}
table[0] = table.pop().unwrap();
table.push(vec![0 as usize; left.len() + 1]);
}
*table[0].last().unwrap()
}
pub fn compare_similarity(left: impl AsRef<str>, right: impl AsRef<str>) -> f64 {
let (len1, len2) = (left.as_ref().len(), right.as_ref().len());
let lcs_len = lcs_length(left.as_ref(), right.as_ref());
let size = max(len1, len2);
if size == 0 { 1.0 } else { lcs_len as f64 / size as f64 }
}
pub fn find_best_similarity(taregt: impl AsRef<str>, options: &[impl AsRef<str>]) -> Option<(String, f64)> {
match options.len() {
0 => None,
_ => {
let mut high_score: f64 = -1.0;
let mut position: usize = 0;
for (index, option) in options.iter().enumerate() {
let score = compare_similarity(option.as_ref(), taregt.as_ref());
if score > high_score {
high_score = score;
position = index;
}
}
Some((options[position].as_ref().to_string(), high_score))
}
}
}
pub fn get_similarity_ratings(taregt: impl AsRef<str>, options: &[impl AsRef<str>]) -> Option<Vec<f64>> {
match options.len() {
0 => None,
_ => {
let mut result = vec![];
for option in options.iter() {
let score = compare_similarity(option.as_ref(), taregt.as_ref());
result.push(score);
}
Some(result)
}
}
}
#[cfg(test)]
mod tests {
use std::{collections::BTreeSet, vec};
use crate::*;
#[test]
fn lcs_works() {
let length = lcs_length("longest", "stone");
assert_eq!(length, 3);
}
#[test]
fn identity_check() {
let score = compare_similarity("hello", "hello");
assert_eq!(score, 1.0);
}
#[test]
fn ratio_is_symetrical() {
let left = "longest";
let right = "stone";
let score1 = compare_similarity(left, right);
let score2 = compare_similarity(right, left);
assert_eq!(score1, score2);
}
#[test]
fn empty_strings() {
let score = compare_similarity("", "");
assert_eq!(score, 1.0);
}
#[test]
fn find_best() {
let target = "fight";
let options = vec!["blight", "night", "stride"];
let (matched, score) = find_best_similarity(target, &options).unwrap();
assert_eq!(matched, "night");
assert_eq!(score, 0.8);
}
#[test]
fn find_best_with_set() {
let target = format!("fight");
let mut options = BTreeSet::new();
options.insert("blight");
options.insert("night");
options.insert("stride");
let vector: Vec<_> = options.iter().collect();
let (matched, score) = find_best_similarity(target, &vector).unwrap();
assert_eq!(matched, "night");
assert_eq!(score, 0.8);
}
#[test]
fn similarity_ratings() {
let expected = vec![0.4, 0.8, 0.2];
let options = vec![
"fill",
"night",
"ride"
];
let ratings = get_similarity_ratings("fight", &options).unwrap();
assert_eq!(expected, ratings);
}
}