norm 0.1.1

A collection of distance metrics on strings
Documentation
//! This crate provides a collection of different distance metrics on strings.
//!
//! This problem is sometimes referred to as "string similarity search", or
//! more colloquially "fuzzy matching". Given a query string and a number of
//! possible candidate strings, the goal is to:
//!
//! a) filter out the candidates that are too dissimilar from the query;
//!
//! b) rank the remaining candidates by their similarity to the query.
//!
//! Here both of these tasks are accomplished by implementing the [`Metric`]
//! trait. This trait is at the basis of norm's design, and it is implemented
//! by all of our metrics. Reading its documentation is a good place to start.
//!
//! # Performance
//!
//! Performance is a top priority for this crate. Our goal is to have the
//! fastest implementation of every metric algorithm we provide, across all
//! languages. [Here][bench] you can find a number of benchmarks comparing
//! norm's metrics to each other, as well as to other popular libraries.
//!
//! # Examples
//!
//! ```rust
//! # use core::ops::Range;
//! use norm::fzf::{FzfParser, FzfV2};
//! use norm::Metric;
//!
//! let mut fzf = FzfV2::new();
//!
//! let mut parser = FzfParser::new();
//!
//! let query = parser.parse("aa");
//!
//! let cities = ["Geneva", "Ulaanbaatar", "New York City", "Adelaide"];
//!
//! let mut results = cities
//!     .iter()
//!     .copied()
//!     .filter_map(|city| fzf.distance(query, city).map(|dist| (city, dist)))
//!     .collect::<Vec<_>>();
//!
//! // We sort the results by distance in ascending order, so that the best
//! // match will be at the front of the vector.
//! results.sort_by_key(|(_city, dist)| *dist);
//!
//! assert_eq!(results.len(), 2);
//! assert_eq!(results[0].0, "Adelaide");
//! assert_eq!(results[1].0, "Ulaanbaatar");
//!
//! // We can also find out which sub-strings of each candidate matched the
//! // query.
//!
//! let mut ranges: Vec<Range<usize>> = Vec::new();
//!
//! let _ = fzf.distance_and_ranges(query, results[0].0, &mut ranges);
//! assert_eq!(ranges.len(), 2);
//! assert_eq!(ranges[0], 0..1); // "A" in "Adelaide"
//! assert_eq!(ranges[1], 4..5); // "a" in "Adelaide"
//!
//! ranges.clear();
//!
//! let _ = fzf.distance_and_ranges(query, results[1].0, &mut ranges);
//! assert_eq!(ranges.len(), 1);
//! assert_eq!(ranges[0], 2..4); // The first "aa" in "Ulaanbaatar"
//! ```
//!
//! # Features flags
//!
//! - `fzf-v1`: enables the [`FzfV1`](metrics::fzf::FzfV1) metric;
//! - `fzf-v2`: enables the [`FzfV2`](metrics::fzf::FzfV2) metric;
//!
//! [bench]: https://github.com/noib3/fuzzy-benches

#![cfg_attr(docsrs, feature(doc_cfg))]
#![allow(clippy::module_inception)]
#![allow(clippy::needless_range_loop)]
#![allow(clippy::too_many_arguments)]
#![deny(missing_docs)]
#![deny(rustdoc::broken_intra_doc_links)]
#![deny(rustdoc::private_intra_doc_links)]

extern crate alloc;

#[cfg(feature = "__any-metric")]
mod candidate;
mod case_sensitivity;
#[cfg(feature = "__any-metric")]
mod matched_ranges;
mod metric;
#[cfg(feature = "__any-metric")]
mod metrics;
#[cfg(feature = "__any-metric")]
mod normalize;
#[cfg(feature = "__any-metric")]
mod utils;

#[cfg(feature = "__any-metric")]
use candidate::{Candidate, CandidateMatches};
pub use case_sensitivity::CaseSensitivity;
#[cfg(feature = "__any-metric")]
use matched_ranges::MatchedRanges;
pub use metric::Metric;
#[cfg(feature = "__any-metric")]
pub use metrics::*;