EmbeddingManager

Struct EmbeddingManager 

Source
pub struct EmbeddingManager { /* private fields */ }

Implementations§

Source§

impl EmbeddingManager

Source

pub fn new(max_speakers: usize) -> Self

Examples found in repository?
examples/max_speakers.rs (line 10)
4fn main() -> Result<()> {
5    let audio_path = std::env::args().nth(1).expect("Please specify audio file");
6    let (samples, sample_rate) = read_wav(&audio_path)?;
7    let max_speakers = 6;
8
9    let extractor = EmbeddingExtractor::new("src/nn/speaker_identification/model.bpk")?;
10    let mut manager = EmbeddingManager::new(max_speakers);
11    let segmenter = Segmenter::new("src/nn/segmentation/model.bpk")?;
12
13    for segment in segmenter.iter_segments(&samples, sample_rate)? {
14        let segment = segment?;
15        let embedding = extractor.extract(&segment.samples, sample_rate)?;
16
17        let speaker = if manager.is_full() {
18            manager.best_match(&embedding)
19        } else {
20            manager.upsert(&embedding, 0.5)
21        }
22        .map(|s| s.to_string())
23        .unwrap_or_else(|| "?".into());
24
25        println!(
26            "start = {:.2}, end = {:.2}, speaker = {}",
27            segment.start, segment.end, speaker
28        );
29    }
30
31    Ok(())
32}
More examples
Hide additional examples
examples/infinite.rs (line 40)
31fn main() -> Result<()> {
32    let audio_path = std::env::args().nth(1).expect("Please specify audio file");
33    let search_threshold = 0.5;
34
35    let embedding_model_path = "src/nn/speaker_identification/model.bpk";
36    let segmentation_model_path = "src/nn/segmentation/model.bpk";
37
38    let (samples, sample_rate) = pyannote_rs::read_wav(&audio_path)?;
39    let embedding_extractor = EmbeddingExtractor::new(embedding_model_path)?;
40    let mut embedding_manager = EmbeddingManager::new(usize::MAX);
41    let segmenter = Segmenter::new(segmentation_model_path)?;
42
43    for segment in segmenter.iter_segments(&samples, sample_rate)? {
44        match segment {
45            Ok(segment) => {
46                if let Err(error) = process_segment(
47                    segment,
48                    &embedding_extractor,
49                    &mut embedding_manager,
50                    search_threshold,
51                    sample_rate,
52                ) {
53                    eprintln!("Error processing segment: {:?}", error);
54                }
55            }
56            Err(error) => eprintln!("Failed to process segment: {:?}", error),
57        }
58    }
59
60    Ok(())
61}
Source

pub fn upsert(&mut self, embedding: &Embedding, threshold: f32) -> Option<usize>

Try to match a speaker; if none is found above threshold, register a new speaker as long as capacity allows.

Examples found in repository?
examples/infinite.rs (line 18)
8fn process_segment(
9    segment: pyannote_rs::Segment,
10    embedding_extractor: &EmbeddingExtractor,
11    embedding_manager: &mut EmbeddingManager,
12    search_threshold: f32,
13    sample_rate: u32,
14) -> Result<()> {
15    let embedding = embedding_extractor.extract(&segment.samples, sample_rate)?;
16
17    let speaker = embedding_manager
18        .upsert(&embedding, search_threshold)
19        .or_else(|| embedding_manager.best_match(&embedding))
20        .map(|r| r.to_string())
21        .unwrap_or("?".into());
22
23    println!(
24        "start = {:.2}, end = {:.2}, speaker = {}",
25        segment.start, segment.end, speaker
26    );
27
28    Ok(())
29}
More examples
Hide additional examples
examples/max_speakers.rs (line 20)
4fn main() -> Result<()> {
5    let audio_path = std::env::args().nth(1).expect("Please specify audio file");
6    let (samples, sample_rate) = read_wav(&audio_path)?;
7    let max_speakers = 6;
8
9    let extractor = EmbeddingExtractor::new("src/nn/speaker_identification/model.bpk")?;
10    let mut manager = EmbeddingManager::new(max_speakers);
11    let segmenter = Segmenter::new("src/nn/segmentation/model.bpk")?;
12
13    for segment in segmenter.iter_segments(&samples, sample_rate)? {
14        let segment = segment?;
15        let embedding = extractor.extract(&segment.samples, sample_rate)?;
16
17        let speaker = if manager.is_full() {
18            manager.best_match(&embedding)
19        } else {
20            manager.upsert(&embedding, 0.5)
21        }
22        .map(|s| s.to_string())
23        .unwrap_or_else(|| "?".into());
24
25        println!(
26            "start = {:.2}, end = {:.2}, speaker = {}",
27            segment.start, segment.end, speaker
28        );
29    }
30
31    Ok(())
32}
Source

pub fn best_match(&self, embedding: &Embedding) -> Option<usize>

Examples found in repository?
examples/infinite.rs (line 19)
8fn process_segment(
9    segment: pyannote_rs::Segment,
10    embedding_extractor: &EmbeddingExtractor,
11    embedding_manager: &mut EmbeddingManager,
12    search_threshold: f32,
13    sample_rate: u32,
14) -> Result<()> {
15    let embedding = embedding_extractor.extract(&segment.samples, sample_rate)?;
16
17    let speaker = embedding_manager
18        .upsert(&embedding, search_threshold)
19        .or_else(|| embedding_manager.best_match(&embedding))
20        .map(|r| r.to_string())
21        .unwrap_or("?".into());
22
23    println!(
24        "start = {:.2}, end = {:.2}, speaker = {}",
25        segment.start, segment.end, speaker
26    );
27
28    Ok(())
29}
More examples
Hide additional examples
examples/max_speakers.rs (line 18)
4fn main() -> Result<()> {
5    let audio_path = std::env::args().nth(1).expect("Please specify audio file");
6    let (samples, sample_rate) = read_wav(&audio_path)?;
7    let max_speakers = 6;
8
9    let extractor = EmbeddingExtractor::new("src/nn/speaker_identification/model.bpk")?;
10    let mut manager = EmbeddingManager::new(max_speakers);
11    let segmenter = Segmenter::new("src/nn/segmentation/model.bpk")?;
12
13    for segment in segmenter.iter_segments(&samples, sample_rate)? {
14        let segment = segment?;
15        let embedding = extractor.extract(&segment.samples, sample_rate)?;
16
17        let speaker = if manager.is_full() {
18            manager.best_match(&embedding)
19        } else {
20            manager.upsert(&embedding, 0.5)
21        }
22        .map(|s| s.to_string())
23        .unwrap_or_else(|| "?".into());
24
25        println!(
26            "start = {:.2}, end = {:.2}, speaker = {}",
27            segment.start, segment.end, speaker
28        );
29    }
30
31    Ok(())
32}
Source

pub fn speaker_count(&self) -> usize

Source

pub fn is_full(&self) -> bool

Examples found in repository?
examples/max_speakers.rs (line 17)
4fn main() -> Result<()> {
5    let audio_path = std::env::args().nth(1).expect("Please specify audio file");
6    let (samples, sample_rate) = read_wav(&audio_path)?;
7    let max_speakers = 6;
8
9    let extractor = EmbeddingExtractor::new("src/nn/speaker_identification/model.bpk")?;
10    let mut manager = EmbeddingManager::new(max_speakers);
11    let segmenter = Segmenter::new("src/nn/segmentation/model.bpk")?;
12
13    for segment in segmenter.iter_segments(&samples, sample_rate)? {
14        let segment = segment?;
15        let embedding = extractor.extract(&segment.samples, sample_rate)?;
16
17        let speaker = if manager.is_full() {
18            manager.best_match(&embedding)
19        } else {
20            manager.upsert(&embedding, 0.5)
21        }
22        .map(|s| s.to_string())
23        .unwrap_or_else(|| "?".into());
24
25        println!(
26            "start = {:.2}, end = {:.2}, speaker = {}",
27            segment.start, segment.end, speaker
28        );
29    }
30
31    Ok(())
32}
Source

pub fn speakers(&self) -> &HashMap<usize, Embedding>

Trait Implementations§

Source§

impl Clone for EmbeddingManager

Source§

fn clone(&self) -> EmbeddingManager

Returns a duplicate of the value. Read more
1.0.0 · Source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more
Source§

impl Debug for EmbeddingManager

Source§

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

Auto Trait Implementations§

Blanket Implementations§

Source§

impl<T> Any for T
where T: 'static + ?Sized,

Source§

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more
Source§

impl<T> Borrow<T> for T
where T: ?Sized,

Source§

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more
Source§

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source§

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more
Source§

impl<T> CloneToUninit for T
where T: Clone,

Source§

unsafe fn clone_to_uninit(&self, dest: *mut u8)

🔬This is a nightly-only experimental API. (clone_to_uninit)
Performs copy-assignment from self to dest. Read more
Source§

impl<T> From<T> for T

Source§

fn from(t: T) -> T

Returns the argument unchanged.

Source§

impl<T, U> Into<U> for T
where U: From<T>,

Source§

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source§

impl<T> IntoEither for T

Source§

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
Source§

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
Source§

impl<T> Pointable for T

Source§

const ALIGN: usize

The alignment of pointer.
Source§

type Init = T

The type for initializers.
Source§

unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more
Source§

unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more
Source§

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more
Source§

unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more
Source§

impl<T> Same for T

Source§

type Output = T

Should always be Self
Source§

impl<T> ToOwned for T
where T: Clone,

Source§

type Owned = T

The resulting type after obtaining ownership.
Source§

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more
Source§

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more
Source§

impl<T, U> TryFrom<U> for T
where U: Into<T>,

Source§

type Error = Infallible

The type returned in the event of a conversion error.
Source§

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.
Source§

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

Source§

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.
Source§

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.
Source§

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

Source§

fn vzip(self) -> V