EmbeddingManager

Struct EmbeddingManager 

Source
pub struct EmbeddingManager { /* private fields */ }

Implementations§

Source§

impl EmbeddingManager

Source

pub fn new(max_speakers: usize) -> Self

Examples found in repository?
examples/infinite.rs (line 44)
35fn main() -> Result<(), eyre::Report> {
36    let audio_path = std::env::args().nth(1).expect("Please specify audio file");
37    let search_threshold = 0.5;
38
39    let embedding_model_path = "wespeaker_en_voxceleb_CAM++.onnx";
40    let segmentation_model_path = "segmentation-3.0.onnx";
41
42    let (samples, sample_rate) = pyannote_rs::read_wav(&audio_path)?;
43    let mut embedding_extractor = EmbeddingExtractor::new(embedding_model_path)?;
44    let mut embedding_manager = EmbeddingManager::new(usize::MAX);
45
46    let segments = pyannote_rs::get_segments(&samples, sample_rate, segmentation_model_path)?;
47
48    for segment in segments {
49        if let Ok(segment) = segment {
50            if let Err(error) = process_segment(
51                segment,
52                &mut embedding_extractor,
53                &mut embedding_manager,
54                search_threshold,
55            ) {
56                eprintln!("Error processing segment: {:?}", error);
57            }
58        } else if let Err(error) = segment {
59            eprintln!("Failed to process segment: {:?}", error);
60        }
61    }
62
63    Ok(())
64}
More examples
Hide additional examples
examples/max_speakers.rs (line 9)
3fn main() {
4    let audio_path = std::env::args().nth(1).expect("Please specify audio file");
5    let (samples, sample_rate) = pyannote_rs::read_wav(&audio_path).unwrap();
6    let max_speakers = 6;
7
8    let mut extractor = EmbeddingExtractor::new("wespeaker_en_voxceleb_CAM++.onnx").unwrap();
9    let mut manager = EmbeddingManager::new(6);
10
11    let segments =
12        pyannote_rs::get_segments(&samples, sample_rate, "segmentation-3.0.onnx").unwrap();
13
14    for segment in segments {
15        match segment {
16            Ok(segment) => {
17                if let Ok(embedding) = extractor.compute(&segment.samples) {
18                    let speaker = if manager.get_all_speakers().len() == max_speakers {
19                        manager
20                            .get_best_speaker_match(embedding.collect())
21                            .map(|s| s.to_string())
22                            .unwrap_or("?".into())
23                    } else {
24                        manager
25                            .search_speaker(embedding.collect(), 0.5)
26                            .map(|s| s.to_string())
27                            .unwrap_or("?".into())
28                    };
29                    println!(
30                        "start = {:.2}, end = {:.2}, speaker = {}",
31                        segment.start, segment.end, speaker
32                    );
33                } else {
34                    println!(
35                        "start = {:.2}, end = {:.2}, speaker = ?",
36                        segment.start, segment.end
37                    );
38                }
39            }
40            Err(error) => eprintln!("Failed to process segment: {:?}", error),
41        }
42    }
43}
Source

pub fn search_speaker( &mut self, embedding: Vec<f32>, threshold: f32, ) -> Option<usize>

Search or create speaker

Examples found in repository?
examples/infinite.rs (line 22)
10fn process_segment(
11    segment: pyannote_rs::Segment,
12    embedding_extractor: &mut EmbeddingExtractor,
13    embedding_manager: &mut EmbeddingManager,
14    search_threshold: f32,
15) -> Result<(), eyre::Report> {
16    let embedding_result: Vec<f32> = embedding_extractor
17        .compute(&segment.samples)
18        .unwrap()
19        .collect();
20
21    let speaker = embedding_manager
22        .search_speaker(embedding_result.clone(), search_threshold)
23        .ok_or_else(|| embedding_manager.search_speaker(embedding_result, 0.0)) // Ensure always to return speaker
24        .map(|r| r.to_string())
25        .unwrap_or("?".into());
26
27    println!(
28        "start = {:.2}, end = {:.2}, speaker = {}",
29        segment.start, segment.end, speaker
30    );
31
32    Ok(())
33}
More examples
Hide additional examples
examples/max_speakers.rs (line 25)
3fn main() {
4    let audio_path = std::env::args().nth(1).expect("Please specify audio file");
5    let (samples, sample_rate) = pyannote_rs::read_wav(&audio_path).unwrap();
6    let max_speakers = 6;
7
8    let mut extractor = EmbeddingExtractor::new("wespeaker_en_voxceleb_CAM++.onnx").unwrap();
9    let mut manager = EmbeddingManager::new(6);
10
11    let segments =
12        pyannote_rs::get_segments(&samples, sample_rate, "segmentation-3.0.onnx").unwrap();
13
14    for segment in segments {
15        match segment {
16            Ok(segment) => {
17                if let Ok(embedding) = extractor.compute(&segment.samples) {
18                    let speaker = if manager.get_all_speakers().len() == max_speakers {
19                        manager
20                            .get_best_speaker_match(embedding.collect())
21                            .map(|s| s.to_string())
22                            .unwrap_or("?".into())
23                    } else {
24                        manager
25                            .search_speaker(embedding.collect(), 0.5)
26                            .map(|s| s.to_string())
27                            .unwrap_or("?".into())
28                    };
29                    println!(
30                        "start = {:.2}, end = {:.2}, speaker = {}",
31                        segment.start, segment.end, speaker
32                    );
33                } else {
34                    println!(
35                        "start = {:.2}, end = {:.2}, speaker = ?",
36                        segment.start, segment.end
37                    );
38                }
39            }
40            Err(error) => eprintln!("Failed to process segment: {:?}", error),
41        }
42    }
43}
Source

pub fn get_best_speaker_match(&mut self, embedding: Vec<f32>) -> Result<usize>

Examples found in repository?
examples/max_speakers.rs (line 20)
3fn main() {
4    let audio_path = std::env::args().nth(1).expect("Please specify audio file");
5    let (samples, sample_rate) = pyannote_rs::read_wav(&audio_path).unwrap();
6    let max_speakers = 6;
7
8    let mut extractor = EmbeddingExtractor::new("wespeaker_en_voxceleb_CAM++.onnx").unwrap();
9    let mut manager = EmbeddingManager::new(6);
10
11    let segments =
12        pyannote_rs::get_segments(&samples, sample_rate, "segmentation-3.0.onnx").unwrap();
13
14    for segment in segments {
15        match segment {
16            Ok(segment) => {
17                if let Ok(embedding) = extractor.compute(&segment.samples) {
18                    let speaker = if manager.get_all_speakers().len() == max_speakers {
19                        manager
20                            .get_best_speaker_match(embedding.collect())
21                            .map(|s| s.to_string())
22                            .unwrap_or("?".into())
23                    } else {
24                        manager
25                            .search_speaker(embedding.collect(), 0.5)
26                            .map(|s| s.to_string())
27                            .unwrap_or("?".into())
28                    };
29                    println!(
30                        "start = {:.2}, end = {:.2}, speaker = {}",
31                        segment.start, segment.end, speaker
32                    );
33                } else {
34                    println!(
35                        "start = {:.2}, end = {:.2}, speaker = ?",
36                        segment.start, segment.end
37                    );
38                }
39            }
40            Err(error) => eprintln!("Failed to process segment: {:?}", error),
41        }
42    }
43}
Source

pub fn get_all_speakers(&self) -> &HashMap<usize, Array1<f32>>

Examples found in repository?
examples/max_speakers.rs (line 18)
3fn main() {
4    let audio_path = std::env::args().nth(1).expect("Please specify audio file");
5    let (samples, sample_rate) = pyannote_rs::read_wav(&audio_path).unwrap();
6    let max_speakers = 6;
7
8    let mut extractor = EmbeddingExtractor::new("wespeaker_en_voxceleb_CAM++.onnx").unwrap();
9    let mut manager = EmbeddingManager::new(6);
10
11    let segments =
12        pyannote_rs::get_segments(&samples, sample_rate, "segmentation-3.0.onnx").unwrap();
13
14    for segment in segments {
15        match segment {
16            Ok(segment) => {
17                if let Ok(embedding) = extractor.compute(&segment.samples) {
18                    let speaker = if manager.get_all_speakers().len() == max_speakers {
19                        manager
20                            .get_best_speaker_match(embedding.collect())
21                            .map(|s| s.to_string())
22                            .unwrap_or("?".into())
23                    } else {
24                        manager
25                            .search_speaker(embedding.collect(), 0.5)
26                            .map(|s| s.to_string())
27                            .unwrap_or("?".into())
28                    };
29                    println!(
30                        "start = {:.2}, end = {:.2}, speaker = {}",
31                        segment.start, segment.end, speaker
32                    );
33                } else {
34                    println!(
35                        "start = {:.2}, end = {:.2}, speaker = ?",
36                        segment.start, segment.end
37                    );
38                }
39            }
40            Err(error) => eprintln!("Failed to process segment: {:?}", error),
41        }
42    }
43}

Trait Implementations§

Source§

impl Clone for EmbeddingManager

Source§

fn clone(&self) -> EmbeddingManager

Returns a duplicate of the value. Read more
1.0.0 · Source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more
Source§

impl Debug for EmbeddingManager

Source§

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

Auto Trait Implementations§

Blanket Implementations§

Source§

impl<T> Any for T
where T: 'static + ?Sized,

Source§

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more
Source§

impl<T> Borrow<T> for T
where T: ?Sized,

Source§

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more
Source§

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source§

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more
Source§

impl<T> CloneToUninit for T
where T: Clone,

Source§

unsafe fn clone_to_uninit(&self, dest: *mut u8)

🔬This is a nightly-only experimental API. (clone_to_uninit)
Performs copy-assignment from self to dest. Read more
Source§

impl<T> From<T> for T

Source§

fn from(t: T) -> T

Returns the argument unchanged.

Source§

impl<T> Instrument for T

Source§

fn instrument(self, span: Span) -> Instrumented<Self>

Instruments this type with the provided Span, returning an Instrumented wrapper. Read more
Source§

fn in_current_span(self) -> Instrumented<Self>

Instruments this type with the current Span, returning an Instrumented wrapper. Read more
Source§

impl<T, U> Into<U> for T
where U: From<T>,

Source§

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source§

impl<T> ToOwned for T
where T: Clone,

Source§

type Owned = T

The resulting type after obtaining ownership.
Source§

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more
Source§

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more
Source§

impl<T, U> TryFrom<U> for T
where U: Into<T>,

Source§

type Error = Infallible

The type returned in the event of a conversion error.
Source§

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.
Source§

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

Source§

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.
Source§

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.
Source§

impl<T> WithSubscriber for T

Source§

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

Attaches the provided Subscriber to this type, returning a WithDispatch wrapper. Read more
Source§

fn with_current_subscriber(self) -> WithDispatch<Self>

Attaches the current default Subscriber to this type, returning a WithDispatch wrapper. Read more