Enum Embedder

Source

pub enum Embedder {
    Local {
        model: Arc<BertModel>,
        tokenizer: Arc<Tokenizer>,
        device: Device,
    },
    Ollama {
        client: Arc<OllamaClient>,
        model_name: String,
        dim: usize,
        degraded: Arc<AtomicBool>,
    },
}

Expand description

Semantic embedding engine supporting multiple backends.

Local (candle): all-MiniLM-L6-v2, 384-dim. Used at the semantic tier.
Ollama: nomic-embed-text-v1.5, 768-dim. Used at smart/autonomous tiers.

Variants§

§

Local

Candle-based local embedding (MiniLM-L6-v2, 384-dim).

v0.7.0 #1084 — model is Arc<BertModel> (no mutex). The pre-#1084 design held an Arc<Mutex<BertModel>> and locked the model across the full forward pass; on a multi-tenant HTTP daemon that serialised every embed call on a single global mutex. Candle’s BertModel::forward(&self, ...) is inference-only (weights are read-only mmap’d safetensors) so the mutex was unnecessary; parallel embed calls now run concurrently against the same weights.

Fields

§model: Arc<BertModel>

§tokenizer: Arc<Tokenizer>

§device: Device

§

Ollama

Remote embed client — Ollama-native OR OpenAI-compatible wire shape (#1598). The historical variant name is preserved to avoid call-site churn; the carried crate::llm::OllamaClient routes /api/embed (Ollama) or /embeddings + Bearer (OpenAI-compatible) per its provider. dim is the model’s vector dimensionality (768 for the historical nomic default); degraded latches the outcome of the most recent embed call so the capabilities surface can report a dead remote endpoint truthfully (#1594).

Fields

§client: Arc<OllamaClient>

§model_name: String

§dim: usize

§degraded: Arc<AtomicBool>

Enum Embedder Copy item path

Variants§

Local

Fields

Ollama

Fields

Implementations§

impl Embedder

pub fn new() -> Result<Self>

pub fn new_local() -> Result<Self>

pub fn new_ollama(client: Arc<OllamaClient>) -> Self

pub fn new_remote( client: Arc<OllamaClient>, model_name: String, dim: usize, ) -> Self

pub fn from_resolved( resolved: &ResolvedEmbeddings, tier_model: Option<EmbeddingModel>, ) -> Result<Option<Self>>

§Errors

pub fn for_model( model: EmbeddingModel, ollama_client: Option<Arc<OllamaClient>>, ) -> Result<Self>

pub fn dim(&self) -> usize

pub fn model_description(&self) -> String

pub fn is_degraded(&self) -> bool

pub fn embed(&self, text: &str) -> Result<Vec<f32>>

pub fn embed_query(&self, text: &str) -> Result<Vec<f32>>

pub fn embed_with_role(&self, text: &str, role: EmbedRole) -> Result<Vec<f32>>

pub fn embed_with_status(&self, text: &str) -> (Option<Vec<f32>>, EmbedStatus)

pub fn embed_batch(&self, texts: &[&str]) -> Result<Vec<Vec<f32>>>

pub fn cosine_similarity(a: &[f32], b: &[f32]) -> f32

pub fn cosine_similarity_checked( query: &[f32], stored: &[f32], ) -> CosineComparison

pub fn fuse(primary: &[f32], secondary: &[f32], primary_weight: f32) -> Vec<f32>

Trait Implementations§

impl Clone for Embedder

fn clone(&self) -> Embedder

fn clone_from(&mut self, source: &Self)

impl Embed for Embedder

fn embed(&self, text: &str) -> Result<Vec<f32>>

fn embed_query(&self, text: &str) -> Result<Vec<f32>>

fn embed_batch(&self, texts: &[&str]) -> Result<Vec<Vec<f32>>>

fn is_degraded(&self) -> bool

Auto Trait Implementations§

impl !RefUnwindSafe for Embedder

impl !UnwindSafe for Embedder

impl Freeze for Embedder

impl Send for Embedder

impl Sync for Embedder

impl Unpin for Embedder

impl UnsafeUnpin for Embedder

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> DynClone for Twhere T: Clone,

fn __clone_box(&self, _: Private) -> *mut ()

impl<T> ErasedDestructor for Twhere T: 'static,

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> FromRef<T> for Twhere T: Clone,

fn from_ref(input: &T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T> PolicyExt for Twhere T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>where T: Sized + Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>where T: Sized + Policy<B, E>, P: Policy<B, E>,

impl<T> Same for T

type Output = T

impl<T> ToOwned for Twhere T: Clone,

Enum Embedder

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T> DynClone for T
where T: Clone,

impl<T> ErasedDestructor for T
where T: 'static,

impl<T> FromRef<T> for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T> PolicyExt for T
where T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Sized + Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Sized + Policy<B, E>, P: Policy<B, E>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,