kbolt-core 0.1.6

Core engine for kbolt local-first retrieval
Documentation
use crate::Result;

#[derive(Debug, Clone, Copy, PartialEq, Eq)]
pub(crate) enum EmbeddingInputKind {
    Query,
    Document,
}

pub(crate) const DEFAULT_DOCUMENT_BATCH_WINDOW: usize = 64;

pub(crate) trait Embedder: Send + Sync {
    fn embed_batch(&self, kind: EmbeddingInputKind, texts: &[String]) -> Result<Vec<Vec<f32>>>;

    fn preferred_document_batch_window(&self) -> usize {
        DEFAULT_DOCUMENT_BATCH_WINDOW
    }
}

pub(crate) trait EmbeddingDocumentSizer: Send + Sync {
    fn count_document_tokens(&self, text: &str) -> Result<usize>;

    fn fits_within_token_limit_by_byte_len(&self, _byte_len: usize, _max_tokens: usize) -> bool {
        false
    }
}