offline_intelligence::worker_threads::llm_worker

Struct LLMWorker

pub struct LLMWorker { /* private fields */ }

Implementations§

Source §

impl LLMWorker

Source

pub fn new(shared_state: Arc<SharedState>) -> Self

Create with shared state (legacy constructor)

Source

pub fn new_with_backend(backend_url: String) -> Self

Create with explicit backend URL

Source

pub fn set_runtime_manager(&self, runtime_manager: Arc<RuntimeManager>)

Set the runtime manager

Source

pub async fn is_runtime_ready(&self) -> bool

Check if runtime is ready for inference

Source

pub async fn generate_response( &self, _session_id: String, context: Vec<Message>, ) -> Result<String>

Generate a complete (non-streaming) response from the LLM.

Source

pub async fn stream_response( &self, messages: Vec<Message>, max_tokens: u32, temperature: f32, ) -> Result<impl Stream<Item = Result<String, Error>>>

Stream response tokens from the LLM as Server-Sent Events. Returns a stream of SSE-formatted strings ready to send to the client.

Source

pub async fn batch_process( &self, prompts: Vec<(String, Vec<Message>)>, ) -> Result<Vec<String>>

Batch process multiple prompts (non-streaming)

Source

pub async fn initialize_model(&self, model_path: &str) -> Result<()>

Initialize LLM model (no-op for HTTP proxy mode)

Source

pub async fn generate_embeddings( &self, texts: Vec<String>, ) -> Result<Vec<Vec<f32>>>

Generate embeddings for one or more text inputs via llama-server’s /v1/embeddings endpoint. This reuses the vectors llama.cpp already computes during inference — no separate model needed. Returns a Vec of embedding vectors (one per input string).

Source

pub async fn generate_title( &self, prompt: &str, max_tokens: u32, ) -> Result<String>

Generate title for a chat using the LLM

Auto Trait Implementations§

§

impl !UnwindSafe for LLMWorker

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> Chain<T> for T

Source §

fn len(&self) -> usize

The number of items that this chain link consists of.

Source §

fn append_to(self, v: &mut Vec<T>)

Append the elements in this link to the chain.

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T> Instrument for T

Source §

fn instrument(self, span: Span) -> Instrumented<Self>

Instruments this type with the provided Span, returning an Instrumented wrapper. Read more

Source §

fn in_current_span(self) -> Instrumented<Self>

Instruments this type with the current Span, returning an Instrumented wrapper. Read more

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T> IntoEither for T

Source §

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

Source §

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

Source §