Struct NativeRuntime

Source

pub struct NativeRuntime { /* private fields */ }

Expand description

Native runtime for local LLM inference.

Uses mistral.rs for high-performance inference on GGUF models. Supports CPU and GPU (Metal on macOS, CUDA on Linux) acceleration.

§Example

use spn_native::inference::NativeRuntime;
use spn_core::LoadConfig;

let mut runtime = NativeRuntime::new()?;
runtime.load("model.gguf".into(), LoadConfig::default()).await?;
let response = runtime.infer("Hello!", Default::default()).await?;

Implementations§

Source §

impl NativeRuntime

Source

pub fn new() -> Self

Create a new native runtime.

The runtime is created without a model loaded. Call load() to load a model before running inference.

Source

pub fn model_path(&self) -> Option<&PathBuf>

Get the path to the currently loaded model.

Source

pub fn config(&self) -> Option<&LoadConfig>

Get the load configuration for the current model.

Trait Implementations§

Source §

impl Clone for NativeRuntime

Source §

fn clone(&self) -> Self

Returns a duplicate of the value. Read more

1.0.0 · Source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more

Source §

impl Debug for NativeRuntime

Source §

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

Source §

impl Default for NativeRuntime

Source §

fn default() -> Self

Returns the “default value” for a type. Read more

Source §

impl InferenceBackend for NativeRuntime

Available on non-crate feature inference only.

Source §

async fn load( &mut self, _model_path: PathBuf, _config: LoadConfig, ) -> Result<(), NativeError>

Load a model from disk. Read more

Source §

async fn unload(&mut self) -> Result<(), NativeError>

Unload the model from memory. Read more

Source §

fn is_loaded(&self) -> bool

Check if a model is currently loaded.

Source §

fn model_info(&self) -> Option<&ModelInfo>

Get metadata about the loaded model. Read more

Source §

async fn infer( &self, _prompt: &str, _options: ChatOptions, ) -> Result<ChatResponse, NativeError>

Generate a response (non-streaming). Read more

Source §

async fn infer_stream( &self, _prompt: &str, _options: ChatOptions, ) -> Result<impl Stream<Item = Result<String, NativeError>> + Send, NativeError>

Generate a response (streaming). Read more

Auto Trait Implementations§

§

impl UnwindSafe for NativeRuntime

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> CloneToUninit for T
where T: Clone,

Source §

unsafe fn clone_to_uninit(&self, dest: *mut u8)

🔬This is a nightly-only experimental API. (clone_to_uninit)

Performs copy-assignment from self to dest. Read more

Source §

impl<T> DynInferenceBackend for T
where T: InferenceBackend + 'static,

Source §

fn load_dyn( &mut self, model_path: PathBuf, config: LoadConfig, ) -> Pin<Box<dyn Future<Output = Result<(), NativeError>> + Send + '_>>

Load a model from disk (boxed future for object safety).

Source §

fn unload_dyn( &mut self, ) -> Pin<Box<dyn Future<Output = Result<(), NativeError>> + Send + '_>>

Unload the model from memory (boxed future for object safety).

Source §

fn is_loaded_dyn(&self) -> bool

Check if a model is currently loaded.

Source §

fn model_info_dyn(&self) -> Option<ModelInfo>

Get metadata about the loaded model (cloned for object safety).

Source §

fn infer_dyn( &self, prompt: String, options: ChatOptions, ) -> Pin<Box<dyn Future<Output = Result<ChatResponse, NativeError>> + Send + '_>>

Generate a response (boxed future for object safety). Read more

Source §

fn infer_stream_dyn( &self, _prompt: String, _options: ChatOptions, ) -> Pin<Box<dyn Future<Output = Result<Pin<Box<dyn Stream<Item = Result<String, NativeError>> + Send>>, NativeError>> + Send + '_>>

Generate a streaming response (boxed stream for object safety). Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T> Instrument for T

Source §

fn instrument(self, span: Span) -> Instrumented<Self>

Instruments this type with the provided Span, returning an Instrumented wrapper. Read more

Source §

fn in_current_span(self) -> Instrumented<Self>

Instruments this type with the current Span, returning an Instrumented wrapper. Read more

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T> PolicyExt for T
where T: ?Sized,

Source §

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

Create a new Policy that returns Action::Follow only if self and other return Action::Follow. Read more

Source §

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

Create a new Policy that returns Action::Follow if either self or other returns Action::Follow. Read more

Source §

impl<T> Same for T

Source §

type Output = T

Should always be Self

Source §

impl<T> ToOwned for T
where T: Clone,

Source §

type Owned = T

The resulting type after obtaining ownership.

Source §

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more

Source §

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

Source §

impl<T> WithSubscriber for T

Source §

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

Attaches the provided Subscriber to this type, returning a WithDispatch wrapper. Read more

Source §

fn with_current_subscriber(self) -> WithDispatch<Self>

Attaches the current default Subscriber to this type, returning a WithDispatch wrapper. Read more

Struct NativeRuntime Copy item path

§Example

Implementations§

impl NativeRuntime

pub fn new() -> Self

pub fn model_path(&self) -> Option<&PathBuf>

pub fn config(&self) -> Option<&LoadConfig>

Trait Implementations§

impl Clone for NativeRuntime

fn clone(&self) -> Self

fn clone_from(&mut self, source: &Self)

impl Debug for NativeRuntime

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl Default for NativeRuntime

fn default() -> Self

impl InferenceBackend for NativeRuntime

async fn load( &mut self, _model_path: PathBuf, _config: LoadConfig, ) -> Result<(), NativeError>

async fn unload(&mut self) -> Result<(), NativeError>

fn is_loaded(&self) -> bool

fn model_info(&self) -> Option<&ModelInfo>

async fn infer( &self, _prompt: &str, _options: ChatOptions, ) -> Result<ChatResponse, NativeError>

async fn infer_stream( &self, _prompt: &str, _options: ChatOptions, ) -> Result<impl Stream<Item = Result<String, NativeError>> + Send, NativeError>

Auto Trait Implementations§

impl Freeze for NativeRuntime

impl RefUnwindSafe for NativeRuntime

impl Send for NativeRuntime

impl Sync for NativeRuntime

impl Unpin for NativeRuntime

impl UnsafeUnpin for NativeRuntime

impl UnwindSafe for NativeRuntime

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> DynInferenceBackend for Twhere T: InferenceBackend + 'static,

fn load_dyn( &mut self, model_path: PathBuf, config: LoadConfig, ) -> Pin<Box<dyn Future<Output = Result<(), NativeError>> + Send + '_>>

fn unload_dyn( &mut self, ) -> Pin<Box<dyn Future<Output = Result<(), NativeError>> + Send + '_>>

fn is_loaded_dyn(&self) -> bool

fn model_info_dyn(&self) -> Option<ModelInfo>

fn infer_dyn( &self, prompt: String, options: ChatOptions, ) -> Pin<Box<dyn Future<Output = Result<ChatResponse, NativeError>> + Send + '_>>

fn infer_stream_dyn( &self, _prompt: String, _options: ChatOptions, ) -> Pin<Box<dyn Future<Output = Result<Pin<Box<dyn Stream<Item = Result<String, NativeError>> + Send>>, NativeError>> + Send + '_>>

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> PolicyExt for Twhere T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>where T: Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>where T: Policy<B, E>, P: Policy<B, E>,

impl<T> Same for T

type Output = T

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

Struct NativeRuntime

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T> DynInferenceBackend for T
where T: InferenceBackend + 'static,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> PolicyExt for T
where T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,