chat-mlx 0.0.0

Local-inference chat-rs provider (and CLI) for MiniCPM5 / Llama / Qwen models on Apple Silicon via MLX.
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
// chat-core's `ChatFailure` is large; boxing every Result is not worth it. The
// other chat-rs providers (e.g. chat-mistralrs) silence this crate-wide too.
#![allow(clippy::result_large_err)]

pub mod api;
pub mod engine;
pub mod loader;
pub mod parsers;

mod builder;
mod client;

pub use builder::{MlxBuilder, WithModel, WithoutModel};
pub use client::{MlxClient, StructuredMode};
pub use loader::Quantize;