aimx/
lib.rs

1//! AIMX: safe Rust bindings for Apple's [FoundationModels] on-device language
2//! model framework, also known as Apple Intelligence.
3//!
4//! `aimx` is a small, safe Rust API over the system
5//! `FoundationModels.framework`. The model runs locally on supported Apple
6//! hardware, so prompts and responses do not require API keys, network requests,
7//! or a hosted inference provider.
8//!
9//! # API overview
10//!
11//! The crate is organized around a few public concepts:
12//!
13//! - [`AppleIntelligenceModels`] starts session builders with [`AppleIntelligenceModels::session`].
14//! - [`LanguageModelSession`] owns a stateful `LanguageModelSession` transcript.
15//! - [`GenerationOptions`] configures per-request temperature and token limits.
16//! - [`ResponseStream`] implements [`futures_core::Stream`] for incremental text.
17//! - [`GenerationSchema`] and [`GenerationSchemaProperty`] mirror Apple's guided-generation
18//!   schema vocabulary for structured JSON responses.
19//! - [`ToolDefinition`] registers Rust callbacks the model can call during a
20//!   response.
21//! - [`Prompt`], [`SystemInstructions`], [`Temperature`], and [`MaxTokens`] make
22//!   important FFI and generation boundaries explicit.
23//!
24//! Top-level helpers such as [`respond`] are available for one-off prompts, but
25//! production code should usually build a [`LanguageModelSession`] so instructions, tools, and
26//! defaults are visible in one place.
27//!
28//! # Learning model
29//!
30//! AIMX is easiest to learn as three decisions:
31//!
32//! 1. Ask whether Apple Intelligence is available with [`availability`] or
33//!    [`AppleIntelligenceModels::availability`].
34//! 2. Choose either a one-shot helper such as [`respond`] or a reusable
35//!    [`LanguageModelSession`].
36//! 3. Convert application input into typed boundaries such as [`Prompt`],
37//!    [`SystemInstructions`], [`Temperature`], [`MaxTokens`], and
38//!    [`GenerationSchema`] before it reaches the Swift bridge.
39//!
40//! This is the main safety rule of the crate. Raw strings and numbers can enter
41//! at your program boundary; after that, AIMX carries meaning with Rust types
42//! and returns [`Error`] when a value cannot safely cross into
43//! FoundationModels.
44//!
45//! # Platform requirements
46//!
47//! | Requirement | Value |
48//! |---|---|
49//! | macOS | 26 (Tahoe) or later |
50//! | Hardware | Apple Silicon (M1 or later) |
51//! | System setting | Apple Intelligence enabled |
52//! | Build tool | Xcode with the macOS 26 SDK |
53//!
54//! The crate still compiles on unsupported hosts. When the Swift bridge cannot
55//! be built, or when the current machine cannot run Apple Intelligence, public
56//! model APIs return [`Error::Unavailable`] instead of panicking or failing to
57//! link.
58//!
59//! # Quick start
60//!
61//! ```no_run
62//! # async fn example() -> Result<(), aimx::Error> {
63//! use aimx::{is_available, respond};
64//!
65//! if !is_available() {
66//!     eprintln!("Apple Intelligence not available on this device");
67//!     return Ok(());
68//! }
69//!
70//! let answer = respond("What is the capital of France?").await?;
71//! println!("{answer}");
72//! # Ok(()) }
73//! ```
74//!
75//! # Builder-style sessions
76//!
77//! ```no_run
78//! # async fn example() -> Result<(), aimx::Error> {
79//! use aimx::{MaxTokens, AppleIntelligenceModels, Temperature};
80//!
81//! let session = AppleIntelligenceModels::default()
82//!     .session()
83//!     .instructions("You are a concise Rust expert.")
84//!     .temperature(Temperature::new(0.2)?)
85//!     .max_tokens(MaxTokens::new(256)?)
86//!     .build()?;
87//! let r1 = session.respond_to("What is ownership?").await?;
88//! let r2 = session.respond_to("Give me a one-line example.").await?;
89//! println!("{r1}\n{r2}");
90//! # Ok(()) }
91//! ```
92//!
93//! # Generation options
94//!
95//! Use [`GenerationOptions::new`] with [`Temperature`] and [`MaxTokens`] to keep
96//! generation defaults type-safe after input has crossed your application boundary.
97//!
98//! ```
99//! use aimx::{GenerationOptions, MaxTokens, Temperature};
100//!
101//! let precise = GenerationOptions::new()
102//!     .temperature(Temperature::new(0.2)?)
103//!     .max_tokens(MaxTokens::new(256)?);
104//! # Ok::<(), aimx::Error>(())
105//! ```
106//!
107//! # Streaming
108//!
109//! ```no_run
110//! # async fn example() -> Result<(), aimx::Error> {
111//! use aimx::LanguageModelSession;
112//!
113//! let session = LanguageModelSession::new()?;
114//! let stream = session.stream_response("Tell me a short story.")?;
115//! # Ok(()) }
116//! ```
117//!
118//! # Structured generation
119//!
120//! ```no_run
121//! # async fn example() -> Result<(), aimx::Error> {
122//! use serde::Deserialize;
123//! use aimx::{LanguageModelSession, GenerationSchema, GenerationSchemaProperty, GenerationSchemaPropertyType};
124//!
125//! #[derive(Deserialize)]
126//! struct CityInfo { name: String, population: f64, country: String }
127//!
128//! let session = LanguageModelSession::new()?;
129//! let schema = GenerationSchema::new("CityInfo")
130//!     .property(GenerationSchemaProperty::new("name", GenerationSchemaPropertyType::String))
131//!     .property(GenerationSchemaProperty::new("population", GenerationSchemaPropertyType::Double))
132//!     .property(GenerationSchemaProperty::new("country", GenerationSchemaPropertyType::String));
133//!
134//! let info: CityInfo = session.respond_generating("Describe Paris.", &schema).await?;
135//! println!("{} has {} people", info.name, info.population);
136//! # Ok(()) }
137//! ```
138//!
139//! # Tool calling
140//!
141//! ```no_run
142//! # async fn example() -> Result<(), aimx::Error> {
143//! use aimx::{
144//!     AppleIntelligenceModels, GenerationSchema, GenerationSchemaProperty, GenerationSchemaPropertyType, ToolDefinition, ToolOutput,
145//! };
146//!
147//! let tool = ToolDefinition::builder(
148//!     "get_weather",
149//!     "Get current weather for a city",
150//!     GenerationSchema::new("GetWeatherArgs")
151//!         .property(GenerationSchemaProperty::new("city", GenerationSchemaPropertyType::String)
152//!             .description("City name")),
153//! )
154//! .handler(|args| {
155//!     let city = args["city"].as_str().unwrap_or("unknown");
156//!     Ok(ToolOutput::from(format!("Weather in {city}: sunny, 72°F")))
157//! });
158//!
159//! let session = AppleIntelligenceModels::default()
160//!     .session()
161//!     .instructions("You are a weather assistant.")
162//!     .tool(tool)
163//!     .build()?;
164//! let response = session.respond_to("What's the weather in Tokyo?").await?;
165//! println!("{response}");
166//! # Ok(()) }
167//! ```
168//!
169//! # Errors
170//!
171//! All fallible APIs use [`Error`]. The most common variants are:
172//!
173//! - [`Error::Unavailable`] when Apple Intelligence cannot run on this machine.
174//! - [`Error::NullByte`] when prompt or instruction text cannot cross the C FFI
175//!   boundary.
176//! - [`Error::InvalidTemperature`] or [`Error::InvalidMaxTokens`] when generation
177//!   options are outside the bridge-supported range.
178//! - [`Error::Generation`] for model or bridge failures during generation.
179//! - [`Error::Json`] for schema serialization or structured-response decoding.
180//!
181//! # Panics
182//!
183//! Public APIs in this crate are designed not to panic for user-provided input.
184//! Validation errors are reported through [`Error`]. Panics inside user-provided
185//! tool handlers are caught and returned as [`ToolCallError`].
186//!
187//! # Safety
188//!
189//! This is a safe Rust wrapper. The private FFI layer owns all `unsafe` calls to
190//! Swift-exported C functions, validates string inputs before crossing the
191//! boundary, and stores opaque Swift handles behind an owned `SessionHandle`.
192//! Callers do not need to uphold any unsafe preconditions.
193//!
194//! # Documentation style
195//!
196//! The public docs intentionally follow the shape recommended by the [rustdoc
197//! book] and the [Rust API Guidelines]: a crate-level overview, examples that
198//! compile where possible, intra-doc links, and explicit error, panic, and
199//! safety sections for fallible or boundary-sensitive APIs. Conceptual docs use
200//! the same teaching order as the tutorial: introduce one idea, show the
201//! smallest useful example, then name the invariant that keeps the example safe.
202//!
203//! [FoundationModels]: https://developer.apple.com/documentation/foundationmodels
204//! [rustdoc book]: https://doc.rust-lang.org/rustdoc/how-to-write-documentation.html
205//! [Rust API Guidelines]: https://rust-lang.github.io/api-guidelines/documentation.html
206
207#![warn(
208    missing_docs,
209    rustdoc::bare_urls,
210    rustdoc::broken_intra_doc_links,
211    rustdoc::invalid_codeblock_attributes
212)]
213#![cfg_attr(
214    not(test),
215    deny(
216        clippy::expect_used,
217        clippy::panic,
218        clippy::todo,
219        clippy::unimplemented,
220        clippy::unwrap_used
221    )
222)]
223
224use std::convert::Infallible;
225use std::ffi::{CStr, CString, NulError};
226use std::future::Future;
227use std::pin::Pin;
228use std::task::{Context as StdContext, Poll};
229
230use futures_channel::mpsc;
231use futures_core::Stream;
232
233#[cfg(aimx_bridge)]
234use std::ffi::{c_char, c_void};
235
236#[cfg(aimx_bridge)]
237use std::ptr::null;
238
239#[cfg(aimx_bridge)]
240use std::ptr::NonNull;
241
242#[cfg(aimx_bridge)]
243use std::sync::Arc;
244
245#[cfg(aimx_bridge)]
246use futures_channel::oneshot;
247
248// ─── FFI declarations ──────────────────────────────────────────────────────────
249
250#[cfg(aimx_bridge)]
251unsafe extern "C" {
252    fn fm_availability_reason() -> i32;
253    fn fm_session_create(instructions: *const c_char) -> *mut c_void;
254    fn fm_session_create_with_tools(
255        instructions: *const c_char,
256        tools_json: *const c_char,
257        tool_ctx: *mut c_void,
258        tool_dispatch: extern "C" fn(
259            *mut c_void,
260            *const c_char,
261            *const c_char,
262            *mut c_void,
263            extern "C" fn(*mut c_void, *const c_char, *const c_char),
264        ),
265    ) -> *mut c_void;
266    fn fm_session_destroy(handle: *mut c_void);
267    fn fm_session_respond(
268        handle: *mut c_void,
269        prompt: *const c_char,
270        temperature: f64,
271        max_tokens: i64,
272        ctx: *mut c_void,
273        callback: extern "C" fn(*mut c_void, *const c_char, *const c_char),
274    );
275    fn fm_session_respond_structured(
276        handle: *mut c_void,
277        prompt: *const c_char,
278        schema_json: *const c_char,
279        temperature: f64,
280        max_tokens: i64,
281        ctx: *mut c_void,
282        callback: extern "C" fn(*mut c_void, *const c_char, *const c_char),
283    );
284    fn fm_session_stream(
285        handle: *mut c_void,
286        prompt: *const c_char,
287        temperature: f64,
288        max_tokens: i64,
289        ctx: *mut c_void,
290        on_token: extern "C" fn(*mut c_void, *const c_char),
291        on_done: extern "C" fn(*mut c_void, *const c_char),
292    );
293}
294
295// ─── Cross-target trait bounds ────────────────────────────────────────────────
296
297/// `Send` on native targets and a no-op marker on WebAssembly.
298#[cfg(not(target_family = "wasm"))]
299pub trait WasmCompatSend: Send {}
300
301/// No-op marker on WebAssembly where single-threaded runtimes do not require `Send`.
302#[cfg(target_family = "wasm")]
303pub trait WasmCompatSend {}
304
305#[cfg(not(target_family = "wasm"))]
306impl<T> WasmCompatSend for T where T: Send {}
307
308#[cfg(target_family = "wasm")]
309impl<T> WasmCompatSend for T {}
310
311/// `Sync` on native targets and a no-op marker on WebAssembly.
312#[cfg(not(target_family = "wasm"))]
313pub trait WasmCompatSync: Sync {}
314
315/// No-op marker on WebAssembly where single-threaded runtimes do not require `Sync`.
316#[cfg(target_family = "wasm")]
317pub trait WasmCompatSync {}
318
319#[cfg(not(target_family = "wasm"))]
320impl<T> WasmCompatSync for T where T: Sync {}
321
322#[cfg(target_family = "wasm")]
323impl<T> WasmCompatSync for T {}
324
325macro_rules! string_newtype {
326    ($(#[$meta:meta])* $name:ident) => {
327        $(#[$meta])*
328        #[derive(Debug, Clone, PartialEq, Eq, Hash, serde::Serialize, serde::Deserialize)]
329        #[serde(transparent)]
330        pub struct $name(String);
331
332        impl $name {
333            /// Creates a new value.
334            pub fn new(value: impl Into<String>) -> Self {
335                Self(value.into())
336            }
337
338            /// Borrows the inner string.
339            pub fn as_str(&self) -> &str {
340                &self.0
341            }
342
343            /// Consumes the wrapper and returns the inner string.
344            pub fn into_string(self) -> String {
345                self.0
346            }
347
348            /// Returns `true` when the wrapped string is empty.
349            pub fn is_empty(&self) -> bool {
350                self.0.is_empty()
351            }
352        }
353
354        impl From<String> for $name {
355            fn from(value: String) -> Self {
356                Self(value)
357            }
358        }
359
360        impl From<&str> for $name {
361            fn from(value: &str) -> Self {
362                Self(value.to_owned())
363            }
364        }
365
366        impl AsRef<str> for $name {
367            fn as_ref(&self) -> &str {
368                self.as_str()
369            }
370        }
371
372        impl std::fmt::Display for $name {
373            fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
374                f.write_str(self.as_str())
375            }
376        }
377
378        impl PartialEq<&str> for $name {
379            fn eq(&self, other: &&str) -> bool {
380                self.as_str() == *other
381            }
382        }
383
384        impl PartialEq<$name> for &str {
385            fn eq(&self, other: &$name) -> bool {
386                *self == other.as_str()
387            }
388        }
389    };
390}
391
392string_newtype!(
393    /// Developer-provided system instructions for a session.
394    InstructionsText
395);
396string_newtype!(
397    /// UTF-8 prompt text sent to the model.
398    PromptText
399);
400string_newtype!(
401    /// Text returned by the model.
402    ResponseText
403);
404/// MLX-style alias for text generated by the model.
405pub type GeneratedText = ResponseText;
406
407string_newtype!(
408    /// Name of a structured-generation schema.
409    GenerationSchemaName
410);
411/// Compatibility alias for the earlier structured-generation schema-name type.
412pub type ResponseSchemaName = GenerationSchemaName;
413/// Compatibility alias for the older structured-generation schema-name type.
414pub type SchemaName = GenerationSchemaName;
415
416string_newtype!(
417    /// Name of a property in a structured-generation schema.
418    GenerationSchemaPropertyName
419);
420/// Compatibility alias for the earlier structured-generation field-name type.
421pub type ResponseFieldName = GenerationSchemaPropertyName;
422/// Compatibility alias for the older structured-generation field-name type.
423pub type SchemaPropertyName = GenerationSchemaPropertyName;
424
425string_newtype!(
426    /// Human-readable description attached to a schema or schema property.
427    SchemaDescription
428);
429string_newtype!(
430    /// Name the model uses to invoke a tool.
431    ToolName
432);
433string_newtype!(
434    /// Human-readable description of a tool.
435    ToolDescription
436);
437string_newtype!(
438    /// Successful output returned from a tool call.
439    ToolOutput
440);
441
442/// Prompt text that has been checked for C-FFI compatibility.
443#[derive(Debug, Clone, PartialEq, Eq)]
444pub struct Prompt {
445    text: String,
446    c_text: CString,
447}
448
449impl Prompt {
450    /// Creates a prompt, rejecting text containing interior null bytes.
451    ///
452    /// Use this when you want to validate user-provided prompt text before
453    /// constructing a [`LanguageModelSession`] or calling [`respond`].
454    ///
455    /// # Examples
456    ///
457    /// ```
458    /// use aimx::Prompt;
459    ///
460    /// let prompt = Prompt::new("Summarize this note")?;
461    /// assert_eq!(prompt.as_str(), "Summarize this note");
462    /// # Ok::<(), aimx::Error>(())
463    /// ```
464    ///
465    /// # Errors
466    ///
467    /// Returns [`Error::NullByte`] if `value` contains an interior null byte.
468    pub fn new(value: impl Into<String>) -> Result<Self, Error> {
469        let text = value.into();
470        let c_text = CString::new(text.clone())?;
471
472        Ok(Self { text, c_text })
473    }
474
475    /// Borrows the prompt as UTF-8 text.
476    pub fn as_str(&self) -> &str {
477        &self.text
478    }
479
480    #[cfg(aimx_bridge)]
481    fn as_ptr(&self) -> *const c_char {
482        self.c_text.as_ptr()
483    }
484}
485
486impl TryFrom<&str> for Prompt {
487    type Error = Error;
488
489    fn try_from(value: &str) -> Result<Self, Self::Error> {
490        Self::new(value)
491    }
492}
493
494impl TryFrom<String> for Prompt {
495    type Error = Error;
496
497    fn try_from(value: String) -> Result<Self, Self::Error> {
498        Self::new(value)
499    }
500}
501
502impl TryFrom<PromptText> for Prompt {
503    type Error = Error;
504
505    fn try_from(value: PromptText) -> Result<Self, Self::Error> {
506        Self::new(value.into_string())
507    }
508}
509
510impl AsRef<str> for Prompt {
511    fn as_ref(&self) -> &str {
512        self.as_str()
513    }
514}
515
516/// Compatibility alias for the older prompt boundary name.
517pub type PromptInput = Prompt;
518
519/// LanguageModelSession instructions that have been checked for C-FFI compatibility.
520#[derive(Debug, Clone, PartialEq, Eq)]
521pub struct SystemInstructions {
522    text: String,
523    c_text: CString,
524}
525
526impl SystemInstructions {
527    /// Creates session instructions, rejecting text containing interior null bytes.
528    ///
529    /// SystemInstructions are developer-controlled system guidance that persists for
530    /// the lifetime of a [`LanguageModelSession`].
531    ///
532    /// # Examples
533    ///
534    /// ```
535    /// use aimx::SystemInstructions;
536    ///
537    /// let instructions = SystemInstructions::new("Answer in one concise paragraph.")?;
538    /// assert_eq!(instructions.as_str(), "Answer in one concise paragraph.");
539    /// # Ok::<(), aimx::Error>(())
540    /// ```
541    ///
542    /// # Errors
543    ///
544    /// Returns [`Error::NullByte`] if `value` contains an interior null byte.
545    pub fn new(value: impl Into<String>) -> Result<Self, Error> {
546        let text = value.into();
547        let c_text = CString::new(text.clone())?;
548
549        Ok(Self { text, c_text })
550    }
551
552    /// Empty system instructions.
553    ///
554    /// This is equivalent to `SystemInstructions::new("")` without the fallible
555    /// allocation path.
556    pub fn empty() -> Self {
557        Self {
558            text: String::new(),
559            c_text: CString::default(),
560        }
561    }
562
563    /// Borrows the instructions as UTF-8 text.
564    pub fn as_str(&self) -> &str {
565        &self.text
566    }
567
568    #[cfg(aimx_bridge)]
569    fn as_ptr(&self) -> *const c_char {
570        self.c_text.as_ptr()
571    }
572}
573
574impl Default for SystemInstructions {
575    fn default() -> Self {
576        Self::empty()
577    }
578}
579
580impl TryFrom<&str> for SystemInstructions {
581    type Error = Error;
582
583    fn try_from(value: &str) -> Result<Self, Self::Error> {
584        Self::new(value)
585    }
586}
587
588impl TryFrom<String> for SystemInstructions {
589    type Error = Error;
590
591    fn try_from(value: String) -> Result<Self, Self::Error> {
592        Self::new(value)
593    }
594}
595
596impl TryFrom<InstructionsText> for SystemInstructions {
597    type Error = Error;
598
599    fn try_from(value: InstructionsText) -> Result<Self, Self::Error> {
600        Self::new(value.into_string())
601    }
602}
603
604/// Compatibility alias for the older system-instructions boundary name.
605pub type Instructions = SystemInstructions;
606
607/// Valid model temperature in the inclusive range `0.0..=2.0`.
608#[derive(Debug, Clone, Copy, PartialEq)]
609pub struct Temperature(f64);
610
611impl Temperature {
612    /// Lowest supported temperature.
613    pub const MIN: f64 = 0.0;
614    /// Highest supported temperature.
615    pub const MAX: f64 = 2.0;
616
617    /// Creates a validated temperature.
618    ///
619    /// Apple Intelligence accepts temperatures in the inclusive range
620    /// [`Temperature::MIN`] through [`Temperature::MAX`]. Lower values make
621    /// output more deterministic; higher values make output more varied.
622    ///
623    /// # Examples
624    ///
625    /// ```
626    /// use aimx::Temperature;
627    ///
628    /// let temperature = Temperature::new(0.2)?;
629    /// assert_eq!(temperature.as_f64(), 0.2);
630    /// # Ok::<(), aimx::Error>(())
631    /// ```
632    ///
633    /// # Errors
634    ///
635    /// Returns [`Error::InvalidTemperature`] when `value` is outside
636    /// `0.0..=2.0` or is `NaN`.
637    pub fn new(value: f64) -> Result<Self, Error> {
638        if (Self::MIN..=Self::MAX).contains(&value) {
639            Ok(Self(value))
640        } else {
641            Err(Error::InvalidTemperature(value))
642        }
643    }
644
645    /// Returns the raw floating-point temperature.
646    pub fn as_f64(self) -> f64 {
647        self.0
648    }
649}
650
651impl TryFrom<f64> for Temperature {
652    type Error = Error;
653
654    fn try_from(value: f64) -> Result<Self, Self::Error> {
655        Self::new(value)
656    }
657}
658
659/// Maximum number of response tokens requested from the model.
660#[derive(Debug, Clone, Copy, PartialEq, Eq, PartialOrd, Ord, Hash)]
661pub struct MaxTokens(usize);
662
663impl MaxTokens {
664    /// Highest token limit representable by the Swift bridge.
665    pub const MAX: usize = i64::MAX as usize;
666
667    /// Creates a token limit.
668    ///
669    /// The Rust API stores token counts as [`usize`], but the Swift bridge uses
670    /// `i64`. This constructor rejects values that cannot cross that boundary
671    /// without changing meaning.
672    ///
673    /// # Examples
674    ///
675    /// ```
676    /// use aimx::MaxTokens;
677    ///
678    /// let max_tokens = MaxTokens::new(256)?;
679    /// assert_eq!(max_tokens.get(), 256);
680    /// # Ok::<(), aimx::Error>(())
681    /// ```
682    ///
683    /// # Errors
684    ///
685    /// Returns [`Error::InvalidMaxTokens`] when `value` is greater than
686    /// [`MaxTokens::MAX`].
687    pub fn new(value: usize) -> Result<Self, Error> {
688        if value <= Self::MAX {
689            Ok(Self(value))
690        } else {
691            Err(Error::InvalidMaxTokens(value))
692        }
693    }
694
695    /// Returns the raw token count.
696    pub fn get(self) -> usize {
697        self.0
698    }
699}
700
701impl TryFrom<usize> for MaxTokens {
702    type Error = Error;
703
704    fn try_from(value: usize) -> Result<Self, Self::Error> {
705        Self::new(value)
706    }
707}
708
709/// Error returned by the model or bridge during generation.
710#[derive(Debug, Clone, PartialEq, Eq, thiserror::Error)]
711#[error("{message}")]
712pub struct GenerationError {
713    message: String,
714}
715
716impl GenerationError {
717    /// Creates a generation error with a human-readable message.
718    pub fn new(message: impl Into<String>) -> Self {
719        Self {
720            message: message.into(),
721        }
722    }
723
724    /// Borrows the error message.
725    pub fn as_str(&self) -> &str {
726        &self.message
727    }
728}
729
730impl From<String> for GenerationError {
731    fn from(message: String) -> Self {
732        Self::new(message)
733    }
734}
735
736impl From<&str> for GenerationError {
737    fn from(message: &str) -> Self {
738        Self::new(message)
739    }
740}
741
742/// Error returned by a Rust tool handler.
743#[derive(Debug, Clone, PartialEq, Eq, thiserror::Error)]
744#[error("{message}")]
745pub struct ToolCallError {
746    message: String,
747}
748
749impl ToolCallError {
750    /// Creates a tool-call error with a human-readable message.
751    pub fn new(message: impl Into<String>) -> Self {
752        Self {
753            message: message.into(),
754        }
755    }
756
757    /// Borrows the error message.
758    pub fn as_str(&self) -> &str {
759        &self.message
760    }
761}
762
763impl From<String> for ToolCallError {
764    fn from(message: String) -> Self {
765        Self::new(message)
766    }
767}
768
769impl From<&str> for ToolCallError {
770    fn from(message: &str) -> Self {
771        Self::new(message)
772    }
773}
774
775/// Result type returned by tool handlers.
776pub type ToolResult = Result<ToolOutput, ToolCallError>;
777
778type ModelTextResult = Result<ResponseText, GenerationError>;
779type StreamSender = mpsc::UnboundedSender<ModelTextResult>;
780type StreamReceiver = mpsc::UnboundedReceiver<ModelTextResult>;
781type ToolHandlerBox = Box<dyn ToolHandler>;
782
783#[cfg(aimx_bridge)]
784type ResponseSender = oneshot::Sender<ModelTextResult>;
785#[cfg(aimx_bridge)]
786type ResponseReceiver = oneshot::Receiver<ModelTextResult>;
787#[cfg(aimx_bridge)]
788type ToolResultCallback = extern "C" fn(*mut c_void, *const c_char, *const c_char);
789
790// ─── Error ─────────────────────────────────────────────────────────────────────
791
792/// Reasons why Apple Intelligence is not available on the current device.
793#[derive(Debug, Clone, PartialEq, Eq, thiserror::Error)]
794pub enum AvailabilityError {
795    /// The device does not have compatible hardware (requires Apple Silicon M1 or later).
796    #[error("device is not eligible (requires Apple Silicon M1 or later)")]
797    DeviceNotEligible,
798    /// Apple Intelligence is supported but has not been enabled in System Settings.
799    #[error("Apple Intelligence is not enabled in System Settings")]
800    NotEnabled,
801    /// The on-device model is still downloading or is otherwise not ready.
802    #[error("the on-device model is not ready yet")]
803    ModelNotReady,
804    /// An unrecognized availability state was returned by the framework.
805    #[error("unknown availability state")]
806    Unknown,
807}
808
809/// Compatibility alias for the older availability error name.
810pub type UnavailabilityReason = AvailabilityError;
811
812/// Errors returned by this crate.
813#[derive(Debug, thiserror::Error)]
814pub enum Error {
815    /// Apple Intelligence is not available on this device.
816    #[error("Apple Intelligence unavailable: {0}")]
817    Unavailable(#[source] AvailabilityError),
818
819    /// The model produced an error during text generation.
820    #[error("generation error: {0}")]
821    Generation(#[from] GenerationError),
822
823    /// An argument contained a null byte and could not be converted to a C string.
824    #[error("argument contains a null byte: {0}")]
825    NullByte(#[from] NulError),
826
827    /// A `temperature` value outside the valid range [0.0, 2.0] was supplied.
828    #[error("temperature {0} is out of range; expected 0.0 – 2.0")]
829    InvalidTemperature(f64),
830
831    /// A `max_tokens` value too large for the AIMX bridge was supplied.
832    #[error("max_tokens {0} is out of range; expected no more than i64::MAX")]
833    InvalidMaxTokens(usize),
834
835    /// JSON serialisation or deserialisation failed.
836    #[error("JSON error: {0}")]
837    Json(#[from] serde_json::Error),
838
839    /// A tool invoked by the model returned an error.
840    #[error("tool '{name}' failed: {error}")]
841    ToolError {
842        /// Tool name.
843        name: ToolName,
844        /// Tool failure.
845        #[source]
846        error: ToolCallError,
847    },
848}
849
850impl From<Infallible> for Error {
851    fn from(error: Infallible) -> Self {
852        match error {}
853    }
854}
855
856// ─── GenerationOptions ─────────────────────────────────────────────────────────
857
858/// Tuning parameters for a single generation request.
859///
860/// Values are optional; `None` uses the model's built-in default. Numeric
861/// settings are stored as [`Temperature`] and [`MaxTokens`] so validated
862/// generation semantics cannot be bypassed after construction.
863#[derive(Debug, Default, Clone)]
864pub struct GenerationOptions {
865    temperature: Option<Temperature>,
866    max_tokens: Option<MaxTokens>,
867}
868
869impl GenerationOptions {
870    /// Creates options using model defaults.
871    pub fn new() -> Self {
872        Self::default()
873    }
874
875    /// Sets the generation temperature.
876    ///
877    /// Range: `0.0` (fully deterministic) to `2.0` (very creative).
878    pub fn temperature(mut self, temperature: Temperature) -> Self {
879        self.temperature = Some(temperature);
880        self
881    }
882
883    /// Alias for [`GenerationOptions::temperature`].
884    pub fn with_temperature(mut self, temperature: Temperature) -> Self {
885        self = self.temperature(temperature);
886        self
887    }
888
889    /// Parses and sets a generation temperature from a raw boundary value.
890    ///
891    /// Prefer [`GenerationOptions::temperature`] when your code already has a
892    /// [`Temperature`]. Use this at IO boundaries such as CLI, JSON, or UI input.
893    ///
894    /// # Errors
895    ///
896    /// Returns [`Error::InvalidTemperature`] when `temperature` is outside
897    /// Apple Intelligence's supported range.
898    pub fn try_temperature(self, temperature: f64) -> Result<Self, Error> {
899        Ok(self.temperature(Temperature::new(temperature)?))
900    }
901
902    /// Sets the maximum number of response tokens.
903    ///
904    /// The model's session has a combined context window of 4 096 tokens
905    /// (instructions + all prompts + all responses). Leaving this unset lets the
906    /// model decide.
907    pub fn max_tokens(mut self, max_tokens: MaxTokens) -> Self {
908        self.max_tokens = Some(max_tokens);
909        self
910    }
911
912    /// Alias for [`GenerationOptions::max_tokens`].
913    pub fn with_max_tokens(mut self, max_tokens: MaxTokens) -> Self {
914        self = self.max_tokens(max_tokens);
915        self
916    }
917
918    /// Parses and sets a maximum token count from a raw boundary value.
919    ///
920    /// Prefer [`GenerationOptions::max_tokens`] when your code already has a
921    /// [`MaxTokens`]. Use this at IO boundaries such as CLI, JSON, or UI input.
922    ///
923    /// # Errors
924    ///
925    /// Returns [`Error::InvalidMaxTokens`] when the value cannot be represented
926    /// by the Swift bridge.
927    pub fn try_max_tokens(self, max_tokens: usize) -> Result<Self, Error> {
928        Ok(self.max_tokens(MaxTokens::new(max_tokens)?))
929    }
930
931    /// Returns the configured typed temperature, if any.
932    pub fn temperature_value(&self) -> Option<Temperature> {
933        self.temperature
934    }
935
936    /// Returns the configured typed maximum response token count, if any.
937    pub fn max_tokens_value(&self) -> Option<MaxTokens> {
938        self.max_tokens
939    }
940
941    /// Validates all configured option values.
942    ///
943    /// Values constructed through this type are already validated. This method
944    /// is kept so generic setup code can verify options before storing them.
945    ///
946    /// # Examples
947    ///
948    /// ```
949    /// use aimx::{GenerationOptions, MaxTokens, Temperature};
950    ///
951    /// let options = GenerationOptions::new()
952    ///     .temperature(Temperature::new(0.4)?)
953    ///     .max_tokens(MaxTokens::new(128)?);
954    /// options.validate()?;
955    /// # Ok::<(), aimx::Error>(())
956    /// ```
957    ///
958    /// # Errors
959    ///
960    /// This method returns errors only if options were constructed through a
961    /// future boundary path that can carry invalid data.
962    pub fn validate(&self) -> Result<(), Error> {
963        GenerationConfig::try_from(self).map(|_| ())
964    }
965
966    fn validated(&self) -> Result<GenerationConfig, Error> {
967        GenerationConfig::try_from(self)
968    }
969}
970
971#[derive(Debug, Clone, Copy, Default)]
972struct GenerationConfig {
973    temperature: Option<Temperature>,
974    max_tokens: Option<MaxTokens>,
975}
976
977impl GenerationConfig {
978    fn ffi_temperature(self) -> f64 {
979        self.temperature.map(Temperature::as_f64).unwrap_or(-1.0)
980    }
981
982    fn ffi_max_tokens(self) -> i64 {
983        self.max_tokens
984            .map(|max_tokens| max_tokens.get() as i64)
985            .unwrap_or(-1)
986    }
987}
988
989impl TryFrom<&GenerationOptions> for GenerationConfig {
990    type Error = Error;
991
992    fn try_from(options: &GenerationOptions) -> Result<Self, Self::Error> {
993        Ok(Self {
994            temperature: options.temperature,
995            max_tokens: options.max_tokens,
996        })
997    }
998}
999
1000// ─── GenerationSchema types for structured generation ────────────────────────────────────
1001
1002/// The type of a single property in a [`GenerationSchema`].
1003#[derive(Debug, Clone, serde::Serialize)]
1004#[serde(rename_all = "lowercase")]
1005pub enum GenerationSchemaPropertyType {
1006    /// UTF-8 text.
1007    String,
1008    /// Whole number (serialised as JSON integer).
1009    Integer,
1010    /// Floating-point number.
1011    Double,
1012    /// Boolean true/false.
1013    Bool,
1014}
1015
1016/// Compatibility alias for the older structured-generation property type name.
1017pub type ResponseFieldType = GenerationSchemaPropertyType;
1018/// Compatibility alias for the oldest structured-generation property type name.
1019pub type SchemaPropertyType = GenerationSchemaPropertyType;
1020
1021/// Whether a [`GenerationSchemaProperty`] must appear in structured output.
1022#[derive(Debug, Clone, Copy, PartialEq, Eq, Default)]
1023pub enum GenerationSchemaPropertyRequirement {
1024    /// The model must include this property.
1025    #[default]
1026    Required,
1027    /// The model may omit this property.
1028    Optional,
1029}
1030
1031impl GenerationSchemaPropertyRequirement {
1032    /// Returns `true` when the property may be omitted.
1033    pub fn is_optional(self) -> bool {
1034        matches!(self, Self::Optional)
1035    }
1036
1037    /// Returns `true` when the property must be present.
1038    pub fn is_required(self) -> bool {
1039        matches!(self, Self::Required)
1040    }
1041}
1042
1043/// A single property within a [`GenerationSchema`].
1044#[derive(Debug, Clone)]
1045pub struct GenerationSchemaProperty {
1046    /// Property name (matches the JSON key in the model output).
1047    pub name: GenerationSchemaPropertyName,
1048    /// Optional human-readable hint that guides the model.
1049    pub description: Option<SchemaDescription>,
1050    /// The expected type of this property.
1051    pub property_type: GenerationSchemaPropertyType,
1052    /// Whether the model must include or may omit this property.
1053    pub requirement: GenerationSchemaPropertyRequirement,
1054}
1055
1056/// Compatibility alias for the older structured-generation property name.
1057pub type ResponseField = GenerationSchemaProperty;
1058/// Compatibility alias for the oldest structured-generation property name.
1059pub type SchemaProperty = GenerationSchemaProperty;
1060
1061impl GenerationSchemaProperty {
1062    /// Creates a required property with the given name and type.
1063    pub fn new(
1064        name: impl Into<GenerationSchemaPropertyName>,
1065        property_type: GenerationSchemaPropertyType,
1066    ) -> Self {
1067        Self {
1068            name: name.into(),
1069            description: None,
1070            property_type,
1071            requirement: GenerationSchemaPropertyRequirement::Required,
1072        }
1073    }
1074
1075    /// Attaches a human-readable description that guides the model.
1076    pub fn description(mut self, description: impl Into<SchemaDescription>) -> Self {
1077        self.description = Some(description.into());
1078        self
1079    }
1080
1081    /// Marks this property as optional (the model may omit it).
1082    pub fn optional(mut self) -> Self {
1083        self.requirement = GenerationSchemaPropertyRequirement::Optional;
1084        self
1085    }
1086
1087    /// Marks this property as required.
1088    pub fn required(mut self) -> Self {
1089        self.requirement = GenerationSchemaPropertyRequirement::Required;
1090        self
1091    }
1092}
1093
1094impl serde::Serialize for GenerationSchemaProperty {
1095    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
1096    where
1097        S: serde::Serializer,
1098    {
1099        use serde::ser::SerializeStruct;
1100
1101        let field_count = if self.description.is_some() { 4 } else { 3 };
1102        let mut state = serializer.serialize_struct("GenerationSchemaProperty", field_count)?;
1103        state.serialize_field("name", &self.name)?;
1104        if let Some(description) = &self.description {
1105            state.serialize_field("description", description)?;
1106        }
1107        state.serialize_field("type", &self.property_type)?;
1108        state.serialize_field("optional", &self.requirement.is_optional())?;
1109        state.end()
1110    }
1111}
1112
1113/// Describes the JSON object shape that the model must produce for structured generation.
1114///
1115/// Build one using the builder methods, then pass it to [`LanguageModelSession::generate_object`].
1116///
1117/// ```
1118/// use aimx::{GenerationSchema, GenerationSchemaProperty, GenerationSchemaPropertyType};
1119///
1120/// let schema = GenerationSchema::new("Point")
1121///     .property(GenerationSchemaProperty::new("x", GenerationSchemaPropertyType::Double))
1122///     .property(GenerationSchemaProperty::new("y", GenerationSchemaPropertyType::Double));
1123/// ```
1124#[derive(Debug, Clone, serde::Serialize)]
1125pub struct GenerationSchema {
1126    /// Internal type name used by the model's structured generation system.
1127    pub name: GenerationSchemaName,
1128    /// Optional description of what this type represents.
1129    #[serde(skip_serializing_if = "Option::is_none")]
1130    pub description: Option<SchemaDescription>,
1131    /// The properties the model must populate.
1132    pub properties: Vec<GenerationSchemaProperty>,
1133}
1134
1135/// Compatibility alias for the older structured-generation schema name.
1136pub type ResponseSchema = GenerationSchema;
1137/// Compatibility alias for the oldest structured-generation schema name.
1138pub type Schema = GenerationSchema;
1139
1140impl GenerationSchema {
1141    /// Creates a new empty schema with the given type name.
1142    pub fn new(name: impl Into<GenerationSchemaName>) -> Self {
1143        Self {
1144            name: name.into(),
1145            description: None,
1146            properties: Vec::new(),
1147        }
1148    }
1149
1150    /// Attaches a description of this type.
1151    pub fn description(mut self, description: impl Into<SchemaDescription>) -> Self {
1152        self.description = Some(description.into());
1153        self
1154    }
1155
1156    /// Adds a property to this schema.
1157    pub fn property(mut self, property: GenerationSchemaProperty) -> Self {
1158        self.properties.push(property);
1159        self
1160    }
1161}
1162
1163// ─── Tool calling ──────────────────────────────────────────────────────────────
1164
1165/// A function that the model can invoke when responding to a prompt.
1166///
1167/// The handler receives the model's arguments as a [`serde_json::Value`] and must return
1168/// either a [`ToolOutput`] delivered back to the model or a [`ToolCallError`].
1169///
1170/// Build one with [`ToolDefinition::builder`], then attach it to a [`LanguageModelSessionBuilder`].
1171pub struct ToolDefinition {
1172    /// Name the model uses to reference this tool. Must be unique within a session.
1173    pub name: ToolName,
1174    /// Human-readable description shown to the model.
1175    pub description: ToolDescription,
1176    /// GenerationSchema describing the arguments the model must supply when calling this tool.
1177    pub parameters: GenerationSchema,
1178    handler: ToolHandlerBox,
1179}
1180
1181impl ToolDefinition {
1182    /// Creates a complete tool definition from a typed handler.
1183    pub fn new(
1184        name: impl Into<ToolName>,
1185        description: impl Into<ToolDescription>,
1186        parameters: GenerationSchema,
1187        handler: impl Fn(serde_json::Value) -> ToolResult + WasmCompatSend + WasmCompatSync + 'static,
1188    ) -> Self {
1189        Self::builder(name, description, parameters).handler(handler)
1190    }
1191
1192    /// Starts building a tool definition.
1193    pub fn builder(
1194        name: impl Into<ToolName>,
1195        description: impl Into<ToolDescription>,
1196        parameters: GenerationSchema,
1197    ) -> ToolDefinitionBuilder {
1198        ToolDefinitionBuilder {
1199            name: name.into(),
1200            description: description.into(),
1201            parameters,
1202        }
1203    }
1204
1205    /// Alias for [`ToolDefinition::new`] that reads well at call sites.
1206    pub fn from_handler(
1207        name: impl Into<ToolName>,
1208        description: impl Into<ToolDescription>,
1209        parameters: GenerationSchema,
1210        handler: impl Fn(serde_json::Value) -> ToolResult + WasmCompatSend + WasmCompatSync + 'static,
1211    ) -> Self {
1212        Self::new(name, description, parameters, handler)
1213    }
1214
1215    #[cfg(aimx_bridge)]
1216    fn bridge_description(&self) -> serde_json::Value {
1217        serde_json::json!({
1218            "name": self.name.as_str(),
1219            "description": self.description.as_str(),
1220            "properties": &self.parameters.properties,
1221        })
1222    }
1223}
1224
1225/// Builder for [`ToolDefinition`].
1226#[derive(Debug, Clone)]
1227pub struct ToolDefinitionBuilder {
1228    name: ToolName,
1229    description: ToolDescription,
1230    parameters: GenerationSchema,
1231}
1232
1233impl ToolDefinitionBuilder {
1234    /// Attaches the Rust handler and returns a complete tool definition.
1235    pub fn handler(
1236        self,
1237        handler: impl Fn(serde_json::Value) -> ToolResult + WasmCompatSend + WasmCompatSync + 'static,
1238    ) -> ToolDefinition {
1239        ToolDefinition {
1240            name: self.name,
1241            description: self.description,
1242            parameters: self.parameters,
1243            handler: Box::new(handler),
1244        }
1245    }
1246}
1247
1248/// Trait boundary implemented by callable Rust tools.
1249pub trait Tool: std::fmt::Debug + WasmCompatSend + WasmCompatSync {
1250    /// Returns the tool name visible to the model.
1251    fn name(&self) -> &ToolName;
1252
1253    /// Returns the human-readable tool description visible to the model.
1254    fn description(&self) -> &ToolDescription;
1255
1256    /// Returns the JSON argument schema visible to the model.
1257    fn parameters(&self) -> &GenerationSchema;
1258
1259    /// Executes the tool with model-supplied arguments.
1260    ///
1261    /// # Errors
1262    ///
1263    /// Returns [`ToolCallError`] when the handler cannot satisfy the model's
1264    /// request. The error text is forwarded back through the bridge as the tool
1265    /// result error.
1266    fn call(&self, args: serde_json::Value) -> ToolResult;
1267}
1268
1269impl Tool for ToolDefinition {
1270    fn name(&self) -> &ToolName {
1271        &self.name
1272    }
1273
1274    fn description(&self) -> &ToolDescription {
1275        &self.description
1276    }
1277
1278    fn parameters(&self) -> &GenerationSchema {
1279        &self.parameters
1280    }
1281
1282    fn call(&self, args: serde_json::Value) -> ToolResult {
1283        call_tool_handler(self.handler.as_ref(), args)
1284    }
1285}
1286
1287trait ToolHandler: WasmCompatSend + WasmCompatSync {
1288    fn call(&self, args: serde_json::Value) -> ToolResult;
1289}
1290
1291impl<F> ToolHandler for F
1292where
1293    F: Fn(serde_json::Value) -> ToolResult + WasmCompatSend + WasmCompatSync,
1294{
1295    fn call(&self, args: serde_json::Value) -> ToolResult {
1296        self(args)
1297    }
1298}
1299
1300fn call_tool_handler(handler: &dyn ToolHandler, args: serde_json::Value) -> ToolResult {
1301    match std::panic::catch_unwind(std::panic::AssertUnwindSafe(|| handler.call(args))) {
1302        Ok(result) => result,
1303        Err(payload) => Err(ToolCallError::new(format!(
1304            "tool handler panicked: {}",
1305            panic_payload_message(payload.as_ref())
1306        ))),
1307    }
1308}
1309
1310fn panic_payload_message(payload: &(dyn std::any::Any + Send)) -> String {
1311    if let Some(message) = payload.downcast_ref::<&'static str>() {
1312        return (*message).to_owned();
1313    }
1314
1315    if let Some(message) = payload.downcast_ref::<String>() {
1316        return message.clone();
1317    }
1318
1319    "non-string panic payload".to_owned()
1320}
1321
1322impl std::fmt::Debug for ToolDefinition {
1323    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
1324        f.debug_struct("ToolDefinition")
1325            .field("name", &self.name)
1326            .field("description", &self.description)
1327            .finish_non_exhaustive()
1328    }
1329}
1330
1331/// Internal context that holds tool handlers. A raw pointer to this is passed to Swift
1332/// as `tool_ctx` and lives for the full `LanguageModelSession` lifetime via `Arc`.
1333#[cfg(aimx_bridge)]
1334struct ToolsContext {
1335    tools: Vec<(ToolName, ToolHandlerBox)>,
1336}
1337
1338#[cfg(aimx_bridge)]
1339impl ToolsContext {
1340    fn from_definitions(tools: Vec<ToolDefinition>) -> Arc<Self> {
1341        Arc::new(Self {
1342            tools: tools
1343                .into_iter()
1344                .map(|tool| (tool.name, tool.handler))
1345                .collect(),
1346        })
1347    }
1348
1349    fn call(&self, name: &str, args: serde_json::Value) -> ToolResult {
1350        let handler = self
1351            .tools
1352            .iter()
1353            .find_map(|(tool_name, handler)| (tool_name.as_str() == name).then_some(handler));
1354
1355        match handler {
1356            Some(handler) => call_tool_handler(handler.as_ref(), args),
1357            None => Err(ToolCallError::new(format!("unknown tool: {name}"))),
1358        }
1359    }
1360}
1361
1362// ─── Availability ──────────────────────────────────────────────────────────────
1363
1364const FM_AVAILABLE: i32 = 0;
1365const FM_DEVICE_NOT_ELIGIBLE: i32 = 1;
1366const FM_NOT_ENABLED: i32 = 2;
1367const FM_MODEL_NOT_READY: i32 = 3;
1368
1369/// Returns `true` if Apple Intelligence is available and ready on this device.
1370///
1371/// This is a cheap synchronous check. See [`availability`] for the specific reason
1372/// when this returns `false`.
1373pub fn is_available() -> bool {
1374    availability().is_ok()
1375}
1376
1377/// Returns `Ok(())` if Apple Intelligence is ready.
1378///
1379/// # Errors
1380///
1381/// Returns [`AvailabilityError`] describing why the local model cannot be
1382/// used on the current machine.
1383pub fn availability() -> Result<(), AvailabilityError> {
1384    #[cfg(aimx_bridge)]
1385    {
1386        let code = unsafe { fm_availability_reason() };
1387        match code {
1388            FM_AVAILABLE => Ok(()),
1389            FM_DEVICE_NOT_ELIGIBLE => Err(AvailabilityError::DeviceNotEligible),
1390            FM_NOT_ENABLED => Err(AvailabilityError::NotEnabled),
1391            FM_MODEL_NOT_READY => Err(AvailabilityError::ModelNotReady),
1392            _ => Err(AvailabilityError::Unknown),
1393        }
1394    }
1395    #[cfg(not(aimx_bridge))]
1396    Err(AvailabilityError::DeviceNotEligible)
1397}
1398
1399// ─── Apple/MLX-style model handle, builders, and trait boundary ──────────────
1400
1401/// Handle for Apple's default on-device system language model.
1402#[derive(Debug, Default, Clone, Copy)]
1403pub struct AppleIntelligenceModels {
1404    _private: (),
1405}
1406
1407impl AppleIntelligenceModels {
1408    /// Creates a handle to the default system language model.
1409    pub fn new() -> Self {
1410        Self::default()
1411    }
1412
1413    /// Returns `Ok(())` when Apple Intelligence is ready for this model.
1414    ///
1415    /// This mirrors Swift's `SystemLanguageModel.default.availability` shape,
1416    /// but maps unavailable states into [`AvailabilityError`].
1417    ///
1418    /// # Errors
1419    ///
1420    /// Returns [`AvailabilityError`] describing why the local model cannot be
1421    /// used on the current machine.
1422    pub fn availability(&self) -> Result<(), AvailabilityError> {
1423        availability()
1424    }
1425
1426    /// Returns `true` when the default system language model is available.
1427    pub fn is_available(&self) -> bool {
1428        self.availability().is_ok()
1429    }
1430
1431    /// Starts building a stateful session.
1432    pub fn session(&self) -> LanguageModelSessionBuilder {
1433        LanguageModelSessionBuilder::new()
1434    }
1435
1436    /// Alias for [`AppleIntelligenceModels::session`] for users coming from Rig's agent builders.
1437    pub fn agent(&self) -> LanguageModelSessionBuilder {
1438        self.session()
1439    }
1440
1441    /// Sends a single prompt in a fresh session and returns plain response text.
1442    ///
1443    /// # Errors
1444    ///
1445    /// Returns [`Error::NullByte`] for prompt text that cannot cross the C FFI
1446    /// boundary, [`Error::Unavailable`] when Apple Intelligence is unavailable,
1447    /// or [`Error::Generation`] when the model or bridge fails.
1448    pub async fn respond<P>(&self, prompt: P) -> Result<String, Error>
1449    where
1450        P: TryInto<Prompt>,
1451        P::Error: Into<Error>,
1452    {
1453        Ok(self.generate_text(prompt).await?.into_string())
1454    }
1455
1456    /// MLX-style alias for [`AppleIntelligenceModels::generate_text`].
1457    ///
1458    /// # Errors
1459    ///
1460    /// Returns the same error variants as [`AppleIntelligenceModels::generate_text`].
1461    pub async fn generate<P>(&self, prompt: P) -> Result<GeneratedText, Error>
1462    where
1463        P: TryInto<Prompt>,
1464        P::Error: Into<Error>,
1465    {
1466        self.generate_text(prompt).await
1467    }
1468
1469    /// MLX-style alias for [`AppleIntelligenceModels::generate_text_with_options`].
1470    ///
1471    /// # Errors
1472    ///
1473    /// Returns the same error variants as [`AppleIntelligenceModels::generate_text_with_options`].
1474    pub async fn generate_with_options<P>(
1475        &self,
1476        prompt: P,
1477        options: &GenerationOptions,
1478    ) -> Result<GeneratedText, Error>
1479    where
1480        P: TryInto<Prompt>,
1481        P::Error: Into<Error>,
1482    {
1483        self.generate_text_with_options(prompt, options).await
1484    }
1485
1486    /// Sends a single prompt in a fresh session and returns typed response text.
1487    ///
1488    /// # Errors
1489    ///
1490    /// Returns the same error variants as [`AppleIntelligenceModels::respond`].
1491    pub async fn complete<P>(&self, prompt: P) -> Result<ResponseText, Error>
1492    where
1493        P: TryInto<Prompt>,
1494        P::Error: Into<Error>,
1495    {
1496        self.generate_text(prompt).await
1497    }
1498
1499    /// Generates typed response text in a fresh session.
1500    ///
1501    /// # Errors
1502    ///
1503    /// Returns the same error variants as [`AppleIntelligenceModels::respond`].
1504    pub async fn generate_text<P>(&self, prompt: P) -> Result<ResponseText, Error>
1505    where
1506        P: TryInto<Prompt>,
1507        P::Error: Into<Error>,
1508    {
1509        let options = GenerationOptions::default();
1510        self.generate_text_with_options(prompt, &options).await
1511    }
1512
1513    /// Generates typed response text in a fresh session with explicit options.
1514    ///
1515    /// # Errors
1516    ///
1517    /// Returns [`Error::NullByte`] for invalid prompt text,
1518    /// [`Error::InvalidTemperature`] or [`Error::InvalidMaxTokens`] for invalid
1519    /// options, [`Error::Unavailable`] when Apple Intelligence is unavailable,
1520    /// or [`Error::Generation`] when the model or bridge fails.
1521    pub async fn generate_text_with_options<P>(
1522        &self,
1523        prompt: P,
1524        options: &GenerationOptions,
1525    ) -> Result<ResponseText, Error>
1526    where
1527        P: TryInto<Prompt>,
1528        P::Error: Into<Error>,
1529    {
1530        LanguageModel::generate_text_with_options(self, prompt, options.clone()).await
1531    }
1532
1533    /// Streams response text from a fresh session.
1534    ///
1535    /// # Errors
1536    ///
1537    /// Returns the same error variants as [`AppleIntelligenceModels::generate_text`].
1538    pub fn stream_text<P>(&self, prompt: P) -> Result<ResponseStream, Error>
1539    where
1540        P: TryInto<Prompt>,
1541        P::Error: Into<Error>,
1542    {
1543        let options = GenerationOptions::default();
1544        self.stream_text_with_options(prompt, &options)
1545    }
1546
1547    /// Streams response text from a fresh session with explicit options.
1548    ///
1549    /// # Errors
1550    ///
1551    /// Returns the same error variants as [`AppleIntelligenceModels::generate_text_with_options`].
1552    pub fn stream_text_with_options<P>(
1553        &self,
1554        prompt: P,
1555        options: &GenerationOptions,
1556    ) -> Result<ResponseStream, Error>
1557    where
1558        P: TryInto<Prompt>,
1559        P::Error: Into<Error>,
1560    {
1561        LanguageModel::stream_text_with_options(self, prompt, options.clone())
1562    }
1563
1564    /// MLX-style alias for [`AppleIntelligenceModels::stream_text`].
1565    ///
1566    /// # Errors
1567    ///
1568    /// Returns the same error variants as [`AppleIntelligenceModels::stream_text`].
1569    pub fn stream_generate<P>(&self, prompt: P) -> Result<ResponseStream, Error>
1570    where
1571        P: TryInto<Prompt>,
1572        P::Error: Into<Error>,
1573    {
1574        self.stream_text(prompt)
1575    }
1576
1577    /// MLX-style alias for [`AppleIntelligenceModels::stream_text_with_options`].
1578    ///
1579    /// # Errors
1580    ///
1581    /// Returns the same error variants as [`AppleIntelligenceModels::stream_text_with_options`].
1582    pub fn stream_generate_with_options<P>(
1583        &self,
1584        prompt: P,
1585        options: &GenerationOptions,
1586    ) -> Result<ResponseStream, Error>
1587    where
1588        P: TryInto<Prompt>,
1589        P::Error: Into<Error>,
1590    {
1591        self.stream_text_with_options(prompt, options)
1592    }
1593}
1594
1595/// Compatibility alias for Apple's framework-facing system-language-model name.
1596pub type SystemLanguageModel = AppleIntelligenceModels;
1597/// Compatibility alias for the earlier provider handle name.
1598pub type FoundationModels = AppleIntelligenceModels;
1599/// Compatibility alias for the older provider handle name.
1600pub type Client = AppleIntelligenceModels;
1601
1602impl LanguageModel for AppleIntelligenceModels {
1603    fn generate_text_with_options<P>(
1604        &self,
1605        prompt: P,
1606        options: GenerationOptions,
1607    ) -> impl Future<Output = Result<ResponseText, Error>> + '_
1608    where
1609        P: TryInto<Prompt>,
1610        P::Error: Into<Error>,
1611    {
1612        let prompt = prompt.try_into().map_err(Into::into);
1613        let builder = self.session().options(options.clone());
1614
1615        async move {
1616            let prompt = prompt?;
1617            let session = builder.build()?;
1618            session.generate_prompt_with_options(prompt, &options).await
1619        }
1620    }
1621
1622    fn stream_text_with_options<P>(
1623        &self,
1624        prompt: P,
1625        options: GenerationOptions,
1626    ) -> Result<ResponseStream, Error>
1627    where
1628        P: TryInto<Prompt>,
1629        P::Error: Into<Error>,
1630    {
1631        let prompt = prompt.try_into().map_err(Into::into)?;
1632        let session = self.session().options(options.clone()).build()?;
1633        session.stream_text_with_options(prompt, &options)
1634    }
1635}
1636
1637/// Provider-agnostic language-model boundary used by sessions and provider handles.
1638pub trait LanguageModel {
1639    /// Generates response text for a prompt with explicit generation options.
1640    ///
1641    /// # Errors
1642    ///
1643    /// Implementations return [`Error`] when prompt conversion, option
1644    /// validation, session creation, or model generation fails.
1645    fn generate_text_with_options<P>(
1646        &self,
1647        prompt: P,
1648        options: GenerationOptions,
1649    ) -> impl Future<Output = Result<ResponseText, Error>> + '_
1650    where
1651        P: TryInto<Prompt>,
1652        P::Error: Into<Error>;
1653
1654    /// Streams response text for a prompt with explicit generation options.
1655    ///
1656    /// # Errors
1657    ///
1658    /// Implementations return [`Error`] when prompt conversion, option
1659    /// validation, session creation, or stream startup fails.
1660    fn stream_text_with_options<P>(
1661        &self,
1662        prompt: P,
1663        options: GenerationOptions,
1664    ) -> Result<ResponseStream, Error>
1665    where
1666        P: TryInto<Prompt>,
1667        P::Error: Into<Error>;
1668}
1669
1670/// Compatibility trait for older completion-oriented naming.
1671pub trait CompletionModel: LanguageModel {
1672    /// Generates response text for a prompt with explicit generation options.
1673    ///
1674    /// # Errors
1675    ///
1676    /// Returns [`Error`] when prompt conversion, option validation, session
1677    /// creation, or model generation fails.
1678    fn completion<P>(
1679        &self,
1680        prompt: P,
1681        options: GenerationOptions,
1682    ) -> impl Future<Output = Result<ResponseText, Error>> + '_
1683    where
1684        P: TryInto<Prompt>,
1685        P::Error: Into<Error>,
1686    {
1687        self.generate_text_with_options(prompt, options)
1688    }
1689
1690    /// Streams response text for a prompt with explicit generation options.
1691    ///
1692    /// # Errors
1693    ///
1694    /// Returns [`Error`] when prompt conversion, option validation, session
1695    /// creation, or stream startup fails.
1696    fn stream_completion<P>(
1697        &self,
1698        prompt: P,
1699        options: GenerationOptions,
1700    ) -> Result<ResponseStream, Error>
1701    where
1702        P: TryInto<Prompt>,
1703        P::Error: Into<Error>,
1704    {
1705        self.stream_text_with_options(prompt, options)
1706    }
1707}
1708
1709impl<T> CompletionModel for T where T: LanguageModel {}
1710
1711/// Convenience trait for sending prompts with default generation options.
1712pub trait GenerateText: LanguageModel {
1713    /// Sends a prompt with default generation options.
1714    ///
1715    /// # Errors
1716    ///
1717    /// Returns [`Error`] when prompt conversion or the underlying generation
1718    /// request fails.
1719    fn prompt<P>(&self, prompt: P) -> impl Future<Output = Result<ResponseText, Error>> + '_
1720    where
1721        P: TryInto<Prompt>,
1722        P::Error: Into<Error>,
1723    {
1724        let prompt = prompt.try_into().map_err(Into::into);
1725
1726        async move {
1727            let prompt = prompt?;
1728            self.generate_text_with_options(prompt, GenerationOptions::default())
1729                .await
1730        }
1731    }
1732}
1733
1734impl<T> GenerateText for T where T: LanguageModel {}
1735
1736/// Builder for [`LanguageModelSession`].
1737#[derive(Debug)]
1738pub struct LanguageModelSessionBuilder {
1739    instructions: InstructionsText,
1740    tools: Vec<ToolDefinition>,
1741    default_options: GenerationOptions,
1742}
1743
1744impl LanguageModelSessionBuilder {
1745    /// Creates an empty session builder.
1746    pub fn new() -> Self {
1747        Self {
1748            instructions: InstructionsText::new(""),
1749            tools: Vec::new(),
1750            default_options: GenerationOptions::default(),
1751        }
1752    }
1753
1754    /// Sets persistent system instructions for the session.
1755    pub fn instructions(mut self, instructions: impl Into<InstructionsText>) -> Self {
1756        self.instructions = instructions.into();
1757        self
1758    }
1759
1760    /// Alias for [`LanguageModelSessionBuilder::instructions`] using Rig terminology.
1761    pub fn preamble(self, instructions: impl Into<InstructionsText>) -> Self {
1762        self.instructions(instructions)
1763    }
1764
1765    /// Adds one callable tool.
1766    pub fn tool(mut self, tool: ToolDefinition) -> Self {
1767        self.tools.push(tool);
1768        self
1769    }
1770
1771    /// Adds multiple callable tools.
1772    pub fn tools(mut self, tools: impl IntoIterator<Item = ToolDefinition>) -> Self {
1773        self.tools.extend(tools);
1774        self
1775    }
1776
1777    /// Sets the typed default temperature used by [`LanguageModelSession::respond_to`] and [`LanguageModelSession::stream_response`].
1778    pub fn temperature(mut self, temperature: Temperature) -> Self {
1779        self.default_options = self.default_options.temperature(temperature);
1780        self
1781    }
1782
1783    /// Alias for [`LanguageModelSessionBuilder::temperature`].
1784    pub fn with_temperature(mut self, temperature: Temperature) -> Self {
1785        self = self.temperature(temperature);
1786        self
1787    }
1788
1789    /// Parses and sets the default temperature from a raw boundary value.
1790    ///
1791    /// # Errors
1792    ///
1793    /// Returns [`Error::InvalidTemperature`] when `temperature` is outside
1794    /// Apple Intelligence's supported range.
1795    pub fn try_temperature(mut self, temperature: f64) -> Result<Self, Error> {
1796        self.default_options = self.default_options.try_temperature(temperature)?;
1797        Ok(self)
1798    }
1799
1800    /// Sets the default maximum response tokens.
1801    pub fn max_tokens(mut self, max_tokens: MaxTokens) -> Self {
1802        self.default_options = self.default_options.max_tokens(max_tokens);
1803        self
1804    }
1805
1806    /// Alias for [`LanguageModelSessionBuilder::max_tokens`].
1807    pub fn with_max_tokens(mut self, max_tokens: MaxTokens) -> Self {
1808        self = self.max_tokens(max_tokens);
1809        self
1810    }
1811
1812    /// Parses and sets the default maximum response token count from a raw boundary value.
1813    ///
1814    /// # Errors
1815    ///
1816    /// Returns [`Error::InvalidMaxTokens`] when `max_tokens` cannot be represented
1817    /// by the Swift bridge.
1818    pub fn try_max_tokens(mut self, max_tokens: usize) -> Result<Self, Error> {
1819        self.default_options = self.default_options.try_max_tokens(max_tokens)?;
1820        Ok(self)
1821    }
1822
1823    /// Replaces all default generation options.
1824    pub fn options(mut self, options: GenerationOptions) -> Self {
1825        self.default_options = options;
1826        self
1827    }
1828
1829    /// Builds a stateful model session.
1830    ///
1831    /// # Examples
1832    ///
1833    /// ```no_run
1834    /// # fn example() -> Result<(), aimx::Error> {
1835    /// use aimx::{AppleIntelligenceModels, Temperature};
1836    ///
1837    /// let session = AppleIntelligenceModels::default()
1838    ///     .session()
1839    ///     .instructions("Answer in short paragraphs.")
1840    ///     .temperature(Temperature::new(0.2)?)
1841    ///     .build()?;
1842    /// # let _ = session;
1843    /// # Ok(()) }
1844    /// ```
1845    ///
1846    /// # Errors
1847    ///
1848    /// Returns [`Error::NullByte`] for invalid instructions,
1849    /// [`Error::InvalidTemperature`] or [`Error::InvalidMaxTokens`] for invalid
1850    /// defaults, [`Error::Json`] if tool metadata cannot be serialized, or
1851    /// [`Error::Unavailable`] when Apple Intelligence is not ready.
1852    pub fn build(self) -> Result<LanguageModelSession, Error> {
1853        let instructions = SystemInstructions::try_from(self.instructions)?;
1854        LanguageModelSession::create(instructions, self.tools, self.default_options)
1855    }
1856}
1857
1858impl Default for LanguageModelSessionBuilder {
1859    fn default() -> Self {
1860        Self::new()
1861    }
1862}
1863
1864/// Compatibility alias for the older session-builder name.
1865pub type SessionBuilder = LanguageModelSessionBuilder;
1866
1867// ─── Convenience top-level functions ──────────────────────────────────────────
1868
1869/// Sends a single prompt to the model and returns the response text.
1870///
1871/// Each call creates a fresh session with no prior context. For multi-turn
1872/// conversations use [`LanguageModelSession`] directly.
1873///
1874/// # Errors
1875///
1876/// Returns [`Error::NullByte`] for prompt text that cannot cross the C FFI
1877/// boundary, [`Error::Unavailable`] when Apple Intelligence is unavailable, or
1878/// [`Error::Generation`] when the model or bridge fails.
1879pub async fn respond<P>(prompt: P) -> Result<String, Error>
1880where
1881    P: TryInto<Prompt>,
1882    P::Error: Into<Error>,
1883{
1884    AppleIntelligenceModels::default().respond(prompt).await
1885}
1886
1887/// Like [`respond`] but allows tuning generation via [`GenerationOptions`].
1888///
1889/// # Errors
1890///
1891/// Returns every error documented by [`respond`]. It can also return
1892/// [`Error::InvalidTemperature`] or [`Error::InvalidMaxTokens`] when `options`
1893/// contains out-of-range values.
1894pub async fn respond_with_options<P>(
1895    prompt: P,
1896    options: &GenerationOptions,
1897) -> Result<String, Error>
1898where
1899    P: TryInto<Prompt>,
1900    P::Error: Into<Error>,
1901{
1902    Ok(AppleIntelligenceModels::default()
1903        .generate_with_options(prompt, options)
1904        .await?
1905        .into_string())
1906}
1907
1908/// MLX-style top-level text generation helper.
1909///
1910/// Each call creates a fresh session with no prior context. For multi-turn
1911/// conversations use [`LanguageModelSession`] directly.
1912///
1913/// # Errors
1914///
1915/// Returns every error documented by [`respond`].
1916pub async fn generate<P>(prompt: P) -> Result<String, Error>
1917where
1918    P: TryInto<Prompt>,
1919    P::Error: Into<Error>,
1920{
1921    respond(prompt).await
1922}
1923
1924/// MLX-style top-level generation helper with explicit generation options.
1925///
1926/// # Errors
1927///
1928/// Returns every error documented by [`respond_with_options`].
1929pub async fn generate_with_options<P>(
1930    prompt: P,
1931    options: &GenerationOptions,
1932) -> Result<String, Error>
1933where
1934    P: TryInto<Prompt>,
1935    P::Error: Into<Error>,
1936{
1937    respond_with_options(prompt, options).await
1938}
1939
1940/// MLX-style top-level streaming helper.
1941///
1942/// # Errors
1943///
1944/// Returns [`Error::NullByte`] for invalid prompt text,
1945/// [`Error::Unavailable`] when Apple Intelligence is unavailable, or
1946/// [`Error::Generation`] if stream startup fails.
1947pub fn stream_generate<P>(prompt: P) -> Result<ResponseStream, Error>
1948where
1949    P: TryInto<Prompt>,
1950    P::Error: Into<Error>,
1951{
1952    AppleIntelligenceModels::default().stream_generate(prompt)
1953}
1954
1955/// MLX-style top-level streaming helper with explicit generation options.
1956///
1957/// # Errors
1958///
1959/// Returns every error documented by [`stream_generate`]. It can also return
1960/// [`Error::InvalidTemperature`] or [`Error::InvalidMaxTokens`] when `options`
1961/// contains out-of-range values.
1962pub fn stream_generate_with_options<P>(
1963    prompt: P,
1964    options: &GenerationOptions,
1965) -> Result<ResponseStream, Error>
1966where
1967    P: TryInto<Prompt>,
1968    P::Error: Into<Error>,
1969{
1970    AppleIntelligenceModels::default().stream_generate_with_options(prompt, options)
1971}
1972
1973// ─── LanguageModelSession ───────────────────────────────────────────────────────────────────
1974
1975/// Owned opaque pointer to Swift's ARC-retained session holder.
1976#[cfg(aimx_bridge)]
1977#[derive(Debug)]
1978struct SessionHandle(NonNull<c_void>);
1979
1980#[cfg(aimx_bridge)]
1981impl SessionHandle {
1982    fn from_raw(handle: *mut c_void) -> Result<Self, Error> {
1983        NonNull::new(handle)
1984            .map(Self)
1985            .ok_or(Error::Unavailable(AvailabilityError::Unknown))
1986    }
1987
1988    fn as_ptr(&self) -> *mut c_void {
1989        self.0.as_ptr()
1990    }
1991}
1992
1993#[cfg(aimx_bridge)]
1994impl Drop for SessionHandle {
1995    fn drop(&mut self) {
1996        unsafe {
1997            fm_session_destroy(self.as_ptr());
1998        }
1999    }
2000}
2001
2002#[cfg(aimx_bridge)]
2003unsafe impl Send for SessionHandle {}
2004
2005#[cfg(aimx_bridge)]
2006unsafe impl Sync for SessionHandle {}
2007
2008/// A stateful conversation session backed by a `LanguageModelSession`.
2009///
2010/// The session automatically maintains a conversation transcript, so each
2011/// successive call to [`respond_to`][LanguageModelSession::respond_to] has access to the full
2012/// prior context (subject to the 4 096-token context window limit).
2013///
2014/// # Thread safety
2015///
2016/// `LanguageModelSession` is `Send + Sync`. Concurrent calls are forwarded to the underlying
2017/// Swift session, which handles them via its internal async actor. Note however
2018/// that concurrent calls will interleave entries in the transcript in an
2019/// unspecified order; for predictable multi-turn behaviour call sequentially.
2020///
2021/// # Drop behaviour
2022///
2023/// Dropping a `LanguageModelSession` releases the caller's session reference.
2024/// In-flight generation futures and active [`ResponseStream`]s hold their own
2025/// cloned handle reference until Swift invokes the completion callback, so
2026/// cancellation cannot release the Swift session while the bridge still needs it.
2027pub struct LanguageModelSession {
2028    default_options: GenerationOptions,
2029    #[cfg(aimx_bridge)]
2030    handle: Arc<SessionHandle>,
2031    /// Keeps the tool handlers alive for the full session lifetime.
2032    /// A raw pointer to the Arc payload is passed to Swift as `tool_ctx`.
2033    #[cfg(aimx_bridge)]
2034    _tools: Option<Arc<ToolsContext>>,
2035}
2036
2037impl std::fmt::Debug for LanguageModelSession {
2038    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
2039        f.debug_struct("LanguageModelSession")
2040            .field("default_options", &self.default_options)
2041            .finish_non_exhaustive()
2042    }
2043}
2044
2045impl LanguageModelSession {
2046    /// Starts building a session.
2047    pub fn builder() -> LanguageModelSessionBuilder {
2048        LanguageModelSessionBuilder::new()
2049    }
2050
2051    /// Creates a new session with no system instructions.
2052    ///
2053    /// # Errors
2054    ///
2055    /// Returns [`Error::Unavailable`] when Apple Intelligence is unavailable.
2056    pub fn new() -> Result<Self, Error> {
2057        Self::builder().build()
2058    }
2059
2060    /// Creates a new session with the given system instructions.
2061    ///
2062    /// SystemInstructions act as a persistent system prompt that guides all subsequent
2063    /// responses in this session. They must come from developer code, never from
2064    /// user input, to prevent prompt-injection attacks.
2065    ///
2066    /// # Errors
2067    ///
2068    /// Returns [`Error::NullByte`] if the instructions cannot cross the C FFI
2069    /// boundary, or [`Error::Unavailable`] when Apple Intelligence is
2070    /// unavailable.
2071    pub fn with_instructions<I>(instructions: I) -> Result<Self, Error>
2072    where
2073        I: TryInto<SystemInstructions>,
2074        I::Error: Into<Error>,
2075    {
2076        let instructions = instructions.try_into().map_err(Into::into)?;
2077        Self::create(instructions, Vec::new(), GenerationOptions::default())
2078    }
2079
2080    /// Creates a session pre-loaded with the given tools.
2081    ///
2082    /// The model will use these tools automatically when appropriate during `respond` calls.
2083    /// Tool names must be unique within the session.
2084    ///
2085    /// # Errors
2086    ///
2087    /// Returns [`Error::NullByte`] if the instructions or serialized tool
2088    /// metadata cannot cross the C FFI boundary, [`Error::Json`] if tool
2089    /// metadata serialization fails, or [`Error::Unavailable`] when Apple
2090    /// Intelligence is unavailable.
2091    pub fn with_tools<I>(instructions: I, tools: Vec<ToolDefinition>) -> Result<Self, Error>
2092    where
2093        I: TryInto<SystemInstructions>,
2094        I::Error: Into<Error>,
2095    {
2096        let instructions = instructions.try_into().map_err(Into::into)?;
2097        Self::create(instructions, tools, GenerationOptions::default())
2098    }
2099
2100    fn create(
2101        instructions: SystemInstructions,
2102        tools: Vec<ToolDefinition>,
2103        default_options: GenerationOptions,
2104    ) -> Result<Self, Error> {
2105        default_options.validate()?;
2106        availability().map_err(Error::Unavailable)?;
2107
2108        #[cfg(aimx_bridge)]
2109        {
2110            Self::create_bridge_session(instructions, tools, default_options)
2111        }
2112        #[cfg(not(aimx_bridge))]
2113        {
2114            let _ = (instructions, tools, default_options);
2115            Err(Error::Unavailable(AvailabilityError::DeviceNotEligible))
2116        }
2117    }
2118
2119    #[cfg(aimx_bridge)]
2120    fn create_bridge_session(
2121        instructions: SystemInstructions,
2122        tools: Vec<ToolDefinition>,
2123        default_options: GenerationOptions,
2124    ) -> Result<Self, Error> {
2125        if tools.is_empty() {
2126            return Self::create_plain_bridge_session(instructions, default_options);
2127        }
2128
2129        Self::create_tool_bridge_session(instructions, tools, default_options)
2130    }
2131
2132    #[cfg(aimx_bridge)]
2133    fn create_plain_bridge_session(
2134        instructions: SystemInstructions,
2135        default_options: GenerationOptions,
2136    ) -> Result<Self, Error> {
2137        let handle = unsafe { fm_session_create(instructions.as_ptr()) };
2138
2139        Ok(Self {
2140            default_options,
2141            handle: Arc::new(SessionHandle::from_raw(handle)?),
2142            _tools: None,
2143        })
2144    }
2145
2146    #[cfg(aimx_bridge)]
2147    fn create_tool_bridge_session(
2148        instructions: SystemInstructions,
2149        tools: Vec<ToolDefinition>,
2150        default_options: GenerationOptions,
2151    ) -> Result<Self, Error> {
2152        let tool_descriptions = tools
2153            .iter()
2154            .map(ToolDefinition::bridge_description)
2155            .collect::<Vec<_>>();
2156        let c_tools_json = CString::new(serde_json::to_vec(&tool_descriptions)?)?;
2157        let tools_ctx = ToolsContext::from_definitions(tools);
2158        let tool_ctx_ptr = Arc::as_ptr(&tools_ctx) as *mut c_void;
2159
2160        let handle = unsafe {
2161            fm_session_create_with_tools(
2162                instructions.as_ptr(),
2163                c_tools_json.as_ptr(),
2164                tool_ctx_ptr,
2165                tool_dispatch,
2166            )
2167        };
2168
2169        Ok(Self {
2170            default_options,
2171            handle: Arc::new(SessionHandle::from_raw(handle)?),
2172            _tools: Some(tools_ctx),
2173        })
2174    }
2175
2176    /// Sends a prompt and returns the full response text.
2177    ///
2178    /// The response is appended to this session's transcript, so subsequent
2179    /// calls have access to prior context.
2180    ///
2181    /// # Errors
2182    ///
2183    /// Returns [`Error::NullByte`] for invalid prompt text, or
2184    /// [`Error::Generation`] when the model or bridge fails.
2185    pub async fn respond<P>(&self, prompt: P) -> Result<String, Error>
2186    where
2187        P: TryInto<Prompt>,
2188        P::Error: Into<Error>,
2189    {
2190        Ok(self.respond_to(prompt).await?.into_string())
2191    }
2192
2193    /// Apple-style typed response method matching Swift's `respond(to:)`.
2194    ///
2195    /// # Errors
2196    ///
2197    /// Returns the same error variants as [`LanguageModelSession::respond`].
2198    pub async fn respond_to<P>(&self, prompt: P) -> Result<ResponseText, Error>
2199    where
2200        P: TryInto<Prompt>,
2201        P::Error: Into<Error>,
2202    {
2203        self.respond_to_with_options(prompt, &self.default_options)
2204            .await
2205    }
2206
2207    /// Sends a prompt and returns typed response text.
2208    ///
2209    /// # Errors
2210    ///
2211    /// Returns the same error variants as [`LanguageModelSession::respond_to`].
2212    pub async fn complete<P>(&self, prompt: P) -> Result<ResponseText, Error>
2213    where
2214        P: TryInto<Prompt>,
2215        P::Error: Into<Error>,
2216    {
2217        self.respond_to(prompt).await
2218    }
2219
2220    /// MLX-style typed response alias.
2221    ///
2222    /// # Errors
2223    ///
2224    /// Returns the same error variants as [`LanguageModelSession::respond_to`].
2225    pub async fn generate<P>(&self, prompt: P) -> Result<GeneratedText, Error>
2226    where
2227        P: TryInto<Prompt>,
2228        P::Error: Into<Error>,
2229    {
2230        self.respond_to(prompt).await
2231    }
2232
2233    /// Generates typed response text and appends the exchange to this session's transcript.
2234    ///
2235    /// # Errors
2236    ///
2237    /// Returns the same error variants as [`LanguageModelSession::respond_to`].
2238    pub async fn generate_text<P>(&self, prompt: P) -> Result<ResponseText, Error>
2239    where
2240        P: TryInto<Prompt>,
2241        P::Error: Into<Error>,
2242    {
2243        self.respond_to(prompt).await
2244    }
2245
2246    /// Like [`respond`][LanguageModelSession::respond] but allows tuning generation.
2247    ///
2248    /// # Errors
2249    ///
2250    /// Returns every error documented by [`LanguageModelSession::respond`]. It can also
2251    /// return [`Error::InvalidTemperature`] or [`Error::InvalidMaxTokens`] when
2252    /// `options` contains out-of-range values.
2253    pub async fn respond_with_options<P>(
2254        &self,
2255        prompt: P,
2256        options: &GenerationOptions,
2257    ) -> Result<String, Error>
2258    where
2259        P: TryInto<Prompt>,
2260        P::Error: Into<Error>,
2261    {
2262        Ok(self
2263            .respond_to_with_options(prompt, options)
2264            .await?
2265            .into_string())
2266    }
2267
2268    /// Apple-style typed response method with explicit generation options.
2269    ///
2270    /// # Errors
2271    ///
2272    /// Returns every error documented by [`LanguageModelSession::respond`]. It can also
2273    /// return [`Error::InvalidTemperature`] or [`Error::InvalidMaxTokens`] when
2274    /// `options` contains out-of-range values.
2275    pub async fn respond_to_with_options<P>(
2276        &self,
2277        prompt: P,
2278        options: &GenerationOptions,
2279    ) -> Result<ResponseText, Error>
2280    where
2281        P: TryInto<Prompt>,
2282        P::Error: Into<Error>,
2283    {
2284        let prompt = prompt.try_into().map_err(Into::into)?;
2285        self.generate_prompt_with_options(prompt, options).await
2286    }
2287
2288    /// Like [`complete`][LanguageModelSession::complete] but allows tuning generation.
2289    ///
2290    /// # Errors
2291    ///
2292    /// Returns the same error variants as [`LanguageModelSession::respond_with_options`].
2293    pub async fn complete_with_options<P>(
2294        &self,
2295        prompt: P,
2296        options: &GenerationOptions,
2297    ) -> Result<ResponseText, Error>
2298    where
2299        P: TryInto<Prompt>,
2300        P::Error: Into<Error>,
2301    {
2302        self.respond_to_with_options(prompt, options).await
2303    }
2304
2305    /// MLX-style typed response alias with explicit generation options.
2306    ///
2307    /// # Errors
2308    ///
2309    /// Returns the same error variants as [`LanguageModelSession::respond_to_with_options`].
2310    pub async fn generate_with_options<P>(
2311        &self,
2312        prompt: P,
2313        options: &GenerationOptions,
2314    ) -> Result<GeneratedText, Error>
2315    where
2316        P: TryInto<Prompt>,
2317        P::Error: Into<Error>,
2318    {
2319        self.respond_to_with_options(prompt, options).await
2320    }
2321
2322    /// Generates typed response text with explicit generation options.
2323    ///
2324    /// # Errors
2325    ///
2326    /// Returns the same error variants as [`LanguageModelSession::respond_with_options`].
2327    pub async fn generate_text_with_options<P>(
2328        &self,
2329        prompt: P,
2330        options: &GenerationOptions,
2331    ) -> Result<ResponseText, Error>
2332    where
2333        P: TryInto<Prompt>,
2334        P::Error: Into<Error>,
2335    {
2336        self.respond_to_with_options(prompt, options).await
2337    }
2338
2339    async fn generate_prompt_with_options(
2340        &self,
2341        prompt: Prompt,
2342        options: &GenerationOptions,
2343    ) -> Result<ResponseText, Error> {
2344        let config = options.validated()?;
2345        #[cfg(aimx_bridge)]
2346        {
2347            let handle = Arc::clone(&self.handle);
2348            let (tx, rx) = oneshot::channel::<ModelTextResult>();
2349            let ctx = Box::into_raw(Box::new(ResponseContext {
2350                tx,
2351                _handle: handle,
2352            })) as *mut c_void;
2353
2354            unsafe {
2355                fm_session_respond(
2356                    self.handle.as_ptr(),
2357                    prompt.as_ptr(),
2358                    config.ffi_temperature(),
2359                    config.ffi_max_tokens(),
2360                    ctx,
2361                    respond_callback,
2362                );
2363            }
2364
2365            receive_response(rx).await
2366        }
2367        #[cfg(not(aimx_bridge))]
2368        {
2369            let _ = (prompt, config);
2370            Err(Error::Unavailable(AvailabilityError::DeviceNotEligible))
2371        }
2372    }
2373
2374    /// Sends a prompt and deserialises the response into `T` using the provided schema.
2375    ///
2376    /// The model generates output conforming to `schema` and this method deserialises it.
2377    /// Derive [`serde::Deserialize`] on `T` and ensure the field names match the schema
2378    /// property names exactly.
2379    ///
2380    /// # Errors
2381    ///
2382    /// Returns [`Error::NullByte`] for invalid prompt text, [`Error::Json`] if
2383    /// the schema or model response cannot be serialized or deserialized, or
2384    /// [`Error::Generation`] when the model or bridge fails.
2385    pub async fn respond_as<T, P>(&self, prompt: P, schema: &GenerationSchema) -> Result<T, Error>
2386    where
2387        T: serde::de::DeserializeOwned,
2388        P: TryInto<Prompt>,
2389        P::Error: Into<Error>,
2390    {
2391        self.respond_generating(prompt, schema).await
2392    }
2393
2394    /// Apple-style guided-generation method for a dynamic [`GenerationSchema`].
2395    ///
2396    /// This mirrors Swift's `respond(to:generating:)` terminology while
2397    /// deserializing the generated JSON into `T`.
2398    ///
2399    /// # Errors
2400    ///
2401    /// Returns every error documented by [`LanguageModelSession::respond_as`].
2402    pub async fn respond_generating<T, P>(
2403        &self,
2404        prompt: P,
2405        schema: &GenerationSchema,
2406    ) -> Result<T, Error>
2407    where
2408        T: serde::de::DeserializeOwned,
2409        P: TryInto<Prompt>,
2410        P::Error: Into<Error>,
2411    {
2412        self.respond_generating_with_options(prompt, schema, &self.default_options)
2413            .await
2414    }
2415
2416    /// Generates structured output and deserialises it into `T`.
2417    ///
2418    /// # Errors
2419    ///
2420    /// Returns the same error variants as [`LanguageModelSession::respond_as`].
2421    pub async fn generate_object<T, P>(
2422        &self,
2423        prompt: P,
2424        schema: &GenerationSchema,
2425    ) -> Result<T, Error>
2426    where
2427        T: serde::de::DeserializeOwned,
2428        P: TryInto<Prompt>,
2429        P::Error: Into<Error>,
2430    {
2431        self.respond_generating(prompt, schema).await
2432    }
2433
2434    /// Like [`respond_as`][LanguageModelSession::respond_as] but allows tuning generation.
2435    ///
2436    /// # Errors
2437    ///
2438    /// Returns every error documented by [`LanguageModelSession::respond_as`]. It can also
2439    /// return [`Error::InvalidTemperature`] or [`Error::InvalidMaxTokens`] when
2440    /// `options` contains out-of-range values.
2441    pub async fn respond_as_with_options<T, P>(
2442        &self,
2443        prompt: P,
2444        schema: &GenerationSchema,
2445        options: &GenerationOptions,
2446    ) -> Result<T, Error>
2447    where
2448        T: serde::de::DeserializeOwned,
2449        P: TryInto<Prompt>,
2450        P::Error: Into<Error>,
2451    {
2452        self.respond_generating_with_options(prompt, schema, options)
2453            .await
2454    }
2455
2456    /// Apple-style guided-generation method with explicit generation options.
2457    ///
2458    /// # Errors
2459    ///
2460    /// Returns every error documented by [`LanguageModelSession::respond_as_with_options`].
2461    pub async fn respond_generating_with_options<T, P>(
2462        &self,
2463        prompt: P,
2464        schema: &GenerationSchema,
2465        options: &GenerationOptions,
2466    ) -> Result<T, Error>
2467    where
2468        T: serde::de::DeserializeOwned,
2469        P: TryInto<Prompt>,
2470        P::Error: Into<Error>,
2471    {
2472        let prompt = prompt.try_into().map_err(Into::into)?;
2473        let config = options.validated()?;
2474
2475        self.respond_generating_prompt_with_config(prompt, schema, config)
2476            .await
2477    }
2478
2479    /// Generates structured output with explicit generation options.
2480    ///
2481    /// # Errors
2482    ///
2483    /// Returns the same error variants as [`LanguageModelSession::respond_as_with_options`].
2484    pub async fn generate_object_with_options<T, P>(
2485        &self,
2486        prompt: P,
2487        schema: &GenerationSchema,
2488        options: &GenerationOptions,
2489    ) -> Result<T, Error>
2490    where
2491        T: serde::de::DeserializeOwned,
2492        P: TryInto<Prompt>,
2493        P::Error: Into<Error>,
2494    {
2495        self.respond_generating_with_options(prompt, schema, options)
2496            .await
2497    }
2498
2499    async fn respond_generating_prompt_with_config<T>(
2500        &self,
2501        prompt: Prompt,
2502        schema: &GenerationSchema,
2503        config: GenerationConfig,
2504    ) -> Result<T, Error>
2505    where
2506        T: serde::de::DeserializeOwned,
2507    {
2508        #[cfg(aimx_bridge)]
2509        {
2510            let handle = Arc::clone(&self.handle);
2511            let (tx, rx) = oneshot::channel::<ModelTextResult>();
2512            let ctx = Box::into_raw(Box::new(ResponseContext {
2513                tx,
2514                _handle: handle,
2515            })) as *mut c_void;
2516            let c_schema_json = CString::new(serde_json::to_vec(schema)?)?;
2517
2518            unsafe {
2519                fm_session_respond_structured(
2520                    self.handle.as_ptr(),
2521                    prompt.as_ptr(),
2522                    c_schema_json.as_ptr(),
2523                    config.ffi_temperature(),
2524                    config.ffi_max_tokens(),
2525                    ctx,
2526                    respond_callback,
2527                );
2528            }
2529
2530            let json = receive_response(rx).await?.into_string();
2531            serde_json::from_str(&json).map_err(Error::from)
2532        }
2533        #[cfg(not(aimx_bridge))]
2534        {
2535            let _ = (prompt, schema, config);
2536            Err(Error::Unavailable(AvailabilityError::DeviceNotEligible))
2537        }
2538    }
2539
2540    /// Returns a [`ResponseStream`] that yields text chunks as the model generates them.
2541    ///
2542    /// Each yielded chunk is an incremental snapshot of the response text. Drive the
2543    /// stream with your preferred async executor.
2544    ///
2545    /// ```no_run
2546    /// # async fn example() -> Result<(), aimx::Error> {
2547    /// use aimx::LanguageModelSession;
2548    ///
2549    /// let session = LanguageModelSession::new()?;
2550    /// let stream = session.stream_response("Count to ten.")?;
2551    /// # Ok(()) }
2552    /// ```
2553    ///
2554    /// # Errors
2555    ///
2556    /// Returns [`Error::NullByte`] for invalid prompt text, or
2557    /// [`Error::Generation`] if stream startup fails. Individual stream items
2558    /// can also yield [`Error::Generation`] after the stream has been created.
2559    pub fn stream<P>(&self, prompt: P) -> Result<ResponseStream, Error>
2560    where
2561        P: TryInto<Prompt>,
2562        P::Error: Into<Error>,
2563    {
2564        self.stream_response(prompt)
2565    }
2566
2567    /// Apple-style streaming method matching Swift's `streamResponse(to:)`.
2568    ///
2569    /// # Errors
2570    ///
2571    /// Returns the same error variants as [`LanguageModelSession::stream`].
2572    pub fn stream_response<P>(&self, prompt: P) -> Result<ResponseStream, Error>
2573    where
2574        P: TryInto<Prompt>,
2575        P::Error: Into<Error>,
2576    {
2577        self.stream_response_with_options(prompt, &self.default_options)
2578    }
2579
2580    /// MLX-style streaming alias matching `stream_generate`.
2581    ///
2582    /// # Errors
2583    ///
2584    /// Returns the same error variants as [`LanguageModelSession::stream_response`].
2585    pub fn stream_generate<P>(&self, prompt: P) -> Result<ResponseStream, Error>
2586    where
2587        P: TryInto<Prompt>,
2588        P::Error: Into<Error>,
2589    {
2590        self.stream_response(prompt)
2591    }
2592
2593    /// Streams response text with this session's default generation options.
2594    ///
2595    /// # Errors
2596    ///
2597    /// Returns the same error variants as [`LanguageModelSession::stream_response`].
2598    pub fn stream_text<P>(&self, prompt: P) -> Result<ResponseStream, Error>
2599    where
2600        P: TryInto<Prompt>,
2601        P::Error: Into<Error>,
2602    {
2603        self.stream_response(prompt)
2604    }
2605
2606    /// Like [`stream`][LanguageModelSession::stream] but allows tuning generation.
2607    ///
2608    /// # Errors
2609    ///
2610    /// Returns every error documented by [`LanguageModelSession::stream`]. It can also return
2611    /// [`Error::InvalidTemperature`] or [`Error::InvalidMaxTokens`] when
2612    /// `options` contains out-of-range values.
2613    pub fn stream_with_options<P>(
2614        &self,
2615        prompt: P,
2616        options: &GenerationOptions,
2617    ) -> Result<ResponseStream, Error>
2618    where
2619        P: TryInto<Prompt>,
2620        P::Error: Into<Error>,
2621    {
2622        self.stream_response_with_options(prompt, options)
2623    }
2624
2625    /// Apple-style streaming method with explicit generation options.
2626    ///
2627    /// # Errors
2628    ///
2629    /// Returns every error documented by [`LanguageModelSession::stream`]. It can also return
2630    /// [`Error::InvalidTemperature`] or [`Error::InvalidMaxTokens`] when
2631    /// `options` contains out-of-range values.
2632    pub fn stream_response_with_options<P>(
2633        &self,
2634        prompt: P,
2635        options: &GenerationOptions,
2636    ) -> Result<ResponseStream, Error>
2637    where
2638        P: TryInto<Prompt>,
2639        P::Error: Into<Error>,
2640    {
2641        let prompt = prompt.try_into().map_err(Into::into)?;
2642        let config = options.validated()?;
2643
2644        self.stream_prompt_with_config(prompt, config)
2645    }
2646
2647    /// MLX-style streaming alias with explicit generation options.
2648    ///
2649    /// # Errors
2650    ///
2651    /// Returns every error documented by [`LanguageModelSession::stream_response_with_options`].
2652    pub fn stream_generate_with_options<P>(
2653        &self,
2654        prompt: P,
2655        options: &GenerationOptions,
2656    ) -> Result<ResponseStream, Error>
2657    where
2658        P: TryInto<Prompt>,
2659        P::Error: Into<Error>,
2660    {
2661        self.stream_response_with_options(prompt, options)
2662    }
2663
2664    /// Streams response text with explicit generation options.
2665    ///
2666    /// # Errors
2667    ///
2668    /// Returns the same error variants as [`LanguageModelSession::stream_with_options`].
2669    pub fn stream_text_with_options<P>(
2670        &self,
2671        prompt: P,
2672        options: &GenerationOptions,
2673    ) -> Result<ResponseStream, Error>
2674    where
2675        P: TryInto<Prompt>,
2676        P::Error: Into<Error>,
2677    {
2678        self.stream_response_with_options(prompt, options)
2679    }
2680
2681    fn stream_prompt_with_config(
2682        &self,
2683        prompt: Prompt,
2684        config: GenerationConfig,
2685    ) -> Result<ResponseStream, Error> {
2686        #[cfg(aimx_bridge)]
2687        {
2688            let handle = Arc::clone(&self.handle);
2689            let (tx, rx) = mpsc::unbounded::<ModelTextResult>();
2690            let ctx = Box::into_raw(Box::new(StreamContext {
2691                tx,
2692                _handle: handle,
2693            })) as *mut c_void;
2694
2695            unsafe {
2696                fm_session_stream(
2697                    self.handle.as_ptr(),
2698                    prompt.as_ptr(),
2699                    config.ffi_temperature(),
2700                    config.ffi_max_tokens(),
2701                    ctx,
2702                    stream_token_callback,
2703                    stream_done_callback,
2704                );
2705            }
2706
2707            Ok(ResponseStream { rx })
2708        }
2709        #[cfg(not(aimx_bridge))]
2710        {
2711            let _ = (prompt, config);
2712            Err(Error::Unavailable(AvailabilityError::DeviceNotEligible))
2713        }
2714    }
2715}
2716
2717/// Compatibility alias for the older session type name.
2718pub type Session = LanguageModelSession;
2719
2720impl LanguageModel for LanguageModelSession {
2721    fn generate_text_with_options<P>(
2722        &self,
2723        prompt: P,
2724        options: GenerationOptions,
2725    ) -> impl Future<Output = Result<ResponseText, Error>> + '_
2726    where
2727        P: TryInto<Prompt>,
2728        P::Error: Into<Error>,
2729    {
2730        let prompt = prompt.try_into().map_err(Into::into);
2731
2732        async move {
2733            let prompt = prompt?;
2734            self.generate_prompt_with_options(prompt, &options).await
2735        }
2736    }
2737
2738    fn stream_text_with_options<P>(
2739        &self,
2740        prompt: P,
2741        options: GenerationOptions,
2742    ) -> Result<ResponseStream, Error>
2743    where
2744        P: TryInto<Prompt>,
2745        P::Error: Into<Error>,
2746    {
2747        LanguageModelSession::stream_text_with_options(self, prompt, &options)
2748    }
2749}
2750
2751// ─── ResponseStream ────────────────────────────────────────────────────────────
2752
2753/// An async stream of text chunks produced by [`LanguageModelSession::stream`].
2754///
2755/// Each item is `Ok(ResponseText)` for a new chunk, or `Err(Error)` if generation failed.
2756/// The stream ends when the model finishes generating.
2757///
2758/// Implements [`futures_core::Stream`]; use with `.next()` from `StreamExt` or
2759/// any executor that can drive `Stream`.
2760pub struct ResponseStream {
2761    rx: StreamReceiver,
2762}
2763
2764impl Stream for ResponseStream {
2765    type Item = Result<ResponseText, Error>;
2766
2767    fn poll_next(mut self: Pin<&mut Self>, cx: &mut StdContext<'_>) -> Poll<Option<Self::Item>> {
2768        Pin::new(&mut self.rx)
2769            .poll_next(cx)
2770            .map(|opt| opt.map(|r| r.map_err(Error::from)))
2771    }
2772}
2773
2774#[cfg(aimx_bridge)]
2775async fn receive_response(receiver: ResponseReceiver) -> Result<ResponseText, Error> {
2776    receiver
2777        .await
2778        .map_err(|_| GenerationError::new("session was dropped before responding"))?
2779        .map_err(Error::from)
2780}
2781
2782// ─── FFI callbacks ─────────────────────────────────────────────────────────────
2783
2784/// Single-shot response context owned by Swift until `respond_callback`.
2785#[cfg(aimx_bridge)]
2786struct ResponseContext {
2787    tx: ResponseSender,
2788    _handle: Arc<SessionHandle>,
2789}
2790
2791/// Callback for text and structured generation. Called exactly once by Swift.
2792#[cfg(aimx_bridge)]
2793extern "C" fn respond_callback(ctx: *mut c_void, result: *const c_char, error: *const c_char) {
2794    // Safety: ctx is always a Box<ResponseContext> allocated by a single-shot
2795    // generation call and consumed by this exactly-once callback.
2796    let context = unsafe { Box::from_raw(ctx as *mut ResponseContext) };
2797
2798    if let Some(msg) = callback_owned_text(error) {
2799        context.tx.send(Err(GenerationError::from(msg))).ok();
2800    } else if let Some(text) = callback_owned_text(result) {
2801        context.tx.send(Ok(ResponseText::from(text))).ok();
2802    }
2803}
2804
2805#[cfg(aimx_bridge)]
2806fn callback_owned_text(ptr: *const c_char) -> Option<String> {
2807    if ptr.is_null() {
2808        return None;
2809    }
2810
2811    Some(unsafe { CStr::from_ptr(ptr).to_string_lossy().into_owned() })
2812}
2813
2814/// Internal state for a streaming request; owned by Swift via raw pointer until stream_done_callback.
2815#[cfg(aimx_bridge)]
2816struct StreamContext {
2817    tx: StreamSender,
2818    _handle: Arc<SessionHandle>,
2819}
2820
2821/// Token callback for streaming. May be called many times before stream_done_callback.
2822#[cfg(aimx_bridge)]
2823extern "C" fn stream_token_callback(ctx: *mut c_void, token: *const c_char) {
2824    // Safety: ctx is a Box<StreamContext> allocated in stream_with_options; it remains
2825    // valid until stream_done_callback drops it.
2826    let stream_ctx = unsafe { &*(ctx as *const StreamContext) };
2827    let Some(text) = callback_owned_text(token) else {
2828        return;
2829    };
2830    // Failure here means the Rust ResponseStream was dropped; ignore silently.
2831    stream_ctx
2832        .tx
2833        .unbounded_send(Ok(ResponseText::from(text)))
2834        .ok();
2835}
2836
2837/// Done callback for streaming. Called exactly once; takes ownership of StreamContext.
2838#[cfg(aimx_bridge)]
2839extern "C" fn stream_done_callback(ctx: *mut c_void, error: *const c_char) {
2840    // Safety: takes ownership of the Box<StreamContext> that was created in stream_with_options.
2841    let stream_ctx = unsafe { Box::from_raw(ctx as *mut StreamContext) };
2842    if let Some(msg) = callback_owned_text(error) {
2843        stream_ctx
2844            .tx
2845            .unbounded_send(Err(GenerationError::from(msg)))
2846            .ok();
2847    }
2848    // stream_ctx drops here, closing the channel and ending the ResponseStream.
2849}
2850
2851/// Dispatches a tool call from Swift to the appropriate Rust handler in `ToolsContext`.
2852/// Calls `result_cb(result_ctx, result, null)` or `result_cb(result_ctx, null, error)`.
2853#[cfg(aimx_bridge)]
2854extern "C" fn tool_dispatch(
2855    ctx: *mut c_void,
2856    name_ptr: *const c_char,
2857    args_ptr: *const c_char,
2858    result_ctx: *mut c_void,
2859    result_cb: ToolResultCallback,
2860) {
2861    let result = dispatch_tool_call(ctx, name_ptr, args_ptr);
2862    send_tool_result(result_ctx, result_cb, result);
2863}
2864
2865#[cfg(aimx_bridge)]
2866fn dispatch_tool_call(
2867    ctx: *mut c_void,
2868    name_ptr: *const c_char,
2869    args_ptr: *const c_char,
2870) -> ToolResult {
2871    if ctx.is_null() {
2872        return Err(ToolCallError::new("missing tool context"));
2873    }
2874
2875    // Safety: ctx is Arc::as_ptr(&tools_ctx) cast to *mut c_void; the Arc outlives this call.
2876    let tools = unsafe { &*(ctx as *const ToolsContext) };
2877    with_callback_text(name_ptr, "tool name", |name| {
2878        let args = parse_tool_args(args_ptr)?;
2879        tools.call(name, args)
2880    })?
2881}
2882
2883#[cfg(aimx_bridge)]
2884fn parse_tool_args(args_ptr: *const c_char) -> Result<serde_json::Value, ToolCallError> {
2885    if args_ptr.is_null() {
2886        return Err(ToolCallError::new("missing tool arguments"));
2887    }
2888
2889    let args = unsafe { CStr::from_ptr(args_ptr) };
2890    serde_json::from_slice(args.to_bytes())
2891        .map_err(|error| ToolCallError::new(format!("invalid tool args JSON: {error}")))
2892}
2893
2894#[cfg(aimx_bridge)]
2895fn with_callback_text<R>(
2896    ptr: *const c_char,
2897    label: &str,
2898    f: impl FnOnce(&str) -> R,
2899) -> Result<R, ToolCallError> {
2900    if ptr.is_null() {
2901        return Err(ToolCallError::new(format!("missing {label}")));
2902    }
2903
2904    let text = unsafe { CStr::from_ptr(ptr).to_string_lossy() };
2905    Ok(f(text.as_ref()))
2906}
2907
2908#[cfg(aimx_bridge)]
2909fn send_tool_result(result_ctx: *mut c_void, result_cb: ToolResultCallback, result: ToolResult) {
2910    match result {
2911        Ok(output) => send_tool_output(result_ctx, result_cb, output),
2912        Err(error) => send_tool_error(result_ctx, result_cb, error.as_str()),
2913    }
2914}
2915
2916#[cfg(aimx_bridge)]
2917fn send_tool_output(result_ctx: *mut c_void, result_cb: ToolResultCallback, output: ToolOutput) {
2918    match CString::new(output.into_string()) {
2919        Ok(c_output) => result_cb(result_ctx, c_output.as_ptr(), null()),
2920        Err(error) => send_tool_error(
2921            result_ctx,
2922            result_cb,
2923            &format!("tool result contains a null byte: {error}"),
2924        ),
2925    }
2926}
2927
2928#[cfg(aimx_bridge)]
2929fn send_tool_error(result_ctx: *mut c_void, result_cb: ToolResultCallback, message: &str) {
2930    match CString::new(message) {
2931        Ok(c_error) => result_cb(result_ctx, null(), c_error.as_ptr()),
2932        Err(_) => result_cb(
2933            result_ctx,
2934            null(),
2935            TOOL_ERROR_ENCODING_FAILURE.as_ptr().cast::<c_char>(),
2936        ),
2937    }
2938}
2939
2940#[cfg(aimx_bridge)]
2941const TOOL_ERROR_ENCODING_FAILURE: &[u8] = b"tool error contains a null byte\0";
2942
2943// ─── Tests ─────────────────────────────────────────────────────────────────────
2944
2945#[cfg(test)]
2946mod tests {
2947    use super::*;
2948    use proptest::prelude::*;
2949
2950    // ── Always-runnable unit tests ────────────────────────────────────────────
2951
2952    #[test]
2953    fn test_is_available_returns_without_panic() {
2954        let _ = is_available();
2955    }
2956
2957    #[test]
2958    fn test_availability_result_is_consistent() {
2959        let avail = availability();
2960        assert_eq!(is_available(), avail.is_ok());
2961    }
2962
2963    #[test]
2964    fn test_options_default_is_valid() -> Result<(), Error> {
2965        let opts = GenerationOptions::default();
2966        assert!(opts.validate().is_ok());
2967        let config = opts.validated()?;
2968        assert_eq!(config.ffi_temperature(), -1.0);
2969        assert_eq!(config.ffi_max_tokens(), -1);
2970        Ok(())
2971    }
2972
2973    #[test]
2974    fn test_options_valid_temperature() -> Result<(), Error> {
2975        for (temp, expected_ffi) in [(0.0_f64, 0.0), (1.0, 1.0), (2.0, 2.0)] {
2976            let opts = GenerationOptions::new().try_temperature(temp)?;
2977            assert!(
2978                opts.validate().is_ok(),
2979                "temperature {temp} should be valid"
2980            );
2981            let config = opts.validated()?;
2982            assert_eq!(config.ffi_temperature(), expected_ffi);
2983        }
2984        Ok(())
2985    }
2986
2987    #[test]
2988    fn test_options_invalid_temperature() {
2989        for temp in [-f64::INFINITY, -0.1_f64, 2.001, f64::INFINITY, f64::NAN] {
2990            assert!(
2991                GenerationOptions::new().try_temperature(temp).is_err(),
2992                "temperature {temp} should be invalid"
2993            );
2994        }
2995    }
2996
2997    #[test]
2998    fn test_options_invalid_max_tokens() {
2999        if usize::BITS < i64::BITS {
3000            return;
3001        }
3002
3003        let invalid = MaxTokens::MAX + 1;
3004
3005        assert!(matches!(
3006            GenerationOptions::new().try_max_tokens(invalid),
3007            Err(Error::InvalidMaxTokens(value)) if value == invalid
3008        ));
3009        assert!(matches!(
3010            MaxTokens::new(invalid),
3011            Err(Error::InvalidMaxTokens(value)) if value == invalid
3012        ));
3013    }
3014
3015    #[test]
3016    fn test_session_creation_fails_gracefully_when_unavailable() {
3017        if is_available() {
3018            return; // skip — integration tests cover the available path
3019        }
3020        assert!(matches!(
3021            LanguageModelSession::new(),
3022            Err(Error::Unavailable(_))
3023        ));
3024    }
3025
3026    #[test]
3027    fn test_null_byte_in_prompt_returns_error() {
3028        let result = futures_executor::block_on(respond("hello\0world"));
3029        assert!(matches!(result, Err(Error::NullByte(_))));
3030    }
3031
3032    #[test]
3033    fn test_prompt_and_instruction_inputs_reject_null_bytes_before_availability() {
3034        let prompt = Prompt::try_from("hello\0world");
3035        let instructions = SystemInstructions::try_from("system\0prompt");
3036
3037        assert!(matches!(prompt, Err(Error::NullByte(_))));
3038        assert!(matches!(instructions, Err(Error::NullByte(_))));
3039    }
3040
3041    #[test]
3042    fn test_session_builder_validates_options_before_availability() {
3043        let result = AppleIntelligenceModels::default()
3044            .session()
3045            .instructions("Valid system prompt")
3046            .try_temperature(2.5)
3047            .and_then(LanguageModelSessionBuilder::build);
3048
3049        assert!(matches!(result, Err(Error::InvalidTemperature(value)) if value == 2.5));
3050    }
3051
3052    #[test]
3053    fn test_options_expose_typed_values() -> Result<(), Error> {
3054        let temperature = Temperature::new(0.4)?;
3055        let max_tokens = MaxTokens::new(128)?;
3056        let opts = GenerationOptions::new()
3057            .temperature(temperature)
3058            .max_tokens(max_tokens);
3059
3060        assert_eq!(opts.temperature_value(), Some(temperature));
3061        assert_eq!(opts.max_tokens_value(), Some(max_tokens));
3062        Ok(())
3063    }
3064
3065    #[test]
3066    fn test_schema_property_requirement_serializes_as_optional_flag() -> Result<(), Error> {
3067        let schema = GenerationSchema::new("Answer")
3068            .property(GenerationSchemaProperty::new(
3069                "required",
3070                GenerationSchemaPropertyType::String,
3071            ))
3072            .property(
3073                GenerationSchemaProperty::new("maybe", GenerationSchemaPropertyType::String)
3074                    .optional(),
3075            );
3076
3077        let json = serde_json::to_value(schema)?;
3078
3079        assert_eq!(json["properties"][0]["optional"], false);
3080        assert_eq!(json["properties"][1]["optional"], true);
3081        assert!(GenerationSchemaPropertyRequirement::Required.is_required());
3082        assert!(GenerationSchemaPropertyRequirement::Optional.is_optional());
3083        Ok(())
3084    }
3085
3086    #[test]
3087    fn test_session_builder_validates_instructions_before_availability() {
3088        let result = AppleIntelligenceModels::default()
3089            .session()
3090            .instructions("bad\0instructions")
3091            .build();
3092
3093        assert!(matches!(result, Err(Error::NullByte(_))));
3094    }
3095
3096    #[test]
3097    fn test_string_newtypes_round_trip_through_display_and_inner_value() {
3098        let cases = [
3099            PromptText::new("prompt").into_string(),
3100            ResponseText::new("response").to_string(),
3101            GenerationSchemaName::new("GenerationSchema").to_string(),
3102            GenerationSchemaPropertyName::new("field").to_string(),
3103            ToolName::new("tool").to_string(),
3104            ToolOutput::new("output").to_string(),
3105        ];
3106
3107        assert_eq!(
3108            cases,
3109            [
3110                "prompt",
3111                "response",
3112                "GenerationSchema",
3113                "field",
3114                "tool",
3115                "output"
3116            ]
3117        );
3118    }
3119
3120    #[test]
3121    fn test_schema_builder() -> Result<(), Error> {
3122        let schema = GenerationSchema::new("Point")
3123            .description("A 2D point")
3124            .property(
3125                GenerationSchemaProperty::new("x", GenerationSchemaPropertyType::Double)
3126                    .description("X axis"),
3127            )
3128            .property(GenerationSchemaProperty::new(
3129                "y",
3130                GenerationSchemaPropertyType::Double,
3131            ));
3132        assert_eq!(schema.name, "Point");
3133        assert_eq!(schema.properties.len(), 2);
3134        let json = serde_json::to_string(&schema)?;
3135        assert!(json.contains("\"x\""));
3136        assert!(json.contains("\"double\""));
3137        Ok(())
3138    }
3139
3140    #[test]
3141    fn test_tool_definition_builder() -> Result<(), ToolCallError> {
3142        let tool = ToolDefinition::builder(
3143            "add",
3144            "Add two numbers",
3145            GenerationSchema::new("AddArgs")
3146                .property(GenerationSchemaProperty::new(
3147                    "a",
3148                    GenerationSchemaPropertyType::Double,
3149                ))
3150                .property(GenerationSchemaProperty::new(
3151                    "b",
3152                    GenerationSchemaPropertyType::Double,
3153                )),
3154        )
3155        .handler(|args| {
3156            let a = args["a"].as_f64().unwrap_or(0.0);
3157            let b = args["b"].as_f64().unwrap_or(0.0);
3158            Ok(ToolOutput::from(format!("{}", a + b)))
3159        });
3160        assert_eq!(tool.name, "add");
3161        let result = tool.call(serde_json::json!({"a": 3.0, "b": 4.0}));
3162        assert_eq!(result?, "7");
3163        Ok(())
3164    }
3165
3166    #[test]
3167    fn test_tool_definition_new_and_trait_boundary() -> Result<(), ToolCallError> {
3168        let tool = ToolDefinition::new(
3169            "echo",
3170            "Echo an input string",
3171            GenerationSchema::new("EchoArgs").property(GenerationSchemaProperty::new(
3172                "value",
3173                GenerationSchemaPropertyType::String,
3174            )),
3175            |args| {
3176                args["value"]
3177                    .as_str()
3178                    .map(ToolOutput::from)
3179                    .ok_or_else(|| ToolCallError::new("missing value"))
3180            },
3181        );
3182
3183        assert_eq!(tool.name().as_str(), "echo");
3184        assert_eq!(tool.description().as_str(), "Echo an input string");
3185        assert_eq!(tool.parameters().name, "EchoArgs");
3186        assert_eq!(tool.call(serde_json::json!({"value": "hello"}))?, "hello");
3187        assert!(tool.call(serde_json::json!({})).is_err());
3188        Ok(())
3189    }
3190
3191    #[test]
3192    fn test_tool_handler_panic_returns_tool_error() {
3193        let tool = ToolDefinition::new(
3194            "panic_tool",
3195            "Tool that fails inside user code",
3196            GenerationSchema::new("PanicArgs"),
3197            |_| -> ToolResult {
3198                std::panic::resume_unwind(Box::new("boom"));
3199            },
3200        );
3201
3202        let error = tool.call(serde_json::json!({})).err();
3203
3204        assert!(
3205            error
3206                .as_ref()
3207                .is_some_and(|error| error.as_str().contains("tool handler panicked: boom")),
3208            "expected panic to be converted into ToolCallError"
3209        );
3210    }
3211
3212    proptest! {
3213        #[test]
3214        fn proptest_prompt_input_matches_c_string_null_boundary(input in ".*") {
3215            let result = Prompt::try_from(input.as_str());
3216
3217            if input.contains('\0') {
3218                prop_assert!(matches!(result, Err(Error::NullByte(_))));
3219            } else {
3220                match result {
3221                    Ok(prompt) => prop_assert_eq!(prompt.as_str(), input.as_str()),
3222                    Err(error) => prop_assert!(false, "unexpected prompt error: {error}"),
3223                }
3224            }
3225        }
3226
3227        #[test]
3228        fn proptest_instructions_match_c_string_null_boundary(input in ".*") {
3229            let result = SystemInstructions::try_from(input.as_str());
3230
3231            if input.contains('\0') {
3232                prop_assert!(matches!(result, Err(Error::NullByte(_))));
3233            } else {
3234                match result {
3235                    Ok(instructions) => prop_assert_eq!(instructions.as_str(), input.as_str()),
3236                    Err(error) => prop_assert!(false, "unexpected instructions error: {error}"),
3237                }
3238            }
3239        }
3240
3241        #[test]
3242        fn proptest_temperature_validation_matches_closed_interval(temp in any::<f64>()) {
3243            let result = Temperature::new(temp);
3244
3245            if (Temperature::MIN..=Temperature::MAX).contains(&temp) {
3246                match result {
3247                    Ok(temperature) => prop_assert_eq!(temperature.as_f64(), temp),
3248                    Err(error) => prop_assert!(false, "unexpected temperature error: {error}"),
3249                }
3250            } else {
3251                prop_assert!(matches!(result, Err(Error::InvalidTemperature(value)) if value.to_bits() == temp.to_bits()));
3252            }
3253        }
3254
3255        #[test]
3256        fn proptest_generation_options_preserve_max_tokens(max_tokens in any::<usize>()) {
3257            if max_tokens <= MaxTokens::MAX {
3258                match GenerationOptions::new().try_max_tokens(max_tokens) {
3259                    Ok(opts) => match opts.validated() {
3260                        Ok(config) => prop_assert_eq!(config.ffi_max_tokens(), max_tokens as i64),
3261                        Err(error) => prop_assert!(false, "unexpected options error: {error}"),
3262                    },
3263                    Err(error) => prop_assert!(false, "unexpected max token error: {error}"),
3264                }
3265            } else {
3266                prop_assert!(matches!(
3267                    GenerationOptions::new().try_max_tokens(max_tokens),
3268                    Err(Error::InvalidMaxTokens(value)) if value == max_tokens
3269                ));
3270            }
3271        }
3272    }
3273
3274    // ── Integration tests (require Apple Intelligence) ─────────────────────────
3275    //
3276    // Run with:  cargo test -- --include-ignored
3277
3278    #[test]
3279    #[ignore = "requires Apple Intelligence (macOS 26+, Apple Silicon, AI enabled)"]
3280    fn test_simple_respond() -> Result<(), Error> {
3281        let response =
3282            futures_executor::block_on(respond("Reply with only the number: what is 2 + 2?"))?;
3283        assert!(
3284            response.as_str().contains('4'),
3285            "expected '4' in: {response:?}"
3286        );
3287        Ok(())
3288    }
3289
3290    #[test]
3291    #[ignore = "requires Apple Intelligence"]
3292    fn test_respond_with_low_temperature() -> Result<(), Error> {
3293        let opts = GenerationOptions::new().temperature(Temperature::new(0.0)?);
3294        let r = futures_executor::block_on(respond_with_options(
3295            "Reply with only the word: capital of France?",
3296            &opts,
3297        ))?;
3298        assert!(
3299            r.as_str().to_lowercase().contains("paris"),
3300            "expected Paris in: {r:?}"
3301        );
3302        Ok(())
3303    }
3304
3305    #[test]
3306    #[ignore = "requires Apple Intelligence"]
3307    fn test_multi_turn_session() -> Result<(), Error> {
3308        let session = LanguageModelSession::with_instructions(
3309            "Reply to every message with exactly one word.",
3310        )?;
3311        let r1 = futures_executor::block_on(session.respond_to("Say hello."))?;
3312        let r2 = futures_executor::block_on(session.respond_to("Say goodbye."))?;
3313        assert!(!r1.is_empty(), "first response was empty");
3314        assert!(!r2.is_empty(), "second response was empty");
3315        Ok(())
3316    }
3317
3318    #[test]
3319    #[ignore = "requires Apple Intelligence"]
3320    fn test_streaming_yields_chunks() -> Result<(), Error> {
3321        let session = LanguageModelSession::new()?;
3322        let stream = session.stream_response("Count: one two three")?;
3323
3324        let chunks: Vec<ResponseText> =
3325            futures_executor::block_on_stream(stream).collect::<Result<_, _>>()?;
3326
3327        assert!(!chunks.is_empty(), "stream produced no chunks");
3328        let full = chunks
3329            .into_iter()
3330            .map(ResponseText::into_string)
3331            .collect::<Vec<_>>()
3332            .join("");
3333        assert!(!full.is_empty(), "concatenated response was empty");
3334        Ok(())
3335    }
3336
3337    #[test]
3338    #[ignore = "requires Apple Intelligence"]
3339    fn test_structured_generation() -> Result<(), Error> {
3340        use serde::Deserialize;
3341
3342        #[derive(Debug, Deserialize)]
3343        struct MathAnswer {
3344            value: f64,
3345            explanation: String,
3346        }
3347
3348        let session = LanguageModelSession::new()?;
3349        let schema = GenerationSchema::new("MathAnswer")
3350            .description("A numeric answer with a brief explanation")
3351            .property(
3352                GenerationSchemaProperty::new("value", GenerationSchemaPropertyType::Double)
3353                    .description("The numeric result"),
3354            )
3355            .property(
3356                GenerationSchemaProperty::new("explanation", GenerationSchemaPropertyType::String)
3357                    .description("One-sentence explanation"),
3358            );
3359
3360        let answer: MathAnswer =
3361            futures_executor::block_on(session.respond_generating("What is 6 × 7?", &schema))?;
3362
3363        assert!(
3364            (answer.value - 42.0).abs() < 0.5,
3365            "expected 42, got {}",
3366            answer.value
3367        );
3368        assert!(!answer.explanation.is_empty(), "explanation was empty");
3369        Ok(())
3370    }
3371
3372    #[test]
3373    #[ignore = "requires Apple Intelligence"]
3374    fn test_tool_calling() -> Result<(), Error> {
3375        let tool = ToolDefinition::builder(
3376            "add_numbers",
3377            "Add two numbers together and return the sum",
3378            GenerationSchema::new("AddArgs")
3379                .property(
3380                    GenerationSchemaProperty::new("a", GenerationSchemaPropertyType::Double)
3381                        .description("First number"),
3382                )
3383                .property(
3384                    GenerationSchemaProperty::new("b", GenerationSchemaPropertyType::Double)
3385                        .description("Second number"),
3386                ),
3387        )
3388        .handler(|args| {
3389            let a = args["a"].as_f64().unwrap_or(0.0);
3390            let b = args["b"].as_f64().unwrap_or(0.0);
3391            Ok(ToolOutput::from(format!("{}", a + b)))
3392        });
3393
3394        let session = LanguageModelSession::with_tools(
3395            "You are a calculator. Use the add_numbers tool when asked to add.",
3396            vec![tool],
3397        )?;
3398
3399        let response = futures_executor::block_on(session.respond_to("What is 15 + 27?"))?;
3400
3401        assert!(
3402            response.as_str().contains("42"),
3403            "expected 42 in response: {response:?}"
3404        );
3405        Ok(())
3406    }
3407}
aimx/lib.rs

aimx/
lib.rs