Skip to main content

rig_core/providers/openai/completion/
mod.rs

1// ================================================================
2// OpenAI Completion API
3// ================================================================
4
5use super::{
6    client::{ApiErrorResponse, ApiResponse},
7    streaming::StreamingCompletionResponse,
8};
9use crate::completion::{
10    CompletionError, CompletionRequest as CoreCompletionRequest, GetTokenUsage,
11};
12use crate::http_client::{self, HttpClientExt};
13use crate::message::{AudioMediaType, DocumentSourceKind, ImageDetail, MimeType};
14use crate::one_or_many::string_or_one_or_many;
15use crate::telemetry::{ProviderResponseExt, SpanCombinator};
16use crate::wasm_compat::{WasmCompatSend, WasmCompatSync};
17use crate::{OneOrMany, completion, json_utils, message};
18use serde::{Deserialize, Serialize, Serializer};
19use std::convert::Infallible;
20use std::fmt;
21use tracing::{Instrument, Level, enabled, info_span};
22
23use std::str::FromStr;
24
25pub mod streaming;
26
27/// Serializes user content as a plain string when there's a single text item,
28/// otherwise as an array of content parts.
29fn serialize_user_content<S>(
30    content: &OneOrMany<UserContent>,
31    serializer: S,
32) -> Result<S::Ok, S::Error>
33where
34    S: Serializer,
35{
36    if content.len() == 1
37        && let UserContent::Text { text, .. } = content.first_ref()
38    {
39        return serializer.serialize_str(text);
40    }
41    content.serialize(serializer)
42}
43
44/// `gpt-5.5` completion model
45pub const GPT_5_5: &str = "gpt-5.5";
46
47/// `gpt-5.2` completion model
48pub const GPT_5_2: &str = "gpt-5.2";
49
50/// `gpt-5.1` completion model
51pub const GPT_5_1: &str = "gpt-5.1";
52
53/// `gpt-5` completion model
54pub const GPT_5: &str = "gpt-5";
55/// `gpt-5` completion model
56pub const GPT_5_MINI: &str = "gpt-5-mini";
57/// `gpt-5` completion model
58pub const GPT_5_NANO: &str = "gpt-5-nano";
59
60/// `gpt-4.5-preview` completion model
61pub const GPT_4_5_PREVIEW: &str = "gpt-4.5-preview";
62/// `gpt-4.5-preview-2025-02-27` completion model
63pub const GPT_4_5_PREVIEW_2025_02_27: &str = "gpt-4.5-preview-2025-02-27";
64/// `gpt-4o-2024-11-20` completion model (this is newer than 4o)
65pub const GPT_4O_2024_11_20: &str = "gpt-4o-2024-11-20";
66/// `gpt-4o` completion model
67pub const GPT_4O: &str = "gpt-4o";
68/// `gpt-4o-mini` completion model
69pub const GPT_4O_MINI: &str = "gpt-4o-mini";
70/// `gpt-4o-2024-05-13` completion model
71pub const GPT_4O_2024_05_13: &str = "gpt-4o-2024-05-13";
72/// `gpt-4-turbo` completion model
73pub const GPT_4_TURBO: &str = "gpt-4-turbo";
74/// `gpt-4-turbo-2024-04-09` completion model
75pub const GPT_4_TURBO_2024_04_09: &str = "gpt-4-turbo-2024-04-09";
76/// `gpt-4-turbo-preview` completion model
77pub const GPT_4_TURBO_PREVIEW: &str = "gpt-4-turbo-preview";
78/// `gpt-4-0125-preview` completion model
79pub const GPT_4_0125_PREVIEW: &str = "gpt-4-0125-preview";
80/// `gpt-4-1106-preview` completion model
81pub const GPT_4_1106_PREVIEW: &str = "gpt-4-1106-preview";
82/// `gpt-4-vision-preview` completion model
83pub const GPT_4_VISION_PREVIEW: &str = "gpt-4-vision-preview";
84/// `gpt-4-1106-vision-preview` completion model
85pub const GPT_4_1106_VISION_PREVIEW: &str = "gpt-4-1106-vision-preview";
86/// `gpt-4` completion model
87pub const GPT_4: &str = "gpt-4";
88/// `gpt-4-0613` completion model
89pub const GPT_4_0613: &str = "gpt-4-0613";
90/// `gpt-4-32k` completion model
91pub const GPT_4_32K: &str = "gpt-4-32k";
92/// `gpt-4-32k-0613` completion model
93pub const GPT_4_32K_0613: &str = "gpt-4-32k-0613";
94
95/// `o4-mini-2025-04-16` completion model
96pub const O4_MINI_2025_04_16: &str = "o4-mini-2025-04-16";
97/// `o4-mini` completion model
98pub const O4_MINI: &str = "o4-mini";
99/// `o3` completion model
100pub const O3: &str = "o3";
101/// `o3-mini` completion model
102pub const O3_MINI: &str = "o3-mini";
103/// `o3-mini-2025-01-31` completion model
104pub const O3_MINI_2025_01_31: &str = "o3-mini-2025-01-31";
105/// `o1-pro` completion model
106pub const O1_PRO: &str = "o1-pro";
107/// `o1`` completion model
108pub const O1: &str = "o1";
109/// `o1-2024-12-17` completion model
110pub const O1_2024_12_17: &str = "o1-2024-12-17";
111/// `o1-preview` completion model
112pub const O1_PREVIEW: &str = "o1-preview";
113/// `o1-preview-2024-09-12` completion model
114pub const O1_PREVIEW_2024_09_12: &str = "o1-preview-2024-09-12";
115/// `o1-mini completion model
116pub const O1_MINI: &str = "o1-mini";
117/// `o1-mini-2024-09-12` completion model
118pub const O1_MINI_2024_09_12: &str = "o1-mini-2024-09-12";
119
120/// `gpt-4.1-mini` completion model
121pub const GPT_4_1_MINI: &str = "gpt-4.1-mini";
122/// `gpt-4.1-nano` completion model
123pub const GPT_4_1_NANO: &str = "gpt-4.1-nano";
124/// `gpt-4.1-2025-04-14` completion model
125pub const GPT_4_1_2025_04_14: &str = "gpt-4.1-2025-04-14";
126/// `gpt-4.1` completion model
127pub const GPT_4_1: &str = "gpt-4.1";
128
129impl From<ApiErrorResponse> for CompletionError {
130    fn from(err: ApiErrorResponse) -> Self {
131        CompletionError::ProviderError(err.message)
132    }
133}
134
135#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
136#[serde(tag = "role", rename_all = "lowercase")]
137pub enum Message {
138    #[serde(alias = "developer")]
139    System {
140        #[serde(deserialize_with = "string_or_one_or_many")]
141        content: OneOrMany<SystemContent>,
142        #[serde(skip_serializing_if = "Option::is_none")]
143        name: Option<String>,
144    },
145    User {
146        #[serde(
147            deserialize_with = "string_or_one_or_many",
148            serialize_with = "serialize_user_content"
149        )]
150        content: OneOrMany<UserContent>,
151        #[serde(skip_serializing_if = "Option::is_none")]
152        name: Option<String>,
153    },
154    Assistant {
155        #[serde(
156            default,
157            deserialize_with = "json_utils::string_or_vec",
158            skip_serializing_if = "Vec::is_empty",
159            serialize_with = "serialize_assistant_content_vec"
160        )]
161        content: Vec<AssistantContent>,
162        // OpenAI-compatible providers expose hidden reasoning on this non-standard
163        // field, and some require it to be echoed back on assistant tool-call turns.
164        #[serde(skip_serializing_if = "Option::is_none", rename = "reasoning_content")]
165        reasoning: Option<String>,
166        #[serde(skip_serializing_if = "Option::is_none")]
167        refusal: Option<String>,
168        #[serde(skip_serializing_if = "Option::is_none")]
169        audio: Option<AudioAssistant>,
170        #[serde(skip_serializing_if = "Option::is_none")]
171        name: Option<String>,
172        #[serde(
173            default,
174            deserialize_with = "json_utils::null_or_vec",
175            skip_serializing_if = "Vec::is_empty"
176        )]
177        tool_calls: Vec<ToolCall>,
178    },
179    #[serde(rename = "tool")]
180    ToolResult {
181        tool_call_id: String,
182        content: ToolResultContentValue,
183    },
184}
185
186impl Message {
187    pub fn system(content: &str) -> Self {
188        Message::System {
189            content: OneOrMany::one(content.to_owned().into()),
190            name: None,
191        }
192    }
193}
194
195fn history_contains_tool_result(messages: &[Message]) -> bool {
196    messages
197        .iter()
198        .any(|message| matches!(message, Message::ToolResult { .. }))
199}
200
201#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
202pub struct AudioAssistant {
203    pub id: String,
204}
205
206#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
207pub struct SystemContent {
208    #[serde(default)]
209    pub r#type: SystemContentType,
210    pub text: String,
211}
212
213#[derive(Default, Debug, Serialize, Deserialize, PartialEq, Clone)]
214#[serde(rename_all = "lowercase")]
215pub enum SystemContentType {
216    #[default]
217    Text,
218}
219
220#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
221#[serde(tag = "type", rename_all = "lowercase")]
222pub enum AssistantContent {
223    Text { text: String },
224    Refusal { refusal: String },
225}
226
227impl From<AssistantContent> for completion::AssistantContent {
228    fn from(value: AssistantContent) -> Self {
229        match value {
230            AssistantContent::Text { text, .. } => completion::AssistantContent::text(text),
231            AssistantContent::Refusal { refusal } => completion::AssistantContent::text(refusal),
232        }
233    }
234}
235
236#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
237#[serde(tag = "type", rename_all = "lowercase")]
238pub enum UserContent {
239    Text {
240        text: String,
241    },
242    #[serde(rename = "image_url")]
243    Image {
244        image_url: ImageUrl,
245    },
246    Audio {
247        input_audio: InputAudio,
248    },
249    /// File content part for documents such as PDFs.
250    ///
251    /// Maps to OpenAI's `{"type":"file","file":{...}}` content type. Either
252    /// `file_data` (a base64 data URI like `data:application/pdf;base64,...`)
253    /// or `file_id` (a previously uploaded file reference) must be set.
254    File {
255        file: FileData,
256    },
257}
258
259#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
260pub struct ImageUrl {
261    pub url: String,
262    #[serde(default)]
263    pub detail: ImageDetail,
264}
265
266#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
267pub struct InputAudio {
268    pub data: String,
269    pub format: AudioMediaType,
270}
271
272/// File payload for [`UserContent::File`].
273///
274/// At least one of `file_data` or `file_id` must be set for the content part
275/// to be accepted by OpenAI's chat completions API. `filename` is optional
276/// but recommended.
277#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
278pub struct FileData {
279    /// Inline file data as a base64 data URI, e.g.
280    /// `data:application/pdf;base64,JVBERi0xLjQK...`.
281    #[serde(skip_serializing_if = "Option::is_none")]
282    pub file_data: Option<String>,
283    /// Identifier of a previously uploaded file (OpenAI Files API).
284    #[serde(skip_serializing_if = "Option::is_none")]
285    pub file_id: Option<String>,
286    /// Display name of the file. Recommended for inline `file_data`.
287    #[serde(skip_serializing_if = "Option::is_none")]
288    pub filename: Option<String>,
289}
290
291#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
292pub struct ToolResultContent {
293    #[serde(default)]
294    r#type: ToolResultContentType,
295    pub text: String,
296}
297
298#[derive(Default, Debug, Serialize, Deserialize, PartialEq, Clone)]
299#[serde(rename_all = "lowercase")]
300pub enum ToolResultContentType {
301    #[default]
302    Text,
303}
304
305impl FromStr for ToolResultContent {
306    type Err = Infallible;
307
308    fn from_str(s: &str) -> Result<Self, Self::Err> {
309        Ok(s.to_owned().into())
310    }
311}
312
313impl From<String> for ToolResultContent {
314    fn from(s: String) -> Self {
315        ToolResultContent {
316            r#type: ToolResultContentType::default(),
317            text: s,
318        }
319    }
320}
321
322#[derive(Debug, Serialize, Deserialize, Clone, PartialEq)]
323#[serde(untagged)]
324pub enum ToolResultContentValue {
325    Array(Vec<ToolResultContent>),
326    String(String),
327}
328
329impl ToolResultContentValue {
330    pub fn from_string(s: String, use_array_format: bool) -> Self {
331        if use_array_format {
332            ToolResultContentValue::Array(vec![ToolResultContent::from(s)])
333        } else {
334            ToolResultContentValue::String(s)
335        }
336    }
337
338    pub fn as_text(&self) -> String {
339        match self {
340            ToolResultContentValue::Array(arr) => arr
341                .iter()
342                .map(|c| c.text.clone())
343                .collect::<Vec<_>>()
344                .join("\n"),
345            ToolResultContentValue::String(s) => s.clone(),
346        }
347    }
348
349    pub fn to_array(&self) -> Self {
350        match self {
351            ToolResultContentValue::Array(_) => self.clone(),
352            ToolResultContentValue::String(s) => {
353                ToolResultContentValue::Array(vec![ToolResultContent::from(s.clone())])
354            }
355        }
356    }
357}
358
359#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
360pub struct ToolCall {
361    pub id: String,
362    #[serde(default)]
363    pub r#type: ToolType,
364    pub function: Function,
365}
366
367#[derive(Default, Debug, Serialize, Deserialize, PartialEq, Clone)]
368#[serde(rename_all = "lowercase")]
369pub enum ToolType {
370    #[default]
371    Function,
372}
373
374/// Function definition for a tool, with optional strict mode
375#[derive(Debug, Deserialize, Serialize, Clone)]
376pub struct FunctionDefinition {
377    pub name: String,
378    pub description: String,
379    pub parameters: serde_json::Value,
380    #[serde(skip_serializing_if = "Option::is_none")]
381    pub strict: Option<bool>,
382}
383
384#[derive(Debug, Deserialize, Serialize, Clone)]
385pub struct ToolDefinition {
386    pub r#type: String,
387    pub function: FunctionDefinition,
388}
389
390impl From<completion::ToolDefinition> for ToolDefinition {
391    fn from(tool: completion::ToolDefinition) -> Self {
392        Self {
393            r#type: "function".into(),
394            function: FunctionDefinition {
395                name: tool.name,
396                description: tool.description,
397                parameters: tool.parameters,
398                strict: None,
399            },
400        }
401    }
402}
403
404impl ToolDefinition {
405    /// Apply strict mode to this tool definition.
406    /// This sets `strict: true` and sanitizes the schema to meet OpenAI requirements.
407    pub fn with_strict(mut self) -> Self {
408        self.function.strict = Some(true);
409        super::sanitize_schema(&mut self.function.parameters);
410        self
411    }
412}
413
414#[derive(Default, Clone, Debug, Deserialize, Serialize, PartialEq)]
415#[serde(rename_all = "snake_case")]
416pub enum ToolChoice {
417    #[default]
418    Auto,
419    None,
420    Required,
421}
422
423impl TryFrom<crate::message::ToolChoice> for ToolChoice {
424    type Error = CompletionError;
425    fn try_from(value: crate::message::ToolChoice) -> Result<Self, Self::Error> {
426        let res = match value {
427            message::ToolChoice::Specific { .. } => {
428                return Err(CompletionError::ProviderError(
429                    "Provider doesn't support only using specific tools".to_string(),
430                ));
431            }
432            message::ToolChoice::Auto => Self::Auto,
433            message::ToolChoice::None => Self::None,
434            message::ToolChoice::Required => Self::Required,
435        };
436
437        Ok(res)
438    }
439}
440
441#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
442pub struct Function {
443    pub name: String,
444    #[serde(
445        serialize_with = "json_utils::stringified_json::serialize",
446        deserialize_with = "json_utils::stringified_json::deserialize_maybe_stringified"
447    )]
448    pub arguments: serde_json::Value,
449}
450
451impl TryFrom<message::ToolResult> for Message {
452    type Error = message::MessageError;
453
454    fn try_from(value: message::ToolResult) -> Result<Self, Self::Error> {
455        let text = value
456            .content
457            .into_iter()
458            .map(|content| {
459                match content {
460                message::ToolResultContent::Text(message::Text { text, .. }) => Ok(text),
461                message::ToolResultContent::Image(_) => Err(message::MessageError::ConversionError(
462                    "OpenAI does not support images in tool results. Tool results must be text."
463                        .into(),
464                )),
465            }
466            })
467            .collect::<Result<Vec<_>, _>>()?
468            .join("\n");
469
470        Ok(Message::ToolResult {
471            tool_call_id: value.id,
472            content: ToolResultContentValue::String(text),
473        })
474    }
475}
476
477impl TryFrom<message::UserContent> for UserContent {
478    type Error = message::MessageError;
479
480    fn try_from(value: message::UserContent) -> Result<Self, Self::Error> {
481        match value {
482            message::UserContent::Text(message::Text { text, .. }) => Ok(UserContent::Text { text }),
483            message::UserContent::Image(message::Image {
484                data,
485                detail,
486                media_type,
487                ..
488            }) => match data {
489                DocumentSourceKind::Url(url) => Ok(UserContent::Image {
490                    image_url: ImageUrl {
491                        url,
492                        detail: detail.unwrap_or_default(),
493                    },
494                }),
495                DocumentSourceKind::Base64(data) => {
496                    let url = format!(
497                        "data:{};base64,{}",
498                        media_type.map(|i| i.to_mime_type()).ok_or(
499                            message::MessageError::ConversionError(
500                                "OpenAI Image URI must have media type".into()
501                            )
502                        )?,
503                        data
504                    );
505
506                    let detail = detail.unwrap_or_default();
507
508                    Ok(UserContent::Image {
509                        image_url: ImageUrl { url, detail },
510                    })
511                }
512                DocumentSourceKind::Raw(_) => Err(message::MessageError::ConversionError(
513                    "Raw files not supported, encode as base64 first".into(),
514                )),
515                DocumentSourceKind::FileId(_) => Err(message::MessageError::ConversionError(
516                    "File IDs are not supported for images".into(),
517                )),
518                DocumentSourceKind::Unknown => Err(message::MessageError::ConversionError(
519                    "Document has no body".into(),
520                )),
521                doc => Err(message::MessageError::ConversionError(format!(
522                    "Unsupported document type: {doc:?}"
523                ))),
524            },
525            message::UserContent::Document(message::Document {
526                data: DocumentSourceKind::FileId(file_id),
527                ..
528            }) => Ok(UserContent::File {
529                file: FileData {
530                    file_data: None,
531                    file_id: Some(file_id),
532                    filename: None,
533                },
534            }),
535            message::UserContent::Document(message::Document {
536                data,
537                media_type: Some(message::DocumentMediaType::PDF),
538                ..
539            }) => match data {
540                DocumentSourceKind::Base64(b64) => Ok(UserContent::File {
541                    file: FileData {
542                        file_data: Some(format!("data:application/pdf;base64,{b64}")),
543                        file_id: None,
544                        filename: Some("document.pdf".to_string()),
545                    },
546                }),
547                DocumentSourceKind::Url(_) => Err(message::MessageError::ConversionError(
548                    "OpenAI chat completions does not accept URL files; use the Responses API or pass base64-encoded bytes".into(),
549                )),
550                DocumentSourceKind::Raw(_) => Err(message::MessageError::ConversionError(
551                    "Raw files not supported, encode as base64 first".into(),
552                )),
553                DocumentSourceKind::String(_) => Err(message::MessageError::ConversionError(
554                    "PDF documents must be base64-encoded, not raw strings".into(),
555                )),
556                DocumentSourceKind::FileId(_) => Err(message::MessageError::ConversionError(
557                    "File ID documents should be converted without media type constraints".into(),
558                )),
559                DocumentSourceKind::Unknown => Err(message::MessageError::ConversionError(
560                    "Document has no body".into(),
561                )),
562            },
563            message::UserContent::Document(message::Document { data, .. }) => {
564                if let DocumentSourceKind::Base64(text) | DocumentSourceKind::String(text) = data {
565                    Ok(UserContent::Text { text })
566                } else {
567                    Err(message::MessageError::ConversionError(
568                        "Documents must be base64 or a string".into(),
569                    ))
570                }
571            }
572            message::UserContent::Audio(message::Audio {
573                data, media_type, ..
574            }) => match data {
575                DocumentSourceKind::Base64(data) => Ok(UserContent::Audio {
576                    input_audio: InputAudio {
577                        data,
578                        format: match media_type {
579                            Some(media_type) => media_type,
580                            None => AudioMediaType::MP3,
581                        },
582                    },
583                }),
584                DocumentSourceKind::Url(_) => Err(message::MessageError::ConversionError(
585                    "URLs are not supported for audio".into(),
586                )),
587                DocumentSourceKind::Raw(_) => Err(message::MessageError::ConversionError(
588                    "Raw files are not supported for audio".into(),
589                )),
590                DocumentSourceKind::FileId(_) => Err(message::MessageError::ConversionError(
591                    "File IDs are not supported for audio".into(),
592                )),
593                DocumentSourceKind::Unknown => Err(message::MessageError::ConversionError(
594                    "Audio has no body".into(),
595                )),
596                audio => Err(message::MessageError::ConversionError(format!(
597                    "Unsupported audio type: {audio:?}"
598                ))),
599            },
600            message::UserContent::ToolResult(_) => Err(message::MessageError::ConversionError(
601                "Tool result is in unsupported format".into(),
602            )),
603            message::UserContent::Video(_) => Err(message::MessageError::ConversionError(
604                "Video is in unsupported format".into(),
605            )),
606        }
607    }
608}
609
610impl TryFrom<OneOrMany<message::UserContent>> for Vec<Message> {
611    type Error = message::MessageError;
612
613    fn try_from(value: OneOrMany<message::UserContent>) -> Result<Self, Self::Error> {
614        let (tool_results, other_content): (Vec<_>, Vec<_>) = value
615            .into_iter()
616            .partition(|content| matches!(content, message::UserContent::ToolResult(_)));
617
618        // If there are messages with both tool results and user content, openai will only
619        //  handle tool results. It's unlikely that there will be both.
620        if !tool_results.is_empty() {
621            tool_results
622                .into_iter()
623                .map(|content| match content {
624                    message::UserContent::ToolResult(tool_result) => tool_result.try_into(),
625                    _ => Err(message::MessageError::ConversionError(
626                        "expected tool result content while converting OpenAI input".into(),
627                    )),
628                })
629                .collect::<Result<Vec<_>, _>>()
630        } else {
631            let other_content: Vec<UserContent> = other_content
632                .into_iter()
633                .map(|content| content.try_into())
634                .collect::<Result<Vec<_>, _>>()?;
635
636            let other_content = OneOrMany::many(other_content).map_err(|_| {
637                message::MessageError::ConversionError(
638                    "OpenAI user message did not contain any non-tool content".into(),
639                )
640            })?;
641
642            Ok(vec![Message::User {
643                content: other_content,
644                name: None,
645            }])
646        }
647    }
648}
649
650impl TryFrom<OneOrMany<message::AssistantContent>> for Vec<Message> {
651    type Error = message::MessageError;
652
653    fn try_from(value: OneOrMany<message::AssistantContent>) -> Result<Self, Self::Error> {
654        let mut text_content = Vec::new();
655        let mut tool_calls = Vec::new();
656        let mut reasoning_text = String::new();
657
658        for content in value {
659            match content {
660                message::AssistantContent::Text(text) => text_content.push(text),
661                message::AssistantContent::ToolCall(tool_call) => tool_calls.push(tool_call),
662                message::AssistantContent::Reasoning(reasoning) => {
663                    reasoning_text.push_str(&reasoning.display_text());
664                }
665                message::AssistantContent::Image(_) => {
666                    return Err(message::MessageError::ConversionError(
667                        "OpenAI assistant messages do not support image content in chat completions"
668                            .into(),
669                    ));
670                }
671            }
672        }
673
674        if text_content.is_empty() && tool_calls.is_empty() {
675            return Ok(vec![]);
676        }
677
678        Ok(vec![Message::Assistant {
679            content: text_content
680                .into_iter()
681                .map(|content| content.text.into())
682                .collect::<Vec<_>>(),
683            reasoning: if reasoning_text.is_empty() {
684                None
685            } else {
686                Some(reasoning_text)
687            },
688            refusal: None,
689            audio: None,
690            name: None,
691            tool_calls: tool_calls
692                .into_iter()
693                .map(|tool_call| tool_call.into())
694                .collect::<Vec<_>>(),
695        }])
696    }
697}
698
699impl TryFrom<message::Message> for Vec<Message> {
700    type Error = message::MessageError;
701
702    fn try_from(message: message::Message) -> Result<Self, Self::Error> {
703        match message {
704            message::Message::System { content } => Ok(vec![Message::system(&content)]),
705            message::Message::User { content } => content.try_into(),
706            message::Message::Assistant { content, .. } => content.try_into(),
707        }
708    }
709}
710
711impl From<message::ToolCall> for ToolCall {
712    fn from(tool_call: message::ToolCall) -> Self {
713        Self {
714            id: tool_call.id,
715            r#type: ToolType::default(),
716            function: Function {
717                name: tool_call.function.name,
718                arguments: tool_call.function.arguments,
719            },
720        }
721    }
722}
723
724impl From<ToolCall> for message::ToolCall {
725    fn from(tool_call: ToolCall) -> Self {
726        Self {
727            id: tool_call.id,
728            call_id: None,
729            function: message::ToolFunction {
730                name: tool_call.function.name,
731                arguments: tool_call.function.arguments,
732            },
733            signature: None,
734            additional_params: None,
735        }
736    }
737}
738
739impl TryFrom<Message> for message::Message {
740    type Error = message::MessageError;
741
742    fn try_from(message: Message) -> Result<Self, Self::Error> {
743        Ok(match message {
744            Message::User { content, .. } => message::Message::User {
745                content: content.map(|content| content.into()),
746            },
747            Message::Assistant {
748                content,
749                tool_calls,
750                reasoning,
751                ..
752            } => {
753                let mut assistant_content = Vec::new();
754
755                if let Some(reasoning) = reasoning
756                    && !reasoning.is_empty()
757                {
758                    assistant_content.push(message::AssistantContent::reasoning(reasoning));
759                }
760
761                assistant_content.extend(content.into_iter().map(|content| match content {
762                    AssistantContent::Text { text, .. } => message::AssistantContent::text(text),
763                    AssistantContent::Refusal { refusal } => {
764                        message::AssistantContent::text(refusal)
765                    }
766                }));
767
768                assistant_content.extend(
769                    tool_calls
770                        .into_iter()
771                        .map(|tool_call| Ok(message::AssistantContent::ToolCall(tool_call.into())))
772                        .collect::<Result<Vec<_>, _>>()?,
773                );
774
775                message::Message::Assistant {
776                    id: None,
777                    content: OneOrMany::many(assistant_content).map_err(|_| {
778                        message::MessageError::ConversionError(
779                            "Neither `content` nor `tool_calls` was provided to the Message"
780                                .to_owned(),
781                        )
782                    })?,
783                }
784            }
785
786            Message::ToolResult {
787                tool_call_id,
788                content,
789            } => message::Message::User {
790                content: OneOrMany::one(message::UserContent::tool_result(
791                    tool_call_id,
792                    OneOrMany::one(message::ToolResultContent::text(content.as_text())),
793                )),
794            },
795
796            // System messages should get stripped out when converting messages, this is just a
797            // stop gap to avoid obnoxious error handling or panic occurring.
798            Message::System { content, .. } => message::Message::User {
799                content: content.map(|content| message::UserContent::text(content.text)),
800            },
801        })
802    }
803}
804
805impl From<UserContent> for message::UserContent {
806    fn from(content: UserContent) -> Self {
807        match content {
808            UserContent::Text { text, .. } => message::UserContent::text(text),
809            UserContent::Image { image_url } => {
810                message::UserContent::image_url(image_url.url, None, Some(image_url.detail))
811            }
812            UserContent::Audio { input_audio } => {
813                message::UserContent::audio(input_audio.data, Some(input_audio.format))
814            }
815            UserContent::File {
816                file: FileData {
817                    file_data, file_id, ..
818                },
819            } => match file_data {
820                Some(data_url) => {
821                    let kind = match data_url.strip_prefix("data:application/pdf;base64,") {
822                        Some(b64) => DocumentSourceKind::Base64(b64.to_string()),
823                        None => DocumentSourceKind::String(data_url),
824                    };
825                    message::UserContent::Document(message::Document {
826                        data: kind,
827                        media_type: Some(message::DocumentMediaType::PDF),
828                        additional_params: None,
829                    })
830                }
831                None => match file_id {
832                    Some(id) => message::UserContent::Document(message::Document {
833                        data: DocumentSourceKind::FileId(id),
834                        media_type: None,
835                        additional_params: None,
836                    }),
837                    None => message::UserContent::text(String::new()),
838                },
839            },
840        }
841    }
842}
843
844impl From<String> for UserContent {
845    fn from(s: String) -> Self {
846        UserContent::Text { text: s }
847    }
848}
849
850impl FromStr for UserContent {
851    type Err = Infallible;
852
853    fn from_str(s: &str) -> Result<Self, Self::Err> {
854        Ok(UserContent::Text {
855            text: s.to_string(),
856        })
857    }
858}
859
860impl From<String> for AssistantContent {
861    fn from(s: String) -> Self {
862        AssistantContent::Text { text: s }
863    }
864}
865
866impl FromStr for AssistantContent {
867    type Err = Infallible;
868
869    fn from_str(s: &str) -> Result<Self, Self::Err> {
870        Ok(AssistantContent::Text {
871            text: s.to_string(),
872        })
873    }
874}
875impl From<String> for SystemContent {
876    fn from(s: String) -> Self {
877        SystemContent {
878            r#type: SystemContentType::default(),
879            text: s,
880        }
881    }
882}
883
884impl FromStr for SystemContent {
885    type Err = Infallible;
886
887    fn from_str(s: &str) -> Result<Self, Self::Err> {
888        Ok(SystemContent {
889            r#type: SystemContentType::default(),
890            text: s.to_string(),
891        })
892    }
893}
894
895#[derive(Debug, Deserialize, Serialize)]
896pub struct CompletionResponse {
897    pub id: String,
898    pub object: String,
899    pub created: u64,
900    pub model: String,
901    pub system_fingerprint: Option<String>,
902    pub choices: Vec<Choice>,
903    pub usage: Option<Usage>,
904}
905
906impl TryFrom<CompletionResponse> for completion::CompletionResponse<CompletionResponse> {
907    type Error = CompletionError;
908
909    fn try_from(response: CompletionResponse) -> Result<Self, Self::Error> {
910        let choice = response.choices.first().ok_or_else(|| {
911            CompletionError::ResponseError("Response contained no choices".to_owned())
912        })?;
913
914        let content = match &choice.message {
915            Message::Assistant {
916                content,
917                tool_calls,
918                reasoning,
919                ..
920            } => {
921                let mut content = content
922                    .iter()
923                    .filter_map(|c| {
924                        let s = match c {
925                            AssistantContent::Text { text, .. } => text,
926                            AssistantContent::Refusal { refusal } => refusal,
927                        };
928                        if s.is_empty() {
929                            None
930                        } else {
931                            Some(completion::AssistantContent::text(s))
932                        }
933                    })
934                    .collect::<Vec<_>>();
935
936                if let Some(reasoning) = reasoning {
937                    // llama.cpp exposes hidden reasoning on a separate non-standard field.
938                    // Keep it structured here so the non-streaming path matches streaming
939                    // behavior and does not pollute plain-text response surfaces.
940                    content.push(completion::AssistantContent::reasoning(reasoning));
941                }
942
943                content.extend(
944                    tool_calls
945                        .iter()
946                        .map(|call| {
947                            completion::AssistantContent::tool_call(
948                                &call.id,
949                                &call.function.name,
950                                call.function.arguments.clone(),
951                            )
952                        })
953                        .collect::<Vec<_>>(),
954                );
955                Ok(content)
956            }
957            _ => Err(CompletionError::ResponseError(
958                "Response did not contain a valid message or tool call".into(),
959            )),
960        }?;
961
962        let choice = OneOrMany::many(content).map_err(|_| {
963            CompletionError::ResponseError(
964                "Response contained no message or tool call (empty)".to_owned(),
965            )
966        })?;
967
968        let usage = response
969            .usage
970            .as_ref()
971            .map(|usage| completion::Usage {
972                input_tokens: usage.prompt_tokens as u64,
973                output_tokens: (usage.total_tokens - usage.prompt_tokens) as u64,
974                total_tokens: usage.total_tokens as u64,
975                cached_input_tokens: usage
976                    .prompt_tokens_details
977                    .as_ref()
978                    .map(|d| d.cached_tokens as u64)
979                    .unwrap_or(0),
980                cache_creation_input_tokens: 0,
981                tool_use_prompt_tokens: 0,
982                reasoning_tokens: 0,
983            })
984            .unwrap_or_default();
985
986        Ok(completion::CompletionResponse {
987            choice,
988            usage,
989            raw_response: response,
990            message_id: None,
991        })
992    }
993}
994
995impl ProviderResponseExt for CompletionResponse {
996    type OutputMessage = Choice;
997    type Usage = Usage;
998
999    fn get_response_id(&self) -> Option<String> {
1000        Some(self.id.to_owned())
1001    }
1002
1003    fn get_response_model_name(&self) -> Option<String> {
1004        Some(self.model.to_owned())
1005    }
1006
1007    fn get_output_messages(&self) -> Vec<Self::OutputMessage> {
1008        self.choices.clone()
1009    }
1010
1011    fn get_text_response(&self) -> Option<String> {
1012        let response = self
1013            .choices
1014            .iter()
1015            .filter_map(|choice| assistant_message_text_response(&choice.message))
1016            .collect::<Vec<_>>()
1017            .join("\n");
1018
1019        if response.is_empty() {
1020            None
1021        } else {
1022            Some(response)
1023        }
1024    }
1025
1026    fn get_usage(&self) -> Option<Self::Usage> {
1027        self.usage.clone()
1028    }
1029}
1030
1031fn assistant_message_text_response(message: &Message) -> Option<String> {
1032    let Message::Assistant {
1033        content, refusal, ..
1034    } = message
1035    else {
1036        return None;
1037    };
1038
1039    let mut segments = content
1040        .iter()
1041        .filter_map(|content| match content {
1042            AssistantContent::Text { text, .. } => (!text.is_empty()).then(|| text.clone()),
1043            AssistantContent::Refusal { refusal } => (!refusal.is_empty()).then(|| refusal.clone()),
1044        })
1045        .collect::<Vec<_>>();
1046
1047    if segments.is_empty()
1048        && let Some(refusal) = refusal.as_ref().filter(|refusal| !refusal.is_empty())
1049    {
1050        segments.push(refusal.clone());
1051    }
1052
1053    if segments.is_empty() {
1054        None
1055    } else {
1056        Some(segments.join("\n"))
1057    }
1058}
1059
1060#[derive(Clone, Debug, Serialize, Deserialize)]
1061pub struct Choice {
1062    pub index: usize,
1063    pub message: Message,
1064    pub logprobs: Option<serde_json::Value>,
1065    pub finish_reason: String,
1066}
1067
1068#[derive(Clone, Debug, Deserialize, Serialize, Default)]
1069pub struct PromptTokensDetails {
1070    /// Cached tokens from prompt caching
1071    #[serde(default)]
1072    pub cached_tokens: usize,
1073}
1074
1075#[derive(Clone, Debug, Deserialize, Serialize)]
1076pub struct Usage {
1077    pub prompt_tokens: usize,
1078    pub total_tokens: usize,
1079    #[serde(skip_serializing_if = "Option::is_none")]
1080    pub prompt_tokens_details: Option<PromptTokensDetails>,
1081}
1082
1083impl Usage {
1084    pub fn new() -> Self {
1085        Self {
1086            prompt_tokens: 0,
1087            total_tokens: 0,
1088            prompt_tokens_details: None,
1089        }
1090    }
1091}
1092
1093impl Default for Usage {
1094    fn default() -> Self {
1095        Self::new()
1096    }
1097}
1098
1099impl fmt::Display for Usage {
1100    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
1101        let Usage {
1102            prompt_tokens,
1103            total_tokens,
1104            ..
1105        } = self;
1106        write!(
1107            f,
1108            "Prompt tokens: {prompt_tokens} Total tokens: {total_tokens}"
1109        )
1110    }
1111}
1112
1113impl GetTokenUsage for Usage {
1114    fn token_usage(&self) -> crate::completion::Usage {
1115        crate::providers::internal::completion_usage(
1116            self.prompt_tokens as u64,
1117            (self.total_tokens - self.prompt_tokens) as u64,
1118            self.total_tokens as u64,
1119            self.prompt_tokens_details
1120                .as_ref()
1121                .map(|d| d.cached_tokens as u64)
1122                .unwrap_or(0),
1123        )
1124    }
1125}
1126
1127#[doc(hidden)]
1128#[derive(Clone)]
1129pub struct GenericCompletionModel<Ext = super::OpenAICompletionsExt, H = reqwest::Client> {
1130    pub(crate) client: crate::client::Client<Ext, H>,
1131    pub model: String,
1132    pub strict_tools: bool,
1133    pub tool_result_array_content: bool,
1134}
1135
1136/// The completion model struct for OpenAI's Chat Completions API.
1137///
1138/// This preserves the historical public generic shape where the first generic
1139/// parameter is the HTTP client type.
1140pub type CompletionModel<H = reqwest::Client> =
1141    GenericCompletionModel<super::OpenAICompletionsExt, H>;
1142
1143impl<Ext, H> GenericCompletionModel<Ext, H>
1144where
1145    crate::client::Client<Ext, H>: std::fmt::Debug + Clone + 'static,
1146    Ext: crate::client::Provider + Clone + 'static,
1147{
1148    pub fn new(client: crate::client::Client<Ext, H>, model: impl Into<String>) -> Self {
1149        Self {
1150            client,
1151            model: model.into(),
1152            strict_tools: false,
1153            tool_result_array_content: false,
1154        }
1155    }
1156
1157    pub fn with_model(client: crate::client::Client<Ext, H>, model: &str) -> Self {
1158        Self {
1159            client,
1160            model: model.into(),
1161            strict_tools: false,
1162            tool_result_array_content: false,
1163        }
1164    }
1165
1166    /// Enable strict mode for tool schemas.
1167    ///
1168    /// When enabled, tool schemas are automatically sanitized to meet OpenAI's strict mode requirements:
1169    /// - `additionalProperties: false` is added to all objects
1170    /// - All properties are marked as required
1171    /// - `strict: true` is set on each function definition
1172    ///
1173    /// This allows OpenAI to guarantee that the model's tool calls will match the schema exactly.
1174    pub fn with_strict_tools(mut self) -> Self {
1175        self.strict_tools = true;
1176        self
1177    }
1178
1179    pub fn with_tool_result_array_content(mut self) -> Self {
1180        self.tool_result_array_content = true;
1181        self
1182    }
1183}
1184
1185#[derive(Debug, Serialize, Deserialize, Clone)]
1186pub struct CompletionRequest {
1187    model: String,
1188    messages: Vec<Message>,
1189    #[serde(skip_serializing_if = "Vec::is_empty")]
1190    tools: Vec<ToolDefinition>,
1191    #[serde(skip_serializing_if = "Option::is_none")]
1192    tool_choice: Option<ToolChoice>,
1193    #[serde(skip_serializing_if = "Option::is_none")]
1194    temperature: Option<f64>,
1195    #[serde(skip_serializing_if = "Option::is_none")]
1196    max_tokens: Option<u64>,
1197    #[serde(flatten)]
1198    additional_params: Option<serde_json::Value>,
1199}
1200
1201pub struct OpenAIRequestParams {
1202    pub model: String,
1203    pub request: CoreCompletionRequest,
1204    pub strict_tools: bool,
1205    pub tool_result_array_content: bool,
1206}
1207
1208impl TryFrom<OpenAIRequestParams> for CompletionRequest {
1209    type Error = CompletionError;
1210
1211    fn try_from(params: OpenAIRequestParams) -> Result<Self, Self::Error> {
1212        let OpenAIRequestParams {
1213            model,
1214            request: req,
1215            strict_tools,
1216            tool_result_array_content,
1217        } = params;
1218        let chat_history = req.chat_history_with_documents();
1219
1220        let CoreCompletionRequest {
1221            model: request_model,
1222            preamble,
1223            chat_history: _,
1224            tools,
1225            temperature,
1226            max_tokens,
1227            additional_params,
1228            tool_choice,
1229            output_schema,
1230            ..
1231        } = req;
1232
1233        let mut partial_history = Vec::new();
1234        partial_history.extend(chat_history);
1235
1236        let mut full_history: Vec<Message> =
1237            preamble.map_or_else(Vec::new, |preamble| vec![Message::system(&preamble)]);
1238
1239        full_history.extend(
1240            partial_history
1241                .into_iter()
1242                .map(message::Message::try_into)
1243                .collect::<Result<Vec<Vec<Message>>, _>>()?
1244                .into_iter()
1245                .flatten()
1246                .collect::<Vec<_>>(),
1247        );
1248
1249        if full_history.is_empty() {
1250            return Err(CompletionError::RequestError(
1251                std::io::Error::new(
1252                    std::io::ErrorKind::InvalidInput,
1253                    "OpenAI Chat Completions request has no provider-compatible messages after conversion",
1254                )
1255                .into(),
1256            ));
1257        }
1258
1259        if tool_result_array_content {
1260            for msg in &mut full_history {
1261                if let Message::ToolResult { content, .. } = msg {
1262                    *content = content.to_array();
1263                }
1264            }
1265        }
1266
1267        let history_has_tool_result = history_contains_tool_result(&full_history);
1268
1269        let tool_choice = tool_choice.map(ToolChoice::try_from).transpose()?;
1270
1271        let tools: Vec<ToolDefinition> = tools
1272            .into_iter()
1273            .map(|tool| {
1274                let def = ToolDefinition::from(tool);
1275                if strict_tools { def.with_strict() } else { def }
1276            })
1277            .collect();
1278
1279        // Some OpenAI-compatible backends such as llama.cpp will skip tool execution
1280        // if `response_format` is sent on the first turn alongside tools. Delay the
1281        // schema until after the conversation contains a tool result.
1282        let should_apply_response_format =
1283            output_schema.is_some() && (tools.is_empty() || history_has_tool_result);
1284
1285        // Map output_schema to OpenAI's response_format and merge into additional_params
1286        let additional_params = if let Some(schema) = output_schema
1287            && should_apply_response_format
1288        {
1289            let name = schema
1290                .as_object()
1291                .and_then(|o| o.get("title"))
1292                .and_then(|v| v.as_str())
1293                .unwrap_or("response_schema")
1294                .to_string();
1295            let mut schema_value = schema.to_value();
1296            super::sanitize_schema(&mut schema_value);
1297            let response_format = serde_json::json!({
1298                "response_format": {
1299                    "type": "json_schema",
1300                    "json_schema": {
1301                        "name": name,
1302                        "strict": true,
1303                        "schema": schema_value
1304                    }
1305                }
1306            });
1307            Some(match additional_params {
1308                Some(existing) => json_utils::merge(existing, response_format),
1309                None => response_format,
1310            })
1311        } else {
1312            additional_params
1313        };
1314
1315        let res = Self {
1316            model: request_model.unwrap_or(model),
1317            messages: full_history,
1318            tools,
1319            tool_choice,
1320            temperature,
1321            max_tokens,
1322            additional_params,
1323        };
1324
1325        Ok(res)
1326    }
1327}
1328
1329impl TryFrom<(String, CoreCompletionRequest)> for CompletionRequest {
1330    type Error = CompletionError;
1331
1332    fn try_from((model, req): (String, CoreCompletionRequest)) -> Result<Self, Self::Error> {
1333        CompletionRequest::try_from(OpenAIRequestParams {
1334            model,
1335            request: req,
1336            strict_tools: false,
1337            tool_result_array_content: false,
1338        })
1339    }
1340}
1341
1342impl crate::telemetry::ProviderRequestExt for CompletionRequest {
1343    type InputMessage = Message;
1344
1345    fn get_input_messages(&self) -> Vec<Self::InputMessage> {
1346        self.messages.clone()
1347    }
1348
1349    fn get_system_prompt(&self) -> Option<String> {
1350        let first_message = self.messages.first()?;
1351
1352        let Message::System { ref content, .. } = first_message.clone() else {
1353            return None;
1354        };
1355
1356        let SystemContent { text, .. } = content.first();
1357
1358        Some(text)
1359    }
1360
1361    fn get_prompt(&self) -> Option<String> {
1362        let last_message = self.messages.last()?;
1363
1364        let Message::User { ref content, .. } = last_message.clone() else {
1365            return None;
1366        };
1367
1368        let UserContent::Text { text, .. } = content.first() else {
1369            return None;
1370        };
1371
1372        Some(text)
1373    }
1374
1375    fn get_model_name(&self) -> String {
1376        self.model.clone()
1377    }
1378}
1379
1380impl GenericCompletionModel<super::OpenAICompletionsExt, reqwest::Client> {
1381    pub fn into_agent_builder(self) -> crate::agent::AgentBuilder<Self> {
1382        crate::agent::AgentBuilder::new(self)
1383    }
1384}
1385
1386impl<Ext, H> completion::CompletionModel for GenericCompletionModel<Ext, H>
1387where
1388    crate::client::Client<Ext, H>:
1389        HttpClientExt + Clone + WasmCompatSend + WasmCompatSync + 'static,
1390    Ext: crate::client::Provider
1391        + crate::client::DebugExt
1392        + Clone
1393        + WasmCompatSend
1394        + WasmCompatSync
1395        + 'static,
1396    H: Clone + Default + std::fmt::Debug + WasmCompatSend + WasmCompatSync + 'static,
1397{
1398    type Response = CompletionResponse;
1399    type StreamingResponse = StreamingCompletionResponse;
1400
1401    type Client = crate::client::Client<Ext, H>;
1402
1403    fn make(client: &Self::Client, model: impl Into<String>) -> Self {
1404        Self::new(client.clone(), model)
1405    }
1406
1407    async fn completion(
1408        &self,
1409        completion_request: CoreCompletionRequest,
1410    ) -> Result<completion::CompletionResponse<CompletionResponse>, CompletionError> {
1411        let span = if tracing::Span::current().is_disabled() {
1412            info_span!(
1413                target: "rig::completions",
1414                "chat",
1415                gen_ai.operation.name = "chat",
1416                gen_ai.provider.name = "openai",
1417                gen_ai.request.model = self.model,
1418                gen_ai.system_instructions = &completion_request.preamble,
1419                gen_ai.response.id = tracing::field::Empty,
1420                gen_ai.response.model = tracing::field::Empty,
1421                gen_ai.usage.output_tokens = tracing::field::Empty,
1422                gen_ai.usage.input_tokens = tracing::field::Empty,
1423                gen_ai.usage.cache_read.input_tokens = tracing::field::Empty,
1424            )
1425        } else {
1426            tracing::Span::current()
1427        };
1428
1429        let request = CompletionRequest::try_from(OpenAIRequestParams {
1430            model: self.model.to_owned(),
1431            request: completion_request,
1432            strict_tools: self.strict_tools,
1433            tool_result_array_content: self.tool_result_array_content,
1434        })?;
1435
1436        if enabled!(Level::TRACE) {
1437            tracing::trace!(
1438                target: "rig::completions",
1439                "OpenAI Chat Completions completion request: {}",
1440                serde_json::to_string_pretty(&request)?
1441            );
1442        }
1443
1444        let body = serde_json::to_vec(&request)?;
1445
1446        let req = self
1447            .client
1448            .post("/chat/completions")?
1449            .body(body)
1450            .map_err(|e| CompletionError::HttpError(e.into()))?;
1451
1452        async move {
1453            let response = self.client.send(req).await?;
1454
1455            if response.status().is_success() {
1456                let text = http_client::text(response).await?;
1457
1458                match serde_json::from_str::<ApiResponse<CompletionResponse>>(&text)? {
1459                    ApiResponse::Ok(response) => {
1460                        let span = tracing::Span::current();
1461                        span.record_response_metadata(&response);
1462                        span.record_token_usage(&response.usage);
1463
1464                        if enabled!(Level::TRACE) {
1465                            tracing::trace!(
1466                                target: "rig::completions",
1467                                "OpenAI Chat Completions completion response: {}",
1468                                serde_json::to_string_pretty(&response)?
1469                            );
1470                        }
1471
1472                        response.try_into()
1473                    }
1474                    ApiResponse::Err(err) => Err(CompletionError::ProviderError(err.message)),
1475                }
1476            } else {
1477                let text = http_client::text(response).await?;
1478                Err(CompletionError::ProviderError(text))
1479            }
1480        }
1481        .instrument(span)
1482        .await
1483    }
1484
1485    async fn stream(
1486        &self,
1487        request: CoreCompletionRequest,
1488    ) -> Result<
1489        crate::streaming::StreamingCompletionResponse<Self::StreamingResponse>,
1490        CompletionError,
1491    > {
1492        GenericCompletionModel::stream(self, request).await
1493    }
1494}
1495
1496fn serialize_assistant_content_vec<S>(
1497    value: &Vec<AssistantContent>,
1498    serializer: S,
1499) -> Result<S::Ok, S::Error>
1500where
1501    S: Serializer,
1502{
1503    if value.is_empty() {
1504        serializer.serialize_str("")
1505    } else {
1506        value.serialize(serializer)
1507    }
1508}
1509
1510#[cfg(test)]
1511mod tests {
1512    use super::*;
1513    use crate::completion::CompletionRequestBuilder;
1514    use crate::telemetry::ProviderResponseExt;
1515    use crate::test_utils::MockCompletionModel;
1516    use std::collections::HashMap;
1517
1518    fn test_document(id: &str, text: &str) -> crate::completion::Document {
1519        crate::completion::Document {
1520            id: id.to_string(),
1521            text: text.to_string(),
1522            additional_props: HashMap::new(),
1523        }
1524    }
1525
1526    #[test]
1527    fn test_openai_request_uses_request_model_override() {
1528        let request = crate::completion::CompletionRequest {
1529            model: Some("gpt-4.1".to_string()),
1530            preamble: None,
1531            chat_history: crate::OneOrMany::one("Hello".into()),
1532            documents: vec![],
1533            tools: vec![],
1534            temperature: None,
1535            max_tokens: None,
1536            tool_choice: None,
1537            additional_params: None,
1538            output_schema: None,
1539        };
1540
1541        let openai_request = CompletionRequest::try_from(OpenAIRequestParams {
1542            model: "gpt-4o-mini".to_string(),
1543            request,
1544            strict_tools: false,
1545            tool_result_array_content: false,
1546        })
1547        .expect("request conversion should succeed");
1548        let serialized =
1549            serde_json::to_value(openai_request).expect("serialization should succeed");
1550
1551        assert_eq!(serialized["model"], "gpt-4.1");
1552    }
1553
1554    #[test]
1555    fn test_openai_request_uses_default_model_when_override_unset() {
1556        let request = crate::completion::CompletionRequest {
1557            model: None,
1558            preamble: None,
1559            chat_history: crate::OneOrMany::one("Hello".into()),
1560            documents: vec![],
1561            tools: vec![],
1562            temperature: None,
1563            max_tokens: None,
1564            tool_choice: None,
1565            additional_params: None,
1566            output_schema: None,
1567        };
1568
1569        let openai_request = CompletionRequest::try_from(OpenAIRequestParams {
1570            model: "gpt-4o-mini".to_string(),
1571            request,
1572            strict_tools: false,
1573            tool_result_array_content: false,
1574        })
1575        .expect("request conversion should succeed");
1576        let serialized =
1577            serde_json::to_value(openai_request).expect("serialization should succeed");
1578
1579        assert_eq!(serialized["model"], "gpt-4o-mini");
1580    }
1581
1582    #[test]
1583    fn openai_chat_request_keeps_documents_after_system_messages() {
1584        let request = CompletionRequestBuilder::new(MockCompletionModel::default(), "Prompt")
1585            .message(crate::completion::Message::system("System prompt"))
1586            .message(crate::completion::Message::user("Earlier user turn"))
1587            .message(crate::completion::Message::assistant(
1588                "Earlier assistant turn",
1589            ))
1590            .document(test_document("doc1", "Document text."))
1591            .build();
1592
1593        let openai_request = CompletionRequest::try_from(OpenAIRequestParams {
1594            model: "gpt-4o-mini".to_string(),
1595            request,
1596            strict_tools: false,
1597            tool_result_array_content: false,
1598        })
1599        .expect("request conversion should succeed");
1600
1601        let serialized =
1602            serde_json::to_value(&openai_request.messages).expect("messages should serialize");
1603        let messages = serialized.as_array().expect("messages should be an array");
1604
1605        assert_eq!(messages.len(), 5);
1606        assert_eq!(messages[0]["role"], "system");
1607        assert_eq!(messages[1]["role"], "user");
1608        assert!(
1609            messages[1].to_string().contains("<file id: doc1>"),
1610            "document message should follow system message: {messages:?}"
1611        );
1612        assert_eq!(messages[2]["role"], "user");
1613        assert!(
1614            messages[2].to_string().contains("Earlier user turn"),
1615            "prior user history should follow document message: {messages:?}"
1616        );
1617        assert_eq!(messages[3]["role"], "assistant");
1618        assert!(
1619            messages[3].to_string().contains("Earlier assistant turn"),
1620            "prior assistant history should follow prior user history: {messages:?}"
1621        );
1622        assert_eq!(messages[4]["role"], "user");
1623        assert!(
1624            messages[4].to_string().contains("Prompt"),
1625            "prompt should remain last: {messages:?}"
1626        );
1627    }
1628
1629    #[test]
1630    fn openai_chat_direct_request_keeps_documents_after_system_messages() {
1631        let request = CoreCompletionRequest {
1632            model: None,
1633            preamble: None,
1634            chat_history: crate::OneOrMany::many(vec![
1635                crate::completion::Message::system("System prompt"),
1636                crate::completion::Message::assistant("Earlier assistant turn"),
1637                crate::completion::Message::system("Mid-conversation instruction"),
1638                crate::completion::Message::user("Prompt"),
1639            ])
1640            .unwrap(),
1641            documents: vec![test_document("doc1", "Document text.")],
1642            tools: vec![],
1643            temperature: None,
1644            max_tokens: None,
1645            tool_choice: None,
1646            additional_params: None,
1647            output_schema: None,
1648        };
1649
1650        let openai_request = CompletionRequest::try_from(OpenAIRequestParams {
1651            model: "gpt-4o-mini".to_string(),
1652            request,
1653            strict_tools: false,
1654            tool_result_array_content: false,
1655        })
1656        .expect("request conversion should succeed");
1657
1658        let serialized =
1659            serde_json::to_value(&openai_request.messages).expect("messages should serialize");
1660        let messages = serialized.as_array().expect("messages should be an array");
1661
1662        assert_eq!(messages.len(), 5);
1663        assert_eq!(messages[0]["role"], "system");
1664        assert_eq!(messages[1]["role"], "user");
1665        assert!(
1666            messages[1].to_string().contains("<file id: doc1>"),
1667            "document message should follow leading system messages: {messages:?}"
1668        );
1669        assert_eq!(messages[2]["role"], "assistant");
1670        assert_eq!(messages[3]["role"], "system");
1671        assert_eq!(messages[4]["role"], "user");
1672        assert_eq!(
1673            messages
1674                .iter()
1675                .filter(|message| message.to_string().contains("<file id: doc1>"))
1676                .count(),
1677            1,
1678            "document message should appear exactly once: {messages:?}"
1679        );
1680    }
1681
1682    #[test]
1683    fn assistant_reasoning_alone_is_dropped() {
1684        let assistant_content = OneOrMany::one(message::AssistantContent::reasoning("hidden"));
1685
1686        let converted: Vec<Message> = assistant_content
1687            .try_into()
1688            .expect("conversion should work");
1689
1690        assert!(converted.is_empty());
1691    }
1692
1693    // Regression test: providers that serve thinking models over the OpenAI
1694    // Chat Completions schema (DeepSeek-R1, GLM-4.6, Qwen3-Thinking) return
1695    // 400 "thinking is enabled but reasoning_content is missing" on the next
1696    // turn if the prior assistant tool-call message didn't echo the reasoning.
1697    #[test]
1698    fn assistant_reasoning_is_attached_to_tool_call_message() {
1699        let assistant_content = OneOrMany::many(vec![
1700            message::AssistantContent::reasoning("hidden"),
1701            message::AssistantContent::text("visible"),
1702            message::AssistantContent::tool_call(
1703                "call_1",
1704                "subtract",
1705                serde_json::json!({"x": 2, "y": 1}),
1706            ),
1707        ])
1708        .expect("non-empty assistant content");
1709
1710        let converted: Vec<Message> = assistant_content
1711            .try_into()
1712            .expect("conversion should work");
1713        assert_eq!(converted.len(), 1);
1714
1715        match &converted[0] {
1716            Message::Assistant {
1717                content,
1718                tool_calls,
1719                reasoning,
1720                ..
1721            } => {
1722                assert_eq!(
1723                    content,
1724                    &vec![AssistantContent::Text {
1725                        text: "visible".to_string()
1726                    }]
1727                );
1728                assert_eq!(tool_calls.len(), 1);
1729                assert_eq!(tool_calls[0].id, "call_1");
1730                assert_eq!(tool_calls[0].function.name, "subtract");
1731                assert_eq!(
1732                    tool_calls[0].function.arguments,
1733                    serde_json::json!({"x": 2, "y": 1})
1734                );
1735                assert_eq!(reasoning.as_deref(), Some("hidden"));
1736            }
1737            _ => panic!("expected assistant message"),
1738        }
1739
1740        let json = serde_json::to_value(&converted[0]).expect("serialize");
1741        assert_eq!(json["reasoning_content"], "hidden");
1742    }
1743
1744    #[test]
1745    fn assistant_reasoning_roundtrips_back_to_rig_message() {
1746        let assistant = Message::Assistant {
1747            content: vec![AssistantContent::Text {
1748                text: "visible".to_string(),
1749            }],
1750            reasoning: Some("hidden".to_string()),
1751            refusal: None,
1752            audio: None,
1753            name: None,
1754            tool_calls: vec![],
1755        };
1756
1757        let rig_msg: message::Message = assistant.try_into().expect("convert back");
1758
1759        let message::Message::Assistant { content, .. } = rig_msg else {
1760            panic!("expected assistant");
1761        };
1762
1763        let items: Vec<_> = content.into_iter().collect();
1764        assert_eq!(items.len(), 2);
1765        assert!(matches!(items[0], message::AssistantContent::Reasoning(_)));
1766        assert!(matches!(items[1], message::AssistantContent::Text(_)));
1767    }
1768
1769    #[test]
1770    fn provider_response_text_response_reads_assistant_multipart_output() {
1771        let response = CompletionResponse {
1772            id: "resp_123".to_owned(),
1773            object: "chat.completion".to_owned(),
1774            created: 0,
1775            model: GPT_4O.to_owned(),
1776            system_fingerprint: None,
1777            choices: vec![Choice {
1778                index: 0,
1779                message: Message::Assistant {
1780                    content: vec![
1781                        AssistantContent::Text {
1782                            text: "first".to_owned(),
1783                        },
1784                        AssistantContent::Refusal {
1785                            refusal: "second".to_owned(),
1786                        },
1787                        AssistantContent::Text {
1788                            text: "third".to_owned(),
1789                        },
1790                    ],
1791                    reasoning: Some("hidden".to_owned()),
1792                    refusal: None,
1793                    audio: None,
1794                    name: None,
1795                    tool_calls: vec![],
1796                },
1797                logprobs: None,
1798                finish_reason: "stop".to_owned(),
1799            }],
1800            usage: None,
1801        };
1802
1803        assert_eq!(
1804            response.get_text_response(),
1805            Some("first\nsecond\nthird".to_owned())
1806        );
1807    }
1808
1809    #[test]
1810    fn provider_response_text_response_falls_back_to_assistant_refusal_field() {
1811        let response = CompletionResponse {
1812            id: "resp_123".to_owned(),
1813            object: "chat.completion".to_owned(),
1814            created: 0,
1815            model: GPT_4O.to_owned(),
1816            system_fingerprint: None,
1817            choices: vec![Choice {
1818                index: 0,
1819                message: Message::Assistant {
1820                    content: vec![],
1821                    reasoning: None,
1822                    refusal: Some("blocked".to_owned()),
1823                    audio: None,
1824                    name: None,
1825                    tool_calls: vec![],
1826                },
1827                logprobs: None,
1828                finish_reason: "stop".to_owned(),
1829            }],
1830            usage: None,
1831        };
1832
1833        assert_eq!(response.get_text_response(), Some("blocked".to_owned()));
1834    }
1835
1836    #[test]
1837    fn test_max_tokens_is_forwarded_to_request() {
1838        let request = crate::completion::CompletionRequest {
1839            model: None,
1840            preamble: None,
1841            chat_history: crate::OneOrMany::one("Hello".into()),
1842            documents: vec![],
1843            tools: vec![],
1844            temperature: None,
1845            max_tokens: Some(4096),
1846            tool_choice: None,
1847            additional_params: None,
1848            output_schema: None,
1849        };
1850
1851        let openai_request = CompletionRequest::try_from(OpenAIRequestParams {
1852            model: "gpt-4o-mini".to_string(),
1853            request,
1854            strict_tools: false,
1855            tool_result_array_content: false,
1856        })
1857        .expect("request conversion should succeed");
1858        let serialized =
1859            serde_json::to_value(openai_request).expect("serialization should succeed");
1860
1861        assert_eq!(serialized["max_tokens"], 4096);
1862    }
1863
1864    #[test]
1865    fn test_max_tokens_omitted_when_none() {
1866        let request = crate::completion::CompletionRequest {
1867            model: None,
1868            preamble: None,
1869            chat_history: crate::OneOrMany::one("Hello".into()),
1870            documents: vec![],
1871            tools: vec![],
1872            temperature: None,
1873            max_tokens: None,
1874            tool_choice: None,
1875            additional_params: None,
1876            output_schema: None,
1877        };
1878
1879        let openai_request = CompletionRequest::try_from(OpenAIRequestParams {
1880            model: "gpt-4o-mini".to_string(),
1881            request,
1882            strict_tools: false,
1883            tool_result_array_content: false,
1884        })
1885        .expect("request conversion should succeed");
1886        let serialized =
1887            serde_json::to_value(openai_request).expect("serialization should succeed");
1888
1889        assert!(serialized.get("max_tokens").is_none());
1890    }
1891
1892    #[test]
1893    fn request_conversion_errors_when_all_messages_are_filtered() {
1894        let request = CoreCompletionRequest {
1895            model: None,
1896            preamble: None,
1897            chat_history: OneOrMany::one(message::Message::Assistant {
1898                id: None,
1899                content: OneOrMany::one(message::AssistantContent::reasoning("hidden")),
1900            }),
1901            documents: vec![],
1902            tools: vec![],
1903            temperature: None,
1904            max_tokens: None,
1905            tool_choice: None,
1906            additional_params: None,
1907            output_schema: None,
1908        };
1909
1910        let result = CompletionRequest::try_from(OpenAIRequestParams {
1911            model: "gpt-4o-mini".to_string(),
1912            request,
1913            strict_tools: false,
1914            tool_result_array_content: false,
1915        });
1916
1917        assert!(matches!(result, Err(CompletionError::RequestError(_))));
1918    }
1919
1920    #[test]
1921    fn request_conversion_omits_response_format_on_initial_tool_turn() {
1922        let request = CoreCompletionRequest {
1923            model: None,
1924            preamble: None,
1925            chat_history: OneOrMany::one(message::Message::user(
1926                "Hello, whats the weather in London?",
1927            )),
1928            documents: vec![],
1929            tools: vec![completion::ToolDefinition {
1930                name: "weather".to_string(),
1931                description: "Get the weather".to_string(),
1932                parameters: serde_json::json!({
1933                    "type": "object",
1934                    "properties": {
1935                        "city": { "type": "string" }
1936                    },
1937                    "required": ["city"]
1938                }),
1939            }],
1940            temperature: None,
1941            max_tokens: None,
1942            tool_choice: None,
1943            additional_params: None,
1944            output_schema: Some(
1945                serde_json::from_value(serde_json::json!({
1946                    "title": "WeatherResponse",
1947                    "type": "object",
1948                    "properties": {
1949                        "city": { "type": "string" },
1950                        "weather": { "type": "string" }
1951                    },
1952                    "required": ["city", "weather"]
1953                }))
1954                .expect("schema should deserialize"),
1955            ),
1956        };
1957
1958        let openai_request = CompletionRequest::try_from(OpenAIRequestParams {
1959            model: "gpt-4o-mini".to_string(),
1960            request,
1961            strict_tools: false,
1962            tool_result_array_content: false,
1963        })
1964        .expect("request conversion should succeed");
1965
1966        let serialized =
1967            serde_json::to_value(openai_request).expect("serialization should succeed");
1968
1969        assert!(
1970            serialized.get("response_format").is_none(),
1971            "initial tool turn should omit response_format: {serialized:?}"
1972        );
1973    }
1974
1975    #[test]
1976    fn request_conversion_restores_response_format_after_tool_result() {
1977        let request = CoreCompletionRequest {
1978            model: None,
1979            preamble: None,
1980            chat_history: OneOrMany::many(vec![
1981                message::Message::user("Hello, whats the weather in London?"),
1982                message::Message::Assistant {
1983                    id: None,
1984                    content: OneOrMany::one(message::AssistantContent::tool_call(
1985                        "call_1",
1986                        "weather",
1987                        serde_json::json!({ "city": "London" }),
1988                    )),
1989                },
1990                message::Message::tool_result(
1991                    "call_1",
1992                    "The weather in London is all fire and brimstone",
1993                ),
1994            ])
1995            .expect("history should be non-empty"),
1996            documents: vec![],
1997            tools: vec![completion::ToolDefinition {
1998                name: "weather".to_string(),
1999                description: "Get the weather".to_string(),
2000                parameters: serde_json::json!({
2001                    "type": "object",
2002                    "properties": {
2003                        "city": { "type": "string" }
2004                    },
2005                    "required": ["city"]
2006                }),
2007            }],
2008            temperature: None,
2009            max_tokens: None,
2010            tool_choice: None,
2011            additional_params: None,
2012            output_schema: Some(
2013                serde_json::from_value(serde_json::json!({
2014                    "title": "WeatherResponse",
2015                    "type": "object",
2016                    "properties": {
2017                        "city": { "type": "string" },
2018                        "weather": { "type": "string" }
2019                    },
2020                    "required": ["city", "weather"]
2021                }))
2022                .expect("schema should deserialize"),
2023            ),
2024        };
2025
2026        let openai_request = CompletionRequest::try_from(OpenAIRequestParams {
2027            model: "gpt-4o-mini".to_string(),
2028            request,
2029            strict_tools: false,
2030            tool_result_array_content: false,
2031        })
2032        .expect("request conversion should succeed");
2033
2034        let serialized =
2035            serde_json::to_value(openai_request).expect("serialization should succeed");
2036
2037        assert!(
2038            serialized.get("response_format").is_some(),
2039            "follow-up turn should restore response_format: {serialized:?}"
2040        );
2041    }
2042
2043    #[test]
2044    fn deserialize_llama_cpp_tool_call() {
2045        let request = r#"{
2046            "choices": [{
2047                "finish_reason": "tool_calls",
2048                "index": 0,
2049                "message": {
2050                    "role": "assistant",
2051                    "content": "",
2052                    "tool_calls": [{ "type": "function", "function": { "name": "hello_world", "arguments": { "city": "Paris" } }, "id": "xxx" }]
2053                }
2054            }],
2055            "created": 0,
2056            "model": "gpt-4o-mini",
2057            "system_fingerprint": "fp_xxx",
2058            "object": "chat.completion",
2059            "usage": { "completion_tokens": 13, "prompt_tokens": 255, "total_tokens": 268 },
2060            "id": "xxx"
2061        }
2062        "#;
2063        let response = serde_json::from_str::<ApiResponse<CompletionResponse>>(request).unwrap();
2064
2065        let ApiResponse::Ok(response) = response else {
2066            panic!("expected successful completion response");
2067        };
2068        assert_eq!(response.choices.len(), 1);
2069
2070        let Message::Assistant { tool_calls, .. } = &response.choices[0].message else {
2071            panic!("expected assistant message");
2072        };
2073        assert_eq!(tool_calls.len(), 1);
2074        assert_eq!(tool_calls[0].id, "xxx");
2075        assert_eq!(tool_calls[0].function.name, "hello_world");
2076        assert_eq!(
2077            tool_calls[0].function.arguments,
2078            serde_json::json!({"city": "Paris"})
2079        );
2080    }
2081
2082    #[test]
2083    fn deserialize_openai_stringified_tool_call() {
2084        let request = r#"{
2085            "choices": [{
2086                "finish_reason": "tool_calls",
2087                "index": 0,
2088                "message": {
2089                    "role": "assistant",
2090                    "content": "",
2091                    "tool_calls": [{ "type": "function", "function": { "name": "hello_world", "arguments": "{\"city\":\"Paris\"}" }, "id": "xxx" }]
2092                }
2093            }],
2094            "created": 0,
2095            "model": "gpt-4o-mini",
2096            "system_fingerprint": "fp_xxx",
2097            "object": "chat.completion",
2098            "usage": { "completion_tokens": 13, "prompt_tokens": 255, "total_tokens": 268 },
2099            "id": "xxx"
2100        }
2101        "#;
2102        let response = serde_json::from_str::<ApiResponse<CompletionResponse>>(request).unwrap();
2103
2104        let ApiResponse::Ok(response) = response else {
2105            panic!("expected successful completion response");
2106        };
2107        assert_eq!(response.choices.len(), 1);
2108
2109        let Message::Assistant { tool_calls, .. } = &response.choices[0].message else {
2110            panic!("expected assistant message");
2111        };
2112        assert_eq!(tool_calls.len(), 1);
2113        assert_eq!(tool_calls[0].id, "xxx");
2114        assert_eq!(tool_calls[0].function.name, "hello_world");
2115        assert_eq!(
2116            tool_calls[0].function.arguments,
2117            serde_json::json!({"city": "Paris"})
2118        );
2119    }
2120
2121    #[test]
2122    fn deserialize_llama_cpp_response_with_reasoning_content() {
2123        let request = r#"
2124        {
2125            "choices": [
2126                {
2127                    "finish_reason": "stop",
2128                    "index": 0,
2129                    "message": {
2130                        "role": "assistant",
2131                        "content": "",
2132                        "reasoning_content": "Now I understand the structure better. I need to: ..."
2133                    }
2134                }
2135            ],
2136            "created": 1776750378,
2137            "model": "unsloth/Qwen3.6-35B-A3B-GGUF:Q8_0",
2138            "system_fingerprint": "fp_xxx",
2139            "object": "chat.completion",
2140            "usage": {
2141                "completion_tokens": 920,
2142                "prompt_tokens": 27806,
2143                "total_tokens": 28726,
2144                "prompt_tokens_details": { "cached_tokens": 18698 }
2145            },
2146            "id": "chatcmpl-xxxx",
2147            "timings": {
2148                "cache_n": 18698,
2149                "prompt_n": 9108,
2150                "prompt_ms": 226645.81,
2151                "prompt_per_token_ms": 24.884256697408873,
2152                "prompt_per_second": 40.186050648807495,
2153                "predicted_n": 920,
2154                "predicted_ms": 177167.955,
2155                "predicted_per_token_ms": 192.57386413043477,
2156                "predicted_per_second": 5.192812661860888
2157            }
2158        }
2159        "#;
2160        let response = serde_json::from_str::<ApiResponse<CompletionResponse>>(request).unwrap();
2161        let ApiResponse::Ok(response) = response else {
2162            panic!("expected successful completion response");
2163        };
2164
2165        let response: completion::CompletionResponse<CompletionResponse> =
2166            response.try_into().unwrap();
2167
2168        assert_eq!(response.choice.len(), 1);
2169
2170        let completion::message::AssistantContent::Reasoning(reasoning) = response.choice.first()
2171        else {
2172            panic!("expected assistant content to be reasoning");
2173        };
2174        assert_eq!(
2175            reasoning.first_text(),
2176            Some("Now I understand the structure better. I need to: ...")
2177        );
2178    }
2179
2180    #[test]
2181    fn pdf_base64_document_serializes_as_file_content_part() {
2182        let doc = message::UserContent::Document(message::Document {
2183            data: DocumentSourceKind::Base64("JVBERi0xLjQK".into()),
2184            media_type: Some(message::DocumentMediaType::PDF),
2185            additional_params: None,
2186        });
2187        let converted: UserContent = doc.try_into().expect("conversion should succeed");
2188        let json = serde_json::to_value(&converted).expect("serialize");
2189
2190        assert_eq!(json["type"], "file");
2191        assert_eq!(
2192            json["file"]["file_data"],
2193            "data:application/pdf;base64,JVBERi0xLjQK"
2194        );
2195        assert_eq!(json["file"]["filename"], "document.pdf");
2196        assert!(json["file"].get("file_id").is_none());
2197    }
2198
2199    #[test]
2200    fn file_id_document_serializes_as_file_content_part() {
2201        let doc = message::UserContent::Document(message::Document {
2202            data: DocumentSourceKind::FileId("file_abc".into()),
2203            media_type: None,
2204            additional_params: None,
2205        });
2206        let converted: UserContent = doc.try_into().expect("conversion should succeed");
2207        let json = serde_json::to_value(&converted).expect("serialize");
2208
2209        assert_eq!(json["type"], "file");
2210        assert_eq!(json["file"]["file_id"], "file_abc");
2211        assert!(json["file"].get("file_data").is_none());
2212    }
2213
2214    #[test]
2215    fn base64_image_without_detail_defaults_to_auto() {
2216        let image = message::UserContent::Image(message::Image {
2217            data: DocumentSourceKind::Base64("iVBORw0KGgo=".into()),
2218            media_type: Some(message::ImageMediaType::PNG),
2219            detail: None,
2220            additional_params: None,
2221        });
2222        let converted: UserContent = image.try_into().expect("conversion should succeed");
2223        let UserContent::Image { image_url } = converted else {
2224            panic!("expected image content");
2225        };
2226
2227        assert_eq!(image_url.url, "data:image/png;base64,iVBORw0KGgo=");
2228        assert_eq!(image_url.detail, ImageDetail::Auto);
2229    }
2230
2231    // Regression guard: callers passing markdown/plain text wrapped in
2232    // `UserContent::Document` should keep getting flattened to `text`.
2233    #[test]
2234    fn non_pdf_document_still_serializes_as_text() {
2235        let doc = message::UserContent::Document(message::Document {
2236            data: DocumentSourceKind::String("# Markdown".into()),
2237            media_type: None,
2238            additional_params: None,
2239        });
2240        let converted: UserContent = doc.try_into().expect("conversion should succeed");
2241        let json = serde_json::to_value(&converted).expect("serialize");
2242
2243        assert_eq!(json["type"], "text");
2244        assert_eq!(json["text"], "# Markdown");
2245    }
2246
2247    #[test]
2248    fn pdf_url_document_returns_conversion_error() {
2249        let doc = message::UserContent::Document(message::Document {
2250            data: DocumentSourceKind::Url("https://example.com/x.pdf".into()),
2251            media_type: Some(message::DocumentMediaType::PDF),
2252            additional_params: None,
2253        });
2254        let res: Result<UserContent, _> = doc.try_into();
2255        assert!(matches!(
2256            res,
2257            Err(message::MessageError::ConversionError(_))
2258        ));
2259    }
2260
2261    #[test]
2262    fn pdf_raw_document_returns_conversion_error() {
2263        let doc = message::UserContent::Document(message::Document {
2264            data: DocumentSourceKind::Raw(b"%PDF-1.4\n".to_vec()),
2265            media_type: Some(message::DocumentMediaType::PDF),
2266            additional_params: None,
2267        });
2268        let res: Result<UserContent, _> = doc.try_into();
2269        assert!(matches!(
2270            res,
2271            Err(message::MessageError::ConversionError(_))
2272        ));
2273    }
2274
2275    #[test]
2276    fn file_user_content_deserializes_from_wire_json() {
2277        let raw = r#"{"type":"file","file":{"file_data":"data:application/pdf;base64,AAAA","filename":"x.pdf"}}"#;
2278        let parsed: UserContent = serde_json::from_str(raw).expect("deserialize");
2279        let UserContent::File { file } = parsed else {
2280            panic!("expected File variant");
2281        };
2282        assert_eq!(
2283            file.file_data.as_deref(),
2284            Some("data:application/pdf;base64,AAAA")
2285        );
2286        assert_eq!(file.filename.as_deref(), Some("x.pdf"));
2287        assert!(file.file_id.is_none());
2288    }
2289
2290    #[test]
2291    fn file_variant_round_trips_back_to_pdf_document() {
2292        let wire = UserContent::File {
2293            file: FileData {
2294                file_data: Some("data:application/pdf;base64,QUJD".to_string()),
2295                file_id: None,
2296                filename: Some("document.pdf".to_string()),
2297            },
2298        };
2299        let rig: message::UserContent = wire.into();
2300        let message::UserContent::Document(doc) = rig else {
2301            panic!("expected Document");
2302        };
2303        assert_eq!(doc.media_type, Some(message::DocumentMediaType::PDF));
2304        assert!(matches!(doc.data, DocumentSourceKind::Base64(ref b) if b == "QUJD"));
2305    }
2306
2307    #[test]
2308    fn file_variant_with_file_id_only_round_trips_to_document_file_id() {
2309        let wire = UserContent::File {
2310            file: FileData {
2311                file_data: None,
2312                file_id: Some("file_abc".to_string()),
2313                filename: None,
2314            },
2315        };
2316        let rig: message::UserContent = wire.into();
2317        let message::UserContent::Document(doc) = rig else {
2318            panic!("expected Document");
2319        };
2320        assert_eq!(doc.media_type, None);
2321        assert!(matches!(doc.data, DocumentSourceKind::FileId(ref id) if id == "file_abc"));
2322
2323        let converted: UserContent = message::UserContent::Document(doc)
2324            .try_into()
2325            .expect("conversion should succeed");
2326        let json = serde_json::to_value(&converted).expect("serialize");
2327
2328        assert_eq!(json["type"], "file");
2329        assert_eq!(json["file"]["file_id"], "file_abc");
2330        assert!(json["file"].get("file_data").is_none());
2331    }
2332
2333    // Guards against `OneOrMany::many` flattening at the User content site:
2334    // a mixed text + PDF message must produce one User message with both parts.
2335    #[test]
2336    fn mixed_text_and_pdf_user_message_produces_two_content_parts() {
2337        let user = message::Message::User {
2338            content: OneOrMany::many(vec![
2339                message::UserContent::text("What is in this PDF?"),
2340                message::UserContent::Document(message::Document {
2341                    data: DocumentSourceKind::Base64("JVBERi0K".into()),
2342                    media_type: Some(message::DocumentMediaType::PDF),
2343                    additional_params: None,
2344                }),
2345            ])
2346            .expect("non-empty content"),
2347        };
2348        let converted: Vec<Message> = user.try_into().expect("conversion should succeed");
2349        assert_eq!(converted.len(), 1);
2350        let Message::User { content, .. } = &converted[0] else {
2351            panic!("expected user message");
2352        };
2353        let parts: Vec<&UserContent> = content.iter().collect();
2354        assert_eq!(parts.len(), 2);
2355        assert!(matches!(parts[0], UserContent::Text { .. }));
2356        assert!(matches!(parts[1], UserContent::File { .. }));
2357    }
2358}