1use super::{ApiErrorResponse, ApiResponse, Client, streaming::StreamingCompletionResponse};
6use crate::completion::{CompletionError, CompletionRequest};
7use crate::message::{AudioMediaType, ImageDetail};
8use crate::one_or_many::string_or_one_or_many;
9use crate::{OneOrMany, completion, json_utils, message};
10use serde::{Deserialize, Serialize};
11use serde_json::{Value, json};
12use std::convert::Infallible;
13use std::fmt;
14
15use std::str::FromStr;
16
17pub mod streaming;
18
19pub const O4_MINI_2025_04_16: &str = "o4-mini-2025-04-16";
21pub const O4_MINI: &str = "o4-mini";
23pub const O3: &str = "o3";
25pub const O3_MINI: &str = "o3-mini";
27pub const O3_MINI_2025_01_31: &str = "o3-mini-2025-01-31";
29pub const O1_PRO: &str = "o1-pro";
31pub const O1: &str = "o1";
33pub const O1_2024_12_17: &str = "o1-2024-12-17";
35pub const O1_PREVIEW: &str = "o1-preview";
37pub const O1_PREVIEW_2024_09_12: &str = "o1-preview-2024-09-12";
39pub const O1_MINI: &str = "o1-mini";
41pub const O1_MINI_2024_09_12: &str = "o1-mini-2024-09-12";
43
44pub const GPT_4_1_MINI: &str = "gpt-4.1-mini";
46pub const GPT_4_1_NANO: &str = "gpt-4.1-nano";
48pub const GPT_4_1_2025_04_14: &str = "gpt-4.1-2025-04-14";
50pub const GPT_4_1: &str = "gpt-4.1";
52pub const GPT_4_5_PREVIEW: &str = "gpt-4.5-preview";
54pub const GPT_4_5_PREVIEW_2025_02_27: &str = "gpt-4.5-preview-2025-02-27";
56pub const GPT_4O_2024_11_20: &str = "gpt-4o-2024-11-20";
58pub const GPT_4O: &str = "gpt-4o";
60pub const GPT_4O_MINI: &str = "gpt-4o-mini";
62pub const GPT_4O_2024_05_13: &str = "gpt-4o-2024-05-13";
64pub const GPT_4_TURBO: &str = "gpt-4-turbo";
66pub const GPT_4_TURBO_2024_04_09: &str = "gpt-4-turbo-2024-04-09";
68pub const GPT_4_TURBO_PREVIEW: &str = "gpt-4-turbo-preview";
70pub const GPT_4_0125_PREVIEW: &str = "gpt-4-0125-preview";
72pub const GPT_4_1106_PREVIEW: &str = "gpt-4-1106-preview";
74pub const GPT_4_VISION_PREVIEW: &str = "gpt-4-vision-preview";
76pub const GPT_4_1106_VISION_PREVIEW: &str = "gpt-4-1106-vision-preview";
78pub const GPT_4: &str = "gpt-4";
80pub const GPT_4_0613: &str = "gpt-4-0613";
82pub const GPT_4_32K: &str = "gpt-4-32k";
84pub const GPT_4_32K_0613: &str = "gpt-4-32k-0613";
86pub const GPT_35_TURBO: &str = "gpt-3.5-turbo";
88pub const GPT_35_TURBO_0125: &str = "gpt-3.5-turbo-0125";
90pub const GPT_35_TURBO_1106: &str = "gpt-3.5-turbo-1106";
92pub const GPT_35_TURBO_INSTRUCT: &str = "gpt-3.5-turbo-instruct";
94
95impl From<ApiErrorResponse> for CompletionError {
96 fn from(err: ApiErrorResponse) -> Self {
97 CompletionError::ProviderError(err.message)
98 }
99}
100
101#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
102#[serde(tag = "role", rename_all = "lowercase")]
103pub enum Message {
104 #[serde(alias = "developer")]
105 System {
106 #[serde(deserialize_with = "string_or_one_or_many")]
107 content: OneOrMany<SystemContent>,
108 #[serde(skip_serializing_if = "Option::is_none")]
109 name: Option<String>,
110 },
111 User {
112 #[serde(deserialize_with = "string_or_one_or_many")]
113 content: OneOrMany<UserContent>,
114 #[serde(skip_serializing_if = "Option::is_none")]
115 name: Option<String>,
116 },
117 Assistant {
118 #[serde(default, deserialize_with = "json_utils::string_or_vec")]
119 content: Vec<AssistantContent>,
120 #[serde(skip_serializing_if = "Option::is_none")]
121 refusal: Option<String>,
122 #[serde(skip_serializing_if = "Option::is_none")]
123 audio: Option<AudioAssistant>,
124 #[serde(skip_serializing_if = "Option::is_none")]
125 name: Option<String>,
126 #[serde(
127 default,
128 deserialize_with = "json_utils::null_or_vec",
129 skip_serializing_if = "Vec::is_empty"
130 )]
131 tool_calls: Vec<ToolCall>,
132 },
133 #[serde(rename = "tool")]
134 ToolResult {
135 tool_call_id: String,
136 content: OneOrMany<ToolResultContent>,
137 },
138}
139
140impl Message {
141 pub fn system(content: &str) -> Self {
142 Message::System {
143 content: OneOrMany::one(content.to_owned().into()),
144 name: None,
145 }
146 }
147}
148
149#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
150pub struct AudioAssistant {
151 id: String,
152}
153
154#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
155pub struct SystemContent {
156 #[serde(default)]
157 r#type: SystemContentType,
158 text: String,
159}
160
161#[derive(Default, Debug, Serialize, Deserialize, PartialEq, Clone)]
162#[serde(rename_all = "lowercase")]
163pub enum SystemContentType {
164 #[default]
165 Text,
166}
167
168#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
169#[serde(tag = "type", rename_all = "lowercase")]
170pub enum AssistantContent {
171 Text { text: String },
172 Refusal { refusal: String },
173}
174
175impl From<AssistantContent> for completion::AssistantContent {
176 fn from(value: AssistantContent) -> Self {
177 match value {
178 AssistantContent::Text { text } => completion::AssistantContent::text(text),
179 AssistantContent::Refusal { refusal } => completion::AssistantContent::text(refusal),
180 }
181 }
182}
183
184#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
185#[serde(tag = "type", rename_all = "lowercase")]
186pub enum UserContent {
187 Text {
188 text: String,
189 },
190 #[serde(rename = "image_url")]
191 Image {
192 image_url: ImageUrl,
193 },
194 Audio {
195 input_audio: InputAudio,
196 },
197}
198
199#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
200pub struct ImageUrl {
201 pub url: String,
202 #[serde(default)]
203 pub detail: ImageDetail,
204}
205
206#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
207pub struct InputAudio {
208 pub data: String,
209 pub format: AudioMediaType,
210}
211
212#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
213pub struct ToolResultContent {
214 #[serde(default)]
215 r#type: ToolResultContentType,
216 pub text: String,
217}
218
219#[derive(Default, Debug, Serialize, Deserialize, PartialEq, Clone)]
220#[serde(rename_all = "lowercase")]
221pub enum ToolResultContentType {
222 #[default]
223 Text,
224}
225
226impl FromStr for ToolResultContent {
227 type Err = Infallible;
228
229 fn from_str(s: &str) -> Result<Self, Self::Err> {
230 Ok(s.to_owned().into())
231 }
232}
233
234impl From<String> for ToolResultContent {
235 fn from(s: String) -> Self {
236 ToolResultContent {
237 r#type: ToolResultContentType::default(),
238 text: s,
239 }
240 }
241}
242
243#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
244pub struct ToolCall {
245 pub id: String,
246 #[serde(default)]
247 pub r#type: ToolType,
248 pub function: Function,
249}
250
251#[derive(Default, Debug, Serialize, Deserialize, PartialEq, Clone)]
252#[serde(rename_all = "lowercase")]
253pub enum ToolType {
254 #[default]
255 Function,
256}
257
258#[derive(Debug, Deserialize, Serialize, Clone)]
259pub struct ToolDefinition {
260 pub r#type: String,
261 pub function: completion::ToolDefinition,
262}
263
264impl From<completion::ToolDefinition> for ToolDefinition {
265 fn from(tool: completion::ToolDefinition) -> Self {
266 Self {
267 r#type: "function".into(),
268 function: tool,
269 }
270 }
271}
272
273#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
274pub struct Function {
275 pub name: String,
276 #[serde(with = "json_utils::stringified_json")]
277 pub arguments: serde_json::Value,
278}
279
280impl TryFrom<message::Message> for Vec<Message> {
281 type Error = message::MessageError;
282
283 fn try_from(message: message::Message) -> Result<Self, Self::Error> {
284 match message {
285 message::Message::User { content } => {
286 let (tool_results, other_content): (Vec<_>, Vec<_>) = content
287 .into_iter()
288 .partition(|content| matches!(content, message::UserContent::ToolResult(_)));
289
290 if !tool_results.is_empty() {
293 tool_results
294 .into_iter()
295 .map(|content| match content {
296 message::UserContent::ToolResult(message::ToolResult {
297 id,
298 content,
299 ..
300 }) => Ok::<_, message::MessageError>(Message::ToolResult {
301 tool_call_id: id,
302 content: content.try_map(|content| match content {
303 message::ToolResultContent::Text(message::Text { text }) => {
304 Ok(text.into())
305 }
306 _ => Err(message::MessageError::ConversionError(
307 "Tool result content does not support non-text".into(),
308 )),
309 })?,
310 }),
311 _ => unreachable!(),
312 })
313 .collect::<Result<Vec<_>, _>>()
314 } else {
315 let other_content = OneOrMany::many(other_content).expect(
316 "There must be other content here if there were no tool result content",
317 );
318
319 Ok(vec![Message::User {
320 content: other_content.map(|content| match content {
321 message::UserContent::Text(message::Text { text }) => {
322 UserContent::Text { text }
323 }
324 message::UserContent::Image(message::Image {
325 data, detail, ..
326 }) => UserContent::Image {
327 image_url: ImageUrl {
328 url: data,
329 detail: detail.unwrap_or_default(),
330 },
331 },
332 message::UserContent::Document(message::Document { data, .. }) => {
333 UserContent::Text { text: data }
334 }
335 message::UserContent::Audio(message::Audio {
336 data,
337 media_type,
338 ..
339 }) => UserContent::Audio {
340 input_audio: InputAudio {
341 data,
342 format: match media_type {
343 Some(media_type) => media_type,
344 None => AudioMediaType::MP3,
345 },
346 },
347 },
348 _ => unreachable!(),
349 }),
350 name: None,
351 }])
352 }
353 }
354 message::Message::Assistant { content, .. } => {
355 let (text_content, tool_calls) = content.into_iter().fold(
356 (Vec::new(), Vec::new()),
357 |(mut texts, mut tools), content| {
358 match content {
359 message::AssistantContent::Text(text) => texts.push(text),
360 message::AssistantContent::ToolCall(tool_call) => tools.push(tool_call),
361 }
362 (texts, tools)
363 },
364 );
365
366 Ok(vec![Message::Assistant {
369 content: text_content
370 .into_iter()
371 .map(|content| content.text.into())
372 .collect::<Vec<_>>(),
373 refusal: None,
374 audio: None,
375 name: None,
376 tool_calls: tool_calls
377 .into_iter()
378 .map(|tool_call| tool_call.into())
379 .collect::<Vec<_>>(),
380 }])
381 }
382 }
383 }
384}
385
386impl From<message::ToolCall> for ToolCall {
387 fn from(tool_call: message::ToolCall) -> Self {
388 Self {
389 id: tool_call.id,
390 r#type: ToolType::default(),
391 function: Function {
392 name: tool_call.function.name,
393 arguments: tool_call.function.arguments,
394 },
395 }
396 }
397}
398
399impl From<ToolCall> for message::ToolCall {
400 fn from(tool_call: ToolCall) -> Self {
401 Self {
402 id: tool_call.id,
403 call_id: None,
404 function: message::ToolFunction {
405 name: tool_call.function.name,
406 arguments: tool_call.function.arguments,
407 },
408 }
409 }
410}
411
412impl TryFrom<Message> for message::Message {
413 type Error = message::MessageError;
414
415 fn try_from(message: Message) -> Result<Self, Self::Error> {
416 Ok(match message {
417 Message::User { content, .. } => message::Message::User {
418 content: content.map(|content| content.into()),
419 },
420 Message::Assistant {
421 content,
422 tool_calls,
423 ..
424 } => {
425 let mut content = content
426 .into_iter()
427 .map(|content| match content {
428 AssistantContent::Text { text } => message::AssistantContent::text(text),
429
430 AssistantContent::Refusal { refusal } => {
433 message::AssistantContent::text(refusal)
434 }
435 })
436 .collect::<Vec<_>>();
437
438 content.extend(
439 tool_calls
440 .into_iter()
441 .map(|tool_call| Ok(message::AssistantContent::ToolCall(tool_call.into())))
442 .collect::<Result<Vec<_>, _>>()?,
443 );
444
445 message::Message::Assistant {
446 id: None,
447 content: OneOrMany::many(content).map_err(|_| {
448 message::MessageError::ConversionError(
449 "Neither `content` nor `tool_calls` was provided to the Message"
450 .to_owned(),
451 )
452 })?,
453 }
454 }
455
456 Message::ToolResult {
457 tool_call_id,
458 content,
459 } => message::Message::User {
460 content: OneOrMany::one(message::UserContent::tool_result(
461 tool_call_id,
462 content.map(|content| message::ToolResultContent::text(content.text)),
463 )),
464 },
465
466 Message::System { content, .. } => message::Message::User {
469 content: content.map(|content| message::UserContent::text(content.text)),
470 },
471 })
472 }
473}
474
475impl From<UserContent> for message::UserContent {
476 fn from(content: UserContent) -> Self {
477 match content {
478 UserContent::Text { text } => message::UserContent::text(text),
479 UserContent::Image { image_url } => message::UserContent::image(
480 image_url.url,
481 Some(message::ContentFormat::default()),
482 None,
483 Some(image_url.detail),
484 ),
485 UserContent::Audio { input_audio } => message::UserContent::audio(
486 input_audio.data,
487 Some(message::ContentFormat::default()),
488 Some(input_audio.format),
489 ),
490 }
491 }
492}
493
494impl From<String> for UserContent {
495 fn from(s: String) -> Self {
496 UserContent::Text { text: s }
497 }
498}
499
500impl FromStr for UserContent {
501 type Err = Infallible;
502
503 fn from_str(s: &str) -> Result<Self, Self::Err> {
504 Ok(UserContent::Text {
505 text: s.to_string(),
506 })
507 }
508}
509
510impl From<String> for AssistantContent {
511 fn from(s: String) -> Self {
512 AssistantContent::Text { text: s }
513 }
514}
515
516impl FromStr for AssistantContent {
517 type Err = Infallible;
518
519 fn from_str(s: &str) -> Result<Self, Self::Err> {
520 Ok(AssistantContent::Text {
521 text: s.to_string(),
522 })
523 }
524}
525impl From<String> for SystemContent {
526 fn from(s: String) -> Self {
527 SystemContent {
528 r#type: SystemContentType::default(),
529 text: s,
530 }
531 }
532}
533
534impl FromStr for SystemContent {
535 type Err = Infallible;
536
537 fn from_str(s: &str) -> Result<Self, Self::Err> {
538 Ok(SystemContent {
539 r#type: SystemContentType::default(),
540 text: s.to_string(),
541 })
542 }
543}
544
545#[derive(Debug, Deserialize)]
546pub struct CompletionResponse {
547 pub id: String,
548 pub object: String,
549 pub created: u64,
550 pub model: String,
551 pub system_fingerprint: Option<String>,
552 pub choices: Vec<Choice>,
553 pub usage: Option<Usage>,
554}
555
556impl TryFrom<CompletionResponse> for completion::CompletionResponse<CompletionResponse> {
557 type Error = CompletionError;
558
559 fn try_from(response: CompletionResponse) -> Result<Self, Self::Error> {
560 let choice = response.choices.first().ok_or_else(|| {
561 CompletionError::ResponseError("Response contained no choices".to_owned())
562 })?;
563
564 let content = match &choice.message {
565 Message::Assistant {
566 content,
567 tool_calls,
568 ..
569 } => {
570 let mut content = content
571 .iter()
572 .filter_map(|c| {
573 let s = match c {
574 AssistantContent::Text { text } => text,
575 AssistantContent::Refusal { refusal } => refusal,
576 };
577 if s.is_empty() {
578 None
579 } else {
580 Some(completion::AssistantContent::text(s))
581 }
582 })
583 .collect::<Vec<_>>();
584
585 content.extend(
586 tool_calls
587 .iter()
588 .map(|call| {
589 completion::AssistantContent::tool_call(
590 &call.id,
591 &call.function.name,
592 call.function.arguments.clone(),
593 )
594 })
595 .collect::<Vec<_>>(),
596 );
597 Ok(content)
598 }
599 _ => Err(CompletionError::ResponseError(
600 "Response did not contain a valid message or tool call".into(),
601 )),
602 }?;
603
604 let choice = OneOrMany::many(content).map_err(|_| {
605 CompletionError::ResponseError(
606 "Response contained no message or tool call (empty)".to_owned(),
607 )
608 })?;
609
610 let usage = response
611 .usage
612 .as_ref()
613 .map(|usage| completion::Usage {
614 input_tokens: usage.prompt_tokens as u64,
615 output_tokens: (usage.total_tokens - usage.prompt_tokens) as u64,
616 total_tokens: usage.total_tokens as u64,
617 })
618 .unwrap_or_default();
619
620 Ok(completion::CompletionResponse {
621 choice,
622 usage,
623 raw_response: response,
624 })
625 }
626}
627
628#[derive(Debug, Serialize, Deserialize)]
629pub struct Choice {
630 pub index: usize,
631 pub message: Message,
632 pub logprobs: Option<serde_json::Value>,
633 pub finish_reason: String,
634}
635
636#[derive(Clone, Debug, Deserialize)]
637pub struct Usage {
638 pub prompt_tokens: usize,
639 pub total_tokens: usize,
640}
641
642impl fmt::Display for Usage {
643 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
644 let Usage {
645 prompt_tokens,
646 total_tokens,
647 } = self;
648 write!(
649 f,
650 "Prompt tokens: {prompt_tokens} Total tokens: {total_tokens}"
651 )
652 }
653}
654
655#[derive(Clone)]
656pub struct CompletionModel {
657 pub(crate) client: Client,
658 pub model: String,
660}
661
662impl CompletionModel {
663 pub fn new(client: Client, model: &str) -> Self {
664 Self {
665 client,
666 model: model.to_string(),
667 }
668 }
669
670 pub fn into_agent_builder(self) -> crate::agent::AgentBuilder<Self> {
671 crate::agent::AgentBuilder::new(self)
672 }
673
674 pub(crate) fn create_completion_request(
675 &self,
676 completion_request: CompletionRequest,
677 ) -> Result<Value, CompletionError> {
678 let mut partial_history = vec![];
680 if let Some(docs) = completion_request.normalized_documents() {
681 partial_history.push(docs);
682 }
683 partial_history.extend(completion_request.chat_history);
684
685 let mut full_history: Vec<Message> = completion_request
687 .preamble
688 .map_or_else(Vec::new, |preamble| vec![Message::system(&preamble)]);
689
690 full_history.extend(
692 partial_history
693 .into_iter()
694 .map(message::Message::try_into)
695 .collect::<Result<Vec<Vec<Message>>, _>>()?
696 .into_iter()
697 .flatten()
698 .collect::<Vec<_>>(),
699 );
700
701 let request = if completion_request.tools.is_empty() {
702 serde_json::json!({
703 "model": self.model,
704 "messages": full_history,
705
706 })
707 } else {
708 json!({
709 "model": self.model,
710 "messages": full_history,
711 "tools": completion_request.tools.into_iter().map(ToolDefinition::from).collect::<Vec<_>>(),
712 "tool_choice": "auto",
713 })
714 };
715
716 let request = if let Some(temperature) = completion_request.temperature {
719 json_utils::merge(
720 request,
721 json!({
722 "temperature": temperature,
723 }),
724 )
725 } else {
726 request
727 };
728
729 let request = if let Some(params) = completion_request.additional_params {
730 json_utils::merge(request, params)
731 } else {
732 request
733 };
734
735 Ok(request)
736 }
737}
738
739impl completion::CompletionModel for CompletionModel {
740 type Response = CompletionResponse;
741 type StreamingResponse = StreamingCompletionResponse;
742
743 #[cfg_attr(feature = "worker", worker::send)]
744 async fn completion(
745 &self,
746 completion_request: CompletionRequest,
747 ) -> Result<completion::CompletionResponse<CompletionResponse>, CompletionError> {
748 let request = self.create_completion_request(completion_request)?;
749
750 let response = self
751 .client
752 .post("/chat/completions")
753 .json(&request)
754 .send()
755 .await?;
756
757 if response.status().is_success() {
758 let t = response.text().await?;
759 tracing::debug!(target: "rig", "OpenAI completion error: {}", t);
760
761 match serde_json::from_str::<ApiResponse<CompletionResponse>>(&t)? {
762 ApiResponse::Ok(response) => {
763 tracing::info!(target: "rig",
764 "OpenAI completion token usage: {:?}",
765 response.usage.clone().map(|usage| format!("{}", usage.total_tokens)).unwrap_or("N/A".to_string())
766 );
767 response.try_into()
768 }
769 ApiResponse::Err(err) => Err(CompletionError::ProviderError(err.message)),
770 }
771 } else {
772 Err(CompletionError::ProviderError(response.text().await?))
773 }
774 }
775
776 #[cfg_attr(feature = "worker", worker::send)]
777 async fn stream(
778 &self,
779 request: CompletionRequest,
780 ) -> Result<
781 crate::streaming::StreamingCompletionResponse<Self::StreamingResponse>,
782 CompletionError,
783 > {
784 CompletionModel::stream(self, request).await
785 }
786}