rig/providers/openai/completion/
mod.rs

1// ================================================================
2// OpenAI Completion API
3// ================================================================
4
5use super::{ApiErrorResponse, ApiResponse, Client, streaming::StreamingCompletionResponse};
6use crate::completion::{CompletionError, CompletionRequest};
7use crate::message::{AudioMediaType, ImageDetail};
8use crate::one_or_many::string_or_one_or_many;
9use crate::{OneOrMany, completion, json_utils, message};
10use serde::{Deserialize, Serialize};
11use serde_json::{Value, json};
12use std::convert::Infallible;
13use std::fmt;
14
15use std::str::FromStr;
16
17pub mod streaming;
18
19/// `o4-mini-2025-04-16` completion model
20pub const O4_MINI_2025_04_16: &str = "o4-mini-2025-04-16";
21/// `o4-mini` completion model
22pub const O4_MINI: &str = "o4-mini";
23/// `o3` completion model
24pub const O3: &str = "o3";
25/// `o3-mini` completion model
26pub const O3_MINI: &str = "o3-mini";
27/// `o3-mini-2025-01-31` completion model
28pub const O3_MINI_2025_01_31: &str = "o3-mini-2025-01-31";
29/// `o1-pro` completion model
30pub const O1_PRO: &str = "o1-pro";
31/// `o1`` completion model
32pub const O1: &str = "o1";
33/// `o1-2024-12-17` completion model
34pub const O1_2024_12_17: &str = "o1-2024-12-17";
35/// `o1-preview` completion model
36pub const O1_PREVIEW: &str = "o1-preview";
37/// `o1-preview-2024-09-12` completion model
38pub const O1_PREVIEW_2024_09_12: &str = "o1-preview-2024-09-12";
39/// `o1-mini completion model
40pub const O1_MINI: &str = "o1-mini";
41/// `o1-mini-2024-09-12` completion model
42pub const O1_MINI_2024_09_12: &str = "o1-mini-2024-09-12";
43
44/// `gpt-4.1-mini` completion model
45pub const GPT_4_1_MINI: &str = "gpt-4.1-mini";
46/// `gpt-4.1-nano` completion model
47pub const GPT_4_1_NANO: &str = "gpt-4.1-nano";
48/// `gpt-4.1-2025-04-14` completion model
49pub const GPT_4_1_2025_04_14: &str = "gpt-4.1-2025-04-14";
50/// `gpt-4.1` completion model
51pub const GPT_4_1: &str = "gpt-4.1";
52/// `gpt-4.5-preview` completion model
53pub const GPT_4_5_PREVIEW: &str = "gpt-4.5-preview";
54/// `gpt-4.5-preview-2025-02-27` completion model
55pub const GPT_4_5_PREVIEW_2025_02_27: &str = "gpt-4.5-preview-2025-02-27";
56/// `gpt-4o-2024-11-20` completion model (this is newer than 4o)
57pub const GPT_4O_2024_11_20: &str = "gpt-4o-2024-11-20";
58/// `gpt-4o` completion model
59pub const GPT_4O: &str = "gpt-4o";
60/// `gpt-4o-mini` completion model
61pub const GPT_4O_MINI: &str = "gpt-4o-mini";
62/// `gpt-4o-2024-05-13` completion model
63pub const GPT_4O_2024_05_13: &str = "gpt-4o-2024-05-13";
64/// `gpt-4-turbo` completion model
65pub const GPT_4_TURBO: &str = "gpt-4-turbo";
66/// `gpt-4-turbo-2024-04-09` completion model
67pub const GPT_4_TURBO_2024_04_09: &str = "gpt-4-turbo-2024-04-09";
68/// `gpt-4-turbo-preview` completion model
69pub const GPT_4_TURBO_PREVIEW: &str = "gpt-4-turbo-preview";
70/// `gpt-4-0125-preview` completion model
71pub const GPT_4_0125_PREVIEW: &str = "gpt-4-0125-preview";
72/// `gpt-4-1106-preview` completion model
73pub const GPT_4_1106_PREVIEW: &str = "gpt-4-1106-preview";
74/// `gpt-4-vision-preview` completion model
75pub const GPT_4_VISION_PREVIEW: &str = "gpt-4-vision-preview";
76/// `gpt-4-1106-vision-preview` completion model
77pub const GPT_4_1106_VISION_PREVIEW: &str = "gpt-4-1106-vision-preview";
78/// `gpt-4` completion model
79pub const GPT_4: &str = "gpt-4";
80/// `gpt-4-0613` completion model
81pub const GPT_4_0613: &str = "gpt-4-0613";
82/// `gpt-4-32k` completion model
83pub const GPT_4_32K: &str = "gpt-4-32k";
84/// `gpt-4-32k-0613` completion model
85pub const GPT_4_32K_0613: &str = "gpt-4-32k-0613";
86/// `gpt-3.5-turbo` completion model
87pub const GPT_35_TURBO: &str = "gpt-3.5-turbo";
88/// `gpt-3.5-turbo-0125` completion model
89pub const GPT_35_TURBO_0125: &str = "gpt-3.5-turbo-0125";
90/// `gpt-3.5-turbo-1106` completion model
91pub const GPT_35_TURBO_1106: &str = "gpt-3.5-turbo-1106";
92/// `gpt-3.5-turbo-instruct` completion model
93pub const GPT_35_TURBO_INSTRUCT: &str = "gpt-3.5-turbo-instruct";
94
95impl From<ApiErrorResponse> for CompletionError {
96    fn from(err: ApiErrorResponse) -> Self {
97        CompletionError::ProviderError(err.message)
98    }
99}
100
101#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
102#[serde(tag = "role", rename_all = "lowercase")]
103pub enum Message {
104    #[serde(alias = "developer")]
105    System {
106        #[serde(deserialize_with = "string_or_one_or_many")]
107        content: OneOrMany<SystemContent>,
108        #[serde(skip_serializing_if = "Option::is_none")]
109        name: Option<String>,
110    },
111    User {
112        #[serde(deserialize_with = "string_or_one_or_many")]
113        content: OneOrMany<UserContent>,
114        #[serde(skip_serializing_if = "Option::is_none")]
115        name: Option<String>,
116    },
117    Assistant {
118        #[serde(default, deserialize_with = "json_utils::string_or_vec")]
119        content: Vec<AssistantContent>,
120        #[serde(skip_serializing_if = "Option::is_none")]
121        refusal: Option<String>,
122        #[serde(skip_serializing_if = "Option::is_none")]
123        audio: Option<AudioAssistant>,
124        #[serde(skip_serializing_if = "Option::is_none")]
125        name: Option<String>,
126        #[serde(
127            default,
128            deserialize_with = "json_utils::null_or_vec",
129            skip_serializing_if = "Vec::is_empty"
130        )]
131        tool_calls: Vec<ToolCall>,
132    },
133    #[serde(rename = "tool")]
134    ToolResult {
135        tool_call_id: String,
136        content: OneOrMany<ToolResultContent>,
137    },
138}
139
140impl Message {
141    pub fn system(content: &str) -> Self {
142        Message::System {
143            content: OneOrMany::one(content.to_owned().into()),
144            name: None,
145        }
146    }
147}
148
149#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
150pub struct AudioAssistant {
151    id: String,
152}
153
154#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
155pub struct SystemContent {
156    #[serde(default)]
157    r#type: SystemContentType,
158    text: String,
159}
160
161#[derive(Default, Debug, Serialize, Deserialize, PartialEq, Clone)]
162#[serde(rename_all = "lowercase")]
163pub enum SystemContentType {
164    #[default]
165    Text,
166}
167
168#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
169#[serde(tag = "type", rename_all = "lowercase")]
170pub enum AssistantContent {
171    Text { text: String },
172    Refusal { refusal: String },
173}
174
175impl From<AssistantContent> for completion::AssistantContent {
176    fn from(value: AssistantContent) -> Self {
177        match value {
178            AssistantContent::Text { text } => completion::AssistantContent::text(text),
179            AssistantContent::Refusal { refusal } => completion::AssistantContent::text(refusal),
180        }
181    }
182}
183
184#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
185#[serde(tag = "type", rename_all = "lowercase")]
186pub enum UserContent {
187    Text {
188        text: String,
189    },
190    #[serde(rename = "image_url")]
191    Image {
192        image_url: ImageUrl,
193    },
194    Audio {
195        input_audio: InputAudio,
196    },
197}
198
199#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
200pub struct ImageUrl {
201    pub url: String,
202    #[serde(default)]
203    pub detail: ImageDetail,
204}
205
206#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
207pub struct InputAudio {
208    pub data: String,
209    pub format: AudioMediaType,
210}
211
212#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
213pub struct ToolResultContent {
214    #[serde(default)]
215    r#type: ToolResultContentType,
216    pub text: String,
217}
218
219#[derive(Default, Debug, Serialize, Deserialize, PartialEq, Clone)]
220#[serde(rename_all = "lowercase")]
221pub enum ToolResultContentType {
222    #[default]
223    Text,
224}
225
226impl FromStr for ToolResultContent {
227    type Err = Infallible;
228
229    fn from_str(s: &str) -> Result<Self, Self::Err> {
230        Ok(s.to_owned().into())
231    }
232}
233
234impl From<String> for ToolResultContent {
235    fn from(s: String) -> Self {
236        ToolResultContent {
237            r#type: ToolResultContentType::default(),
238            text: s,
239        }
240    }
241}
242
243#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
244pub struct ToolCall {
245    pub id: String,
246    #[serde(default)]
247    pub r#type: ToolType,
248    pub function: Function,
249}
250
251#[derive(Default, Debug, Serialize, Deserialize, PartialEq, Clone)]
252#[serde(rename_all = "lowercase")]
253pub enum ToolType {
254    #[default]
255    Function,
256}
257
258#[derive(Debug, Deserialize, Serialize, Clone)]
259pub struct ToolDefinition {
260    pub r#type: String,
261    pub function: completion::ToolDefinition,
262}
263
264impl From<completion::ToolDefinition> for ToolDefinition {
265    fn from(tool: completion::ToolDefinition) -> Self {
266        Self {
267            r#type: "function".into(),
268            function: tool,
269        }
270    }
271}
272
273#[derive(Debug, Serialize, Deserialize, PartialEq, Clone)]
274pub struct Function {
275    pub name: String,
276    #[serde(with = "json_utils::stringified_json")]
277    pub arguments: serde_json::Value,
278}
279
280impl TryFrom<message::Message> for Vec<Message> {
281    type Error = message::MessageError;
282
283    fn try_from(message: message::Message) -> Result<Self, Self::Error> {
284        match message {
285            message::Message::User { content } => {
286                let (tool_results, other_content): (Vec<_>, Vec<_>) = content
287                    .into_iter()
288                    .partition(|content| matches!(content, message::UserContent::ToolResult(_)));
289
290                // If there are messages with both tool results and user content, openai will only
291                //  handle tool results. It's unlikely that there will be both.
292                if !tool_results.is_empty() {
293                    tool_results
294                        .into_iter()
295                        .map(|content| match content {
296                            message::UserContent::ToolResult(message::ToolResult {
297                                id,
298                                content,
299                                ..
300                            }) => Ok::<_, message::MessageError>(Message::ToolResult {
301                                tool_call_id: id,
302                                content: content.try_map(|content| match content {
303                                    message::ToolResultContent::Text(message::Text { text }) => {
304                                        Ok(text.into())
305                                    }
306                                    _ => Err(message::MessageError::ConversionError(
307                                        "Tool result content does not support non-text".into(),
308                                    )),
309                                })?,
310                            }),
311                            _ => unreachable!(),
312                        })
313                        .collect::<Result<Vec<_>, _>>()
314                } else {
315                    let other_content = OneOrMany::many(other_content).expect(
316                        "There must be other content here if there were no tool result content",
317                    );
318
319                    Ok(vec![Message::User {
320                        content: other_content.map(|content| match content {
321                            message::UserContent::Text(message::Text { text }) => {
322                                UserContent::Text { text }
323                            }
324                            message::UserContent::Image(message::Image {
325                                data, detail, ..
326                            }) => UserContent::Image {
327                                image_url: ImageUrl {
328                                    url: data,
329                                    detail: detail.unwrap_or_default(),
330                                },
331                            },
332                            message::UserContent::Document(message::Document { data, .. }) => {
333                                UserContent::Text { text: data }
334                            }
335                            message::UserContent::Audio(message::Audio {
336                                data,
337                                media_type,
338                                ..
339                            }) => UserContent::Audio {
340                                input_audio: InputAudio {
341                                    data,
342                                    format: match media_type {
343                                        Some(media_type) => media_type,
344                                        None => AudioMediaType::MP3,
345                                    },
346                                },
347                            },
348                            _ => unreachable!(),
349                        }),
350                        name: None,
351                    }])
352                }
353            }
354            message::Message::Assistant { content, .. } => {
355                let (text_content, tool_calls) = content.into_iter().fold(
356                    (Vec::new(), Vec::new()),
357                    |(mut texts, mut tools), content| {
358                        match content {
359                            message::AssistantContent::Text(text) => texts.push(text),
360                            message::AssistantContent::ToolCall(tool_call) => tools.push(tool_call),
361                        }
362                        (texts, tools)
363                    },
364                );
365
366                // `OneOrMany` ensures at least one `AssistantContent::Text` or `ToolCall` exists,
367                //  so either `content` or `tool_calls` will have some content.
368                Ok(vec![Message::Assistant {
369                    content: text_content
370                        .into_iter()
371                        .map(|content| content.text.into())
372                        .collect::<Vec<_>>(),
373                    refusal: None,
374                    audio: None,
375                    name: None,
376                    tool_calls: tool_calls
377                        .into_iter()
378                        .map(|tool_call| tool_call.into())
379                        .collect::<Vec<_>>(),
380                }])
381            }
382        }
383    }
384}
385
386impl From<message::ToolCall> for ToolCall {
387    fn from(tool_call: message::ToolCall) -> Self {
388        Self {
389            id: tool_call.id,
390            r#type: ToolType::default(),
391            function: Function {
392                name: tool_call.function.name,
393                arguments: tool_call.function.arguments,
394            },
395        }
396    }
397}
398
399impl From<ToolCall> for message::ToolCall {
400    fn from(tool_call: ToolCall) -> Self {
401        Self {
402            id: tool_call.id,
403            call_id: None,
404            function: message::ToolFunction {
405                name: tool_call.function.name,
406                arguments: tool_call.function.arguments,
407            },
408        }
409    }
410}
411
412impl TryFrom<Message> for message::Message {
413    type Error = message::MessageError;
414
415    fn try_from(message: Message) -> Result<Self, Self::Error> {
416        Ok(match message {
417            Message::User { content, .. } => message::Message::User {
418                content: content.map(|content| content.into()),
419            },
420            Message::Assistant {
421                content,
422                tool_calls,
423                ..
424            } => {
425                let mut content = content
426                    .into_iter()
427                    .map(|content| match content {
428                        AssistantContent::Text { text } => message::AssistantContent::text(text),
429
430                        // TODO: Currently, refusals are converted into text, but should be
431                        //  investigated for generalization.
432                        AssistantContent::Refusal { refusal } => {
433                            message::AssistantContent::text(refusal)
434                        }
435                    })
436                    .collect::<Vec<_>>();
437
438                content.extend(
439                    tool_calls
440                        .into_iter()
441                        .map(|tool_call| Ok(message::AssistantContent::ToolCall(tool_call.into())))
442                        .collect::<Result<Vec<_>, _>>()?,
443                );
444
445                message::Message::Assistant {
446                    id: None,
447                    content: OneOrMany::many(content).map_err(|_| {
448                        message::MessageError::ConversionError(
449                            "Neither `content` nor `tool_calls` was provided to the Message"
450                                .to_owned(),
451                        )
452                    })?,
453                }
454            }
455
456            Message::ToolResult {
457                tool_call_id,
458                content,
459            } => message::Message::User {
460                content: OneOrMany::one(message::UserContent::tool_result(
461                    tool_call_id,
462                    content.map(|content| message::ToolResultContent::text(content.text)),
463                )),
464            },
465
466            // System messages should get stripped out when converting messages, this is just a
467            // stop gap to avoid obnoxious error handling or panic occurring.
468            Message::System { content, .. } => message::Message::User {
469                content: content.map(|content| message::UserContent::text(content.text)),
470            },
471        })
472    }
473}
474
475impl From<UserContent> for message::UserContent {
476    fn from(content: UserContent) -> Self {
477        match content {
478            UserContent::Text { text } => message::UserContent::text(text),
479            UserContent::Image { image_url } => message::UserContent::image(
480                image_url.url,
481                Some(message::ContentFormat::default()),
482                None,
483                Some(image_url.detail),
484            ),
485            UserContent::Audio { input_audio } => message::UserContent::audio(
486                input_audio.data,
487                Some(message::ContentFormat::default()),
488                Some(input_audio.format),
489            ),
490        }
491    }
492}
493
494impl From<String> for UserContent {
495    fn from(s: String) -> Self {
496        UserContent::Text { text: s }
497    }
498}
499
500impl FromStr for UserContent {
501    type Err = Infallible;
502
503    fn from_str(s: &str) -> Result<Self, Self::Err> {
504        Ok(UserContent::Text {
505            text: s.to_string(),
506        })
507    }
508}
509
510impl From<String> for AssistantContent {
511    fn from(s: String) -> Self {
512        AssistantContent::Text { text: s }
513    }
514}
515
516impl FromStr for AssistantContent {
517    type Err = Infallible;
518
519    fn from_str(s: &str) -> Result<Self, Self::Err> {
520        Ok(AssistantContent::Text {
521            text: s.to_string(),
522        })
523    }
524}
525impl From<String> for SystemContent {
526    fn from(s: String) -> Self {
527        SystemContent {
528            r#type: SystemContentType::default(),
529            text: s,
530        }
531    }
532}
533
534impl FromStr for SystemContent {
535    type Err = Infallible;
536
537    fn from_str(s: &str) -> Result<Self, Self::Err> {
538        Ok(SystemContent {
539            r#type: SystemContentType::default(),
540            text: s.to_string(),
541        })
542    }
543}
544
545#[derive(Debug, Deserialize)]
546pub struct CompletionResponse {
547    pub id: String,
548    pub object: String,
549    pub created: u64,
550    pub model: String,
551    pub system_fingerprint: Option<String>,
552    pub choices: Vec<Choice>,
553    pub usage: Option<Usage>,
554}
555
556impl TryFrom<CompletionResponse> for completion::CompletionResponse<CompletionResponse> {
557    type Error = CompletionError;
558
559    fn try_from(response: CompletionResponse) -> Result<Self, Self::Error> {
560        let choice = response.choices.first().ok_or_else(|| {
561            CompletionError::ResponseError("Response contained no choices".to_owned())
562        })?;
563
564        let content = match &choice.message {
565            Message::Assistant {
566                content,
567                tool_calls,
568                ..
569            } => {
570                let mut content = content
571                    .iter()
572                    .filter_map(|c| {
573                        let s = match c {
574                            AssistantContent::Text { text } => text,
575                            AssistantContent::Refusal { refusal } => refusal,
576                        };
577                        if s.is_empty() {
578                            None
579                        } else {
580                            Some(completion::AssistantContent::text(s))
581                        }
582                    })
583                    .collect::<Vec<_>>();
584
585                content.extend(
586                    tool_calls
587                        .iter()
588                        .map(|call| {
589                            completion::AssistantContent::tool_call(
590                                &call.id,
591                                &call.function.name,
592                                call.function.arguments.clone(),
593                            )
594                        })
595                        .collect::<Vec<_>>(),
596                );
597                Ok(content)
598            }
599            _ => Err(CompletionError::ResponseError(
600                "Response did not contain a valid message or tool call".into(),
601            )),
602        }?;
603
604        let choice = OneOrMany::many(content).map_err(|_| {
605            CompletionError::ResponseError(
606                "Response contained no message or tool call (empty)".to_owned(),
607            )
608        })?;
609
610        let usage = response
611            .usage
612            .as_ref()
613            .map(|usage| completion::Usage {
614                input_tokens: usage.prompt_tokens as u64,
615                output_tokens: (usage.total_tokens - usage.prompt_tokens) as u64,
616                total_tokens: usage.total_tokens as u64,
617            })
618            .unwrap_or_default();
619
620        Ok(completion::CompletionResponse {
621            choice,
622            usage,
623            raw_response: response,
624        })
625    }
626}
627
628#[derive(Debug, Serialize, Deserialize)]
629pub struct Choice {
630    pub index: usize,
631    pub message: Message,
632    pub logprobs: Option<serde_json::Value>,
633    pub finish_reason: String,
634}
635
636#[derive(Clone, Debug, Deserialize)]
637pub struct Usage {
638    pub prompt_tokens: usize,
639    pub total_tokens: usize,
640}
641
642impl fmt::Display for Usage {
643    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
644        let Usage {
645            prompt_tokens,
646            total_tokens,
647        } = self;
648        write!(
649            f,
650            "Prompt tokens: {prompt_tokens} Total tokens: {total_tokens}"
651        )
652    }
653}
654
655#[derive(Clone)]
656pub struct CompletionModel {
657    pub(crate) client: Client,
658    /// Name of the model (e.g.: gpt-3.5-turbo-1106)
659    pub model: String,
660}
661
662impl CompletionModel {
663    pub fn new(client: Client, model: &str) -> Self {
664        Self {
665            client,
666            model: model.to_string(),
667        }
668    }
669
670    pub fn into_agent_builder(self) -> crate::agent::AgentBuilder<Self> {
671        crate::agent::AgentBuilder::new(self)
672    }
673
674    pub(crate) fn create_completion_request(
675        &self,
676        completion_request: CompletionRequest,
677    ) -> Result<Value, CompletionError> {
678        // Build up the order of messages (context, chat_history)
679        let mut partial_history = vec![];
680        if let Some(docs) = completion_request.normalized_documents() {
681            partial_history.push(docs);
682        }
683        partial_history.extend(completion_request.chat_history);
684
685        // Initialize full history with preamble (or empty if non-existent)
686        let mut full_history: Vec<Message> = completion_request
687            .preamble
688            .map_or_else(Vec::new, |preamble| vec![Message::system(&preamble)]);
689
690        // Convert and extend the rest of the history
691        full_history.extend(
692            partial_history
693                .into_iter()
694                .map(message::Message::try_into)
695                .collect::<Result<Vec<Vec<Message>>, _>>()?
696                .into_iter()
697                .flatten()
698                .collect::<Vec<_>>(),
699        );
700
701        let request = if completion_request.tools.is_empty() {
702            serde_json::json!({
703                "model": self.model,
704                "messages": full_history,
705
706            })
707        } else {
708            json!({
709                "model": self.model,
710                "messages": full_history,
711                "tools": completion_request.tools.into_iter().map(ToolDefinition::from).collect::<Vec<_>>(),
712                "tool_choice": "auto",
713            })
714        };
715
716        // only include temperature if it exists
717        // because some models don't support temperature
718        let request = if let Some(temperature) = completion_request.temperature {
719            json_utils::merge(
720                request,
721                json!({
722                    "temperature": temperature,
723                }),
724            )
725        } else {
726            request
727        };
728
729        let request = if let Some(params) = completion_request.additional_params {
730            json_utils::merge(request, params)
731        } else {
732            request
733        };
734
735        Ok(request)
736    }
737}
738
739impl completion::CompletionModel for CompletionModel {
740    type Response = CompletionResponse;
741    type StreamingResponse = StreamingCompletionResponse;
742
743    #[cfg_attr(feature = "worker", worker::send)]
744    async fn completion(
745        &self,
746        completion_request: CompletionRequest,
747    ) -> Result<completion::CompletionResponse<CompletionResponse>, CompletionError> {
748        let request = self.create_completion_request(completion_request)?;
749
750        let response = self
751            .client
752            .post("/chat/completions")
753            .json(&request)
754            .send()
755            .await?;
756
757        if response.status().is_success() {
758            let t = response.text().await?;
759            tracing::debug!(target: "rig", "OpenAI completion error: {}", t);
760
761            match serde_json::from_str::<ApiResponse<CompletionResponse>>(&t)? {
762                ApiResponse::Ok(response) => {
763                    tracing::info!(target: "rig",
764                        "OpenAI completion token usage: {:?}",
765                        response.usage.clone().map(|usage| format!("{}", usage.total_tokens)).unwrap_or("N/A".to_string())
766                    );
767                    response.try_into()
768                }
769                ApiResponse::Err(err) => Err(CompletionError::ProviderError(err.message)),
770            }
771        } else {
772            Err(CompletionError::ProviderError(response.text().await?))
773        }
774    }
775
776    #[cfg_attr(feature = "worker", worker::send)]
777    async fn stream(
778        &self,
779        request: CompletionRequest,
780    ) -> Result<
781        crate::streaming::StreamingCompletionResponse<Self::StreamingResponse>,
782        CompletionError,
783    > {
784        CompletionModel::stream(self, request).await
785    }
786}