rig/providers/huggingface/
client.rs

1use crate::client::{
2    self, BearerAuth, Capabilities, Capable, DebugExt, Nothing, Provider, ProviderBuilder,
3    ProviderClient,
4};
5use crate::http_client;
6#[cfg(feature = "image")]
7use crate::image_generation::ImageGenerationError;
8use crate::transcription::TranscriptionError;
9use std::fmt::Debug;
10use std::fmt::Display;
11
12#[derive(Debug, Clone, PartialEq, Default)]
13pub enum SubProvider {
14    #[default]
15    HFInference,
16    Together,
17    SambaNova,
18    Fireworks,
19    Hyperbolic,
20    Nebius,
21    Novita,
22    Custom(String),
23}
24
25impl SubProvider {
26    /// Get the chat completion endpoint for the SubProvider
27    /// Required because Huggingface Inference requires the model
28    /// in the url and in the request body.
29    pub fn completion_endpoint(&self, _model: &str) -> String {
30        "v1/chat/completions".to_string()
31    }
32
33    /// Get the transcription endpoint for the SubProvider
34    /// Required because Huggingface Inference requires the model
35    /// in the url and in the request body.
36    pub fn transcription_endpoint(&self, model: &str) -> Result<String, TranscriptionError> {
37        match self {
38            SubProvider::HFInference => Ok(format!("/{model}")),
39            _ => Err(TranscriptionError::ProviderError(format!(
40                "transcription endpoint is not supported yet for {self}"
41            ))),
42        }
43    }
44
45    /// Get the image generation endpoint for the SubProvider
46    /// Required because Huggingface Inference requires the model
47    /// in the url and in the request body.
48    #[cfg(feature = "image")]
49    pub fn image_generation_endpoint(&self, model: &str) -> Result<String, ImageGenerationError> {
50        match self {
51            SubProvider::HFInference => Ok(format!("/{model}")),
52            _ => Err(ImageGenerationError::ProviderError(format!(
53                "image generation endpoint is not supported yet for {self}"
54            ))),
55        }
56    }
57
58    pub fn model_identifier(&self, model: &str) -> String {
59        match self {
60            SubProvider::Fireworks => format!("accounts/fireworks/models/{model}"),
61            _ => model.to_string(),
62        }
63    }
64}
65
66impl From<&str> for SubProvider {
67    fn from(s: &str) -> Self {
68        SubProvider::Custom(s.to_string())
69    }
70}
71
72impl From<String> for SubProvider {
73    fn from(value: String) -> Self {
74        SubProvider::Custom(value)
75    }
76}
77
78impl Display for SubProvider {
79    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
80        let route = match self {
81            SubProvider::HFInference => "hf-inference/models".to_string(),
82            SubProvider::Together => "together".to_string(),
83            SubProvider::SambaNova => "sambanova".to_string(),
84            SubProvider::Fireworks => "fireworks-ai".to_string(),
85            SubProvider::Hyperbolic => "hyperbolic".to_string(),
86            SubProvider::Nebius => "nebius".to_string(),
87            SubProvider::Novita => "novita".to_string(),
88            SubProvider::Custom(route) => route.clone(),
89        };
90
91        write!(f, "{route}")
92    }
93}
94
95// ================================================================
96// Main Huggingface Client
97// ================================================================
98const HUGGINGFACE_API_BASE_URL: &str = "https://router.huggingface.co";
99
100#[derive(Debug, Default, Clone)]
101pub struct HuggingFaceExt {
102    subprovider: SubProvider,
103}
104
105#[derive(Debug, Default, Clone)]
106pub struct HuggingFaceBuilder {
107    subprovider: SubProvider,
108}
109
110type HuggingFaceApiKey = BearerAuth;
111
112pub type Client<H = reqwest::Client> = client::Client<HuggingFaceExt, H>;
113pub type ClientBuilder<H = reqwest::Client> =
114    client::ClientBuilder<HuggingFaceBuilder, HuggingFaceApiKey, H>;
115
116impl Provider for HuggingFaceExt {
117    type Builder = HuggingFaceBuilder;
118
119    const VERIFY_PATH: &'static str = "/api/whoami-v2";
120
121    fn build<H>(
122        builder: &client::ClientBuilder<Self::Builder, HuggingFaceApiKey, H>,
123    ) -> http_client::Result<Self> {
124        Ok(Self {
125            subprovider: builder.ext().subprovider.clone(),
126        })
127    }
128}
129
130impl<H> Capabilities<H> for HuggingFaceExt {
131    type Completion = Capable<super::completion::CompletionModel<H>>;
132    type Embeddings = Nothing;
133    type Transcription = Capable<super::transcription::TranscriptionModel<H>>;
134    #[cfg(feature = "image")]
135    type ImageGeneration = Capable<super::image_generation::ImageGenerationModel<H>>;
136
137    #[cfg(feature = "audio")]
138    type AudioGeneration = Nothing;
139}
140
141impl DebugExt for HuggingFaceExt {
142    fn fields(&self) -> impl Iterator<Item = (&'static str, &dyn Debug)> {
143        std::iter::once(("subprovider", (&self.subprovider as &dyn Debug)))
144    }
145}
146
147impl ProviderBuilder for HuggingFaceBuilder {
148    type Output = HuggingFaceExt;
149    type ApiKey = HuggingFaceApiKey;
150
151    const BASE_URL: &'static str = HUGGINGFACE_API_BASE_URL;
152}
153
154impl ProviderClient for Client {
155    type Input = String;
156
157    /// Create a new Huggingface client from the `HUGGINGFACE_API_KEY` environment variable.
158    /// Panics if the environment variable is not set.
159    fn from_env() -> Self {
160        let api_key = std::env::var("HUGGINGFACE_API_KEY").expect("HUGGINGFACE_API_KEY is not set");
161
162        Self::new(&api_key).unwrap()
163    }
164
165    fn from_val(input: Self::Input) -> Self {
166        Self::new(&input).unwrap()
167    }
168}
169
170impl<H> ClientBuilder<H> {
171    pub fn subprovider(mut self, subprovider: SubProvider) -> Self {
172        *self.ext_mut() = HuggingFaceBuilder { subprovider };
173        self
174    }
175}
176
177impl<H> Client<H> {
178    pub(crate) fn subprovider(&self) -> &SubProvider {
179        &self.ext().subprovider
180    }
181}