Skip to main content

vtcode_config/models/model_id/
capabilities.rs

1use crate::models::Provider;
2
3use super::ModelId;
4
5#[cfg(not(docsrs))]
6#[allow(dead_code)]
7mod capability_generated {
8    include!(concat!(env!("OUT_DIR"), "/model_capabilities.rs"));
9}
10
11#[cfg(docsrs)]
12#[allow(dead_code)]
13mod capability_generated {
14    #[derive(Clone, Copy)]
15    pub struct Pricing {
16        pub input: Option<f64>,
17        pub output: Option<f64>,
18        pub cache_read: Option<f64>,
19        pub cache_write: Option<f64>,
20    }
21
22    #[derive(Clone, Copy)]
23    pub struct Entry {
24        pub provider: &'static str,
25        pub id: &'static str,
26        pub display_name: &'static str,
27        pub description: &'static str,
28        pub context_window: usize,
29        pub max_output_tokens: Option<usize>,
30        pub reasoning: bool,
31        pub tool_call: bool,
32        pub vision: bool,
33        pub input_modalities: &'static [&'static str],
34        pub caching: bool,
35        pub structured_output: bool,
36        pub pricing: Pricing,
37    }
38
39    pub const ENTRIES: &[Entry] = &[];
40    pub const PROVIDERS: &[&str] = &[];
41
42    pub fn metadata_for(_provider: &str, _id: &str) -> Option<Entry> {
43        None
44    }
45
46    pub fn models_for_provider(_provider: &str) -> Option<&'static [&'static str]> {
47        None
48    }
49}
50
51/// Catalog metadata generated from `docs/models.json`.
52#[derive(Clone, Copy, Debug, PartialEq)]
53pub struct ModelPricing {
54    pub input: Option<f64>,
55    pub output: Option<f64>,
56    pub cache_read: Option<f64>,
57    pub cache_write: Option<f64>,
58}
59
60#[derive(Clone, Copy, Debug, PartialEq)]
61pub struct ModelCatalogEntry {
62    pub provider: &'static str,
63    pub id: &'static str,
64    pub display_name: &'static str,
65    pub description: &'static str,
66    pub context_window: usize,
67    pub max_output_tokens: Option<usize>,
68    pub reasoning: bool,
69    pub tool_call: bool,
70    pub vision: bool,
71    pub input_modalities: &'static [&'static str],
72    pub caching: bool,
73    pub structured_output: bool,
74    pub pricing: ModelPricing,
75}
76
77fn catalog_provider_key(provider: &str) -> &str {
78    if provider.eq_ignore_ascii_case("google") || provider.eq_ignore_ascii_case("gemini") {
79        "gemini"
80    } else if provider.eq_ignore_ascii_case("openai") {
81        "openai"
82    } else if provider.eq_ignore_ascii_case("anthropic") {
83        "anthropic"
84    } else if provider.eq_ignore_ascii_case("deepseek") {
85        "deepseek"
86    } else if provider.eq_ignore_ascii_case("openrouter") {
87        "openrouter"
88    } else if provider.eq_ignore_ascii_case("ollama") {
89        "ollama"
90    } else if provider.eq_ignore_ascii_case("lmstudio") {
91        "lmstudio"
92    } else if provider.eq_ignore_ascii_case("moonshot") {
93        "moonshot"
94    } else if provider.eq_ignore_ascii_case("zai") {
95        "zai"
96    } else if provider.eq_ignore_ascii_case("minimax") {
97        "minimax"
98    } else if provider.eq_ignore_ascii_case("huggingface") {
99        "huggingface"
100    } else if provider.eq_ignore_ascii_case("poolside") {
101        "poolside"
102    } else {
103        provider
104    }
105}
106
107fn capability_provider_key(provider: Provider) -> &'static str {
108    match provider {
109        Provider::Gemini => "gemini",
110        Provider::OpenAI => "openai",
111        Provider::Anthropic => "anthropic",
112        Provider::Copilot => "copilot",
113        Provider::DeepSeek => "deepseek",
114        Provider::OpenRouter => "openrouter",
115        Provider::Ollama => "ollama",
116        Provider::LmStudio => "lmstudio",
117        Provider::Moonshot => "moonshot",
118        Provider::ZAI => "zai",
119        Provider::Minimax => "minimax",
120        Provider::MiMo => "mimo",
121        Provider::Mistral => "mistral",
122        Provider::HuggingFace => "huggingface",
123        Provider::OpenCodeZen => "opencode-zen",
124        Provider::OpenCodeGo => "opencode-go",
125        Provider::Qwen => "qwen",
126        Provider::Poolside => "poolside",
127    }
128}
129
130fn generated_catalog_entry(provider: &str, id: &str) -> Option<ModelCatalogEntry> {
131    capability_generated::metadata_for(catalog_provider_key(provider), id).map(|entry| {
132        ModelCatalogEntry {
133            provider: entry.provider,
134            id: entry.id,
135            display_name: entry.display_name,
136            description: entry.description,
137            context_window: entry.context_window,
138            max_output_tokens: entry.max_output_tokens,
139            reasoning: entry.reasoning,
140            tool_call: entry.tool_call,
141            vision: entry.vision,
142            input_modalities: entry.input_modalities,
143            caching: entry.caching,
144            structured_output: entry.structured_output,
145            pricing: ModelPricing {
146                input: entry.pricing.input,
147                output: entry.pricing.output,
148                cache_read: entry.pricing.cache_read,
149                cache_write: entry.pricing.cache_write,
150            },
151        }
152    })
153}
154
155pub fn model_catalog_entry(provider: &str, id: &str) -> Option<ModelCatalogEntry> {
156    generated_catalog_entry(provider, id)
157}
158
159pub fn supported_models_for_provider(provider: &str) -> Option<&'static [&'static str]> {
160    capability_generated::models_for_provider(catalog_provider_key(provider))
161}
162
163pub fn catalog_provider_keys() -> &'static [&'static str] {
164    capability_generated::PROVIDERS
165}
166
167impl ModelId {
168    fn generated_capabilities(&self) -> Option<ModelCatalogEntry> {
169        generated_catalog_entry(capability_provider_key(self.provider()), self.as_str())
170    }
171
172    /// Preferred built-in lightweight sibling or lower-tier fallback for this model.
173    pub fn preferred_lightweight_variant(&self) -> Option<Self> {
174        match self {
175            ModelId::Gemini31ProPreview | ModelId::Gemini31ProPreviewCustomTools => {
176                Some(ModelId::Gemini31FlashLitePreview)
177            }
178            ModelId::GPT55 | ModelId::GPT54 | ModelId::GPT54Pro => Some(ModelId::GPT54Mini),
179            ModelId::OpenCodeZenGPT54 => Some(ModelId::OpenCodeZenGPT54Mini),
180            ModelId::GPT52
181            | ModelId::GPT52Codex
182            | ModelId::GPT53Codex
183            | ModelId::GPT51Codex
184            | ModelId::GPT51CodexMax
185            | ModelId::GPT5
186            | ModelId::GPT5Codex => Some(ModelId::GPT5Mini),
187            ModelId::ClaudeOpus48
188            | ModelId::ClaudeOpus47
189            | ModelId::ClaudeOpus46
190            | ModelId::ClaudeSonnet46
191            | ModelId::ClaudeMythosPreview => Some(ModelId::ClaudeHaiku45),
192            ModelId::CopilotGPT54 => Some(ModelId::CopilotGPT54Mini),
193            ModelId::CopilotGPT52Codex | ModelId::CopilotGPT51CodexMax => {
194                Some(ModelId::CopilotGPT54Mini)
195            }
196            ModelId::DeepSeekV4Pro => Some(ModelId::DeepSeekV4Flash),
197            ModelId::HuggingFaceDeepseekV4ProTogether => {
198                Some(ModelId::HuggingFaceDeepseekV4FlashNovita)
199            }
200            ModelId::OllamaDeepseekV4ProCloud => Some(ModelId::OllamaDeepseekV4FlashCloud),
201            ModelId::ZaiGlm51 => Some(ModelId::ZaiGlm5),
202            ModelId::MinimaxM27 => Some(ModelId::MinimaxM25),
203            ModelId::OpenCodeGoMinimaxM27 => Some(ModelId::OpenCodeGoMinimaxM25),
204            ModelId::PoolsideLagunaM1 => Some(ModelId::PoolsideLagunaXs2),
205            _ => None,
206        }
207    }
208
209    /// Attempt to find a non-reasoning variant for this model.
210    pub fn non_reasoning_variant(&self) -> Option<Self> {
211        if let Some(meta) = self.openrouter_metadata() {
212            if !meta.reasoning {
213                return None;
214            }
215
216            let vendor = meta.vendor;
217            let mut candidates: Vec<Self> = Self::openrouter_vendor_groups()
218                .into_iter()
219                .find(|(candidate_vendor, _)| *candidate_vendor == vendor)
220                .map(|(_, models)| {
221                    models
222                        .iter()
223                        .copied()
224                        .filter(|candidate| candidate != self)
225                        .filter(|candidate| {
226                            candidate
227                                .openrouter_metadata()
228                                .map(|other| !other.reasoning)
229                                .unwrap_or(false)
230                        })
231                        .collect()
232                })
233                .unwrap_or_default();
234
235            if candidates.is_empty() {
236                return None;
237            }
238
239            candidates.sort_by_key(|candidate| {
240                candidate
241                    .openrouter_metadata()
242                    .map(|data| (!data.efficient, data.display))
243                    .unwrap_or((true, ""))
244            });
245
246            return candidates.into_iter().next();
247        }
248
249        let direct = match self {
250            ModelId::Gemini31ProPreview
251            | ModelId::Gemini31ProPreviewCustomTools
252            | ModelId::Gemini31FlashLitePreview => Some(ModelId::Gemini3FlashPreview),
253            ModelId::GPT55
254            | ModelId::GPT52
255            | ModelId::GPT54
256            | ModelId::GPT54Pro
257            | ModelId::GPT54Nano
258            | ModelId::GPT54Mini
259            | ModelId::GPT5 => Some(ModelId::GPT5Mini),
260            ModelId::OpenCodeZenGPT54 => Some(ModelId::OpenCodeZenGPT54Mini),
261            ModelId::CopilotGPT52Codex | ModelId::CopilotGPT54 => Some(ModelId::CopilotGPT54Mini),
262            ModelId::DeepSeekV4Pro => Some(ModelId::DeepSeekV4Flash),
263            ModelId::HuggingFaceDeepseekV4ProTogether => {
264                Some(ModelId::HuggingFaceDeepseekV4FlashNovita)
265            }
266            ModelId::OllamaDeepseekV4ProCloud => Some(ModelId::OllamaDeepseekV4FlashCloud),
267            ModelId::ZaiGlm5 | ModelId::ZaiGlm51 => Some(ModelId::OllamaGlm5Cloud),
268            ModelId::ClaudeOpus48
269            | ModelId::ClaudeOpus47
270            | ModelId::ClaudeOpus46
271            | ModelId::ClaudeSonnet46
272            | ModelId::ClaudeMythosPreview => Some(ModelId::ClaudeSonnet46),
273            ModelId::OpenCodeGoMinimaxM27 => Some(ModelId::OpenCodeGoMinimaxM25),
274            ModelId::MinimaxM27 | ModelId::MinimaxM25 => None,
275            _ => None,
276        };
277
278        direct.and_then(|candidate| {
279            if candidate.supports_reasoning_effort() {
280                None
281            } else {
282                Some(candidate)
283            }
284        })
285    }
286
287    /// Check if this is a "flash" variant (optimized for speed)
288    pub fn is_flash_variant(&self) -> bool {
289        matches!(
290            self,
291            ModelId::Gemini3FlashPreview
292                | ModelId::Gemini31FlashLitePreview
293                | ModelId::OpenRouterStepfunStep35FlashFree
294                | ModelId::OpenRouterNvidiaNemotron3Super120bA12bFree
295                | ModelId::OllamaGemini3FlashPreviewCloud
296                | ModelId::HuggingFaceStep35Flash
297                | ModelId::HuggingFaceDeepseekV4FlashNovita
298        )
299    }
300
301    /// Check if this is a "pro" variant (optimized for capability)
302    pub fn is_pro_variant(&self) -> bool {
303        matches!(
304            self,
305            ModelId::Gemini31ProPreview
306                | ModelId::Gemini31ProPreviewCustomTools
307                | ModelId::OpenRouterGoogleGemini31ProPreview
308                | ModelId::GPT55
309                | ModelId::GPT5
310                | ModelId::GPT52
311                | ModelId::GPT52Codex
312                | ModelId::GPT54
313                | ModelId::GPT54Pro
314                | ModelId::GPT53Codex
315                | ModelId::GPT51Codex
316                | ModelId::GPT51CodexMax
317                | ModelId::CopilotGPT52Codex
318                | ModelId::CopilotGPT51CodexMax
319                | ModelId::CopilotGPT54
320                | ModelId::CopilotClaudeSonnet46
321                | ModelId::GPT5Codex
322                | ModelId::ClaudeOpus48
323                | ModelId::ClaudeOpus47
324                | ModelId::ClaudeOpus46
325                | ModelId::ClaudeSonnet46
326                | ModelId::ClaudeMythosPreview
327                | ModelId::OpenCodeZenGPT54
328                | ModelId::OpenCodeZenClaudeSonnet46
329                | ModelId::OpenCodeZenGlm51
330                | ModelId::OpenCodeZenKimiK25
331                | ModelId::OpenCodeGoGlm51
332                | ModelId::OpenCodeGoKimiK25
333                | ModelId::OpenCodeGoMinimaxM27
334                | ModelId::DeepSeekV4Pro
335                | ModelId::ZaiGlm5
336                | ModelId::ZaiGlm51
337                | ModelId::OpenRouterStepfunStep35FlashFree
338                | ModelId::OpenRouterNvidiaNemotron3Super120bA12bFree
339                | ModelId::MinimaxM27
340                | ModelId::MinimaxM25
341                | ModelId::OpenCodeGoMinimaxM25
342                | ModelId::OllamaGlm5Cloud
343                | ModelId::OllamaGlm51Cloud
344                | ModelId::OllamaNemotron3SuperCloud
345                | ModelId::OllamaMinimaxM25Cloud
346                | ModelId::HuggingFaceQwen3CoderNextNovita
347                | ModelId::HuggingFaceQwen35397BA17BTogether
348                | ModelId::HuggingFaceDeepseekV4ProTogether
349                | ModelId::OpenRouterMoonshotaiKimiK26
350                | ModelId::PoolsideLagunaM1
351        )
352    }
353
354    /// Check if this is an optimized/efficient variant
355    pub fn is_efficient_variant(&self) -> bool {
356        if let Some(meta) = self.openrouter_metadata() {
357            return meta.efficient;
358        }
359        matches!(
360            self,
361            ModelId::Gemini3FlashPreview
362                | ModelId::Gemini31FlashLitePreview
363                | ModelId::GPT5Mini
364                | ModelId::GPT5Nano
365                | ModelId::CopilotGPT54Mini
366                | ModelId::ClaudeHaiku45
367                | ModelId::OpenCodeZenGPT54Mini
368                | ModelId::OpenCodeGoMinimaxM25
369                | ModelId::DeepSeekV4Flash
370                | ModelId::HuggingFaceStep35Flash
371                | ModelId::HuggingFaceDeepseekV4FlashNovita
372                | ModelId::PoolsideLagunaXs2
373        )
374    }
375
376    /// Check if this is a top-tier model
377    pub fn is_top_tier(&self) -> bool {
378        if let Some(meta) = self.openrouter_metadata() {
379            return meta.top_tier;
380        }
381        matches!(
382            self,
383            ModelId::Gemini31ProPreview
384                | ModelId::Gemini31ProPreviewCustomTools
385                | ModelId::OpenRouterGoogleGemini31ProPreview
386                | ModelId::Gemini3FlashPreview
387                | ModelId::Gemini31FlashLitePreview
388                | ModelId::GPT55
389                | ModelId::GPT5
390                | ModelId::GPT52
391                | ModelId::GPT52Codex
392                | ModelId::GPT54
393                | ModelId::GPT54Pro
394                | ModelId::GPT53Codex
395                | ModelId::GPT51Codex
396                | ModelId::GPT51CodexMax
397                | ModelId::GPT5Codex
398                | ModelId::ClaudeOpus48
399                | ModelId::ClaudeOpus47
400                | ModelId::ClaudeOpus46
401                | ModelId::ClaudeSonnet46
402                | ModelId::ClaudeMythosPreview
403                | ModelId::OpenCodeZenGPT54
404                | ModelId::OpenCodeZenClaudeSonnet46
405                | ModelId::OpenCodeZenGlm51
406                | ModelId::OpenCodeZenKimiK25
407                | ModelId::OpenCodeGoGlm51
408                | ModelId::OpenCodeGoKimiK25
409                | ModelId::OpenCodeGoMinimaxM27
410                | ModelId::DeepSeekV4Pro
411                | ModelId::ZaiGlm5
412                | ModelId::ZaiGlm51
413                | ModelId::OpenRouterStepfunStep35FlashFree
414                | ModelId::HuggingFaceQwen3CoderNextNovita
415                | ModelId::HuggingFaceQwen35397BA17BTogether
416                | ModelId::HuggingFaceDeepseekV4FlashNovita
417                | ModelId::HuggingFaceDeepseekV4ProTogether
418                | ModelId::OpenRouterMoonshotaiKimiK26
419                | ModelId::PoolsideLagunaM1
420        )
421    }
422
423    /// Determine whether the model is a reasoning-capable variant
424    pub fn is_reasoning_variant(&self) -> bool {
425        if let Some(meta) = self.openrouter_metadata() {
426            return meta.reasoning;
427        }
428        self.provider().supports_reasoning_effort(self.as_str())
429    }
430
431    /// Determine whether the model supports tool calls/function execution
432    pub fn supports_tool_calls(&self) -> bool {
433        if let Some(meta) = self.generated_capabilities() {
434            return meta.tool_call;
435        }
436        if let Some(meta) = self.openrouter_metadata() {
437            return meta.tool_call;
438        }
439        true
440    }
441
442    /// Ordered list of supported input modalities when VT Code has metadata for this model.
443    pub fn input_modalities(&self) -> &'static [&'static str] {
444        self.generated_capabilities()
445            .map(|meta| meta.input_modalities)
446            .unwrap_or(&[])
447    }
448
449    /// Get the generation/version string for this model
450    pub fn generation(&self) -> &'static str {
451        if let Some(meta) = self.openrouter_metadata() {
452            return meta.generation;
453        }
454        match self {
455            // Gemini generations
456            ModelId::Gemini31ProPreview | ModelId::Gemini31ProPreviewCustomTools => "3.1",
457            ModelId::Gemini31FlashLitePreview => "3.1-lite",
458            ModelId::Gemini3FlashPreview => "3",
459            // OpenAI generations
460            ModelId::GPT55 => "5.5",
461            ModelId::GPT52 | ModelId::GPT52Codex => "5.2",
462            ModelId::GPT54 | ModelId::GPT54Pro | ModelId::GPT54Nano | ModelId::GPT54Mini => "5.4",
463            ModelId::GPT53Codex => "5.3",
464            ModelId::GPT51Codex | ModelId::GPT51CodexMax => "5.1",
465            ModelId::GPT5
466            | ModelId::GPT5Codex
467            | ModelId::GPT5Mini
468            | ModelId::GPT5Nano
469            | ModelId::OpenAIGptOss20b
470            | ModelId::OpenAIGptOss120b => "5",
471            // Anthropic generations
472            ModelId::ClaudeOpus48 => "4.8",
473            ModelId::ClaudeOpus47 => "4.7",
474            ModelId::ClaudeOpus46 => "4.6",
475            ModelId::ClaudeSonnet46 => "4.6",
476            ModelId::ClaudeHaiku45 => "4.5",
477            ModelId::ClaudeMythosPreview => "preview",
478            // DeepSeek generations
479            ModelId::DeepSeekV4Pro | ModelId::DeepSeekV4Flash => "4",
480            // Z.AI generations
481            ModelId::ZaiGlm5 => "5",
482            ModelId::ZaiGlm51 => "5.1",
483            ModelId::OpenCodeZenGPT54 | ModelId::OpenCodeZenGPT54Mini => "5.4",
484            ModelId::OpenCodeZenClaudeSonnet46 => "4.6",
485            ModelId::OpenCodeZenGlm51 | ModelId::OpenCodeGoGlm51 => "5.1",
486            ModelId::OpenCodeZenKimiK25 | ModelId::OpenCodeGoKimiK25 => "k2.5",
487            ModelId::OpenCodeGoMinimaxM25 => "m2.5",
488            ModelId::OpenCodeGoMinimaxM27 => "m2.7",
489            ModelId::OllamaGptOss20b => "oss",
490            ModelId::OllamaGptOss20bCloud => "oss-cloud",
491            ModelId::OllamaGptOss120bCloud => "oss-cloud",
492            ModelId::OllamaQwen317b => "oss",
493            ModelId::OllamaQwen3CoderNext => "qwen3-coder-next:cloud",
494            ModelId::OllamaDeepseekV32Cloud => "deepseek-v3.2",
495            ModelId::OllamaDeepseekV4FlashCloud => "deepseek-v4-flash",
496            ModelId::OllamaDeepseekV4ProCloud => "deepseek-v4-pro",
497            ModelId::OllamaQwen3Next80bCloud => "qwen3-next",
498            ModelId::OllamaMinimaxM2Cloud => "minimax-m2",
499            ModelId::OllamaMinimaxM27Cloud => "minimax-m2.7",
500            ModelId::OllamaGlm5Cloud => "glm-5",
501            ModelId::OllamaGlm51Cloud => "glm-5.1",
502            ModelId::OllamaMinimaxM25Cloud => "minimax-m2.5",
503            ModelId::OllamaKimiK26Cloud => "kimi-k2.6",
504            ModelId::OllamaNemotron3SuperCloud => "nemotron-3",
505            ModelId::OllamaGemini3FlashPreviewCloud => "gemini-3",
506            ModelId::OllamaLagunaXs2 => "laguna-xs.2",
507            // MiniMax models
508            ModelId::MinimaxM27 => "M2.7",
509            ModelId::MinimaxM25 => "M2.5",
510            // Moonshot models
511            ModelId::MoonshotKimiK26 => "k2.6",
512            ModelId::MoonshotKimiK25 => "k2.5",
513            // Hugging Face generations
514            ModelId::HuggingFaceDeepseekV32 => "V3.2-Exp",
515            ModelId::HuggingFaceOpenAIGptOss20b => "oss",
516            ModelId::HuggingFaceOpenAIGptOss120b => "oss",
517            ModelId::HuggingFaceMinimaxM25Novita => "m2.5",
518            ModelId::HuggingFaceDeepseekV32Novita => "v3.2",
519            ModelId::HuggingFaceXiaomiMimoV2FlashNovita => "v2-flash",
520            ModelId::HuggingFaceGlm5Novita => "5",
521            ModelId::HuggingFaceGlm51ZaiOrg => "5.1",
522            ModelId::HuggingFaceKimiK26Novita => "k2.6",
523            ModelId::HuggingFaceDeepseekV4FlashNovita => "v4-flash",
524            ModelId::HuggingFaceDeepseekV4ProTogether => "v4-pro",
525            ModelId::HuggingFaceStep35Flash => "3.5",
526            ModelId::HuggingFaceQwen3CoderNextNovita | ModelId::OpenRouterQwen3CoderNext => {
527                "qwen3-coder-next"
528            }
529            // Poolside models
530            ModelId::PoolsideLagunaM1 => "laguna-m.1",
531            ModelId::PoolsideLagunaXs2 => "laguna-xs.2",
532            // Qwen models
533            ModelId::Qwen37Max => "3.7",
534            ModelId::Qwen36Flash | ModelId::Qwen36Plus => "3.6",
535            ModelId::QwenDeepSeekV4Flash | ModelId::QwenDeepSeekV4Pro => "v4",
536            ModelId::QwenGlm51 => "5.1",
537            _ => "unknown",
538        }
539    }
540
541    /// Determine if this model supports GPT-5.1+/5.2+/5.3+ shell tool type
542    pub fn supports_shell_tool(&self) -> bool {
543        matches!(
544            self,
545            ModelId::GPT55
546                | ModelId::GPT52
547                | ModelId::GPT52Codex
548                | ModelId::GPT54
549                | ModelId::GPT54Pro
550                | ModelId::GPT53Codex
551                | ModelId::GPT51Codex
552                | ModelId::GPT51CodexMax
553                | ModelId::GPT5Codex
554        )
555    }
556
557    /// Determine if this model supports optimized apply_patch tool
558    pub fn supports_apply_patch_tool(&self) -> bool {
559        false // Placeholder for future optimization
560    }
561}