Skip to main content

vtcode_config/models/model_id/
capabilities.rs

1use crate::models::Provider;
2
3use super::ModelId;
4
5#[cfg(not(docsrs))]
6#[allow(dead_code)]
7mod capability_generated {
8    include!(concat!(env!("OUT_DIR"), "/model_capabilities.rs"));
9}
10
11#[cfg(docsrs)]
12#[allow(dead_code)]
13mod capability_generated {
14    #[derive(Clone, Copy)]
15    pub struct Pricing {
16        pub input: Option<f64>,
17        pub output: Option<f64>,
18        pub cache_read: Option<f64>,
19        pub cache_write: Option<f64>,
20    }
21
22    #[derive(Clone, Copy)]
23    pub struct Entry {
24        pub provider: &'static str,
25        pub id: &'static str,
26        pub display_name: &'static str,
27        pub description: &'static str,
28        pub context_window: usize,
29        pub max_output_tokens: Option<usize>,
30        pub reasoning: bool,
31        pub tool_call: bool,
32        pub vision: bool,
33        pub input_modalities: &'static [&'static str],
34        pub caching: bool,
35        pub structured_output: bool,
36        pub pricing: Pricing,
37    }
38
39    pub const ENTRIES: &[Entry] = &[];
40    pub const PROVIDERS: &[&str] = &[];
41
42    pub fn metadata_for(_provider: &str, _id: &str) -> Option<Entry> {
43        None
44    }
45
46    pub fn models_for_provider(_provider: &str) -> Option<&'static [&'static str]> {
47        None
48    }
49}
50
51/// Catalog metadata generated from `docs/models.json`.
52#[derive(Clone, Copy, Debug, PartialEq)]
53pub struct ModelPricing {
54    pub input: Option<f64>,
55    pub output: Option<f64>,
56    pub cache_read: Option<f64>,
57    pub cache_write: Option<f64>,
58}
59
60#[derive(Clone, Copy, Debug, PartialEq)]
61pub struct ModelCatalogEntry {
62    pub provider: &'static str,
63    pub id: &'static str,
64    pub display_name: &'static str,
65    pub description: &'static str,
66    pub context_window: usize,
67    pub max_output_tokens: Option<usize>,
68    pub reasoning: bool,
69    pub tool_call: bool,
70    pub vision: bool,
71    pub input_modalities: &'static [&'static str],
72    pub caching: bool,
73    pub structured_output: bool,
74    pub pricing: ModelPricing,
75}
76
77fn catalog_provider_key(provider: &str) -> &str {
78    if provider.eq_ignore_ascii_case("google") || provider.eq_ignore_ascii_case("gemini") {
79        "gemini"
80    } else if provider.eq_ignore_ascii_case("openai") {
81        "openai"
82    } else if provider.eq_ignore_ascii_case("anthropic") {
83        "anthropic"
84    } else if provider.eq_ignore_ascii_case("deepseek") {
85        "deepseek"
86    } else if provider.eq_ignore_ascii_case("openrouter") {
87        "openrouter"
88    } else if provider.eq_ignore_ascii_case("ollama") {
89        "ollama"
90    } else if provider.eq_ignore_ascii_case("lmstudio") {
91        "lmstudio"
92    } else if provider.eq_ignore_ascii_case("llamacpp")
93        || provider.eq_ignore_ascii_case("llama.cpp")
94    {
95        "llamacpp"
96    } else if provider.eq_ignore_ascii_case("moonshot") {
97        "moonshot"
98    } else if provider.eq_ignore_ascii_case("zai") {
99        "zai"
100    } else if provider.eq_ignore_ascii_case("minimax") {
101        "minimax"
102    } else if provider.eq_ignore_ascii_case("huggingface") {
103        "huggingface"
104    } else if provider.eq_ignore_ascii_case("stepfun") {
105        "stepfun"
106    } else if provider.eq_ignore_ascii_case("poolside") {
107        "poolside"
108    } else {
109        provider
110    }
111}
112
113fn capability_provider_key(provider: Provider) -> &'static str {
114    match provider {
115        Provider::Gemini => "gemini",
116        Provider::OpenAI => "openai",
117        Provider::Anthropic => "anthropic",
118        Provider::Copilot => "copilot",
119        Provider::DeepSeek => "deepseek",
120        Provider::OpenRouter => "openrouter",
121        Provider::Ollama => "ollama",
122        Provider::LmStudio => "lmstudio",
123        Provider::LlamaCpp => "llamacpp",
124        Provider::Moonshot => "moonshot",
125        Provider::ZAI => "zai",
126        Provider::Minimax => "minimax",
127        Provider::MiMo => "mimo",
128        Provider::Mistral => "mistral",
129        Provider::HuggingFace => "huggingface",
130        Provider::OpenCodeZen => "opencode-zen",
131        Provider::OpenCodeGo => "opencode-go",
132        Provider::Qwen => "qwen",
133        Provider::StepFun => "stepfun",
134        Provider::Poolside => "poolside",
135    }
136}
137
138fn generated_catalog_entry(provider: &str, id: &str) -> Option<ModelCatalogEntry> {
139    capability_generated::metadata_for(catalog_provider_key(provider), id).map(|entry| {
140        ModelCatalogEntry {
141            provider: entry.provider,
142            id: entry.id,
143            display_name: entry.display_name,
144            description: entry.description,
145            context_window: entry.context_window,
146            max_output_tokens: entry.max_output_tokens,
147            reasoning: entry.reasoning,
148            tool_call: entry.tool_call,
149            vision: entry.vision,
150            input_modalities: entry.input_modalities,
151            caching: entry.caching,
152            structured_output: entry.structured_output,
153            pricing: ModelPricing {
154                input: entry.pricing.input,
155                output: entry.pricing.output,
156                cache_read: entry.pricing.cache_read,
157                cache_write: entry.pricing.cache_write,
158            },
159        }
160    })
161}
162
163pub fn model_catalog_entry(provider: &str, id: &str) -> Option<ModelCatalogEntry> {
164    generated_catalog_entry(provider, id)
165}
166
167pub fn supported_models_for_provider(provider: &str) -> Option<&'static [&'static str]> {
168    capability_generated::models_for_provider(catalog_provider_key(provider))
169}
170
171pub fn catalog_provider_keys() -> &'static [&'static str] {
172    capability_generated::PROVIDERS
173}
174
175impl ModelId {
176    fn generated_capabilities(&self) -> Option<ModelCatalogEntry> {
177        generated_catalog_entry(capability_provider_key(self.provider()), self.as_str())
178    }
179
180    /// Preferred built-in lightweight sibling or lower-tier fallback for this model.
181    pub fn preferred_lightweight_variant(&self) -> Option<Self> {
182        match self {
183            ModelId::Gemini31ProPreview | ModelId::Gemini31ProPreviewCustomTools => {
184                Some(ModelId::Gemini31FlashLitePreview)
185            }
186            ModelId::GPT55 | ModelId::GPT54 | ModelId::GPT54Pro => Some(ModelId::GPT54Mini),
187            ModelId::OpenCodeZenGPT54 => Some(ModelId::OpenCodeZenGPT54Mini),
188            ModelId::GPT53Codex => Some(ModelId::GPT54Mini),
189            ModelId::ClaudeOpus48 | ModelId::ClaudeSonnet46 | ModelId::ClaudeMythosPreview => {
190                Some(ModelId::ClaudeHaiku45)
191            }
192            ModelId::CopilotGPT54 => Some(ModelId::CopilotGPT54Mini),
193            ModelId::CopilotGPT52Codex | ModelId::CopilotGPT51CodexMax => {
194                Some(ModelId::CopilotGPT54Mini)
195            }
196            ModelId::DeepSeekV4Pro => Some(ModelId::DeepSeekV4Flash),
197            ModelId::HuggingFaceDeepseekV4ProTogether => {
198                Some(ModelId::HuggingFaceDeepseekV4FlashNovita)
199            }
200            ModelId::HuggingFaceDeepseekV4ProNovita => {
201                Some(ModelId::HuggingFaceDeepseekV4FlashNovita)
202            }
203            ModelId::OllamaDeepseekV4ProCloud => Some(ModelId::OllamaDeepseekV4FlashCloud),
204            ModelId::ZaiGlm51 => Some(ModelId::ZaiGlm5),
205            ModelId::MinimaxM27 => Some(ModelId::MinimaxM25),
206            ModelId::OpenCodeGoMinimaxM27 => Some(ModelId::OpenCodeGoMinimaxM25),
207            ModelId::StepFun37Flash => None,
208            ModelId::PoolsideLagunaM1 => Some(ModelId::PoolsideLagunaXs2),
209            _ => None,
210        }
211    }
212
213    /// Attempt to find a non-reasoning variant for this model.
214    pub fn non_reasoning_variant(&self) -> Option<Self> {
215        if let Some(meta) = self.openrouter_metadata() {
216            if !meta.reasoning {
217                return None;
218            }
219
220            let vendor = meta.vendor;
221            let mut candidates: Vec<Self> = Self::openrouter_vendor_groups()
222                .into_iter()
223                .find(|(candidate_vendor, _)| *candidate_vendor == vendor)
224                .map(|(_, models)| {
225                    models
226                        .iter()
227                        .copied()
228                        .filter(|candidate| candidate != self)
229                        .filter(|candidate| {
230                            candidate
231                                .openrouter_metadata()
232                                .map(|other| !other.reasoning)
233                                .unwrap_or(false)
234                        })
235                        .collect()
236                })
237                .unwrap_or_default();
238
239            if candidates.is_empty() {
240                return None;
241            }
242
243            candidates.sort_by_key(|candidate| {
244                candidate
245                    .openrouter_metadata()
246                    .map(|data| (!data.efficient, data.display))
247                    .unwrap_or((true, ""))
248            });
249
250            return candidates.into_iter().next();
251        }
252
253        let direct = match self {
254            ModelId::Gemini31ProPreview
255            | ModelId::Gemini31ProPreviewCustomTools
256            | ModelId::Gemini31FlashLitePreview => Some(ModelId::Gemini35Flash),
257            ModelId::GPT55
258            | ModelId::GPT54
259            | ModelId::GPT54Pro
260            | ModelId::GPT54Nano
261            | ModelId::GPT54Mini => Some(ModelId::GPT54Mini),
262            ModelId::OpenCodeZenGPT54 => Some(ModelId::OpenCodeZenGPT54Mini),
263            ModelId::CopilotGPT52Codex | ModelId::CopilotGPT54 => Some(ModelId::CopilotGPT54Mini),
264            ModelId::DeepSeekV4Pro => Some(ModelId::DeepSeekV4Flash),
265            ModelId::HuggingFaceDeepseekV4ProTogether => {
266                Some(ModelId::HuggingFaceDeepseekV4FlashNovita)
267            }
268            ModelId::HuggingFaceDeepseekV4ProNovita => {
269                Some(ModelId::HuggingFaceDeepseekV4FlashNovita)
270            }
271            ModelId::OllamaDeepseekV4ProCloud => Some(ModelId::OllamaDeepseekV4FlashCloud),
272            ModelId::ZaiGlm5 | ModelId::ZaiGlm51 => Some(ModelId::OllamaGlm5Cloud),
273            ModelId::ClaudeOpus48 | ModelId::ClaudeSonnet46 | ModelId::ClaudeMythosPreview => {
274                Some(ModelId::ClaudeSonnet46)
275            }
276            ModelId::OpenCodeGoMinimaxM27 => Some(ModelId::OpenCodeGoMinimaxM25),
277            ModelId::MinimaxM27 | ModelId::MinimaxM25 => None,
278            _ => None,
279        };
280
281        direct.and_then(|candidate| {
282            if candidate.supports_reasoning_effort() {
283                None
284            } else {
285                Some(candidate)
286            }
287        })
288    }
289
290    /// Check if this is a "flash" variant (optimized for speed)
291    pub fn is_flash_variant(&self) -> bool {
292        matches!(
293            self,
294            ModelId::Gemini31FlashLitePreview
295                | ModelId::Gemini35Flash
296                | ModelId::OpenRouterStepfunStep35FlashFree
297                | ModelId::OpenRouterNvidiaNemotron3Super120bA12bFree
298                | ModelId::HuggingFaceStep35Flash
299                | ModelId::StepFun37Flash
300                | ModelId::HuggingFaceDeepseekV4FlashNovita
301        )
302    }
303
304    /// Check if this is a "pro" variant (optimized for capability)
305    pub fn is_pro_variant(&self) -> bool {
306        matches!(
307            self,
308            ModelId::Gemini31ProPreview
309                | ModelId::Gemini31ProPreviewCustomTools
310                | ModelId::OpenRouterGoogleGemini31ProPreview
311                | ModelId::GPT55
312                | ModelId::GPT54
313                | ModelId::GPT54Pro
314                | ModelId::GPT53Codex
315                | ModelId::CopilotGPT52Codex
316                | ModelId::CopilotGPT51CodexMax
317                | ModelId::CopilotGPT54
318                | ModelId::CopilotClaudeSonnet46
319                | ModelId::ClaudeOpus48
320                | ModelId::ClaudeSonnet46
321                | ModelId::ClaudeMythosPreview
322                | ModelId::OpenCodeZenGPT54
323                | ModelId::OpenCodeZenClaudeSonnet46
324                | ModelId::OpenCodeZenGlm51
325                | ModelId::OpenCodeGoGlm51
326                | ModelId::OpenCodeGoMinimaxM27
327                | ModelId::DeepSeekV4Pro
328                | ModelId::ZaiGlm5
329                | ModelId::ZaiGlm51
330                | ModelId::OpenRouterStepfunStep35FlashFree
331                | ModelId::OpenRouterNvidiaNemotron3Super120bA12bFree
332                | ModelId::MinimaxM27
333                | ModelId::MinimaxM25
334                | ModelId::OpenCodeGoMinimaxM25
335                | ModelId::OllamaGlm5Cloud
336                | ModelId::OllamaGlm51Cloud
337                | ModelId::OllamaNemotron3SuperCloud
338                | ModelId::OllamaMinimaxM25Cloud
339                | ModelId::HuggingFaceQwen3CoderNextNovita
340                | ModelId::HuggingFaceQwen35397BA17BTogether
341                | ModelId::HuggingFaceDeepseekV4ProTogether
342                | ModelId::HuggingFaceGlm51Deepinfra
343                | ModelId::HuggingFaceMinimaxM27Novita
344                | ModelId::HuggingFaceDeepseekV4ProNovita
345                | ModelId::OpenRouterMoonshotaiKimiK26
346                | ModelId::PoolsideLagunaM1
347        )
348    }
349
350    /// Check if this is an optimized/efficient variant
351    pub fn is_efficient_variant(&self) -> bool {
352        if let Some(meta) = self.openrouter_metadata() {
353            return meta.efficient;
354        }
355        matches!(
356            self,
357            ModelId::Gemini31FlashLitePreview
358                | ModelId::Gemini35Flash
359                | ModelId::GPT54Mini
360                | ModelId::CopilotGPT54Mini
361                | ModelId::ClaudeHaiku45
362                | ModelId::OpenCodeZenGPT54Mini
363                | ModelId::OpenCodeGoMinimaxM25
364                | ModelId::DeepSeekV4Flash
365                | ModelId::HuggingFaceStep35Flash
366                | ModelId::HuggingFaceDeepseekV4FlashNovita
367                | ModelId::PoolsideLagunaXs2
368        )
369    }
370
371    /// Check if this is a top-tier model
372    pub fn is_top_tier(&self) -> bool {
373        if let Some(meta) = self.openrouter_metadata() {
374            return meta.top_tier;
375        }
376        matches!(
377            self,
378            ModelId::Gemini31ProPreview
379                | ModelId::Gemini31ProPreviewCustomTools
380                | ModelId::OpenRouterGoogleGemini31ProPreview
381                | ModelId::Gemini31FlashLitePreview
382                | ModelId::Gemini35Flash
383                | ModelId::GPT55
384                | ModelId::GPT54
385                | ModelId::GPT54Pro
386                | ModelId::GPT53Codex
387                | ModelId::ClaudeOpus48
388                | ModelId::ClaudeSonnet46
389                | ModelId::ClaudeMythosPreview
390                | ModelId::OpenCodeZenGPT54
391                | ModelId::OpenCodeZenClaudeSonnet46
392                | ModelId::OpenCodeZenGlm51
393                | ModelId::OpenCodeGoGlm51
394                | ModelId::OpenCodeGoMinimaxM27
395                | ModelId::DeepSeekV4Pro
396                | ModelId::ZaiGlm5
397                | ModelId::ZaiGlm51
398                | ModelId::OpenRouterStepfunStep35FlashFree
399                | ModelId::HuggingFaceQwen3CoderNextNovita
400                | ModelId::HuggingFaceQwen35397BA17BTogether
401                | ModelId::HuggingFaceDeepseekV4FlashNovita
402                | ModelId::HuggingFaceDeepseekV4ProTogether
403                | ModelId::HuggingFaceGlm51Deepinfra
404                | ModelId::HuggingFaceMinimaxM27Novita
405                | ModelId::HuggingFaceDeepseekV4ProNovita
406                | ModelId::OpenRouterMoonshotaiKimiK26
407                | ModelId::PoolsideLagunaM1
408        )
409    }
410
411    /// Determine whether the model is a reasoning-capable variant
412    pub fn is_reasoning_variant(&self) -> bool {
413        if let Some(meta) = self.openrouter_metadata() {
414            return meta.reasoning;
415        }
416        self.provider().supports_reasoning_effort(self.as_str())
417    }
418
419    /// Determine whether the model supports tool calls/function execution
420    pub fn supports_tool_calls(&self) -> bool {
421        if let Some(meta) = self.generated_capabilities() {
422            return meta.tool_call;
423        }
424        if let Some(meta) = self.openrouter_metadata() {
425            return meta.tool_call;
426        }
427        true
428    }
429
430    /// Ordered list of supported input modalities when VT Code has metadata for this model.
431    pub fn input_modalities(&self) -> &'static [&'static str] {
432        self.generated_capabilities()
433            .map(|meta| meta.input_modalities)
434            .unwrap_or(&[])
435    }
436
437    /// Get the generation/version string for this model
438    pub fn generation(&self) -> &'static str {
439        if let Some(meta) = self.openrouter_metadata() {
440            return meta.generation;
441        }
442        match self {
443            // Gemini generations
444            ModelId::Gemini31ProPreview | ModelId::Gemini31ProPreviewCustomTools => "3.1",
445            ModelId::Gemini31FlashLitePreview => "3.1-lite",
446            // OpenAI generations
447            ModelId::GPT55 => "5.5",
448            ModelId::GPT54 | ModelId::GPT54Pro | ModelId::GPT54Nano | ModelId::GPT54Mini => "5.4",
449            ModelId::GPT53Codex => "5.3",
450            ModelId::OpenAIGptOss20b | ModelId::OpenAIGptOss120b => "5",
451            // Anthropic generations
452            ModelId::ClaudeOpus48 => "4.8",
453            ModelId::ClaudeSonnet46 => "4.6",
454            ModelId::ClaudeHaiku45 => "4.5",
455            ModelId::ClaudeMythosPreview => "preview",
456            // DeepSeek generations
457            ModelId::DeepSeekV4Pro | ModelId::DeepSeekV4Flash => "4",
458            // Z.AI generations
459            ModelId::ZaiGlm5 => "5",
460            ModelId::ZaiGlm51 => "5.1",
461            ModelId::Gemini35Flash => "3.5",
462            ModelId::OpenCodeZenGPT54 | ModelId::OpenCodeZenGPT54Mini => "5.4",
463            ModelId::OpenCodeZenClaudeSonnet46 => "4.6",
464            ModelId::OpenCodeZenGlm51 | ModelId::OpenCodeGoGlm51 => "5.1",
465            ModelId::OpenCodeGoMinimaxM25 => "m2.5",
466            ModelId::OpenCodeGoMinimaxM27 => "m2.7",
467            ModelId::OllamaGptOss20b => "oss",
468            ModelId::OllamaGptOss20bCloud => "oss-cloud",
469            ModelId::OllamaGptOss120bCloud => "oss-cloud",
470            ModelId::OllamaQwen317b => "oss",
471            ModelId::OllamaQwen3CoderNext => "qwen3-coder-next:cloud",
472            ModelId::OllamaDeepseekV4FlashCloud => "deepseek-v4-flash",
473            ModelId::OllamaDeepseekV4ProCloud => "deepseek-v4-pro",
474            ModelId::OllamaQwen3Next80bCloud => "qwen3-next",
475            ModelId::OllamaMinimaxM2Cloud => "minimax-m2",
476            ModelId::OllamaMinimaxM27Cloud => "minimax-m2.7",
477            ModelId::OllamaGlm5Cloud => "glm-5",
478            ModelId::OllamaGlm51Cloud => "glm-5.1",
479            ModelId::OllamaMinimaxM25Cloud => "minimax-m2.5",
480            ModelId::OllamaKimiK26Cloud => "kimi-k2.6",
481            ModelId::OllamaNemotron3SuperCloud => "nemotron-3",
482            ModelId::OllamaLagunaXs2 => "laguna-xs.2",
483            ModelId::LlamaCppQwen3627b => "3.6",
484            ModelId::LlamaCppQwen3635bA3b => "3.6",
485            ModelId::LlamaCppGemma426bA4b => "4",
486            ModelId::LlamaCppGemma4E4b => "4",
487            ModelId::LlamaCppGptOss20b => "oss",
488            ModelId::LlamaCppStep35Flash => "3.5",
489            // MiniMax models
490            ModelId::MinimaxM27 => "M2.7",
491            ModelId::MinimaxM25 => "M2.5",
492            // Moonshot models
493            ModelId::MoonshotKimiK26 => "k2.6",
494            // Hugging Face generations
495            ModelId::HuggingFaceOpenAIGptOss20b => "oss",
496            ModelId::HuggingFaceOpenAIGptOss120b => "oss",
497            ModelId::HuggingFaceMinimaxM25Novita => "m2.5",
498            ModelId::HuggingFaceMinimaxM27Novita => "m2.7",
499            ModelId::HuggingFaceGlm5Novita => "5",
500            ModelId::HuggingFaceGlm51ZaiOrg => "5.1",
501            ModelId::HuggingFaceGlm51Deepinfra => "5.1",
502            ModelId::HuggingFaceKimiK26Novita => "k2.6",
503            ModelId::HuggingFaceDeepseekV4FlashNovita => "v4-flash",
504            ModelId::HuggingFaceDeepseekV4ProTogether => "v4-pro",
505            ModelId::HuggingFaceDeepseekV4ProNovita => "v4-pro",
506            ModelId::HuggingFaceStep35Flash => "3.5",
507            ModelId::HuggingFaceQwen3CoderNextNovita | ModelId::OpenRouterQwen3CoderNext => {
508                "qwen3-coder-next"
509            }
510            // Poolside models
511            ModelId::PoolsideLagunaM1 => "laguna-m.1",
512            ModelId::PoolsideLagunaXs2 => "laguna-xs.2",
513            // Qwen models
514            ModelId::Qwen37Max => "3.7",
515            ModelId::Qwen36Flash | ModelId::Qwen36Plus => "3.6",
516            ModelId::QwenDeepSeekV4Flash | ModelId::QwenDeepSeekV4Pro => "v4",
517            ModelId::QwenGlm51 => "5.1",
518            _ => "unknown",
519        }
520    }
521
522    /// Determine if this model supports GPT-5.1+/5.2+/5.3+ shell tool type
523    pub fn supports_shell_tool(&self) -> bool {
524        matches!(
525            self,
526            ModelId::GPT55 | ModelId::GPT54 | ModelId::GPT54Pro | ModelId::GPT53Codex
527        )
528    }
529
530    /// Determine if this model supports optimized apply_patch tool
531    pub fn supports_apply_patch_tool(&self) -> bool {
532        false // Placeholder for future optimization
533    }
534}