vtcode_config/models/model_id.rs
1use serde::{Deserialize, Serialize};
2
3mod as_str;
4mod capabilities;
5mod collection;
6mod defaults;
7mod description;
8mod display;
9mod format;
10mod openrouter;
11mod parse;
12mod provider;
13
14pub use capabilities::{
15 ModelCatalogEntry, ModelPricing, catalog_provider_keys, model_catalog_entry,
16 supported_models_for_provider,
17};
18
19/// Centralized enum for all supported model identifiers
20#[cfg_attr(feature = "schema", derive(schemars::JsonSchema))]
21#[derive(Clone, Copy, Debug, Default, PartialEq, Eq, Hash, Serialize, Deserialize)]
22pub enum ModelId {
23 // Gemini models
24 /// Gemini 3.1 Pro Preview - Latest Gemini 3.1 Pro flagship
25 Gemini31ProPreview,
26 /// Gemini 3.1 Pro Preview Custom Tools - Optimized for custom tools & bash
27 Gemini31ProPreviewCustomTools,
28 /// Gemini 3.1 Flash Lite Preview - Most cost-efficient model, offering fastest performance for high-frequency, lightweight tasks
29 Gemini31FlashLitePreview,
30 /// Gemini 3 Flash Preview - Our most intelligent model built for speed, combining frontier intelligence with superior search and grounding
31 #[default]
32 Gemini3FlashPreview,
33
34 // OpenAI models
35 /// GPT-5 - Latest most capable OpenAI model (2025-08-07)
36 GPT5,
37 /// GPT-5.2 - Latest flagship general-purpose OpenAI model (2025-12-11)
38 GPT52,
39 /// GPT-5.2 Codex - Code-focused GPT-5.2 variant optimized for agentic coding with xhigh reasoning support
40 GPT52Codex,
41 /// GPT-5.4 - Mainline frontier GPT model for general-purpose and coding work
42 GPT54,
43 /// GPT-5.4 Pro - Higher-compute GPT-5.4 variant for difficult problems
44 GPT54Pro,
45 /// GPT-5.4 Nano - Lightweight GPT-5.4 variant optimized for speed and cost-efficiency
46 GPT54Nano,
47 /// GPT-5.4 Mini - Compact GPT-5.4 variant for cost-effective tasks with reduced reasoning overhead
48 GPT54Mini,
49 /// GPT-5.3 Codex - Code-focused GPT-5.3 variant optimized for agentic coding with reasoning effort support (low, medium, high, xhigh)
50 GPT53Codex,
51 /// GPT-5.1 Codex - Code-focused GPT-5.1 variant optimized for agentic coding
52 GPT51Codex,
53 /// GPT-5.1 Codex Max - Higher-compute GPT-5.1 Codex variant for longer-running engineering tasks
54 GPT51CodexMax,
55 /// GPT-5 Mini - Latest efficient OpenAI model (2025-08-07)
56 GPT5Mini,
57 /// GPT-5 Nano - Latest most cost-effective OpenAI model (2025-08-07)
58 GPT5Nano,
59 /// GPT-5 Codex - Code-focused GPT-5 variant optimized for agentic coding
60 GPT5Codex,
61 /// GPT-OSS 20B - OpenAI's open-source 20B parameter model using harmony
62 OpenAIGptOss20b,
63 /// GPT-OSS 120B - OpenAI's open-source 120B parameter model using harmony
64 OpenAIGptOss120b,
65
66 // Anthropic models
67 /// Claude Opus 4.6 - Next-gen flagship Anthropic model with extended thinking
68 ClaudeOpus46,
69 /// Claude Sonnet 4.6 - Balanced flagship Anthropic model with extended thinking
70 ClaudeSonnet46,
71 /// Claude Haiku 4.5 - Latest efficient Anthropic model (2025-10-15)
72 ClaudeHaiku45,
73 /// GitHub Copilot auto model selection
74 CopilotAuto,
75 /// GitHub Copilot GPT-5.2 Codex
76 CopilotGPT52Codex,
77 /// GitHub Copilot GPT-5.1 Codex Max
78 CopilotGPT51CodexMax,
79 /// GitHub Copilot GPT-5.4
80 CopilotGPT54,
81 /// GitHub Copilot GPT-5.4 Mini
82 CopilotGPT54Mini,
83 /// GitHub Copilot Claude Sonnet 4.6
84 CopilotClaudeSonnet46,
85
86 // DeepSeek models
87 /// DeepSeek V3.2 Chat - Fast non-thinking mode
88 DeepSeekChat,
89 /// DeepSeek V3.2 Reasoner - Thinking mode with structured reasoning output
90 DeepSeekReasoner,
91 // Hugging Face models
92 /// DeepSeek V3.2 via Hugging Face router
93 HuggingFaceDeepseekV32,
94 /// OpenAI GPT-OSS 20B via Hugging Face router
95 HuggingFaceOpenAIGptOss20b,
96 /// OpenAI GPT-OSS 120B via Hugging Face router
97 HuggingFaceOpenAIGptOss120b,
98 /// DeepSeek V3.2 via Novita on Hugging Face router
99 HuggingFaceDeepseekV32Novita,
100 /// Xiaomi MiMo-V2-Flash via Novita on Hugging Face router
101 HuggingFaceXiaomiMimoV2FlashNovita,
102 /// MiniMax M2.5 via Novita on Hugging Face router
103 HuggingFaceMinimaxM25Novita,
104 /// Z.AI GLM-5 via Novita on Hugging Face router
105 HuggingFaceGlm5Novita,
106 /// Z.AI GLM-5.1 via zai-org provider on Hugging Face router
107 HuggingFaceGlm51ZaiOrg,
108 /// Qwen3-Coder-Next via Novita inference provider on Hugging Face router
109 HuggingFaceQwen3CoderNextNovita,
110 /// Qwen3.5-397B-A17B via Together inference provider on Hugging Face router
111 HuggingFaceQwen35397BA17BTogether,
112 /// Step 3.5 Flash via Hugging Face router
113 HuggingFaceStep35Flash,
114
115 /// GLM-5 - Flagship Z.ai foundation model for complex systems
116 ZaiGlm5,
117 /// GLM-5.1 - Next-gen Z.ai foundation model with improved reasoning
118 ZaiGlm51,
119
120 // Moonshot models
121 /// Kimi K2.5 - Moonshot.ai's flagship reasoning model
122 MoonshotKimiK25,
123
124 // Ollama models
125 /// GPT-OSS 20B - Open-weight GPT-OSS 20B model served via Ollama locally
126 OllamaGptOss20b,
127 /// GPT-OSS 20B Cloud - Cloud-hosted GPT-OSS 20B served via Ollama Cloud
128 OllamaGptOss20bCloud,
129 /// GPT-OSS 120B Cloud - Cloud-hosted GPT-OSS 120B served via Ollama Cloud
130 OllamaGptOss120bCloud,
131 /// Qwen3 1.7B - Qwen3 1.7B model served via Ollama
132 OllamaQwen317b,
133 /// Qwen3 Coder Next - Coding-optimized Qwen3 Next model served via Ollama locally
134 OllamaQwen3CoderNext,
135 /// DeepSeek V3.2 Cloud - DeepSeek V3.2 reasoning deployment via Ollama Cloud
136 OllamaDeepseekV32Cloud,
137 /// Qwen3 Next 80B Cloud - Next-generation Qwen3 80B via Ollama Cloud
138 OllamaQwen3Next80bCloud,
139 /// MiniMax-M2 Cloud - Cloud-hosted MiniMax-M2 model served via Ollama Cloud
140 OllamaMinimaxM2Cloud,
141 /// MiniMax-M2.7 Cloud - Cloud-hosted MiniMax-M2.7 model served via Ollama Cloud
142 OllamaMinimaxM27Cloud,
143 /// GLM-5 Cloud - Cloud-hosted GLM-5 model served via Ollama Cloud
144 OllamaGlm5Cloud,
145 /// GLM-5.1 Cloud - Cloud-hosted GLM-5.1 model served via Ollama Cloud
146 OllamaGlm51Cloud,
147 /// MiniMax-M2.5 Cloud - Cloud-hosted MiniMax-M2.5 model served via Ollama Cloud
148 OllamaMinimaxM25Cloud,
149 /// Gemini 3 Flash Preview Cloud - Google Gemini 3 Flash Preview via Ollama Cloud
150 OllamaGemini3FlashPreviewCloud,
151 /// Nemotron 3 Super Cloud - NVIDIA Nemotron 3 Super 120B via Ollama Cloud
152 OllamaNemotron3SuperCloud,
153
154 // MiniMax models
155 /// MiniMax-M2.7 - Recursive self-improvement flagship with 204.8K context
156 MinimaxM27,
157 /// MiniMax-M2.5 - Latest MiniMax model with further improvements in reasoning and coding
158 MinimaxM25,
159
160 // OpenRouter models
161 /// Qwen3 32B - Dense 32B Qwen3 deployment
162 OpenRouterQwen332b,
163 /// Qwen3 30B A3B - Active-parameter 30B Qwen3 model
164 OpenRouterQwen330bA3b,
165 /// Qwen3 30B A3B Instruct 2507 - Instruction-tuned Qwen3 30B A3B
166 OpenRouterQwen330bA3bInstruct2507,
167 /// Qwen3 30B A3B Thinking 2507 - Deliberative Qwen3 30B A3B release
168 OpenRouterQwen330bA3bThinking2507,
169 /// Qwen3 14B - Lightweight Qwen3 14B model
170 OpenRouterQwen314b,
171 /// Qwen3 8B - Compact Qwen3 8B deployment
172 OpenRouterQwen38b,
173 /// Qwen3 Next 80B A3B Instruct - Next-generation Qwen3 instruction model
174 OpenRouterQwen3Next80bA3bInstruct,
175 /// Qwen3 Next 80B A3B Thinking - Next-generation Qwen3 reasoning release
176 OpenRouterQwen3Next80bA3bThinking,
177 /// Qwen3.5-397B-A17B - Native vision-language model with linear attention and sparse MoE, 1M context window
178 OpenRouterQwen35Plus0215,
179 /// Qwen3 Coder - Qwen3-based coding model tuned for IDE workflows
180 OpenRouterQwen3Coder,
181 /// Qwen3 Coder Plus - Premium Qwen3 coding model with long context
182 OpenRouterQwen3CoderPlus,
183 /// Qwen3 Coder Flash - Latency optimised Qwen3 coding model
184 OpenRouterQwen3CoderFlash,
185 /// Qwen3 Coder 30B A3B Instruct - Large Mixture-of-Experts coding deployment
186 OpenRouterQwen3Coder30bA3bInstruct,
187 /// Qwen3 Coder Next - Next-generation Qwen3 coding model with enhanced reasoning
188 OpenRouterQwen3CoderNext,
189 /// DeepSeek V3.2 Chat - Official chat model via OpenRouter
190 OpenRouterDeepseekChat,
191 /// DeepSeek V3.2 - Standard model with thinking support via OpenRouter
192 OpenRouterDeepSeekV32,
193 /// DeepSeek V3.2 Reasoner - Thinking mode via OpenRouter
194 OpenRouterDeepseekReasoner,
195 /// DeepSeek V3.2 Speciale - Enhanced reasoning model (no tool-use)
196 OpenRouterDeepSeekV32Speciale,
197 /// DeepSeek V3.2 Exp - Experimental DeepSeek V3.2 listing
198 OpenRouterDeepSeekV32Exp,
199 /// DeepSeek Chat v3.1 - Advanced DeepSeek model via OpenRouter
200 OpenRouterDeepSeekChatV31,
201 /// DeepSeek R1 - DeepSeek R1 reasoning model with chain-of-thought
202 OpenRouterDeepSeekR1,
203 /// OpenAI gpt-oss-120b - Open-weight 120B reasoning model via OpenRouter
204 OpenRouterOpenAIGptOss120b,
205 /// OpenAI gpt-oss-120b:free - Open-weight 120B reasoning model free tier via OpenRouter
206 OpenRouterOpenAIGptOss120bFree,
207 /// OpenAI gpt-oss-20b - Open-weight 20B deployment via OpenRouter
208 OpenRouterOpenAIGptOss20b,
209 /// OpenAI GPT-5 - OpenAI GPT-5 model accessed through OpenRouter
210 OpenRouterOpenAIGpt5,
211 /// OpenAI GPT-5 Chat - Chat optimised GPT-5 endpoint without tool use
212 OpenRouterOpenAIGpt5Chat,
213
214 /// Gemini 3.1 Pro Preview - Google's latest Gemini 3.1 Pro model via OpenRouter
215 OpenRouterGoogleGemini31ProPreview,
216
217 /// Claude Sonnet 4.5 - Anthropic Claude Sonnet 4.5 listing
218 OpenRouterAnthropicClaudeSonnet45,
219 /// Claude Sonnet 4.6 - Anthropic Claude Sonnet 4.6 listing
220 OpenRouterAnthropicClaudeSonnet46,
221 /// Claude Haiku 4.5 - Anthropic Claude Haiku 4.5 listing
222 OpenRouterAnthropicClaudeHaiku45,
223 /// Mistral Large 3 2512 - Mistral Large 3 2512 model via OpenRouter
224 OpenRouterMistralaiMistralLarge2512,
225 /// DeepSeek V3.1 Nex N1 - Nex AGI DeepSeek V3.1 Nex N1 model via OpenRouter
226 OpenRouterNexAgiDeepseekV31NexN1,
227 /// Step 3.5 Flash (free) - StepFun's most capable open-source reasoning model via OpenRouter
228 OpenRouterStepfunStep35FlashFree,
229 /// Nemotron 3 Super (free) - NVIDIA's 120B hybrid MoE model via OpenRouter
230 OpenRouterNvidiaNemotron3Super120bA12bFree,
231 /// GLM-5 - Z.AI GLM-5 flagship foundation model via OpenRouter
232 OpenRouterZaiGlm5,
233 /// GLM-5.1 - Z.AI GLM-5.1 next-gen foundation model via OpenRouter
234 OpenRouterZaiGlm51,
235 /// MiniMax-M2.5 - MiniMax flagship model via OpenRouter
236 OpenRouterMinimaxM25,
237}