1use std::collections::HashMap;
2
3use codewhale_config::ProviderKind;
4use serde::{Deserialize, Serialize};
5
6#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize)]
8pub enum ModelFamily {
9 DeepSeek,
10 Anthropic,
11 OpenAI,
12 Google,
13 Meta,
14 Mistral,
15 Qwen,
16 Grok,
17 Cohere,
18 GptOss,
19 Inferencer,
20}
21
22#[derive(Debug, Clone, Serialize, Deserialize)]
28pub struct ModelInfo {
29 pub id: String,
31 pub provider: ProviderKind,
33 pub aliases: Vec<String>,
35 pub supports_tools: bool,
37 pub supports_reasoning: bool,
39}
40
41#[derive(Debug, Clone, Serialize, Deserialize)]
46pub struct ModelResolution {
47 pub requested: Option<String>,
49 pub resolved: ModelInfo,
51 pub used_fallback: bool,
53 pub fallback_chain: Vec<String>,
55}
56
57#[derive(Debug, Clone)]
63pub struct ModelRegistry {
64 models: Vec<ModelInfo>,
65 alias_map: HashMap<String, usize>,
66}
67
68impl Default for ModelRegistry {
70 fn default() -> Self {
71 let models = vec![
72 ModelInfo {
73 id: "deepseek-v4-pro".to_string(),
74 provider: ProviderKind::Deepseek,
75 aliases: vec![],
76 supports_tools: true,
77 supports_reasoning: true,
78 },
79 ModelInfo {
80 id: "deepseek-v4-flash".to_string(),
81 provider: ProviderKind::Deepseek,
82 aliases: vec![
83 "deepseek-chat".to_string(),
84 "deepseek-reasoner".to_string(),
85 "deepseek-r1".to_string(),
86 "deepseek-v3".to_string(),
87 "deepseek-v3.2".to_string(),
88 ],
89 supports_tools: true,
90 supports_reasoning: true,
91 },
92 ModelInfo {
93 id: "deepseek-ai/deepseek-v4-pro".to_string(),
94 provider: ProviderKind::NvidiaNim,
95 aliases: vec![
96 "deepseek-v4-pro".to_string(),
97 "nvidia-deepseek-v4-pro".to_string(),
98 "nim-deepseek-v4-pro".to_string(),
99 ],
100 supports_tools: true,
101 supports_reasoning: true,
102 },
103 ModelInfo {
104 id: "deepseek-ai/deepseek-v4-flash".to_string(),
105 provider: ProviderKind::NvidiaNim,
106 aliases: vec![
107 "deepseek-v4-flash".to_string(),
108 "deepseek-chat".to_string(),
109 "deepseek-reasoner".to_string(),
110 "nvidia-deepseek-v4-flash".to_string(),
111 "nim-deepseek-v4-flash".to_string(),
112 ],
113 supports_tools: true,
114 supports_reasoning: true,
115 },
116 ModelInfo {
117 id: "deepseek-v4-pro".to_string(),
118 provider: ProviderKind::Openai,
119 aliases: vec!["openai-compatible-deepseek-v4-pro".to_string()],
120 supports_tools: true,
121 supports_reasoning: true,
122 },
123 ModelInfo {
124 id: "deepseek-v4-flash".to_string(),
125 provider: ProviderKind::Openai,
126 aliases: vec!["openai-compatible-deepseek-v4-flash".to_string()],
127 supports_tools: true,
128 supports_reasoning: true,
129 },
130 ModelInfo {
131 id: "deepseek-ai/deepseek-v4-flash".to_string(),
132 provider: ProviderKind::Atlascloud,
133 aliases: vec![
134 "deepseek-v4-flash".to_string(),
135 "atlascloud-deepseek-v4-flash".to_string(),
136 ],
137 supports_tools: true,
138 supports_reasoning: true,
139 },
140 ModelInfo {
141 id: "deepseek-ai/deepseek-v4-pro".to_string(),
142 provider: ProviderKind::Atlascloud,
143 aliases: vec![
144 "deepseek-v4-pro".to_string(),
145 "atlascloud-deepseek-v4-pro".to_string(),
146 ],
147 supports_tools: true,
148 supports_reasoning: true,
149 },
150 ModelInfo {
151 id: "deepseek-reasoner".to_string(),
152 provider: ProviderKind::WanjieArk,
153 aliases: vec![
154 "wanjie-deepseek-reasoner".to_string(),
155 "ark-wanjie-deepseek-reasoner".to_string(),
156 ],
157 supports_tools: true,
158 supports_reasoning: true,
159 },
160 ModelInfo {
161 id: "DeepSeek-V4-Pro".to_string(),
162 provider: ProviderKind::Volcengine,
163 aliases: vec![
164 "deepseek-v4-pro".to_string(),
165 "volcengine-deepseek-v4-pro".to_string(),
166 "ark-deepseek-v4-pro".to_string(),
167 ],
168 supports_tools: true,
169 supports_reasoning: true,
170 },
171 ModelInfo {
172 id: "DeepSeek-V4-Flash".to_string(),
173 provider: ProviderKind::Volcengine,
174 aliases: vec![
175 "deepseek-v4-flash".to_string(),
176 "deepseek-chat".to_string(),
177 "volcengine-deepseek-v4-flash".to_string(),
178 "ark-deepseek-v4-flash".to_string(),
179 ],
180 supports_tools: true,
181 supports_reasoning: true,
182 },
183 ModelInfo {
184 id: "trinity-large-thinking".to_string(),
185 provider: ProviderKind::Arcee,
186 aliases: vec![
187 "trinity".to_string(),
188 "arcee-trinity".to_string(),
189 "arcee-trinity-large-thinking".to_string(),
190 ],
191 supports_tools: true,
192 supports_reasoning: true,
193 },
194 ModelInfo {
195 id: "deepseek/deepseek-v4-pro".to_string(),
196 provider: ProviderKind::Openrouter,
197 aliases: vec![
198 "deepseek-v4-pro".to_string(),
199 "openrouter-deepseek-v4-pro".to_string(),
200 ],
201 supports_tools: true,
202 supports_reasoning: true,
203 },
204 ModelInfo {
205 id: "deepseek/deepseek-v4-flash".to_string(),
206 provider: ProviderKind::Openrouter,
207 aliases: vec![
208 "deepseek-v4-flash".to_string(),
209 "deepseek-chat".to_string(),
210 "deepseek-reasoner".to_string(),
211 "openrouter-deepseek-v4-flash".to_string(),
212 ],
213 supports_tools: true,
214 supports_reasoning: true,
215 },
216 ModelInfo {
217 id: "arcee-ai/trinity-large-thinking".to_string(),
218 provider: ProviderKind::Openrouter,
219 aliases: vec![
220 "trinity".to_string(),
221 "trinity-large-thinking".to_string(),
222 "arcee-trinity-large-thinking".to_string(),
223 ],
224 supports_tools: true,
225 supports_reasoning: true,
226 },
227 ModelInfo {
228 id: "xiaomi/mimo-v2.5-pro".to_string(),
229 provider: ProviderKind::Openrouter,
230 aliases: vec![
231 "openrouter-mimo-v2.5-pro".to_string(),
232 "openrouter-xiaomi-mimo-v2.5-pro".to_string(),
233 ],
234 supports_tools: true,
235 supports_reasoning: true,
236 },
237 ModelInfo {
238 id: "xiaomi/mimo-v2.5".to_string(),
239 provider: ProviderKind::Openrouter,
240 aliases: vec![
241 "openrouter-mimo-v2.5".to_string(),
242 "openrouter-xiaomi-mimo-v2.5".to_string(),
243 ],
244 supports_tools: true,
245 supports_reasoning: true,
246 },
247 ModelInfo {
248 id: "qwen/qwen3.6-flash".to_string(),
249 provider: ProviderKind::Openrouter,
250 aliases: vec!["qwen3.6-flash".to_string(), "qwen-3.6-flash".to_string()],
251 supports_tools: true,
252 supports_reasoning: true,
253 },
254 ModelInfo {
255 id: "qwen/qwen3.6-35b-a3b".to_string(),
256 provider: ProviderKind::Openrouter,
257 aliases: vec![
258 "qwen3.6-35b-a3b".to_string(),
259 "qwen-3.6-35b-a3b".to_string(),
260 ],
261 supports_tools: true,
262 supports_reasoning: true,
263 },
264 ModelInfo {
265 id: "qwen/qwen3.6-max-preview".to_string(),
266 provider: ProviderKind::Openrouter,
267 aliases: vec![
268 "qwen3.6-max-preview".to_string(),
269 "qwen-3.6-max-preview".to_string(),
270 "qwen-max-preview".to_string(),
271 ],
272 supports_tools: true,
273 supports_reasoning: true,
274 },
275 ModelInfo {
276 id: "qwen/qwen3.6-27b".to_string(),
277 provider: ProviderKind::Openrouter,
278 aliases: vec!["qwen3.6-27b".to_string(), "qwen-3.6-27b".to_string()],
279 supports_tools: true,
280 supports_reasoning: true,
281 },
282 ModelInfo {
283 id: "qwen/qwen3.6-plus".to_string(),
284 provider: ProviderKind::Openrouter,
285 aliases: vec!["qwen3.6-plus".to_string(), "qwen-3.6-plus".to_string()],
286 supports_tools: true,
287 supports_reasoning: true,
288 },
289 ModelInfo {
290 id: "moonshotai/kimi-k2.6".to_string(),
291 provider: ProviderKind::Openrouter,
292 aliases: vec!["openrouter-kimi-k2.6".to_string()],
293 supports_tools: true,
294 supports_reasoning: true,
295 },
296 ModelInfo {
297 id: "minimax/minimax-m3".to_string(),
298 provider: ProviderKind::Openrouter,
299 aliases: vec![
300 "minimax-m3".to_string(),
301 "minimax-m-3".to_string(),
302 "openrouter-minimax-m3".to_string(),
303 ],
304 supports_tools: true,
305 supports_reasoning: true,
306 },
307 ModelInfo {
308 id: "z-ai/glm-5.1".to_string(),
309 provider: ProviderKind::Openrouter,
310 aliases: vec!["glm-5.1".to_string(), "zai-glm-5.1".to_string()],
311 supports_tools: true,
312 supports_reasoning: true,
313 },
314 ModelInfo {
315 id: "tencent/hy3-preview".to_string(),
316 provider: ProviderKind::Openrouter,
317 aliases: vec!["hy3-preview".to_string(), "tencent-hy3-preview".to_string()],
318 supports_tools: true,
319 supports_reasoning: true,
320 },
321 ModelInfo {
322 id: "google/gemma-4-31b-it".to_string(),
323 provider: ProviderKind::Openrouter,
324 aliases: vec!["gemma-4-31b".to_string(), "gemma-4-31b-it".to_string()],
325 supports_tools: true,
326 supports_reasoning: true,
327 },
328 ModelInfo {
329 id: "google/gemma-4-26b-a4b-it".to_string(),
330 provider: ProviderKind::Openrouter,
331 aliases: vec![
332 "gemma-4-26b-a4b".to_string(),
333 "gemma-4-26b-a4b-it".to_string(),
334 ],
335 supports_tools: true,
336 supports_reasoning: true,
337 },
338 ModelInfo {
339 id: "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free".to_string(),
340 provider: ProviderKind::Openrouter,
341 aliases: vec![
342 "nemotron-3-nano-omni".to_string(),
343 "nemotron-3-nano-omni-reasoning".to_string(),
344 ],
345 supports_tools: true,
346 supports_reasoning: true,
347 },
348 ModelInfo {
349 id: "mimo-v2.5-pro".to_string(),
350 provider: ProviderKind::XiaomiMimo,
351 aliases: vec![
352 "mimo".to_string(),
353 "pro".to_string(),
354 "xiaomi-mimo-v2.5-pro".to_string(),
355 "xiaomi-mimo-v2-5-pro".to_string(),
356 ],
357 supports_tools: true,
358 supports_reasoning: true,
359 },
360 ModelInfo {
361 id: "mimo-v2.5".to_string(),
362 provider: ProviderKind::XiaomiMimo,
363 aliases: vec![
364 "omni".to_string(),
365 "mimo-omni".to_string(),
366 "v2.5-omni".to_string(),
367 "mimo-v2.5-omni".to_string(),
368 "xiaomi-mimo-v2.5".to_string(),
369 "xiaomi-mimo-v2.5-omni".to_string(),
370 ],
371 supports_tools: true,
372 supports_reasoning: true,
373 },
374 ModelInfo {
375 id: "mimo-v2.5-asr".to_string(),
376 provider: ProviderKind::XiaomiMimo,
377 aliases: vec![
378 "asr".to_string(),
379 "speech-to-text".to_string(),
380 "transcribe".to_string(),
381 ],
382 supports_tools: false,
383 supports_reasoning: false,
384 },
385 ModelInfo {
386 id: "mimo-v2.5-tts".to_string(),
387 provider: ProviderKind::XiaomiMimo,
388 aliases: vec![
389 "tts".to_string(),
390 "speech".to_string(),
391 "mimo-tts".to_string(),
392 ],
393 supports_tools: false,
394 supports_reasoning: false,
395 },
396 ModelInfo {
397 id: "mimo-v2.5-tts-voicedesign".to_string(),
398 provider: ProviderKind::XiaomiMimo,
399 aliases: vec![
400 "voicedesign".to_string(),
401 "voice-design".to_string(),
402 "mimo-voice-design".to_string(),
403 ],
404 supports_tools: false,
405 supports_reasoning: false,
406 },
407 ModelInfo {
408 id: "mimo-v2.5-tts-voiceclone".to_string(),
409 provider: ProviderKind::XiaomiMimo,
410 aliases: vec![
411 "voiceclone".to_string(),
412 "voice-clone".to_string(),
413 "mimo-voice-clone".to_string(),
414 ],
415 supports_tools: false,
416 supports_reasoning: false,
417 },
418 ModelInfo {
419 id: "mimo-v2-tts".to_string(),
420 provider: ProviderKind::XiaomiMimo,
421 aliases: vec!["mimo-v2-speech".to_string()],
422 supports_tools: false,
423 supports_reasoning: false,
424 },
425 ModelInfo {
426 id: "deepseek/deepseek-v4-pro".to_string(),
427 provider: ProviderKind::Novita,
428 aliases: vec![
429 "deepseek-v4-pro".to_string(),
430 "novita-deepseek-v4-pro".to_string(),
431 ],
432 supports_tools: true,
433 supports_reasoning: true,
434 },
435 ModelInfo {
436 id: "deepseek/deepseek-v4-flash".to_string(),
437 provider: ProviderKind::Novita,
438 aliases: vec![
439 "deepseek-v4-flash".to_string(),
440 "deepseek-chat".to_string(),
441 "deepseek-reasoner".to_string(),
442 "novita-deepseek-v4-flash".to_string(),
443 ],
444 supports_tools: true,
445 supports_reasoning: true,
446 },
447 ModelInfo {
448 id: "accounts/fireworks/models/deepseek-v4-pro".to_string(),
449 provider: ProviderKind::Fireworks,
450 aliases: vec![
451 "deepseek-v4-pro".to_string(),
452 "fireworks-deepseek-v4-pro".to_string(),
453 ],
454 supports_tools: true,
455 supports_reasoning: true,
456 },
457 ModelInfo {
458 id: "deepseek-ai/DeepSeek-V4-Pro".to_string(),
459 provider: ProviderKind::Siliconflow,
460 aliases: vec![
461 "deepseek-v4-pro".to_string(),
462 "deepseek-reasoner".to_string(),
463 "deepseek-r1".to_string(),
464 "siliconflow-deepseek-v4-pro".to_string(),
465 ],
466 supports_tools: true,
467 supports_reasoning: true,
468 },
469 ModelInfo {
470 id: "deepseek-ai/DeepSeek-V4-Flash".to_string(),
471 provider: ProviderKind::Siliconflow,
472 aliases: vec![
473 "deepseek-v4-flash".to_string(),
474 "deepseek-chat".to_string(),
475 "deepseek-v3".to_string(),
476 "siliconflow-deepseek-v4-flash".to_string(),
477 ],
478 supports_tools: true,
479 supports_reasoning: true,
480 },
481 ModelInfo {
482 id: "trinity-large-preview".to_string(),
483 provider: ProviderKind::Arcee,
484 aliases: vec!["arcee-trinity-large-preview".to_string()],
485 supports_tools: true,
486 supports_reasoning: false,
487 },
488 ModelInfo {
489 id: "kimi-k2.6".to_string(),
490 provider: ProviderKind::Moonshot,
491 aliases: vec![
492 "kimi".to_string(),
493 "kimi-k2".to_string(),
494 "moonshot-kimi-k2.6".to_string(),
495 ],
496 supports_tools: true,
497 supports_reasoning: true,
498 },
499 ModelInfo {
500 id: "deepseek-ai/DeepSeek-V4-Pro".to_string(),
501 provider: ProviderKind::Sglang,
502 aliases: vec![
503 "deepseek-v4-pro".to_string(),
504 "sglang-deepseek-v4-pro".to_string(),
505 ],
506 supports_tools: true,
507 supports_reasoning: true,
508 },
509 ModelInfo {
510 id: "deepseek-ai/DeepSeek-V4-Flash".to_string(),
511 provider: ProviderKind::Sglang,
512 aliases: vec![
513 "deepseek-v4-flash".to_string(),
514 "deepseek-chat".to_string(),
515 "deepseek-reasoner".to_string(),
516 "sglang-deepseek-v4-flash".to_string(),
517 ],
518 supports_tools: true,
519 supports_reasoning: true,
520 },
521 ModelInfo {
522 id: "deepseek-ai/DeepSeek-V4-Pro".to_string(),
523 provider: ProviderKind::Vllm,
524 aliases: vec![
525 "deepseek-v4-pro".to_string(),
526 "vllm-deepseek-v4-pro".to_string(),
527 ],
528 supports_tools: true,
529 supports_reasoning: true,
530 },
531 ModelInfo {
532 id: "deepseek-ai/DeepSeek-V4-Flash".to_string(),
533 provider: ProviderKind::Vllm,
534 aliases: vec![
535 "deepseek-v4-flash".to_string(),
536 "deepseek-chat".to_string(),
537 "deepseek-reasoner".to_string(),
538 "vllm-deepseek-v4-flash".to_string(),
539 ],
540 supports_tools: true,
541 supports_reasoning: true,
542 },
543 ModelInfo {
544 id: "deepseek-coder:1.3b".to_string(),
545 provider: ProviderKind::Ollama,
546 aliases: vec![],
547 supports_tools: true,
548 supports_reasoning: false,
549 },
550 ModelInfo {
551 id: "deepseek-ai/DeepSeek-V4-Pro".to_string(),
552 provider: ProviderKind::Huggingface,
553 aliases: vec![
554 "deepseek-v4-pro".to_string(),
555 "hf-deepseek-v4-pro".to_string(),
556 ],
557 supports_tools: true,
558 supports_reasoning: true,
559 },
560 ModelInfo {
561 id: "deepseek-ai/DeepSeek-V4-Flash".to_string(),
562 provider: ProviderKind::Huggingface,
563 aliases: vec![
564 "deepseek-v4-flash".to_string(),
565 "deepseek-chat".to_string(),
566 "deepseek-reasoner".to_string(),
567 "hf-deepseek-v4-flash".to_string(),
568 ],
569 supports_tools: true,
570 supports_reasoning: true,
571 },
572 ];
573 Self::new(models)
574 }
575}
576
577impl ModelRegistry {
578 #[must_use]
584 pub fn new(models: Vec<ModelInfo>) -> Self {
585 let mut alias_map = HashMap::new();
586 for (idx, model) in models.iter().enumerate() {
587 alias_map.entry(normalize(&model.id)).or_insert(idx);
588 for alias in &model.aliases {
589 alias_map.entry(normalize(alias)).or_insert(idx);
590 }
591 }
592 Self { models, alias_map }
593 }
594
595 #[must_use]
597 pub fn list(&self) -> Vec<ModelInfo> {
598 self.models.clone()
599 }
600
601 #[must_use]
613 pub fn resolve(
614 &self,
615 requested: Option<&str>,
616 provider_hint: Option<ProviderKind>,
617 ) -> ModelResolution {
618 let mut fallback_chain = Vec::new();
619
620 if let Some(name) = requested {
621 fallback_chain.push(format!("requested:{name}"));
622 if provider_hint == Some(ProviderKind::Ollama) {
623 return ModelResolution {
624 requested: Some(name.to_string()),
625 resolved: ModelInfo {
626 id: name.trim().to_string(),
627 provider: ProviderKind::Ollama,
628 aliases: Vec::new(),
629 supports_tools: true,
630 supports_reasoning: false,
631 },
632 used_fallback: false,
633 fallback_chain,
634 };
635 }
636 if let Some(provider) = provider_hint
637 && let Some(model) = self
638 .models
639 .iter()
640 .find(|m| m.provider == provider && model_matches(m, name))
641 .cloned()
642 {
643 return ModelResolution {
644 requested: Some(name.to_string()),
645 resolved: model,
646 used_fallback: false,
647 fallback_chain,
648 };
649 }
650 if provider_hint == Some(ProviderKind::Atlascloud)
651 && let Some(model) = atlascloud_passthrough_model(name)
652 {
653 return ModelResolution {
654 requested: Some(name.to_string()),
655 resolved: model,
656 used_fallback: false,
657 fallback_chain,
658 };
659 }
660 if provider_hint == Some(ProviderKind::Arcee)
661 && let Some(model) = arcee_passthrough_model(name)
662 {
663 return ModelResolution {
664 requested: Some(name.to_string()),
665 resolved: model,
666 used_fallback: false,
667 fallback_chain,
668 };
669 }
670 if provider_hint == Some(ProviderKind::XiaomiMimo)
671 && let Some(model) = xiaomi_mimo_passthrough_model(name)
672 {
673 return ModelResolution {
674 requested: Some(name.to_string()),
675 resolved: model,
676 used_fallback: false,
677 fallback_chain,
678 };
679 }
680 if let Some(idx) = self.alias_map.get(&normalize(name)) {
681 return ModelResolution {
682 requested: Some(name.to_string()),
683 resolved: preserve_requested_model_id_case(self.models[*idx].clone(), name),
684 used_fallback: false,
685 fallback_chain,
686 };
687 }
688 }
689
690 let provider = provider_hint.unwrap_or(ProviderKind::Deepseek);
691 fallback_chain.push(format!("provider_default:{}", provider.as_str()));
692 if let Some(model) = self.models.iter().find(|m| m.provider == provider).cloned() {
693 return ModelResolution {
694 requested: requested.map(ToOwned::to_owned),
695 resolved: model,
696 used_fallback: true,
697 fallback_chain,
698 };
699 }
700
701 let final_fallback = self.models.first().cloned().unwrap_or(ModelInfo {
702 id: "deepseek-v4-pro".to_string(),
703 provider: ProviderKind::Deepseek,
704 aliases: Vec::new(),
705 supports_tools: true,
706 supports_reasoning: true,
707 });
708 fallback_chain.push("global_default:deepseek-v4-pro".to_string());
709 ModelResolution {
710 requested: requested.map(ToOwned::to_owned),
711 resolved: final_fallback,
712 used_fallback: true,
713 fallback_chain,
714 }
715 }
716}
717
718fn normalize(value: &str) -> String {
719 value.trim().to_ascii_lowercase()
720}
721
722#[must_use]
723pub fn model_family(model_id: &str) -> ModelFamily {
725 let normalized = normalize(model_id);
726 if normalized.is_empty() {
727 return ModelFamily::Inferencer;
728 }
729
730 if normalized.contains("deepseek") {
731 return ModelFamily::DeepSeek;
732 }
733 if normalized.contains("claude") || normalized.contains("anthropic") {
734 return ModelFamily::Anthropic;
735 }
736 if normalized.contains("gpt-oss") || normalized.contains("gpt_oss") {
737 return ModelFamily::GptOss;
738 }
739 if normalized.starts_with("gpt-")
740 || normalized.contains("/gpt-")
741 || normalized.contains("openai/")
742 {
743 return ModelFamily::OpenAI;
744 }
745 if normalized.contains("gemini")
746 || normalized.contains("gemma")
747 || normalized.contains("google/")
748 {
749 return ModelFamily::Google;
750 }
751 if normalized.contains("llama") || normalized.contains("meta-") || normalized.contains("meta/")
752 {
753 return ModelFamily::Meta;
754 }
755 if normalized.contains("mistral")
756 || normalized.contains("mixtral")
757 || normalized.contains("codestral")
758 {
759 return ModelFamily::Mistral;
760 }
761 if normalized.contains("qwen") {
762 return ModelFamily::Qwen;
763 }
764 if normalized.contains("grok") {
765 return ModelFamily::Grok;
766 }
767 if normalized.contains("cohere") || normalized.contains("command-r") {
768 return ModelFamily::Cohere;
769 }
770
771 ModelFamily::Inferencer
772}
773
774fn model_matches(model: &ModelInfo, requested: &str) -> bool {
775 let requested = normalize(requested);
776 normalize(&model.id) == requested
777 || model
778 .aliases
779 .iter()
780 .any(|alias| normalize(alias) == requested)
781}
782
783fn preserve_requested_model_id_case(mut model: ModelInfo, requested: &str) -> ModelInfo {
784 let requested = requested.trim();
785 if model.id.eq_ignore_ascii_case(requested) {
786 model.id = requested.to_string();
787 }
788 model
789}
790
791fn atlascloud_passthrough_model(requested: &str) -> Option<ModelInfo> {
792 let requested = requested.trim();
793 if requested.is_empty() || !requested.contains('/') {
794 return None;
795 }
796
797 Some(ModelInfo {
798 id: requested.to_string(),
799 provider: ProviderKind::Atlascloud,
800 aliases: Vec::new(),
801 supports_tools: true,
802 supports_reasoning: true,
803 })
804}
805
806fn arcee_passthrough_model(requested: &str) -> Option<ModelInfo> {
807 let requested = requested.trim();
808 if requested.is_empty() {
809 return None;
810 }
811 let supports_reasoning = requested.to_ascii_lowercase().contains("thinking");
812
813 Some(ModelInfo {
814 id: requested.to_string(),
815 provider: ProviderKind::Arcee,
816 aliases: Vec::new(),
817 supports_tools: true,
818 supports_reasoning,
819 })
820}
821
822fn xiaomi_mimo_passthrough_model(requested: &str) -> Option<ModelInfo> {
823 let requested = requested.trim();
824 if requested.is_empty() || requested.chars().any(char::is_control) {
825 return None;
826 }
827
828 Some(ModelInfo {
829 id: requested.to_string(),
830 provider: ProviderKind::XiaomiMimo,
831 aliases: Vec::new(),
832 supports_tools: true,
833 supports_reasoning: true,
834 })
835}
836
837#[cfg(test)]
838mod tests {
839 use super::*;
840
841 #[test]
842 fn deepseek_v4_pro_alias_stays_deepseek_by_default() {
843 let registry = ModelRegistry::default();
844 let resolved = registry.resolve(Some("deepseek-v4-pro"), None);
845
846 assert_eq!(resolved.resolved.provider, ProviderKind::Deepseek);
847 assert_eq!(resolved.resolved.id, "deepseek-v4-pro");
848 }
849
850 #[test]
851 fn deepseek_v4_pro_alias_resolves_to_nvidia_nim_when_provider_hinted() {
852 let registry = ModelRegistry::default();
853 let resolved = registry.resolve(Some("deepseek-v4-pro"), Some(ProviderKind::NvidiaNim));
854
855 assert_eq!(resolved.resolved.provider, ProviderKind::NvidiaNim);
856 assert_eq!(resolved.resolved.id, "deepseek-ai/deepseek-v4-pro");
857 }
858
859 #[test]
860 fn nvidia_nim_default_uses_catalog_model_id() {
861 let registry = ModelRegistry::default();
862 let resolved = registry.resolve(None, Some(ProviderKind::NvidiaNim));
863
864 assert_eq!(resolved.resolved.provider, ProviderKind::NvidiaNim);
865 assert_eq!(resolved.resolved.id, "deepseek-ai/deepseek-v4-pro");
866 }
867
868 #[test]
869 fn deepseek_v4_flash_alias_resolves_to_nvidia_nim_when_provider_hinted() {
870 let registry = ModelRegistry::default();
871 let resolved = registry.resolve(Some("deepseek-v4-flash"), Some(ProviderKind::NvidiaNim));
872
873 assert_eq!(resolved.resolved.provider, ProviderKind::NvidiaNim);
874 assert_eq!(resolved.resolved.id, "deepseek-ai/deepseek-v4-flash");
875 }
876
877 #[test]
878 fn atlascloud_default_uses_namespaced_model_id() {
879 let registry = ModelRegistry::default();
880 let resolved = registry.resolve(None, Some(ProviderKind::Atlascloud));
881
882 assert_eq!(resolved.resolved.provider, ProviderKind::Atlascloud);
883 assert_eq!(resolved.resolved.id, "deepseek-ai/deepseek-v4-flash");
884 assert!(resolved.resolved.supports_reasoning);
885 }
886
887 #[test]
888 fn deepseek_v4_flash_alias_resolves_to_atlascloud_when_provider_hinted() {
889 let registry = ModelRegistry::default();
890 let resolved = registry.resolve(Some("deepseek-v4-flash"), Some(ProviderKind::Atlascloud));
891
892 assert_eq!(resolved.resolved.provider, ProviderKind::Atlascloud);
893 assert_eq!(resolved.resolved.id, "deepseek-ai/deepseek-v4-flash");
894 }
895
896 #[test]
897 fn deepseek_v4_pro_alias_resolves_to_atlascloud_when_provider_hinted() {
898 let registry = ModelRegistry::default();
899 let resolved = registry.resolve(Some("deepseek-v4-pro"), Some(ProviderKind::Atlascloud));
900
901 assert_eq!(resolved.resolved.provider, ProviderKind::Atlascloud);
902 assert_eq!(resolved.resolved.id, "deepseek-ai/deepseek-v4-pro");
903 }
904
905 #[test]
906 fn atlascloud_provider_hint_passes_through_explicit_model_id() {
907 let registry = ModelRegistry::default();
908 let resolved =
909 registry.resolve(Some("openai/gpt-5.2-chat"), Some(ProviderKind::Atlascloud));
910
911 assert_eq!(resolved.resolved.provider, ProviderKind::Atlascloud);
912 assert_eq!(resolved.resolved.id, "openai/gpt-5.2-chat");
913 assert!(resolved.resolved.supports_tools);
914 assert!(resolved.resolved.supports_reasoning);
915 assert!(!resolved.used_fallback);
916 }
917
918 #[test]
919 fn atlascloud_provider_hint_preserves_explicit_model_id_case() {
920 let registry = ModelRegistry::default();
921 let resolved = registry.resolve(Some("Qwen/Qwen3-Coder"), Some(ProviderKind::Atlascloud));
922
923 assert_eq!(resolved.resolved.provider, ProviderKind::Atlascloud);
924 assert_eq!(resolved.resolved.id, "Qwen/Qwen3-Coder");
925 assert!(!resolved.used_fallback);
926 }
927
928 #[test]
929 fn atlascloud_plain_unknown_model_still_uses_provider_default() {
930 let registry = ModelRegistry::default();
931 let resolved = registry.resolve(Some("not-in-atlas"), Some(ProviderKind::Atlascloud));
932
933 assert_eq!(resolved.resolved.provider, ProviderKind::Atlascloud);
934 assert_eq!(resolved.resolved.id, "deepseek-ai/deepseek-v4-flash");
935 assert!(resolved.used_fallback);
936 }
937
938 #[test]
939 fn openrouter_default_uses_namespaced_model_id() {
940 let registry = ModelRegistry::default();
941 let resolved = registry.resolve(None, Some(ProviderKind::Openrouter));
942
943 assert_eq!(resolved.resolved.provider, ProviderKind::Openrouter);
944 assert_eq!(resolved.resolved.id, "deepseek/deepseek-v4-pro");
945 }
946
947 #[test]
948 fn xiaomi_mimo_default_uses_canonical_model_id() {
949 let registry = ModelRegistry::default();
950 let resolved = registry.resolve(None, Some(ProviderKind::XiaomiMimo));
951
952 assert_eq!(resolved.resolved.provider, ProviderKind::XiaomiMimo);
953 assert_eq!(resolved.resolved.id, "mimo-v2.5-pro");
954 assert!(resolved.resolved.supports_reasoning);
955 }
956
957 #[test]
958 fn xiaomi_mimo_tts_aliases_resolve_when_provider_hinted() {
959 let registry = ModelRegistry::default();
960 let resolved = registry.resolve(Some("tts"), Some(ProviderKind::XiaomiMimo));
961 assert_eq!(resolved.resolved.provider, ProviderKind::XiaomiMimo);
962 assert_eq!(resolved.resolved.id, "mimo-v2.5-tts");
963 assert!(!resolved.resolved.supports_tools);
964 assert!(!resolved.resolved.supports_reasoning);
965
966 let resolved = registry.resolve(Some("voice-design"), Some(ProviderKind::XiaomiMimo));
967 assert_eq!(resolved.resolved.id, "mimo-v2.5-tts-voicedesign");
968
969 let resolved = registry.resolve(Some("voiceclone"), Some(ProviderKind::XiaomiMimo));
970 assert_eq!(resolved.resolved.id, "mimo-v2.5-tts-voiceclone");
971 }
972
973 #[test]
974 fn xiaomi_mimo_chat_aliases_resolve_when_provider_hinted() {
975 let registry = ModelRegistry::default();
976
977 let resolved = registry.resolve(Some("omni"), Some(ProviderKind::XiaomiMimo));
978 assert_eq!(resolved.resolved.provider, ProviderKind::XiaomiMimo);
979 assert_eq!(resolved.resolved.id, "mimo-v2.5");
980 assert!(resolved.resolved.supports_tools);
981 }
982
983 #[test]
984 fn xiaomi_mimo_provider_hint_preserves_custom_model_id() {
985 let registry = ModelRegistry::default();
986 let resolved =
987 registry.resolve(Some("account-custom-mimo"), Some(ProviderKind::XiaomiMimo));
988
989 assert_eq!(resolved.resolved.provider, ProviderKind::XiaomiMimo);
990 assert_eq!(resolved.resolved.id, "account-custom-mimo");
991 assert!(!resolved.used_fallback);
992 }
993
994 #[test]
995 fn xiaomi_mimo_provider_hint_does_not_reclassify_openrouter_model_id() {
996 let registry = ModelRegistry::default();
997 let resolved = registry.resolve(
998 Some("deepseek/deepseek-v4-pro"),
999 Some(ProviderKind::XiaomiMimo),
1000 );
1001
1002 assert_eq!(resolved.resolved.provider, ProviderKind::XiaomiMimo);
1003 assert_eq!(resolved.resolved.id, "deepseek/deepseek-v4-pro");
1004 assert!(!resolved.used_fallback);
1005 }
1006
1007 #[test]
1008 fn wanjie_ark_default_uses_reasoner_model_id() {
1009 let registry = ModelRegistry::default();
1010 let resolved = registry.resolve(None, Some(ProviderKind::WanjieArk));
1011
1012 assert_eq!(resolved.resolved.provider, ProviderKind::WanjieArk);
1013 assert_eq!(resolved.resolved.id, "deepseek-reasoner");
1014 assert!(resolved.resolved.supports_reasoning);
1015 }
1016
1017 #[test]
1018 fn novita_default_uses_namespaced_model_id() {
1019 let registry = ModelRegistry::default();
1020 let resolved = registry.resolve(None, Some(ProviderKind::Novita));
1021
1022 assert_eq!(resolved.resolved.provider, ProviderKind::Novita);
1023 assert_eq!(resolved.resolved.id, "deepseek/deepseek-v4-pro");
1024 }
1025
1026 #[test]
1027 fn fireworks_default_uses_canonical_model_id() {
1028 let registry = ModelRegistry::default();
1029 let resolved = registry.resolve(None, Some(ProviderKind::Fireworks));
1030
1031 assert_eq!(resolved.resolved.provider, ProviderKind::Fireworks);
1032 assert_eq!(
1033 resolved.resolved.id,
1034 "accounts/fireworks/models/deepseek-v4-pro"
1035 );
1036 }
1037
1038 #[test]
1039 fn siliconflow_default_uses_canonical_pro_model_id() {
1040 let registry = ModelRegistry::default();
1041 let resolved = registry.resolve(None, Some(ProviderKind::Siliconflow));
1042
1043 assert_eq!(resolved.resolved.provider, ProviderKind::Siliconflow);
1044 assert_eq!(resolved.resolved.id, "deepseek-ai/DeepSeek-V4-Pro");
1045 assert!(resolved.resolved.supports_reasoning);
1046 }
1047
1048 #[test]
1049 fn arcee_default_uses_direct_trinity_large_thinking_model_id() {
1050 let registry = ModelRegistry::default();
1051 let resolved = registry.resolve(None, Some(ProviderKind::Arcee));
1052
1053 assert_eq!(resolved.resolved.provider, ProviderKind::Arcee);
1054 assert_eq!(resolved.resolved.id, "trinity-large-thinking");
1055 assert!(resolved.resolved.supports_reasoning);
1056 }
1057
1058 #[test]
1059 fn arcee_trinity_alias_resolves_to_direct_large_thinking_not_openrouter() {
1060 let registry = ModelRegistry::default();
1061 let resolved = registry.resolve(Some("trinity"), Some(ProviderKind::Arcee));
1062
1063 assert_eq!(resolved.resolved.provider, ProviderKind::Arcee);
1064 assert_eq!(resolved.resolved.id, "trinity-large-thinking");
1065 assert!(resolved.resolved.supports_reasoning);
1066 }
1067
1068 #[test]
1069 fn arcee_trinity_mini_remains_explicit_compatibility_model() {
1070 let registry = ModelRegistry::default();
1071 let resolved = registry.resolve(Some("trinity-mini"), Some(ProviderKind::Arcee));
1072
1073 assert_eq!(resolved.resolved.provider, ProviderKind::Arcee);
1074 assert_eq!(resolved.resolved.id, "trinity-mini");
1075 assert!(!resolved.resolved.supports_reasoning);
1076 }
1077
1078 #[test]
1079 fn arcee_provider_hint_preserves_explicit_future_model_id() {
1080 let registry = ModelRegistry::default();
1081 let resolved = registry.resolve(Some("trinity-large-next"), Some(ProviderKind::Arcee));
1082
1083 assert_eq!(resolved.resolved.provider, ProviderKind::Arcee);
1084 assert_eq!(resolved.resolved.id, "trinity-large-next");
1085 assert!(!resolved.resolved.supports_reasoning);
1086 assert!(!resolved.used_fallback);
1087 }
1088
1089 #[test]
1090 fn deepseek_reasoner_alias_resolves_to_siliconflow_pro_when_provider_hinted() {
1091 let registry = ModelRegistry::default();
1092 let resolved = registry.resolve(Some("deepseek-reasoner"), Some(ProviderKind::Siliconflow));
1093
1094 assert_eq!(resolved.resolved.provider, ProviderKind::Siliconflow);
1095 assert_eq!(resolved.resolved.id, "deepseek-ai/DeepSeek-V4-Pro");
1096 }
1097
1098 #[test]
1099 fn deepseek_v4_flash_alias_resolves_to_siliconflow_flash_when_provider_hinted() {
1100 let registry = ModelRegistry::default();
1101 let resolved = registry.resolve(Some("deepseek-v4-flash"), Some(ProviderKind::Siliconflow));
1102
1103 assert_eq!(resolved.resolved.provider, ProviderKind::Siliconflow);
1104 assert_eq!(resolved.resolved.id, "deepseek-ai/DeepSeek-V4-Flash");
1105 }
1106
1107 #[test]
1108 fn sglang_default_uses_canonical_model_id() {
1109 let registry = ModelRegistry::default();
1110 let resolved = registry.resolve(None, Some(ProviderKind::Sglang));
1111
1112 assert_eq!(resolved.resolved.provider, ProviderKind::Sglang);
1113 assert_eq!(resolved.resolved.id, "deepseek-ai/DeepSeek-V4-Pro");
1114 }
1115
1116 #[test]
1117 fn deepseek_v4_flash_alias_resolves_to_openrouter_when_provider_hinted() {
1118 let registry = ModelRegistry::default();
1119 let resolved = registry.resolve(Some("deepseek-v4-flash"), Some(ProviderKind::Openrouter));
1120
1121 assert_eq!(resolved.resolved.provider, ProviderKind::Openrouter);
1122 assert_eq!(resolved.resolved.id, "deepseek/deepseek-v4-flash");
1123 }
1124
1125 #[test]
1126 fn recent_openrouter_large_model_aliases_resolve_when_provider_hinted() {
1127 let registry = ModelRegistry::default();
1128
1129 for (alias, expected) in [
1130 ("trinity-large-thinking", "arcee-ai/trinity-large-thinking"),
1131 ("qwen3.6-flash", "qwen/qwen3.6-flash"),
1132 ("qwen3.6-35b-a3b", "qwen/qwen3.6-35b-a3b"),
1133 ("qwen3.6-max-preview", "qwen/qwen3.6-max-preview"),
1134 ("qwen3.6-plus", "qwen/qwen3.6-plus"),
1135 ("gemma-4-31b-it", "google/gemma-4-31b-it"),
1136 ("glm-5.1", "z-ai/glm-5.1"),
1137 ("minimax-m3", "minimax/minimax-m3"),
1138 ("openrouter-mimo-v2.5-pro", "xiaomi/mimo-v2.5-pro"),
1139 ("openrouter-kimi-k2.6", "moonshotai/kimi-k2.6"),
1140 ] {
1141 let resolved = registry.resolve(Some(alias), Some(ProviderKind::Openrouter));
1142
1143 assert_eq!(resolved.resolved.provider, ProviderKind::Openrouter);
1144 assert_eq!(resolved.resolved.id, expected);
1145 assert!(resolved.resolved.supports_tools);
1146 assert!(resolved.resolved.supports_reasoning);
1147 }
1148 }
1149
1150 #[test]
1151 fn deepseek_v4_flash_alias_resolves_to_novita_when_provider_hinted() {
1152 let registry = ModelRegistry::default();
1153 let resolved = registry.resolve(Some("deepseek-v4-flash"), Some(ProviderKind::Novita));
1154
1155 assert_eq!(resolved.resolved.provider, ProviderKind::Novita);
1156 assert_eq!(resolved.resolved.id, "deepseek/deepseek-v4-flash");
1157 }
1158
1159 #[test]
1160 fn deepseek_v4_flash_alias_resolves_to_sglang_when_provider_hinted() {
1161 let registry = ModelRegistry::default();
1162 let resolved = registry.resolve(Some("deepseek-v4-flash"), Some(ProviderKind::Sglang));
1163
1164 assert_eq!(resolved.resolved.provider, ProviderKind::Sglang);
1165 assert_eq!(resolved.resolved.id, "deepseek-ai/DeepSeek-V4-Flash");
1166 }
1167
1168 #[test]
1169 fn vllm_default_uses_canonical_model_id() {
1170 let registry = ModelRegistry::default();
1171 let resolved = registry.resolve(None, Some(ProviderKind::Vllm));
1172
1173 assert_eq!(resolved.resolved.provider, ProviderKind::Vllm);
1174 assert_eq!(resolved.resolved.id, "deepseek-ai/DeepSeek-V4-Pro");
1175 }
1176
1177 #[test]
1178 fn ollama_default_uses_small_local_model_id() {
1179 let registry = ModelRegistry::default();
1180 let resolved = registry.resolve(None, Some(ProviderKind::Ollama));
1181
1182 assert_eq!(resolved.resolved.provider, ProviderKind::Ollama);
1183 assert_eq!(resolved.resolved.id, "deepseek-coder:1.3b");
1184 assert!(!resolved.resolved.supports_reasoning);
1185 }
1186
1187 #[test]
1188 fn ollama_requested_model_tag_is_preserved() {
1189 let registry = ModelRegistry::default();
1190 let resolved = registry.resolve(Some("qwen2.5-coder:7b"), Some(ProviderKind::Ollama));
1191
1192 assert_eq!(resolved.resolved.provider, ProviderKind::Ollama);
1193 assert_eq!(resolved.resolved.id, "qwen2.5-coder:7b");
1194 assert!(!resolved.used_fallback);
1195 }
1196
1197 #[test]
1198 fn deepseek_v4_flash_alias_resolves_to_vllm_when_provider_hinted() {
1199 let registry = ModelRegistry::default();
1200 let resolved = registry.resolve(Some("deepseek-v4-flash"), Some(ProviderKind::Vllm));
1201
1202 assert_eq!(resolved.resolved.provider, ProviderKind::Vllm);
1203 assert_eq!(resolved.resolved.id, "deepseek-ai/DeepSeek-V4-Flash");
1204 }
1205
1206 #[test]
1207 fn preserves_requested_model_casing_for_third_party_providers() {
1208 let registry = ModelRegistry::default();
1209 let resolved = registry.resolve(Some("DeepSeek-V4-Pro"), None);
1210
1211 assert_eq!(resolved.resolved.provider, ProviderKind::Deepseek);
1212 assert_eq!(resolved.resolved.id, "DeepSeek-V4-Pro");
1213 }
1214
1215 #[test]
1216 fn registry_casing_takes_priority_over_requested_casing_with_provider_hint() {
1217 let registry = ModelRegistry::default();
1218 let resolved = registry.resolve(Some("DeepSeek-V4-Pro"), Some(ProviderKind::Deepseek));
1219
1220 assert_eq!(resolved.resolved.provider, ProviderKind::Deepseek);
1221 assert_eq!(resolved.resolved.id, "deepseek-v4-pro");
1223 }
1224
1225 #[test]
1226 fn preserves_requested_model_casing_without_surrounding_whitespace() {
1227 let registry = ModelRegistry::default();
1228 let resolved = registry.resolve(Some(" DeepSeek-V4-Pro "), None);
1229
1230 assert_eq!(resolved.resolved.provider, ProviderKind::Deepseek);
1231 assert_eq!(resolved.resolved.id, "DeepSeek-V4-Pro");
1232 }
1233
1234 #[test]
1235 fn alias_match_does_not_override_requested_casing() {
1236 let registry = ModelRegistry::default();
1237 let resolved = registry.resolve(Some("deepseek-reasoner"), None);
1238
1239 assert_eq!(resolved.resolved.provider, ProviderKind::Deepseek);
1240 assert_eq!(resolved.resolved.id, "deepseek-v4-flash");
1241 }
1242
1243 #[test]
1244 fn model_family_classifies_known_model_ids() {
1245 assert_eq!(model_family("deepseek-v4-pro"), ModelFamily::DeepSeek);
1246 assert_eq!(model_family("openai/gpt-5.4"), ModelFamily::OpenAI);
1247 assert_eq!(
1248 model_family("anthropic/claude-opus-4-7"),
1249 ModelFamily::Anthropic
1250 );
1251 assert_eq!(
1252 model_family("meta-llama/llama-3.3-70b-instruct"),
1253 ModelFamily::Meta
1254 );
1255 assert_eq!(model_family("Qwen/Qwen3-Coder"), ModelFamily::Qwen);
1256 }
1257
1258 #[test]
1259 fn model_family_uses_underlying_model_for_router_ids() {
1260 assert_eq!(
1261 model_family("groq/llama-3.3-70b-versatile"),
1262 ModelFamily::Meta
1263 );
1264 assert_eq!(
1265 model_family("openrouter/openai/gpt-5.4"),
1266 ModelFamily::OpenAI
1267 );
1268 assert_eq!(
1269 model_family("fireworks/accounts/fireworks/models/deepseek-v4-pro"),
1270 ModelFamily::DeepSeek
1271 );
1272 }
1273
1274 #[test]
1275 fn model_family_covers_prominent_google_and_mistral_model_names() {
1276 assert_eq!(model_family("google/gemma-3-27b-it"), ModelFamily::Google);
1277 assert_eq!(
1278 model_family("mistralai/mixtral-8x22b"),
1279 ModelFamily::Mistral
1280 );
1281 assert_eq!(model_family("codestral-latest"), ModelFamily::Mistral);
1282 }
1283
1284 #[test]
1285 fn model_family_falls_back_to_inferencer_for_unknown_models() {
1286 assert_eq!(
1287 model_family("custom-gateway/my-private-model"),
1288 ModelFamily::Inferencer
1289 );
1290 assert_eq!(model_family(""), ModelFamily::Inferencer);
1291 }
1292}