use crate::pricing::ModelPrice;
pub const PRICES_UPDATED: &str = "2026-05-01";
pub const PRICES_SOURCE: &str = "litellm community registry";
pub const GENERATED: &[(&str, ModelPrice)] = &[
("Qwen/Qwen3-235B-A22B-Instruct-2507-tput", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 6.0, max_input_tokens: Some(262000) }),
("Qwen/Qwen3-235B-A22B-Thinking-2507", ModelPrice { input_per_mtok: 0.65, output_per_mtok: 3.0, max_input_tokens: Some(256000) }),
("Qwen/Qwen3-235B-A22B-fp8-tput", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.6, max_input_tokens: Some(40000) }),
("Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 2.0, max_input_tokens: Some(256000) }),
("Qwen/Qwen3-Next-80B-A3B-Instruct", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 1.5, max_input_tokens: Some(262144) }),
("Qwen/Qwen3-Next-80B-A3B-Thinking", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 1.5, max_input_tokens: Some(262144) }),
("Qwen/Qwen3.5-397B-A17B", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 3.6, max_input_tokens: Some(262144) }),
("accounts/fireworks/models/chronos-hermes-13b-v2", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/code-llama-13b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/code-llama-13b-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/code-llama-13b-python", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/code-llama-34b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/code-llama-34b-instruct", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/code-llama-34b-python", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/code-llama-70b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/code-llama-70b-instruct", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/code-llama-70b-python", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/code-llama-7b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/code-llama-7b-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/code-llama-7b-python", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/code-qwen-1p5-7b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(65536) }),
("accounts/fireworks/models/codegemma-2b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(8192) }),
("accounts/fireworks/models/codegemma-7b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(8192) }),
("accounts/fireworks/models/cogito-671b-v2-p1", ModelPrice { input_per_mtok: 1.2, output_per_mtok: 1.2, max_input_tokens: Some(163840) }),
("accounts/fireworks/models/cogito-v1-preview-llama-3b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/cogito-v1-preview-llama-70b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/cogito-v1-preview-llama-8b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/cogito-v1-preview-qwen-14b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/cogito-v1-preview-qwen-32b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/dbrx-instruct", ModelPrice { input_per_mtok: 1.2, output_per_mtok: 1.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/deepseek-coder-1b-base", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/deepseek-coder-33b-instruct", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/deepseek-coder-7b-base", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/deepseek-coder-7b-base-v1p5", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/deepseek-coder-7b-instruct-v1p5", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/deepseek-coder-v2-instruct", ModelPrice { input_per_mtok: 1.2, output_per_mtok: 1.2, max_input_tokens: Some(65536) }),
("accounts/fireworks/models/deepseek-coder-v2-lite-base", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 0.5, max_input_tokens: Some(163840) }),
("accounts/fireworks/models/deepseek-coder-v2-lite-instruct", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 0.5, max_input_tokens: Some(163840) }),
("accounts/fireworks/models/deepseek-prover-v2", ModelPrice { input_per_mtok: 1.2, output_per_mtok: 1.2, max_input_tokens: Some(163840) }),
("accounts/fireworks/models/deepseek-r1", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 8.0, max_input_tokens: Some(128000) }),
("accounts/fireworks/models/deepseek-r1-0528", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 8.0, max_input_tokens: Some(160000) }),
("accounts/fireworks/models/deepseek-r1-0528-distill-qwen3-8b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/deepseek-r1-basic", ModelPrice { input_per_mtok: 0.55, output_per_mtok: 2.19, max_input_tokens: Some(128000) }),
("accounts/fireworks/models/deepseek-r1-distill-llama-70b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/deepseek-r1-distill-llama-8b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/deepseek-r1-distill-qwen-14b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/deepseek-r1-distill-qwen-1p5b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/deepseek-r1-distill-qwen-32b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/deepseek-r1-distill-qwen-7b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/deepseek-v2-lite-chat", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 0.5, max_input_tokens: Some(163840) }),
("accounts/fireworks/models/deepseek-v2p5", ModelPrice { input_per_mtok: 1.2, output_per_mtok: 1.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/deepseek-v3", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(128000) }),
("accounts/fireworks/models/deepseek-v3-0324", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(163840) }),
("accounts/fireworks/models/deepseek-v3p1", ModelPrice { input_per_mtok: 0.56, output_per_mtok: 1.68, max_input_tokens: Some(128000) }),
("accounts/fireworks/models/deepseek-v3p1-terminus", ModelPrice { input_per_mtok: 0.56, output_per_mtok: 1.68, max_input_tokens: Some(128000) }),
("accounts/fireworks/models/deepseek-v3p2", ModelPrice { input_per_mtok: 0.56, output_per_mtok: 1.68, max_input_tokens: Some(163840) }),
("accounts/fireworks/models/devstral-small-2505", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/dobby-mini-unhinged-plus-llama-3-1-8b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/dobby-unhinged-llama-3-3-70b-new", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/dolphin-2-9-2-qwen2-72b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/dolphin-2p6-mixtral-8x7b", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 0.5, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/ernie-4p5-21b-a3b-pt", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/ernie-4p5-300b-a47b-pt", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/fare-20b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/firefunction-v1", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 0.5, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/firefunction-v2", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(8192) }),
("accounts/fireworks/models/firellava-13b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/firesearch-ocr-v6", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(8192) }),
("accounts/fireworks/models/flux-1-dev", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/flux-1-dev-controlnet-union", ModelPrice { input_per_mtok: 0.001, output_per_mtok: 0.001, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/flux-1-schnell", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/gemma-2b-it", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(8192) }),
("accounts/fireworks/models/gemma-3-27b-it", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/gemma-7b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(8192) }),
("accounts/fireworks/models/gemma-7b-it", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(8192) }),
("accounts/fireworks/models/gemma2-9b-it", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(8192) }),
("accounts/fireworks/models/glm-4p5", ModelPrice { input_per_mtok: 0.55, output_per_mtok: 2.19, max_input_tokens: Some(128000) }),
("accounts/fireworks/models/glm-4p5-air", ModelPrice { input_per_mtok: 0.22, output_per_mtok: 0.88, max_input_tokens: Some(128000) }),
("accounts/fireworks/models/glm-4p5v", ModelPrice { input_per_mtok: 1.2, output_per_mtok: 1.2, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/glm-4p6", ModelPrice { input_per_mtok: 0.55, output_per_mtok: 2.19, max_input_tokens: Some(202800) }),
("accounts/fireworks/models/glm-4p7", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.2, max_input_tokens: Some(202800) }),
("accounts/fireworks/models/gpt-oss-120b", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/gpt-oss-20b", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.2, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/gpt-oss-safeguard-120b", ModelPrice { input_per_mtok: 1.2, output_per_mtok: 1.2, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/gpt-oss-safeguard-20b", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 0.5, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/hermes-2-pro-mistral-7b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/internvl3-38b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/internvl3-78b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/internvl3-8b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/kat-coder", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(262144) }),
("accounts/fireworks/models/kat-dev-32b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/kat-dev-72b-exp", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/kimi-k2-instruct", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.5, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/kimi-k2-instruct-0905", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.5, max_input_tokens: Some(262144) }),
("accounts/fireworks/models/kimi-k2-thinking", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.5, max_input_tokens: Some(262144) }),
("accounts/fireworks/models/kimi-k2p5", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 3.0, max_input_tokens: Some(262144) }),
("accounts/fireworks/models/llama-guard-2-8b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(8192) }),
("accounts/fireworks/models/llama-guard-3-1b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/llama-guard-3-8b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/llama-v2-13b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/llama-v2-13b-chat", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/llama-v2-70b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/llama-v2-70b-chat", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(2048) }),
("accounts/fireworks/models/llama-v2-7b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/llama-v2-7b-chat", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/llama-v3-70b-instruct", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(8192) }),
("accounts/fireworks/models/llama-v3-70b-instruct-hf", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(8192) }),
("accounts/fireworks/models/llama-v3-8b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(8192) }),
("accounts/fireworks/models/llama-v3-8b-instruct-hf", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(8192) }),
("accounts/fireworks/models/llama-v3p1-405b-instruct", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 3.0, max_input_tokens: Some(128000) }),
("accounts/fireworks/models/llama-v3p1-405b-instruct-long", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/llama-v3p1-70b-instruct", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/llama-v3p1-70b-instruct-1b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/llama-v3p1-8b-instruct", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/llama-v3p1-nemotron-70b-instruct", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/llama-v3p2-11b-vision-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/llama-v3p2-1b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/llama-v3p2-1b-instruct", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/llama-v3p2-3b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/llama-v3p2-3b-instruct", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/llama-v3p2-90b-vision-instruct", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/llama-v3p3-70b-instruct", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/llama4-maverick-instruct-basic", ModelPrice { input_per_mtok: 0.22, output_per_mtok: 0.88, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/llama4-scout-instruct-basic", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/llamaguard-7b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/llava-yi-34b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/minimax-m1-80k", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/minimax-m2", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/minimax-m2p1", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(204800) }),
("accounts/fireworks/models/ministral-3-14b-instruct-2512", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(256000) }),
("accounts/fireworks/models/ministral-3-3b-instruct-2512", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(256000) }),
("accounts/fireworks/models/ministral-3-8b-instruct-2512", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(256000) }),
("accounts/fireworks/models/mistral-7b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/mistral-7b-instruct-4k", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/mistral-7b-instruct-v0p2", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/mistral-7b-instruct-v3", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/mistral-7b-v0p2", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/mistral-large-3-fp8", ModelPrice { input_per_mtok: 1.2, output_per_mtok: 1.2, max_input_tokens: Some(256000) }),
("accounts/fireworks/models/mistral-nemo-base-2407", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(128000) }),
("accounts/fireworks/models/mistral-nemo-instruct-2407", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(128000) }),
("accounts/fireworks/models/mistral-small-24b-instruct-2501", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/mixtral-8x22b", ModelPrice { input_per_mtok: 1.2, output_per_mtok: 1.2, max_input_tokens: Some(65536) }),
("accounts/fireworks/models/mixtral-8x22b-instruct", ModelPrice { input_per_mtok: 1.2, output_per_mtok: 1.2, max_input_tokens: Some(65536) }),
("accounts/fireworks/models/mixtral-8x22b-instruct-hf", ModelPrice { input_per_mtok: 1.2, output_per_mtok: 1.2, max_input_tokens: Some(65536) }),
("accounts/fireworks/models/mixtral-8x7b", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 0.5, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/mixtral-8x7b-instruct", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 0.5, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/mixtral-8x7b-instruct-hf", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 0.5, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/mythomax-l2-13b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/nemotron-nano-v2-12b-vl", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/nous-capybara-7b-v1p9", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/nous-hermes-2-mixtral-8x7b-dpo", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 0.5, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/nous-hermes-2-yi-34b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/nous-hermes-llama2-13b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/nous-hermes-llama2-70b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/nous-hermes-llama2-7b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/nvidia-nemotron-nano-12b-v2", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/nvidia-nemotron-nano-9b-v2", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/openchat-3p5-0106-7b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(8192) }),
("accounts/fireworks/models/openhermes-2-mistral-7b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/openhermes-2p5-mistral-7b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/openorca-7b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/phi-2-3b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(2048) }),
("accounts/fireworks/models/phi-3-mini-128k-instruct", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/phi-3-vision-128k-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32064) }),
("accounts/fireworks/models/phind-code-llama-34b-python-v1", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/phind-code-llama-34b-v1", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/phind-code-llama-34b-v2", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/pythia-12b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(2048) }),
("accounts/fireworks/models/qwen-qwq-32b-preview", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen-v2p5-14b-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen-v2p5-7b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/qwen1p5-72b-chat", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2-72b-instruct", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2-7b-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2-vl-2b-instruct", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2-vl-72b-instruct", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2-vl-7b-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2p5-0p5b-instruct", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2p5-14b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/qwen2p5-1p5b-instruct", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2p5-32b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/qwen2p5-32b-instruct", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2p5-72b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/qwen2p5-72b-instruct", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2p5-7b-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2p5-coder-0p5b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2p5-coder-0p5b-instruct", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2p5-coder-14b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2p5-coder-14b-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2p5-coder-1p5b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2p5-coder-1p5b-instruct", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2p5-coder-32b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2p5-coder-32b-instruct", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/qwen2p5-coder-32b-instruct-128k", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/qwen2p5-coder-32b-instruct-32k-rope", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2p5-coder-32b-instruct-64k", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(65536) }),
("accounts/fireworks/models/qwen2p5-coder-3b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2p5-coder-3b-instruct", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2p5-coder-7b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2p5-coder-7b-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/qwen2p5-math-72b-instruct", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/qwen2p5-vl-32b-instruct", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(128000) }),
("accounts/fireworks/models/qwen2p5-vl-3b-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(128000) }),
("accounts/fireworks/models/qwen2p5-vl-72b-instruct", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(128000) }),
("accounts/fireworks/models/qwen2p5-vl-7b-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(128000) }),
("accounts/fireworks/models/qwen3-0p6b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(40960) }),
("accounts/fireworks/models/qwen3-14b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(40960) }),
("accounts/fireworks/models/qwen3-1p7b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/qwen3-1p7b-fp8-draft", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(262144) }),
("accounts/fireworks/models/qwen3-1p7b-fp8-draft-131072", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/qwen3-1p7b-fp8-draft-40960", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(40960) }),
("accounts/fireworks/models/qwen3-235b-a22b", ModelPrice { input_per_mtok: 0.22, output_per_mtok: 0.88, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/qwen3-235b-a22b-instruct-2507", ModelPrice { input_per_mtok: 0.22, output_per_mtok: 0.88, max_input_tokens: Some(262144) }),
("accounts/fireworks/models/qwen3-235b-a22b-thinking-2507", ModelPrice { input_per_mtok: 0.22, output_per_mtok: 0.88, max_input_tokens: Some(262144) }),
("accounts/fireworks/models/qwen3-30b-a3b", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/qwen3-30b-a3b-instruct-2507", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 0.5, max_input_tokens: Some(262144) }),
("accounts/fireworks/models/qwen3-30b-a3b-thinking-2507", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(262144) }),
("accounts/fireworks/models/qwen3-32b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/qwen3-4b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(40960) }),
("accounts/fireworks/models/qwen3-4b-instruct-2507", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(262144) }),
("accounts/fireworks/models/qwen3-8b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(40960) }),
("accounts/fireworks/models/qwen3-coder-30b-a3b-instruct", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(262144) }),
("accounts/fireworks/models/qwen3-coder-480b-a35b-instruct", ModelPrice { input_per_mtok: 0.45, output_per_mtok: 1.8, max_input_tokens: Some(262144) }),
("accounts/fireworks/models/qwen3-coder-480b-instruct-bf16", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/qwen3-next-80b-a3b-instruct", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/qwen3-next-80b-a3b-thinking", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/qwen3-vl-235b-a22b-instruct", ModelPrice { input_per_mtok: 0.22, output_per_mtok: 0.88, max_input_tokens: Some(262144) }),
("accounts/fireworks/models/qwen3-vl-235b-a22b-thinking", ModelPrice { input_per_mtok: 0.22, output_per_mtok: 0.88, max_input_tokens: Some(262144) }),
("accounts/fireworks/models/qwen3-vl-30b-a3b-instruct", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(262144) }),
("accounts/fireworks/models/qwen3-vl-30b-a3b-thinking", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(262144) }),
("accounts/fireworks/models/qwen3-vl-32b-instruct", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/qwen3-vl-8b-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/qwq-32b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("accounts/fireworks/models/rolm-ocr", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(128000) }),
("accounts/fireworks/models/snorkel-mistral-7b-pairrm-dpo", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/stablecode-3b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/starcoder-16b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(8192) }),
("accounts/fireworks/models/starcoder-7b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(8192) }),
("accounts/fireworks/models/starcoder2-15b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/starcoder2-3b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/starcoder2-7b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(16384) }),
("accounts/fireworks/models/toppy-m-7b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/yi-34b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/yi-34b-200k-capybara", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(200000) }),
("accounts/fireworks/models/yi-34b-chat", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/yi-6b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(4096) }),
("accounts/fireworks/models/yi-large", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 3.0, max_input_tokens: Some(32768) }),
("accounts/fireworks/models/zephyr-7b-beta", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("ai21.j2-mid-v1", ModelPrice { input_per_mtok: 12.5, output_per_mtok: 12.5, max_input_tokens: Some(8191) }),
("ai21.j2-ultra-v1", ModelPrice { input_per_mtok: 18.8, output_per_mtok: 18.8, max_input_tokens: Some(8191) }),
("ai21.jamba-1-5-large-v1:0", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 8.0, max_input_tokens: Some(256000) }),
("ai21.jamba-1-5-mini-v1:0", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.4, max_input_tokens: Some(256000) }),
("ai21.jamba-instruct-v1:0", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 0.7, max_input_tokens: Some(70000) }),
("amazon-nova/nova-lite-v1", ModelPrice { input_per_mtok: 0.06, output_per_mtok: 0.24, max_input_tokens: Some(300000) }),
("amazon-nova/nova-micro-v1", ModelPrice { input_per_mtok: 0.035, output_per_mtok: 0.14, max_input_tokens: Some(128000) }),
("amazon-nova/nova-premier-v1", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 12.5, max_input_tokens: Some(1000000) }),
("amazon-nova/nova-pro-v1", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 3.2, max_input_tokens: Some(300000) }),
("amazon.nova-2-lite-v1:0", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 2.5, max_input_tokens: Some(1000000) }),
("amazon.nova-2-pro-preview-20251202-v1:0", ModelPrice { input_per_mtok: 2.1875, output_per_mtok: 17.5, max_input_tokens: Some(1000000) }),
("amazon.nova-lite-v1:0", ModelPrice { input_per_mtok: 0.06, output_per_mtok: 0.24, max_input_tokens: Some(300000) }),
("amazon.nova-micro-v1:0", ModelPrice { input_per_mtok: 0.035, output_per_mtok: 0.14, max_input_tokens: Some(128000) }),
("amazon.nova-pro-v1:0", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 3.2, max_input_tokens: Some(300000) }),
("amazon.titan-text-express-v1", ModelPrice { input_per_mtok: 1.3, output_per_mtok: 1.7, max_input_tokens: Some(42000) }),
("amazon.titan-text-lite-v1", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.4, max_input_tokens: Some(42000) }),
("amazon.titan-text-premier-v1:0", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(42000) }),
("anthropic.claude-3-5-haiku-20241022-v1:0", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 4.0, max_input_tokens: Some(200000) }),
("anthropic.claude-3-5-sonnet-20240620-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1000000) }),
("anthropic.claude-3-5-sonnet-20241022-v2:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1000000) }),
("anthropic.claude-3-7-sonnet-20240620-v1:0", ModelPrice { input_per_mtok: 3.6, output_per_mtok: 18.0, max_input_tokens: Some(200000) }),
("anthropic.claude-3-7-sonnet-20250219-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("anthropic.claude-3-haiku-20240307-v1:0", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 1.25, max_input_tokens: Some(200000) }),
("anthropic.claude-3-opus-20240229-v1:0", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("anthropic.claude-3-sonnet-20240229-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("anthropic.claude-haiku-4-5-20251001-v1:0", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 5.0, max_input_tokens: Some(200000) }),
("anthropic.claude-haiku-4-5@20251001", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 5.0, max_input_tokens: Some(200000) }),
("anthropic.claude-instant-v1", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 2.4, max_input_tokens: Some(100000) }),
("anthropic.claude-opus-4-1-20250805-v1:0", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("anthropic.claude-opus-4-20250514-v1:0", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("anthropic.claude-opus-4-5-20251101-v1:0", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(200000) }),
("anthropic.claude-opus-4-6-v1", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(1000000) }),
("anthropic.claude-opus-4-7", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(1000000) }),
("anthropic.claude-sonnet-4-20250514-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1000000) }),
("anthropic.claude-sonnet-4-5-20250929-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("anthropic.claude-sonnet-4-6", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1000000) }),
("anthropic.claude-v1", ModelPrice { input_per_mtok: 8.0, output_per_mtok: 24.0, max_input_tokens: Some(100000) }),
("anthropic.claude-v2:1", ModelPrice { input_per_mtok: 8.0, output_per_mtok: 24.0, max_input_tokens: Some(100000) }),
("anthropic/claude-3.5-haiku", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 5.0, max_input_tokens: None }),
("anthropic/claude-3.5-sonnet", ModelPrice { input_per_mtok: 3.75, output_per_mtok: 18.75, max_input_tokens: None }),
("anthropic/claude-3.7-sonnet", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: None }),
("anthropic/claude-4-sonnet", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: None }),
("anthropic/claude-4.5-haiku", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 5.0, max_input_tokens: None }),
("anthropic/claude-4.5-sonnet", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: None }),
("anyscale/HuggingFaceH4/zephyr-7b-beta", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: Some(16384) }),
("anyscale/codellama/CodeLlama-34b-Instruct-hf", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 1.0, max_input_tokens: Some(4096) }),
("anyscale/codellama/CodeLlama-70b-Instruct-hf", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 1.0, max_input_tokens: Some(4096) }),
("anyscale/google/gemma-7b-it", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: Some(8192) }),
("anyscale/meta-llama/Llama-2-13b-chat-hf", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 0.25, max_input_tokens: Some(4096) }),
("anyscale/meta-llama/Llama-2-70b-chat-hf", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 1.0, max_input_tokens: Some(4096) }),
("anyscale/meta-llama/Llama-2-7b-chat-hf", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: Some(4096) }),
("anyscale/meta-llama/Meta-Llama-3-70B-Instruct", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 1.0, max_input_tokens: Some(8192) }),
("anyscale/meta-llama/Meta-Llama-3-8B-Instruct", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: Some(8192) }),
("anyscale/mistralai/Mistral-7B-Instruct-v0.1", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: Some(16384) }),
("anyscale/mistralai/Mixtral-8x22B-Instruct-v0.1", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(65536) }),
("anyscale/mistralai/Mixtral-8x7B-Instruct-v0.1", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: Some(16384) }),
("ap-northeast-1/anthropic.claude-instant-v1", ModelPrice { input_per_mtok: 2.23, output_per_mtok: 7.55, max_input_tokens: Some(100000) }),
("ap-northeast-1/anthropic.claude-v1", ModelPrice { input_per_mtok: 8.0, output_per_mtok: 24.0, max_input_tokens: Some(100000) }),
("ap-northeast-1/anthropic.claude-v2:1", ModelPrice { input_per_mtok: 8.0, output_per_mtok: 24.0, max_input_tokens: Some(100000) }),
("ap-northeast-1/deepseek.v3.2", ModelPrice { input_per_mtok: 0.74, output_per_mtok: 2.22, max_input_tokens: Some(163840) }),
("ap-northeast-1/minimax.minimax-m2.1", ModelPrice { input_per_mtok: 0.36, output_per_mtok: 1.44, max_input_tokens: Some(196000) }),
("ap-northeast-1/minimax.minimax-m2.5", ModelPrice { input_per_mtok: 0.36, output_per_mtok: 1.44, max_input_tokens: Some(1000000) }),
("ap-northeast-1/moonshotai.kimi-k2-thinking", ModelPrice { input_per_mtok: 0.73, output_per_mtok: 3.03, max_input_tokens: Some(262144) }),
("ap-northeast-1/moonshotai.kimi-k2.5", ModelPrice { input_per_mtok: 0.72, output_per_mtok: 3.6, max_input_tokens: Some(262144) }),
("ap-northeast-1/qwen.qwen3-coder-next", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 1.44, max_input_tokens: Some(262144) }),
("ap-south-1/deepseek.v3.2", ModelPrice { input_per_mtok: 0.74, output_per_mtok: 2.22, max_input_tokens: Some(163840) }),
("ap-south-1/meta.llama3-70b-instruct-v1:0", ModelPrice { input_per_mtok: 3.18, output_per_mtok: 4.2, max_input_tokens: Some(8192) }),
("ap-south-1/meta.llama3-8b-instruct-v1:0", ModelPrice { input_per_mtok: 0.36, output_per_mtok: 0.72, max_input_tokens: Some(8192) }),
("ap-south-1/minimax.minimax-m2.1", ModelPrice { input_per_mtok: 0.36, output_per_mtok: 1.44, max_input_tokens: Some(196000) }),
("ap-south-1/minimax.minimax-m2.5", ModelPrice { input_per_mtok: 0.36, output_per_mtok: 1.44, max_input_tokens: Some(1000000) }),
("ap-south-1/moonshotai.kimi-k2-thinking", ModelPrice { input_per_mtok: 0.71, output_per_mtok: 2.94, max_input_tokens: Some(262144) }),
("ap-south-1/moonshotai.kimi-k2.5", ModelPrice { input_per_mtok: 0.72, output_per_mtok: 3.6, max_input_tokens: Some(262144) }),
("ap-south-1/qwen.qwen3-coder-next", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 1.44, max_input_tokens: Some(262144) }),
("ap-southeast-2/minimax.minimax-m2.5", ModelPrice { input_per_mtok: 0.309, output_per_mtok: 1.236, max_input_tokens: Some(1000000) }),
("ap-southeast-3/deepseek.v3.2", ModelPrice { input_per_mtok: 0.74, output_per_mtok: 2.22, max_input_tokens: Some(163840) }),
("ap-southeast-3/minimax.minimax-m2.1", ModelPrice { input_per_mtok: 0.36, output_per_mtok: 1.44, max_input_tokens: Some(196000) }),
("ap-southeast-3/minimax.minimax-m2.5", ModelPrice { input_per_mtok: 0.36, output_per_mtok: 1.44, max_input_tokens: Some(1000000) }),
("ap-southeast-3/moonshotai.kimi-k2.5", ModelPrice { input_per_mtok: 0.72, output_per_mtok: 3.6, max_input_tokens: Some(262144) }),
("ap-southeast-3/qwen.qwen3-coder-next", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 1.44, max_input_tokens: Some(262144) }),
("apac.amazon.nova-2-lite-v1:0", ModelPrice { input_per_mtok: 0.33, output_per_mtok: 2.75, max_input_tokens: Some(1000000) }),
("apac.amazon.nova-2-pro-preview-20251202-v1:0", ModelPrice { input_per_mtok: 2.1875, output_per_mtok: 17.5, max_input_tokens: Some(1000000) }),
("apac.amazon.nova-lite-v1:0", ModelPrice { input_per_mtok: 0.063, output_per_mtok: 0.252, max_input_tokens: Some(300000) }),
("apac.amazon.nova-micro-v1:0", ModelPrice { input_per_mtok: 0.037, output_per_mtok: 0.148, max_input_tokens: Some(128000) }),
("apac.amazon.nova-pro-v1:0", ModelPrice { input_per_mtok: 0.84, output_per_mtok: 3.36, max_input_tokens: Some(300000) }),
("apac.anthropic.claude-3-5-sonnet-20240620-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("apac.anthropic.claude-3-5-sonnet-20241022-v2:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("apac.anthropic.claude-3-haiku-20240307-v1:0", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 1.25, max_input_tokens: Some(200000) }),
("apac.anthropic.claude-3-sonnet-20240229-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("apac.anthropic.claude-haiku-4-5-20251001-v1:0", ModelPrice { input_per_mtok: 1.1, output_per_mtok: 5.5, max_input_tokens: Some(200000) }),
("apac.anthropic.claude-sonnet-4-20250514-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1000000) }),
("au.anthropic.claude-haiku-4-5-20251001-v1:0", ModelPrice { input_per_mtok: 1.1, output_per_mtok: 5.5, max_input_tokens: Some(200000) }),
("au.anthropic.claude-opus-4-6-v1", ModelPrice { input_per_mtok: 5.5, output_per_mtok: 27.5, max_input_tokens: Some(1000000) }),
("au.anthropic.claude-opus-4-7", ModelPrice { input_per_mtok: 5.5, output_per_mtok: 27.5, max_input_tokens: Some(1000000) }),
("au.anthropic.claude-sonnet-4-5-20250929-v1:0", ModelPrice { input_per_mtok: 3.3, output_per_mtok: 16.5, max_input_tokens: Some(200000) }),
("au.anthropic.claude-sonnet-4-6", ModelPrice { input_per_mtok: 3.3, output_per_mtok: 16.5, max_input_tokens: Some(1000000) }),
("azure_ai/Llama-3.2-11B-Vision-Instruct", ModelPrice { input_per_mtok: 0.37, output_per_mtok: 0.37, max_input_tokens: Some(128000) }),
("azure_ai/Llama-3.2-90B-Vision-Instruct", ModelPrice { input_per_mtok: 2.04, output_per_mtok: 2.04, max_input_tokens: Some(128000) }),
("azure_ai/Llama-3.3-70B-Instruct", ModelPrice { input_per_mtok: 0.71, output_per_mtok: 0.71, max_input_tokens: Some(128000) }),
("azure_ai/Llama-4-Maverick-17B-128E-Instruct-FP8", ModelPrice { input_per_mtok: 1.41, output_per_mtok: 0.35, max_input_tokens: Some(1000000) }),
("azure_ai/Llama-4-Scout-17B-16E-Instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.78, max_input_tokens: Some(10000000) }),
("azure_ai/MAI-DS-R1", ModelPrice { input_per_mtok: 1.35, output_per_mtok: 5.4, max_input_tokens: Some(128000) }),
("azure_ai/Meta-Llama-3-70B-Instruct", ModelPrice { input_per_mtok: 1.1, output_per_mtok: 0.37, max_input_tokens: Some(8192) }),
("azure_ai/Meta-Llama-3.1-405B-Instruct", ModelPrice { input_per_mtok: 5.33, output_per_mtok: 16.0, max_input_tokens: Some(128000) }),
("azure_ai/Meta-Llama-3.1-70B-Instruct", ModelPrice { input_per_mtok: 2.68, output_per_mtok: 3.54, max_input_tokens: Some(128000) }),
("azure_ai/Meta-Llama-3.1-8B-Instruct", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.61, max_input_tokens: Some(128000) }),
("azure_ai/Phi-3-medium-128k-instruct", ModelPrice { input_per_mtok: 0.17, output_per_mtok: 0.68, max_input_tokens: Some(128000) }),
("azure_ai/Phi-3-medium-4k-instruct", ModelPrice { input_per_mtok: 0.17, output_per_mtok: 0.68, max_input_tokens: Some(4096) }),
("azure_ai/Phi-3-mini-128k-instruct", ModelPrice { input_per_mtok: 0.13, output_per_mtok: 0.52, max_input_tokens: Some(128000) }),
("azure_ai/Phi-3-mini-4k-instruct", ModelPrice { input_per_mtok: 0.13, output_per_mtok: 0.52, max_input_tokens: Some(4096) }),
("azure_ai/Phi-3-small-128k-instruct", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(128000) }),
("azure_ai/Phi-3-small-8k-instruct", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(8192) }),
("azure_ai/Phi-3.5-MoE-instruct", ModelPrice { input_per_mtok: 0.16, output_per_mtok: 0.64, max_input_tokens: Some(128000) }),
("azure_ai/Phi-3.5-mini-instruct", ModelPrice { input_per_mtok: 0.13, output_per_mtok: 0.52, max_input_tokens: Some(128000) }),
("azure_ai/Phi-3.5-vision-instruct", ModelPrice { input_per_mtok: 0.13, output_per_mtok: 0.52, max_input_tokens: Some(128000) }),
("azure_ai/Phi-4", ModelPrice { input_per_mtok: 0.125, output_per_mtok: 0.5, max_input_tokens: Some(16384) }),
("azure_ai/Phi-4-mini-instruct", ModelPrice { input_per_mtok: 0.075, output_per_mtok: 0.3, max_input_tokens: Some(131072) }),
("azure_ai/Phi-4-mini-reasoning", ModelPrice { input_per_mtok: 0.08, output_per_mtok: 0.32, max_input_tokens: Some(131072) }),
("azure_ai/Phi-4-multimodal-instruct", ModelPrice { input_per_mtok: 0.08, output_per_mtok: 0.32, max_input_tokens: Some(131072) }),
("azure_ai/Phi-4-reasoning", ModelPrice { input_per_mtok: 0.125, output_per_mtok: 0.5, max_input_tokens: Some(32768) }),
("azure_ai/claude-haiku-4-5", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 5.0, max_input_tokens: Some(200000) }),
("azure_ai/claude-opus-4-1", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("azure_ai/claude-opus-4-5", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(200000) }),
("azure_ai/claude-opus-4-6", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(200000) }),
("azure_ai/claude-opus-4-7", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(200000) }),
("azure_ai/claude-sonnet-4-5", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("azure_ai/claude-sonnet-4-6", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1000000) }),
("azure_ai/deepseek-r1", ModelPrice { input_per_mtok: 1.35, output_per_mtok: 5.4, max_input_tokens: Some(128000) }),
("azure_ai/deepseek-v3", ModelPrice { input_per_mtok: 1.14, output_per_mtok: 4.56, max_input_tokens: Some(128000) }),
("azure_ai/deepseek-v3-0324", ModelPrice { input_per_mtok: 1.14, output_per_mtok: 4.56, max_input_tokens: Some(128000) }),
("azure_ai/deepseek-v3.2", ModelPrice { input_per_mtok: 0.58, output_per_mtok: 1.68, max_input_tokens: Some(163840) }),
("azure_ai/deepseek-v3.2-speciale", ModelPrice { input_per_mtok: 0.58, output_per_mtok: 1.68, max_input_tokens: Some(163840) }),
("azure_ai/global/grok-3", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(131072) }),
("azure_ai/global/grok-3-mini", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 1.27, max_input_tokens: Some(131072) }),
("azure_ai/gpt-oss-120b", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(131072) }),
("azure_ai/grok-3", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(131072) }),
("azure_ai/grok-3-mini", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 1.27, max_input_tokens: Some(131072) }),
("azure_ai/grok-4", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(131072) }),
("azure_ai/grok-4-1-fast-non-reasoning", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.5, max_input_tokens: Some(131072) }),
("azure_ai/grok-4-1-fast-reasoning", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.5, max_input_tokens: Some(131072) }),
("azure_ai/grok-4-fast-non-reasoning", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.5, max_input_tokens: Some(131072) }),
("azure_ai/grok-4-fast-reasoning", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.5, max_input_tokens: Some(131072) }),
("azure_ai/grok-code-fast-1", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 1.5, max_input_tokens: Some(131072) }),
("azure_ai/jais-30b-chat", ModelPrice { input_per_mtok: 3200.0, output_per_mtok: 9710.0, max_input_tokens: Some(8192) }),
("azure_ai/jamba-instruct", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 0.7, max_input_tokens: Some(70000) }),
("azure_ai/kimi-k2.5", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 3.0, max_input_tokens: Some(262144) }),
("azure_ai/ministral-3b", ModelPrice { input_per_mtok: 0.04, output_per_mtok: 0.04, max_input_tokens: Some(128000) }),
("azure_ai/mistral-large", ModelPrice { input_per_mtok: 4.0, output_per_mtok: 12.0, max_input_tokens: Some(32000) }),
("azure_ai/mistral-large-2407", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 6.0, max_input_tokens: Some(128000) }),
("azure_ai/mistral-large-3", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(256000) }),
("azure_ai/mistral-large-latest", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 6.0, max_input_tokens: Some(128000) }),
("azure_ai/mistral-medium-2505", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 2.0, max_input_tokens: Some(131072) }),
("azure_ai/mistral-nemo", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: Some(131072) }),
("azure_ai/mistral-small", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.0, max_input_tokens: Some(32000) }),
("azure_ai/mistral-small-2503", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.3, max_input_tokens: Some(128000) }),
("azure_ai/model_router", ModelPrice { input_per_mtok: 0.14, output_per_mtok: 0.0, max_input_tokens: None }),
("babbage-002", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 0.4, max_input_tokens: Some(16384) }),
("baseten/MiniMaxAI/MiniMax-M2.5", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: None }),
("baseten/deepseek-ai/DeepSeek-V3-0324", ModelPrice { input_per_mtok: 0.77, output_per_mtok: 0.77, max_input_tokens: None }),
("baseten/deepseek-ai/DeepSeek-V3.1", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: None }),
("baseten/moonshotai/Kimi-K2-Instruct-0905", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.5, max_input_tokens: None }),
("baseten/moonshotai/Kimi-K2-Thinking", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.5, max_input_tokens: None }),
("baseten/moonshotai/Kimi-K2.5", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 3.0, max_input_tokens: None }),
("baseten/nvidia/Nemotron-120B-A12B", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.75, max_input_tokens: None }),
("baseten/openai/gpt-oss-120b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.5, max_input_tokens: None }),
("baseten/zai-org/GLM-4.6", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.2, max_input_tokens: None }),
("baseten/zai-org/GLM-4.7", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.2, max_input_tokens: None }),
("baseten/zai-org/GLM-5", ModelPrice { input_per_mtok: 0.95, output_per_mtok: 3.15, max_input_tokens: None }),
("bedrock_mantle/openai.gpt-oss-120b", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(131072) }),
("bedrock_mantle/openai.gpt-oss-20b", ModelPrice { input_per_mtok: 0.075, output_per_mtok: 0.3, max_input_tokens: Some(131072) }),
("bedrock_mantle/openai.gpt-oss-safeguard-120b", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(131072) }),
("bedrock_mantle/openai.gpt-oss-safeguard-20b", ModelPrice { input_per_mtok: 0.075, output_per_mtok: 0.3, max_input_tokens: Some(131072) }),
("bytedance/ui-tars-1.5-7b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.2, max_input_tokens: Some(131072) }),
("ca-central-1/meta.llama3-70b-instruct-v1:0", ModelPrice { input_per_mtok: 3.05, output_per_mtok: 4.03, max_input_tokens: Some(8192) }),
("ca-central-1/meta.llama3-8b-instruct-v1:0", ModelPrice { input_per_mtok: 0.35, output_per_mtok: 0.69, max_input_tokens: Some(8192) }),
("cerebras/gpt-oss-120b", ModelPrice { input_per_mtok: 0.35, output_per_mtok: 0.75, max_input_tokens: Some(131072) }),
("cerebras/llama-3.3-70b", ModelPrice { input_per_mtok: 0.85, output_per_mtok: 1.2, max_input_tokens: Some(128000) }),
("cerebras/llama3.1-70b", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 0.6, max_input_tokens: Some(128000) }),
("cerebras/llama3.1-8b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(128000) }),
("cerebras/qwen-3-32b", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 0.8, max_input_tokens: Some(128000) }),
("cerebras/zai-glm-4.6", ModelPrice { input_per_mtok: 2.25, output_per_mtok: 2.75, max_input_tokens: Some(128000) }),
("cerebras/zai-glm-4.7", ModelPrice { input_per_mtok: 2.25, output_per_mtok: 2.75, max_input_tokens: Some(128000) }),
("chatdolphin", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 0.5, max_input_tokens: Some(16384) }),
("chatgpt-4o-latest", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 15.0, max_input_tokens: Some(128000) }),
("claude-3-5-haiku", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 5.0, max_input_tokens: Some(200000) }),
("claude-3-5-haiku@20241022", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 5.0, max_input_tokens: Some(200000) }),
("claude-3-5-sonnet", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("claude-3-5-sonnet@20240620", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("claude-3-7-sonnet-20250219", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("claude-3-7-sonnet@20250219", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("claude-3-haiku", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 1.25, max_input_tokens: Some(200000) }),
("claude-3-haiku-20240307", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 1.25, max_input_tokens: Some(200000) }),
("claude-3-haiku@20240307", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 1.25, max_input_tokens: Some(200000) }),
("claude-3-opus", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("claude-3-opus-20240229", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("claude-3-opus@20240229", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("claude-3-sonnet", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("claude-3-sonnet@20240229", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("claude-3.5-sonnet", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("claude-3.7-sonnet", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("claude-4-opus-20250514", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("claude-4-sonnet-20250514", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1000000) }),
("claude-haiku-4-5", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 5.0, max_input_tokens: Some(200000) }),
("claude-haiku-4-5-20251001", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 5.0, max_input_tokens: Some(200000) }),
("claude-haiku-4-5@20251001", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 5.0, max_input_tokens: Some(200000) }),
("claude-haiku-4.5", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 5.0, max_input_tokens: Some(200000) }),
("claude-opus-4", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("claude-opus-4-1", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("claude-opus-4-1-20250805", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("claude-opus-4-1@20250805", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("claude-opus-4-20250514", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("claude-opus-4-5", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(200000) }),
("claude-opus-4-5-20251101", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(200000) }),
("claude-opus-4-5@20251101", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(200000) }),
("claude-opus-4-6", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(1000000) }),
("claude-opus-4-6-20260205", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(1000000) }),
("claude-opus-4-6@default", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(1000000) }),
("claude-opus-4-7", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(1000000) }),
("claude-opus-4-7-20260416", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(1000000) }),
("claude-opus-4-7@default", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(1000000) }),
("claude-opus-4.1", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("claude-opus-4.5", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(200000) }),
("claude-opus-4.6", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(1000000) }),
("claude-opus-4@20250514", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("claude-sonnet-4", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1000000) }),
("claude-sonnet-4-20250514", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1000000) }),
("claude-sonnet-4-5", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("claude-sonnet-4-5-20250929", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("claude-sonnet-4-5-20250929-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("claude-sonnet-4-5@20250929", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("claude-sonnet-4-6", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1000000) }),
("claude-sonnet-4-6@default", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1000000) }),
("claude-sonnet-4.5", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1000000) }),
("claude-sonnet-4.6", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1000000) }),
("claude-sonnet-4@20250514", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1000000) }),
("cloudflare/@cf/meta/llama-2-7b-chat-fp16", ModelPrice { input_per_mtok: 1.923, output_per_mtok: 1.923, max_input_tokens: Some(3072) }),
("cloudflare/@cf/meta/llama-2-7b-chat-int8", ModelPrice { input_per_mtok: 1.923, output_per_mtok: 1.923, max_input_tokens: Some(2048) }),
("cloudflare/@cf/mistral/mistral-7b-instruct-v0.1", ModelPrice { input_per_mtok: 1.923, output_per_mtok: 1.923, max_input_tokens: Some(8192) }),
("cloudflare/@hf/thebloke/codellama-7b-instruct-awq", ModelPrice { input_per_mtok: 1.923, output_per_mtok: 1.923, max_input_tokens: Some(4096) }),
("codellama-34b-instruct", ModelPrice { input_per_mtok: 0.35, output_per_mtok: 1.4, max_input_tokens: Some(16384) }),
("codellama-70b-instruct", ModelPrice { input_per_mtok: 0.7, output_per_mtok: 2.8, max_input_tokens: Some(16384) }),
("codestral-2", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.9, max_input_tokens: Some(128000) }),
("codestral-2405", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.0, max_input_tokens: Some(32000) }),
("codestral-2501", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.6, max_input_tokens: Some(128000) }),
("codestral-2508", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.9, max_input_tokens: Some(256000) }),
("codestral-2@001", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.9, max_input_tokens: Some(128000) }),
("codestral-latest", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.0, max_input_tokens: Some(32000) }),
("codestral-mamba-latest", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 0.25, max_input_tokens: Some(256000) }),
("codestral@2405", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.6, max_input_tokens: Some(128000) }),
("codestral@latest", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.6, max_input_tokens: Some(128000) }),
("codex-mini", ModelPrice { input_per_mtok: 1.5, output_per_mtok: 6.0, max_input_tokens: Some(200000) }),
("codex-mini-latest", ModelPrice { input_per_mtok: 1.5, output_per_mtok: 6.0, max_input_tokens: Some(200000) }),
("cohere.command-light-text-v14", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.6, max_input_tokens: Some(4096) }),
("cohere.command-r-plus-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(128000) }),
("cohere.command-r-v1:0", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(128000) }),
("cohere.command-text-v14", ModelPrice { input_per_mtok: 1.5, output_per_mtok: 2.0, max_input_tokens: Some(4096) }),
("command", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 2.0, max_input_tokens: Some(4096) }),
("command-a-03-2025", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(256000) }),
("command-light", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.6, max_input_tokens: Some(4096) }),
("command-nightly", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 2.0, max_input_tokens: Some(4096) }),
("command-r", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(128000) }),
("command-r-08-2024", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(128000) }),
("command-r-plus", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(128000) }),
("command-r-plus-08-2024", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("command-r7b-12-2024", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.0375, max_input_tokens: Some(128000) }),
("computer-use-preview", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 12.0, max_input_tokens: Some(8192) }),
("dashscope/qwen-coder", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.5, max_input_tokens: Some(1000000) }),
("dashscope/qwen-max", ModelPrice { input_per_mtok: 1.6, output_per_mtok: 6.4, max_input_tokens: Some(30720) }),
("dashscope/qwen-plus", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 1.2, max_input_tokens: Some(129024) }),
("dashscope/qwen-plus-2025-01-25", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 1.2, max_input_tokens: Some(129024) }),
("dashscope/qwen-plus-2025-04-28", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 1.2, max_input_tokens: Some(129024) }),
("dashscope/qwen-plus-2025-07-14", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 1.2, max_input_tokens: Some(129024) }),
("dashscope/qwen-turbo", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.2, max_input_tokens: Some(129024) }),
("dashscope/qwen-turbo-2024-11-01", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.2, max_input_tokens: Some(1000000) }),
("dashscope/qwen-turbo-2025-04-28", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.2, max_input_tokens: Some(1000000) }),
("dashscope/qwen-turbo-latest", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.2, max_input_tokens: Some(1000000) }),
("dashscope/qwen3-next-80b-a3b-instruct", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 1.2, max_input_tokens: Some(262144) }),
("dashscope/qwen3-next-80b-a3b-thinking", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 1.2, max_input_tokens: Some(262144) }),
("dashscope/qwen3-vl-235b-a22b-instruct", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 1.6, max_input_tokens: Some(131072) }),
("dashscope/qwen3-vl-235b-a22b-thinking", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 4.0, max_input_tokens: Some(131072) }),
("dashscope/qwen3-vl-32b-instruct", ModelPrice { input_per_mtok: 0.16, output_per_mtok: 0.64, max_input_tokens: Some(131072) }),
("dashscope/qwen3-vl-32b-thinking", ModelPrice { input_per_mtok: 0.16, output_per_mtok: 2.87, max_input_tokens: Some(131072) }),
("dashscope/qwq-plus", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 2.4, max_input_tokens: Some(98304) }),
("databricks/databricks-claude-3-7-sonnet", ModelPrice { input_per_mtok: 2.99999, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("databricks/databricks-claude-haiku-4-5", ModelPrice { input_per_mtok: 1.00002, output_per_mtok: 5.00003, max_input_tokens: Some(200000) }),
("databricks/databricks-claude-opus-4", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("databricks/databricks-claude-opus-4-1", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("databricks/databricks-claude-opus-4-5", ModelPrice { input_per_mtok: 5.00003, output_per_mtok: 25.0, max_input_tokens: Some(200000) }),
("databricks/databricks-claude-sonnet-4", ModelPrice { input_per_mtok: 2.99999, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("databricks/databricks-claude-sonnet-4-1", ModelPrice { input_per_mtok: 2.99999, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("databricks/databricks-claude-sonnet-4-5", ModelPrice { input_per_mtok: 2.99999, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("databricks/databricks-gemini-2-5-flash", ModelPrice { input_per_mtok: 0.30002, output_per_mtok: 2.49998, max_input_tokens: Some(1048576) }),
("databricks/databricks-gemini-2-5-pro", ModelPrice { input_per_mtok: 1.24999, output_per_mtok: 9.99999, max_input_tokens: Some(1048576) }),
("databricks/databricks-gemma-3-12b", ModelPrice { input_per_mtok: 0.15001, output_per_mtok: 0.50001, max_input_tokens: Some(128000) }),
("databricks/databricks-gpt-5", ModelPrice { input_per_mtok: 1.24999, output_per_mtok: 9.99999, max_input_tokens: Some(272000) }),
("databricks/databricks-gpt-5-1", ModelPrice { input_per_mtok: 1.24999, output_per_mtok: 9.99999, max_input_tokens: Some(272000) }),
("databricks/databricks-gpt-5-mini", ModelPrice { input_per_mtok: 0.24997, output_per_mtok: 1.99997, max_input_tokens: Some(272000) }),
("databricks/databricks-gpt-5-nano", ModelPrice { input_per_mtok: 0.04998, output_per_mtok: 0.39998, max_input_tokens: Some(272000) }),
("databricks/databricks-gpt-oss-120b", ModelPrice { input_per_mtok: 0.15001, output_per_mtok: 0.59997, max_input_tokens: Some(131072) }),
("databricks/databricks-gpt-oss-20b", ModelPrice { input_per_mtok: 0.07, output_per_mtok: 0.30002, max_input_tokens: Some(131072) }),
("databricks/databricks-llama-2-70b-chat", ModelPrice { input_per_mtok: 0.50001, output_per_mtok: 1.50003, max_input_tokens: Some(4096) }),
("databricks/databricks-llama-4-maverick", ModelPrice { input_per_mtok: 0.50001, output_per_mtok: 1.50003, max_input_tokens: Some(128000) }),
("databricks/databricks-meta-llama-3-1-405b-instruct", ModelPrice { input_per_mtok: 5.00003, output_per_mtok: 15.0, max_input_tokens: Some(128000) }),
("databricks/databricks-meta-llama-3-1-8b-instruct", ModelPrice { input_per_mtok: 0.15001, output_per_mtok: 0.45003, max_input_tokens: Some(200000) }),
("databricks/databricks-meta-llama-3-3-70b-instruct", ModelPrice { input_per_mtok: 0.50001, output_per_mtok: 1.50003, max_input_tokens: Some(128000) }),
("databricks/databricks-meta-llama-3-70b-instruct", ModelPrice { input_per_mtok: 1.00002, output_per_mtok: 2.99999, max_input_tokens: Some(128000) }),
("databricks/databricks-mixtral-8x7b-instruct", ModelPrice { input_per_mtok: 0.50001, output_per_mtok: 1.00002, max_input_tokens: Some(4096) }),
("databricks/databricks-mpt-30b-instruct", ModelPrice { input_per_mtok: 1.00002, output_per_mtok: 1.00002, max_input_tokens: Some(8192) }),
("databricks/databricks-mpt-7b-instruct", ModelPrice { input_per_mtok: 0.50001, output_per_mtok: 0.0, max_input_tokens: Some(8192) }),
("davinci-002", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 2.0, max_input_tokens: Some(16384) }),
("deepinfra/Gryphe/MythoMax-L2-13b", ModelPrice { input_per_mtok: 0.08, output_per_mtok: 0.09, max_input_tokens: Some(4096) }),
("deepinfra/NousResearch/Hermes-3-Llama-3.1-405B", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 1.0, max_input_tokens: Some(131072) }),
("deepinfra/NousResearch/Hermes-3-Llama-3.1-70B", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.3, max_input_tokens: Some(131072) }),
("deepinfra/Qwen/QwQ-32B", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.4, max_input_tokens: Some(131072) }),
("deepinfra/Qwen/Qwen2.5-72B-Instruct", ModelPrice { input_per_mtok: 0.12, output_per_mtok: 0.39, max_input_tokens: Some(32768) }),
("deepinfra/Qwen/Qwen2.5-7B-Instruct", ModelPrice { input_per_mtok: 0.04, output_per_mtok: 0.1, max_input_tokens: Some(32768) }),
("deepinfra/Qwen/Qwen2.5-VL-32B-Instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.6, max_input_tokens: Some(128000) }),
("deepinfra/Qwen/Qwen3-14B", ModelPrice { input_per_mtok: 0.06, output_per_mtok: 0.24, max_input_tokens: Some(40960) }),
("deepinfra/Qwen/Qwen3-235B-A22B", ModelPrice { input_per_mtok: 0.18, output_per_mtok: 0.54, max_input_tokens: Some(40960) }),
("deepinfra/Qwen/Qwen3-235B-A22B-Instruct-2507", ModelPrice { input_per_mtok: 0.09, output_per_mtok: 0.6, max_input_tokens: Some(262144) }),
("deepinfra/Qwen/Qwen3-235B-A22B-Thinking-2507", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 2.9, max_input_tokens: Some(262144) }),
("deepinfra/Qwen/Qwen3-30B-A3B", ModelPrice { input_per_mtok: 0.08, output_per_mtok: 0.29, max_input_tokens: Some(40960) }),
("deepinfra/Qwen/Qwen3-32B", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.28, max_input_tokens: Some(40960) }),
("deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 1.6, max_input_tokens: Some(262144) }),
("deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo", ModelPrice { input_per_mtok: 0.29, output_per_mtok: 1.2, max_input_tokens: Some(262144) }),
("deepinfra/Qwen/Qwen3-Next-80B-A3B-Instruct", ModelPrice { input_per_mtok: 0.14, output_per_mtok: 1.4, max_input_tokens: Some(262144) }),
("deepinfra/Qwen/Qwen3-Next-80B-A3B-Thinking", ModelPrice { input_per_mtok: 0.14, output_per_mtok: 1.4, max_input_tokens: Some(262144) }),
("deepinfra/Sao10K/L3-8B-Lunaris-v1-Turbo", ModelPrice { input_per_mtok: 0.04, output_per_mtok: 0.05, max_input_tokens: Some(8192) }),
("deepinfra/Sao10K/L3.1-70B-Euryale-v2.2", ModelPrice { input_per_mtok: 0.65, output_per_mtok: 0.75, max_input_tokens: Some(131072) }),
("deepinfra/Sao10K/L3.3-70B-Euryale-v2.3", ModelPrice { input_per_mtok: 0.65, output_per_mtok: 0.75, max_input_tokens: Some(131072) }),
("deepinfra/allenai/olmOCR-7B-0725-FP8", ModelPrice { input_per_mtok: 0.27, output_per_mtok: 1.5, max_input_tokens: Some(16384) }),
("deepinfra/anthropic/claude-3-7-sonnet-latest", ModelPrice { input_per_mtok: 3.3, output_per_mtok: 16.5, max_input_tokens: Some(200000) }),
("deepinfra/anthropic/claude-4-opus", ModelPrice { input_per_mtok: 16.5, output_per_mtok: 82.5, max_input_tokens: Some(200000) }),
("deepinfra/anthropic/claude-4-sonnet", ModelPrice { input_per_mtok: 3.3, output_per_mtok: 16.5, max_input_tokens: Some(200000) }),
("deepinfra/deepseek-ai/DeepSeek-R1", ModelPrice { input_per_mtok: 0.7, output_per_mtok: 2.4, max_input_tokens: Some(163840) }),
("deepinfra/deepseek-ai/DeepSeek-R1-0528", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 2.15, max_input_tokens: Some(163840) }),
("deepinfra/deepseek-ai/DeepSeek-R1-0528-Turbo", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.0, max_input_tokens: Some(32768) }),
("deepinfra/deepseek-ai/DeepSeek-R1-Distill-Llama-70B", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.6, max_input_tokens: Some(131072) }),
("deepinfra/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", ModelPrice { input_per_mtok: 0.27, output_per_mtok: 0.27, max_input_tokens: Some(131072) }),
("deepinfra/deepseek-ai/DeepSeek-R1-Turbo", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.0, max_input_tokens: Some(40960) }),
("deepinfra/deepseek-ai/DeepSeek-V3", ModelPrice { input_per_mtok: 0.38, output_per_mtok: 0.89, max_input_tokens: Some(163840) }),
("deepinfra/deepseek-ai/DeepSeek-V3-0324", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 0.88, max_input_tokens: Some(163840) }),
("deepinfra/deepseek-ai/DeepSeek-V3.1", ModelPrice { input_per_mtok: 0.27, output_per_mtok: 1.0, max_input_tokens: Some(163840) }),
("deepinfra/deepseek-ai/DeepSeek-V3.1-Terminus", ModelPrice { input_per_mtok: 0.27, output_per_mtok: 1.0, max_input_tokens: Some(163840) }),
("deepinfra/google/gemini-2.0-flash-001", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.4, max_input_tokens: Some(1000000) }),
("deepinfra/google/gemini-2.5-flash", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 2.5, max_input_tokens: Some(1000000) }),
("deepinfra/google/gemini-2.5-pro", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(1000000) }),
("deepinfra/google/gemma-3-12b-it", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.1, max_input_tokens: Some(131072) }),
("deepinfra/google/gemma-3-27b-it", ModelPrice { input_per_mtok: 0.09, output_per_mtok: 0.16, max_input_tokens: Some(131072) }),
("deepinfra/google/gemma-3-4b-it", ModelPrice { input_per_mtok: 0.04, output_per_mtok: 0.08, max_input_tokens: Some(131072) }),
("deepinfra/meta-llama/Llama-3.2-11B-Vision-Instruct", ModelPrice { input_per_mtok: 0.049, output_per_mtok: 0.049, max_input_tokens: Some(131072) }),
("deepinfra/meta-llama/Llama-3.2-3B-Instruct", ModelPrice { input_per_mtok: 0.02, output_per_mtok: 0.02, max_input_tokens: Some(131072) }),
("deepinfra/meta-llama/Llama-3.3-70B-Instruct", ModelPrice { input_per_mtok: 0.23, output_per_mtok: 0.4, max_input_tokens: Some(131072) }),
("deepinfra/meta-llama/Llama-3.3-70B-Instruct-Turbo", ModelPrice { input_per_mtok: 0.13, output_per_mtok: 0.39, max_input_tokens: Some(131072) }),
("deepinfra/meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(1048576) }),
("deepinfra/meta-llama/Llama-4-Scout-17B-16E-Instruct", ModelPrice { input_per_mtok: 0.08, output_per_mtok: 0.3, max_input_tokens: Some(327680) }),
("deepinfra/meta-llama/Llama-Guard-3-8B", ModelPrice { input_per_mtok: 0.055, output_per_mtok: 0.055, max_input_tokens: Some(131072) }),
("deepinfra/meta-llama/Llama-Guard-4-12B", ModelPrice { input_per_mtok: 0.18, output_per_mtok: 0.18, max_input_tokens: Some(163840) }),
("deepinfra/meta-llama/Meta-Llama-3-8B-Instruct", ModelPrice { input_per_mtok: 0.03, output_per_mtok: 0.06, max_input_tokens: Some(8192) }),
("deepinfra/meta-llama/Meta-Llama-3.1-70B-Instruct", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 0.4, max_input_tokens: Some(131072) }),
("deepinfra/meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.28, max_input_tokens: Some(131072) }),
("deepinfra/meta-llama/Meta-Llama-3.1-8B-Instruct", ModelPrice { input_per_mtok: 0.03, output_per_mtok: 0.05, max_input_tokens: Some(131072) }),
("deepinfra/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo", ModelPrice { input_per_mtok: 0.02, output_per_mtok: 0.03, max_input_tokens: Some(131072) }),
("deepinfra/microsoft/WizardLM-2-8x22B", ModelPrice { input_per_mtok: 0.48, output_per_mtok: 0.48, max_input_tokens: Some(65536) }),
("deepinfra/microsoft/phi-4", ModelPrice { input_per_mtok: 0.07, output_per_mtok: 0.14, max_input_tokens: Some(16384) }),
("deepinfra/mistralai/Mistral-Nemo-Instruct-2407", ModelPrice { input_per_mtok: 0.02, output_per_mtok: 0.04, max_input_tokens: Some(131072) }),
("deepinfra/mistralai/Mistral-Small-24B-Instruct-2501", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.08, max_input_tokens: Some(32768) }),
("deepinfra/mistralai/Mistral-Small-3.2-24B-Instruct-2506", ModelPrice { input_per_mtok: 0.075, output_per_mtok: 0.2, max_input_tokens: Some(128000) }),
("deepinfra/mistralai/Mixtral-8x7B-Instruct-v0.1", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 0.4, max_input_tokens: Some(32768) }),
("deepinfra/moonshotai/Kimi-K2-Instruct", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 2.0, max_input_tokens: Some(131072) }),
("deepinfra/moonshotai/Kimi-K2-Instruct-0905", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 2.0, max_input_tokens: Some(262144) }),
("deepinfra/nvidia/Llama-3.1-Nemotron-70B-Instruct", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 0.6, max_input_tokens: Some(131072) }),
("deepinfra/nvidia/Llama-3.3-Nemotron-Super-49B-v1.5", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.4, max_input_tokens: Some(131072) }),
("deepinfra/nvidia/NVIDIA-Nemotron-Nano-9B-v2", ModelPrice { input_per_mtok: 0.04, output_per_mtok: 0.16, max_input_tokens: Some(131072) }),
("deepinfra/openai/gpt-oss-120b", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.45, max_input_tokens: Some(131072) }),
("deepinfra/openai/gpt-oss-20b", ModelPrice { input_per_mtok: 0.04, output_per_mtok: 0.15, max_input_tokens: Some(131072) }),
("deepinfra/zai-org/GLM-4.5", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 1.6, max_input_tokens: Some(131072) }),
("deepseek-ai/DeepSeek-R1", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 7.0, max_input_tokens: Some(128000) }),
("deepseek-ai/DeepSeek-R1-0528-tput", ModelPrice { input_per_mtok: 0.55, output_per_mtok: 2.19, max_input_tokens: Some(128000) }),
("deepseek-ai/DeepSeek-V3", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 1.25, max_input_tokens: Some(65536) }),
("deepseek-ai/DeepSeek-V3.1", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 1.7, max_input_tokens: Some(128000) }),
("deepseek-ai/deepseek-r1", ModelPrice { input_per_mtok: 3.75, output_per_mtok: 10.0, max_input_tokens: Some(65536) }),
("deepseek-ai/deepseek-r1-0528-maas", ModelPrice { input_per_mtok: 1.35, output_per_mtok: 5.4, max_input_tokens: Some(65336) }),
("deepseek-ai/deepseek-v3", ModelPrice { input_per_mtok: 1.45, output_per_mtok: 1.45, max_input_tokens: Some(65536) }),
("deepseek-ai/deepseek-v3.1", ModelPrice { input_per_mtok: 0.672, output_per_mtok: 2.016, max_input_tokens: Some(163840) }),
("deepseek-ai/deepseek-v3.1-maas", ModelPrice { input_per_mtok: 1.35, output_per_mtok: 5.4, max_input_tokens: Some(163840) }),
("deepseek-ai/deepseek-v3.2-maas", ModelPrice { input_per_mtok: 0.56, output_per_mtok: 1.68, max_input_tokens: Some(163840) }),
("deepseek-chat", ModelPrice { input_per_mtok: 0.28, output_per_mtok: 0.42, max_input_tokens: Some(131072) }),
("deepseek-chat-v3-0324", ModelPrice { input_per_mtok: 0.14, output_per_mtok: 0.28, max_input_tokens: Some(65536) }),
("deepseek-chat-v3.1", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.8, max_input_tokens: Some(163840) }),
("deepseek-coder", ModelPrice { input_per_mtok: 0.14, output_per_mtok: 0.28, max_input_tokens: Some(128000) }),
("deepseek-r1", ModelPrice { input_per_mtok: 0.55, output_per_mtok: 2.19, max_input_tokens: Some(65536) }),
("deepseek-r1-0528", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 2.15, max_input_tokens: Some(65336) }),
("deepseek-reasoner", ModelPrice { input_per_mtok: 0.28, output_per_mtok: 0.42, max_input_tokens: Some(131072) }),
("deepseek-v3", ModelPrice { input_per_mtok: 0.27, output_per_mtok: 1.1, max_input_tokens: Some(65536) }),
("deepseek-v3.2", ModelPrice { input_per_mtok: 0.28, output_per_mtok: 0.4, max_input_tokens: Some(163840) }),
("deepseek-v3.2-exp", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.4, max_input_tokens: Some(163840) }),
("deepseek.v3-v1:0", ModelPrice { input_per_mtok: 0.58, output_per_mtok: 1.68, max_input_tokens: Some(163840) }),
("deepseek.v3.2", ModelPrice { input_per_mtok: 0.62, output_per_mtok: 1.85, max_input_tokens: Some(163840) }),
("devstral-2512", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 2.0, max_input_tokens: Some(256000) }),
("devstral-latest", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 2.0, max_input_tokens: Some(256000) }),
("devstral-medium-2507", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 2.0, max_input_tokens: Some(128000) }),
("devstral-medium-latest", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 2.0, max_input_tokens: Some(256000) }),
("devstral-small-2505", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.3, max_input_tokens: Some(128000) }),
("devstral-small-2507", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.3, max_input_tokens: Some(128000) }),
("devstral-small-latest", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.3, max_input_tokens: Some(256000) }),
("dolphin", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 0.5, max_input_tokens: Some(16384) }),
("eu-central-1/anthropic.claude-instant-v1", ModelPrice { input_per_mtok: 2.48, output_per_mtok: 8.38, max_input_tokens: Some(100000) }),
("eu-central-1/anthropic.claude-v1", ModelPrice { input_per_mtok: 8.0, output_per_mtok: 24.0, max_input_tokens: Some(100000) }),
("eu-central-1/anthropic.claude-v2:1", ModelPrice { input_per_mtok: 8.0, output_per_mtok: 24.0, max_input_tokens: Some(100000) }),
("eu-central-1/minimax.minimax-m2.1", ModelPrice { input_per_mtok: 0.36, output_per_mtok: 1.44, max_input_tokens: Some(196000) }),
("eu-central-1/minimax.minimax-m2.5", ModelPrice { input_per_mtok: 0.36, output_per_mtok: 1.44, max_input_tokens: Some(1000000) }),
("eu-central-1/qwen.qwen3-coder-next", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 1.44, max_input_tokens: Some(262144) }),
("eu-north-1/deepseek.v3.2", ModelPrice { input_per_mtok: 0.74, output_per_mtok: 2.22, max_input_tokens: Some(163840) }),
("eu-north-1/minimax.minimax-m2.1", ModelPrice { input_per_mtok: 0.36, output_per_mtok: 1.44, max_input_tokens: Some(196000) }),
("eu-north-1/minimax.minimax-m2.5", ModelPrice { input_per_mtok: 0.36, output_per_mtok: 1.44, max_input_tokens: Some(1000000) }),
("eu-north-1/moonshotai.kimi-k2.5", ModelPrice { input_per_mtok: 0.72, output_per_mtok: 3.6, max_input_tokens: Some(262144) }),
("eu-south-1/minimax.minimax-m2.1", ModelPrice { input_per_mtok: 0.36, output_per_mtok: 1.44, max_input_tokens: Some(196000) }),
("eu-south-1/minimax.minimax-m2.5", ModelPrice { input_per_mtok: 0.36, output_per_mtok: 1.44, max_input_tokens: Some(1000000) }),
("eu-south-1/qwen.qwen3-coder-next", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 1.44, max_input_tokens: Some(262144) }),
("eu-west-1/meta.llama3-70b-instruct-v1:0", ModelPrice { input_per_mtok: 2.86, output_per_mtok: 3.78, max_input_tokens: Some(8192) }),
("eu-west-1/meta.llama3-8b-instruct-v1:0", ModelPrice { input_per_mtok: 0.32, output_per_mtok: 0.65, max_input_tokens: Some(8192) }),
("eu-west-1/minimax.minimax-m2.1", ModelPrice { input_per_mtok: 0.36, output_per_mtok: 1.44, max_input_tokens: Some(196000) }),
("eu-west-1/minimax.minimax-m2.5", ModelPrice { input_per_mtok: 0.36, output_per_mtok: 1.44, max_input_tokens: Some(1000000) }),
("eu-west-1/qwen.qwen3-coder-next", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 1.44, max_input_tokens: Some(262144) }),
("eu-west-2/meta.llama3-70b-instruct-v1:0", ModelPrice { input_per_mtok: 3.45, output_per_mtok: 4.55, max_input_tokens: Some(8192) }),
("eu-west-2/meta.llama3-8b-instruct-v1:0", ModelPrice { input_per_mtok: 0.39, output_per_mtok: 0.78, max_input_tokens: Some(8192) }),
("eu-west-2/minimax.minimax-m2.1", ModelPrice { input_per_mtok: 0.47, output_per_mtok: 1.86, max_input_tokens: Some(196000) }),
("eu-west-2/minimax.minimax-m2.5", ModelPrice { input_per_mtok: 0.47, output_per_mtok: 1.86, max_input_tokens: Some(1000000) }),
("eu-west-2/qwen.qwen3-coder-next", ModelPrice { input_per_mtok: 0.78, output_per_mtok: 1.86, max_input_tokens: Some(262144) }),
("eu-west-3/mistral.mistral-7b-instruct-v0:2", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.26, max_input_tokens: Some(32000) }),
("eu-west-3/mistral.mistral-large-2402-v1:0", ModelPrice { input_per_mtok: 10.4, output_per_mtok: 31.2, max_input_tokens: Some(32000) }),
("eu-west-3/mistral.mixtral-8x7b-instruct-v0:1", ModelPrice { input_per_mtok: 0.59, output_per_mtok: 0.91, max_input_tokens: Some(32000) }),
("eu.amazon.nova-2-lite-v1:0", ModelPrice { input_per_mtok: 0.33, output_per_mtok: 2.75, max_input_tokens: Some(1000000) }),
("eu.amazon.nova-2-pro-preview-20251202-v1:0", ModelPrice { input_per_mtok: 2.1875, output_per_mtok: 17.5, max_input_tokens: Some(1000000) }),
("eu.amazon.nova-lite-v1:0", ModelPrice { input_per_mtok: 0.078, output_per_mtok: 0.312, max_input_tokens: Some(300000) }),
("eu.amazon.nova-micro-v1:0", ModelPrice { input_per_mtok: 0.046, output_per_mtok: 0.184, max_input_tokens: Some(128000) }),
("eu.amazon.nova-pro-v1:0", ModelPrice { input_per_mtok: 1.05, output_per_mtok: 4.2, max_input_tokens: Some(300000) }),
("eu.anthropic.claude-3-5-haiku-20241022-v1:0", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 1.25, max_input_tokens: Some(200000) }),
("eu.anthropic.claude-3-5-sonnet-20240620-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("eu.anthropic.claude-3-5-sonnet-20241022-v2:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("eu.anthropic.claude-3-7-sonnet-20250219-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("eu.anthropic.claude-3-haiku-20240307-v1:0", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 1.25, max_input_tokens: Some(200000) }),
("eu.anthropic.claude-3-opus-20240229-v1:0", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("eu.anthropic.claude-3-sonnet-20240229-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("eu.anthropic.claude-haiku-4-5-20251001-v1:0", ModelPrice { input_per_mtok: 1.1, output_per_mtok: 5.5, max_input_tokens: Some(200000) }),
("eu.anthropic.claude-opus-4-1-20250805-v1:0", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("eu.anthropic.claude-opus-4-20250514-v1:0", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("eu.anthropic.claude-opus-4-5-20251101-v1:0", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(200000) }),
("eu.anthropic.claude-opus-4-6-v1", ModelPrice { input_per_mtok: 5.5, output_per_mtok: 27.5, max_input_tokens: Some(1000000) }),
("eu.anthropic.claude-opus-4-7", ModelPrice { input_per_mtok: 5.5, output_per_mtok: 27.5, max_input_tokens: Some(1000000) }),
("eu.anthropic.claude-sonnet-4-20250514-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1000000) }),
("eu.anthropic.claude-sonnet-4-5-20250929-v1:0", ModelPrice { input_per_mtok: 3.3, output_per_mtok: 16.5, max_input_tokens: Some(200000) }),
("eu.anthropic.claude-sonnet-4-6", ModelPrice { input_per_mtok: 3.3, output_per_mtok: 16.5, max_input_tokens: Some(1000000) }),
("eu.deepseek.v3.2", ModelPrice { input_per_mtok: 0.74, output_per_mtok: 2.22, max_input_tokens: Some(163840) }),
("eu.meta.llama3-2-1b-instruct-v1:0", ModelPrice { input_per_mtok: 0.13, output_per_mtok: 0.13, max_input_tokens: Some(128000) }),
("eu.meta.llama3-2-3b-instruct-v1:0", ModelPrice { input_per_mtok: 0.19, output_per_mtok: 0.19, max_input_tokens: Some(128000) }),
("eu.mistral.pixtral-large-2502-v1:0", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 6.0, max_input_tokens: Some(128000) }),
("eu/gpt-4o-2024-08-06", ModelPrice { input_per_mtok: 2.75, output_per_mtok: 11.0, max_input_tokens: Some(128000) }),
("eu/gpt-4o-2024-11-20", ModelPrice { input_per_mtok: 2.75, output_per_mtok: 11.0, max_input_tokens: Some(128000) }),
("eu/gpt-4o-mini-2024-07-18", ModelPrice { input_per_mtok: 0.165, output_per_mtok: 0.66, max_input_tokens: Some(128000) }),
("eu/gpt-4o-mini-realtime-preview-2024-12-17", ModelPrice { input_per_mtok: 0.66, output_per_mtok: 2.64, max_input_tokens: Some(128000) }),
("eu/gpt-4o-realtime-preview-2024-10-01", ModelPrice { input_per_mtok: 5.5, output_per_mtok: 22.0, max_input_tokens: Some(128000) }),
("eu/gpt-4o-realtime-preview-2024-12-17", ModelPrice { input_per_mtok: 5.5, output_per_mtok: 22.0, max_input_tokens: Some(128000) }),
("eu/gpt-5-2025-08-07", ModelPrice { input_per_mtok: 1.375, output_per_mtok: 11.0, max_input_tokens: Some(272000) }),
("eu/gpt-5-mini-2025-08-07", ModelPrice { input_per_mtok: 0.275, output_per_mtok: 2.2, max_input_tokens: Some(272000) }),
("eu/gpt-5-nano-2025-08-07", ModelPrice { input_per_mtok: 0.055, output_per_mtok: 0.44, max_input_tokens: Some(272000) }),
("eu/gpt-5.1", ModelPrice { input_per_mtok: 1.38, output_per_mtok: 11.0, max_input_tokens: Some(272000) }),
("eu/gpt-5.1-chat", ModelPrice { input_per_mtok: 1.38, output_per_mtok: 11.0, max_input_tokens: Some(128000) }),
("eu/gpt-5.1-codex", ModelPrice { input_per_mtok: 1.38, output_per_mtok: 11.0, max_input_tokens: Some(272000) }),
("eu/gpt-5.1-codex-mini", ModelPrice { input_per_mtok: 0.275, output_per_mtok: 2.2, max_input_tokens: Some(272000) }),
("eu/o1-2024-12-17", ModelPrice { input_per_mtok: 16.5, output_per_mtok: 66.0, max_input_tokens: Some(200000) }),
("eu/o1-mini-2024-09-12", ModelPrice { input_per_mtok: 1.21, output_per_mtok: 4.84, max_input_tokens: Some(128000) }),
("eu/o1-preview-2024-09-12", ModelPrice { input_per_mtok: 16.5, output_per_mtok: 66.0, max_input_tokens: Some(128000) }),
("eu/o3-mini-2025-01-31", ModelPrice { input_per_mtok: 1.21, output_per_mtok: 4.84, max_input_tokens: Some(200000) }),
("fireworks-ai-4.1b-to-16b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: None }),
("fireworks-ai-56b-to-176b", ModelPrice { input_per_mtok: 1.2, output_per_mtok: 1.2, max_input_tokens: None }),
("fireworks-ai-above-16b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: None }),
("fireworks-ai-embedding-150m-to-350m", ModelPrice { input_per_mtok: 0.016, output_per_mtok: 0.0, max_input_tokens: None }),
("fireworks-ai-embedding-up-to-150m", ModelPrice { input_per_mtok: 0.008, output_per_mtok: 0.0, max_input_tokens: None }),
("fireworks-ai-moe-up-to-56b", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 0.5, max_input_tokens: None }),
("fireworks-ai-up-to-4b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: None }),
("friendliai/meta-llama-3.1-70b-instruct", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 0.6, max_input_tokens: Some(8192) }),
("friendliai/meta-llama-3.1-8b-instruct", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(8192) }),
("ft:babbage-002", ModelPrice { input_per_mtok: 1.6, output_per_mtok: 1.6, max_input_tokens: Some(16384) }),
("ft:davinci-002", ModelPrice { input_per_mtok: 12.0, output_per_mtok: 12.0, max_input_tokens: Some(16384) }),
("ft:gpt-3.5-turbo", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 6.0, max_input_tokens: Some(16385) }),
("ft:gpt-3.5-turbo-0125", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 6.0, max_input_tokens: Some(16385) }),
("ft:gpt-3.5-turbo-0613", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 6.0, max_input_tokens: Some(4096) }),
("ft:gpt-3.5-turbo-1106", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 6.0, max_input_tokens: Some(16385) }),
("ft:gpt-4-0613", ModelPrice { input_per_mtok: 30.0, output_per_mtok: 60.0, max_input_tokens: Some(8192) }),
("ft:gpt-4.1-2025-04-14", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 12.0, max_input_tokens: Some(1047576) }),
("ft:gpt-4.1-mini-2025-04-14", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 3.2, max_input_tokens: Some(1047576) }),
("ft:gpt-4.1-nano-2025-04-14", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.8, max_input_tokens: Some(1047576) }),
("ft:gpt-4o-2024-08-06", ModelPrice { input_per_mtok: 3.75, output_per_mtok: 15.0, max_input_tokens: Some(128000) }),
("ft:gpt-4o-2024-11-20", ModelPrice { input_per_mtok: 3.75, output_per_mtok: 15.0, max_input_tokens: Some(128000) }),
("ft:gpt-4o-mini-2024-07-18", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(128000) }),
("ft:o4-mini-2025-04-16", ModelPrice { input_per_mtok: 4.0, output_per_mtok: 16.0, max_input_tokens: Some(200000) }),
("gemini-2.0-flash", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.4, max_input_tokens: Some(1048576) }),
("gemini-2.0-flash-001", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(1048576) }),
("gemini-2.0-flash-lite", ModelPrice { input_per_mtok: 0.075, output_per_mtok: 0.3, max_input_tokens: Some(1048576) }),
("gemini-2.0-flash-lite-001", ModelPrice { input_per_mtok: 0.075, output_per_mtok: 0.3, max_input_tokens: Some(1048576) }),
("gemini-2.5-computer-use-preview-10-2025", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("gemini-2.5-flash", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 2.5, max_input_tokens: Some(1048576) }),
("gemini-2.5-flash-lite", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.4, max_input_tokens: Some(1048576) }),
("gemini-2.5-flash-lite-preview-06-17", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.4, max_input_tokens: Some(1048576) }),
("gemini-2.5-flash-lite-preview-09-2025", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.4, max_input_tokens: Some(1048576) }),
("gemini-2.5-flash-native-audio-latest", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 2.5, max_input_tokens: Some(1048576) }),
("gemini-2.5-flash-native-audio-preview-09-2025", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 2.5, max_input_tokens: Some(1048576) }),
("gemini-2.5-flash-native-audio-preview-12-2025", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 2.5, max_input_tokens: Some(1048576) }),
("gemini-2.5-flash-preview-09-2025", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 2.5, max_input_tokens: Some(1048576) }),
("gemini-2.5-pro", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(1048576) }),
("gemini-2.5-pro-preview-tts", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(1048576) }),
("gemini-3-flash-preview", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 3.0, max_input_tokens: Some(1048576) }),
("gemini-3-pro-preview", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 12.0, max_input_tokens: Some(1048576) }),
("gemini-3.1-flash-lite-preview", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 1.5, max_input_tokens: Some(1048576) }),
("gemini-3.1-flash-live-preview", ModelPrice { input_per_mtok: 0.75, output_per_mtok: 4.5, max_input_tokens: Some(131072) }),
("gemini-3.1-pro-preview", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 12.0, max_input_tokens: Some(1048576) }),
("gemini-3.1-pro-preview-customtools", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 12.0, max_input_tokens: Some(1048576) }),
("gemini-exp-1206", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 2.5, max_input_tokens: Some(1048576) }),
("gemini-flash-latest", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 2.5, max_input_tokens: Some(1048576) }),
("gemini-flash-lite-latest", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.4, max_input_tokens: Some(1048576) }),
("gemini-gemma-2-27b-it", ModelPrice { input_per_mtok: 0.35, output_per_mtok: 1.05, max_input_tokens: Some(8192) }),
("gemini-gemma-2-9b-it", ModelPrice { input_per_mtok: 0.35, output_per_mtok: 1.05, max_input_tokens: Some(8192) }),
("gemini-pro-latest", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(1048576) }),
("gemini-robotics-er-1.5-preview", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 2.5, max_input_tokens: Some(1048576) }),
("gemma-7b-it", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.08, max_input_tokens: Some(8192) }),
("glm-4p7", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.2, max_input_tokens: Some(202800) }),
("global-standard/gpt-4o-2024-08-06", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("global-standard/gpt-4o-2024-11-20", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("global-standard/gpt-4o-mini", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(128000) }),
("global.amazon.nova-2-lite-v1:0", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 2.5, max_input_tokens: Some(1000000) }),
("global.anthropic.claude-haiku-4-5-20251001-v1:0", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 5.0, max_input_tokens: Some(200000) }),
("global.anthropic.claude-opus-4-5-20251101-v1:0", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(200000) }),
("global.anthropic.claude-opus-4-6-v1", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(1000000) }),
("global.anthropic.claude-opus-4-7", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(1000000) }),
("global.anthropic.claude-sonnet-4-20250514-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1000000) }),
("global.anthropic.claude-sonnet-4-5-20250929-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("global.anthropic.claude-sonnet-4-6", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1000000) }),
("global/gpt-4o-2024-08-06", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("global/gpt-4o-2024-11-20", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("global/gpt-5.1", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(272000) }),
("global/gpt-5.1-chat", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("global/gpt-5.1-codex", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(272000) }),
("global/gpt-5.1-codex-mini", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 2.0, max_input_tokens: Some(272000) }),
("gmi/MiniMaxAI/MiniMax-M2.1", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(196608) }),
("gmi/Qwen/Qwen3-VL-235B-A22B-Instruct-FP8", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.4, max_input_tokens: Some(262144) }),
("gmi/anthropic/claude-opus-4", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(409600) }),
("gmi/anthropic/claude-opus-4.5", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(409600) }),
("gmi/anthropic/claude-sonnet-4", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(409600) }),
("gmi/anthropic/claude-sonnet-4.5", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(409600) }),
("gmi/deepseek-ai/DeepSeek-V3-0324", ModelPrice { input_per_mtok: 0.28, output_per_mtok: 0.88, max_input_tokens: Some(163840) }),
("gmi/deepseek-ai/DeepSeek-V3.2", ModelPrice { input_per_mtok: 0.28, output_per_mtok: 0.4, max_input_tokens: Some(163840) }),
("gmi/google/gemini-3-flash-preview", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 3.0, max_input_tokens: Some(1048576) }),
("gmi/google/gemini-3-pro-preview", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 12.0, max_input_tokens: Some(1048576) }),
("gmi/moonshotai/Kimi-K2-Thinking", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 1.2, max_input_tokens: Some(262144) }),
("gmi/openai/gpt-4o", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(131072) }),
("gmi/openai/gpt-4o-mini", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(131072) }),
("gmi/openai/gpt-5", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(409600) }),
("gmi/openai/gpt-5.1", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(409600) }),
("gmi/openai/gpt-5.2", ModelPrice { input_per_mtok: 1.75, output_per_mtok: 14.0, max_input_tokens: Some(409600) }),
("gmi/zai-org/GLM-4.7-FP8", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 2.0, max_input_tokens: Some(202752) }),
("google.gemma-3-12b-it", ModelPrice { input_per_mtok: 0.09, output_per_mtok: 0.29, max_input_tokens: Some(128000) }),
("google.gemma-3-27b-it", ModelPrice { input_per_mtok: 0.23, output_per_mtok: 0.38, max_input_tokens: Some(128000) }),
("google.gemma-3-4b-it", ModelPrice { input_per_mtok: 0.04, output_per_mtok: 0.08, max_input_tokens: Some(128000) }),
("google/gemini-2.0-flash-001", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.4, max_input_tokens: Some(1048576) }),
("google/gemini-2.5-flash", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 2.5, max_input_tokens: Some(1048576) }),
("google/gemini-2.5-pro", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(1048576) }),
("google/gemini-3-flash-preview", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 3.0, max_input_tokens: Some(1048576) }),
("google/gemini-3-pro", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 12.0, max_input_tokens: None }),
("google/gemini-3-pro-preview", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 12.0, max_input_tokens: Some(1048576) }),
("google/gemini-3.1-flash-lite-preview", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 1.5, max_input_tokens: Some(1048576) }),
("google/gemini-3.1-pro-preview", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 12.0, max_input_tokens: Some(1048576) }),
("gpt-3.5-turbo", ModelPrice { input_per_mtok: 1.5, output_per_mtok: 2.0, max_input_tokens: Some(16385) }),
("gpt-3.5-turbo-0125", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(16385) }),
("gpt-3.5-turbo-1106", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 2.0, max_input_tokens: Some(16385) }),
("gpt-3.5-turbo-16k", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 4.0, max_input_tokens: Some(16385) }),
("gpt-3.5-turbo-instruct", ModelPrice { input_per_mtok: 1.5, output_per_mtok: 2.0, max_input_tokens: Some(8192) }),
("gpt-3.5-turbo-instruct-0914", ModelPrice { input_per_mtok: 1.5, output_per_mtok: 2.0, max_input_tokens: Some(8192) }),
("gpt-35-turbo", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(4097) }),
("gpt-35-turbo-0125", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(16384) }),
("gpt-35-turbo-1106", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 2.0, max_input_tokens: Some(16384) }),
("gpt-35-turbo-16k", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 4.0, max_input_tokens: Some(16385) }),
("gpt-35-turbo-16k-0613", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 4.0, max_input_tokens: Some(16385) }),
("gpt-35-turbo-instruct", ModelPrice { input_per_mtok: 1.5, output_per_mtok: 2.0, max_input_tokens: Some(4097) }),
("gpt-35-turbo-instruct-0914", ModelPrice { input_per_mtok: 1.5, output_per_mtok: 2.0, max_input_tokens: Some(4097) }),
("gpt-4", ModelPrice { input_per_mtok: 30.0, output_per_mtok: 60.0, max_input_tokens: Some(8192) }),
("gpt-4-0125-preview", ModelPrice { input_per_mtok: 10.0, output_per_mtok: 30.0, max_input_tokens: Some(128000) }),
("gpt-4-0314", ModelPrice { input_per_mtok: 30.0, output_per_mtok: 60.0, max_input_tokens: Some(8192) }),
("gpt-4-0613", ModelPrice { input_per_mtok: 30.0, output_per_mtok: 60.0, max_input_tokens: Some(8192) }),
("gpt-4-1106-preview", ModelPrice { input_per_mtok: 10.0, output_per_mtok: 30.0, max_input_tokens: Some(128000) }),
("gpt-4-32k", ModelPrice { input_per_mtok: 60.0, output_per_mtok: 120.0, max_input_tokens: Some(32768) }),
("gpt-4-32k-0613", ModelPrice { input_per_mtok: 60.0, output_per_mtok: 120.0, max_input_tokens: Some(32768) }),
("gpt-4-turbo", ModelPrice { input_per_mtok: 10.0, output_per_mtok: 30.0, max_input_tokens: Some(128000) }),
("gpt-4-turbo-2024-04-09", ModelPrice { input_per_mtok: 10.0, output_per_mtok: 30.0, max_input_tokens: Some(128000) }),
("gpt-4-turbo-preview", ModelPrice { input_per_mtok: 10.0, output_per_mtok: 30.0, max_input_tokens: Some(128000) }),
("gpt-4-turbo-vision-preview", ModelPrice { input_per_mtok: 10.0, output_per_mtok: 30.0, max_input_tokens: Some(128000) }),
("gpt-4.1", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 8.0, max_input_tokens: Some(1047576) }),
("gpt-4.1-2025-04-14", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 8.0, max_input_tokens: Some(1047576) }),
("gpt-4.1-mini", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 1.6, max_input_tokens: Some(1047576) }),
("gpt-4.1-mini-2025-04-14", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 1.6, max_input_tokens: Some(1047576) }),
("gpt-4.1-nano", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.4, max_input_tokens: Some(1047576) }),
("gpt-4.1-nano-2025-04-14", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.4, max_input_tokens: Some(1047576) }),
("gpt-4.5-preview", ModelPrice { input_per_mtok: 75.0, output_per_mtok: 150.0, max_input_tokens: Some(128000) }),
("gpt-4o", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("gpt-4o-2024-05-13", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 15.0, max_input_tokens: Some(128000) }),
("gpt-4o-2024-08-06", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("gpt-4o-2024-11-20", ModelPrice { input_per_mtok: 2.75, output_per_mtok: 11.0, max_input_tokens: Some(128000) }),
("gpt-4o-audio-preview", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("gpt-4o-audio-preview-2024-12-17", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("gpt-4o-audio-preview-2025-06-03", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("gpt-4o-mini", ModelPrice { input_per_mtok: 0.165, output_per_mtok: 0.66, max_input_tokens: Some(128000) }),
("gpt-4o-mini-2024-07-18", ModelPrice { input_per_mtok: 0.165, output_per_mtok: 0.66, max_input_tokens: Some(128000) }),
("gpt-4o-mini-audio-preview", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(128000) }),
("gpt-4o-mini-audio-preview-2024-12-17", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("gpt-4o-mini-realtime-preview", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.4, max_input_tokens: Some(128000) }),
("gpt-4o-mini-realtime-preview-2024-12-17", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.4, max_input_tokens: Some(128000) }),
("gpt-4o-mini-search-preview", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(128000) }),
("gpt-4o-mini-search-preview-2025-03-11", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(128000) }),
("gpt-4o-realtime-preview", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 20.0, max_input_tokens: Some(128000) }),
("gpt-4o-realtime-preview-2024-10-01", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 20.0, max_input_tokens: Some(128000) }),
("gpt-4o-realtime-preview-2024-12-17", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 20.0, max_input_tokens: Some(128000) }),
("gpt-4o-realtime-preview-2025-06-03", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 20.0, max_input_tokens: Some(128000) }),
("gpt-4o-search-preview", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("gpt-4o-search-preview-2025-03-11", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("gpt-5", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(272000) }),
("gpt-5-2025-08-07", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(272000) }),
("gpt-5-chat", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("gpt-5-chat-latest", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("gpt-5-codex", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(272000) }),
("gpt-5-mini", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 2.0, max_input_tokens: Some(272000) }),
("gpt-5-mini-2025-08-07", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 2.0, max_input_tokens: Some(272000) }),
("gpt-5-nano", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.4, max_input_tokens: Some(272000) }),
("gpt-5-nano-2025-08-07", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.4, max_input_tokens: Some(272000) }),
("gpt-5-pro", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 120.0, max_input_tokens: Some(272000) }),
("gpt-5-pro-2025-10-06", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 120.0, max_input_tokens: Some(128000) }),
("gpt-5-search-api", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(272000) }),
("gpt-5-search-api-2025-10-14", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(272000) }),
("gpt-5.1", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(272000) }),
("gpt-5.1-2025-11-13", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(272000) }),
("gpt-5.1-chat", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("gpt-5.1-chat-2025-11-13", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("gpt-5.1-chat-latest", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("gpt-5.1-codex", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(272000) }),
("gpt-5.1-codex-2025-11-13", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(272000) }),
("gpt-5.1-codex-max", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(400000) }),
("gpt-5.1-codex-mini", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 2.0, max_input_tokens: Some(272000) }),
("gpt-5.1-codex-mini-2025-11-13", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 2.0, max_input_tokens: Some(272000) }),
("gpt-5.2", ModelPrice { input_per_mtok: 1.75, output_per_mtok: 14.0, max_input_tokens: Some(272000) }),
("gpt-5.2-2025-12-11", ModelPrice { input_per_mtok: 1.75, output_per_mtok: 14.0, max_input_tokens: Some(272000) }),
("gpt-5.2-chat", ModelPrice { input_per_mtok: 1.75, output_per_mtok: 14.0, max_input_tokens: Some(128000) }),
("gpt-5.2-chat-2025-12-11", ModelPrice { input_per_mtok: 1.75, output_per_mtok: 14.0, max_input_tokens: Some(128000) }),
("gpt-5.2-chat-latest", ModelPrice { input_per_mtok: 1.75, output_per_mtok: 14.0, max_input_tokens: Some(128000) }),
("gpt-5.2-codex", ModelPrice { input_per_mtok: 1.75, output_per_mtok: 14.0, max_input_tokens: Some(272000) }),
("gpt-5.2-pro", ModelPrice { input_per_mtok: 21.0, output_per_mtok: 168.0, max_input_tokens: Some(272000) }),
("gpt-5.2-pro-2025-12-11", ModelPrice { input_per_mtok: 21.0, output_per_mtok: 168.0, max_input_tokens: Some(272000) }),
("gpt-5.3-chat", ModelPrice { input_per_mtok: 1.75, output_per_mtok: 14.0, max_input_tokens: Some(128000) }),
("gpt-5.3-chat-latest", ModelPrice { input_per_mtok: 1.75, output_per_mtok: 14.0, max_input_tokens: Some(128000) }),
("gpt-5.3-codex", ModelPrice { input_per_mtok: 1.75, output_per_mtok: 14.0, max_input_tokens: Some(272000) }),
("gpt-5.4", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 15.0, max_input_tokens: Some(1050000) }),
("gpt-5.4-2026-03-05", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 15.0, max_input_tokens: Some(1050000) }),
("gpt-5.4-mini", ModelPrice { input_per_mtok: 0.75, output_per_mtok: 4.5, max_input_tokens: Some(1050000) }),
("gpt-5.4-mini-2026-03-17", ModelPrice { input_per_mtok: 0.75, output_per_mtok: 4.5, max_input_tokens: Some(1050000) }),
("gpt-5.4-nano", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 1.25, max_input_tokens: Some(1050000) }),
("gpt-5.4-nano-2026-03-17", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 1.25, max_input_tokens: Some(1050000) }),
("gpt-5.4-pro", ModelPrice { input_per_mtok: 30.0, output_per_mtok: 180.0, max_input_tokens: Some(1050000) }),
("gpt-5.4-pro-2026-03-05", ModelPrice { input_per_mtok: 30.0, output_per_mtok: 180.0, max_input_tokens: Some(1050000) }),
("gpt-5.5", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 30.0, max_input_tokens: Some(1050000) }),
("gpt-5.5-2026-04-23", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 30.0, max_input_tokens: Some(1050000) }),
("gpt-5.5-pro", ModelPrice { input_per_mtok: 30.0, output_per_mtok: 180.0, max_input_tokens: Some(1050000) }),
("gpt-5.5-pro-2026-04-23", ModelPrice { input_per_mtok: 30.0, output_per_mtok: 180.0, max_input_tokens: Some(1050000) }),
("gpt-audio", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("gpt-audio-1.5", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("gpt-audio-1.5-2026-02-23", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("gpt-audio-2025-08-28", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("gpt-audio-mini", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.4, max_input_tokens: Some(128000) }),
("gpt-audio-mini-2025-10-06", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.4, max_input_tokens: Some(128000) }),
("gpt-audio-mini-2025-12-15", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.4, max_input_tokens: Some(128000) }),
("gpt-oss-120b", ModelPrice { input_per_mtok: 0.18, output_per_mtok: 0.8, max_input_tokens: Some(131072) }),
("gpt-oss-120b-maas", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(131072) }),
("gpt-oss-20b", ModelPrice { input_per_mtok: 0.02, output_per_mtok: 0.1, max_input_tokens: Some(131072) }),
("gpt-oss-20b-maas", ModelPrice { input_per_mtok: 0.075, output_per_mtok: 0.3, max_input_tokens: Some(131072) }),
("gpt-realtime", ModelPrice { input_per_mtok: 4.0, output_per_mtok: 16.0, max_input_tokens: Some(32000) }),
("gpt-realtime-1.5", ModelPrice { input_per_mtok: 4.0, output_per_mtok: 16.0, max_input_tokens: Some(32000) }),
("gpt-realtime-1.5-2026-02-23", ModelPrice { input_per_mtok: 4.0, output_per_mtok: 16.0, max_input_tokens: Some(32000) }),
("gpt-realtime-2025-08-28", ModelPrice { input_per_mtok: 4.0, output_per_mtok: 16.0, max_input_tokens: Some(32000) }),
("gpt-realtime-mini", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.4, max_input_tokens: Some(128000) }),
("gpt-realtime-mini-2025-10-06", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.4, max_input_tokens: Some(128000) }),
("gpt-realtime-mini-2025-12-15", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.4, max_input_tokens: Some(128000) }),
("gradient_ai/anthropic-claude-3-opus", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(1024) }),
("gradient_ai/anthropic-claude-3.5-haiku", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 4.0, max_input_tokens: Some(1024) }),
("gradient_ai/anthropic-claude-3.5-sonnet", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1024) }),
("gradient_ai/anthropic-claude-3.7-sonnet", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1024) }),
("gradient_ai/deepseek-r1-distill-llama-70b", ModelPrice { input_per_mtok: 0.99, output_per_mtok: 0.99, max_input_tokens: Some(8000) }),
("gradient_ai/llama3-8b-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(512) }),
("gradient_ai/llama3.3-70b-instruct", ModelPrice { input_per_mtok: 0.65, output_per_mtok: 0.65, max_input_tokens: Some(2048) }),
("gradient_ai/mistral-nemo-instruct-2407", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.3, max_input_tokens: Some(512) }),
("gradient_ai/openai-o3", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 8.0, max_input_tokens: Some(100000) }),
("gradient_ai/openai-o3-mini", ModelPrice { input_per_mtok: 1.1, output_per_mtok: 4.4, max_input_tokens: Some(100000) }),
("grok-2", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 10.0, max_input_tokens: Some(131072) }),
("grok-2-1212", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 10.0, max_input_tokens: Some(131072) }),
("grok-2-latest", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 10.0, max_input_tokens: Some(131072) }),
("grok-2-vision", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 10.0, max_input_tokens: Some(32768) }),
("grok-2-vision-1212", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 10.0, max_input_tokens: Some(32768) }),
("grok-2-vision-latest", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 10.0, max_input_tokens: Some(32768) }),
("grok-3", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(131072) }),
("grok-3-beta", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(131072) }),
("grok-3-fast-beta", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(131072) }),
("grok-3-fast-latest", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(131072) }),
("grok-3-latest", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(131072) }),
("grok-3-mini", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.5, max_input_tokens: Some(131072) }),
("grok-3-mini-beta", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.5, max_input_tokens: Some(131072) }),
("grok-3-mini-fast", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 4.0, max_input_tokens: Some(131072) }),
("grok-3-mini-fast-beta", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 4.0, max_input_tokens: Some(131072) }),
("grok-3-mini-fast-latest", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 4.0, max_input_tokens: Some(131072) }),
("grok-3-mini-latest", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.5, max_input_tokens: Some(131072) }),
("grok-4", ModelPrice { input_per_mtok: 7.2, output_per_mtok: 36.0, max_input_tokens: Some(256000) }),
("grok-4-0709", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(256000) }),
("grok-4-1-fast", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.5, max_input_tokens: Some(2000000) }),
("grok-4-1-fast-non-reasoning", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.5, max_input_tokens: Some(2000000) }),
("grok-4-1-fast-non-reasoning-latest", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.5, max_input_tokens: Some(2000000) }),
("grok-4-1-fast-reasoning", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.5, max_input_tokens: Some(2000000) }),
("grok-4-1-fast-reasoning-latest", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.5, max_input_tokens: Some(2000000) }),
("grok-4-fast-non-reasoning", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.5, max_input_tokens: Some(2000000) }),
("grok-4-fast-reasoning", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.5, max_input_tokens: Some(2000000) }),
("grok-4-latest", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(256000) }),
("grok-4.20-0309-reasoning", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 6.0, max_input_tokens: Some(2000000) }),
("grok-4.20-beta-0309-non-reasoning", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 6.0, max_input_tokens: Some(2000000) }),
("grok-4.20-beta-0309-reasoning", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 6.0, max_input_tokens: Some(2000000) }),
("grok-4.20-multi-agent-beta-0309", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 6.0, max_input_tokens: Some(2000000) }),
("grok-beta", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 15.0, max_input_tokens: Some(131072) }),
("grok-code-fast", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 1.5, max_input_tokens: Some(256000) }),
("grok-code-fast-1", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 1.5, max_input_tokens: Some(256000) }),
("grok-code-fast-1-0825", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 1.5, max_input_tokens: Some(256000) }),
("grok-vision-beta", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 15.0, max_input_tokens: Some(8192) }),
("gryphe/mythomax-l2-13b", ModelPrice { input_per_mtok: 1.875, output_per_mtok: 1.875, max_input_tokens: Some(8192) }),
("hyperbolic/NousResearch/Hermes-3-Llama-3.1-70B", ModelPrice { input_per_mtok: 0.12, output_per_mtok: 0.3, max_input_tokens: Some(32768) }),
("hyperbolic/Qwen/QwQ-32B", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(131072) }),
("hyperbolic/Qwen/Qwen2.5-72B-Instruct", ModelPrice { input_per_mtok: 0.12, output_per_mtok: 0.3, max_input_tokens: Some(131072) }),
("hyperbolic/Qwen/Qwen2.5-Coder-32B-Instruct", ModelPrice { input_per_mtok: 0.12, output_per_mtok: 0.3, max_input_tokens: Some(32768) }),
("hyperbolic/Qwen/Qwen3-235B-A22B", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 2.0, max_input_tokens: Some(131072) }),
("hyperbolic/deepseek-ai/DeepSeek-R1", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 0.4, max_input_tokens: Some(32768) }),
("hyperbolic/deepseek-ai/DeepSeek-R1-0528", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 0.25, max_input_tokens: Some(131072) }),
("hyperbolic/deepseek-ai/DeepSeek-V3", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(32768) }),
("hyperbolic/deepseek-ai/DeepSeek-V3-0324", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 0.4, max_input_tokens: Some(32768) }),
("hyperbolic/meta-llama/Llama-3.2-3B-Instruct", ModelPrice { input_per_mtok: 0.12, output_per_mtok: 0.3, max_input_tokens: Some(32768) }),
("hyperbolic/meta-llama/Llama-3.3-70B-Instruct", ModelPrice { input_per_mtok: 0.12, output_per_mtok: 0.3, max_input_tokens: Some(131072) }),
("hyperbolic/meta-llama/Meta-Llama-3-70B-Instruct", ModelPrice { input_per_mtok: 0.12, output_per_mtok: 0.3, max_input_tokens: Some(131072) }),
("hyperbolic/meta-llama/Meta-Llama-3.1-405B-Instruct", ModelPrice { input_per_mtok: 0.12, output_per_mtok: 0.3, max_input_tokens: Some(32768) }),
("hyperbolic/meta-llama/Meta-Llama-3.1-70B-Instruct", ModelPrice { input_per_mtok: 0.12, output_per_mtok: 0.3, max_input_tokens: Some(32768) }),
("hyperbolic/meta-llama/Meta-Llama-3.1-8B-Instruct", ModelPrice { input_per_mtok: 0.12, output_per_mtok: 0.3, max_input_tokens: Some(32768) }),
("hyperbolic/moonshotai/Kimi-K2-Instruct", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 2.0, max_input_tokens: Some(131072) }),
("ibm-granite/granite-3.3-8b-instruct", ModelPrice { input_per_mtok: 0.03, output_per_mtok: 0.25, max_input_tokens: None }),
("invoke/anthropic.claude-3-5-sonnet-20240620-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("j2-light", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 3.0, max_input_tokens: Some(8192) }),
("j2-mid", ModelPrice { input_per_mtok: 10.0, output_per_mtok: 10.0, max_input_tokens: Some(8192) }),
("j2-ultra", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 15.0, max_input_tokens: Some(8192) }),
("jamba-1.5", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.4, max_input_tokens: Some(256000) }),
("jamba-1.5-large", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 8.0, max_input_tokens: Some(256000) }),
("jamba-1.5-large@001", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 8.0, max_input_tokens: Some(256000) }),
("jamba-1.5-mini", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.4, max_input_tokens: Some(256000) }),
("jamba-1.5-mini@001", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.4, max_input_tokens: Some(256000) }),
("jamba-large-1.6", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 8.0, max_input_tokens: Some(256000) }),
("jamba-large-1.7", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 8.0, max_input_tokens: Some(256000) }),
("jamba-mini-1.6", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.4, max_input_tokens: Some(256000) }),
("jamba-mini-1.7", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.4, max_input_tokens: Some(256000) }),
("jp.anthropic.claude-haiku-4-5-20251001-v1:0", ModelPrice { input_per_mtok: 1.1, output_per_mtok: 5.5, max_input_tokens: Some(200000) }),
("jp.anthropic.claude-sonnet-4-5-20250929-v1:0", ModelPrice { input_per_mtok: 3.3, output_per_mtok: 16.5, max_input_tokens: Some(200000) }),
("kimi-k2p5", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 3.0, max_input_tokens: Some(262144) }),
("labs-devstral-small-2512", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.3, max_input_tokens: Some(256000) }),
("lambda_ai/deepseek-llama3.3-70b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.6, max_input_tokens: Some(131072) }),
("lambda_ai/deepseek-r1-0528", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.6, max_input_tokens: Some(131072) }),
("lambda_ai/deepseek-r1-671b", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 0.8, max_input_tokens: Some(131072) }),
("lambda_ai/deepseek-v3-0324", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.6, max_input_tokens: Some(131072) }),
("lambda_ai/hermes3-405b", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 0.8, max_input_tokens: Some(131072) }),
("lambda_ai/hermes3-70b", ModelPrice { input_per_mtok: 0.12, output_per_mtok: 0.3, max_input_tokens: Some(131072) }),
("lambda_ai/hermes3-8b", ModelPrice { input_per_mtok: 0.025, output_per_mtok: 0.04, max_input_tokens: Some(131072) }),
("lambda_ai/lfm-40b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.2, max_input_tokens: Some(131072) }),
("lambda_ai/lfm-7b", ModelPrice { input_per_mtok: 0.025, output_per_mtok: 0.04, max_input_tokens: Some(131072) }),
("lambda_ai/llama-4-maverick-17b-128e-instruct-fp8", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.1, max_input_tokens: Some(131072) }),
("lambda_ai/llama-4-scout-17b-16e-instruct", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.1, max_input_tokens: Some(16384) }),
("lambda_ai/llama3.1-405b-instruct-fp8", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 0.8, max_input_tokens: Some(131072) }),
("lambda_ai/llama3.1-70b-instruct-fp8", ModelPrice { input_per_mtok: 0.12, output_per_mtok: 0.3, max_input_tokens: Some(131072) }),
("lambda_ai/llama3.1-8b-instruct", ModelPrice { input_per_mtok: 0.025, output_per_mtok: 0.04, max_input_tokens: Some(131072) }),
("lambda_ai/llama3.1-nemotron-70b-instruct-fp8", ModelPrice { input_per_mtok: 0.12, output_per_mtok: 0.3, max_input_tokens: Some(131072) }),
("lambda_ai/llama3.2-11b-vision-instruct", ModelPrice { input_per_mtok: 0.015, output_per_mtok: 0.025, max_input_tokens: Some(131072) }),
("lambda_ai/llama3.2-3b-instruct", ModelPrice { input_per_mtok: 0.015, output_per_mtok: 0.025, max_input_tokens: Some(131072) }),
("lambda_ai/llama3.3-70b-instruct-fp8", ModelPrice { input_per_mtok: 0.12, output_per_mtok: 0.3, max_input_tokens: Some(131072) }),
("lambda_ai/qwen25-coder-32b-instruct", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.1, max_input_tokens: Some(131072) }),
("lambda_ai/qwen3-32b-fp8", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.1, max_input_tokens: Some(131072) }),
("llama-2-70b-chat", ModelPrice { input_per_mtok: 0.7, output_per_mtok: 2.8, max_input_tokens: Some(4096) }),
("llama-3.1-70b-instruct", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 1.0, max_input_tokens: Some(131072) }),
("llama-3.1-8b-instant", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.08, max_input_tokens: Some(128000) }),
("llama-3.1-8b-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(131072) }),
("llama-3.3-70b-versatile", ModelPrice { input_per_mtok: 0.59, output_per_mtok: 0.79, max_input_tokens: Some(128000) }),
("llamagate/codellama-7b", ModelPrice { input_per_mtok: 0.06, output_per_mtok: 0.12, max_input_tokens: Some(16384) }),
("llamagate/deepseek-coder-6.7b", ModelPrice { input_per_mtok: 0.06, output_per_mtok: 0.12, max_input_tokens: Some(16384) }),
("llamagate/deepseek-r1-7b-qwen", ModelPrice { input_per_mtok: 0.08, output_per_mtok: 0.15, max_input_tokens: Some(131072) }),
("llamagate/deepseek-r1-8b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.2, max_input_tokens: Some(65536) }),
("llamagate/dolphin3-8b", ModelPrice { input_per_mtok: 0.08, output_per_mtok: 0.15, max_input_tokens: Some(128000) }),
("llamagate/gemma3-4b", ModelPrice { input_per_mtok: 0.03, output_per_mtok: 0.08, max_input_tokens: Some(128000) }),
("llamagate/llama-3.1-8b", ModelPrice { input_per_mtok: 0.03, output_per_mtok: 0.05, max_input_tokens: Some(131072) }),
("llamagate/llama-3.2-3b", ModelPrice { input_per_mtok: 0.04, output_per_mtok: 0.08, max_input_tokens: Some(131072) }),
("llamagate/llava-7b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.2, max_input_tokens: Some(4096) }),
("llamagate/mistral-7b-v0.3", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.15, max_input_tokens: Some(32768) }),
("llamagate/openthinker-7b", ModelPrice { input_per_mtok: 0.08, output_per_mtok: 0.15, max_input_tokens: Some(32768) }),
("llamagate/qwen2.5-coder-7b", ModelPrice { input_per_mtok: 0.06, output_per_mtok: 0.12, max_input_tokens: Some(32768) }),
("llamagate/qwen3-8b", ModelPrice { input_per_mtok: 0.04, output_per_mtok: 0.14, max_input_tokens: Some(32768) }),
("llamagate/qwen3-vl-8b", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.55, max_input_tokens: Some(32768) }),
("luminous-base", ModelPrice { input_per_mtok: 30.0, output_per_mtok: 33.0, max_input_tokens: Some(2048) }),
("luminous-base-control", ModelPrice { input_per_mtok: 37.5, output_per_mtok: 41.25, max_input_tokens: Some(2048) }),
("luminous-extended", ModelPrice { input_per_mtok: 45.0, output_per_mtok: 49.5, max_input_tokens: Some(2048) }),
("luminous-extended-control", ModelPrice { input_per_mtok: 56.25, output_per_mtok: 61.875, max_input_tokens: Some(2048) }),
("luminous-supreme", ModelPrice { input_per_mtok: 175.0, output_per_mtok: 192.5, max_input_tokens: Some(2048) }),
("luminous-supreme-control", ModelPrice { input_per_mtok: 218.75, output_per_mtok: 240.625, max_input_tokens: Some(2048) }),
("magistral-medium-1-2-2509", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 5.0, max_input_tokens: Some(40000) }),
("magistral-medium-2506", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 5.0, max_input_tokens: Some(40000) }),
("magistral-medium-2509", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 5.0, max_input_tokens: Some(40000) }),
("magistral-medium-latest", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 5.0, max_input_tokens: Some(40000) }),
("magistral-small-1-2-2509", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(40000) }),
("magistral-small-2506", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(40000) }),
("magistral-small-latest", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(40000) }),
("mancer/weaver", ModelPrice { input_per_mtok: 5.625, output_per_mtok: 5.625, max_input_tokens: Some(8000) }),
("meta-llama/Llama-3.3-70B-Instruct-Turbo", ModelPrice { input_per_mtok: 0.88, output_per_mtok: 0.88, max_input_tokens: None }),
("meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", ModelPrice { input_per_mtok: 0.27, output_per_mtok: 0.85, max_input_tokens: None }),
("meta-llama/Llama-4-Scout-17B-16E-Instruct", ModelPrice { input_per_mtok: 0.18, output_per_mtok: 0.59, max_input_tokens: None }),
("meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo", ModelPrice { input_per_mtok: 3.5, output_per_mtok: 3.5, max_input_tokens: None }),
("meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo", ModelPrice { input_per_mtok: 0.88, output_per_mtok: 0.88, max_input_tokens: None }),
("meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo", ModelPrice { input_per_mtok: 0.18, output_per_mtok: 0.18, max_input_tokens: None }),
("meta-llama/llama-3-70b-instruct", ModelPrice { input_per_mtok: 0.59, output_per_mtok: 0.79, max_input_tokens: Some(8192) }),
("meta-llama/llama-4-maverick-17b-128e-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.6, max_input_tokens: Some(131072) }),
("meta-llama/llama-4-scout-17b-16e-instruct", ModelPrice { input_per_mtok: 0.11, output_per_mtok: 0.34, max_input_tokens: Some(131072) }),
("meta-llama/llama-guard-4-12b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(8192) }),
("meta.llama2-13b-chat-v1", ModelPrice { input_per_mtok: 0.75, output_per_mtok: 1.0, max_input_tokens: Some(4096) }),
("meta.llama2-70b-chat-v1", ModelPrice { input_per_mtok: 1.95, output_per_mtok: 2.56, max_input_tokens: Some(4096) }),
("meta.llama3-1-405b-instruct-v1:0", ModelPrice { input_per_mtok: 5.32, output_per_mtok: 16.0, max_input_tokens: Some(128000) }),
("meta.llama3-1-70b-instruct-v1:0", ModelPrice { input_per_mtok: 0.99, output_per_mtok: 0.99, max_input_tokens: Some(128000) }),
("meta.llama3-1-8b-instruct-v1:0", ModelPrice { input_per_mtok: 0.22, output_per_mtok: 0.22, max_input_tokens: Some(128000) }),
("meta.llama3-2-11b-instruct-v1:0", ModelPrice { input_per_mtok: 0.35, output_per_mtok: 0.35, max_input_tokens: Some(128000) }),
("meta.llama3-2-1b-instruct-v1:0", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(128000) }),
("meta.llama3-2-3b-instruct-v1:0", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: Some(128000) }),
("meta.llama3-2-90b-instruct-v1:0", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 2.0, max_input_tokens: Some(128000) }),
("meta.llama3-3-70b-instruct-v1:0", ModelPrice { input_per_mtok: 0.72, output_per_mtok: 0.72, max_input_tokens: Some(128000) }),
("meta.llama3-70b-instruct-v1:0", ModelPrice { input_per_mtok: 2.65, output_per_mtok: 3.5, max_input_tokens: Some(8192) }),
("meta.llama3-8b-instruct-v1:0", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.6, max_input_tokens: Some(8192) }),
("meta.llama4-maverick-17b-instruct-v1:0", ModelPrice { input_per_mtok: 0.24, output_per_mtok: 0.97, max_input_tokens: Some(128000) }),
("meta.llama4-scout-17b-instruct-v1:0", ModelPrice { input_per_mtok: 0.17, output_per_mtok: 0.66, max_input_tokens: Some(128000) }),
("meta/llama-2-13b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.5, max_input_tokens: Some(4096) }),
("meta/llama-2-13b-chat", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.5, max_input_tokens: Some(4096) }),
("meta/llama-2-70b", ModelPrice { input_per_mtok: 0.65, output_per_mtok: 2.75, max_input_tokens: Some(4096) }),
("meta/llama-2-70b-chat", ModelPrice { input_per_mtok: 0.65, output_per_mtok: 2.75, max_input_tokens: Some(4096) }),
("meta/llama-2-7b", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.25, max_input_tokens: Some(4096) }),
("meta/llama-2-7b-chat", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.25, max_input_tokens: Some(4096) }),
("meta/llama-3-70b", ModelPrice { input_per_mtok: 0.65, output_per_mtok: 2.75, max_input_tokens: Some(8192) }),
("meta/llama-3-70b-instruct", ModelPrice { input_per_mtok: 0.65, output_per_mtok: 2.75, max_input_tokens: Some(8192) }),
("meta/llama-3-8b", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.25, max_input_tokens: Some(8086) }),
("meta/llama-3-8b-instruct", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.25, max_input_tokens: Some(8086) }),
("meta/llama-3.1-405b-instruct-maas", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 16.0, max_input_tokens: Some(128000) }),
("meta/llama-4-maverick-17b-128e-instruct-maas", ModelPrice { input_per_mtok: 0.35, output_per_mtok: 1.15, max_input_tokens: Some(1000000) }),
("meta/llama-4-maverick-17b-16e-instruct-maas", ModelPrice { input_per_mtok: 0.35, output_per_mtok: 1.15, max_input_tokens: Some(1000000) }),
("meta/llama-4-scout-17b-128e-instruct-maas", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 0.7, max_input_tokens: Some(10000000) }),
("meta/llama-4-scout-17b-16e-instruct-maas", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 0.7, max_input_tokens: Some(10000000) }),
("minimax-m2p1", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(204800) }),
("minimax.minimax-m2", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(128000) }),
("minimax.minimax-m2.1", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(196000) }),
("minimax.minimax-m2.5", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(1000000) }),
("minimax/MiniMax-M2", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(200000) }),
("minimax/MiniMax-M2.1", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(1000000) }),
("minimax/MiniMax-M2.1-lightning", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 2.4, max_input_tokens: Some(1000000) }),
("minimax/MiniMax-M2.5", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(1000000) }),
("minimax/MiniMax-M2.5-lightning", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 2.4, max_input_tokens: Some(1000000) }),
("minimax/minimax-m2", ModelPrice { input_per_mtok: 0.255, output_per_mtok: 1.02, max_input_tokens: Some(204800) }),
("minimax/minimax-m2.1", ModelPrice { input_per_mtok: 0.27, output_per_mtok: 1.2, max_input_tokens: Some(204000) }),
("minimax/minimax-m2.5", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.1, max_input_tokens: Some(196608) }),
("minimaxai/minimax-m2-maas", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(196608) }),
("ministral-3-14b-2512", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(262144) }),
("ministral-3-3b-2512", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(131072) }),
("ministral-3-8b-2512", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: Some(262144) }),
("mistral-7b-instruct", ModelPrice { input_per_mtok: 0.07, output_per_mtok: 0.28, max_input_tokens: Some(4096) }),
("mistral-large-2402", ModelPrice { input_per_mtok: 8.0, output_per_mtok: 24.0, max_input_tokens: Some(32000) }),
("mistral-large-2407", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 9.0, max_input_tokens: Some(128000) }),
("mistral-large-2411", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 6.0, max_input_tokens: Some(128000) }),
("mistral-large-2512", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(262144) }),
("mistral-large-3", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(262144) }),
("mistral-large-latest", ModelPrice { input_per_mtok: 8.0, output_per_mtok: 24.0, max_input_tokens: Some(262144) }),
("mistral-large@2407", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 6.0, max_input_tokens: Some(128000) }),
("mistral-large@2411-001", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 6.0, max_input_tokens: Some(128000) }),
("mistral-large@latest", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 6.0, max_input_tokens: Some(128000) }),
("mistral-medium", ModelPrice { input_per_mtok: 2.7, output_per_mtok: 8.1, max_input_tokens: Some(32000) }),
("mistral-medium-2312", ModelPrice { input_per_mtok: 2.7, output_per_mtok: 8.1, max_input_tokens: Some(32000) }),
("mistral-medium-2505", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 2.0, max_input_tokens: Some(131072) }),
("mistral-medium-3", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 2.0, max_input_tokens: Some(128000) }),
("mistral-medium-3-1-2508", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 2.0, max_input_tokens: Some(131072) }),
("mistral-medium-3@001", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 2.0, max_input_tokens: Some(128000) }),
("mistral-medium-latest", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 2.0, max_input_tokens: Some(131072) }),
("mistral-nemo@2407", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 3.0, max_input_tokens: Some(128000) }),
("mistral-nemo@latest", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: Some(128000) }),
("mistral-small", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.3, max_input_tokens: Some(32000) }),
("mistral-small-2503", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.0, max_input_tokens: Some(128000) }),
("mistral-small-2503@001", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.0, max_input_tokens: Some(32000) }),
("mistral-small-3-2-2506", ModelPrice { input_per_mtok: 0.06, output_per_mtok: 0.18, max_input_tokens: Some(131072) }),
("mistral-small-latest", ModelPrice { input_per_mtok: 0.06, output_per_mtok: 0.18, max_input_tokens: Some(131072) }),
("mistral-tiny", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 0.25, max_input_tokens: Some(32000) }),
("mistral.devstral-2-123b", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 2.0, max_input_tokens: Some(256000) }),
("mistral.magistral-small-2509", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(128000) }),
("mistral.ministral-3-14b-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(128000) }),
("mistral.ministral-3-3b-instruct", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(128000) }),
("mistral.ministral-3-8b-instruct", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: Some(128000) }),
("mistral.mistral-7b-instruct-v0:2", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.2, max_input_tokens: Some(32000) }),
("mistral.mistral-large-2402-v1:0", ModelPrice { input_per_mtok: 8.0, output_per_mtok: 24.0, max_input_tokens: Some(32000) }),
("mistral.mistral-large-2407-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 9.0, max_input_tokens: Some(128000) }),
("mistral.mistral-large-3-675b-instruct", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(128000) }),
("mistral.mistral-small-2402-v1:0", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.0, max_input_tokens: Some(32000) }),
("mistral.mixtral-8x7b-instruct-v0:1", ModelPrice { input_per_mtok: 0.45, output_per_mtok: 0.7, max_input_tokens: Some(32000) }),
("mistral.voxtral-mini-3b-2507", ModelPrice { input_per_mtok: 0.04, output_per_mtok: 0.04, max_input_tokens: Some(128000) }),
("mistral.voxtral-small-24b-2507", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.3, max_input_tokens: Some(128000) }),
("mistralai/Mixtral-8x7B-Instruct-v0.1", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 0.6, max_input_tokens: None }),
("mistralai/codestral-2", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.9, max_input_tokens: Some(128000) }),
("mistralai/codestral-2@001", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.9, max_input_tokens: Some(128000) }),
("mistralai/devstral-2512", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(262144) }),
("mistralai/ministral-14b-2512", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(262144) }),
("mistralai/ministral-3b-2512", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(131072) }),
("mistralai/ministral-8b-2512", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: Some(262144) }),
("mistralai/mistral-7b-instruct", ModelPrice { input_per_mtok: 0.13, output_per_mtok: 0.13, max_input_tokens: Some(8192) }),
("mistralai/mistral-7b-instruct-v0.2", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.25, max_input_tokens: Some(4096) }),
("mistralai/mistral-7b-v0.1", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.25, max_input_tokens: Some(4096) }),
("mistralai/mistral-large", ModelPrice { input_per_mtok: 8.0, output_per_mtok: 24.0, max_input_tokens: Some(32000) }),
("mistralai/mistral-large-2512", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(262144) }),
("mistralai/mistral-medium-3", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 2.0, max_input_tokens: Some(128000) }),
("mistralai/mistral-medium-3@001", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 2.0, max_input_tokens: Some(128000) }),
("mistralai/mistral-small-3.1-24b-instruct", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.3, max_input_tokens: Some(32000) }),
("mistralai/mistral-small-3.2-24b-instruct", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.3, max_input_tokens: Some(32000) }),
("mistralai/mixtral-8x22b-instruct", ModelPrice { input_per_mtok: 0.65, output_per_mtok: 0.65, max_input_tokens: Some(65536) }),
("mistralai/mixtral-8x7b-instruct-v0.1", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.0, max_input_tokens: Some(4096) }),
("mixtral-8x7b-instruct", ModelPrice { input_per_mtok: 0.07, output_per_mtok: 0.28, max_input_tokens: Some(4096) }),
("moonshot.kimi-k2-thinking", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.5, max_input_tokens: Some(128000) }),
("moonshot/kimi-k2-0711-preview", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.5, max_input_tokens: Some(131072) }),
("moonshot/kimi-k2-0905-preview", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.5, max_input_tokens: Some(262144) }),
("moonshot/kimi-k2-thinking", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.5, max_input_tokens: Some(262144) }),
("moonshot/kimi-k2-thinking-turbo", ModelPrice { input_per_mtok: 1.15, output_per_mtok: 8.0, max_input_tokens: Some(262144) }),
("moonshot/kimi-k2-turbo-preview", ModelPrice { input_per_mtok: 1.15, output_per_mtok: 8.0, max_input_tokens: Some(262144) }),
("moonshot/kimi-k2.5", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 3.0, max_input_tokens: Some(262144) }),
("moonshot/kimi-k2.6", ModelPrice { input_per_mtok: 0.95, output_per_mtok: 4.0, max_input_tokens: Some(262144) }),
("moonshot/kimi-latest", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 5.0, max_input_tokens: Some(131072) }),
("moonshot/kimi-latest-128k", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 5.0, max_input_tokens: Some(131072) }),
("moonshot/kimi-latest-32k", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.0, max_input_tokens: Some(32768) }),
("moonshot/kimi-latest-8k", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 2.0, max_input_tokens: Some(8192) }),
("moonshot/kimi-thinking-preview", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.5, max_input_tokens: Some(131072) }),
("moonshot/moonshot-v1-128k", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 5.0, max_input_tokens: Some(131072) }),
("moonshot/moonshot-v1-128k-0430", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 5.0, max_input_tokens: Some(131072) }),
("moonshot/moonshot-v1-128k-vision-preview", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 5.0, max_input_tokens: Some(131072) }),
("moonshot/moonshot-v1-32k", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.0, max_input_tokens: Some(32768) }),
("moonshot/moonshot-v1-32k-0430", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.0, max_input_tokens: Some(32768) }),
("moonshot/moonshot-v1-32k-vision-preview", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.0, max_input_tokens: Some(32768) }),
("moonshot/moonshot-v1-8k", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 2.0, max_input_tokens: Some(8192) }),
("moonshot/moonshot-v1-8k-0430", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 2.0, max_input_tokens: Some(8192) }),
("moonshot/moonshot-v1-8k-vision-preview", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 2.0, max_input_tokens: Some(8192) }),
("moonshot/moonshot-v1-auto", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 5.0, max_input_tokens: Some(131072) }),
("moonshotai.kimi-k2-thinking", ModelPrice { input_per_mtok: 0.73, output_per_mtok: 3.03, max_input_tokens: Some(262144) }),
("moonshotai.kimi-k2.5", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 3.03, max_input_tokens: Some(262144) }),
("moonshotai/Kimi-K2-Instruct", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.0, max_input_tokens: None }),
("moonshotai/Kimi-K2-Instruct-0905", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.0, max_input_tokens: Some(262144) }),
("moonshotai/Kimi-K2.5", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 2.8, max_input_tokens: Some(256000) }),
("moonshotai/kimi-k2-instruct-0905", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.0, max_input_tokens: Some(262144) }),
("moonshotai/kimi-k2-thinking-maas", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.5, max_input_tokens: Some(256000) }),
("moonshotai/kimi-k2.5", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 3.0, max_input_tokens: Some(262144) }),
("morph/morph-v3-fast", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 1.2, max_input_tokens: Some(16000) }),
("morph/morph-v3-large", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 1.9, max_input_tokens: Some(16000) }),
("nebius/NousResearch/Hermes-3-Llama-3.1-405B", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.0, max_input_tokens: Some(128000) }),
("nebius/Qwen/QwQ-32B", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.45, max_input_tokens: Some(32768) }),
("nebius/Qwen/Qwen2-VL-72B-Instruct", ModelPrice { input_per_mtok: 0.13, output_per_mtok: 0.4, max_input_tokens: Some(131072) }),
("nebius/Qwen/Qwen2-VL-7B-Instruct", ModelPrice { input_per_mtok: 0.02, output_per_mtok: 0.06, max_input_tokens: Some(131072) }),
("nebius/Qwen/Qwen2.5-32B-Instruct", ModelPrice { input_per_mtok: 0.06, output_per_mtok: 0.2, max_input_tokens: Some(128000) }),
("nebius/Qwen/Qwen2.5-72B-Instruct", ModelPrice { input_per_mtok: 0.13, output_per_mtok: 0.4, max_input_tokens: Some(128000) }),
("nebius/Qwen/Qwen2.5-Coder-7B", ModelPrice { input_per_mtok: 0.01, output_per_mtok: 0.03, max_input_tokens: Some(32768) }),
("nebius/Qwen/Qwen2.5-VL-72B-Instruct", ModelPrice { input_per_mtok: 0.13, output_per_mtok: 0.4, max_input_tokens: Some(131072) }),
("nebius/Qwen/Qwen3-14B", ModelPrice { input_per_mtok: 0.08, output_per_mtok: 0.24, max_input_tokens: Some(32768) }),
("nebius/Qwen/Qwen3-235B-A22B", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.6, max_input_tokens: Some(262144) }),
("nebius/Qwen/Qwen3-30B-A3B", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.3, max_input_tokens: Some(32768) }),
("nebius/Qwen/Qwen3-32B", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.3, max_input_tokens: Some(32768) }),
("nebius/Qwen/Qwen3-4B", ModelPrice { input_per_mtok: 0.08, output_per_mtok: 0.24, max_input_tokens: Some(32768) }),
("nebius/deepseek-ai/DeepSeek-R1", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 2.4, max_input_tokens: Some(128000) }),
("nebius/deepseek-ai/DeepSeek-R1-0528", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 2.4, max_input_tokens: Some(164000) }),
("nebius/deepseek-ai/DeepSeek-R1-Distill-Llama-70B", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 0.75, max_input_tokens: Some(128000) }),
("nebius/deepseek-ai/DeepSeek-V3", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(128000) }),
("nebius/deepseek-ai/DeepSeek-V3-0324", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(128000) }),
("nebius/google/gemma-3-27b-it", ModelPrice { input_per_mtok: 0.06, output_per_mtok: 0.2, max_input_tokens: Some(128000) }),
("nebius/meta-llama/Llama-3.3-70B-Instruct", ModelPrice { input_per_mtok: 0.13, output_per_mtok: 0.4, max_input_tokens: Some(128000) }),
("nebius/meta-llama/Llama-Guard-3-8B", ModelPrice { input_per_mtok: 0.02, output_per_mtok: 0.06, max_input_tokens: Some(128000) }),
("nebius/meta-llama/Meta-Llama-3.1-405B-Instruct", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.0, max_input_tokens: Some(128000) }),
("nebius/meta-llama/Meta-Llama-3.1-70B-Instruct", ModelPrice { input_per_mtok: 0.13, output_per_mtok: 0.4, max_input_tokens: Some(128000) }),
("nebius/meta-llama/Meta-Llama-3.1-8B-Instruct", ModelPrice { input_per_mtok: 0.02, output_per_mtok: 0.06, max_input_tokens: Some(128000) }),
("nebius/mistralai/Mistral-Nemo-Instruct-2407", ModelPrice { input_per_mtok: 0.04, output_per_mtok: 0.12, max_input_tokens: Some(128000) }),
("nebius/nvidia/Llama-3.1-Nemotron-Ultra-253B-v1", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 1.8, max_input_tokens: Some(128000) }),
("nebius/nvidia/Llama-3.3-Nemotron-Super-49B-v1", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.4, max_input_tokens: Some(131072) }),
("novita/Sao10K/L3-8B-Stheno-v3.2", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.05, max_input_tokens: Some(8192) }),
("novita/baichuan/baichuan-m2-32b", ModelPrice { input_per_mtok: 0.07, output_per_mtok: 0.07, max_input_tokens: Some(131072) }),
("novita/baidu/ernie-4.5-21B-a3b", ModelPrice { input_per_mtok: 0.07, output_per_mtok: 0.28, max_input_tokens: Some(120000) }),
("novita/baidu/ernie-4.5-21B-a3b-thinking", ModelPrice { input_per_mtok: 0.07, output_per_mtok: 0.28, max_input_tokens: Some(131072) }),
("novita/baidu/ernie-4.5-300b-a47b-paddle", ModelPrice { input_per_mtok: 0.28, output_per_mtok: 1.1, max_input_tokens: Some(123000) }),
("novita/baidu/ernie-4.5-vl-28b-a3b", ModelPrice { input_per_mtok: 0.14, output_per_mtok: 0.56, max_input_tokens: Some(30000) }),
("novita/baidu/ernie-4.5-vl-28b-a3b-thinking", ModelPrice { input_per_mtok: 0.39, output_per_mtok: 0.39, max_input_tokens: Some(131072) }),
("novita/baidu/ernie-4.5-vl-424b-a47b", ModelPrice { input_per_mtok: 0.42, output_per_mtok: 1.25, max_input_tokens: Some(123000) }),
("novita/deepseek/deepseek-ocr", ModelPrice { input_per_mtok: 0.03, output_per_mtok: 0.03, max_input_tokens: Some(8192) }),
("novita/deepseek/deepseek-prover-v2-671b", ModelPrice { input_per_mtok: 0.7, output_per_mtok: 2.5, max_input_tokens: Some(160000) }),
("novita/deepseek/deepseek-r1-0528", ModelPrice { input_per_mtok: 0.7, output_per_mtok: 2.5, max_input_tokens: Some(163840) }),
("novita/deepseek/deepseek-r1-0528-qwen3-8b", ModelPrice { input_per_mtok: 0.06, output_per_mtok: 0.09, max_input_tokens: Some(128000) }),
("novita/deepseek/deepseek-r1-distill-llama-70b", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 0.8, max_input_tokens: Some(8192) }),
("novita/deepseek/deepseek-r1-distill-qwen-14b", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: Some(32768) }),
("novita/deepseek/deepseek-r1-distill-qwen-32b", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.3, max_input_tokens: Some(64000) }),
("novita/deepseek/deepseek-r1-turbo", ModelPrice { input_per_mtok: 0.7, output_per_mtok: 2.5, max_input_tokens: Some(64000) }),
("novita/deepseek/deepseek-v3-0324", ModelPrice { input_per_mtok: 0.27, output_per_mtok: 1.12, max_input_tokens: Some(163840) }),
("novita/deepseek/deepseek-v3-turbo", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 1.3, max_input_tokens: Some(64000) }),
("novita/deepseek/deepseek-v3.1", ModelPrice { input_per_mtok: 0.27, output_per_mtok: 1.0, max_input_tokens: Some(131072) }),
("novita/deepseek/deepseek-v3.1-terminus", ModelPrice { input_per_mtok: 0.27, output_per_mtok: 1.0, max_input_tokens: Some(131072) }),
("novita/deepseek/deepseek-v3.2", ModelPrice { input_per_mtok: 0.269, output_per_mtok: 0.4, max_input_tokens: Some(163840) }),
("novita/deepseek/deepseek-v3.2-exp", ModelPrice { input_per_mtok: 0.27, output_per_mtok: 0.41, max_input_tokens: Some(163840) }),
("novita/google/gemma-3-12b-it", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.1, max_input_tokens: Some(131072) }),
("novita/google/gemma-3-27b-it", ModelPrice { input_per_mtok: 0.119, output_per_mtok: 0.2, max_input_tokens: Some(98304) }),
("novita/gryphe/mythomax-l2-13b", ModelPrice { input_per_mtok: 0.09, output_per_mtok: 0.09, max_input_tokens: Some(4096) }),
("novita/kwaipilot/kat-coder-pro", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(256000) }),
("novita/meta-llama/llama-3-70b-instruct", ModelPrice { input_per_mtok: 0.51, output_per_mtok: 0.74, max_input_tokens: Some(8192) }),
("novita/meta-llama/llama-3-8b-instruct", ModelPrice { input_per_mtok: 0.04, output_per_mtok: 0.04, max_input_tokens: Some(8192) }),
("novita/meta-llama/llama-3.1-8b-instruct", ModelPrice { input_per_mtok: 0.02, output_per_mtok: 0.05, max_input_tokens: Some(16384) }),
("novita/meta-llama/llama-3.2-3b-instruct", ModelPrice { input_per_mtok: 0.03, output_per_mtok: 0.05, max_input_tokens: Some(32768) }),
("novita/meta-llama/llama-3.3-70b-instruct", ModelPrice { input_per_mtok: 0.135, output_per_mtok: 0.4, max_input_tokens: Some(131072) }),
("novita/meta-llama/llama-4-maverick-17b-128e-instruct-fp8", ModelPrice { input_per_mtok: 0.27, output_per_mtok: 0.85, max_input_tokens: Some(1048576) }),
("novita/meta-llama/llama-4-scout-17b-16e-instruct", ModelPrice { input_per_mtok: 0.18, output_per_mtok: 0.59, max_input_tokens: Some(131072) }),
("novita/microsoft/wizardlm-2-8x22b", ModelPrice { input_per_mtok: 0.62, output_per_mtok: 0.62, max_input_tokens: Some(65535) }),
("novita/minimax/minimax-m2", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(204800) }),
("novita/minimax/minimax-m2.1", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(204800) }),
("novita/minimaxai/minimax-m1-80k", ModelPrice { input_per_mtok: 0.55, output_per_mtok: 2.2, max_input_tokens: Some(1000000) }),
("novita/mistralai/mistral-nemo", ModelPrice { input_per_mtok: 0.04, output_per_mtok: 0.17, max_input_tokens: Some(60288) }),
("novita/moonshotai/kimi-k2-0905", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.5, max_input_tokens: Some(262144) }),
("novita/moonshotai/kimi-k2-instruct", ModelPrice { input_per_mtok: 0.57, output_per_mtok: 2.3, max_input_tokens: Some(131072) }),
("novita/moonshotai/kimi-k2-thinking", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.5, max_input_tokens: Some(262144) }),
("novita/nousresearch/hermes-2-pro-llama-3-8b", ModelPrice { input_per_mtok: 0.14, output_per_mtok: 0.14, max_input_tokens: Some(8192) }),
("novita/openai/gpt-oss-120b", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.25, max_input_tokens: Some(131072) }),
("novita/openai/gpt-oss-20b", ModelPrice { input_per_mtok: 0.04, output_per_mtok: 0.15, max_input_tokens: Some(131072) }),
("novita/paddlepaddle/paddleocr-vl", ModelPrice { input_per_mtok: 0.02, output_per_mtok: 0.02, max_input_tokens: Some(16384) }),
("novita/qwen/qwen-2.5-72b-instruct", ModelPrice { input_per_mtok: 0.38, output_per_mtok: 0.4, max_input_tokens: Some(32000) }),
("novita/qwen/qwen-mt-plus", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 0.75, max_input_tokens: Some(16384) }),
("novita/qwen/qwen2.5-7b-instruct", ModelPrice { input_per_mtok: 0.07, output_per_mtok: 0.07, max_input_tokens: Some(32000) }),
("novita/qwen/qwen2.5-vl-72b-instruct", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 0.8, max_input_tokens: Some(32768) }),
("novita/qwen/qwen3-235b-a22b-fp8", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.8, max_input_tokens: Some(40960) }),
("novita/qwen/qwen3-235b-a22b-instruct-2507", ModelPrice { input_per_mtok: 0.09, output_per_mtok: 0.58, max_input_tokens: Some(131072) }),
("novita/qwen/qwen3-235b-a22b-thinking-2507", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 3.0, max_input_tokens: Some(131072) }),
("novita/qwen/qwen3-30b-a3b-fp8", ModelPrice { input_per_mtok: 0.09, output_per_mtok: 0.45, max_input_tokens: Some(40960) }),
("novita/qwen/qwen3-32b-fp8", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.45, max_input_tokens: Some(40960) }),
("novita/qwen/qwen3-4b-fp8", ModelPrice { input_per_mtok: 0.03, output_per_mtok: 0.03, max_input_tokens: Some(128000) }),
("novita/qwen/qwen3-8b-fp8", ModelPrice { input_per_mtok: 0.035, output_per_mtok: 0.138, max_input_tokens: Some(128000) }),
("novita/qwen/qwen3-coder-30b-a3b-instruct", ModelPrice { input_per_mtok: 0.07, output_per_mtok: 0.27, max_input_tokens: Some(160000) }),
("novita/qwen/qwen3-coder-480b-a35b-instruct", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.3, max_input_tokens: Some(262144) }),
("novita/qwen/qwen3-max", ModelPrice { input_per_mtok: 2.11, output_per_mtok: 8.45, max_input_tokens: Some(262144) }),
("novita/qwen/qwen3-next-80b-a3b-instruct", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 1.5, max_input_tokens: Some(131072) }),
("novita/qwen/qwen3-next-80b-a3b-thinking", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 1.5, max_input_tokens: Some(131072) }),
("novita/qwen/qwen3-omni-30b-a3b-instruct", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 0.97, max_input_tokens: Some(65536) }),
("novita/qwen/qwen3-omni-30b-a3b-thinking", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 0.97, max_input_tokens: Some(65536) }),
("novita/qwen/qwen3-vl-235b-a22b-instruct", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.5, max_input_tokens: Some(131072) }),
("novita/qwen/qwen3-vl-235b-a22b-thinking", ModelPrice { input_per_mtok: 0.98, output_per_mtok: 3.95, max_input_tokens: Some(131072) }),
("novita/qwen/qwen3-vl-30b-a3b-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.7, max_input_tokens: Some(131072) }),
("novita/qwen/qwen3-vl-30b-a3b-thinking", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 1.0, max_input_tokens: Some(131072) }),
("novita/qwen/qwen3-vl-8b-instruct", ModelPrice { input_per_mtok: 0.08, output_per_mtok: 0.5, max_input_tokens: Some(131072) }),
("novita/sao10k/l3-70b-euryale-v2.1", ModelPrice { input_per_mtok: 1.48, output_per_mtok: 1.48, max_input_tokens: Some(8192) }),
("novita/sao10k/l3-8b-lunaris", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.05, max_input_tokens: Some(8192) }),
("novita/sao10k/l31-70b-euryale-v2.2", ModelPrice { input_per_mtok: 1.48, output_per_mtok: 1.48, max_input_tokens: Some(8192) }),
("novita/skywork/r1v4-lite", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.6, max_input_tokens: Some(262144) }),
("novita/xiaomimimo/mimo-v2-flash", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.3, max_input_tokens: Some(262144) }),
("novita/zai-org/autoglm-phone-9b-multilingual", ModelPrice { input_per_mtok: 0.035, output_per_mtok: 0.138, max_input_tokens: Some(65536) }),
("novita/zai-org/glm-4.5", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.2, max_input_tokens: Some(131072) }),
("novita/zai-org/glm-4.5-air", ModelPrice { input_per_mtok: 0.13, output_per_mtok: 0.85, max_input_tokens: Some(131072) }),
("novita/zai-org/glm-4.5v", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 1.8, max_input_tokens: Some(65536) }),
("novita/zai-org/glm-4.6", ModelPrice { input_per_mtok: 0.55, output_per_mtok: 2.2, max_input_tokens: Some(204800) }),
("novita/zai-org/glm-4.6v", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.9, max_input_tokens: Some(131072) }),
("novita/zai-org/glm-4.7", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.2, max_input_tokens: Some(204800) }),
("nscale/Qwen/QwQ-32B", ModelPrice { input_per_mtok: 0.18, output_per_mtok: 0.2, max_input_tokens: None }),
("nscale/Qwen/Qwen2.5-Coder-32B-Instruct", ModelPrice { input_per_mtok: 0.06, output_per_mtok: 0.2, max_input_tokens: None }),
("nscale/Qwen/Qwen2.5-Coder-3B-Instruct", ModelPrice { input_per_mtok: 0.01, output_per_mtok: 0.03, max_input_tokens: None }),
("nscale/Qwen/Qwen2.5-Coder-7B-Instruct", ModelPrice { input_per_mtok: 0.01, output_per_mtok: 0.03, max_input_tokens: None }),
("nscale/deepseek-ai/DeepSeek-R1-Distill-Llama-70B", ModelPrice { input_per_mtok: 0.375, output_per_mtok: 0.375, max_input_tokens: None }),
("nscale/deepseek-ai/DeepSeek-R1-Distill-Llama-8B", ModelPrice { input_per_mtok: 0.025, output_per_mtok: 0.025, max_input_tokens: None }),
("nscale/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B", ModelPrice { input_per_mtok: 0.09, output_per_mtok: 0.09, max_input_tokens: None }),
("nscale/deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", ModelPrice { input_per_mtok: 0.07, output_per_mtok: 0.07, max_input_tokens: None }),
("nscale/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: None }),
("nscale/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: None }),
("nscale/meta-llama/Llama-3.1-8B-Instruct", ModelPrice { input_per_mtok: 0.03, output_per_mtok: 0.03, max_input_tokens: None }),
("nscale/meta-llama/Llama-3.3-70B-Instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: None }),
("nscale/meta-llama/Llama-4-Scout-17B-16E-Instruct", ModelPrice { input_per_mtok: 0.09, output_per_mtok: 0.29, max_input_tokens: None }),
("nscale/mistralai/mixtral-8x22b-instruct-v0.1", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 0.6, max_input_tokens: None }),
("nvidia.nemotron-nano-12b-v2", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.6, max_input_tokens: Some(128000) }),
("nvidia.nemotron-nano-3-30b", ModelPrice { input_per_mtok: 0.06, output_per_mtok: 0.24, max_input_tokens: Some(262144) }),
("nvidia.nemotron-nano-9b-v2", ModelPrice { input_per_mtok: 0.06, output_per_mtok: 0.23, max_input_tokens: Some(128000) }),
("nvidia.nemotron-super-3-120b", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.65, max_input_tokens: Some(256000) }),
("o1", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 60.0, max_input_tokens: Some(200000) }),
("o1-2024-12-17", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 60.0, max_input_tokens: Some(200000) }),
("o1-mini", ModelPrice { input_per_mtok: 1.21, output_per_mtok: 4.84, max_input_tokens: Some(128000) }),
("o1-mini-2024-09-12", ModelPrice { input_per_mtok: 1.1, output_per_mtok: 4.4, max_input_tokens: Some(128000) }),
("o1-preview", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 60.0, max_input_tokens: Some(128000) }),
("o1-preview-2024-09-12", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 60.0, max_input_tokens: Some(128000) }),
("o1-pro", ModelPrice { input_per_mtok: 150.0, output_per_mtok: 600.0, max_input_tokens: Some(200000) }),
("o1-pro-2025-03-19", ModelPrice { input_per_mtok: 150.0, output_per_mtok: 600.0, max_input_tokens: Some(200000) }),
("o3", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 8.0, max_input_tokens: Some(200000) }),
("o3-2025-04-16", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 8.0, max_input_tokens: Some(200000) }),
("o3-deep-research", ModelPrice { input_per_mtok: 10.0, output_per_mtok: 40.0, max_input_tokens: Some(200000) }),
("o3-deep-research-2025-06-26", ModelPrice { input_per_mtok: 10.0, output_per_mtok: 40.0, max_input_tokens: Some(200000) }),
("o3-mini", ModelPrice { input_per_mtok: 1.1, output_per_mtok: 4.4, max_input_tokens: Some(200000) }),
("o3-mini-2025-01-31", ModelPrice { input_per_mtok: 1.1, output_per_mtok: 4.4, max_input_tokens: Some(200000) }),
("o3-mini-high", ModelPrice { input_per_mtok: 1.1, output_per_mtok: 4.4, max_input_tokens: Some(128000) }),
("o3-pro", ModelPrice { input_per_mtok: 20.0, output_per_mtok: 80.0, max_input_tokens: Some(200000) }),
("o3-pro-2025-06-10", ModelPrice { input_per_mtok: 20.0, output_per_mtok: 80.0, max_input_tokens: Some(200000) }),
("o4-mini", ModelPrice { input_per_mtok: 1.1, output_per_mtok: 4.4, max_input_tokens: Some(200000) }),
("o4-mini-2025-04-16", ModelPrice { input_per_mtok: 1.1, output_per_mtok: 4.4, max_input_tokens: Some(200000) }),
("o4-mini-deep-research", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 8.0, max_input_tokens: Some(200000) }),
("o4-mini-deep-research-2025-06-26", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 8.0, max_input_tokens: Some(200000) }),
("oci/cohere.command-a-03-2025", ModelPrice { input_per_mtok: 1.56, output_per_mtok: 1.56, max_input_tokens: Some(256000) }),
("oci/cohere.command-a-reasoning-08-2025", ModelPrice { input_per_mtok: 1.56, output_per_mtok: 1.56, max_input_tokens: Some(256000) }),
("oci/cohere.command-a-translate-08-2025", ModelPrice { input_per_mtok: 0.09, output_per_mtok: 0.09, max_input_tokens: Some(256000) }),
("oci/cohere.command-a-vision-07-2025", ModelPrice { input_per_mtok: 1.56, output_per_mtok: 1.56, max_input_tokens: Some(128000) }),
("oci/cohere.command-latest", ModelPrice { input_per_mtok: 1.56, output_per_mtok: 1.56, max_input_tokens: Some(128000) }),
("oci/cohere.command-plus-latest", ModelPrice { input_per_mtok: 1.56, output_per_mtok: 1.56, max_input_tokens: Some(128000) }),
("oci/cohere.command-r-08-2024", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: Some(128000) }),
("oci/cohere.command-r-plus-08-2024", ModelPrice { input_per_mtok: 1.56, output_per_mtok: 1.56, max_input_tokens: Some(128000) }),
("oci/google.gemini-2.5-flash", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(1048576) }),
("oci/google.gemini-2.5-flash-lite", ModelPrice { input_per_mtok: 0.075, output_per_mtok: 0.3, max_input_tokens: Some(1048576) }),
("oci/google.gemini-2.5-pro", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: Some(1048576) }),
("oci/meta.llama-3.1-405b-instruct", ModelPrice { input_per_mtok: 10.68, output_per_mtok: 10.68, max_input_tokens: Some(128000) }),
("oci/meta.llama-3.1-70b-instruct", ModelPrice { input_per_mtok: 0.72, output_per_mtok: 0.72, max_input_tokens: Some(128000) }),
("oci/meta.llama-3.2-11b-vision-instruct", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 2.0, max_input_tokens: Some(128000) }),
("oci/meta.llama-3.2-90b-vision-instruct", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 2.0, max_input_tokens: Some(128000) }),
("oci/meta.llama-3.3-70b-instruct", ModelPrice { input_per_mtok: 0.72, output_per_mtok: 0.72, max_input_tokens: Some(128000) }),
("oci/meta.llama-3.3-70b-instruct-fp8-dynamic", ModelPrice { input_per_mtok: 0.72, output_per_mtok: 0.72, max_input_tokens: Some(128000) }),
("oci/meta.llama-4-maverick-17b-128e-instruct-fp8", ModelPrice { input_per_mtok: 0.72, output_per_mtok: 0.72, max_input_tokens: Some(512000) }),
("oci/meta.llama-4-scout-17b-16e-instruct", ModelPrice { input_per_mtok: 0.72, output_per_mtok: 0.72, max_input_tokens: Some(192000) }),
("oci/xai.grok-3", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(131072) }),
("oci/xai.grok-3-fast", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(131072) }),
("oci/xai.grok-3-mini", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.5, max_input_tokens: Some(131072) }),
("oci/xai.grok-3-mini-fast", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 4.0, max_input_tokens: Some(131072) }),
("oci/xai.grok-4", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(128000) }),
("oci/xai.grok-4-fast", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(131072) }),
("oci/xai.grok-4.1-fast", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(131072) }),
("oci/xai.grok-4.20", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(131072) }),
("oci/xai.grok-4.20-multi-agent", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(131072) }),
("oci/xai.grok-code-fast-1", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(131072) }),
("open-codestral-mamba", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 0.25, max_input_tokens: Some(256000) }),
("open-mistral-7b", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 0.25, max_input_tokens: Some(32000) }),
("open-mistral-nemo", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.3, max_input_tokens: Some(128000) }),
("open-mistral-nemo-2407", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.3, max_input_tokens: Some(128000) }),
("open-mixtral-8x22b", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 6.0, max_input_tokens: Some(65336) }),
("open-mixtral-8x7b", ModelPrice { input_per_mtok: 0.7, output_per_mtok: 0.7, max_input_tokens: Some(32000) }),
("openai.gpt-oss-120b-1:0", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(128000) }),
("openai.gpt-oss-20b-1:0", ModelPrice { input_per_mtok: 0.07, output_per_mtok: 0.3, max_input_tokens: Some(128000) }),
("openai.gpt-oss-safeguard-120b", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(128000) }),
("openai.gpt-oss-safeguard-20b", ModelPrice { input_per_mtok: 0.07, output_per_mtok: 0.2, max_input_tokens: Some(128000) }),
("openai/gpt-4.1", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 8.0, max_input_tokens: None }),
("openai/gpt-4.1-mini", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 1.6, max_input_tokens: None }),
("openai/gpt-4.1-nano", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.4, max_input_tokens: None }),
("openai/gpt-4o", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: None }),
("openai/gpt-4o-mini", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: None }),
("openai/gpt-5", ModelPrice { input_per_mtok: 1.25, output_per_mtok: 10.0, max_input_tokens: None }),
("openai/gpt-5-mini", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 2.0, max_input_tokens: None }),
("openai/gpt-5-nano", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.4, max_input_tokens: None }),
("openai/gpt-oss-120b", ModelPrice { input_per_mtok: 0.18, output_per_mtok: 0.72, max_input_tokens: Some(131072) }),
("openai/gpt-oss-20b", ModelPrice { input_per_mtok: 0.075, output_per_mtok: 0.3, max_input_tokens: Some(131072) }),
("openai/gpt-oss-safeguard-20b", ModelPrice { input_per_mtok: 0.075, output_per_mtok: 0.3, max_input_tokens: Some(131072) }),
("openai/o1", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 60.0, max_input_tokens: None }),
("openai/o1-mini", ModelPrice { input_per_mtok: 1.1, output_per_mtok: 4.4, max_input_tokens: None }),
("openai/o4-mini", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 4.0, max_input_tokens: None }),
("ovhcloud/DeepSeek-R1-Distill-Llama-70B", ModelPrice { input_per_mtok: 0.67, output_per_mtok: 0.67, max_input_tokens: Some(131000) }),
("ovhcloud/Llama-3.1-8B-Instruct", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(131000) }),
("ovhcloud/Meta-Llama-3_1-70B-Instruct", ModelPrice { input_per_mtok: 0.67, output_per_mtok: 0.67, max_input_tokens: Some(131000) }),
("ovhcloud/Meta-Llama-3_3-70B-Instruct", ModelPrice { input_per_mtok: 0.67, output_per_mtok: 0.67, max_input_tokens: Some(131000) }),
("ovhcloud/Mistral-7B-Instruct-v0.3", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(127000) }),
("ovhcloud/Mistral-Nemo-Instruct-2407", ModelPrice { input_per_mtok: 0.13, output_per_mtok: 0.13, max_input_tokens: Some(118000) }),
("ovhcloud/Mistral-Small-3.2-24B-Instruct-2506", ModelPrice { input_per_mtok: 0.09, output_per_mtok: 0.28, max_input_tokens: Some(128000) }),
("ovhcloud/Mixtral-8x7B-Instruct-v0.1", ModelPrice { input_per_mtok: 0.63, output_per_mtok: 0.63, max_input_tokens: Some(32000) }),
("ovhcloud/Qwen2.5-Coder-32B-Instruct", ModelPrice { input_per_mtok: 0.87, output_per_mtok: 0.87, max_input_tokens: Some(32000) }),
("ovhcloud/Qwen2.5-VL-72B-Instruct", ModelPrice { input_per_mtok: 0.91, output_per_mtok: 0.91, max_input_tokens: Some(32000) }),
("ovhcloud/Qwen3-32B", ModelPrice { input_per_mtok: 0.08, output_per_mtok: 0.23, max_input_tokens: Some(32000) }),
("ovhcloud/gpt-oss-120b", ModelPrice { input_per_mtok: 0.08, output_per_mtok: 0.4, max_input_tokens: Some(131000) }),
("ovhcloud/gpt-oss-20b", ModelPrice { input_per_mtok: 0.04, output_per_mtok: 0.15, max_input_tokens: Some(131000) }),
("ovhcloud/llava-v1.6-mistral-7b-hf", ModelPrice { input_per_mtok: 0.29, output_per_mtok: 0.29, max_input_tokens: Some(32000) }),
("ovhcloud/mamba-codestral-7B-v0.1", ModelPrice { input_per_mtok: 0.19, output_per_mtok: 0.19, max_input_tokens: Some(256000) }),
("palm/chat-bison", ModelPrice { input_per_mtok: 0.125, output_per_mtok: 0.125, max_input_tokens: Some(8192) }),
("palm/chat-bison-001", ModelPrice { input_per_mtok: 0.125, output_per_mtok: 0.125, max_input_tokens: Some(8192) }),
("palm/text-bison", ModelPrice { input_per_mtok: 0.125, output_per_mtok: 0.125, max_input_tokens: Some(8192) }),
("palm/text-bison-001", ModelPrice { input_per_mtok: 0.125, output_per_mtok: 0.125, max_input_tokens: Some(8192) }),
("palm/text-bison-safety-off", ModelPrice { input_per_mtok: 0.125, output_per_mtok: 0.125, max_input_tokens: Some(8192) }),
("palm/text-bison-safety-recitation-off", ModelPrice { input_per_mtok: 0.125, output_per_mtok: 0.125, max_input_tokens: Some(8192) }),
("pixtral-12b-2409", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: Some(128000) }),
("pixtral-large-2411", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 6.0, max_input_tokens: Some(128000) }),
("pixtral-large-latest", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 6.0, max_input_tokens: Some(128000) }),
("pplx-70b-chat", ModelPrice { input_per_mtok: 0.7, output_per_mtok: 2.8, max_input_tokens: Some(4096) }),
("pplx-70b-online", ModelPrice { input_per_mtok: 0.0, output_per_mtok: 2.8, max_input_tokens: Some(4096) }),
("pplx-7b-chat", ModelPrice { input_per_mtok: 0.07, output_per_mtok: 0.28, max_input_tokens: Some(8192) }),
("pplx-7b-online", ModelPrice { input_per_mtok: 0.0, output_per_mtok: 0.28, max_input_tokens: Some(4096) }),
("qwen.qwen3-235b-a22b-2507-v1:0", ModelPrice { input_per_mtok: 0.22, output_per_mtok: 0.88, max_input_tokens: Some(262144) }),
("qwen.qwen3-32b-v1:0", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(131072) }),
("qwen.qwen3-coder-30b-a3b-v1:0", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(262144) }),
("qwen.qwen3-coder-480b-a35b-v1:0", ModelPrice { input_per_mtok: 0.22, output_per_mtok: 1.8, max_input_tokens: Some(262000) }),
("qwen.qwen3-coder-next", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.2, max_input_tokens: Some(262144) }),
("qwen.qwen3-next-80b-a3b", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 1.2, max_input_tokens: Some(128000) }),
("qwen.qwen3-vl-235b-a22b", ModelPrice { input_per_mtok: 0.53, output_per_mtok: 2.66, max_input_tokens: Some(128000) }),
("qwen/qwen-2.5-coder-32b-instruct", ModelPrice { input_per_mtok: 0.18, output_per_mtok: 0.18, max_input_tokens: Some(33792) }),
("qwen/qwen-vl-plus", ModelPrice { input_per_mtok: 0.21, output_per_mtok: 0.63, max_input_tokens: Some(8192) }),
("qwen/qwen3-235b-a22b-2507", ModelPrice { input_per_mtok: 0.071, output_per_mtok: 0.1, max_input_tokens: Some(262144) }),
("qwen/qwen3-235b-a22b-instruct-2507", ModelPrice { input_per_mtok: 0.264, output_per_mtok: 1.06, max_input_tokens: None }),
("qwen/qwen3-235b-a22b-instruct-2507-maas", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 1.0, max_input_tokens: Some(262144) }),
("qwen/qwen3-235b-a22b-thinking-2507", ModelPrice { input_per_mtok: 0.11, output_per_mtok: 0.6, max_input_tokens: Some(262144) }),
("qwen/qwen3-32b", ModelPrice { input_per_mtok: 0.29, output_per_mtok: 0.59, max_input_tokens: Some(131000) }),
("qwen/qwen3-coder", ModelPrice { input_per_mtok: 0.22, output_per_mtok: 0.95, max_input_tokens: Some(262100) }),
("qwen/qwen3-coder-480b-a35b-instruct-maas", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 4.0, max_input_tokens: Some(262144) }),
("qwen/qwen3-coder-plus", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 5.0, max_input_tokens: Some(997952) }),
("qwen/qwen3-next-80b-a3b-instruct-maas", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 1.2, max_input_tokens: Some(262144) }),
("qwen/qwen3-next-80b-a3b-thinking-maas", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 1.2, max_input_tokens: Some(262144) }),
("qwen/qwen3.5-122b-a10b", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 2.0, max_input_tokens: Some(262144) }),
("qwen/qwen3.5-27b", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 2.4, max_input_tokens: Some(262144) }),
("qwen/qwen3.5-35b-a3b", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 2.0, max_input_tokens: Some(262144) }),
("qwen/qwen3.5-397b-a17b", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 3.6, max_input_tokens: Some(262144) }),
("qwen/qwen3.5-flash-02-23", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.4, max_input_tokens: Some(1000000) }),
("qwen/qwen3.5-plus-02-15", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 2.4, max_input_tokens: Some(1000000) }),
("replicateopenai/gpt-oss-20b", ModelPrice { input_per_mtok: 0.09, output_per_mtok: 0.36, max_input_tokens: None }),
("sa-east-1/deepseek.v3.2", ModelPrice { input_per_mtok: 0.74, output_per_mtok: 2.22, max_input_tokens: Some(163840) }),
("sa-east-1/meta.llama3-70b-instruct-v1:0", ModelPrice { input_per_mtok: 4.45, output_per_mtok: 5.88, max_input_tokens: Some(8192) }),
("sa-east-1/meta.llama3-8b-instruct-v1:0", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.01, max_input_tokens: Some(8192) }),
("sa-east-1/minimax.minimax-m2.1", ModelPrice { input_per_mtok: 0.36, output_per_mtok: 1.44, max_input_tokens: Some(196000) }),
("sa-east-1/minimax.minimax-m2.5", ModelPrice { input_per_mtok: 0.36, output_per_mtok: 1.44, max_input_tokens: Some(1000000) }),
("sa-east-1/moonshotai.kimi-k2-thinking", ModelPrice { input_per_mtok: 0.73, output_per_mtok: 3.03, max_input_tokens: Some(262144) }),
("sa-east-1/moonshotai.kimi-k2.5", ModelPrice { input_per_mtok: 0.72, output_per_mtok: 3.6, max_input_tokens: Some(262144) }),
("sa-east-1/qwen.qwen3-coder-next", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 1.44, max_input_tokens: Some(262144) }),
("sambanova/DeepSeek-R1", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 7.0, max_input_tokens: Some(32768) }),
("sambanova/DeepSeek-R1-Distill-Llama-70B", ModelPrice { input_per_mtok: 0.7, output_per_mtok: 1.4, max_input_tokens: Some(131072) }),
("sambanova/DeepSeek-V3-0324", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 4.5, max_input_tokens: Some(32768) }),
("sambanova/DeepSeek-V3.1", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 4.5, max_input_tokens: Some(32768) }),
("sambanova/Llama-4-Maverick-17B-128E-Instruct", ModelPrice { input_per_mtok: 0.63, output_per_mtok: 1.8, max_input_tokens: Some(131072) }),
("sambanova/Llama-4-Scout-17B-16E-Instruct", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 0.7, max_input_tokens: Some(8192) }),
("sambanova/Meta-Llama-3.1-405B-Instruct", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 10.0, max_input_tokens: Some(16384) }),
("sambanova/Meta-Llama-3.1-8B-Instruct", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.2, max_input_tokens: Some(16384) }),
("sambanova/Meta-Llama-3.2-1B-Instruct", ModelPrice { input_per_mtok: 0.04, output_per_mtok: 0.08, max_input_tokens: Some(16384) }),
("sambanova/Meta-Llama-3.2-3B-Instruct", ModelPrice { input_per_mtok: 0.08, output_per_mtok: 0.16, max_input_tokens: Some(4096) }),
("sambanova/Meta-Llama-3.3-70B-Instruct", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 1.2, max_input_tokens: Some(131072) }),
("sambanova/Meta-Llama-Guard-3-8B", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.3, max_input_tokens: Some(16384) }),
("sambanova/QwQ-32B", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.0, max_input_tokens: Some(16384) }),
("sambanova/Qwen2-Audio-7B-Instruct", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 100.0, max_input_tokens: Some(4096) }),
("sambanova/Qwen3-32B", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 0.8, max_input_tokens: Some(8192) }),
("sambanova/gpt-oss-120b", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 4.5, max_input_tokens: Some(131072) }),
("sonar", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 1.0, max_input_tokens: Some(128000) }),
("sonar-deep-research", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 8.0, max_input_tokens: Some(128000) }),
("sonar-medium-chat", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 1.8, max_input_tokens: Some(16384) }),
("sonar-medium-online", ModelPrice { input_per_mtok: 0.0, output_per_mtok: 1.8, max_input_tokens: Some(12000) }),
("sonar-pro", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("sonar-reasoning", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 5.0, max_input_tokens: Some(128000) }),
("sonar-reasoning-pro", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 8.0, max_input_tokens: Some(128000) }),
("sonar-small-chat", ModelPrice { input_per_mtok: 0.07, output_per_mtok: 0.28, max_input_tokens: Some(16384) }),
("sonar-small-online", ModelPrice { input_per_mtok: 0.0, output_per_mtok: 0.28, max_input_tokens: Some(12000) }),
("switchpoint/router", ModelPrice { input_per_mtok: 0.85, output_per_mtok: 3.4, max_input_tokens: Some(131072) }),
("text-unicorn", ModelPrice { input_per_mtok: 10.0, output_per_mtok: 28.0, max_input_tokens: Some(8192) }),
("text-unicorn@001", ModelPrice { input_per_mtok: 10.0, output_per_mtok: 28.0, max_input_tokens: Some(8192) }),
("together-ai-21.1b-41b", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 0.8, max_input_tokens: None }),
("together-ai-4.1b-8b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: None }),
("together-ai-41.1b-80b", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: None }),
("together-ai-8.1b-21b", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.3, max_input_tokens: Some(1000) }),
("together-ai-81.1b-110b", ModelPrice { input_per_mtok: 1.8, output_per_mtok: 1.8, max_input_tokens: None }),
("together-ai-up-to-4b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: None }),
("undi95/remm-slerp-l2-13b", ModelPrice { input_per_mtok: 1.875, output_per_mtok: 1.875, max_input_tokens: Some(6144) }),
("us-east-1/anthropic.claude-instant-v1", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 2.4, max_input_tokens: Some(100000) }),
("us-east-1/anthropic.claude-v1", ModelPrice { input_per_mtok: 8.0, output_per_mtok: 24.0, max_input_tokens: Some(100000) }),
("us-east-1/anthropic.claude-v2:1", ModelPrice { input_per_mtok: 8.0, output_per_mtok: 24.0, max_input_tokens: Some(100000) }),
("us-east-1/deepseek.v3.2", ModelPrice { input_per_mtok: 0.62, output_per_mtok: 1.85, max_input_tokens: Some(163840) }),
("us-east-1/meta.llama3-70b-instruct-v1:0", ModelPrice { input_per_mtok: 2.65, output_per_mtok: 3.5, max_input_tokens: Some(8192) }),
("us-east-1/meta.llama3-8b-instruct-v1:0", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.6, max_input_tokens: Some(8192) }),
("us-east-1/minimax.minimax-m2.1", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(196000) }),
("us-east-1/minimax.minimax-m2.5", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(1000000) }),
("us-east-1/mistral.mistral-7b-instruct-v0:2", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.2, max_input_tokens: Some(32000) }),
("us-east-1/mistral.mistral-large-2402-v1:0", ModelPrice { input_per_mtok: 8.0, output_per_mtok: 24.0, max_input_tokens: Some(32000) }),
("us-east-1/mistral.mixtral-8x7b-instruct-v0:1", ModelPrice { input_per_mtok: 0.45, output_per_mtok: 0.7, max_input_tokens: Some(32000) }),
("us-east-1/moonshotai.kimi-k2-thinking", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.5, max_input_tokens: Some(262144) }),
("us-east-1/moonshotai.kimi-k2.5", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 3.0, max_input_tokens: Some(262144) }),
("us-east-1/qwen.qwen3-coder-next", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.2, max_input_tokens: Some(262144) }),
("us-east-2/deepseek.v3.2", ModelPrice { input_per_mtok: 0.62, output_per_mtok: 1.85, max_input_tokens: Some(163840) }),
("us-east-2/minimax.minimax-m2.1", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(196000) }),
("us-east-2/minimax.minimax-m2.5", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(1000000) }),
("us-east-2/moonshotai.kimi-k2-thinking", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.5, max_input_tokens: Some(262144) }),
("us-east-2/moonshotai.kimi-k2.5", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 3.0, max_input_tokens: Some(262144) }),
("us-east-2/qwen.qwen3-coder-next", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.2, max_input_tokens: Some(262144) }),
("us-gov-east-1/amazon.nova-pro-v1:0", ModelPrice { input_per_mtok: 0.96, output_per_mtok: 3.84, max_input_tokens: Some(300000) }),
("us-gov-east-1/amazon.titan-text-express-v1", ModelPrice { input_per_mtok: 1.3, output_per_mtok: 1.7, max_input_tokens: Some(42000) }),
("us-gov-east-1/amazon.titan-text-lite-v1", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.4, max_input_tokens: Some(42000) }),
("us-gov-east-1/amazon.titan-text-premier-v1:0", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(42000) }),
("us-gov-east-1/anthropic.claude-3-5-sonnet-20240620-v1:0", ModelPrice { input_per_mtok: 3.6, output_per_mtok: 18.0, max_input_tokens: Some(200000) }),
("us-gov-east-1/anthropic.claude-3-haiku-20240307-v1:0", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.5, max_input_tokens: Some(200000) }),
("us-gov-east-1/anthropic.claude-haiku-4-5-20251001-v1:0", ModelPrice { input_per_mtok: 1.2, output_per_mtok: 6.0, max_input_tokens: Some(200000) }),
("us-gov-east-1/anthropic.claude-sonnet-4-5-20250929-v1:0", ModelPrice { input_per_mtok: 3.3, output_per_mtok: 16.5, max_input_tokens: Some(200000) }),
("us-gov-east-1/claude-sonnet-4-5-20250929-v1:0", ModelPrice { input_per_mtok: 3.3, output_per_mtok: 16.5, max_input_tokens: Some(200000) }),
("us-gov-east-1/meta.llama3-70b-instruct-v1:0", ModelPrice { input_per_mtok: 2.65, output_per_mtok: 3.5, max_input_tokens: Some(8000) }),
("us-gov-east-1/meta.llama3-8b-instruct-v1:0", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 2.65, max_input_tokens: Some(8000) }),
("us-gov-west-1/amazon.nova-pro-v1:0", ModelPrice { input_per_mtok: 0.96, output_per_mtok: 3.84, max_input_tokens: Some(300000) }),
("us-gov-west-1/amazon.titan-text-express-v1", ModelPrice { input_per_mtok: 1.3, output_per_mtok: 1.7, max_input_tokens: Some(42000) }),
("us-gov-west-1/amazon.titan-text-lite-v1", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.4, max_input_tokens: Some(42000) }),
("us-gov-west-1/amazon.titan-text-premier-v1:0", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(42000) }),
("us-gov-west-1/anthropic.claude-3-5-sonnet-20240620-v1:0", ModelPrice { input_per_mtok: 3.6, output_per_mtok: 18.0, max_input_tokens: Some(200000) }),
("us-gov-west-1/anthropic.claude-3-7-sonnet-20250219-v1:0", ModelPrice { input_per_mtok: 3.6, output_per_mtok: 18.0, max_input_tokens: Some(200000) }),
("us-gov-west-1/anthropic.claude-3-haiku-20240307-v1:0", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.5, max_input_tokens: Some(200000) }),
("us-gov-west-1/anthropic.claude-haiku-4-5-20251001-v1:0", ModelPrice { input_per_mtok: 1.2, output_per_mtok: 6.0, max_input_tokens: Some(200000) }),
("us-gov-west-1/anthropic.claude-sonnet-4-5-20250929-v1:0", ModelPrice { input_per_mtok: 3.3, output_per_mtok: 16.5, max_input_tokens: Some(200000) }),
("us-gov-west-1/claude-sonnet-4-5-20250929-v1:0", ModelPrice { input_per_mtok: 3.3, output_per_mtok: 16.5, max_input_tokens: Some(200000) }),
("us-gov-west-1/meta.llama3-70b-instruct-v1:0", ModelPrice { input_per_mtok: 2.65, output_per_mtok: 3.5, max_input_tokens: Some(8000) }),
("us-gov-west-1/meta.llama3-8b-instruct-v1:0", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 2.65, max_input_tokens: Some(8000) }),
("us-gov.anthropic.claude-sonnet-4-5-20250929-v1:0", ModelPrice { input_per_mtok: 3.3, output_per_mtok: 16.5, max_input_tokens: Some(200000) }),
("us-west-1/meta.llama3-70b-instruct-v1:0", ModelPrice { input_per_mtok: 2.65, output_per_mtok: 3.5, max_input_tokens: Some(8192) }),
("us-west-1/meta.llama3-8b-instruct-v1:0", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.6, max_input_tokens: Some(8192) }),
("us-west-2/anthropic.claude-instant-v1", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 2.4, max_input_tokens: Some(100000) }),
("us-west-2/anthropic.claude-v1", ModelPrice { input_per_mtok: 8.0, output_per_mtok: 24.0, max_input_tokens: Some(100000) }),
("us-west-2/anthropic.claude-v2:1", ModelPrice { input_per_mtok: 8.0, output_per_mtok: 24.0, max_input_tokens: Some(100000) }),
("us-west-2/deepseek.v3.2", ModelPrice { input_per_mtok: 0.62, output_per_mtok: 1.85, max_input_tokens: Some(163840) }),
("us-west-2/minimax.minimax-m2.1", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(196000) }),
("us-west-2/minimax.minimax-m2.5", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(1000000) }),
("us-west-2/mistral.mistral-7b-instruct-v0:2", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.2, max_input_tokens: Some(32000) }),
("us-west-2/mistral.mistral-large-2402-v1:0", ModelPrice { input_per_mtok: 8.0, output_per_mtok: 24.0, max_input_tokens: Some(32000) }),
("us-west-2/mistral.mixtral-8x7b-instruct-v0:1", ModelPrice { input_per_mtok: 0.45, output_per_mtok: 0.7, max_input_tokens: Some(32000) }),
("us-west-2/moonshotai.kimi-k2-thinking", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.5, max_input_tokens: Some(262144) }),
("us-west-2/moonshotai.kimi-k2.5", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 3.0, max_input_tokens: Some(262144) }),
("us-west-2/qwen.qwen3-coder-next", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.2, max_input_tokens: Some(262144) }),
("us.amazon.nova-2-lite-v1:0", ModelPrice { input_per_mtok: 0.33, output_per_mtok: 2.75, max_input_tokens: Some(1000000) }),
("us.amazon.nova-2-pro-preview-20251202-v1:0", ModelPrice { input_per_mtok: 2.1875, output_per_mtok: 17.5, max_input_tokens: Some(1000000) }),
("us.amazon.nova-lite-v1:0", ModelPrice { input_per_mtok: 0.06, output_per_mtok: 0.24, max_input_tokens: Some(300000) }),
("us.amazon.nova-micro-v1:0", ModelPrice { input_per_mtok: 0.035, output_per_mtok: 0.14, max_input_tokens: Some(128000) }),
("us.amazon.nova-premier-v1:0", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 12.5, max_input_tokens: Some(1000000) }),
("us.amazon.nova-pro-v1:0", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 3.2, max_input_tokens: Some(300000) }),
("us.anthropic.claude-3-5-haiku-20241022-v1:0", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 4.0, max_input_tokens: Some(200000) }),
("us.anthropic.claude-3-5-sonnet-20240620-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("us.anthropic.claude-3-5-sonnet-20241022-v2:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("us.anthropic.claude-3-7-sonnet-20250219-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("us.anthropic.claude-3-haiku-20240307-v1:0", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 1.25, max_input_tokens: Some(200000) }),
("us.anthropic.claude-3-opus-20240229-v1:0", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("us.anthropic.claude-3-sonnet-20240229-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("us.anthropic.claude-haiku-4-5-20251001-v1:0", ModelPrice { input_per_mtok: 1.1, output_per_mtok: 5.5, max_input_tokens: Some(200000) }),
("us.anthropic.claude-opus-4-1-20250805-v1:0", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("us.anthropic.claude-opus-4-20250514-v1:0", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("us.anthropic.claude-opus-4-5-20251101-v1:0", ModelPrice { input_per_mtok: 5.5, output_per_mtok: 27.5, max_input_tokens: Some(200000) }),
("us.anthropic.claude-opus-4-6-v1", ModelPrice { input_per_mtok: 5.5, output_per_mtok: 27.5, max_input_tokens: Some(1000000) }),
("us.anthropic.claude-opus-4-7", ModelPrice { input_per_mtok: 5.5, output_per_mtok: 27.5, max_input_tokens: Some(1000000) }),
("us.anthropic.claude-sonnet-4-20250514-v1:0", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1000000) }),
("us.anthropic.claude-sonnet-4-5-20250929-v1:0", ModelPrice { input_per_mtok: 3.3, output_per_mtok: 16.5, max_input_tokens: Some(200000) }),
("us.anthropic.claude-sonnet-4-6", ModelPrice { input_per_mtok: 3.3, output_per_mtok: 16.5, max_input_tokens: Some(1000000) }),
("us.deepseek.r1-v1:0", ModelPrice { input_per_mtok: 1.35, output_per_mtok: 5.4, max_input_tokens: Some(128000) }),
("us.deepseek.v3.2", ModelPrice { input_per_mtok: 0.62, output_per_mtok: 1.85, max_input_tokens: Some(163840) }),
("us.meta.llama3-1-405b-instruct-v1:0", ModelPrice { input_per_mtok: 5.32, output_per_mtok: 16.0, max_input_tokens: Some(128000) }),
("us.meta.llama3-1-70b-instruct-v1:0", ModelPrice { input_per_mtok: 0.99, output_per_mtok: 0.99, max_input_tokens: Some(128000) }),
("us.meta.llama3-1-8b-instruct-v1:0", ModelPrice { input_per_mtok: 0.22, output_per_mtok: 0.22, max_input_tokens: Some(128000) }),
("us.meta.llama3-2-11b-instruct-v1:0", ModelPrice { input_per_mtok: 0.35, output_per_mtok: 0.35, max_input_tokens: Some(128000) }),
("us.meta.llama3-2-1b-instruct-v1:0", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(128000) }),
("us.meta.llama3-2-3b-instruct-v1:0", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: Some(128000) }),
("us.meta.llama3-2-90b-instruct-v1:0", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 2.0, max_input_tokens: Some(128000) }),
("us.meta.llama3-3-70b-instruct-v1:0", ModelPrice { input_per_mtok: 0.72, output_per_mtok: 0.72, max_input_tokens: Some(128000) }),
("us.meta.llama4-maverick-17b-instruct-v1:0", ModelPrice { input_per_mtok: 0.24, output_per_mtok: 0.97, max_input_tokens: Some(128000) }),
("us.meta.llama4-scout-17b-instruct-v1:0", ModelPrice { input_per_mtok: 0.17, output_per_mtok: 0.66, max_input_tokens: Some(128000) }),
("us.mistral.pixtral-large-2502-v1:0", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 6.0, max_input_tokens: Some(128000) }),
("us.writer.palmyra-x4-v1:0", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("us.writer.palmyra-x5-v1:0", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 6.0, max_input_tokens: Some(1000000) }),
("us/gpt-4.1-2025-04-14", ModelPrice { input_per_mtok: 2.2, output_per_mtok: 8.8, max_input_tokens: Some(1047576) }),
("us/gpt-4.1-mini-2025-04-14", ModelPrice { input_per_mtok: 0.44, output_per_mtok: 1.76, max_input_tokens: Some(1047576) }),
("us/gpt-4.1-nano-2025-04-14", ModelPrice { input_per_mtok: 0.11, output_per_mtok: 0.44, max_input_tokens: Some(1047576) }),
("us/gpt-4o-2024-08-06", ModelPrice { input_per_mtok: 2.75, output_per_mtok: 11.0, max_input_tokens: Some(128000) }),
("us/gpt-4o-2024-11-20", ModelPrice { input_per_mtok: 2.75, output_per_mtok: 11.0, max_input_tokens: Some(128000) }),
("us/gpt-4o-mini-2024-07-18", ModelPrice { input_per_mtok: 0.165, output_per_mtok: 0.66, max_input_tokens: Some(128000) }),
("us/gpt-4o-mini-realtime-preview-2024-12-17", ModelPrice { input_per_mtok: 0.66, output_per_mtok: 2.64, max_input_tokens: Some(128000) }),
("us/gpt-4o-realtime-preview-2024-10-01", ModelPrice { input_per_mtok: 5.5, output_per_mtok: 22.0, max_input_tokens: Some(128000) }),
("us/gpt-4o-realtime-preview-2024-12-17", ModelPrice { input_per_mtok: 5.5, output_per_mtok: 22.0, max_input_tokens: Some(128000) }),
("us/gpt-5-2025-08-07", ModelPrice { input_per_mtok: 1.375, output_per_mtok: 11.0, max_input_tokens: Some(272000) }),
("us/gpt-5-mini-2025-08-07", ModelPrice { input_per_mtok: 0.275, output_per_mtok: 2.2, max_input_tokens: Some(272000) }),
("us/gpt-5-nano-2025-08-07", ModelPrice { input_per_mtok: 0.055, output_per_mtok: 0.44, max_input_tokens: Some(272000) }),
("us/gpt-5.1", ModelPrice { input_per_mtok: 1.38, output_per_mtok: 11.0, max_input_tokens: Some(272000) }),
("us/gpt-5.1-chat", ModelPrice { input_per_mtok: 1.38, output_per_mtok: 11.0, max_input_tokens: Some(128000) }),
("us/gpt-5.1-codex", ModelPrice { input_per_mtok: 1.38, output_per_mtok: 11.0, max_input_tokens: Some(272000) }),
("us/gpt-5.1-codex-mini", ModelPrice { input_per_mtok: 0.275, output_per_mtok: 2.2, max_input_tokens: Some(272000) }),
("us/o1-2024-12-17", ModelPrice { input_per_mtok: 16.5, output_per_mtok: 66.0, max_input_tokens: Some(200000) }),
("us/o1-mini-2024-09-12", ModelPrice { input_per_mtok: 1.21, output_per_mtok: 4.84, max_input_tokens: Some(128000) }),
("us/o1-preview-2024-09-12", ModelPrice { input_per_mtok: 16.5, output_per_mtok: 66.0, max_input_tokens: Some(128000) }),
("us/o3-2025-04-16", ModelPrice { input_per_mtok: 2.2, output_per_mtok: 8.8, max_input_tokens: Some(200000) }),
("us/o3-mini-2025-01-31", ModelPrice { input_per_mtok: 1.21, output_per_mtok: 4.84, max_input_tokens: Some(200000) }),
("us/o4-mini-2025-04-16", ModelPrice { input_per_mtok: 1.21, output_per_mtok: 4.84, max_input_tokens: Some(200000) }),
("v0/v0-1.0-md", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(128000) }),
("v0/v0-1.5-lg", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(512000) }),
("v0/v0-1.5-md", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/alibaba/qwen-3-14b", ModelPrice { input_per_mtok: 0.08, output_per_mtok: 0.24, max_input_tokens: Some(40960) }),
("vercel_ai_gateway/alibaba/qwen-3-235b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.6, max_input_tokens: Some(40960) }),
("vercel_ai_gateway/alibaba/qwen-3-30b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.3, max_input_tokens: Some(40960) }),
("vercel_ai_gateway/alibaba/qwen-3-32b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.3, max_input_tokens: Some(40960) }),
("vercel_ai_gateway/alibaba/qwen3-coder", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 1.6, max_input_tokens: Some(262144) }),
("vercel_ai_gateway/amazon/nova-lite", ModelPrice { input_per_mtok: 0.06, output_per_mtok: 0.24, max_input_tokens: Some(300000) }),
("vercel_ai_gateway/amazon/nova-micro", ModelPrice { input_per_mtok: 0.035, output_per_mtok: 0.14, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/amazon/nova-pro", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 3.2, max_input_tokens: Some(300000) }),
("vercel_ai_gateway/amazon/titan-embed-text-v2", ModelPrice { input_per_mtok: 0.02, output_per_mtok: 0.0, max_input_tokens: None }),
("vercel_ai_gateway/anthropic/claude-3-5-sonnet", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/anthropic/claude-3-5-sonnet-20241022", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/anthropic/claude-3-7-sonnet", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/anthropic/claude-3-haiku", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 1.25, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/anthropic/claude-3-opus", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/anthropic/claude-3.5-haiku", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 4.0, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/anthropic/claude-3.5-sonnet", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/anthropic/claude-3.7-sonnet", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/anthropic/claude-4-opus", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/anthropic/claude-4-sonnet", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/anthropic/claude-haiku-4.5", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 5.0, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/anthropic/claude-opus-4", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/anthropic/claude-opus-4.1", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 75.0, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/anthropic/claude-opus-4.5", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/anthropic/claude-opus-4.6", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/anthropic/claude-sonnet-4", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/anthropic/claude-sonnet-4.5", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(1000000) }),
("vercel_ai_gateway/cohere/command-a", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(256000) }),
("vercel_ai_gateway/cohere/command-r", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/cohere/command-r-plus", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/cohere/embed-v4.0", ModelPrice { input_per_mtok: 0.12, output_per_mtok: 0.0, max_input_tokens: None }),
("vercel_ai_gateway/deepseek/deepseek-r1", ModelPrice { input_per_mtok: 0.55, output_per_mtok: 2.19, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/deepseek/deepseek-r1-distill-llama-70b", ModelPrice { input_per_mtok: 0.75, output_per_mtok: 0.99, max_input_tokens: Some(131072) }),
("vercel_ai_gateway/deepseek/deepseek-v3", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 0.9, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/google/gemini-2.0-flash", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(1048576) }),
("vercel_ai_gateway/google/gemini-2.0-flash-lite", ModelPrice { input_per_mtok: 0.075, output_per_mtok: 0.3, max_input_tokens: Some(1048576) }),
("vercel_ai_gateway/google/gemini-2.5-flash", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 2.5, max_input_tokens: Some(1000000) }),
("vercel_ai_gateway/google/gemini-2.5-pro", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(1048576) }),
("vercel_ai_gateway/google/gemma-2-9b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(8192) }),
("vercel_ai_gateway/inception/mercury-coder-small", ModelPrice { input_per_mtok: 0.25, output_per_mtok: 1.0, max_input_tokens: Some(32000) }),
("vercel_ai_gateway/meta/llama-3-70b", ModelPrice { input_per_mtok: 0.59, output_per_mtok: 0.79, max_input_tokens: Some(8192) }),
("vercel_ai_gateway/meta/llama-3-8b", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.08, max_input_tokens: Some(8192) }),
("vercel_ai_gateway/meta/llama-3.1-70b", ModelPrice { input_per_mtok: 0.72, output_per_mtok: 0.72, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/meta/llama-3.1-8b", ModelPrice { input_per_mtok: 0.05, output_per_mtok: 0.08, max_input_tokens: Some(131000) }),
("vercel_ai_gateway/meta/llama-3.2-11b", ModelPrice { input_per_mtok: 0.16, output_per_mtok: 0.16, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/meta/llama-3.2-1b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/meta/llama-3.2-3b", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/meta/llama-3.2-90b", ModelPrice { input_per_mtok: 0.72, output_per_mtok: 0.72, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/meta/llama-3.3-70b", ModelPrice { input_per_mtok: 0.72, output_per_mtok: 0.72, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/meta/llama-4-maverick", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.6, max_input_tokens: Some(131072) }),
("vercel_ai_gateway/meta/llama-4-scout", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.3, max_input_tokens: Some(131072) }),
("vercel_ai_gateway/mistral/codestral", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.9, max_input_tokens: Some(256000) }),
("vercel_ai_gateway/mistral/codestral-embed", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.0, max_input_tokens: None }),
("vercel_ai_gateway/mistral/devstral-small", ModelPrice { input_per_mtok: 0.07, output_per_mtok: 0.28, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/mistral/magistral-medium", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 5.0, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/mistral/magistral-small", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/mistral/ministral-3b", ModelPrice { input_per_mtok: 0.04, output_per_mtok: 0.04, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/mistral/ministral-8b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/mistral/mistral-embed", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.0, max_input_tokens: None }),
("vercel_ai_gateway/mistral/mistral-large", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 6.0, max_input_tokens: Some(32000) }),
("vercel_ai_gateway/mistral/mistral-saba-24b", ModelPrice { input_per_mtok: 0.79, output_per_mtok: 0.79, max_input_tokens: Some(32768) }),
("vercel_ai_gateway/mistral/mistral-small", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.3, max_input_tokens: Some(32000) }),
("vercel_ai_gateway/mistral/mixtral-8x22b-instruct", ModelPrice { input_per_mtok: 1.2, output_per_mtok: 1.2, max_input_tokens: Some(65536) }),
("vercel_ai_gateway/mistral/pixtral-12b", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/mistral/pixtral-large", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 6.0, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/moonshotai/kimi-k2", ModelPrice { input_per_mtok: 0.55, output_per_mtok: 2.2, max_input_tokens: Some(131072) }),
("vercel_ai_gateway/morph/morph-v3-fast", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 1.2, max_input_tokens: Some(32768) }),
("vercel_ai_gateway/morph/morph-v3-large", ModelPrice { input_per_mtok: 0.9, output_per_mtok: 1.9, max_input_tokens: Some(32768) }),
("vercel_ai_gateway/openai/gpt-3.5-turbo", ModelPrice { input_per_mtok: 0.5, output_per_mtok: 1.5, max_input_tokens: Some(16385) }),
("vercel_ai_gateway/openai/gpt-3.5-turbo-instruct", ModelPrice { input_per_mtok: 1.5, output_per_mtok: 2.0, max_input_tokens: Some(8192) }),
("vercel_ai_gateway/openai/gpt-4-turbo", ModelPrice { input_per_mtok: 10.0, output_per_mtok: 30.0, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/openai/gpt-4.1", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 8.0, max_input_tokens: Some(1047576) }),
("vercel_ai_gateway/openai/gpt-4.1-mini", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 1.6, max_input_tokens: Some(1047576) }),
("vercel_ai_gateway/openai/gpt-4.1-nano", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.4, max_input_tokens: Some(1047576) }),
("vercel_ai_gateway/openai/gpt-4o", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/openai/gpt-4o-mini", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/openai/o1", ModelPrice { input_per_mtok: 15.0, output_per_mtok: 60.0, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/openai/o3", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 8.0, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/openai/o3-mini", ModelPrice { input_per_mtok: 1.1, output_per_mtok: 4.4, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/openai/o4-mini", ModelPrice { input_per_mtok: 1.1, output_per_mtok: 4.4, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/perplexity/sonar", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 1.0, max_input_tokens: Some(127000) }),
("vercel_ai_gateway/perplexity/sonar-pro", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(200000) }),
("vercel_ai_gateway/perplexity/sonar-reasoning", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 5.0, max_input_tokens: Some(127000) }),
("vercel_ai_gateway/perplexity/sonar-reasoning-pro", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 8.0, max_input_tokens: Some(127000) }),
("vercel_ai_gateway/vercel/v0-1.0-md", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/vercel/v0-1.5-md", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/xai/grok-2", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 10.0, max_input_tokens: Some(131072) }),
("vercel_ai_gateway/xai/grok-2-vision", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 10.0, max_input_tokens: Some(32768) }),
("vercel_ai_gateway/xai/grok-3", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(131072) }),
("vercel_ai_gateway/xai/grok-3-fast", ModelPrice { input_per_mtok: 5.0, output_per_mtok: 25.0, max_input_tokens: Some(131072) }),
("vercel_ai_gateway/xai/grok-3-mini", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 0.5, max_input_tokens: Some(131072) }),
("vercel_ai_gateway/xai/grok-3-mini-fast", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 4.0, max_input_tokens: Some(131072) }),
("vercel_ai_gateway/xai/grok-4", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(256000) }),
("vercel_ai_gateway/zai/glm-4.5", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.2, max_input_tokens: Some(131072) }),
("vercel_ai_gateway/zai/glm-4.5-air", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 1.1, max_input_tokens: Some(128000) }),
("vercel_ai_gateway/zai/glm-4.6", ModelPrice { input_per_mtok: 0.45, output_per_mtok: 1.8, max_input_tokens: Some(200000) }),
("wandb/MiniMaxAI/MiniMax-M2.5", ModelPrice { input_per_mtok: 0.3, output_per_mtok: 1.2, max_input_tokens: Some(197000) }),
("wandb/Qwen/Qwen3-235B-A22B-Instruct-2507", ModelPrice { input_per_mtok: 10000.0, output_per_mtok: 10000.0, max_input_tokens: Some(262144) }),
("wandb/Qwen/Qwen3-235B-A22B-Thinking-2507", ModelPrice { input_per_mtok: 10000.0, output_per_mtok: 10000.0, max_input_tokens: Some(262144) }),
("wandb/Qwen/Qwen3-Coder-480B-A35B-Instruct", ModelPrice { input_per_mtok: 1e+05, output_per_mtok: 1.5e+05, max_input_tokens: Some(262144) }),
("wandb/deepseek-ai/DeepSeek-R1-0528", ModelPrice { input_per_mtok: 1.35e+05, output_per_mtok: 5.4e+05, max_input_tokens: Some(161000) }),
("wandb/deepseek-ai/DeepSeek-V3-0324", ModelPrice { input_per_mtok: 1.14e+05, output_per_mtok: 2.75e+05, max_input_tokens: Some(161000) }),
("wandb/deepseek-ai/DeepSeek-V3.1", ModelPrice { input_per_mtok: 55000.0, output_per_mtok: 1.65e+05, max_input_tokens: Some(128000) }),
("wandb/meta-llama/Llama-3.1-8B-Instruct", ModelPrice { input_per_mtok: 22000.0, output_per_mtok: 22000.0, max_input_tokens: Some(128000) }),
("wandb/meta-llama/Llama-3.3-70B-Instruct", ModelPrice { input_per_mtok: 71000.0, output_per_mtok: 71000.0, max_input_tokens: Some(128000) }),
("wandb/meta-llama/Llama-4-Scout-17B-16E-Instruct", ModelPrice { input_per_mtok: 17000.0, output_per_mtok: 66000.0, max_input_tokens: Some(64000) }),
("wandb/microsoft/Phi-4-mini-instruct", ModelPrice { input_per_mtok: 8000.0, output_per_mtok: 35000.0, max_input_tokens: Some(128000) }),
("wandb/moonshotai/Kimi-K2-Instruct", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.5, max_input_tokens: Some(128000) }),
("wandb/moonshotai/Kimi-K2.5", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 3.0, max_input_tokens: Some(262144) }),
("wandb/openai/gpt-oss-120b", ModelPrice { input_per_mtok: 15000.0, output_per_mtok: 60000.0, max_input_tokens: Some(131072) }),
("wandb/openai/gpt-oss-20b", ModelPrice { input_per_mtok: 5000.0, output_per_mtok: 20000.0, max_input_tokens: Some(131072) }),
("wandb/zai-org/GLM-4.5", ModelPrice { input_per_mtok: 55000.0, output_per_mtok: 2e+05, max_input_tokens: Some(131072) }),
("watsonx/bigscience/mt0-xxl-13b", ModelPrice { input_per_mtok: 500.0, output_per_mtok: 2000.0, max_input_tokens: Some(8192) }),
("watsonx/core42/jais-13b-chat", ModelPrice { input_per_mtok: 500.0, output_per_mtok: 2000.0, max_input_tokens: Some(8192) }),
("watsonx/google/flan-t5-xl-3b", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 0.6, max_input_tokens: Some(8192) }),
("watsonx/ibm/granite-13b-chat-v2", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 0.6, max_input_tokens: Some(8192) }),
("watsonx/ibm/granite-13b-instruct-v2", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 0.6, max_input_tokens: Some(8192) }),
("watsonx/ibm/granite-3-3-8b-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(8192) }),
("watsonx/ibm/granite-3-8b-instruct", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(8192) }),
("watsonx/ibm/granite-4-h-small", ModelPrice { input_per_mtok: 0.06, output_per_mtok: 0.25, max_input_tokens: Some(20480) }),
("watsonx/ibm/granite-guardian-3-2-2b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(8192) }),
("watsonx/ibm/granite-guardian-3-3-8b", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 0.2, max_input_tokens: Some(8192) }),
("watsonx/ibm/granite-ttm-1024-96-r2", ModelPrice { input_per_mtok: 0.38, output_per_mtok: 0.38, max_input_tokens: Some(512) }),
("watsonx/ibm/granite-ttm-1536-96-r2", ModelPrice { input_per_mtok: 0.38, output_per_mtok: 0.38, max_input_tokens: Some(512) }),
("watsonx/ibm/granite-ttm-512-96-r2", ModelPrice { input_per_mtok: 0.38, output_per_mtok: 0.38, max_input_tokens: Some(512) }),
("watsonx/ibm/granite-vision-3-2-2b", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(8192) }),
("watsonx/meta-llama/llama-3-2-11b-vision-instruct", ModelPrice { input_per_mtok: 0.35, output_per_mtok: 0.35, max_input_tokens: Some(128000) }),
("watsonx/meta-llama/llama-3-2-1b-instruct", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(128000) }),
("watsonx/meta-llama/llama-3-2-3b-instruct", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.15, max_input_tokens: Some(128000) }),
("watsonx/meta-llama/llama-3-2-90b-vision-instruct", ModelPrice { input_per_mtok: 2.0, output_per_mtok: 2.0, max_input_tokens: Some(128000) }),
("watsonx/meta-llama/llama-3-3-70b-instruct", ModelPrice { input_per_mtok: 0.71, output_per_mtok: 0.71, max_input_tokens: Some(128000) }),
("watsonx/meta-llama/llama-4-maverick-17b", ModelPrice { input_per_mtok: 0.35, output_per_mtok: 1.4, max_input_tokens: Some(128000) }),
("watsonx/meta-llama/llama-guard-3-11b-vision", ModelPrice { input_per_mtok: 0.35, output_per_mtok: 0.35, max_input_tokens: Some(128000) }),
("watsonx/mistralai/mistral-large", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 10.0, max_input_tokens: Some(131072) }),
("watsonx/mistralai/mistral-medium-2505", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("watsonx/mistralai/mistral-small-2503", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.3, max_input_tokens: Some(32000) }),
("watsonx/mistralai/mistral-small-3-1-24b-instruct-2503", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.3, max_input_tokens: Some(32000) }),
("watsonx/mistralai/pixtral-12b-2409", ModelPrice { input_per_mtok: 0.35, output_per_mtok: 0.35, max_input_tokens: Some(128000) }),
("watsonx/openai/gpt-oss-120b", ModelPrice { input_per_mtok: 0.15, output_per_mtok: 0.6, max_input_tokens: Some(8192) }),
("watsonx/sdaia/allam-1-13b-instruct", ModelPrice { input_per_mtok: 1.8, output_per_mtok: 1.8, max_input_tokens: Some(8192) }),
("writer.palmyra-x4-v1:0", ModelPrice { input_per_mtok: 2.5, output_per_mtok: 10.0, max_input_tokens: Some(128000) }),
("writer.palmyra-x5-v1:0", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 6.0, max_input_tokens: Some(1000000) }),
("x-ai/grok-4", ModelPrice { input_per_mtok: 3.0, output_per_mtok: 15.0, max_input_tokens: Some(256000) }),
("xiaomi/mimo-v2-flash", ModelPrice { input_per_mtok: 0.09, output_per_mtok: 0.29, max_input_tokens: Some(262144) }),
("z-ai/glm-4.6", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 1.75, max_input_tokens: Some(202800) }),
("z-ai/glm-4.6:exacto", ModelPrice { input_per_mtok: 0.45, output_per_mtok: 1.9, max_input_tokens: Some(202800) }),
("z-ai/glm-4.7", ModelPrice { input_per_mtok: 0.4, output_per_mtok: 1.5, max_input_tokens: Some(202752) }),
("z-ai/glm-4.7-flash", ModelPrice { input_per_mtok: 0.07, output_per_mtok: 0.4, max_input_tokens: Some(200000) }),
("z-ai/glm-5", ModelPrice { input_per_mtok: 0.8, output_per_mtok: 2.56, max_input_tokens: Some(202752) }),
("zai-org/GLM-4.5-Air-FP8", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 1.1, max_input_tokens: Some(128000) }),
("zai-org/GLM-4.6", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.2, max_input_tokens: Some(200000) }),
("zai-org/GLM-4.7", ModelPrice { input_per_mtok: 0.45, output_per_mtok: 2.0, max_input_tokens: Some(200000) }),
("zai-org/glm-4.7-maas", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.2, max_input_tokens: Some(200000) }),
("zai-org/glm-5-maas", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.2, max_input_tokens: Some(200000) }),
("zai.glm-4.7", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.2, max_input_tokens: Some(200000) }),
("zai.glm-4.7-flash", ModelPrice { input_per_mtok: 0.07, output_per_mtok: 0.4, max_input_tokens: Some(200000) }),
("zai.glm-5", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.2, max_input_tokens: Some(200000) }),
("zai/glm-4-32b-0414-128k", ModelPrice { input_per_mtok: 0.1, output_per_mtok: 0.1, max_input_tokens: Some(128000) }),
("zai/glm-4.5", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.2, max_input_tokens: Some(128000) }),
("zai/glm-4.5-air", ModelPrice { input_per_mtok: 0.2, output_per_mtok: 1.1, max_input_tokens: Some(128000) }),
("zai/glm-4.5-airx", ModelPrice { input_per_mtok: 1.1, output_per_mtok: 4.5, max_input_tokens: Some(128000) }),
("zai/glm-4.5-x", ModelPrice { input_per_mtok: 2.2, output_per_mtok: 8.9, max_input_tokens: Some(128000) }),
("zai/glm-4.5v", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 1.8, max_input_tokens: Some(128000) }),
("zai/glm-4.6", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.2, max_input_tokens: Some(200000) }),
("zai/glm-4.7", ModelPrice { input_per_mtok: 0.6, output_per_mtok: 2.2, max_input_tokens: Some(200000) }),
("zai/glm-5", ModelPrice { input_per_mtok: 1.0, output_per_mtok: 3.2, max_input_tokens: Some(200000) }),
("zai/glm-5-code", ModelPrice { input_per_mtok: 1.2, output_per_mtok: 5.0, max_input_tokens: Some(200000) }),
];