[[model]]
provider = "openai"
model = "gpt-5.5"
max_input_tokens = 200000
max_output_tokens = 16000
capabilities = ["text", "vision", "tools", "json_mode", "streaming", "prompt_caching"]
[[model]]
provider = "openai"
model = "gpt-5.4"
max_input_tokens = 200000
max_output_tokens = 16000
capabilities = ["text", "vision", "tools", "json_mode", "streaming", "prompt_caching"]
[[model]]
provider = "openai"
model = "gpt-4o"
max_input_tokens = 128000
max_output_tokens = 16000
capabilities = ["text", "vision", "tools", "json_mode", "streaming", "prompt_caching"]
[[model]]
provider = "openai"
model = "gpt-4o-mini"
max_input_tokens = 128000
max_output_tokens = 16000
capabilities = ["text", "vision", "tools", "json_mode", "streaming", "prompt_caching"]
[[model]]
provider = "openai"
model = "o3"
max_input_tokens = 200000
max_output_tokens = 100000
capabilities = ["text", "tools", "json_mode", "reasoning", "streaming"]
[[model]]
provider = "openai"
model = "o4-mini"
max_input_tokens = 200000
max_output_tokens = 100000
capabilities = ["text", "tools", "json_mode", "reasoning", "streaming"]
[[model]]
provider = "openai"
model = "text-embedding-3-small"
max_input_tokens = 8191
max_output_tokens = 0
capabilities = ["text"]
[[model]]
provider = "openai"
model = "text-embedding-3-large"
max_input_tokens = 8191
max_output_tokens = 0
capabilities = ["text"]
[[model]]
provider = "anthropic"
model = "claude-haiku-4-5"
max_input_tokens = 200000
max_output_tokens = 8192
capabilities = ["text", "vision", "tools", "json_mode", "streaming", "prompt_caching"]
[[model]]
provider = "anthropic"
model = "claude-sonnet-4-6"
max_input_tokens = 200000
max_output_tokens = 8192
capabilities = ["text", "vision", "tools", "json_mode", "streaming", "prompt_caching"]
[[model]]
provider = "anthropic"
model = "claude-opus-4-7"
max_input_tokens = 200000
max_output_tokens = 8192
capabilities = ["text", "vision", "tools", "json_mode", "streaming", "prompt_caching"]
[[model]]
provider = "gemini"
model = "gemini-3.1-flash-lite"
max_input_tokens = 1000000
max_output_tokens = 8192
capabilities = ["text", "vision", "tools", "json_mode", "streaming", "prompt_caching"]
[[model]]
provider = "gemini"
model = "gemini-3.5-flash"
max_input_tokens = 1000000
max_output_tokens = 8192
capabilities = ["text", "vision", "tools", "json_mode", "streaming", "prompt_caching"]
[[model]]
provider = "gemini"
model = "gemini-3.1-pro"
max_input_tokens = 2000000
max_output_tokens = 8192
capabilities = ["text", "vision", "tools", "json_mode", "streaming", "prompt_caching"]
[[model]]
provider = "mistral"
model = "mistral-large-latest"
max_input_tokens = 128000
max_output_tokens = 4096
capabilities = ["text", "tools", "json_mode", "streaming"]
[[model]]
provider = "mistral"
model = "mistral-medium-latest"
max_input_tokens = 128000
max_output_tokens = 4096
capabilities = ["text", "tools", "json_mode", "streaming"]
[[model]]
provider = "mistral"
model = "mistral-small-latest"
max_input_tokens = 128000
max_output_tokens = 4096
capabilities = ["text", "tools", "json_mode", "streaming"]
[[model]]
provider = "mistral"
model = "codestral-latest"
max_input_tokens = 256000
max_output_tokens = 8192
capabilities = ["text", "tools", "json_mode", "streaming"]
[[model]]
provider = "mistral"
model = "pixtral-large-latest"
max_input_tokens = 128000
max_output_tokens = 4096
capabilities = ["text", "vision", "tools", "json_mode", "streaming"]
[[model]]
provider = "groq"
model = "llama-3.3-70b-versatile"
max_input_tokens = 128000
max_output_tokens = 8192
capabilities = ["text", "tools", "json_mode", "streaming"]
[[model]]
provider = "groq"
model = "llama-3.1-8b-instant"
max_input_tokens = 128000
max_output_tokens = 8192
capabilities = ["text", "tools", "json_mode", "streaming"]
[[model]]
provider = "groq"
model = "deepseek-r1-distill-llama-70b"
max_input_tokens = 128000
max_output_tokens = 8192
capabilities = ["text", "tools", "json_mode", "streaming", "reasoning"]
[[model]]
provider = "groq"
model = "mixtral-8x7b-32768"
max_input_tokens = 32768
max_output_tokens = 4096
capabilities = ["text", "tools", "json_mode", "streaming"]
[[model]]
provider = "together"
model = "meta-llama/Meta-Llama-3.3-70B-Instruct-Turbo"
max_input_tokens = 128000
max_output_tokens = 8192
capabilities = ["text", "tools", "json_mode", "streaming"]
[[model]]
provider = "together"
model = "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo"
max_input_tokens = 128000
max_output_tokens = 8192
capabilities = ["text", "tools", "json_mode", "streaming"]
[[model]]
provider = "together"
model = "Qwen/Qwen2.5-72B-Instruct-Turbo"
max_input_tokens = 32768
max_output_tokens = 4096
capabilities = ["text", "tools", "json_mode", "streaming"]
[[model]]
provider = "together"
model = "deepseek-ai/DeepSeek-V3"
max_input_tokens = 64000
max_output_tokens = 8192
capabilities = ["text", "tools", "json_mode", "streaming"]
[[model]]
provider = "openrouter"
model = "anthropic/claude-sonnet-4-6"
max_input_tokens = 200000
max_output_tokens = 8192
capabilities = ["text", "tools", "json_mode", "streaming"]
[[model]]
provider = "openrouter"
model = "openai/gpt-5.5"
max_input_tokens = 200000
max_output_tokens = 16000
capabilities = ["text", "tools", "json_mode", "streaming"]
[[model]]
provider = "openrouter"
model = "google/gemini-3.1-pro"
max_input_tokens = 1000000
max_output_tokens = 8192
capabilities = ["text", "tools", "json_mode", "streaming"]
[[model]]
provider = "openrouter"
model = "meta-llama/llama-3.3-70b-instruct"
max_input_tokens = 128000
max_output_tokens = 8192
capabilities = ["text", "tools", "json_mode", "streaming"]
[[model]]
provider = "openrouter"
model = "mistralai/mistral-large"
max_input_tokens = 128000
max_output_tokens = 4096
capabilities = ["text", "tools", "json_mode", "streaming"]