[server]
host = "0.0.0.0"
port = 8090
dashboard = true
[logging]
enabled = true
path = "logs/requests.jsonl"
[[providers]]
name = "local-llama"
format = "openai"
base_url = "http://localhost:8080/v1"
cost_per_1m_tokens = 0.0
quality = 60
latency_ms = 900
throughput_tokens_per_sec = 20
[[providers]]
name = "ollama"
format = "ollama"
base_url = "http://localhost:11434"
cost_per_1m_tokens = 0.0
quality = 75
latency_ms = 600
throughput_tokens_per_sec = 30
[[providers]]
name = "cloudflare"
format = "openai"
base_url = "https://api.cloudflare.com/client/v4/accounts/e4847a910eddf0d11d40af276cc478b7/ai/v1"
api_key_env = "CLOUDFLARE_API_TOKEN"
cost_per_1m_tokens = 0.2
quality = 80
latency_ms = 500
throughput_tokens_per_sec = 60
[[providers]]
name = "openai"
format = "openai"
base_url = "https://api.openai.com/v1"
api_key_env = "OPENAI_API_KEY"
cost_per_1m_tokens = 5.0
quality = 90
latency_ms = 400
throughput_tokens_per_sec = 80
[[providers]]
name = "anthropic"
format = "anthropic"
base_url = "https://api.anthropic.com"
api_key_env = "ANTHROPIC_API_KEY"
cost_per_1m_tokens = 15.0
quality = 95
latency_ms = 600
throughput_tokens_per_sec = 70
[classifiers.keyword]
enabled = true
[classifiers.keyword.tags]
vision = ["image", "photo", "picture", "screenshot", "visual", "diagram", "chart"]
video = ["video", "clip", "footage", "frame", "timestamp"]
code = ["function", "class", "import", "def ", "fn ", "bug", "error", "stack trace",
"compile", "runtime", "algorithm", "refactor", "debug"]
nsfw = ["nsfw", "adult", "explicit", "erotic", "nude", "naked",
"sexual", "xxx", "porn", "hentai", "fetish", "lewd"]
[[routers]]
type = "random"
candidates = [
{ provider = "local-llama", model = "llama3.2-3b" },
{ provider = "ollama", model = "llama3.1:8b" },
{ provider = "ollama", model = "deepseek-r1:latest" },
{ provider = "ollama", model = "gemma3:latest" },
{ provider = "cloudflare", model = "@cf/meta/llama-3.1-8b-instruct" },
{ provider = "cloudflare", model = "@cf/meta/llama-3.2-3b-instruct" },
{ provider = "cloudflare", model = "@cf/deepseek-ai/deepseek-r1-distill-qwen-32b" },
{ provider = "cloudflare", model = "@cf/google/gemma-3-12b-it" },
{ provider = "openai", model = "gpt-4o-mini" },
{ provider = "openai", model = "gpt-4o" },
{ provider = "anthropic", model = "claude-haiku-4-5-20251001" },
{ provider = "anthropic", model = "claude-sonnet-4-6" },
]
[plugins.response-healing]
enabled = true
[plugins.pareto-router]
enabled = false
default_tier = "medium"
[plugins.pareto-router.tiers]
low = ["local-llama"]
medium = ["ollama"]
high = ["ollama"]