modelmux 0.3.1

ModelMux - high-performance Rust gateway that translates OpenAI-compatible API requests to Vertex AI (Claude), with streaming, tool calling, and production-grade reliability.
Documentation
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
SET_CORS_HEADERS=true
LOG_LEVEL=trace
HOST=localhost
PORT=3000
LLM_URL="https://<location>.googleapis.com/v1/projects/<organization>/locations/<location>/publishers/"
LLM_CHAT_ENDPOINT="anthropic/models/<model>:streamRawPredict"
LLM_MODEL="<model>"
LLM_PROVIDER="Vertex AI"
GCP_SERVICE_ACCOUNT_KEY="ewo...<key>...=="
LLM_CONTEXT_SIZE=200000
LLM_WORD_LIMIT=150000
LLM_TEMPERATURE=0.9
#LLM_TOP_P=0.1
LLM_MAX_TOKENS=8000
# LLM_REPETITION_PENALTY=1.1