1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
# >>> DO NOT EDIT THIS FILE <<<
# IMPORTANT: THIS FILE WILL BE UPDATED WITH EACH AIPACK UPDATE
# To customize AIPACK, edit the sibling `./config-user.toml` with the values to add or override.
# Thus, `config-default.toml` will be loaded first, and `config-user.toml` will be merged on top of it to create the
# global configuration for aipack. This can then be overridden by the workspace `.aipack/config.toml` and agent-specific options.
[]
# `model` is required to run an agent.
# This will be the fallback if not defined in `./config-user.toml` or a workspace-level `config.toml`.
#
# Supported models from:
# - OpenAI, Gemini, Anthropic, Ollama (local), xAI, Cohere, DeepSeek,
# - Fireworks.Ai, Nebius, Groq, Together.ai
# - For OpenAI & Gemini models, you can use `-low`, `-medium`, `-high` suffixes to control reasoning budget (e.g., `gpt-5-mini-high`)
# - AIPACK with the Genai library will try to match the appropriate provider; if not found, it will fallback to localhost ollama
# - Can specify a model with namespacing for example `fireworks::kimi-k2-instruct`
#
# For reasoning model, like gpt-5, gemini-2.5-flash, and claude-sonnet-4-5-20250929, reasoning suffixes,
# such as `-minimal`, `-low`, `-medium`, `-high` suffixes (or event or `-zero` for flash) can be used on model name or even model aliases
#
# e.g.,
# OpenAI: "gpt-5.4", "gpt-5.4-codex", "gpt-5.4-codex-mini" (with optional `-low`, `-medium`, `-high`, `-xhigh`, `-max` suffixes)
# Gemini: "gemini-3.1-pro-repview", gemini-3.1-flash-zero" (with `-zero` for flash, `-low`, `-medium`, `-high` suffixes)
# Anthropic: "claude-sonnet-4-6"
# Fireworks: "fireworks::qwen3-coder-480b-a35b-instruct",
# Ollama: "phi4:14b", "gemma3:4b", "gemma3:27b", "deepseek-r1:70b", "llama4:scout" (or any locally installed Ollama)
= "gpt-5.4" # or an alias from below (e.g., "flash", "gpro")
# Temperature (by default unset)
# temperature = 0.0
# How many inputs can be processed at the same time (Defaults to 2 if absent)
= 2
# Model Aliases
#
# These are default model aliases that can be used.
#
# These will be updated over time as versions are updated.
#
# Customize global model aliases in `./config-user.toml`.
#
# Recommendation: Use simple alias names with `_` and `-` (like those below or in `config-default.toml`).
#
# Note 1: If an alias name contains `.` or special characters, use double quotes.
# e.g., `"my-nano" = "gpt-5.4-nano"`
#
# Note 2: Aliases can be added or overridden in the workspace `.aipack/config.toml` or via agent options.
#
# Note 3: for reasoning model, reasoning suffix `-low`, `-medium`, `-high`, `-xhigh`, `-xhigh`
# on full model names but also on aliases (it will carry over) (for example, `sonnet-low`)
#
[]
# -- Anthropic
# Also support `-max`, `-high`, `-medium`, or `-low` suffixes.
= "claude-opus-4-7"
= "claude-sonnet-4-6"
= "claude-sonnet-4-6"
= "claude-haiku-4-5"
# -- OpenAI
# Also support `-xhigh`, `-high`, `-medium`, or `-low` suffixes.
# e.g., `gpt-5-low`, `gpt-5-nano-high`
= "gpt-5.4"
= "gpt-5.4-mini"
= "gpt-5.4-nano"
= "gpt-5.4" # much better than gpt-5.3-codex
# -- Google
# As shown below, Gemini model names also support the use of `-high`, `-medium`, or `-low` suffixes,
# in addition to the `-zero` suffix for Flash or pro
= "gemini-3.1-pro-preview"
= "gemini-3-flash-preview"
= "gemini-3.1-flash-lite-preview"
# -- Fireworks (namespaced with `fireworks::_model_name`
= "fireworks::qwen3-coder-480b-a35b-instruct"
= "fireworks::qwen3-235b-a22b-instruct-2507"
= "accounts/fireworks/models/qwen3-235b-a22b-thinking-2507" # can be full fireworks name
= "fireworks::kimi-k2-instruct"
= "fireworks::glm-4p5"
= "fireworks::glm-4p5-air"
= "fireworks::gpt-oss-120b"
= "fireworks::gpt-oss-120b"
= "fireworks::gpt-oss-20b"
= "fireworks::gpt-oss-20b"
# -- DeepSeek (from deepseek.com)
= "deepseek-reasoner"