1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
//! Model pricing configuration
//!
//! Loaded from `~/.opencrabs/usage_pricing.toml` at runtime.
//! No compiled-in fallback — if the file is missing or broken, an error is returned.
//! Users can edit the file live — changes take effect on next `/usage` open.
use serde::{Deserialize, Serialize};
use std::collections::HashMap;
/// A single model pricing entry.
/// `prefix` is matched as a substring of the model name (case-insensitive).
/// First match wins, so put more specific prefixes before general ones.
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct PricingEntry {
pub prefix: String,
pub input_per_m: f64,
pub output_per_m: f64,
/// Cache write cost per million tokens (defaults to 1.25x input_per_m if absent)
#[serde(default)]
pub cache_write_per_m: Option<f64>,
/// Cache read cost per million tokens (defaults to 0.1x input_per_m if absent)
#[serde(default)]
pub cache_read_per_m: Option<f64>,
}
/// Per-provider block in the TOML file.
/// TOML format: `[providers.anthropic]\nentries = [...]`
#[derive(Debug, Clone, Serialize, Deserialize, Default)]
pub struct ProviderBlock {
#[serde(default)]
pub entries: Vec<PricingEntry>,
}
/// The full pricing table, keyed by provider name (for display only).
#[derive(Debug, Clone, Serialize, Deserialize, Default)]
pub struct PricingConfig {
#[serde(default)]
pub providers: HashMap<String, ProviderBlock>,
}
impl PricingConfig {
/// Calculate cost for a model + token counts (no cache breakdown).
/// Treats all input tokens at the regular input rate.
pub fn calculate_cost(&self, model: &str, input_tokens: u32, output_tokens: u32) -> f64 {
self.calculate_cost_with_cache(model, input_tokens, output_tokens, 0, 0)
}
/// Calculate cost with full cache breakdown.
/// `input_tokens` = non-cached input only.
/// Cache write defaults to 1.25x input rate, cache read to 0.1x.
pub fn calculate_cost_with_cache(
&self,
model: &str,
input_tokens: u32,
output_tokens: u32,
cache_creation_tokens: u32,
cache_read_tokens: u32,
) -> f64 {
let m = model.to_lowercase();
for block in self.providers.values() {
for entry in &block.entries {
if m.contains(&entry.prefix.to_lowercase()) {
let input = (input_tokens as f64 / 1_000_000.0) * entry.input_per_m;
let output = (output_tokens as f64 / 1_000_000.0) * entry.output_per_m;
let cache_write_rate =
entry.cache_write_per_m.unwrap_or(entry.input_per_m * 1.25);
let cache_read_rate = entry.cache_read_per_m.unwrap_or(entry.input_per_m * 0.1);
let cache_write =
(cache_creation_tokens as f64 / 1_000_000.0) * cache_write_rate;
let cache_read = (cache_read_tokens as f64 / 1_000_000.0) * cache_read_rate;
return input + output + cache_write + cache_read;
}
}
}
0.0
}
/// Estimate cost from a combined token count using an 80/20 input/output split.
/// Returns None if model is unknown.
pub fn estimate_cost(&self, model: &str, token_count: i64) -> Option<f64> {
let m = model.to_lowercase();
// Try direct match first
if let Some(cost) = self.try_match(&m, token_count) {
return Some(cost);
}
// If no match, try prepending common provider prefixes
// (normalized names like "opus-4-6" need "claude-" to match TOML entries)
let prefixes = [
"claude-",
"gpt-",
"gemini-",
"deepseek-",
"llama-",
"qwen",
"kimi-",
"zhipu-",
"glm-",
];
for p in &prefixes {
let prefixed = format!("{}{}", p, m);
if let Some(cost) = self.try_match(&prefixed, token_count) {
return Some(cost);
}
}
None
}
/// Internal helper: try to match a model string against all pricing entries.
fn try_match(&self, model_lower: &str, token_count: i64) -> Option<f64> {
for block in self.providers.values() {
for entry in &block.entries {
if model_lower.contains(&entry.prefix.to_lowercase()) {
let input = (token_count as f64 * 0.80 / 1_000_000.0) * entry.input_per_m;
let output = (token_count as f64 * 0.20 / 1_000_000.0) * entry.output_per_m;
return Some(input + output);
}
}
}
None
}
/// Load from ~/.opencrabs/usage_pricing.toml.
/// Supports both the current schema (`[providers.X] entries = [...]`) and the
/// legacy on-disk schema (`[[usage.pricing.X]]` array-of-tables).
/// Falls back to the embedded example file if the user file doesn't exist
/// (useful for tests and CI environments).
/// Returns an error only if both the user file and embedded example fail to parse.
///
/// **Additive baseline merge:** after parsing the user file, the
/// embedded example is parsed too and any `(provider, prefix)` pair
/// present in the baseline but missing from the user file is
/// appended. The merged file is written back to disk so subsequent
/// loads see the new entries without re-running the merge. This is
/// how MiniMax-M3 / future model releases reach users who already
/// have a `usage_pricing.toml` from an earlier install — without
/// this, the seed-on-missing pattern leaves their pricing table
/// frozen at whatever shipped on their first install.
///
/// The merge is strictly additive: user customisations (renamed
/// prefixes, hand-tweaked rates) are NEVER overwritten. Only
/// prefixes the user doesn't have at all get appended.
pub fn load() -> Result<Self, String> {
let path = crate::config::opencrabs_home().join("usage_pricing.toml");
let content = match std::fs::read_to_string(&path) {
Ok(c) => c,
Err(_) => {
// Fall back to embedded example (tests, CI, fresh installs)
let example = include_str!("../../usage_pricing.toml.example");
return Self::parse_content(example, "embedded example");
}
};
let mut user_cfg = Self::parse_content(&content, &format!("{:?}", path))?;
// Additive merge with embedded baseline. Skip on parse failure
// of the baseline — we never want a bad bundled example to
// mask a working user file.
let baseline_example = include_str!("../../usage_pricing.toml.example");
if let Ok(baseline_cfg) = Self::parse_content(baseline_example, "embedded example baseline")
{
let added = user_cfg.merge_missing_from(&baseline_cfg);
if added > 0 {
tracing::info!(
target: "pricing",
added,
path = ?path,
"merged new baseline pricing entries into user pricing file (additive only)"
);
let new_content = Self::serialize_to_toml(&user_cfg);
if let Err(e) = std::fs::write(&path, &new_content) {
tracing::warn!(
target: "pricing",
error = %e,
path = ?path,
"failed to persist merged pricing back to disk — entries are in-memory only \
this session, will re-merge on next load"
);
}
}
}
Ok(user_cfg)
}
/// Append any `(provider, prefix)` from `other` that does not exist
/// in `self`. Returns the number of entries appended. Idempotent:
/// running twice with the same baseline adds zero on the second
/// call. Matching is case-insensitive on the `prefix` field —
/// `minimax-m3` and `MiniMax-M3` count as the same entry.
pub fn merge_missing_from(&mut self, other: &PricingConfig) -> usize {
let mut added = 0;
for (prov_name, baseline_block) in &other.providers {
let user_block = self.providers.entry(prov_name.clone()).or_default();
for baseline_entry in &baseline_block.entries {
let needle = baseline_entry.prefix.to_lowercase();
if !user_block
.entries
.iter()
.any(|e| e.prefix.to_lowercase() == needle)
{
user_block.entries.push(baseline_entry.clone());
added += 1;
}
}
}
added
}
/// Parse TOML content with both schema variants.
fn parse_content(content: &str, source: &str) -> Result<Self, String> {
// Try current schema first.
if let Ok(cfg) = toml::from_str::<PricingConfig>(content)
&& !cfg.providers.is_empty()
{
return Ok(cfg);
}
// Try legacy schema: [[usage.pricing.<provider>]] entries
if let Ok(cfg) = Self::load_legacy(content)
&& !cfg.providers.is_empty()
{
tracing::warn!(
"usage_pricing.toml uses old format — please update it to the new schema. \
See usage_pricing.toml.example in the repo"
);
let new_content = Self::serialize_to_toml(&cfg);
// Only write back if source is a real file path (not embedded example)
if source != "embedded example" {
let path = crate::config::opencrabs_home().join("usage_pricing.toml");
let _ = std::fs::write(&path, new_content);
}
return Ok(cfg);
}
Err(format!(
"usage_pricing.toml from {} failed to parse with both schemas.\n\
Check the file syntax or re-copy from usage_pricing.toml.example",
source
))
}
/// Parse the legacy `[[usage.pricing.<provider>]]` format.
fn load_legacy(content: &str) -> Result<Self, toml::de::Error> {
#[derive(serde::Deserialize)]
struct LegacyRoot {
usage: Option<LegacyUsage>,
}
#[derive(serde::Deserialize)]
struct LegacyUsage {
pricing: Option<toml::Value>,
}
let root: LegacyRoot = toml::from_str(content)?;
let pricing_val = root
.usage
.and_then(|u| u.pricing)
.unwrap_or(toml::Value::Table(toml::map::Map::new()));
let mut providers: HashMap<String, ProviderBlock> = HashMap::new();
if let toml::Value::Table(table) = pricing_val {
for (provider_name, entries_val) in table {
if let toml::Value::Array(arr) = entries_val {
let entries: Vec<PricingEntry> =
arr.into_iter().filter_map(|v| v.try_into().ok()).collect();
if !entries.is_empty() {
providers.insert(provider_name, ProviderBlock { entries });
}
}
}
}
Ok(PricingConfig { providers })
}
/// Serialize a PricingConfig back to the canonical TOML schema.
fn serialize_to_toml(cfg: &PricingConfig) -> String {
let mut out = String::from(
"# OpenCrabs Usage Pricing — auto-migrated to current schema.\n\
# Edit freely. Changes take effect immediately on next /usage open.\n\
# prefix is matched case-insensitively as a substring of the model name.\n\
# Costs are per 1 million tokens (USD).\n\n",
);
let mut providers: Vec<(&String, &ProviderBlock)> = cfg.providers.iter().collect();
providers.sort_by_key(|(k, _)| k.as_str());
for (name, block) in providers {
out.push_str(&format!("[providers.{}]\nentries = [\n", name));
for e in &block.entries {
let mut row = format!(
" {{ prefix = {:?}, input_per_m = {}, output_per_m = {}",
e.prefix, e.input_per_m, e.output_per_m
);
// Preserve optional cache rates — without this the
// additive merge would silently drop MiniMax-M3's
// cache_read_per_m on the first write-back, leaving
// the user paying the default 0.1x input fallback
// instead of the real $0.12/M list rate.
if let Some(cw) = e.cache_write_per_m {
row.push_str(&format!(", cache_write_per_m = {cw}"));
}
if let Some(cr) = e.cache_read_per_m {
row.push_str(&format!(", cache_read_per_m = {cr}"));
}
row.push_str(" },\n");
out.push_str(&row);
}
out.push_str("]\n\n");
}
out
}
/// Copy `usage_pricing.toml.example` to brain directory on first run only.
/// Existing users: see release notes for instructions to diff and update their file.
pub fn seed_from_example() {
let path = crate::config::opencrabs_home().join("usage_pricing.toml");
if path.exists() {
return; // User owns this file. Never overwrite.
}
let example_content = include_str!("../../usage_pricing.toml.example");
if let Err(e) = std::fs::write(&path, example_content) {
tracing::error!("Failed to seed usage_pricing.toml from example: {}", e);
} else {
tracing::info!("Seeded usage_pricing.toml from example");
}
}
}