use orbok_core::{OrbokError, OrbokResult, StorageCategory, now_iso8601};
use orbok_db::Catalog;
use orbok_db::repo::StorageAccountingRepository;
use rusqlite::params;
use std::path::Path;
pub fn update_storage_accounting(
catalog: &Catalog,
cache_db_path: &Path,
) -> OrbokResult<Vec<(StorageCategory, u64, u64)>> {
let storage = StorageAccountingRepository::new(catalog);
let mut rows = Vec::new();
macro_rules! measure {
($cat:expr, $size:expr, $count:expr) => {{
storage.upsert($cat, $size, $count)?;
rows.push(($cat, $size, $count));
}};
}
let conn = catalog.lock();
let catalog_path = catalog.path();
let catalog_bytes = if catalog_path.to_str() == Some(":memory:") {
let pages: i64 = conn
.query_row("PRAGMA page_count", [], |r| r.get(0))
.unwrap_or(0);
let page_size: i64 = conn
.query_row("PRAGMA page_size", [], |r| r.get(0))
.unwrap_or(4096);
(pages * page_size) as u64
} else {
std::fs::metadata(catalog_path).map(|m| m.len()).unwrap_or(0)
};
let source_count: i64 = conn
.query_row("SELECT COUNT(*) FROM sources WHERE status != 'removed'", [], |r| r.get(0))
.unwrap_or(0);
drop(conn); measure!(StorageCategory::PersistentCatalog, catalog_bytes, source_count as u64);
let conn = catalog.lock();
let kw_count: i64 = conn
.query_row("SELECT COUNT(*) FROM keyword_index_records WHERE status='active'", [], |r| r.get(0))
.unwrap_or(0);
let kw_bytes = kw_count as u64 * 256;
drop(conn);
measure!(StorageCategory::KeywordIndex, kw_bytes, kw_count as u64);
let conn = catalog.lock();
let (emb_count, emb_bytes): (i64, i64) = conn
.query_row(
"SELECT COUNT(*), COALESCE(SUM(LENGTH(vector_blob)), 0) FROM embeddings WHERE status='active'",
[],
|r| Ok((r.get(0)?, r.get(1)?)),
)
.unwrap_or((0, 0));
drop(conn);
measure!(StorageCategory::VectorIndex, emb_bytes as u64, emb_count as u64);
let conn = catalog.lock();
let (snip_count, snip_bytes): (i64, i64) = conn
.query_row(
"SELECT COUNT(*), COALESCE(SUM(size_bytes), 0) FROM snippet_cache",
[],
|r| Ok((r.get(0)?, r.get(1)?)),
)
.unwrap_or((0, 0));
drop(conn);
measure!(StorageCategory::SnippetCache, snip_bytes as u64, snip_count as u64);
let conn = catalog.lock();
let sr_count: i64 = conn
.query_row("SELECT COUNT(*) FROM search_result_cache", [], |r| r.get(0))
.unwrap_or(0);
drop(conn);
measure!(StorageCategory::SearchCache, sr_count as u64 * 512, sr_count as u64);
let cache_bytes = std::fs::metadata(cache_db_path)
.map(|m| m.len())
.unwrap_or(0);
let conn = catalog.lock();
let extract_count: i64 = conn
.query_row("SELECT COUNT(*) FROM extraction_records WHERE status='succeeded'", [], |r| r.get(0))
.unwrap_or(0);
drop(conn);
measure!(StorageCategory::TemporaryExtraction, cache_bytes, extract_count as u64);
let conn = catalog.lock();
let evt_count: i64 = conn
.query_row("SELECT COUNT(*) FROM app_events", [], |r| r.get(0))
.unwrap_or(0);
drop(conn);
measure!(StorageCategory::Logs, evt_count as u64 * 256, evt_count as u64);
measure!(StorageCategory::ModelFiles, 0, 0);
Ok(rows)
}