Skip to main content

sqlite_graphrag/
memory_guard.rs

1//! Memory guard: checks RAM availability before loading the ONNX model.
2//!
3//! Loading the model via `fastembed` consumes approximately
4//! [`crate::constants::EMBEDDING_LOAD_EXPECTED_RSS_MB`] MiB of resident memory.
5//! Without this guard, multiple parallel invocations can exhaust RAM and trigger
6//! OOM (Out-Of-Memory), stalling the system.
7//!
8//! This guard queries the OS via `sysinfo` before any heavy initialisation,
9//! aborting with [`crate::errors::AppError::LowMemory`] (exit 77) when the
10//! configured floor is not met.
11
12use sysinfo::{
13    get_current_pid, MemoryRefreshKind, ProcessRefreshKind, ProcessesToUpdate, RefreshKind, System,
14    UpdateKind,
15};
16
17use crate::errors::AppError;
18
19/// Returns the current available memory in MiB.
20pub fn available_memory_mb() -> u64 {
21    let sys =
22        System::new_with_specifics(RefreshKind::new().with_memory(MemoryRefreshKind::everything()));
23    let available_bytes = sys.available_memory();
24    available_bytes / (1024 * 1024)
25}
26
27/// Returns the current process RSS in MiB when available.
28pub fn current_process_memory_mb() -> Option<u64> {
29    let pid = get_current_pid().ok()?;
30    let mut sys =
31        System::new_with_specifics(RefreshKind::new().with_memory(MemoryRefreshKind::everything()));
32    sys.refresh_processes_specifics(
33        ProcessesToUpdate::Some(&[pid]),
34        true,
35        ProcessRefreshKind::new()
36            .with_memory()
37            .with_exe(UpdateKind::OnlyIfNotSet),
38    );
39    sys.process(pid).map(|p| p.memory() / (1024 * 1024))
40}
41
42/// Calculates the safe concurrency ceiling for heavy embedding workloads.
43///
44/// Canonical formula:
45/// `permits = min(cpus, available_memory_mb / ram_per_task_mb) * 0.5`
46///
47/// The result is clamped between `1` and `max_concurrency`.
48pub fn calculate_safe_concurrency(
49    available_mb: u64,
50    cpu_count: usize,
51    ram_per_task_mb: u64,
52    max_concurrency: usize,
53) -> usize {
54    let cpu_count = cpu_count.max(1);
55    let max_concurrency = max_concurrency.max(1);
56    let ram_per_task_mb = ram_per_task_mb.max(1);
57
58    let memory_bound = (available_mb / ram_per_task_mb) as usize;
59    let resource_bound = cpu_count.min(memory_bound).max(1);
60    let safe_with_margin = (resource_bound / 2).max(1);
61
62    safe_with_margin.min(max_concurrency)
63}
64
65/// Checks whether sufficient memory is available to start loading the model.
66///
67/// # Parameters
68/// - `min_mb`: minimum floor in MiB of available memory (typically
69///   [`crate::constants::MIN_AVAILABLE_MEMORY_MB`]).
70///
71/// # Errors
72/// Returns [`AppError::LowMemory`] when `available_mb < min_mb`.
73///
74/// # Returns
75/// Returns `Ok(available_mb)` with the actual available memory in MiB.
76pub fn check_available_memory(min_mb: u64) -> Result<u64, AppError> {
77    let available_mb = available_memory_mb();
78
79    if available_mb < min_mb {
80        return Err(AppError::LowMemory {
81            available_mb,
82            required_mb: min_mb,
83        });
84    }
85
86    Ok(available_mb)
87}
88
89#[cfg(test)]
90mod tests {
91    use super::*;
92
93    #[test]
94    fn check_available_memory_with_zero_always_passes() {
95        let result = check_available_memory(0);
96        assert!(result.is_ok(), "min_mb=0 must always pass, got: {result:?}");
97        let mb = result.unwrap();
98        assert!(mb > 0, "system must report positive memory");
99    }
100
101    #[test]
102    fn check_available_memory_with_huge_value_fails() {
103        let result = check_available_memory(u64::MAX);
104        assert!(
105            matches!(result, Err(AppError::LowMemory { .. })),
106            "u64::MAX MiB must fail with LowMemory, got: {result:?}"
107        );
108    }
109
110    #[test]
111    fn low_memory_error_contains_correct_values() {
112        match check_available_memory(u64::MAX) {
113            Err(AppError::LowMemory {
114                available_mb,
115                required_mb,
116            }) => {
117                assert_eq!(required_mb, u64::MAX);
118                assert!(available_mb < u64::MAX);
119            }
120            other => unreachable!("expected LowMemory, got: {other:?}"),
121        }
122    }
123
124    #[test]
125    fn calculate_safe_concurrency_respects_half_margin() {
126        let permits = calculate_safe_concurrency(8_000, 8, 1_000, 4);
127        assert_eq!(permits, 4);
128    }
129
130    #[test]
131    fn calculate_safe_concurrency_never_returns_zero() {
132        let permits = calculate_safe_concurrency(100, 1, 10_000, 4);
133        assert_eq!(permits, 1);
134    }
135
136    #[test]
137    fn calculate_safe_concurrency_respects_max_ceiling() {
138        let permits = calculate_safe_concurrency(128_000, 64, 500, 4);
139        assert_eq!(permits, 4);
140    }
141
142    #[test]
143    fn current_process_memory_mb_returns_some_value() {
144        let rss = current_process_memory_mb();
145        assert!(rss.is_some());
146    }
147}