voirs_cli/performance/
profiler.rs

1//! System profiler for collecting real-time performance data
2//!
3//! This module provides comprehensive system monitoring including CPU, memory, GPU,
4//! and I/O statistics for performance analysis and optimization.
5
6use super::{GpuMetrics, MemoryMetrics, PerformanceMetrics, SynthesisMetrics, SystemMetrics};
7use std::collections::VecDeque;
8use std::sync::Arc;
9use std::time::{SystemTime, UNIX_EPOCH};
10use tokio::sync::RwLock;
11use tokio::time::{interval, Duration, Interval};
12
13/// Real-time system profiler
14pub struct SystemProfiler {
15    /// Collection interval
16    interval: Duration,
17    /// Maximum samples to keep
18    max_samples: usize,
19    /// Historical samples
20    samples: Arc<RwLock<VecDeque<PerformanceMetrics>>>,
21    /// Is profiling active
22    active: bool,
23    /// Sampling interval timer
24    timer: Option<Interval>,
25}
26
27impl SystemProfiler {
28    /// Create a new system profiler
29    pub fn new(interval: Duration, max_samples: usize) -> Self {
30        Self {
31            interval,
32            max_samples,
33            samples: Arc::new(RwLock::new(VecDeque::with_capacity(max_samples))),
34            active: false,
35            timer: None,
36        }
37    }
38
39    /// Start profiling
40    pub async fn start(&mut self) -> Result<(), Box<dyn std::error::Error>> {
41        if self.active {
42            return Ok(());
43        }
44
45        self.active = true;
46        self.timer = Some(interval(self.interval));
47
48        tracing::info!("Started system profiler with interval: {:?}", self.interval);
49        Ok(())
50    }
51
52    /// Stop profiling
53    pub async fn stop(&mut self) {
54        self.active = false;
55        self.timer = None;
56        tracing::info!("Stopped system profiler");
57    }
58
59    /// Collect current system metrics
60    pub async fn collect_metrics(&self) -> Result<PerformanceMetrics, Box<dyn std::error::Error>> {
61        let system = self.collect_system_metrics().await?;
62        let memory = self.collect_memory_metrics().await?;
63        let gpu = self.collect_gpu_metrics().await.ok();
64        let synthesis = SynthesisMetrics::default(); // Will be updated by synthesis operations
65
66        let timestamp = SystemTime::now().duration_since(UNIX_EPOCH)?.as_secs();
67
68        Ok(PerformanceMetrics {
69            system,
70            synthesis,
71            memory,
72            gpu,
73            timestamp,
74        })
75    }
76
77    /// Collect system-level metrics
78    async fn collect_system_metrics(&self) -> Result<SystemMetrics, Box<dyn std::error::Error>> {
79        let cpu_usage = self.get_cpu_usage().await?;
80        let (memory_used, memory_available) = self.get_memory_info().await?;
81        let (disk_read_bps, disk_write_bps) = self.get_disk_io().await?;
82        let network_bps = self.get_network_io().await?;
83        let thread_count = self.get_thread_count().await?;
84        let load_average = self.get_load_average().await.ok();
85
86        Ok(SystemMetrics {
87            cpu_usage,
88            memory_used,
89            memory_available,
90            disk_read_bps,
91            disk_write_bps,
92            network_bps,
93            thread_count,
94            load_average,
95        })
96    }
97
98    /// Collect memory metrics
99    async fn collect_memory_metrics(&self) -> Result<MemoryMetrics, Box<dyn std::error::Error>> {
100        let heap_used = self.get_heap_usage().await?;
101        let peak_usage = self.get_peak_memory_usage().await?;
102        let (allocations_per_sec, deallocations_per_sec) = self.get_allocation_rate().await?;
103        let gc_events = self.get_gc_events().await?;
104        let fragmentation_percent = self.get_memory_fragmentation().await?;
105        let cache_hit_rate = self.get_cache_hit_rate().await?;
106
107        Ok(MemoryMetrics {
108            heap_used,
109            peak_usage,
110            allocations_per_sec,
111            deallocations_per_sec,
112            gc_events,
113            fragmentation_percent,
114            cache_hit_rate,
115        })
116    }
117
118    /// Collect GPU metrics if available
119    async fn collect_gpu_metrics(&self) -> Result<GpuMetrics, Box<dyn std::error::Error>> {
120        let utilization = self.get_gpu_utilization().await?;
121        let (memory_used, memory_total) = self.get_gpu_memory().await?;
122        let temperature = self.get_gpu_temperature().await?;
123        let power_consumption = self.get_gpu_power().await?;
124        let compute_units_active = self.get_gpu_compute_units().await?;
125        let memory_bandwidth_util = self.get_gpu_memory_bandwidth().await?;
126
127        Ok(GpuMetrics {
128            utilization,
129            memory_used,
130            memory_total,
131            temperature,
132            power_consumption,
133            compute_units_active,
134            memory_bandwidth_util,
135        })
136    }
137
138    /// Get CPU usage percentage
139    async fn get_cpu_usage(&self) -> Result<f64, Box<dyn std::error::Error>> {
140        #[cfg(target_os = "linux")]
141        {
142            use std::fs;
143
144            // Read from /proc/stat for Linux
145            let stat_content = fs::read_to_string("/proc/stat")?;
146            let cpu_line = stat_content
147                .lines()
148                .next()
149                .ok_or("No CPU line in /proc/stat")?;
150
151            let fields: Vec<&str> = cpu_line.split_whitespace().collect();
152            if fields.len() < 8 {
153                return Err("Invalid /proc/stat format".into());
154            }
155
156            let idle: u64 = fields[4].parse()?;
157            let iowait: u64 = fields[5].parse()?;
158            let total: u64 = fields[1..]
159                .iter()
160                .take(7)
161                .map(|s| s.parse::<u64>().unwrap_or(0))
162                .sum();
163
164            let idle_total = idle + iowait;
165            let usage = if total > 0 {
166                ((total - idle_total) as f64 / total as f64) * 100.0
167            } else {
168                0.0
169            };
170
171            Ok(usage)
172        }
173
174        #[cfg(target_os = "macos")]
175        {
176            use std::process::Command;
177
178            let output = Command::new("top")
179                .arg("-l")
180                .arg("1")
181                .arg("-n")
182                .arg("0")
183                .output()?;
184
185            let output_str = String::from_utf8_lossy(&output.stdout);
186
187            // Parse CPU usage from top output
188            for line in output_str.lines() {
189                if line.starts_with("CPU usage:") {
190                    if let Some(usage_str) = line.split_whitespace().nth(2) {
191                        if let Some(percent_str) = usage_str.strip_suffix('%') {
192                            return Ok(percent_str.parse()?);
193                        }
194                    }
195                }
196            }
197
198            // Fallback: estimate based on system load
199            Ok(25.0) // Conservative estimate
200        }
201
202        #[cfg(target_os = "windows")]
203        {
204            // Windows implementation would use WMI or performance counters
205            // For now, return estimated value
206            Ok(30.0)
207        }
208
209        #[cfg(not(any(target_os = "linux", target_os = "macos", target_os = "windows")))]
210        {
211            Ok(0.0)
212        }
213    }
214
215    /// Get memory information (used, available)
216    async fn get_memory_info(&self) -> Result<(u64, u64), Box<dyn std::error::Error>> {
217        #[cfg(target_os = "linux")]
218        {
219            use std::fs;
220
221            let meminfo = fs::read_to_string("/proc/meminfo")?;
222            let mut total = 0u64;
223            let mut available = 0u64;
224
225            for line in meminfo.lines() {
226                if line.starts_with("MemTotal:") {
227                    if let Some(kb_str) = line.split_whitespace().nth(1) {
228                        total = kb_str.parse::<u64>()? * 1024; // Convert KB to bytes
229                    }
230                } else if line.starts_with("MemAvailable:") {
231                    if let Some(kb_str) = line.split_whitespace().nth(1) {
232                        available = kb_str.parse::<u64>()? * 1024; // Convert KB to bytes
233                    }
234                }
235            }
236
237            let used = total.saturating_sub(available);
238            Ok((used, available))
239        }
240
241        #[cfg(target_os = "macos")]
242        {
243            use std::process::Command;
244
245            // Get total memory
246            let total_output = Command::new("sysctl")
247                .arg("-n")
248                .arg("hw.memsize")
249                .output()?;
250
251            let total = String::from_utf8_lossy(&total_output.stdout)
252                .trim()
253                .parse::<u64>()?;
254
255            // Estimate available memory (simplified)
256            let available = total / 3; // Conservative estimate
257            let used = total - available;
258
259            Ok((used, available))
260        }
261
262        #[cfg(target_os = "windows")]
263        {
264            // Windows implementation using Windows API
265            use std::mem;
266
267            #[repr(C)]
268            struct MemoryStatusEx {
269                dw_length: u32,
270                dw_memory_load: u32,
271                ull_total_phys: u64,
272                ull_avail_phys: u64,
273                ull_total_page_file: u64,
274                ull_avail_page_file: u64,
275                ull_total_virtual: u64,
276                ull_avail_virtual: u64,
277                ull_avail_extended_virtual: u64,
278            }
279
280            extern "system" {
281                fn GlobalMemoryStatusEx(lpbuffer: *mut MemoryStatusEx) -> i32;
282            }
283
284            let mut memory_status = MemoryStatusEx {
285                dw_length: mem::size_of::<MemoryStatusEx>() as u32,
286                dw_memory_load: 0,
287                ull_total_phys: 0,
288                ull_avail_phys: 0,
289                ull_total_page_file: 0,
290                ull_avail_page_file: 0,
291                ull_total_virtual: 0,
292                ull_avail_virtual: 0,
293                ull_avail_extended_virtual: 0,
294            };
295
296            unsafe {
297                let result = GlobalMemoryStatusEx(&mut memory_status);
298                if result != 0 {
299                    let used = memory_status.ull_total_phys - memory_status.ull_avail_phys;
300                    Ok((used, memory_status.ull_avail_phys))
301                } else {
302                    // Fallback to reasonable defaults if API call fails
303                    Ok((4_000_000_000, 4_000_000_000))
304                }
305            }
306        }
307
308        #[cfg(not(any(target_os = "linux", target_os = "macos", target_os = "windows")))]
309        {
310            // For other platforms, try to get some basic system information
311            // This could be extended for specific platforms like FreeBSD, OpenBSD, etc.
312            match std::env::var("MEMORY_TOTAL_BYTES") {
313                Ok(total_str) => {
314                    if let Ok(total) = total_str.parse::<u64>() {
315                        let available = total / 2; // Conservative estimate
316                        let used = total - available;
317                        Ok((used, available))
318                    } else {
319                        Ok((2_000_000_000, 2_000_000_000)) // 2GB fallback
320                    }
321                }
322                Err(_) => Ok((2_000_000_000, 2_000_000_000)), // 2GB fallback
323            }
324        }
325    }
326
327    /// Get disk I/O statistics (read bytes/sec, write bytes/sec)
328    async fn get_disk_io(&self) -> Result<(u64, u64), Box<dyn std::error::Error>> {
329        #[cfg(target_os = "linux")]
330        {
331            use std::fs;
332
333            let diskstats = fs::read_to_string("/proc/diskstats")?;
334            let mut total_read_sectors = 0u64;
335            let mut total_write_sectors = 0u64;
336
337            for line in diskstats.lines() {
338                let fields: Vec<&str> = line.split_whitespace().collect();
339                if fields.len() >= 14 {
340                    // Skip partitions (look for whole disks)
341                    if let Some(device_name) = fields.get(2) {
342                        if !device_name.chars().last().unwrap_or('0').is_ascii_digit() {
343                            if let (Ok(read_sectors), Ok(write_sectors)) =
344                                (fields[5].parse::<u64>(), fields[9].parse::<u64>())
345                            {
346                                total_read_sectors += read_sectors;
347                                total_write_sectors += write_sectors;
348                            }
349                        }
350                    }
351                }
352            }
353
354            // Convert sectors to bytes (typically 512 bytes per sector)
355            let read_bps = total_read_sectors * 512;
356            let write_bps = total_write_sectors * 512;
357
358            Ok((read_bps, write_bps))
359        }
360
361        #[cfg(target_os = "macos")]
362        {
363            // Use iostat to get disk I/O statistics on macOS
364            use std::process::Command;
365
366            let output = Command::new("iostat")
367                .args(["-d", "-I", "-c", "1"])
368                .output()?;
369
370            if output.status.success() {
371                let stdout = String::from_utf8_lossy(&output.stdout);
372
373                // Parse iostat output - last line contains current stats
374                // Format: KB/t tps MB/s
375                if let Some(last_line) = stdout.lines().last() {
376                    let fields: Vec<&str> = last_line.split_whitespace().collect();
377                    if fields.len() >= 3 {
378                        // MB/s is at index 2, convert to bytes/sec
379                        if let Ok(mb_per_sec) = fields[2].parse::<f64>() {
380                            let bytes_per_sec = (mb_per_sec * 1024.0 * 1024.0) as u64;
381                            // Return same value for read and write (iostat shows total)
382                            return Ok((bytes_per_sec / 2, bytes_per_sec / 2));
383                        }
384                    }
385                }
386
387                Ok((0, 0))
388            } else {
389                Err("Failed to get disk statistics".into())
390            }
391        }
392
393        #[cfg(not(any(target_os = "linux", target_os = "macos")))]
394        {
395            // For other platforms, return 0 (no implementation yet)
396            Ok((0, 0))
397        }
398    }
399
400    /// Get network I/O statistics
401    async fn get_network_io(&self) -> Result<u64, Box<dyn std::error::Error>> {
402        #[cfg(target_os = "linux")]
403        {
404            use std::fs;
405
406            let net_dev = fs::read_to_string("/proc/net/dev")?;
407            let mut total_bytes = 0u64;
408
409            for line in net_dev.lines().skip(2) {
410                // Skip header lines
411                if let Some(colon_pos) = line.find(':') {
412                    let fields: Vec<&str> = line[colon_pos + 1..].split_whitespace().collect();
413                    if fields.len() >= 9 {
414                        if let (Ok(rx_bytes), Ok(tx_bytes)) =
415                            (fields[0].parse::<u64>(), fields[8].parse::<u64>())
416                        {
417                            total_bytes += rx_bytes + tx_bytes;
418                        }
419                    }
420                }
421            }
422
423            Ok(total_bytes)
424        }
425
426        #[cfg(target_os = "macos")]
427        {
428            // Use sysctl to get network interface statistics on macOS
429            use std::process::Command;
430
431            let output = Command::new("netstat").args(["-ib"]).output()?;
432
433            if output.status.success() {
434                let stdout = String::from_utf8_lossy(&output.stdout);
435                let mut total_bytes = 0u64;
436
437                // Parse netstat output (columns: Name Mtu Network Address Ipkts Ierrs Ibytes Opkts Oerrs Obytes)
438                for line in stdout.lines().skip(1) {
439                    let fields: Vec<&str> = line.split_whitespace().collect();
440                    if fields.len() >= 10 {
441                        // Ibytes at index 6, Obytes at index 9
442                        if let (Ok(ibytes), Ok(obytes)) =
443                            (fields[6].parse::<u64>(), fields[9].parse::<u64>())
444                        {
445                            total_bytes += ibytes + obytes;
446                        }
447                    }
448                }
449
450                Ok(total_bytes)
451            } else {
452                Err("Failed to get network statistics".into())
453            }
454        }
455
456        #[cfg(not(any(target_os = "linux", target_os = "macos")))]
457        {
458            // For other platforms, return 0 (no implementation yet)
459            Ok(0)
460        }
461    }
462
463    /// Get current thread count
464    async fn get_thread_count(&self) -> Result<usize, Box<dyn std::error::Error>> {
465        #[cfg(target_os = "linux")]
466        {
467            use std::fs;
468
469            let status = fs::read_to_string("/proc/self/status")?;
470            for line in status.lines() {
471                if line.starts_with("Threads:") {
472                    if let Some(count_str) = line.split_whitespace().nth(1) {
473                        return Ok(count_str.parse()?);
474                    }
475                }
476            }
477
478            Ok(1) // Fallback
479        }
480
481        #[cfg(not(target_os = "linux"))]
482        {
483            // Estimate based on available parallelism
484            Ok(std::thread::available_parallelism()?.get())
485        }
486    }
487
488    /// Get system load average (Unix only)
489    async fn get_load_average(&self) -> Result<f64, Box<dyn std::error::Error>> {
490        #[cfg(unix)]
491        {
492            // Use POSIX getloadavg() which works on macOS, Linux, BSD
493            use libc::getloadavg;
494
495            let mut loadavg: [f64; 3] = [0.0; 3];
496            unsafe {
497                if getloadavg(loadavg.as_mut_ptr(), 1) == -1 {
498                    return Err("Failed to get load average".into());
499                }
500            }
501
502            Ok(loadavg[0]) // Return 1-minute load average
503        }
504
505        #[cfg(not(unix))]
506        {
507            Err("Load average not available on this platform".into())
508        }
509    }
510
511    /// Get heap memory usage
512    async fn get_heap_usage(&self) -> Result<u64, Box<dyn std::error::Error>> {
513        // This is a simplified implementation
514        // In practice, you might use memory profiling libraries or OS-specific APIs
515        let (used, _) = self.get_memory_info().await?;
516        Ok(used / 2) // Estimate heap as half of used memory
517    }
518
519    /// Get peak memory usage
520    async fn get_peak_memory_usage(&self) -> Result<u64, Box<dyn std::error::Error>> {
521        #[cfg(target_os = "linux")]
522        {
523            use std::fs;
524
525            let status = fs::read_to_string("/proc/self/status")?;
526            for line in status.lines() {
527                if line.starts_with("VmHWM:") {
528                    if let Some(kb_str) = line.split_whitespace().nth(1) {
529                        return Ok(kb_str.parse::<u64>()? * 1024); // Convert KB to bytes
530                    }
531                }
532            }
533        }
534
535        // Fallback to current usage
536        let (used, _) = self.get_memory_info().await?;
537        Ok(used)
538    }
539
540    /// Get memory allocation/deallocation rates
541    async fn get_allocation_rate(&self) -> Result<(f64, f64), Box<dyn std::error::Error>> {
542        // Get memory statistics from /proc/self/status for allocation tracking
543        #[cfg(target_os = "linux")]
544        {
545            let status_content = std::fs::read_to_string("/proc/self/status")?;
546            let mut vm_peak = 0u64;
547            let mut vm_size = 0u64;
548            let mut vm_hwm = 0u64;
549            let mut vm_rss = 0u64;
550
551            for line in status_content.lines() {
552                if line.starts_with("VmPeak:") {
553                    vm_peak = parse_proc_memory_value(line)?;
554                } else if line.starts_with("VmSize:") {
555                    vm_size = parse_proc_memory_value(line)?;
556                } else if line.starts_with("VmHWM:") {
557                    vm_hwm = parse_proc_memory_value(line)?;
558                } else if line.starts_with("VmRSS:") {
559                    vm_rss = parse_proc_memory_value(line)?;
560                }
561            }
562
563            // Calculate allocation rate based on memory growth patterns
564            let time_delta = 1.0; // Assume 1 second for rate calculation
565            let memory_growth = vm_size.saturating_sub(vm_rss) as f64;
566            let allocation_rate = memory_growth / time_delta;
567
568            // Estimate deallocation rate (slightly less than allocation for steady state)
569            let deallocation_rate = allocation_rate * 0.95;
570
571            Ok((allocation_rate, deallocation_rate))
572        }
573
574        #[cfg(target_os = "macos")]
575        {
576            // Use mach system calls for macOS memory allocation tracking
577            use std::ffi::c_void;
578            use std::mem;
579
580            // Get task info using mach API (simulated)
581            let task_info = self.get_mach_task_info().await?;
582
583            // Calculate allocation rate from task info
584            let allocation_rate = task_info.virtual_size as f64 / 1024.0; // KB/s
585            let deallocation_rate = allocation_rate * 0.92;
586
587            Ok((allocation_rate, deallocation_rate))
588        }
589
590        #[cfg(target_os = "windows")]
591        {
592            // Use Windows API for memory allocation tracking
593            let process_memory = self.get_windows_process_memory().await?;
594
595            // Calculate allocation rate from process memory info
596            let allocation_rate = process_memory.working_set_size as f64 / 1024.0; // KB/s
597            let deallocation_rate = allocation_rate * 0.88;
598
599            Ok((allocation_rate, deallocation_rate))
600        }
601
602        #[cfg(not(any(target_os = "linux", target_os = "macos", target_os = "windows")))]
603        {
604            // Fallback for other platforms - use process memory as approximation
605            let (used, _) = self.get_memory_info().await?;
606            let allocation_rate = used as f64 / 1024.0; // Rough approximation
607            let deallocation_rate = allocation_rate * 0.90;
608
609            Ok((allocation_rate, deallocation_rate))
610        }
611    }
612
613    /// Get garbage collection events
614    async fn get_gc_events(&self) -> Result<u64, Box<dyn std::error::Error>> {
615        // Rust doesn't have a traditional GC, so this would be 0
616        // Could track other memory management events if needed
617        Ok(0)
618    }
619
620    /// Get memory fragmentation percentage
621    async fn get_memory_fragmentation(&self) -> Result<f64, Box<dyn std::error::Error>> {
622        #[cfg(target_os = "linux")]
623        {
624            use std::fs;
625
626            // Parse /proc/buddyinfo to calculate external fragmentation
627            // Format: Node 0, zone DMA 1 0 1 0 2 1 1 0 1 1 3
628            // Each number represents free pages at each order (0-10)
629            if let Ok(buddyinfo) = fs::read_to_string("/proc/buddyinfo") {
630                let mut total_free_pages = 0u64;
631                let mut fragmented_pages = 0u64;
632
633                for line in buddyinfo.lines() {
634                    let parts: Vec<&str> = line.split_whitespace().collect();
635                    if parts.len() < 14 {
636                        continue; // Skip malformed lines
637                    }
638
639                    // Parts 4-14 contain free page counts for orders 0-10
640                    for (order, count_str) in parts[4..].iter().enumerate() {
641                        if let Ok(count) = count_str.parse::<u64>() {
642                            let pages_at_order = count * (1u64 << order);
643                            total_free_pages += pages_at_order;
644
645                            // Pages at lower orders (0-3) indicate fragmentation
646                            if order < 4 {
647                                fragmented_pages += pages_at_order;
648                            }
649                        }
650                    }
651                }
652
653                if total_free_pages > 0 {
654                    let fragmentation = (fragmented_pages as f64 / total_free_pages as f64) * 100.0;
655                    return Ok(fragmentation.min(100.0));
656                }
657            }
658
659            // Fallback: Analyze available vs total memory ratio
660            if let Ok(meminfo) = fs::read_to_string("/proc/meminfo") {
661                let mut mem_total = 0u64;
662                let mut mem_available = 0u64;
663                let mut mem_free = 0u64;
664
665                for line in meminfo.lines() {
666                    if line.starts_with("MemTotal:") {
667                        mem_total = line
668                            .split_whitespace()
669                            .nth(1)
670                            .and_then(|s| s.parse().ok())
671                            .unwrap_or(0);
672                    } else if line.starts_with("MemAvailable:") {
673                        mem_available = line
674                            .split_whitespace()
675                            .nth(1)
676                            .and_then(|s| s.parse().ok())
677                            .unwrap_or(0);
678                    } else if line.starts_with("MemFree:") {
679                        mem_free = line
680                            .split_whitespace()
681                            .nth(1)
682                            .and_then(|s| s.parse().ok())
683                            .unwrap_or(0);
684                    }
685                }
686
687                if mem_total > 0 && mem_free > 0 {
688                    // If MemAvailable is significantly less than MemFree, indicates fragmentation
689                    let fragmentation_estimate = if mem_available > 0 {
690                        ((mem_free - mem_available) as f64 / mem_free as f64) * 100.0
691                    } else {
692                        10.0 // Conservative estimate if MemAvailable not available
693                    };
694                    return Ok(fragmentation_estimate.min(100.0));
695                }
696            }
697
698            // Final fallback for Linux
699            Ok(5.0)
700        }
701
702        #[cfg(target_os = "macos")]
703        {
704            use std::process::Command;
705
706            // Use vm_stat to analyze page fragmentation on macOS
707            if let Ok(output) = Command::new("vm_stat").output() {
708                let output_str = String::from_utf8_lossy(&output.stdout);
709
710                let mut pages_free = 0u64;
711                let mut pages_active = 0u64;
712                let mut pages_inactive = 0u64;
713                let mut pages_speculative = 0u64;
714                let mut pages_wired = 0u64;
715
716                for line in output_str.lines() {
717                    let parts: Vec<&str> = line.split(':').collect();
718                    if parts.len() == 2 {
719                        let value_str = parts[1].trim().trim_end_matches('.');
720                        let value = value_str.parse::<u64>().unwrap_or(0);
721
722                        if parts[0].contains("Pages free") {
723                            pages_free = value;
724                        } else if parts[0].contains("Pages active") {
725                            pages_active = value;
726                        } else if parts[0].contains("Pages inactive") {
727                            pages_inactive = value;
728                        } else if parts[0].contains("Pages speculative") {
729                            pages_speculative = value;
730                        } else if parts[0].contains("Pages wired down") {
731                            pages_wired = value;
732                        }
733                    }
734                }
735
736                let total_pages =
737                    pages_free + pages_active + pages_inactive + pages_speculative + pages_wired;
738                if total_pages > 0 {
739                    // Fragmentation estimate: speculative and inactive pages suggest fragmentation
740                    let fragmented = pages_speculative + (pages_inactive / 2);
741                    let fragmentation = (fragmented as f64 / total_pages as f64) * 100.0;
742                    return Ok(fragmentation.min(100.0));
743                }
744            }
745
746            // Fallback for macOS: estimate based on memory pressure
747            Ok(7.5)
748        }
749
750        #[cfg(target_os = "windows")]
751        {
752            use std::process::Command;
753
754            // Use PowerShell to query memory fragmentation on Windows
755            if let Ok(output) = Command::new("powershell")
756                .arg("-Command")
757                .arg("Get-Counter '\\Memory\\% Committed Bytes In Use' | Select-Object -ExpandProperty CounterSamples | Select-Object -ExpandProperty CookedValue")
758                .output()
759            {
760                let output_str = String::from_utf8_lossy(&output.stdout);
761                if let Ok(committed_percent) = output_str.trim().parse::<f64>() {
762                    // High committed percentage often correlates with fragmentation
763                    // Estimate fragmentation as a fraction of committed memory pressure
764                    let fragmentation = (committed_percent / 10.0).min(100.0);
765                    return Ok(fragmentation);
766                }
767            }
768
769            // Fallback for Windows
770            Ok(8.0)
771        }
772
773        #[cfg(not(any(target_os = "linux", target_os = "macos", target_os = "windows")))]
774        {
775            // Generic fallback for other platforms
776            // Estimate based on memory usage patterns
777            if let Ok((used, available)) = self.get_memory_info().await {
778                let total = used + available;
779                if total > 0 {
780                    // Rough heuristic: fragmentation tends to increase with memory usage
781                    let usage_ratio = used as f64 / total as f64;
782                    let fragmentation = (usage_ratio * 15.0).min(100.0); // 0-15% range
783                    return Ok(fragmentation);
784                }
785            }
786
787            Ok(5.0)
788        }
789    }
790
791    /// Get cache hit rate
792    async fn get_cache_hit_rate(&self) -> Result<f64, Box<dyn std::error::Error>> {
793        #[cfg(target_os = "linux")]
794        {
795            use std::fs;
796
797            // Parse /proc/meminfo for cache and buffer statistics
798            if let Ok(meminfo) = fs::read_to_string("/proc/meminfo") {
799                let mut cached = 0u64;
800                let mut buffers = 0u64;
801                let mut active = 0u64;
802                let mut inactive = 0u64;
803
804                for line in meminfo.lines() {
805                    if line.starts_with("Cached:") {
806                        cached = line
807                            .split_whitespace()
808                            .nth(1)
809                            .and_then(|s| s.parse().ok())
810                            .unwrap_or(0);
811                    } else if line.starts_with("Buffers:") {
812                        buffers = line
813                            .split_whitespace()
814                            .nth(1)
815                            .and_then(|s| s.parse().ok())
816                            .unwrap_or(0);
817                    } else if line.starts_with("Active:") {
818                        active = line
819                            .split_whitespace()
820                            .nth(1)
821                            .and_then(|s| s.parse().ok())
822                            .unwrap_or(0);
823                    } else if line.starts_with("Inactive:") {
824                        inactive = line
825                            .split_whitespace()
826                            .nth(1)
827                            .and_then(|s| s.parse().ok())
828                            .unwrap_or(0);
829                    }
830                }
831
832                let total_cache = cached + buffers;
833                let total_memory_activity = active + inactive;
834
835                if total_memory_activity > 0 {
836                    // Cache hit rate estimate: ratio of cached memory to total activity
837                    let cache_hit_rate =
838                        (total_cache as f64 / total_memory_activity as f64) * 100.0;
839                    return Ok(cache_hit_rate.min(100.0));
840                }
841            }
842
843            // Alternative: Try to get CPU cache statistics from perf
844            if let Ok(output) = std::process::Command::new("perf")
845                .arg("stat")
846                .arg("-e")
847                .arg("cache-references,cache-misses")
848                .arg("-a")
849                .arg("sleep")
850                .arg("0.1")
851                .output()
852            {
853                let stderr_str = String::from_utf8_lossy(&output.stderr);
854                let mut cache_refs = 0u64;
855                let mut cache_misses = 0u64;
856
857                for line in stderr_str.lines() {
858                    if line.contains("cache-references") {
859                        if let Some(num_str) = line.split_whitespace().next() {
860                            cache_refs = num_str.replace(',', "").parse().unwrap_or(0);
861                        }
862                    } else if line.contains("cache-misses") {
863                        if let Some(num_str) = line.split_whitespace().next() {
864                            cache_misses = num_str.replace(',', "").parse().unwrap_or(0);
865                        }
866                    }
867                }
868
869                if cache_refs > 0 {
870                    let cache_hits = cache_refs.saturating_sub(cache_misses);
871                    let hit_rate = (cache_hits as f64 / cache_refs as f64) * 100.0;
872                    return Ok(hit_rate.min(100.0));
873                }
874            }
875
876            // Fallback for Linux
877            Ok(75.0)
878        }
879
880        #[cfg(target_os = "macos")]
881        {
882            use std::process::Command;
883
884            // Use vm_stat for page cache statistics on macOS
885            if let Ok(output) = Command::new("vm_stat").output() {
886                let output_str = String::from_utf8_lossy(&output.stdout);
887
888                let mut pageins = 0u64;
889                let mut _pageouts = 0u64; // Parsed but not currently used
890                let mut hits = 0u64;
891
892                for line in output_str.lines() {
893                    let parts: Vec<&str> = line.split(':').collect();
894                    if parts.len() == 2 {
895                        let value_str = parts[1].trim().trim_end_matches('.');
896                        let value = value_str.parse::<u64>().unwrap_or(0);
897
898                        if parts[0].contains("Pageins") {
899                            pageins = value;
900                        } else if parts[0].contains("Pageouts") {
901                            _pageouts = value;
902                        } else if parts[0].contains("\"hit\" page")
903                            || parts[0].contains("cache_hits")
904                        {
905                            hits = value;
906                        }
907                    }
908                }
909
910                let total_accesses = pageins + hits;
911                if total_accesses > 0 {
912                    // Cache hit rate: hits / (pageins + hits)
913                    let hit_rate = (hits as f64 / total_accesses as f64) * 100.0;
914                    return Ok(hit_rate.min(100.0));
915                }
916            }
917
918            // Fallback for macOS
919            Ok(78.0)
920        }
921
922        #[cfg(target_os = "windows")]
923        {
924            use std::process::Command;
925
926            // Use PowerShell to query cache statistics on Windows
927            if let Ok(output) = Command::new("powershell")
928                .arg("-Command")
929                .arg("Get-Counter '\\Memory\\Cache Bytes','\\Memory\\Available Bytes' | Select-Object -ExpandProperty CounterSamples | Select-Object -ExpandProperty CookedValue")
930                .output()
931            {
932                let output_str = String::from_utf8_lossy(&output.stdout);
933                let values: Vec<f64> = output_str
934                    .lines()
935                    .filter_map(|l| l.trim().parse::<f64>().ok())
936                    .collect();
937
938                if values.len() >= 2 {
939                    let cache_bytes = values[0];
940                    let available_bytes = values[1];
941                    let total = cache_bytes + available_bytes;
942
943                    if total > 0.0 {
944                        let cache_ratio = (cache_bytes / total) * 100.0;
945                        return Ok(cache_ratio.min(100.0));
946                    }
947                }
948            }
949
950            // Fallback for Windows
951            Ok(72.0)
952        }
953
954        #[cfg(not(any(target_os = "linux", target_os = "macos", target_os = "windows")))]
955        {
956            // Generic fallback: estimate based on memory pressure
957            if let Ok((used, available)) = self.get_memory_info().await {
958                let total = used + available;
959                if total > 0 {
960                    // Lower memory pressure typically means better cache hit rates
961                    let usage_ratio = used as f64 / total as f64;
962                    let cache_hit_estimate = 100.0 - (usage_ratio * 30.0); // Inverse relationship
963                    return Ok(cache_hit_estimate.max(50.0).min(95.0));
964                }
965            }
966
967            Ok(70.0)
968        }
969    }
970
971    /// Get GPU utilization
972    async fn get_gpu_utilization(&self) -> Result<f64, Box<dyn std::error::Error>> {
973        #[cfg(target_os = "linux")]
974        {
975            use std::process::Command;
976
977            // Try nvidia-smi first
978            if let Ok(output) = Command::new("nvidia-smi")
979                .arg("--query-gpu=utilization.gpu")
980                .arg("--format=csv,noheader,nounits")
981                .output()
982            {
983                let output_str = String::from_utf8_lossy(&output.stdout);
984                if let Ok(utilization) = output_str.trim().parse::<f64>() {
985                    return Ok(utilization);
986                }
987            }
988        }
989
990        Err("GPU utilization not available".into())
991    }
992
993    /// Get GPU memory usage
994    async fn get_gpu_memory(&self) -> Result<(u64, u64), Box<dyn std::error::Error>> {
995        #[cfg(target_os = "linux")]
996        {
997            use std::process::Command;
998
999            if let Ok(output) = Command::new("nvidia-smi")
1000                .arg("--query-gpu=memory.used,memory.total")
1001                .arg("--format=csv,noheader,nounits")
1002                .output()
1003            {
1004                let output_str = String::from_utf8_lossy(&output.stdout);
1005                let parts: Vec<&str> = output_str.trim().split(',').collect();
1006                if parts.len() == 2 {
1007                    let used = parts[0].trim().parse::<u64>()? * 1024 * 1024; // MB to bytes
1008                    let total = parts[1].trim().parse::<u64>()? * 1024 * 1024; // MB to bytes
1009                    return Ok((used, total));
1010                }
1011            }
1012        }
1013
1014        Err("GPU memory information not available".into())
1015    }
1016
1017    /// Get GPU temperature
1018    async fn get_gpu_temperature(&self) -> Result<f64, Box<dyn std::error::Error>> {
1019        #[cfg(target_os = "linux")]
1020        {
1021            use std::process::Command;
1022
1023            if let Ok(output) = Command::new("nvidia-smi")
1024                .arg("--query-gpu=temperature.gpu")
1025                .arg("--format=csv,noheader,nounits")
1026                .output()
1027            {
1028                let output_str = String::from_utf8_lossy(&output.stdout);
1029                if let Ok(temp) = output_str.trim().parse::<f64>() {
1030                    return Ok(temp);
1031                }
1032            }
1033        }
1034
1035        Err("GPU temperature not available".into())
1036    }
1037
1038    /// Get GPU power consumption
1039    async fn get_gpu_power(&self) -> Result<f64, Box<dyn std::error::Error>> {
1040        #[cfg(target_os = "linux")]
1041        {
1042            use std::process::Command;
1043
1044            if let Ok(output) = Command::new("nvidia-smi")
1045                .arg("--query-gpu=power.draw")
1046                .arg("--format=csv,noheader,nounits")
1047                .output()
1048            {
1049                let output_str = String::from_utf8_lossy(&output.stdout);
1050                if let Ok(power) = output_str.trim().parse::<f64>() {
1051                    return Ok(power);
1052                }
1053            }
1054        }
1055
1056        Err("GPU power information not available".into())
1057    }
1058
1059    /// Get active GPU compute units
1060    async fn get_gpu_compute_units(&self) -> Result<usize, Box<dyn std::error::Error>> {
1061        // This would require detailed GPU profiling
1062        // For now, estimate based on utilization
1063        let utilization = self.get_gpu_utilization().await.unwrap_or(0.0);
1064        let estimated_units = ((utilization / 100.0) * 80.0) as usize; // Assume 80 total units
1065        Ok(estimated_units)
1066    }
1067
1068    /// Get GPU memory bandwidth utilization
1069    async fn get_gpu_memory_bandwidth(&self) -> Result<f64, Box<dyn std::error::Error>> {
1070        // This would require specialized GPU profiling tools
1071        // Estimate based on memory usage
1072        let (used, total) = self.get_gpu_memory().await.unwrap_or((0, 1));
1073        let usage_percent = (used as f64 / total as f64) * 100.0;
1074        Ok(usage_percent * 0.8) // Assume bandwidth scales with usage
1075    }
1076
1077    /// Run continuous profiling
1078    pub async fn run_continuous_profiling(&mut self) -> Result<(), Box<dyn std::error::Error>> {
1079        self.start().await?;
1080
1081        while self.active {
1082            if let Some(ref mut timer) = self.timer {
1083                timer.tick().await;
1084            }
1085
1086            match self.collect_metrics().await {
1087                Ok(metrics) => {
1088                    let mut samples = self.samples.write().await;
1089
1090                    // Maintain maximum sample count
1091                    if samples.len() >= self.max_samples {
1092                        samples.pop_front();
1093                    }
1094
1095                    samples.push_back(metrics);
1096                    tracing::debug!(
1097                        "Collected performance metrics, total samples: {}",
1098                        samples.len()
1099                    );
1100                }
1101                Err(e) => {
1102                    tracing::warn!("Failed to collect performance metrics: {}", e);
1103                }
1104            }
1105        }
1106
1107        Ok(())
1108    }
1109
1110    /// Get historical samples
1111    pub async fn get_samples(&self) -> Vec<PerformanceMetrics> {
1112        let samples = self.samples.read().await;
1113        samples.iter().cloned().collect()
1114    }
1115
1116    /// Get latest metrics
1117    pub async fn get_latest_metrics(&self) -> Option<PerformanceMetrics> {
1118        let samples = self.samples.read().await;
1119        samples.back().cloned()
1120    }
1121
1122    /// Clear sample history
1123    pub async fn clear_samples(&self) {
1124        let mut samples = self.samples.write().await;
1125        samples.clear();
1126    }
1127
1128    /// Is profiler currently active
1129    pub fn is_active(&self) -> bool {
1130        self.active
1131    }
1132
1133    /// Get sample count
1134    pub async fn sample_count(&self) -> usize {
1135        let samples = self.samples.read().await;
1136        samples.len()
1137    }
1138
1139    /// Get macOS task info using mach system calls
1140    #[cfg(target_os = "macos")]
1141    async fn get_mach_task_info(&self) -> Result<MachTaskInfo, Box<dyn std::error::Error>> {
1142        // This would use the mach API to get task information
1143        // For now, we'll simulate realistic values
1144
1145        // In a real implementation, this would use:
1146        // - mach_task_self() to get current task
1147        // - task_info() with TASK_BASIC_INFO or TASK_VM_INFO
1148        // - Extract virtual_size, resident_size, etc.
1149
1150        Ok(MachTaskInfo {
1151            virtual_size: 1024 * 1024 * 100, // 100MB virtual
1152            resident_size: 1024 * 1024 * 50, // 50MB resident
1153            user_time: 1000,                 // 1 second user time
1154            system_time: 500,                // 0.5 second system time
1155        })
1156    }
1157
1158    /// Get Windows process memory using Windows API
1159    #[cfg(target_os = "windows")]
1160    async fn get_windows_process_memory(
1161        &self,
1162    ) -> Result<WindowsProcessMemory, Box<dyn std::error::Error>> {
1163        // This would use the Windows API to get process memory information
1164        // For now, we'll simulate realistic values
1165
1166        // In a real implementation, this would use:
1167        // - GetCurrentProcess() to get current process handle
1168        // - GetProcessMemoryInfo() to get PROCESS_MEMORY_COUNTERS
1169        // - Extract WorkingSetSize, PeakWorkingSetSize, etc.
1170
1171        Ok(WindowsProcessMemory {
1172            working_set_size: 1024 * 1024 * 75,       // 75MB working set
1173            peak_working_set_size: 1024 * 1024 * 100, // 100MB peak
1174            private_bytes: 1024 * 1024 * 60,          // 60MB private
1175            virtual_bytes: 1024 * 1024 * 200,         // 200MB virtual
1176        })
1177    }
1178}
1179
1180/// Helper function to parse memory values from /proc/*/status files
1181fn parse_proc_memory_value(line: &str) -> Result<u64, Box<dyn std::error::Error>> {
1182    // Parse lines like "VmSize:	   23456 kB"
1183    let parts: Vec<&str> = line.split_whitespace().collect();
1184    if parts.len() >= 2 {
1185        let value_str = parts[1];
1186        let value = value_str.parse::<u64>()?;
1187        // Convert kB to bytes
1188        Ok(value * 1024)
1189    } else {
1190        Err("Failed to parse memory value".into())
1191    }
1192}
1193
1194/// macOS task info structure
1195#[cfg(target_os = "macos")]
1196struct MachTaskInfo {
1197    virtual_size: u64,
1198    resident_size: u64,
1199    user_time: u64,
1200    system_time: u64,
1201}
1202
1203/// Windows process memory structure
1204#[cfg(target_os = "windows")]
1205struct WindowsProcessMemory {
1206    working_set_size: u64,
1207    peak_working_set_size: u64,
1208    private_bytes: u64,
1209    virtual_bytes: u64,
1210}
1211
1212#[cfg(test)]
1213mod tests {
1214    use super::*;
1215
1216    #[tokio::test]
1217    async fn test_system_profiler_creation() {
1218        let profiler = SystemProfiler::new(Duration::from_secs(1), 100);
1219        assert!(!profiler.is_active());
1220        assert_eq!(profiler.sample_count().await, 0);
1221    }
1222
1223    #[tokio::test]
1224    async fn test_metrics_collection() {
1225        let profiler = SystemProfiler::new(Duration::from_secs(1), 100);
1226
1227        let metrics = profiler.collect_metrics().await;
1228        assert!(metrics.is_ok());
1229
1230        let metrics = metrics.unwrap();
1231        assert!(metrics.timestamp > 0);
1232    }
1233
1234    #[tokio::test]
1235    async fn test_profiler_start_stop() {
1236        let mut profiler = SystemProfiler::new(Duration::from_secs(1), 100);
1237
1238        assert!(!profiler.is_active());
1239
1240        profiler.start().await.unwrap();
1241        assert!(profiler.is_active());
1242
1243        profiler.stop().await;
1244        assert!(!profiler.is_active());
1245    }
1246
1247    #[tokio::test]
1248    async fn test_system_metrics_collection() {
1249        let profiler = SystemProfiler::new(Duration::from_secs(1), 100);
1250
1251        let system_metrics = profiler.collect_system_metrics().await;
1252        assert!(system_metrics.is_ok());
1253
1254        let metrics = system_metrics.unwrap();
1255        assert!(metrics.cpu_usage >= 0.0);
1256        assert!(metrics.thread_count > 0);
1257    }
1258
1259    #[tokio::test]
1260    async fn test_memory_metrics_collection() {
1261        let profiler = SystemProfiler::new(Duration::from_secs(1), 100);
1262
1263        let memory_metrics = profiler.collect_memory_metrics().await;
1264        assert!(memory_metrics.is_ok());
1265
1266        let metrics = memory_metrics.unwrap();
1267        // heap_used is unsigned, so always >= 0 - removing redundant check
1268        assert!(metrics.cache_hit_rate >= 0.0);
1269    }
1270
1271    #[tokio::test]
1272    async fn test_sample_management() {
1273        let profiler = SystemProfiler::new(Duration::from_secs(1), 2); // Max 2 samples
1274        let mut samples = profiler.samples.write().await;
1275
1276        // Add samples beyond capacity
1277        let metrics1 = PerformanceMetrics::default();
1278        let metrics2 = PerformanceMetrics::default();
1279        let metrics3 = PerformanceMetrics::default();
1280
1281        samples.push_back(metrics1);
1282        samples.push_back(metrics2);
1283        assert_eq!(samples.len(), 2);
1284
1285        // Adding third should remove first
1286        samples.push_back(metrics3);
1287        if samples.len() > 2 {
1288            samples.pop_front();
1289        }
1290        assert_eq!(samples.len(), 2);
1291    }
1292}
voirs_cli/performance/profiler.rs

voirs_cli/performance/
profiler.rs