oximedia_gpu/
memory.rs

1//! GPU memory management and allocation tracking
2//!
3//! This module provides memory allocation tracking, usage statistics,
4//! and memory pool management for GPU buffers.
5
6use crate::{GpuBuffer, GpuDevice, GpuError, Result};
7use parking_lot::RwLock;
8use std::collections::HashMap;
9use std::sync::atomic::{AtomicU64, Ordering};
10use std::sync::Arc;
11
12/// Memory allocation statistics
13#[derive(Debug, Clone, Copy, Default)]
14pub struct MemoryStats {
15    /// Total bytes allocated
16    pub total_allocated: u64,
17    /// Total bytes freed
18    pub total_freed: u64,
19    /// Current bytes in use
20    pub current_usage: u64,
21    /// Peak memory usage
22    pub peak_usage: u64,
23    /// Number of active allocations
24    pub allocation_count: u64,
25}
26
27impl MemoryStats {
28    /// Get the current memory usage in bytes
29    #[must_use]
30    pub fn current_bytes(&self) -> u64 {
31        self.current_usage
32    }
33
34    /// Get the current memory usage in megabytes
35    #[must_use]
36    pub fn current_mb(&self) -> f64 {
37        self.current_usage as f64 / (1024.0 * 1024.0)
38    }
39
40    /// Get the peak memory usage in bytes
41    #[must_use]
42    pub fn peak_bytes(&self) -> u64 {
43        self.peak_usage
44    }
45
46    /// Get the peak memory usage in megabytes
47    #[must_use]
48    pub fn peak_mb(&self) -> f64 {
49        self.peak_usage as f64 / (1024.0 * 1024.0)
50    }
51}
52
53/// Memory allocator for GPU buffers
54pub struct MemoryAllocator {
55    device: Arc<wgpu::Device>,
56    total_allocated: AtomicU64,
57    total_freed: AtomicU64,
58    current_usage: AtomicU64,
59    peak_usage: AtomicU64,
60    allocation_count: AtomicU64,
61}
62
63impl MemoryAllocator {
64    /// Create a new memory allocator
65    #[must_use]
66    pub fn new(device: &GpuDevice) -> Self {
67        Self {
68            device: Arc::clone(device.device()),
69            total_allocated: AtomicU64::new(0),
70            total_freed: AtomicU64::new(0),
71            current_usage: AtomicU64::new(0),
72            peak_usage: AtomicU64::new(0),
73            allocation_count: AtomicU64::new(0),
74        }
75    }
76
77    /// Track a memory allocation
78    pub fn track_allocation(&self, size: u64) {
79        self.total_allocated.fetch_add(size, Ordering::Relaxed);
80        let current = self.current_usage.fetch_add(size, Ordering::Relaxed) + size;
81        self.allocation_count.fetch_add(1, Ordering::Relaxed);
82
83        // Update peak usage
84        let mut peak = self.peak_usage.load(Ordering::Relaxed);
85        while current > peak {
86            match self.peak_usage.compare_exchange_weak(
87                peak,
88                current,
89                Ordering::Relaxed,
90                Ordering::Relaxed,
91            ) {
92                Ok(_) => break,
93                Err(x) => peak = x,
94            }
95        }
96    }
97
98    /// Track a memory deallocation
99    pub fn track_deallocation(&self, size: u64) {
100        self.total_freed.fetch_add(size, Ordering::Relaxed);
101        self.current_usage.fetch_sub(size, Ordering::Relaxed);
102        self.allocation_count.fetch_sub(1, Ordering::Relaxed);
103    }
104
105    /// Get current memory statistics
106    pub fn stats(&self) -> MemoryStats {
107        MemoryStats {
108            total_allocated: self.total_allocated.load(Ordering::Relaxed),
109            total_freed: self.total_freed.load(Ordering::Relaxed),
110            current_usage: self.current_usage.load(Ordering::Relaxed),
111            peak_usage: self.peak_usage.load(Ordering::Relaxed),
112            allocation_count: self.allocation_count.load(Ordering::Relaxed),
113        }
114    }
115
116    /// Reset statistics
117    pub fn reset_stats(&self) {
118        self.total_allocated.store(0, Ordering::Relaxed);
119        self.total_freed.store(0, Ordering::Relaxed);
120        self.current_usage.store(0, Ordering::Relaxed);
121        self.peak_usage.store(0, Ordering::Relaxed);
122        self.allocation_count.store(0, Ordering::Relaxed);
123    }
124
125    /// Get the device reference
126    pub fn device(&self) -> &Arc<wgpu::Device> {
127        &self.device
128    }
129}
130
131/// Memory pool for reusing GPU buffers
132pub struct MemoryPool {
133    #[allow(dead_code)]
134    device: Arc<wgpu::Device>,
135    allocator: Arc<MemoryAllocator>,
136    pools: RwLock<HashMap<u64, Vec<GpuBuffer>>>,
137}
138
139impl MemoryPool {
140    /// Create a new memory pool
141    #[must_use]
142    pub fn new(device: &GpuDevice) -> Self {
143        Self {
144            device: Arc::clone(device.device()),
145            allocator: Arc::new(MemoryAllocator::new(device)),
146            pools: RwLock::new(HashMap::new()),
147        }
148    }
149
150    /// Allocate a buffer from the pool
151    ///
152    /// If a buffer of the requested size is available in the pool, it will be reused.
153    /// Otherwise, a new buffer will be allocated.
154    ///
155    /// # Arguments
156    ///
157    /// * `device` - GPU device
158    /// * `size` - Buffer size in bytes
159    /// * `buffer_type` - Type of buffer to allocate
160    ///
161    /// # Errors
162    ///
163    /// Returns an error if buffer allocation fails.
164    pub fn allocate(
165        &self,
166        device: &GpuDevice,
167        size: u64,
168        buffer_type: crate::buffer::BufferType,
169    ) -> Result<GpuBuffer> {
170        // Try to reuse a buffer from the pool
171        {
172            let mut pools = self.pools.write();
173            if let Some(pool) = pools.get_mut(&size) {
174                if let Some(buffer) = pool.pop() {
175                    return Ok(buffer);
176                }
177            }
178        }
179
180        // Allocate a new buffer
181        let buffer = GpuBuffer::new(device, size, buffer_type)?;
182        self.allocator.track_allocation(size);
183
184        Ok(buffer)
185    }
186
187    /// Return a buffer to the pool for reuse
188    ///
189    /// # Arguments
190    ///
191    /// * `buffer` - Buffer to return to the pool
192    pub fn deallocate(&self, buffer: GpuBuffer) {
193        let size = buffer.size();
194        let mut pools = self.pools.write();
195        pools.entry(size).or_default().push(buffer);
196    }
197
198    /// Clear the memory pool
199    pub fn clear(&self) {
200        let mut pools = self.pools.write();
201        for (size, buffers) in pools.drain() {
202            let total_size = size * buffers.len() as u64;
203            self.allocator.track_deallocation(total_size);
204        }
205    }
206
207    /// Get the number of buffers in the pool
208    pub fn pool_size(&self) -> usize {
209        let pools = self.pools.read();
210        pools.values().map(std::vec::Vec::len).sum()
211    }
212
213    /// Get memory statistics
214    pub fn stats(&self) -> MemoryStats {
215        self.allocator.stats()
216    }
217
218    /// Get the allocator
219    pub fn allocator(&self) -> &Arc<MemoryAllocator> {
220        &self.allocator
221    }
222}
223
224/// RAII wrapper for automatic buffer deallocation
225pub struct ManagedBuffer {
226    buffer: Option<GpuBuffer>,
227    pool: Arc<MemoryPool>,
228}
229
230impl ManagedBuffer {
231    /// Create a new managed buffer
232    pub fn new(buffer: GpuBuffer, pool: Arc<MemoryPool>) -> Self {
233        Self {
234            buffer: Some(buffer),
235            pool,
236        }
237    }
238
239    /// Get a reference to the buffer.
240    ///
241    /// # Panics
242    ///
243    /// Panics if the buffer has already been released via [`ManagedBuffer::take`].
244    /// Under normal usage this cannot happen because `take()` consumes `self`.
245    #[must_use]
246    pub fn buffer(&self) -> &GpuBuffer {
247        self.buffer
248            .as_ref()
249            .unwrap_or_else(|| unreachable!("ManagedBuffer accessed after buffer was released"))
250    }
251
252    /// Fallible variant of [`ManagedBuffer::buffer`].
253    ///
254    /// # Errors
255    ///
256    /// Returns [`GpuError::Internal`] if the buffer has already been released.
257    pub fn try_buffer(&self) -> Result<&GpuBuffer> {
258        self.buffer
259            .as_ref()
260            .ok_or_else(|| GpuError::Internal("Buffer already released".to_string()))
261    }
262
263    /// Take ownership of the buffer, preventing automatic deallocation.
264    ///
265    /// # Errors
266    ///
267    /// Returns [`GpuError::Internal`] if the buffer has already been released.
268    pub fn take(mut self) -> Result<GpuBuffer> {
269        self.buffer
270            .take()
271            .ok_or_else(|| GpuError::Internal("Buffer already released".to_string()))
272    }
273}
274
275impl Drop for ManagedBuffer {
276    fn drop(&mut self) {
277        if let Some(buffer) = self.buffer.take() {
278            self.pool.deallocate(buffer);
279        }
280    }
281}
282
283impl std::ops::Deref for ManagedBuffer {
284    type Target = GpuBuffer;
285
286    fn deref(&self) -> &Self::Target {
287        self.buffer()
288    }
289}
290
291#[cfg(test)]
292mod tests {
293    use super::*;
294
295    #[test]
296    fn test_memory_stats() {
297        let stats = MemoryStats {
298            total_allocated: 1024 * 1024 * 100, // 100 MB
299            total_freed: 1024 * 1024 * 20,      // 20 MB
300            current_usage: 1024 * 1024 * 80,    // 80 MB
301            peak_usage: 1024 * 1024 * 90,       // 90 MB
302            allocation_count: 10,
303        };
304
305        assert_eq!(stats.current_bytes(), 1024 * 1024 * 80);
306        assert!((stats.current_mb() - 80.0).abs() < 0.01);
307        assert_eq!(stats.peak_bytes(), 1024 * 1024 * 90);
308        assert!((stats.peak_mb() - 90.0).abs() < 0.01);
309    }
310
311    #[test]
312    #[ignore] // Requires GPU hardware; run with --ignored
313    fn test_memory_allocator_tracking() {
314        let Ok(gpu_device) = crate::device::GpuDevice::new(None) else {
315            return;
316        };
317        let allocator = MemoryAllocator::new(&gpu_device);
318
319        allocator.track_allocation(1024);
320        allocator.track_allocation(2048);
321
322        let stats = allocator.stats();
323        assert_eq!(stats.total_allocated, 3072);
324        assert_eq!(stats.current_usage, 3072);
325        assert_eq!(stats.allocation_count, 2);
326
327        allocator.track_deallocation(1024);
328
329        let stats = allocator.stats();
330        assert_eq!(stats.total_freed, 1024);
331        assert_eq!(stats.current_usage, 2048);
332        assert_eq!(stats.allocation_count, 1);
333    }
334
335    #[test]
336    fn test_memory_allocator_tracking_no_gpu() {
337        // Test tracking logic without GPU initialization using atomic counters directly.
338        let total_allocated = AtomicU64::new(0);
339        let total_freed = AtomicU64::new(0);
340        let current_usage = AtomicU64::new(0);
341        let allocation_count = AtomicU64::new(0);
342
343        // Simulate track_allocation(1024)
344        total_allocated.fetch_add(1024, Ordering::Relaxed);
345        current_usage.fetch_add(1024, Ordering::Relaxed);
346        allocation_count.fetch_add(1, Ordering::Relaxed);
347
348        // Simulate track_allocation(2048)
349        total_allocated.fetch_add(2048, Ordering::Relaxed);
350        current_usage.fetch_add(2048, Ordering::Relaxed);
351        allocation_count.fetch_add(1, Ordering::Relaxed);
352
353        assert_eq!(total_allocated.load(Ordering::Relaxed), 3072);
354        assert_eq!(current_usage.load(Ordering::Relaxed), 3072);
355        assert_eq!(allocation_count.load(Ordering::Relaxed), 2);
356
357        // Simulate track_deallocation(1024)
358        total_freed.fetch_add(1024, Ordering::Relaxed);
359        current_usage.fetch_sub(1024, Ordering::Relaxed);
360        allocation_count.fetch_sub(1, Ordering::Relaxed);
361
362        assert_eq!(total_freed.load(Ordering::Relaxed), 1024);
363        assert_eq!(current_usage.load(Ordering::Relaxed), 2048);
364        assert_eq!(allocation_count.load(Ordering::Relaxed), 1);
365    }
366}
oximedia_gpu/memory.rs

oximedia_gpu/
memory.rs