ruvector_core/
cache_optimized.rs

1//! Cache-optimized data structures using Structure-of-Arrays (SoA) layout
2//!
3//! This module provides cache-friendly layouts for vector storage to minimize
4//! cache misses and improve memory access patterns.
5
6use std::alloc::{alloc, dealloc, Layout};
7use std::ptr;
8
9/// Cache line size (typically 64 bytes on modern CPUs)
10const CACHE_LINE_SIZE: usize = 64;
11
12/// Structure-of-Arrays layout for vectors
13///
14/// Instead of storing vectors as Vec<Vec<f32>>, we store all components
15/// separately to improve cache locality during SIMD operations.
16#[repr(align(64))] // Align to cache line boundary
17pub struct SoAVectorStorage {
18    /// Number of vectors
19    count: usize,
20    /// Dimensions per vector
21    dimensions: usize,
22    /// Capacity (allocated vectors)
23    capacity: usize,
24    /// Storage for each dimension separately
25    /// Layout: [dim0_vec0, dim0_vec1, ..., dim0_vecN, dim1_vec0, ...]
26    data: *mut f32,
27}
28
29impl SoAVectorStorage {
30    /// Maximum allowed dimensions to prevent overflow
31    const MAX_DIMENSIONS: usize = 65536;
32    /// Maximum allowed capacity to prevent overflow
33    const MAX_CAPACITY: usize = 1 << 24; // ~16M vectors
34
35    /// Create a new SoA vector storage
36    ///
37    /// # Panics
38    /// Panics if dimensions or capacity exceed safe limits or would cause overflow.
39    pub fn new(dimensions: usize, initial_capacity: usize) -> Self {
40        // Security: Validate inputs to prevent integer overflow
41        assert!(
42            dimensions > 0 && dimensions <= Self::MAX_DIMENSIONS,
43            "dimensions must be between 1 and {}",
44            Self::MAX_DIMENSIONS
45        );
46        assert!(
47            initial_capacity <= Self::MAX_CAPACITY,
48            "initial_capacity exceeds maximum of {}",
49            Self::MAX_CAPACITY
50        );
51
52        let capacity = initial_capacity.next_power_of_two();
53
54        // Security: Use checked arithmetic to prevent overflow
55        let total_elements = dimensions
56            .checked_mul(capacity)
57            .expect("dimensions * capacity overflow");
58        let total_bytes = total_elements
59            .checked_mul(std::mem::size_of::<f32>())
60            .expect("total size overflow");
61
62        let layout =
63            Layout::from_size_align(total_bytes, CACHE_LINE_SIZE).expect("invalid memory layout");
64
65        let data = unsafe { alloc(layout) as *mut f32 };
66
67        // Zero initialize
68        unsafe {
69            ptr::write_bytes(data, 0, total_elements);
70        }
71
72        Self {
73            count: 0,
74            dimensions,
75            capacity,
76            data,
77        }
78    }
79
80    /// Add a vector to the storage
81    pub fn push(&mut self, vector: &[f32]) {
82        assert_eq!(vector.len(), self.dimensions);
83
84        if self.count >= self.capacity {
85            self.grow();
86        }
87
88        // Store each dimension separately
89        for (dim_idx, &value) in vector.iter().enumerate() {
90            let offset = dim_idx * self.capacity + self.count;
91            unsafe {
92                *self.data.add(offset) = value;
93            }
94        }
95
96        self.count += 1;
97    }
98
99    /// Get a vector by index (copies to output buffer)
100    pub fn get(&self, index: usize, output: &mut [f32]) {
101        assert!(index < self.count);
102        assert_eq!(output.len(), self.dimensions);
103
104        for dim_idx in 0..self.dimensions {
105            let offset = dim_idx * self.capacity + index;
106            output[dim_idx] = unsafe { *self.data.add(offset) };
107        }
108    }
109
110    /// Get a slice of a specific dimension across all vectors
111    /// This allows efficient SIMD operations on a single dimension
112    pub fn dimension_slice(&self, dim_idx: usize) -> &[f32] {
113        assert!(dim_idx < self.dimensions);
114        let offset = dim_idx * self.capacity;
115        unsafe { std::slice::from_raw_parts(self.data.add(offset), self.count) }
116    }
117
118    /// Get a mutable slice of a specific dimension
119    pub fn dimension_slice_mut(&mut self, dim_idx: usize) -> &mut [f32] {
120        assert!(dim_idx < self.dimensions);
121        let offset = dim_idx * self.capacity;
122        unsafe { std::slice::from_raw_parts_mut(self.data.add(offset), self.count) }
123    }
124
125    /// Number of vectors stored
126    pub fn len(&self) -> usize {
127        self.count
128    }
129
130    /// Check if empty
131    pub fn is_empty(&self) -> bool {
132        self.count == 0
133    }
134
135    /// Dimensions per vector
136    pub fn dimensions(&self) -> usize {
137        self.dimensions
138    }
139
140    /// Grow the storage capacity
141    fn grow(&mut self) {
142        let new_capacity = self.capacity * 2;
143        let new_total_elements = self.dimensions * new_capacity;
144
145        let new_layout = Layout::from_size_align(
146            new_total_elements * std::mem::size_of::<f32>(),
147            CACHE_LINE_SIZE,
148        )
149        .unwrap();
150
151        let new_data = unsafe { alloc(new_layout) as *mut f32 };
152
153        // Copy old data dimension by dimension
154        for dim_idx in 0..self.dimensions {
155            let old_offset = dim_idx * self.capacity;
156            let new_offset = dim_idx * new_capacity;
157
158            unsafe {
159                ptr::copy_nonoverlapping(
160                    self.data.add(old_offset),
161                    new_data.add(new_offset),
162                    self.count,
163                );
164            }
165        }
166
167        // Deallocate old data
168        let old_layout = Layout::from_size_align(
169            self.dimensions * self.capacity * std::mem::size_of::<f32>(),
170            CACHE_LINE_SIZE,
171        )
172        .unwrap();
173
174        unsafe {
175            dealloc(self.data as *mut u8, old_layout);
176        }
177
178        self.data = new_data;
179        self.capacity = new_capacity;
180    }
181
182    /// Compute distance from query to all stored vectors using dimension-wise operations
183    /// This takes advantage of the SoA layout for better cache utilization
184    pub fn batch_euclidean_distances(&self, query: &[f32], output: &mut [f32]) {
185        assert_eq!(query.len(), self.dimensions);
186        assert_eq!(output.len(), self.count);
187
188        // Initialize output with zeros
189        output.fill(0.0);
190
191        // Process dimension by dimension
192        for dim_idx in 0..self.dimensions {
193            let dim_slice = self.dimension_slice(dim_idx);
194            let query_val = query[dim_idx];
195
196            // Compute squared differences for this dimension
197            for vec_idx in 0..self.count {
198                let diff = dim_slice[vec_idx] - query_val;
199                output[vec_idx] += diff * diff;
200            }
201        }
202
203        // Take square root
204        for distance in output.iter_mut() {
205            *distance = distance.sqrt();
206        }
207    }
208}
209
210impl Drop for SoAVectorStorage {
211    fn drop(&mut self) {
212        let layout = Layout::from_size_align(
213            self.dimensions * self.capacity * std::mem::size_of::<f32>(),
214            CACHE_LINE_SIZE,
215        )
216        .unwrap();
217
218        unsafe {
219            dealloc(self.data as *mut u8, layout);
220        }
221    }
222}
223
224unsafe impl Send for SoAVectorStorage {}
225unsafe impl Sync for SoAVectorStorage {}
226
227#[cfg(test)]
228mod tests {
229    use super::*;
230
231    #[test]
232    fn test_soa_storage() {
233        let mut storage = SoAVectorStorage::new(3, 4);
234
235        storage.push(&[1.0, 2.0, 3.0]);
236        storage.push(&[4.0, 5.0, 6.0]);
237
238        assert_eq!(storage.len(), 2);
239
240        let mut output = vec![0.0; 3];
241        storage.get(0, &mut output);
242        assert_eq!(output, vec![1.0, 2.0, 3.0]);
243
244        storage.get(1, &mut output);
245        assert_eq!(output, vec![4.0, 5.0, 6.0]);
246    }
247
248    #[test]
249    fn test_dimension_slice() {
250        let mut storage = SoAVectorStorage::new(3, 4);
251
252        storage.push(&[1.0, 2.0, 3.0]);
253        storage.push(&[4.0, 5.0, 6.0]);
254        storage.push(&[7.0, 8.0, 9.0]);
255
256        // Get all values for dimension 0
257        let dim0 = storage.dimension_slice(0);
258        assert_eq!(dim0, &[1.0, 4.0, 7.0]);
259
260        // Get all values for dimension 1
261        let dim1 = storage.dimension_slice(1);
262        assert_eq!(dim1, &[2.0, 5.0, 8.0]);
263    }
264
265    #[test]
266    fn test_batch_distances() {
267        let mut storage = SoAVectorStorage::new(3, 4);
268
269        storage.push(&[1.0, 0.0, 0.0]);
270        storage.push(&[0.0, 1.0, 0.0]);
271        storage.push(&[0.0, 0.0, 1.0]);
272
273        let query = vec![1.0, 0.0, 0.0];
274        let mut distances = vec![0.0; 3];
275
276        storage.batch_euclidean_distances(&query, &mut distances);
277
278        assert!((distances[0] - 0.0).abs() < 0.001);
279        assert!((distances[1] - 1.414).abs() < 0.01);
280        assert!((distances[2] - 1.414).abs() < 0.01);
281    }
282}
ruvector_core/cache_optimized.rs

ruvector_core/
cache_optimized.rs