scouter_events/queue/spc/
feature_queue.rs

1use crate::error::FeatureQueueError;
2use crate::queue::traits::FeatureQueue;
3use core::result::Result::Ok;
4use ndarray::prelude::*;
5use ndarray::Array2;
6use scouter_drift::spc::monitor::SpcMonitor;
7use scouter_types::spc::SpcDriftProfile;
8use scouter_types::QueueExt;
9use scouter_types::{Feature, ServerRecords};
10use std::collections::HashMap;
11use tracing::instrument;
12use tracing::{debug, error};
13
14pub struct SpcFeatureQueue {
15    pub drift_profile: SpcDriftProfile,
16    pub empty_queue: HashMap<String, Vec<f64>>,
17    pub monitor: SpcMonitor,
18    pub feature_names: Vec<String>,
19}
20
21impl SpcFeatureQueue {
22    #[instrument(skip(drift_profile))]
23    pub fn new(drift_profile: SpcDriftProfile) -> Self {
24        let empty_queue: HashMap<String, Vec<f64>> = drift_profile
25            .config
26            .alert_config
27            .features_to_monitor
28            .iter()
29            .map(|feature| (feature.clone(), Vec::new()))
30            .collect();
31
32        let feature_names = empty_queue.keys().cloned().collect();
33
34        SpcFeatureQueue {
35            drift_profile,
36            empty_queue,
37            monitor: SpcMonitor::new(),
38            feature_names,
39        }
40    }
41
42    #[instrument(skip(self, features), name = "insert_spc")]
43    pub fn insert(
44        &self,
45        features: &[Feature],
46        queue: &mut HashMap<String, Vec<f64>>,
47    ) -> Result<(), FeatureQueueError> {
48        let feat_map = &self.drift_profile.config.feature_map;
49
50        debug!("Inserting features into queue");
51        features.iter().for_each(|feature| {
52            let name = feature.name().to_string();
53
54            if self.feature_names.contains(&name) {
55                if let Some(queue) = queue.get_mut(&name) {
56                    if let Ok(value) = feature.to_float(feat_map) {
57                        queue.push(value);
58                    }
59                }
60            } else {
61                error!("Feature {} not found in drift profile", name);
62            }
63        });
64
65        Ok(())
66    }
67
68    // Create drift records from queue items
69    //
70    // returns: DriftServerRecords
71    #[instrument(skip(self), name = "Create Server Records")]
72    pub fn create_drift_records(
73        &self,
74        queue: HashMap<String, Vec<f64>>,
75    ) -> Result<ServerRecords, FeatureQueueError> {
76        // filter out empty queues
77        let (arrays, feature_names): (Vec<_>, Vec<_>) = queue
78            .iter()
79            .filter(|(_, values)| !values.is_empty())
80            .map(|(feature, values)| {
81                (
82                    Array2::from_shape_vec((values.len(), 1), values.clone()).unwrap(),
83                    feature.clone(),
84                )
85            })
86            .unzip();
87        let n = arrays[0].dim().0;
88        if arrays.iter().any(|array| array.dim().0 != n) {
89            error!("Shape mismatch");
90            return Err(FeatureQueueError::DriftRecordError(
91                "Shape mismatch".to_string(),
92            ));
93        }
94
95        let concatenated = ndarray::concatenate(
96            Axis(1),
97            &arrays.iter().map(|a| a.view()).collect::<Vec<_>>(),
98        )
99        .map_err(|e| {
100            error!("Failed to concatenate arrays: {:?}", e);
101            FeatureQueueError::DriftRecordError(format!("Failed to concatenate arrays: {e:?}"))
102        })?;
103
104        let records = self
105            .monitor
106            .sample_data(&feature_names, &concatenated.view(), &self.drift_profile)
107            .map_err(|e| {
108                error!("Failed to create drift record: {:?}", e);
109                FeatureQueueError::DriftRecordError(format!("Failed to create drift record: {e:?}"))
110            })?;
111
112        Ok(records)
113    }
114}
115
116impl FeatureQueue for SpcFeatureQueue {
117    fn create_drift_records_from_batch<T: QueueExt>(
118        &self,
119        batch: Vec<T>,
120    ) -> Result<ServerRecords, FeatureQueueError> {
121        // clones the empty map (so we don't need to recreate it on each call)
122        let mut queue = self.empty_queue.clone();
123
124        for elem in batch {
125            self.insert(elem.features(), &mut queue)?;
126        }
127
128        self.create_drift_records(queue)
129    }
130}
131
132#[cfg(test)]
133mod tests {
134
135    use scouter_types::spc::{SpcAlertConfig, SpcDriftConfig};
136    use scouter_types::Features;
137
138    use super::*;
139    use ndarray::Array;
140    use ndarray_rand::rand_distr::Uniform;
141    use ndarray_rand::RandomExt;
142
143    #[test]
144    fn test_feature_queue_new() {
145        let array = Array::random((1030, 3), Uniform::new(0., 10.));
146
147        let features = vec![
148            "feature_1".to_string(),
149            "feature_2".to_string(),
150            "feature_3".to_string(),
151        ];
152
153        let monitor = SpcMonitor::new();
154        let alert_config = SpcAlertConfig {
155            features_to_monitor: features.clone(),
156            ..Default::default()
157        };
158        let config = SpcDriftConfig::new(
159            Some("name".to_string()),
160            Some("repo".to_string()),
161            None,
162            None,
163            None,
164            Some(alert_config),
165            None,
166        );
167
168        let profile = monitor
169            .create_2d_drift_profile(&features, &array.view(), &config.unwrap())
170            .unwrap();
171        assert_eq!(profile.features.len(), 3);
172
173        let feature_queue = SpcFeatureQueue::new(profile);
174
175        assert_eq!(feature_queue.empty_queue.len(), 3);
176        let mut batch_features = Vec::new();
177
178        for _ in 0..9 {
179            let one = Feature::int("feature_1".to_string(), 1);
180            let two = Feature::int("feature_2".to_string(), 2);
181            let three = Feature::int("feature_3".to_string(), 3);
182
183            let features = Features {
184                features: vec![one, two, three],
185                entity_type: scouter_types::EntityType::Feature,
186            };
187
188            batch_features.push(features);
189        }
190
191        let mut queue = feature_queue.empty_queue.clone();
192        for feature in batch_features.clone() {
193            feature_queue.insert(&feature.features, &mut queue).unwrap();
194        }
195
196        assert_eq!(queue.get("feature_1").unwrap().len(), 9);
197        assert_eq!(queue.get("feature_2").unwrap().len(), 9);
198        assert_eq!(queue.get("feature_3").unwrap().len(), 9);
199
200        let records = feature_queue
201            .create_drift_records_from_batch(batch_features)
202            .unwrap();
203
204        assert_eq!(records.records.len(), 3);
205
206        // serialize records
207        let json_records = records.model_dump_json();
208        assert!(!json_records.is_empty());
209
210        // deserialize records
211        let records: ServerRecords = serde_json::from_str(&json_records).unwrap();
212        assert_eq!(records.records.len(), 3);
213
214        // convert to bytes and back
215        let bytes = json_records.as_bytes();
216
217        let records = ServerRecords::load_from_bytes(bytes).unwrap();
218        assert_eq!(records.records.len(), 3);
219    }
220}