scouter_events/queue/spc/
feature_queue.rs

1use crate::error::FeatureQueueError;
2use crate::queue::traits::FeatureQueue;
3use core::result::Result::Ok;
4use ndarray::prelude::*;
5use ndarray::Array2;
6use scouter_drift::spc::monitor::SpcMonitor;
7use scouter_types::spc::SpcDriftProfile;
8use scouter_types::QueueExt;
9use scouter_types::{Feature, ServerRecords};
10use std::collections::HashMap;
11use tracing::instrument;
12use tracing::{debug, error};
13
14pub struct SpcFeatureQueue {
15    pub drift_profile: SpcDriftProfile,
16    pub empty_queue: HashMap<String, Vec<f64>>,
17    pub monitor: SpcMonitor,
18    pub feature_names: Vec<String>,
19}
20
21impl SpcFeatureQueue {
22    #[instrument(skip(drift_profile))]
23    pub fn new(drift_profile: SpcDriftProfile) -> Self {
24        let empty_queue: HashMap<String, Vec<f64>> = drift_profile
25            .config
26            .alert_config
27            .features_to_monitor
28            .iter()
29            .map(|feature| (feature.clone(), Vec::new()))
30            .collect();
31
32        let feature_names = empty_queue.keys().cloned().collect();
33
34        SpcFeatureQueue {
35            drift_profile,
36            empty_queue,
37            monitor: SpcMonitor::new(),
38            feature_names,
39        }
40    }
41
42    #[instrument(skip(self, features), name = "insert_spc")]
43    pub fn insert(
44        &self,
45        features: &[Feature],
46        queue: &mut HashMap<String, Vec<f64>>,
47    ) -> Result<(), FeatureQueueError> {
48        let feat_map = &self.drift_profile.config.feature_map;
49
50        debug!("Inserting features into queue");
51        features.iter().for_each(|feature| {
52            let name = feature.name().to_string();
53
54            if self.feature_names.contains(&name) {
55                if let Some(queue) = queue.get_mut(&name) {
56                    if let Ok(value) = feature.to_float(feat_map) {
57                        queue.push(value);
58                    }
59                }
60            }
61        });
62
63        Ok(())
64    }
65
66    // Create drift records from queue items
67    //
68    // returns: DriftServerRecords
69    #[instrument(skip(self), name = "Create Server Records")]
70    pub fn create_drift_records(
71        &self,
72        queue: HashMap<String, Vec<f64>>,
73    ) -> Result<ServerRecords, FeatureQueueError> {
74        // filter out empty queues
75        let (arrays, feature_names): (Vec<_>, Vec<_>) = queue
76            .iter()
77            .filter(|(_, values)| !values.is_empty())
78            .map(|(feature, values)| {
79                (
80                    Array2::from_shape_vec((values.len(), 1), values.clone()).unwrap(),
81                    feature.clone(),
82                )
83            })
84            .unzip();
85        let n = arrays[0].dim().0;
86        if arrays.iter().any(|array| array.dim().0 != n) {
87            error!("Shape mismatch");
88            return Err(FeatureQueueError::DriftRecordError(
89                "Shape mismatch".to_string(),
90            ));
91        }
92
93        let concatenated = ndarray::concatenate(
94            Axis(1),
95            &arrays.iter().map(|a| a.view()).collect::<Vec<_>>(),
96        )
97        .map_err(|e| {
98            error!("Failed to concatenate arrays: {:?}", e);
99            FeatureQueueError::DriftRecordError(format!("Failed to concatenate arrays: {:?}", e))
100        })?;
101
102        let records = self
103            .monitor
104            .sample_data(&feature_names, &concatenated.view(), &self.drift_profile)
105            .map_err(|e| {
106                error!("Failed to create drift record: {:?}", e);
107                FeatureQueueError::DriftRecordError(format!(
108                    "Failed to create drift record: {:?}",
109                    e
110                ))
111            })?;
112
113        Ok(records)
114    }
115}
116
117impl FeatureQueue for SpcFeatureQueue {
118    fn create_drift_records_from_batch<T: QueueExt>(
119        &self,
120        batch: Vec<T>,
121    ) -> Result<ServerRecords, FeatureQueueError> {
122        // clones the empty map (so we don't need to recreate it on each call)
123        let mut queue = self.empty_queue.clone();
124
125        for elem in batch {
126            self.insert(elem.features(), &mut queue)?;
127        }
128
129        self.create_drift_records(queue)
130    }
131}
132
133#[cfg(test)]
134mod tests {
135
136    use scouter_types::spc::{SpcAlertConfig, SpcDriftConfig};
137    use scouter_types::Features;
138
139    use super::*;
140    use ndarray::Array;
141    use ndarray_rand::rand_distr::Uniform;
142    use ndarray_rand::RandomExt;
143
144    #[test]
145    fn test_feature_queue_new() {
146        let array = Array::random((1030, 3), Uniform::new(0., 10.));
147
148        let features = vec![
149            "feature_1".to_string(),
150            "feature_2".to_string(),
151            "feature_3".to_string(),
152        ];
153
154        let monitor = SpcMonitor::new();
155        let alert_config = SpcAlertConfig {
156            features_to_monitor: features.clone(),
157            ..Default::default()
158        };
159        let config = SpcDriftConfig::new(
160            Some("name".to_string()),
161            Some("repo".to_string()),
162            None,
163            None,
164            None,
165            Some(alert_config),
166            None,
167        );
168
169        let profile = monitor
170            .create_2d_drift_profile(&features, &array.view(), &config.unwrap())
171            .unwrap();
172        assert_eq!(profile.features.len(), 3);
173
174        let feature_queue = SpcFeatureQueue::new(profile);
175
176        assert_eq!(feature_queue.empty_queue.len(), 3);
177        let mut batch_features = Vec::new();
178
179        for _ in 0..9 {
180            let one = Feature::int("feature_1".to_string(), 1);
181            let two = Feature::int("feature_2".to_string(), 2);
182            let three = Feature::int("feature_3".to_string(), 3);
183
184            let features = Features {
185                features: vec![one, two, three],
186                entity_type: scouter_types::EntityType::Feature,
187            };
188
189            batch_features.push(features);
190        }
191
192        let mut queue = feature_queue.empty_queue.clone();
193        for feature in batch_features.clone() {
194            feature_queue.insert(&feature.features, &mut queue).unwrap();
195        }
196
197        assert_eq!(queue.get("feature_1").unwrap().len(), 9);
198        assert_eq!(queue.get("feature_2").unwrap().len(), 9);
199        assert_eq!(queue.get("feature_3").unwrap().len(), 9);
200
201        let records = feature_queue
202            .create_drift_records_from_batch(batch_features)
203            .unwrap();
204
205        assert_eq!(records.records.len(), 3);
206
207        // serialize records
208        let json_records = records.model_dump_json();
209        assert!(!json_records.is_empty());
210
211        // deserialize records
212        let records: ServerRecords = serde_json::from_str(&json_records).unwrap();
213        assert_eq!(records.records.len(), 3);
214
215        // convert to bytes and back
216        let bytes = json_records.as_bytes();
217
218        let records = ServerRecords::load_from_bytes(bytes).unwrap();
219        assert_eq!(records.records.len(), 3);
220    }
221}