dag/nameset/
lazy.rs

1/*
2 * Copyright (c) Meta Platforms, Inc. and affiliates.
3 *
4 * This source code is licensed under the MIT license found in the
5 * LICENSE file in the root directory of this source tree.
6 */
7
8use std::any::Any;
9use std::fmt;
10use std::sync::Arc;
11
12use futures::lock::Mutex;
13use futures::lock::MutexGuard;
14use futures::StreamExt;
15use indexmap::IndexSet;
16
17use super::AsyncNameSetQuery;
18use super::BoxVertexStream;
19use super::Hints;
20use crate::Result;
21use crate::VertexName;
22
23/// A set backed by a lazy iterator of names.
24pub struct LazySet {
25    inner: Arc<Mutex<Inner>>,
26    hints: Hints,
27}
28
29struct Inner {
30    iter: BoxVertexStream,
31    visited: IndexSet<VertexName>,
32    state: State,
33}
34
35impl Inner {
36    async fn load_more(&mut self, n: usize, mut out: Option<&mut Vec<VertexName>>) -> Result<()> {
37        if matches!(self.state, State::Complete | State::Error) {
38            return Ok(());
39        }
40        for _ in 0..n {
41            match self.iter.next().await {
42                Some(Ok(name)) => {
43                    if let Some(ref mut out) = out {
44                        out.push(name.clone());
45                    }
46                    self.visited.insert(name);
47                }
48                None => {
49                    self.state = State::Complete;
50                    break;
51                }
52                Some(Err(err)) => {
53                    self.state = State::Error;
54                    return Err(err);
55                }
56            }
57        }
58        Ok(())
59    }
60}
61
62#[derive(Copy, Clone, Debug, PartialEq)]
63enum State {
64    Incomplete,
65    Complete,
66    Error,
67}
68
69pub struct Iter {
70    inner: Arc<Mutex<Inner>>,
71    index: usize,
72}
73
74impl Iter {
75    async fn next(&mut self) -> Option<Result<VertexName>> {
76        loop {
77            let mut inner = self.inner.lock().await;
78            match inner.state {
79                State::Error => break None,
80                State::Complete if inner.visited.len() <= self.index => break None,
81                State::Complete | State::Incomplete => {
82                    let value = inner.visited.get_index(self.index).cloned();
83                    match value {
84                        Some(value) => {
85                            self.index += 1;
86                            break Some(Ok(value));
87                        }
88                        None => {
89                            // Data not available. Load more.
90                            if let Err(err) = inner.load_more(1, None).await {
91                                return Some(Err(err));
92                            }
93                            continue;
94                        }
95                    }
96                }
97            }
98        }
99    }
100
101    fn into_stream(self) -> BoxVertexStream {
102        Box::pin(futures::stream::unfold(self, |mut state| async move {
103            let result = state.next().await;
104            result.map(|r| (r, state))
105        }))
106    }
107}
108
109impl fmt::Debug for LazySet {
110    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
111        f.write_str("<lazy ")?;
112        if let Some(inner) = self.inner.try_lock() {
113            let limit = f.width().unwrap_or(3);
114            f.debug_list()
115                .entries(inner.visited.iter().take(limit))
116                .finish()?;
117            let remaining = inner.visited.len().max(limit) - limit;
118            match (remaining, inner.state) {
119                (0, State::Incomplete) => f.write_str(" + ? more")?,
120                (n, State::Incomplete) => write!(f, "+ {} + ? more", n)?,
121                (0, _) => {}
122                (n, _) => write!(f, " + {} more", n)?,
123            }
124        } else {
125            f.write_str(" ?")?;
126        }
127        f.write_str(">")?;
128        Ok(())
129    }
130}
131
132impl LazySet {
133    pub fn from_iter<I>(names: I, hints: Hints) -> Self
134    where
135        I: IntoIterator<Item = Result<VertexName>> + 'static,
136        <I as IntoIterator>::IntoIter: Send + Sync,
137    {
138        let stream = futures::stream::iter(names);
139        Self::from_stream(Box::pin(stream), hints)
140    }
141
142    pub fn from_stream(names: BoxVertexStream, hints: Hints) -> Self {
143        let inner = Inner {
144            iter: names,
145            visited: IndexSet::new(),
146            state: State::Incomplete,
147        };
148        Self {
149            inner: Arc::new(Mutex::new(inner)),
150            hints,
151        }
152    }
153
154    async fn load_all(&self) -> Result<MutexGuard<'_, Inner>> {
155        let mut inner = self.inner.lock().await;
156        inner.load_more(usize::max_value(), None).await?;
157        Ok(inner)
158    }
159}
160
161#[async_trait::async_trait]
162impl AsyncNameSetQuery for LazySet {
163    async fn iter(&self) -> Result<BoxVertexStream> {
164        let inner = self.inner.clone();
165        let iter = Iter { inner, index: 0 };
166        Ok(iter.into_stream())
167    }
168
169    async fn iter_rev(&self) -> Result<BoxVertexStream> {
170        let inner = self.load_all().await?;
171        let iter = inner.visited.clone().into_iter().rev().map(Ok);
172        let stream = futures::stream::iter(iter);
173        Ok(Box::pin(stream))
174    }
175
176    async fn count(&self) -> Result<usize> {
177        let inner = self.load_all().await?;
178        Ok(inner.visited.len())
179    }
180
181    async fn last(&self) -> Result<Option<VertexName>> {
182        let inner = self.load_all().await?;
183        Ok(inner.visited.iter().rev().nth(0).cloned())
184    }
185
186    async fn contains(&self, name: &VertexName) -> Result<bool> {
187        let mut inner = self.inner.lock().await;
188        if inner.visited.contains(name) {
189            return Ok(true);
190        } else {
191            let mut loaded = Vec::new();
192            loop {
193                loaded.clear();
194                inner.load_more(1, Some(&mut loaded)).await?;
195                debug_assert!(loaded.len() <= 1);
196                if loaded.is_empty() {
197                    break;
198                }
199                if loaded.first() == Some(name) {
200                    return Ok(true);
201                }
202            }
203        }
204        Ok(false)
205    }
206
207    async fn contains_fast(&self, name: &VertexName) -> Result<Option<bool>> {
208        let inner = self.inner.lock().await;
209        if inner.visited.contains(name) {
210            return Ok(Some(true));
211        } else if inner.state != State::Incomplete {
212            return Ok(Some(false));
213        }
214        Ok(None)
215    }
216
217    fn as_any(&self) -> &dyn Any {
218        self
219    }
220
221    fn hints(&self) -> &Hints {
222        &self.hints
223    }
224}
225
226#[cfg(test)]
227mod tests {
228    use std::collections::HashSet;
229
230    use super::super::tests::*;
231    use super::*;
232
233    fn lazy_set(a: &[u8]) -> LazySet {
234        LazySet::from_iter(
235            a.to_vec().into_iter().map(|b| Ok(to_name(b))),
236            Hints::default(),
237        )
238    }
239
240    #[test]
241    fn test_lazy_basic() -> Result<()> {
242        let set = lazy_set(b"\x11\x33\x22\x77\x22\x55\x11");
243        check_invariants(&set)?;
244        assert_eq!(shorten_iter(ni(set.iter())), ["11", "33", "22", "77", "55"]);
245        assert_eq!(
246            shorten_iter(ni(set.iter_rev())),
247            ["55", "77", "22", "33", "11"]
248        );
249        assert!(!nb(set.is_empty())?);
250        assert_eq!(nb(set.count())?, 5);
251        assert_eq!(shorten_name(nb(set.first())?.unwrap()), "11");
252        assert_eq!(shorten_name(nb(set.last())?.unwrap()), "55");
253        Ok(())
254    }
255
256    #[test]
257    fn test_debug() {
258        let set = lazy_set(b"");
259        assert_eq!(format!("{:?}", &set), "<lazy [] + ? more>");
260        nb(set.count()).unwrap();
261        assert_eq!(format!("{:?}", &set), "<lazy []>");
262
263        let set = lazy_set(b"\x11\x33\x22");
264        assert_eq!(format!("{:?}", &set), "<lazy [] + ? more>");
265        let mut iter = ni(set.iter()).unwrap();
266        iter.next();
267        assert_eq!(format!("{:?}", &set), "<lazy [1111] + ? more>");
268        iter.next();
269        assert_eq!(format!("{:?}", &set), "<lazy [1111, 3333] + ? more>");
270        iter.next();
271        assert_eq!(format!("{:2.2?}", &set), "<lazy [11, 33]+ 1 + ? more>");
272        iter.next();
273        assert_eq!(format!("{:1.3?}", &set), "<lazy [111] + 2 more>");
274    }
275
276    quickcheck::quickcheck! {
277        fn test_lazy_quickcheck(a: Vec<u8>) -> bool {
278            let set = lazy_set(&a);
279            check_invariants(&set).unwrap();
280
281            let count = nb(set.count()).unwrap();
282            assert!(count <= a.len());
283
284            let set2: HashSet<_> = a.iter().cloned().collect();
285            assert_eq!(count, set2.len());
286
287            true
288        }
289    }
290}