guided_digraph 0.1.1

A data structure for incremental live and dead state detection in an abstract transition system
Documentation
/*
    A directed graph implementation that is used by the different
    implementations of the state graph interface.

    Supports:
    - Adding vertices with names of type V, labeled by type T
    - Adding edges either in forward or backward direction.
      Although the forward and backward may correspond in some implementations,
      for some of the algorithms we want to support (Jump and BFGT)
      it is more flexible to add them separately.
    - Merging vertices in O(1) time (the two vertex names are now aliases)
      (requires a merge function T x T -> T)
      Note: this is a simple graph. self-loops are ignored after a merge.
    - Iterating through the edges at a vertex (O(1) per edge)
      Note: this iterates over original edges; currently doesn't
      support "cleaning" edges by removing duplicates and self-loops
      in case of merged vertices.
    - Generic search functions: DFS forward and backward, or topological
      search backward. For more documentation on these, see search.rs.

    If T implements Default, additionally supports "ensure" functionality
    (i.e. add a vertex default if it doesn't exist already).
*/

use super::debug_counter::DebugCounter;
use super::search::{DepthFirstSearch, TopologicalSearch};
use disjoint_sets::UnionFind;
use std::collections::{HashMap, LinkedList};
use std::fmt::Debug;
use std::hash::Hash;
use std::iter;

// Newtypes to keep different types of ID straight
#[derive(Clone, Copy, Debug, Default, Eq, Hash, PartialEq)]
struct UniqueID(usize);
#[derive(Clone, Copy, Debug, Default, Eq, Hash, PartialEq)]
struct CanonicalID(usize);

#[derive(Debug)]
pub struct DiGraph<V, T> {
    vertex_ids: HashMap<V, UniqueID>,
    id_vertices: HashMap<UniqueID, V>,
    id_find: UnionFind<usize>,
    labels: HashMap<CanonicalID, T>,
    fwd_edges: HashMap<CanonicalID, LinkedList<UniqueID>>,
    bck_edges: HashMap<CanonicalID, LinkedList<UniqueID>>,
    // Debug mode statistics
    space: DebugCounter,
    time: DebugCounter,
}
impl<V, T> Default for DiGraph<V, T> {
    // Can't derive automatically because we don't want to assume V: Default
    // (Basically: derive macro isn't smart enough)
    fn default() -> Self {
        Self {
            vertex_ids: Default::default(),
            id_vertices: Default::default(),
            id_find: Default::default(),
            labels: Default::default(),
            fwd_edges: Default::default(),
            bck_edges: Default::default(),
            space: Default::default(),
            time: Default::default(),
        }
    }
}
impl<V, T> DiGraph<V, T>
where
    V: Copy + Clone + Debug + Eq + Hash + PartialEq,
    T: Debug + PartialEq,
{
    /*
        Exposed API
    */
    pub fn new() -> Self {
        Default::default()
    }
    pub fn is_seen(&self, v: V) -> bool {
        self.time.inc();
        self.vertex_ids.contains_key(&v)
    }
    pub fn get_label(&self, v: V) -> Option<&T> {
        self.time.inc();
        self.get_canon_id(v).and_then(|id| self.labels.get(&id))
    }
    pub fn get_label_mut(&mut self, v: V) -> Option<&mut T> {
        self.time.inc();
        self.get_canon_id(v).and_then(move |id| self.labels.get_mut(&id))
    }
    pub fn overwrite_vertex(&mut self, v: V, label: T) {
        // overwrites if already seen
        if self.is_seen(v) {
            let canon_id = self.get_canon_id_unwrapped(v);
            self.labels.insert(canon_id, label);
            self.time.inc();
        } else {
            self.add_vertex_core(v, label);
        }
    }
    pub fn is_same_vertex(&self, v1: V, v2: V) -> bool {
        self.time.inc();
        let id1 = self.get_canon_id(v1);
        let id2 = self.get_canon_id(v2);
        v1 == v2 || id1.is_some() && id1 == id2
    }
    pub fn get_canon_vertex(&self, v: V) -> V {
        match self.get_canon_id(v) {
            Some(CanonicalID(id)) => {
                *self.id_vertices.get(&UniqueID(id)).unwrap()
            }
            None => v,
        }
    }
    pub fn iter_vertices(&self) -> impl Iterator<Item = V> + '_ {
        // For merged vertices, includes only one copy
        self.labels
            .keys()
            .copied()
            .map(|CanonicalID(id)| UniqueID(id))
            .map(move |uid| self.id_vertices[&uid])
            .inspect(move |_| self.time.inc())
    }
    pub fn iter_vertices_all(&self) -> impl Iterator<Item = V> + '_ {
        // Includes every original vertex even when merged
        self.vertex_ids.keys().copied()
    }
    pub fn iter_fwd_edges(&self, v: V) -> impl Iterator<Item = V> + '_ {
        // Note that when vertices are merged, edges aren't. So the same vertex
        // could appear more than once in the iterator; but iter_edges enforces
        // that self-loops are filtered out.
        debug_assert!(self.is_seen(v));
        self.iter_edges(v, &self.fwd_edges)
    }
    pub fn iter_bck_edges(&self, v: V) -> impl Iterator<Item = V> + '_ {
        // Note that when vertices are merged, edges aren't. So the same vertex
        // could appear more than once in the iterator; but iter_edges enforces
        // that self-loops are filtered out.
        debug_assert!(self.is_seen(v));
        self.iter_edges(v, &self.bck_edges)
    }
    pub fn merge_using<F>(&mut self, v1: V, v2: V, merge_fun: F)
    where
        F: Fn(T, T) -> T,
    {
        // Panics if v1 or v2 aren't seen
        // Uses function F to merge labels
        debug_assert!(self.is_seen(v1));
        debug_assert!(self.is_seen(v2));

        self.time.inc();
        let canon1 = self.get_canon_id_unwrapped(v1);
        let canon2 = self.get_canon_id_unwrapped(v2);
        if canon1 != canon2 {
            self.id_find.union(canon1.0, canon2.0);
            let new = CanonicalID(self.id_find.find(canon1.0));
            debug_assert_eq!(new.0, self.id_find.find(canon2.0));
            debug_assert!(new == canon1 || new == canon2);
            let old = if new == canon1 { canon2 } else { canon1 };
            // Merge labels using merge_fun
            let label1 = self.labels.remove(&old).unwrap();
            let label2 = self.labels.remove(&new).unwrap();
            self.labels.insert(new, merge_fun(label1, label2));
            // Merge edges -- note the following are O(1)
            let mut old_fwd = self.fwd_edges.remove(&old).unwrap();
            let mut old_bck = self.bck_edges.remove(&old).unwrap();
            self.fwd_edges.get_mut(&new).unwrap().append(&mut old_fwd);
            self.bck_edges.get_mut(&new).unwrap().append(&mut old_bck);
        }
        // Could return new vertex here; for now we return nothing.
    }
    pub fn merge(&mut self, v1: V, v2: V) {
        // Panics if v1 or v2 aren't seen, or if their labels differ
        debug_assert_eq!(self.get_label(v1), self.get_label(v2));
        self.merge_using(v1, v2, |t1, t2| {
            debug_assert_eq!(t1, t2);
            t1
        });
    }
    pub fn dfs_fwd<'a>(
        &'a self,
        source: V,
        include: impl (Fn(V) -> bool) + Clone + 'a,
    ) -> impl Iterator<Item = V> + 'a {
        // Depth-first search forward from 'sources', NOT including 'sources',
        // and excluding vertices in the graph not satisfying 'include'.
        // Precondition: everything in 'sources' should be seen
        DepthFirstSearch::new(
            iter::once(self.get_canon_vertex(source)),
            move |v| {
                let include = include.clone();
                self.iter_fwd_edges(v).filter(move |&w| include(w))
            },
        )
    }
    pub fn dfs_bck<'a>(
        &'a self,
        source: V,
        include: impl (Fn(V) -> bool) + Clone + 'a,
    ) -> impl Iterator<Item = V> + 'a {
        // Depth-first search backward from 'sources', NOT including 'sources',
        // and excluding vertices in the graph not satisfying 'include'.
        // Precondition: everything in 'sources' should be seen
        DepthFirstSearch::new(
            iter::once(self.get_canon_vertex(source)),
            move |v| {
                let include = include.clone();
                self.iter_bck_edges(v).filter(move |&w| include(w))
            },
        )
    }
    pub fn topo_search_bck<'a>(
        &'a self,
        source: V,
        include_bck: impl (Fn(V) -> bool) + Clone + 'a,
        include_fwd: impl (Fn(V) -> bool) + Clone + 'a,
    ) -> impl Iterator<Item = V> + 'a {
        // Visit vertices starting from 'source' in a topologically
        // sorted order going backwards. The guarantee is that for each vertex
        // v returned by the search, all forward vertices from v (restricted to
        // those in 'include_fwd') have already been returned, and v is either
        // 'source' or a backward vertex from an already returned
        // vertex (restricted to those in 'include_bck').
        // The search includes 'source' if it qualifies for these conditions.
        // Remember that self-loops in the graph are ignored after a merge, so
        // these conditions skip self-loop edges.
        // See search::TopologicalSearch for more details.
        TopologicalSearch::new(
            iter::once(self.get_canon_vertex(source)),
            move |v| {
                let include_bck = include_bck.clone();
                self.iter_bck_edges(v).filter(move |&w| include_bck(w))
            },
            move |v| {
                let include_fwd = include_fwd.clone();
                self.iter_fwd_edges(v).filter(move |&w| include_fwd(w))
            },
        )
    }

    /*
        Debug mode statistics
        These panic if not in debug mode.
    */
    pub fn get_space(&self) -> usize {
        self.space.get()
    }
    pub fn get_time(&self) -> usize {
        self.time.get()
    }

    /*
        Internal
    */
    fn add_vertex_core(&mut self, v: V, label: T) {
        // Panics if v is seen
        debug_assert!(!self.is_seen(v));
        let new_id = self.id_find.alloc();
        let unique_id = UniqueID(new_id);
        let canon_id = CanonicalID(new_id);
        debug_assert_eq!(self.id_find.find(new_id), new_id);
        debug_assert!(!self.vertex_ids.contains_key(&v));
        debug_assert!(!self.id_vertices.contains_key(&unique_id));
        debug_assert!(!self.labels.contains_key(&canon_id));
        debug_assert!(!self.fwd_edges.contains_key(&canon_id));
        debug_assert!(!self.bck_edges.contains_key(&canon_id));
        self.vertex_ids.insert(v, unique_id);
        self.id_vertices.insert(unique_id, v);
        self.labels.insert(canon_id, label);
        self.fwd_edges.insert(canon_id, LinkedList::new());
        self.bck_edges.insert(canon_id, LinkedList::new());
        self.time.inc();
        self.space.inc();
    }
    fn add_edge_fwd_core(&mut self, v1: V, v2: V) {
        // Add fwd-edge v1 -> v2
        // Precondition: v1 and v2 are seen
        debug_assert!(self.is_seen(v1));
        debug_assert!(self.is_seen(v2));
        let canon1 = self.get_canon_id_unwrapped(v1);
        let canon2 = self.get_canon_id_unwrapped(v2);
        if canon1 != canon2 {
            self.fwd_edges
                .get_mut(&canon1)
                .unwrap()
                .push_back(UniqueID(canon2.0));
            self.space.inc();
        }
        self.time.inc();
    }
    fn add_edge_bck_core(&mut self, v1: V, v2: V) {
        // Add back-edge v2 -> v1 corresponding to fwd-edge v1 -> v2
        // Precondition: v1 and v2 are seen
        debug_assert!(self.is_seen(v1));
        debug_assert!(self.is_seen(v2));
        let canon1 = self.get_canon_id_unwrapped(v1);
        let canon2 = self.get_canon_id_unwrapped(v2);
        if canon1 != canon2 {
            self.bck_edges
                .get_mut(&canon2)
                .unwrap()
                .push_back(UniqueID(canon1.0));
            self.space.inc();
        }
        self.time.inc();
    }
    fn get_canon_id(&self, v: V) -> Option<CanonicalID> {
        self.vertex_ids
            .get(&v)
            .map(|id| self.id_find.find(id.0))
            .map(CanonicalID)
    }
    fn get_canon_id_unwrapped(&self, v: V) -> CanonicalID {
        let id = self.vertex_ids.get(&v).unwrap();
        CanonicalID(self.id_find.find(id.0))
    }
    fn iter_edges<'a>(
        &'a self,
        v: V,
        edges: &'a HashMap<CanonicalID, LinkedList<UniqueID>>,
    ) -> impl Iterator<Item = V> + 'a {
        self.time.inc();
        let canon = self.get_canon_id_unwrapped(v);
        edges[&canon]
            .iter()
            .inspect(move |_| self.time.inc())
            .map(move |id| self.id_find.find(id.0))
            .filter(move |&id| id != canon.0)
            .map(move |id| self.id_vertices.get(&UniqueID(id)).unwrap())
            .copied()
    }
}

/*
    Additional functionality when T: Default
*/
impl<V, T> DiGraph<V, T>
where
    V: Copy + Clone + Debug + Eq + Hash + PartialEq,
    T: Debug + Default + PartialEq,
{
    pub fn ensure_vertex(&mut self, v: V) {
        // if not already seen, adds the default value
        if self.is_seen(v) {
            // increment time since there was a function call
            self.time.inc();
        } else {
            self.add_vertex_core(v, Default::default());
        }
    }
    pub fn ensure_edge_fwd(&mut self, v1: V, v2: V) {
        // add a fwd-edge, ensuring the vertices exist first
        self.ensure_vertex(v1);
        self.ensure_vertex(v2);
        self.add_edge_fwd_core(v1, v2);
    }
    pub fn ensure_edge_bck(&mut self, v1: V, v2: V) {
        // add a bck-edge corresponding to fwd-edge from v1 to v2,
        // ensuring the vertices exist first
        self.ensure_vertex(v1);
        self.ensure_vertex(v2);
        self.add_edge_bck_core(v1, v2);
    }
    pub fn ensure_edge(&mut self, v1: V, v2: V) {
        // add an edge, ensuring the vertices exist first
        self.ensure_vertex(v1);
        self.ensure_vertex(v2);
        self.add_edge_fwd_core(v1, v2);
        self.add_edge_bck_core(v1, v2);
    }
}