Make topological sort fully general. (#1138)

* Make topological sort fully general. * Detect missing provenance. * Never gonna underflow. --------- Co-authored-by: porcuquine <[email protected]>
lurk-lab · Feb 17, 2024 · f2d70f4 · f2d70f4 · github-actions · Feb 17, 2024
1 parent 6621d24
commit f2d70f4
Showing 1 changed file with 49 additions and 20 deletions.
diff --git a/src/coroutine/memoset/mod.rs b/src/coroutine/memoset/mod.rs
@@ -617,40 +617,57 @@ impl<F: LurkField, Q: Query<F>> Scope<Q, LogMemo<F>, F> {
     // }
 
     fn compute_provenances(&self, store: &Store<F>) -> HashMap<ZPtr<Tag, F>, ZPtr<Tag, F>> {
-        let base_cases = self
+        let mut provenances = HashMap::default();
+        let mut ready = HashSet::new();
+
+        let mut missing_dependency_counts: HashMap<&Ptr, usize> = self
             .queries
             .keys()
-            .filter(|key| {
-                if let Some(deps) = self.dependencies.get(key) {
-                    deps.is_empty()
-                } else {
-                    true
+            .map(|key| {
+                let dep_count = self.dependencies.get(key).map_or(0, |x| x.len());
+
+                if dep_count == 0 {
+                    // Queries are ready if they have no missing dependencies.
+                    // Initially, this will be the base cases -- which have no dependencies.
+                    ready.insert(key);
                 }
+                (key, dep_count)
             })
-            .collect::<HashSet<_>>();
-        let mut todo = base_cases;
-        let mut provenances = HashMap::default();
-
-        while !todo.is_empty() {
-            todo = self.extend_provenances(store, &mut provenances, todo);
+            .collect();
+
+        while !ready.is_empty() {
+            ready = self.extend_provenances(
+                store,
+                &mut provenances,
+                ready,
+                &mut missing_dependency_counts,
+            );
         }
 
+        assert_eq!(
+            self.queries.len(),
+            provenances.len(),
+            "incomplete provenance computation (probably a forbidden cyclic query)"
+        );
+
         provenances
             .iter()
             .map(|(k, v)| (store.hash_ptr(k), store.hash_ptr(v)))
             .collect()
     }
 
-    fn extend_provenances(
-        &self,
+    fn extend_provenances<'a>(
+        &'a self,
         store: &Store<F>,
         provenances: &mut HashMap<Ptr, Ptr>,
-        todo: HashSet<&Ptr>,
+        ready: HashSet<&Ptr>,
+        missing_dependency_counts: &mut HashMap<&'a Ptr, usize>,
     ) -> HashSet<&Ptr> {
         let mut next = HashSet::new();
-
-        for query in todo.into_iter() {
+        for query in ready.into_iter() {
             if provenances.get(query).is_some() {
+                // Skip if already complete. This should not happen if called by `compute_provenances` when computing
+                // all provenances from scratch, but it could happen if we compute more incrementally in the future.
                 continue;
             };
 
@@ -669,9 +686,21 @@ impl<F: LurkField, Q: Query<F>> Scope<Q, LogMemo<F>, F> {
 
             if let Some(dependents) = self.dependents.get(query) {
                 for dependent in dependents {
-                    if provenances.get(dependent).is_none() {
-                        next.insert(dependent);
-                    }
+                    missing_dependency_counts
+                        .entry(dependent)
+                        .and_modify(|missing_count| {
+                            // NOTE: A query only becomes the `dependent` here when one of its dependencies is
+                            // processed. Any query with `missing_count` 0 has no unprocessed dependencies to trigger
+                            // the following update. Therefore, the underflow guarded against below should never occur
+                            // if the implicit topological sort worked correctly. Any failure suggests the algorithm has
+                            // been broken accidentally.
+                            *missing_count = missing_count
+                                .checked_sub(1)
+                                .expect("topological sort has been broken; a dependency was processed out of order");
+                            if *missing_count == 0 {
+                                next.insert(dependent);
+                            }
+                        });
                 }
             };