src/main/java/com/google/devtools/build/lib/graph/Digraph.java - bazel - Git at Google

 // Copyright 2014 The Bazel Authors. All rights reserved.
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //    http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.

 package com.google.devtools.build.lib.graph;

 import static java.util.Comparator.comparing;
 import static java.util.Comparator.comparingLong;

 import com.google.common.base.Preconditions;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableSet;
 import java.util.ArrayList;
 import java.util.Collection;
 import java.util.Collections;
 import java.util.Comparator;
 import java.util.HashMap;
 import java.util.HashSet;
 import java.util.LinkedList;
 import java.util.List;
 import java.util.Map;
 import java.util.PriorityQueue;
 import java.util.Set;
 import java.util.concurrent.ConcurrentHashMap;
 import javax.annotation.Nullable;

 /**
  * {@code Digraph} a generic directed graph or "digraph", suitable for modeling asymmetric binary
  * relations.
  *
  * <p>An instance <code>G = &lt;V,E&gt;</code> consists of a set of nodes or vertices <code>V</code>
  * , and a set of directed edges <code>E</code>, which is a subset of <code>V &times; V</code>. This
  * permits self-edges but does not represent multiple edges between the same pair of nodes.
  *
  * <p>Nodes may be labeled with values of any type (type parameter T). All nodes within a graph have
  * distinct labels. The null pointer is not a valid label.
  *
  * <p>The package supports various operations for modeling partial order relations, and supports
  * input/output in AT&amp;T's 'dot' format. See http://www.research.att.com/sw/tools/graphviz/.
  *
  * <p>Some invariants:
  *
  * <ul>
  *   <li>Each graph instances "owns" the nodes is creates. The behaviour of operations on nodes a
  *       graph does not own is undefined.
  *   <li>{@code Digraph} assumes immutability of node labels, much like {@link HashMap} assumes it
  *       for keys.
  *   <li>Mutating the underlying graph invalidates any sets and iterators backed by it.
  *   <li>Nodes can be added and removed concurrently. Edges can be added and removed concurrently
  *       too. While it is thread safe to add or remove edge, these operations are not atomic. Graph
  *       can be observable in inconsistent state during this operations, for instance: edge linked
  *       to only one node.
  *   <li>
  * </ul>
  *
  * <p>Each node stores successor and predecessor adjacency sets using a representation that
  * dynamically changes with size: small sets are stored as arrays, large sets using hash tables.
  * This representation provides significant space and time performance improvements upon two prior
  * versions: the earliest used only HashSets; a later version used linked lists, as described in
  * Cormen, Leiserson &amp; Rivest.
  */
 public final class Digraph<T> implements Cloneable {

   /** Maps labels to nodes, which are in strict 1:1 correspondence. */
   private final Map<T, Node<T>> nodes = new ConcurrentHashMap<>();

   /**
    * Construct an empty Digraph.
    */
   public Digraph() {}

   /**
    * Sanity-check: assert that a node is indeed a member of this graph and not
    * another one.  Perform this check whenever a function is supplied a node by
    * the user.
    */
   private final void checkNode(Node<T> node) {
     if (getNode(node.getLabel()) != node) {
       throw new IllegalArgumentException("node " + node
                                          + " is not a member of this graph");
     }
   }

   /**
    * Adds a directed edge between the nodes labelled 'from' and 'to', creating
    * them if necessary.
    *
    * @return true iff the edge was not already present.
    */
   public boolean addEdge(T from, T to) {
     Node<T> fromNode = createNode(from);
     Node<T> toNode   = createNode(to);
     return addEdge(fromNode, toNode);
   }

   /**
    * Adds a directed edge between the specified nodes, which must exist and
    * belong to this graph.
    *
    * @return true iff the edge was not already present.
    *
    * Note: multi-edges are ignored.  Self-edges are permitted.
    */
   public boolean addEdge(Node<T> fromNode, Node<T> toNode) {
     checkNode(fromNode);
     checkNode(toNode);
     return fromNode.addEdge(toNode);
   }

   /**
    * Returns true iff the graph contains an edge between the
    * specified nodes, which must exist and belong to this graph.
    */
   public boolean containsEdge(Node<T> fromNode, Node<T> toNode) {
     checkNode(fromNode);
     checkNode(toNode);
     // TODO(bazel-team): (2009) iterate only over the shorter of from.succs, to.preds.
     return fromNode.getSuccessors().contains(toNode);
   }

   /**
    * Removes the edge between the specified nodes.  Idempotent: attempts to
    * remove non-existent edges have no effect.
    *
    * @return true iff graph changed.
    */
   public boolean removeEdge(Node<T> fromNode, Node<T> toNode) {
     checkNode(fromNode);
     checkNode(toNode);
     return fromNode.removeEdge(toNode);
   }

   /**
    * Remove all nodes and edges.
    */
   public void clear() {
     nodes.clear();
   }

   @Override
   public String toString() {
     return "Digraph[" + getNodeCount() + " nodes]";
   }

   @Override
   public int hashCode() {
     throw new UnsupportedOperationException(); // avoid nondeterminism
   }

   /**
    * Returns true iff the two graphs are equivalent, i.e. have the same set
    * of node labels, with the same connectivity relation.
    *
    * O(n^2) in the worst case, i.e. equivalence.  The algorithm could be speed up by
    * close to a factor 2 in the worst case by a more direct implementation instead
    * of using isSubgraph twice.
    */
   @Override
   public boolean equals(Object thatObject) {
     /* If this graph is a subgraph of thatObject, then we know that thatObject is of
      * type Digraph<?> and thatObject can be cast to this type.
      */
     return isSubgraph(thatObject) && ((Digraph<?>) thatObject).isSubgraph(this);
   }

   /**
    * Returns true iff this graph is a subgraph of the argument. This means that this graph's nodes
    * are a subset of those of the argument; moreover, for each node of this graph the set of
    * successors is a subset of those of the corresponding node in the argument graph.
    *
    * This algorithm is O(n^2), but linear in the total sizes of the graphs.
    */
   public boolean isSubgraph(Object thatObject) {
     if (this == thatObject) {
       return true;
     }
     if (!(thatObject instanceof Digraph)) {
       return false;
     }

     @SuppressWarnings("unchecked")
     Digraph<T> that = (Digraph<T>) thatObject;
     if (this.getNodeCount() > that.getNodeCount()) {
       return false;
     }
     for (Node<T> n1: nodes.values()) {
       Node<T> n2 = that.getNodeMaybe(n1.getLabel());
       if (n2 == null) {
         return false; // 'that' is missing a node
       }

       // Now compare the successor relations.
       // Careful:
       // - We can't do simple equality on the succs-sets because the
       //   nodes belong to two different graphs!
       // - There's no need to check both predecessor and successor
       //   relations, either one is sufficient.
       Collection<Node<T>> n1succs = n1.getSuccessors();
       Collection<Node<T>> n2succs = n2.getSuccessors();
       if (n1succs.size() > n2succs.size()) {
         return false;
       }
       // foreach successor of n1, ensure n2 has a similarly-labeled succ.
       for (Node<T> succ1: n1succs) {
         Node<T> succ2 = that.getNodeMaybe(succ1.getLabel());
         if (succ2 == null) {
           return false;
         }
         if (!n2succs.contains(succ2)) {
           return false;
         }
       }
     }
     return true;
   }

   /**
    * Returns a duplicate graph with the same set of node labels and the same
    * connectivity relation.  The labels themselves are not cloned.
    */
   @Override
   public Digraph<T> clone() {
     final Digraph<T> that = new Digraph<T>();
     visitNodesBeforeEdges(
         new AbstractGraphVisitor<T>() {
           @Override
           public void visitEdge(Node<T> lhs, Node<T> rhs) {
             that.addEdge(lhs.getLabel(), rhs.getLabel());
           }

           @Override
           public void visitNode(Node<T> node) {
             that.createNode(node.getLabel());
           }
         },
         nodes.values(),
         null);
     return that;
   }

   /** Returns a deterministic immutable copy of the nodes of this graph. */
   public Collection<Node<T>> getNodes(final Comparator<? super T> comparator) {
     return ImmutableList.sortedCopyOf(comparing(Node::getLabel, comparator), nodes.values());
   }

   /**
    * Returns an immutable view of the nodes of this graph.
    *
    * Note: we have to return Collection and not Set because values() returns
    * one: the 'nodes' HashMap doesn't know that it is injective.  :-(
    */
   public Collection<Node<T>> getNodes() {
     return Collections.unmodifiableCollection(nodes.values());
   }

   /**
    * @return the set of root nodes: those with no predecessors.
    *
    * NOTE: in a cyclic graph, there may be nodes that are not reachable from
    * any "root".
    */
   public Set<Node<T>> getRoots() {
     Set<Node<T>> roots = new HashSet<>();
     for (Node<T> node: nodes.values()) {
       if (!node.hasPredecessors()) {
         roots.add(node);
       }
     }
     return roots;
   }

   /**
    * @return the set of leaf nodes: those with no successors.
    */
   public Set<Node<T>> getLeaves() {
     Set<Node<T>> leaves = new HashSet<>();
     for (Node<T> node: nodes.values()) {
       if (!node.hasSuccessors()) {
         leaves.add(node);
       }
     }
     return leaves;
   }

   /**
    * @return an immutable view of the set of labels of this graph's nodes.
    */
   public Set<T> getLabels() {
     return Collections.unmodifiableSet(nodes.keySet());
   }

   /**
    * Finds and returns the node with the specified label.  If there is no such
    * node, an exception is thrown.  The null pointer is not a valid label.
    *
    * @return the node whose label is "label".
    * @throws IllegalArgumentException if no node was found with the specified
    * label.
    */
   public Node<T> getNode(T label) {
     if (label == null) {
       throw new NullPointerException();
     }
     Node<T> node = nodes.get(label);
     if (node == null) {
       throw new IllegalArgumentException("No such node label: " + label);
     }
     return node;
   }

   /**
    * Find the node with the specified label.  Returns null if it doesn't exist.
    * The null pointer is not a valid label.
    *
    * @return the node whose label is "label", or null if it was not found.
    */
   public Node<T> getNodeMaybe(T label) {
     if (label == null) {
       throw new NullPointerException();
     }
     return nodes.get(label);
   }

   /**
    * @return the number of nodes in the graph.
    */
   public int getNodeCount() {
     return nodes.size();
   }

   /**
    * @return the number of edges in the graph.
    *
    * Note: expensive! Useful when asserting against mutations though.
    */
   public int getEdgeCount() {
     int edges = 0;
     for (Node<T> node: nodes.values()) {
       edges += node.getSuccessors().size();
     }
     return edges;
   }

   /**
    * Find or create a node with the specified label. This is the <i>only</i> factory of Nodes. The
    * null pointer is not a valid label.
    */
   public Node<T> createNode(T label) {
     return nodes.computeIfAbsent(label, Digraph::createNodeNative);
   }

   private static <T> Node<T> createNodeNative(T label) {
     Preconditions.checkNotNull(label);
     return new Node<>(label);
   }

   /******************************************************************
    *                                                                *
    *                        Graph Algorithms                        *
    *                                                                *
    ******************************************************************/

   /**
    * These only manipulate the graph through methods defined above.
    */

   /**
    * Returns true iff the graph is cyclic.  Time: O(n).
    */
   public boolean isCyclic() {

     // To detect cycles, we use a colored depth-first search. All nodes are
     // initially marked white.  When a node is encountered, it is marked grey,
     // and when its descendants are completely visited, it is marked black.
     // If a grey node is ever encountered, then there is a cycle.
     final Object WHITE = null; // i.e. not present in nodeToColor, the default.
     final Object GREY  = new Object();
     final Object BLACK = new Object();
     final Map<Node<T>, Object> nodeToColor = new HashMap<>(); // empty => all white

     class CycleDetector { /* defining a class gives us lexical scope */
       boolean visit(Node<T> node) {
         nodeToColor.put(node, GREY);
         for (Node<T> succ: node.getSuccessors()) {
           if (nodeToColor.get(succ) == GREY) {
             return true;
           } else if (nodeToColor.get(succ) == WHITE) {
             if (visit(succ)) {
               return true;
             }
           }
         }
         nodeToColor.put(node, BLACK);
         return false;
       }
     }

     CycleDetector detector = new CycleDetector();
     for (Node<T> node: nodes.values()) {
       if (nodeToColor.get(node) == WHITE) {
         if (detector.visit(node)) {
           return true;
         }
       }
     }
     return false;
   }

   /**
    * Returns the strong component graph of "this".  That is, returns a new
    * acyclic graph in which all strongly-connected components in the original
    * graph have been "fused" into a single node.
    *
    * @return a new graph, whose node labels are sets of nodes of the
    * original graph.  (Do not get confused as to which graph each
    * set of Nodes belongs!)
    */
   public Digraph<Set<Node<T>>> getStrongComponentGraph() {
     Collection<Set<Node<T>>> sccs = getStronglyConnectedComponents();
     Digraph<Set<Node<T>>> scGraph = createImageUnderPartition(sccs);
     scGraph.removeSelfEdges(); // scGraph should be acyclic: no self-edges
     return scGraph;
   }

   /**
    * Returns a partition of the nodes of this graph into sets, each set being
    * one strongly-connected component of the graph.
    */
   public Collection<Set<Node<T>>> getStronglyConnectedComponents() {
     final List<Set<Node<T>>> sccs = new ArrayList<>();
     NodeSetReceiver<T> r = sccs::add;
     SccVisitor<T> v = new SccVisitor<>();
     for (Node<T> node : nodes.values()) {
       v.visit(r, node);
     }
     return sccs;
   }

   /**
    * <p> Given a partition of the graph into sets of nodes, returns the image
    * of this graph under the function which maps each node to the
    * partition-set in which it appears.  The labels of the new graph are the
    * (immutable) sets of the partition, and the edges of the new graph are the
    * edges of the original graph, mapped via the same function. </p>
    *
    * <p> Note: the resulting graph may contain self-edges.  If these are not
    * wanted, call <code>removeSelfEdges()</code>> on the result. </p>
    *
    * <p> Interesting special case: if the partition is the set of
    * strongly-connected components, the result of this function is the
    * strong-component graph. </p>
    */
   public Digraph<Set<Node<T>>>
     createImageUnderPartition(Collection<Set<Node<T>>> partition) {

     // Build mapping function: each node label is mapped to its equiv class:
     Map<T, Set<Node<T>>> labelToImage = new HashMap<>();
     for (Set<Node<T>> set: partition) {
       // It's important to use immutable sets of node labels when sets are keys
       // in a map; see ImmutableSet class for explanation.
       Set<Node<T>> imageSet = ImmutableSet.copyOf(set);
       for (Node<T> node: imageSet) {
         labelToImage.put(node.getLabel(), imageSet);
       }
     }

     if (labelToImage.size() != getNodeCount()) {
       throw new IllegalArgumentException(
           "createImageUnderPartition(): argument is not a partition");
     }

     return createImageUnderMapping(labelToImage);
   }

   /**
    * Returns the image of this graph in a given function, expressed as a
    * mapping from labels to some other domain.
    */
   public <IMAGE> Digraph<IMAGE>
     createImageUnderMapping(Map<T, IMAGE> map) {
     Digraph<IMAGE> imageGraph = new Digraph<>();

     for (Node<T> fromNode: nodes.values()) {
       T fromLabel = fromNode.getLabel();

       IMAGE fromImage = map.get(fromLabel);
       if (fromImage == null) {
         throw new IllegalArgumentException(
             "Incomplete function: undefined for " + fromLabel);
       }
       imageGraph.createNode(fromImage);

       for (Node<T> toNode: fromNode.getSuccessors()) {
         T toLabel = toNode.getLabel();

         IMAGE toImage = map.get(toLabel);
         if (toImage == null) {
           throw new IllegalArgumentException(
             "Incomplete function: undefined for " + toLabel);
         }
         imageGraph.addEdge(fromImage, toImage);
       }
     }

     return imageGraph;
   }

   /**
    * Removes any self-edges (x,x) in this graph.
    */
   public void removeSelfEdges() {
     for (Node<T> node: nodes.values()) {
       removeEdge(node, node);
     }
   }

   /**
    * Finds the shortest directed path from "fromNode" to "toNode".  The path is
    * returned as an ordered list of nodes, including both endpoints.  Returns
    * null if there is no path.  Uses breadth-first search.  Running time is
    * O(n).
    */
   public List<Node<T>> getShortestPath(Node<T> fromNode,
                                            Node<T> toNode) {
     checkNode(fromNode);
     checkNode(toNode);

     if (fromNode == toNode) {
       return Collections.singletonList(fromNode);
     }

     Map<Node<T>, Node<T>> pathPredecessor = new HashMap<>();

     Set<Node<T>> marked = new HashSet<>();

     LinkedList<Node<T>> queue = new LinkedList<>();
     queue.addLast(fromNode);
     marked.add(fromNode);

     while (!queue.isEmpty()) {
       Node<T> u = queue.removeFirst();
       for (Node<T> v: u.getSuccessors()) {
         if (marked.add(v)) {
           pathPredecessor.put(v, u);
           if (v == toNode) {
             return getPathToTreeNode(pathPredecessor, v); // found a path
           }
           queue.addLast(v);
         }
       }
     }
     return null; // no path
   }

   /**
    * Given a tree (expressed as a map from each node to its parent), and a
    * starting node, returns the path from the root of the tree to 'node' as a
    * list.
    */
   public static <X> List<X> getPathToTreeNode(Map<X, X> tree, X node) {
     List<X> path = new ArrayList<>();
     while (node != null) {
       path.add(node);
       node = tree.get(node); // get parent
     }
     Collections.reverse(path);
     return path;
   }

   /**
    * Returns the nodes of an acyclic graph in topological order
    * [a.k.a "reverse post-order" of depth-first search.]
    *
    * A topological order is one such that, if (u, v) is a path in
    * acyclic graph G, then u is before v in the topological order.
    * In other words "tails before heads" or "roots before leaves".
    *
    * @return The nodes of the graph, in a topological order
    */
   public List<Node<T>> getTopologicalOrder() {
     List<Node<T>> order = getPostorder();
     Collections.reverse(order);
     return order;
   }

   /**
    * Returns the nodes of an acyclic graph in topological order
    * [a.k.a "reverse post-order" of depth-first search.]
    *
    * A topological order is one such that, if (u, v) is a path in
    * acyclic graph G, then u is before v in the topological order.
    * In other words "tails before heads" or "roots before leaves".
    *
    * If an ordering is given, returns a specific topological order from the set
    * of all topological orders; if no ordering given, returns an arbitrary
    * (nondeterministic) one, but is a bit faster because no sorting needs to be
    * done for each node.
    *
    * @param edgeOrder the ordering in which edges originating from the same node
    *     are visited.
    * @return The nodes of the graph, in a topological order
    */
   public List<Node<T>> getTopologicalOrder(Comparator<? super T> edgeOrder) {
     CollectingVisitor<T> visitor = new CollectingVisitor<>();
     DFS<T> visitation = new DFS<>(DFS.Order.POSTORDER, edgeOrder, false);
     visitor.beginVisit();
     for (Node<T> node : getNodes(edgeOrder)) {
       visitation.visit(node, visitor);
     }
     visitor.endVisit();

     List<Node<T>> order = visitor.getVisitedNodes();
     Collections.reverse(order);
     return order;
   }

   /**
    * Returns the nodes of an acyclic graph in post-order.
    */
   public List<Node<T>> getPostorder() {
     CollectingVisitor<T> collectingVisitor = new CollectingVisitor<>();
     visitPostorder(collectingVisitor);
     return collectingVisitor.getVisitedNodes();
   }

   /**
    * Returns the (immutable) set of nodes reachable from node 'n' (reflexive
    * transitive closure).
    */
   public Set<Node<T>> getFwdReachable(Node<T> n) {
     return getFwdReachable(Collections.singleton(n));
   }

   /**
    * Returns the (immutable) set of nodes reachable from any node in {@code
    * startNodes} (reflexive transitive closure).
    */
   public Set<Node<T>> getFwdReachable(Collection<Node<T>> startNodes) {
     // This method is intentionally not static, to permit future expansion.
     DFS<T> dfs = new DFS<T>(DFS.Order.PREORDER, false);
     for (Node<T> n : startNodes) {
       dfs.visit(n, new AbstractGraphVisitor<>());
     }
     return dfs.getMarked();
   }

   /**
    * Returns the (immutable) set of nodes that reach node 'n' (reflexive
    * transitive closure).
    */
   public Set<Node<T>> getBackReachable(Node<T> n) {
     return getBackReachable(Collections.singleton(n));
   }

   /**
    * Returns the (immutable) set of nodes that reach some node in {@code
    * startNodes} (reflexive transitive closure).
    */
   public Set<Node<T>> getBackReachable(Collection<Node<T>> startNodes) {
     // This method is intentionally not static, to permit future expansion.
     DFS<T> dfs = new DFS<T>(DFS.Order.PREORDER, true);
     for (Node<T> n : startNodes) {
       dfs.visit(n, new AbstractGraphVisitor<>());
     }
     return dfs.getMarked();
   }

   /**
    * Removes the specified node in the graph.
    *
    * <p>If preserveOrder flag is set than after removing node this method connects all predecessors
    * and successors.
    *
    * <p>Let's consider graph
    *
    * <pre>
    * a -> n -> c
    * b -> n -> d
    * </pre>
    *
    * After n removed the following edges will be added
    *
    * <pre>
    * a -> c
    * a -> d
    * b -> c
    * b -> d
    * </pre>
    *
    * @param node the node to remove (must be in the graph).
    * @param preserveOrder see removeNode(T, boolean).
    */
   public Collection<Node<T>> removeNode(Node<T> node, boolean preserveOrder) {
     checkNode(node);

     Collection<Node<T>> predecessors = node.removeAllPredecessors();
     Collection<Node<T>> successors = node.removeAllSuccessors();

     List<Node<T>> neighbours = Collections.emptyList();

     if (preserveOrder) {
       neighbours = new ArrayList<>(successors.size() + predecessors.size());
       neighbours.addAll(successors);
       neighbours.addAll(predecessors);

       for (Node<T> p : predecessors) {
         for (Node<T> s : successors) {
           p.addEdge(s);
         }
       }
     }

     Object del = nodes.remove(node.getLabel());
     if (del != node) {
       throw new IllegalStateException(del + " " + node);
     }

     return neighbours;
   }

   /**
    * Extracts the subgraph G' of this graph G, containing exactly the nodes
    * specified by the labels in V', and preserving the original
    * <i>transitive</i> graph relation among those nodes. </p>
    *
    * @param subset a subset of the labels of this graph; the resulting graph
    * will have only the nodes with these labels.
    */
   public Digraph<T> extractSubgraph(final Set<T> subset) {
     Digraph<T> subgraph = this.clone();
     subgraph.subgraph(subset);
     return subgraph;
   }

   /**
    * Removes all nodes from this graph except those whose label is an element of {@code keepLabels}.
    * Edges are added so as to preserve the <i>transitive</i> closure relation.
    *
    * @param keepLabels a subset of the labels of this graph; the resulting graph will have only the
    *     nodes with these labels.
    */
   private void subgraph(final Set<T> keepLabels) {
     // This algorithm does the following:
     // Let keep = nodes that have labels in keepLabels.
     // Let toRemove = nodes \ keep. reachables = successors and predecessors of keep in nodes.
     // reachables is the subset of nodes of remove that are an immediate neighbor of some node in
     // keep.
     //
     // Removes all nodes of reachables from keepLabels.
     // Until reachables is empty:
     //   Takes n from reachables
     //   for all s in succ(n)
     //     for all p in pred(n)
     //       add the edge (p, s)
     //     add s to reachables
     //   for all p in pred(n)
     //     add p to reachables
     //   Remove n and its edges
     //
     // A few adjustments are needed to do the whole computation.

     final Set<Node<T>> toRemove = new HashSet<>();
     final Set<Node<T>> keepNeighbors = new HashSet<>();

     // Look for all nodes if they are to be kept or removed
     for (Node<T> node : nodes.values()) {
       if (keepLabels.contains(node.getLabel())) {
         // Node is to be kept
         keepNeighbors.addAll(node.getPredecessors());
         keepNeighbors.addAll(node.getSuccessors());
       } else {
         // node is to be removed.
         toRemove.add(node);
       }
     }

     if (toRemove.isEmpty()) {
       // This premature return is needed to avoid 0-size priority queue creation.
       return;
     }

     // We use a priority queue to look for low-order nodes first so we don't propagate the high
     // number of paths of high-order nodes making the time consumption explode.
     // For perfect results we should reorder the set each time we add a new edge but this would
     // be too expensive, so this is a good enough approximation.
     final PriorityQueue<Node<T>> reachables =
         new PriorityQueue<>(
             toRemove.size(),
             comparingLong(arg -> (long) arg.numPredecessors() * (long) arg.numSuccessors()));

     // Construct the reachables queue with the list of successors and predecessors of keep in
     // toRemove.
     keepNeighbors.retainAll(toRemove);
     reachables.addAll(keepNeighbors);
     toRemove.removeAll(reachables);

     // Remove nodes, least connected first, preserving reachability.
     while (!reachables.isEmpty()) {

       Node<T> node = reachables.poll();

       Collection<Node<T>> neighbours = removeNode(node, /*preserveOrder*/ true);

       for (Node<T> neighbour : neighbours) {
         if (toRemove.remove(neighbour)) {
           reachables.add(neighbour);
         }
       }
     }

     // Final cleanup for non-reachable nodes.
     for (Node<T> node : toRemove) {
       removeNode(node, false);
     }
   }

   @FunctionalInterface
   private interface NodeSetReceiver<T> {
     void accept(Set<Node<T>> nodes);
   }

   /**
    * Find strongly connected components using path-based strong component
    * algorithm. This has the advantage over the default method of returning
    * the components in postorder.
    *
    * We visit nodes depth-first, keeping track of the order that
    * we visit them in (preorder). Our goal is to find the smallest node (in
    * this preorder of visitation) reachable from a given node. We keep track of the
    * smallest node pointed to so far at the top of a stack. If we ever find an
    * already-visited node, then if it is not already part of a component, we
    * pop nodes from that stack until we reach this already-visited node's number
    * or an even smaller one.
    *
    * Once the depth-first visitation of a node is complete, if this node's
    * number is at the top of the stack, then it is the "first" element visited
    * in its strongly connected component. Hence we pop all elements that were
    * pushed onto the visitation stack and put them in a strongly connected
    * component with this one, then send a passed-in {@link Digraph.NodeSetReceiver} this component.
    */
   private class SccVisitor<T> {
     // Nodes already assigned to a strongly connected component.
     private final Set<Node<T>> assigned = new HashSet<>();

     // The order each node was visited in.
     private final Map<Node<T>, Integer> preorder = new HashMap<>();

     // Stack of all nodes visited whose SCC has not yet been determined. When an SCC is found,
     // that SCC is an initial segment of this stack, and is popped off. Every time a new node is
     // visited, it is put on this stack.
     private final List<Node<T>> stack = new ArrayList<>();

     // Stack of visited indices for the first-visited nodes in each of their known-so-far
     // strongly connected components. A node pushes its index on when it is visited. If any of
     // its successors have already been visited and are not in an already-found strongly connected
     // component, then, since the successor was already visited, it and this node must be part of a
     // cycle. So every node visited since the successor is actually in the same strongly connected
     // component. In this case, preorderStack is popped until the top is at most the successor's
     // index.
     //
     // After all descendants of a node have been visited, if the top element of preorderStack is
     // still the current node's index, then it was the first element visited of the current strongly
     // connected component. So all nodes on {@code stack} down to the current node are in its
     // strongly connected component. And the node's index is popped from preorderStack.
     private final List<Integer> preorderStack = new ArrayList<>();

     // Index of node being visited.
     private int counter = 0;

     private void visit(NodeSetReceiver<T> visitor, Node<T> node) {
       if (preorder.containsKey(node)) {
         // This can only happen if this was a non-recursive call, and a previous
         // visit call had already visited node.
         return;
       }
       preorder.put(node, counter);
       stack.add(node);
       preorderStack.add(counter++);
       int preorderLength = preorderStack.size();
       for (Node<T> succ : node.getSuccessors()) {
         Integer succPreorder = preorder.get(succ);
         if (succPreorder == null) {
           visit(visitor, succ);
         } else {
           // Does succ not already belong to an SCC? If it doesn't, then it
           // must be in the same SCC as node. The "starting node" of this SCC
           // must have been visited before succ (or is succ itself).
           if (!assigned.contains(succ)) {
             while (preorderStack.get(preorderStack.size() - 1) > succPreorder) {
               preorderStack.remove(preorderStack.size() - 1);
             }
           }
         }
       }
       if (preorderLength == preorderStack.size()) {
         // If the length of the preorderStack is unchanged, we did not find any earlier-visited
         // nodes that were part of a cycle with this node. So this node is the first-visited
         // element in its strongly connected component, and we collect the component.
         preorderStack.remove(preorderStack.size() - 1);
         Set<Node<T>> scc = new HashSet<>();
         Node<T> compNode;
         do {
           compNode = stack.remove(stack.size() - 1);
           assigned.add(compNode);
           scc.add(compNode);
         } while (!node.equals(compNode));
         visitor.accept(scc);
       }
     }
   }

   /********************************************************************
    *                                                                  *
    *                    Orders, traversals and visitors               *
    *                                                                  *
    ********************************************************************/

   /**
    * A visitation over all the nodes in the graph that invokes
    * <code>visitor.visitNode()</code> for each node in a depth-first
    * post-order: each node is visited <i>after</i> each of its successors; the
    * order in which edges are traversed is the order in which they were added
    * to the graph.  <code>visitor.visitEdge()</code> is not called.
    *
    * @param startNodes the set of nodes from which to begin the visitation.
    */
   public void visitPostorder(GraphVisitor<T> visitor,
                              Iterable<Node<T>> startNodes) {
     visitDepthFirst(visitor, DFS.Order.POSTORDER, false, startNodes);
   }

   /**
    * Equivalent to {@code visitPostorder(visitor, getNodes())}.
    */
   public void visitPostorder(GraphVisitor<T> visitor) {
     visitPostorder(visitor, nodes.values());
   }

   /**
    * A visitation over all the nodes in the graph that invokes
    * <code>visitor.visitNode()</code> for each node in a depth-first
    * pre-order: each node is visited <i>before</i> each of its successors; the
    * order in which edges are traversed is the order in which they were added
    * to the graph.  <code>visitor.visitEdge()</code> is not called.
    *
    * @param startNodes the set of nodes from which to begin the visitation.
    */
   public void visitPreorder(GraphVisitor<T> visitor,
                             Iterable<Node<T>> startNodes) {
     visitDepthFirst(visitor, DFS.Order.PREORDER, false, startNodes);
   }

   /**
    * Equivalent to {@code visitPreorder(visitor, getNodes())}.
    */
   public void visitPreorder(GraphVisitor<T> visitor) {
     visitPreorder(visitor, nodes.values());
   }

   /**
    * A visitation over all the nodes in the graph in depth-first order.  See
    * DFS constructor for meaning of 'order' and 'transpose' parameters.
    *
    * @param startNodes the set of nodes from which to begin the visitation.
    */
   public void visitDepthFirst(GraphVisitor<T> visitor,
                               DFS.Order order,
                               boolean transpose,
                               Iterable<Node<T>> startNodes) {
     DFS<T> visitation = new DFS<>(order, transpose);
     visitor.beginVisit();
     for (Node<T> node: startNodes) {
       visitation.visit(node, visitor);
     }
     visitor.endVisit();
   }

   private static <T> Comparator<Node<T>> makeNodeComparator(
       final Comparator<? super T> comparator) {
     return comparing(Node::getLabel, comparator::compare);
   }

   /**
    * Given {@code unordered}, a collection of nodes and a (possibly null) {@code comparator} for
    * their labels, returns a sorted collection if {@code comparator} is non-null, otherwise returns
    * {@code unordered}.
    */
   private static <T> Collection<Node<T>> maybeOrderCollection(
       Collection<Node<T>> unordered, @Nullable final Comparator<? super T> comparator) {
     return comparator == null
         ? unordered
         : ImmutableList.sortedCopyOf(makeNodeComparator(comparator), unordered);
   }

   private void visitNodesBeforeEdges(
       GraphVisitor<T> visitor,
       Iterable<Node<T>> startNodes,
       @Nullable Comparator<? super T> comparator) {
     visitor.beginVisit();
     for (Node<T> fromNode: startNodes) {
       visitor.visitNode(fromNode);
       for (Node<T> toNode : maybeOrderCollection(fromNode.getSuccessors(), comparator)) {
         visitor.visitEdge(fromNode, toNode);
       }
     }
     visitor.endVisit();
   }

   /**
    * A visitation over the graph that visits all nodes and edges in topological order
    * such that each node is visited before any edge coming out of that node; ties among nodes are
    * broken using the provided {@code comparator} if not null; edges are visited in order specified
    * by the comparator, <b>not</b> topological order of the target nodes.
    */
   public void visitNodesBeforeEdges(
       GraphVisitor<T> visitor, @Nullable Comparator<? super T> comparator) {
     visitNodesBeforeEdges(
         visitor,
         comparator == null ? getTopologicalOrder() : getTopologicalOrder(comparator),
         comparator);
   }
 }