-
Notifications
You must be signed in to change notification settings - Fork 16
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Add lowest_common_ancestor
algorithm
#35
Changes from all commits
fc99019
8c9bbba
699b13d
3260183
00a4a4a
0293eb7
52db2cb
45b1583
7ee35fc
bd77bac
34315db
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,104 @@ | ||
# Copyright (c) 2024-2025, NVIDIA CORPORATION. | ||
# Licensed under the Apache License, Version 2.0 (the "License"); | ||
# you may not use this file except in compliance with the License. | ||
# You may obtain a copy of the License at | ||
# | ||
# http://www.apache.org/licenses/LICENSE-2.0 | ||
# | ||
# Unless required by applicable law or agreed to in writing, software | ||
# distributed under the License is distributed on an "AS IS" BASIS, | ||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
# See the License for the specific language governing permissions and | ||
# limitations under the License. | ||
|
||
import cupy as cp | ||
import networkx as nx | ||
import numpy as np | ||
import pylibcugraph as plc | ||
|
||
from nx_cugraph.convert import _to_directed_graph | ||
from nx_cugraph.utils import ( | ||
_groupby, | ||
index_dtype, | ||
networkx_algorithm, | ||
not_implemented_for, | ||
) | ||
|
||
__all__ = ["lowest_common_ancestor"] | ||
|
||
|
||
@not_implemented_for("undirected") | ||
@networkx_algorithm(is_incomplete=True, version_added="24.12", _plc="bfs") | ||
def lowest_common_ancestor(G, node1, node2, default=None): | ||
"""May not always raise NetworkXError for graphs that are not DAGs.""" | ||
G = _to_directed_graph(G) | ||
|
||
# if not nxcg.is_directed_acyclic_graph(G): # TODO | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Do we need to wait on this before merging? There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. It would be nice to, but I don't think it's super important in practice so I would say no. We add a note to the docstring. If/when PLC can help answer whether a graph is a DAG, then we should add The difference is that if the graph is not a DAG, then we may still give an answer or we may raise as networkx does. It's common to know whether your graph is a DAG or not (often by construction). |
||
# raise nx.NetworkXError("LCA only defined on directed acyclic graphs.") | ||
|
||
if G._N == 0: | ||
raise nx.NetworkXPointlessConcept("LCA meaningless on null graphs.") | ||
if node1 not in G: | ||
nodes = {node1} | ||
raise nx.NodeNotFound(f"Node(s) {nodes} from pair {(node1, node2)} not in G.") | ||
if node2 not in G: | ||
nodes = {node2} | ||
raise nx.NodeNotFound(f"Node(s) {nodes} from pair {(node1, node2)} not in G.") | ||
|
||
# Ancestor BFS from node1 | ||
node1_index = node1 if G.key_to_id is None else G.key_to_id[node1] | ||
node2_index = node2 if G.key_to_id is None else G.key_to_id[node2] | ||
if node1_index == node2_index: # Handle trivial case | ||
return node1 | ||
plc_graph = G._get_plc_graph(switch_indices=True) | ||
distances1, predecessors1, node_ids1 = plc.bfs( | ||
handle=plc.ResourceHandle(), | ||
graph=plc_graph, | ||
sources=cp.array([node1_index], index_dtype), | ||
direction_optimizing=False, # True for undirected only | ||
depth_limit=-1, | ||
compute_predecessors=False, | ||
do_expensive_check=False, | ||
) | ||
mask1 = distances1 != np.iinfo(distances1.dtype).max | ||
node_ids1 = node_ids1[mask1] | ||
|
||
# Ancestor BFS from node2 | ||
distances2, predecessors2, node_ids2 = plc.bfs( | ||
handle=plc.ResourceHandle(), | ||
graph=plc_graph, | ||
sources=cp.array([node2_index], index_dtype), | ||
direction_optimizing=False, # True for undirected only | ||
depth_limit=-1, | ||
compute_predecessors=False, | ||
do_expensive_check=False, | ||
) | ||
mask2 = distances2 != np.iinfo(distances2.dtype).max | ||
node_ids2 = node_ids2[mask2] | ||
|
||
# Find all common ancestors | ||
common_ids = cp.intersect1d(node_ids1, node_ids2, assume_unique=True) | ||
if common_ids.size == 0: | ||
return default | ||
if common_ids.size == 1: | ||
# Only one; it must be the lowest common ancestor | ||
node_index = common_ids[0].tolist() | ||
return node_index if G.key_to_id is None else G.id_to_key[node_index] | ||
|
||
# Find nodes from `common_ids` that have no predecessors from `common_ids`. | ||
# TODO: create utility functions for getting neighbors, predecessors, | ||
# and successors of nodes, which may simplify this code. | ||
mask = cp.isin(G.src_indices, common_ids) & (G.src_indices != G.dst_indices) | ||
groups = _groupby(G.src_indices[mask], G.dst_indices[mask]) | ||
# Walk along successors until we reach a lowest common ancestor | ||
node_index = next(iter(groups)) # Choose arbitrary element | ||
seen = set() | ||
while True: | ||
if node_index in seen: | ||
raise nx.NetworkXError("LCA only defined on directed acyclic graphs.") | ||
lower_ancestors = cp.intersect1d(groups[node_index], common_ids) | ||
if lower_ancestors.size == 0: | ||
break | ||
seen.add(node_index) | ||
node_index = lower_ancestors[0].tolist() # Arbitrary element | ||
return node_index if G.key_to_id is None else G.id_to_key[node_index] |
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Does adding this make the algorithm automatically raise errors on undirected graphs?
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Yes. It's a decorator from networkx.
We place it before
@networkx_algorithm
, because NetworkX already checks and raises if the input graph is undirected before dispatching to backends:https://github.com/networkx/networkx/blob/9beaf7a0b59fe21775cd93862d9c7b28152a2d8c/networkx/algorithms/lowest_common_ancestors.py#L115-L117
In other words, we use the same decorator so the algorithm behaves correctly when used directly such as
nxcg.lowest_common_ancestor(G)
.