PyPI - pyg-nightly - Versions diffs - 2.6.0.dev20240704__py3-none-any.whl → 2.8.0.dev20251207__py3-none-any.whl - Mend

pyg-nightly 2.6.0.dev20240704py3-none-any.whl → 2.8.0.dev20251207py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of pyg-nightly might be problematic. Click here for more details.

Files changed (268) hide show

{pyg_nightly-2.6.0.dev20240704.dist-info → pyg_nightly-2.8.0.dev20251207.dist-info}/METADATA +81 -58
{pyg_nightly-2.6.0.dev20240704.dist-info → pyg_nightly-2.8.0.dev20251207.dist-info}/RECORD +265 -221
{pyg_nightly-2.6.0.dev20240704.dist-info → pyg_nightly-2.8.0.dev20251207.dist-info}/WHEEL +1 -1
pyg_nightly-2.8.0.dev20251207.dist-info/licenses/LICENSE +19 -0
torch_geometric/__init__.py +34 -1
torch_geometric/_compile.py +11 -3
torch_geometric/_onnx.py +228 -0
torch_geometric/config_mixin.py +8 -3
torch_geometric/config_store.py +1 -1
torch_geometric/contrib/__init__.py +1 -1
torch_geometric/contrib/explain/pgm_explainer.py +1 -1
torch_geometric/data/__init__.py +19 -1
torch_geometric/data/batch.py +2 -2
torch_geometric/data/collate.py +1 -3
torch_geometric/data/data.py +110 -6
torch_geometric/data/database.py +19 -5
torch_geometric/data/dataset.py +14 -9
torch_geometric/data/extract.py +1 -1
torch_geometric/data/feature_store.py +17 -22
torch_geometric/data/graph_store.py +3 -2
torch_geometric/data/hetero_data.py +139 -7
torch_geometric/data/hypergraph_data.py +2 -2
torch_geometric/data/in_memory_dataset.py +2 -2
torch_geometric/data/lightning/datamodule.py +42 -28
torch_geometric/data/storage.py +9 -1
torch_geometric/datasets/__init__.py +20 -1
torch_geometric/datasets/actor.py +7 -9
torch_geometric/datasets/airfrans.py +17 -20
torch_geometric/datasets/airports.py +8 -10
torch_geometric/datasets/amazon.py +8 -11
torch_geometric/datasets/amazon_book.py +8 -9
torch_geometric/datasets/amazon_products.py +7 -9
torch_geometric/datasets/aminer.py +8 -9
torch_geometric/datasets/aqsol.py +10 -13
torch_geometric/datasets/attributed_graph_dataset.py +8 -10
torch_geometric/datasets/ba_multi_shapes.py +10 -12
torch_geometric/datasets/ba_shapes.py +5 -6
torch_geometric/datasets/brca_tgca.py +1 -1
torch_geometric/datasets/city.py +157 -0
torch_geometric/datasets/dbp15k.py +1 -1
torch_geometric/datasets/gdelt_lite.py +3 -2
torch_geometric/datasets/ged_dataset.py +3 -2
torch_geometric/datasets/git_mol_dataset.py +263 -0
torch_geometric/datasets/gnn_benchmark_dataset.py +3 -2
torch_geometric/datasets/hgb_dataset.py +2 -2
torch_geometric/datasets/hm.py +1 -1
torch_geometric/datasets/instruct_mol_dataset.py +134 -0
torch_geometric/datasets/linkx_dataset.py +4 -3
torch_geometric/datasets/lrgb.py +3 -5
torch_geometric/datasets/malnet_tiny.py +2 -1
torch_geometric/datasets/md17.py +3 -3
torch_geometric/datasets/medshapenet.py +145 -0
torch_geometric/datasets/mnist_superpixels.py +2 -3
torch_geometric/datasets/modelnet.py +1 -1
torch_geometric/datasets/molecule_gpt_dataset.py +492 -0
torch_geometric/datasets/molecule_net.py +3 -2
torch_geometric/datasets/neurograph.py +1 -3
torch_geometric/datasets/ogb_mag.py +1 -1
torch_geometric/datasets/opf.py +19 -5
torch_geometric/datasets/pascal_pf.py +1 -1
torch_geometric/datasets/pcqm4m.py +2 -1
torch_geometric/datasets/ppi.py +2 -1
torch_geometric/datasets/protein_mpnn_dataset.py +451 -0
torch_geometric/datasets/qm7.py +1 -1
torch_geometric/datasets/qm9.py +3 -2
torch_geometric/datasets/shrec2016.py +2 -2
torch_geometric/datasets/snap_dataset.py +8 -4
torch_geometric/datasets/tag_dataset.py +462 -0
torch_geometric/datasets/teeth3ds.py +269 -0
torch_geometric/datasets/web_qsp_dataset.py +342 -0
torch_geometric/datasets/wikics.py +2 -1
torch_geometric/datasets/wikidata.py +2 -1
torch_geometric/deprecation.py +1 -1
torch_geometric/distributed/__init__.py +13 -0
torch_geometric/distributed/dist_loader.py +2 -2
torch_geometric/distributed/local_feature_store.py +3 -2
torch_geometric/distributed/local_graph_store.py +2 -1
torch_geometric/distributed/partition.py +9 -8
torch_geometric/distributed/rpc.py +3 -3
torch_geometric/edge_index.py +35 -22
torch_geometric/explain/algorithm/attention_explainer.py +219 -29
torch_geometric/explain/algorithm/base.py +2 -2
torch_geometric/explain/algorithm/captum.py +1 -1
torch_geometric/explain/algorithm/captum_explainer.py +2 -1
torch_geometric/explain/algorithm/gnn_explainer.py +406 -69
torch_geometric/explain/algorithm/graphmask_explainer.py +8 -8
torch_geometric/explain/algorithm/pg_explainer.py +305 -47
torch_geometric/explain/explainer.py +2 -2
torch_geometric/explain/explanation.py +89 -5
torch_geometric/explain/metric/faithfulness.py +1 -1
torch_geometric/graphgym/checkpoint.py +2 -1
torch_geometric/graphgym/config.py +3 -2
torch_geometric/graphgym/imports.py +15 -4
torch_geometric/graphgym/logger.py +1 -1
torch_geometric/graphgym/loss.py +1 -1
torch_geometric/graphgym/models/encoder.py +2 -2
torch_geometric/graphgym/models/layer.py +1 -1
torch_geometric/graphgym/utils/comp_budget.py +4 -3
torch_geometric/hash_tensor.py +798 -0
torch_geometric/index.py +16 -7
torch_geometric/inspector.py +6 -2
torch_geometric/io/fs.py +27 -0
torch_geometric/io/tu.py +2 -3
torch_geometric/llm/__init__.py +9 -0
torch_geometric/llm/large_graph_indexer.py +741 -0
torch_geometric/llm/models/__init__.py +23 -0
torch_geometric/llm/models/g_retriever.py +251 -0
torch_geometric/llm/models/git_mol.py +336 -0
torch_geometric/llm/models/glem.py +397 -0
torch_geometric/llm/models/llm.py +470 -0
torch_geometric/llm/models/llm_judge.py +158 -0
torch_geometric/llm/models/molecule_gpt.py +222 -0
torch_geometric/llm/models/protein_mpnn.py +333 -0
torch_geometric/llm/models/sentence_transformer.py +188 -0
torch_geometric/llm/models/txt2kg.py +353 -0
torch_geometric/llm/models/vision_transformer.py +38 -0
torch_geometric/llm/rag_loader.py +154 -0
torch_geometric/llm/utils/__init__.py +10 -0
torch_geometric/llm/utils/backend_utils.py +443 -0
torch_geometric/llm/utils/feature_store.py +169 -0
torch_geometric/llm/utils/graph_store.py +199 -0
torch_geometric/llm/utils/vectorrag.py +125 -0
torch_geometric/loader/cluster.py +6 -5
torch_geometric/loader/graph_saint.py +2 -1
torch_geometric/loader/ibmb_loader.py +4 -4
torch_geometric/loader/link_loader.py +1 -1
torch_geometric/loader/link_neighbor_loader.py +2 -1
torch_geometric/loader/mixin.py +6 -5
torch_geometric/loader/neighbor_loader.py +1 -1
torch_geometric/loader/neighbor_sampler.py +2 -2
torch_geometric/loader/prefetch.py +4 -3
torch_geometric/loader/temporal_dataloader.py +2 -2
torch_geometric/loader/utils.py +10 -10
torch_geometric/metrics/__init__.py +23 -2
torch_geometric/metrics/link_pred.py +755 -85
torch_geometric/nn/__init__.py +1 -0
torch_geometric/nn/aggr/__init__.py +2 -0
torch_geometric/nn/aggr/base.py +1 -1
torch_geometric/nn/aggr/equilibrium.py +1 -1
torch_geometric/nn/aggr/fused.py +1 -1
torch_geometric/nn/aggr/patch_transformer.py +149 -0
torch_geometric/nn/aggr/set_transformer.py +1 -1
torch_geometric/nn/aggr/utils.py +9 -4
torch_geometric/nn/attention/__init__.py +9 -1
torch_geometric/nn/attention/polynormer.py +107 -0
torch_geometric/nn/attention/qformer.py +71 -0
torch_geometric/nn/attention/sgformer.py +99 -0
torch_geometric/nn/conv/__init__.py +2 -0
torch_geometric/nn/conv/appnp.py +1 -1
torch_geometric/nn/conv/collect.jinja +6 -3
torch_geometric/nn/conv/cugraph/gat_conv.py +8 -2
torch_geometric/nn/conv/cugraph/rgcn_conv.py +3 -0
torch_geometric/nn/conv/cugraph/sage_conv.py +3 -0
torch_geometric/nn/conv/dna_conv.py +1 -1
torch_geometric/nn/conv/eg_conv.py +7 -7
torch_geometric/nn/conv/gat_conv.py +33 -4
torch_geometric/nn/conv/gatv2_conv.py +35 -4
torch_geometric/nn/conv/gen_conv.py +1 -1
torch_geometric/nn/conv/general_conv.py +1 -1
torch_geometric/nn/conv/gravnet_conv.py +2 -1
torch_geometric/nn/conv/hetero_conv.py +3 -2
torch_geometric/nn/conv/meshcnn_conv.py +487 -0
torch_geometric/nn/conv/message_passing.py +6 -5
torch_geometric/nn/conv/mixhop_conv.py +1 -1
torch_geometric/nn/conv/rgcn_conv.py +2 -1
torch_geometric/nn/conv/sg_conv.py +1 -1
torch_geometric/nn/conv/spline_conv.py +2 -1
torch_geometric/nn/conv/ssg_conv.py +1 -1
torch_geometric/nn/conv/transformer_conv.py +5 -3
torch_geometric/nn/data_parallel.py +5 -4
torch_geometric/nn/dense/linear.py +5 -24
torch_geometric/nn/encoding.py +17 -3
torch_geometric/nn/fx.py +17 -15
torch_geometric/nn/model_hub.py +5 -16
torch_geometric/nn/models/__init__.py +11 -0
torch_geometric/nn/models/attentive_fp.py +1 -1
torch_geometric/nn/models/attract_repel.py +148 -0
torch_geometric/nn/models/basic_gnn.py +2 -1
torch_geometric/nn/models/captum.py +1 -1
torch_geometric/nn/models/deep_graph_infomax.py +1 -1
torch_geometric/nn/models/dimenet.py +2 -2
torch_geometric/nn/models/dimenet_utils.py +4 -2
torch_geometric/nn/models/gpse.py +1083 -0
torch_geometric/nn/models/graph_unet.py +13 -4
torch_geometric/nn/models/lpformer.py +783 -0
torch_geometric/nn/models/metapath2vec.py +1 -1
torch_geometric/nn/models/mlp.py +4 -2
torch_geometric/nn/models/node2vec.py +1 -1
torch_geometric/nn/models/polynormer.py +206 -0
torch_geometric/nn/models/rev_gnn.py +3 -3
torch_geometric/nn/models/schnet.py +2 -1
torch_geometric/nn/models/sgformer.py +219 -0
torch_geometric/nn/models/signed_gcn.py +1 -1
torch_geometric/nn/models/visnet.py +2 -2
torch_geometric/nn/norm/batch_norm.py +17 -7
torch_geometric/nn/norm/diff_group_norm.py +7 -2
torch_geometric/nn/norm/graph_norm.py +9 -4
torch_geometric/nn/norm/instance_norm.py +5 -1
torch_geometric/nn/norm/layer_norm.py +15 -7
torch_geometric/nn/norm/msg_norm.py +8 -2
torch_geometric/nn/pool/__init__.py +15 -9
torch_geometric/nn/pool/cluster_pool.py +144 -0
torch_geometric/nn/pool/connect/base.py +1 -3
torch_geometric/nn/pool/edge_pool.py +1 -1
torch_geometric/nn/pool/knn.py +13 -10
torch_geometric/nn/pool/select/base.py +1 -4
torch_geometric/nn/summary.py +1 -1
torch_geometric/nn/to_hetero_module.py +4 -3
torch_geometric/nn/to_hetero_transformer.py +3 -3
torch_geometric/nn/to_hetero_with_bases_transformer.py +5 -5
torch_geometric/profile/__init__.py +2 -0
torch_geometric/profile/nvtx.py +66 -0
torch_geometric/profile/profiler.py +18 -9
torch_geometric/profile/utils.py +20 -5
torch_geometric/sampler/__init__.py +2 -1
torch_geometric/sampler/base.py +337 -8
torch_geometric/sampler/hgt_sampler.py +11 -1
torch_geometric/sampler/neighbor_sampler.py +298 -25
torch_geometric/sampler/utils.py +93 -5
torch_geometric/testing/__init__.py +4 -0
torch_geometric/testing/decorators.py +35 -5
torch_geometric/testing/distributed.py +1 -1
torch_geometric/transforms/__init__.py +4 -0
torch_geometric/transforms/add_gpse.py +49 -0
torch_geometric/transforms/add_metapaths.py +10 -8
torch_geometric/transforms/add_positional_encoding.py +2 -2
torch_geometric/transforms/base_transform.py +2 -1
torch_geometric/transforms/delaunay.py +65 -15
torch_geometric/transforms/face_to_edge.py +32 -3
torch_geometric/transforms/gdc.py +8 -9
torch_geometric/transforms/largest_connected_components.py +1 -1
torch_geometric/transforms/mask.py +5 -1
torch_geometric/transforms/node_property_split.py +1 -1
torch_geometric/transforms/normalize_features.py +3 -3
torch_geometric/transforms/pad.py +1 -1
torch_geometric/transforms/random_link_split.py +1 -1
torch_geometric/transforms/remove_duplicated_edges.py +4 -2
torch_geometric/transforms/remove_self_loops.py +36 -0
torch_geometric/transforms/rooted_subgraph.py +1 -1
torch_geometric/transforms/svd_feature_reduction.py +1 -1
torch_geometric/transforms/virtual_node.py +2 -1
torch_geometric/typing.py +82 -17
torch_geometric/utils/__init__.py +6 -1
torch_geometric/utils/_lexsort.py +0 -9
torch_geometric/utils/_negative_sampling.py +28 -13
torch_geometric/utils/_normalize_edge_index.py +46 -0
torch_geometric/utils/_scatter.py +126 -164
torch_geometric/utils/_sort_edge_index.py +0 -2
torch_geometric/utils/_spmm.py +16 -14
torch_geometric/utils/_subgraph.py +4 -0
torch_geometric/utils/_tree_decomposition.py +1 -1
torch_geometric/utils/_trim_to_layer.py +2 -2
torch_geometric/utils/augmentation.py +1 -1
torch_geometric/utils/convert.py +17 -10
torch_geometric/utils/cross_entropy.py +34 -13
torch_geometric/utils/embedding.py +91 -2
torch_geometric/utils/geodesic.py +28 -25
torch_geometric/utils/influence.py +279 -0
torch_geometric/utils/map.py +14 -10
torch_geometric/utils/nested.py +1 -1
torch_geometric/utils/smiles.py +3 -3
torch_geometric/utils/sparse.py +32 -24
torch_geometric/visualization/__init__.py +2 -1
torch_geometric/visualization/graph.py +250 -5
torch_geometric/warnings.py +11 -2
torch_geometric/nn/nlp/__init__.py +0 -7
torch_geometric/nn/nlp/llm.py +0 -283
torch_geometric/nn/nlp/sentence_transformer.py +0 -94

torch_geometric/utils/embedding.py CHANGED Viewed

@@ -1,9 +1,11 @@
 import warnings
-from typing import Any, List
+from typing import Any, Dict, List, Optional, Type
 import torch
 from torch import Tensor
+from torch_geometric.typing import NodeType
 def get_embeddings(
     model: torch.nn.Module,
@@ -40,7 +42,8 @@ def get_embeddings(
             hook_handles.append(module.register_forward_hook(hook))
     if len(hook_handles) == 0:
-        warnings.warn("The 'model' does not have any 'MessagePassing' layers")
+        warnings.warn("The 'model' does not have any 'MessagePassing' layers",
+                      stacklevel=2)
     training = model.training
     model.eval()
@@ -52,3 +55,89 @@ def get_embeddings(
         handle.remove()
     return embeddings
+def get_embeddings_hetero(
+    model: torch.nn.Module,
+    supported_models: Optional[List[Type[torch.nn.Module]]] = None,
+    *args: Any,
+    **kwargs: Any,
+) -> Dict[NodeType, List[Tensor]]:
+    """Returns the output embeddings of all
+    :class:`~torch_geometric.nn.conv.MessagePassing` layers in a heterogeneous
+    :obj:`model`, organized by edge type.
+    Internally, this method registers forward hooks on all modules that process
+    heterogeneous graphs in the model and runs the forward pass of the model.
+    For heterogeneous models, the output is a dictionary where each key is a
+    node type and each value is a list of embeddings from different layers.
+    Args:
+        model (torch.nn.Module): The heterogeneous GNN model.
+        supported_models (List[Type[torch.nn.Module]], optional): A list of
+            supported model classes. If not provided, defaults to
+            [HGTConv, HANConv, HeteroConv].
+        *args: Arguments passed to the model.
+        **kwargs (optional): Additional keyword arguments passed to the model.
+    Returns:
+        Dict[NodeType, List[Tensor]]: A dictionary mapping each node type to
+        a list of embeddings from different layers.
+    """
+    from torch_geometric.nn import HANConv, HeteroConv, HGTConv
+    if not supported_models:
+        supported_models = [HGTConv, HANConv, HeteroConv]
+    # Dictionary to store node embeddings by type
+    node_embeddings_dict: Dict[NodeType, List[Tensor]] = {}
+    # Hook function to capture node embeddings
+    def hook(model: torch.nn.Module, inputs: Any, outputs: Any) -> None:
+        # Check if the outputs is a dictionary mapping node types to embeddings
+        if isinstance(outputs, dict) and outputs:
+            # Store embeddings for each node type
+            for node_type, embedding in outputs.items():
+                # Made sure that the outputs are a dictionary mapping node
+                # types to embeddings and remove the false positives.
+                if node_type not in node_embeddings_dict:
+                    node_embeddings_dict[node_type] = []
+                node_embeddings_dict[node_type].append(embedding.clone())
+    # List to store hook handles
+    hook_handles = []
+    # Find ModuleDict objects in the model
+    for _, module in model.named_modules():
+        # Handle the native heterogenous models, e.g. HGTConv, HANConv
+        # and HeteroConv, etc.
+        if isinstance(module, tuple(supported_models)):
+            hook_handles.append(module.register_forward_hook(hook))
+        else:
+            # Handle the heterogenous models that are generated by calling
+            # to_hetero() on the homogeneous models.
+            submodules = list(module.children())
+            submodules_contains_module_dict = any([
+                isinstance(submodule, torch.nn.ModuleDict)
+                for submodule in submodules
+            ])
+            if submodules_contains_module_dict:
+                hook_handles.append(module.register_forward_hook(hook))
+    if len(hook_handles) == 0:
+        warnings.warn(
+            "The 'model' does not have any heterogenous "
+            "'MessagePassing' layers", stacklevel=2)
+    # Run the model forward pass
+    training = model.training
+    model.eval()
+    with torch.no_grad():
+        model(*args, **kwargs)
+    model.train(training)
+    # Clean up hooks
+    for handle in hook_handles:
+        handle.remove()
+    return node_embeddings_dict

torch_geometric/utils/geodesic.py CHANGED Viewed

@@ -2,6 +2,7 @@ import multiprocessing as mp
 import warnings
 from typing import Optional
+import numpy as np
 import torch
 from torch import Tensor
@@ -65,9 +66,10 @@ def geodesic_distance(  # noqa: D417
     if 'dest' in kwargs:
         dst = kwargs['dest']
-        warnings.warn("'dest' attribute in 'geodesic_distance' is deprecated "
-                      "and will be removed in a future release. Use the 'dst' "
-                      "argument instead.")
+        warnings.warn(
+            "'dest' attribute in 'geodesic_distance' is deprecated "
+            "and will be removed in a future release. Use the 'dst' "
+            "argument instead.", stacklevel=2)
     max_distance = float('inf') if max_distance is None else max_distance
@@ -82,54 +84,55 @@ def geodesic_distance(  # noqa: D417
     dtype = pos.dtype
-    pos = pos.detach().cpu().to(torch.double).numpy()
-    face = face.detach().t().cpu().to(torch.int).numpy()
+    pos_np = pos.detach().cpu().to(torch.double).numpy()
+    face_np = face.detach().t().cpu().to(torch.int).numpy()
     if src is None and dst is None:
-        out = gdist.local_gdist_matrix(pos, face,
-                                       max_distance * scale).toarray() / scale
+        out = gdist.local_gdist_matrix(
+            pos_np,
+            face_np,
+            max_distance * scale,
+        ).toarray() / scale
         return torch.from_numpy(out).to(dtype)
     if src is None:
-        src = torch.arange(pos.shape[0], dtype=torch.int).numpy()
+        src_np = torch.arange(pos.size(0), dtype=torch.int).numpy()
     else:
-        src = src.detach().cpu().to(torch.int).numpy()
-    assert src is not None
+        src_np = src.detach().cpu().to(torch.int).numpy()
-    dst = None if dst is None else dst.detach().cpu().to(torch.int).numpy()
+    dst_np = None if dst is None else dst.detach().cpu().to(torch.int).numpy()
     def _parallel_loop(
-        pos: Tensor,
-        face: Tensor,
-        src: Tensor,
-        dst: Optional[Tensor],
+        pos_np: np.ndarray,
+        face_np: np.ndarray,
+        src_np: np.ndarray,
+        dst_np: Optional[np.ndarray],
         max_distance: float,
         scale: float,
         i: int,
         dtype: torch.dtype,
     ) -> Tensor:
-        s = src[i:i + 1]
-        d = None if dst is None else dst[i:i + 1]
-        out = gdist.compute_gdist(pos, face, s, d, max_distance * scale)
+        s = src_np[i:i + 1]
+        d = None if dst_np is None else dst_np[i:i + 1]
+        out = gdist.compute_gdist(pos_np, face_np, s, d, max_distance * scale)
         out = out / scale
         return torch.from_numpy(out).to(dtype)
     num_workers = mp.cpu_count() if num_workers <= -1 else num_workers
     if num_workers > 0:
         with mp.Pool(num_workers) as pool:
-            outs = pool.starmap(
-                _parallel_loop,
-                [(pos, face, src, dst, max_distance, scale, i, dtype)
-                 for i in range(len(src))])
+            data = [(pos_np, face_np, src_np, dst_np, max_distance, scale, i,
+                     dtype) for i in range(len(src_np))]
+            outs = pool.starmap(_parallel_loop, data)
     else:
         outs = [
-            _parallel_loop(pos, face, src, dst, max_distance, scale, i, dtype)
-            for i in range(len(src))
+            _parallel_loop(pos_np, face_np, src_np, dst_np, max_distance,
+                           scale, i, dtype) for i in range(len(src_np))
         ]
     out = torch.cat(outs, dim=0)
     if dst is None:
-        out = out.view(-1, pos.shape[0])
+        out = out.view(-1, pos.size(0))
     return out

torch_geometric/utils/influence.py ADDED Viewed

@@ -0,0 +1,279 @@
+from typing import List, Tuple, Union, cast
+import torch
+from torch import Tensor
+from torch.autograd.functional import jacobian
+from tqdm.auto import tqdm
+from torch_geometric.data import Data
+from torch_geometric.utils import k_hop_subgraph
+def k_hop_subsets_rough(
+    node_idx: int,
+    num_hops: int,
+    edge_index: Tensor,
+    num_nodes: int,
+) -> List[Tensor]:
+    r"""Return *rough* (possibly overlapping) *k*-hop node subsets.
+    This is a thin wrapper around
+    :pyfunc:`torch_geometric.utils.k_hop_subgraph` that *additionally* returns
+    **all** intermediate hop subsets rather than the full union only.
+    Parameters
+    ----------
+    node_idx: int
+        Index or indices of the central node(s).
+    num_hops: int
+        Number of hops *k*.
+    edge_index: Tensor
+        Edge index in COO format with shape :math:`[2, \text{num_edges}]`.
+    num_nodes: int
+        Total number of nodes in the graph. Required to allocate the masks.
+    Returns:
+    -------
+    List[Tensor]
+        A list ``[H₀, H₁, …, H_k]`` where ``H₀`` contains the seed node(s) and
+        ``H_i`` (for *i*>0) contains **all** nodes that are exactly *i* hops
+        away in the *expanded* neighbourhood (i.e. overlaps are *not*
+        removed).
+    """
+    col, row = edge_index
+    node_mask = row.new_empty(num_nodes, dtype=torch.bool)
+    edge_mask = row.new_empty(row.size(0), dtype=torch.bool)
+    node_idx_ = torch.tensor([node_idx], device=row.device)
+    subsets = [node_idx_]
+    for _ in range(num_hops):
+        node_mask.zero_()
+        node_mask[subsets[-1]] = True
+        torch.index_select(node_mask, 0, row, out=edge_mask)
+        subsets.append(col[edge_mask])
+    return subsets
+def k_hop_subsets_exact(
+    node_idx: int,
+    num_hops: int,
+    edge_index: Tensor,
+    num_nodes: int,
+    device: Union[torch.device, str],
+) -> List[Tensor]:
+    """Return **disjoint** *k*-hop subsets.
+    This function refines :pyfunc:`k_hop_subsets_rough` by removing nodes that
+    have already appeared in previous hops, ensuring that each subset contains
+    nodes *exactly* *i* hops away from the seed.
+    """
+    rough_subsets = k_hop_subsets_rough(node_idx, num_hops, edge_index,
+                                        num_nodes)
+    exact_subsets: List[List[int]] = [rough_subsets[0].tolist()]
+    visited: set[int] = set(exact_subsets[0])
+    for hop_subset in rough_subsets[1:]:
+        fresh = set(hop_subset.tolist()) - visited
+        visited |= fresh
+        exact_subsets.append(list(fresh))
+    return [
+        torch.tensor(s, device=device, dtype=edge_index.dtype)
+        for s in exact_subsets
+    ]
+def jacobian_l1(
+    model: torch.nn.Module,
+    data: Data,
+    max_hops: int,
+    node_idx: int,
+    device: Union[torch.device, str],
+    *,
+    vectorize: bool = True,
+) -> Tensor:
+    """Compute the **L1 norm** of the Jacobian for a given node.
+    The Jacobian is evaluated w.r.t. the node features of the *k*-hop induced
+    sub‑graph centred at ``node_idx``. The result is *folded back* onto the
+    **original** node index space so that the returned tensor has length
+    ``data.num_nodes``, where the influence score will be zero for nodes
+    outside the *k*-hop subgraph.
+    Notes:
+    -----
+    *   The function assumes that the model *and* ``data.x`` share the same
+        floating‑point precision (e.g. both ``float32`` or both ``float16``).
+    """
+    # Build the induced *k*-hop sub‑graph (with node re‑labelling).
+    edge_index = cast(Tensor, data.edge_index)
+    x = cast(Tensor, data.x)
+    k_hop_nodes, sub_edge_index, mapping, _ = k_hop_subgraph(
+        node_idx, max_hops, edge_index, relabel_nodes=True)
+    # get the location of the *center* node inside the sub‑graph
+    root_pos = cast(int, mapping[0])
+    # Move tensors & model to the correct device
+    device = torch.device(device)
+    sub_x = x[k_hop_nodes].to(device)
+    sub_edge_index = sub_edge_index.to(device)
+    model = model.to(device)
+    # Jacobian evaluation
+    def _forward(x: Tensor) -> Tensor:
+        return model(x, sub_edge_index)[root_pos]
+    jac = jacobian(_forward, sub_x, vectorize=vectorize)
+    influence_sub = jac.abs().sum(dim=(0, 2))  # Sum of L1 norm
+    num_nodes = cast(int, data.num_nodes)
+    # Scatter the influence scores back to the *global* node space
+    influence_full = torch.zeros(num_nodes, dtype=influence_sub.dtype,
+                                 device=device)
+    influence_full[k_hop_nodes] = influence_sub
+    return influence_full
+def jacobian_l1_agg_per_hop(
+    model: torch.nn.Module,
+    data: Data,
+    max_hops: int,
+    node_idx: int,
+    device: Union[torch.device, str],
+    vectorize: bool = True,
+) -> Tensor:
+    """Aggregate Jacobian L1 norms **per hop** for node_idx.
+    Returns a vector ``[I_0, I_1, …, I_k]`` where ``I_i`` is the *total*
+    influence exerted by nodes that are exactly *i* hops away from
+    ``node_idx``.
+    """
+    num_nodes = cast(int, data.num_nodes)
+    edge_index = cast(Tensor, data.edge_index)
+    influence = jacobian_l1(model, data, max_hops, node_idx, device,
+                            vectorize=vectorize)
+    hop_subsets = k_hop_subsets_exact(node_idx, max_hops, edge_index,
+                                      num_nodes, influence.device)
+    single_node_influence_per_hop = [influence[s].sum() for s in hop_subsets]
+    return torch.tensor(single_node_influence_per_hop, device=influence.device)
+def avg_total_influence(
+    influence_all_nodes: Tensor,
+    normalize: bool = True,
+) -> Tensor:
+    """Compute the *influence‑weighted receptive field* ``R``."""
+    avg_total_influences = torch.mean(influence_all_nodes, dim=0)
+    if normalize:  # normalize by hop_0 (jacobian of the center node feature)
+        avg_total_influences = avg_total_influences / avg_total_influences[0]
+    return avg_total_influences
+def influence_weighted_receptive_field(T: Tensor) -> float:
+    """Compute the *influence‑weighted receptive field* ``R``.
+    Given an influence matrix ``T`` of shape ``[N, k+1]`` (i‑th row contains
+    the per‑hop influences of node *i*), the receptive field breadth *R* is
+    defined as the expected hop distance when weighting by influence.
+    A larger *R* indicates that, on average, influence comes from **farther**
+    hops.
+    """
+    normalised = T / torch.sum(T, dim=1, keepdim=True)
+    hops = torch.arange(T.shape[1]).float()  # 0 … k
+    breadth = normalised @ hops  # shape (N,)
+    return breadth.mean().item()
+def total_influence(
+    model: torch.nn.Module,
+    data: Data,
+    max_hops: int,
+    num_samples: Union[int, None] = None,
+    normalize: bool = True,
+    average: bool = True,
+    device: Union[torch.device, str] = "cpu",
+    vectorize: bool = True,
+) -> Tuple[Tensor, float]:
+    r"""Compute Jacobian‑based influence aggregates for *multiple* seed nodes,
+    as introduced in the
+    `"Towards Quantifying Long-Range Interactions in Graph Machine Learning:
+    a Large Graph Dataset and a Measurement"
+    <https://arxiv.org/abs/2503.09008>`_ paper.
+    This measurement quantifies how a GNN model's output at a node is
+    influenced by features of other nodes at increasing hop distances.
+    Specifically, for every sampled node :math:`v`, this method
+    1. evaluates the **L1‑norm** of the Jacobian of the model output at
+       :math:`v` w.r.t. the node features of its *k*-hop induced sub‑graph;
+    2. sums these scores **per hop** to obtain the influence vector
+       :math:`(I_{0}, I_{1}, \dots, I_{k})`;
+    3. optionally averages those vectors over all sampled nodes and
+       optionally normalises them by :math:`I_{0}`.
+    Please refer to Section 4 of the paper for a more detailed definition.
+    Args:
+        model (torch.nn.Module): A PyTorch Geometric‑compatible model with
+            forward signature ``model(x, edge_index) -> Tensor``.
+        data (torch_geometric.data.Data): Graph data object providing at least
+            :obj:`x` (node features) and :obj:`edge_index` (connectivity).
+        max_hops (int): Maximum hop distance :math:`k`.
+        num_samples (int, optional): Number of random seed nodes to evaluate.
+            If :obj:`None`, all nodes are used. (default: :obj:`None`)
+        normalize (bool, optional): If :obj:`True`, normalize each hop‑wise
+            influence by the influence of hop 0. (default: :obj:`True`)
+        average (bool, optional): If :obj:`True`, return the hop‑wise **mean**
+            over all seed nodes (shape ``[k+1]``).
+            If :obj:`False`, return the full influence matrix of shape
+            ``[N, k+1]``. (default: :obj:`True`)
+        device (torch.device or str, optional): Device on which to perform the
+            computation. (default: :obj:`"cpu"`)
+        vectorize (bool, optional): Forwarded to
+            :func:`torch.autograd.functional.jacobian`.  Keeping this
+            :obj:`True` is often faster but increases memory usage.
+            (default: :obj:`True`)
+    Returns:
+        Tuple[Tensor, float]:
+            * **avg_influence** (*Tensor*):
+              shape ``[k+1]`` if :obj:`average=True`;
+              shape ``[N, k+1]`` otherwise.
+            * **R** (*float*): Influence‑weighted receptive‑field breadth
+              returned by :func:`influence_weighted_receptive_field`.
+    Example::
+        >>> avg_I, R = total_influence(model, data, max_hops=3,
+        ...                            num_samples=1000)
+        >>> avg_I
+        tensor([1.0000, 0.1273, 0.0142, 0.0019])
+        >>> R
+        0.216
+    """
+    num_samples = data.num_nodes if num_samples is None else num_samples
+    num_nodes = cast(int, data.num_nodes)
+    nodes = torch.randperm(num_nodes)[:num_samples].tolist()
+    influence_all_nodes: List[Tensor] = [
+        jacobian_l1_agg_per_hop(model, data, max_hops, n, device,
+                                vectorize=vectorize)
+        for n in tqdm(nodes, desc="Influence")
+    ]
+    allnodes = torch.vstack(influence_all_nodes).detach().cpu()
+    # Average total influence at each hop
+    if average:
+        avg_influence = avg_total_influence(allnodes, normalize=normalize)
+    else:
+        avg_influence = allnodes
+    # Influence‑weighted receptive field
+    R = influence_weighted_receptive_field(allnodes)
+    return avg_influence, R

torch_geometric/utils/map.py CHANGED Viewed

@@ -1,4 +1,3 @@
-import warnings
 from typing import Optional, Tuple, Union
 import numpy as np
@@ -6,6 +5,10 @@ import torch
 from torch import Tensor
 from torch.utils.dlpack import from_dlpack
+from torch_geometric.warnings import WarningCache
+_warning_cache = WarningCache()
 def map_index(
     src: Tensor,
@@ -14,7 +17,7 @@ def map_index(
     inclusive: bool = False,
 ) -> Tuple[Tensor, Optional[Tensor]]:
     r"""Maps indices in :obj:`src` to the positional value of their
-    corresponding occurence in :obj:`index`.
+    corresponding occurrence in :obj:`index`.
     Indices must be strictly positive.
     Args:
@@ -93,10 +96,10 @@ def map_index(
             WITH_CUDF = True
         except ImportError:
             import pandas as pd
-            warnings.warn("Using CPU-based processing within 'map_index' "
-                          "which may cause slowdowns and device "
-                          "synchronization. Consider installing 'cudf' to "
-                          "accelerate computation")
+            _warning_cache.warn("Using CPU-based processing within "
+                                "'map_index' which may cause slowdowns and "
+                                "device synchronization. Consider installing "
+                                "'cudf' to accelerate computation")
     else:
         import pandas as pd
@@ -148,10 +151,11 @@ def map_index(
         if inclusive:
             try:
                 out = from_dlpack(result['right_ser'].to_dlpack())
-            except ValueError:
-                raise ValueError("Found invalid entries in 'src' that do not "
-                                 "have a corresponding entry in 'index'. Set "
-                                 "`inclusive=False` to ignore these entries.")
+            except ValueError as e:
+                raise ValueError(
+                    "Found invalid entries in 'src' that do not "
+                    "have a corresponding entry in 'index'. Set "
+                    "`inclusive=False` to ignore these entries.") from e
         else:
             out = from_dlpack(result['right_ser'].fillna(-1).to_dlpack())

torch_geometric/utils/nested.py CHANGED Viewed

@@ -43,7 +43,7 @@ def to_nested_tensor(
         xs = [x]
     # This currently copies the data, although `x` is already contiguous.
-    # Sadly, there does not exist any (public) API to preven this :(
+    # Sadly, there does not exist any (public) API to prevent this :(
     return torch.nested.as_nested_tensor(xs)

torch_geometric/utils/smiles.py CHANGED Viewed

@@ -91,7 +91,7 @@ def from_rdmol(mol: Any) -> 'torch_geometric.data.Data':
     assert isinstance(mol, Chem.Mol)
     xs: List[List[int]] = []
-    for atom in mol.GetAtoms():  # type: ignore
+    for atom in mol.GetAtoms():
         row: List[int] = []
         row.append(x_map['atomic_num'].index(atom.GetAtomicNum()))
         row.append(x_map['chirality'].index(str(atom.GetChiralTag())))
@@ -108,7 +108,7 @@ def from_rdmol(mol: Any) -> 'torch_geometric.data.Data':
     x = torch.tensor(xs, dtype=torch.long).view(-1, 9)
     edge_indices, edge_attrs = [], []
-    for bond in mol.GetBonds():  # type: ignore
+    for bond in mol.GetBonds():
         i = bond.GetBeginAtomIdx()
         j = bond.GetEndAtomIdx()
@@ -148,7 +148,7 @@ def from_smiles(
     """
     from rdkit import Chem, RDLogger
-    RDLogger.DisableLog('rdApp.*')  # type: ignore
+    RDLogger.DisableLog('rdApp.*')  # type: ignore[attr-defined]
     mol = Chem.MolFromSmiles(smiles)

pyg-nightly 2.6.0.dev20240704__py3-none-any.whl → 2.8.0.dev20251207__py3-none-any.whl

Potentially problematic release.

pyg-nightly 2.6.0.dev20240704py3-none-any.whl → 2.8.0.dev20251207py3-none-any.whl