PyPI - scikit-network - Versions diffs - 0.28.3__cp39-cp39-macosx_12_0_arm64.whl - Mend

scikit-network 0.28.3__cp39-cp39-macosx_12_0_arm64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of scikit-network might be problematic. Click here for more details.

Files changed (240) hide show

scikit_network-0.28.3.dist-info/AUTHORS.rst +41 -0
scikit_network-0.28.3.dist-info/LICENSE +34 -0
scikit_network-0.28.3.dist-info/METADATA +457 -0
scikit_network-0.28.3.dist-info/RECORD +240 -0
scikit_network-0.28.3.dist-info/WHEEL +5 -0
scikit_network-0.28.3.dist-info/top_level.txt +1 -0
sknetwork/__init__.py +21 -0
sknetwork/classification/__init__.py +8 -0
sknetwork/classification/base.py +84 -0
sknetwork/classification/base_rank.py +143 -0
sknetwork/classification/diffusion.py +134 -0
sknetwork/classification/knn.py +162 -0
sknetwork/classification/metrics.py +205 -0
sknetwork/classification/pagerank.py +66 -0
sknetwork/classification/propagation.py +152 -0
sknetwork/classification/tests/__init__.py +1 -0
sknetwork/classification/tests/test_API.py +35 -0
sknetwork/classification/tests/test_diffusion.py +37 -0
sknetwork/classification/tests/test_knn.py +24 -0
sknetwork/classification/tests/test_metrics.py +53 -0
sknetwork/classification/tests/test_pagerank.py +20 -0
sknetwork/classification/tests/test_propagation.py +24 -0
sknetwork/classification/vote.cpython-39-darwin.so +0 -0
sknetwork/classification/vote.pyx +58 -0
sknetwork/clustering/__init__.py +7 -0
sknetwork/clustering/base.py +102 -0
sknetwork/clustering/kmeans.py +142 -0
sknetwork/clustering/louvain.py +255 -0
sknetwork/clustering/louvain_core.cpython-39-darwin.so +0 -0
sknetwork/clustering/louvain_core.pyx +134 -0
sknetwork/clustering/metrics.py +91 -0
sknetwork/clustering/postprocess.py +66 -0
sknetwork/clustering/propagation_clustering.py +108 -0
sknetwork/clustering/tests/__init__.py +1 -0
sknetwork/clustering/tests/test_API.py +37 -0
sknetwork/clustering/tests/test_kmeans.py +47 -0
sknetwork/clustering/tests/test_louvain.py +104 -0
sknetwork/clustering/tests/test_metrics.py +50 -0
sknetwork/clustering/tests/test_post_processing.py +23 -0
sknetwork/clustering/tests/test_postprocess.py +39 -0
sknetwork/data/__init__.py +5 -0
sknetwork/data/load.py +408 -0
sknetwork/data/models.py +459 -0
sknetwork/data/parse.py +621 -0
sknetwork/data/test_graphs.py +84 -0
sknetwork/data/tests/__init__.py +1 -0
sknetwork/data/tests/test_API.py +30 -0
sknetwork/data/tests/test_load.py +95 -0
sknetwork/data/tests/test_models.py +52 -0
sknetwork/data/tests/test_parse.py +253 -0
sknetwork/data/tests/test_test_graphs.py +30 -0
sknetwork/data/tests/test_toy_graphs.py +68 -0
sknetwork/data/toy_graphs.py +619 -0
sknetwork/embedding/__init__.py +10 -0
sknetwork/embedding/base.py +90 -0
sknetwork/embedding/force_atlas.py +197 -0
sknetwork/embedding/louvain_embedding.py +174 -0
sknetwork/embedding/louvain_hierarchy.py +142 -0
sknetwork/embedding/metrics.py +66 -0
sknetwork/embedding/random_projection.py +133 -0
sknetwork/embedding/spectral.py +214 -0
sknetwork/embedding/spring.py +198 -0
sknetwork/embedding/svd.py +363 -0
sknetwork/embedding/tests/__init__.py +1 -0
sknetwork/embedding/tests/test_API.py +73 -0
sknetwork/embedding/tests/test_force_atlas.py +35 -0
sknetwork/embedding/tests/test_louvain_embedding.py +33 -0
sknetwork/embedding/tests/test_louvain_hierarchy.py +19 -0
sknetwork/embedding/tests/test_metrics.py +29 -0
sknetwork/embedding/tests/test_random_projection.py +28 -0
sknetwork/embedding/tests/test_spectral.py +84 -0
sknetwork/embedding/tests/test_spring.py +50 -0
sknetwork/embedding/tests/test_svd.py +37 -0
sknetwork/flow/__init__.py +3 -0
sknetwork/flow/flow.py +73 -0
sknetwork/flow/tests/__init__.py +1 -0
sknetwork/flow/tests/test_flow.py +17 -0
sknetwork/flow/tests/test_utils.py +69 -0
sknetwork/flow/utils.py +91 -0
sknetwork/gnn/__init__.py +10 -0
sknetwork/gnn/activation.py +117 -0
sknetwork/gnn/base.py +155 -0
sknetwork/gnn/base_activation.py +89 -0
sknetwork/gnn/base_layer.py +109 -0
sknetwork/gnn/gnn_classifier.py +381 -0
sknetwork/gnn/layer.py +153 -0
sknetwork/gnn/layers.py +127 -0
sknetwork/gnn/loss.py +180 -0
sknetwork/gnn/neighbor_sampler.py +65 -0
sknetwork/gnn/optimizer.py +163 -0
sknetwork/gnn/tests/__init__.py +1 -0
sknetwork/gnn/tests/test_activation.py +56 -0
sknetwork/gnn/tests/test_base.py +79 -0
sknetwork/gnn/tests/test_base_layer.py +37 -0
sknetwork/gnn/tests/test_gnn_classifier.py +192 -0
sknetwork/gnn/tests/test_layers.py +80 -0
sknetwork/gnn/tests/test_loss.py +33 -0
sknetwork/gnn/tests/test_neigh_sampler.py +23 -0
sknetwork/gnn/tests/test_optimizer.py +43 -0
sknetwork/gnn/tests/test_utils.py +93 -0
sknetwork/gnn/utils.py +219 -0
sknetwork/hierarchy/__init__.py +7 -0
sknetwork/hierarchy/base.py +69 -0
sknetwork/hierarchy/louvain_hierarchy.py +264 -0
sknetwork/hierarchy/metrics.py +234 -0
sknetwork/hierarchy/paris.cpython-39-darwin.so +0 -0
sknetwork/hierarchy/paris.pyx +317 -0
sknetwork/hierarchy/postprocess.py +350 -0
sknetwork/hierarchy/tests/__init__.py +1 -0
sknetwork/hierarchy/tests/test_API.py +25 -0
sknetwork/hierarchy/tests/test_algos.py +29 -0
sknetwork/hierarchy/tests/test_metrics.py +62 -0
sknetwork/hierarchy/tests/test_postprocess.py +57 -0
sknetwork/hierarchy/tests/test_ward.py +25 -0
sknetwork/hierarchy/ward.py +94 -0
sknetwork/linalg/__init__.py +9 -0
sknetwork/linalg/basics.py +37 -0
sknetwork/linalg/diteration.cpython-39-darwin.so +0 -0
sknetwork/linalg/diteration.pyx +49 -0
sknetwork/linalg/eig_solver.py +93 -0
sknetwork/linalg/laplacian.py +15 -0
sknetwork/linalg/normalization.py +66 -0
sknetwork/linalg/operators.py +225 -0
sknetwork/linalg/polynome.py +76 -0
sknetwork/linalg/ppr_solver.py +170 -0
sknetwork/linalg/push.cpython-39-darwin.so +0 -0
sknetwork/linalg/push.pyx +73 -0
sknetwork/linalg/sparse_lowrank.py +142 -0
sknetwork/linalg/svd_solver.py +91 -0
sknetwork/linalg/tests/__init__.py +1 -0
sknetwork/linalg/tests/test_eig.py +44 -0
sknetwork/linalg/tests/test_laplacian.py +18 -0
sknetwork/linalg/tests/test_normalization.py +38 -0
sknetwork/linalg/tests/test_operators.py +70 -0
sknetwork/linalg/tests/test_polynome.py +38 -0
sknetwork/linalg/tests/test_ppr.py +50 -0
sknetwork/linalg/tests/test_sparse_lowrank.py +61 -0
sknetwork/linalg/tests/test_svd.py +38 -0
sknetwork/linkpred/__init__.py +4 -0
sknetwork/linkpred/base.py +80 -0
sknetwork/linkpred/first_order.py +508 -0
sknetwork/linkpred/first_order_core.cpython-39-darwin.so +0 -0
sknetwork/linkpred/first_order_core.pyx +315 -0
sknetwork/linkpred/postprocessing.py +98 -0
sknetwork/linkpred/tests/__init__.py +1 -0
sknetwork/linkpred/tests/test_API.py +49 -0
sknetwork/linkpred/tests/test_postprocessing.py +21 -0
sknetwork/path/__init__.py +4 -0
sknetwork/path/metrics.py +148 -0
sknetwork/path/search.py +65 -0
sknetwork/path/shortest_path.py +186 -0
sknetwork/path/tests/__init__.py +1 -0
sknetwork/path/tests/test_metrics.py +29 -0
sknetwork/path/tests/test_search.py +25 -0
sknetwork/path/tests/test_shortest_path.py +45 -0
sknetwork/ranking/__init__.py +9 -0
sknetwork/ranking/base.py +56 -0
sknetwork/ranking/betweenness.cpython-39-darwin.so +0 -0
sknetwork/ranking/betweenness.pyx +99 -0
sknetwork/ranking/closeness.py +95 -0
sknetwork/ranking/harmonic.py +82 -0
sknetwork/ranking/hits.py +94 -0
sknetwork/ranking/katz.py +81 -0
sknetwork/ranking/pagerank.py +107 -0
sknetwork/ranking/postprocess.py +25 -0
sknetwork/ranking/tests/__init__.py +1 -0
sknetwork/ranking/tests/test_API.py +34 -0
sknetwork/ranking/tests/test_betweenness.py +38 -0
sknetwork/ranking/tests/test_closeness.py +34 -0
sknetwork/ranking/tests/test_hits.py +20 -0
sknetwork/ranking/tests/test_pagerank.py +69 -0
sknetwork/regression/__init__.py +4 -0
sknetwork/regression/base.py +56 -0
sknetwork/regression/diffusion.py +190 -0
sknetwork/regression/tests/__init__.py +1 -0
sknetwork/regression/tests/test_API.py +34 -0
sknetwork/regression/tests/test_diffusion.py +48 -0
sknetwork/sknetwork.py +3 -0
sknetwork/topology/__init__.py +9 -0
sknetwork/topology/dag.py +74 -0
sknetwork/topology/dag_core.cpython-39-darwin.so +0 -0
sknetwork/topology/dag_core.pyx +38 -0
sknetwork/topology/kcliques.cpython-39-darwin.so +0 -0
sknetwork/topology/kcliques.pyx +193 -0
sknetwork/topology/kcore.cpython-39-darwin.so +0 -0
sknetwork/topology/kcore.pyx +120 -0
sknetwork/topology/structure.py +234 -0
sknetwork/topology/tests/__init__.py +1 -0
sknetwork/topology/tests/test_cliques.py +28 -0
sknetwork/topology/tests/test_cores.py +21 -0
sknetwork/topology/tests/test_dag.py +26 -0
sknetwork/topology/tests/test_structure.py +99 -0
sknetwork/topology/tests/test_triangles.py +42 -0
sknetwork/topology/tests/test_wl_coloring.py +49 -0
sknetwork/topology/tests/test_wl_kernel.py +31 -0
sknetwork/topology/triangles.cpython-39-darwin.so +0 -0
sknetwork/topology/triangles.pyx +166 -0
sknetwork/topology/weisfeiler_lehman.py +163 -0
sknetwork/topology/weisfeiler_lehman_core.cpython-39-darwin.so +0 -0
sknetwork/topology/weisfeiler_lehman_core.pyx +116 -0
sknetwork/utils/__init__.py +40 -0
sknetwork/utils/base.py +35 -0
sknetwork/utils/check.py +354 -0
sknetwork/utils/co_neighbor.py +71 -0
sknetwork/utils/format.py +219 -0
sknetwork/utils/kmeans.py +89 -0
sknetwork/utils/knn.py +166 -0
sknetwork/utils/knn1d.cpython-39-darwin.so +0 -0
sknetwork/utils/knn1d.pyx +80 -0
sknetwork/utils/membership.py +82 -0
sknetwork/utils/minheap.cpython-39-darwin.so +0 -0
sknetwork/utils/minheap.pxd +22 -0
sknetwork/utils/minheap.pyx +111 -0
sknetwork/utils/neighbors.py +115 -0
sknetwork/utils/seeds.py +75 -0
sknetwork/utils/simplex.py +140 -0
sknetwork/utils/tests/__init__.py +1 -0
sknetwork/utils/tests/test_base.py +28 -0
sknetwork/utils/tests/test_bunch.py +16 -0
sknetwork/utils/tests/test_check.py +190 -0
sknetwork/utils/tests/test_co_neighbor.py +43 -0
sknetwork/utils/tests/test_format.py +61 -0
sknetwork/utils/tests/test_kmeans.py +21 -0
sknetwork/utils/tests/test_knn.py +32 -0
sknetwork/utils/tests/test_membership.py +24 -0
sknetwork/utils/tests/test_neighbors.py +41 -0
sknetwork/utils/tests/test_projection_simplex.py +33 -0
sknetwork/utils/tests/test_seeds.py +67 -0
sknetwork/utils/tests/test_verbose.py +15 -0
sknetwork/utils/tests/test_ward.py +20 -0
sknetwork/utils/timeout.py +38 -0
sknetwork/utils/verbose.py +37 -0
sknetwork/utils/ward.py +60 -0
sknetwork/visualization/__init__.py +4 -0
sknetwork/visualization/colors.py +34 -0
sknetwork/visualization/dendrograms.py +229 -0
sknetwork/visualization/graphs.py +819 -0
sknetwork/visualization/tests/__init__.py +1 -0
sknetwork/visualization/tests/test_dendrograms.py +53 -0
sknetwork/visualization/tests/test_graphs.py +167 -0

sknetwork/embedding/tests/test_spring.py ADDED Viewed

@@ -0,0 +1,50 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+"""tests for spring embeddings"""
+import unittest
+from sknetwork.data.test_graphs import *
+from sknetwork.embedding import Spring
+class TestEmbeddings(unittest.TestCase):
+    def test_shape(self):
+        for adjacency in [test_graph(), test_digraph()]:
+            n = adjacency.shape[0]
+            spring = Spring()
+            layout = spring.fit_transform(adjacency)
+            self.assertEqual((n, 2), layout.shape)
+            spring = Spring(n_components=3)
+            layout = spring.fit_transform(adjacency)
+            self.assertEqual((n, 3), layout.shape)
+    def test_pos_init(self):
+        adjacency = test_graph()
+        n = adjacency.shape[0]
+        spring = Spring(strength=0.1, position_init='spectral', tol=1e3)
+        layout = spring.fit_transform(adjacency)
+        self.assertEqual((n, 2), layout.shape)
+        layout = spring.fit_transform(adjacency, position_init=layout)
+        self.assertEqual((n, 2), layout.shape)
+    def test_approx_radius(self):
+        adjacency = test_graph()
+        n = adjacency.shape[0]
+        spring = Spring(approx_radius=1.)
+        layout = spring.fit_transform(adjacency)
+        self.assertEqual((n, 2), layout.shape)
+    def test_errors(self):
+        adjacency = test_graph()
+        with self.assertRaises(ValueError):
+            Spring(position_init='toto')
+        with self.assertRaises(ValueError):
+            Spring().fit(adjacency, position_init=np.ones((2, 2)))
+        with self.assertRaises(TypeError):
+            # noinspection PyTypeChecker
+            Spring().fit(adjacency, position_init='toto')

sknetwork/embedding/tests/test_svd.py ADDED Viewed

@@ -0,0 +1,37 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+"""tests for svd"""
+import unittest
+import numpy as np
+from sknetwork.data import star_wars
+from sknetwork.embedding import GSVD, SVD, PCA
+from sknetwork.linalg import LanczosSVD
+class TestSVD(unittest.TestCase):
+    def test_options(self):
+        biadjacency = star_wars(metadata=False)
+        n_row, n_col = biadjacency.shape
+        min_dim = min(n_row, n_col) - 1
+        gsvd = GSVD(n_components=5, regularization=0., solver='halko')
+        with self.assertWarns(Warning):
+            gsvd.fit(biadjacency)
+        self.assertEqual(gsvd.embedding_row_.shape, (n_row, min_dim))
+        self.assertEqual(gsvd.embedding_col_.shape, (n_col, min_dim))
+        gsvd = GSVD(n_components=1, regularization=0.1, solver='lanczos')
+        gsvd.fit(biadjacency)
+        gsvd.predict(np.random.rand(n_col))
+        pca = PCA(n_components=min_dim, solver='lanczos')
+        pca.fit(biadjacency)
+        self.assertEqual(pca.embedding_row_.shape, (n_row, min_dim))
+        svd = SVD(n_components=min_dim, solver=LanczosSVD())
+        svd.fit(biadjacency)
+        self.assertEqual(svd.embedding_row_.shape, (n_row, min_dim))

sknetwork/flow/__init__.py ADDED Viewed

@@ -0,0 +1,3 @@
+"""flow module"""
+from sknetwork.flow.utils import get_residual_graph, flow_is_feasible, find_excess
+from sknetwork.flow.push_relabel import get_max_flow

sknetwork/flow/flow.py ADDED Viewed

@@ -0,0 +1,73 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+"""
+Created on July 7, 2022.
+@author: Henry L. Carscadden <hcarscad@gmail.com>
+"""
+from scipy import sparse
+import numpy as np
+from sknetwork.flow.utils import get_residual_graph
+from sknetwork.flow.flow_core import push
+def residual_to_flow(adjacency: sparse.csr_matrix, residual: sparse.csr_matrix, preflow: sparse.csr_matrix):
+    rows, cols = adjacency.nonzero()
+    for i in range(rows.size):
+        row, col = rows[i], cols[i]
+        preflow[row, col] = residual[col, row]
+    return preflow
+def push_relabel(adjacency: sparse.csr_matrix, src: int, sink: int):
+    """ This algorithm finds a maximum flow following the classic push-relabel algorithm.
+    Parameters
+    ----------
+    adjacency : sparse.csr_matrix
+        The adjacency matrix of the graph with weights containing the edge capacities.
+    src : int
+        The node with the flow source.
+    sink : int
+        The node with that receives the flow.
+    Returns
+    -------
+    flow : sparse.csr_matrix
+        A maximum flow for the graph.
+    Reference
+    ---------
+    Goldberg, A V; Tarjan, R E (1986). A new approach to the maximum flow problem.
+    Proceedings of the eighteenth annual ACM symposium on Theory of computing – STOC 86.
+    """
+    # Initialize preflow.
+    preflow_vals = np.zeros(dtype=np.int32, shape=(adjacency.nnz,))
+    preflow = sparse.csr_matrix((preflow_vals, adjacency.indices, adjacency.indptr), shape=adjacency.shape)
+    # Initialize the heights to 0.
+    heights = np.zeros(shape=(adjacency.shape[0],), dtype=np.int32)
+    # Set the height of the src to n.
+    heights[src] = adjacency.shape[0]
+    # Create the excess flow array.
+    excess_flow = np.zeros(shape=(adjacency.shape[0],), dtype=np.int32)
+    # Send all the possible flow out of the source.
+    for dest_node in adjacency.indices[adjacency.indptr[src]:adjacency.indptr[src + 1]]:
+        edge_capacity = adjacency[src, dest_node]
+        preflow[src, dest_node] = edge_capacity
+        if edge_capacity > 0:
+            excess_flow[dest_node] = edge_capacity
+    # Initialize the residual graph.
+    residual = get_residual_graph(adjacency, preflow)
+    non_zero_indices = excess_flow.nonzero()[0]
+    # While there are nodes with excess, push or relabel.
+    while non_zero_indices.size > 0:
+        # while nodes have excess
+        # Get nodes from active nodes (excess > 0)
+        for curr_node in non_zero_indices:
+            pushed = push(residual, curr_node, src, sink, heights, excess_flow)
+            # Relabel step
+            if not pushed:
+                heights[curr_node] = heights[curr_node] + 1
+        non_zero_indices = excess_flow.nonzero()[0]
+    return residual_to_flow(adjacency, residual, preflow)

sknetwork/flow/tests/__init__.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ "Tests for flow"

sknetwork/flow/tests/test_flow.py ADDED Viewed

@@ -0,0 +1,17 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+""""tests for push_relabel.py"""
+import unittest
+from sknetwork.flow import get_max_flow, find_excess
+from scipy import sparse
+class TestFlow(unittest.TestCase):
+    def test_push_relabel_1(self):
+        adj = sparse.csr_matrix([[0, 2, 3, 0, 0, 0, 0], [0, 0, 0, 3, 0, 0, 0],
+        [0, 0, 0, 2, 0, 0, 0], [0, 0, 0, 0, 1, 3, 0], [0, 0, 0, 0, 0, 0, 2],
+        [0, 0, 0, 0, 0, 0, 2], [0, 0, 0, 0, 0, 0, 0]])
+        flow = get_max_flow(adj, 0, 6)
+        self.assertEqual(3, flow[:, 6].sum())
+        for i in range(1, 6):
+            self.assertEqual(0, find_excess(flow, i))

sknetwork/flow/tests/test_utils.py ADDED Viewed

@@ -0,0 +1,69 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+""""tests for utils.py"""
+import unittest
+from sknetwork.flow import get_residual_graph, flow_is_feasible, find_excess
+from scipy.sparse import csr_matrix
+class TestUtils(unittest.TestCase):
+    def test_get_residual_graph(self):
+        adjacency = csr_matrix([[0, 2, 3, 0, 0, 0, 0], [0, 0, 0, 3, 0, 0, 0],
+        [0, 0, 0, 2, 0, 0, 0], [0, 0, 0, 0, 1, 3, 0], [0, 0, 0, 0, 0, 0, 2],
+        [0, 0, 0, 0, 0, 0, 2], [0, 0, 0, 0, 0, 0, 0]])
+        flow = csr_matrix([[0, 1, 0, 0, 0, 0, 0], [0, 0, 0, 1, 0, 0, 0],
+        [0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 1, 0, 0], [0, 0, 0, 0, 0, 0, 1],
+        [0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0]])
+        residual = csr_matrix([[0, 1, 3, 0, 0, 0, 0], [1, 0, 0, 2, 0, 0, 0],
+        [0, 0, 0, 2, 0, 0, 0], [0, 1, 0, 0, 0, 3, 0], [0, 0, 0, 1, 0, 0, 1],
+        [0, 0, 0, 0, 0, 0, 2], [0, 0, 0, 0, 0, 0, 0]])
+        res_out = get_residual_graph(adjacency, flow, 0, 6)
+        rows, cols = residual.nonzero()
+        for i in range(len(rows)):
+            row, col = rows[i], cols[i]
+            self.assertEquals(residual[row, col], res_out[row, col])
+    def test_flow_is_feasible_1(self):
+        adjacency = csr_matrix([[0, 2, 3, 0, 0, 0, 0], [0, 0, 0, 3, 0, 0, 0],
+        [0, 0, 0, 2, 0, 0, 0], [0, 0, 0, 0, 1, 3, 0], [0, 0, 0, 0, 0, 0, 2],
+        [0, 0, 0, 0, 0, 0, 2], [0, 0, 0, 0, 0, 0, 0]])
+        flow = csr_matrix([[0, 1, 0, 0, 0, 0, 0], [0, 0, 0, 2, 0, 0, 0],
+        [0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 1, 0, 0], [0, 0, 0, 0, 0, 0, 1],
+        [0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0]])
+        self.assertFalse(flow_is_feasible(adjacency, flow, 0, 6))
+    def test_flow_is_feasible_2(self):
+        adjacency = csr_matrix([[0, 2, 3, 0, 0, 0, 0], [0, 0, 0, 3, 0, 0, 0],
+            [0, 0, 0, 2, 0, 0, 0], [0, 0, 0, 0, 1, 3, 0], [0, 0, 0, 0, 0, 0, 2],
+            [0, 0, 0, 0, 0, 0, 2], [0, 0, 0, 0, 0, 0, 0]])
+        flow = csr_matrix([[0, 2, 0, 0, 0, 0, 0], [0, 0, 0, 2, 0, 0, 0],
+            [0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 2, 0, 0], [0, 0, 0, 0, 0, 0, 1],
+            [0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0]])
+        self.assertFalse(flow_is_feasible(adjacency, flow, 0, 6))
+    def test_flow_is_feasible_3(self):
+        adjacency = csr_matrix([[0, 2, 3, 0, 0, 0, 0], [0, 0, 0, 3, 0, 0, 0],
+                [0, 0, 0, 2, 0, 0, 0], [0, 0, 0, 0, 1, 3, 0], [0, 0, 0, 0, 0, 0, 2],
+                [0, 0, 0, 0, 0, 0, 2], [0, 0, 0, 0, 0, 0, 0]])
+        flow = csr_matrix([[0, 1, 0, 0, 0, 0, 0], [0, 0, 0, 1, 0, 0, 0],
+                [0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 1, 0, 0], [0, 0, 0, 0, 0, 0, 1],
+                [0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0]])
+        self.assertTrue(flow_is_feasible(adjacency, flow, 0, 6))
+    def test_flow_is_feasible_4(self):
+        adjacency = csr_matrix([[0, 2, 3, 0, 0, 0, 0], [0, 0, 0, 3, 0, 0, 0],
+                [0, 0, 0, 2, 0, 0, 0], [0, 0, 0, 0, 1, 3, 0], [0, 0, 0, 0, 0, 0, 2],
+                [0, 0, 0, 0, 0, 0, 2], [0, 0, 0, 0, 0, 0, 0]])
+        flow = csr_matrix([[0, 1, 0, 0, 0, 0, 0], [0, 0, 0, 1, 0, 0, 0],
+                [0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 1, 0, 0], [0, 0, 0, 0, 0, 0, 1],
+                [0, 0, 0, 0, 0, 0, 0]])
+        self.assertRaises(ValueError, flow_is_feasible, adjacency, flow, 0, 6)
+    def test_flow_is_feasible_3(self):
+        adjacency = csr_matrix([[0, 2, 3, 0, 0, 0, 0], [0, 0, 0, 3, 0, 0, 0],
+                [0, 0, 0, 2, 0, 0, 0], [0, 0, 0, 0, 1, 3, 0], [0, 0, 0, 0, 0, 0, 2],
+                [0, 0, 0, 0, 0, 0, 2], [0, 0, 0, 0, 0, 0, 0]])
+        flow = csr_matrix([[0, 10, 0, 0, 0, 0, 0], [0, 0, 0, 1, 0, 0, 0],
+                [0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 1, 0, 0], [0, 0, 0, 0, 0, 0, 1],
+                [0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0]])
+        self.assertFalse(flow_is_feasible(adjacency, flow, 0, 6))
+    def test_find_excess(self):
+        flow = csr_matrix([[0, 1, 0, 0, 0, 0, 0], [0, 0, 0, 1, 0, 0, 0],
+                [0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 1, 0, 0], [0, 0, 0, 0, 0, 0, 1],
+                [0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0]])
+        self.assertEquals(0, find_excess(flow, 1))

sknetwork/flow/utils.py ADDED Viewed

@@ -0,0 +1,91 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+"""
+Created on July 4, 2022.
+@author: Henry L. Carscadden <hcarscad@gmail.com>
+"""
+from scipy import sparse
+import numpy as np
+def find_excess(flow: sparse.csr_matrix, node: int):
+    """
+    This function computes the excess flow for a node in a preflow.
+    Parameters
+    ----------
+    flow: sparse.csr_matrix
+        The matrix showing the flows in the proposed solution.
+    node : int
+        Node to compute the excess on.
+    Returns
+    -------
+    excess: int
+        The amount of excess flow.
+    """
+    return flow[:, node].sum() - flow[node, :].sum()
+def flow_is_feasible(adjacency: sparse.csr_matrix, flow: sparse.csr_matrix, src: int, sink: int):
+    """ This utility is used to check if a provided flow satisfies the capacity and flow conservation constraints.
+    Parameters
+    ----------
+    adjacency : sparse.csr_matrix
+        The adjacency matrix of the graph with weights containing the edge capacities.
+    flow: sparse.csr_matrix
+        The matrix showing the flows in the proposed solution.
+    src : int
+        The node with the flow source.
+    sink : int
+        The node with that receives the flow.
+    Returns
+    -------
+    feasible: bool
+        Whether the follow is feasible, i.e., both the capacity and flow constraints are satisfied.
+    """
+    if adjacency.shape != flow.shape:
+        raise ValueError("The flow has the incorrect shape.")
+    rows, cols = adjacency.nonzero()
+    for row in rows:
+        if row != src and row != sink:
+            if flow[row, :].sum() != flow[:, row].sum():
+                return False
+    for i in range(rows.size):
+        row, col = rows[i], cols[i]
+        if adjacency[row, col] < flow[row, col]:
+            return False
+    return True
+def get_residual_graph(adjacency: sparse.csr_matrix, flow: sparse.csr_matrix):
+    """ This utility is used for maximum flow algorithms to find the residual graph given a flow.
+    Parameters
+    ----------
+    adjacency : sparse.csr_matrix
+        The adjacency matrix of the graph with weights containing the edge capacities.
+    flow: sparse.csr_matrix
+        The matrix showing the flows in the proposed solution.
+    Returns
+    -------
+    residual: sparse.csr_matrix
+        The adjacency matrix of the residual graph.
+    """
+    rows, cols = adjacency.nonzero()
+    row_ind = np.zeros(shape=(adjacency.nnz * 2), dtype=np.int)
+    col_ind = np.zeros(shape=(adjacency.nnz * 2), dtype=np.int)
+    data = np.zeros(shape=(adjacency.nnz * 2), dtype=np.int)
+    for i in range(rows.size):
+        row, col = rows[i], cols[i]
+        curr_ind = i * 2
+        row_ind[curr_ind], col_ind[curr_ind] = row, col
+        row_ind[curr_ind + 1], col_ind[curr_ind + 1] = col, row
+        data[curr_ind] = adjacency[row, col] - flow[row, col]
+        data[curr_ind + 1] = flow[row, col]
+    residual = sparse.csr_matrix((data, (row_ind, col_ind)), shape=adjacency.shape)
+    return residual

sknetwork/gnn/__init__.py ADDED Viewed

@@ -0,0 +1,10 @@
+"""gnn module"""
+from sknetwork.gnn.base import BaseGNN
+from sknetwork.gnn.base_activation import BaseActivation, BaseLoss
+from sknetwork.gnn.base_layer import BaseLayer
+from sknetwork.gnn.gnn_classifier import GNNClassifier
+from sknetwork.gnn.layer import Convolution
+from sknetwork.gnn.neighbor_sampler import UniformNeighborSampler
+from sknetwork.gnn.activation import ReLu, Sigmoid, Softmax
+from sknetwork.gnn.loss import BinaryCrossEntropy, CrossEntropy
+from sknetwork.gnn.optimizer import BaseOptimizer, GD, ADAM

sknetwork/gnn/activation.py ADDED Viewed

@@ -0,0 +1,117 @@
+#!/usr/bin/env python3
+# coding: utf-8
+"""
+Created in April 2022
+@author: Simon Delarue <sdelarue@enst.fr>
+@author: Thomas Bonald <bonald@enst.fr>
+"""
+from typing import Union
+import numpy as np
+from scipy import special
+from sknetwork.gnn.base_activation import BaseActivation
+class ReLu(BaseActivation):
+    """ReLu (Rectified Linear Unit) activation function:
+    :math:`\\sigma(x) = \\max(0, x)`
+    """
+    def __init__(self):
+        super(ReLu, self).__init__('ReLu')
+    @staticmethod
+    def output(signal: np.ndarray) -> np.ndarray:
+        """Output of the ReLu function."""
+        return np.maximum(signal, 0)
+    @staticmethod
+    def gradient(signal: np.ndarray, direction: np.ndarray) -> np.ndarray:
+        """Gradient of the ReLu function."""
+        return direction * (signal > 0)
+class Sigmoid(BaseActivation):
+    """Sigmoid activation function:
+    :math:`\\sigma(x) = \\frac{1}{1+e^{-x}}`
+    Also known as the logistic function.
+    """
+    def __init__(self):
+        super(Sigmoid, self).__init__('Sigmoid')
+    @staticmethod
+    def output(signal: np.ndarray) -> np.ndarray:
+        """Output of the sigmoid function."""
+        return special.expit(signal)
+    @staticmethod
+    def gradient(signal: np.ndarray, direction: np.ndarray) -> np.ndarray:
+        """Gradient of the sigmoid function."""
+        output = Sigmoid.output(signal)
+        return output * (1 - output) * direction
+class Softmax(BaseActivation):
+    """Softmax activation function:
+    :math:`\\sigma(x) =
+    (\\frac{e^{x_1}}{\\sum_{i=1}^N e^{x_i})},\\ldots,\\frac{e^{x_N}}{\\sum_{i=1}^N e^{x_i})})`
+    where :math:`N` is the number of channels.
+    """
+    def __init__(self):
+        super(Softmax, self).__init__('Softmax')
+    @staticmethod
+    def output(signal: np.ndarray) -> np.ndarray:
+        """Output of the softmax function (rows sum to 1)."""
+        return special.softmax(signal, axis=1)
+    @staticmethod
+    def gradient(signal: np.ndarray, direction: np.ndarray) -> np.ndarray:
+        """Gradient of the softmax function."""
+        output = Softmax.output(signal)
+        return output * (direction.T - (output * direction).sum(axis=1)).T
+def get_activation(activation: Union[BaseActivation, str] = 'identity') -> BaseActivation:
+    """Get the activation function.
+    Parameters
+    ----------
+    activation : Union[BaseActivation, str]
+        Activation function.
+        If a name is given, can be either ``'Identity'``, ``'Relu'``, ``'Sigmoid'`` or ``'Softmax'``.
+        If a custom activation function is given, must be of class BaseActivation.
+    Returns
+    -------
+    activation : BaseActivation
+        Activation function.
+    Raises
+    ------
+    TypeError
+        Error raised if the input not a string or an object of class BaseActivation.
+    ValueError
+        Error raised if the name of the activation function is unknown.
+    """
+    if issubclass(type(activation), BaseActivation):
+        return activation
+    elif type(activation) == str:
+        activation = activation.lower()
+        if activation in ['identity', '']:
+            return BaseActivation()
+        elif activation == 'relu':
+            return ReLu()
+        elif activation == 'sigmoid':
+            return Sigmoid()
+        elif activation == 'softmax':
+            return Softmax()
+        else:
+            raise ValueError("Activation must be either \"Identity\", \"ReLu\", \"Sigmoid\" or \"Softmax\".")
+    else:
+        raise TypeError("Activation must be a string or an object of type \"BaseActivation\".")

sknetwork/gnn/base.py ADDED Viewed

@@ -0,0 +1,155 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+"""
+Created on July 2022
+@author: Simon Delarue <sdelarue@enst.fr>
+@author: Thomas Bonald <bonald@enst.fr>
+"""
+from typing import Union
+import numpy as np
+from collections import defaultdict
+from scipy import sparse
+from sknetwork.gnn.loss import BaseLoss, get_loss
+from sknetwork.gnn.optimizer import BaseOptimizer, get_optimizer
+from sknetwork.utils.verbose import VerboseMixin
+class BaseGNN(VerboseMixin):
+    """Base class for GNNs.
+    Parameters
+    ----------
+    loss : str or custom loss (default = ``'Cross entropy'``)
+        Loss function.
+    optimizer : str or custom optimizer (default = ``'Adam'``)
+        Optimizer used for training.
+        * ``'Adam'``, a stochastic gradient-based optimizer.
+        * ``'GD'``, gradient descent.
+    learning_rate : float
+        Learning rate.
+    verbose : bool
+        Verbose mode
+    Attributes
+    ----------
+    layers: list
+        List of layers.
+    labels_: np.ndarray
+        Predicted labels.
+    history_: dict
+        Training history per epoch: {'embedding', 'loss', 'train_accuracy', 'test_accuracy'}.
+    """
+    def __init__(self, loss: Union[BaseLoss, str] = 'CrossEntropy', optimizer: Union[BaseOptimizer, str] = 'Adam',
+                 learning_rate: float = 0.01, verbose: bool = False):
+        VerboseMixin.__init__(self, verbose)
+        self.optimizer = get_optimizer(optimizer, learning_rate)
+        self.loss = get_loss(loss)
+        self.layers = []
+        self.derivative_weight = []
+        self.derivative_bias = []
+        self.train_mask = None
+        self.test_mask = None
+        self.val_mask = None
+        self.embedding_ = None
+        self.output_ = None
+        self.labels_ = None
+        self.history_ = defaultdict(list)
+    def fit(self, *args, **kwargs):
+        """Fit Algorithm to the data."""
+        raise NotImplementedError
+    def predict(self, *args, **kwargs):
+        """Predict labels."""
+        raise NotImplementedError
+    def fit_predict(self, *args, **kwargs) -> np.ndarray:
+        """Fit algorithm to the data and return the labels. Same parameters as the ``fit`` method.
+        Returns
+        -------
+        labels : np.ndarray
+            Labels of the nodes.
+        """
+        self.fit(*args, **kwargs)
+        return self.predict()
+    def fit_transform(self, *args, **kwargs) -> np.ndarray:
+        """Fit algorithm to the data and return the embedding of the nodes. Same parameters as the ``fit`` method.
+        Returns
+        -------
+        embedding : np.ndarray
+            Embedding of the nodes.
+        """
+        self.fit(*args, **kwargs)
+        return self.embedding_
+    def backward(self, features: sparse.csr_matrix, labels: np.ndarray, mask: np.ndarray):
+        """Compute backpropagation.
+        Parameters
+        ----------
+        features : sparse.csr_matrix
+            Features, array of shape (n_nodes, n_features).
+        labels : np.ndarray
+            Labels, array of shape (n_nodes,).
+        mask: np.ndarray
+            Boolean mask, array of shape (n_nodes,).
+        """
+        derivative_weight = []
+        derivative_bias = []
+        # discard missing labels
+        mask = mask & (labels >= 0)
+        labels = labels[mask]
+        # backpropagation
+        n_layers = len(self.layers)
+        layers_reverse: list = list(reversed(self.layers))
+        signal = layers_reverse[0].embedding
+        signal = signal[mask]
+        gradient = layers_reverse[0].activation.loss_gradient(signal, labels)
+        for i in range(n_layers):
+            if i < n_layers - 1:
+                signal = layers_reverse[i + 1].output
+            else:
+                signal = features
+            signal = signal[mask]
+            derivative_weight.append(signal.T.dot(gradient))
+            derivative_bias.append(np.mean(gradient, axis=0, keepdims=True))
+            if i < n_layers - 1:
+                signal = layers_reverse[i + 1].embedding
+                signal = signal[mask]
+                direction = layers_reverse[i].weight.dot(gradient.T).T
+                gradient = layers_reverse[i + 1].activation.gradient(signal, direction)
+        self.derivative_weight = list(reversed(derivative_weight))
+        self.derivative_bias = list(reversed(derivative_bias))
+    def _check_fitted(self):
+        if self.output_ is None:
+            raise ValueError("This embedding instance is not fitted yet. "
+                             "Call 'fit' with appropriate arguments before using this method.")
+        else:
+            return self
+    def __repr__(self) -> str:
+        """String representation of the `GNN`, layers by layers.
+        Returns
+        -------
+        str
+            String representation of object.
+        """
+        string = f'{self.__class__.__name__}(\n'
+        for layer in self.layers:
+            string += f'  {layer}\n'
+        string += ')'
+        return string