PyPI - nystrom-ncut - Versions diffs - 0.0.1__py3-none-any.whl → 0.0.3__py3-none-any.whl - Mend

nystrom-ncut 0.0.1py3-none-any.whl → 0.0.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

nystrom_ncut/__init__.py +4 -4
nystrom_ncut/common.py +20 -0
nystrom_ncut/ncut_pytorch.py +190 -473
nystrom_ncut/nystrom.py +4 -2
nystrom_ncut/propagation_utils.py +19 -61
nystrom_ncut/visualize_utils.py +11 -100
{nystrom_ncut-0.0.1.dist-info → nystrom_ncut-0.0.3.dist-info}/METADATA +1 -1
nystrom_ncut-0.0.3.dist-info/RECORD +11 -0
nystrom_ncut/new_ncut_pytorch.py +0 -241
nystrom_ncut-0.0.1.dist-info/RECORD +0 -11
{nystrom_ncut-0.0.1.dist-info → nystrom_ncut-0.0.3.dist-info}/LICENSE +0 -0
{nystrom_ncut-0.0.1.dist-info → nystrom_ncut-0.0.3.dist-info}/WHEEL +0 -0
{nystrom_ncut-0.0.1.dist-info → nystrom_ncut-0.0.3.dist-info}/top_level.txt +0 -0

nystrom_ncut/new_ncut_pytorch.py DELETED Viewed

@@ -1,241 +0,0 @@
-import logging
-from typing import Literal, Tuple
-import torch
-from .nystrom import (
-    EigSolverOptions,
-    OnlineKernel,
-    OnlineNystrom,
-    solve_eig,
-)
-from .propagation_utils import (
-    affinity_from_features,
-    run_subgraph_sampling,
-)
-DistanceOptions = Literal["cosine", "euclidean", "rbf"]
-class LaplacianKernel(OnlineKernel):
-    def __init__(
-        self,
-        affinity_focal_gamma: float,
-        distance: DistanceOptions,
-        eig_solver: EigSolverOptions,
-    ):
-        self.affinity_focal_gamma = affinity_focal_gamma
-        self.distance: DistanceOptions = distance
-        self.eig_solver: EigSolverOptions = eig_solver
-        # Anchor matrices
-        self.anchor_features: torch.Tensor = None               # [n x d]
-        self.A: torch.Tensor = None                             # [n x n]
-        self.Ainv: torch.Tensor = None                          # [n x n]
-        # Updated matrices
-        self.a_r: torch.Tensor = None                           # [n]
-        self.b_r: torch.Tensor = None                           # [n]
-    def fit(self, features: torch.Tensor) -> None:
-        self.anchor_features = features                         # [n x d]
-        self.A = affinity_from_features(
-            self.anchor_features,                               # [n x d]
-            affinity_focal_gamma=self.affinity_focal_gamma,
-            distance=self.distance,
-            fill_diagonal=False,
-        )                                                       # [n x n]
-        U, L = solve_eig(
-            self.A,
-            num_eig=features.shape[-1] + 1,
-            eig_solver=self.eig_solver,
-        )                                                       # [n x (d + 1)], [d + 1]
-        self.Ainv = U @ torch.diag(1 / L) @ U.mT                # [n x n]
-        self.a_r = torch.sum(self.A, dim=-1)                    # [n]
-        self.b_r = torch.zeros_like(self.a_r)                   # [n]
-    def update(self, features: torch.Tensor) -> torch.Tensor:
-        B = affinity_from_features(
-            self.anchor_features,                               # [n x d]
-            features,                                           # [m x d]
-            affinity_focal_gamma=self.affinity_focal_gamma,
-            distance=self.distance,
-            fill_diagonal=False,
-        )                                                       # [n x m]
-        b_r = torch.sum(B, dim=-1)                              # [n]
-        b_c = torch.sum(B, dim=-2)                              # [m]
-        self.b_r = self.b_r + b_r                               # [n]
-        rowscale = self.a_r + self.b_r                          # [n]
-        colscale = b_c + B.mT @ self.Ainv @ self.b_r            # [m]
-        scale = (rowscale[:, None] * colscale) ** -0.5          # [n x m]
-        return (B * scale).mT                                   # [m x n]
-    def transform(self, features: torch.Tensor = None) -> torch.Tensor:
-        rowscale = self.a_r + self.b_r                          # [n]
-        if features is None:
-            B = self.A                                          # [n x n]
-            colscale = rowscale                                 # [n]
-        else:
-            B = affinity_from_features(
-                self.anchor_features,                           # [n x d]
-                features,                                       # [m x d]
-                affinity_focal_gamma=self.affinity_focal_gamma,
-                distance=self.distance,
-                fill_diagonal=False,
-            )                                                   # [n x m]
-            b_c = torch.sum(B, dim=-2)                          # [m]
-            colscale = b_c + B.mT @ self.Ainv @ self.b_r        # [m]
-        scale = (rowscale[:, None] * colscale) ** -0.5          # [n x m]
-        return (B * scale).mT                                   # [m x n]
-class NewNCUT(OnlineNystrom):
-    """Nystrom Normalized Cut for large scale graph."""
-    def __init__(
-        self,
-        num_eig: int = 100,
-        affinity_focal_gamma: float = 1.0,
-        num_sample: int = 10000,
-        sample_method: Literal["farthest", "random"] = "farthest",
-        distance: DistanceOptions = "cosine",
-        eig_solver: EigSolverOptions = "svd_lowrank",
-        normalize_features: bool = None,
-        device: str = None,
-        move_output_to_cpu: bool = False,
-        matmul_chunk_size: int = 8096,
-    ):
-        """
-        Args:
-            num_eig (int): number of top eigenvectors to return
-            affinity_focal_gamma (float): affinity matrix temperature, lower t reduce the not-so-connected edge weights,
-                smaller t result in more sharp eigenvectors.
-            num_sample (int): number of samples for Nystrom-like approximation,
-                reduce only if memory is not enough, increase for better approximation
-            sample_method (str): subgraph sampling, ['farthest', 'random'].
-                farthest point sampling is recommended for better Nystrom-approximation accuracy
-            distance (str): distance metric for affinity matrix, ['cosine', 'euclidean', 'rbf'].
-            eig_solver (str): eigen decompose solver, ['svd_lowrank', 'lobpcg', 'svd', 'eigh'].
-            normalize_features (bool): normalize input features before computing affinity matrix,
-                default 'None' is True for cosine distance, False for euclidean distance and rbf
-            device (str): device to use for eigen computation,
-                move to GPU to speeds up a bit (~5x faster)
-            move_output_to_cpu (bool): move output to CPU, set to True if you have memory issue
-            matmul_chunk_size (int): chunk size for large-scale matrix multiplication
-        """
-        OnlineNystrom.__init__(
-            self,
-            n_components=num_eig,
-            kernel=LaplacianKernel(affinity_focal_gamma, distance, eig_solver),
-            eig_solver=eig_solver,
-            chunk_size=matmul_chunk_size,
-        )
-        self.num_sample = num_sample
-        self.sample_method = sample_method
-        self.distance = distance
-        self.normalize_features = normalize_features
-        if self.normalize_features is None:
-            if distance in ["cosine"]:
-                self.normalize_features = True
-            if distance in ["euclidean", "rbf"]:
-                self.normalize_features = False
-        self.device = device
-        self.move_output_to_cpu = move_output_to_cpu
-        self.matmul_chunk_size = matmul_chunk_size
-    def _fit_helper(
-        self,
-        features: torch.Tensor,
-        precomputed_sampled_indices: torch.Tensor,
-    ) -> Tuple[torch.Tensor, torch.Tensor]:
-        # move subgraph gpu to speed up
-        original_device = features.device
-        device = original_device if self.device is None else self.device
-        _n = features.shape[0]
-        if self.num_sample >= _n:
-            logging.info(
-                f"NCUT nystrom num_sample is larger than number of input samples, nyström approximation is not needed, setting num_sample={_n}"
-            )
-            self.num_sample = _n
-        # check if features dimension greater than num_eig
-        if self.eig_solver in ["svd_lowrank", "lobpcg"]:
-            assert (
-                _n >= self.n_components * 2
-            ), "number of nodes should be greater than 2*num_eig"
-        elif self.eig_solver in ["svd", "eigh"]:
-            assert (
-                _n >= self.n_components
-            ), "number of nodes should be greater than num_eig"
-        assert self.distance in ["cosine", "euclidean", "rbf"], "distance should be 'cosine', 'euclidean', 'rbf'"
-        if self.normalize_features:
-            # features need to be normalized for affinity matrix computation (cosine distance)
-            features = torch.nn.functional.normalize(features, dim=-1)
-        if precomputed_sampled_indices is not None:
-            sampled_indices = precomputed_sampled_indices
-        else:
-            sampled_indices = run_subgraph_sampling(
-                features,
-                num_sample=self.num_sample,
-                sample_method=self.sample_method,
-            )
-        sampled_features = features[sampled_indices].to(device)
-        OnlineNystrom.fit(self, sampled_features)
-        _n_not_sampled = _n - len(sampled_features)
-        if _n_not_sampled > 0:
-            unsampled_indices = torch.full((_n,), True).scatter(0, sampled_indices, False)
-            unsampled_features = features[unsampled_indices].to(device)
-            V_unsampled, _ = OnlineNystrom.update(self, unsampled_features)
-        else:
-            unsampled_indices = V_unsampled = None
-        return unsampled_indices, V_unsampled
-    def fit(
-        self,
-        features: torch.Tensor,
-        precomputed_sampled_indices: torch.Tensor = None,
-    ):
-        """Fit Nystrom Normalized Cut on the input features.
-        Args:
-            features (torch.Tensor): input features, shape (n_samples, n_features)
-            precomputed_sampled_indices (torch.Tensor): precomputed sampled indices, shape (num_sample,)
-                override the sample_method, if not None
-        Returns:
-            (NCUT): self
-        """
-        NewNCUT._fit_helper(self, features, precomputed_sampled_indices)
-        return self
-    def fit_transform(
-        self,
-        features: torch.Tensor,
-        precomputed_sampled_indices: torch.Tensor = None,
-    ) -> Tuple[torch.Tensor, torch.Tensor]:
-        """
-        Args:
-            features (torch.Tensor): input features, shape (n_samples, n_features)
-            precomputed_sampled_indices (torch.Tensor): precomputed sampled indices, shape (num_sample,)
-                override the sample_method, if not None
-        Returns:
-            (torch.Tensor): eigen_vectors, shape (n_samples, num_eig)
-            (torch.Tensor): eigen_values, sorted in descending order, shape (num_eig,)
-        """
-        unsampled_indices, V_unsampled = NewNCUT._fit_helper(self, features, precomputed_sampled_indices)
-        V_sampled, L = OnlineNystrom.transform(self)
-        if unsampled_indices is not None:
-            V = torch.zeros((len(unsampled_indices), self.n_components))
-            V[~unsampled_indices] = V_sampled
-            V[unsampled_indices] = V_unsampled
-        else:
-            V = V_sampled
-        return V, L

nystrom_ncut-0.0.1.dist-info/RECORD DELETED Viewed

@@ -1,11 +0,0 @@
-nystrom_ncut/__init__.py,sha256=K8a7o9oP9jhG9auqsAFt1KPQMElRUP3_TFxBmRUz8-o,544
-nystrom_ncut/ncut_pytorch.py,sha256=f4VHCgOP3tEjn5NIr2wFE4hAGnQIWV6P6W4xuMt0d0I,22426
-nystrom_ncut/new_ncut_pytorch.py,sha256=wPG-OAcew4kw0mDMLQPJOetz-9sBfvFmexL7n0JVYjc,10419
-nystrom_ncut/nystrom.py,sha256=UOXfhgz-xB2FtKYfn-cwMDNkgCWrM-3yXHtPxOrgEV4,8569
-nystrom_ncut/propagation_utils.py,sha256=quykDk1RgFyHEUloRBcapSocq9Wvkk3hG_TYx-Tue6A,13813
-nystrom_ncut/visualize_utils.py,sha256=3TEdXF_H7sBUQFz1nK3QemmlKqRteo5BKkno1LozVTg,21840
-nystrom_ncut-0.0.1.dist-info/LICENSE,sha256=2bm9uFabQZ3Ykb_SaSU_uUbAj2-htc6WJQmS_65qD00,1073
-nystrom_ncut-0.0.1.dist-info/METADATA,sha256=kj900xV7RSfTSW8jyzjhrGV2z1Ttzn5UoTFOlHpfZg8,6058
-nystrom_ncut-0.0.1.dist-info/WHEEL,sha256=A3WOREP4zgxI0fKrHUG8DC8013e3dK3n7a6HDbcEIwE,91
-nystrom_ncut-0.0.1.dist-info/top_level.txt,sha256=j7g_j0S048EvguFFnGgD5Ewd3r2H6klsxd5A4dd-wHw,13
-nystrom_ncut-0.0.1.dist-info/RECORD,,

{nystrom_ncut-0.0.1.dist-info → nystrom_ncut-0.0.3.dist-info}/LICENSE RENAMED Viewed

File without changes

{nystrom_ncut-0.0.1.dist-info → nystrom_ncut-0.0.3.dist-info}/WHEEL RENAMED Viewed

File without changes

{nystrom_ncut-0.0.1.dist-info → nystrom_ncut-0.0.3.dist-info}/top_level.txt RENAMED Viewed

File without changes

nystrom-ncut 0.0.1__py3-none-any.whl → 0.0.3__py3-none-any.whl

nystrom-ncut 0.0.1py3-none-any.whl → 0.0.3py3-none-any.whl