PyPI - imageatlas - Versions diffs - 0.1.0__tar.gz → 0.1.1__tar.gz - Mend

imageatlas 0.1.0tar.gz → 0.1.1tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (58) hide show

{imageatlas-0.1.0 → imageatlas-0.1.1}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: imageatlas
-Version: 0.1.0
+Version: 0.1.1
 Summary: ImageAtlas: A toolkit for organizing, cleaning and analysing your image datasets.
 Author-email: Ahmad Javed <ahmadjaved97@gmail.com>
 Maintainer-email: Ahmad Javed <ahmadjaved97@gmail.com>
@@ -63,6 +63,7 @@ Requires-Dist: openpyxl; extra == "full"
 Dynamic: license-file
 # ImageAtlas
+[![PyPI Downloads](https://static.pepy.tech/personalized-badge/imageatlas?period=total&units=INTERNATIONAL_SYSTEM&left_color=BLACK&right_color=GREEN&left_text=Downloads)](https://pepy.tech/projects/imageatlas)
 ## Overview
@@ -86,6 +87,12 @@ pip install imageatlas
 pip install imageatlas[full]
 ```
+**Note on CLIP**: If you wish to use the CLIP model, you must install it manually from GitHub using:
+```
+pip install git+https://github.com/openai/CLIP.git
+```
 **From Source**
 ```
 git clone https://github.com/ahmadjaved97/ImageAtlas.git

{imageatlas-0.1.0 → imageatlas-0.1.1}/README.md RENAMED Viewed

@@ -1,4 +1,5 @@
 # ImageAtlas
+[![PyPI Downloads](https://static.pepy.tech/personalized-badge/imageatlas?period=total&units=INTERNATIONAL_SYSTEM&left_color=BLACK&right_color=GREEN&left_text=Downloads)](https://pepy.tech/projects/imageatlas)
 ## Overview
@@ -22,6 +23,12 @@ pip install imageatlas
 pip install imageatlas[full]
 ```
+**Note on CLIP**: If you wish to use the CLIP model, you must install it manually from GitHub using:
+```
+pip install git+https://github.com/openai/CLIP.git
+```
 **From Source**
 ```
 git clone https://github.com/ahmadjaved97/ImageAtlas.git

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/__init__.py RENAMED Viewed

@@ -2,7 +2,7 @@
 ImageAtlas: A toolkit for organizing, cleaning and analysing your image datasets.
 """
-__version__ = '0.1.0'
+__version__ = '0.1.1'
 # 1. High level API (The everything tool)

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/clustering/__init__.py RENAMED Viewed

@@ -1,7 +1,15 @@
+"""
+Clustering Algorithms module.
+This module provides various clustering algorithms with a unified interface for clustering
+on image features.
+"""
 from .base import ClusteringResult, ClusteringAlgorithm
 from .kmeans import KMeansClustering
 from .hdbscan_clustering import HDBSCANClustering
 from .gmm import GMMClustering
+from .factory import create_clustering_algorithm, get_available_algorithms
@@ -11,4 +19,6 @@ __all__ = [
     'KMeansClustering',
     'HDBSCANClustering',
     'GMMClustering',
+    'create_clustering_algorithm',
+    'get_available_algorithms'
 ]

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/clustering/base.py RENAMED Viewed

@@ -8,7 +8,13 @@ import numpy as np
 class ClusteringResult:
     """
     Container for clustering Results.
+    Attributes:
+       cluster_labels: Array of cluster assignments for each sample.
+       cluster_dict: Dictionary mapping cluster IDs to list of sample indices.
+       n_clusters: Number of clusters found.
+       metadata: Additional algorithm-specific metadata.
     """
     cluster_labels: np.ndarray
     cluster_dict: Dict[int, List[int]]
     n_clusters: int
@@ -49,11 +55,18 @@ class ClusteringResult:
 class ClusteringAlgorithm(ABC):
     """
     Abstract base class for all clustering algorithms.
+    All the clustering algorithms must implement the fit_predict method and
+    provide a consistent interface for clustering operations.
     """
     def __init__(self, random_state=42, **kwargs):
         """
         Initialize the clustering algorithm.
+        Args:
+            random_state: Random seed for reproducibility.
+            **kwargs: Additional algorithm related parameters.
         """
         self.random_state = random_state
         self.params = kwargs
@@ -64,6 +77,12 @@ class ClusteringAlgorithm(ABC):
     def fit_predict(self, features) -> ClusteringResult:
         """
         Fit the clustering algorithms and predict cluster labels.
+        Args:
+            features: Feature matrix of shape (n_samples, n_features)
+        Returns:
+            ClusteringResult object containing cluster assignments and metadata.
         """
         pass
@@ -77,7 +96,14 @@ class ClusteringAlgorithm(ABC):
     def _validate_features(self, features:np.ndarray) -> None:
         """
         Validate the input feature matrix.
+        Args:
+            features: Feature matrix of shape (n_samples, n_features) to validate.
+        Raises:
+            ValueError: If features are invalid.
         """
         if not isinstance(features, np.ndarray):
             raise ValueError(f"Feature must be a numpy array, got {type(features)}")
@@ -93,6 +119,13 @@ class ClusteringAlgorithm(ABC):
     def _create_cluster_dict(self, cluster_labels, filenames=None):
         """
         Createa dictionary mapping cluster IDs to indices or filenames
+        Args:
+            cluster_labels: Array of cluster assignments.
+            filenames: Optional list of filenames corresponding to images.
+        Returns:
+            Dictionary mapping cluster IDs to lists of indices or filenames
         """
         cluster_dict = {}

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/clustering/factory.py RENAMED Viewed

@@ -22,6 +22,27 @@ def create_clustering_algorithm(
 ) -> ClusteringAlgorithm:
     """
     Factory function to create clustering algorithms.
+    Args:
+        method: Name of the clustering algorithm ('kmeans', 'gmm', 'hdbscan')
+        **kwargs: Algorithm specific parameters
+    Returns:
+        Instance of the requested clustering algorithm
+    Raises:
+        Value Error: If clustering method is not supported.
+    Examples:
+        >>> # Create KMeans with 5 clusters
+        >>> clusterer = create_clustering_algorithm('kmeans', n_clusters=5)
+        >>>  # Create GMM with full covariance
+        >>> clusterer = create_clustering_algorithm('gmm', n_components=8, covariance_type='full')
+        >>> # Create HDBSCAN with auto parameters
+        >>> clusterer = create_clustering_algorithm('hdbscan', auto_params=True)
     """
     method = method.lower()
@@ -39,5 +60,8 @@ def create_clustering_algorithm(
 def get_available_algorithms():
     """
     Get a list of available clustering algorithms.
+    Returns:
+        List of algorithm names.
     """
     return sorted(CLUSTERING_ALGORITHMS.keys())

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/clustering/gmm.py RENAMED Viewed

@@ -10,6 +10,14 @@ from .base import ClusteringAlgorithm, ClusteringResult
 class GMMClustering(ClusteringAlgorithm):
     """
     Gaussian Mixture Model clustering algorithm.
+    Args:
+        n_components: Number of mixture components (clusters)
+        covariance_type: Type of covarince parameters ('full', 'diag', 'tied', 'spherical')
+        max_iter: Maximum number of EM iterations
+        n_init: Number of initializations to perform
+        reg_covar: Regularization added to diagonal of covariance (prevents singular matrices)
+        random_state: Random seed for reproducibility
     """
     def __init__(
@@ -46,10 +54,16 @@ class GMMClustering(ClusteringAlgorithm):
         """
         Fit GMM and predict cluster labels.
+        Args:
+            features: Feature matrix of shape (n_samples, n_features)
+            filenames: Optional list of filenames for cluster mapping
+        Returns:
+            ClusteringResult object with cluster assignments.
         """
         self._validate_features(features)
-        print('fshape: ', features.shape)
         n_samples = features.shape[0]
@@ -110,6 +124,15 @@ class GMMClustering(ClusteringAlgorithm):
     def predict(self, features):
         """
         Predict cluster label for new samples.
+        Args:
+            features: Feature matrix of shape (n_samples, n_features)
+        Returns:
+            Array of cluster labels
+        Raises:
+            RuntimeError: If model has not been fitted yet.
         """
         if not self.is_fitted or self._model is None:
@@ -121,6 +144,15 @@ class GMMClustering(ClusteringAlgorithm):
     def predict_proba(self, features):
         """
         Predict probability of each cluster for new samples.
+        Args:
+            features: Feature matrix of shape (n_samples, n_features)
+        Returns:
+            Array of cluster labels
+        Raises:
+            RuntimeError: If model has not been fitted yet.
         """
         if not self.is_fitted or self._model is None:
@@ -132,6 +164,9 @@ class GMMClustering(ClusteringAlgorithm):
     def get_cluster_means(self):
         """
         Get cluster means (centers) if model is fitted.
+        Returns:
+            Array of cluster centers or None if not fitted.
         """
         if self.is_fitted and self._model is not None:
@@ -142,6 +177,12 @@ class GMMClustering(ClusteringAlgorithm):
     def score(self, features):
         """
         Compute the log-likelihood of the data under the model.
+        Args:
+            features: Feature matrix of shape (n_samples, n_features)
+        Returns:
+            Log-likelihood score
         """
         if not self.is_fitted or self._model is None:

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/clustering/hdbscan_clustering.py RENAMED Viewed

@@ -7,7 +7,16 @@ from .base import ClusteringAlgorithm, ClusteringResult
 class HDBSCANClustering(ClusteringAlgorithm):
     """
-    HDBSCAN algorithm.
+    HDBSCAN (Hierarchical Density-Based Spatial Clustering) Algorithm.
+    Args:
+        min_cluster_size: Minimum number of samples in a cluster
+        min_samples: Number of samples in a neighborhood for core points.
+        metric: Distance metric to use
+        cluster_selection_method: Method for selecting clusters ('eom' or 'leaf')
+        auto_params: Whether to automatically set parameters based on dataset size
+        random_state: Random seed (note: HDBSCAN is deterministic, this is for consistency)
     """
     def __init__(
@@ -37,6 +46,12 @@ class HDBSCANClustering(ClusteringAlgorithm):
     def _auto_select_params(self, n_samples):
         """
         Automatically select HDBSCAN parameters based on dataset size.
+        Args:
+            n_samples: Number of samples in the dataset.
+        Returns:
+            Tuple of (min_cluster_size, min_samples)
         """
         if n_samples < 100:
@@ -62,6 +77,10 @@ class HDBSCANClustering(ClusteringAlgorithm):
         """
         Fit HDBSCAN and predict cluster labels.
+        Args:
+            features: Feature matrix of shape (n_samples, n_features)
+            filenames: Optional list of filenames for cluster mapping.
         """
         try:
@@ -137,6 +156,11 @@ class HDBSCANClustering(ClusteringAlgorithm):
     def get_outlier_score(self):
         """
         Get outlier score for each sample.
+        Higher scores indicate more likely outliers.
+        Returns:
+            Array of outlier scores or None if model is not fitted.
         """
         if self.is_fitted and self._model is not None:
@@ -147,6 +171,9 @@ class HDBSCANClustering(ClusteringAlgorithm):
     def get_condensed_tree(self):
         """
         Get condensed cluster hierarchy tree.
+        Returns:
+            Array of membership probabilities or None if model not fitted.
         """
         if self.is_fitted and self._model is not None:

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/clustering/kmeans.py RENAMED Viewed

@@ -10,6 +10,14 @@ from typing import Optional
 class KMeansClustering(ClusteringAlgorithm):
     """
     K-Means clustering algorithm.
+    Args:
+        n_clusters: Number of clusters to form
+        n_init: Number of times to run with different centroid seeds
+        max_iter: Maximum number of iterations
+        use_minibatch: Whether to use MiniBatchKMeans for large datasets
+        batch_size: Batch size for MiniBatchKMeans
+        random_state: Random seed for reproducibility
     """
     def __init__(
@@ -42,6 +50,13 @@ class KMeansClustering(ClusteringAlgorithm):
         """
         Fit K-Means and predict cluster labels.
+        Args:
+            features: Feature matrix of shape (n_samples, n_features)
+            filenames: Optional list of filenames for cluster mapping
+        Returns:
+            ClusteringResult object with cluster assignments.
         """
         self._validate_features(features)
@@ -108,6 +123,15 @@ class KMeansClustering(ClusteringAlgorithm):
     def predict(self, features):
         """
         Predict cluster label for new samples.
+        Args:
+            features: Feature matrix of shape (n_samples, n_features)
+        Returns:
+            Array of cluster labels
+        Raises:
+            RuntimeError: If model has not yet been fitted.
         """
         if not self.is_fitted or self._model == None:
@@ -119,6 +143,9 @@ class KMeansClustering(ClusteringAlgorithm):
     def get_cluster_centers(self):
         """
         Get cluster centers if model is fitted.
+        Returns:
+            Array of cluster centers or None if not fitted.
         """
         if self.is_fitted and self._model is not None:
             return self._model.cluster_centers_

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/features/cache.py RENAMED Viewed

@@ -121,7 +121,7 @@ class HDF5Cache(FeatureCache):
             path = path + ".h5"
         if not self.exists(path):
-            raise FileNotFoundError("fCache file not found: {path}")
+            raise FileNotFoundError(f"Cache file not found: {path}")
         with h5py.File(path, 'r') as f:
             # Load filenames

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: imageatlas
-Version: 0.1.0
+Version: 0.1.1
 Summary: ImageAtlas: A toolkit for organizing, cleaning and analysing your image datasets.
 Author-email: Ahmad Javed <ahmadjaved97@gmail.com>
 Maintainer-email: Ahmad Javed <ahmadjaved97@gmail.com>
@@ -63,6 +63,7 @@ Requires-Dist: openpyxl; extra == "full"
 Dynamic: license-file
 # ImageAtlas
+[![PyPI Downloads](https://static.pepy.tech/personalized-badge/imageatlas?period=total&units=INTERNATIONAL_SYSTEM&left_color=BLACK&right_color=GREEN&left_text=Downloads)](https://pepy.tech/projects/imageatlas)
 ## Overview
@@ -86,6 +87,12 @@ pip install imageatlas
 pip install imageatlas[full]
 ```
+**Note on CLIP**: If you wish to use the CLIP model, you must install it manually from GitHub using:
+```
+pip install git+https://github.com/openai/CLIP.git
+```
 **From Source**
 ```
 git clone https://github.com/ahmadjaved97/ImageAtlas.git

{imageatlas-0.1.0 → imageatlas-0.1.1}/CHANGELOG.md RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/CONTRIBUTING.md RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/LICENSE RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/MANIFEST.in RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/examples/example_apis.ipynb RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/examples/example_complete_workflow.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/core/__init__.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/core/clusterer.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/core/results.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/features/__init__.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/features/adapter.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/features/batch.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/features/extractors/__init__.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/features/extractors/base.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/features/extractors/clip.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/features/extractors/convnext.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/features/extractors/dinov2.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/features/extractors/efficientnet.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/features/extractors/factory.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/features/extractors/mobilenet.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/features/extractors/resnet.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/features/extractors/swin.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/features/extractors/vgg.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/features/extractors/vit.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/features/loaders.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/features/metadata.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/features/pipeline.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/reduction/__init__.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/reduction/base.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/reduction/factory.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/reduction/pca.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/reduction/tsne.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/reduction/umap_reducer.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/visualization/__init__.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas/visualization/grids.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas.egg-info/SOURCES.txt RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas.egg-info/dependency_links.txt RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas.egg-info/requires.txt RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/imageatlas.egg-info/top_level.txt RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/pyproject.toml RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/requirements.txt RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/setup.cfg RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/tests/test_batch_processing.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/tests/test_core_api.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/tests/test_features_pipeline.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/tests/test_reduction_module.py RENAMED Viewed

File without changes

{imageatlas-0.1.0 → imageatlas-0.1.1}/tests/test_visualization.py RENAMED Viewed

File without changes

imageatlas 0.1.0__tar.gz → 0.1.1__tar.gz

imageatlas 0.1.0tar.gz → 0.1.1tar.gz