PyPI - pyvisim - Versions diffs - 0.1.0__tar.gz - Mend

pyvisim 0.1.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (27) hide show

pyvisim-0.1.0/LICENSE +21 -0
pyvisim-0.1.0/PKG-INFO +158 -0
pyvisim-0.1.0/README.md +133 -0
pyvisim-0.1.0/pyvisim/__init__.py +5 -0
pyvisim-0.1.0/pyvisim/_base_classes.py +51 -0
pyvisim-0.1.0/pyvisim/_config.py +56 -0
pyvisim-0.1.0/pyvisim/_errors.py +10 -0
pyvisim-0.1.0/pyvisim/_utils.py +948 -0
pyvisim-0.1.0/pyvisim/datasets/__init__.py +1 -0
pyvisim-0.1.0/pyvisim/datasets/datasets.py +141 -0
pyvisim-0.1.0/pyvisim/encoders/__init__.py +9 -0
pyvisim-0.1.0/pyvisim/encoders/_base_encoder.py +275 -0
pyvisim-0.1.0/pyvisim/encoders/fisher_vector.py +110 -0
pyvisim-0.1.0/pyvisim/encoders/pipeline.py +126 -0
pyvisim-0.1.0/pyvisim/encoders/vlad.py +97 -0
pyvisim-0.1.0/pyvisim/eval.py +145 -0
pyvisim-0.1.0/pyvisim/features/__init__.py +2 -0
pyvisim-0.1.0/pyvisim/features/_features.py +290 -0
pyvisim-0.1.0/pyvisim/losses/__init__.py +0 -0
pyvisim-0.1.0/pyvisim/losses/_losses.py +204 -0
pyvisim-0.1.0/pyvisim.egg-info/PKG-INFO +158 -0
pyvisim-0.1.0/pyvisim.egg-info/SOURCES.txt +25 -0
pyvisim-0.1.0/pyvisim.egg-info/dependency_links.txt +1 -0
pyvisim-0.1.0/pyvisim.egg-info/requires.txt +1 -0
pyvisim-0.1.0/pyvisim.egg-info/top_level.txt +1 -0
pyvisim-0.1.0/setup.cfg +4 -0
pyvisim-0.1.0/setup.py +23 -0

pyvisim-0.1.0/LICENSE ADDED Viewed

@@ -0,0 +1,21 @@
+MIT License
+Copyright (c) 2024 Nhat Huy Vu
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

pyvisim-0.1.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,158 @@
+Metadata-Version: 2.2
+Name: pyvisim
+Version: 0.1.0
+Summary: A Python library for image similarity analysis using Image Encoders and Neural Networks
+Home-page: https://github.com/MechaCritter/Python-Visual-Similarity
+Author: Nhat Huy Vu
+Author-email: vunhathuy234@gmail.com
+License: MIT
+Classifier: Programming Language :: Python :: 3
+Classifier: Operating System :: OS Independent
+Requires-Python: >=3.10
+Description-Content-Type: text/markdown
+License-File: LICENSE
+Requires-Dist: opencv-python>=4.5.3
+Dynamic: author
+Dynamic: author-email
+Dynamic: classifier
+Dynamic: description
+Dynamic: description-content-type
+Dynamic: home-page
+Dynamic: license
+Dynamic: requires-dist
+Dynamic: requires-python
+Dynamic: summary
+<!-- Logo -->
+<p align="center">
+  <img src="res/images/logo.png" alt="pyvisim" width="1418" />
+</p>
+<!-- Added badges to convey project readiness/branding (example placeholders) -->
+![License](https://img.shields.io/badge/license-MIT-brightgreen)
+![Version](https://img.shields.io/badge/version-0.1.0-blue)
+![Status](https://img.shields.io/badge/status-pre--release-orange)
+![Python](https://img.shields.io/badge/Python-3.10%2B-brightgreen)
+![Contributions](https://img.shields.io/badge/contributions-welcome-brightgreen)
+# Welcome to `pyvisim`!
+`pyvisim` is a Python library for computing image similarities using encoding methods such as Fisher Vectors, VLAD
+and Siamese Networks.
+This project was made by me in cooperation with the __Lehrstuhl fÃ¼r Automatisierung und Informationssysteme__
+at the Technical University of Munich.
+## Table of Contents
+1. [Why **pyvisim**](#why-pyvisim)
+2. [Installation](#installation)
+3. [Contributing](#contributing)
+4. [Get in Touch](#get-in-touch)
+5. [TODO](#todo)
+6. [License](#license)
+7. [Acknowledgements](#acknowledgements)
+8. [References](#references)
+## Why `pyvisim`?
+`pyvisim` is designed to provide a simple and efficient way to compare images. The use-cases include:
+1. **Image Retrieval**
+   Retrieve the top-k most similar images from a dataset.
+   - Use encoding methods like VLAD or Fisher Vectors to quickly find the most relevant matches. Please visit
+   [this juptyer notebook](examples/vlad_fisher_with_vgg16_embeddings_image_retrieval.ipynb) for an example.
+   - Example use: Building a fast image search engine for photo management software.
+2. **Deep Learning Embeddings**
+   - Generate VLAD or Fisher vectors from neural network embeddings, e.g., VGG16 or other models.
+   - Enhance your deep learning pipeline by leveraging traditional encoding methods on top of CNN features.
+3. **Image Clustering**
+   - Cluster images based on their similarities to group them by category or content. An example and benchmarking
+    can be found in [this notebook](examples/clustering_images_using_fv.ipynb).
+   - Useful for organizing unlabeled data or generating pseudo-labels for further training.
+4. **Pipeline for Combining Multiple Encoders**
+   - Chain various encoders in a single pipeline. An example can be found in [this notebook](examples/pipeline.ipynb).
+   - Achieve more robust similarity metrics by blending different feature representations.
+5. **Siamese Network (Coming Soon!)**
+   - Train a neural network to learn a similarity function directly from pairs/triples of images.
+   - Possible use cases include face recognition, signature verification, or any image-based identity matching.
+## Installation
+Currently, the package still needs to be tested and validated before being uploaded to PyPI. To use the library, you can
+clone the repository and install the package locally:
+```bash
+git clone # TODO: Add the link to the repository
+cd similarity_metrics_of_images
+pip install .
+```
+All experiments in this project was made on the Oxford Flower Dataset <ref>[7]</ref>, for which I
+have created a custom dataset class. To use this class, import it as follows:
+```python
+from image_similarity.datasets import OxfordFlowerDataset
+```
+In order to replicate the experiments done in this project, follow the preprocessing steps in
+the [datasets README](pyvisim/datasets/README.md).
+## Contributing
+We love contributions of all kindsâ€”whether itâ€™s suggesting new features, fixing bugs, or writing docs! Hereâ€™s how you
+can get involved:
+1. **Fork** this repository.
+2. **Create a new branch** for your changes.
+3. **Open a pull request** with a clear description of your idea or fix.
+We welcome all feedback and hope to build a supportive community around pyvisim!
+## Get in Touch
+If you have any questions or just want to say hi, feel free to:
+- Open an issue on [GitHub](https://github.com/MechaCritter/similarity_metrics_of_images/issues).
+- Write me an email at [vunhathuy234@gmail.com](mailto:vunhathuy234@gmail.com).
+- Connect on [LinkedIn](https://www.linkedin.com/in/nhat-huy-vu-80495111b/) to follow my work and share your thoughts.
+## TODO
+The features below are planned for future releases:
+- Implement proper **unit tests** to validate the functionality of the package before uploading to PyPI.
+- Implement the **siamese network**.
+- Add **tensor sketch approximation** and **mutual information** analysis for Fisher Vector, according to this
+paper by Weixia Zhang, Jia Yan, Wenxuan Shi, Tianpeng Feng, and Dexiang Deng <sup>[1](#references)</sup>
+- Add support for **vision transformers** for the `DeepConvFeature` class.
+You are welcome to implement any of these features or suggest new ones!
+## License
+This project is licensed under the terms of the MIT license.
+## Acknowledgements
+I would like to thank the __Lehrstuhl fÃ¼r Automatisierung und Informationssysteme__ at the Technical University of Munich
+for their support, guidance and provision of computational resources for this project, without which this project would
+not have been possible. I would also like to thank my supervisor, <add name>, for his guidance, as well as Dr. <add name>
+for her valuable feedback and suggestions.
+## References
+[1] Weixia Zhang, Jia Yan, Wenxuan Shi, Tianpeng Feng, and Dexiang Deng, "Refining Deep Convolutional Features for
+Improving Fine-Grained Image Recognition," EURASIP Journal on Image and Video Processing, 2017. \
+[2] Relja ArandjeloviÄ‡ and Andrew Zisserman, 'All About VLAD', Department of Engineering Science, University of Oxford. \
+[3] E. Spyromitros-Xioufis, S. Papadopoulos, I. Kompatsiaris, G. Tsoumakas, and I. Vlahavas, "An Empirical Study on the
+Combination of SURF Features with VLAD Vectors for Image Search," Informatics and Telematics Institute, Center for Research and
+Technology Hellas, Thessaloniki, Greece; Department of Informatics, Aristotle University of Thessaloniki, Greece. \
+[4] Relja ArandjeloviÄ‡ and Andrew Zisserman, "Three things everyone should know to improve object retrieval," Department of
+Engineering Science, University of Oxford. \
+[5] HervÃ© JÃ©gou, Florent Perronnin, Matthijs Douze, Jorge SÃ¡nchez, Patrick PÃ©rez, and Cordelia Schmid, "Aggregating Local
+Image Descriptors into Compact Codes," IEEE. \
+[6] Liangliang Wang and Deepu Rajan, "An Image Similarity Descriptor for Classification Tasks," J. Vis. Commun.
+Image R., vol. 71, pp. 102847, 2020. \
+[7] [Oxford Flower Dataset](https://www.robots.ox.ac.uk/~vgg/data/flowers/102/).

pyvisim-0.1.0/README.md ADDED Viewed

@@ -0,0 +1,133 @@
+<!-- Logo -->
+<p align="center">
+  <img src="res/images/logo.png" alt="pyvisim" width="1418" />
+</p>
+<!-- Added badges to convey project readiness/branding (example placeholders) -->
+![License](https://img.shields.io/badge/license-MIT-brightgreen)
+![Version](https://img.shields.io/badge/version-0.1.0-blue)
+![Status](https://img.shields.io/badge/status-pre--release-orange)
+![Python](https://img.shields.io/badge/Python-3.10%2B-brightgreen)
+![Contributions](https://img.shields.io/badge/contributions-welcome-brightgreen)
+# Welcome to `pyvisim`!
+`pyvisim` is a Python library for computing image similarities using encoding methods such as Fisher Vectors, VLAD
+and Siamese Networks.
+This project was made by me in cooperation with the __Lehrstuhl für Automatisierung und Informationssysteme__
+at the Technical University of Munich.
+## Table of Contents
+1. [Why **pyvisim**](#why-pyvisim)
+2. [Installation](#installation)
+3. [Contributing](#contributing)
+4. [Get in Touch](#get-in-touch)
+5. [TODO](#todo)
+6. [License](#license)
+7. [Acknowledgements](#acknowledgements)
+8. [References](#references)
+## Why `pyvisim`?
+`pyvisim` is designed to provide a simple and efficient way to compare images. The use-cases include:
+1. **Image Retrieval**
+   Retrieve the top-k most similar images from a dataset.
+   - Use encoding methods like VLAD or Fisher Vectors to quickly find the most relevant matches. Please visit
+   [this juptyer notebook](examples/vlad_fisher_with_vgg16_embeddings_image_retrieval.ipynb) for an example.
+   - Example use: Building a fast image search engine for photo management software.
+2. **Deep Learning Embeddings**
+   - Generate VLAD or Fisher vectors from neural network embeddings, e.g., VGG16 or other models.
+   - Enhance your deep learning pipeline by leveraging traditional encoding methods on top of CNN features.
+3. **Image Clustering**
+   - Cluster images based on their similarities to group them by category or content. An example and benchmarking
+    can be found in [this notebook](examples/clustering_images_using_fv.ipynb).
+   - Useful for organizing unlabeled data or generating pseudo-labels for further training.
+4. **Pipeline for Combining Multiple Encoders**
+   - Chain various encoders in a single pipeline. An example can be found in [this notebook](examples/pipeline.ipynb).
+   - Achieve more robust similarity metrics by blending different feature representations.
+5. **Siamese Network (Coming Soon!)**
+   - Train a neural network to learn a similarity function directly from pairs/triples of images.
+   - Possible use cases include face recognition, signature verification, or any image-based identity matching.
+## Installation
+Currently, the package still needs to be tested and validated before being uploaded to PyPI. To use the library, you can
+clone the repository and install the package locally:
+```bash
+git clone # TODO: Add the link to the repository
+cd similarity_metrics_of_images
+pip install .
+```
+All experiments in this project was made on the Oxford Flower Dataset <ref>[7]</ref>, for which I
+have created a custom dataset class. To use this class, import it as follows:
+```python
+from image_similarity.datasets import OxfordFlowerDataset
+```
+In order to replicate the experiments done in this project, follow the preprocessing steps in
+the [datasets README](pyvisim/datasets/README.md).
+## Contributing
+We love contributions of all kinds—whether it’s suggesting new features, fixing bugs, or writing docs! Here’s how you
+can get involved:
+1. **Fork** this repository.
+2. **Create a new branch** for your changes.
+3. **Open a pull request** with a clear description of your idea or fix.
+We welcome all feedback and hope to build a supportive community around pyvisim!
+## Get in Touch
+If you have any questions or just want to say hi, feel free to:
+- Open an issue on [GitHub](https://github.com/MechaCritter/similarity_metrics_of_images/issues).
+- Write me an email at [vunhathuy234@gmail.com](mailto:vunhathuy234@gmail.com).
+- Connect on [LinkedIn](https://www.linkedin.com/in/nhat-huy-vu-80495111b/) to follow my work and share your thoughts.
+## TODO
+The features below are planned for future releases:
+- Implement proper **unit tests** to validate the functionality of the package before uploading to PyPI.
+- Implement the **siamese network**.
+- Add **tensor sketch approximation** and **mutual information** analysis for Fisher Vector, according to this
+paper by Weixia Zhang, Jia Yan, Wenxuan Shi, Tianpeng Feng, and Dexiang Deng <sup>[1](#references)</sup>
+- Add support for **vision transformers** for the `DeepConvFeature` class.
+You are welcome to implement any of these features or suggest new ones!
+## License
+This project is licensed under the terms of the MIT license.
+## Acknowledgements
+I would like to thank the __Lehrstuhl für Automatisierung und Informationssysteme__ at the Technical University of Munich
+for their support, guidance and provision of computational resources for this project, without which this project would
+not have been possible. I would also like to thank my supervisor, <add name>, for his guidance, as well as Dr. <add name>
+for her valuable feedback and suggestions.
+## References
+[1] Weixia Zhang, Jia Yan, Wenxuan Shi, Tianpeng Feng, and Dexiang Deng, "Refining Deep Convolutional Features for
+Improving Fine-Grained Image Recognition," EURASIP Journal on Image and Video Processing, 2017. \
+[2] Relja Arandjelović and Andrew Zisserman, 'All About VLAD', Department of Engineering Science, University of Oxford. \
+[3] E. Spyromitros-Xioufis, S. Papadopoulos, I. Kompatsiaris, G. Tsoumakas, and I. Vlahavas, "An Empirical Study on the
+Combination of SURF Features with VLAD Vectors for Image Search," Informatics and Telematics Institute, Center for Research and
+Technology Hellas, Thessaloniki, Greece; Department of Informatics, Aristotle University of Thessaloniki, Greece. \
+[4] Relja Arandjelović and Andrew Zisserman, "Three things everyone should know to improve object retrieval," Department of
+Engineering Science, University of Oxford. \
+[5] Hervé Jégou, Florent Perronnin, Matthijs Douze, Jorge Sánchez, Patrick Pérez, and Cordelia Schmid, "Aggregating Local
+Image Descriptors into Compact Codes," IEEE. \
+[6] Liangliang Wang and Deepu Rajan, "An Image Similarity Descriptor for Classification Tasks," J. Vis. Commun.
+Image R., vol. 71, pp. 102847, 2020. \
+[7] [Oxford Flower Dataset](https://www.robots.ox.ac.uk/~vgg/data/flowers/102/).

pyvisim-0.1.0/pyvisim/__init__.py ADDED Viewed

@@ -0,0 +1,5 @@
+"""
+PyVisim: A Python library for image similarity analysis using Image Encoders and Neural Networks.
+"""
+__all__ = ['datasets', 'encoders', 'features', 'eval']

pyvisim-0.1.0/pyvisim/_base_classes.py ADDED Viewed

@@ -0,0 +1,51 @@
+import abc
+import logging
+import numpy as np
+class SimilarityMetric(abc.ABC):
+    """
+    Abstract base for all similarity encoders.
+    All concrete similarity metric classes must inherit from this class.
+    """
+    _logger = logging.getLogger('Similarity_Metrics')
+    @abc.abstractmethod
+    def similarity_score(self, image1: np.ndarray, image2: np.ndarray) -> float:
+        """
+        Compute a similarity score between two images.
+        :param image1: First image
+        :param image2: Second image
+        :return: A similarity score
+        """
+        pass
+class FeatureExtractorBase(abc.ABC):
+    """
+    Abstract interface for extracting features from images.
+    A feature extractor transforms an image (NumPy array) into a
+    set of feature vectors (NumPy array).
+    """
+    _logger = logging.getLogger("Feature_Extractor")
+    def __init__(self):
+        pass
+    @abc.abstractmethod
+    def __call__(self, image: np.ndarray) -> np.ndarray:
+        """
+        Extracts features from an image.
+        :param image: Input image (NumPy array).
+        :return: Feature descriptors (NumPy array).
+        """
+        raise NotImplementedError
+    @property
+    @abc.abstractmethod
+    def output_dim(self) -> int:
+        """
+        The dimensionality (D) of each feature vector, i.e., shape[1] of the output.
+        """
+        raise NotImplementedError

pyvisim-0.1.0/pyvisim/_config.py ADDED Viewed

@@ -0,0 +1,56 @@
+import logging
+import logging.config
+import pathlib
+import yaml
+import torch
+# -Config for the dataset- #
+ROOT = pathlib.Path(__file__).parent.parent
+LOG_FILE_PATH = ROOT / "res/logs/log_msgs.log"
+# - Device - #
+ENFORCE_CUDA = True
+def get_device():
+    """Get device (if available)"""
+    global ENFORCE_CUDA
+    if ENFORCE_CUDA:
+        if not torch.cuda.is_available():
+            raise RuntimeError("CUDA is not available. Please check your computer's configuration.")
+        return torch.device("cuda")
+    return torch.device("cuda" if torch.cuda.is_available() else "cpu")
+DEVICE = get_device()
+print(f"Device used: {DEVICE}")
+# -Paths for the Excavator dataset- #
+TRAIN_IMG_DATA_PATH_EXCAVATOR= rf"{ROOT}/excavator_dataset_w_masks/train"
+TRAIN_MASK_DATA_PATH_EXCAVATOR = rf"{ROOT}/excavator_dataset_w_masks/train_annot"
+TEST_IMG_DATA_PATH_EXCAVATOR = rf"{ROOT}/excavator_dataset_w_masks/test"
+TEST_MASK_DATA_PATH_EXCAVATOR = rf"{ROOT}/excavator_dataset_w_masks/test_annot"
+VALID_IMG_DATA_PATH_EXCAVATOR = None
+VALID_MASK_DATA_PATH_EXCAVATOR = None
+# -Paths for the Flower dataset- #
+IMG_DATA_PATH_FLOWER = rf"{ROOT}/oxford_flower_dataset/images"
+LABELS_PATH_FLOWER = rf"{ROOT}/oxford_flower_dataset/imagelabels.mat"
+SETID_PATH_FLOWER = rf"{ROOT}/oxford_flower_dataset/setid.mat"
+# - Logging - #
+def setup_logging(default_path=rf"{ROOT}/res/logging_config.yaml", default_level=logging.INFO):
+    """Setup logging configuration"""
+    try:
+        with open(default_path, 'rt') as f:
+            config = yaml.safe_load(f.read())
+        try:
+            config["handlers"]["file_handler"]["filename"] = str(LOG_FILE_PATH)
+        except Exception as e:
+            print(f"Error in Logging Configuration: {e}. Cannot set output path for log file.")
+        logging.config.dictConfig(config)
+    except Exception as e:
+        print(f"Error in Logging Configuration: {e}")
+        logging.basicConfig(level=default_level, format='%(asctime)s - %(name)s - %(levelname)s - %(message)s')

pyvisim-0.1.0/pyvisim/_errors.py ADDED Viewed

@@ -0,0 +1,10 @@
+"""
+Includes exceptions for the package.
+"""
+class InvalidImageError(Exception):
+    """
+    Raised when an image is not provided.
+    """
+    def __init__(self, message: str = "Input is not a valid image."):
+        super().__init__(message)