PyPI - datasketch - Versions diffs - 1.7.0__tar.gz → 1.9.0__tar.gz - Mend

datasketch 1.7.0tar.gz → 1.9.0tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (44) hide show

datasketch-1.9.0/.gitignore +87 -0
datasketch-1.9.0/PKG-INFO +262 -0
datasketch-1.7.0/PKG-INFO → datasketch-1.9.0/README.rst +121 -70
{datasketch-1.7.0 → datasketch-1.9.0}/datasketch/__init__.py +34 -9
{datasketch-1.7.0 → datasketch-1.9.0}/datasketch/b_bit_minhash.py +57 -72
{datasketch-1.7.0 → datasketch-1.9.0}/datasketch/experimental/__init__.py +4 -7
{datasketch-1.7.0 → datasketch-1.9.0}/datasketch/experimental/aio/lsh.py +110 -118
{datasketch-1.7.0 → datasketch-1.9.0}/datasketch/experimental/aio/storage.py +138 -122
{datasketch-1.7.0 → datasketch-1.9.0}/datasketch/hashfunc.py +6 -3
{datasketch-1.7.0 → datasketch-1.9.0}/datasketch/hnsw.py +103 -151
{datasketch-1.7.0 → datasketch-1.9.0}/datasketch/hyperloglog.py +55 -66
{datasketch-1.7.0 → datasketch-1.9.0}/datasketch/lean_minhash.py +25 -25
{datasketch-1.7.0 → datasketch-1.9.0}/datasketch/lsh.py +199 -134
datasketch-1.9.0/datasketch/lsh_bloom.py +377 -0
{datasketch-1.7.0 → datasketch-1.9.0}/datasketch/lshensemble.py +39 -46
{datasketch-1.7.0 → datasketch-1.9.0}/datasketch/lshensemble_partition.py +34 -33
{datasketch-1.7.0 → datasketch-1.9.0}/datasketch/lshforest.py +28 -36
{datasketch-1.7.0 → datasketch-1.9.0}/datasketch/minhash.py +176 -49
{datasketch-1.7.0 → datasketch-1.9.0}/datasketch/storage.py +188 -233
{datasketch-1.7.0 → datasketch-1.9.0}/datasketch/weighted_minhash.py +28 -30
datasketch-1.9.0/pyproject.toml +197 -0
datasketch-1.7.0/README.rst +0 -88
datasketch-1.7.0/datasketch/lsh_bloom.py +0 -335
datasketch-1.7.0/datasketch/version.py +0 -1
datasketch-1.7.0/datasketch.egg-info/PKG-INFO +0 -153
datasketch-1.7.0/datasketch.egg-info/SOURCES.txt +0 -38
datasketch-1.7.0/datasketch.egg-info/dependency_links.txt +0 -1
datasketch-1.7.0/datasketch.egg-info/requires.txt +0 -43
datasketch-1.7.0/datasketch.egg-info/top_level.txt +0 -1
datasketch-1.7.0/setup.cfg +0 -4
datasketch-1.7.0/setup.py +0 -91
datasketch-1.7.0/test/test_hnsw.py +0 -306
datasketch-1.7.0/test/test_hyperloglog.py +0 -177
datasketch-1.7.0/test/test_lean_minhash.py +0 -190
datasketch-1.7.0/test/test_lsh.py +0 -451
datasketch-1.7.0/test/test_lsh_cassandra.py +0 -269
datasketch-1.7.0/test/test_lshbloom.py +0 -126
datasketch-1.7.0/test/test_lshensemble.py +0 -92
datasketch-1.7.0/test/test_lshforest.py +0 -149
datasketch-1.7.0/test/test_minhash.py +0 -203
datasketch-1.7.0/test/test_weighted_minhash.py +0 -108
{datasketch-1.7.0 → datasketch-1.9.0}/LICENSE +0 -0
{datasketch-1.7.0 → datasketch-1.9.0}/datasketch/experimental/aio/__init__.py +0 -0
{datasketch-1.7.0 → datasketch-1.9.0}/datasketch/hyperloglog_const.py +0 -0

datasketch-1.9.0/.gitignore ADDED Viewed

@@ -0,0 +1,87 @@
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+# C extensions
+*.so
+# VIM stuff
+*.swp
+# Distribution / packaging
+.Python
+env/
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+*.egg-info/
+.installed.cfg
+*.egg
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*,cover
+# Translations
+*.mo
+*.pot
+# Django stuff:
+*.log
+# Sphinx documentation
+docs/_build/
+# PyBuilder
+target/
+# Documentation
+.doctrees
+_build
+doctrees
+# Jetbrains
+.idea
+# Benchmark files
+benchmark/**/*.inp.gz
+# Benchmark output
+benchmark/**/*.sqlite
+# Benchmark plots
+benchmark/**/*.png
+benchmark/**/*.pdf
+# Virtual env
+.venv
+# IDE
+.vscode
+# MacOS
+.DS_Store

datasketch-1.9.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,262 @@
+Metadata-Version: 2.4
+Name: datasketch
+Version: 1.9.0
+Summary: Probabilistic data structures for processing and searching very large datasets
+Project-URL: Homepage, https://ekzhu.github.io/datasketch
+Project-URL: Bug Tracker, https://github.com/ekzhu/datasketch/issues
+Project-URL: Documentation, https://ekzhu.github.io/datasketch
+Project-URL: Source, https://github.com/ekzhu/datasketch
+Author-email: ekzhu <ekzhu@cs.toronto.edu>
+License: MIT
+License-File: LICENSE
+Keywords: database,datamining
+Classifier: Development Status :: 5 - Production/Stable
+Classifier: Intended Audience :: Developers
+Classifier: License :: OSI Approved :: MIT License
+Classifier: Programming Language :: Python :: 3.9
+Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Programming Language :: Python :: 3.13
+Classifier: Topic :: Database
+Classifier: Topic :: Scientific/Engineering :: Information Analysis
+Requires-Python: >=3.9
+Requires-Dist: numpy>=1.11
+Requires-Dist: scipy>=1.0.0
+Provides-Extra: benchmark
+Requires-Dist: matplotlib>=3.1.2; extra == 'benchmark'
+Requires-Dist: nltk>=3.4.5; extra == 'benchmark'
+Requires-Dist: pandas>=0.25.3; extra == 'benchmark'
+Requires-Dist: pyfarmhash>=0.2.2; extra == 'benchmark'
+Requires-Dist: pyhash>=0.9.3; extra == 'benchmark'
+Requires-Dist: scikit-learn>=0.21.3; extra == 'benchmark'
+Requires-Dist: scipy>=1.3.3; extra == 'benchmark'
+Requires-Dist: setsimilaritysearch>=0.1.7; extra == 'benchmark'
+Provides-Extra: bloom
+Requires-Dist: pybloomfilter3>=0.7.2; extra == 'bloom'
+Provides-Extra: cassandra
+Requires-Dist: cassandra-driver>=3.20; extra == 'cassandra'
+Provides-Extra: experimental-aio
+Requires-Dist: aiounittest; extra == 'experimental-aio'
+Requires-Dist: motor>3.6.0; extra == 'experimental-aio'
+Provides-Extra: redis
+Requires-Dist: redis>=2.10.0; extra == 'redis'
+Provides-Extra: test
+Requires-Dist: cassandra-driver>=3.20; extra == 'test'
+Requires-Dist: coverage; extra == 'test'
+Requires-Dist: mock>=2.0.0; extra == 'test'
+Requires-Dist: mockredispy; extra == 'test'
+Requires-Dist: nose-exclude>=0.5.0; extra == 'test'
+Requires-Dist: nose>=1.3.7; extra == 'test'
+Requires-Dist: pymongo>=3.9.0; extra == 'test'
+Requires-Dist: pytest; extra == 'test'
+Requires-Dist: pytest-asyncio; extra == 'test'
+Requires-Dist: pytest-cov; extra == 'test'
+Requires-Dist: pytest-rerunfailures; extra == 'test'
+Requires-Dist: redis>=2.10.0; extra == 'test'
+Description-Content-Type: text/x-rst
+datasketch: Big Data Looks Small
+================================
+.. image:: https://static.pepy.tech/badge/datasketch/month
+    :target: https://pepy.tech/project/datasketch
+.. image:: https://zenodo.org/badge/DOI/10.5281/zenodo.598238.svg
+   :target: https://zenodo.org/doi/10.5281/zenodo.598238
+.. image:: https://codecov.io/gh/ekzhu/datasketch/branch/master/graph/badge.svg
+    :target: https://codecov.io/gh/ekzhu/datasketch
+datasketch gives you probabilistic data structures that can process and
+search very large amount of data super fast, with little loss of
+accuracy.
+This package contains the following data sketches:
++-------------------------+-----------------------------------------------+
+| Data Sketch             | Usage                                         |
++=========================+===============================================+
+| `MinHash`_              | estimate Jaccard similarity and cardinality   |
++-------------------------+-----------------------------------------------+
+| `Weighted MinHash`_     | estimate weighted Jaccard similarity          |
++-------------------------+-----------------------------------------------+
+| `HyperLogLog`_          | estimate cardinality                          |
++-------------------------+-----------------------------------------------+
+| `HyperLogLog++`_        | estimate cardinality                          |
++-------------------------+-----------------------------------------------+
+The following indexes for data sketches are provided to support
+sub-linear query time:
++---------------------------+-----------------------------+------------------------+
+| Index                     | For Data Sketch             | Supported Query Type   |
++===========================+=============================+========================+
+| `MinHash LSH`_            | MinHash, Weighted MinHash   | Jaccard Threshold      |
++---------------------------+-----------------------------+------------------------+
+| `LSHBloom`_               | MinHash, Weighted MinHash   | Jaccard Threshold      |
++---------------------------+-----------------------------+------------------------+
+| `MinHash LSH Forest`_     | MinHash, Weighted MinHash   | Jaccard Top-K          |
++---------------------------+-----------------------------+------------------------+
+| `MinHash LSH Ensemble`_   | MinHash                     | Containment Threshold  |
++---------------------------+-----------------------------+------------------------+
+| `HNSW`_                   | Any                         | Custom Metric Top-K    |
++---------------------------+-----------------------------+------------------------+
+datasketch must be used with Python 3.9 or above, NumPy 1.11 or above, and Scipy.
+Note that `MinHash LSH`_ and `MinHash LSH Ensemble`_ also support Redis and Cassandra
+storage layer (see `MinHash LSH at Scale`_).
+Install
+-------
+To install datasketch using ``pip``:
+.. code-block:: bash
+    pip install datasketch
+This will also install NumPy as dependency.
+To install with Redis dependency:
+.. code-block:: bash
+    pip install datasketch[redis]
+To install with Cassandra dependency:
+.. code-block:: bash
+    pip install datasketch[cassandra]
+To install with Bloom filter dependency:
+.. code-block:: bash
+    pip install datasketch[bloom]
+.. _`MinHash`: https://ekzhu.github.io/datasketch/minhash.html
+.. _`Weighted MinHash`: https://ekzhu.github.io/datasketch/weightedminhash.html
+.. _`HyperLogLog`: https://ekzhu.github.io/datasketch/hyperloglog.html
+.. _`HyperLogLog++`: https://ekzhu.github.io/datasketch/hyperloglog.html#hyperloglog-plusplus
+.. _`MinHash LSH`: https://ekzhu.github.io/datasketch/lsh.html
+.. _`MinHash LSH Forest`: https://ekzhu.github.io/datasketch/lshforest.html
+.. _`MinHash LSH Ensemble`: https://ekzhu.github.io/datasketch/lshensemble.html
+.. _`LSHBloom`: https://ekzhu.github.io/datasketch/lshbloom.html
+.. _`Minhash LSH at Scale`: http://ekzhu.github.io/datasketch/lsh.html#minhash-lsh-at-scale
+.. _`HNSW`: https://ekzhu.github.io/datasketch/documentation.html#hnsw
+Contributing
+------------
+We welcome contributions from everyone. Whether you're fixing bugs, adding features, improving documentation, or helping with tests, your contributions are valuable.
+Development Setup
+^^^^^^^^^^^^^^^^^
+The project uses `uv` for fast and reliable Python package management. Follow these steps to set up your development environment:
+1. **Install uv**: Follow the official installation guide at https://docs.astral.sh/uv/getting-started/installation/
+2. **Clone the repository**:
+   .. code-block:: bash
+       git clone https://github.com/ekzhu/datasketch.git
+       cd datasketch
+3. **Set up the environment**:
+   .. code-block:: bash
+       # Create a virtual environment
+       # (Optional: specify Python version with --python 3.x)
+       uv venv
+       # Activate the virtual environment (optional, uv run commands work without it)
+       source .venv/bin/activate
+       # Install all dependencies
+       uv sync
+4. **Verify installation**:
+   .. code-block:: bash
+       # Run tests to ensure everything works
+       uv run pytest
+5. **Optional dependencies** (for specific development needs):
+   .. code-block:: bash
+       # For testing
+       uv sync --extra test
+       # For Cassandra support
+       uv sync --extra cassandra
+       # For Redis support
+       uv sync --extra redis
+       # For all extras
+       uv sync --all-extras
+Learn more about `uv` at https://docs.astral.sh/uv/
+Development Workflow
+^^^^^^^^^^^^^^^^^^^^
+1. **Fork the repository** on GitHub if you haven't already.
+2. **Create a feature branch** for your changes:
+   .. code-block:: bash
+       git checkout -b feature/your-feature-name
+       # Or for bug fixes:
+       git checkout -b fix/issue-description
+3. **Make your changes** following the project's coding standards.
+4. **Run the tests** to ensure nothing is broken:
+   .. code-block:: bash
+       uv run pytest
+5. **Check code quality** with ruff:
+   .. code-block:: bash
+       # Check for issues
+       uvx ruff check .
+       # Auto-fix formatting issues
+       uvx ruff format .
+6. **Commit your changes** with a clear, descriptive commit message:
+   .. code-block:: bash
+       git commit -m "Add feature: brief description of what was changed"
+7. **Push to your fork** and create a pull request on GitHub:
+   .. code-block:: bash
+       git push origin your-branch-name
+8. **Respond to feedback** from maintainers and iterate on your changes.
+Guidelines
+^^^^^^^^^^
+- Follow PEP 8 style guidelines
+- Write tests for new features
+- Update documentation as needed
+- Keep commits focused and atomic
+- Be respectful in discussions
+For more information, check the `GitHub issues <https://github.com/ekzhu/datasketch/issues>`_ for current priorities or areas needing help. You can also join the discussion on `project roadmap and priorities <https://github.com/ekzhu/datasketch/discussions/252>`_.

datasketch-1.7.0/PKG-INFO → datasketch-1.9.0/README.rst RENAMED Viewed

@@ -1,68 +1,3 @@
-Metadata-Version: 2.4
-Name: datasketch
-Version: 1.7.0
-Summary: Probabilistic data structures for processing and searching very large datasets
-Home-page: https://ekzhu.github.io/datasketch
-Author: ekzhu
-Author-email: ekzhu@cs.toronto.edu
-License: MIT
-Project-URL: Source, https://github.com/ekzhu/datasketch
-Keywords: database datamining
-Classifier: Development Status :: 5 - Production/Stable
-Classifier: Intended Audience :: Developers
-Classifier: Topic :: Database
-Classifier: Topic :: Scientific/Engineering :: Information Analysis
-Classifier: License :: OSI Approved :: MIT License
-Classifier: Programming Language :: Python :: 3.8
-Classifier: Programming Language :: Python :: 3.9
-Classifier: Programming Language :: Python :: 3.10
-Classifier: Programming Language :: Python :: 3.11
-Classifier: Programming Language :: Python :: 3.12
-License-File: LICENSE
-Requires-Dist: numpy>=1.11
-Requires-Dist: scipy>=1.0.0
-Provides-Extra: cassandra
-Requires-Dist: cassandra-driver>=3.20; extra == "cassandra"
-Provides-Extra: redis
-Requires-Dist: redis>=2.10.0; extra == "redis"
-Provides-Extra: bloom
-Requires-Dist: pybloomfilter3>=0.7.2; python_version >= "3.9" and extra == "bloom"
-Requires-Dist: pybloomfiltermmap3==0.6.0; python_version < "3.9" and extra == "bloom"
-Provides-Extra: benchmark
-Requires-Dist: pyhash>=0.9.3; extra == "benchmark"
-Requires-Dist: matplotlib>=3.1.2; extra == "benchmark"
-Requires-Dist: scikit-learn>=0.21.3; extra == "benchmark"
-Requires-Dist: scipy>=1.3.3; extra == "benchmark"
-Requires-Dist: pandas>=0.25.3; extra == "benchmark"
-Requires-Dist: SetSimilaritySearch>=0.1.7; extra == "benchmark"
-Requires-Dist: pyfarmhash>=0.2.2; extra == "benchmark"
-Requires-Dist: nltk>=3.4.5; extra == "benchmark"
-Provides-Extra: test
-Requires-Dist: cassandra-driver>=3.20; extra == "test"
-Requires-Dist: redis>=2.10.0; extra == "test"
-Requires-Dist: mock>=2.0.0; extra == "test"
-Requires-Dist: mockredispy; extra == "test"
-Requires-Dist: coverage; extra == "test"
-Requires-Dist: pymongo>=3.9.0; extra == "test"
-Requires-Dist: nose>=1.3.7; extra == "test"
-Requires-Dist: nose-exclude>=0.5.0; extra == "test"
-Requires-Dist: pytest; extra == "test"
-Provides-Extra: experimental-aio
-Requires-Dist: aiounittest; python_version >= "3.8" and extra == "experimental-aio"
-Requires-Dist: motor>3.6.0; python_version >= "3.8" and extra == "experimental-aio"
-Dynamic: author
-Dynamic: author-email
-Dynamic: classifier
-Dynamic: description
-Dynamic: home-page
-Dynamic: keywords
-Dynamic: license
-Dynamic: license-file
-Dynamic: project-url
-Dynamic: provides-extra
-Dynamic: requires-dist
-Dynamic: summary
 datasketch: Big Data Looks Small
 ================================
@@ -72,6 +7,9 @@ datasketch: Big Data Looks Small
 .. image:: https://zenodo.org/badge/DOI/10.5281/zenodo.598238.svg
    :target: https://zenodo.org/doi/10.5281/zenodo.598238
+.. image:: https://codecov.io/gh/ekzhu/datasketch/branch/master/graph/badge.svg
+    :target: https://codecov.io/gh/ekzhu/datasketch
 datasketch gives you probabilistic data structures that can process and
 search very large amount of data super fast, with little loss of
 accuracy.
@@ -107,7 +45,7 @@ sub-linear query time:
 | `HNSW`_                   | Any                         | Custom Metric Top-K    |
 +---------------------------+-----------------------------+------------------------+
-datasketch must be used with Python 3.8 or above, NumPy 1.11 or above, and Scipy.
+datasketch must be used with Python 3.9 or above, NumPy 1.11 or above, and Scipy.
 Note that `MinHash LSH`_ and `MinHash LSH Ensemble`_ also support Redis and Cassandra
 storage layer (see `MinHash LSH at Scale`_).
@@ -117,7 +55,7 @@ Install
 To install datasketch using ``pip``:
-::
+.. code-block:: bash
     pip install datasketch
@@ -125,19 +63,19 @@ This will also install NumPy as dependency.
 To install with Redis dependency:
-::
+.. code-block:: bash
     pip install datasketch[redis]
 To install with Cassandra dependency:
-::
+.. code-block:: bash
     pip install datasketch[cassandra]
 To install with Bloom filter dependency:
-::
+.. code-block:: bash
     pip install datasketch[bloom]
@@ -151,3 +89,116 @@ To install with Bloom filter dependency:
 .. _`LSHBloom`: https://ekzhu.github.io/datasketch/lshbloom.html
 .. _`Minhash LSH at Scale`: http://ekzhu.github.io/datasketch/lsh.html#minhash-lsh-at-scale
 .. _`HNSW`: https://ekzhu.github.io/datasketch/documentation.html#hnsw
+Contributing
+------------
+We welcome contributions from everyone. Whether you're fixing bugs, adding features, improving documentation, or helping with tests, your contributions are valuable.
+Development Setup
+^^^^^^^^^^^^^^^^^
+The project uses `uv` for fast and reliable Python package management. Follow these steps to set up your development environment:
+1. **Install uv**: Follow the official installation guide at https://docs.astral.sh/uv/getting-started/installation/
+2. **Clone the repository**:
+   .. code-block:: bash
+       git clone https://github.com/ekzhu/datasketch.git
+       cd datasketch
+3. **Set up the environment**:
+   .. code-block:: bash
+       # Create a virtual environment
+       # (Optional: specify Python version with --python 3.x)
+       uv venv
+       # Activate the virtual environment (optional, uv run commands work without it)
+       source .venv/bin/activate
+       # Install all dependencies
+       uv sync
+4. **Verify installation**:
+   .. code-block:: bash
+       # Run tests to ensure everything works
+       uv run pytest
+5. **Optional dependencies** (for specific development needs):
+   .. code-block:: bash
+       # For testing
+       uv sync --extra test
+       # For Cassandra support
+       uv sync --extra cassandra
+       # For Redis support
+       uv sync --extra redis
+       # For all extras
+       uv sync --all-extras
+Learn more about `uv` at https://docs.astral.sh/uv/
+Development Workflow
+^^^^^^^^^^^^^^^^^^^^
+1. **Fork the repository** on GitHub if you haven't already.
+2. **Create a feature branch** for your changes:
+   .. code-block:: bash
+       git checkout -b feature/your-feature-name
+       # Or for bug fixes:
+       git checkout -b fix/issue-description
+3. **Make your changes** following the project's coding standards.
+4. **Run the tests** to ensure nothing is broken:
+   .. code-block:: bash
+       uv run pytest
+5. **Check code quality** with ruff:
+   .. code-block:: bash
+       # Check for issues
+       uvx ruff check .
+       # Auto-fix formatting issues
+       uvx ruff format .
+6. **Commit your changes** with a clear, descriptive commit message:
+   .. code-block:: bash
+       git commit -m "Add feature: brief description of what was changed"
+7. **Push to your fork** and create a pull request on GitHub:
+   .. code-block:: bash
+       git push origin your-branch-name
+8. **Respond to feedback** from maintainers and iterate on your changes.
+Guidelines
+^^^^^^^^^^
+- Follow PEP 8 style guidelines
+- Write tests for new features
+- Update documentation as needed
+- Keep commits focused and atomic
+- Be respectful in discussions
+For more information, check the `GitHub issues <https://github.com/ekzhu/datasketch/issues>`_ for current priorities or areas needing help. You can also join the discussion on `project roadmap and priorities <https://github.com/ekzhu/datasketch/discussions/252>`_.

{datasketch-1.7.0 → datasketch-1.9.0}/datasketch/__init__.py RENAMED Viewed

@@ -1,18 +1,43 @@
-from datasketch.hyperloglog import HyperLogLog, HyperLogLogPlusPlus
-from datasketch.minhash import MinHash
+import importlib.metadata
+from typing import Final
+try:
+    _version = importlib.metadata.version(__name__)
+except importlib.metadata.PackageNotFoundError:
+    _version = "0.0.0"  # Fallback for development mode
+__version__: Final[str] = _version
 from datasketch.b_bit_minhash import bBitMinHash
+from datasketch.hashfunc import sha1_hash32
+from datasketch.hnsw import HNSW
+from datasketch.hyperloglog import HyperLogLog, HyperLogLogPlusPlus
+from datasketch.lean_minhash import LeanMinHash
 from datasketch.lsh import MinHashLSH
 from datasketch.lsh_bloom import MinHashLSHBloom
-from datasketch.weighted_minhash import WeightedMinHash, WeightedMinHashGenerator
-from datasketch.lshforest import MinHashLSHForest
 from datasketch.lshensemble import MinHashLSHEnsemble
-from datasketch.lean_minhash import LeanMinHash
-from datasketch.hashfunc import sha1_hash32
-from datasketch.hnsw import HNSW
+from datasketch.lshforest import MinHashLSHForest
+from datasketch.minhash import MinHash
+from datasketch.weighted_minhash import WeightedMinHash, WeightedMinHashGenerator
 # Alias
 WeightedMinHashLSH = MinHashLSH
 WeightedMinHashLSHForest = MinHashLSHForest
-# Version
-from datasketch.version import __version__
+__all__ = [
+    "HNSW",
+    "HyperLogLog",
+    "HyperLogLogPlusPlus",
+    "LeanMinHash",
+    "MinHash",
+    "MinHashLSH",
+    "MinHashLSHBloom",
+    "MinHashLSHEnsemble",
+    "MinHashLSHForest",
+    "WeightedMinHash",
+    "WeightedMinHashGenerator",
+    "WeightedMinHashLSH",
+    "WeightedMinHashLSHForest",
+    "bBitMinHash",
+    "sha1_hash32",
+]

datasketch 1.7.0__tar.gz → 1.9.0__tar.gz

datasketch 1.7.0tar.gz → 1.9.0tar.gz