PyPI - photo-stack-finder - Versions diffs - 0.1.7__py3-none-any.whl → 0.1.8__py3-none-any.whl - Mend

photo-stack-finder 0.1.7py3-none-any.whl → 0.1.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (68) hide show

orchestrator/__init__.py +2 -2
orchestrator/app.py +6 -11
orchestrator/build_pipeline.py +19 -21
orchestrator/orchestrator_runner.py +11 -8
orchestrator/pipeline_builder.py +126 -126
orchestrator/pipeline_orchestrator.py +604 -604
orchestrator/review_persistence.py +162 -162
orchestrator/static/orchestrator.css +76 -76
orchestrator/static/orchestrator.html +11 -5
orchestrator/static/orchestrator.js +3 -1
overlap_metrics/__init__.py +1 -1
overlap_metrics/config.py +135 -135
overlap_metrics/core.py +284 -284
overlap_metrics/estimators.py +292 -292
overlap_metrics/metrics.py +307 -307
overlap_metrics/registry.py +99 -99
overlap_metrics/utils.py +104 -104
photo_compare/__init__.py +1 -1
photo_compare/base.py +285 -285
photo_compare/config.py +225 -225
photo_compare/distance.py +15 -15
photo_compare/feature_methods.py +173 -173
photo_compare/file_hash.py +29 -29
photo_compare/hash_methods.py +99 -99
photo_compare/histogram_methods.py +118 -118
photo_compare/pixel_methods.py +58 -58
photo_compare/structural_methods.py +104 -104
photo_compare/types.py +28 -28
{photo_stack_finder-0.1.7.dist-info → photo_stack_finder-0.1.8.dist-info}/METADATA +21 -22
photo_stack_finder-0.1.8.dist-info/RECORD +75 -0
scripts/orchestrate.py +12 -10
utils/__init__.py +4 -3
utils/base_pipeline_stage.py +171 -171
utils/base_ports.py +176 -176
utils/benchmark_utils.py +823 -823
utils/channel.py +74 -74
utils/comparison_gates.py +40 -21
utils/compute_benchmarks.py +355 -355
utils/compute_identical.py +94 -24
utils/compute_indices.py +235 -235
utils/compute_perceptual_hash.py +127 -127
utils/compute_perceptual_match.py +240 -240
utils/compute_sha_bins.py +64 -20
utils/compute_template_similarity.py +1 -1
utils/compute_versions.py +483 -483
utils/config.py +8 -5
utils/data_io.py +83 -83
utils/graph_context.py +44 -44
utils/logger.py +2 -2
utils/models.py +2 -2
utils/photo_file.py +90 -91
utils/pipeline_graph.py +334 -334
utils/pipeline_stage.py +408 -408
utils/plot_helpers.py +123 -123
utils/ports.py +136 -136
utils/progress.py +415 -415
utils/report_builder.py +139 -139
utils/review_types.py +55 -55
utils/review_utils.py +10 -19
utils/sequence.py +10 -8
utils/sequence_clustering.py +1 -1
utils/template.py +57 -57
utils/template_parsing.py +71 -0
photo_stack_finder-0.1.7.dist-info/RECORD +0 -74
{photo_stack_finder-0.1.7.dist-info → photo_stack_finder-0.1.8.dist-info}/WHEEL +0 -0
{photo_stack_finder-0.1.7.dist-info → photo_stack_finder-0.1.8.dist-info}/entry_points.txt +0 -0
{photo_stack_finder-0.1.7.dist-info → photo_stack_finder-0.1.8.dist-info}/licenses/LICENSE +0 -0
{photo_stack_finder-0.1.7.dist-info → photo_stack_finder-0.1.8.dist-info}/top_level.txt +0 -0

photo_compare/feature_methods.py CHANGED Viewed

@@ -1,173 +1,173 @@
-"""Feature-based similarity methods with caching support."""
-from __future__ import annotations
-from abc import abstractmethod
-import cv2 as cv
-import numpy as np
-import numpy.typing as npt
-from PIL import Image
-from .base import ComparisonMethodName, SimilarityMethod
-class FeatureMethodBase(SimilarityMethod[npt.NDArray[np.float32] | npt.NDArray[np.uint8]]):
-    """Base class for feature-based similarity methods."""
-    def __init__(self, method_name: ComparisonMethodName, match_threshold: float) -> None:
-        super().__init__(method_name)
-        self.match_threshold = match_threshold
-    @abstractmethod
-    def _prepare_single(self, pixels: npt.NDArray[np.uint8]) -> npt.NDArray[np.float32] | npt.NDArray[np.uint8]:
-        """Implement the actual preparation logic for feature descriptors."""
-        pass
-    @abstractmethod
-    def _get_matcher(self) -> cv.FlannBasedMatcher | cv.BFMatcher:
-        """Get the appropriate matcher for this feature type."""
-        pass
-    def _compare_prepared(
-        self,
-        prep1: npt.NDArray[np.float32] | npt.NDArray[np.uint8],
-        prep2: npt.NDArray[np.float32] | npt.NDArray[np.uint8],
-    ) -> float:
-        """Compare feature descriptors using matching ratio."""
-        min_features: int = min(len(prep1), len(prep2))
-        if min_features < 2:
-            return 0.0  # Not enough features to compare
-        matcher: cv.FlannBasedMatcher | cv.BFMatcher = self._get_matcher()
-        matches: list[tuple[cv.DMatch, ...]] = matcher.knnMatch(prep1, prep2, k=2)
-        good_matches: list[cv.DMatch] = []
-        for match_pair in matches:
-            if len(match_pair) == 2:
-                m, n = match_pair
-                if m.distance < self.match_threshold * n.distance:
-                    good_matches.append(m)
-        return len(good_matches) / min_features
-class SIFTMethod(FeatureMethodBase):
-    """SIFT (Scale-Invariant Feature Transform) keypoint method."""
-    LOWE_RATIO_THRESHOLD = 0.7  # Algorithmic constant
-    def __init__(self, max_features: int = 0, match_threshold: float = LOWE_RATIO_THRESHOLD) -> None:
-        super().__init__("sift", match_threshold)
-        self.max_features = max_features
-    def _get_matcher(self) -> cv.FlannBasedMatcher | cv.BFMatcher:
-        """SIFT uses FLANN matcher for float descriptors."""
-        return cv.FlannBasedMatcher()
-    def _prepare_single(self, pixels: npt.NDArray[np.uint8]) -> npt.NDArray[np.float32]:
-        """Prepare SIFT keypoint descriptors for the image."""
-        img = Image.fromarray(pixels, mode="RGB")
-        img = img.convert("L")
-        gray: npt.NDArray[np.uint8] = np.array(img.resize((512, 512), Image.Resampling.LANCZOS))
-        # noinspection PyUnresolvedReferences
-        sift: cv.SIFT = cv.SIFT_create(nfeatures=self.max_features)
-        _keypoints, desc = sift.detectAndCompute(gray, None)
-        if desc is None:
-            # Return empty array with correct shape (0 features, 128 dimensions)
-            return np.array([], dtype=np.float32).reshape(0, 128)
-        # SIFT always returns float32 descriptors
-        return desc.astype(np.float32)
-class AKAZEMethod(FeatureMethodBase):
-    """AKAZE (Accelerated-KAZE) keypoint method."""
-    LOWE_RATIO_THRESHOLD = 0.75  # May need slight adjustment for binary features
-    def __init__(self, match_threshold: float = LOWE_RATIO_THRESHOLD) -> None:
-        super().__init__("akaze", match_threshold)
-    def _get_matcher(self) -> cv.FlannBasedMatcher | cv.BFMatcher:
-        """AKAZE uses BF matcher for binary descriptors."""
-        return cv.BFMatcher(cv.NORM_HAMMING, crossCheck=False)
-    def _prepare_single(self, pixels: npt.NDArray[np.uint8]) -> npt.NDArray[np.uint8]:
-        """Prepare AKAZE keypoint descriptors for the image."""
-        img = Image.fromarray(pixels, mode="RGB")
-        img = img.convert("L")
-        gray: npt.NDArray[np.uint8] = np.array(img.resize((512, 512), Image.Resampling.LANCZOS))
-        # noinspection PyUnresolvedReferences
-        akaze = cv.AKAZE_create()
-        _keypoints, desc = akaze.detectAndCompute(gray, None)
-        if desc is None:
-            # Return empty array with correct shape (0 features, 61 bytes for AKAZE)
-            return np.array([], dtype=np.uint8).reshape(0, 61)
-        # AKAZE returns binary (uint8) descriptors
-        return desc.astype(np.uint8)
-class ORBMethod(FeatureMethodBase):
-    """ORB (Oriented FAST and Rotated BRIEF) keypoint method."""
-    LOWE_RATIO_THRESHOLD = 0.75  # May need slight adjustment for binary features
-    def __init__(self, max_features: int = 0, match_threshold: float = LOWE_RATIO_THRESHOLD) -> None:
-        super().__init__("orb", match_threshold)
-        self.max_features = max_features
-    def _get_matcher(self) -> cv.FlannBasedMatcher | cv.BFMatcher:
-        """ORB uses BF matcher for binary descriptors."""
-        return cv.BFMatcher(cv.NORM_HAMMING, crossCheck=False)
-    def _prepare_single(self, pixels: npt.NDArray[np.uint8]) -> npt.NDArray[np.uint8]:
-        """Prepare ORB keypoint descriptors for the image."""
-        img = Image.fromarray(pixels, mode="RGB")
-        img = img.convert("L")
-        gray: npt.NDArray[np.uint8] = np.array(img.resize((512, 512), Image.Resampling.LANCZOS))
-        orb = cv.ORB_create(nfeatures=self.max_features)
-        _keypoints, desc = orb.detectAndCompute(gray, None)
-        if desc is None:
-            # Return empty array with correct shape (0 features, 32 bytes for ORB)
-            return np.array([], dtype=np.uint8).reshape(0, 32)
-        # ORB returns binary (uint8) descriptors
-        return desc.astype(np.uint8)
-class BRISKMethod(FeatureMethodBase):
-    """BRISK (Binary Robust Invariant Scalable Keypoints) method."""
-    LOWE_RATIO_THRESHOLD = 0.75  # May need slight adjustment for binary features
-    def __init__(self, match_threshold: float = LOWE_RATIO_THRESHOLD) -> None:
-        super().__init__("brisk", match_threshold)
-    def _get_matcher(self) -> cv.FlannBasedMatcher | cv.BFMatcher:
-        """BRISK uses BF matcher for binary descriptors."""
-        return cv.BFMatcher(cv.NORM_HAMMING, crossCheck=False)
-    def _prepare_single(self, pixels: npt.NDArray[np.uint8]) -> npt.NDArray[np.uint8]:
-        """Prepare BRISK keypoint descriptors for the image."""
-        img = Image.fromarray(pixels, mode="RGB")
-        img = img.convert("L")
-        gray: npt.NDArray[np.uint8] = np.array(img.resize((512, 512), Image.Resampling.LANCZOS))
-        # noinspection PyUnresolvedReferences
-        brisk = cv.BRISK_create()
-        _keypoints, desc = brisk.detectAndCompute(gray, None)
-        if desc is None:
-            # Return empty array with correct shape (0 features, 64 bytes for BRISK)
-            return np.array([], dtype=np.uint8).reshape(0, 64)
-        # BRISK returns binary (uint8) descriptors
-        return desc.astype(np.uint8)
+"""Feature-based similarity methods with caching support."""
+from __future__ import annotations
+from abc import abstractmethod
+import cv2 as cv
+import numpy as np
+import numpy.typing as npt
+from PIL import Image
+from .base import ComparisonMethodName, SimilarityMethod
+class FeatureMethodBase(SimilarityMethod[npt.NDArray[np.float32] | npt.NDArray[np.uint8]]):
+    """Base class for feature-based similarity methods."""
+    def __init__(self, method_name: ComparisonMethodName, match_threshold: float) -> None:
+        super().__init__(method_name)
+        self.match_threshold = match_threshold
+    @abstractmethod
+    def _prepare_single(self, pixels: npt.NDArray[np.uint8]) -> npt.NDArray[np.float32] | npt.NDArray[np.uint8]:
+        """Implement the actual preparation logic for feature descriptors."""
+        pass
+    @abstractmethod
+    def _get_matcher(self) -> cv.FlannBasedMatcher | cv.BFMatcher:
+        """Get the appropriate matcher for this feature type."""
+        pass
+    def _compare_prepared(
+        self,
+        prep1: npt.NDArray[np.float32] | npt.NDArray[np.uint8],
+        prep2: npt.NDArray[np.float32] | npt.NDArray[np.uint8],
+    ) -> float:
+        """Compare feature descriptors using matching ratio."""
+        min_features: int = min(len(prep1), len(prep2))
+        if min_features < 2:
+            return 0.0  # Not enough features to compare
+        matcher: cv.FlannBasedMatcher | cv.BFMatcher = self._get_matcher()
+        matches: list[tuple[cv.DMatch, ...]] = matcher.knnMatch(prep1, prep2, k=2)
+        good_matches: list[cv.DMatch] = []
+        for match_pair in matches:
+            if len(match_pair) == 2:
+                m, n = match_pair
+                if m.distance < self.match_threshold * n.distance:
+                    good_matches.append(m)
+        return len(good_matches) / min_features
+class SIFTMethod(FeatureMethodBase):
+    """SIFT (Scale-Invariant Feature Transform) keypoint method."""
+    LOWE_RATIO_THRESHOLD = 0.7  # Algorithmic constant
+    def __init__(self, max_features: int = 0, match_threshold: float = LOWE_RATIO_THRESHOLD) -> None:
+        super().__init__("sift", match_threshold)
+        self.max_features = max_features
+    def _get_matcher(self) -> cv.FlannBasedMatcher | cv.BFMatcher:
+        """SIFT uses FLANN matcher for float descriptors."""
+        return cv.FlannBasedMatcher()
+    def _prepare_single(self, pixels: npt.NDArray[np.uint8]) -> npt.NDArray[np.float32]:
+        """Prepare SIFT keypoint descriptors for the image."""
+        img = Image.fromarray(pixels, mode="RGB")
+        img = img.convert("L")
+        gray: npt.NDArray[np.uint8] = np.array(img.resize((512, 512), Image.Resampling.LANCZOS))
+        # noinspection PyUnresolvedReferences
+        sift: cv.SIFT = cv.SIFT_create(nfeatures=self.max_features)
+        _keypoints, desc = sift.detectAndCompute(gray, None)
+        if desc is None:
+            # Return empty array with correct shape (0 features, 128 dimensions)
+            return np.array([], dtype=np.float32).reshape(0, 128)
+        # SIFT always returns float32 descriptors
+        return desc.astype(np.float32)
+class AKAZEMethod(FeatureMethodBase):
+    """AKAZE (Accelerated-KAZE) keypoint method."""
+    LOWE_RATIO_THRESHOLD = 0.75  # May need slight adjustment for binary features
+    def __init__(self, match_threshold: float = LOWE_RATIO_THRESHOLD) -> None:
+        super().__init__("akaze", match_threshold)
+    def _get_matcher(self) -> cv.FlannBasedMatcher | cv.BFMatcher:
+        """AKAZE uses BF matcher for binary descriptors."""
+        return cv.BFMatcher(cv.NORM_HAMMING, crossCheck=False)
+    def _prepare_single(self, pixels: npt.NDArray[np.uint8]) -> npt.NDArray[np.uint8]:
+        """Prepare AKAZE keypoint descriptors for the image."""
+        img = Image.fromarray(pixels, mode="RGB")
+        img = img.convert("L")
+        gray: npt.NDArray[np.uint8] = np.array(img.resize((512, 512), Image.Resampling.LANCZOS))
+        # noinspection PyUnresolvedReferences
+        akaze = cv.AKAZE_create()
+        _keypoints, desc = akaze.detectAndCompute(gray, None)
+        if desc is None:
+            # Return empty array with correct shape (0 features, 61 bytes for AKAZE)
+            return np.array([], dtype=np.uint8).reshape(0, 61)
+        # AKAZE returns binary (uint8) descriptors
+        return desc.astype(np.uint8)
+class ORBMethod(FeatureMethodBase):
+    """ORB (Oriented FAST and Rotated BRIEF) keypoint method."""
+    LOWE_RATIO_THRESHOLD = 0.75  # May need slight adjustment for binary features
+    def __init__(self, max_features: int = 0, match_threshold: float = LOWE_RATIO_THRESHOLD) -> None:
+        super().__init__("orb", match_threshold)
+        self.max_features = max_features
+    def _get_matcher(self) -> cv.FlannBasedMatcher | cv.BFMatcher:
+        """ORB uses BF matcher for binary descriptors."""
+        return cv.BFMatcher(cv.NORM_HAMMING, crossCheck=False)
+    def _prepare_single(self, pixels: npt.NDArray[np.uint8]) -> npt.NDArray[np.uint8]:
+        """Prepare ORB keypoint descriptors for the image."""
+        img = Image.fromarray(pixels, mode="RGB")
+        img = img.convert("L")
+        gray: npt.NDArray[np.uint8] = np.array(img.resize((512, 512), Image.Resampling.LANCZOS))
+        orb = cv.ORB_create(nfeatures=self.max_features)
+        _keypoints, desc = orb.detectAndCompute(gray, None)
+        if desc is None:
+            # Return empty array with correct shape (0 features, 32 bytes for ORB)
+            return np.array([], dtype=np.uint8).reshape(0, 32)
+        # ORB returns binary (uint8) descriptors
+        return desc.astype(np.uint8)
+class BRISKMethod(FeatureMethodBase):
+    """BRISK (Binary Robust Invariant Scalable Keypoints) method."""
+    LOWE_RATIO_THRESHOLD = 0.75  # May need slight adjustment for binary features
+    def __init__(self, match_threshold: float = LOWE_RATIO_THRESHOLD) -> None:
+        super().__init__("brisk", match_threshold)
+    def _get_matcher(self) -> cv.FlannBasedMatcher | cv.BFMatcher:
+        """BRISK uses BF matcher for binary descriptors."""
+        return cv.BFMatcher(cv.NORM_HAMMING, crossCheck=False)
+    def _prepare_single(self, pixels: npt.NDArray[np.uint8]) -> npt.NDArray[np.uint8]:
+        """Prepare BRISK keypoint descriptors for the image."""
+        img = Image.fromarray(pixels, mode="RGB")
+        img = img.convert("L")
+        gray: npt.NDArray[np.uint8] = np.array(img.resize((512, 512), Image.Resampling.LANCZOS))
+        # noinspection PyUnresolvedReferences
+        brisk = cv.BRISK_create()
+        _keypoints, desc = brisk.detectAndCompute(gray, None)
+        if desc is None:
+            # Return empty array with correct shape (0 features, 64 bytes for BRISK)
+            return np.array([], dtype=np.uint8).reshape(0, 64)
+        # BRISK returns binary (uint8) descriptors
+        return desc.astype(np.uint8)

photo_compare/file_hash.py CHANGED Viewed

@@ -1,29 +1,29 @@
-"""File hashing utilities for duplicate detection."""
-from __future__ import annotations
-import hashlib
-from pathlib import Path
-def file_sha256(path: Path) -> str:
-    """Compute SHA256 hash of file contents."""
-    # Python 3.11+ streaming helper with default buffering for efficiency
-    # Default buffering (typically 8KB) is critical for WSL/network filesystems
-    with path.open("rb") as f:
-        return hashlib.file_digest(f, "sha256").hexdigest()
-def binary_files_equal(pa: Path, pb: Path, chunk_size: int = 1 << 20) -> bool:
-    """Return True iff files `a` and `b` are byte-for-byte identical."""
-    sa, sb = pa.stat(), pb.stat()
-    if sa.st_size != sb.st_size:
-        return False
-    with pa.open("rb") as fa, pb.open("rb") as fb:
-        while True:
-            ca = fa.read(chunk_size)
-            cb = fb.read(chunk_size)
-            if ca != cb:
-                return False
-            if not ca:  # reached EOF on both
-                return True
+"""File hashing utilities for duplicate detection."""
+from __future__ import annotations
+import hashlib
+from pathlib import Path
+def file_sha256(path: Path) -> str:
+    """Compute SHA256 hash of file contents."""
+    # Python 3.11+ streaming helper with default buffering for efficiency
+    # Default buffering (typically 8KB) is critical for WSL/network filesystems
+    with path.open("rb") as f:
+        return hashlib.file_digest(f, "sha256").hexdigest()
+def binary_files_equal(pa: Path, pb: Path, chunk_size: int = 1 << 20) -> bool:
+    """Return True iff files `a` and `b` are byte-for-byte identical."""
+    sa, sb = pa.stat(), pb.stat()
+    if sa.st_size != sb.st_size:
+        return False
+    with pa.open("rb") as fa, pb.open("rb") as fb:
+        while True:
+            ca = fa.read(chunk_size)
+            cb = fb.read(chunk_size)
+            if ca != cb:
+                return False
+            if not ca:  # reached EOF on both
+                return True

photo_compare/hash_methods.py CHANGED Viewed

@@ -1,99 +1,99 @@
-"""Hash-based similarity methods with caching support."""
-from __future__ import annotations
-import imagehash
-import numpy as np
-import numpy.typing as npt
-from PIL import Image
-from .base import BinningSimilarityMethod
-from .distance import hamming_similarity
-class AHashMethod(BinningSimilarityMethod[bytes, bytes]):
-    """Average hash method - very fast, basic similarity detection."""
-    def __init__(self, hash_size: int) -> None:
-        super().__init__("ahash")
-        self.hash_size = hash_size
-    def _prepare_single(self, pixels: npt.NDArray[np.uint8]) -> bytes:
-        """Prepare average hash for the image."""
-        img = Image.fromarray(pixels, mode="RGB")
-        hash_obj = imagehash.average_hash(img, self.hash_size)
-        return np.packbits(hash_obj.hash).tobytes()
-    def _compare_prepared(self, prep1: bytes, prep2: bytes) -> float:
-        """Compare hash bytes using Hamming similarity."""
-        return hamming_similarity(prep1, prep2)
-    def _get_bin_key(self, prepared: bytes) -> bytes:
-        """Use the hash itself as the bin key for exact matches."""
-        return prepared
-class DHashMethod(BinningSimilarityMethod[bytes, bytes]):
-    """Difference hash method - good for detecting crops and borders."""
-    def __init__(self, hash_size: int) -> None:
-        super().__init__("dhash")
-        self.hash_size = hash_size
-    def _prepare_single(self, pixels: npt.NDArray[np.uint8]) -> bytes:
-        """Prepare difference hash for the image."""
-        img = Image.fromarray(pixels, mode="RGB")
-        hash_obj = imagehash.dhash(img, self.hash_size)
-        return np.packbits(hash_obj.hash).tobytes()
-    def _compare_prepared(self, prep1: bytes, prep2: bytes) -> float:
-        """Compare hash bytes using Hamming similarity."""
-        return hamming_similarity(prep1, prep2)
-    def _get_bin_key(self, prepared: bytes) -> bytes:
-        """Use the hash itself as the bin key for exact matches."""
-        return prepared
-class PHashMethod(BinningSimilarityMethod[bytes, bytes]):
-    """Perceptual hash method - DCT based, robust to minor changes."""
-    def __init__(self, hash_size: int) -> None:
-        super().__init__("phash")
-        self.hash_size = hash_size
-    def _prepare_single(self, pixels: npt.NDArray[np.uint8]) -> bytes:
-        """Prepare perceptual hash for the image."""
-        img = Image.fromarray(pixels, mode="RGB")
-        hash_obj = imagehash.phash(img, self.hash_size)
-        return np.packbits(hash_obj.hash).tobytes()
-    def _compare_prepared(self, prep1: bytes, prep2: bytes) -> float:
-        """Compare hash bytes using Hamming similarity."""
-        return hamming_similarity(prep1, prep2)
-    def _get_bin_key(self, prepared: bytes) -> bytes:
-        """Use the hash itself as the bin key for exact matches."""
-        return prepared
-class WHashMethod(BinningSimilarityMethod[bytes, bytes]):
-    """Wavelet hash method - good for texture detection."""
-    def __init__(self, hash_size: int) -> None:
-        super().__init__("whash")
-        self.hash_size = hash_size
-    def _prepare_single(self, pixels: npt.NDArray[np.uint8]) -> bytes:
-        """Prepare wavelet hash for the image."""
-        img = Image.fromarray(pixels, mode="RGB")
-        hash_obj = imagehash.whash(img, self.hash_size)
-        return np.packbits(hash_obj.hash).tobytes()
-    def _compare_prepared(self, prep1: bytes, prep2: bytes) -> float:
-        """Compare hash bytes using Hamming similarity."""
-        return hamming_similarity(prep1, prep2)
-    def _get_bin_key(self, prepared: bytes) -> bytes:
-        """Use the hash itself as the bin key for exact matches."""
-        return prepared
+"""Hash-based similarity methods with caching support."""
+from __future__ import annotations
+import imagehash
+import numpy as np
+import numpy.typing as npt
+from PIL import Image
+from .base import BinningSimilarityMethod
+from .distance import hamming_similarity
+class AHashMethod(BinningSimilarityMethod[bytes, bytes]):
+    """Average hash method - very fast, basic similarity detection."""
+    def __init__(self, hash_size: int) -> None:
+        super().__init__("ahash")
+        self.hash_size = hash_size
+    def _prepare_single(self, pixels: npt.NDArray[np.uint8]) -> bytes:
+        """Prepare average hash for the image."""
+        img = Image.fromarray(pixels, mode="RGB")
+        hash_obj = imagehash.average_hash(img, self.hash_size)
+        return np.packbits(hash_obj.hash).tobytes()
+    def _compare_prepared(self, prep1: bytes, prep2: bytes) -> float:
+        """Compare hash bytes using Hamming similarity."""
+        return hamming_similarity(prep1, prep2)
+    def _get_bin_key(self, prepared: bytes) -> bytes:
+        """Use the hash itself as the bin key for exact matches."""
+        return prepared
+class DHashMethod(BinningSimilarityMethod[bytes, bytes]):
+    """Difference hash method - good for detecting crops and borders."""
+    def __init__(self, hash_size: int) -> None:
+        super().__init__("dhash")
+        self.hash_size = hash_size
+    def _prepare_single(self, pixels: npt.NDArray[np.uint8]) -> bytes:
+        """Prepare difference hash for the image."""
+        img = Image.fromarray(pixels, mode="RGB")
+        hash_obj = imagehash.dhash(img, self.hash_size)
+        return np.packbits(hash_obj.hash).tobytes()
+    def _compare_prepared(self, prep1: bytes, prep2: bytes) -> float:
+        """Compare hash bytes using Hamming similarity."""
+        return hamming_similarity(prep1, prep2)
+    def _get_bin_key(self, prepared: bytes) -> bytes:
+        """Use the hash itself as the bin key for exact matches."""
+        return prepared
+class PHashMethod(BinningSimilarityMethod[bytes, bytes]):
+    """Perceptual hash method - DCT based, robust to minor changes."""
+    def __init__(self, hash_size: int) -> None:
+        super().__init__("phash")
+        self.hash_size = hash_size
+    def _prepare_single(self, pixels: npt.NDArray[np.uint8]) -> bytes:
+        """Prepare perceptual hash for the image."""
+        img = Image.fromarray(pixels, mode="RGB")
+        hash_obj = imagehash.phash(img, self.hash_size)
+        return np.packbits(hash_obj.hash).tobytes()
+    def _compare_prepared(self, prep1: bytes, prep2: bytes) -> float:
+        """Compare hash bytes using Hamming similarity."""
+        return hamming_similarity(prep1, prep2)
+    def _get_bin_key(self, prepared: bytes) -> bytes:
+        """Use the hash itself as the bin key for exact matches."""
+        return prepared
+class WHashMethod(BinningSimilarityMethod[bytes, bytes]):
+    """Wavelet hash method - good for texture detection."""
+    def __init__(self, hash_size: int) -> None:
+        super().__init__("whash")
+        self.hash_size = hash_size
+    def _prepare_single(self, pixels: npt.NDArray[np.uint8]) -> bytes:
+        """Prepare wavelet hash for the image."""
+        img = Image.fromarray(pixels, mode="RGB")
+        hash_obj = imagehash.whash(img, self.hash_size)
+        return np.packbits(hash_obj.hash).tobytes()
+    def _compare_prepared(self, prep1: bytes, prep2: bytes) -> float:
+        """Compare hash bytes using Hamming similarity."""
+        return hamming_similarity(prep1, prep2)
+    def _get_bin_key(self, prepared: bytes) -> bytes:
+        """Use the hash itself as the bin key for exact matches."""
+        return prepared

photo-stack-finder 0.1.7__py3-none-any.whl → 0.1.8__py3-none-any.whl

photo-stack-finder 0.1.7py3-none-any.whl → 0.1.8py3-none-any.whl