dgenerate-ultralytics-headless 8.3.253__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- dgenerate_ultralytics_headless-8.3.253.dist-info/METADATA +405 -0
- dgenerate_ultralytics_headless-8.3.253.dist-info/RECORD +299 -0
- dgenerate_ultralytics_headless-8.3.253.dist-info/WHEEL +5 -0
- dgenerate_ultralytics_headless-8.3.253.dist-info/entry_points.txt +3 -0
- dgenerate_ultralytics_headless-8.3.253.dist-info/licenses/LICENSE +661 -0
- dgenerate_ultralytics_headless-8.3.253.dist-info/top_level.txt +1 -0
- tests/__init__.py +23 -0
- tests/conftest.py +59 -0
- tests/test_cli.py +131 -0
- tests/test_cuda.py +216 -0
- tests/test_engine.py +157 -0
- tests/test_exports.py +309 -0
- tests/test_integrations.py +151 -0
- tests/test_python.py +777 -0
- tests/test_solutions.py +371 -0
- ultralytics/__init__.py +48 -0
- ultralytics/assets/bus.jpg +0 -0
- ultralytics/assets/zidane.jpg +0 -0
- ultralytics/cfg/__init__.py +1028 -0
- ultralytics/cfg/datasets/Argoverse.yaml +78 -0
- ultralytics/cfg/datasets/DOTAv1.5.yaml +37 -0
- ultralytics/cfg/datasets/DOTAv1.yaml +36 -0
- ultralytics/cfg/datasets/GlobalWheat2020.yaml +68 -0
- ultralytics/cfg/datasets/HomeObjects-3K.yaml +32 -0
- ultralytics/cfg/datasets/ImageNet.yaml +2025 -0
- ultralytics/cfg/datasets/Objects365.yaml +447 -0
- ultralytics/cfg/datasets/SKU-110K.yaml +58 -0
- ultralytics/cfg/datasets/TT100K.yaml +346 -0
- ultralytics/cfg/datasets/VOC.yaml +102 -0
- ultralytics/cfg/datasets/VisDrone.yaml +87 -0
- ultralytics/cfg/datasets/african-wildlife.yaml +25 -0
- ultralytics/cfg/datasets/brain-tumor.yaml +22 -0
- ultralytics/cfg/datasets/carparts-seg.yaml +44 -0
- ultralytics/cfg/datasets/coco-pose.yaml +64 -0
- ultralytics/cfg/datasets/coco.yaml +118 -0
- ultralytics/cfg/datasets/coco128-seg.yaml +101 -0
- ultralytics/cfg/datasets/coco128.yaml +101 -0
- ultralytics/cfg/datasets/coco8-grayscale.yaml +103 -0
- ultralytics/cfg/datasets/coco8-multispectral.yaml +104 -0
- ultralytics/cfg/datasets/coco8-pose.yaml +47 -0
- ultralytics/cfg/datasets/coco8-seg.yaml +101 -0
- ultralytics/cfg/datasets/coco8.yaml +101 -0
- ultralytics/cfg/datasets/construction-ppe.yaml +32 -0
- ultralytics/cfg/datasets/crack-seg.yaml +22 -0
- ultralytics/cfg/datasets/dog-pose.yaml +52 -0
- ultralytics/cfg/datasets/dota8-multispectral.yaml +38 -0
- ultralytics/cfg/datasets/dota8.yaml +35 -0
- ultralytics/cfg/datasets/hand-keypoints.yaml +50 -0
- ultralytics/cfg/datasets/kitti.yaml +27 -0
- ultralytics/cfg/datasets/lvis.yaml +1240 -0
- ultralytics/cfg/datasets/medical-pills.yaml +21 -0
- ultralytics/cfg/datasets/open-images-v7.yaml +663 -0
- ultralytics/cfg/datasets/package-seg.yaml +22 -0
- ultralytics/cfg/datasets/signature.yaml +21 -0
- ultralytics/cfg/datasets/tiger-pose.yaml +41 -0
- ultralytics/cfg/datasets/xView.yaml +155 -0
- ultralytics/cfg/default.yaml +130 -0
- ultralytics/cfg/models/11/yolo11-cls-resnet18.yaml +17 -0
- ultralytics/cfg/models/11/yolo11-cls.yaml +33 -0
- ultralytics/cfg/models/11/yolo11-obb.yaml +50 -0
- ultralytics/cfg/models/11/yolo11-pose.yaml +51 -0
- ultralytics/cfg/models/11/yolo11-seg.yaml +50 -0
- ultralytics/cfg/models/11/yolo11.yaml +50 -0
- ultralytics/cfg/models/11/yoloe-11-seg.yaml +48 -0
- ultralytics/cfg/models/11/yoloe-11.yaml +48 -0
- ultralytics/cfg/models/12/yolo12-cls.yaml +32 -0
- ultralytics/cfg/models/12/yolo12-obb.yaml +48 -0
- ultralytics/cfg/models/12/yolo12-pose.yaml +49 -0
- ultralytics/cfg/models/12/yolo12-seg.yaml +48 -0
- ultralytics/cfg/models/12/yolo12.yaml +48 -0
- ultralytics/cfg/models/rt-detr/rtdetr-l.yaml +53 -0
- ultralytics/cfg/models/rt-detr/rtdetr-resnet101.yaml +45 -0
- ultralytics/cfg/models/rt-detr/rtdetr-resnet50.yaml +45 -0
- ultralytics/cfg/models/rt-detr/rtdetr-x.yaml +57 -0
- ultralytics/cfg/models/v10/yolov10b.yaml +45 -0
- ultralytics/cfg/models/v10/yolov10l.yaml +45 -0
- ultralytics/cfg/models/v10/yolov10m.yaml +45 -0
- ultralytics/cfg/models/v10/yolov10n.yaml +45 -0
- ultralytics/cfg/models/v10/yolov10s.yaml +45 -0
- ultralytics/cfg/models/v10/yolov10x.yaml +45 -0
- ultralytics/cfg/models/v3/yolov3-spp.yaml +49 -0
- ultralytics/cfg/models/v3/yolov3-tiny.yaml +40 -0
- ultralytics/cfg/models/v3/yolov3.yaml +49 -0
- ultralytics/cfg/models/v5/yolov5-p6.yaml +62 -0
- ultralytics/cfg/models/v5/yolov5.yaml +51 -0
- ultralytics/cfg/models/v6/yolov6.yaml +56 -0
- ultralytics/cfg/models/v8/yoloe-v8-seg.yaml +48 -0
- ultralytics/cfg/models/v8/yoloe-v8.yaml +48 -0
- ultralytics/cfg/models/v8/yolov8-cls-resnet101.yaml +28 -0
- ultralytics/cfg/models/v8/yolov8-cls-resnet50.yaml +28 -0
- ultralytics/cfg/models/v8/yolov8-cls.yaml +32 -0
- ultralytics/cfg/models/v8/yolov8-ghost-p2.yaml +58 -0
- ultralytics/cfg/models/v8/yolov8-ghost-p6.yaml +60 -0
- ultralytics/cfg/models/v8/yolov8-ghost.yaml +50 -0
- ultralytics/cfg/models/v8/yolov8-obb.yaml +49 -0
- ultralytics/cfg/models/v8/yolov8-p2.yaml +57 -0
- ultralytics/cfg/models/v8/yolov8-p6.yaml +59 -0
- ultralytics/cfg/models/v8/yolov8-pose-p6.yaml +60 -0
- ultralytics/cfg/models/v8/yolov8-pose.yaml +50 -0
- ultralytics/cfg/models/v8/yolov8-rtdetr.yaml +49 -0
- ultralytics/cfg/models/v8/yolov8-seg-p6.yaml +59 -0
- ultralytics/cfg/models/v8/yolov8-seg.yaml +49 -0
- ultralytics/cfg/models/v8/yolov8-world.yaml +51 -0
- ultralytics/cfg/models/v8/yolov8-worldv2.yaml +49 -0
- ultralytics/cfg/models/v8/yolov8.yaml +49 -0
- ultralytics/cfg/models/v9/yolov9c-seg.yaml +41 -0
- ultralytics/cfg/models/v9/yolov9c.yaml +41 -0
- ultralytics/cfg/models/v9/yolov9e-seg.yaml +64 -0
- ultralytics/cfg/models/v9/yolov9e.yaml +64 -0
- ultralytics/cfg/models/v9/yolov9m.yaml +41 -0
- ultralytics/cfg/models/v9/yolov9s.yaml +41 -0
- ultralytics/cfg/models/v9/yolov9t.yaml +41 -0
- ultralytics/cfg/trackers/botsort.yaml +21 -0
- ultralytics/cfg/trackers/bytetrack.yaml +12 -0
- ultralytics/data/__init__.py +26 -0
- ultralytics/data/annotator.py +66 -0
- ultralytics/data/augment.py +2801 -0
- ultralytics/data/base.py +435 -0
- ultralytics/data/build.py +437 -0
- ultralytics/data/converter.py +855 -0
- ultralytics/data/dataset.py +834 -0
- ultralytics/data/loaders.py +704 -0
- ultralytics/data/scripts/download_weights.sh +18 -0
- ultralytics/data/scripts/get_coco.sh +61 -0
- ultralytics/data/scripts/get_coco128.sh +18 -0
- ultralytics/data/scripts/get_imagenet.sh +52 -0
- ultralytics/data/split.py +138 -0
- ultralytics/data/split_dota.py +344 -0
- ultralytics/data/utils.py +798 -0
- ultralytics/engine/__init__.py +1 -0
- ultralytics/engine/exporter.py +1580 -0
- ultralytics/engine/model.py +1125 -0
- ultralytics/engine/predictor.py +508 -0
- ultralytics/engine/results.py +1522 -0
- ultralytics/engine/trainer.py +977 -0
- ultralytics/engine/tuner.py +449 -0
- ultralytics/engine/validator.py +387 -0
- ultralytics/hub/__init__.py +166 -0
- ultralytics/hub/auth.py +151 -0
- ultralytics/hub/google/__init__.py +174 -0
- ultralytics/hub/session.py +422 -0
- ultralytics/hub/utils.py +162 -0
- ultralytics/models/__init__.py +9 -0
- ultralytics/models/fastsam/__init__.py +7 -0
- ultralytics/models/fastsam/model.py +79 -0
- ultralytics/models/fastsam/predict.py +169 -0
- ultralytics/models/fastsam/utils.py +23 -0
- ultralytics/models/fastsam/val.py +38 -0
- ultralytics/models/nas/__init__.py +7 -0
- ultralytics/models/nas/model.py +98 -0
- ultralytics/models/nas/predict.py +56 -0
- ultralytics/models/nas/val.py +38 -0
- ultralytics/models/rtdetr/__init__.py +7 -0
- ultralytics/models/rtdetr/model.py +63 -0
- ultralytics/models/rtdetr/predict.py +88 -0
- ultralytics/models/rtdetr/train.py +89 -0
- ultralytics/models/rtdetr/val.py +216 -0
- ultralytics/models/sam/__init__.py +25 -0
- ultralytics/models/sam/amg.py +275 -0
- ultralytics/models/sam/build.py +365 -0
- ultralytics/models/sam/build_sam3.py +377 -0
- ultralytics/models/sam/model.py +169 -0
- ultralytics/models/sam/modules/__init__.py +1 -0
- ultralytics/models/sam/modules/blocks.py +1067 -0
- ultralytics/models/sam/modules/decoders.py +495 -0
- ultralytics/models/sam/modules/encoders.py +794 -0
- ultralytics/models/sam/modules/memory_attention.py +298 -0
- ultralytics/models/sam/modules/sam.py +1160 -0
- ultralytics/models/sam/modules/tiny_encoder.py +979 -0
- ultralytics/models/sam/modules/transformer.py +344 -0
- ultralytics/models/sam/modules/utils.py +512 -0
- ultralytics/models/sam/predict.py +3940 -0
- ultralytics/models/sam/sam3/__init__.py +3 -0
- ultralytics/models/sam/sam3/decoder.py +546 -0
- ultralytics/models/sam/sam3/encoder.py +529 -0
- ultralytics/models/sam/sam3/geometry_encoders.py +415 -0
- ultralytics/models/sam/sam3/maskformer_segmentation.py +286 -0
- ultralytics/models/sam/sam3/model_misc.py +199 -0
- ultralytics/models/sam/sam3/necks.py +129 -0
- ultralytics/models/sam/sam3/sam3_image.py +339 -0
- ultralytics/models/sam/sam3/text_encoder_ve.py +307 -0
- ultralytics/models/sam/sam3/vitdet.py +547 -0
- ultralytics/models/sam/sam3/vl_combiner.py +160 -0
- ultralytics/models/utils/__init__.py +1 -0
- ultralytics/models/utils/loss.py +466 -0
- ultralytics/models/utils/ops.py +315 -0
- ultralytics/models/yolo/__init__.py +7 -0
- ultralytics/models/yolo/classify/__init__.py +7 -0
- ultralytics/models/yolo/classify/predict.py +90 -0
- ultralytics/models/yolo/classify/train.py +202 -0
- ultralytics/models/yolo/classify/val.py +216 -0
- ultralytics/models/yolo/detect/__init__.py +7 -0
- ultralytics/models/yolo/detect/predict.py +122 -0
- ultralytics/models/yolo/detect/train.py +227 -0
- ultralytics/models/yolo/detect/val.py +507 -0
- ultralytics/models/yolo/model.py +430 -0
- ultralytics/models/yolo/obb/__init__.py +7 -0
- ultralytics/models/yolo/obb/predict.py +56 -0
- ultralytics/models/yolo/obb/train.py +79 -0
- ultralytics/models/yolo/obb/val.py +302 -0
- ultralytics/models/yolo/pose/__init__.py +7 -0
- ultralytics/models/yolo/pose/predict.py +65 -0
- ultralytics/models/yolo/pose/train.py +110 -0
- ultralytics/models/yolo/pose/val.py +248 -0
- ultralytics/models/yolo/segment/__init__.py +7 -0
- ultralytics/models/yolo/segment/predict.py +109 -0
- ultralytics/models/yolo/segment/train.py +69 -0
- ultralytics/models/yolo/segment/val.py +307 -0
- ultralytics/models/yolo/world/__init__.py +5 -0
- ultralytics/models/yolo/world/train.py +173 -0
- ultralytics/models/yolo/world/train_world.py +178 -0
- ultralytics/models/yolo/yoloe/__init__.py +22 -0
- ultralytics/models/yolo/yoloe/predict.py +162 -0
- ultralytics/models/yolo/yoloe/train.py +287 -0
- ultralytics/models/yolo/yoloe/train_seg.py +122 -0
- ultralytics/models/yolo/yoloe/val.py +206 -0
- ultralytics/nn/__init__.py +27 -0
- ultralytics/nn/autobackend.py +964 -0
- ultralytics/nn/modules/__init__.py +182 -0
- ultralytics/nn/modules/activation.py +54 -0
- ultralytics/nn/modules/block.py +1947 -0
- ultralytics/nn/modules/conv.py +669 -0
- ultralytics/nn/modules/head.py +1183 -0
- ultralytics/nn/modules/transformer.py +793 -0
- ultralytics/nn/modules/utils.py +159 -0
- ultralytics/nn/tasks.py +1768 -0
- ultralytics/nn/text_model.py +356 -0
- ultralytics/py.typed +1 -0
- ultralytics/solutions/__init__.py +41 -0
- ultralytics/solutions/ai_gym.py +108 -0
- ultralytics/solutions/analytics.py +264 -0
- ultralytics/solutions/config.py +107 -0
- ultralytics/solutions/distance_calculation.py +123 -0
- ultralytics/solutions/heatmap.py +125 -0
- ultralytics/solutions/instance_segmentation.py +86 -0
- ultralytics/solutions/object_blurrer.py +89 -0
- ultralytics/solutions/object_counter.py +190 -0
- ultralytics/solutions/object_cropper.py +87 -0
- ultralytics/solutions/parking_management.py +280 -0
- ultralytics/solutions/queue_management.py +93 -0
- ultralytics/solutions/region_counter.py +133 -0
- ultralytics/solutions/security_alarm.py +151 -0
- ultralytics/solutions/similarity_search.py +219 -0
- ultralytics/solutions/solutions.py +828 -0
- ultralytics/solutions/speed_estimation.py +114 -0
- ultralytics/solutions/streamlit_inference.py +260 -0
- ultralytics/solutions/templates/similarity-search.html +156 -0
- ultralytics/solutions/trackzone.py +88 -0
- ultralytics/solutions/vision_eye.py +67 -0
- ultralytics/trackers/__init__.py +7 -0
- ultralytics/trackers/basetrack.py +115 -0
- ultralytics/trackers/bot_sort.py +257 -0
- ultralytics/trackers/byte_tracker.py +469 -0
- ultralytics/trackers/track.py +116 -0
- ultralytics/trackers/utils/__init__.py +1 -0
- ultralytics/trackers/utils/gmc.py +339 -0
- ultralytics/trackers/utils/kalman_filter.py +482 -0
- ultralytics/trackers/utils/matching.py +154 -0
- ultralytics/utils/__init__.py +1450 -0
- ultralytics/utils/autobatch.py +118 -0
- ultralytics/utils/autodevice.py +205 -0
- ultralytics/utils/benchmarks.py +728 -0
- ultralytics/utils/callbacks/__init__.py +5 -0
- ultralytics/utils/callbacks/base.py +233 -0
- ultralytics/utils/callbacks/clearml.py +146 -0
- ultralytics/utils/callbacks/comet.py +625 -0
- ultralytics/utils/callbacks/dvc.py +197 -0
- ultralytics/utils/callbacks/hub.py +110 -0
- ultralytics/utils/callbacks/mlflow.py +134 -0
- ultralytics/utils/callbacks/neptune.py +126 -0
- ultralytics/utils/callbacks/platform.py +453 -0
- ultralytics/utils/callbacks/raytune.py +42 -0
- ultralytics/utils/callbacks/tensorboard.py +123 -0
- ultralytics/utils/callbacks/wb.py +188 -0
- ultralytics/utils/checks.py +1020 -0
- ultralytics/utils/cpu.py +85 -0
- ultralytics/utils/dist.py +123 -0
- ultralytics/utils/downloads.py +529 -0
- ultralytics/utils/errors.py +35 -0
- ultralytics/utils/events.py +113 -0
- ultralytics/utils/export/__init__.py +7 -0
- ultralytics/utils/export/engine.py +237 -0
- ultralytics/utils/export/imx.py +325 -0
- ultralytics/utils/export/tensorflow.py +231 -0
- ultralytics/utils/files.py +219 -0
- ultralytics/utils/git.py +137 -0
- ultralytics/utils/instance.py +484 -0
- ultralytics/utils/logger.py +506 -0
- ultralytics/utils/loss.py +849 -0
- ultralytics/utils/metrics.py +1563 -0
- ultralytics/utils/nms.py +337 -0
- ultralytics/utils/ops.py +664 -0
- ultralytics/utils/patches.py +201 -0
- ultralytics/utils/plotting.py +1047 -0
- ultralytics/utils/tal.py +404 -0
- ultralytics/utils/torch_utils.py +984 -0
- ultralytics/utils/tqdm.py +443 -0
- ultralytics/utils/triton.py +112 -0
- ultralytics/utils/tuner.py +168 -0
|
@@ -0,0 +1,219 @@
|
|
|
1
|
+
# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
|
|
2
|
+
|
|
3
|
+
from __future__ import annotations
|
|
4
|
+
|
|
5
|
+
import os
|
|
6
|
+
from pathlib import Path
|
|
7
|
+
from typing import Any
|
|
8
|
+
|
|
9
|
+
import numpy as np
|
|
10
|
+
from PIL import Image
|
|
11
|
+
|
|
12
|
+
from ultralytics.data.utils import IMG_FORMATS
|
|
13
|
+
from ultralytics.utils import LOGGER, TORCH_VERSION
|
|
14
|
+
from ultralytics.utils.checks import check_requirements
|
|
15
|
+
from ultralytics.utils.torch_utils import TORCH_2_4, select_device
|
|
16
|
+
|
|
17
|
+
os.environ["KMP_DUPLICATE_LIB_OK"] = "TRUE" # Avoid OpenMP conflict on some systems
|
|
18
|
+
|
|
19
|
+
|
|
20
|
+
class VisualAISearch:
|
|
21
|
+
"""A semantic image search system that leverages OpenCLIP for generating high-quality image and text embeddings and
|
|
22
|
+
FAISS for fast similarity-based retrieval.
|
|
23
|
+
|
|
24
|
+
This class aligns image and text embeddings in a shared semantic space, enabling users to search large collections
|
|
25
|
+
of images using natural language queries with high accuracy and speed.
|
|
26
|
+
|
|
27
|
+
Attributes:
|
|
28
|
+
data (str): Directory containing images.
|
|
29
|
+
device (str): Computation device, e.g., 'cpu' or 'cuda'.
|
|
30
|
+
faiss_index (str): Path to the FAISS index file.
|
|
31
|
+
data_path_npy (str): Path to the numpy file storing image paths.
|
|
32
|
+
data_dir (Path): Path object for the data directory.
|
|
33
|
+
model: Loaded CLIP model.
|
|
34
|
+
index: FAISS index for similarity search.
|
|
35
|
+
image_paths (list[str]): List of image file paths.
|
|
36
|
+
|
|
37
|
+
Methods:
|
|
38
|
+
extract_image_feature: Extract CLIP embedding from an image.
|
|
39
|
+
extract_text_feature: Extract CLIP embedding from text.
|
|
40
|
+
load_or_build_index: Load existing FAISS index or build new one.
|
|
41
|
+
search: Perform semantic search for similar images.
|
|
42
|
+
|
|
43
|
+
Examples:
|
|
44
|
+
Initialize and search for images
|
|
45
|
+
>>> searcher = VisualAISearch(data="path/to/images", device="cuda")
|
|
46
|
+
>>> results = searcher.search("a cat sitting on a chair", k=10)
|
|
47
|
+
"""
|
|
48
|
+
|
|
49
|
+
def __init__(self, **kwargs: Any) -> None:
|
|
50
|
+
"""Initialize the VisualAISearch class with FAISS index and CLIP model."""
|
|
51
|
+
assert TORCH_2_4, f"VisualAISearch requires torch>=2.4 (found torch=={TORCH_VERSION})"
|
|
52
|
+
from ultralytics.nn.text_model import build_text_model
|
|
53
|
+
|
|
54
|
+
check_requirements("faiss-cpu")
|
|
55
|
+
|
|
56
|
+
self.faiss = __import__("faiss")
|
|
57
|
+
self.faiss_index = "faiss.index"
|
|
58
|
+
self.data_path_npy = "paths.npy"
|
|
59
|
+
self.data_dir = Path(kwargs.get("data", "images"))
|
|
60
|
+
self.device = select_device(kwargs.get("device", "cpu"))
|
|
61
|
+
|
|
62
|
+
if not self.data_dir.exists():
|
|
63
|
+
from ultralytics.utils import ASSETS_URL
|
|
64
|
+
|
|
65
|
+
LOGGER.warning(f"{self.data_dir} not found. Downloading images.zip from {ASSETS_URL}/images.zip")
|
|
66
|
+
from ultralytics.utils.downloads import safe_download
|
|
67
|
+
|
|
68
|
+
safe_download(url=f"{ASSETS_URL}/images.zip", unzip=True, retry=3)
|
|
69
|
+
self.data_dir = Path("images")
|
|
70
|
+
|
|
71
|
+
self.model = build_text_model("clip:ViT-B/32", device=self.device)
|
|
72
|
+
|
|
73
|
+
self.index = None
|
|
74
|
+
self.image_paths = []
|
|
75
|
+
|
|
76
|
+
self.load_or_build_index()
|
|
77
|
+
|
|
78
|
+
def extract_image_feature(self, path: Path) -> np.ndarray:
|
|
79
|
+
"""Extract CLIP image embedding from the given image path."""
|
|
80
|
+
return self.model.encode_image(Image.open(path)).detach().cpu().numpy()
|
|
81
|
+
|
|
82
|
+
def extract_text_feature(self, text: str) -> np.ndarray:
|
|
83
|
+
"""Extract CLIP text embedding from the given text query."""
|
|
84
|
+
return self.model.encode_text(self.model.tokenize([text])).detach().cpu().numpy()
|
|
85
|
+
|
|
86
|
+
def load_or_build_index(self) -> None:
|
|
87
|
+
"""Load existing FAISS index or build a new one from image features.
|
|
88
|
+
|
|
89
|
+
Checks if FAISS index and image paths exist on disk. If found, loads them directly. Otherwise, builds a new
|
|
90
|
+
index by extracting features from all images in the data directory, normalizes the features, and saves both the
|
|
91
|
+
index and image paths for future use.
|
|
92
|
+
"""
|
|
93
|
+
# Check if the FAISS index and corresponding image paths already exist
|
|
94
|
+
if Path(self.faiss_index).exists() and Path(self.data_path_npy).exists():
|
|
95
|
+
LOGGER.info("Loading existing FAISS index...")
|
|
96
|
+
self.index = self.faiss.read_index(self.faiss_index) # Load the FAISS index from disk
|
|
97
|
+
self.image_paths = np.load(self.data_path_npy) # Load the saved image path list
|
|
98
|
+
return # Exit the function as the index is successfully loaded
|
|
99
|
+
|
|
100
|
+
# If the index doesn't exist, start building it from scratch
|
|
101
|
+
LOGGER.info("Building FAISS index from images...")
|
|
102
|
+
vectors = [] # List to store feature vectors of images
|
|
103
|
+
|
|
104
|
+
# Iterate over all image files in the data directory
|
|
105
|
+
for file in self.data_dir.iterdir():
|
|
106
|
+
# Skip files that are not valid image formats
|
|
107
|
+
if file.suffix.lower().lstrip(".") not in IMG_FORMATS:
|
|
108
|
+
continue
|
|
109
|
+
try:
|
|
110
|
+
# Extract feature vector for the image and add to the list
|
|
111
|
+
vectors.append(self.extract_image_feature(file))
|
|
112
|
+
self.image_paths.append(file.name) # Store the corresponding image name
|
|
113
|
+
except Exception as e:
|
|
114
|
+
LOGGER.warning(f"Skipping {file.name}: {e}")
|
|
115
|
+
|
|
116
|
+
# If no vectors were successfully created, raise an error
|
|
117
|
+
if not vectors:
|
|
118
|
+
raise RuntimeError("No image embeddings could be generated.")
|
|
119
|
+
|
|
120
|
+
vectors = np.vstack(vectors).astype("float32") # Stack all vectors into a NumPy array and convert to float32
|
|
121
|
+
self.faiss.normalize_L2(vectors) # Normalize vectors to unit length for cosine similarity
|
|
122
|
+
|
|
123
|
+
self.index = self.faiss.IndexFlatIP(vectors.shape[1]) # Create a new FAISS index using inner product
|
|
124
|
+
self.index.add(vectors) # Add the normalized vectors to the FAISS index
|
|
125
|
+
self.faiss.write_index(self.index, self.faiss_index) # Save the newly built FAISS index to disk
|
|
126
|
+
np.save(self.data_path_npy, np.array(self.image_paths)) # Save the list of image paths to disk
|
|
127
|
+
|
|
128
|
+
LOGGER.info(f"Indexed {len(self.image_paths)} images.")
|
|
129
|
+
|
|
130
|
+
def search(self, query: str, k: int = 30, similarity_thresh: float = 0.1) -> list[str]:
|
|
131
|
+
"""Return top-k semantically similar images to the given query.
|
|
132
|
+
|
|
133
|
+
Args:
|
|
134
|
+
query (str): Natural language text query to search for.
|
|
135
|
+
k (int, optional): Maximum number of results to return.
|
|
136
|
+
similarity_thresh (float, optional): Minimum similarity threshold for filtering results.
|
|
137
|
+
|
|
138
|
+
Returns:
|
|
139
|
+
(list[str]): List of image filenames ranked by similarity score.
|
|
140
|
+
|
|
141
|
+
Examples:
|
|
142
|
+
Search for images matching a query
|
|
143
|
+
>>> searcher = VisualAISearch(data="images")
|
|
144
|
+
>>> results = searcher.search("red car", k=5, similarity_thresh=0.2)
|
|
145
|
+
"""
|
|
146
|
+
text_feat = self.extract_text_feature(query).astype("float32")
|
|
147
|
+
self.faiss.normalize_L2(text_feat)
|
|
148
|
+
|
|
149
|
+
D, index = self.index.search(text_feat, k)
|
|
150
|
+
results = [
|
|
151
|
+
(self.image_paths[i], float(D[0][idx])) for idx, i in enumerate(index[0]) if D[0][idx] >= similarity_thresh
|
|
152
|
+
]
|
|
153
|
+
results.sort(key=lambda x: x[1], reverse=True)
|
|
154
|
+
|
|
155
|
+
LOGGER.info("\nRanked Results:")
|
|
156
|
+
for name, score in results:
|
|
157
|
+
LOGGER.info(f" - {name} | Similarity: {score:.4f}")
|
|
158
|
+
|
|
159
|
+
return [r[0] for r in results]
|
|
160
|
+
|
|
161
|
+
def __call__(self, query: str) -> list[str]:
|
|
162
|
+
"""Direct call interface for the search function."""
|
|
163
|
+
return self.search(query)
|
|
164
|
+
|
|
165
|
+
|
|
166
|
+
class SearchApp:
|
|
167
|
+
"""A Flask-based web interface for semantic image search with natural language queries.
|
|
168
|
+
|
|
169
|
+
This class provides a clean, responsive frontend that enables users to input natural language queries and instantly
|
|
170
|
+
view the most relevant images retrieved from the indexed database.
|
|
171
|
+
|
|
172
|
+
Attributes:
|
|
173
|
+
render_template: Flask template rendering function.
|
|
174
|
+
request: Flask request object.
|
|
175
|
+
searcher (VisualAISearch): Instance of the VisualAISearch class.
|
|
176
|
+
app (Flask): Flask application instance.
|
|
177
|
+
|
|
178
|
+
Methods:
|
|
179
|
+
index: Process user queries and display search results.
|
|
180
|
+
run: Start the Flask web application.
|
|
181
|
+
|
|
182
|
+
Examples:
|
|
183
|
+
Start a search application
|
|
184
|
+
>>> app = SearchApp(data="path/to/images", device="cuda")
|
|
185
|
+
>>> app.run(debug=True)
|
|
186
|
+
"""
|
|
187
|
+
|
|
188
|
+
def __init__(self, data: str = "images", device: str | None = None) -> None:
|
|
189
|
+
"""Initialize the SearchApp with VisualAISearch backend.
|
|
190
|
+
|
|
191
|
+
Args:
|
|
192
|
+
data (str, optional): Path to directory containing images to index and search.
|
|
193
|
+
device (str, optional): Device to run inference on (e.g. 'cpu', 'cuda').
|
|
194
|
+
"""
|
|
195
|
+
check_requirements("flask>=3.0.1")
|
|
196
|
+
from flask import Flask, render_template, request
|
|
197
|
+
|
|
198
|
+
self.render_template = render_template
|
|
199
|
+
self.request = request
|
|
200
|
+
self.searcher = VisualAISearch(data=data, device=device)
|
|
201
|
+
self.app = Flask(
|
|
202
|
+
__name__,
|
|
203
|
+
template_folder="templates",
|
|
204
|
+
static_folder=Path(data).resolve(), # Absolute path to serve images
|
|
205
|
+
static_url_path="/images", # URL prefix for images
|
|
206
|
+
)
|
|
207
|
+
self.app.add_url_rule("/", view_func=self.index, methods=["GET", "POST"])
|
|
208
|
+
|
|
209
|
+
def index(self) -> str:
|
|
210
|
+
"""Process user query and display search results in the web interface."""
|
|
211
|
+
results = []
|
|
212
|
+
if self.request.method == "POST":
|
|
213
|
+
query = self.request.form.get("query", "").strip()
|
|
214
|
+
results = self.searcher(query)
|
|
215
|
+
return self.render_template("similarity-search.html", results=results)
|
|
216
|
+
|
|
217
|
+
def run(self, debug: bool = False) -> None:
|
|
218
|
+
"""Start the Flask web application server."""
|
|
219
|
+
self.app.run(debug=debug)
|