PyPI - dgenerate-ultralytics-headless - Versions diffs - 8.3.134__py3-none-any.whl - Mend

dgenerate-ultralytics-headless 8.3.134__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (272) hide show

dgenerate_ultralytics_headless-8.3.134.dist-info/METADATA +400 -0
dgenerate_ultralytics_headless-8.3.134.dist-info/RECORD +272 -0
dgenerate_ultralytics_headless-8.3.134.dist-info/WHEEL +5 -0
dgenerate_ultralytics_headless-8.3.134.dist-info/entry_points.txt +3 -0
dgenerate_ultralytics_headless-8.3.134.dist-info/licenses/LICENSE +661 -0
dgenerate_ultralytics_headless-8.3.134.dist-info/top_level.txt +1 -0
tests/__init__.py +22 -0
tests/conftest.py +83 -0
tests/test_cli.py +138 -0
tests/test_cuda.py +215 -0
tests/test_engine.py +131 -0
tests/test_exports.py +236 -0
tests/test_integrations.py +154 -0
tests/test_python.py +694 -0
tests/test_solutions.py +187 -0
ultralytics/__init__.py +30 -0
ultralytics/assets/bus.jpg +0 -0
ultralytics/assets/zidane.jpg +0 -0
ultralytics/cfg/__init__.py +1023 -0
ultralytics/cfg/datasets/Argoverse.yaml +77 -0
ultralytics/cfg/datasets/DOTAv1.5.yaml +37 -0
ultralytics/cfg/datasets/DOTAv1.yaml +36 -0
ultralytics/cfg/datasets/GlobalWheat2020.yaml +68 -0
ultralytics/cfg/datasets/HomeObjects-3K.yaml +33 -0
ultralytics/cfg/datasets/ImageNet.yaml +2025 -0
ultralytics/cfg/datasets/Objects365.yaml +443 -0
ultralytics/cfg/datasets/SKU-110K.yaml +58 -0
ultralytics/cfg/datasets/VOC.yaml +106 -0
ultralytics/cfg/datasets/VisDrone.yaml +77 -0
ultralytics/cfg/datasets/african-wildlife.yaml +25 -0
ultralytics/cfg/datasets/brain-tumor.yaml +23 -0
ultralytics/cfg/datasets/carparts-seg.yaml +44 -0
ultralytics/cfg/datasets/coco-pose.yaml +42 -0
ultralytics/cfg/datasets/coco.yaml +118 -0
ultralytics/cfg/datasets/coco128-seg.yaml +101 -0
ultralytics/cfg/datasets/coco128.yaml +101 -0
ultralytics/cfg/datasets/coco8-multispectral.yaml +104 -0
ultralytics/cfg/datasets/coco8-pose.yaml +26 -0
ultralytics/cfg/datasets/coco8-seg.yaml +101 -0
ultralytics/cfg/datasets/coco8.yaml +101 -0
ultralytics/cfg/datasets/crack-seg.yaml +22 -0
ultralytics/cfg/datasets/dog-pose.yaml +24 -0
ultralytics/cfg/datasets/dota8-multispectral.yaml +38 -0
ultralytics/cfg/datasets/dota8.yaml +35 -0
ultralytics/cfg/datasets/hand-keypoints.yaml +26 -0
ultralytics/cfg/datasets/lvis.yaml +1240 -0
ultralytics/cfg/datasets/medical-pills.yaml +22 -0
ultralytics/cfg/datasets/open-images-v7.yaml +666 -0
ultralytics/cfg/datasets/package-seg.yaml +22 -0
ultralytics/cfg/datasets/signature.yaml +21 -0
ultralytics/cfg/datasets/tiger-pose.yaml +25 -0
ultralytics/cfg/datasets/xView.yaml +155 -0
ultralytics/cfg/default.yaml +127 -0
ultralytics/cfg/models/11/yolo11-cls-resnet18.yaml +17 -0
ultralytics/cfg/models/11/yolo11-cls.yaml +33 -0
ultralytics/cfg/models/11/yolo11-obb.yaml +50 -0
ultralytics/cfg/models/11/yolo11-pose.yaml +51 -0
ultralytics/cfg/models/11/yolo11-seg.yaml +50 -0
ultralytics/cfg/models/11/yolo11.yaml +50 -0
ultralytics/cfg/models/11/yoloe-11-seg.yaml +48 -0
ultralytics/cfg/models/11/yoloe-11.yaml +48 -0
ultralytics/cfg/models/12/yolo12-cls.yaml +32 -0
ultralytics/cfg/models/12/yolo12-obb.yaml +48 -0
ultralytics/cfg/models/12/yolo12-pose.yaml +49 -0
ultralytics/cfg/models/12/yolo12-seg.yaml +48 -0
ultralytics/cfg/models/12/yolo12.yaml +48 -0
ultralytics/cfg/models/rt-detr/rtdetr-l.yaml +53 -0
ultralytics/cfg/models/rt-detr/rtdetr-resnet101.yaml +45 -0
ultralytics/cfg/models/rt-detr/rtdetr-resnet50.yaml +45 -0
ultralytics/cfg/models/rt-detr/rtdetr-x.yaml +57 -0
ultralytics/cfg/models/v10/yolov10b.yaml +45 -0
ultralytics/cfg/models/v10/yolov10l.yaml +45 -0
ultralytics/cfg/models/v10/yolov10m.yaml +45 -0
ultralytics/cfg/models/v10/yolov10n.yaml +45 -0
ultralytics/cfg/models/v10/yolov10s.yaml +45 -0
ultralytics/cfg/models/v10/yolov10x.yaml +45 -0
ultralytics/cfg/models/v3/yolov3-spp.yaml +49 -0
ultralytics/cfg/models/v3/yolov3-tiny.yaml +40 -0
ultralytics/cfg/models/v3/yolov3.yaml +49 -0
ultralytics/cfg/models/v5/yolov5-p6.yaml +62 -0
ultralytics/cfg/models/v5/yolov5.yaml +51 -0
ultralytics/cfg/models/v6/yolov6.yaml +56 -0
ultralytics/cfg/models/v8/yoloe-v8-seg.yaml +45 -0
ultralytics/cfg/models/v8/yoloe-v8.yaml +45 -0
ultralytics/cfg/models/v8/yolov8-cls-resnet101.yaml +28 -0
ultralytics/cfg/models/v8/yolov8-cls-resnet50.yaml +28 -0
ultralytics/cfg/models/v8/yolov8-cls.yaml +32 -0
ultralytics/cfg/models/v8/yolov8-ghost-p2.yaml +58 -0
ultralytics/cfg/models/v8/yolov8-ghost-p6.yaml +60 -0
ultralytics/cfg/models/v8/yolov8-ghost.yaml +50 -0
ultralytics/cfg/models/v8/yolov8-obb.yaml +49 -0
ultralytics/cfg/models/v8/yolov8-p2.yaml +57 -0
ultralytics/cfg/models/v8/yolov8-p6.yaml +59 -0
ultralytics/cfg/models/v8/yolov8-pose-p6.yaml +60 -0
ultralytics/cfg/models/v8/yolov8-pose.yaml +50 -0
ultralytics/cfg/models/v8/yolov8-rtdetr.yaml +49 -0
ultralytics/cfg/models/v8/yolov8-seg-p6.yaml +59 -0
ultralytics/cfg/models/v8/yolov8-seg.yaml +49 -0
ultralytics/cfg/models/v8/yolov8-world.yaml +51 -0
ultralytics/cfg/models/v8/yolov8-worldv2.yaml +49 -0
ultralytics/cfg/models/v8/yolov8.yaml +49 -0
ultralytics/cfg/models/v9/yolov9c-seg.yaml +41 -0
ultralytics/cfg/models/v9/yolov9c.yaml +41 -0
ultralytics/cfg/models/v9/yolov9e-seg.yaml +64 -0
ultralytics/cfg/models/v9/yolov9e.yaml +64 -0
ultralytics/cfg/models/v9/yolov9m.yaml +41 -0
ultralytics/cfg/models/v9/yolov9s.yaml +41 -0
ultralytics/cfg/models/v9/yolov9t.yaml +41 -0
ultralytics/cfg/trackers/botsort.yaml +22 -0
ultralytics/cfg/trackers/bytetrack.yaml +14 -0
ultralytics/data/__init__.py +26 -0
ultralytics/data/annotator.py +66 -0
ultralytics/data/augment.py +2945 -0
ultralytics/data/base.py +438 -0
ultralytics/data/build.py +258 -0
ultralytics/data/converter.py +754 -0
ultralytics/data/dataset.py +834 -0
ultralytics/data/loaders.py +676 -0
ultralytics/data/scripts/download_weights.sh +18 -0
ultralytics/data/scripts/get_coco.sh +61 -0
ultralytics/data/scripts/get_coco128.sh +18 -0
ultralytics/data/scripts/get_imagenet.sh +52 -0
ultralytics/data/split.py +125 -0
ultralytics/data/split_dota.py +325 -0
ultralytics/data/utils.py +777 -0
ultralytics/engine/__init__.py +1 -0
ultralytics/engine/exporter.py +1519 -0
ultralytics/engine/model.py +1156 -0
ultralytics/engine/predictor.py +502 -0
ultralytics/engine/results.py +1840 -0
ultralytics/engine/trainer.py +853 -0
ultralytics/engine/tuner.py +243 -0
ultralytics/engine/validator.py +377 -0
ultralytics/hub/__init__.py +168 -0
ultralytics/hub/auth.py +137 -0
ultralytics/hub/google/__init__.py +176 -0
ultralytics/hub/session.py +446 -0
ultralytics/hub/utils.py +248 -0
ultralytics/models/__init__.py +9 -0
ultralytics/models/fastsam/__init__.py +7 -0
ultralytics/models/fastsam/model.py +61 -0
ultralytics/models/fastsam/predict.py +181 -0
ultralytics/models/fastsam/utils.py +24 -0
ultralytics/models/fastsam/val.py +40 -0
ultralytics/models/nas/__init__.py +7 -0
ultralytics/models/nas/model.py +102 -0
ultralytics/models/nas/predict.py +58 -0
ultralytics/models/nas/val.py +39 -0
ultralytics/models/rtdetr/__init__.py +7 -0
ultralytics/models/rtdetr/model.py +63 -0
ultralytics/models/rtdetr/predict.py +84 -0
ultralytics/models/rtdetr/train.py +85 -0
ultralytics/models/rtdetr/val.py +191 -0
ultralytics/models/sam/__init__.py +6 -0
ultralytics/models/sam/amg.py +260 -0
ultralytics/models/sam/build.py +358 -0
ultralytics/models/sam/model.py +170 -0
ultralytics/models/sam/modules/__init__.py +1 -0
ultralytics/models/sam/modules/blocks.py +1129 -0
ultralytics/models/sam/modules/decoders.py +515 -0
ultralytics/models/sam/modules/encoders.py +854 -0
ultralytics/models/sam/modules/memory_attention.py +299 -0
ultralytics/models/sam/modules/sam.py +1006 -0
ultralytics/models/sam/modules/tiny_encoder.py +1002 -0
ultralytics/models/sam/modules/transformer.py +351 -0
ultralytics/models/sam/modules/utils.py +394 -0
ultralytics/models/sam/predict.py +1605 -0
ultralytics/models/utils/__init__.py +1 -0
ultralytics/models/utils/loss.py +455 -0
ultralytics/models/utils/ops.py +268 -0
ultralytics/models/yolo/__init__.py +7 -0
ultralytics/models/yolo/classify/__init__.py +7 -0
ultralytics/models/yolo/classify/predict.py +88 -0
ultralytics/models/yolo/classify/train.py +233 -0
ultralytics/models/yolo/classify/val.py +215 -0
ultralytics/models/yolo/detect/__init__.py +7 -0
ultralytics/models/yolo/detect/predict.py +124 -0
ultralytics/models/yolo/detect/train.py +217 -0
ultralytics/models/yolo/detect/val.py +451 -0
ultralytics/models/yolo/model.py +354 -0
ultralytics/models/yolo/obb/__init__.py +7 -0
ultralytics/models/yolo/obb/predict.py +66 -0
ultralytics/models/yolo/obb/train.py +81 -0
ultralytics/models/yolo/obb/val.py +283 -0
ultralytics/models/yolo/pose/__init__.py +7 -0
ultralytics/models/yolo/pose/predict.py +79 -0
ultralytics/models/yolo/pose/train.py +154 -0
ultralytics/models/yolo/pose/val.py +394 -0
ultralytics/models/yolo/segment/__init__.py +7 -0
ultralytics/models/yolo/segment/predict.py +113 -0
ultralytics/models/yolo/segment/train.py +123 -0
ultralytics/models/yolo/segment/val.py +428 -0
ultralytics/models/yolo/world/__init__.py +5 -0
ultralytics/models/yolo/world/train.py +119 -0
ultralytics/models/yolo/world/train_world.py +176 -0
ultralytics/models/yolo/yoloe/__init__.py +22 -0
ultralytics/models/yolo/yoloe/predict.py +169 -0
ultralytics/models/yolo/yoloe/train.py +298 -0
ultralytics/models/yolo/yoloe/train_seg.py +124 -0
ultralytics/models/yolo/yoloe/val.py +191 -0
ultralytics/nn/__init__.py +29 -0
ultralytics/nn/autobackend.py +842 -0
ultralytics/nn/modules/__init__.py +182 -0
ultralytics/nn/modules/activation.py +53 -0
ultralytics/nn/modules/block.py +1966 -0
ultralytics/nn/modules/conv.py +712 -0
ultralytics/nn/modules/head.py +880 -0
ultralytics/nn/modules/transformer.py +713 -0
ultralytics/nn/modules/utils.py +164 -0
ultralytics/nn/tasks.py +1627 -0
ultralytics/nn/text_model.py +351 -0
ultralytics/solutions/__init__.py +41 -0
ultralytics/solutions/ai_gym.py +116 -0
ultralytics/solutions/analytics.py +252 -0
ultralytics/solutions/config.py +106 -0
ultralytics/solutions/distance_calculation.py +124 -0
ultralytics/solutions/heatmap.py +127 -0
ultralytics/solutions/instance_segmentation.py +84 -0
ultralytics/solutions/object_blurrer.py +90 -0
ultralytics/solutions/object_counter.py +195 -0
ultralytics/solutions/object_cropper.py +84 -0
ultralytics/solutions/parking_management.py +273 -0
ultralytics/solutions/queue_management.py +93 -0
ultralytics/solutions/region_counter.py +120 -0
ultralytics/solutions/security_alarm.py +154 -0
ultralytics/solutions/similarity_search.py +172 -0
ultralytics/solutions/solutions.py +724 -0
ultralytics/solutions/speed_estimation.py +110 -0
ultralytics/solutions/streamlit_inference.py +196 -0
ultralytics/solutions/templates/similarity-search.html +160 -0
ultralytics/solutions/trackzone.py +88 -0
ultralytics/solutions/vision_eye.py +68 -0
ultralytics/trackers/__init__.py +7 -0
ultralytics/trackers/basetrack.py +124 -0
ultralytics/trackers/bot_sort.py +260 -0
ultralytics/trackers/byte_tracker.py +480 -0
ultralytics/trackers/track.py +125 -0
ultralytics/trackers/utils/__init__.py +1 -0
ultralytics/trackers/utils/gmc.py +376 -0
ultralytics/trackers/utils/kalman_filter.py +493 -0
ultralytics/trackers/utils/matching.py +157 -0
ultralytics/utils/__init__.py +1435 -0
ultralytics/utils/autobatch.py +106 -0
ultralytics/utils/autodevice.py +174 -0
ultralytics/utils/benchmarks.py +695 -0
ultralytics/utils/callbacks/__init__.py +5 -0
ultralytics/utils/callbacks/base.py +234 -0
ultralytics/utils/callbacks/clearml.py +153 -0
ultralytics/utils/callbacks/comet.py +552 -0
ultralytics/utils/callbacks/dvc.py +205 -0
ultralytics/utils/callbacks/hub.py +108 -0
ultralytics/utils/callbacks/mlflow.py +138 -0
ultralytics/utils/callbacks/neptune.py +140 -0
ultralytics/utils/callbacks/raytune.py +43 -0
ultralytics/utils/callbacks/tensorboard.py +132 -0
ultralytics/utils/callbacks/wb.py +185 -0
ultralytics/utils/checks.py +897 -0
ultralytics/utils/dist.py +119 -0
ultralytics/utils/downloads.py +499 -0
ultralytics/utils/errors.py +43 -0
ultralytics/utils/export.py +219 -0
ultralytics/utils/files.py +221 -0
ultralytics/utils/instance.py +499 -0
ultralytics/utils/loss.py +813 -0
ultralytics/utils/metrics.py +1356 -0
ultralytics/utils/ops.py +885 -0
ultralytics/utils/patches.py +143 -0
ultralytics/utils/plotting.py +1011 -0
ultralytics/utils/tal.py +416 -0
ultralytics/utils/torch_utils.py +990 -0
ultralytics/utils/triton.py +116 -0
ultralytics/utils/tuner.py +159 -0

ultralytics/models/__init__.py ADDED Viewed

@@ -0,0 +1,9 @@
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
+from .fastsam import FastSAM
+from .nas import NAS
+from .rtdetr import RTDETR
+from .sam import SAM
+from .yolo import YOLO, YOLOE, YOLOWorld
+__all__ = "YOLO", "RTDETR", "SAM", "FastSAM", "NAS", "YOLOWorld", "YOLOE"  # allow simpler import

ultralytics/models/fastsam/__init__.py ADDED Viewed

@@ -0,0 +1,7 @@
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
+from .model import FastSAM
+from .predict import FastSAMPredictor
+from .val import FastSAMValidator
+__all__ = "FastSAMPredictor", "FastSAM", "FastSAMValidator"

ultralytics/models/fastsam/model.py ADDED Viewed

@@ -0,0 +1,61 @@
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
+from pathlib import Path
+from ultralytics.engine.model import Model
+from .predict import FastSAMPredictor
+from .val import FastSAMValidator
+class FastSAM(Model):
+    """
+    FastSAM model interface for segment anything tasks.
+    This class extends the base Model class to provide specific functionality for the FastSAM (Fast Segment Anything Model)
+    implementation, allowing for efficient and accurate image segmentation.
+    Attributes:
+        model (str): Path to the pre-trained FastSAM model file.
+        task (str): The task type, set to "segment" for FastSAM models.
+    Examples:
+        >>> from ultralytics import FastSAM
+        >>> model = FastSAM("last.pt")
+        >>> results = model.predict("ultralytics/assets/bus.jpg")
+    """
+    def __init__(self, model="FastSAM-x.pt"):
+        """Initialize the FastSAM model with the specified pre-trained weights."""
+        if str(model) == "FastSAM.pt":
+            model = "FastSAM-x.pt"
+        assert Path(model).suffix not in {".yaml", ".yml"}, "FastSAM models only support pre-trained models."
+        super().__init__(model=model, task="segment")
+    def predict(self, source, stream=False, bboxes=None, points=None, labels=None, texts=None, **kwargs):
+        """
+        Perform segmentation prediction on image or video source.
+        Supports prompted segmentation with bounding boxes, points, labels, and texts. The method packages these
+        prompts and passes them to the parent class predict method.
+        Args:
+            source (str | PIL.Image | numpy.ndarray): Input source for prediction, can be a file path, URL, PIL image,
+                or numpy array.
+            stream (bool): Whether to enable real-time streaming mode for video inputs.
+            bboxes (list): Bounding box coordinates for prompted segmentation in format [[x1, y1, x2, y2], ...].
+            points (list): Point coordinates for prompted segmentation in format [[x, y], ...].
+            labels (list): Class labels for prompted segmentation.
+            texts (list): Text prompts for segmentation guidance.
+            **kwargs (Any): Additional keyword arguments passed to the predictor.
+        Returns:
+            (list): List of Results objects containing the prediction results.
+        """
+        prompts = dict(bboxes=bboxes, points=points, labels=labels, texts=texts)
+        return super().predict(source, stream, prompts=prompts, **kwargs)
+    @property
+    def task_map(self):
+        """Returns a dictionary mapping segment task to corresponding predictor and validator classes."""
+        return {"segment": {"predictor": FastSAMPredictor, "validator": FastSAMValidator}}

ultralytics/models/fastsam/predict.py ADDED Viewed

@@ -0,0 +1,181 @@
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
+import torch
+from PIL import Image
+from ultralytics.models.yolo.segment import SegmentationPredictor
+from ultralytics.utils import DEFAULT_CFG, checks
+from ultralytics.utils.metrics import box_iou
+from ultralytics.utils.ops import scale_masks
+from .utils import adjust_bboxes_to_image_border
+class FastSAMPredictor(SegmentationPredictor):
+    """
+    FastSAMPredictor is specialized for fast SAM (Segment Anything Model) segmentation prediction tasks.
+    This class extends the SegmentationPredictor, customizing the prediction pipeline specifically for fast SAM. It
+    adjusts post-processing steps to incorporate mask prediction and non-maximum suppression while optimizing for
+    single-class segmentation.
+    Attributes:
+        prompts (dict): Dictionary containing prompt information for segmentation (bboxes, points, labels, texts).
+        device (torch.device): Device on which model and tensors are processed.
+        clip_model (Any, optional): CLIP model for text-based prompting, loaded on demand.
+        clip_preprocess (Any, optional): CLIP preprocessing function for images, loaded on demand.
+    Methods:
+        postprocess: Applies box postprocessing for FastSAM predictions.
+        prompt: Performs image segmentation inference based on various prompt types.
+        _clip_inference: Performs CLIP inference to calculate similarity between images and text prompts.
+        set_prompts: Sets prompts to be used during inference.
+    """
+    def __init__(self, cfg=DEFAULT_CFG, overrides=None, _callbacks=None):
+        """
+        Initialize the FastSAMPredictor with configuration and callbacks.
+        This initializes a predictor specialized for Fast SAM (Segment Anything Model) segmentation tasks. The predictor
+        extends SegmentationPredictor with custom post-processing for mask prediction and non-maximum suppression
+        optimized for single-class segmentation.
+        Args:
+            cfg (dict): Configuration for the predictor. Defaults to Ultralytics DEFAULT_CFG.
+            overrides (dict, optional): Configuration overrides.
+            _callbacks (list, optional): List of callback functions.
+        """
+        super().__init__(cfg, overrides, _callbacks)
+        self.prompts = {}
+    def postprocess(self, preds, img, orig_imgs):
+        """
+        Apply postprocessing to FastSAM predictions and handle prompts.
+        Args:
+            preds (List[torch.Tensor]): Raw predictions from the model.
+            img (torch.Tensor): Input image tensor that was fed to the model.
+            orig_imgs (List[numpy.ndarray]): Original images before preprocessing.
+        Returns:
+            (List[Results]): Processed results with prompts applied.
+        """
+        bboxes = self.prompts.pop("bboxes", None)
+        points = self.prompts.pop("points", None)
+        labels = self.prompts.pop("labels", None)
+        texts = self.prompts.pop("texts", None)
+        results = super().postprocess(preds, img, orig_imgs)
+        for result in results:
+            full_box = torch.tensor(
+                [0, 0, result.orig_shape[1], result.orig_shape[0]], device=preds[0].device, dtype=torch.float32
+            )
+            boxes = adjust_bboxes_to_image_border(result.boxes.xyxy, result.orig_shape)
+            idx = torch.nonzero(box_iou(full_box[None], boxes) > 0.9).flatten()
+            if idx.numel() != 0:
+                result.boxes.xyxy[idx] = full_box
+        return self.prompt(results, bboxes=bboxes, points=points, labels=labels, texts=texts)
+    def prompt(self, results, bboxes=None, points=None, labels=None, texts=None):
+        """
+        Perform image segmentation inference based on cues like bounding boxes, points, and text prompts.
+        Args:
+            results (Results | List[Results]): Original inference results from FastSAM models without any prompts.
+            bboxes (np.ndarray | List, optional): Bounding boxes with shape (N, 4), in XYXY format.
+            points (np.ndarray | List, optional): Points indicating object locations with shape (N, 2), in pixels.
+            labels (np.ndarray | List, optional): Labels for point prompts, shape (N, ). 1 = foreground, 0 = background.
+            texts (str | List[str], optional): Textual prompts, a list containing string objects.
+        Returns:
+            (List[Results]): Output results filtered and determined by the provided prompts.
+        """
+        if bboxes is None and points is None and texts is None:
+            return results
+        prompt_results = []
+        if not isinstance(results, list):
+            results = [results]
+        for result in results:
+            if len(result) == 0:
+                prompt_results.append(result)
+                continue
+            masks = result.masks.data
+            if masks.shape[1:] != result.orig_shape:
+                masks = scale_masks(masks[None], result.orig_shape)[0]
+            # bboxes prompt
+            idx = torch.zeros(len(result), dtype=torch.bool, device=self.device)
+            if bboxes is not None:
+                bboxes = torch.as_tensor(bboxes, dtype=torch.int32, device=self.device)
+                bboxes = bboxes[None] if bboxes.ndim == 1 else bboxes
+                bbox_areas = (bboxes[:, 3] - bboxes[:, 1]) * (bboxes[:, 2] - bboxes[:, 0])
+                mask_areas = torch.stack([masks[:, b[1] : b[3], b[0] : b[2]].sum(dim=(1, 2)) for b in bboxes])
+                full_mask_areas = torch.sum(masks, dim=(1, 2))
+                union = bbox_areas[:, None] + full_mask_areas - mask_areas
+                idx[torch.argmax(mask_areas / union, dim=1)] = True
+            if points is not None:
+                points = torch.as_tensor(points, dtype=torch.int32, device=self.device)
+                points = points[None] if points.ndim == 1 else points
+                if labels is None:
+                    labels = torch.ones(points.shape[0])
+                labels = torch.as_tensor(labels, dtype=torch.int32, device=self.device)
+                assert len(labels) == len(points), (
+                    f"Excepted `labels` got same size as `point`, but got {len(labels)} and {len(points)}"
+                )
+                point_idx = (
+                    torch.ones(len(result), dtype=torch.bool, device=self.device)
+                    if labels.sum() == 0  # all negative points
+                    else torch.zeros(len(result), dtype=torch.bool, device=self.device)
+                )
+                for point, label in zip(points, labels):
+                    point_idx[torch.nonzero(masks[:, point[1], point[0]], as_tuple=True)[0]] = bool(label)
+                idx |= point_idx
+            if texts is not None:
+                if isinstance(texts, str):
+                    texts = [texts]
+                crop_ims, filter_idx = [], []
+                for i, b in enumerate(result.boxes.xyxy.tolist()):
+                    x1, y1, x2, y2 = (int(x) for x in b)
+                    if masks[i].sum() <= 100:
+                        filter_idx.append(i)
+                        continue
+                    crop_ims.append(Image.fromarray(result.orig_img[y1:y2, x1:x2, ::-1]))
+                similarity = self._clip_inference(crop_ims, texts)
+                text_idx = torch.argmax(similarity, dim=-1)  # (M, )
+                if len(filter_idx):
+                    text_idx += (torch.tensor(filter_idx, device=self.device)[None] <= int(text_idx)).sum(0)
+                idx[text_idx] = True
+            prompt_results.append(result[idx])
+        return prompt_results
+    def _clip_inference(self, images, texts):
+        """
+        Perform CLIP inference to calculate similarity between images and text prompts.
+        Args:
+            images (List[PIL.Image]): List of source images, each should be PIL.Image with RGB channel order.
+            texts (List[str]): List of prompt texts, each should be a string object.
+        Returns:
+            (torch.Tensor): Similarity matrix between given images and texts with shape (M, N).
+        """
+        try:
+            import clip
+        except ImportError:
+            checks.check_requirements("git+https://github.com/ultralytics/CLIP.git")
+            import clip
+        if (not hasattr(self, "clip_model")) or (not hasattr(self, "clip_preprocess")):
+            self.clip_model, self.clip_preprocess = clip.load("ViT-B/32", device=self.device)
+        images = torch.stack([self.clip_preprocess(image).to(self.device) for image in images])
+        tokenized_text = clip.tokenize(texts).to(self.device)
+        image_features = self.clip_model.encode_image(images)
+        text_features = self.clip_model.encode_text(tokenized_text)
+        image_features /= image_features.norm(dim=-1, keepdim=True)  # (N, 512)
+        text_features /= text_features.norm(dim=-1, keepdim=True)  # (M, 512)
+        return (image_features * text_features[:, None]).sum(-1)  # (M, N)
+    def set_prompts(self, prompts):
+        """Set prompts to be used during inference."""
+        self.prompts = prompts

ultralytics/models/fastsam/utils.py ADDED Viewed

@@ -0,0 +1,24 @@
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
+def adjust_bboxes_to_image_border(boxes, image_shape, threshold=20):
+    """
+    Adjust bounding boxes to stick to image border if they are within a certain threshold.
+    Args:
+        boxes (torch.Tensor): Bounding boxes with shape (n, 4) in xyxy format.
+        image_shape (Tuple[int, int]): Image dimensions as (height, width).
+        threshold (int): Pixel threshold for considering a box close to the border.
+    Returns:
+       boxes (torch.Tensor): Adjusted bounding boxes with shape (n, 4).
+    """
+    # Image dimensions
+    h, w = image_shape
+    # Adjust boxes that are close to image borders
+    boxes[boxes[:, 0] < threshold, 0] = 0  # x1
+    boxes[boxes[:, 1] < threshold, 1] = 0  # y1
+    boxes[boxes[:, 2] > w - threshold, 2] = w  # x2
+    boxes[boxes[:, 3] > h - threshold, 3] = h  # y2
+    return boxes

ultralytics/models/fastsam/val.py ADDED Viewed

@@ -0,0 +1,40 @@
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
+from ultralytics.models.yolo.segment import SegmentationValidator
+from ultralytics.utils.metrics import SegmentMetrics
+class FastSAMValidator(SegmentationValidator):
+    """
+    Custom validation class for fast SAM (Segment Anything Model) segmentation in Ultralytics YOLO framework.
+    Extends the SegmentationValidator class, customizing the validation process specifically for fast SAM. This class
+    sets the task to 'segment' and uses the SegmentMetrics for evaluation. Additionally, plotting features are disabled
+    to avoid errors during validation.
+    Attributes:
+        dataloader (torch.utils.data.DataLoader): The data loader object used for validation.
+        save_dir (Path): The directory where validation results will be saved.
+        pbar (tqdm.tqdm): A progress bar object for displaying validation progress.
+        args (SimpleNamespace): Additional arguments for customization of the validation process.
+        _callbacks (list): List of callback functions to be invoked during validation.
+    """
+    def __init__(self, dataloader=None, save_dir=None, pbar=None, args=None, _callbacks=None):
+        """
+        Initialize the FastSAMValidator class, setting the task to 'segment' and metrics to SegmentMetrics.
+        Args:
+            dataloader (torch.utils.data.DataLoader): Dataloader to be used for validation.
+            save_dir (Path, optional): Directory to save results.
+            pbar (tqdm.tqdm): Progress bar for displaying progress.
+            args (SimpleNamespace): Configuration for the validator.
+            _callbacks (list): List of callback functions to be invoked during validation.
+        Notes:
+            Plots for ConfusionMatrix and other related metrics are disabled in this class to avoid errors.
+        """
+        super().__init__(dataloader, save_dir, pbar, args, _callbacks)
+        self.args.task = "segment"
+        self.args.plots = False  # disable ConfusionMatrix and other plots to avoid errors
+        self.metrics = SegmentMetrics(save_dir=self.save_dir)

ultralytics/models/nas/__init__.py ADDED Viewed

@@ -0,0 +1,7 @@
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
+from .model import NAS
+from .predict import NASPredictor
+from .val import NASValidator
+__all__ = "NASPredictor", "NASValidator", "NAS"

ultralytics/models/nas/model.py ADDED Viewed

@@ -0,0 +1,102 @@
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
+"""
+YOLO-NAS model interface.
+Examples:
+    >>> from ultralytics import NAS
+    >>> model = NAS("yolo_nas_s")
+    >>> results = model.predict("ultralytics/assets/bus.jpg")
+"""
+from pathlib import Path
+import torch
+from ultralytics.engine.model import Model
+from ultralytics.utils import DEFAULT_CFG_DICT
+from ultralytics.utils.downloads import attempt_download_asset
+from ultralytics.utils.torch_utils import model_info
+from .predict import NASPredictor
+from .val import NASValidator
+class NAS(Model):
+    """
+    YOLO NAS model for object detection.
+    This class provides an interface for the YOLO-NAS models and extends the `Model` class from Ultralytics engine.
+    It is designed to facilitate the task of object detection using pre-trained or custom-trained YOLO-NAS models.
+    Attributes:
+        model (torch.nn.Module): The loaded YOLO-NAS model.
+        task (str): The task type for the model, defaults to 'detect'.
+        predictor (NASPredictor): The predictor instance for making predictions.
+        validator (NASValidator): The validator instance for model validation.
+    Examples:
+        >>> from ultralytics import NAS
+        >>> model = NAS("yolo_nas_s")
+        >>> results = model.predict("ultralytics/assets/bus.jpg")
+    Notes:
+        YOLO-NAS models only support pre-trained models. Do not provide YAML configuration files.
+    """
+    def __init__(self, model: str = "yolo_nas_s.pt") -> None:
+        """Initialize the NAS model with the provided or default model."""
+        assert Path(model).suffix not in {".yaml", ".yml"}, "YOLO-NAS models only support pre-trained models."
+        super().__init__(model, task="detect")
+    def _load(self, weights: str, task=None) -> None:
+        """
+        Load an existing NAS model weights or create a new NAS model with pretrained weights.
+        Args:
+            weights (str): Path to the model weights file or model name.
+            task (str, optional): Task type for the model.
+        """
+        import super_gradients
+        suffix = Path(weights).suffix
+        if suffix == ".pt":
+            self.model = torch.load(attempt_download_asset(weights))
+        elif suffix == "":
+            self.model = super_gradients.training.models.get(weights, pretrained_weights="coco")
+        # Override the forward method to ignore additional arguments
+        def new_forward(x, *args, **kwargs):
+            """Ignore additional __call__ arguments."""
+            return self.model._original_forward(x)
+        self.model._original_forward = self.model.forward
+        self.model.forward = new_forward
+        # Standardize model
+        self.model.fuse = lambda verbose=True: self.model
+        self.model.stride = torch.tensor([32])
+        self.model.names = dict(enumerate(self.model._class_names))
+        self.model.is_fused = lambda: False  # for info()
+        self.model.yaml = {}  # for info()
+        self.model.pt_path = weights  # for export()
+        self.model.task = "detect"  # for export()
+        self.model.args = {**DEFAULT_CFG_DICT, **self.overrides}  # for export()
+        self.model.eval()
+    def info(self, detailed: bool = False, verbose: bool = True):
+        """
+        Log model information.
+        Args:
+            detailed (bool): Show detailed information about model.
+            verbose (bool): Controls verbosity.
+        Returns:
+            (dict): Model information dictionary.
+        """
+        return model_info(self.model, detailed=detailed, verbose=verbose, imgsz=640)
+    @property
+    def task_map(self):
+        """Return a dictionary mapping tasks to respective predictor and validator classes."""
+        return {"detect": {"predictor": NASPredictor, "validator": NASValidator}}

ultralytics/models/nas/predict.py ADDED Viewed

@@ -0,0 +1,58 @@
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
+import torch
+from ultralytics.models.yolo.detect.predict import DetectionPredictor
+from ultralytics.utils import ops
+class NASPredictor(DetectionPredictor):
+    """
+    Ultralytics YOLO NAS Predictor for object detection.
+    This class extends the `DetectionPredictor` from Ultralytics engine and is responsible for post-processing the
+    raw predictions generated by the YOLO NAS models. It applies operations like non-maximum suppression and
+    scaling the bounding boxes to fit the original image dimensions.
+    Attributes:
+        args (Namespace): Namespace containing various configurations for post-processing including confidence threshold,
+            IoU threshold, agnostic NMS flag, maximum detections, and class filtering options.
+        model (torch.nn.Module): The YOLO NAS model used for inference.
+        batch (list): Batch of inputs for processing.
+    Examples:
+        >>> from ultralytics import NAS
+        >>> model = NAS("yolo_nas_s")
+        >>> predictor = model.predictor
+        Assume that raw_preds, img, orig_imgs are available
+        >>> results = predictor.postprocess(raw_preds, img, orig_imgs)
+    Notes:
+        Typically, this class is not instantiated directly. It is used internally within the `NAS` class.
+    """
+    def postprocess(self, preds_in, img, orig_imgs):
+        """
+        Postprocess NAS model predictions to generate final detection results.
+        This method takes raw predictions from a YOLO NAS model, converts bounding box formats, and applies
+        post-processing operations to generate the final detection results compatible with Ultralytics
+        result visualization and analysis tools.
+        Args:
+            preds_in (list): Raw predictions from the NAS model, typically containing bounding boxes and class scores.
+            img (torch.Tensor): Input image tensor that was fed to the model, with shape (B, C, H, W).
+            orig_imgs (list | torch.Tensor | np.ndarray): Original images before preprocessing, used for scaling
+                coordinates back to original dimensions.
+        Returns:
+            (list): List of Results objects containing the processed predictions for each image in the batch.
+        Examples:
+            >>> predictor = NAS("yolo_nas_s").predictor
+            >>> results = predictor.postprocess(raw_preds, img, orig_imgs)
+        """
+        boxes = ops.xyxy2xywh(preds_in[0][0])
+        preds = torch.cat((boxes, preds_in[0][1]), -1).permute(0, 2, 1)  # concatenate with class scores
+        return super().postprocess(preds, img, orig_imgs)

ultralytics/models/nas/val.py ADDED Viewed

@@ -0,0 +1,39 @@
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
+import torch
+from ultralytics.models.yolo.detect import DetectionValidator
+from ultralytics.utils import ops
+__all__ = ["NASValidator"]
+class NASValidator(DetectionValidator):
+    """
+    Ultralytics YOLO NAS Validator for object detection.
+    Extends `DetectionValidator` from the Ultralytics models package and is designed to post-process the raw predictions
+    generated by YOLO NAS models. It performs non-maximum suppression to remove overlapping and low-confidence boxes,
+    ultimately producing the final detections.
+    Attributes:
+        args (Namespace): Namespace containing various configurations for post-processing, such as confidence and IoU
+            thresholds.
+        lb (torch.Tensor): Optional tensor for multilabel NMS.
+    Examples:
+        >>> from ultralytics import NAS
+        >>> model = NAS("yolo_nas_s")
+        >>> validator = model.validator
+        Assumes that raw_preds are available
+        >>> final_preds = validator.postprocess(raw_preds)
+    Notes:
+        This class is generally not instantiated directly but is used internally within the `NAS` class.
+    """
+    def postprocess(self, preds_in):
+        """Apply Non-maximum suppression to prediction outputs."""
+        boxes = ops.xyxy2xywh(preds_in[0][0])  # Convert bounding box format from xyxy to xywh
+        preds = torch.cat((boxes, preds_in[0][1]), -1).permute(0, 2, 1)  # Concatenate boxes with scores and permute
+        return super().postprocess(preds)

ultralytics/models/rtdetr/__init__.py ADDED Viewed

@@ -0,0 +1,7 @@
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
+from .model import RTDETR
+from .predict import RTDETRPredictor
+from .val import RTDETRValidator
+__all__ = "RTDETRPredictor", "RTDETRValidator", "RTDETR"

ultralytics/models/rtdetr/model.py ADDED Viewed

@@ -0,0 +1,63 @@
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
+"""
+Interface for Baidu's RT-DETR, a Vision Transformer-based real-time object detector.
+RT-DETR offers real-time performance and high accuracy, excelling in accelerated backends like CUDA with TensorRT.
+It features an efficient hybrid encoder and IoU-aware query selection for enhanced detection accuracy.
+References:
+    https://arxiv.org/pdf/2304.08069.pdf
+"""
+from ultralytics.engine.model import Model
+from ultralytics.nn.tasks import RTDETRDetectionModel
+from .predict import RTDETRPredictor
+from .train import RTDETRTrainer
+from .val import RTDETRValidator
+class RTDETR(Model):
+    """
+    Interface for Baidu's RT-DETR model, a Vision Transformer-based real-time object detector.
+    This model provides real-time performance with high accuracy. It supports efficient hybrid encoding, IoU-aware query
+    selection, and adaptable inference speed.
+    Attributes:
+        model (str): Path to the pre-trained model.
+    Examples:
+        >>> from ultralytics import RTDETR
+        >>> model = RTDETR("rtdetr-l.pt")
+        >>> results = model("image.jpg")
+    """
+    def __init__(self, model: str = "rtdetr-l.pt") -> None:
+        """
+        Initialize the RT-DETR model with the given pre-trained model file.
+        Args:
+            model (str): Path to the pre-trained model. Supports .pt, .yaml, and .yml formats.
+        Raises:
+            NotImplementedError: If the model file extension is not 'pt', 'yaml', or 'yml'.
+        """
+        super().__init__(model=model, task="detect")
+    @property
+    def task_map(self) -> dict:
+        """
+        Returns a task map for RT-DETR, associating tasks with corresponding Ultralytics classes.
+        Returns:
+            (dict): A dictionary mapping task names to Ultralytics task classes for the RT-DETR model.
+        """
+        return {
+            "detect": {
+                "predictor": RTDETRPredictor,
+                "validator": RTDETRValidator,
+                "trainer": RTDETRTrainer,
+                "model": RTDETRDetectionModel,
+            }
+        }