PyPI - ultralytics - Versions diffs - 8.1.28__py3-none-any.whl → 8.3.62__py3-none-any.whl - Mend

ultralytics 8.1.28py3-none-any.whl → 8.3.62py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (247) hide show

tests/__init__.py +22 -0
tests/conftest.py +83 -0
tests/test_cli.py +122 -0
tests/test_cuda.py +155 -0
tests/test_engine.py +131 -0
tests/test_exports.py +216 -0
tests/test_integrations.py +150 -0
tests/test_python.py +615 -0
tests/test_solutions.py +94 -0
ultralytics/__init__.py +11 -8
ultralytics/cfg/__init__.py +569 -131
ultralytics/cfg/datasets/Argoverse.yaml +2 -1
ultralytics/cfg/datasets/DOTAv1.5.yaml +3 -2
ultralytics/cfg/datasets/DOTAv1.yaml +3 -2
ultralytics/cfg/datasets/GlobalWheat2020.yaml +3 -2
ultralytics/cfg/datasets/ImageNet.yaml +2 -1
ultralytics/cfg/datasets/Objects365.yaml +5 -4
ultralytics/cfg/datasets/SKU-110K.yaml +2 -1
ultralytics/cfg/datasets/VOC.yaml +3 -2
ultralytics/cfg/datasets/VisDrone.yaml +6 -5
ultralytics/cfg/datasets/african-wildlife.yaml +25 -0
ultralytics/cfg/datasets/brain-tumor.yaml +23 -0
ultralytics/cfg/datasets/carparts-seg.yaml +3 -2
ultralytics/cfg/datasets/coco-pose.yaml +7 -6
ultralytics/cfg/datasets/coco.yaml +3 -2
ultralytics/cfg/datasets/coco128-seg.yaml +4 -3
ultralytics/cfg/datasets/coco128.yaml +4 -3
ultralytics/cfg/datasets/coco8-pose.yaml +3 -2
ultralytics/cfg/datasets/coco8-seg.yaml +3 -2
ultralytics/cfg/datasets/coco8.yaml +3 -2
ultralytics/cfg/datasets/crack-seg.yaml +3 -2
ultralytics/cfg/datasets/dog-pose.yaml +24 -0
ultralytics/cfg/datasets/dota8.yaml +3 -2
ultralytics/cfg/datasets/hand-keypoints.yaml +26 -0
ultralytics/cfg/datasets/lvis.yaml +1236 -0
ultralytics/cfg/datasets/medical-pills.yaml +22 -0
ultralytics/cfg/datasets/open-images-v7.yaml +2 -1
ultralytics/cfg/datasets/package-seg.yaml +5 -4
ultralytics/cfg/datasets/signature.yaml +21 -0
ultralytics/cfg/datasets/tiger-pose.yaml +3 -2
ultralytics/cfg/datasets/xView.yaml +2 -1
ultralytics/cfg/default.yaml +14 -11
ultralytics/cfg/models/11/yolo11-cls-resnet18.yaml +24 -0
ultralytics/cfg/models/11/yolo11-cls.yaml +33 -0
ultralytics/cfg/models/11/yolo11-obb.yaml +50 -0
ultralytics/cfg/models/11/yolo11-pose.yaml +51 -0
ultralytics/cfg/models/11/yolo11-seg.yaml +50 -0
ultralytics/cfg/models/11/yolo11.yaml +50 -0
ultralytics/cfg/models/rt-detr/rtdetr-l.yaml +5 -2
ultralytics/cfg/models/rt-detr/rtdetr-resnet101.yaml +5 -2
ultralytics/cfg/models/rt-detr/rtdetr-resnet50.yaml +5 -2
ultralytics/cfg/models/rt-detr/rtdetr-x.yaml +5 -2
ultralytics/cfg/models/v10/yolov10b.yaml +45 -0
ultralytics/cfg/models/v10/yolov10l.yaml +45 -0
ultralytics/cfg/models/v10/yolov10m.yaml +45 -0
ultralytics/cfg/models/v10/yolov10n.yaml +45 -0
ultralytics/cfg/models/v10/yolov10s.yaml +45 -0
ultralytics/cfg/models/v10/yolov10x.yaml +45 -0
ultralytics/cfg/models/v3/yolov3-spp.yaml +5 -2
ultralytics/cfg/models/v3/yolov3-tiny.yaml +5 -2
ultralytics/cfg/models/v3/yolov3.yaml +5 -2
ultralytics/cfg/models/v5/yolov5-p6.yaml +5 -2
ultralytics/cfg/models/v5/yolov5.yaml +5 -2
ultralytics/cfg/models/v6/yolov6.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-cls-resnet101.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-cls-resnet50.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-cls.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-ghost-p2.yaml +6 -2
ultralytics/cfg/models/v8/yolov8-ghost-p6.yaml +6 -2
ultralytics/cfg/models/v8/yolov8-ghost.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-obb.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-p2.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-p6.yaml +10 -7
ultralytics/cfg/models/v8/yolov8-pose-p6.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-pose.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-rtdetr.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-seg-p6.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-seg.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-world.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-worldv2.yaml +5 -2
ultralytics/cfg/models/v8/yolov8.yaml +5 -2
ultralytics/cfg/models/v9/yolov9c-seg.yaml +41 -0
ultralytics/cfg/models/v9/yolov9c.yaml +30 -25
ultralytics/cfg/models/v9/yolov9e-seg.yaml +64 -0
ultralytics/cfg/models/v9/yolov9e.yaml +46 -42
ultralytics/cfg/models/v9/yolov9m.yaml +41 -0
ultralytics/cfg/models/v9/yolov9s.yaml +41 -0
ultralytics/cfg/models/v9/yolov9t.yaml +41 -0
ultralytics/cfg/solutions/default.yaml +24 -0
ultralytics/cfg/trackers/botsort.yaml +8 -5
ultralytics/cfg/trackers/bytetrack.yaml +8 -5
ultralytics/data/__init__.py +14 -3
ultralytics/data/annotator.py +37 -15
ultralytics/data/augment.py +1783 -289
ultralytics/data/base.py +62 -27
ultralytics/data/build.py +36 -8
ultralytics/data/converter.py +196 -36
ultralytics/data/dataset.py +233 -94
ultralytics/data/loaders.py +199 -96
ultralytics/data/split_dota.py +39 -29
ultralytics/data/utils.py +110 -40
ultralytics/engine/__init__.py +1 -1
ultralytics/engine/exporter.py +569 -242
ultralytics/engine/model.py +604 -252
ultralytics/engine/predictor.py +22 -11
ultralytics/engine/results.py +1228 -218
ultralytics/engine/trainer.py +190 -129
ultralytics/engine/tuner.py +18 -18
ultralytics/engine/validator.py +18 -15
ultralytics/hub/__init__.py +31 -13
ultralytics/hub/auth.py +11 -7
ultralytics/hub/google/__init__.py +159 -0
ultralytics/hub/session.py +128 -94
ultralytics/hub/utils.py +20 -21
ultralytics/models/__init__.py +4 -2
ultralytics/models/fastsam/__init__.py +2 -3
ultralytics/models/fastsam/model.py +26 -4
ultralytics/models/fastsam/predict.py +127 -63
ultralytics/models/fastsam/utils.py +1 -44
ultralytics/models/fastsam/val.py +1 -1
ultralytics/models/nas/__init__.py +1 -1
ultralytics/models/nas/model.py +21 -10
ultralytics/models/nas/predict.py +3 -6
ultralytics/models/nas/val.py +4 -4
ultralytics/models/rtdetr/__init__.py +1 -1
ultralytics/models/rtdetr/model.py +1 -1
ultralytics/models/rtdetr/predict.py +6 -8
ultralytics/models/rtdetr/train.py +6 -2
ultralytics/models/rtdetr/val.py +3 -3
ultralytics/models/sam/__init__.py +3 -3
ultralytics/models/sam/amg.py +29 -23
ultralytics/models/sam/build.py +211 -13
ultralytics/models/sam/model.py +91 -30
ultralytics/models/sam/modules/__init__.py +1 -1
ultralytics/models/sam/modules/blocks.py +1129 -0
ultralytics/models/sam/modules/decoders.py +381 -53
ultralytics/models/sam/modules/encoders.py +515 -324
ultralytics/models/sam/modules/memory_attention.py +237 -0
ultralytics/models/sam/modules/sam.py +969 -21
ultralytics/models/sam/modules/tiny_encoder.py +425 -154
ultralytics/models/sam/modules/transformer.py +159 -60
ultralytics/models/sam/modules/utils.py +293 -0
ultralytics/models/sam/predict.py +1263 -132
ultralytics/models/utils/__init__.py +1 -1
ultralytics/models/utils/loss.py +36 -24
ultralytics/models/utils/ops.py +3 -7
ultralytics/models/yolo/__init__.py +3 -3
ultralytics/models/yolo/classify/__init__.py +1 -1
ultralytics/models/yolo/classify/predict.py +7 -8
ultralytics/models/yolo/classify/train.py +17 -22
ultralytics/models/yolo/classify/val.py +8 -4
ultralytics/models/yolo/detect/__init__.py +1 -1
ultralytics/models/yolo/detect/predict.py +3 -5
ultralytics/models/yolo/detect/train.py +11 -4
ultralytics/models/yolo/detect/val.py +90 -52
ultralytics/models/yolo/model.py +14 -9
ultralytics/models/yolo/obb/__init__.py +1 -1
ultralytics/models/yolo/obb/predict.py +2 -2
ultralytics/models/yolo/obb/train.py +5 -3
ultralytics/models/yolo/obb/val.py +41 -23
ultralytics/models/yolo/pose/__init__.py +1 -1
ultralytics/models/yolo/pose/predict.py +3 -5
ultralytics/models/yolo/pose/train.py +2 -2
ultralytics/models/yolo/pose/val.py +51 -17
ultralytics/models/yolo/segment/__init__.py +1 -1
ultralytics/models/yolo/segment/predict.py +3 -5
ultralytics/models/yolo/segment/train.py +2 -2
ultralytics/models/yolo/segment/val.py +60 -19
ultralytics/models/yolo/world/__init__.py +5 -0
ultralytics/models/yolo/world/train.py +92 -0
ultralytics/models/yolo/world/train_world.py +109 -0
ultralytics/nn/__init__.py +1 -1
ultralytics/nn/autobackend.py +228 -93
ultralytics/nn/modules/__init__.py +39 -14
ultralytics/nn/modules/activation.py +21 -0
ultralytics/nn/modules/block.py +527 -67
ultralytics/nn/modules/conv.py +24 -7
ultralytics/nn/modules/head.py +177 -34
ultralytics/nn/modules/transformer.py +6 -5
ultralytics/nn/modules/utils.py +1 -2
ultralytics/nn/tasks.py +225 -77
ultralytics/solutions/__init__.py +30 -1
ultralytics/solutions/ai_gym.py +96 -143
ultralytics/solutions/analytics.py +247 -0
ultralytics/solutions/distance_calculation.py +78 -135
ultralytics/solutions/heatmap.py +93 -247
ultralytics/solutions/object_counter.py +184 -259
ultralytics/solutions/parking_management.py +246 -0
ultralytics/solutions/queue_management.py +112 -0
ultralytics/solutions/region_counter.py +116 -0
ultralytics/solutions/security_alarm.py +144 -0
ultralytics/solutions/solutions.py +178 -0
ultralytics/solutions/speed_estimation.py +86 -174
ultralytics/solutions/streamlit_inference.py +190 -0
ultralytics/solutions/trackzone.py +68 -0
ultralytics/trackers/__init__.py +1 -1
ultralytics/trackers/basetrack.py +32 -13
ultralytics/trackers/bot_sort.py +61 -28
ultralytics/trackers/byte_tracker.py +83 -51
ultralytics/trackers/track.py +21 -6
ultralytics/trackers/utils/__init__.py +1 -1
ultralytics/trackers/utils/gmc.py +62 -48
ultralytics/trackers/utils/kalman_filter.py +166 -35
ultralytics/trackers/utils/matching.py +40 -21
ultralytics/utils/__init__.py +511 -239
ultralytics/utils/autobatch.py +40 -22
ultralytics/utils/benchmarks.py +266 -85
ultralytics/utils/callbacks/__init__.py +1 -1
ultralytics/utils/callbacks/base.py +1 -3
ultralytics/utils/callbacks/clearml.py +7 -6
ultralytics/utils/callbacks/comet.py +39 -17
ultralytics/utils/callbacks/dvc.py +1 -1
ultralytics/utils/callbacks/hub.py +16 -16
ultralytics/utils/callbacks/mlflow.py +28 -24
ultralytics/utils/callbacks/neptune.py +6 -2
ultralytics/utils/callbacks/raytune.py +3 -4
ultralytics/utils/callbacks/tensorboard.py +18 -18
ultralytics/utils/callbacks/wb.py +27 -20
ultralytics/utils/checks.py +160 -100
ultralytics/utils/dist.py +2 -1
ultralytics/utils/downloads.py +44 -37
ultralytics/utils/errors.py +1 -1
ultralytics/utils/files.py +72 -38
ultralytics/utils/instance.py +41 -19
ultralytics/utils/loss.py +84 -56
ultralytics/utils/metrics.py +61 -56
ultralytics/utils/ops.py +94 -89
ultralytics/utils/patches.py +30 -14
ultralytics/utils/plotting.py +600 -269
ultralytics/utils/tal.py +67 -26
ultralytics/utils/torch_utils.py +302 -102
ultralytics/utils/triton.py +2 -1
ultralytics/utils/tuner.py +21 -12
ultralytics-8.3.62.dist-info/METADATA +370 -0
ultralytics-8.3.62.dist-info/RECORD +241 -0
{ultralytics-8.1.28.dist-info → ultralytics-8.3.62.dist-info}/WHEEL +1 -1
ultralytics/data/explorer/__init__.py +0 -5
ultralytics/data/explorer/explorer.py +0 -472
ultralytics/data/explorer/gui/__init__.py +0 -1
ultralytics/data/explorer/gui/dash.py +0 -268
ultralytics/data/explorer/utils.py +0 -166
ultralytics/models/fastsam/prompt.py +0 -357
ultralytics-8.1.28.dist-info/METADATA +0 -373
ultralytics-8.1.28.dist-info/RECORD +0 -197
{ultralytics-8.1.28.dist-info → ultralytics-8.3.62.dist-info}/LICENSE +0 -0
{ultralytics-8.1.28.dist-info → ultralytics-8.3.62.dist-info}/entry_points.txt +0 -0
{ultralytics-8.1.28.dist-info → ultralytics-8.3.62.dist-info}/top_level.txt +0 -0

ultralytics/models/yolo/model.py CHANGED Viewed

@@ -1,21 +1,21 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 from pathlib import Path
 from ultralytics.engine.model import Model
 from ultralytics.models import yolo
 from ultralytics.nn.tasks import ClassificationModel, DetectionModel, OBBModel, PoseModel, SegmentationModel, WorldModel
-from ultralytics.utils import yaml_load, ROOT
+from ultralytics.utils import ROOT, yaml_load
 class YOLO(Model):
     """YOLO (You Only Look Once) object detection model."""
-    def __init__(self, model="yolov8n.pt", task=None, verbose=False):
+    def __init__(self, model="yolo11n.pt", task=None, verbose=False):
         """Initialize YOLO model, switching to YOLOWorld if model filename contains '-world'."""
         path = Path(model)
         if "-world" in path.stem and path.suffix in {".pt", ".yaml", ".yml"}:  # if YOLOWorld PyTorch model
-            new_instance = YOLOWorld(path)
+            new_instance = YOLOWorld(path, verbose=verbose)
             self.__class__ = type(new_instance)
             self.__dict__ = new_instance.__dict__
         else:
@@ -62,14 +62,18 @@ class YOLO(Model):
 class YOLOWorld(Model):
     """YOLO-World object detection model."""
-    def __init__(self, model="yolov8s-world.pt") -> None:
+    def __init__(self, model="yolov8s-world.pt", verbose=False) -> None:
         """
-        Initializes the YOLOv8-World model with the given pre-trained model file. Supports *.pt and *.yaml formats.
+        Initialize YOLOv8-World model with a pre-trained model file.
+        Loads a YOLOv8-World model for object detection. If no custom class names are provided, it assigns default
+        COCO class names.
         Args:
-            model (str | Path): Path to the pre-trained model. Defaults to 'yolov8s-world.pt'.
+            model (str | Path): Path to the pre-trained model file. Supports *.pt and *.yaml formats.
+            verbose (bool): If True, prints additional information during initialization.
         """
-        super().__init__(model=model, task="detect")
+        super().__init__(model=model, task="detect", verbose=verbose)
         # Assign default COCO class names when there are no custom names
         if not hasattr(self.model, "names"):
@@ -83,6 +87,7 @@ class YOLOWorld(Model):
                 "model": WorldModel,
                 "validator": yolo.detect.DetectionValidator,
                 "predictor": yolo.detect.DetectionPredictor,
+                "trainer": yolo.world.WorldTrainer,
             }
         }
@@ -91,7 +96,7 @@ class YOLOWorld(Model):
         Set classes.
         Args:
-            classes (List(str)): A list of categories i.e ["person"].
+            classes (List(str)): A list of categories i.e. ["person"].
         """
         self.model.set_classes(classes)
         # Remove background if it's given

ultralytics/models/yolo/obb/__init__.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 from .predict import OBBPredictor
 from .train import OBBTrainer

ultralytics/models/yolo/obb/predict.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 import torch
@@ -16,7 +16,7 @@ class OBBPredictor(DetectionPredictor):
         from ultralytics.utils import ASSETS
         from ultralytics.models.yolo.obb import OBBPredictor
-        args = dict(model='yolov8n-obb.pt', source=ASSETS)
+        args = dict(model="yolov8n-obb.pt", source=ASSETS)
         predictor = OBBPredictor(overrides=args)
         predictor.predict_cli()
         ```

ultralytics/models/yolo/obb/train.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 from copy import copy
@@ -15,7 +15,7 @@ class OBBTrainer(yolo.detect.DetectionTrainer):
         ```python
         from ultralytics.models.yolo.obb import OBBTrainer
-        args = dict(model='yolov8n-obb.pt', data='dota8.yaml', epochs=3)
+        args = dict(model="yolov8n-obb.pt", data="dota8.yaml", epochs=3)
         trainer = OBBTrainer(overrides=args)
         trainer.train()
         ```
@@ -39,4 +39,6 @@ class OBBTrainer(yolo.detect.DetectionTrainer):
     def get_validator(self):
         """Return an instance of OBBValidator for validation of YOLO model."""
         self.loss_names = "box_loss", "cls_loss", "dfl_loss"
-        return yolo.obb.OBBValidator(self.test_loader, save_dir=self.save_dir, args=copy(self.args))
+        return yolo.obb.OBBValidator(
+            self.test_loader, save_dir=self.save_dir, args=copy(self.args), _callbacks=self.callbacks
+        )

ultralytics/models/yolo/obb/val.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 from pathlib import Path
@@ -18,9 +18,9 @@ class OBBValidator(DetectionValidator):
         ```python
         from ultralytics.models.yolo.obb import OBBValidator
-        args = dict(model='yolov8n-obb.pt', data='dota8.yaml')
+        args = dict(model="yolov8n-obb.pt", data="dota8.yaml")
         validator = OBBValidator(args=args)
-        validator(model=args['model'])
+        validator(model=args["model"])
         ```
     """
@@ -45,24 +45,36 @@ class OBBValidator(DetectionValidator):
             labels=self.lb,
             nc=self.nc,
             multi_label=True,
-            agnostic=self.args.single_cls,
+            agnostic=self.args.single_cls or self.args.agnostic_nms,
             max_det=self.args.max_det,
             rotated=True,
         )
     def _process_batch(self, detections, gt_bboxes, gt_cls):
         """
-        Return correct prediction matrix.
+        Perform computation of the correct prediction matrix for a batch of detections and ground truth bounding boxes.
         Args:
-            detections (torch.Tensor): Tensor of shape [N, 7] representing detections.
-                Each detection is of the format: x1, y1, x2, y2, conf, class, angle.
-            gt_bboxes (torch.Tensor): Tensor of shape [M, 5] representing rotated boxes.
-                Each box is of the format: x1, y1, x2, y2, angle.
-            labels (torch.Tensor): Tensor of shape [M] representing labels.
+            detections (torch.Tensor): A tensor of shape (N, 7) representing the detected bounding boxes and associated
+                data. Each detection is represented as (x1, y1, x2, y2, conf, class, angle).
+            gt_bboxes (torch.Tensor): A tensor of shape (M, 5) representing the ground truth bounding boxes. Each box is
+                represented as (x1, y1, x2, y2, angle).
+            gt_cls (torch.Tensor): A tensor of shape (M,) representing class labels for the ground truth bounding boxes.
         Returns:
-            (torch.Tensor): Correct prediction matrix of shape [N, 10] for 10 IoU levels.
+            (torch.Tensor): The correct prediction matrix with shape (N, 10), which includes 10 IoU (Intersection over
+                Union) levels for each detection, indicating the accuracy of predictions compared to the ground truth.
+        Example:
+            ```python
+            detections = torch.rand(100, 7)  # 100 sample detections
+            gt_bboxes = torch.rand(50, 5)  # 50 sample ground truth boxes
+            gt_cls = torch.randint(0, 5, (50,))  # 50 ground truth class labels
+            correct_matrix = OBBValidator._process_batch(detections, gt_bboxes, gt_cls)
+            ```
+        Note:
+            This method relies on `batch_probiou` to calculate IoU between detections and ground truth bounding boxes.
         """
         iou = batch_probiou(gt_bboxes, torch.cat([detections[:, :4], detections[:, -1:]], dim=-1))
         return self.match_predictions(detections[:, 5], gt_cls, iou)
@@ -78,7 +90,7 @@ class OBBValidator(DetectionValidator):
         if len(cls):
             bbox[..., :4].mul_(torch.tensor(imgsz, device=self.device)[[1, 0, 1, 0]])  # target boxes
             ops.scale_boxes(imgsz, bbox, ori_shape, ratio_pad=ratio_pad, xywh=True)  # native-space labels
-        return dict(cls=cls, bbox=bbox, ori_shape=ori_shape, imgsz=imgsz, ratio_pad=ratio_pad)
+        return {"cls": cls, "bbox": bbox, "ori_shape": ori_shape, "imgsz": imgsz, "ratio_pad": ratio_pad}
     def _prepare_pred(self, pred, pbatch):
         """Prepares and returns a batch for OBB validation with scaled and padded bounding boxes."""
@@ -118,13 +130,19 @@ class OBBValidator(DetectionValidator):
     def save_one_txt(self, predn, save_conf, shape, file):
         """Save YOLO detections to a txt file in normalized coordinates in a specific format."""
-        gn = torch.tensor(shape)[[1, 0]]  # normalization gain whwh
-        for *xywh, conf, cls, angle in predn.tolist():
-            xywha = torch.tensor([*xywh, angle]).view(1, 5)
-            xyxyxyxy = (ops.xywhr2xyxyxyxy(xywha) / gn).view(-1).tolist()  # normalized xywh
-            line = (cls, *xyxyxyxy, conf) if save_conf else (cls, *xyxyxyxy)  # label format
-            with open(file, "a") as f:
-                f.write(("%g " * len(line)).rstrip() % line + "\n")
+        import numpy as np
+        from ultralytics.engine.results import Results
+        rboxes = torch.cat([predn[:, :4], predn[:, -1:]], dim=-1)
+        # xywh, r, conf, cls
+        obb = torch.cat([rboxes, predn[:, 4:6]], dim=-1)
+        Results(
+            np.zeros((shape[0], shape[1]), dtype=np.uint8),
+            path=None,
+            names=self.names,
+            obb=obb,
+        ).save_txt(file, save_conf=save_conf)
     def eval_json(self, stats):
         """Evaluates YOLO output in JSON format and returns performance statistics."""
@@ -142,10 +160,10 @@ class OBBValidator(DetectionValidator):
             for d in data:
                 image_id = d["image_id"]
                 score = d["score"]
-                classname = self.names[d["category_id"]].replace(" ", "-")
+                classname = self.names[d["category_id"] - 1].replace(" ", "-")
                 p = d["poly"]
-                with open(f'{pred_txt / f"Task1_{classname}"}.txt', "a") as f:
+                with open(f"{pred_txt / f'Task1_{classname}'}.txt", "a") as f:
                     f.writelines(f"{image_id} {score} {p[0]} {p[1]} {p[2]} {p[3]} {p[4]} {p[5]} {p[6]} {p[7]}\n")
             # Save merged results, this could result slightly lower map than using official merging script,
             # because of the probiou calculation.
@@ -157,7 +175,7 @@ class OBBValidator(DetectionValidator):
                 image_id = d["image_id"].split("__")[0]
                 pattern = re.compile(r"\d+___\d+")
                 x, y = (int(c) for c in re.findall(pattern, d["image_id"])[0].split("___"))
-                bbox, score, cls = d["rbox"], d["score"], d["category_id"]
+                bbox, score, cls = d["rbox"], d["score"], d["category_id"] - 1
                 bbox[0] += x
                 bbox[1] += y
                 bbox.extend([score, cls])
@@ -179,7 +197,7 @@ class OBBValidator(DetectionValidator):
                     p = [round(i, 3) for i in x[:-2]]  # poly
                     score = round(x[-2], 3)
-                    with open(f'{pred_merged_txt / f"Task1_{classname}"}.txt', "a") as f:
+                    with open(f"{pred_merged_txt / f'Task1_{classname}'}.txt", "a") as f:
                         f.writelines(f"{image_id} {score} {p[0]} {p[1]} {p[2]} {p[3]} {p[4]} {p[5]} {p[6]} {p[7]}\n")
         return stats

ultralytics/models/yolo/pose/__init__.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 from .predict import PosePredictor
 from .train import PoseTrainer

ultralytics/models/yolo/pose/predict.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 from ultralytics.engine.results import Results
 from ultralytics.models.yolo.detect.predict import DetectionPredictor
@@ -14,7 +14,7 @@ class PosePredictor(DetectionPredictor):
         from ultralytics.utils import ASSETS
         from ultralytics.models.yolo.pose import PosePredictor
-        args = dict(model='yolov8n-pose.pt', source=ASSETS)
+        args = dict(model="yolov8n-pose.pt", source=ASSETS)
         predictor = PosePredictor(overrides=args)
         predictor.predict_cli()
         ```
@@ -46,12 +46,10 @@ class PosePredictor(DetectionPredictor):
             orig_imgs = ops.convert_torch2numpy_batch(orig_imgs)
         results = []
-        for i, pred in enumerate(preds):
-            orig_img = orig_imgs[i]
+        for pred, orig_img, img_path in zip(preds, orig_imgs, self.batch[0]):
             pred[:, :4] = ops.scale_boxes(img.shape[2:], pred[:, :4], orig_img.shape).round()
             pred_kpts = pred[:, 6:].view(len(pred), *self.model.kpt_shape) if len(pred) else pred[:, 6:]
             pred_kpts = ops.scale_coords(img.shape[2:], pred_kpts, orig_img.shape)
-            img_path = self.batch[0][i]
             results.append(
                 Results(orig_img, path=img_path, names=self.model.names, boxes=pred[:, :6], keypoints=pred_kpts)
             )

ultralytics/models/yolo/pose/train.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 from copy import copy
@@ -16,7 +16,7 @@ class PoseTrainer(yolo.detect.DetectionTrainer):
         ```python
         from ultralytics.models.yolo.pose import PoseTrainer
-        args = dict(model='yolov8n-pose.pt', data='coco8-pose.yaml', epochs=3)
+        args = dict(model="yolov8n-pose.pt", data="coco8-pose.yaml", epochs=3)
         trainer = PoseTrainer(overrides=args)
         trainer.train()
         ```

ultralytics/models/yolo/pose/val.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 from pathlib import Path
@@ -20,7 +20,7 @@ class PoseValidator(DetectionValidator):
         ```python
         from ultralytics.models.yolo.pose import PoseValidator
-        args = dict(model='yolov8n-pose.pt', data='coco8-pose.yaml')
+        args = dict(model="yolov8n-pose.pt", data="coco8-pose.yaml")
         validator = PoseValidator(args=args)
         validator()
         ```
@@ -69,7 +69,7 @@ class PoseValidator(DetectionValidator):
             self.args.iou,
             labels=self.lb,
             multi_label=True,
-            agnostic=self.args.single_cls,
+            agnostic=self.args.single_cls or self.args.agnostic_nms,
             max_det=self.args.max_det,
             nc=self.nc,
         )
@@ -81,7 +81,7 @@ class PoseValidator(DetectionValidator):
         is_pose = self.kpt_shape == [17, 3]
         nkpt = self.kpt_shape[0]
         self.sigma = OKS_SIGMA if is_pose else np.ones(nkpt) / nkpt
-        self.stats = dict(tp_p=[], tp=[], conf=[], pred_cls=[], target_cls=[])
+        self.stats = dict(tp_p=[], tp=[], conf=[], pred_cls=[], target_cls=[], target_img=[])
     def _prepare_batch(self, si, batch):
         """Prepares a batch for processing by converting keypoints to float and moving to device."""
@@ -118,6 +118,7 @@ class PoseValidator(DetectionValidator):
             cls, bbox = pbatch.pop("cls"), pbatch.pop("bbox")
             nl = len(cls)
             stat["target_cls"] = cls
+            stat["target_img"] = cls.unique()
             if npr == 0:
                 if nl:
                     for k in self.stats.keys():
@@ -137,8 +138,8 @@ class PoseValidator(DetectionValidator):
             if nl:
                 stat["tp"] = self._process_batch(predn, bbox, cls)
                 stat["tp_p"] = self._process_batch(predn, bbox, cls, pred_kpts, pbatch["kpts"])
-                if self.args.plots:
-                    self.confusion_matrix.process_batch(predn, bbox, cls)
+            if self.args.plots:
+                self.confusion_matrix.process_batch(predn, bbox, cls)
             for k in self.stats.keys():
                 self.stats[k].append(stat[k])
@@ -146,24 +147,45 @@ class PoseValidator(DetectionValidator):
             # Save
             if self.args.save_json:
                 self.pred_to_json(predn, batch["im_file"][si])
-            # if self.args.save_txt:
-            #    save_one_txt(predn, save_conf, shape, file=save_dir / 'labels' / f'{path.stem}.txt')
+            if self.args.save_txt:
+                self.save_one_txt(
+                    predn,
+                    pred_kpts,
+                    self.args.save_conf,
+                    pbatch["ori_shape"],
+                    self.save_dir / "labels" / f"{Path(batch['im_file'][si]).stem}.txt",
+                )
     def _process_batch(self, detections, gt_bboxes, gt_cls, pred_kpts=None, gt_kpts=None):
         """
-        Return correct prediction matrix.
+        Return correct prediction matrix by computing Intersection over Union (IoU) between detections and ground truth.
         Args:
-            detections (torch.Tensor): Tensor of shape [N, 6] representing detections.
-                Each detection is of the format: x1, y1, x2, y2, conf, class.
-            labels (torch.Tensor): Tensor of shape [M, 5] representing labels.
-                Each label is of the format: class, x1, y1, x2, y2.
-            pred_kpts (torch.Tensor, optional): Tensor of shape [N, 51] representing predicted keypoints.
-                51 corresponds to 17 keypoints each with 3 values.
-            gt_kpts (torch.Tensor, optional): Tensor of shape [N, 51] representing ground truth keypoints.
+            detections (torch.Tensor): Tensor with shape (N, 6) representing detection boxes and scores, where each
+                detection is of the format (x1, y1, x2, y2, conf, class).
+            gt_bboxes (torch.Tensor): Tensor with shape (M, 4) representing ground truth bounding boxes, where each
+                box is of the format (x1, y1, x2, y2).
+            gt_cls (torch.Tensor): Tensor with shape (M,) representing ground truth class indices.
+            pred_kpts (torch.Tensor | None): Optional tensor with shape (N, 51) representing predicted keypoints, where
+                51 corresponds to 17 keypoints each having 3 values.
+            gt_kpts (torch.Tensor | None): Optional tensor with shape (N, 51) representing ground truth keypoints.
         Returns:
-            torch.Tensor: Correct prediction matrix of shape [N, 10] for 10 IoU levels.
+            torch.Tensor: A tensor with shape (N, 10) representing the correct prediction matrix for 10 IoU levels,
+                where N is the number of detections.
+        Example:
+            ```python
+            detections = torch.rand(100, 6)  # 100 predictions: (x1, y1, x2, y2, conf, class)
+            gt_bboxes = torch.rand(50, 4)  # 50 ground truth boxes: (x1, y1, x2, y2)
+            gt_cls = torch.randint(0, 2, (50,))  # 50 ground truth class indices
+            pred_kpts = torch.rand(100, 51)  # 100 predicted keypoints
+            gt_kpts = torch.rand(50, 51)  # 50 ground truth keypoints
+            correct_preds = _process_batch(detections, gt_bboxes, gt_cls, pred_kpts, gt_kpts)
+            ```
+        Note:
+            `0.53` scale factor used in area computation is referenced from https://github.com/jin-s13/xtcocoapi/blob/master/xtcocotools/cocoeval.py#L384.
         """
         if pred_kpts is not None and gt_kpts is not None:
             # `0.53` is from https://github.com/jin-s13/xtcocoapi/blob/master/xtcocotools/cocoeval.py#L384
@@ -201,6 +223,18 @@ class PoseValidator(DetectionValidator):
             on_plot=self.on_plot,
         )  # pred
+    def save_one_txt(self, predn, pred_kpts, save_conf, shape, file):
+        """Save YOLO detections to a txt file in normalized coordinates in a specific format."""
+        from ultralytics.engine.results import Results
+        Results(
+            np.zeros((shape[0], shape[1]), dtype=np.uint8),
+            path=None,
+            names=self.names,
+            boxes=predn[:, :6],
+            keypoints=pred_kpts,
+        ).save_txt(file, save_conf=save_conf)
     def pred_to_json(self, predn, filename):
         """Converts YOLO predictions to COCO JSON format."""
         stem = Path(filename).stem

ultralytics/models/yolo/segment/__init__.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 from .predict import SegmentationPredictor
 from .train import SegmentationTrainer

ultralytics/models/yolo/segment/predict.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 from ultralytics.engine.results import Results
 from ultralytics.models.yolo.detect.predict import DetectionPredictor
@@ -14,7 +14,7 @@ class SegmentationPredictor(DetectionPredictor):
         from ultralytics.utils import ASSETS
         from ultralytics.models.yolo.segment import SegmentationPredictor
-        args = dict(model='yolov8n-seg.pt', source=ASSETS)
+        args = dict(model="yolov8n-seg.pt", source=ASSETS)
         predictor = SegmentationPredictor(overrides=args)
         predictor.predict_cli()
         ```
@@ -42,9 +42,7 @@ class SegmentationPredictor(DetectionPredictor):
         results = []
         proto = preds[1][-1] if isinstance(preds[1], tuple) else preds[1]  # tuple if PyTorch model or array if exported
-        for i, pred in enumerate(p):
-            orig_img = orig_imgs[i]
-            img_path = self.batch[0][i]
+        for i, (pred, orig_img, img_path) in enumerate(zip(p, orig_imgs, self.batch[0])):
             if not len(pred):  # save empty boxes
                 masks = None
             elif self.args.retina_masks:

ultralytics/models/yolo/segment/train.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 from copy import copy
@@ -16,7 +16,7 @@ class SegmentationTrainer(yolo.detect.DetectionTrainer):
         ```python
         from ultralytics.models.yolo.segment import SegmentationTrainer
-        args = dict(model='yolov8n-seg.pt', data='coco8-seg.yaml', epochs=3)
+        args = dict(model="yolov8n-seg.pt", data="coco8-seg.yaml", epochs=3)
         trainer = SegmentationTrainer(overrides=args)
         trainer.train()
         ```

ultralytics/models/yolo/segment/val.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 from multiprocessing.pool import ThreadPool
 from pathlib import Path
@@ -22,7 +22,7 @@ class SegmentationValidator(DetectionValidator):
         ```python
         from ultralytics.models.yolo.segment import SegmentationValidator
-        args = dict(model='yolov8n-seg.pt', data='coco8-seg.yaml')
+        args = dict(model="yolov8n-seg.pt", data="coco8-seg.yaml")
         validator = SegmentationValidator(args=args)
         validator()
         ```
@@ -48,10 +48,9 @@ class SegmentationValidator(DetectionValidator):
         self.plot_masks = []
         if self.args.save_json:
             check_requirements("pycocotools>=2.0.6")
-            self.process = ops.process_mask_upsample  # more accurate
-        else:
-            self.process = ops.process_mask  # faster
-        self.stats = dict(tp_m=[], tp=[], conf=[], pred_cls=[], target_cls=[])
+        # more accurate vs faster
+        self.process = ops.process_mask_native if self.args.save_json or self.args.save_txt else ops.process_mask
+        self.stats = dict(tp_m=[], tp=[], conf=[], pred_cls=[], target_cls=[], target_img=[])
     def get_desc(self):
         """Return a formatted description of evaluation metrics."""
@@ -77,7 +76,7 @@ class SegmentationValidator(DetectionValidator):
             self.args.iou,
             labels=self.lb,
             multi_label=True,
-            agnostic=self.args.single_cls,
+            agnostic=self.args.single_cls or self.args.agnostic_nms,
             max_det=self.args.max_det,
             nc=self.nc,
         )
@@ -112,6 +111,7 @@ class SegmentationValidator(DetectionValidator):
             cls, bbox = pbatch.pop("cls"), pbatch.pop("bbox")
             nl = len(cls)
             stat["target_cls"] = cls
+            stat["target_img"] = cls.unique()
             if npr == 0:
                 if nl:
                     for k in self.stats.keys():
@@ -135,8 +135,8 @@ class SegmentationValidator(DetectionValidator):
                 stat["tp_m"] = self._process_batch(
                     predn, bbox, cls, pred_masks, gt_masks, self.args.overlap_mask, masks=True
                 )
-                if self.args.plots:
-                    self.confusion_matrix.process_batch(predn, bbox, cls)
+            if self.args.plots:
+                self.confusion_matrix.process_batch(predn, bbox, cls)
             for k in self.stats.keys():
                 self.stats[k].append(stat[k])
@@ -147,14 +147,23 @@ class SegmentationValidator(DetectionValidator):
             # Save
             if self.args.save_json:
-                pred_masks = ops.scale_image(
-                    pred_masks.permute(1, 2, 0).contiguous().cpu().numpy(),
+                self.pred_to_json(
+                    predn,
+                    batch["im_file"][si],
+                    ops.scale_image(
+                        pred_masks.permute(1, 2, 0).contiguous().cpu().numpy(),
+                        pbatch["ori_shape"],
+                        ratio_pad=batch["ratio_pad"][si],
+                    ),
+                )
+            if self.args.save_txt:
+                self.save_one_txt(
+                    predn,
+                    pred_masks,
+                    self.args.save_conf,
                     pbatch["ori_shape"],
-                    ratio_pad=batch["ratio_pad"][si],
+                    self.save_dir / "labels" / f"{Path(batch['im_file'][si]).stem}.txt",
                 )
-                self.pred_to_json(predn, batch["im_file"][si], pred_masks)
-            # if self.args.save_txt:
-            #    save_one_txt(predn, save_conf, shape, file=save_dir / 'labels' / f'{path.stem}.txt')
     def finalize_metrics(self, *args, **kwargs):
         """Sets speed and confusion matrix for evaluation metrics."""
@@ -163,14 +172,34 @@ class SegmentationValidator(DetectionValidator):
     def _process_batch(self, detections, gt_bboxes, gt_cls, pred_masks=None, gt_masks=None, overlap=False, masks=False):
         """
-        Return correct prediction matrix.
+        Compute correct prediction matrix for a batch based on bounding boxes and optional masks.
         Args:
-            detections (array[N, 6]), x1, y1, x2, y2, conf, class
-            labels (array[M, 5]), class, x1, y1, x2, y2
+            detections (torch.Tensor): Tensor of shape (N, 6) representing detected bounding boxes and
+                associated confidence scores and class indices. Each row is of the format [x1, y1, x2, y2, conf, class].
+            gt_bboxes (torch.Tensor): Tensor of shape (M, 4) representing ground truth bounding box coordinates.
+                Each row is of the format [x1, y1, x2, y2].
+            gt_cls (torch.Tensor): Tensor of shape (M,) representing ground truth class indices.
+            pred_masks (torch.Tensor | None): Tensor representing predicted masks, if available. The shape should
+                match the ground truth masks.
+            gt_masks (torch.Tensor | None): Tensor of shape (M, H, W) representing ground truth masks, if available.
+            overlap (bool): Flag indicating if overlapping masks should be considered.
+            masks (bool): Flag indicating if the batch contains mask data.
         Returns:
-            correct (array[N, 10]), for 10 IoU levels
+            (torch.Tensor): A correct prediction matrix of shape (N, 10), where 10 represents different IoU levels.
+        Note:
+            - If `masks` is True, the function computes IoU between predicted and ground truth masks.
+            - If `overlap` is True and `masks` is True, overlapping masks are taken into account when computing IoU.
+        Example:
+            ```python
+            detections = torch.tensor([[25, 30, 200, 300, 0.8, 1], [50, 60, 180, 290, 0.75, 0]])
+            gt_bboxes = torch.tensor([[24, 29, 199, 299], [55, 65, 185, 295]])
+            gt_cls = torch.tensor([1, 0])
+            correct_preds = validator._process_batch(detections, gt_bboxes, gt_cls)
+            ```
         """
         if masks:
             if overlap:
@@ -214,6 +243,18 @@ class SegmentationValidator(DetectionValidator):
         )  # pred
         self.plot_masks.clear()
+    def save_one_txt(self, predn, pred_masks, save_conf, shape, file):
+        """Save YOLO detections to a txt file in normalized coordinates in a specific format."""
+        from ultralytics.engine.results import Results
+        Results(
+            np.zeros((shape[0], shape[1]), dtype=np.uint8),
+            path=None,
+            names=self.names,
+            boxes=predn[:, :6],
+            masks=pred_masks,
+        ).save_txt(file, save_conf=save_conf)
     def pred_to_json(self, predn, filename, pred_masks):
         """
         Save one JSON result.

ultralytics/models/yolo/world/__init__.py ADDED Viewed

@@ -0,0 +1,5 @@
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
+from .train import WorldTrainer
+__all__ = ["WorldTrainer"]

ultralytics 8.1.28__py3-none-any.whl → 8.3.62__py3-none-any.whl

ultralytics 8.1.28py3-none-any.whl → 8.3.62py3-none-any.whl