PyPI - ultralytics - Versions diffs - 8.1.29__py3-none-any.whl → 8.3.63__py3-none-any.whl - Mend

ultralytics 8.1.29py3-none-any.whl → 8.3.63py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (247) hide show

tests/__init__.py +22 -0
tests/conftest.py +83 -0
tests/test_cli.py +122 -0
tests/test_cuda.py +155 -0
tests/test_engine.py +131 -0
tests/test_exports.py +216 -0
tests/test_integrations.py +150 -0
tests/test_python.py +615 -0
tests/test_solutions.py +94 -0
ultralytics/__init__.py +11 -8
ultralytics/cfg/__init__.py +569 -131
ultralytics/cfg/datasets/Argoverse.yaml +2 -1
ultralytics/cfg/datasets/DOTAv1.5.yaml +3 -2
ultralytics/cfg/datasets/DOTAv1.yaml +3 -2
ultralytics/cfg/datasets/GlobalWheat2020.yaml +3 -2
ultralytics/cfg/datasets/ImageNet.yaml +2 -1
ultralytics/cfg/datasets/Objects365.yaml +5 -4
ultralytics/cfg/datasets/SKU-110K.yaml +2 -1
ultralytics/cfg/datasets/VOC.yaml +3 -2
ultralytics/cfg/datasets/VisDrone.yaml +6 -5
ultralytics/cfg/datasets/african-wildlife.yaml +25 -0
ultralytics/cfg/datasets/brain-tumor.yaml +23 -0
ultralytics/cfg/datasets/carparts-seg.yaml +3 -2
ultralytics/cfg/datasets/coco-pose.yaml +7 -6
ultralytics/cfg/datasets/coco.yaml +3 -2
ultralytics/cfg/datasets/coco128-seg.yaml +4 -3
ultralytics/cfg/datasets/coco128.yaml +4 -3
ultralytics/cfg/datasets/coco8-pose.yaml +3 -2
ultralytics/cfg/datasets/coco8-seg.yaml +3 -2
ultralytics/cfg/datasets/coco8.yaml +3 -2
ultralytics/cfg/datasets/crack-seg.yaml +3 -2
ultralytics/cfg/datasets/dog-pose.yaml +24 -0
ultralytics/cfg/datasets/dota8.yaml +3 -2
ultralytics/cfg/datasets/hand-keypoints.yaml +26 -0
ultralytics/cfg/datasets/lvis.yaml +1236 -0
ultralytics/cfg/datasets/medical-pills.yaml +22 -0
ultralytics/cfg/datasets/open-images-v7.yaml +2 -1
ultralytics/cfg/datasets/package-seg.yaml +5 -4
ultralytics/cfg/datasets/signature.yaml +21 -0
ultralytics/cfg/datasets/tiger-pose.yaml +3 -2
ultralytics/cfg/datasets/xView.yaml +2 -1
ultralytics/cfg/default.yaml +14 -11
ultralytics/cfg/models/11/yolo11-cls-resnet18.yaml +24 -0
ultralytics/cfg/models/11/yolo11-cls.yaml +33 -0
ultralytics/cfg/models/11/yolo11-obb.yaml +50 -0
ultralytics/cfg/models/11/yolo11-pose.yaml +51 -0
ultralytics/cfg/models/11/yolo11-seg.yaml +50 -0
ultralytics/cfg/models/11/yolo11.yaml +50 -0
ultralytics/cfg/models/rt-detr/rtdetr-l.yaml +5 -2
ultralytics/cfg/models/rt-detr/rtdetr-resnet101.yaml +5 -2
ultralytics/cfg/models/rt-detr/rtdetr-resnet50.yaml +5 -2
ultralytics/cfg/models/rt-detr/rtdetr-x.yaml +5 -2
ultralytics/cfg/models/v10/yolov10b.yaml +45 -0
ultralytics/cfg/models/v10/yolov10l.yaml +45 -0
ultralytics/cfg/models/v10/yolov10m.yaml +45 -0
ultralytics/cfg/models/v10/yolov10n.yaml +45 -0
ultralytics/cfg/models/v10/yolov10s.yaml +45 -0
ultralytics/cfg/models/v10/yolov10x.yaml +45 -0
ultralytics/cfg/models/v3/yolov3-spp.yaml +5 -2
ultralytics/cfg/models/v3/yolov3-tiny.yaml +5 -2
ultralytics/cfg/models/v3/yolov3.yaml +5 -2
ultralytics/cfg/models/v5/yolov5-p6.yaml +5 -2
ultralytics/cfg/models/v5/yolov5.yaml +5 -2
ultralytics/cfg/models/v6/yolov6.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-cls-resnet101.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-cls-resnet50.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-cls.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-ghost-p2.yaml +6 -2
ultralytics/cfg/models/v8/yolov8-ghost-p6.yaml +6 -2
ultralytics/cfg/models/v8/yolov8-ghost.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-obb.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-p2.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-p6.yaml +10 -7
ultralytics/cfg/models/v8/yolov8-pose-p6.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-pose.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-rtdetr.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-seg-p6.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-seg.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-world.yaml +5 -2
ultralytics/cfg/models/v8/yolov8-worldv2.yaml +5 -2
ultralytics/cfg/models/v8/yolov8.yaml +5 -2
ultralytics/cfg/models/v9/yolov9c-seg.yaml +41 -0
ultralytics/cfg/models/v9/yolov9c.yaml +30 -25
ultralytics/cfg/models/v9/yolov9e-seg.yaml +64 -0
ultralytics/cfg/models/v9/yolov9e.yaml +46 -42
ultralytics/cfg/models/v9/yolov9m.yaml +41 -0
ultralytics/cfg/models/v9/yolov9s.yaml +41 -0
ultralytics/cfg/models/v9/yolov9t.yaml +41 -0
ultralytics/cfg/solutions/default.yaml +24 -0
ultralytics/cfg/trackers/botsort.yaml +8 -5
ultralytics/cfg/trackers/bytetrack.yaml +8 -5
ultralytics/data/__init__.py +14 -3
ultralytics/data/annotator.py +37 -15
ultralytics/data/augment.py +1783 -289
ultralytics/data/base.py +62 -27
ultralytics/data/build.py +37 -8
ultralytics/data/converter.py +196 -36
ultralytics/data/dataset.py +233 -94
ultralytics/data/loaders.py +199 -96
ultralytics/data/split_dota.py +39 -29
ultralytics/data/utils.py +111 -41
ultralytics/engine/__init__.py +1 -1
ultralytics/engine/exporter.py +579 -244
ultralytics/engine/model.py +604 -252
ultralytics/engine/predictor.py +22 -11
ultralytics/engine/results.py +1228 -218
ultralytics/engine/trainer.py +191 -129
ultralytics/engine/tuner.py +18 -18
ultralytics/engine/validator.py +18 -15
ultralytics/hub/__init__.py +31 -13
ultralytics/hub/auth.py +11 -7
ultralytics/hub/google/__init__.py +159 -0
ultralytics/hub/session.py +128 -94
ultralytics/hub/utils.py +20 -21
ultralytics/models/__init__.py +4 -2
ultralytics/models/fastsam/__init__.py +2 -3
ultralytics/models/fastsam/model.py +26 -4
ultralytics/models/fastsam/predict.py +127 -63
ultralytics/models/fastsam/utils.py +1 -44
ultralytics/models/fastsam/val.py +1 -1
ultralytics/models/nas/__init__.py +1 -1
ultralytics/models/nas/model.py +21 -10
ultralytics/models/nas/predict.py +3 -6
ultralytics/models/nas/val.py +4 -4
ultralytics/models/rtdetr/__init__.py +1 -1
ultralytics/models/rtdetr/model.py +1 -1
ultralytics/models/rtdetr/predict.py +6 -8
ultralytics/models/rtdetr/train.py +6 -2
ultralytics/models/rtdetr/val.py +3 -3
ultralytics/models/sam/__init__.py +3 -3
ultralytics/models/sam/amg.py +29 -23
ultralytics/models/sam/build.py +211 -13
ultralytics/models/sam/model.py +91 -30
ultralytics/models/sam/modules/__init__.py +1 -1
ultralytics/models/sam/modules/blocks.py +1129 -0
ultralytics/models/sam/modules/decoders.py +381 -53
ultralytics/models/sam/modules/encoders.py +515 -324
ultralytics/models/sam/modules/memory_attention.py +237 -0
ultralytics/models/sam/modules/sam.py +969 -21
ultralytics/models/sam/modules/tiny_encoder.py +425 -154
ultralytics/models/sam/modules/transformer.py +159 -60
ultralytics/models/sam/modules/utils.py +293 -0
ultralytics/models/sam/predict.py +1263 -132
ultralytics/models/utils/__init__.py +1 -1
ultralytics/models/utils/loss.py +36 -24
ultralytics/models/utils/ops.py +3 -7
ultralytics/models/yolo/__init__.py +3 -3
ultralytics/models/yolo/classify/__init__.py +1 -1
ultralytics/models/yolo/classify/predict.py +7 -8
ultralytics/models/yolo/classify/train.py +17 -22
ultralytics/models/yolo/classify/val.py +8 -4
ultralytics/models/yolo/detect/__init__.py +1 -1
ultralytics/models/yolo/detect/predict.py +3 -5
ultralytics/models/yolo/detect/train.py +11 -4
ultralytics/models/yolo/detect/val.py +90 -52
ultralytics/models/yolo/model.py +14 -9
ultralytics/models/yolo/obb/__init__.py +1 -1
ultralytics/models/yolo/obb/predict.py +2 -2
ultralytics/models/yolo/obb/train.py +5 -3
ultralytics/models/yolo/obb/val.py +41 -23
ultralytics/models/yolo/pose/__init__.py +1 -1
ultralytics/models/yolo/pose/predict.py +3 -5
ultralytics/models/yolo/pose/train.py +2 -2
ultralytics/models/yolo/pose/val.py +51 -17
ultralytics/models/yolo/segment/__init__.py +1 -1
ultralytics/models/yolo/segment/predict.py +3 -5
ultralytics/models/yolo/segment/train.py +2 -2
ultralytics/models/yolo/segment/val.py +60 -19
ultralytics/models/yolo/world/__init__.py +5 -0
ultralytics/models/yolo/world/train.py +92 -0
ultralytics/models/yolo/world/train_world.py +109 -0
ultralytics/nn/__init__.py +1 -1
ultralytics/nn/autobackend.py +228 -93
ultralytics/nn/modules/__init__.py +39 -14
ultralytics/nn/modules/activation.py +21 -0
ultralytics/nn/modules/block.py +526 -66
ultralytics/nn/modules/conv.py +24 -7
ultralytics/nn/modules/head.py +177 -34
ultralytics/nn/modules/transformer.py +6 -5
ultralytics/nn/modules/utils.py +1 -2
ultralytics/nn/tasks.py +226 -82
ultralytics/solutions/__init__.py +30 -1
ultralytics/solutions/ai_gym.py +96 -143
ultralytics/solutions/analytics.py +247 -0
ultralytics/solutions/distance_calculation.py +78 -135
ultralytics/solutions/heatmap.py +93 -247
ultralytics/solutions/object_counter.py +184 -259
ultralytics/solutions/parking_management.py +246 -0
ultralytics/solutions/queue_management.py +112 -0
ultralytics/solutions/region_counter.py +116 -0
ultralytics/solutions/security_alarm.py +144 -0
ultralytics/solutions/solutions.py +178 -0
ultralytics/solutions/speed_estimation.py +86 -174
ultralytics/solutions/streamlit_inference.py +190 -0
ultralytics/solutions/trackzone.py +68 -0
ultralytics/trackers/__init__.py +1 -1
ultralytics/trackers/basetrack.py +32 -13
ultralytics/trackers/bot_sort.py +61 -28
ultralytics/trackers/byte_tracker.py +83 -51
ultralytics/trackers/track.py +21 -6
ultralytics/trackers/utils/__init__.py +1 -1
ultralytics/trackers/utils/gmc.py +62 -48
ultralytics/trackers/utils/kalman_filter.py +166 -35
ultralytics/trackers/utils/matching.py +40 -21
ultralytics/utils/__init__.py +511 -239
ultralytics/utils/autobatch.py +40 -22
ultralytics/utils/benchmarks.py +266 -85
ultralytics/utils/callbacks/__init__.py +1 -1
ultralytics/utils/callbacks/base.py +1 -3
ultralytics/utils/callbacks/clearml.py +7 -6
ultralytics/utils/callbacks/comet.py +39 -17
ultralytics/utils/callbacks/dvc.py +1 -1
ultralytics/utils/callbacks/hub.py +16 -16
ultralytics/utils/callbacks/mlflow.py +28 -24
ultralytics/utils/callbacks/neptune.py +6 -2
ultralytics/utils/callbacks/raytune.py +3 -4
ultralytics/utils/callbacks/tensorboard.py +18 -18
ultralytics/utils/callbacks/wb.py +27 -20
ultralytics/utils/checks.py +172 -100
ultralytics/utils/dist.py +2 -1
ultralytics/utils/downloads.py +40 -34
ultralytics/utils/errors.py +1 -1
ultralytics/utils/files.py +72 -38
ultralytics/utils/instance.py +41 -19
ultralytics/utils/loss.py +83 -55
ultralytics/utils/metrics.py +61 -56
ultralytics/utils/ops.py +94 -89
ultralytics/utils/patches.py +30 -14
ultralytics/utils/plotting.py +600 -269
ultralytics/utils/tal.py +67 -26
ultralytics/utils/torch_utils.py +305 -112
ultralytics/utils/triton.py +2 -1
ultralytics/utils/tuner.py +21 -12
ultralytics-8.3.63.dist-info/METADATA +370 -0
ultralytics-8.3.63.dist-info/RECORD +241 -0
{ultralytics-8.1.29.dist-info → ultralytics-8.3.63.dist-info}/WHEEL +1 -1
ultralytics/data/explorer/__init__.py +0 -5
ultralytics/data/explorer/explorer.py +0 -472
ultralytics/data/explorer/gui/__init__.py +0 -1
ultralytics/data/explorer/gui/dash.py +0 -268
ultralytics/data/explorer/utils.py +0 -166
ultralytics/models/fastsam/prompt.py +0 -357
ultralytics-8.1.29.dist-info/METADATA +0 -373
ultralytics-8.1.29.dist-info/RECORD +0 -197
{ultralytics-8.1.29.dist-info → ultralytics-8.3.63.dist-info}/LICENSE +0 -0
{ultralytics-8.1.29.dist-info → ultralytics-8.3.63.dist-info}/entry_points.txt +0 -0
{ultralytics-8.1.29.dist-info → ultralytics-8.3.63.dist-info}/top_level.txt +0 -0

ultralytics/models/utils/__init__.py CHANGED Viewed

	@@ -1 +1 @@
1	- # Ultralytics ~~YOLO~~ 🚀, AGPL-3.0 license
1	+ # Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license

ultralytics/models/utils/loss.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 import torch
 import torch.nn as nn
@@ -6,6 +6,7 @@ import torch.nn.functional as F
 from ultralytics.utils.loss import FocalLoss, VarifocalLoss
 from ultralytics.utils.metrics import bbox_iou
 from .ops import HungarianMatcher
@@ -33,15 +34,19 @@ class DETRLoss(nn.Module):
         self, nc=80, loss_gain=None, aux_loss=True, use_fl=True, use_vfl=False, use_uni_match=False, uni_match_ind=0
     ):
         """
-        DETR loss function.
+        Initialize DETR loss function with customizable components and gains.
+        Uses default loss_gain if not provided. Initializes HungarianMatcher with
+        preset cost gains. Supports auxiliary losses and various loss types.
         Args:
-            nc (int): The number of classes.
-            loss_gain (dict): The coefficient of loss.
-            aux_loss (bool): If 'aux_loss = True', loss at each decoder layer are to be used.
-            use_vfl (bool): Use VarifocalLoss or not.
-            use_uni_match (bool): Whether to use a fixed layer to assign labels for auxiliary branch.
-            uni_match_ind (int): The fixed indices of a layer.
+            nc (int): Number of classes.
+            loss_gain (dict): Coefficients for different loss components.
+            aux_loss (bool): Use auxiliary losses from each decoder layer.
+            use_fl (bool): Use FocalLoss.
+            use_vfl (bool): Use VarifocalLoss.
+            use_uni_match (bool): Use fixed layer for auxiliary branch label assignment.
+            uni_match_ind (int): Index of fixed layer for uni_match.
         """
         super().__init__()
@@ -81,9 +86,7 @@ class DETRLoss(nn.Module):
         return {name_class: loss_cls.squeeze() * self.loss_gain["class"]}
     def _get_loss_bbox(self, pred_bboxes, gt_bboxes, postfix=""):
-        """Calculates and returns the bounding box loss and GIoU loss for the predicted and ground truth bounding
-        boxes.
-        """
+        """Computes bounding box and GIoU losses for predicted and ground truth bounding boxes."""
         # Boxes: [b, query, 4], gt_bbox: list[[n, 4]]
         name_bbox = f"loss_bbox{postfix}"
         name_giou = f"loss_giou{postfix}"
@@ -240,23 +243,32 @@ class DETRLoss(nn.Module):
         if len(gt_bboxes):
             gt_scores[idx] = bbox_iou(pred_bboxes.detach(), gt_bboxes, xywh=True).squeeze(-1)
-        loss = {}
-        loss.update(self._get_loss_class(pred_scores, targets, gt_scores, len(gt_bboxes), postfix))
-        loss.update(self._get_loss_bbox(pred_bboxes, gt_bboxes, postfix))
-        # if masks is not None and gt_mask is not None:
-        #     loss.update(self._get_loss_mask(masks, gt_mask, match_indices, postfix))
-        return loss
+        return {
+            **self._get_loss_class(pred_scores, targets, gt_scores, len(gt_bboxes), postfix),
+            **self._get_loss_bbox(pred_bboxes, gt_bboxes, postfix),
+            # **(self._get_loss_mask(masks, gt_mask, match_indices, postfix) if masks is not None and gt_mask is not None else {})
+        }
     def forward(self, pred_bboxes, pred_scores, batch, postfix="", **kwargs):
         """
+        Calculate loss for predicted bounding boxes and scores.
         Args:
-            pred_bboxes (torch.Tensor): [l, b, query, 4]
-            pred_scores (torch.Tensor): [l, b, query, num_classes]
-            batch (dict): A dict includes:
-                gt_cls (torch.Tensor) with shape [num_gts, ],
-                gt_bboxes (torch.Tensor): [num_gts, 4],
-                gt_groups (List(int)): a list of batch size length includes the number of gts of each image.
-            postfix (str): postfix of loss name.
+            pred_bboxes (torch.Tensor): Predicted bounding boxes, shape [l, b, query, 4].
+            pred_scores (torch.Tensor): Predicted class scores, shape [l, b, query, num_classes].
+            batch (dict): Batch information containing:
+                cls (torch.Tensor): Ground truth classes, shape [num_gts].
+                bboxes (torch.Tensor): Ground truth bounding boxes, shape [num_gts, 4].
+                gt_groups (List[int]): Number of ground truths for each image in the batch.
+            postfix (str): Postfix for loss names.
+            **kwargs (Any): Additional arguments, may include 'match_indices'.
+        Returns:
+            (dict): Computed losses, including main and auxiliary (if enabled).
+        Note:
+            Uses last elements of pred_bboxes and pred_scores for main loss, and the rest for auxiliary losses if
+            self.aux_loss is True.
         """
         self.device = pred_bboxes.device
         match_indices = kwargs.get("match_indices", None)

ultralytics/models/utils/ops.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 import torch
 import torch.nn as nn
@@ -32,9 +32,7 @@ class HungarianMatcher(nn.Module):
     """
     def __init__(self, cost_gain=None, use_fl=True, with_mask=False, num_sample_points=12544, alpha=0.25, gamma=2.0):
-        """Initializes HungarianMatcher with cost coefficients, Focal Loss, mask prediction, sample points, and alpha
-        gamma factors.
-        """
+        """Initializes a HungarianMatcher module for optimal assignment of predicted and ground truth bounding boxes."""
         super().__init__()
         if cost_gain is None:
             cost_gain = {"class": 1, "bbox": 5, "giou": 2, "mask": 1, "dice": 1}
@@ -70,7 +68,6 @@ class HungarianMatcher(nn.Module):
                 For each batch element, it holds:
                     len(index_i) = len(index_j) = min(num_queries, num_target_boxes)
         """
         bs, nq, nc = pred_scores.shape
         if sum(gt_groups) == 0:
@@ -133,7 +130,7 @@ class HungarianMatcher(nn.Module):
     #     sample_points = torch.cat([a.repeat(b, 1, 1, 1) for a, b in zip(sample_points, num_gts) if b > 0])
     #     tgt_mask = F.grid_sample(tgt_mask, sample_points, align_corners=False).squeeze([1, 2])
     #
-    #     with torch.cuda.amp.autocast(False):
+    #     with torch.amp.autocast("cuda", enabled=False):
     #         # binary cross entropy cost
     #         pos_cost_mask = F.binary_cross_entropy_with_logits(out_mask, torch.ones_like(out_mask), reduction='none')
     #         neg_cost_mask = F.binary_cross_entropy_with_logits(out_mask, torch.zeros_like(out_mask), reduction='none')
@@ -175,7 +172,6 @@ def get_cdn_group(
             bounding boxes, attention mask and meta information for denoising. If not in training mode or 'num_dn'
             is less than or equal to 0, the function returns None for all elements in the tuple.
     """
     if (not training) or num_dn <= 0:
         return None, None, None, None
     gt_groups = batch["gt_groups"]

ultralytics/models/yolo/__init__.py CHANGED Viewed

@@ -1,7 +1,7 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
-from ultralytics.models.yolo import classify, detect, obb, pose, segment
+from ultralytics.models.yolo import classify, detect, obb, pose, segment, world
 from .model import YOLO, YOLOWorld
-__all__ = "classify", "segment", "detect", "pose", "obb", "YOLO", "YOLOWorld"
+__all__ = "classify", "segment", "detect", "pose", "obb", "world", "YOLO", "YOLOWorld"

ultralytics/models/yolo/classify/__init__.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 from ultralytics.models.yolo.classify.predict import ClassificationPredictor
 from ultralytics.models.yolo.classify.train import ClassificationTrainer

ultralytics/models/yolo/classify/predict.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 import cv2
 import torch
@@ -21,7 +21,7 @@ class ClassificationPredictor(BasePredictor):
         from ultralytics.utils import ASSETS
         from ultralytics.models.yolo.classify import ClassificationPredictor
-        args = dict(model='yolov8n-cls.pt', source=ASSETS)
+        args = dict(model="yolov8n-cls.pt", source=ASSETS)
         predictor = ClassificationPredictor(overrides=args)
         predictor.predict_cli()
         ```
@@ -53,9 +53,8 @@ class ClassificationPredictor(BasePredictor):
         if not isinstance(orig_imgs, list):  # input images are a torch.Tensor, not a list
             orig_imgs = ops.convert_torch2numpy_batch(orig_imgs)
-        results = []
-        for i, pred in enumerate(preds):
-            orig_img = orig_imgs[i]
-            img_path = self.batch[0][i]
-            results.append(Results(orig_img, path=img_path, names=self.model.names, probs=pred))
-        return results
+        preds = preds[0] if isinstance(preds, (list, tuple)) else preds
+        return [
+            Results(orig_img, path=img_path, names=self.model.names, probs=pred)
+            for pred, orig_img, img_path in zip(preds, orig_imgs, self.batch[0])
+        ]

ultralytics/models/yolo/classify/train.py CHANGED Viewed

@@ -1,13 +1,14 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
+from copy import copy
 import torch
-import torchvision
 from ultralytics.data import ClassificationDataset, build_dataloader
 from ultralytics.engine.trainer import BaseTrainer
 from ultralytics.models import yolo
-from ultralytics.nn.tasks import ClassificationModel, attempt_load_one_weight
-from ultralytics.utils import DEFAULT_CFG, LOGGER, RANK, colorstr
+from ultralytics.nn.tasks import ClassificationModel
+from ultralytics.utils import DEFAULT_CFG, LOGGER, RANK
 from ultralytics.utils.plotting import plot_images, plot_results
 from ultralytics.utils.torch_utils import is_parallel, strip_optimizer, torch_distributed_zero_first
@@ -23,7 +24,7 @@ class ClassificationTrainer(BaseTrainer):
         ```python
         from ultralytics.models.yolo.classify import ClassificationTrainer
-        args = dict(model='yolov8n-cls.pt', data='imagenet10', epochs=3)
+        args = dict(model="yolov8n-cls.pt", data="imagenet10", epochs=3)
         trainer = ClassificationTrainer(overrides=args)
         trainer.train()
         ```
@@ -59,23 +60,16 @@ class ClassificationTrainer(BaseTrainer):
     def setup_model(self):
         """Load, create or download model for any task."""
-        if isinstance(self.model, torch.nn.Module):  # if model is loaded beforehand. No setup needed
-            return
-        model, ckpt = str(self.model), None
-        # Load a YOLO model locally, from torchvision, or from Ultralytics assets
-        if model.endswith(".pt"):
-            self.model, ckpt = attempt_load_one_weight(model, device="cpu")
-            for p in self.model.parameters():
-                p.requires_grad = True  # for training
-        elif model.split(".")[-1] in ("yaml", "yml"):
-            self.model = self.get_model(cfg=model)
-        elif model in torchvision.models.__dict__:
-            self.model = torchvision.models.__dict__[model](weights="IMAGENET1K_V1" if self.args.pretrained else None)
+        import torchvision  # scope for faster 'import ultralytics'
+        if str(self.model) in torchvision.models.__dict__:
+            self.model = torchvision.models.__dict__[self.model](
+                weights="IMAGENET1K_V1" if self.args.pretrained else None
+            )
+            ckpt = None
         else:
-            FileNotFoundError(f"ERROR: model={model} not found locally or online. Please check model name.")
+            ckpt = super().setup_model()
         ClassificationModel.reshape_outputs(self.model, self.data["nc"])
         return ckpt
     def build_dataset(self, img_path, mode="train", batch=None):
@@ -115,7 +109,9 @@ class ClassificationTrainer(BaseTrainer):
     def get_validator(self):
         """Returns an instance of ClassificationValidator for validation."""
         self.loss_names = ["loss"]
-        return yolo.classify.ClassificationValidator(self.test_loader, self.save_dir, _callbacks=self.callbacks)
+        return yolo.classify.ClassificationValidator(
+            self.test_loader, self.save_dir, args=copy(self.args), _callbacks=self.callbacks
+        )
     def label_loss_items(self, loss_items=None, prefix="train"):
         """
@@ -145,7 +141,6 @@ class ClassificationTrainer(BaseTrainer):
                     self.metrics = self.validator(model=f)
                     self.metrics.pop("fitness", None)
                     self.run_callbacks("on_fit_epoch_end")
-        LOGGER.info(f"Results saved to {colorstr('bold', self.save_dir)}")
     def plot_training_samples(self, batch, ni):
         """Plots training samples with their annotations."""

ultralytics/models/yolo/classify/val.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 import torch
@@ -20,7 +20,7 @@ class ClassificationValidator(BaseValidator):
         ```python
         from ultralytics.models.yolo.classify import ClassificationValidator
-        args = dict(model='yolov8n-cls.pt', data='imagenet10')
+        args = dict(model="yolov8n-cls.pt", data="imagenet10")
         validator = ClassificationValidator(args=args)
         validator()
         ```
@@ -56,8 +56,8 @@ class ClassificationValidator(BaseValidator):
     def update_metrics(self, preds, batch):
         """Updates running metrics with model predictions and batch targets."""
         n5 = min(len(self.names), 5)
-        self.pred.append(preds.argsort(1, descending=True)[:, :n5])
-        self.targets.append(batch["cls"])
+        self.pred.append(preds.argsort(1, descending=True)[:, :n5].type(torch.int32).cpu())
+        self.targets.append(batch["cls"].type(torch.int32).cpu())
     def finalize_metrics(self, *args, **kwargs):
         """Finalizes metrics of the model such as confusion_matrix and speed."""
@@ -71,6 +71,10 @@ class ClassificationValidator(BaseValidator):
         self.metrics.confusion_matrix = self.confusion_matrix
         self.metrics.save_dir = self.save_dir
+    def postprocess(self, preds):
+        """Preprocesses the classification predictions."""
+        return preds[0] if isinstance(preds, (list, tuple)) else preds
     def get_stats(self):
         """Returns a dictionary of metrics obtained by processing targets and predictions."""
         self.metrics.process(self.targets, self.pred)

ultralytics/models/yolo/detect/__init__.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 from .predict import DetectionPredictor
 from .train import DetectionTrainer

ultralytics/models/yolo/detect/predict.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 from ultralytics.engine.predictor import BasePredictor
 from ultralytics.engine.results import Results
@@ -14,7 +14,7 @@ class DetectionPredictor(BasePredictor):
         from ultralytics.utils import ASSETS
         from ultralytics.models.yolo.detect import DetectionPredictor
-        args = dict(model='yolov8n.pt', source=ASSETS)
+        args = dict(model="yolo11n.pt", source=ASSETS)
         predictor = DetectionPredictor(overrides=args)
         predictor.predict_cli()
         ```
@@ -35,9 +35,7 @@ class DetectionPredictor(BasePredictor):
             orig_imgs = ops.convert_torch2numpy_batch(orig_imgs)
         results = []
-        for i, pred in enumerate(preds):
-            orig_img = orig_imgs[i]
+        for pred, orig_img, img_path in zip(preds, orig_imgs, self.batch[0]):
             pred[:, :4] = ops.scale_boxes(img.shape[2:], pred[:, :4], orig_img.shape)
-            img_path = self.batch[0][i]
             results.append(Results(orig_img, path=img_path, names=self.model.names, boxes=pred))
         return results

ultralytics/models/yolo/detect/train.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 import math
 import random
@@ -24,7 +24,7 @@ class DetectionTrainer(BaseTrainer):
         ```python
         from ultralytics.models.yolo.detect import DetectionTrainer
-        args = dict(model='yolov8n.pt', data='coco8.yaml', epochs=3)
+        args = dict(model="yolo11n.pt", data="coco8.yaml", epochs=3)
         trainer = DetectionTrainer(overrides=args)
         trainer.train()
         ```
@@ -44,7 +44,7 @@ class DetectionTrainer(BaseTrainer):
     def get_dataloader(self, dataset_path, batch_size=16, rank=0, mode="train"):
         """Construct and return dataloader."""
-        assert mode in ["train", "val"]
+        assert mode in {"train", "val"}, f"Mode must be 'train' or 'val', not {mode}."
         with torch_distributed_zero_first(rank):  # init dataset *.cache only once if DDP
             dataset = self.build_dataset(dataset_path, mode, batch_size)
         shuffle = mode == "train"
@@ -60,7 +60,7 @@ class DetectionTrainer(BaseTrainer):
         if self.args.multi_scale:
             imgs = batch["img"]
             sz = (
-                random.randrange(self.args.imgsz * 0.5, self.args.imgsz * 1.5 + self.stride)
+                random.randrange(int(self.args.imgsz * 0.5), int(self.args.imgsz * 1.5 + self.stride))
                 // self.stride
                 * self.stride
             )  # size
@@ -141,3 +141,10 @@ class DetectionTrainer(BaseTrainer):
         boxes = np.concatenate([lb["bboxes"] for lb in self.train_loader.dataset.labels], 0)
         cls = np.concatenate([lb["cls"] for lb in self.train_loader.dataset.labels], 0)
         plot_labels(boxes, cls.squeeze(), names=self.data["names"], save_dir=self.save_dir, on_plot=self.on_plot)
+    def auto_batch(self):
+        """Get batch size by calculating memory occupation of model."""
+        train_dataset = self.build_dataset(self.trainset, mode="train", batch=16)
+        # 4 for mosaic augmentation
+        max_num_obj = max(len(label["cls"]) for label in train_dataset.labels) * 4
+        return super().auto_batch(max_num_obj)

ultralytics/models/yolo/detect/val.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 import os
 from pathlib import Path
@@ -22,7 +22,7 @@ class DetectionValidator(BaseValidator):
         ```python
         from ultralytics.models.yolo.detect import DetectionValidator
-        args = dict(model='yolov8n.pt', data='coco8.yaml')
+        args = dict(model="yolo11n.pt", data="coco8.yaml")
         validator = DetectionValidator(args=args)
         validator()
         ```
@@ -32,13 +32,20 @@ class DetectionValidator(BaseValidator):
         """Initialize detection model with necessary variables and settings."""
         super().__init__(dataloader, save_dir, pbar, args, _callbacks)
         self.nt_per_class = None
+        self.nt_per_image = None
         self.is_coco = False
+        self.is_lvis = False
         self.class_map = None
         self.args.task = "detect"
         self.metrics = DetMetrics(save_dir=self.save_dir, on_plot=self.on_plot)
         self.iouv = torch.linspace(0.5, 0.95, 10)  # IoU vector for mAP@0.5:0.95
         self.niou = self.iouv.numel()
         self.lb = []  # for autolabelling
+        if self.args.save_hybrid:
+            LOGGER.warning(
+                "WARNING ⚠️ 'save_hybrid=True' will append ground truth to predictions for autolabelling.\n"
+                "WARNING ⚠️ 'save_hybrid=True' will cause incorrect mAP.\n"
+            )
     def preprocess(self, batch):
         """Preprocesses batch of images for YOLO training."""
@@ -51,23 +58,24 @@ class DetectionValidator(BaseValidator):
             height, width = batch["img"].shape[2:]
             nb = len(batch["img"])
             bboxes = batch["bboxes"] * torch.tensor((width, height, width, height), device=self.device)
-            self.lb = (
-                [
-                    torch.cat([batch["cls"][batch["batch_idx"] == i], bboxes[batch["batch_idx"] == i]], dim=-1)
-                    for i in range(nb)
-                ]
-                if self.args.save_hybrid
-                else []
-            )  # for autolabelling
+            self.lb = [
+                torch.cat([batch["cls"][batch["batch_idx"] == i], bboxes[batch["batch_idx"] == i]], dim=-1)
+                for i in range(nb)
+            ]
         return batch
     def init_metrics(self, model):
         """Initialize evaluation metrics for YOLO."""
         val = self.data.get(self.args.split, "")  # validation path
-        self.is_coco = isinstance(val, str) and "coco" in val and val.endswith(f"{os.sep}val2017.txt")  # is COCO
-        self.class_map = converter.coco80_to_coco91_class() if self.is_coco else list(range(1000))
-        self.args.save_json |= self.is_coco and not self.training  # run on final val if training COCO
+        self.is_coco = (
+            isinstance(val, str)
+            and "coco" in val
+            and (val.endswith(f"{os.sep}val2017.txt") or val.endswith(f"{os.sep}test-dev2017.txt"))
+        )  # is COCO
+        self.is_lvis = isinstance(val, str) and "lvis" in val and not self.is_coco  # is LVIS
+        self.class_map = converter.coco80_to_coco91_class() if self.is_coco else list(range(1, len(model.names) + 1))
+        self.args.save_json |= self.args.val and (self.is_coco or self.is_lvis) and not self.training  # run final val
         self.names = model.names
         self.nc = len(model.names)
         self.metrics.names = self.names
@@ -75,7 +83,7 @@ class DetectionValidator(BaseValidator):
         self.confusion_matrix = ConfusionMatrix(nc=self.nc, conf=self.args.conf)
         self.seen = 0
         self.jdict = []
-        self.stats = dict(tp=[], conf=[], pred_cls=[], target_cls=[])
+        self.stats = dict(tp=[], conf=[], pred_cls=[], target_cls=[], target_img=[])
     def get_desc(self):
         """Return a formatted string summarizing class metrics of YOLO model."""
@@ -89,7 +97,7 @@ class DetectionValidator(BaseValidator):
             self.args.iou,
             labels=self.lb,
             multi_label=True,
-            agnostic=self.args.single_cls,
+            agnostic=self.args.single_cls or self.args.agnostic_nms,
             max_det=self.args.max_det,
         )
@@ -104,7 +112,7 @@ class DetectionValidator(BaseValidator):
         if len(cls):
             bbox = ops.xywh2xyxy(bbox) * torch.tensor(imgsz, device=self.device)[[1, 0, 1, 0]]  # target boxes
             ops.scale_boxes(imgsz, bbox, ori_shape, ratio_pad=ratio_pad)  # native-space labels
-        return dict(cls=cls, bbox=bbox, ori_shape=ori_shape, imgsz=imgsz, ratio_pad=ratio_pad)
+        return {"cls": cls, "bbox": bbox, "ori_shape": ori_shape, "imgsz": imgsz, "ratio_pad": ratio_pad}
     def _prepare_pred(self, pred, pbatch):
         """Prepares a batch of images and annotations for validation."""
@@ -128,6 +136,7 @@ class DetectionValidator(BaseValidator):
             cls, bbox = pbatch.pop("cls"), pbatch.pop("bbox")
             nl = len(cls)
             stat["target_cls"] = cls
+            stat["target_img"] = cls.unique()
             if npr == 0:
                 if nl:
                     for k in self.stats.keys():
@@ -146,8 +155,8 @@ class DetectionValidator(BaseValidator):
             # Evaluate
             if nl:
                 stat["tp"] = self._process_batch(predn, bbox, cls)
-                if self.args.plots:
-                    self.confusion_matrix.process_batch(predn, bbox, cls)
+            if self.args.plots:
+                self.confusion_matrix.process_batch(predn, bbox, cls)
             for k in self.stats.keys():
                 self.stats[k].append(stat[k])
@@ -155,8 +164,12 @@ class DetectionValidator(BaseValidator):
             if self.args.save_json:
                 self.pred_to_json(predn, batch["im_file"][si])
             if self.args.save_txt:
-                file = self.save_dir / "labels" / f'{Path(batch["im_file"][si]).stem}.txt'
-                self.save_one_txt(predn, self.args.save_conf, pbatch["ori_shape"], file)
+                self.save_one_txt(
+                    predn,
+                    self.args.save_conf,
+                    pbatch["ori_shape"],
+                    self.save_dir / "labels" / f"{Path(batch['im_file'][si]).stem}.txt",
+                )
     def finalize_metrics(self, *args, **kwargs):
         """Set final values for metrics speed and confusion matrix."""
@@ -166,11 +179,11 @@ class DetectionValidator(BaseValidator):
     def get_stats(self):
         """Returns metrics statistics and results dictionary."""
         stats = {k: torch.cat(v, 0).cpu().numpy() for k, v in self.stats.items()}  # to numpy
+        self.nt_per_class = np.bincount(stats["target_cls"].astype(int), minlength=self.nc)
+        self.nt_per_image = np.bincount(stats["target_img"].astype(int), minlength=self.nc)
+        stats.pop("target_img", None)
         if len(stats) and stats["tp"].any():
             self.metrics.process(**stats)
-        self.nt_per_class = np.bincount(
-            stats["target_cls"].astype(int), minlength=self.nc
-        )  # number of targets per class
         return self.metrics.results_dict
     def print_results(self):
@@ -183,7 +196,9 @@ class DetectionValidator(BaseValidator):
         # Print results per class
         if self.args.verbose and not self.training and self.nc > 1 and len(self.stats):
             for i, c in enumerate(self.metrics.ap_class_index):
-                LOGGER.info(pf % (self.names[c], self.seen, self.nt_per_class[c], *self.metrics.class_result(i)))
+                LOGGER.info(
+                    pf % (self.names[c], self.nt_per_image[c], self.nt_per_class[c], *self.metrics.class_result(i))
+                )
         if self.args.plots:
             for normalize in True, False:
@@ -196,13 +211,18 @@ class DetectionValidator(BaseValidator):
         Return correct prediction matrix.
         Args:
-            detections (torch.Tensor): Tensor of shape [N, 6] representing detections.
-                Each detection is of the format: x1, y1, x2, y2, conf, class.
-            labels (torch.Tensor): Tensor of shape [M, 5] representing labels.
-                Each label is of the format: class, x1, y1, x2, y2.
+            detections (torch.Tensor): Tensor of shape (N, 6) representing detections where each detection is
+                (x1, y1, x2, y2, conf, class).
+            gt_bboxes (torch.Tensor): Tensor of shape (M, 4) representing ground-truth bounding box coordinates. Each
+                bounding box is of the format: (x1, y1, x2, y2).
+            gt_cls (torch.Tensor): Tensor of shape (M,) representing target class indices.
         Returns:
-            (torch.Tensor): Correct prediction matrix of shape [N, 10] for 10 IoU levels.
+            (torch.Tensor): Correct prediction matrix of shape (N, 10) for 10 IoU levels.
+        Note:
+            The function does not return any value directly usable for metrics calculation. Instead, it provides an
+            intermediate representation used for evaluating predictions against ground truth.
         """
         iou = box_iou(gt_bboxes, detections[:, :4])
         return self.match_predictions(detections[:, 5], gt_cls, iou)
@@ -249,12 +269,14 @@ class DetectionValidator(BaseValidator):
     def save_one_txt(self, predn, save_conf, shape, file):
         """Save YOLO detections to a txt file in normalized coordinates in a specific format."""
-        gn = torch.tensor(shape)[[1, 0, 1, 0]]  # normalization gain whwh
-        for *xyxy, conf, cls in predn.tolist():
-            xywh = (ops.xyxy2xywh(torch.tensor(xyxy).view(1, 4)) / gn).view(-1).tolist()  # normalized xywh
-            line = (cls, *xywh, conf) if save_conf else (cls, *xywh)  # label format
-            with open(file, "a") as f:
-                f.write(("%g " * len(line)).rstrip() % line + "\n")
+        from ultralytics.engine.results import Results
+        Results(
+            np.zeros((shape[0], shape[1]), dtype=np.uint8),
+            path=None,
+            names=self.names,
+            boxes=predn[:, :6],
+        ).save_txt(file, save_conf=save_conf)
     def pred_to_json(self, predn, filename):
         """Serialize YOLO predictions to COCO json format."""
@@ -274,26 +296,42 @@ class DetectionValidator(BaseValidator):
     def eval_json(self, stats):
         """Evaluates YOLO output in JSON format and returns performance statistics."""
-        if self.args.save_json and self.is_coco and len(self.jdict):
-            anno_json = self.data["path"] / "annotations/instances_val2017.json"  # annotations
+        if self.args.save_json and (self.is_coco or self.is_lvis) and len(self.jdict):
             pred_json = self.save_dir / "predictions.json"  # predictions
-            LOGGER.info(f"\nEvaluating pycocotools mAP using {pred_json} and {anno_json}...")
+            anno_json = (
+                self.data["path"]
+                / "annotations"
+                / ("instances_val2017.json" if self.is_coco else f"lvis_v1_{self.args.split}.json")
+            )  # annotations
+            pkg = "pycocotools" if self.is_coco else "lvis"
+            LOGGER.info(f"\nEvaluating {pkg} mAP using {pred_json} and {anno_json}...")
             try:  # https://github.com/cocodataset/cocoapi/blob/master/PythonAPI/pycocoEvalDemo.ipynb
-                check_requirements("pycocotools>=2.0.6")
-                from pycocotools.coco import COCO  # noqa
-                from pycocotools.cocoeval import COCOeval  # noqa
-                for x in anno_json, pred_json:
+                for x in pred_json, anno_json:
                     assert x.is_file(), f"{x} file not found"
-                anno = COCO(str(anno_json))  # init annotations api
-                pred = anno.loadRes(str(pred_json))  # init predictions api (must pass string, not Path)
-                eval = COCOeval(anno, pred, "bbox")
+                check_requirements("pycocotools>=2.0.6" if self.is_coco else "lvis>=0.5.3")
                 if self.is_coco:
-                    eval.params.imgIds = [int(Path(x).stem) for x in self.dataloader.dataset.im_files]  # images to eval
-                eval.evaluate()
-                eval.accumulate()
-                eval.summarize()
-                stats[self.metrics.keys[-1]], stats[self.metrics.keys[-2]] = eval.stats[:2]  # update mAP50-95 and mAP50
+                    from pycocotools.coco import COCO  # noqa
+                    from pycocotools.cocoeval import COCOeval  # noqa
+                    anno = COCO(str(anno_json))  # init annotations api
+                    pred = anno.loadRes(str(pred_json))  # init predictions api (must pass string, not Path)
+                    val = COCOeval(anno, pred, "bbox")
+                else:
+                    from lvis import LVIS, LVISEval
+                    anno = LVIS(str(anno_json))  # init annotations api
+                    pred = anno._load_json(str(pred_json))  # init predictions api (must pass string, not Path)
+                    val = LVISEval(anno, pred, "bbox")
+                val.params.imgIds = [int(Path(x).stem) for x in self.dataloader.dataset.im_files]  # images to eval
+                val.evaluate()
+                val.accumulate()
+                val.summarize()
+                if self.is_lvis:
+                    val.print_results()  # explicitly call print_results
+                # update mAP50-95 and mAP50
+                stats[self.metrics.keys[-1]], stats[self.metrics.keys[-2]] = (
+                    val.stats[:2] if self.is_coco else [val.results["AP50"], val.results["AP"]]
+                )
             except Exception as e:
-                LOGGER.warning(f"pycocotools unable to run: {e}")
+                LOGGER.warning(f"{pkg} unable to run: {e}")
         return stats

ultralytics 8.1.29__py3-none-any.whl → 8.3.63__py3-none-any.whl

ultralytics 8.1.29py3-none-any.whl → 8.3.63py3-none-any.whl