PyPI - ultralytics - Versions diffs - 8.3.89__py3-none-any.whl → 8.3.91__py3-none-any.whl - Mend

ultralytics 8.3.89py3-none-any.whl → 8.3.91py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (156) hide show

tests/conftest.py +2 -2
tests/test_cli.py +13 -11
tests/test_cuda.py +10 -1
tests/test_exports.py +2 -2
tests/test_integrations.py +1 -5
tests/test_python.py +16 -16
tests/test_solutions.py +9 -9
ultralytics/__init__.py +1 -1
ultralytics/cfg/__init__.py +3 -1
ultralytics/cfg/models/11/yolo11-cls.yaml +5 -5
ultralytics/cfg/models/11/yolo11-obb.yaml +5 -5
ultralytics/cfg/models/11/yolo11-pose.yaml +5 -5
ultralytics/cfg/models/11/yolo11-seg.yaml +5 -5
ultralytics/cfg/models/11/yolo11.yaml +5 -5
ultralytics/cfg/models/v8/yolov8-ghost-p2.yaml +5 -5
ultralytics/cfg/models/v8/yolov8-ghost-p6.yaml +5 -5
ultralytics/cfg/models/v8/yolov8-ghost.yaml +5 -5
ultralytics/cfg/models/v8/yolov8-obb.yaml +5 -5
ultralytics/cfg/models/v8/yolov8-p6.yaml +5 -5
ultralytics/cfg/models/v8/yolov8-rtdetr.yaml +5 -5
ultralytics/cfg/models/v8/yolov8-world.yaml +5 -5
ultralytics/cfg/models/v8/yolov8-worldv2.yaml +5 -5
ultralytics/cfg/models/v8/yolov8.yaml +5 -5
ultralytics/cfg/models/v9/yolov9c-seg.yaml +1 -1
ultralytics/cfg/models/v9/yolov9c.yaml +1 -1
ultralytics/cfg/models/v9/yolov9e-seg.yaml +1 -1
ultralytics/cfg/models/v9/yolov9e.yaml +1 -1
ultralytics/cfg/models/v9/yolov9m.yaml +1 -1
ultralytics/cfg/models/v9/yolov9s.yaml +1 -1
ultralytics/cfg/models/v9/yolov9t.yaml +1 -1
ultralytics/data/annotator.py +9 -14
ultralytics/data/base.py +118 -30
ultralytics/data/build.py +63 -24
ultralytics/data/converter.py +5 -5
ultralytics/data/dataset.py +207 -53
ultralytics/data/loaders.py +1 -0
ultralytics/data/split_dota.py +39 -12
ultralytics/data/utils.py +15 -19
ultralytics/engine/exporter.py +24 -23
ultralytics/engine/model.py +67 -88
ultralytics/engine/predictor.py +106 -21
ultralytics/engine/trainer.py +32 -23
ultralytics/engine/tuner.py +21 -18
ultralytics/engine/validator.py +75 -41
ultralytics/hub/__init__.py +12 -13
ultralytics/hub/auth.py +9 -12
ultralytics/hub/session.py +76 -21
ultralytics/hub/utils.py +19 -17
ultralytics/models/fastsam/model.py +20 -11
ultralytics/models/fastsam/predict.py +36 -16
ultralytics/models/fastsam/utils.py +5 -5
ultralytics/models/fastsam/val.py +6 -6
ultralytics/models/nas/model.py +22 -11
ultralytics/models/nas/predict.py +9 -4
ultralytics/models/nas/val.py +5 -5
ultralytics/models/rtdetr/model.py +20 -11
ultralytics/models/rtdetr/predict.py +18 -15
ultralytics/models/rtdetr/train.py +20 -16
ultralytics/models/rtdetr/val.py +42 -6
ultralytics/models/sam/__init__.py +1 -1
ultralytics/models/sam/amg.py +50 -4
ultralytics/models/sam/model.py +8 -14
ultralytics/models/sam/modules/decoders.py +18 -21
ultralytics/models/sam/modules/encoders.py +25 -46
ultralytics/models/sam/modules/memory_attention.py +19 -15
ultralytics/models/sam/modules/sam.py +18 -25
ultralytics/models/sam/modules/tiny_encoder.py +19 -29
ultralytics/models/sam/modules/transformer.py +35 -57
ultralytics/models/sam/modules/utils.py +15 -15
ultralytics/models/sam/predict.py +0 -3
ultralytics/models/utils/loss.py +87 -36
ultralytics/models/utils/ops.py +26 -31
ultralytics/models/yolo/classify/predict.py +24 -3
ultralytics/models/yolo/classify/train.py +77 -10
ultralytics/models/yolo/classify/val.py +40 -15
ultralytics/models/yolo/detect/predict.py +23 -10
ultralytics/models/yolo/detect/train.py +85 -15
ultralytics/models/yolo/detect/val.py +145 -21
ultralytics/models/yolo/model.py +1 -2
ultralytics/models/yolo/obb/predict.py +12 -4
ultralytics/models/yolo/obb/train.py +7 -0
ultralytics/models/yolo/obb/val.py +25 -7
ultralytics/models/yolo/pose/predict.py +22 -6
ultralytics/models/yolo/pose/train.py +17 -1
ultralytics/models/yolo/pose/val.py +46 -21
ultralytics/models/yolo/segment/predict.py +22 -8
ultralytics/models/yolo/segment/train.py +6 -0
ultralytics/models/yolo/segment/val.py +100 -14
ultralytics/models/yolo/world/train.py +38 -8
ultralytics/models/yolo/world/train_world.py +39 -10
ultralytics/nn/autobackend.py +28 -14
ultralytics/nn/modules/__init__.py +3 -0
ultralytics/nn/modules/activation.py +12 -3
ultralytics/nn/modules/block.py +587 -84
ultralytics/nn/modules/conv.py +418 -54
ultralytics/nn/modules/head.py +3 -4
ultralytics/nn/modules/transformer.py +320 -34
ultralytics/nn/modules/utils.py +17 -3
ultralytics/nn/tasks.py +221 -69
ultralytics/solutions/ai_gym.py +2 -2
ultralytics/solutions/analytics.py +4 -4
ultralytics/solutions/heatmap.py +4 -4
ultralytics/solutions/instance_segmentation.py +10 -4
ultralytics/solutions/object_blurrer.py +2 -2
ultralytics/solutions/object_counter.py +2 -2
ultralytics/solutions/object_cropper.py +2 -2
ultralytics/solutions/parking_management.py +9 -9
ultralytics/solutions/queue_management.py +1 -1
ultralytics/solutions/region_counter.py +2 -2
ultralytics/solutions/security_alarm.py +7 -7
ultralytics/solutions/solutions.py +7 -4
ultralytics/solutions/speed_estimation.py +2 -2
ultralytics/solutions/streamlit_inference.py +6 -6
ultralytics/solutions/trackzone.py +9 -2
ultralytics/solutions/vision_eye.py +4 -4
ultralytics/trackers/basetrack.py +1 -1
ultralytics/trackers/bot_sort.py +23 -22
ultralytics/trackers/byte_tracker.py +4 -4
ultralytics/trackers/track.py +2 -1
ultralytics/trackers/utils/gmc.py +26 -27
ultralytics/trackers/utils/kalman_filter.py +31 -29
ultralytics/trackers/utils/matching.py +7 -7
ultralytics/utils/__init__.py +32 -27
ultralytics/utils/autobatch.py +5 -5
ultralytics/utils/benchmarks.py +111 -18
ultralytics/utils/callbacks/base.py +3 -3
ultralytics/utils/callbacks/clearml.py +11 -11
ultralytics/utils/callbacks/comet.py +42 -24
ultralytics/utils/callbacks/dvc.py +11 -10
ultralytics/utils/callbacks/hub.py +8 -8
ultralytics/utils/callbacks/mlflow.py +1 -1
ultralytics/utils/callbacks/neptune.py +12 -10
ultralytics/utils/callbacks/raytune.py +1 -1
ultralytics/utils/callbacks/tensorboard.py +6 -6
ultralytics/utils/callbacks/wb.py +16 -16
ultralytics/utils/checks.py +116 -35
ultralytics/utils/dist.py +15 -2
ultralytics/utils/downloads.py +13 -9
ultralytics/utils/files.py +12 -13
ultralytics/utils/instance.py +112 -45
ultralytics/utils/loss.py +28 -33
ultralytics/utils/metrics.py +246 -181
ultralytics/utils/ops.py +61 -53
ultralytics/utils/patches.py +8 -6
ultralytics/utils/plotting.py +65 -45
ultralytics/utils/tal.py +88 -57
ultralytics/utils/torch_utils.py +181 -33
ultralytics/utils/triton.py +13 -3
ultralytics/utils/tuner.py +8 -16
{ultralytics-8.3.89.dist-info → ultralytics-8.3.91.dist-info}/METADATA +1 -1
ultralytics-8.3.91.dist-info/RECORD +250 -0
ultralytics-8.3.89.dist-info/RECORD +0 -250
{ultralytics-8.3.89.dist-info → ultralytics-8.3.91.dist-info}/LICENSE +0 -0
{ultralytics-8.3.89.dist-info → ultralytics-8.3.91.dist-info}/WHEEL +0 -0
{ultralytics-8.3.89.dist-info → ultralytics-8.3.91.dist-info}/entry_points.txt +0 -0
{ultralytics-8.3.89.dist-info → ultralytics-8.3.91.dist-info}/top_level.txt +0 -0

ultralytics/utils/ops.py CHANGED Viewed

@@ -18,6 +18,11 @@ class Profile(contextlib.ContextDecorator):
     """
     YOLOv8 Profile class. Use as a decorator with @Profile() or as a context manager with 'with Profile():'.
+    Attributes:
+        t (float): Accumulated time.
+        device (torch.device): Device used for model inference.
+        cuda (bool): Whether CUDA is being used.
     Examples:
         >>> from ultralytics.utils.ops import Profile
         >>> with Profile(device=device) as dt:
@@ -30,8 +35,8 @@ class Profile(contextlib.ContextDecorator):
         Initialize the Profile class.
         Args:
-            t (float): Initial time. Defaults to 0.0.
-            device (torch.device): Devices used for model inference. Defaults to None (cpu).
+            t (float): Initial time.
+            device (torch.device): Device used for model inference.
         """
         self.t = t
         self.device = device
@@ -63,12 +68,12 @@ def segment2box(segment, width=640, height=640):
     Convert 1 segment label to 1 box label, applying inside-image constraint, i.e. (xy1, xy2, ...) to (xyxy).
     Args:
-        segment (torch.Tensor): the segment label
-        width (int): the width of the image. Defaults to 640
-        height (int): The height of the image. Defaults to 640
+        segment (torch.Tensor): The segment label.
+        width (int): The width of the image.
+        height (int): The height of the image.
     Returns:
-        (np.ndarray): the minimum and maximum x and y values of the segment.
+        (np.ndarray): The minimum and maximum x and y values of the segment.
     """
     x, y = segment.T  # segment xy
     # any 3 out of 4 sides are outside the image, clip coordinates first, https://github.com/ultralytics/ultralytics/pull/18294
@@ -87,21 +92,20 @@ def segment2box(segment, width=640, height=640):
 def scale_boxes(img1_shape, boxes, img0_shape, ratio_pad=None, padding=True, xywh=False):
     """
-    Rescales bounding boxes (in the format of xyxy by default) from the shape of the image they were originally
-    specified in (img1_shape) to the shape of a different image (img0_shape).
+    Rescale bounding boxes from img1_shape to img0_shape.
     Args:
         img1_shape (tuple): The shape of the image that the bounding boxes are for, in the format of (height, width).
-        boxes (torch.Tensor): the bounding boxes of the objects in the image, in the format of (x1, y1, x2, y2)
-        img0_shape (tuple): the shape of the target image, in the format of (height, width).
-        ratio_pad (tuple): a tuple of (ratio, pad) for scaling the boxes. If not provided, the ratio and pad will be
+        boxes (torch.Tensor): The bounding boxes of the objects in the image, in the format of (x1, y1, x2, y2).
+        img0_shape (tuple): The shape of the target image, in the format of (height, width).
+        ratio_pad (tuple): A tuple of (ratio, pad) for scaling the boxes. If not provided, the ratio and pad will be
             calculated based on the size difference between the two images.
         padding (bool): If True, assuming the boxes is based on image augmented by yolo style. If False then do regular
             rescaling.
-        xywh (bool): The box format is xywh or not, default=False.
+        xywh (bool): The box format is xywh or not.
     Returns:
-        boxes (torch.Tensor): The scaled bounding boxes, in the format of (x1, y1, x2, y2)
+        (torch.Tensor): The scaled bounding boxes, in the format of (x1, y1, x2, y2).
     """
     if ratio_pad is None:  # calculate from img0_shape
         gain = min(img1_shape[0] / img0_shape[0], img1_shape[1] / img0_shape[1])  # gain  = old / new
@@ -146,8 +150,8 @@ def nms_rotated(boxes, scores, threshold=0.45, use_triu=True):
     Args:
         boxes (torch.Tensor): Rotated bounding boxes, shape (N, 5), format xywhr.
         scores (torch.Tensor): Confidence scores, shape (N,).
-        threshold (float, optional): IoU threshold. Defaults to 0.45.
-        use_triu (bool, optional): Whether to use `torch.triu` operator. It'd be useful for disable it
+        threshold (float): IoU threshold.
+        use_triu (bool): Whether to use `torch.triu` operator. It'd be useful for disable it
             when exporting obb models to some formats that do not support `torch.triu`.
     Returns:
@@ -210,7 +214,7 @@ def non_max_suppression(
             list contains the apriori labels for a given image. The list should be in the format
             output by a dataloader, with each label being a tuple of (class_index, x1, y1, x2, y2).
         max_det (int): The maximum number of boxes to keep after NMS.
-        nc (int, optional): The number of classes output by the model. Any indices after this will be considered masks.
+        nc (int): The number of classes output by the model. Any indices after this will be considered masks.
         max_time_img (float): The maximum time (seconds) for processing one image.
         max_nms (int): The maximum number of boxes into torchvision.ops.nms().
         max_wh (int): The maximum box width and height in pixels.
@@ -333,7 +337,7 @@ def clip_boxes(boxes, shape):
     Takes a list of bounding boxes and a shape (height, width) and clips the bounding boxes to the shape.
     Args:
-        boxes (torch.Tensor): The bounding boxes to clip.
+        boxes (torch.Tensor | numpy.ndarray): The bounding boxes to clip.
         shape (tuple): The shape of the image.
     Returns:
@@ -359,7 +363,7 @@ def clip_coords(coords, shape):
         shape (tuple): A tuple of integers representing the size of the image in the format (height, width).
     Returns:
-        (torch.Tensor | numpy.ndarray): Clipped coordinates
+        (torch.Tensor | numpy.ndarray): Clipped coordinates.
     """
     if isinstance(coords, torch.Tensor):  # faster individually (WARNING: inplace .clamp_() Apple MPS bug)
         coords[..., 0] = coords[..., 0].clamp(0, shape[1])  # x
@@ -451,10 +455,11 @@ def xywhn2xyxy(x, w=640, h=640, padw=0, padh=0):
     Args:
         x (np.ndarray | torch.Tensor): The bounding box coordinates.
-        w (int): Width of the image. Defaults to 640
-        h (int): Height of the image. Defaults to 640
-        padw (int): Padding width. Defaults to 0
-        padh (int): Padding height. Defaults to 0
+        w (int): Width of the image.
+        h (int): Height of the image.
+        padw (int): Padding width.
+        padh (int): Padding height.
     Returns:
         y (np.ndarray | torch.Tensor): The coordinates of the bounding box in the format [x1, y1, x2, y2] where
             x1,y1 is the top-left corner, x2,y2 is the bottom-right corner of the bounding box.
@@ -475,10 +480,10 @@ def xyxy2xywhn(x, w=640, h=640, clip=False, eps=0.0):
     Args:
         x (np.ndarray | torch.Tensor): The input bounding box coordinates in (x1, y1, x2, y2) format.
-        w (int): The width of the image. Defaults to 640
-        h (int): The height of the image. Defaults to 640
-        clip (bool): If True, the boxes will be clipped to the image boundaries. Defaults to False
-        eps (float): The minimum value of the box's width and height. Defaults to 0.0
+        w (int): The width of the image.
+        h (int): The height of the image.
+        clip (bool): If True, the boxes will be clipped to the image boundaries.
+        eps (float): The minimum value of the box's width and height.
     Returns:
         y (np.ndarray | torch.Tensor): The bounding box coordinates in (x, y, width, height, normalized) format
@@ -598,13 +603,13 @@ def xywhr2xyxyxyxy(x):
 def ltwh2xyxy(x):
     """
-    It converts the bounding box from [x1, y1, w, h] to [x1, y1, x2, y2] where xy1=top-left, xy2=bottom-right.
+    Convert bounding box from [x1, y1, w, h] to [x1, y1, x2, y2] where xy1=top-left, xy2=bottom-right.
     Args:
-        x (np.ndarray | torch.Tensor): the input image
+        x (np.ndarray | torch.Tensor): The input image.
     Returns:
-        y (np.ndarray | torch.Tensor): the xyxy coordinates of the bounding boxes.
+        (np.ndarray | torch.Tensor): The xyxy coordinates of the bounding boxes.
     """
     y = x.clone() if isinstance(x, torch.Tensor) else np.copy(x)
     y[..., 2] = x[..., 2] + x[..., 0]  # width
@@ -614,13 +619,13 @@ def ltwh2xyxy(x):
 def segments2boxes(segments):
     """
-    It converts segment labels to box labels, i.e. (cls, xy1, xy2, ...) to (cls, xywh).
+    Convert segment labels to box labels, i.e. (cls, xy1, xy2, ...) to (cls, xywh).
     Args:
-        segments (list): list of segments, each segment is a list of points, each point is a list of x, y coordinates
+        segments (List): List of segments, each segment is a list of points, each point is a list of x, y coordinates.
     Returns:
-        (np.ndarray): the xywh coordinates of the bounding boxes.
+        (np.ndarray): The xywh coordinates of the bounding boxes.
     """
     boxes = []
     for s in segments:
@@ -634,11 +639,11 @@ def resample_segments(segments, n=1000):
     Inputs a list of segments (n,2) and returns a list of segments (n,2) up-sampled to n points each.
     Args:
-        segments (list): a list of (n,2) arrays, where n is the number of points in the segment.
-        n (int): number of points to resample the segment to. Defaults to 1000
+        segments (List): A list of (n,2) arrays, where n is the number of points in the segment.
+        n (int): Number of points to resample the segment to.
     Returns:
-        segments (list): the resampled segments.
+        segments (List): The resampled segments.
     """
     for i, s in enumerate(segments):
         if len(s) == n:
@@ -655,14 +660,14 @@ def resample_segments(segments, n=1000):
 def crop_mask(masks, boxes):
     """
-    It takes a mask and a bounding box, and returns a mask that is cropped to the bounding box.
+    Crop masks to bounding boxes.
     Args:
-        masks (torch.Tensor): [n, h, w] tensor of masks
-        boxes (torch.Tensor): [n, 4] tensor of bbox coordinates in relative point form
+        masks (torch.Tensor): [n, h, w] tensor of masks.
+        boxes (torch.Tensor): [n, 4] tensor of bbox coordinates in relative point form.
     Returns:
-        (torch.Tensor): The masks are being cropped to the bounding box.
+        (torch.Tensor): Cropped masks.
     """
     _, h, w = masks.shape
     x1, y1, x2, y2 = torch.chunk(boxes[:, :, None], 4, 1)  # x1 shape(n,1,1)
@@ -681,7 +686,7 @@ def process_mask(protos, masks_in, bboxes, shape, upsample=False):
         masks_in (torch.Tensor): A tensor of shape [n, mask_dim], where n is the number of masks after NMS.
         bboxes (torch.Tensor): A tensor of shape [n, 4], where n is the number of masks after NMS.
         shape (tuple): A tuple of integers representing the size of the input image in the format (h, w).
-        upsample (bool): A flag to indicate whether to upsample the mask to the original image size. Default is False.
+        upsample (bool): A flag to indicate whether to upsample the mask to the original image size.
     Returns:
         (torch.Tensor): A binary mask tensor of shape [n, h, w], where n is the number of masks after NMS, and h and w
@@ -707,16 +712,16 @@ def process_mask(protos, masks_in, bboxes, shape, upsample=False):
 def process_mask_native(protos, masks_in, bboxes, shape):
     """
-    It takes the output of the mask head, and crops it after upsampling to the bounding boxes.
+    Apply masks to bounding boxes using the output of the mask head with native upsampling.
     Args:
-        protos (torch.Tensor): [mask_dim, mask_h, mask_w]
+        protos (torch.Tensor): [mask_dim, mask_h, mask_w].
         masks_in (torch.Tensor): [n, mask_dim], n is number of masks after nms.
         bboxes (torch.Tensor): [n, 4], n is number of masks after nms.
         shape (tuple): The size of the input image (h,w).
     Returns:
-        masks (torch.Tensor): The returned masks with dimensions [h, w, n].
+        (torch.Tensor): The returned masks with dimensions [h, w, n].
     """
     c, mh, mw = protos.shape  # CHW
     masks = (masks_in @ protos.float().view(c, -1)).view(-1, mh, mw)
@@ -734,6 +739,9 @@ def scale_masks(masks, shape, padding=True):
         shape (tuple): Height and width.
         padding (bool): If True, assuming the boxes is based on image augmented by yolo style. If False then do regular
             rescaling.
+    Returns:
+        (torch.Tensor): Rescaled masks.
     """
     mh, mw = masks.shape[2:]
     gain = min(mh / shape[0], mw / shape[1])  # gain  = old / new
@@ -755,10 +763,10 @@ def scale_coords(img1_shape, coords, img0_shape, ratio_pad=None, normalize=False
     Args:
         img1_shape (tuple): The shape of the image that the coords are from.
-        coords (torch.Tensor): the coords to be scaled of shape n,2.
-        img0_shape (tuple): the shape of the image that the segmentation is being applied to.
-        ratio_pad (tuple): the ratio of the image size to the padded image size.
-        normalize (bool): If True, the coordinates will be normalized to the range [0, 1]. Defaults to False.
+        coords (torch.Tensor): The coords to be scaled of shape n,2.
+        img0_shape (tuple): The shape of the image that the segmentation is being applied to.
+        ratio_pad (tuple): The ratio of the image size to the padded image size.
+        normalize (bool): If True, the coordinates will be normalized to the range [0, 1].
         padding (bool): If True, assuming the boxes is based on image augmented by yolo style. If False then do regular
             rescaling.
@@ -805,14 +813,14 @@ def regularize_rboxes(rboxes):
 def masks2segments(masks, strategy="all"):
     """
-    It takes a list of masks(n,h,w) and returns a list of segments(n,xy).
+    Convert masks to segments.
     Args:
-        masks (torch.Tensor): the output of the model, which is a tensor of shape (batch_size, 160, 160)
-        strategy (str): 'all' or 'largest'. Defaults to all
+        masks (torch.Tensor): The output of the model, which is a tensor of shape (batch_size, 160, 160).
+        strategy (str): 'all' or 'largest'.
     Returns:
-        segments (List): list of segment masks
+        (List): List of segment masks.
     """
     from ultralytics.data.converter import merge_multi_segment
@@ -852,10 +860,10 @@ def clean_str(s):
     Cleans a string by replacing special characters with '_' character.
     Args:
-        s (str): a string needing special characters replaced
+        s (str): A string needing special characters replaced.
     Returns:
-        (str): a string with special characters replaced by an underscore _
+        (str): A string with special characters replaced by an underscore _.
     """
     return re.sub(pattern="[|@#!¡·$€%&()=?¿^*;:,¨´><+]", repl="_", string=s)

ultralytics/utils/patches.py CHANGED Viewed

@@ -18,7 +18,7 @@ def imread(filename: str, flags: int = cv2.IMREAD_COLOR):
     Args:
         filename (str): Path to the file to read.
-        flags (int, optional): Flag that can take values of cv2.IMREAD_*. Defaults to cv2.IMREAD_COLOR.
+        flags (int, optional): Flag that can take values of cv2.IMREAD_*.
     Returns:
         (np.ndarray): The read image.
@@ -33,7 +33,7 @@ def imwrite(filename: str, img: np.ndarray, params=None):
     Args:
         filename (str): Path to the file to write.
         img (np.ndarray): Image to write.
-        params (list of ints, optional): Additional parameters. See OpenCV documentation.
+        params (List[int], optional): Additional parameters for image encoding.
     Returns:
         (bool): True if the file was written, False otherwise.
@@ -47,7 +47,7 @@ def imwrite(filename: str, img: np.ndarray, params=None):
 def imshow(winname: str, mat: np.ndarray):
     """
-    Displays an image in the specified window.
+    Display an image in the specified window.
     Args:
         winname (str): Name of the window.
@@ -88,11 +88,13 @@ def torch_load(*args, **kwargs):
 def torch_save(*args, **kwargs):
     """
-    Optionally use dill to serialize lambda functions where pickle does not, adding robustness with 3 retries and
-    exponential standoff in case of save failure.
+    Save PyTorch objects with retry mechanism for robustness.
+    This function wraps torch.save with 3 retries and exponential backoff in case of save failures, which can occur
+    due to device flushing delays or antivirus scanning.
     Args:
-        *args (tuple): Positional arguments to pass to torch.save.
+        *args (Any): Positional arguments to pass to torch.save.
         **kwargs (Any): Keyword arguments to pass to torch.save.
     """
     for i in range(4):  # 3 retries

ultralytics/utils/plotting.py CHANGED Viewed

@@ -25,9 +25,9 @@ class Colors:
     RGB values.
     Attributes:
-        palette (list of tuple): List of RGB color values.
+        palette (List[Tuple]): List of RGB color values.
         n (int): The number of colors in the palette.
-        pose_palette (np.ndarray): A specific color palette array with dtype np.uint8.
+        pose_palette (np.ndarray): A specific color palette array for pose estimation with dtype np.uint8.
     Examples:
         >>> from ultralytics.utils.plotting import Colors
@@ -142,13 +142,13 @@ class Colors:
         )
     def __call__(self, i, bgr=False):
-        """Converts hex color codes to RGB values."""
+        """Convert hex color codes to RGB values."""
         c = self.palette[int(i) % self.n]
         return (c[2], c[1], c[0]) if bgr else c
     @staticmethod
     def hex2rgb(h):
-        """Converts hex color codes to RGB values (i.e. default PIL order)."""
+        """Convert hex color codes to RGB values (i.e. default PIL order)."""
         return tuple(int(h[1 + i : 1 + i + 2], 16) for i in (0, 2, 4))
@@ -160,13 +160,15 @@ class Annotator:
     Ultralytics Annotator for train/val mosaics and JPGs and predictions annotations.
     Attributes:
-        im (Image.Image or numpy array): The image to annotate.
+        im (Image.Image or np.ndarray): The image to annotate.
         pil (bool): Whether to use PIL or cv2 for drawing annotations.
         font (ImageFont.truetype or ImageFont.load_default): Font used for text annotations.
         lw (float): Line width for drawing.
         skeleton (List[List[int]]): Skeleton structure for keypoints.
         limb_color (List[int]): Color palette for limbs.
         kpt_color (List[int]): Color palette for keypoints.
+        dark_colors (set): Set of colors considered dark for text contrast.
+        light_colors (set): Set of colors considered light for text contrast.
     Examples:
         >>> from ultralytics.utils.plotting import Annotator
@@ -256,7 +258,7 @@ class Annotator:
             txt_color (tuple, optional): The color of the text (R, G, B).
         Returns:
-            txt_color (tuple): Text color for label
+            (tuple): Text color for label.
         Examples:
             >>> from ultralytics.utils.plotting import Annotator
@@ -273,14 +275,14 @@ class Annotator:
     def box_label(self, box, label="", color=(128, 128, 128), txt_color=(255, 255, 255), rotated=False):
         """
-        Draws a bounding box to image with label.
+        Draw a bounding box on an image with a given label.
         Args:
             box (tuple): The bounding box coordinates (x1, y1, x2, y2).
-            label (str): The text label to be displayed.
+            label (str, optional): The text label to be displayed.
             color (tuple, optional): The background color of the rectangle (B, G, R).
             txt_color (tuple, optional): The color of the text (R, G, B).
-            rotated (bool, optional): Variable used to check if task is OBB
+            rotated (bool, optional): Whether the task is oriented bounding box detection.
         Examples:
             >>> from ultralytics.utils.plotting import Annotator
@@ -340,11 +342,11 @@ class Annotator:
         Plot masks on image.
         Args:
-            masks (tensor): Predicted masks on cuda, shape: [n, h, w]
-            colors (List[List[Int]]): Colors for predicted masks, [[r, g, b] * n]
-            im_gpu (tensor): Image is in cuda, shape: [3, h, w], range: [0, 1]
-            alpha (float): Mask transparency: 0.0 fully transparent, 1.0 opaque
-            retina_masks (bool): Whether to use high resolution masks or not. Defaults to False.
+            masks (torch.Tensor): Predicted masks on cuda, shape: [n, h, w]
+            colors (List[List[int]]): Colors for predicted masks, [[r, g, b] * n]
+            im_gpu (torch.Tensor): Image is in cuda, shape: [3, h, w], range: [0, 1]
+            alpha (float, optional): Mask transparency: 0.0 fully transparent, 1.0 opaque.
+            retina_masks (bool, optional): Whether to use high resolution masks or not.
         """
         if self.pil:
             # Convert to numpy first
@@ -377,11 +379,11 @@ class Annotator:
         Args:
             kpts (torch.Tensor): Keypoints, shape [17, 3] (x, y, confidence).
-            shape (tuple, optional): Image shape (h, w). Defaults to (640, 640).
-            radius (int, optional): Keypoint radius. Defaults to 5.
-            kpt_line (bool, optional): Draw lines between keypoints. Defaults to True.
-            conf_thres (float, optional): Confidence threshold. Defaults to 0.25.
-            kpt_color (tuple, optional): Keypoint color (B, G, R). Defaults to None.
+            shape (tuple, optional): Image shape (h, w).
+            radius (int, optional): Keypoint radius.
+            kpt_line (bool, optional): Draw lines between keypoints.
+            conf_thres (float, optional): Confidence threshold.
+            kpt_color (tuple, optional): Keypoint color (B, G, R).
         Note:
             - `kpt_line=True` currently only supports human pose plotting.
@@ -436,7 +438,16 @@ class Annotator:
         self.draw.rectangle(xy, fill, outline, width)
     def text(self, xy, text, txt_color=(255, 255, 255), anchor="top", box_style=False):
-        """Adds text to an image using PIL or cv2."""
+        """
+        Add text to an image using PIL or cv2.
+        Args:
+            xy (List[int]): Top-left coordinates for text placement.
+            text (str): Text to be drawn.
+            txt_color (tuple, optional): Text color (R, G, B).
+            anchor (str, optional): Text anchor position ('top' or 'bottom').
+            box_style (bool, optional): Whether to draw text with a background box.
+        """
         if anchor == "bottom":  # start y from font bottom
             w, h = self.font.getsize(text)  # text width, height
             xy[1] += 1 - h
@@ -492,7 +503,7 @@ class Annotator:
     @staticmethod
     def get_bbox_dimension(bbox=None):
         """
-        Calculate the area of a bounding box.
+        Calculate the dimensions and area of a bounding box.
         Args:
             bbox (tuple): Bounding box coordinates in the format (x_min, y_min, x_max, y_max).
@@ -517,7 +528,16 @@ class Annotator:
 @TryExcept()  # known issue https://github.com/ultralytics/yolov5/issues/5395
 @plt_settings()
 def plot_labels(boxes, cls, names=(), save_dir=Path(""), on_plot=None):
-    """Plot training labels including class histograms and box statistics."""
+    """
+    Plot training labels including class histograms and box statistics.
+    Args:
+        boxes (np.ndarray): Bounding box coordinates in format [x, y, width, height].
+        cls (np.ndarray): Class indices.
+        names (Dict, optional): Dictionary mapping class indices to class names.
+        save_dir (Path, optional): Directory to save the plot.
+        on_plot (Callable, optional): Function to call after plot is saved.
+    """
     import pandas  # scope for faster 'import ultralytics'
     import seaborn  # scope for faster 'import ultralytics'
@@ -580,16 +600,16 @@ def save_one_box(xyxy, im, file=Path("im.jpg"), gain=1.02, pad=10, square=False,
     Args:
         xyxy (torch.Tensor or list): A tensor or list representing the bounding box in xyxy format.
-        im (numpy.ndarray): The input image.
-        file (Path, optional): The path where the cropped image will be saved. Defaults to 'im.jpg'.
-        gain (float, optional): A multiplicative factor to increase the size of the bounding box. Defaults to 1.02.
-        pad (int, optional): The number of pixels to add to the width and height of the bounding box. Defaults to 10.
-        square (bool, optional): If True, the bounding box will be transformed into a square. Defaults to False.
-        BGR (bool, optional): If True, the image will be saved in BGR format, otherwise in RGB. Defaults to False.
-        save (bool, optional): If True, the cropped image will be saved to disk. Defaults to True.
+        im (np.ndarray): The input image.
+        file (Path, optional): The path where the cropped image will be saved.
+        gain (float, optional): A multiplicative factor to increase the size of the bounding box.
+        pad (int, optional): The number of pixels to add to the width and height of the bounding box.
+        square (bool, optional): If True, the bounding box will be transformed into a square.
+        BGR (bool, optional): If True, the image will be saved in BGR format, otherwise in RGB.
+        save (bool, optional): If True, the cropped image will be saved to disk.
     Returns:
-        (numpy.ndarray): The cropped image.
+        (np.ndarray): The cropped image.
     Examples:
         >>> from ultralytics.utils.plotting import save_one_box
@@ -653,7 +673,7 @@ def plot_images(
         conf_thres: Confidence threshold for displaying detections.
     Returns:
-        np.ndarray: Plotted image grid as a numpy array if save is False, None otherwise.
+        (np.ndarray): Plotted image grid as a numpy array if save is False, None otherwise.
     Note:
         This function supports both tensor and numpy array inputs. It will automatically
@@ -693,6 +713,7 @@ def plot_images(
     # Annotate
     fs = int((h + w) * ns * 0.01)  # font size
+    fs = max(fs, 18)  # ensure that the font size is large enough to be easily readable.
     annotator = Annotator(mosaic, line_width=round(fs / 10), font_size=fs, pil=True, example=names)
     for i in range(bs):
         x, y = int(w * (i // ns)), int(h * (i % ns))  # block origin
@@ -789,13 +810,12 @@ def plot_results(file="path/to/results.csv", dir="", segment=False, pose=False,
     pose estimation, and classification. Plots are saved as 'results.png' in the directory where the CSV is located.
     Args:
-        file (str, optional): Path to the CSV file containing the training results. Defaults to 'path/to/results.csv'.
-        dir (str, optional): Directory where the CSV file is located if 'file' is not provided. Defaults to ''.
-        segment (bool, optional): Flag to indicate if the data is for segmentation. Defaults to False.
-        pose (bool, optional): Flag to indicate if the data is for pose estimation. Defaults to False.
-        classify (bool, optional): Flag to indicate if the data is for classification. Defaults to False.
+        file (str, optional): Path to the CSV file containing the training results.
+        dir (str, optional): Directory where the CSV file is located if 'file' is not provided.
+        segment (bool, optional): Flag to indicate if the data is for segmentation.
+        pose (bool, optional): Flag to indicate if the data is for pose estimation.
+        classify (bool, optional): Flag to indicate if the data is for classification.
         on_plot (callable, optional): Callback function to be executed after plotting. Takes filename as an argument.
-            Defaults to None.
     Examples:
         >>> from ultralytics.utils.plotting import plot_results
@@ -845,15 +865,15 @@ def plot_results(file="path/to/results.csv", dir="", segment=False, pose=False,
 def plt_color_scatter(v, f, bins=20, cmap="viridis", alpha=0.8, edgecolors="none"):
     """
-    Plots a scatter plot with points colored based on a 2D histogram.
+    Plot a scatter plot with points colored based on a 2D histogram.
     Args:
         v (array-like): Values for the x-axis.
         f (array-like): Values for the y-axis.
-        bins (int, optional): Number of bins for the histogram. Defaults to 20.
-        cmap (str, optional): Colormap for the scatter plot. Defaults to 'viridis'.
-        alpha (float, optional): Alpha for the scatter plot. Defaults to 0.8.
-        edgecolors (str, optional): Edge colors for the scatter plot. Defaults to 'none'.
+        bins (int, optional): Number of bins for the histogram.
+        cmap (str, optional): Colormap for the scatter plot.
+        alpha (float, optional): Alpha for the scatter plot.
+        edgecolors (str, optional): Edge colors for the scatter plot.
     Examples:
         >>> v = np.random.rand(100)
@@ -880,7 +900,7 @@ def plot_tune_results(csv_file="tune_results.csv"):
     in the CSV, color-coded based on fitness scores. The best-performing configurations are highlighted on the plots.
     Args:
-        csv_file (str, optional): Path to the CSV file containing the tuning results. Defaults to 'tune_results.csv'.
+        csv_file (str, optional): Path to the CSV file containing the tuning results.
     Examples:
         >>> plot_tune_results("path/to/tune_results.csv")
@@ -959,8 +979,8 @@ def feature_visualization(x, module_type, stage, n=32, save_dir=Path("runs/detec
         x (torch.Tensor): Features to be visualized.
         module_type (str): Module type.
         stage (int): Module stage within the model.
-        n (int, optional): Maximum number of feature maps to plot. Defaults to 32.
-        save_dir (Path, optional): Directory to save results. Defaults to Path('runs/detect/exp').
+        n (int, optional): Maximum number of feature maps to plot.
+        save_dir (Path, optional): Directory to save results.
     """
     for m in {"Detect", "Segment", "Pose", "Classify", "OBB", "RTDETRDecoder"}:  # all model heads
         if m in module_type:

ultralytics 8.3.89__py3-none-any.whl → 8.3.91__py3-none-any.whl

ultralytics 8.3.89py3-none-any.whl → 8.3.91py3-none-any.whl