PyPI - ultralytics - Versions diffs - 8.3.89__py3-none-any.whl → 8.3.91__py3-none-any.whl - Mend

ultralytics 8.3.89py3-none-any.whl → 8.3.91py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (156) hide show

tests/conftest.py +2 -2
tests/test_cli.py +13 -11
tests/test_cuda.py +10 -1
tests/test_exports.py +2 -2
tests/test_integrations.py +1 -5
tests/test_python.py +16 -16
tests/test_solutions.py +9 -9
ultralytics/__init__.py +1 -1
ultralytics/cfg/__init__.py +3 -1
ultralytics/cfg/models/11/yolo11-cls.yaml +5 -5
ultralytics/cfg/models/11/yolo11-obb.yaml +5 -5
ultralytics/cfg/models/11/yolo11-pose.yaml +5 -5
ultralytics/cfg/models/11/yolo11-seg.yaml +5 -5
ultralytics/cfg/models/11/yolo11.yaml +5 -5
ultralytics/cfg/models/v8/yolov8-ghost-p2.yaml +5 -5
ultralytics/cfg/models/v8/yolov8-ghost-p6.yaml +5 -5
ultralytics/cfg/models/v8/yolov8-ghost.yaml +5 -5
ultralytics/cfg/models/v8/yolov8-obb.yaml +5 -5
ultralytics/cfg/models/v8/yolov8-p6.yaml +5 -5
ultralytics/cfg/models/v8/yolov8-rtdetr.yaml +5 -5
ultralytics/cfg/models/v8/yolov8-world.yaml +5 -5
ultralytics/cfg/models/v8/yolov8-worldv2.yaml +5 -5
ultralytics/cfg/models/v8/yolov8.yaml +5 -5
ultralytics/cfg/models/v9/yolov9c-seg.yaml +1 -1
ultralytics/cfg/models/v9/yolov9c.yaml +1 -1
ultralytics/cfg/models/v9/yolov9e-seg.yaml +1 -1
ultralytics/cfg/models/v9/yolov9e.yaml +1 -1
ultralytics/cfg/models/v9/yolov9m.yaml +1 -1
ultralytics/cfg/models/v9/yolov9s.yaml +1 -1
ultralytics/cfg/models/v9/yolov9t.yaml +1 -1
ultralytics/data/annotator.py +9 -14
ultralytics/data/base.py +118 -30
ultralytics/data/build.py +63 -24
ultralytics/data/converter.py +5 -5
ultralytics/data/dataset.py +207 -53
ultralytics/data/loaders.py +1 -0
ultralytics/data/split_dota.py +39 -12
ultralytics/data/utils.py +15 -19
ultralytics/engine/exporter.py +24 -23
ultralytics/engine/model.py +67 -88
ultralytics/engine/predictor.py +106 -21
ultralytics/engine/trainer.py +32 -23
ultralytics/engine/tuner.py +21 -18
ultralytics/engine/validator.py +75 -41
ultralytics/hub/__init__.py +12 -13
ultralytics/hub/auth.py +9 -12
ultralytics/hub/session.py +76 -21
ultralytics/hub/utils.py +19 -17
ultralytics/models/fastsam/model.py +20 -11
ultralytics/models/fastsam/predict.py +36 -16
ultralytics/models/fastsam/utils.py +5 -5
ultralytics/models/fastsam/val.py +6 -6
ultralytics/models/nas/model.py +22 -11
ultralytics/models/nas/predict.py +9 -4
ultralytics/models/nas/val.py +5 -5
ultralytics/models/rtdetr/model.py +20 -11
ultralytics/models/rtdetr/predict.py +18 -15
ultralytics/models/rtdetr/train.py +20 -16
ultralytics/models/rtdetr/val.py +42 -6
ultralytics/models/sam/__init__.py +1 -1
ultralytics/models/sam/amg.py +50 -4
ultralytics/models/sam/model.py +8 -14
ultralytics/models/sam/modules/decoders.py +18 -21
ultralytics/models/sam/modules/encoders.py +25 -46
ultralytics/models/sam/modules/memory_attention.py +19 -15
ultralytics/models/sam/modules/sam.py +18 -25
ultralytics/models/sam/modules/tiny_encoder.py +19 -29
ultralytics/models/sam/modules/transformer.py +35 -57
ultralytics/models/sam/modules/utils.py +15 -15
ultralytics/models/sam/predict.py +0 -3
ultralytics/models/utils/loss.py +87 -36
ultralytics/models/utils/ops.py +26 -31
ultralytics/models/yolo/classify/predict.py +24 -3
ultralytics/models/yolo/classify/train.py +77 -10
ultralytics/models/yolo/classify/val.py +40 -15
ultralytics/models/yolo/detect/predict.py +23 -10
ultralytics/models/yolo/detect/train.py +85 -15
ultralytics/models/yolo/detect/val.py +145 -21
ultralytics/models/yolo/model.py +1 -2
ultralytics/models/yolo/obb/predict.py +12 -4
ultralytics/models/yolo/obb/train.py +7 -0
ultralytics/models/yolo/obb/val.py +25 -7
ultralytics/models/yolo/pose/predict.py +22 -6
ultralytics/models/yolo/pose/train.py +17 -1
ultralytics/models/yolo/pose/val.py +46 -21
ultralytics/models/yolo/segment/predict.py +22 -8
ultralytics/models/yolo/segment/train.py +6 -0
ultralytics/models/yolo/segment/val.py +100 -14
ultralytics/models/yolo/world/train.py +38 -8
ultralytics/models/yolo/world/train_world.py +39 -10
ultralytics/nn/autobackend.py +28 -14
ultralytics/nn/modules/__init__.py +3 -0
ultralytics/nn/modules/activation.py +12 -3
ultralytics/nn/modules/block.py +587 -84
ultralytics/nn/modules/conv.py +418 -54
ultralytics/nn/modules/head.py +3 -4
ultralytics/nn/modules/transformer.py +320 -34
ultralytics/nn/modules/utils.py +17 -3
ultralytics/nn/tasks.py +221 -69
ultralytics/solutions/ai_gym.py +2 -2
ultralytics/solutions/analytics.py +4 -4
ultralytics/solutions/heatmap.py +4 -4
ultralytics/solutions/instance_segmentation.py +10 -4
ultralytics/solutions/object_blurrer.py +2 -2
ultralytics/solutions/object_counter.py +2 -2
ultralytics/solutions/object_cropper.py +2 -2
ultralytics/solutions/parking_management.py +9 -9
ultralytics/solutions/queue_management.py +1 -1
ultralytics/solutions/region_counter.py +2 -2
ultralytics/solutions/security_alarm.py +7 -7
ultralytics/solutions/solutions.py +7 -4
ultralytics/solutions/speed_estimation.py +2 -2
ultralytics/solutions/streamlit_inference.py +6 -6
ultralytics/solutions/trackzone.py +9 -2
ultralytics/solutions/vision_eye.py +4 -4
ultralytics/trackers/basetrack.py +1 -1
ultralytics/trackers/bot_sort.py +23 -22
ultralytics/trackers/byte_tracker.py +4 -4
ultralytics/trackers/track.py +2 -1
ultralytics/trackers/utils/gmc.py +26 -27
ultralytics/trackers/utils/kalman_filter.py +31 -29
ultralytics/trackers/utils/matching.py +7 -7
ultralytics/utils/__init__.py +32 -27
ultralytics/utils/autobatch.py +5 -5
ultralytics/utils/benchmarks.py +111 -18
ultralytics/utils/callbacks/base.py +3 -3
ultralytics/utils/callbacks/clearml.py +11 -11
ultralytics/utils/callbacks/comet.py +42 -24
ultralytics/utils/callbacks/dvc.py +11 -10
ultralytics/utils/callbacks/hub.py +8 -8
ultralytics/utils/callbacks/mlflow.py +1 -1
ultralytics/utils/callbacks/neptune.py +12 -10
ultralytics/utils/callbacks/raytune.py +1 -1
ultralytics/utils/callbacks/tensorboard.py +6 -6
ultralytics/utils/callbacks/wb.py +16 -16
ultralytics/utils/checks.py +116 -35
ultralytics/utils/dist.py +15 -2
ultralytics/utils/downloads.py +13 -9
ultralytics/utils/files.py +12 -13
ultralytics/utils/instance.py +112 -45
ultralytics/utils/loss.py +28 -33
ultralytics/utils/metrics.py +246 -181
ultralytics/utils/ops.py +61 -53
ultralytics/utils/patches.py +8 -6
ultralytics/utils/plotting.py +65 -45
ultralytics/utils/tal.py +88 -57
ultralytics/utils/torch_utils.py +181 -33
ultralytics/utils/triton.py +13 -3
ultralytics/utils/tuner.py +8 -16
{ultralytics-8.3.89.dist-info → ultralytics-8.3.91.dist-info}/METADATA +1 -1
ultralytics-8.3.91.dist-info/RECORD +250 -0
ultralytics-8.3.89.dist-info/RECORD +0 -250
{ultralytics-8.3.89.dist-info → ultralytics-8.3.91.dist-info}/LICENSE +0 -0
{ultralytics-8.3.89.dist-info → ultralytics-8.3.91.dist-info}/WHEEL +0 -0
{ultralytics-8.3.89.dist-info → ultralytics-8.3.91.dist-info}/entry_points.txt +0 -0
{ultralytics-8.3.89.dist-info → ultralytics-8.3.91.dist-info}/top_level.txt +0 -0

ultralytics/nn/modules/conv.py CHANGED Viewed

@@ -35,40 +35,112 @@ def autopad(k, p=None, d=1):  # kernel, padding, dilation
 class Conv(nn.Module):
-    """Standard convolution with args(ch_in, ch_out, kernel, stride, padding, groups, dilation, activation)."""
+    """
+    Standard convolution module with batch normalization and activation.
+    Attributes:
+        conv (nn.Conv2d): Convolutional layer.
+        bn (nn.BatchNorm2d): Batch normalization layer.
+        act (nn.Module): Activation function layer.
+        default_act (nn.Module): Default activation function (SiLU).
+    """
     default_act = nn.SiLU()  # default activation
     def __init__(self, c1, c2, k=1, s=1, p=None, g=1, d=1, act=True):
-        """Initialize Conv layer with given arguments including activation."""
+        """
+        Initialize Conv layer with given parameters.
+        Args:
+            c1 (int): Number of input channels.
+            c2 (int): Number of output channels.
+            k (int): Kernel size.
+            s (int): Stride.
+            p (int, optional): Padding.
+            g (int): Groups.
+            d (int): Dilation.
+            act (bool | nn.Module): Activation function.
+        """
         super().__init__()
         self.conv = nn.Conv2d(c1, c2, k, s, autopad(k, p, d), groups=g, dilation=d, bias=False)
         self.bn = nn.BatchNorm2d(c2)
         self.act = self.default_act if act is True else act if isinstance(act, nn.Module) else nn.Identity()
     def forward(self, x):
-        """Apply convolution, batch normalization and activation to input tensor."""
+        """
+        Apply convolution, batch normalization and activation to input tensor.
+        Args:
+            x (torch.Tensor): Input tensor.
+        Returns:
+            (torch.Tensor): Output tensor.
+        """
         return self.act(self.bn(self.conv(x)))
     def forward_fuse(self, x):
-        """Apply convolution and activation without batch normalization."""
+        """
+        Apply convolution and activation without batch normalization.
+        Args:
+            x (torch.Tensor): Input tensor.
+        Returns:
+            (torch.Tensor): Output tensor.
+        """
         return self.act(self.conv(x))
 class Conv2(Conv):
-    """Simplified RepConv module with Conv fusing."""
+    """
+    Simplified RepConv module with Conv fusing.
+    Attributes:
+        conv (nn.Conv2d): Main 3x3 convolutional layer.
+        cv2 (nn.Conv2d): Additional 1x1 convolutional layer.
+        bn (nn.BatchNorm2d): Batch normalization layer.
+        act (nn.Module): Activation function layer.
+    """
     def __init__(self, c1, c2, k=3, s=1, p=None, g=1, d=1, act=True):
-        """Initialize Conv layer with given arguments including activation."""
+        """
+        Initialize Conv2 layer with given parameters.
+        Args:
+            c1 (int): Number of input channels.
+            c2 (int): Number of output channels.
+            k (int): Kernel size.
+            s (int): Stride.
+            p (int, optional): Padding.
+            g (int): Groups.
+            d (int): Dilation.
+            act (bool | nn.Module): Activation function.
+        """
         super().__init__(c1, c2, k, s, p, g=g, d=d, act=act)
         self.cv2 = nn.Conv2d(c1, c2, 1, s, autopad(1, p, d), groups=g, dilation=d, bias=False)  # add 1x1 conv
     def forward(self, x):
-        """Apply convolution, batch normalization and activation to input tensor."""
+        """
+        Apply convolution, batch normalization and activation to input tensor.
+        Args:
+            x (torch.Tensor): Input tensor.
+        Returns:
+            (torch.Tensor): Output tensor.
+        """
         return self.act(self.bn(self.conv(x) + self.cv2(x)))
     def forward_fuse(self, x):
-        """Apply fused convolution, batch normalization and activation to input tensor."""
+        """
+        Apply fused convolution, batch normalization and activation to input tensor.
+        Args:
+            x (torch.Tensor): Input tensor.
+        Returns:
+            (torch.Tensor): Output tensor.
+        """
         return self.act(self.bn(self.conv(x)))
     def fuse_convs(self):
@@ -83,106 +155,257 @@ class Conv2(Conv):
 class LightConv(nn.Module):
     """
-    Light convolution with args(ch_in, ch_out, kernel).
+    Light convolution module with 1x1 and depthwise convolutions.
+    This implementation is based on the PaddleDetection HGNetV2 backbone.
-    https://github.com/PaddlePaddle/PaddleDetection/blob/develop/ppdet/modeling/backbones/hgnet_v2.py
+    Attributes:
+        conv1 (Conv): 1x1 convolution layer.
+        conv2 (DWConv): Depthwise convolution layer.
     """
     def __init__(self, c1, c2, k=1, act=nn.ReLU()):
-        """Initialize Conv layer with given arguments including activation."""
+        """
+        Initialize LightConv layer with given parameters.
+        Args:
+            c1 (int): Number of input channels.
+            c2 (int): Number of output channels.
+            k (int): Kernel size for depthwise convolution.
+            act (nn.Module): Activation function.
+        """
         super().__init__()
         self.conv1 = Conv(c1, c2, 1, act=False)
         self.conv2 = DWConv(c2, c2, k, act=act)
     def forward(self, x):
-        """Apply 2 convolutions to input tensor."""
+        """
+        Apply 2 convolutions to input tensor.
+        Args:
+            x (torch.Tensor): Input tensor.
+        Returns:
+            (torch.Tensor): Output tensor.
+        """
         return self.conv2(self.conv1(x))
 class DWConv(Conv):
-    """Depth-wise convolution."""
+    """Depth-wise convolution module."""
-    def __init__(self, c1, c2, k=1, s=1, d=1, act=True):  # ch_in, ch_out, kernel, stride, dilation, activation
-        """Initialize Depth-wise convolution with given parameters."""
+    def __init__(self, c1, c2, k=1, s=1, d=1, act=True):
+        """
+        Initialize depth-wise convolution with given parameters.
+        Args:
+            c1 (int): Number of input channels.
+            c2 (int): Number of output channels.
+            k (int): Kernel size.
+            s (int): Stride.
+            d (int): Dilation.
+            act (bool | nn.Module): Activation function.
+        """
         super().__init__(c1, c2, k, s, g=math.gcd(c1, c2), d=d, act=act)
 class DWConvTranspose2d(nn.ConvTranspose2d):
-    """Depth-wise transpose convolution."""
+    """Depth-wise transpose convolution module."""
-    def __init__(self, c1, c2, k=1, s=1, p1=0, p2=0):  # ch_in, ch_out, kernel, stride, padding, padding_out
-        """Initialize DWConvTranspose2d class with given parameters."""
+    def __init__(self, c1, c2, k=1, s=1, p1=0, p2=0):
+        """
+        Initialize depth-wise transpose convolution with given parameters.
+        Args:
+            c1 (int): Number of input channels.
+            c2 (int): Number of output channels.
+            k (int): Kernel size.
+            s (int): Stride.
+            p1 (int): Padding.
+            p2 (int): Output padding.
+        """
         super().__init__(c1, c2, k, s, p1, p2, groups=math.gcd(c1, c2))
 class ConvTranspose(nn.Module):
-    """Convolution transpose 2d layer."""
+    """
+    Convolution transpose module with optional batch normalization and activation.
+    Attributes:
+        conv_transpose (nn.ConvTranspose2d): Transposed convolution layer.
+        bn (nn.BatchNorm2d | nn.Identity): Batch normalization layer.
+        act (nn.Module): Activation function layer.
+        default_act (nn.Module): Default activation function (SiLU).
+    """
     default_act = nn.SiLU()  # default activation
     def __init__(self, c1, c2, k=2, s=2, p=0, bn=True, act=True):
-        """Initialize ConvTranspose2d layer with batch normalization and activation function."""
+        """
+        Initialize ConvTranspose layer with given parameters.
+        Args:
+            c1 (int): Number of input channels.
+            c2 (int): Number of output channels.
+            k (int): Kernel size.
+            s (int): Stride.
+            p (int): Padding.
+            bn (bool): Use batch normalization.
+            act (bool | nn.Module): Activation function.
+        """
         super().__init__()
         self.conv_transpose = nn.ConvTranspose2d(c1, c2, k, s, p, bias=not bn)
         self.bn = nn.BatchNorm2d(c2) if bn else nn.Identity()
         self.act = self.default_act if act is True else act if isinstance(act, nn.Module) else nn.Identity()
     def forward(self, x):
-        """Applies transposed convolutions, batch normalization and activation to input."""
+        """
+        Apply transposed convolution, batch normalization and activation to input.
+        Args:
+            x (torch.Tensor): Input tensor.
+        Returns:
+            (torch.Tensor): Output tensor.
+        """
         return self.act(self.bn(self.conv_transpose(x)))
     def forward_fuse(self, x):
-        """Applies activation and convolution transpose operation to input."""
+        """
+        Apply activation and convolution transpose operation to input.
+        Args:
+            x (torch.Tensor): Input tensor.
+        Returns:
+            (torch.Tensor): Output tensor.
+        """
         return self.act(self.conv_transpose(x))
 class Focus(nn.Module):
-    """Focus wh information into c-space."""
+    """
+    Focus module for concentrating feature information.
+    Slices input tensor into 4 parts and concatenates them in the channel dimension.
+    Attributes:
+        conv (Conv): Convolution layer.
+    """
     def __init__(self, c1, c2, k=1, s=1, p=None, g=1, act=True):
-        """Initializes Focus object with user defined channel, convolution, padding, group and activation values."""
+        """
+        Initialize Focus module with given parameters.
+        Args:
+            c1 (int): Number of input channels.
+            c2 (int): Number of output channels.
+            k (int): Kernel size.
+            s (int): Stride.
+            p (int, optional): Padding.
+            g (int): Groups.
+            act (bool | nn.Module): Activation function.
+        """
         super().__init__()
         self.conv = Conv(c1 * 4, c2, k, s, p, g, act=act)
         # self.contract = Contract(gain=2)
     def forward(self, x):
         """
-        Applies convolution to concatenated tensor and returns the output.
+        Apply Focus operation and convolution to input tensor.
         Input shape is (b,c,w,h) and output shape is (b,4c,w/2,h/2).
+        Args:
+            x (torch.Tensor): Input tensor.
+        Returns:
+            (torch.Tensor): Output tensor.
         """
         return self.conv(torch.cat((x[..., ::2, ::2], x[..., 1::2, ::2], x[..., ::2, 1::2], x[..., 1::2, 1::2]), 1))
         # return self.conv(self.contract(x))
 class GhostConv(nn.Module):
-    """Ghost Convolution https://github.com/huawei-noah/ghostnet."""
+    """
+    Ghost Convolution module.
+    Generates more features with fewer parameters by using cheap operations.
+    Attributes:
+        cv1 (Conv): Primary convolution.
+        cv2 (Conv): Cheap operation convolution.
+    References:
+        https://github.com/huawei-noah/ghostnet
+    """
     def __init__(self, c1, c2, k=1, s=1, g=1, act=True):
-        """Initializes Ghost Convolution module with primary and cheap operations for efficient feature learning."""
+        """
+        Initialize Ghost Convolution module with given parameters.
+        Args:
+            c1 (int): Number of input channels.
+            c2 (int): Number of output channels.
+            k (int): Kernel size.
+            s (int): Stride.
+            g (int): Groups.
+            act (bool | nn.Module): Activation function.
+        """
         super().__init__()
         c_ = c2 // 2  # hidden channels
         self.cv1 = Conv(c1, c_, k, s, None, g, act=act)
         self.cv2 = Conv(c_, c_, 5, 1, None, c_, act=act)
     def forward(self, x):
-        """Forward propagation through a Ghost Bottleneck layer with skip connection."""
+        """
+        Apply Ghost Convolution to input tensor.
+        Args:
+            x (torch.Tensor): Input tensor.
+        Returns:
+            (torch.Tensor): Output tensor with concatenated features.
+        """
         y = self.cv1(x)
         return torch.cat((y, self.cv2(y)), 1)
 class RepConv(nn.Module):
     """
-    RepConv is a basic rep-style block, including training and deploy status.
+    RepConv module with training and deploy modes.
+    This module is used in RT-DETR and can fuse convolutions during inference for efficiency.
+    Attributes:
+        conv1 (Conv): 3x3 convolution.
+        conv2 (Conv): 1x1 convolution.
+        bn (nn.BatchNorm2d, optional): Batch normalization for identity branch.
+        act (nn.Module): Activation function.
+        default_act (nn.Module): Default activation function (SiLU).
-    This module is used in RT-DETR.
-    Based on https://github.com/DingXiaoH/RepVGG/blob/main/repvgg.py
+    References:
+        https://github.com/DingXiaoH/RepVGG/blob/main/repvgg.py
     """
     default_act = nn.SiLU()  # default activation
     def __init__(self, c1, c2, k=3, s=1, p=1, g=1, d=1, act=True, bn=False, deploy=False):
-        """Initializes Light Convolution layer with inputs, outputs & optional activation function."""
+        """
+        Initialize RepConv module with given parameters.
+        Args:
+            c1 (int): Number of input channels.
+            c2 (int): Number of output channels.
+            k (int): Kernel size.
+            s (int): Stride.
+            p (int): Padding.
+            g (int): Groups.
+            d (int): Dilation.
+            act (bool | nn.Module): Activation function.
+            bn (bool): Use batch normalization for identity branch.
+            deploy (bool): Deploy mode for inference.
+        """
         super().__init__()
         assert k == 3 and p == 1
         self.g = g
@@ -195,16 +418,39 @@ class RepConv(nn.Module):
         self.conv2 = Conv(c1, c2, 1, s, p=(p - k // 2), g=g, act=False)
     def forward_fuse(self, x):
-        """Forward process."""
+        """
+        Forward pass for deploy mode.
+        Args:
+            x (torch.Tensor): Input tensor.
+        Returns:
+            (torch.Tensor): Output tensor.
+        """
         return self.act(self.conv(x))
     def forward(self, x):
-        """Forward process."""
+        """
+        Forward pass for training mode.
+        Args:
+            x (torch.Tensor): Input tensor.
+        Returns:
+            (torch.Tensor): Output tensor.
+        """
         id_out = 0 if self.bn is None else self.bn(x)
         return self.act(self.conv1(x) + self.conv2(x) + id_out)
     def get_equivalent_kernel_bias(self):
-        """Returns equivalent kernel and bias by adding 3x3 kernel, 1x1 kernel and identity kernel with their biases."""
+        """
+        Calculate equivalent kernel and bias by fusing convolutions.
+        Returns:
+            (tuple): Tuple containing:
+                - Equivalent kernel (torch.Tensor)
+                - Equivalent bias (torch.Tensor)
+        """
         kernel3x3, bias3x3 = self._fuse_bn_tensor(self.conv1)
         kernel1x1, bias1x1 = self._fuse_bn_tensor(self.conv2)
         kernelid, biasid = self._fuse_bn_tensor(self.bn)
@@ -212,14 +458,32 @@ class RepConv(nn.Module):
     @staticmethod
     def _pad_1x1_to_3x3_tensor(kernel1x1):
-        """Pads a 1x1 tensor to a 3x3 tensor."""
+        """
+        Pad a 1x1 kernel to 3x3 size.
+        Args:
+            kernel1x1 (torch.Tensor): 1x1 convolution kernel.
+        Returns:
+            (torch.Tensor): Padded 3x3 kernel.
+        """
         if kernel1x1 is None:
             return 0
         else:
             return torch.nn.functional.pad(kernel1x1, [1, 1, 1, 1])
     def _fuse_bn_tensor(self, branch):
-        """Generates appropriate kernels and biases for convolution by fusing branches of the neural network."""
+        """
+        Fuse batch normalization with convolution weights.
+        Args:
+            branch (Conv | nn.BatchNorm2d | None): Branch to fuse.
+        Returns:
+            (tuple): Tuple containing:
+                - Fused kernel (torch.Tensor)
+                - Fused bias (torch.Tensor)
+        """
         if branch is None:
             return 0, 0
         if isinstance(branch, Conv):
@@ -247,7 +511,7 @@ class RepConv(nn.Module):
         return kernel * t, beta - running_mean * gamma / std
     def fuse_convs(self):
-        """Combines two convolution layers into a single layer and removes unused attributes from the class."""
+        """Fuse convolutions for inference by creating a single equivalent convolution."""
         if hasattr(self, "conv"):
             return
         kernel, bias = self.get_equivalent_kernel_bias()
@@ -276,25 +540,63 @@ class RepConv(nn.Module):
 class ChannelAttention(nn.Module):
-    """Channel-attention module https://github.com/open-mmlab/mmdetection/tree/v3.0.0rc1/configs/rtmdet."""
+    """
+    Channel-attention module for feature recalibration.
+    Applies attention weights to channels based on global average pooling.
+    Attributes:
+        pool (nn.AdaptiveAvgPool2d): Global average pooling.
+        fc (nn.Conv2d): Fully connected layer implemented as 1x1 convolution.
+        act (nn.Sigmoid): Sigmoid activation for attention weights.
+    References:
+        https://github.com/open-mmlab/mmdetection/tree/v3.0.0rc1/configs/rtmdet
+    """
     def __init__(self, channels: int) -> None:
-        """Initializes the class and sets the basic configurations and instance variables required."""
+        """
+        Initialize Channel-attention module.
+        Args:
+            channels (int): Number of input channels.
+        """
         super().__init__()
         self.pool = nn.AdaptiveAvgPool2d(1)
         self.fc = nn.Conv2d(channels, channels, 1, 1, 0, bias=True)
         self.act = nn.Sigmoid()
     def forward(self, x: torch.Tensor) -> torch.Tensor:
-        """Applies forward pass using activation on convolutions of the input, optionally using batch normalization."""
+        """
+        Apply channel attention to input tensor.
+        Args:
+            x (torch.Tensor): Input tensor.
+        Returns:
+            (torch.Tensor): Channel-attended output tensor.
+        """
         return x * self.act(self.fc(self.pool(x)))
 class SpatialAttention(nn.Module):
-    """Spatial-attention module."""
+    """
+    Spatial-attention module for feature recalibration.
+    Applies attention weights to spatial dimensions based on channel statistics.
+    Attributes:
+        cv1 (nn.Conv2d): Convolution layer for spatial attention.
+        act (nn.Sigmoid): Sigmoid activation for attention weights.
+    """
     def __init__(self, kernel_size=7):
-        """Initialize Spatial-attention module with kernel size argument."""
+        """
+        Initialize Spatial-attention module.
+        Args:
+            kernel_size (int): Size of the convolutional kernel (3 or 7).
+        """
         super().__init__()
         assert kernel_size in {3, 7}, "kernel size must be 3 or 7"
         padding = 3 if kernel_size == 7 else 1
@@ -302,49 +604,111 @@ class SpatialAttention(nn.Module):
         self.act = nn.Sigmoid()
     def forward(self, x):
-        """Apply channel and spatial attention on input for feature recalibration."""
+        """
+        Apply spatial attention to input tensor.
+        Args:
+            x (torch.Tensor): Input tensor.
+        Returns:
+            (torch.Tensor): Spatial-attended output tensor.
+        """
         return x * self.act(self.cv1(torch.cat([torch.mean(x, 1, keepdim=True), torch.max(x, 1, keepdim=True)[0]], 1)))
 class CBAM(nn.Module):
-    """Convolutional Block Attention Module."""
+    """
+    Convolutional Block Attention Module.
+    Combines channel and spatial attention mechanisms for comprehensive feature refinement.
+    Attributes:
+        channel_attention (ChannelAttention): Channel attention module.
+        spatial_attention (SpatialAttention): Spatial attention module.
+    """
     def __init__(self, c1, kernel_size=7):
-        """Initialize CBAM with given input channel (c1) and kernel size."""
+        """
+        Initialize CBAM with given parameters.
+        Args:
+            c1 (int): Number of input channels.
+            kernel_size (int): Size of the convolutional kernel for spatial attention.
+        """
         super().__init__()
         self.channel_attention = ChannelAttention(c1)
         self.spatial_attention = SpatialAttention(kernel_size)
     def forward(self, x):
-        """Applies the forward pass through C1 module."""
+        """
+        Apply channel and spatial attention sequentially to input tensor.
+        Args:
+            x (torch.Tensor): Input tensor.
+        Returns:
+            (torch.Tensor): Attended output tensor.
+        """
         return self.spatial_attention(self.channel_attention(x))
 class Concat(nn.Module):
-    """Concatenate a list of tensors along dimension."""
+    """
+    Concatenate a list of tensors along specified dimension.
+    Attributes:
+        d (int): Dimension along which to concatenate tensors.
+    """
     def __init__(self, dimension=1):
-        """Concatenates a list of tensors along a specified dimension."""
+        """
+        Initialize Concat module.
+        Args:
+            dimension (int): Dimension along which to concatenate tensors.
+        """
         super().__init__()
         self.d = dimension
     def forward(self, x):
-        """Forward pass for the YOLOv8 mask Proto module."""
+        """
+        Concatenate input tensors along specified dimension.
+        Args:
+            x (List[torch.Tensor]): List of input tensors.
+        Returns:
+            (torch.Tensor): Concatenated tensor.
+        """
         return torch.cat(x, self.d)
 class Index(nn.Module):
-    """Returns a particular index of the input."""
+    """
+    Returns a particular index of the input.
+    Attributes:
+        index (int): Index to select from input.
+    """
     def __init__(self, index=0):
-        """Returns a particular index of the input."""
+        """
+        Initialize Index module.
+        Args:
+            index (int): Index to select from input.
+        """
         super().__init__()
         self.index = index
     def forward(self, x):
         """
-        Forward pass.
+        Select and return a particular index from input.
+        Args:
+            x (List[torch.Tensor]): List of input tensors.
-        Expects a list of tensors as input.
+        Returns:
+            (torch.Tensor): Selected tensor.
         """
         return x[self.index]

ultralytics 8.3.89__py3-none-any.whl → 8.3.91__py3-none-any.whl

ultralytics 8.3.89py3-none-any.whl → 8.3.91py3-none-any.whl