PyPI - dgenerate-ultralytics-headless - Versions diffs - 8.3.137__py3-none-any.whl → 8.3.224__py3-none-any.whl - Mend

dgenerate-ultralytics-headless 8.3.137py3-none-any.whl → 8.3.224py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (215) hide show

{dgenerate_ultralytics_headless-8.3.137.dist-info → dgenerate_ultralytics_headless-8.3.224.dist-info}/METADATA +41 -34
dgenerate_ultralytics_headless-8.3.224.dist-info/RECORD +285 -0
{dgenerate_ultralytics_headless-8.3.137.dist-info → dgenerate_ultralytics_headless-8.3.224.dist-info}/WHEEL +1 -1
tests/__init__.py +7 -6
tests/conftest.py +15 -39
tests/test_cli.py +17 -17
tests/test_cuda.py +17 -8
tests/test_engine.py +36 -10
tests/test_exports.py +98 -37
tests/test_integrations.py +12 -15
tests/test_python.py +126 -82
tests/test_solutions.py +319 -135
ultralytics/__init__.py +27 -9
ultralytics/cfg/__init__.py +83 -87
ultralytics/cfg/datasets/Argoverse.yaml +4 -4
ultralytics/cfg/datasets/DOTAv1.5.yaml +2 -2
ultralytics/cfg/datasets/DOTAv1.yaml +2 -2
ultralytics/cfg/datasets/GlobalWheat2020.yaml +2 -2
ultralytics/cfg/datasets/HomeObjects-3K.yaml +4 -5
ultralytics/cfg/datasets/ImageNet.yaml +3 -3
ultralytics/cfg/datasets/Objects365.yaml +24 -20
ultralytics/cfg/datasets/SKU-110K.yaml +9 -9
ultralytics/cfg/datasets/VOC.yaml +10 -13
ultralytics/cfg/datasets/VisDrone.yaml +43 -33
ultralytics/cfg/datasets/african-wildlife.yaml +5 -5
ultralytics/cfg/datasets/brain-tumor.yaml +4 -5
ultralytics/cfg/datasets/carparts-seg.yaml +5 -5
ultralytics/cfg/datasets/coco-pose.yaml +26 -4
ultralytics/cfg/datasets/coco.yaml +4 -4
ultralytics/cfg/datasets/coco128-seg.yaml +2 -2
ultralytics/cfg/datasets/coco128.yaml +2 -2
ultralytics/cfg/datasets/coco8-grayscale.yaml +103 -0
ultralytics/cfg/datasets/coco8-multispectral.yaml +2 -2
ultralytics/cfg/datasets/coco8-pose.yaml +23 -2
ultralytics/cfg/datasets/coco8-seg.yaml +2 -2
ultralytics/cfg/datasets/coco8.yaml +2 -2
ultralytics/cfg/datasets/construction-ppe.yaml +32 -0
ultralytics/cfg/datasets/crack-seg.yaml +5 -5
ultralytics/cfg/datasets/dog-pose.yaml +32 -4
ultralytics/cfg/datasets/dota8-multispectral.yaml +2 -2
ultralytics/cfg/datasets/dota8.yaml +2 -2
ultralytics/cfg/datasets/hand-keypoints.yaml +29 -4
ultralytics/cfg/datasets/lvis.yaml +9 -9
ultralytics/cfg/datasets/medical-pills.yaml +4 -5
ultralytics/cfg/datasets/open-images-v7.yaml +7 -10
ultralytics/cfg/datasets/package-seg.yaml +5 -5
ultralytics/cfg/datasets/signature.yaml +4 -4
ultralytics/cfg/datasets/tiger-pose.yaml +20 -4
ultralytics/cfg/datasets/xView.yaml +5 -5
ultralytics/cfg/default.yaml +96 -93
ultralytics/cfg/trackers/botsort.yaml +16 -17
ultralytics/cfg/trackers/bytetrack.yaml +9 -11
ultralytics/data/__init__.py +4 -4
ultralytics/data/annotator.py +12 -12
ultralytics/data/augment.py +531 -564
ultralytics/data/base.py +76 -81
ultralytics/data/build.py +206 -42
ultralytics/data/converter.py +179 -78
ultralytics/data/dataset.py +121 -121
ultralytics/data/loaders.py +114 -91
ultralytics/data/split.py +28 -15
ultralytics/data/split_dota.py +67 -48
ultralytics/data/utils.py +110 -89
ultralytics/engine/exporter.py +422 -460
ultralytics/engine/model.py +224 -252
ultralytics/engine/predictor.py +94 -89
ultralytics/engine/results.py +345 -595
ultralytics/engine/trainer.py +231 -134
ultralytics/engine/tuner.py +279 -73
ultralytics/engine/validator.py +53 -46
ultralytics/hub/__init__.py +26 -28
ultralytics/hub/auth.py +30 -16
ultralytics/hub/google/__init__.py +34 -36
ultralytics/hub/session.py +53 -77
ultralytics/hub/utils.py +23 -109
ultralytics/models/__init__.py +1 -1
ultralytics/models/fastsam/__init__.py +1 -1
ultralytics/models/fastsam/model.py +36 -18
ultralytics/models/fastsam/predict.py +33 -44
ultralytics/models/fastsam/utils.py +4 -5
ultralytics/models/fastsam/val.py +12 -14
ultralytics/models/nas/__init__.py +1 -1
ultralytics/models/nas/model.py +16 -20
ultralytics/models/nas/predict.py +12 -14
ultralytics/models/nas/val.py +4 -5
ultralytics/models/rtdetr/__init__.py +1 -1
ultralytics/models/rtdetr/model.py +9 -9
ultralytics/models/rtdetr/predict.py +22 -17
ultralytics/models/rtdetr/train.py +20 -16
ultralytics/models/rtdetr/val.py +79 -59
ultralytics/models/sam/__init__.py +8 -2
ultralytics/models/sam/amg.py +53 -38
ultralytics/models/sam/build.py +29 -31
ultralytics/models/sam/model.py +33 -38
ultralytics/models/sam/modules/blocks.py +159 -182
ultralytics/models/sam/modules/decoders.py +38 -47
ultralytics/models/sam/modules/encoders.py +114 -133
ultralytics/models/sam/modules/memory_attention.py +38 -31
ultralytics/models/sam/modules/sam.py +114 -93
ultralytics/models/sam/modules/tiny_encoder.py +268 -291
ultralytics/models/sam/modules/transformer.py +59 -66
ultralytics/models/sam/modules/utils.py +55 -72
ultralytics/models/sam/predict.py +745 -341
ultralytics/models/utils/loss.py +118 -107
ultralytics/models/utils/ops.py +118 -71
ultralytics/models/yolo/__init__.py +1 -1
ultralytics/models/yolo/classify/predict.py +28 -26
ultralytics/models/yolo/classify/train.py +50 -81
ultralytics/models/yolo/classify/val.py +68 -61
ultralytics/models/yolo/detect/predict.py +12 -15
ultralytics/models/yolo/detect/train.py +56 -46
ultralytics/models/yolo/detect/val.py +279 -223
ultralytics/models/yolo/model.py +167 -86
ultralytics/models/yolo/obb/predict.py +7 -11
ultralytics/models/yolo/obb/train.py +23 -25
ultralytics/models/yolo/obb/val.py +107 -99
ultralytics/models/yolo/pose/__init__.py +1 -1
ultralytics/models/yolo/pose/predict.py +12 -14
ultralytics/models/yolo/pose/train.py +31 -69
ultralytics/models/yolo/pose/val.py +119 -254
ultralytics/models/yolo/segment/predict.py +21 -25
ultralytics/models/yolo/segment/train.py +12 -66
ultralytics/models/yolo/segment/val.py +126 -305
ultralytics/models/yolo/world/train.py +53 -45
ultralytics/models/yolo/world/train_world.py +51 -32
ultralytics/models/yolo/yoloe/__init__.py +7 -7
ultralytics/models/yolo/yoloe/predict.py +30 -37
ultralytics/models/yolo/yoloe/train.py +89 -71
ultralytics/models/yolo/yoloe/train_seg.py +15 -17
ultralytics/models/yolo/yoloe/val.py +56 -41
ultralytics/nn/__init__.py +9 -11
ultralytics/nn/autobackend.py +179 -107
ultralytics/nn/modules/__init__.py +67 -67
ultralytics/nn/modules/activation.py +8 -7
ultralytics/nn/modules/block.py +302 -323
ultralytics/nn/modules/conv.py +61 -104
ultralytics/nn/modules/head.py +488 -186
ultralytics/nn/modules/transformer.py +183 -123
ultralytics/nn/modules/utils.py +15 -20
ultralytics/nn/tasks.py +327 -203
ultralytics/nn/text_model.py +81 -65
ultralytics/py.typed +1 -0
ultralytics/solutions/__init__.py +12 -12
ultralytics/solutions/ai_gym.py +19 -27
ultralytics/solutions/analytics.py +36 -26
ultralytics/solutions/config.py +29 -28
ultralytics/solutions/distance_calculation.py +23 -24
ultralytics/solutions/heatmap.py +17 -19
ultralytics/solutions/instance_segmentation.py +21 -19
ultralytics/solutions/object_blurrer.py +16 -17
ultralytics/solutions/object_counter.py +48 -53
ultralytics/solutions/object_cropper.py +22 -16
ultralytics/solutions/parking_management.py +61 -58
ultralytics/solutions/queue_management.py +19 -19
ultralytics/solutions/region_counter.py +63 -50
ultralytics/solutions/security_alarm.py +22 -25
ultralytics/solutions/similarity_search.py +107 -60
ultralytics/solutions/solutions.py +343 -262
ultralytics/solutions/speed_estimation.py +35 -31
ultralytics/solutions/streamlit_inference.py +104 -40
ultralytics/solutions/templates/similarity-search.html +31 -24
ultralytics/solutions/trackzone.py +24 -24
ultralytics/solutions/vision_eye.py +11 -12
ultralytics/trackers/__init__.py +1 -1
ultralytics/trackers/basetrack.py +18 -27
ultralytics/trackers/bot_sort.py +48 -39
ultralytics/trackers/byte_tracker.py +94 -94
ultralytics/trackers/track.py +7 -16
ultralytics/trackers/utils/gmc.py +37 -69
ultralytics/trackers/utils/kalman_filter.py +68 -76
ultralytics/trackers/utils/matching.py +13 -17
ultralytics/utils/__init__.py +251 -275
ultralytics/utils/autobatch.py +19 -7
ultralytics/utils/autodevice.py +68 -38
ultralytics/utils/benchmarks.py +169 -130
ultralytics/utils/callbacks/base.py +12 -13
ultralytics/utils/callbacks/clearml.py +14 -15
ultralytics/utils/callbacks/comet.py +139 -66
ultralytics/utils/callbacks/dvc.py +19 -27
ultralytics/utils/callbacks/hub.py +8 -6
ultralytics/utils/callbacks/mlflow.py +6 -10
ultralytics/utils/callbacks/neptune.py +11 -19
ultralytics/utils/callbacks/platform.py +73 -0
ultralytics/utils/callbacks/raytune.py +3 -4
ultralytics/utils/callbacks/tensorboard.py +9 -12
ultralytics/utils/callbacks/wb.py +33 -30
ultralytics/utils/checks.py +163 -114
ultralytics/utils/cpu.py +89 -0
ultralytics/utils/dist.py +24 -20
ultralytics/utils/downloads.py +176 -146
ultralytics/utils/errors.py +11 -13
ultralytics/utils/events.py +113 -0
ultralytics/utils/export/__init__.py +7 -0
ultralytics/utils/{export.py → export/engine.py} +81 -63
ultralytics/utils/export/imx.py +294 -0
ultralytics/utils/export/tensorflow.py +217 -0
ultralytics/utils/files.py +33 -36
ultralytics/utils/git.py +137 -0
ultralytics/utils/instance.py +105 -120
ultralytics/utils/logger.py +404 -0
ultralytics/utils/loss.py +99 -61
ultralytics/utils/metrics.py +649 -478
ultralytics/utils/nms.py +337 -0
ultralytics/utils/ops.py +263 -451
ultralytics/utils/patches.py +70 -31
ultralytics/utils/plotting.py +253 -223
ultralytics/utils/tal.py +48 -61
ultralytics/utils/torch_utils.py +244 -251
ultralytics/utils/tqdm.py +438 -0
ultralytics/utils/triton.py +22 -23
ultralytics/utils/tuner.py +11 -10
dgenerate_ultralytics_headless-8.3.137.dist-info/RECORD +0 -272
{dgenerate_ultralytics_headless-8.3.137.dist-info → dgenerate_ultralytics_headless-8.3.224.dist-info}/entry_points.txt +0 -0
{dgenerate_ultralytics_headless-8.3.137.dist-info → dgenerate_ultralytics_headless-8.3.224.dist-info}/licenses/LICENSE +0 -0
{dgenerate_ultralytics_headless-8.3.137.dist-info → dgenerate_ultralytics_headless-8.3.224.dist-info}/top_level.txt +0 -0

ultralytics/nn/modules/block.py CHANGED Viewed

@@ -1,6 +1,8 @@
 # Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
 """Block modules."""
+from __future__ import annotations
 import torch
 import torch.nn as nn
 import torch.nn.functional as F
@@ -11,64 +13,67 @@ from .conv import Conv, DWConv, GhostConv, LightConv, RepConv, autopad
 from .transformer import TransformerBlock
 __all__ = (
-    "DFL",
-    "HGBlock",
-    "HGStem",
-    "SPP",
-    "SPPF",
     "C1",
     "C2",
+    "C2PSA",
     "C3",
+    "C3TR",
+    "CIB",
+    "DFL",
+    "ELAN1",
+    "PSA",
+    "SPP",
+    "SPPELAN",
+    "SPPF",
+    "AConv",
+    "ADown",
+    "Attention",
+    "BNContrastiveHead",
+    "Bottleneck",
+    "BottleneckCSP",
     "C2f",
     "C2fAttn",
-    "ImagePoolingAttn",
-    "ContrastiveHead",
-    "BNContrastiveHead",
-    "C3x",
-    "C3TR",
+    "C2fCIB",
+    "C2fPSA",
     "C3Ghost",
+    "C3k2",
+    "C3x",
+    "CBFuse",
+    "CBLinear",
+    "ContrastiveHead",
     "GhostBottleneck",
-    "Bottleneck",
-    "BottleneckCSP",
+    "HGBlock",
+    "HGStem",
+    "ImagePoolingAttn",
     "Proto",
     "RepC3",
-    "ResNetLayer",
     "RepNCSPELAN4",
-    "ELAN1",
-    "ADown",
-    "AConv",
-    "SPPELAN",
-    "CBFuse",
-    "CBLinear",
-    "C3k2",
-    "C2fPSA",
-    "C2PSA",
     "RepVGGDW",
-    "CIB",
-    "C2fCIB",
-    "Attention",
-    "PSA",
+    "ResNetLayer",
     "SCDown",
     "TorchVision",
 )
 class DFL(nn.Module):
-    """
-    Integral module of Distribution Focal Loss (DFL).
+    """Integral module of Distribution Focal Loss (DFL).
     Proposed in Generalized Focal Loss https://ieeexplore.ieee.org/document/9792391
     """
-    def __init__(self, c1=16):
-        """Initialize a convolutional layer with a given number of input channels."""
+    def __init__(self, c1: int = 16):
+        """Initialize a convolutional layer with a given number of input channels.
+        Args:
+            c1 (int): Number of input channels.
+        """
         super().__init__()
         self.conv = nn.Conv2d(c1, 1, 1, bias=False).requires_grad_(False)
         x = torch.arange(c1, dtype=torch.float)
         self.conv.weight.data[:] = nn.Parameter(x.view(1, c1, 1, 1))
         self.c1 = c1
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Apply the DFL module to input tensor and return transformed output."""
         b, _, a = x.shape  # batch, channels, anchors
         return self.conv(x.view(b, 4, self.c1, a).transpose(2, 1).softmax(1)).view(b, 4, a)
@@ -78,9 +83,8 @@ class DFL(nn.Module):
 class Proto(nn.Module):
     """Ultralytics YOLO models mask Proto module for segmentation models."""
-    def __init__(self, c1, c_=256, c2=32):
-        """
-        Initialize the Ultralytics YOLO models mask Proto module with specified number of protos and masks.
+    def __init__(self, c1: int, c_: int = 256, c2: int = 32):
+        """Initialize the Ultralytics YOLO models mask Proto module with specified number of protos and masks.
         Args:
             c1 (int): Input channels.
@@ -93,21 +97,19 @@ class Proto(nn.Module):
         self.cv2 = Conv(c_, c_, k=3)
         self.cv3 = Conv(c_, c2)
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Perform a forward pass through layers using an upsampled input image."""
         return self.cv3(self.cv2(self.upsample(self.cv1(x))))
 class HGStem(nn.Module):
-    """
-    StemBlock of PPHGNetV2 with 5 convolutions and one maxpool2d.
+    """StemBlock of PPHGNetV2 with 5 convolutions and one maxpool2d.
     https://github.com/PaddlePaddle/PaddleDetection/blob/develop/ppdet/modeling/backbones/hgnet_v2.py
     """
-    def __init__(self, c1, cm, c2):
-        """
-        Initialize the StemBlock of PPHGNetV2.
+    def __init__(self, c1: int, cm: int, c2: int):
+        """Initialize the StemBlock of PPHGNetV2.
         Args:
             c1 (int): Input channels.
@@ -122,7 +124,7 @@ class HGStem(nn.Module):
         self.stem4 = Conv(cm, c2, 1, 1, act=nn.ReLU())
         self.pool = nn.MaxPool2d(kernel_size=2, stride=1, padding=0, ceil_mode=True)
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Forward pass of a PPHGNetV2 backbone layer."""
         x = self.stem1(x)
         x = F.pad(x, [0, 1, 0, 1])
@@ -137,15 +139,23 @@ class HGStem(nn.Module):
 class HGBlock(nn.Module):
-    """
-    HG_Block of PPHGNetV2 with 2 convolutions and LightConv.
+    """HG_Block of PPHGNetV2 with 2 convolutions and LightConv.
     https://github.com/PaddlePaddle/PaddleDetection/blob/develop/ppdet/modeling/backbones/hgnet_v2.py
     """
-    def __init__(self, c1, cm, c2, k=3, n=6, lightconv=False, shortcut=False, act=nn.ReLU()):
-        """
-        Initialize HGBlock with specified parameters.
+    def __init__(
+        self,
+        c1: int,
+        cm: int,
+        c2: int,
+        k: int = 3,
+        n: int = 6,
+        lightconv: bool = False,
+        shortcut: bool = False,
+        act: nn.Module = nn.ReLU(),
+    ):
+        """Initialize HGBlock with specified parameters.
         Args:
             c1 (int): Input channels.
@@ -164,7 +174,7 @@ class HGBlock(nn.Module):
         self.ec = Conv(c2 // 2, c2, 1, 1, act=act)  # excitation conv
         self.add = shortcut and c1 == c2
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Forward pass of a PPHGNetV2 backbone layer."""
         y = [x]
         y.extend(m(y[-1]) for m in self.m)
@@ -175,14 +185,13 @@ class HGBlock(nn.Module):
 class SPP(nn.Module):
     """Spatial Pyramid Pooling (SPP) layer https://arxiv.org/abs/1406.4729."""
-    def __init__(self, c1, c2, k=(5, 9, 13)):
-        """
-        Initialize the SPP layer with input/output channels and pooling kernel sizes.
+    def __init__(self, c1: int, c2: int, k: tuple[int, ...] = (5, 9, 13)):
+        """Initialize the SPP layer with input/output channels and pooling kernel sizes.
         Args:
             c1 (int): Input channels.
             c2 (int): Output channels.
-            k (Tuple[int, int, int]): Kernel sizes for max pooling.
+            k (tuple): Kernel sizes for max pooling.
         """
         super().__init__()
         c_ = c1 // 2  # hidden channels
@@ -190,7 +199,7 @@ class SPP(nn.Module):
         self.cv2 = Conv(c_ * (len(k) + 1), c2, 1, 1)
         self.m = nn.ModuleList([nn.MaxPool2d(kernel_size=x, stride=1, padding=x // 2) for x in k])
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Forward pass of the SPP layer, performing spatial pyramid pooling."""
         x = self.cv1(x)
         return self.cv2(torch.cat([x] + [m(x) for m in self.m], 1))
@@ -199,9 +208,8 @@ class SPP(nn.Module):
 class SPPF(nn.Module):
     """Spatial Pyramid Pooling - Fast (SPPF) layer for YOLOv5 by Glenn Jocher."""
-    def __init__(self, c1, c2, k=5):
-        """
-        Initialize the SPPF layer with given input/output channels and kernel size.
+    def __init__(self, c1: int, c2: int, k: int = 5):
+        """Initialize the SPPF layer with given input/output channels and kernel size.
         Args:
             c1 (int): Input channels.
@@ -217,7 +225,7 @@ class SPPF(nn.Module):
         self.cv2 = Conv(c_ * 4, c2, 1, 1)
         self.m = nn.MaxPool2d(kernel_size=k, stride=1, padding=k // 2)
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Apply sequential pooling operations to input and return concatenated feature maps."""
         y = [self.cv1(x)]
         y.extend(self.m(y[-1]) for _ in range(3))
@@ -227,9 +235,8 @@ class SPPF(nn.Module):
 class C1(nn.Module):
     """CSP Bottleneck with 1 convolution."""
-    def __init__(self, c1, c2, n=1):
-        """
-        Initialize the CSP Bottleneck with 1 convolution.
+    def __init__(self, c1: int, c2: int, n: int = 1):
+        """Initialize the CSP Bottleneck with 1 convolution.
         Args:
             c1 (int): Input channels.
@@ -240,7 +247,7 @@ class C1(nn.Module):
         self.cv1 = Conv(c1, c2, 1, 1)
         self.m = nn.Sequential(*(Conv(c2, c2, 3) for _ in range(n)))
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Apply convolution and residual connection to input tensor."""
         y = self.cv1(x)
         return self.m(y) + y
@@ -249,9 +256,8 @@ class C1(nn.Module):
 class C2(nn.Module):
     """CSP Bottleneck with 2 convolutions."""
-    def __init__(self, c1, c2, n=1, shortcut=True, g=1, e=0.5):
-        """
-        Initialize a CSP Bottleneck with 2 convolutions.
+    def __init__(self, c1: int, c2: int, n: int = 1, shortcut: bool = True, g: int = 1, e: float = 0.5):
+        """Initialize a CSP Bottleneck with 2 convolutions.
         Args:
             c1 (int): Input channels.
@@ -268,7 +274,7 @@ class C2(nn.Module):
         # self.attention = ChannelAttention(2 * self.c)  # or SpatialAttention()
         self.m = nn.Sequential(*(Bottleneck(self.c, self.c, shortcut, g, k=((3, 3), (3, 3)), e=1.0) for _ in range(n)))
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Forward pass through the CSP bottleneck with 2 convolutions."""
         a, b = self.cv1(x).chunk(2, 1)
         return self.cv2(torch.cat((self.m(a), b), 1))
@@ -277,9 +283,8 @@ class C2(nn.Module):
 class C2f(nn.Module):
     """Faster Implementation of CSP Bottleneck with 2 convolutions."""
-    def __init__(self, c1, c2, n=1, shortcut=False, g=1, e=0.5):
-        """
-        Initialize a CSP bottleneck with 2 convolutions.
+    def __init__(self, c1: int, c2: int, n: int = 1, shortcut: bool = False, g: int = 1, e: float = 0.5):
+        """Initialize a CSP bottleneck with 2 convolutions.
         Args:
             c1 (int): Input channels.
@@ -295,13 +300,13 @@ class C2f(nn.Module):
         self.cv2 = Conv((2 + n) * self.c, c2, 1)  # optional act=FReLU(c2)
         self.m = nn.ModuleList(Bottleneck(self.c, self.c, shortcut, g, k=((3, 3), (3, 3)), e=1.0) for _ in range(n))
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Forward pass through C2f layer."""
         y = list(self.cv1(x).chunk(2, 1))
         y.extend(m(y[-1]) for m in self.m)
         return self.cv2(torch.cat(y, 1))
-    def forward_split(self, x):
+    def forward_split(self, x: torch.Tensor) -> torch.Tensor:
         """Forward pass using split() instead of chunk()."""
         y = self.cv1(x).split((self.c, self.c), 1)
         y = [y[0], y[1]]
@@ -312,9 +317,8 @@ class C2f(nn.Module):
 class C3(nn.Module):
     """CSP Bottleneck with 3 convolutions."""
-    def __init__(self, c1, c2, n=1, shortcut=True, g=1, e=0.5):
-        """
-        Initialize the CSP Bottleneck with 3 convolutions.
+    def __init__(self, c1: int, c2: int, n: int = 1, shortcut: bool = True, g: int = 1, e: float = 0.5):
+        """Initialize the CSP Bottleneck with 3 convolutions.
         Args:
             c1 (int): Input channels.
@@ -331,7 +335,7 @@ class C3(nn.Module):
         self.cv3 = Conv(2 * c_, c2, 1)  # optional act=FReLU(c2)
         self.m = nn.Sequential(*(Bottleneck(c_, c_, shortcut, g, k=((1, 1), (3, 3)), e=1.0) for _ in range(n)))
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Forward pass through the CSP bottleneck with 3 convolutions."""
         return self.cv3(torch.cat((self.m(self.cv1(x)), self.cv2(x)), 1))
@@ -339,9 +343,8 @@ class C3(nn.Module):
 class C3x(C3):
     """C3 module with cross-convolutions."""
-    def __init__(self, c1, c2, n=1, shortcut=True, g=1, e=0.5):
-        """
-        Initialize C3 module with cross-convolutions.
+    def __init__(self, c1: int, c2: int, n: int = 1, shortcut: bool = True, g: int = 1, e: float = 0.5):
+        """Initialize C3 module with cross-convolutions.
         Args:
             c1 (int): Input channels.
@@ -359,9 +362,8 @@ class C3x(C3):
 class RepC3(nn.Module):
     """Rep C3."""
-    def __init__(self, c1, c2, n=3, e=1.0):
-        """
-        Initialize CSP Bottleneck with a single convolution.
+    def __init__(self, c1: int, c2: int, n: int = 3, e: float = 1.0):
+        """Initialize CSP Bottleneck with a single convolution.
         Args:
             c1 (int): Input channels.
@@ -376,7 +378,7 @@ class RepC3(nn.Module):
         self.m = nn.Sequential(*[RepConv(c_, c_) for _ in range(n)])
         self.cv3 = Conv(c_, c2, 1, 1) if c_ != c2 else nn.Identity()
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Forward pass of RepC3 module."""
         return self.cv3(self.m(self.cv1(x)) + self.cv2(x))
@@ -384,9 +386,8 @@ class RepC3(nn.Module):
 class C3TR(C3):
     """C3 module with TransformerBlock()."""
-    def __init__(self, c1, c2, n=1, shortcut=True, g=1, e=0.5):
-        """
-        Initialize C3 module with TransformerBlock.
+    def __init__(self, c1: int, c2: int, n: int = 1, shortcut: bool = True, g: int = 1, e: float = 0.5):
+        """Initialize C3 module with TransformerBlock.
         Args:
             c1 (int): Input channels.
@@ -404,9 +405,8 @@ class C3TR(C3):
 class C3Ghost(C3):
     """C3 module with GhostBottleneck()."""
-    def __init__(self, c1, c2, n=1, shortcut=True, g=1, e=0.5):
-        """
-        Initialize C3 module with GhostBottleneck.
+    def __init__(self, c1: int, c2: int, n: int = 1, shortcut: bool = True, g: int = 1, e: float = 0.5):
+        """Initialize C3 module with GhostBottleneck.
         Args:
             c1 (int): Input channels.
@@ -424,9 +424,8 @@ class C3Ghost(C3):
 class GhostBottleneck(nn.Module):
     """Ghost Bottleneck https://github.com/huawei-noah/Efficient-AI-Backbones."""
-    def __init__(self, c1, c2, k=3, s=1):
-        """
-        Initialize Ghost Bottleneck module.
+    def __init__(self, c1: int, c2: int, k: int = 3, s: int = 1):
+        """Initialize Ghost Bottleneck module.
         Args:
             c1 (int): Input channels.
@@ -445,7 +444,7 @@ class GhostBottleneck(nn.Module):
             nn.Sequential(DWConv(c1, c1, k, s, act=False), Conv(c1, c2, 1, 1, act=False)) if s == 2 else nn.Identity()
         )
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Apply skip connection and concatenation to input tensor."""
         return self.conv(x) + self.shortcut(x)
@@ -453,16 +452,17 @@ class GhostBottleneck(nn.Module):
 class Bottleneck(nn.Module):
     """Standard bottleneck."""
-    def __init__(self, c1, c2, shortcut=True, g=1, k=(3, 3), e=0.5):
-        """
-        Initialize a standard bottleneck module.
+    def __init__(
+        self, c1: int, c2: int, shortcut: bool = True, g: int = 1, k: tuple[int, int] = (3, 3), e: float = 0.5
+    ):
+        """Initialize a standard bottleneck module.
         Args:
             c1 (int): Input channels.
             c2 (int): Output channels.
             shortcut (bool): Whether to use shortcut connection.
             g (int): Groups for convolutions.
-            k (Tuple[int, int]): Kernel sizes for convolutions.
+            k (tuple): Kernel sizes for convolutions.
             e (float): Expansion ratio.
         """
         super().__init__()
@@ -471,7 +471,7 @@ class Bottleneck(nn.Module):
         self.cv2 = Conv(c_, c2, k[1], 1, g=g)
         self.add = shortcut and c1 == c2
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Apply bottleneck with optional shortcut connection."""
         return x + self.cv2(self.cv1(x)) if self.add else self.cv2(self.cv1(x))
@@ -479,9 +479,8 @@ class Bottleneck(nn.Module):
 class BottleneckCSP(nn.Module):
     """CSP Bottleneck https://github.com/WongKinYiu/CrossStagePartialNetworks."""
-    def __init__(self, c1, c2, n=1, shortcut=True, g=1, e=0.5):
-        """
-        Initialize CSP Bottleneck.
+    def __init__(self, c1: int, c2: int, n: int = 1, shortcut: bool = True, g: int = 1, e: float = 0.5):
+        """Initialize CSP Bottleneck.
         Args:
             c1 (int): Input channels.
@@ -501,7 +500,7 @@ class BottleneckCSP(nn.Module):
         self.act = nn.SiLU()
         self.m = nn.Sequential(*(Bottleneck(c_, c_, shortcut, g, e=1.0) for _ in range(n)))
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Apply CSP bottleneck with 3 convolutions."""
         y1 = self.cv3(self.m(self.cv1(x)))
         y2 = self.cv2(x)
@@ -511,9 +510,8 @@ class BottleneckCSP(nn.Module):
 class ResNetBlock(nn.Module):
     """ResNet block with standard convolution layers."""
-    def __init__(self, c1, c2, s=1, e=4):
-        """
-        Initialize ResNet block.
+    def __init__(self, c1: int, c2: int, s: int = 1, e: int = 4):
+        """Initialize ResNet block.
         Args:
             c1 (int): Input channels.
@@ -528,7 +526,7 @@ class ResNetBlock(nn.Module):
         self.cv3 = Conv(c2, c3, k=1, act=False)
         self.shortcut = nn.Sequential(Conv(c1, c3, k=1, s=s, act=False)) if s != 1 or c1 != c3 else nn.Identity()
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Forward pass through the ResNet block."""
         return F.relu(self.cv3(self.cv2(self.cv1(x))) + self.shortcut(x))
@@ -536,9 +534,8 @@ class ResNetBlock(nn.Module):
 class ResNetLayer(nn.Module):
     """ResNet layer with multiple ResNet blocks."""
-    def __init__(self, c1, c2, s=1, is_first=False, n=1, e=4):
-        """
-        Initialize ResNet layer.
+    def __init__(self, c1: int, c2: int, s: int = 1, is_first: bool = False, n: int = 1, e: int = 4):
+        """Initialize ResNet layer.
         Args:
             c1 (int): Input channels.
@@ -560,7 +557,7 @@ class ResNetLayer(nn.Module):
             blocks.extend([ResNetBlock(e * c2, c2, 1, e=e) for _ in range(n - 1)])
             self.layer = nn.Sequential(*blocks)
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Forward pass through the ResNet layer."""
         return self.layer(x)
@@ -568,9 +565,8 @@ class ResNetLayer(nn.Module):
 class MaxSigmoidAttnBlock(nn.Module):
     """Max Sigmoid attention block."""
-    def __init__(self, c1, c2, nh=1, ec=128, gc=512, scale=False):
-        """
-        Initialize MaxSigmoidAttnBlock.
+    def __init__(self, c1: int, c2: int, nh: int = 1, ec: int = 128, gc: int = 512, scale: bool = False):
+        """Initialize MaxSigmoidAttnBlock.
         Args:
             c1 (int): Input channels.
@@ -589,9 +585,8 @@ class MaxSigmoidAttnBlock(nn.Module):
         self.proj_conv = Conv(c1, c2, k=3, s=1, act=False)
         self.scale = nn.Parameter(torch.ones(1, nh, 1, 1)) if scale else 1.0
-    def forward(self, x, guide):
-        """
-        Forward pass of MaxSigmoidAttnBlock.
+    def forward(self, x: torch.Tensor, guide: torch.Tensor) -> torch.Tensor:
+        """Forward pass of MaxSigmoidAttnBlock.
         Args:
             x (torch.Tensor): Input tensor.
@@ -622,9 +617,19 @@ class MaxSigmoidAttnBlock(nn.Module):
 class C2fAttn(nn.Module):
     """C2f module with an additional attn module."""
-    def __init__(self, c1, c2, n=1, ec=128, nh=1, gc=512, shortcut=False, g=1, e=0.5):
-        """
-        Initialize C2f module with attention mechanism.
+    def __init__(
+        self,
+        c1: int,
+        c2: int,
+        n: int = 1,
+        ec: int = 128,
+        nh: int = 1,
+        gc: int = 512,
+        shortcut: bool = False,
+        g: int = 1,
+        e: float = 0.5,
+    ):
+        """Initialize C2f module with attention mechanism.
         Args:
             c1 (int): Input channels.
@@ -644,9 +649,8 @@ class C2fAttn(nn.Module):
         self.m = nn.ModuleList(Bottleneck(self.c, self.c, shortcut, g, k=((3, 3), (3, 3)), e=1.0) for _ in range(n))
         self.attn = MaxSigmoidAttnBlock(self.c, self.c, gc=gc, ec=ec, nh=nh)
-    def forward(self, x, guide):
-        """
-        Forward pass through C2f layer with attention.
+    def forward(self, x: torch.Tensor, guide: torch.Tensor) -> torch.Tensor:
+        """Forward pass through C2f layer with attention.
         Args:
             x (torch.Tensor): Input tensor.
@@ -660,9 +664,8 @@ class C2fAttn(nn.Module):
         y.append(self.attn(y[-1], guide))
         return self.cv2(torch.cat(y, 1))
-    def forward_split(self, x, guide):
-        """
-        Forward pass using split() instead of chunk().
+    def forward_split(self, x: torch.Tensor, guide: torch.Tensor) -> torch.Tensor:
+        """Forward pass using split() instead of chunk().
         Args:
             x (torch.Tensor): Input tensor.
@@ -680,9 +683,10 @@ class C2fAttn(nn.Module):
 class ImagePoolingAttn(nn.Module):
     """ImagePoolingAttn: Enhance the text embeddings with image-aware information."""
-    def __init__(self, ec=256, ch=(), ct=512, nh=8, k=3, scale=False):
-        """
-        Initialize ImagePoolingAttn module.
+    def __init__(
+        self, ec: int = 256, ch: tuple[int, ...] = (), ct: int = 512, nh: int = 8, k: int = 3, scale: bool = False
+    ):
+        """Initialize ImagePoolingAttn module.
         Args:
             ec (int): Embedding channels.
@@ -708,12 +712,11 @@ class ImagePoolingAttn(nn.Module):
         self.hc = ec // nh
         self.k = k
-    def forward(self, x, text):
-        """
-        Forward pass of ImagePoolingAttn.
+    def forward(self, x: list[torch.Tensor], text: torch.Tensor) -> torch.Tensor:
+        """Forward pass of ImagePoolingAttn.
         Args:
-            x (List[torch.Tensor]): List of input feature maps.
+            x (list[torch.Tensor]): List of input feature maps.
             text (torch.Tensor): Text embeddings.
         Returns:
@@ -752,9 +755,8 @@ class ContrastiveHead(nn.Module):
         self.bias = nn.Parameter(torch.tensor([-10.0]))
         self.logit_scale = nn.Parameter(torch.ones([]) * torch.tensor(1 / 0.07).log())
-    def forward(self, x, w):
-        """
-        Forward function of contrastive learning.
+    def forward(self, x: torch.Tensor, w: torch.Tensor) -> torch.Tensor:
+        """Forward function of contrastive learning.
         Args:
             x (torch.Tensor): Image features.
@@ -770,16 +772,14 @@ class ContrastiveHead(nn.Module):
 class BNContrastiveHead(nn.Module):
-    """
-    Batch Norm Contrastive Head using batch norm instead of l2-normalization.
+    """Batch Norm Contrastive Head using batch norm instead of l2-normalization.
     Args:
         embed_dims (int): Embed dimensions of text and image features.
     """
     def __init__(self, embed_dims: int):
-        """
-        Initialize BNContrastiveHead.
+        """Initialize BNContrastiveHead.
         Args:
             embed_dims (int): Embedding dimensions for features.
@@ -798,17 +798,12 @@ class BNContrastiveHead(nn.Module):
         del self.logit_scale
         self.forward = self.forward_fuse
-    def forward_fuse(self, x, w):
-        """
-        Passes input out unchanged.
-        TODO: Update or remove?
-        """
+    def forward_fuse(self, x: torch.Tensor, w: torch.Tensor) -> torch.Tensor:
+        """Passes input out unchanged."""
         return x
-    def forward(self, x, w):
-        """
-        Forward function of contrastive learning with batch normalization.
+    def forward(self, x: torch.Tensor, w: torch.Tensor) -> torch.Tensor:
+        """Forward function of contrastive learning with batch normalization.
         Args:
             x (torch.Tensor): Image features.
@@ -827,16 +822,17 @@ class BNContrastiveHead(nn.Module):
 class RepBottleneck(Bottleneck):
     """Rep bottleneck."""
-    def __init__(self, c1, c2, shortcut=True, g=1, k=(3, 3), e=0.5):
-        """
-        Initialize RepBottleneck.
+    def __init__(
+        self, c1: int, c2: int, shortcut: bool = True, g: int = 1, k: tuple[int, int] = (3, 3), e: float = 0.5
+    ):
+        """Initialize RepBottleneck.
         Args:
             c1 (int): Input channels.
             c2 (int): Output channels.
             shortcut (bool): Whether to use shortcut connection.
             g (int): Groups for convolutions.
-            k (Tuple[int, int]): Kernel sizes for convolutions.
+            k (tuple): Kernel sizes for convolutions.
             e (float): Expansion ratio.
         """
         super().__init__(c1, c2, shortcut, g, k, e)
@@ -847,9 +843,8 @@ class RepBottleneck(Bottleneck):
 class RepCSP(C3):
     """Repeatable Cross Stage Partial Network (RepCSP) module for efficient feature extraction."""
-    def __init__(self, c1, c2, n=1, shortcut=True, g=1, e=0.5):
-        """
-        Initialize RepCSP layer.
+    def __init__(self, c1: int, c2: int, n: int = 1, shortcut: bool = True, g: int = 1, e: float = 0.5):
+        """Initialize RepCSP layer.
         Args:
             c1 (int): Input channels.
@@ -867,9 +862,8 @@ class RepCSP(C3):
 class RepNCSPELAN4(nn.Module):
     """CSP-ELAN."""
-    def __init__(self, c1, c2, c3, c4, n=1):
-        """
-        Initialize CSP-ELAN layer.
+    def __init__(self, c1: int, c2: int, c3: int, c4: int, n: int = 1):
+        """Initialize CSP-ELAN layer.
         Args:
             c1 (int): Input channels.
@@ -885,13 +879,13 @@ class RepNCSPELAN4(nn.Module):
         self.cv3 = nn.Sequential(RepCSP(c4, c4, n), Conv(c4, c4, 3, 1))
         self.cv4 = Conv(c3 + (2 * c4), c2, 1, 1)
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Forward pass through RepNCSPELAN4 layer."""
         y = list(self.cv1(x).chunk(2, 1))
         y.extend((m(y[-1])) for m in [self.cv2, self.cv3])
         return self.cv4(torch.cat(y, 1))
-    def forward_split(self, x):
+    def forward_split(self, x: torch.Tensor) -> torch.Tensor:
         """Forward pass using split() instead of chunk()."""
         y = list(self.cv1(x).split((self.c, self.c), 1))
         y.extend(m(y[-1]) for m in [self.cv2, self.cv3])
@@ -901,9 +895,8 @@ class RepNCSPELAN4(nn.Module):
 class ELAN1(RepNCSPELAN4):
     """ELAN1 module with 4 convolutions."""
-    def __init__(self, c1, c2, c3, c4):
-        """
-        Initialize ELAN1 layer.
+    def __init__(self, c1: int, c2: int, c3: int, c4: int):
+        """Initialize ELAN1 layer.
         Args:
             c1 (int): Input channels.
@@ -922,9 +915,8 @@ class ELAN1(RepNCSPELAN4):
 class AConv(nn.Module):
     """AConv."""
-    def __init__(self, c1, c2):
-        """
-        Initialize AConv module.
+    def __init__(self, c1: int, c2: int):
+        """Initialize AConv module.
         Args:
             c1 (int): Input channels.
@@ -933,7 +925,7 @@ class AConv(nn.Module):
         super().__init__()
         self.cv1 = Conv(c1, c2, 3, 2, 1)
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Forward pass through AConv layer."""
         x = torch.nn.functional.avg_pool2d(x, 2, 1, 0, False, True)
         return self.cv1(x)
@@ -942,9 +934,8 @@ class AConv(nn.Module):
 class ADown(nn.Module):
     """ADown."""
-    def __init__(self, c1, c2):
-        """
-        Initialize ADown module.
+    def __init__(self, c1: int, c2: int):
+        """Initialize ADown module.
         Args:
             c1 (int): Input channels.
@@ -955,7 +946,7 @@ class ADown(nn.Module):
         self.cv1 = Conv(c1 // 2, self.c, 3, 2, 1)
         self.cv2 = Conv(c1 // 2, self.c, 1, 1, 0)
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Forward pass through ADown layer."""
         x = torch.nn.functional.avg_pool2d(x, 2, 1, 0, False, True)
         x1, x2 = x.chunk(2, 1)
@@ -968,9 +959,8 @@ class ADown(nn.Module):
 class SPPELAN(nn.Module):
     """SPP-ELAN."""
-    def __init__(self, c1, c2, c3, k=5):
-        """
-        Initialize SPP-ELAN block.
+    def __init__(self, c1: int, c2: int, c3: int, k: int = 5):
+        """Initialize SPP-ELAN block.
         Args:
             c1 (int): Input channels.
@@ -986,7 +976,7 @@ class SPPELAN(nn.Module):
         self.cv4 = nn.MaxPool2d(kernel_size=k, stride=1, padding=k // 2)
         self.cv5 = Conv(4 * c3, c2, 1, 1)
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Forward pass through SPPELAN layer."""
         y = [self.cv1(x)]
         y.extend(m(y[-1]) for m in [self.cv2, self.cv3, self.cv4])
@@ -996,13 +986,12 @@ class SPPELAN(nn.Module):
 class CBLinear(nn.Module):
     """CBLinear."""
-    def __init__(self, c1, c2s, k=1, s=1, p=None, g=1):
-        """
-        Initialize CBLinear module.
+    def __init__(self, c1: int, c2s: list[int], k: int = 1, s: int = 1, p: int | None = None, g: int = 1):
+        """Initialize CBLinear module.
         Args:
             c1 (int): Input channels.
-            c2s (List[int]): List of output channel sizes.
+            c2s (list[int]): List of output channel sizes.
             k (int): Kernel size.
             s (int): Stride.
             p (int | None): Padding.
@@ -1012,7 +1001,7 @@ class CBLinear(nn.Module):
         self.c2s = c2s
         self.conv = nn.Conv2d(c1, sum(c2s), k, s, autopad(k, p), groups=g, bias=True)
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> list[torch.Tensor]:
         """Forward pass through CBLinear layer."""
         return self.conv(x).split(self.c2s, dim=1)
@@ -1020,22 +1009,20 @@ class CBLinear(nn.Module):
 class CBFuse(nn.Module):
     """CBFuse."""
-    def __init__(self, idx):
-        """
-        Initialize CBFuse module.
+    def __init__(self, idx: list[int]):
+        """Initialize CBFuse module.
         Args:
-            idx (List[int]): Indices for feature selection.
+            idx (list[int]): Indices for feature selection.
         """
         super().__init__()
         self.idx = idx
-    def forward(self, xs):
-        """
-        Forward pass through CBFuse layer.
+    def forward(self, xs: list[torch.Tensor]) -> torch.Tensor:
+        """Forward pass through CBFuse layer.
         Args:
-            xs (List[torch.Tensor]): List of input tensors.
+            xs (list[torch.Tensor]): List of input tensors.
         Returns:
             (torch.Tensor): Fused output tensor.
@@ -1048,9 +1035,8 @@ class CBFuse(nn.Module):
 class C3f(nn.Module):
     """Faster Implementation of CSP Bottleneck with 2 convolutions."""
-    def __init__(self, c1, c2, n=1, shortcut=False, g=1, e=0.5):
-        """
-        Initialize CSP bottleneck layer with two convolutions.
+    def __init__(self, c1: int, c2: int, n: int = 1, shortcut: bool = False, g: int = 1, e: float = 0.5):
+        """Initialize CSP bottleneck layer with two convolutions.
         Args:
             c1 (int): Input channels.
@@ -1067,7 +1053,7 @@ class C3f(nn.Module):
         self.cv3 = Conv((2 + n) * c_, c2, 1)  # optional act=FReLU(c2)
         self.m = nn.ModuleList(Bottleneck(c_, c_, shortcut, g, k=((3, 3), (3, 3)), e=1.0) for _ in range(n))
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Forward pass through C3f layer."""
         y = [self.cv2(x), self.cv1(x)]
         y.extend(m(y[-1]) for m in self.m)
@@ -1077,9 +1063,10 @@ class C3f(nn.Module):
 class C3k2(C2f):
     """Faster Implementation of CSP Bottleneck with 2 convolutions."""
-    def __init__(self, c1, c2, n=1, c3k=False, e=0.5, g=1, shortcut=True):
-        """
-        Initialize C3k2 module.
+    def __init__(
+        self, c1: int, c2: int, n: int = 1, c3k: bool = False, e: float = 0.5, g: int = 1, shortcut: bool = True
+    ):
+        """Initialize C3k2 module.
         Args:
             c1 (int): Input channels.
@@ -1099,9 +1086,8 @@ class C3k2(C2f):
 class C3k(C3):
     """C3k is a CSP bottleneck module with customizable kernel sizes for feature extraction in neural networks."""
-    def __init__(self, c1, c2, n=1, shortcut=True, g=1, e=0.5, k=3):
-        """
-        Initialize C3k module.
+    def __init__(self, c1: int, c2: int, n: int = 1, shortcut: bool = True, g: int = 1, e: float = 0.5, k: int = 3):
+        """Initialize C3k module.
         Args:
             c1 (int): Input channels.
@@ -1121,9 +1107,8 @@ class C3k(C3):
 class RepVGGDW(torch.nn.Module):
     """RepVGGDW is a class that represents a depth wise separable convolutional block in RepVGG architecture."""
-    def __init__(self, ed) -> None:
-        """
-        Initialize RepVGGDW module.
+    def __init__(self, ed: int) -> None:
+        """Initialize RepVGGDW module.
         Args:
             ed (int): Input and output channels.
@@ -1134,9 +1119,8 @@ class RepVGGDW(torch.nn.Module):
         self.dim = ed
         self.act = nn.SiLU()
-    def forward(self, x):
-        """
-        Perform a forward pass of the RepVGGDW block.
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        """Perform a forward pass of the RepVGGDW block.
         Args:
             x (torch.Tensor): Input tensor.
@@ -1146,9 +1130,8 @@ class RepVGGDW(torch.nn.Module):
         """
         return self.act(self.conv(x) + self.conv1(x))
-    def forward_fuse(self, x):
-        """
-        Perform a forward pass of the RepVGGDW block without fusing the convolutions.
+    def forward_fuse(self, x: torch.Tensor) -> torch.Tensor:
+        """Perform a forward pass of the RepVGGDW block without fusing the convolutions.
         Args:
             x (torch.Tensor): Input tensor.
@@ -1160,8 +1143,7 @@ class RepVGGDW(torch.nn.Module):
     @torch.no_grad()
     def fuse(self):
-        """
-        Fuse the convolutional layers in the RepVGGDW block.
+        """Fuse the convolutional layers in the RepVGGDW block.
         This method fuses the convolutional layers and updates the weights and biases accordingly.
         """
@@ -1186,8 +1168,7 @@ class RepVGGDW(torch.nn.Module):
 class CIB(nn.Module):
-    """
-    Conditional Identity Block (CIB) module.
+    """Conditional Identity Block (CIB) module.
     Args:
         c1 (int): Number of input channels.
@@ -1197,9 +1178,8 @@ class CIB(nn.Module):
         lk (bool, optional): Whether to use RepVGGDW for the third convolutional layer. Defaults to False.
     """
-    def __init__(self, c1, c2, shortcut=True, e=0.5, lk=False):
-        """
-        Initialize the CIB module.
+    def __init__(self, c1: int, c2: int, shortcut: bool = True, e: float = 0.5, lk: bool = False):
+        """Initialize the CIB module.
         Args:
             c1 (int): Input channels.
@@ -1220,9 +1200,8 @@ class CIB(nn.Module):
         self.add = shortcut and c1 == c2
-    def forward(self, x):
-        """
-        Forward pass of the CIB module.
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        """Forward pass of the CIB module.
         Args:
             x (torch.Tensor): Input tensor.
@@ -1234,8 +1213,7 @@ class CIB(nn.Module):
 class C2fCIB(C2f):
-    """
-    C2fCIB class represents a convolutional block with C2f and CIB modules.
+    """C2fCIB class represents a convolutional block with C2f and CIB modules.
     Args:
         c1 (int): Number of input channels.
@@ -1247,9 +1225,10 @@ class C2fCIB(C2f):
         e (float, optional): Expansion ratio for CIB modules. Defaults to 0.5.
     """
-    def __init__(self, c1, c2, n=1, shortcut=False, lk=False, g=1, e=0.5):
-        """
-        Initialize C2fCIB module.
+    def __init__(
+        self, c1: int, c2: int, n: int = 1, shortcut: bool = False, lk: bool = False, g: int = 1, e: float = 0.5
+    ):
+        """Initialize C2fCIB module.
         Args:
             c1 (int): Input channels.
@@ -1265,8 +1244,7 @@ class C2fCIB(C2f):
 class Attention(nn.Module):
-    """
-    Attention module that performs self-attention on the input tensor.
+    """Attention module that performs self-attention on the input tensor.
     Args:
         dim (int): The input tensor dimension.
@@ -1283,9 +1261,8 @@ class Attention(nn.Module):
         pe (Conv): Convolutional layer for positional encoding.
     """
-    def __init__(self, dim, num_heads=8, attn_ratio=0.5):
-        """
-        Initialize multi-head attention module.
+    def __init__(self, dim: int, num_heads: int = 8, attn_ratio: float = 0.5):
+        """Initialize multi-head attention module.
         Args:
             dim (int): Input dimension.
@@ -1303,9 +1280,8 @@ class Attention(nn.Module):
         self.proj = Conv(dim, dim, 1, act=False)
         self.pe = Conv(dim, dim, 3, 1, g=dim, act=False)
-    def forward(self, x):
-        """
-        Forward pass of the Attention module.
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        """Forward pass of the Attention module.
         Args:
             x (torch.Tensor): The input tensor.
@@ -1328,8 +1304,7 @@ class Attention(nn.Module):
 class PSABlock(nn.Module):
-    """
-    PSABlock class implementing a Position-Sensitive Attention block for neural networks.
+    """PSABlock class implementing a Position-Sensitive Attention block for neural networks.
     This class encapsulates the functionality for applying multi-head attention and feed-forward neural network layers
     with optional shortcut connections.
@@ -1349,9 +1324,8 @@ class PSABlock(nn.Module):
         >>> output_tensor = psablock(input_tensor)
     """
-    def __init__(self, c, attn_ratio=0.5, num_heads=4, shortcut=True) -> None:
-        """
-        Initialize the PSABlock.
+    def __init__(self, c: int, attn_ratio: float = 0.5, num_heads: int = 4, shortcut: bool = True) -> None:
+        """Initialize the PSABlock.
         Args:
             c (int): Input and output channels.
@@ -1365,9 +1339,8 @@ class PSABlock(nn.Module):
         self.ffn = nn.Sequential(Conv(c, c * 2, 1), Conv(c * 2, c, 1, act=False))
         self.add = shortcut
-    def forward(self, x):
-        """
-        Execute a forward pass through PSABlock.
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        """Execute a forward pass through PSABlock.
         Args:
             x (torch.Tensor): Input tensor.
@@ -1381,8 +1354,7 @@ class PSABlock(nn.Module):
 class PSA(nn.Module):
-    """
-    PSA class for implementing Position-Sensitive Attention in neural networks.
+    """PSA class for implementing Position-Sensitive Attention in neural networks.
     This class encapsulates the functionality for applying position-sensitive attention and feed-forward networks to
     input tensors, enhancing feature extraction and processing capabilities.
@@ -1404,9 +1376,8 @@ class PSA(nn.Module):
         >>> output_tensor = psa.forward(input_tensor)
     """
-    def __init__(self, c1, c2, e=0.5):
-        """
-        Initialize PSA module.
+    def __init__(self, c1: int, c2: int, e: float = 0.5):
+        """Initialize PSA module.
         Args:
             c1 (int): Input channels.
@@ -1422,9 +1393,8 @@ class PSA(nn.Module):
         self.attn = Attention(self.c, attn_ratio=0.5, num_heads=self.c // 64)
         self.ffn = nn.Sequential(Conv(self.c, self.c * 2, 1), Conv(self.c * 2, self.c, 1, act=False))
-    def forward(self, x):
-        """
-        Execute forward pass in PSA module.
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        """Execute forward pass in PSA module.
         Args:
             x (torch.Tensor): Input tensor.
@@ -1439,8 +1409,7 @@ class PSA(nn.Module):
 class C2PSA(nn.Module):
-    """
-    C2PSA module with attention mechanism for enhanced feature extraction and processing.
+    """C2PSA module with attention mechanism for enhanced feature extraction and processing.
     This module implements a convolutional block with attention mechanisms to enhance feature extraction and processing
     capabilities. It includes a series of PSABlock modules for self-attention and feed-forward operations.
@@ -1454,18 +1423,17 @@ class C2PSA(nn.Module):
     Methods:
         forward: Performs a forward pass through the C2PSA module, applying attention and feed-forward operations.
-    Notes:
-        This module essentially is the same as PSA module, but refactored to allow stacking more PSABlock modules.
     Examples:
         >>> c2psa = C2PSA(c1=256, c2=256, n=3, e=0.5)
         >>> input_tensor = torch.randn(1, 256, 64, 64)
         >>> output_tensor = c2psa(input_tensor)
+    Notes:
+        This module essentially is the same as PSA module, but refactored to allow stacking more PSABlock modules.
     """
-    def __init__(self, c1, c2, n=1, e=0.5):
-        """
-        Initialize C2PSA module.
+    def __init__(self, c1: int, c2: int, n: int = 1, e: float = 0.5):
+        """Initialize C2PSA module.
         Args:
             c1 (int): Input channels.
@@ -1481,9 +1449,8 @@ class C2PSA(nn.Module):
         self.m = nn.Sequential(*(PSABlock(self.c, attn_ratio=0.5, num_heads=self.c // 64) for _ in range(n)))
-    def forward(self, x):
-        """
-        Process the input tensor through a series of PSA blocks.
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        """Process the input tensor through a series of PSA blocks.
         Args:
             x (torch.Tensor): Input tensor.
@@ -1497,10 +1464,10 @@ class C2PSA(nn.Module):
 class C2fPSA(C2f):
-    """
-    C2fPSA module with enhanced feature extraction using PSA blocks.
+    """C2fPSA module with enhanced feature extraction using PSA blocks.
-    This class extends the C2f module by incorporating PSA blocks for improved attention mechanisms and feature extraction.
+    This class extends the C2f module by incorporating PSA blocks for improved attention mechanisms and feature
+    extraction.
     Attributes:
         c (int): Number of hidden channels.
@@ -1521,9 +1488,8 @@ class C2fPSA(C2f):
         >>> print(output.shape)
     """
-    def __init__(self, c1, c2, n=1, e=0.5):
-        """
-        Initialize C2fPSA module.
+    def __init__(self, c1: int, c2: int, n: int = 1, e: float = 0.5):
+        """Initialize C2fPSA module.
         Args:
             c1 (int): Input channels.
@@ -1537,8 +1503,7 @@ class C2fPSA(C2f):
 class SCDown(nn.Module):
-    """
-    SCDown module for downsampling with separable convolutions.
+    """SCDown module for downsampling with separable convolutions.
     This module performs downsampling using a combination of pointwise and depthwise convolutions, which helps in
     efficiently reducing the spatial dimensions of the input tensor while maintaining the channel information.
@@ -1560,9 +1525,8 @@ class SCDown(nn.Module):
         torch.Size([1, 128, 64, 64])
     """
-    def __init__(self, c1, c2, k, s):
-        """
-        Initialize SCDown module.
+    def __init__(self, c1: int, c2: int, k: int, s: int):
+        """Initialize SCDown module.
         Args:
             c1 (int): Input channels.
@@ -1574,9 +1538,8 @@ class SCDown(nn.Module):
         self.cv1 = Conv(c1, c2, 1, 1)
         self.cv2 = Conv(c2, c2, k=k, s=s, g=c2, act=False)
-    def forward(self, x):
-        """
-        Apply convolution and downsampling to the input tensor.
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        """Apply convolution and downsampling to the input tensor.
         Args:
             x (torch.Tensor): Input tensor.
@@ -1588,25 +1551,26 @@ class SCDown(nn.Module):
 class TorchVision(nn.Module):
-    """
-    TorchVision module to allow loading any torchvision model.
+    """TorchVision module to allow loading any torchvision model.
-    This class provides a way to load a model from the torchvision library, optionally load pre-trained weights, and customize the model by truncating or unwrapping layers.
-    Attributes:
-        m (nn.Module): The loaded torchvision model, possibly truncated and unwrapped.
+    This class provides a way to load a model from the torchvision library, optionally load pre-trained weights, and
+    customize the model by truncating or unwrapping layers.
     Args:
         model (str): Name of the torchvision model to load.
         weights (str, optional): Pre-trained weights to load. Default is "DEFAULT".
-        unwrap (bool, optional): If True, unwraps the model to a sequential containing all but the last `truncate` layers. Default is True.
+        unwrap (bool, optional): Unwraps the model to a sequential containing all but the last `truncate` layers.
         truncate (int, optional): Number of layers to truncate from the end if `unwrap` is True. Default is 2.
         split (bool, optional): Returns output from intermediate child modules as list. Default is False.
+    Attributes:
+        m (nn.Module): The loaded torchvision model, possibly truncated and unwrapped.
     """
-    def __init__(self, model, weights="DEFAULT", unwrap=True, truncate=2, split=False):
-        """
-        Load the model and weights from torchvision.
+    def __init__(
+        self, model: str, weights: str = "DEFAULT", unwrap: bool = True, truncate: int = 2, split: bool = False
+    ):
+        """Load the model and weights from torchvision.
         Args:
             model (str): Name of the torchvision model to load.
@@ -1632,15 +1596,14 @@ class TorchVision(nn.Module):
             self.split = False
             self.m.head = self.m.heads = nn.Identity()
-    def forward(self, x):
-        """
-        Forward pass through the model.
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        """Forward pass through the model.
         Args:
             x (torch.Tensor): Input tensor.
         Returns:
-            (torch.Tensor | List[torch.Tensor]): Output tensor or list of tensors.
+            (torch.Tensor | list[torch.Tensor]): Output tensor or list of tensors.
         """
         if self.split:
             y = [x]
@@ -1651,8 +1614,7 @@ class TorchVision(nn.Module):
 class AAttn(nn.Module):
-    """
-    Area-attention module for YOLO models, providing efficient attention mechanisms.
+    """Area-attention module for YOLO models, providing efficient attention mechanisms.
     This module implements an area-based attention mechanism that processes input features in a spatially-aware manner,
     making it particularly effective for object detection tasks.
@@ -1676,14 +1638,13 @@ class AAttn(nn.Module):
         torch.Size([1, 256, 32, 32])
     """
-    def __init__(self, dim, num_heads, area=1):
-        """
-        Initialize an Area-attention module for YOLO models.
+    def __init__(self, dim: int, num_heads: int, area: int = 1):
+        """Initialize an Area-attention module for YOLO models.
         Args:
             dim (int): Number of hidden channels.
             num_heads (int): Number of heads into which the attention mechanism is divided.
-            area (int): Number of areas the feature map is divided, default is 1.
+            area (int): Number of areas the feature map is divided.
         """
         super().__init__()
         self.area = area
@@ -1696,9 +1657,8 @@ class AAttn(nn.Module):
         self.proj = Conv(all_head_dim, dim, 1, act=False)
         self.pe = Conv(all_head_dim, dim, 7, 1, 3, g=dim, act=False)
-    def forward(self, x):
-        """
-        Process the input tensor through the area-attention.
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        """Process the input tensor through the area-attention.
         Args:
             x (torch.Tensor): Input tensor.
@@ -1737,8 +1697,7 @@ class AAttn(nn.Module):
 class ABlock(nn.Module):
-    """
-    Area-attention block module for efficient feature extraction in YOLO models.
+    """Area-attention block module for efficient feature extraction in YOLO models.
     This module implements an area-attention mechanism combined with a feed-forward network for processing feature maps.
     It uses a novel area-based attention approach that is more efficient than traditional self-attention while
@@ -1760,9 +1719,8 @@ class ABlock(nn.Module):
         torch.Size([1, 256, 32, 32])
     """
-    def __init__(self, dim, num_heads, mlp_ratio=1.2, area=1):
-        """
-        Initialize an Area-attention block module.
+    def __init__(self, dim: int, num_heads: int, mlp_ratio: float = 1.2, area: int = 1):
+        """Initialize an Area-attention block module.
         Args:
             dim (int): Number of input channels.
@@ -1778,9 +1736,8 @@ class ABlock(nn.Module):
         self.apply(self._init_weights)
-    def _init_weights(self, m):
-        """
-        Initialize weights using a truncated normal distribution.
+    def _init_weights(self, m: nn.Module):
+        """Initialize weights using a truncated normal distribution.
         Args:
             m (nn.Module): Module to initialize.
@@ -1790,9 +1747,8 @@ class ABlock(nn.Module):
             if m.bias is not None:
                 nn.init.constant_(m.bias, 0)
-    def forward(self, x):
-        """
-        Forward pass through ABlock.
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        """Forward pass through ABlock.
         Args:
             x (torch.Tensor): Input tensor.
@@ -1805,8 +1761,7 @@ class ABlock(nn.Module):
 class A2C2f(nn.Module):
-    """
-    Area-Attention C2f module for enhanced feature extraction with area-based attention mechanisms.
+    """Area-Attention C2f module for enhanced feature extraction with area-based attention mechanisms.
     This module extends the C2f architecture by incorporating area-attention and ABlock layers for improved feature
     processing. It supports both area-attention and standard convolution modes.
@@ -1828,9 +1783,20 @@ class A2C2f(nn.Module):
         torch.Size([1, 512, 32, 32])
     """
-    def __init__(self, c1, c2, n=1, a2=True, area=1, residual=False, mlp_ratio=2.0, e=0.5, g=1, shortcut=True):
-        """
-        Initialize Area-Attention C2f module.
+    def __init__(
+        self,
+        c1: int,
+        c2: int,
+        n: int = 1,
+        a2: bool = True,
+        area: int = 1,
+        residual: bool = False,
+        mlp_ratio: float = 2.0,
+        e: float = 0.5,
+        g: int = 1,
+        shortcut: bool = True,
+    ):
+        """Initialize Area-Attention C2f module.
         Args:
             c1 (int): Number of input channels.
@@ -1859,9 +1825,8 @@ class A2C2f(nn.Module):
             for _ in range(n)
         )
-    def forward(self, x):
-        """
-        Forward pass through A2C2f layer.
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        """Forward pass through A2C2f layer.
         Args:
             x (torch.Tensor): Input tensor.
@@ -1873,20 +1838,26 @@ class A2C2f(nn.Module):
         y.extend(m(y[-1]) for m in self.m)
         y = self.cv2(torch.cat(y, 1))
         if self.gamma is not None:
-            return x + self.gamma.view(-1, len(self.gamma), 1, 1) * y
+            return x + self.gamma.view(-1, self.gamma.shape[0], 1, 1) * y
         return y
 class SwiGLUFFN(nn.Module):
     """SwiGLU Feed-Forward Network for transformer-based architectures."""
-    def __init__(self, gc, ec, e=4) -> None:
-        """Initialize SwiGLU FFN with input dimension, output dimension, and expansion factor."""
+    def __init__(self, gc: int, ec: int, e: int = 4) -> None:
+        """Initialize SwiGLU FFN with input dimension, output dimension, and expansion factor.
+        Args:
+            gc (int): Guide channels.
+            ec (int): Embedding channels.
+            e (int): Expansion factor.
+        """
         super().__init__()
         self.w12 = nn.Linear(gc, e * ec)
         self.w3 = nn.Linear(e * ec // 2, ec)
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Apply SwiGLU transformation to input features."""
         x12 = self.w12(x)
         x1, x2 = x12.chunk(2, dim=-1)
@@ -1897,8 +1868,12 @@ class SwiGLUFFN(nn.Module):
 class Residual(nn.Module):
     """Residual connection wrapper for neural network modules."""
-    def __init__(self, m) -> None:
-        """Initialize residual module with the wrapped module."""
+    def __init__(self, m: nn.Module) -> None:
+        """Initialize residual module with the wrapped module.
+        Args:
+            m (nn.Module): Module to wrap with residual connection.
+        """
         super().__init__()
         self.m = m
         nn.init.zeros_(self.m.w3.bias)
@@ -1906,7 +1881,7 @@ class Residual(nn.Module):
         # nn.init.constant_(self.m.w3.weight, 1e-6)
         nn.init.zeros_(self.m.w3.weight)
-    def forward(self, x):
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
         """Apply residual connection to input features."""
         return x + self.m(x)
@@ -1914,8 +1889,14 @@ class Residual(nn.Module):
 class SAVPE(nn.Module):
     """Spatial-Aware Visual Prompt Embedding module for feature enhancement."""
-    def __init__(self, ch, c3, embed):
-        """Initialize SAVPE module with channels, intermediate channels, and embedding dimension."""
+    def __init__(self, ch: list[int], c3: int, embed: int):
+        """Initialize SAVPE module with channels, intermediate channels, and embedding dimension.
+        Args:
+            ch (list[int]): List of input channel dimensions.
+            c3 (int): Intermediate channels.
+            embed (int): Embedding dimension.
+        """
         super().__init__()
         self.cv1 = nn.ModuleList(
             nn.Sequential(
@@ -1935,7 +1916,7 @@ class SAVPE(nn.Module):
         self.cv5 = nn.Conv2d(1, self.c, 3, padding=1)
         self.cv6 = nn.Sequential(Conv(2 * self.c, self.c, 3), nn.Conv2d(self.c, self.c, 3, padding=1))
-    def forward(self, x, vp):
+    def forward(self, x: list[torch.Tensor], vp: torch.Tensor) -> torch.Tensor:
         """Process input features and visual prompts to generate enhanced embeddings."""
         y = [self.cv2[i](xi) for i, xi in enumerate(x)]
         y = self.cv4(torch.cat(y, dim=1))
@@ -1958,9 +1939,7 @@ class SAVPE(nn.Module):
         vp = vp.reshape(B, Q, 1, -1)
         score = y * vp + torch.logical_not(vp) * torch.finfo(y.dtype).min
-        score = F.softmax(score, dim=-1, dtype=torch.float).to(score.dtype)
+        score = F.softmax(score, dim=-1).to(y.dtype)
         aggregated = score.transpose(-2, -3) @ x.reshape(B, self.c, C // self.c, -1).transpose(-1, -2)
         return F.normalize(aggregated.transpose(-2, -3).reshape(B, Q, -1), dim=-1, p=2)

dgenerate-ultralytics-headless 8.3.137__py3-none-any.whl → 8.3.224__py3-none-any.whl

dgenerate-ultralytics-headless 8.3.137py3-none-any.whl → 8.3.224py3-none-any.whl