PyPI - birder - Versions diffs - 0.4.1__py3-none-any.whl → 0.4.4__py3-none-any.whl - Mend

birder 0.4.1py3-none-any.whl → 0.4.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (100) hide show

birder/__init__.py +2 -0
birder/common/fs_ops.py +81 -1
birder/common/training_cli.py +12 -2
birder/common/training_utils.py +73 -12
birder/data/collators/detection.py +3 -1
birder/datahub/_lib.py +15 -6
birder/datahub/evaluation.py +591 -0
birder/eval/__init__.py +0 -0
birder/eval/__main__.py +74 -0
birder/eval/_embeddings.py +50 -0
birder/eval/adversarial.py +315 -0
birder/eval/benchmarks/__init__.py +0 -0
birder/eval/benchmarks/awa2.py +357 -0
birder/eval/benchmarks/bioscan5m.py +198 -0
birder/eval/benchmarks/fishnet.py +318 -0
birder/eval/benchmarks/flowers102.py +210 -0
birder/eval/benchmarks/fungiclef.py +261 -0
birder/eval/benchmarks/nabirds.py +202 -0
birder/eval/benchmarks/newt.py +262 -0
birder/eval/benchmarks/plankton.py +255 -0
birder/eval/benchmarks/plantdoc.py +259 -0
birder/eval/benchmarks/plantnet.py +252 -0
birder/eval/classification.py +235 -0
birder/eval/methods/__init__.py +0 -0
birder/eval/methods/ami.py +78 -0
birder/eval/methods/knn.py +71 -0
birder/eval/methods/linear.py +152 -0
birder/eval/methods/mlp.py +178 -0
birder/eval/methods/simpleshot.py +100 -0
birder/eval/methods/svm.py +92 -0
birder/inference/classification.py +23 -2
birder/inference/detection.py +35 -15
birder/net/_vit_configs.py +5 -0
birder/net/cait.py +3 -3
birder/net/coat.py +3 -3
birder/net/cswin_transformer.py +2 -1
birder/net/deit.py +1 -1
birder/net/deit3.py +1 -1
birder/net/detection/__init__.py +2 -0
birder/net/detection/base.py +41 -18
birder/net/detection/deformable_detr.py +74 -50
birder/net/detection/detr.py +29 -26
birder/net/detection/efficientdet.py +42 -25
birder/net/detection/faster_rcnn.py +53 -21
birder/net/detection/fcos.py +42 -23
birder/net/detection/lw_detr.py +1204 -0
birder/net/detection/plain_detr.py +60 -47
birder/net/detection/retinanet.py +47 -35
birder/net/detection/rt_detr_v1.py +49 -46
birder/net/detection/rt_detr_v2.py +95 -102
birder/net/detection/ssd.py +47 -31
birder/net/detection/ssdlite.py +2 -2
birder/net/detection/yolo_v2.py +33 -18
birder/net/detection/yolo_v3.py +35 -33
birder/net/detection/yolo_v4.py +35 -20
birder/net/detection/yolo_v4_tiny.py +1 -2
birder/net/edgevit.py +3 -3
birder/net/efficientvit_msft.py +1 -1
birder/net/flexivit.py +1 -1
birder/net/hiera.py +44 -67
birder/net/hieradet.py +2 -2
birder/net/maxvit.py +2 -2
birder/net/mim/fcmae.py +2 -2
birder/net/mim/mae_hiera.py +9 -16
birder/net/mnasnet.py +2 -2
birder/net/nextvit.py +4 -4
birder/net/resnext.py +2 -2
birder/net/rope_deit3.py +2 -2
birder/net/rope_flexivit.py +2 -2
birder/net/rope_vit.py +2 -2
birder/net/simple_vit.py +1 -1
birder/net/squeezenet.py +1 -1
birder/net/ssl/capi.py +32 -25
birder/net/ssl/dino_v2.py +12 -15
birder/net/ssl/franca.py +26 -19
birder/net/van.py +2 -2
birder/net/vit.py +21 -3
birder/net/vit_parallel.py +1 -1
birder/net/vit_sam.py +62 -16
birder/net/xcit.py +1 -1
birder/ops/msda.py +46 -16
birder/scripts/benchmark.py +35 -8
birder/scripts/predict.py +14 -1
birder/scripts/predict_detection.py +7 -1
birder/scripts/train.py +27 -11
birder/scripts/train_capi.py +13 -10
birder/scripts/train_detection.py +18 -7
birder/scripts/train_franca.py +10 -2
birder/scripts/train_kd.py +28 -11
birder/tools/adversarial.py +5 -0
birder/tools/convert_model.py +101 -43
birder/tools/quantize_model.py +33 -16
birder/version.py +1 -1
{birder-0.4.1.dist-info → birder-0.4.4.dist-info}/METADATA +17 -10
{birder-0.4.1.dist-info → birder-0.4.4.dist-info}/RECORD +99 -75
{birder-0.4.1.dist-info → birder-0.4.4.dist-info}/WHEEL +1 -1
birder/scripts/evaluate.py +0 -176
{birder-0.4.1.dist-info → birder-0.4.4.dist-info}/entry_points.txt +0 -0
{birder-0.4.1.dist-info → birder-0.4.4.dist-info}/licenses/LICENSE +0 -0
{birder-0.4.1.dist-info → birder-0.4.4.dist-info}/top_level.txt +0 -0

birder/__init__.py CHANGED Viewed

@@ -1,5 +1,6 @@
 from birder.common.fs_ops import load_model_with_cfg
 from birder.common.fs_ops import load_pretrained_model
+from birder.common.fs_ops import load_pretrained_model_and_transform
 from birder.common.lib import get_channels_from_signature
 from birder.common.lib import get_size_from_signature
 from birder.data.transforms.classification import inference_preset as classification_transform
@@ -17,5 +18,6 @@ __all__ = [
     "list_pretrained_models",
     "load_model_with_cfg",
     "load_pretrained_model",
+    "load_pretrained_model_and_transform",
     "__version__",
 ]

birder/common/fs_ops.py CHANGED Viewed

@@ -2,6 +2,7 @@ import json
 import logging
 import os
 import re
+from collections.abc import Callable
 from collections.abc import Iterator
 from pathlib import Path
 from typing import Any
@@ -24,6 +25,8 @@ from birder.common.lib import get_network_name
 from birder.common.lib import get_pretrained_model_url
 from birder.conf import settings
 from birder.data.transforms.classification import RGBType
+from birder.data.transforms.classification import inference_preset
+from birder.data.transforms.detection import InferenceTransform
 from birder.model_registry import Task
 from birder.model_registry import registry
 from birder.model_registry.manifest import FileFormatType
@@ -801,7 +804,8 @@ def load_detection_model(
         for param in net.parameters():
             param.requires_grad_(False)
-        net.eval()
+        if pt2 is False:  # NOTE: Remove when GraphModule add support for 'eval'
+            net.eval()
     if len(backbone_loaded_config) == 0:
         backbone_custom_config = None
@@ -918,6 +922,82 @@ def load_pretrained_model(
     raise ValueError(f"Unknown model type: {model_metadata['task']}")
+def load_pretrained_model_and_transform(
+    weights: str,
+    *,
+    dst: Optional[str | Path] = None,
+    file_format: FileFormatType = "pt",
+    inference: bool = True,
+    device: Optional[torch.device] = None,
+    dtype: Optional[torch.dtype] = None,
+    custom_config: Optional[dict[str, Any]] = None,
+    progress_bar: bool = True,
+    classification_kwargs: Optional[dict[str, Any]] = None,
+    detection_kwargs: Optional[dict[str, Any]] = None,
+) -> tuple[BaseNet | DetectionBaseNet, ModelInfo | DetectionModelInfo, Callable[..., torch.Tensor]]:
+    """
+    Loads a pre-trained model and builds the matching inference transform
+    This is a convenience helper for the common inference path where the model and
+    its default preprocessing are needed together. Classification models use
+    inference_preset, detection models use InferenceTransform.
+    Parameters
+    ----------
+    weights
+        Name of the pre-trained weights to load from the model registry.
+    dst
+        Destination path where the model weights will be downloaded or loaded from.
+    file_format
+        Model format (e.g. pt, pt2, safetensors, etc.)
+    inference
+        Flag to prepare the model for inference mode.
+    device
+        The device to load the model on (cpu/cuda).
+    dtype
+        Data type for model parameters and computations (e.g., torch.float32, torch.float16).
+    custom_config
+        Additional model configuration that overrides or extends the predefined configuration.
+    progress_bar
+        Whether to display a progress bar during file download.
+    classification_kwargs
+        Optional keyword arguments forwarded to inference_preset.
+    detection_kwargs
+        Optional keyword arguments forwarded to InferenceTransform. If dynamic_size is
+        not provided it defaults to the model signature value.
+    Returns
+    -------
+    A tuple containing three elements:
+    - A PyTorch module (neural network model) loaded with pre-trained weights.
+    - Model info containing class mappings, signature, and RGB stats.
+    - An inference transform matching the model task.
+    """
+    net, model_info = load_pretrained_model(
+        weights,
+        dst=dst,
+        file_format=file_format,
+        inference=inference,
+        device=device,
+        dtype=dtype,
+        custom_config=custom_config,
+        progress_bar=progress_bar,
+    )
+    size = lib.get_size_from_signature(model_info.signature)
+    transform: Callable[..., torch.Tensor]
+    if isinstance(model_info, DetectionModelInfo):
+        detection_args = {} if detection_kwargs is None else dict(detection_kwargs)
+        detection_args.setdefault("dynamic_size", model_info.signature["dynamic"])
+        transform = InferenceTransform(size, model_info.rgb_stats, **detection_args)
+    else:
+        classification_args = {} if classification_kwargs is None else dict(classification_kwargs)
+        transform = inference_preset(size, model_info.rgb_stats, **classification_args)
+    return (net, model_info, transform)
 def load_model_with_cfg(
     cfg: dict[str, Any] | str | Path, weights_path: Optional[str | Path]
 ) -> tuple[torch.nn.Module, dict[str, Any]]:

birder/common/training_cli.py CHANGED Viewed

@@ -56,7 +56,9 @@ def add_optimization_args(parser: argparse.ArgumentParser, default_batch_size: i
     )
-def add_lr_wd_args(parser: argparse.ArgumentParser, backbone_lr: bool = False, wd_end: bool = False) -> None:
+def add_lr_wd_args(
+    parser: argparse.ArgumentParser, backbone_lr: bool = False, wd_end: bool = False, backbone_layer_decay: bool = False
+) -> None:
     group = parser.add_argument_group("Learning rate and regularization parameters")
     group.add_argument("--lr", type=float, default=0.1, metavar="LR", help="base learning rate")
     group.add_argument("--bias-lr", type=float, metavar="LR", help="learning rate of biases")
@@ -92,6 +94,9 @@ def add_lr_wd_args(parser: argparse.ArgumentParser, backbone_lr: bool = False, w
         help="custom weight decay for specific layers by name (e.g., offset_conv=0.0)",
     )
     group.add_argument("--layer-decay", type=float, help="layer-wise learning rate decay (LLRD)")
+    if backbone_layer_decay is True:
+        group.add_argument("--backbone-layer-decay", type=float, help="backbone layer-wise learning rate decay (LLRD)")
     group.add_argument("--layer-decay-min-scale", type=float, help="minimum layer scale factor clamp value")
     group.add_argument(
         "--layer-decay-no-opt-scale", type=float, help="layer scale threshold below which parameters are frozen"
@@ -480,8 +485,13 @@ def add_dataloader_args(
         )
-def add_precision_args(parser: argparse.ArgumentParser) -> None:
+def add_precision_args(parser: argparse.ArgumentParser, channels_last: bool = False) -> None:
     group = parser.add_argument_group("Precision parameters")
+    if channels_last is True:
+        group.add_argument(
+            "--channels-last", default=False, action="store_true", help="use channels-last memory format"
+        )
     group.add_argument(
         "--model-dtype",
         type=str,

birder/common/training_utils.py CHANGED Viewed

@@ -343,7 +343,7 @@ def count_layers(model: torch.nn.Module) -> int:
     return num_layers
-# pylint: disable=protected-access,too-many-locals,too-many-branches
+# pylint: disable=protected-access,too-many-locals,too-many-branches,too-many-statements
 def optimizer_parameter_groups(
     model: torch.nn.Module,
     weight_decay: float,
@@ -352,6 +352,7 @@ def optimizer_parameter_groups(
     custom_keys_weight_decay: Optional[list[tuple[str, float]]] = None,
     custom_layer_weight_decay: Optional[dict[str, float]] = None,
     layer_decay: Optional[float] = None,
+    backbone_layer_decay: Optional[float] = None,
     layer_decay_min_scale: Optional[float] = None,
     layer_decay_no_opt_scale: Optional[float] = None,
     bias_lr: Optional[float] = None,
@@ -388,6 +389,8 @@ def optimizer_parameter_groups(
         Applied to parameters whose names contain the specified keys.
     layer_decay
         Layer-wise learning rate decay factor.
+    backbone_layer_decay
+        Layer-wise learning rate decay factor for backbone parameters only.
     layer_decay_min_scale
         Minimum learning rate scale factor when using layer decay. Prevents layers from having too small learning rates.
     layer_decay_no_opt_scale
@@ -434,6 +437,27 @@ def optimizer_parameter_groups(
         if layer_decay is not None:
             logger.warning("Assigning lr scaling (layer decay) without a block group map")
+    backbone_group_map: dict[str, int] = {}
+    backbone_num_layers = 0
+    if backbone_layer_decay is not None:
+        backbone_module = getattr(model, "backbone", None)
+        if backbone_module is None:
+            logger.warning("Backbone layer decay requested but model has no backbone")
+            backbone_layer_decay = None
+        else:
+            backbone_block_group_regex = getattr(backbone_module, "block_group_regex", None)
+            if backbone_block_group_regex is not None:
+                names = [n for n, _ in backbone_module.named_parameters()]
+                groups = group_by_regex(names, backbone_block_group_regex)
+                backbone_group_map = {
+                    f"backbone.{item}": index for index, sublist in enumerate(groups) for item in sublist
+                }
+                backbone_num_layers = len(groups)
+            else:
+                backbone_group_map = {}
+                backbone_num_layers = count_layers(backbone_module)
+                logger.warning("Assigning lr scaling (backbone layer decay) without a block group map")
     # Build layer scale
     if layer_decay_min_scale is None:
         layer_decay_min_scale = 0.0
@@ -444,14 +468,28 @@ def optimizer_parameter_groups(
         layer_scales = [max(layer_decay_min_scale, layer_decay ** (layer_max - i)) for i in range(num_layers)]
         logger.info(f"Layer scaling ranges from {min(layer_scales)} to {max(layer_scales)} across {num_layers} layers")
+    backbone_layer_scales = []
+    if backbone_layer_decay is not None:
+        backbone_layer_max = backbone_num_layers - 1
+        backbone_layer_scales = [
+            max(layer_decay_min_scale, backbone_layer_decay ** (backbone_layer_max - i))
+            for i in range(backbone_num_layers)
+        ]
+        logger.info(
+            "Backbone layer scaling ranges from "
+            f"{min(backbone_layer_scales)} to {max(backbone_layer_scales)} across {backbone_num_layers} layers"
+        )
     # Set weight decay and layer decay
     idx = 0
+    backbone_idx = 0
     params = []
     module_stack_with_prefix = [(model, "")]
     visited_modules = []
     while len(module_stack_with_prefix) > 0:  # pylint: disable=too-many-nested-blocks
         skip_module = False
         module, prefix = module_stack_with_prefix.pop()
+        is_backbone_module = prefix == "backbone" or prefix.startswith("backbone.")
         if id(module) in visited_modules:
             skip_module = True
@@ -460,23 +498,35 @@ def optimizer_parameter_groups(
         for name, p in module.named_parameters(recurse=False):
             target_name = f"{prefix}.{name}" if prefix != "" else name
             idx = group_map.get(target_name, idx)
+            is_backbone_param = target_name.startswith("backbone.")
+            if backbone_layer_decay is not None and is_backbone_param is True:
+                backbone_idx = backbone_group_map.get(target_name, backbone_idx)
             if skip_module is True:
                 break
             parameters_found = True
             if p.requires_grad is False:
                 continue
-            if layer_decay is not None and layer_decay_no_opt_scale is not None:
-                if layer_scales[idx] < layer_decay_no_opt_scale:
-                    p.requires_grad_(False)
+            if layer_decay_no_opt_scale is not None:
+                if backbone_layer_decay is not None and is_backbone_param is True:
+                    if backbone_layer_scales and backbone_layer_scales[backbone_idx] < layer_decay_no_opt_scale:
+                        p.requires_grad_(False)
+                elif layer_decay is not None:
+                    if layer_scales[idx] < layer_decay_no_opt_scale:
+                        p.requires_grad_(False)
             is_custom_key = False
             if custom_keys_weight_decay is not None:
                 for key, custom_wd in custom_keys_weight_decay:
                     target_name_for_custom_key = f"{prefix}.{name}" if prefix != "" and "." in key else name
                     if key == target_name_for_custom_key:
-                        # Calculate lr_scale (from layer_decay or custom_layer_lr_scale)
-                        lr_scale = 1.0 if layer_decay is None else layer_scales[idx]
+                        # Calculate lr_scale (from layer_decay/backbone_layer_decay or custom_layer_lr_scale)
+                        if layer_decay is not None and (backbone_layer_decay is None or is_backbone_param is False):
+                            lr_scale = layer_scales[idx]
+                        elif backbone_layer_decay is not None and is_backbone_param is True:
+                            lr_scale = backbone_layer_scales[backbone_idx]
+                        else:
+                            lr_scale = 1.0
                         if custom_layer_lr_scale is not None:
                             for layer_name_key, custom_scale in custom_layer_lr_scale.items():
                                 if layer_name_key in target_name:
@@ -500,8 +550,8 @@ def optimizer_parameter_groups(
                         # Apply learning rate based on priority: bias_lr > backbone_lr > lr_scale
                         if bias_lr is not None and target_name.endswith(".bias") is True:
                             d["lr"] = bias_lr
-                        elif backbone_lr is not None and target_name.startswith("backbone.") is True:
-                            d["lr"] = backbone_lr
+                        elif backbone_lr is not None and is_backbone_param is True:
+                            d["lr"] = backbone_lr * lr_scale if backbone_layer_decay is not None else backbone_lr
                         elif lr_scale != 1.0:
                             d["lr"] = base_lr * lr_scale
@@ -522,8 +572,13 @@ def optimizer_parameter_groups(
                             wd = custom_wd_value
                             break
-                # Calculate lr_scale (from layer_decay or custom_layer_lr_scale)
-                lr_scale = 1.0 if layer_decay is None else layer_scales[idx]
+                # Calculate lr_scale (from layer_decay/backbone_layer_decay or custom_layer_lr_scale)
+                if layer_decay is not None and (backbone_layer_decay is None or is_backbone_param is False):
+                    lr_scale = layer_scales[idx]
+                elif backbone_layer_decay is not None and is_backbone_param is True:
+                    lr_scale = backbone_layer_scales[backbone_idx]
+                else:
+                    lr_scale = 1.0
                 if custom_layer_lr_scale is not None:
                     for layer_name_key, custom_scale in custom_layer_lr_scale.items():
                         if layer_name_key in target_name:
@@ -539,8 +594,8 @@ def optimizer_parameter_groups(
                 # Apply learning rate based on priority: bias_lr > backbone_lr > lr_scale
                 if bias_lr is not None and target_name.endswith(".bias") is True:
                     d["lr"] = bias_lr
-                elif backbone_lr is not None and target_name.startswith("backbone.") is True:
-                    d["lr"] = backbone_lr
+                elif backbone_lr is not None and is_backbone_param is True:
+                    d["lr"] = backbone_lr * lr_scale if backbone_layer_decay is not None else backbone_lr
                 elif lr_scale != 1.0:
                     d["lr"] = base_lr * lr_scale
@@ -548,6 +603,8 @@ def optimizer_parameter_groups(
         if parameters_found is True:
             idx += 1
+            if is_backbone_module is True:
+                backbone_idx += 1
         for child_name, child_module in reversed(list(module.named_children())):
             child_prefix = f"{prefix}.{child_name}" if prefix != "" else child_name
@@ -1108,12 +1165,16 @@ def init_training(
         device_id = torch.cuda.current_device()
     if args.use_deterministic_algorithms is True:
+        log.debug("Turning on deterministic algorithms")
         torch.backends.cudnn.benchmark = False
         torch.use_deterministic_algorithms(True)
     elif cudnn_dynamic_size is True:
         # Dynamic sizes: avoid per-size algorithm selection overhead.
+        log.debug("Turning off cudnn")
         torch.backends.cudnn.enabled = False
+        torch.backends.cudnn.benchmark = False
     else:
+        log.debug("Turning on cudnn")
         torch.backends.cudnn.enabled = True
         torch.backends.cudnn.benchmark = True

birder/data/collators/detection.py CHANGED Viewed

@@ -15,7 +15,9 @@ def collate_fn(batch: list[tuple[Any, ...]]) -> tuple[Any, ...]:
     return tuple(zip(*batch))
-def batch_images(images: list[torch.Tensor], size_divisible: int) -> tuple[torch.Tensor, torch.Tensor, list[list[int]]]:
+def batch_images(
+    images: list[torch.Tensor], size_divisible: int
+) -> tuple[torch.Tensor, torch.Tensor, list[tuple[int, int]]]:
     """
     Batch list of image tensors of different sizes into a single batch.
     Pad with zeros all images to the shape of the largest image in the list.

birder/datahub/_lib.py CHANGED Viewed

@@ -1,5 +1,6 @@
 import logging
 import tarfile
+import zipfile
 from pathlib import Path
 from birder.common import cli
@@ -26,9 +27,17 @@ def download_url(url: str, target: str | Path, sha256: str, progress_bar: bool =
 def extract_archive(from_path: str | Path, to_path: str | Path) -> None:
     logger.info(f"Extracting {from_path} to {to_path}")
-    with tarfile.open(from_path, "r") as tar:
-        if hasattr(tarfile, "data_filter") is True:
-            tar.extractall(to_path, filter="data")
-        else:
-            # NOTE: Remove once minimum Python version is 3.12 or above
-            tar.extractall(to_path)  # nosec # tarfile_unsafe_members
+    if isinstance(from_path, str):
+        from_path = Path(from_path)
+    if from_path.suffix == ".zip":
+        with zipfile.ZipFile(from_path, "r") as zf:
+            zf.extractall(to_path)  # nosec # tarfile_unsafe_members
+    else:
+        with tarfile.open(from_path, "r") as tar:
+            if hasattr(tarfile, "data_filter") is True:
+                tar.extractall(to_path, filter="data")
+            else:
+                # NOTE: Remove once minimum Python version is 3.12 or above
+                tar.extractall(to_path)  # nosec # tarfile_unsafe_members

birder 0.4.1__py3-none-any.whl → 0.4.4__py3-none-any.whl

birder 0.4.1py3-none-any.whl → 0.4.4py3-none-any.whl