PyPI - inference-models - Versions diffs - 0.18.3__py3-none-any.whl - Mend

inference-models 0.18.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (195) hide show

inference_models/__init__.py +36 -0
inference_models/configuration.py +72 -0
inference_models/constants.py +2 -0
inference_models/entities.py +5 -0
inference_models/errors.py +137 -0
inference_models/logger.py +52 -0
inference_models/model_pipelines/__init__.py +0 -0
inference_models/model_pipelines/auto_loaders/__init__.py +0 -0
inference_models/model_pipelines/auto_loaders/core.py +120 -0
inference_models/model_pipelines/auto_loaders/pipelines_registry.py +36 -0
inference_models/model_pipelines/face_and_gaze_detection/__init__.py +0 -0
inference_models/model_pipelines/face_and_gaze_detection/mediapipe_l2cs.py +200 -0
inference_models/models/__init__.py +0 -0
inference_models/models/auto_loaders/__init__.py +0 -0
inference_models/models/auto_loaders/access_manager.py +168 -0
inference_models/models/auto_loaders/auto_negotiation.py +1329 -0
inference_models/models/auto_loaders/auto_resolution_cache.py +129 -0
inference_models/models/auto_loaders/constants.py +7 -0
inference_models/models/auto_loaders/core.py +1341 -0
inference_models/models/auto_loaders/dependency_models.py +52 -0
inference_models/models/auto_loaders/entities.py +57 -0
inference_models/models/auto_loaders/models_registry.py +497 -0
inference_models/models/auto_loaders/presentation_utils.py +333 -0
inference_models/models/auto_loaders/ranking.py +413 -0
inference_models/models/auto_loaders/utils.py +31 -0
inference_models/models/base/__init__.py +0 -0
inference_models/models/base/classification.py +123 -0
inference_models/models/base/depth_estimation.py +62 -0
inference_models/models/base/documents_parsing.py +111 -0
inference_models/models/base/embeddings.py +66 -0
inference_models/models/base/instance_segmentation.py +87 -0
inference_models/models/base/keypoints_detection.py +93 -0
inference_models/models/base/object_detection.py +143 -0
inference_models/models/base/semantic_segmentation.py +74 -0
inference_models/models/base/types.py +5 -0
inference_models/models/clip/__init__.py +0 -0
inference_models/models/clip/clip_onnx.py +148 -0
inference_models/models/clip/clip_pytorch.py +104 -0
inference_models/models/clip/preprocessing.py +162 -0
inference_models/models/common/__init__.py +0 -0
inference_models/models/common/cuda.py +30 -0
inference_models/models/common/model_packages.py +25 -0
inference_models/models/common/onnx.py +379 -0
inference_models/models/common/roboflow/__init__.py +0 -0
inference_models/models/common/roboflow/model_packages.py +361 -0
inference_models/models/common/roboflow/post_processing.py +436 -0
inference_models/models/common/roboflow/pre_processing.py +1332 -0
inference_models/models/common/torch.py +20 -0
inference_models/models/common/trt.py +266 -0
inference_models/models/deep_lab_v3_plus/__init__.py +0 -0
inference_models/models/deep_lab_v3_plus/deep_lab_v3_plus_segmentation_onnx.py +282 -0
inference_models/models/deep_lab_v3_plus/deep_lab_v3_plus_segmentation_torch.py +264 -0
inference_models/models/deep_lab_v3_plus/deep_lab_v3_plus_segmentation_trt.py +313 -0
inference_models/models/depth_anything_v2/__init__.py +0 -0
inference_models/models/depth_anything_v2/depth_anything_v2_hf.py +77 -0
inference_models/models/dinov3/__init__.py +0 -0
inference_models/models/dinov3/dinov3_classification_onnx.py +348 -0
inference_models/models/dinov3/dinov3_classification_torch.py +323 -0
inference_models/models/doctr/__init__.py +0 -0
inference_models/models/doctr/doctr_torch.py +304 -0
inference_models/models/easy_ocr/__init__.py +0 -0
inference_models/models/easy_ocr/easy_ocr_torch.py +222 -0
inference_models/models/florence2/__init__.py +0 -0
inference_models/models/florence2/florence2_hf.py +897 -0
inference_models/models/grounding_dino/__init__.py +0 -0
inference_models/models/grounding_dino/grounding_dino_torch.py +227 -0
inference_models/models/l2cs/__init__.py +0 -0
inference_models/models/l2cs/l2cs_onnx.py +216 -0
inference_models/models/mediapipe_face_detection/__init__.py +0 -0
inference_models/models/mediapipe_face_detection/face_detection.py +203 -0
inference_models/models/moondream2/__init__.py +0 -0
inference_models/models/moondream2/moondream2_hf.py +281 -0
inference_models/models/owlv2/__init__.py +0 -0
inference_models/models/owlv2/cache.py +182 -0
inference_models/models/owlv2/entities.py +112 -0
inference_models/models/owlv2/owlv2_hf.py +695 -0
inference_models/models/owlv2/reference_dataset.py +291 -0
inference_models/models/paligemma/__init__.py +0 -0
inference_models/models/paligemma/paligemma_hf.py +209 -0
inference_models/models/perception_encoder/__init__.py +0 -0
inference_models/models/perception_encoder/perception_encoder_pytorch.py +197 -0
inference_models/models/perception_encoder/vision_encoder/__init__.py +0 -0
inference_models/models/perception_encoder/vision_encoder/config.py +160 -0
inference_models/models/perception_encoder/vision_encoder/pe.py +742 -0
inference_models/models/perception_encoder/vision_encoder/rope.py +344 -0
inference_models/models/perception_encoder/vision_encoder/tokenizer.py +342 -0
inference_models/models/perception_encoder/vision_encoder/transforms.py +33 -0
inference_models/models/qwen25vl/__init__.py +1 -0
inference_models/models/qwen25vl/qwen25vl_hf.py +285 -0
inference_models/models/resnet/__init__.py +0 -0
inference_models/models/resnet/resnet_classification_onnx.py +330 -0
inference_models/models/resnet/resnet_classification_torch.py +305 -0
inference_models/models/resnet/resnet_classification_trt.py +369 -0
inference_models/models/rfdetr/__init__.py +0 -0
inference_models/models/rfdetr/backbone_builder.py +101 -0
inference_models/models/rfdetr/class_remapping.py +41 -0
inference_models/models/rfdetr/common.py +115 -0
inference_models/models/rfdetr/default_labels.py +108 -0
inference_models/models/rfdetr/dinov2_with_windowed_attn.py +1330 -0
inference_models/models/rfdetr/misc.py +26 -0
inference_models/models/rfdetr/ms_deform_attn.py +180 -0
inference_models/models/rfdetr/ms_deform_attn_func.py +60 -0
inference_models/models/rfdetr/position_encoding.py +166 -0
inference_models/models/rfdetr/post_processor.py +83 -0
inference_models/models/rfdetr/projector.py +373 -0
inference_models/models/rfdetr/rfdetr_backbone_pytorch.py +394 -0
inference_models/models/rfdetr/rfdetr_base_pytorch.py +807 -0
inference_models/models/rfdetr/rfdetr_instance_segmentation_onnx.py +206 -0
inference_models/models/rfdetr/rfdetr_instance_segmentation_pytorch.py +373 -0
inference_models/models/rfdetr/rfdetr_instance_segmentation_trt.py +227 -0
inference_models/models/rfdetr/rfdetr_object_detection_onnx.py +244 -0
inference_models/models/rfdetr/rfdetr_object_detection_pytorch.py +470 -0
inference_models/models/rfdetr/rfdetr_object_detection_trt.py +270 -0
inference_models/models/rfdetr/segmentation_head.py +273 -0
inference_models/models/rfdetr/transformer.py +767 -0
inference_models/models/roboflow_instant/__init__.py +0 -0
inference_models/models/roboflow_instant/roboflow_instant_hf.py +141 -0
inference_models/models/sam/__init__.py +0 -0
inference_models/models/sam/cache.py +147 -0
inference_models/models/sam/entities.py +25 -0
inference_models/models/sam/sam_torch.py +675 -0
inference_models/models/sam2/__init__.py +0 -0
inference_models/models/sam2/cache.py +162 -0
inference_models/models/sam2/entities.py +43 -0
inference_models/models/sam2/sam2_torch.py +905 -0
inference_models/models/sam2_rt/__init__.py +0 -0
inference_models/models/sam2_rt/sam2_pytorch.py +119 -0
inference_models/models/smolvlm/__init__.py +0 -0
inference_models/models/smolvlm/smolvlm_hf.py +245 -0
inference_models/models/trocr/__init__.py +0 -0
inference_models/models/trocr/trocr_hf.py +53 -0
inference_models/models/vit/__init__.py +0 -0
inference_models/models/vit/vit_classification_huggingface.py +319 -0
inference_models/models/vit/vit_classification_onnx.py +326 -0
inference_models/models/vit/vit_classification_trt.py +365 -0
inference_models/models/yolact/__init__.py +1 -0
inference_models/models/yolact/yolact_instance_segmentation_onnx.py +336 -0
inference_models/models/yolact/yolact_instance_segmentation_trt.py +361 -0
inference_models/models/yolo_world/__init__.py +1 -0
inference_models/models/yolonas/__init__.py +0 -0
inference_models/models/yolonas/nms.py +44 -0
inference_models/models/yolonas/yolonas_object_detection_onnx.py +204 -0
inference_models/models/yolonas/yolonas_object_detection_trt.py +230 -0
inference_models/models/yolov10/__init__.py +0 -0
inference_models/models/yolov10/yolov10_object_detection_onnx.py +187 -0
inference_models/models/yolov10/yolov10_object_detection_trt.py +215 -0
inference_models/models/yolov11/__init__.py +0 -0
inference_models/models/yolov11/yolov11_onnx.py +28 -0
inference_models/models/yolov11/yolov11_torch_script.py +25 -0
inference_models/models/yolov11/yolov11_trt.py +21 -0
inference_models/models/yolov12/__init__.py +0 -0
inference_models/models/yolov12/yolov12_onnx.py +7 -0
inference_models/models/yolov12/yolov12_torch_script.py +7 -0
inference_models/models/yolov12/yolov12_trt.py +7 -0
inference_models/models/yolov5/__init__.py +0 -0
inference_models/models/yolov5/nms.py +99 -0
inference_models/models/yolov5/yolov5_instance_segmentation_onnx.py +225 -0
inference_models/models/yolov5/yolov5_instance_segmentation_trt.py +255 -0
inference_models/models/yolov5/yolov5_object_detection_onnx.py +192 -0
inference_models/models/yolov5/yolov5_object_detection_trt.py +218 -0
inference_models/models/yolov7/__init__.py +0 -0
inference_models/models/yolov7/yolov7_instance_segmentation_onnx.py +226 -0
inference_models/models/yolov7/yolov7_instance_segmentation_trt.py +253 -0
inference_models/models/yolov8/__init__.py +0 -0
inference_models/models/yolov8/yolov8_classification_onnx.py +181 -0
inference_models/models/yolov8/yolov8_instance_segmentation_onnx.py +239 -0
inference_models/models/yolov8/yolov8_instance_segmentation_torch_script.py +201 -0
inference_models/models/yolov8/yolov8_instance_segmentation_trt.py +268 -0
inference_models/models/yolov8/yolov8_key_points_detection_onnx.py +263 -0
inference_models/models/yolov8/yolov8_key_points_detection_torch_script.py +218 -0
inference_models/models/yolov8/yolov8_key_points_detection_trt.py +287 -0
inference_models/models/yolov8/yolov8_object_detection_onnx.py +213 -0
inference_models/models/yolov8/yolov8_object_detection_torch_script.py +166 -0
inference_models/models/yolov8/yolov8_object_detection_trt.py +231 -0
inference_models/models/yolov9/__init__.py +0 -0
inference_models/models/yolov9/yolov9_onnx.py +7 -0
inference_models/models/yolov9/yolov9_torch_script.py +7 -0
inference_models/models/yolov9/yolov9_trt.py +7 -0
inference_models/runtime_introspection/__init__.py +0 -0
inference_models/runtime_introspection/core.py +410 -0
inference_models/utils/__init__.py +0 -0
inference_models/utils/download.py +608 -0
inference_models/utils/environment.py +28 -0
inference_models/utils/file_system.py +51 -0
inference_models/utils/hashing.py +7 -0
inference_models/utils/imports.py +48 -0
inference_models/utils/onnx_introspection.py +17 -0
inference_models/weights_providers/__init__.py +0 -0
inference_models/weights_providers/core.py +20 -0
inference_models/weights_providers/entities.py +159 -0
inference_models/weights_providers/roboflow.py +601 -0
inference_models-0.18.3.dist-info/METADATA +466 -0
inference_models-0.18.3.dist-info/RECORD +195 -0
inference_models-0.18.3.dist-info/WHEEL +5 -0
inference_models-0.18.3.dist-info/top_level.txt +1 -0

inference_models/models/auto_loaders/dependency_models.py ADDED Viewed

@@ -0,0 +1,52 @@
+from typing import Any, Dict, List, Optional, Tuple, Union
+import torch
+from pydantic import BaseModel, ConfigDict, Field, ValidationError
+from inference_models.configuration import DEFAULT_DEVICE
+from inference_models.errors import DependencyModelParametersValidationError
+from inference_models.models.auto_loaders.entities import BackendType
+from inference_models.weights_providers.entities import Quantization
+class DependencyModelParameters(BaseModel):
+    model_config = ConfigDict(extra="allow", arbitrary_types_allowed=True)
+    model_id_or_path: str
+    model_package_id: Optional[str] = Field(default=None)
+    backend: Optional[Union[str, BackendType, List[Union[str, BackendType]]]] = Field(
+        default=None
+    )
+    batch_size: Optional[Union[int, Tuple[int, int]]] = Field(default=None)
+    quantization: Optional[Union[str, Quantization, List[Union[str, Quantization]]]] = (
+        Field(default=None)
+    )
+    onnx_execution_providers: Optional[List[Union[str, tuple]]] = Field(default=None)
+    device: torch.device = Field(default=DEFAULT_DEVICE)
+    default_onnx_trt_options: bool = Field(default=True)
+    nms_fusion_preferences: Optional[Union[bool, dict]] = Field(default=None)
+    model_type: Optional[str] = Field(default=None)
+    task_type: Optional[str] = Field(default=None)
+    @property
+    def kwargs(self) -> Dict[str, Any]:
+        return self.model_extra or {}
+def prepare_dependency_model_parameters(
+    model_parameters: Union[str, dict, DependencyModelParameters]
+) -> DependencyModelParameters:
+    if isinstance(model_parameters, dict):
+        try:
+            return DependencyModelParameters.model_validate(model_parameters)
+        except ValidationError as error:
+            raise DependencyModelParametersValidationError(
+                message="Could not validate parameters to initialise dependent model - if you run locally, make sure "
+                f"that you initialise model properly, as at least one parameter parameter specified in "
+                f"dictionary with model options is invalid. If you use Roboflow hosted offering, contact us to "
+                f"get help.",
+                help_url="https://todo",
+            ) from error
+    if isinstance(model_parameters, str):
+        model_parameters = DependencyModelParameters(model_id_or_path=model_parameters)
+    return model_parameters

inference_models/models/auto_loaders/entities.py ADDED Viewed

@@ -0,0 +1,57 @@
+from dataclasses import dataclass
+from enum import Enum
+from typing import Optional, Union
+from inference_models.models.base.classification import (
+    ClassificationModel,
+    MultiLabelClassificationModel,
+)
+from inference_models.models.base.depth_estimation import DepthEstimationModel
+from inference_models.models.base.documents_parsing import StructuredOCRModel
+from inference_models.models.base.embeddings import TextImageEmbeddingModel
+from inference_models.models.base.instance_segmentation import InstanceSegmentationModel
+from inference_models.models.base.keypoints_detection import KeyPointsDetectionModel
+from inference_models.models.base.object_detection import (
+    ObjectDetectionModel,
+    OpenVocabularyObjectDetectionModel,
+)
+ModelArchitecture = str
+TaskType = Optional[str]
+MODEL_CONFIG_FILE_NAME = "model_config.json"
+class BackendType(str, Enum):
+    TORCH = "torch"
+    TORCH_SCRIPT = "torch-script"
+    ONNX = "onnx"
+    TRT = "trt"
+    HF = "hugging-face"
+    ULTRALYTICS = "ultralytics"
+    MEDIAPIPE = "mediapipe"
+    CUSTOM = "custom"
+AnyModel = Union[
+    ClassificationModel,
+    MultiLabelClassificationModel,
+    DepthEstimationModel,
+    StructuredOCRModel,
+    TextImageEmbeddingModel,
+    InstanceSegmentationModel,
+    KeyPointsDetectionModel,
+    ObjectDetectionModel,
+    OpenVocabularyObjectDetectionModel,
+]
+@dataclass(frozen=True)
+class InferenceModelConfig:
+    model_architecture: Optional[ModelArchitecture]
+    task_type: TaskType
+    backend_type: Optional[BackendType]
+    model_module: Optional[str]
+    model_class: Optional[str]
+    def is_library_model(self) -> bool:
+        return self.model_architecture is not None and self.backend_type is not None

inference_models/models/auto_loaders/models_registry.py ADDED Viewed

@@ -0,0 +1,497 @@
+from dataclasses import dataclass, field
+from typing import Dict, Optional, Set, Tuple, Union
+from inference_models.errors import ModelImplementationLoaderError
+from inference_models.models.auto_loaders.entities import (
+    BackendType,
+    ModelArchitecture,
+    TaskType,
+)
+from inference_models.utils.imports import LazyClass
+OBJECT_DETECTION_TASK = "object-detection"
+INSTANCE_SEGMENTATION_TASK = "instance-segmentation"
+SEMANTIC_SEGMENTATION_TASK = "semantic-segmentation"
+KEYPOINT_DETECTION_TASK = "keypoint-detection"
+VLM_TASK = "vlm"
+EMBEDDING_TASK = "embedding"
+CLASSIFICATION_TASK = "classification"
+MULTI_LABEL_CLASSIFICATION_TASK = "multi-label-classification"
+DEPTH_ESTIMATION_TASK = "depth-estimation"
+STRUCTURED_OCR_TASK = "structured-ocr"
+TEXT_ONLY_OCR_TASK = "text-only-ocr"
+GAZE_DETECTION_TASK = "gaze-detection"
+OPEN_VOCABULARY_OBJECT_DETECTION_TASK = "open-vocabulary-object-detection"
+INTERACTIVE_INSTANCE_SEGMENTATION_TASK = "interactive-instance-segmentation"
+@dataclass(frozen=True)
+class RegistryEntry:
+    model_class: LazyClass
+    supported_model_features: Optional[Set[str]] = field(default=None)
+REGISTERED_MODELS: Dict[
+    Tuple[ModelArchitecture, TaskType, BackendType], Union[LazyClass, RegistryEntry]
+] = {
+    ("yolonas", OBJECT_DETECTION_TASK, BackendType.ONNX): LazyClass(
+        module_name="inference_models.models.yolonas.yolonas_object_detection_onnx",
+        class_name="YOLONasForObjectDetectionOnnx",
+    ),
+    ("yolonas", OBJECT_DETECTION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.yolonas.yolonas_object_detection_trt",
+        class_name="YOLONasForObjectDetectionTRT",
+    ),
+    ("yolov5", OBJECT_DETECTION_TASK, BackendType.ONNX): LazyClass(
+        module_name="inference_models.models.yolov5.yolov5_object_detection_onnx",
+        class_name="YOLOv5ForObjectDetectionOnnx",
+    ),
+    ("yolov5", OBJECT_DETECTION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.yolov5.yolov5_object_detection_trt",
+        class_name="YOLOv5ForObjectDetectionTRT",
+    ),
+    ("yolov5", INSTANCE_SEGMENTATION_TASK, BackendType.ONNX): LazyClass(
+        module_name="inference_models.models.yolov5.yolov5_instance_segmentation_onnx",
+        class_name="YOLOv5ForInstanceSegmentationOnnx",
+    ),
+    ("yolov5", INSTANCE_SEGMENTATION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.yolov5.yolov5_instance_segmentation_trt",
+        class_name="YOLOv5ForInstanceSegmentationTRT",
+    ),
+    ("yolov7", INSTANCE_SEGMENTATION_TASK, BackendType.ONNX): LazyClass(
+        module_name="inference_models.models.yolov7.yolov7_instance_segmentation_onnx",
+        class_name="YOLOv7ForInstanceSegmentationOnnx",
+    ),
+    ("yolov7", INSTANCE_SEGMENTATION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.yolov7.yolov7_instance_segmentation_trt",
+        class_name="YOLOv7ForInstanceSegmentationTRT",
+    ),
+    ("yolov8", CLASSIFICATION_TASK, BackendType.ONNX): RegistryEntry(
+        model_class=LazyClass(
+            module_name="inference_models.models.yolov8.yolov8_classification_onnx",
+            class_name="YOLOv8ForClassificationOnnx",
+        ),
+    ),
+    ("yolov8", OBJECT_DETECTION_TASK, BackendType.ONNX): RegistryEntry(
+        model_class=LazyClass(
+            module_name="inference_models.models.yolov8.yolov8_object_detection_onnx",
+            class_name="YOLOv8ForObjectDetectionOnnx",
+        ),
+        supported_model_features={"nms_fused"},
+    ),
+    ("yolov8", OBJECT_DETECTION_TASK, BackendType.TORCH_SCRIPT): RegistryEntry(
+        model_class=LazyClass(
+            module_name="inference_models.models.yolov8.yolov8_object_detection_torch_script",
+            class_name="YOLOv8ForObjectDetectionTorchScript",
+        ),
+        supported_model_features={"nms_fused"},
+    ),
+    ("yolov8", OBJECT_DETECTION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.yolov8.yolov8_object_detection_trt",
+        class_name="YOLOv8ForObjectDetectionTRT",
+    ),
+    ("yolov8", KEYPOINT_DETECTION_TASK, BackendType.ONNX): RegistryEntry(
+        model_class=LazyClass(
+            module_name="inference_models.models.yolov8.yolov8_key_points_detection_onnx",
+            class_name="YOLOv8ForKeyPointsDetectionOnnx",
+        ),
+        supported_model_features={"nms_fused"},
+    ),
+    ("yolov8", KEYPOINT_DETECTION_TASK, BackendType.TORCH_SCRIPT): RegistryEntry(
+        model_class=LazyClass(
+            module_name="inference_models.models.yolov8.yolov8_key_points_detection_torch_script",
+            class_name="YOLOv8ForKeyPointsDetectionTorchScript",
+        ),
+        supported_model_features={"nms_fused"},
+    ),
+    ("yolov8", KEYPOINT_DETECTION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.yolov8.yolov8_key_points_detection_trt",
+        class_name="YOLOv8ForKeyPointsDetectionTRT",
+    ),
+    ("yolov8", INSTANCE_SEGMENTATION_TASK, BackendType.ONNX): RegistryEntry(
+        model_class=LazyClass(
+            module_name="inference_models.models.yolov8.yolov8_instance_segmentation_onnx",
+            class_name="YOLOv8ForInstanceSegmentationOnnx",
+        ),
+        supported_model_features={"nms_fused"},
+    ),
+    ("yolov8", INSTANCE_SEGMENTATION_TASK, BackendType.TORCH_SCRIPT): RegistryEntry(
+        model_class=LazyClass(
+            module_name="inference_models.models.yolov8.yolov8_instance_segmentation_torch_script",
+            class_name="YOLOv8ForInstanceSegmentationTorchScript",
+        ),
+        supported_model_features={"nms_fused"},
+    ),
+    ("yolov8", INSTANCE_SEGMENTATION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.yolov8.yolov8_instance_segmentation_trt",
+        class_name="YOLOv8ForInstanceSegmentationTRT",
+    ),
+    ("yolov9", OBJECT_DETECTION_TASK, BackendType.ONNX): RegistryEntry(
+        model_class=LazyClass(
+            module_name="inference_models.models.yolov9.yolov9_onnx",
+            class_name="YOLOv9ForObjectDetectionOnnx",
+        ),
+        supported_model_features={"nms_fused"},
+    ),
+    ("yolov9", OBJECT_DETECTION_TASK, BackendType.TORCH_SCRIPT): RegistryEntry(
+        model_class=LazyClass(
+            module_name="inference_models.models.yolov9.yolov9_torch_script",
+            class_name="YOLOv9ForObjectDetectionTorchScript",
+        ),
+        supported_model_features={"nms_fused"},
+    ),
+    ("yolov9", OBJECT_DETECTION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.yolov9.yolov9_trt",
+        class_name="YOLOv9ForObjectDetectionTRT",
+    ),
+    ("yolov10", OBJECT_DETECTION_TASK, BackendType.ONNX): LazyClass(
+        module_name="inference_models.models.yolov10.yolov10_object_detection_onnx",
+        class_name="YOLOv10ForObjectDetectionOnnx",
+    ),
+    ("yolov10", OBJECT_DETECTION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.yolov10.yolov10_object_detection_trt",
+        class_name="YOLOv10ForObjectDetectionTRT",
+    ),
+    ("yolov11", CLASSIFICATION_TASK, BackendType.ONNX): RegistryEntry(
+        model_class=LazyClass(
+            module_name="inference_models.models.yolov11.yolov11_onnx",
+            class_name="YOLOv11ForClassificationOnnx",
+        ),
+    ),
+    ("yolov11", OBJECT_DETECTION_TASK, BackendType.ONNX): RegistryEntry(
+        model_class=LazyClass(
+            module_name="inference_models.models.yolov11.yolov11_onnx",
+            class_name="YOLOv11ForObjectDetectionOnnx",
+        ),
+        supported_model_features={"nms_fused"},
+    ),
+    ("yolov11", OBJECT_DETECTION_TASK, BackendType.TORCH_SCRIPT): RegistryEntry(
+        model_class=LazyClass(
+            module_name="inference_models.models.yolov11.yolov11_torch_script",
+            class_name="YOLOv11ForObjectDetectionTorchScript",
+        ),
+        supported_model_features={"nms_fused"},
+    ),
+    ("yolov11", OBJECT_DETECTION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.yolov11.yolov11_trt",
+        class_name="YOLOv11ForObjectDetectionTRT",
+    ),
+    ("yolov11", KEYPOINT_DETECTION_TASK, BackendType.ONNX): RegistryEntry(
+        model_class=LazyClass(
+            module_name="inference_models.models.yolov11.yolov11_onnx",
+            class_name="YOLOv11ForForKeyPointsDetectionOnnx",
+        ),
+        supported_model_features={"nms_fused"},
+    ),
+    ("yolov11", KEYPOINT_DETECTION_TASK, BackendType.TORCH_SCRIPT): RegistryEntry(
+        model_class=LazyClass(
+            module_name="inference_models.models.yolov11.yolov11_torch_script",
+            class_name="YOLOv11ForForKeyPointsDetectionTorchScript",
+        ),
+        supported_model_features={"nms_fused"},
+    ),
+    ("yolov11", KEYPOINT_DETECTION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.yolov11.yolov11_trt",
+        class_name="YOLOv11ForForKeyPointsDetectionTRT",
+    ),
+    ("yolov11", INSTANCE_SEGMENTATION_TASK, BackendType.ONNX): RegistryEntry(
+        model_class=LazyClass(
+            module_name="inference_models.models.yolov11.yolov11_onnx",
+            class_name="YOLOv11ForInstanceSegmentationOnnx",
+        ),
+        supported_model_features={"nms_fused"},
+    ),
+    ("yolov11", INSTANCE_SEGMENTATION_TASK, BackendType.TORCH_SCRIPT): RegistryEntry(
+        model_class=LazyClass(
+            module_name="inference_models.models.yolov11.yolov11_torch_script",
+            class_name="YOLOv11ForInstanceSegmentationTorchScript",
+        ),
+        supported_model_features={"nms_fused"},
+    ),
+    ("yolov11", INSTANCE_SEGMENTATION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.yolov11.yolov11_trt",
+        class_name="YOLOv11ForInstanceSegmentationTRT",
+    ),
+    ("yolov12", OBJECT_DETECTION_TASK, BackendType.ONNX): RegistryEntry(
+        model_class=LazyClass(
+            module_name="inference_models.models.yolov12.yolov12_onnx",
+            class_name="YOLOv12ForObjectDetectionOnnx",
+        ),
+        supported_model_features={"nms_fused"},
+    ),
+    ("yolov12", OBJECT_DETECTION_TASK, BackendType.TORCH_SCRIPT): RegistryEntry(
+        model_class=LazyClass(
+            module_name="inference_models.models.yolov12.yolov12_torch_script",
+            class_name="YOLOv12ForObjectDetectionTorchScript",
+        ),
+        supported_model_features={"nms_fused"},
+    ),
+    ("yolov12", OBJECT_DETECTION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.yolov12.yolov12_trt",
+        class_name="YOLOv12ForObjectDetectionTRT",
+    ),
+    ("paligemma-2", VLM_TASK, BackendType.HF): LazyClass(
+        module_name="inference_models.models.paligemma.paligemma_hf",
+        class_name="PaliGemmaHF",
+    ),
+    ("paligemma", VLM_TASK, BackendType.HF): LazyClass(
+        module_name="inference_models.models.paligemma.paligemma_hf",
+        class_name="PaliGemmaHF",
+    ),
+    ("smolvlm-v2", VLM_TASK, BackendType.HF): LazyClass(
+        module_name="inference_models.models.smolvlm.smolvlm_hf",
+        class_name="SmolVLMHF",
+    ),
+    ("qwen25vl", VLM_TASK, BackendType.HF): LazyClass(
+        module_name="inference_models.models.qwen25vl.qwen25vl_hf",
+        class_name="Qwen25VLHF",
+    ),
+    ("florence-2", VLM_TASK, BackendType.HF): LazyClass(
+        module_name="inference_models.models.florence2.florence2_hf",
+        class_name="Florence2HF",
+    ),
+    ("clip", EMBEDDING_TASK, BackendType.TORCH): LazyClass(
+        module_name="inference_models.models.clip.clip_pytorch",
+        class_name="ClipTorch",
+    ),
+    ("clip", EMBEDDING_TASK, BackendType.ONNX): LazyClass(
+        module_name="inference_models.models.clip.clip_onnx",
+        class_name="ClipOnnx",
+    ),
+    ("perception-encoder", EMBEDDING_TASK, BackendType.TORCH): LazyClass(
+        module_name="inference_models.models.perception_encoder.perception_encoder_pytorch",
+        class_name="PerceptionEncoderTorch",
+    ),
+    ("rfdetr", OBJECT_DETECTION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.rfdetr.rfdetr_object_detection_trt",
+        class_name="RFDetrForObjectDetectionTRT",
+    ),
+    ("rfdetr", OBJECT_DETECTION_TASK, BackendType.TORCH): LazyClass(
+        module_name="inference_models.models.rfdetr.rfdetr_object_detection_pytorch",
+        class_name="RFDetrForObjectDetectionTorch",
+    ),
+    ("rfdetr", OBJECT_DETECTION_TASK, BackendType.ONNX): LazyClass(
+        module_name="inference_models.models.rfdetr.rfdetr_object_detection_onnx",
+        class_name="RFDetrForObjectDetectionONNX",
+    ),
+    ("rfdetr", INSTANCE_SEGMENTATION_TASK, BackendType.TORCH): LazyClass(
+        module_name="inference_models.models.rfdetr.rfdetr_instance_segmentation_pytorch",
+        class_name="RFDetrForInstanceSegmentationTorch",
+    ),
+    ("rfdetr", INSTANCE_SEGMENTATION_TASK, BackendType.ONNX): LazyClass(
+        module_name="inference_models.models.rfdetr.rfdetr_instance_segmentation_onnx",
+        class_name="RFDetrForInstanceSegmentationOnnx",
+    ),
+    ("rfdetr", INSTANCE_SEGMENTATION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.rfdetr.rfdetr_instance_segmentation_trt",
+        class_name="RFDetrForInstanceSegmentationTRT",
+    ),
+    ("moondream2", VLM_TASK, BackendType.HF): LazyClass(
+        module_name="inference_models.models.moondream2.moondream2_hf",
+        class_name="MoonDream2HF",
+    ),
+    ("vit", CLASSIFICATION_TASK, BackendType.ONNX): LazyClass(
+        module_name="inference_models.models.vit.vit_classification_onnx",
+        class_name="VITForClassificationOnnx",
+    ),
+    ("vit", MULTI_LABEL_CLASSIFICATION_TASK, BackendType.ONNX): LazyClass(
+        module_name="inference_models.models.vit.vit_classification_onnx",
+        class_name="VITForMultiLabelClassificationOnnx",
+    ),
+    ("vit", CLASSIFICATION_TASK, BackendType.HF): LazyClass(
+        module_name="inference_models.models.vit.vit_classification_huggingface",
+        class_name="VITForClassificationHF",
+    ),
+    ("vit", MULTI_LABEL_CLASSIFICATION_TASK, BackendType.HF): LazyClass(
+        module_name="inference_models.models.vit.vit_classification_huggingface",
+        class_name="VITForMultiLabelClassificationHF",
+    ),
+    ("vit", CLASSIFICATION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.vit.vit_classification_trt",
+        class_name="VITForClassificationTRT",
+    ),
+    ("vit", MULTI_LABEL_CLASSIFICATION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.vit.vit_classification_trt",
+        class_name="VITForMultiLabelClassificationTRT",
+    ),
+    ("resnet", CLASSIFICATION_TASK, BackendType.ONNX): LazyClass(
+        module_name="inference_models.models.resnet.resnet_classification_onnx",
+        class_name="ResNetForClassificationOnnx",
+    ),
+    ("resnet", MULTI_LABEL_CLASSIFICATION_TASK, BackendType.ONNX): LazyClass(
+        module_name="inference_models.models.resnet.resnet_classification_onnx",
+        class_name="ResNetForMultiLabelClassificationOnnx",
+    ),
+    ("resnet", CLASSIFICATION_TASK, BackendType.TORCH): LazyClass(
+        module_name="inference_models.models.resnet.resnet_classification_torch",
+        class_name="ResNetForClassificationTorch",
+    ),
+    ("resnet", MULTI_LABEL_CLASSIFICATION_TASK, BackendType.TORCH): LazyClass(
+        module_name="inference_models.models.resnet.resnet_classification_torch",
+        class_name="ResNetForMultiLabelClassificationTorch",
+    ),
+    ("resnet", CLASSIFICATION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.resnet.resnet_classification_trt",
+        class_name="ResNetForClassificationTRT",
+    ),
+    ("resnet", MULTI_LABEL_CLASSIFICATION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.resnet.resnet_classification_trt",
+        class_name="ResNetForMultiLabelClassificationTRT",
+    ),
+    ("segment-anything-2-rt", INSTANCE_SEGMENTATION_TASK, BackendType.TORCH): LazyClass(
+        module_name="inference_models.models.sam2_rt.sam2_pytorch",
+        class_name="SAM2ForStream",
+    ),
+    ("deep-lab-v3-plus", SEMANTIC_SEGMENTATION_TASK, BackendType.TORCH): LazyClass(
+        module_name="inference_models.models.deep_lab_v3_plus.deep_lab_v3_plus_segmentation_torch",
+        class_name="DeepLabV3PlusForSemanticSegmentationTorch",
+    ),
+    ("deep-lab-v3-plus", SEMANTIC_SEGMENTATION_TASK, BackendType.ONNX): LazyClass(
+        module_name="inference_models.models.deep_lab_v3_plus.deep_lab_v3_plus_segmentation_onnx",
+        class_name="DeepLabV3PlusForSemanticSegmentationOnnx",
+    ),
+    ("deep-lab-v3-plus", SEMANTIC_SEGMENTATION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.deep_lab_v3_plus.deep_lab_v3_plus_segmentation_trt",
+        class_name="DeepLabV3PlusForSemanticSegmentationTRT",
+    ),
+    ("yolact", INSTANCE_SEGMENTATION_TASK, BackendType.ONNX): LazyClass(
+        module_name="inference_models.models.yolact.yolact_instance_segmentation_onnx",
+        class_name="YOLOACTForInstanceSegmentationOnnx",
+    ),
+    ("yolact", INSTANCE_SEGMENTATION_TASK, BackendType.TRT): LazyClass(
+        module_name="inference_models.models.yolact.yolact_instance_segmentation_trt",
+        class_name="YOLOACTForInstanceSegmentationTRT",
+    ),
+    ("depth-anything-v2", DEPTH_ESTIMATION_TASK, BackendType.HF): LazyClass(
+        module_name="inference_models.models.depth_anything_v2.depth_anything_v2_hf",
+        class_name="DepthAnythingV2HF",
+    ),
+    ("doctr", STRUCTURED_OCR_TASK, BackendType.TORCH): LazyClass(
+        module_name="inference_models.models.doctr.doctr_torch", class_name="DocTR"
+    ),
+    ("easy-ocr", STRUCTURED_OCR_TASK, BackendType.TORCH): LazyClass(
+        module_name="inference_models.models.easy_ocr.easy_ocr_torch",
+        class_name="EasyOCRTorch",
+    ),
+    ("tr-ocr", TEXT_ONLY_OCR_TASK, BackendType.HF): LazyClass(
+        module_name="inference_models.models.trocr.trocr_hf",
+        class_name="TROcrHF",
+    ),
+    (
+        "mediapipe-face-detector",
+        KEYPOINT_DETECTION_TASK,
+        BackendType.MEDIAPIPE,
+    ): LazyClass(
+        module_name="inference_models.models.mediapipe_face_detection.face_detection",
+        class_name="MediaPipeFaceDetector",
+    ),
+    ("l2cs-net", GAZE_DETECTION_TASK, BackendType.ONNX): LazyClass(
+        module_name="inference_models.models.l2cs.l2cs_onnx",
+        class_name="L2CSNetOnnx",
+    ),
+    (
+        "grounding-dino",
+        OPEN_VOCABULARY_OBJECT_DETECTION_TASK,
+        BackendType.TORCH,
+    ): LazyClass(
+        module_name="inference_models.models.grounding_dino.grounding_dino_torch",
+        class_name="GroundingDinoForObjectDetectionTorch",
+    ),
+    (
+        "dinov3_probe",
+        MULTI_LABEL_CLASSIFICATION_TASK,
+        BackendType.ONNX,
+    ): LazyClass(
+        module_name="inference_models.models.dinov3.dinov3_classification_onnx",
+        class_name="DinoV3ForMultiLabelClassificationOnnx",
+    ),
+    (
+        "dinov3_probe",
+        CLASSIFICATION_TASK,
+        BackendType.ONNX,
+    ): LazyClass(
+        module_name="inference_models.models.dinov3.dinov3_classification_onnx",
+        class_name="DinoV3ForClassificationOnnx",
+    ),
+    (
+        "dinov3_probe",
+        MULTI_LABEL_CLASSIFICATION_TASK,
+        BackendType.TORCH,
+    ): LazyClass(
+        module_name="inference_models.models.dinov3.dinov3_classification_torch",
+        class_name="DinoV3ForMultiLabelClassificationTorch",
+    ),
+    (
+        "dinov3_probe",
+        CLASSIFICATION_TASK,
+        BackendType.TORCH,
+    ): LazyClass(
+        module_name="inference_models.models.dinov3.dinov3_classification_torch",
+        class_name="DinoV3ForClassificationTorch",
+    ),
+    (
+        "owlv2",
+        OPEN_VOCABULARY_OBJECT_DETECTION_TASK,
+        BackendType.HF,
+    ): LazyClass(
+        module_name="inference_models.models.owlv2.owlv2_hf",
+        class_name="OWLv2HF",
+    ),
+    (
+        "roboflow-instant",
+        OBJECT_DETECTION_TASK,
+        BackendType.HF,
+    ): LazyClass(
+        module_name="inference_models.models.roboflow_instant.roboflow_instant_hf",
+        class_name="RoboflowInstantHF",
+    ),
+    ("sam", INTERACTIVE_INSTANCE_SEGMENTATION_TASK, BackendType.TORCH): LazyClass(
+        module_name="inference_models.models.sam.sam_torch",
+        class_name="SAMTorch",
+    ),
+    ("sam2", INTERACTIVE_INSTANCE_SEGMENTATION_TASK, BackendType.TORCH): LazyClass(
+        module_name="inference_models.models.sam2.sam2_torch",
+        class_name="SAM2Torch",
+    ),
+}
+def resolve_model_class(
+    model_architecture: ModelArchitecture,
+    task_type: TaskType,
+    backend: BackendType,
+    model_features: Optional[Set[str]] = None,
+) -> type:
+    if not model_implementation_exists(
+        model_architecture=model_architecture,
+        task_type=task_type,
+        backend=backend,
+        model_features=model_features,
+    ):
+        raise ModelImplementationLoaderError(
+            message=f"Did not find implementation for model with architecture: {model_architecture}, "
+            f"task type: {task_type} backend: {backend} and model features: {model_features}",
+            help_url="https://todo",
+        )
+    matched_model = REGISTERED_MODELS[(model_architecture, task_type, backend)]
+    if isinstance(matched_model, RegistryEntry):
+        return matched_model.model_class.resolve()
+    return matched_model.resolve()
+def model_implementation_exists(
+    model_architecture: ModelArchitecture,
+    task_type: TaskType,
+    backend: BackendType,
+    model_features: Optional[Set[str]] = None,
+) -> bool:
+    lookup_key = (model_architecture, task_type, backend)
+    if lookup_key not in REGISTERED_MODELS:
+        return False
+    if not model_features:
+        return True
+    matched_model = REGISTERED_MODELS[(model_architecture, task_type, backend)]
+    if not isinstance(matched_model, RegistryEntry):
+        # features requested, but no supported features manifested
+        return False
+    return all(f in matched_model.supported_model_features for f in model_features)