PyPI - inference-models - Versions diffs - 0.18.3__py3-none-any.whl - Mend

inference-models 0.18.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (195) hide show

inference_models/__init__.py +36 -0
inference_models/configuration.py +72 -0
inference_models/constants.py +2 -0
inference_models/entities.py +5 -0
inference_models/errors.py +137 -0
inference_models/logger.py +52 -0
inference_models/model_pipelines/__init__.py +0 -0
inference_models/model_pipelines/auto_loaders/__init__.py +0 -0
inference_models/model_pipelines/auto_loaders/core.py +120 -0
inference_models/model_pipelines/auto_loaders/pipelines_registry.py +36 -0
inference_models/model_pipelines/face_and_gaze_detection/__init__.py +0 -0
inference_models/model_pipelines/face_and_gaze_detection/mediapipe_l2cs.py +200 -0
inference_models/models/__init__.py +0 -0
inference_models/models/auto_loaders/__init__.py +0 -0
inference_models/models/auto_loaders/access_manager.py +168 -0
inference_models/models/auto_loaders/auto_negotiation.py +1329 -0
inference_models/models/auto_loaders/auto_resolution_cache.py +129 -0
inference_models/models/auto_loaders/constants.py +7 -0
inference_models/models/auto_loaders/core.py +1341 -0
inference_models/models/auto_loaders/dependency_models.py +52 -0
inference_models/models/auto_loaders/entities.py +57 -0
inference_models/models/auto_loaders/models_registry.py +497 -0
inference_models/models/auto_loaders/presentation_utils.py +333 -0
inference_models/models/auto_loaders/ranking.py +413 -0
inference_models/models/auto_loaders/utils.py +31 -0
inference_models/models/base/__init__.py +0 -0
inference_models/models/base/classification.py +123 -0
inference_models/models/base/depth_estimation.py +62 -0
inference_models/models/base/documents_parsing.py +111 -0
inference_models/models/base/embeddings.py +66 -0
inference_models/models/base/instance_segmentation.py +87 -0
inference_models/models/base/keypoints_detection.py +93 -0
inference_models/models/base/object_detection.py +143 -0
inference_models/models/base/semantic_segmentation.py +74 -0
inference_models/models/base/types.py +5 -0
inference_models/models/clip/__init__.py +0 -0
inference_models/models/clip/clip_onnx.py +148 -0
inference_models/models/clip/clip_pytorch.py +104 -0
inference_models/models/clip/preprocessing.py +162 -0
inference_models/models/common/__init__.py +0 -0
inference_models/models/common/cuda.py +30 -0
inference_models/models/common/model_packages.py +25 -0
inference_models/models/common/onnx.py +379 -0
inference_models/models/common/roboflow/__init__.py +0 -0
inference_models/models/common/roboflow/model_packages.py +361 -0
inference_models/models/common/roboflow/post_processing.py +436 -0
inference_models/models/common/roboflow/pre_processing.py +1332 -0
inference_models/models/common/torch.py +20 -0
inference_models/models/common/trt.py +266 -0
inference_models/models/deep_lab_v3_plus/__init__.py +0 -0
inference_models/models/deep_lab_v3_plus/deep_lab_v3_plus_segmentation_onnx.py +282 -0
inference_models/models/deep_lab_v3_plus/deep_lab_v3_plus_segmentation_torch.py +264 -0
inference_models/models/deep_lab_v3_plus/deep_lab_v3_plus_segmentation_trt.py +313 -0
inference_models/models/depth_anything_v2/__init__.py +0 -0
inference_models/models/depth_anything_v2/depth_anything_v2_hf.py +77 -0
inference_models/models/dinov3/__init__.py +0 -0
inference_models/models/dinov3/dinov3_classification_onnx.py +348 -0
inference_models/models/dinov3/dinov3_classification_torch.py +323 -0
inference_models/models/doctr/__init__.py +0 -0
inference_models/models/doctr/doctr_torch.py +304 -0
inference_models/models/easy_ocr/__init__.py +0 -0
inference_models/models/easy_ocr/easy_ocr_torch.py +222 -0
inference_models/models/florence2/__init__.py +0 -0
inference_models/models/florence2/florence2_hf.py +897 -0
inference_models/models/grounding_dino/__init__.py +0 -0
inference_models/models/grounding_dino/grounding_dino_torch.py +227 -0
inference_models/models/l2cs/__init__.py +0 -0
inference_models/models/l2cs/l2cs_onnx.py +216 -0
inference_models/models/mediapipe_face_detection/__init__.py +0 -0
inference_models/models/mediapipe_face_detection/face_detection.py +203 -0
inference_models/models/moondream2/__init__.py +0 -0
inference_models/models/moondream2/moondream2_hf.py +281 -0
inference_models/models/owlv2/__init__.py +0 -0
inference_models/models/owlv2/cache.py +182 -0
inference_models/models/owlv2/entities.py +112 -0
inference_models/models/owlv2/owlv2_hf.py +695 -0
inference_models/models/owlv2/reference_dataset.py +291 -0
inference_models/models/paligemma/__init__.py +0 -0
inference_models/models/paligemma/paligemma_hf.py +209 -0
inference_models/models/perception_encoder/__init__.py +0 -0
inference_models/models/perception_encoder/perception_encoder_pytorch.py +197 -0
inference_models/models/perception_encoder/vision_encoder/__init__.py +0 -0
inference_models/models/perception_encoder/vision_encoder/config.py +160 -0
inference_models/models/perception_encoder/vision_encoder/pe.py +742 -0
inference_models/models/perception_encoder/vision_encoder/rope.py +344 -0
inference_models/models/perception_encoder/vision_encoder/tokenizer.py +342 -0
inference_models/models/perception_encoder/vision_encoder/transforms.py +33 -0
inference_models/models/qwen25vl/__init__.py +1 -0
inference_models/models/qwen25vl/qwen25vl_hf.py +285 -0
inference_models/models/resnet/__init__.py +0 -0
inference_models/models/resnet/resnet_classification_onnx.py +330 -0
inference_models/models/resnet/resnet_classification_torch.py +305 -0
inference_models/models/resnet/resnet_classification_trt.py +369 -0
inference_models/models/rfdetr/__init__.py +0 -0
inference_models/models/rfdetr/backbone_builder.py +101 -0
inference_models/models/rfdetr/class_remapping.py +41 -0
inference_models/models/rfdetr/common.py +115 -0
inference_models/models/rfdetr/default_labels.py +108 -0
inference_models/models/rfdetr/dinov2_with_windowed_attn.py +1330 -0
inference_models/models/rfdetr/misc.py +26 -0
inference_models/models/rfdetr/ms_deform_attn.py +180 -0
inference_models/models/rfdetr/ms_deform_attn_func.py +60 -0
inference_models/models/rfdetr/position_encoding.py +166 -0
inference_models/models/rfdetr/post_processor.py +83 -0
inference_models/models/rfdetr/projector.py +373 -0
inference_models/models/rfdetr/rfdetr_backbone_pytorch.py +394 -0
inference_models/models/rfdetr/rfdetr_base_pytorch.py +807 -0
inference_models/models/rfdetr/rfdetr_instance_segmentation_onnx.py +206 -0
inference_models/models/rfdetr/rfdetr_instance_segmentation_pytorch.py +373 -0
inference_models/models/rfdetr/rfdetr_instance_segmentation_trt.py +227 -0
inference_models/models/rfdetr/rfdetr_object_detection_onnx.py +244 -0
inference_models/models/rfdetr/rfdetr_object_detection_pytorch.py +470 -0
inference_models/models/rfdetr/rfdetr_object_detection_trt.py +270 -0
inference_models/models/rfdetr/segmentation_head.py +273 -0
inference_models/models/rfdetr/transformer.py +767 -0
inference_models/models/roboflow_instant/__init__.py +0 -0
inference_models/models/roboflow_instant/roboflow_instant_hf.py +141 -0
inference_models/models/sam/__init__.py +0 -0
inference_models/models/sam/cache.py +147 -0
inference_models/models/sam/entities.py +25 -0
inference_models/models/sam/sam_torch.py +675 -0
inference_models/models/sam2/__init__.py +0 -0
inference_models/models/sam2/cache.py +162 -0
inference_models/models/sam2/entities.py +43 -0
inference_models/models/sam2/sam2_torch.py +905 -0
inference_models/models/sam2_rt/__init__.py +0 -0
inference_models/models/sam2_rt/sam2_pytorch.py +119 -0
inference_models/models/smolvlm/__init__.py +0 -0
inference_models/models/smolvlm/smolvlm_hf.py +245 -0
inference_models/models/trocr/__init__.py +0 -0
inference_models/models/trocr/trocr_hf.py +53 -0
inference_models/models/vit/__init__.py +0 -0
inference_models/models/vit/vit_classification_huggingface.py +319 -0
inference_models/models/vit/vit_classification_onnx.py +326 -0
inference_models/models/vit/vit_classification_trt.py +365 -0
inference_models/models/yolact/__init__.py +1 -0
inference_models/models/yolact/yolact_instance_segmentation_onnx.py +336 -0
inference_models/models/yolact/yolact_instance_segmentation_trt.py +361 -0
inference_models/models/yolo_world/__init__.py +1 -0
inference_models/models/yolonas/__init__.py +0 -0
inference_models/models/yolonas/nms.py +44 -0
inference_models/models/yolonas/yolonas_object_detection_onnx.py +204 -0
inference_models/models/yolonas/yolonas_object_detection_trt.py +230 -0
inference_models/models/yolov10/__init__.py +0 -0
inference_models/models/yolov10/yolov10_object_detection_onnx.py +187 -0
inference_models/models/yolov10/yolov10_object_detection_trt.py +215 -0
inference_models/models/yolov11/__init__.py +0 -0
inference_models/models/yolov11/yolov11_onnx.py +28 -0
inference_models/models/yolov11/yolov11_torch_script.py +25 -0
inference_models/models/yolov11/yolov11_trt.py +21 -0
inference_models/models/yolov12/__init__.py +0 -0
inference_models/models/yolov12/yolov12_onnx.py +7 -0
inference_models/models/yolov12/yolov12_torch_script.py +7 -0
inference_models/models/yolov12/yolov12_trt.py +7 -0
inference_models/models/yolov5/__init__.py +0 -0
inference_models/models/yolov5/nms.py +99 -0
inference_models/models/yolov5/yolov5_instance_segmentation_onnx.py +225 -0
inference_models/models/yolov5/yolov5_instance_segmentation_trt.py +255 -0
inference_models/models/yolov5/yolov5_object_detection_onnx.py +192 -0
inference_models/models/yolov5/yolov5_object_detection_trt.py +218 -0
inference_models/models/yolov7/__init__.py +0 -0
inference_models/models/yolov7/yolov7_instance_segmentation_onnx.py +226 -0
inference_models/models/yolov7/yolov7_instance_segmentation_trt.py +253 -0
inference_models/models/yolov8/__init__.py +0 -0
inference_models/models/yolov8/yolov8_classification_onnx.py +181 -0
inference_models/models/yolov8/yolov8_instance_segmentation_onnx.py +239 -0
inference_models/models/yolov8/yolov8_instance_segmentation_torch_script.py +201 -0
inference_models/models/yolov8/yolov8_instance_segmentation_trt.py +268 -0
inference_models/models/yolov8/yolov8_key_points_detection_onnx.py +263 -0
inference_models/models/yolov8/yolov8_key_points_detection_torch_script.py +218 -0
inference_models/models/yolov8/yolov8_key_points_detection_trt.py +287 -0
inference_models/models/yolov8/yolov8_object_detection_onnx.py +213 -0
inference_models/models/yolov8/yolov8_object_detection_torch_script.py +166 -0
inference_models/models/yolov8/yolov8_object_detection_trt.py +231 -0
inference_models/models/yolov9/__init__.py +0 -0
inference_models/models/yolov9/yolov9_onnx.py +7 -0
inference_models/models/yolov9/yolov9_torch_script.py +7 -0
inference_models/models/yolov9/yolov9_trt.py +7 -0
inference_models/runtime_introspection/__init__.py +0 -0
inference_models/runtime_introspection/core.py +410 -0
inference_models/utils/__init__.py +0 -0
inference_models/utils/download.py +608 -0
inference_models/utils/environment.py +28 -0
inference_models/utils/file_system.py +51 -0
inference_models/utils/hashing.py +7 -0
inference_models/utils/imports.py +48 -0
inference_models/utils/onnx_introspection.py +17 -0
inference_models/weights_providers/__init__.py +0 -0
inference_models/weights_providers/core.py +20 -0
inference_models/weights_providers/entities.py +159 -0
inference_models/weights_providers/roboflow.py +601 -0
inference_models-0.18.3.dist-info/METADATA +466 -0
inference_models-0.18.3.dist-info/RECORD +195 -0
inference_models-0.18.3.dist-info/WHEEL +5 -0
inference_models-0.18.3.dist-info/top_level.txt +1 -0

inference_models/models/base/documents_parsing.py ADDED Viewed

@@ -0,0 +1,111 @@
+from abc import ABC, abstractmethod
+from typing import Generic, List, Tuple, Union
+import numpy as np
+import torch
+from inference_models.models.base.object_detection import Detections
+from inference_models.models.base.types import (
+    PreprocessedInputs,
+    PreprocessingMetadata,
+    RawPrediction,
+)
+class StructuredOCRModel(
+    ABC, Generic[PreprocessedInputs, PreprocessingMetadata, RawPrediction]
+):
+    @classmethod
+    @abstractmethod
+    def from_pretrained(cls, model_name_or_path: str, **kwargs) -> "StructuredOCRModel":
+        pass
+    @property
+    @abstractmethod
+    def class_names(self) -> List[str]:
+        pass
+    def infer(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        **kwargs,
+    ) -> Tuple[List[str], List[Detections]]:
+        pre_processed_images, pre_processing_meta = self.pre_process(images, **kwargs)
+        model_results = self.forward(pre_processed_images, **kwargs)
+        return self.post_process(model_results, pre_processing_meta, **kwargs)
+    @abstractmethod
+    def pre_process(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        **kwargs,
+    ) -> Tuple[PreprocessedInputs, PreprocessingMetadata]:
+        pass
+    @abstractmethod
+    def forward(
+        self, pre_processed_images: PreprocessedInputs, **kwargs
+    ) -> RawPrediction:
+        pass
+    @abstractmethod
+    def post_process(
+        self,
+        model_results: RawPrediction,
+        pre_processing_meta: PreprocessingMetadata,
+        **kwargs,
+    ) -> Tuple[List[str], List[Detections]]:
+        pass
+    def __call__(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        **kwargs,
+    ) -> Tuple[List[str], List[Detections]]:
+        return self.infer(images, **kwargs)
+class TextOnlyOCRModel(ABC, Generic[PreprocessedInputs, RawPrediction]):
+    @classmethod
+    @abstractmethod
+    def from_pretrained(cls, model_name_or_path: str, **kwargs) -> "TextOnlyOCRModel":
+        pass
+    def infer(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        **kwargs,
+    ) -> List[str]:
+        pre_processed_images = self.pre_process(images, **kwargs)
+        model_results = self.forward(pre_processed_images, **kwargs)
+        return self.post_process(model_results, **kwargs)
+    @abstractmethod
+    def pre_process(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        **kwargs,
+    ) -> PreprocessedInputs:
+        pass
+    @abstractmethod
+    def forward(
+        self, pre_processed_images: PreprocessedInputs, **kwargs
+    ) -> RawPrediction:
+        pass
+    @abstractmethod
+    def post_process(
+        self,
+        model_results: RawPrediction,
+        **kwargs,
+    ) -> List[str]:
+        pass
+    def __call__(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        **kwargs,
+    ) -> List[str]:
+        return self.infer(images, **kwargs)

inference_models/models/base/embeddings.py ADDED Viewed

@@ -0,0 +1,66 @@
+from abc import ABC, abstractmethod
+from typing import List, Literal, Union
+import numpy as np
+import torch
+import torch.nn.functional as F
+class TextImageEmbeddingModel(ABC):
+    @classmethod
+    @abstractmethod
+    def from_pretrained(
+        cls, model_name_or_path: str, **kwargs
+    ) -> "TextImageEmbeddingModel":
+        pass
+    def compare_embeddings(
+        self,
+        x: Union[
+            torch.Tensor,
+            List[torch.Tensor],
+            np.ndarray,
+            List[np.ndarray],
+            str,
+            List[str],
+        ],
+        y: Union[
+            torch.Tensor,
+            List[torch.Tensor],
+            np.ndarray,
+            List[np.ndarray],
+            str,
+            List[str],
+        ],
+        x_type: Literal["image", "text"] = "image",
+        y_type: Literal["image", "text"] = "text",
+        **kwargs,
+    ) -> torch.Tensor:
+        if x_type == "image":
+            x_embeddings = self.embed_images(images=x, **kwargs)
+        else:
+            x_embeddings = self.embed_text(texts=x, **kwargs)
+        if y_type == "image":
+            y_embeddings = self.embed_images(images=y, **kwargs)
+        else:
+            y_embeddings = self.embed_text(texts=y, **kwargs)
+        x_embeddings_norm = F.normalize(x_embeddings, p=2, dim=1)
+        y_embeddings_morm = F.normalize(y_embeddings, p=2, dim=1)
+        return x_embeddings_norm @ y_embeddings_morm.T
+    @abstractmethod
+    def embed_images(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        **kwargs,
+    ) -> torch.Tensor:
+        pass
+    @abstractmethod
+    def embed_text(
+        self,
+        texts: Union[str, List[str]],
+        **kwargs,
+    ) -> torch.Tensor:
+        pass

inference_models/models/base/instance_segmentation.py ADDED Viewed

@@ -0,0 +1,87 @@
+from abc import ABC, abstractmethod
+from dataclasses import dataclass
+from typing import Generic, List, Optional, Tuple, Union
+import numpy as np
+import supervision as sv
+import torch
+from inference_models.models.base.types import (
+    PreprocessedInputs,
+    PreprocessingMetadata,
+    RawPrediction,
+)
+@dataclass
+class InstanceDetections:
+    xyxy: torch.Tensor  # (n_boxes, 4)
+    class_id: torch.Tensor  # (n_boxes, )
+    confidence: torch.Tensor  # (n_boxes, )
+    mask: torch.Tensor  # (n_boxes, mask_height, mask_width)
+    image_metadata: Optional[dict] = None
+    bboxes_metadata: Optional[List[dict]] = (
+        None  # if given, list of size equal to # of bboxes
+    )
+    def to_supervision(self) -> sv.Detections:
+        return sv.Detections(
+            xyxy=self.xyxy.cpu().numpy(),
+            class_id=self.class_id.cpu().numpy(),
+            confidence=self.confidence.cpu().numpy(),
+            mask=self.mask.cpu().numpy(),
+        )
+class InstanceSegmentationModel(
+    ABC, Generic[PreprocessedInputs, PreprocessingMetadata, RawPrediction]
+):
+    @classmethod
+    @abstractmethod
+    def from_pretrained(
+        cls, model_name_or_path: str, **kwargs
+    ) -> "InstanceSegmentationModel":
+        pass
+    @property
+    @abstractmethod
+    def class_names(self) -> List[str]:
+        pass
+    def infer(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        **kwargs,
+    ) -> List[InstanceDetections]:
+        pre_processed_images, pre_processing_meta = self.pre_process(images, **kwargs)
+        model_results = self.forward(pre_processed_images, **kwargs)
+        return self.post_process(model_results, pre_processing_meta, **kwargs)
+    @abstractmethod
+    def pre_process(
+        self, images: Union[torch.Tensor, List[torch.Tensor]], **kwargs
+    ) -> Tuple[PreprocessedInputs, PreprocessingMetadata]:
+        pass
+    @abstractmethod
+    def forward(
+        self, pre_processed_images: PreprocessedInputs, **kwargs
+    ) -> RawPrediction:
+        pass
+    @abstractmethod
+    def post_process(
+        self,
+        model_results: RawPrediction,
+        pre_processing_meta: PreprocessedInputs,
+        **kwargs,
+    ) -> List[InstanceDetections]:
+        pass
+    def __call__(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        **kwargs,
+    ) -> List[InstanceDetections]:
+        return self.infer(images, **kwargs)

inference_models/models/base/keypoints_detection.py ADDED Viewed

@@ -0,0 +1,93 @@
+from abc import ABC, abstractmethod
+from dataclasses import dataclass
+from typing import Generic, List, Optional, Tuple, Union
+import numpy as np
+import supervision as sv
+import torch
+from inference_models.models.base.object_detection import Detections
+from inference_models.models.base.types import (
+    PreprocessedInputs,
+    PreprocessingMetadata,
+    RawPrediction,
+)
+@dataclass
+class KeyPoints:
+    xy: torch.Tensor  # (instances, instance_key_points, 2)
+    class_id: torch.Tensor  # (instances, )
+    confidence: torch.Tensor  # (instances, instance_key_points)
+    image_metadata: Optional[dict] = None
+    key_points_metadata: Optional[List[dict]] = (
+        None  # if given, list of size equal to # of instances
+    )
+    def to_supervision(self) -> sv.KeyPoints:
+        return sv.KeyPoints(
+            xy=self.xy.cpu().numpy(),
+            class_id=self.class_id.cpu().numpy(),
+            confidence=self.confidence.cpu().numpy(),
+        )
+class KeyPointsDetectionModel(
+    ABC, Generic[PreprocessedInputs, PreprocessingMetadata, RawPrediction]
+):
+    @classmethod
+    @abstractmethod
+    def from_pretrained(
+        cls, model_name_or_path: str, **kwargs
+    ) -> "KeyPointsDetectionModel":
+        pass
+    @property
+    @abstractmethod
+    def class_names(self) -> List[str]:
+        pass
+    @property
+    @abstractmethod
+    def skeletons(self) -> List[List[Tuple[int, int]]]:
+        pass
+    def infer(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        **kwargs,
+    ) -> Tuple[List[KeyPoints], Optional[List[Detections]]]:
+        pre_processed_images, pre_processing_meta = self.pre_process(images, **kwargs)
+        model_results = self.forward(pre_processed_images, **kwargs)
+        return self.post_process(model_results, pre_processing_meta, **kwargs)
+    @abstractmethod
+    def pre_process(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        **kwargs,
+    ) -> Tuple[PreprocessedInputs, PreprocessingMetadata]:
+        pass
+    @abstractmethod
+    def forward(
+        self, pre_processed_images: PreprocessedInputs, **kwargs
+    ) -> RawPrediction:
+        pass
+    @abstractmethod
+    def post_process(
+        self,
+        model_results: RawPrediction,
+        pre_processing_meta: PreprocessingMetadata,
+        **kwargs,
+    ) -> Tuple[List[KeyPoints], Optional[List[Detections]]]:
+        pass
+    def __call__(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        **kwargs,
+    ) -> Tuple[List[KeyPoints], Optional[List[Detections]]]:
+        return self.infer(images, **kwargs)

inference_models/models/base/object_detection.py ADDED Viewed

@@ -0,0 +1,143 @@
+from abc import ABC, abstractmethod
+from dataclasses import dataclass
+from typing import Generic, List, Optional, Tuple, Union
+import numpy as np
+import supervision as sv
+import torch
+from inference_models.models.base.types import (
+    PreprocessedInputs,
+    PreprocessingMetadata,
+    RawPrediction,
+)
+@dataclass
+class Detections:
+    xyxy: torch.Tensor  # (n_boxes, 4)
+    class_id: torch.Tensor  # (n_boxes, )
+    confidence: torch.Tensor  # (n_boxes, )
+    image_metadata: Optional[dict] = None
+    bboxes_metadata: Optional[List[dict]] = (
+        None  # if given, list of size equal to # of bboxes
+    )
+    def to_supervision(self) -> sv.Detections:
+        return sv.Detections(
+            xyxy=self.xyxy.cpu().numpy(),
+            class_id=self.class_id.cpu().numpy(),
+            confidence=self.confidence.cpu().numpy(),
+        )
+class ObjectDetectionModel(
+    ABC, Generic[PreprocessedInputs, PreprocessingMetadata, RawPrediction]
+):
+    @classmethod
+    @abstractmethod
+    def from_pretrained(
+        cls, model_name_or_path: str, **kwargs
+    ) -> "ObjectDetectionModel":
+        pass
+    @property
+    @abstractmethod
+    def class_names(self) -> List[str]:
+        pass
+    def infer(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        **kwargs,
+    ) -> List[Detections]:
+        pre_processed_images, pre_processing_meta = self.pre_process(images, **kwargs)
+        model_results = self.forward(pre_processed_images, **kwargs)
+        return self.post_process(model_results, pre_processing_meta, **kwargs)
+    @abstractmethod
+    def pre_process(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        **kwargs,
+    ) -> Tuple[PreprocessedInputs, PreprocessingMetadata]:
+        pass
+    @abstractmethod
+    def forward(
+        self, pre_processed_images: PreprocessedInputs, **kwargs
+    ) -> RawPrediction:
+        pass
+    @abstractmethod
+    def post_process(
+        self,
+        model_results: RawPrediction,
+        pre_processing_meta: PreprocessingMetadata,
+        **kwargs,
+    ) -> List[Detections]:
+        pass
+    def __call__(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        **kwargs,
+    ) -> List[Detections]:
+        return self.infer(images, **kwargs)
+class OpenVocabularyObjectDetectionModel(
+    ABC, Generic[PreprocessedInputs, PreprocessingMetadata, RawPrediction]
+):
+    @classmethod
+    @abstractmethod
+    def from_pretrained(
+        cls, model_name_or_path: str, **kwargs
+    ) -> "OpenVocabularyObjectDetectionModel":
+        pass
+    def infer(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        classes: Union[str, List[str]],
+        **kwargs,
+    ) -> List[Detections]:
+        pre_processed_images, pre_processing_meta = self.pre_process(images, **kwargs)
+        model_results = self.forward(pre_processed_images, classes, **kwargs)
+        return self.post_process(model_results, pre_processing_meta, **kwargs)
+    @abstractmethod
+    def pre_process(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        **kwargs,
+    ) -> Tuple[PreprocessedInputs, PreprocessingMetadata]:
+        pass
+    @abstractmethod
+    def forward(
+        self,
+        pre_processed_images: PreprocessedInputs,
+        classes: List[str],
+        **kwargs,
+    ) -> RawPrediction:
+        pass
+    @abstractmethod
+    def post_process(
+        self,
+        model_results: RawPrediction,
+        pre_processing_meta: PreprocessingMetadata,
+        **kwargs,
+    ) -> List[Detections]:
+        pass
+    def __call__(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        classes: List[str],
+        **kwargs,
+    ) -> List[Detections]:
+        return self.infer(images=images, classes=classes, **kwargs)

inference_models/models/base/semantic_segmentation.py ADDED Viewed

@@ -0,0 +1,74 @@
+from abc import ABC, abstractmethod
+from dataclasses import dataclass
+from typing import Generic, List, Optional, Tuple, Union
+import numpy as np
+import supervision as sv
+import torch
+from inference_models.models.base.types import (
+    PreprocessedInputs,
+    PreprocessingMetadata,
+    RawPrediction,
+)
+@dataclass
+class SemanticSegmentationResult:
+    segmentation_map: torch.Tensor
+    confidence: torch.Tensor
+    image_metadata: Optional[dict] = None
+class SemanticSegmentationModel(
+    ABC, Generic[PreprocessedInputs, PreprocessingMetadata, RawPrediction]
+):
+    @classmethod
+    @abstractmethod
+    def from_pretrained(
+        cls, model_name_or_path: str, **kwargs
+    ) -> "SemanticSegmentationModel":
+        pass
+    @property
+    @abstractmethod
+    def class_names(self) -> List[str]:
+        pass
+    def infer(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        **kwargs,
+    ) -> List[SemanticSegmentationResult]:
+        pre_processed_images, pre_processing_meta = self.pre_process(images, **kwargs)
+        model_results = self.forward(pre_processed_images, **kwargs)
+        return self.post_process(model_results, pre_processing_meta, **kwargs)
+    @abstractmethod
+    def pre_process(
+        self, images: Union[torch.Tensor, List[torch.Tensor]], **kwargs
+    ) -> PreprocessedInputs:
+        pass
+    @abstractmethod
+    def forward(
+        self, pre_processed_images: PreprocessedInputs, **kwargs
+    ) -> RawPrediction:
+        pass
+    @abstractmethod
+    def post_process(
+        self,
+        model_results: RawPrediction,
+        pre_processing_meta: PreprocessedInputs,
+        **kwargs,
+    ) -> List[SemanticSegmentationResult]:
+        pass
+    def __call__(
+        self,
+        images: Union[torch.Tensor, List[torch.Tensor], np.ndarray, List[np.ndarray]],
+        **kwargs,
+    ) -> List[SemanticSegmentationResult]:
+        return self.infer(images, **kwargs)

inference_models/models/base/types.py ADDED Viewed

@@ -0,0 +1,5 @@
+from typing import TypeVar
+PreprocessedInputs = TypeVar("PreprocessedInputs")
+PreprocessingMetadata = TypeVar("PreprocessingMetadata")
+RawPrediction = TypeVar("RawPrediction")

inference_models/models/clip/__init__.py ADDED Viewed

File without changes