PyPI - inference-models - Versions diffs - 0.18.3__py3-none-any.whl - Mend

inference-models 0.18.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (195) hide show

inference_models/__init__.py +36 -0
inference_models/configuration.py +72 -0
inference_models/constants.py +2 -0
inference_models/entities.py +5 -0
inference_models/errors.py +137 -0
inference_models/logger.py +52 -0
inference_models/model_pipelines/__init__.py +0 -0
inference_models/model_pipelines/auto_loaders/__init__.py +0 -0
inference_models/model_pipelines/auto_loaders/core.py +120 -0
inference_models/model_pipelines/auto_loaders/pipelines_registry.py +36 -0
inference_models/model_pipelines/face_and_gaze_detection/__init__.py +0 -0
inference_models/model_pipelines/face_and_gaze_detection/mediapipe_l2cs.py +200 -0
inference_models/models/__init__.py +0 -0
inference_models/models/auto_loaders/__init__.py +0 -0
inference_models/models/auto_loaders/access_manager.py +168 -0
inference_models/models/auto_loaders/auto_negotiation.py +1329 -0
inference_models/models/auto_loaders/auto_resolution_cache.py +129 -0
inference_models/models/auto_loaders/constants.py +7 -0
inference_models/models/auto_loaders/core.py +1341 -0
inference_models/models/auto_loaders/dependency_models.py +52 -0
inference_models/models/auto_loaders/entities.py +57 -0
inference_models/models/auto_loaders/models_registry.py +497 -0
inference_models/models/auto_loaders/presentation_utils.py +333 -0
inference_models/models/auto_loaders/ranking.py +413 -0
inference_models/models/auto_loaders/utils.py +31 -0
inference_models/models/base/__init__.py +0 -0
inference_models/models/base/classification.py +123 -0
inference_models/models/base/depth_estimation.py +62 -0
inference_models/models/base/documents_parsing.py +111 -0
inference_models/models/base/embeddings.py +66 -0
inference_models/models/base/instance_segmentation.py +87 -0
inference_models/models/base/keypoints_detection.py +93 -0
inference_models/models/base/object_detection.py +143 -0
inference_models/models/base/semantic_segmentation.py +74 -0
inference_models/models/base/types.py +5 -0
inference_models/models/clip/__init__.py +0 -0
inference_models/models/clip/clip_onnx.py +148 -0
inference_models/models/clip/clip_pytorch.py +104 -0
inference_models/models/clip/preprocessing.py +162 -0
inference_models/models/common/__init__.py +0 -0
inference_models/models/common/cuda.py +30 -0
inference_models/models/common/model_packages.py +25 -0
inference_models/models/common/onnx.py +379 -0
inference_models/models/common/roboflow/__init__.py +0 -0
inference_models/models/common/roboflow/model_packages.py +361 -0
inference_models/models/common/roboflow/post_processing.py +436 -0
inference_models/models/common/roboflow/pre_processing.py +1332 -0
inference_models/models/common/torch.py +20 -0
inference_models/models/common/trt.py +266 -0
inference_models/models/deep_lab_v3_plus/__init__.py +0 -0
inference_models/models/deep_lab_v3_plus/deep_lab_v3_plus_segmentation_onnx.py +282 -0
inference_models/models/deep_lab_v3_plus/deep_lab_v3_plus_segmentation_torch.py +264 -0
inference_models/models/deep_lab_v3_plus/deep_lab_v3_plus_segmentation_trt.py +313 -0
inference_models/models/depth_anything_v2/__init__.py +0 -0
inference_models/models/depth_anything_v2/depth_anything_v2_hf.py +77 -0
inference_models/models/dinov3/__init__.py +0 -0
inference_models/models/dinov3/dinov3_classification_onnx.py +348 -0
inference_models/models/dinov3/dinov3_classification_torch.py +323 -0
inference_models/models/doctr/__init__.py +0 -0
inference_models/models/doctr/doctr_torch.py +304 -0
inference_models/models/easy_ocr/__init__.py +0 -0
inference_models/models/easy_ocr/easy_ocr_torch.py +222 -0
inference_models/models/florence2/__init__.py +0 -0
inference_models/models/florence2/florence2_hf.py +897 -0
inference_models/models/grounding_dino/__init__.py +0 -0
inference_models/models/grounding_dino/grounding_dino_torch.py +227 -0
inference_models/models/l2cs/__init__.py +0 -0
inference_models/models/l2cs/l2cs_onnx.py +216 -0
inference_models/models/mediapipe_face_detection/__init__.py +0 -0
inference_models/models/mediapipe_face_detection/face_detection.py +203 -0
inference_models/models/moondream2/__init__.py +0 -0
inference_models/models/moondream2/moondream2_hf.py +281 -0
inference_models/models/owlv2/__init__.py +0 -0
inference_models/models/owlv2/cache.py +182 -0
inference_models/models/owlv2/entities.py +112 -0
inference_models/models/owlv2/owlv2_hf.py +695 -0
inference_models/models/owlv2/reference_dataset.py +291 -0
inference_models/models/paligemma/__init__.py +0 -0
inference_models/models/paligemma/paligemma_hf.py +209 -0
inference_models/models/perception_encoder/__init__.py +0 -0
inference_models/models/perception_encoder/perception_encoder_pytorch.py +197 -0
inference_models/models/perception_encoder/vision_encoder/__init__.py +0 -0
inference_models/models/perception_encoder/vision_encoder/config.py +160 -0
inference_models/models/perception_encoder/vision_encoder/pe.py +742 -0
inference_models/models/perception_encoder/vision_encoder/rope.py +344 -0
inference_models/models/perception_encoder/vision_encoder/tokenizer.py +342 -0
inference_models/models/perception_encoder/vision_encoder/transforms.py +33 -0
inference_models/models/qwen25vl/__init__.py +1 -0
inference_models/models/qwen25vl/qwen25vl_hf.py +285 -0
inference_models/models/resnet/__init__.py +0 -0
inference_models/models/resnet/resnet_classification_onnx.py +330 -0
inference_models/models/resnet/resnet_classification_torch.py +305 -0
inference_models/models/resnet/resnet_classification_trt.py +369 -0
inference_models/models/rfdetr/__init__.py +0 -0
inference_models/models/rfdetr/backbone_builder.py +101 -0
inference_models/models/rfdetr/class_remapping.py +41 -0
inference_models/models/rfdetr/common.py +115 -0
inference_models/models/rfdetr/default_labels.py +108 -0
inference_models/models/rfdetr/dinov2_with_windowed_attn.py +1330 -0
inference_models/models/rfdetr/misc.py +26 -0
inference_models/models/rfdetr/ms_deform_attn.py +180 -0
inference_models/models/rfdetr/ms_deform_attn_func.py +60 -0
inference_models/models/rfdetr/position_encoding.py +166 -0
inference_models/models/rfdetr/post_processor.py +83 -0
inference_models/models/rfdetr/projector.py +373 -0
inference_models/models/rfdetr/rfdetr_backbone_pytorch.py +394 -0
inference_models/models/rfdetr/rfdetr_base_pytorch.py +807 -0
inference_models/models/rfdetr/rfdetr_instance_segmentation_onnx.py +206 -0
inference_models/models/rfdetr/rfdetr_instance_segmentation_pytorch.py +373 -0
inference_models/models/rfdetr/rfdetr_instance_segmentation_trt.py +227 -0
inference_models/models/rfdetr/rfdetr_object_detection_onnx.py +244 -0
inference_models/models/rfdetr/rfdetr_object_detection_pytorch.py +470 -0
inference_models/models/rfdetr/rfdetr_object_detection_trt.py +270 -0
inference_models/models/rfdetr/segmentation_head.py +273 -0
inference_models/models/rfdetr/transformer.py +767 -0
inference_models/models/roboflow_instant/__init__.py +0 -0
inference_models/models/roboflow_instant/roboflow_instant_hf.py +141 -0
inference_models/models/sam/__init__.py +0 -0
inference_models/models/sam/cache.py +147 -0
inference_models/models/sam/entities.py +25 -0
inference_models/models/sam/sam_torch.py +675 -0
inference_models/models/sam2/__init__.py +0 -0
inference_models/models/sam2/cache.py +162 -0
inference_models/models/sam2/entities.py +43 -0
inference_models/models/sam2/sam2_torch.py +905 -0
inference_models/models/sam2_rt/__init__.py +0 -0
inference_models/models/sam2_rt/sam2_pytorch.py +119 -0
inference_models/models/smolvlm/__init__.py +0 -0
inference_models/models/smolvlm/smolvlm_hf.py +245 -0
inference_models/models/trocr/__init__.py +0 -0
inference_models/models/trocr/trocr_hf.py +53 -0
inference_models/models/vit/__init__.py +0 -0
inference_models/models/vit/vit_classification_huggingface.py +319 -0
inference_models/models/vit/vit_classification_onnx.py +326 -0
inference_models/models/vit/vit_classification_trt.py +365 -0
inference_models/models/yolact/__init__.py +1 -0
inference_models/models/yolact/yolact_instance_segmentation_onnx.py +336 -0
inference_models/models/yolact/yolact_instance_segmentation_trt.py +361 -0
inference_models/models/yolo_world/__init__.py +1 -0
inference_models/models/yolonas/__init__.py +0 -0
inference_models/models/yolonas/nms.py +44 -0
inference_models/models/yolonas/yolonas_object_detection_onnx.py +204 -0
inference_models/models/yolonas/yolonas_object_detection_trt.py +230 -0
inference_models/models/yolov10/__init__.py +0 -0
inference_models/models/yolov10/yolov10_object_detection_onnx.py +187 -0
inference_models/models/yolov10/yolov10_object_detection_trt.py +215 -0
inference_models/models/yolov11/__init__.py +0 -0
inference_models/models/yolov11/yolov11_onnx.py +28 -0
inference_models/models/yolov11/yolov11_torch_script.py +25 -0
inference_models/models/yolov11/yolov11_trt.py +21 -0
inference_models/models/yolov12/__init__.py +0 -0
inference_models/models/yolov12/yolov12_onnx.py +7 -0
inference_models/models/yolov12/yolov12_torch_script.py +7 -0
inference_models/models/yolov12/yolov12_trt.py +7 -0
inference_models/models/yolov5/__init__.py +0 -0
inference_models/models/yolov5/nms.py +99 -0
inference_models/models/yolov5/yolov5_instance_segmentation_onnx.py +225 -0
inference_models/models/yolov5/yolov5_instance_segmentation_trt.py +255 -0
inference_models/models/yolov5/yolov5_object_detection_onnx.py +192 -0
inference_models/models/yolov5/yolov5_object_detection_trt.py +218 -0
inference_models/models/yolov7/__init__.py +0 -0
inference_models/models/yolov7/yolov7_instance_segmentation_onnx.py +226 -0
inference_models/models/yolov7/yolov7_instance_segmentation_trt.py +253 -0
inference_models/models/yolov8/__init__.py +0 -0
inference_models/models/yolov8/yolov8_classification_onnx.py +181 -0
inference_models/models/yolov8/yolov8_instance_segmentation_onnx.py +239 -0
inference_models/models/yolov8/yolov8_instance_segmentation_torch_script.py +201 -0
inference_models/models/yolov8/yolov8_instance_segmentation_trt.py +268 -0
inference_models/models/yolov8/yolov8_key_points_detection_onnx.py +263 -0
inference_models/models/yolov8/yolov8_key_points_detection_torch_script.py +218 -0
inference_models/models/yolov8/yolov8_key_points_detection_trt.py +287 -0
inference_models/models/yolov8/yolov8_object_detection_onnx.py +213 -0
inference_models/models/yolov8/yolov8_object_detection_torch_script.py +166 -0
inference_models/models/yolov8/yolov8_object_detection_trt.py +231 -0
inference_models/models/yolov9/__init__.py +0 -0
inference_models/models/yolov9/yolov9_onnx.py +7 -0
inference_models/models/yolov9/yolov9_torch_script.py +7 -0
inference_models/models/yolov9/yolov9_trt.py +7 -0
inference_models/runtime_introspection/__init__.py +0 -0
inference_models/runtime_introspection/core.py +410 -0
inference_models/utils/__init__.py +0 -0
inference_models/utils/download.py +608 -0
inference_models/utils/environment.py +28 -0
inference_models/utils/file_system.py +51 -0
inference_models/utils/hashing.py +7 -0
inference_models/utils/imports.py +48 -0
inference_models/utils/onnx_introspection.py +17 -0
inference_models/weights_providers/__init__.py +0 -0
inference_models/weights_providers/core.py +20 -0
inference_models/weights_providers/entities.py +159 -0
inference_models/weights_providers/roboflow.py +601 -0
inference_models-0.18.3.dist-info/METADATA +466 -0
inference_models-0.18.3.dist-info/RECORD +195 -0
inference_models-0.18.3.dist-info/WHEEL +5 -0
inference_models-0.18.3.dist-info/top_level.txt +1 -0

inference_models/models/auto_loaders/core.py ADDED Viewed

@@ -0,0 +1,1341 @@
+import hashlib
+import importlib
+import importlib.util
+import os.path
+import re
+from datetime import datetime
+from functools import partial
+from typing import Any, Callable, Dict, List, Optional, Set, Tuple, Union
+import torch
+from argon2 import PasswordHasher
+from filelock import FileLock
+from rich.console import Console
+from rich.text import Text
+from inference_models.configuration import DEFAULT_DEVICE, INFERENCE_HOME
+from inference_models.errors import (
+    CorruptedModelPackageError,
+    DirectLocalStorageAccessError,
+    InsecureModelIdentifierError,
+    ModelLoadingError,
+    NoModelPackagesAvailableError,
+    UnauthorizedModelAccessError,
+)
+from inference_models.logger import LOGGER, verbose_info
+from inference_models.models.auto_loaders.access_manager import (
+    AccessIdentifiers,
+    LiberalModelAccessManager,
+    ModelAccessManager,
+)
+from inference_models.models.auto_loaders.auto_negotiation import (
+    negotiate_model_packages,
+    parse_backend_type,
+)
+from inference_models.models.auto_loaders.auto_resolution_cache import (
+    AutoResolutionCache,
+    AutoResolutionCacheEntry,
+    BaseAutoLoadMetadataCache,
+)
+from inference_models.models.auto_loaders.constants import (
+    MODEL_DEPENDENCIES_KEY,
+    MODEL_DEPENDENCIES_SUB_DIR,
+)
+from inference_models.models.auto_loaders.dependency_models import (
+    prepare_dependency_model_parameters,
+)
+from inference_models.models.auto_loaders.entities import (
+    MODEL_CONFIG_FILE_NAME,
+    AnyModel,
+    BackendType,
+    InferenceModelConfig,
+    ModelArchitecture,
+    TaskType,
+)
+from inference_models.models.auto_loaders.models_registry import (
+    INSTANCE_SEGMENTATION_TASK,
+    OBJECT_DETECTION_TASK,
+    resolve_model_class,
+)
+from inference_models.models.auto_loaders.presentation_utils import (
+    calculate_artefacts_size,
+    calculate_size_of_all_model_packages_artefacts,
+    render_model_package_details_table,
+    render_runtime_x_ray,
+    render_table_with_model_overview,
+    render_table_with_model_packages,
+)
+from inference_models.runtime_introspection.core import x_ray_runtime_environment
+from inference_models.utils.download import FileHandle, download_files_to_directory
+from inference_models.utils.file_system import dump_json, read_json
+from inference_models.utils.hashing import hash_dict_content
+from inference_models.weights_providers.core import get_model_from_provider
+from inference_models.weights_providers.entities import (
+    ModelDependency,
+    ModelPackageMetadata,
+    Quantization,
+)
+MODEL_TYPES_TO_LOAD_FROM_CHECKPOINT = {
+    "rfdetr-base",
+    "rfdetr-small",
+    "rfdetr-medium",
+    "rfdetr-nano",
+    "rfdetr-large",
+    "rfdetr-seg-preview",
+}
+DEFAULT_KWARGS_PARAMS_TO_BE_FORWARDED_TO_DEPENDENT_MODELS = [
+    "owlv2_enforce_model_compilation",
+    "owlv2_class_embeddings_cache",
+    "owlv2_images_embeddings_cache",
+]
+class AutoModel:
+    @classmethod
+    def describe_model(
+        cls,
+        model_id: str,
+        weights_provider: str = "roboflow",
+        api_key: Optional[str] = None,
+        pull_artefacts_size: bool = False,
+    ) -> None:
+        model_metadata = get_model_from_provider(
+            provider=weights_provider,
+            model_id=model_id,
+            api_key=api_key,
+        )
+        model_packages_size = None
+        if pull_artefacts_size:
+            model_packages_size = calculate_size_of_all_model_packages_artefacts(
+                model_packages=model_metadata.model_packages
+            )
+        console = Console()
+        model_overview_table = render_table_with_model_overview(
+            model_id=model_metadata.model_id,
+            requested_model_id=model_id,
+            model_architecture=model_metadata.model_architecture,
+            model_variant=model_metadata.model_variant,
+            task_type=model_metadata.task_type,
+            weights_provider=weights_provider,
+            registered_packages=len(model_metadata.model_packages),
+            model_dependencies=model_metadata.model_dependencies,
+        )
+        console.print(model_overview_table)
+        console.print("\n")
+        packages_overview_table = render_table_with_model_packages(
+            model_packages=model_metadata.model_packages,
+            model_packages_size=model_packages_size,
+        )
+        console.print(packages_overview_table)
+        text = Text.assemble(
+            ("\nWant to check more details about specific package?", "bold"),
+            "\nUse AutoModel.describe_model_package('model_id', 'package_id').",
+        )
+        console.print(text)
+        if not pull_artefacts_size:
+            text = Text.assemble(
+                ("\nWant to verify the size of model package?", "bold"),
+                "\nUse AutoModel.describe_model('model_id', pull_artefacts_size=True) - the execution will be "
+                "slightly longer, as we must collect the size of all elements of model package.",
+            )
+            console.print(text)
+    @classmethod
+    def describe_model_package(
+        cls,
+        model_id: str,
+        package_id: str,
+        weights_provider: str = "roboflow",
+        api_key: Optional[str] = None,
+        pull_artefacts_size: bool = True,
+    ) -> None:
+        model_metadata = get_model_from_provider(
+            provider=weights_provider,
+            model_id=model_id,
+            api_key=api_key,
+        )
+        selected_package = None
+        for package in model_metadata.model_packages:
+            if package.package_id == package_id:
+                selected_package = package
+        if selected_package is None:
+            raise NoModelPackagesAvailableError(
+                message=f"Selected model package {package_id} does not exist for model {model_id}. Make sure provided "
+                f"value is valid.",
+                help_url="https://todo",
+            )
+        artefacts_size = None
+        if pull_artefacts_size:
+            artefacts_size = calculate_artefacts_size(
+                package_artefacts=selected_package.package_artefacts
+            )
+        table = render_model_package_details_table(
+            model_id=model_metadata.model_id,
+            requested_model_id=model_id,
+            artefacts_size=artefacts_size,
+            model_package=selected_package,
+        )
+        console = Console()
+        console.print(table)
+        if not pull_artefacts_size:
+            text = Text.assemble(
+                ("\nWant to verify the size of model package?", "bold"),
+                "\nUse AutoModel.describe_model_package('model_id', 'package_id', pull_artefacts_size=True)"
+                "- the execution will be slightly longer, as we must collect the size of all elements of model package.",
+            )
+            console.print(text)
+    @classmethod
+    def describe_compute_environment(cls) -> None:
+        runtime_x_ray = x_ray_runtime_environment()
+        table = render_runtime_x_ray(runtime_x_ray=runtime_x_ray)
+        console = Console()
+        console.print(table)
+    @classmethod
+    def from_pretrained(
+        cls,
+        model_id_or_path: str,
+        weights_provider: str = "roboflow",
+        api_key: Optional[str] = None,
+        model_package_id: Optional[str] = None,
+        backend: Optional[
+            Union[str, BackendType, List[Union[str, BackendType]]]
+        ] = None,
+        batch_size: Optional[Union[int, Tuple[int, int]]] = None,
+        quantization: Optional[
+            Union[str, Quantization, List[Union[str, Quantization]]]
+        ] = None,
+        onnx_execution_providers: Optional[List[Union[str, tuple]]] = None,
+        device: torch.device = DEFAULT_DEVICE,
+        default_onnx_trt_options: bool = True,
+        max_package_loading_attempts: Optional[int] = None,
+        verbose: bool = False,
+        model_download_file_lock_acquire_timeout: int = 10,
+        allow_untrusted_packages: bool = False,
+        trt_engine_host_code_allowed: bool = True,
+        allow_local_code_packages: bool = True,
+        verify_hash_while_download: bool = True,
+        download_files_without_hash: bool = False,
+        use_auto_resolution_cache: bool = True,
+        auto_resolution_cache: Optional[AutoResolutionCache] = None,
+        allow_direct_local_storage_loading: bool = True,
+        model_access_manager: Optional[ModelAccessManager] = None,
+        nms_fusion_preferences: Optional[Union[bool, dict]] = None,
+        model_type: Optional[str] = None,
+        task_type: Optional[str] = None,
+        allow_loading_dependency_models: bool = True,
+        dependency_models_params: Optional[dict] = None,
+        point_model_directory: Optional[Callable[[str], None]] = None,
+        forwarded_kwargs: Optional[List[str]] = None,
+        **kwargs,
+    ) -> AnyModel:
+        if model_access_manager is None:
+            model_access_manager = LiberalModelAccessManager()
+        if model_access_manager.is_model_access_forbidden(
+            model_id=model_id_or_path, api_key=api_key
+        ):
+            raise UnauthorizedModelAccessError(
+                message=f"Unauthorized not access model with ID: {model_package_id}. Are you sure you use valid "
+                f"API key? The default weights provider is Roboflow - see Roboflow authentication details: "
+                f"https://docs.roboflow.com/api-reference/authentication "
+                f"and export key to `ROBOFLOW_API_KEY` environment variable. If you use custom weights "
+                f"provider - verify access constraints relevant for the provider.",
+                help_url="https://todo",
+            )
+        if auto_resolution_cache is None:
+            def register_file_created_for_model_package(
+                file_path: str, model_id: str, package_id: str
+            ) -> None:
+                access_identifiers = AccessIdentifiers(
+                    model_id=model_id,
+                    package_id=package_id,
+                    api_key=api_key,
+                )
+                model_access_manager.on_file_created(
+                    file_path=file_path,
+                    access_identifiers=access_identifiers,
+                )
+            auto_resolution_cache = BaseAutoLoadMetadataCache(
+                file_lock_acquire_timeout=model_download_file_lock_acquire_timeout,
+                verbose=verbose,
+                on_file_created=register_file_created_for_model_package,
+                on_file_deleted=model_access_manager.on_file_deleted,
+            )
+        model_init_kwargs = {
+            "onnx_execution_providers": onnx_execution_providers,
+            "device": device,
+            "default_onnx_trt_options": default_onnx_trt_options,
+            "engine_host_code_allowed": trt_engine_host_code_allowed,
+        }
+        model_init_kwargs.update(kwargs)
+        if not os.path.exists(model_id_or_path):
+            # QUESTION: is it enough to assume presence of local dir as the intent to load
+            # model from disc drive? What if we have clash of model id / model alias with
+            # contents of someone's local drive - shall we then try to load from both sources?
+            # that still may end up with ambiguous behaviour - probably the solution would be
+            # to require prefix like file://... to denote the intent of loading model from local
+            # drive?
+            if api_key is not None:
+                password_hashed = PasswordHasher()
+                api_key_hash = password_hashed.hash(api_key)
+            else:
+                api_key_hash = api_key
+            auto_negotiation_hash = hash_dict_content(
+                content={
+                    "provider": weights_provider,
+                    "model_id": model_id_or_path,
+                    "api_key": api_key_hash,
+                    "requested_model_package_id": model_package_id,
+                    "requested_backends": backend,
+                    "requested_batch_size": batch_size,
+                    "requested_quantization": quantization,
+                    "device": str(device),
+                    "onnx_execution_providers": onnx_execution_providers,
+                    "allow_untrusted_packages": allow_untrusted_packages,
+                    "trt_engine_host_code_allowed": trt_engine_host_code_allowed,
+                    "nms_fusion_preferences": nms_fusion_preferences,
+                }
+            )
+            model_from_access_manager = model_access_manager.retrieve_model_instance(
+                model_id=model_id_or_path,
+                package_id=model_package_id,
+                api_key=api_key,
+                loading_parameter_digest=auto_negotiation_hash,
+            )
+            if model_from_access_manager:
+                return model_from_access_manager
+            if forwarded_kwargs is None:
+                forwarded_kwargs = (
+                    DEFAULT_KWARGS_PARAMS_TO_BE_FORWARDED_TO_DEPENDENT_MODELS
+                )
+            forwarded_kwargs_values = {
+                name: kwargs[name] for name in forwarded_kwargs if name in kwargs
+            }
+            model_from_cache = attempt_loading_model_with_auto_load_cache(
+                use_auto_resolution_cache=use_auto_resolution_cache,
+                auto_resolution_cache=auto_resolution_cache,
+                auto_negotiation_hash=auto_negotiation_hash,
+                model_access_manager=model_access_manager,
+                model_name_or_path=model_id_or_path,
+                model_init_kwargs=model_init_kwargs,
+                api_key=api_key,
+                allow_loading_dependency_models=allow_loading_dependency_models,
+                forwarded_kwargs_values=forwarded_kwargs_values,
+                verbose=verbose,
+                weights_provider=weights_provider,
+                max_package_loading_attempts=max_package_loading_attempts,
+                model_download_file_lock_acquire_timeout=model_download_file_lock_acquire_timeout,
+                allow_untrusted_packages=allow_untrusted_packages,
+                trt_engine_host_code_allowed=trt_engine_host_code_allowed,
+                allow_local_code_packages=allow_local_code_packages,
+                verify_hash_while_download=verify_hash_while_download,
+                download_files_without_hash=download_files_without_hash,
+                allow_direct_local_storage_loading=allow_direct_local_storage_loading,
+                dependency_models_params=dependency_models_params,
+            )
+            if model_from_cache:
+                return model_from_cache
+            try:
+                model_metadata = get_model_from_provider(
+                    provider=weights_provider,
+                    model_id=model_id_or_path,
+                    api_key=api_key,
+                )
+                if (
+                    model_metadata.model_dependencies
+                    and not allow_loading_dependency_models
+                ):
+                    raise CorruptedModelPackageError(
+                        message=f"Could not load model {model_id_or_path} as it defines another models which are "
+                        f"it's dependency, but the auto-loader prevents loading dependencies at certain "
+                        f"nesting depth to avoid excessive resolution procedure. This is a limitation of "
+                        f"current implementation. Provide us the context of your use-case to get help.",
+                        help_url="https://todo",
+                    )
+                if model_metadata.model_id != model_id_or_path:
+                    model_access_manager.on_model_alias_discovered(
+                        alias=model_id_or_path,
+                        model_id=model_metadata.model_id,
+                    )
+                model_dependencies = model_metadata.model_dependencies or []
+                for model_dependency in model_dependencies:
+                    model_access_manager.on_model_dependency_discovered(
+                        base_model_id=model_dependency.model_id,
+                        base_model_package_id=model_dependency.model_package_id,
+                        dependent_model_id=model_metadata.model_id,
+                    )
+                for model_package in model_metadata.model_packages:
+                    package_access_identifiers = AccessIdentifiers(
+                        model_id=model_metadata.model_id,
+                        package_id=model_package.package_id,
+                        api_key=api_key,
+                    )
+                    model_access_manager.on_model_package_access_granted(
+                        package_access_identifiers
+                    )
+            except UnauthorizedModelAccessError as error:
+                model_access_manager.on_model_access_forbidden(
+                    model_id=model_id_or_path, api_key=api_key
+                )
+                raise error
+            # here we verify if de-aliasing or access confirmation from auth master changed something
+            model_from_access_manager = model_access_manager.retrieve_model_instance(
+                model_id=model_id_or_path,
+                package_id=model_package_id,
+                api_key=api_key,
+                loading_parameter_digest=auto_negotiation_hash,
+            )
+            if model_from_access_manager:
+                return model_from_access_manager
+            matching_model_packages = negotiate_model_packages(
+                model_architecture=model_metadata.model_architecture,
+                task_type=model_metadata.task_type,
+                model_packages=model_metadata.model_packages,
+                requested_model_package_id=model_package_id,
+                requested_backends=backend,
+                requested_batch_size=batch_size,
+                requested_quantization=quantization,
+                device=device,
+                onnx_execution_providers=onnx_execution_providers,
+                allow_untrusted_packages=allow_untrusted_packages,
+                trt_engine_host_code_allowed=trt_engine_host_code_allowed,
+                nms_fusion_preferences=nms_fusion_preferences,
+                verbose=verbose,
+            )
+            model_dependencies_instances = {}
+            model_dependencies_directories = {}
+            dependency_models_params = dependency_models_params or {}
+            for model_dependency in model_dependencies:
+                dependency_params = dependency_models_params.get(
+                    model_dependency.name, {}
+                )
+                dependency_params["model_id_or_path"] = model_dependency.model_id
+                dependency_params["model_package_id"] = (
+                    model_dependency.model_package_id
+                )
+                resolved_model_parameters = prepare_dependency_model_parameters(
+                    model_parameters=dependency_params
+                )
+                verbose_info(
+                    message=f"Initialising dependent model: {model_dependency.model_id}",
+                    verbose_requested=verbose,
+                )
+                def model_directory_pointer(model_dir: str) -> None:
+                    model_dependencies_directories[model_dependency.name] = model_dir
+                for name, value in forwarded_kwargs_values.items():
+                    if name not in resolved_model_parameters.model_extra:
+                        resolved_model_parameters.model_extra[name] = value
+                dependency_instance = AutoModel.from_pretrained(
+                    model_id_or_path=resolved_model_parameters.model_id_or_path,
+                    weights_provider=weights_provider,
+                    api_key=api_key,
+                    model_package_id=resolved_model_parameters.model_package_id,
+                    backend=resolved_model_parameters.backend,
+                    batch_size=resolved_model_parameters.batch_size,
+                    quantization=resolved_model_parameters.quantization,
+                    onnx_execution_providers=resolved_model_parameters.onnx_execution_providers,
+                    device=resolved_model_parameters.device,
+                    default_onnx_trt_options=resolved_model_parameters.default_onnx_trt_options,
+                    max_package_loading_attempts=max_package_loading_attempts,
+                    verbose=verbose,
+                    model_download_file_lock_acquire_timeout=model_download_file_lock_acquire_timeout,
+                    allow_untrusted_packages=allow_untrusted_packages,
+                    trt_engine_host_code_allowed=trt_engine_host_code_allowed,
+                    allow_local_code_packages=allow_local_code_packages,
+                    verify_hash_while_download=verify_hash_while_download,
+                    download_files_without_hash=download_files_without_hash,
+                    use_auto_resolution_cache=use_auto_resolution_cache,
+                    auto_resolution_cache=auto_resolution_cache,
+                    allow_direct_local_storage_loading=allow_direct_local_storage_loading,
+                    model_access_manager=model_access_manager,
+                    nms_fusion_preferences=resolved_model_parameters.nms_fusion_preferences,
+                    model_type=resolved_model_parameters.model_type,
+                    task_type=resolved_model_parameters.task_type,
+                    allow_loading_dependency_models=False,
+                    dependency_models_params=None,
+                    point_model_directory=model_directory_pointer,
+                    **resolved_model_parameters.kwargs,
+                )
+                model_dependencies_instances[model_dependency.name] = (
+                    dependency_instance
+                )
+            return attempt_loading_matching_model_packages(
+                model_id=model_id_or_path,
+                model_architecture=model_metadata.model_architecture,
+                task_type=model_metadata.task_type,
+                matching_model_packages=matching_model_packages,
+                model_init_kwargs=model_init_kwargs,
+                model_access_manager=model_access_manager,
+                auto_negotiation_hash=auto_negotiation_hash,
+                api_key=api_key,
+                model_dependencies=model_metadata.model_dependencies,
+                model_dependencies_instances=model_dependencies_instances,
+                model_dependencies_directories=model_dependencies_directories,
+                max_package_loading_attempts=max_package_loading_attempts,
+                model_download_file_lock_acquire_timeout=model_download_file_lock_acquire_timeout,
+                verify_hash_while_download=verify_hash_while_download,
+                download_files_without_hash=download_files_without_hash,
+                auto_resolution_cache=auto_resolution_cache,
+                use_auto_resolution_cache=use_auto_resolution_cache,
+                point_model_directory=point_model_directory,
+                verbose=verbose,
+            )
+        if not allow_direct_local_storage_loading:
+            raise DirectLocalStorageAccessError(
+                message="Attempted to load model directly pointing local path, rather than model ID. This "
+                "operation is forbidden as AutoModel.from_pretrained(...) was used with "
+                "`allow_direct_local_storage_loading=False`. If you are running `inference-models` outside Roboflow "
+                "hosted solutions - verify your setup. If you see this error on Roboflow platform - this "
+                "feature was disabled for security reason. In rare cases when you use valid model ID, the "
+                "clash of ID with local path may cause this error - we ask you to report the issue here: "
+                "https://github.com/roboflow/inference/issues.",
+                help_url="https://todo",
+            )
+        return attempt_loading_model_from_local_storage(
+            model_dir_or_weights_path=model_id_or_path,
+            allow_local_code_packages=allow_local_code_packages,
+            model_init_kwargs=model_init_kwargs,
+            model_type=model_type,
+            task_type=task_type,
+            backend_type=backend,
+        )
+def attempt_loading_model_with_auto_load_cache(
+    use_auto_resolution_cache: bool,
+    auto_resolution_cache: AutoResolutionCache,
+    auto_negotiation_hash: str,
+    model_access_manager: ModelAccessManager,
+    model_name_or_path: str,
+    model_init_kwargs: dict,
+    api_key: Optional[str],
+    allow_loading_dependency_models: bool,
+    forwarded_kwargs_values: Dict[str, Any],
+    verbose: bool = False,
+    weights_provider: str = "roboflow",
+    max_package_loading_attempts: Optional[int] = None,
+    model_download_file_lock_acquire_timeout: int = 10,
+    allow_untrusted_packages: bool = False,
+    trt_engine_host_code_allowed: bool = True,
+    allow_local_code_packages: bool = True,
+    verify_hash_while_download: bool = True,
+    download_files_without_hash: bool = False,
+    allow_direct_local_storage_loading: bool = True,
+    dependency_models_params: Optional[dict] = None,
+) -> Optional[AnyModel]:
+    if not use_auto_resolution_cache:
+        return None
+    verbose_info(
+        message=f"Attempt to load model {model_name_or_path} using auto-load cache.",
+        verbose_requested=verbose,
+    )
+    cache_entry = auto_resolution_cache.retrieve(
+        auto_negotiation_hash=auto_negotiation_hash
+    )
+    if cache_entry is None:
+        verbose_info(
+            message=f"Could not find auto-load cache for model {model_name_or_path}.",
+            verbose_requested=verbose,
+        )
+        return None
+    if not model_access_manager.is_model_package_access_granted(
+        model_id=cache_entry.model_id,
+        package_id=cache_entry.model_package_id,
+        api_key=api_key,
+    ):
+        return None
+    if not all_files_exist(files=cache_entry.resolved_files):
+        verbose_info(
+            message=f"Could not find all required files denoted in auto-load cache for model {model_name_or_path}.",
+            verbose_requested=verbose,
+        )
+        return None
+    try:
+        model_dependencies = cache_entry.model_dependencies or []
+        if model_dependencies and not allow_loading_dependency_models:
+            raise CorruptedModelPackageError(
+                message=f"Could not load model {cache_entry.model_id} as it defines another models which are "
+                f"it's dependency, but the auto-loader prevents loading dependencies at certain "
+                f"nesting depth to avoid excessive resolution procedure. This is a limitation of "
+                f"current implementation. Provide us the context of your use-case to get help.",
+                help_url="https://todo",
+            )
+        model_dependencies_instances = {}
+        dependency_models_params = dependency_models_params or {}
+        for model_dependency in model_dependencies:
+            dependency_params = dependency_models_params.get(model_dependency.name, {})
+            dependency_params["model_id_or_path"] = model_dependency.model_id
+            dependency_params["model_package_id"] = model_dependency.model_package_id
+            resolved_model_parameters = prepare_dependency_model_parameters(
+                model_parameters=dependency_params
+            )
+            for name, value in forwarded_kwargs_values.items():
+                if name not in resolved_model_parameters.model_extra:
+                    resolved_model_parameters.model_extra[name] = value
+            verbose_info(
+                message=f"Initialising dependent model: {model_dependency.model_id}",
+                verbose_requested=verbose,
+            )
+            dependency_instance = AutoModel.from_pretrained(
+                model_id_or_path=resolved_model_parameters.model_id_or_path,
+                weights_provider=weights_provider,
+                api_key=api_key,
+                model_package_id=resolved_model_parameters.model_package_id,
+                backend=resolved_model_parameters.backend,
+                batch_size=resolved_model_parameters.batch_size,
+                quantization=resolved_model_parameters.quantization,
+                onnx_execution_providers=resolved_model_parameters.onnx_execution_providers,
+                device=resolved_model_parameters.device,
+                default_onnx_trt_options=resolved_model_parameters.default_onnx_trt_options,
+                max_package_loading_attempts=max_package_loading_attempts,
+                verbose=verbose,
+                model_download_file_lock_acquire_timeout=model_download_file_lock_acquire_timeout,
+                allow_untrusted_packages=allow_untrusted_packages,
+                trt_engine_host_code_allowed=trt_engine_host_code_allowed,
+                allow_local_code_packages=allow_local_code_packages,
+                verify_hash_while_download=verify_hash_while_download,
+                download_files_without_hash=download_files_without_hash,
+                use_auto_resolution_cache=use_auto_resolution_cache,
+                auto_resolution_cache=auto_resolution_cache,
+                allow_direct_local_storage_loading=allow_direct_local_storage_loading,
+                model_access_manager=model_access_manager,
+                nms_fusion_preferences=resolved_model_parameters.nms_fusion_preferences,
+                model_type=resolved_model_parameters.model_type,
+                task_type=resolved_model_parameters.task_type,
+                allow_loading_dependency_models=False,
+                dependency_models_params=None,
+                **resolved_model_parameters.kwargs,
+            )
+            model_dependencies_instances[model_dependency.name] = dependency_instance
+        model_class = resolve_model_class(
+            model_architecture=cache_entry.model_architecture,
+            task_type=cache_entry.task_type,
+            backend=cache_entry.backend_type,
+        )
+        model_package_cache_dir = generate_model_package_cache_path(
+            model_id=cache_entry.model_id,
+            package_id=cache_entry.model_package_id,
+        )
+        model_init_kwargs[MODEL_DEPENDENCIES_KEY] = model_dependencies_instances
+        model = model_class.from_pretrained(
+            model_package_cache_dir, **model_init_kwargs
+        )
+        verbose_info(
+            message=f"Successfully loaded model {model_name_or_path} using auto-loading cache.",
+            verbose_requested=verbose,
+        )
+        return model
+    except Exception as error:
+        LOGGER.warning(
+            f"Encountered error {error} of type {type(error)} when attempted to load model using "
+            f"auto-load cache. This may indicate corrupted cache of inference bug. Contact Roboflow submitting "
+            f"issue under: https://github.com/roboflow/inference/issues/"
+        )
+        auto_resolution_cache.invalidate(auto_negotiation_hash=auto_negotiation_hash)
+        return None
+def all_files_exist(files: List[str]) -> bool:
+    return all(os.path.exists(f) for f in files)
+def attempt_loading_matching_model_packages(
+    model_id: str,
+    model_architecture: ModelArchitecture,
+    task_type: Optional[TaskType],
+    matching_model_packages: List[ModelPackageMetadata],
+    model_init_kwargs: dict,
+    model_access_manager: ModelAccessManager,
+    auto_resolution_cache: AutoResolutionCache,
+    auto_negotiation_hash: str,
+    api_key: Optional[str],
+    model_dependencies: Optional[List[ModelDependency]],
+    model_dependencies_instances: Dict[str, AnyModel],
+    model_dependencies_directories: Dict[str, str],
+    max_package_loading_attempts: Optional[int] = None,
+    model_download_file_lock_acquire_timeout: int = 10,
+    verbose: bool = True,
+    verify_hash_while_download: bool = True,
+    download_files_without_hash: bool = False,
+    use_auto_resolution_cache: bool = True,
+    point_model_directory: Optional[Callable[[str], None]] = None,
+) -> AnyModel:
+    if max_package_loading_attempts is not None:
+        matching_model_packages = matching_model_packages[:max_package_loading_attempts]
+    if not matching_model_packages:
+        raise ModelLoadingError(
+            message=f"Cannot load model {model_id} - no matching model package candidates for given model "
+            f"running in this environment.",
+            help_url="https://todo",
+        )
+    failed_load_attempts: List[Tuple[str, Exception]] = []
+    for model_package in matching_model_packages:
+        access_identifiers = AccessIdentifiers(
+            model_id=model_id,
+            package_id=model_package.package_id,
+            api_key=api_key,
+        )
+        verbose_info(
+            message=f"Attempt to load model package: {model_package.get_summary()}",
+            verbose_requested=verbose,
+        )
+        try:
+            model, model_package_cache_dir = initialize_model(
+                model_id=model_id,
+                model_architecture=model_architecture,
+                task_type=task_type,
+                model_package=model_package,
+                model_download_file_lock_acquire_timeout=model_download_file_lock_acquire_timeout,
+                model_init_kwargs=model_init_kwargs,
+                auto_resolution_cache=auto_resolution_cache,
+                auto_negotiation_hash=auto_negotiation_hash,
+                model_dependencies=model_dependencies,
+                model_dependencies_instances=model_dependencies_instances,
+                model_dependencies_directories=model_dependencies_directories,
+                verify_hash_while_download=verify_hash_while_download,
+                download_files_without_hash=download_files_without_hash,
+                on_file_created=partial(
+                    model_access_manager.on_file_created,
+                    access_identifiers=access_identifiers,
+                ),
+                on_file_renamed=partial(
+                    model_access_manager.on_file_renamed,
+                    access_identifiers=access_identifiers,
+                ),
+                on_symlink_created=partial(
+                    model_access_manager.on_symlink_created,
+                    access_identifiers=access_identifiers,
+                ),
+                on_symlink_deleted=model_access_manager.on_symlink_deleted,
+                use_auto_resolution_cache=use_auto_resolution_cache,
+            )
+            model_access_manager.on_model_loaded(
+                model=model,
+                access_identifiers=access_identifiers,
+                model_storage_path=model_package_cache_dir,
+            )
+            if point_model_directory:
+                point_model_directory(model_package_cache_dir)
+            return model
+        except Exception as error:
+            LOGGER.warning(
+                f"Model package with id {model_package.package_id} that was selected to be loaded "
+                f"failed to load with error: {error} of type {error.__class__.__name__}. This may "
+                f"be caused several issues. If you see this warning after manually specifying model "
+                f"package to be loaded - make sure that all required dependencies are installed. If "
+                f"that warning is displayed when the model package was auto-selected - there is most "
+                f"likely a bug in `inference-models` and you should raise an issue providing full context of "
+                f"the event. https://github.com/roboflow/inference/issues"
+            )
+            failed_load_attempts.append((model_package.package_id, error))
+    summary_of_errors = "\n".join(
+        f"\t* model_package_id={model_package_id} error={error} error_type={error.__class__.__name__}"
+        for model_package_id, error in failed_load_attempts
+    )
+    raise ModelLoadingError(
+        message=f"Could not load any of model package candidate for model {model_id}. This may "
+        f"be caused several issues. If you see this warning after manually specifying model "
+        f"package to be loaded - make sure that all required dependencies are installed. If "
+        f"that warning is displayed when the model package was auto-selected - there is most "
+        f"likely a bug in `inference-models` and you should raise an issue providing full context of "
+        f"the event. https://github.com/roboflow/inference/issues\n\n"
+        f"Here is the summary of errors for specific model packages:\n{summary_of_errors}\n\n",
+        help_url="https://todo",
+    )
+def initialize_model(
+    model_id: str,
+    model_architecture: ModelArchitecture,
+    task_type: Optional[TaskType],
+    model_package: ModelPackageMetadata,
+    model_init_kwargs: dict,
+    auto_resolution_cache: AutoResolutionCache,
+    auto_negotiation_hash: str,
+    model_dependencies: Optional[List[ModelDependency]],
+    model_dependencies_instances: Dict[str, AnyModel],
+    model_dependencies_directories: Dict[str, str],
+    model_download_file_lock_acquire_timeout: int = 10,
+    verify_hash_while_download: bool = True,
+    download_files_without_hash: bool = False,
+    on_file_created: Optional[Callable[[str], None]] = None,
+    on_file_renamed: Optional[Callable[[str, str], None]] = None,
+    on_symlink_created: Optional[Callable[[str, str], None]] = None,
+    on_symlink_deleted: Optional[Callable[[str], None]] = None,
+    use_auto_resolution_cache: bool = True,
+) -> Tuple[AnyModel, str]:
+    model_class = resolve_model_class(
+        model_architecture=model_architecture,
+        task_type=task_type,
+        backend=model_package.backend,
+    )
+    for artefact in model_package.package_artefacts:
+        if artefact.file_handle == MODEL_CONFIG_FILE_NAME:
+            raise CorruptedModelPackageError(
+                message=f"For model with id=`{model_id}` and package={model_package.package_id} discovered "
+                f"artefact named `{MODEL_CONFIG_FILE_NAME}` which collides with the config file that "
+                f"inference is supposed to create for a model in order for compatibility with offline "
+                f"loaders. This problem indicate a violation of model package contract and requires change in "
+                f"model package structure. If you experience this issue using hosted Roboflow solution, contact "
+                f"us to solve the problem.",
+                help_url="https://todo",
+            )
+    files_specs = [
+        (a.file_handle, a.download_url, a.md5_hash)
+        for a in model_package.package_artefacts
+    ]
+    file_specs_with_hash = [f for f in files_specs if f[2] is not None]
+    file_specs_without_hash = [f for f in files_specs if f[2] is None]
+    shared_blobs_dir = generate_shared_blobs_path()
+    model_package_cache_dir = generate_model_package_cache_path(
+        model_id=model_id,
+        package_id=model_package.package_id,
+    )
+    os.makedirs(model_package_cache_dir, exist_ok=True)
+    shared_files_mapping = download_files_to_directory(
+        target_dir=shared_blobs_dir,
+        files_specs=file_specs_with_hash,
+        file_lock_acquire_timeout=model_download_file_lock_acquire_timeout,
+        verify_hash_while_download=verify_hash_while_download,
+        download_files_without_hash=download_files_without_hash,
+        name_after="md5_hash",
+        on_file_created=on_file_created,
+        on_file_renamed=on_file_renamed,
+    )
+    model_specific_files_mapping = download_files_to_directory(
+        target_dir=model_package_cache_dir,
+        files_specs=file_specs_without_hash,
+        file_lock_acquire_timeout=model_download_file_lock_acquire_timeout,
+        verify_hash_while_download=verify_hash_while_download,
+        download_files_without_hash=download_files_without_hash,
+        on_file_created=on_file_created,
+        on_file_renamed=on_file_renamed,
+    )
+    symlinks_mapping = create_symlinks_to_shared_blobs(
+        model_dir=model_package_cache_dir,
+        shared_files_mapping=shared_files_mapping,
+        model_download_file_lock_acquire_timeout=model_download_file_lock_acquire_timeout,
+        on_symlink_created=on_symlink_created,
+        on_symlink_deleted=on_symlink_deleted,
+    )
+    config_path = os.path.join(model_package_cache_dir, MODEL_CONFIG_FILE_NAME)
+    dump_model_config_for_offline_use(
+        config_path=config_path,
+        model_architecture=model_architecture,
+        task_type=task_type,
+        backend_type=model_package.backend,
+        file_lock_acquire_timeout=model_download_file_lock_acquire_timeout,
+        on_file_created=on_file_created,
+    )
+    resolved_files = set(shared_files_mapping.values())
+    resolved_files.update(model_specific_files_mapping.values())
+    resolved_files.update(symlinks_mapping.values())
+    resolved_files.add(config_path)
+    dependencies_resolved_files = handle_dependencies_directories_creation(
+        model_package_cache_dir=model_package_cache_dir,
+        model_dependencies_directories=model_dependencies_directories,
+        model_download_file_lock_acquire_timeout=model_download_file_lock_acquire_timeout,
+        on_symlink_created=on_symlink_created,
+        on_symlink_deleted=on_symlink_deleted,
+    )
+    resolved_files.update(dependencies_resolved_files)
+    model_init_kwargs[MODEL_DEPENDENCIES_KEY] = model_dependencies_instances
+    model = model_class.from_pretrained(model_package_cache_dir, **model_init_kwargs)
+    dump_auto_resolution_cache(
+        use_auto_resolution_cache=use_auto_resolution_cache,
+        auto_resolution_cache=auto_resolution_cache,
+        auto_negotiation_hash=auto_negotiation_hash,
+        model_id=model_id,
+        model_package_id=model_package.package_id,
+        model_architecture=model_architecture,
+        task_type=task_type,
+        backend_type=model_package.backend,
+        resolved_files=resolved_files,
+        model_dependencies=model_dependencies,
+    )
+    return model, model_package_cache_dir
+def create_symlinks_to_shared_blobs(
+    model_dir: str,
+    shared_files_mapping: Dict[FileHandle, str],
+    model_download_file_lock_acquire_timeout: int = 10,
+    on_symlink_created: Optional[Callable[[str, str], None]] = None,
+    on_symlink_deleted: Optional[Callable[[str], None]] = None,
+) -> Dict[str, str]:
+    # this function will not override existing files
+    os.makedirs(model_dir, exist_ok=True)
+    result = {}
+    for file_handle, source_path in shared_files_mapping.items():
+        link_name = os.path.join(model_dir, file_handle)
+        target_path = shared_files_mapping[file_handle]
+        result[file_handle] = link_name
+        if os.path.exists(link_name) and (
+            not os.path.islink(link_name) or os.path.realpath(link_name) == target_path
+        ):
+            continue
+        handle_symlink_creation(
+            target_path=target_path,
+            link_name=link_name,
+            model_download_file_lock_acquire_timeout=model_download_file_lock_acquire_timeout,
+            on_symlink_created=on_symlink_created,
+            on_symlink_deleted=on_symlink_deleted,
+        )
+    return result
+def handle_symlink_creation(
+    target_path: str,
+    link_name: str,
+    model_download_file_lock_acquire_timeout: int = 10,
+    on_symlink_created: Optional[Callable[[str, str], None]] = None,
+    on_symlink_deleted: Optional[Callable[[str], None]] = None,
+) -> None:
+    link_dir, link_file_name = os.path.split(os.path.abspath(link_name))
+    os.makedirs(link_dir, exist_ok=True)
+    lock_path = os.path.join(link_dir, f".{link_file_name}.lock")
+    with FileLock(lock_path, timeout=model_download_file_lock_acquire_timeout):
+        if os.path.islink(link_name):
+            # file does not exist, but is link = broken symlink - we should purge
+            os.remove(link_name)
+            if on_symlink_deleted:
+                on_symlink_deleted(link_name)
+        os.symlink(target_path, link_name)
+        if on_symlink_created:
+            on_symlink_created(target_path, link_name)
+def dump_model_config_for_offline_use(
+    config_path: str,
+    model_architecture: Optional[ModelArchitecture],
+    task_type: TaskType,
+    backend_type: Optional[BackendType],
+    file_lock_acquire_timeout: int,
+    on_file_created: Optional[Callable[[str], None]] = None,
+) -> None:
+    if os.path.exists(config_path):
+        # we kinda trust that what we did previously is right - in case when the file
+        # gets corrupted we may end up in problem - to be verified empirically
+        return None
+    target_file_dir, target_file_name = os.path.split(config_path)
+    lock_path = os.path.join(target_file_dir, f".{target_file_name}.lock")
+    with FileLock(lock_path, timeout=file_lock_acquire_timeout):
+        dump_json(
+            path=config_path,
+            content={
+                "model_architecture": model_architecture,
+                "task_type": task_type,
+                "backend_type": backend_type,
+            },
+        )
+        if on_file_created:
+            on_file_created(config_path)
+def handle_dependencies_directories_creation(
+    model_package_cache_dir: str,
+    model_dependencies_directories: Dict[str, str],
+    model_download_file_lock_acquire_timeout: int = 10,
+    on_symlink_created: Optional[Callable[[str, str], None]] = None,
+    on_symlink_deleted: Optional[Callable[[str], None]] = None,
+) -> Set[str]:
+    resolved_files = set()
+    if not model_dependencies_directories:
+        return resolved_files
+    for dependency_name, dependency_directory in model_dependencies_directories.items():
+        dependency_files = scan_dependency_directory_for_resolved_files(
+            dependency_directory=dependency_directory
+        )
+        resolved_files.update(dependency_files)
+        dependencies_sub_dir = os.path.join(
+            model_package_cache_dir, MODEL_DEPENDENCIES_SUB_DIR
+        )
+        target_dependency_dir = os.path.join(dependencies_sub_dir, dependency_name)
+        os.makedirs(dependencies_sub_dir, exist_ok=True)
+        dependency_lock_path = os.path.join(
+            dependencies_sub_dir, f".{dependency_name}.lock"
+        )
+        with FileLock(
+            dependency_lock_path, timeout=model_download_file_lock_acquire_timeout
+        ):
+            if os.path.exists(target_dependency_dir) and os.path.islink(
+                target_dependency_dir
+            ):
+                os.remove(target_dependency_dir)
+                if on_symlink_deleted:
+                    on_symlink_deleted(target_dependency_dir)
+            if not os.path.exists(target_dependency_dir):
+                # Question: is it ok to only try to remove symlink and avoid doing anything else
+                # if we encounter actual file / dir there?
+                os.symlink(dependency_directory, target_dependency_dir)
+                if on_symlink_created:
+                    on_symlink_created(dependency_directory, target_dependency_dir)
+    return resolved_files
+def scan_dependency_directory_for_resolved_files(
+    dependency_directory: str,
+) -> List[str]:
+    # we do not follow symlinks here, as the assumption is that we only support one level of nesting
+    # for packages, wo when we have dependency - this model must not have dependencies, so
+    # we will not encounter directories which are symlinks to be followed.
+    results = []
+    for current_dir, _, files in os.walk(dependency_directory):
+        for file in files:
+            if file.startswith(".") and file.endswith(".lock"):
+                continue
+            full_path = os.path.abspath(os.path.join(current_dir, file))
+            results.append(full_path)
+            if os.path.islink(full_path):
+                results.append(os.readlink(full_path))
+    return results
+def dump_auto_resolution_cache(
+    use_auto_resolution_cache: bool,
+    auto_resolution_cache: AutoResolutionCache,
+    auto_negotiation_hash: str,
+    model_id: str,
+    model_package_id: str,
+    model_architecture: Optional[ModelArchitecture],
+    task_type: TaskType,
+    backend_type: Optional[BackendType],
+    resolved_files: Set[str],
+    model_dependencies: Optional[List[ModelDependency]],
+) -> None:
+    if not use_auto_resolution_cache:
+        return None
+    cache_content = AutoResolutionCacheEntry(
+        model_id=model_id,
+        model_package_id=model_package_id,
+        resolved_files=resolved_files,
+        model_architecture=model_architecture,
+        task_type=task_type,
+        backend_type=backend_type,
+        created_at=datetime.now(),
+        model_dependencies=model_dependencies,
+    )
+    auto_resolution_cache.register(
+        auto_negotiation_hash=auto_negotiation_hash, cache_entry=cache_content
+    )
+def generate_shared_blobs_path() -> str:
+    return os.path.join(INFERENCE_HOME, "shared-blobs")
+def generate_model_package_cache_path(model_id: str, package_id: str) -> str:
+    ensure_package_id_is_os_safe(model_id=model_id, package_id=package_id)
+    model_id_slug = slugify_model_id_to_os_safe_format(model_id=model_id)
+    return os.path.join(INFERENCE_HOME, "models-cache", model_id_slug, package_id)
+def ensure_package_id_is_os_safe(model_id: str, package_id: str) -> None:
+    if re.search(r"[^A-Za-z0-9]", package_id):
+        raise InsecureModelIdentifierError(
+            message=f"Attempted to load model: {model_id} using package ID: {package_id} which "
+            f"has invalid format. ID is expected to contain only ASCII characters and numbers to "
+            f"ensure safety of local cache. If you see this error running your model on Roboflow platform, "
+            f"raise the issue: https://github.com/roboflow/inference/issues. If you are running `inference` "
+            f"outside of the platform, verify that your weights provider keeps the model packages identifiers "
+            f"in the expected format.",
+            help_url="https://TODO",
+        )
+def slugify_model_id_to_os_safe_format(model_id: str) -> str:
+    # Only ASCII
+    model_id_slug = re.sub(r"[^A-Za-z0-9_-]+", "-", model_id)
+    # Collapse multiple underscores/dashes
+    model_id_slug = re.sub(r"[_-]{2,}", "-", model_id_slug)
+    if not model_id_slug:
+        model_id_slug = "special-char-only-model-id"
+    if len(model_id_slug) > 48:
+        model_id_slug = model_id_slug[:48]
+    digest = hashlib.blake2s(model_id.encode("utf-8"), digest_size=4).hexdigest()
+    return f"{model_id_slug}-{digest}"
+def attempt_loading_model_from_local_storage(
+    model_dir_or_weights_path: str,
+    allow_local_code_packages: bool,
+    model_init_kwargs: dict,
+    model_type: Optional[str] = None,
+    task_type: Optional[str] = None,
+    backend_type: Optional[
+        Union[str, BackendType, List[Union[str, BackendType]]]
+    ] = None,
+) -> AnyModel:
+    if os.path.isfile(model_dir_or_weights_path):
+        return attempt_loading_model_from_checkpoint(
+            checkpoint_path=model_dir_or_weights_path,
+            model_init_kwargs=model_init_kwargs,
+            model_type=model_type,
+            task_type=task_type,
+            backend_type=backend_type,
+        )
+    config_path = os.path.join(model_dir_or_weights_path, MODEL_CONFIG_FILE_NAME)
+    model_config = parse_model_config(config_path=config_path)
+    if model_config.is_library_model():
+        return load_library_model_from_local_dir(
+            model_dir=model_dir_or_weights_path,
+            model_config=model_config,
+            model_init_kwargs=model_init_kwargs,
+        )
+    if not allow_local_code_packages:
+        raise ModelLoadingError(
+            message=f"Attempted to load model from local package with arbitrary code. This is not allowed in "
+            f"this environment. To let inference loading such models, use `allow_local_code_packages=True` "
+            f"parameter of `AutoModel.from_pretrained(...)`. If you see this error while using one of Roboflow "
+            f"hosted solution - contact us to solve the problem.",
+            help_url="https://todo",
+        )
+    return load_model_from_local_package_with_arbitrary_code(
+        model_dir=model_dir_or_weights_path,
+        model_config=model_config,
+        model_init_kwargs=model_init_kwargs,
+    )
+def attempt_loading_model_from_checkpoint(
+    checkpoint_path: str,
+    model_init_kwargs: dict,
+    model_type: Optional[str] = None,
+    task_type: Optional[str] = None,
+    backend_type: Optional[
+        Union[str, BackendType, List[Union[str, BackendType]]]
+    ] = None,
+) -> AnyModel:
+    model_architecture, task_type, backend_type = resolve_models_registry_entry(
+        model_type=model_type,
+        task_type=task_type,
+        backend_type=backend_type,
+    )
+    model_init_kwargs["model_type"] = model_type
+    model_class = resolve_model_class(
+        model_architecture=model_architecture,
+        task_type=task_type,
+        backend=backend_type,
+    )
+    return model_class.from_pretrained(checkpoint_path, **model_init_kwargs)
+def resolve_models_registry_entry(
+    model_type: Optional[str],
+    task_type: Optional[str] = None,
+    backend_type: Optional[
+        Union[str, BackendType, List[Union[str, BackendType]]]
+    ] = None,
+) -> Tuple[str, str, BackendType]:
+    #  TODO: in the future this check will grow in size
+    if not model_type:
+        raise ModelLoadingError(
+            message="When loading model directly from checkpoint path, `model_type` parameter must be specified. "
+            "Use one of the supported value, for example `rfdetr-nano` in case you refer checkpoint of "
+            "RFDetr Nano model.",
+            help_url="https://todo",
+        )
+    if model_type not in MODEL_TYPES_TO_LOAD_FROM_CHECKPOINT:
+        raise ModelLoadingError(
+            message="When loading model directly from checkpoint path, `model_type` parameter must define "
+            "one of the type of model that support loading directly from the checkpoints. "
+            f"Models supported in current version: {MODEL_TYPES_TO_LOAD_FROM_CHECKPOINT}",
+            help_url="https://todo",
+        )
+    # a bit of hard coding here, over time we must maintain
+    model_architecture = "rfdetr"
+    if task_type is None:
+        if model_type == "rfdetr-seg-preview":
+            task_type = INSTANCE_SEGMENTATION_TASK
+        else:
+            task_type = OBJECT_DETECTION_TASK
+    if task_type not in {OBJECT_DETECTION_TASK, INSTANCE_SEGMENTATION_TASK}:
+        raise ModelLoadingError(
+            message=f"When loading model directly from checkpoint path, set `model_type` as {model_type} and "
+            f"`task_type` as {task_type}, whereas selected model do only support `{OBJECT_DETECTION_TASK}` "
+            f"task while loading from checkpoint file.",
+            help_url="https://todo",
+        )
+    if backend_type is None:
+        backend_type = BackendType.TORCH
+    if isinstance(backend_type, list) and len(backend_type) != 1:
+        if len(backend_type) != 1:
+            raise ModelLoadingError(
+                message=f"When loading model directly from checkpoint path, set `backend` parameter to be {backend_type}, "
+                f"whereas it is only supported to pass a single value.",
+                help_url="https://todo",
+            )
+        backend_type = backend_type[0]
+    if isinstance(backend_type, str):
+        backend_type = parse_backend_type(value=backend_type)
+    if backend_type is not BackendType.TORCH:
+        raise ModelLoadingError(
+            message=f"When loading model directly from checkpoint path, selected the following backend {backend_type}, "
+            f"but the backend supported for model {model_type} is {BackendType.TORCH}",
+            help_url="https://todo",
+        )
+    return model_architecture, task_type, backend_type
+def parse_model_config(config_path: str) -> InferenceModelConfig:
+    if not os.path.isfile(config_path):
+        raise ModelLoadingError(
+            message=f"Could not find model config while attempting to load model from "
+            f"local directory. This error may be caused by misconfiguration of model package (lack of config "
+            f"file), as well as by clash between model_id or model alias and contents of local disc drive which "
+            f"is possible when you have local directory in current dir which has the name colliding with the "
+            f"model you attempt to load. If your intent was to load model from remote backend (not local "
+            f"storage) - verify the contents of $PWD. If you see this problem while using one of Roboflow "
+            f"hosted solutions - contact us to get help.",
+            help_url="https://todo",
+        )
+    try:
+        raw_config = read_json(path=config_path)
+    except ValueError as error:
+        raise CorruptedModelPackageError(
+            message=f"Could not decode model config while attempting to load model from "
+            f"local directory. This error may be caused by corrupted config file. Validate the content of your "
+            f"model package and check in documentation the required format of model config file. "
+            f"If you see this problem while using one of Roboflow hosted solutions - contact us to get help.",
+            help_url="https://todo",
+        ) from error
+    if not isinstance(raw_config, dict):
+        raise CorruptedModelPackageError(
+            message=f"While loading the model from local directory encountered corrupted model config file - config is "
+            f"supposed to be a dictionary, instead decoded object of type: "
+            f"{type(raw_config)}. If you see this problem while using one of Roboflow hosted solutions - "
+            f"contact us to get help. Otherwise - verify the content of your model config.",
+            help_url="https://todo",
+        )
+    backend_type = None
+    if "backend_type" in raw_config:
+        raw_backend_type = raw_config["backend_type"]
+        try:
+            backend_type = BackendType(raw_backend_type)
+        except ValueError as e:
+            raise CorruptedModelPackageError(
+                message=f"While loading the model from local directory encountered corrupted model config "
+                "- declared `backend_type` ({raw_backend_type}) is not supported by inference. "
+                f"Supported values: {list(t.value for t in BackendType)}. If you see this problem while using "
+                f"one of Roboflow hosted solutions - contact us to get help. Otherwise - verify the content "
+                f"of your model config.",
+                help_url="https://todo",
+            ) from e
+    return InferenceModelConfig(
+        model_architecture=raw_config.get("model_architecture"),
+        task_type=raw_config.get("task_type"),
+        backend_type=backend_type,
+        model_module=raw_config.get("model_module"),
+        model_class=raw_config.get("model_class"),
+    )
+def load_library_model_from_local_dir(
+    model_dir: str,
+    model_config: InferenceModelConfig,
+    model_init_kwargs: dict,
+) -> AnyModel:
+    model_class = resolve_model_class(
+        model_architecture=model_config.model_architecture,
+        task_type=model_config.task_type,
+        backend=model_config.backend_type,
+    )
+    return model_class.from_pretrained(model_dir, **model_init_kwargs)
+def load_model_from_local_package_with_arbitrary_code(
+    model_dir: str,
+    model_config: InferenceModelConfig,
+    model_init_kwargs: dict,
+) -> AnyModel:
+    if model_config.model_module is None or model_config.model_class is None:
+        raise CorruptedModelPackageError(
+            message=f"While loading the model from local directory encountered corrupted model config file. "
+            f"Config does not specify neither `model_module` name nor `model_class`, which are both  "
+            f"required to load models provided with arbitrary code. If you see this problem while using "
+            f"one of Roboflow hosted solutions - contact us to get help. Otherwise - verify the content "
+            f"of your model config.",
+            help_url="https://todo",
+        )
+    model_module_path = os.path.join(model_dir, model_config.model_module)
+    if not os.path.isfile(model_module_path):
+        raise CorruptedModelPackageError(
+            message=f"While loading the model from local directory encountered corrupted model config file. "
+            f"Config pointed module {model_config.model_module}, but there is no file under "
+            f"{model_module_path}. If you see this problem while using "
+            f"one of Roboflow hosted solutions - contact us to get help. Otherwise - verify the content "
+            f"of your model config.",
+            help_url="https://todo",
+        )
+    model_class = load_class_from_path(
+        module_path=model_module_path, class_name=model_config.model_class
+    )
+    return model_class.from_pretrained(model_dir, **model_init_kwargs)
+def load_class_from_path(module_path: str, class_name: str) -> AnyModel:
+    if not os.path.exists(module_path):
+        raise CorruptedModelPackageError(
+            message=f"When loading local model with arbitrary code, encountered issue with loading the module. "
+            "Could find the module under the path specified in model config. If you see this problem "
+            f"while using one of Roboflow hosted solutions - contact us to get help. Otherwise - verify your "
+            f"model package checking if you can load the module with model implementation within your "
+            f"python environment.",
+            help_url="https://todo",
+        )
+    module_name = os.path.splitext(os.path.basename(module_path))[0]
+    spec = importlib.util.spec_from_file_location(module_name, module_path)
+    if spec is None:
+        raise CorruptedModelPackageError(
+            message=f"When loading local model with arbitrary code, encountered issue with loading the module. "
+            "Could not build module specification. If you see this problem while using "
+            f"one of Roboflow hosted solutions - contact us to get help. Otherwise - verify your "
+            f"model package checking if you can load the module with model implementation within your "
+            f"python environment.",
+            help_url="https://todo",
+        )
+    module = importlib.util.module_from_spec(spec)
+    loader = spec.loader
+    if loader is None or not hasattr(loader, "exec_module"):
+        raise CorruptedModelPackageError(
+            message=f"When loading local model with arbitrary code, encountered issue with loading the module. "
+            "Could not execute module loader. If you see this problem while using "
+            f"one of Roboflow hosted solutions - contact us to get help. Otherwise - verify your "
+            f"model package checking if you can load the module with model implementation within your "
+            f"python environment.",
+            help_url="https://todo",
+        )
+    try:
+        loader.exec_module(module)
+    except Exception as error:
+        raise CorruptedModelPackageError(
+            message=f"When loading local model with arbitrary code, encountered issue executing the module code "
+            f"to retrieve model class. Details of the error: {error}. If you see this problem while using "
+            f"one of Roboflow hosted solutions - contact us to get help. Otherwise - verify your "
+            f"model package checking if you can load the module with model implementation within your "
+            f"python environment.",
+            help_url="https://todo",
+        )
+    if not hasattr(module, class_name):
+        raise CorruptedModelPackageError(
+            message=f"When loading local model with arbitrary code, encountered issue with loading the module. "
+            f"Module `{module_name}` has no class `{class_name}`. If you see this problem while using "
+            f"one of Roboflow hosted solutions - contact us to get help. Otherwise - verify your "
+            f"model package checking if you can load the module with model implementation within your "
+            f"python environment. It may also be the case that configuration file of the model points "
+            f"to invalid class name.",
+            help_url="https://todo",
+        )
+    return getattr(module, class_name)