PyPI - inference-models - Versions diffs - 0.18.3__py3-none-any.whl - Mend

inference-models 0.18.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (195) hide show

inference_models/__init__.py +36 -0
inference_models/configuration.py +72 -0
inference_models/constants.py +2 -0
inference_models/entities.py +5 -0
inference_models/errors.py +137 -0
inference_models/logger.py +52 -0
inference_models/model_pipelines/__init__.py +0 -0
inference_models/model_pipelines/auto_loaders/__init__.py +0 -0
inference_models/model_pipelines/auto_loaders/core.py +120 -0
inference_models/model_pipelines/auto_loaders/pipelines_registry.py +36 -0
inference_models/model_pipelines/face_and_gaze_detection/__init__.py +0 -0
inference_models/model_pipelines/face_and_gaze_detection/mediapipe_l2cs.py +200 -0
inference_models/models/__init__.py +0 -0
inference_models/models/auto_loaders/__init__.py +0 -0
inference_models/models/auto_loaders/access_manager.py +168 -0
inference_models/models/auto_loaders/auto_negotiation.py +1329 -0
inference_models/models/auto_loaders/auto_resolution_cache.py +129 -0
inference_models/models/auto_loaders/constants.py +7 -0
inference_models/models/auto_loaders/core.py +1341 -0
inference_models/models/auto_loaders/dependency_models.py +52 -0
inference_models/models/auto_loaders/entities.py +57 -0
inference_models/models/auto_loaders/models_registry.py +497 -0
inference_models/models/auto_loaders/presentation_utils.py +333 -0
inference_models/models/auto_loaders/ranking.py +413 -0
inference_models/models/auto_loaders/utils.py +31 -0
inference_models/models/base/__init__.py +0 -0
inference_models/models/base/classification.py +123 -0
inference_models/models/base/depth_estimation.py +62 -0
inference_models/models/base/documents_parsing.py +111 -0
inference_models/models/base/embeddings.py +66 -0
inference_models/models/base/instance_segmentation.py +87 -0
inference_models/models/base/keypoints_detection.py +93 -0
inference_models/models/base/object_detection.py +143 -0
inference_models/models/base/semantic_segmentation.py +74 -0
inference_models/models/base/types.py +5 -0
inference_models/models/clip/__init__.py +0 -0
inference_models/models/clip/clip_onnx.py +148 -0
inference_models/models/clip/clip_pytorch.py +104 -0
inference_models/models/clip/preprocessing.py +162 -0
inference_models/models/common/__init__.py +0 -0
inference_models/models/common/cuda.py +30 -0
inference_models/models/common/model_packages.py +25 -0
inference_models/models/common/onnx.py +379 -0
inference_models/models/common/roboflow/__init__.py +0 -0
inference_models/models/common/roboflow/model_packages.py +361 -0
inference_models/models/common/roboflow/post_processing.py +436 -0
inference_models/models/common/roboflow/pre_processing.py +1332 -0
inference_models/models/common/torch.py +20 -0
inference_models/models/common/trt.py +266 -0
inference_models/models/deep_lab_v3_plus/__init__.py +0 -0
inference_models/models/deep_lab_v3_plus/deep_lab_v3_plus_segmentation_onnx.py +282 -0
inference_models/models/deep_lab_v3_plus/deep_lab_v3_plus_segmentation_torch.py +264 -0
inference_models/models/deep_lab_v3_plus/deep_lab_v3_plus_segmentation_trt.py +313 -0
inference_models/models/depth_anything_v2/__init__.py +0 -0
inference_models/models/depth_anything_v2/depth_anything_v2_hf.py +77 -0
inference_models/models/dinov3/__init__.py +0 -0
inference_models/models/dinov3/dinov3_classification_onnx.py +348 -0
inference_models/models/dinov3/dinov3_classification_torch.py +323 -0
inference_models/models/doctr/__init__.py +0 -0
inference_models/models/doctr/doctr_torch.py +304 -0
inference_models/models/easy_ocr/__init__.py +0 -0
inference_models/models/easy_ocr/easy_ocr_torch.py +222 -0
inference_models/models/florence2/__init__.py +0 -0
inference_models/models/florence2/florence2_hf.py +897 -0
inference_models/models/grounding_dino/__init__.py +0 -0
inference_models/models/grounding_dino/grounding_dino_torch.py +227 -0
inference_models/models/l2cs/__init__.py +0 -0
inference_models/models/l2cs/l2cs_onnx.py +216 -0
inference_models/models/mediapipe_face_detection/__init__.py +0 -0
inference_models/models/mediapipe_face_detection/face_detection.py +203 -0
inference_models/models/moondream2/__init__.py +0 -0
inference_models/models/moondream2/moondream2_hf.py +281 -0
inference_models/models/owlv2/__init__.py +0 -0
inference_models/models/owlv2/cache.py +182 -0
inference_models/models/owlv2/entities.py +112 -0
inference_models/models/owlv2/owlv2_hf.py +695 -0
inference_models/models/owlv2/reference_dataset.py +291 -0
inference_models/models/paligemma/__init__.py +0 -0
inference_models/models/paligemma/paligemma_hf.py +209 -0
inference_models/models/perception_encoder/__init__.py +0 -0
inference_models/models/perception_encoder/perception_encoder_pytorch.py +197 -0
inference_models/models/perception_encoder/vision_encoder/__init__.py +0 -0
inference_models/models/perception_encoder/vision_encoder/config.py +160 -0
inference_models/models/perception_encoder/vision_encoder/pe.py +742 -0
inference_models/models/perception_encoder/vision_encoder/rope.py +344 -0
inference_models/models/perception_encoder/vision_encoder/tokenizer.py +342 -0
inference_models/models/perception_encoder/vision_encoder/transforms.py +33 -0
inference_models/models/qwen25vl/__init__.py +1 -0
inference_models/models/qwen25vl/qwen25vl_hf.py +285 -0
inference_models/models/resnet/__init__.py +0 -0
inference_models/models/resnet/resnet_classification_onnx.py +330 -0
inference_models/models/resnet/resnet_classification_torch.py +305 -0
inference_models/models/resnet/resnet_classification_trt.py +369 -0
inference_models/models/rfdetr/__init__.py +0 -0
inference_models/models/rfdetr/backbone_builder.py +101 -0
inference_models/models/rfdetr/class_remapping.py +41 -0
inference_models/models/rfdetr/common.py +115 -0
inference_models/models/rfdetr/default_labels.py +108 -0
inference_models/models/rfdetr/dinov2_with_windowed_attn.py +1330 -0
inference_models/models/rfdetr/misc.py +26 -0
inference_models/models/rfdetr/ms_deform_attn.py +180 -0
inference_models/models/rfdetr/ms_deform_attn_func.py +60 -0
inference_models/models/rfdetr/position_encoding.py +166 -0
inference_models/models/rfdetr/post_processor.py +83 -0
inference_models/models/rfdetr/projector.py +373 -0
inference_models/models/rfdetr/rfdetr_backbone_pytorch.py +394 -0
inference_models/models/rfdetr/rfdetr_base_pytorch.py +807 -0
inference_models/models/rfdetr/rfdetr_instance_segmentation_onnx.py +206 -0
inference_models/models/rfdetr/rfdetr_instance_segmentation_pytorch.py +373 -0
inference_models/models/rfdetr/rfdetr_instance_segmentation_trt.py +227 -0
inference_models/models/rfdetr/rfdetr_object_detection_onnx.py +244 -0
inference_models/models/rfdetr/rfdetr_object_detection_pytorch.py +470 -0
inference_models/models/rfdetr/rfdetr_object_detection_trt.py +270 -0
inference_models/models/rfdetr/segmentation_head.py +273 -0
inference_models/models/rfdetr/transformer.py +767 -0
inference_models/models/roboflow_instant/__init__.py +0 -0
inference_models/models/roboflow_instant/roboflow_instant_hf.py +141 -0
inference_models/models/sam/__init__.py +0 -0
inference_models/models/sam/cache.py +147 -0
inference_models/models/sam/entities.py +25 -0
inference_models/models/sam/sam_torch.py +675 -0
inference_models/models/sam2/__init__.py +0 -0
inference_models/models/sam2/cache.py +162 -0
inference_models/models/sam2/entities.py +43 -0
inference_models/models/sam2/sam2_torch.py +905 -0
inference_models/models/sam2_rt/__init__.py +0 -0
inference_models/models/sam2_rt/sam2_pytorch.py +119 -0
inference_models/models/smolvlm/__init__.py +0 -0
inference_models/models/smolvlm/smolvlm_hf.py +245 -0
inference_models/models/trocr/__init__.py +0 -0
inference_models/models/trocr/trocr_hf.py +53 -0
inference_models/models/vit/__init__.py +0 -0
inference_models/models/vit/vit_classification_huggingface.py +319 -0
inference_models/models/vit/vit_classification_onnx.py +326 -0
inference_models/models/vit/vit_classification_trt.py +365 -0
inference_models/models/yolact/__init__.py +1 -0
inference_models/models/yolact/yolact_instance_segmentation_onnx.py +336 -0
inference_models/models/yolact/yolact_instance_segmentation_trt.py +361 -0
inference_models/models/yolo_world/__init__.py +1 -0
inference_models/models/yolonas/__init__.py +0 -0
inference_models/models/yolonas/nms.py +44 -0
inference_models/models/yolonas/yolonas_object_detection_onnx.py +204 -0
inference_models/models/yolonas/yolonas_object_detection_trt.py +230 -0
inference_models/models/yolov10/__init__.py +0 -0
inference_models/models/yolov10/yolov10_object_detection_onnx.py +187 -0
inference_models/models/yolov10/yolov10_object_detection_trt.py +215 -0
inference_models/models/yolov11/__init__.py +0 -0
inference_models/models/yolov11/yolov11_onnx.py +28 -0
inference_models/models/yolov11/yolov11_torch_script.py +25 -0
inference_models/models/yolov11/yolov11_trt.py +21 -0
inference_models/models/yolov12/__init__.py +0 -0
inference_models/models/yolov12/yolov12_onnx.py +7 -0
inference_models/models/yolov12/yolov12_torch_script.py +7 -0
inference_models/models/yolov12/yolov12_trt.py +7 -0
inference_models/models/yolov5/__init__.py +0 -0
inference_models/models/yolov5/nms.py +99 -0
inference_models/models/yolov5/yolov5_instance_segmentation_onnx.py +225 -0
inference_models/models/yolov5/yolov5_instance_segmentation_trt.py +255 -0
inference_models/models/yolov5/yolov5_object_detection_onnx.py +192 -0
inference_models/models/yolov5/yolov5_object_detection_trt.py +218 -0
inference_models/models/yolov7/__init__.py +0 -0
inference_models/models/yolov7/yolov7_instance_segmentation_onnx.py +226 -0
inference_models/models/yolov7/yolov7_instance_segmentation_trt.py +253 -0
inference_models/models/yolov8/__init__.py +0 -0
inference_models/models/yolov8/yolov8_classification_onnx.py +181 -0
inference_models/models/yolov8/yolov8_instance_segmentation_onnx.py +239 -0
inference_models/models/yolov8/yolov8_instance_segmentation_torch_script.py +201 -0
inference_models/models/yolov8/yolov8_instance_segmentation_trt.py +268 -0
inference_models/models/yolov8/yolov8_key_points_detection_onnx.py +263 -0
inference_models/models/yolov8/yolov8_key_points_detection_torch_script.py +218 -0
inference_models/models/yolov8/yolov8_key_points_detection_trt.py +287 -0
inference_models/models/yolov8/yolov8_object_detection_onnx.py +213 -0
inference_models/models/yolov8/yolov8_object_detection_torch_script.py +166 -0
inference_models/models/yolov8/yolov8_object_detection_trt.py +231 -0
inference_models/models/yolov9/__init__.py +0 -0
inference_models/models/yolov9/yolov9_onnx.py +7 -0
inference_models/models/yolov9/yolov9_torch_script.py +7 -0
inference_models/models/yolov9/yolov9_trt.py +7 -0
inference_models/runtime_introspection/__init__.py +0 -0
inference_models/runtime_introspection/core.py +410 -0
inference_models/utils/__init__.py +0 -0
inference_models/utils/download.py +608 -0
inference_models/utils/environment.py +28 -0
inference_models/utils/file_system.py +51 -0
inference_models/utils/hashing.py +7 -0
inference_models/utils/imports.py +48 -0
inference_models/utils/onnx_introspection.py +17 -0
inference_models/weights_providers/__init__.py +0 -0
inference_models/weights_providers/core.py +20 -0
inference_models/weights_providers/entities.py +159 -0
inference_models/weights_providers/roboflow.py +601 -0
inference_models-0.18.3.dist-info/METADATA +466 -0
inference_models-0.18.3.dist-info/RECORD +195 -0
inference_models-0.18.3.dist-info/WHEEL +5 -0
inference_models-0.18.3.dist-info/top_level.txt +1 -0

inference_models/utils/download.py ADDED Viewed

@@ -0,0 +1,608 @@
+import hashlib
+import math
+import os
+from concurrent.futures import FIRST_EXCEPTION, ThreadPoolExecutor, wait
+from threading import Lock
+from typing import Callable, Dict, List, Literal, Optional, Set, Tuple, Union
+from uuid import uuid4
+import backoff
+import requests
+from filelock import FileLock
+from requests import Response, Timeout
+from rich.progress import (
+    BarColumn,
+    DownloadColumn,
+    Progress,
+    TimeRemainingColumn,
+    TransferSpeedColumn,
+)
+from inference_models.configuration import (
+    API_CALLS_MAX_TRIES,
+    API_CALLS_TIMEOUT,
+    DISABLE_INTERACTIVE_PROGRESS_BARS,
+    IDEMPOTENT_API_REQUEST_CODES_TO_RETRY,
+)
+from inference_models.errors import (
+    FileHashSumMissmatch,
+    InvalidParameterError,
+    RetryError,
+    UntrustedFileError,
+)
+from inference_models.logger import LOGGER
+from inference_models.utils.file_system import (
+    ensure_parent_dir_exists,
+    pre_allocate_file,
+    remove_file_if_exists,
+    stream_file_bytes,
+)
+FileHandle = str
+DownloadUrl = str
+MD5Hash = Optional[str]
+MIN_SIZE_FOR_THREADED_DOWNLOAD = 32 * 1024 * 1024  # 32MB
+MIN_THREAD_CHUNK_SIZE = 16 * 1024 * 1024  # 16MB
+DEFAULT_STREAM_DOWNLOAD_CHUNK = 1 * 1024 * 1024  # 1MB
+class HashNullObject:
+    def update(self, *args, **kwargs) -> None:
+        pass
+    def hexdigest(self) -> None:
+        return None
+def download_files_to_directory(
+    target_dir: str,
+    files_specs: List[Tuple[FileHandle, DownloadUrl, MD5Hash]],
+    verbose: bool = True,
+    response_codes_to_retry: Optional[Set[int]] = None,
+    request_timeout: Optional[int] = None,
+    max_parallel_downloads: int = 8,
+    max_threads_per_download: int = 8,
+    file_lock_acquire_timeout: int = 10,
+    verify_hash_while_download: bool = True,
+    download_files_without_hash: bool = False,
+    name_after: Literal["file_handle", "md5_hash"] = "file_handle",
+    on_file_created: Optional[Callable[[str], None]] = None,
+    on_file_renamed: Optional[Callable[[str, str], None]] = None,
+) -> Dict[str, str]:
+    if name_after not in {"file_handle", "md5_hash"}:
+        raise InvalidParameterError(
+            message="Function download_files_to_directory(...) was called with "
+            f"invalid value of parameter `name_after` - received value `{name_after}`. "
+            f"This is a bug in `inference-models` - submit new issue under "
+            f"https://github.com/roboflow/inference/issues/",
+            help_url="https://todo",
+        )
+    if DISABLE_INTERACTIVE_PROGRESS_BARS:
+        verbose = False
+    files_mapping = construct_files_path_mapping(
+        target_dir=target_dir,
+        files_specs=files_specs,
+        name_after=name_after,
+    )
+    files_specs = exclude_existing_files(
+        files_specs=files_specs,
+        files_mapping=files_mapping,
+    )
+    if not files_specs:
+        return files_mapping
+    if response_codes_to_retry is None:
+        response_codes_to_retry = IDEMPOTENT_API_REQUEST_CODES_TO_RETRY
+    if request_timeout is None:
+        request_timeout = API_CALLS_TIMEOUT
+    if not download_files_without_hash:
+        untrusted_files = [f[1] for f in files_specs if f[2] is None]
+        if len(untrusted_files) > 0:
+            raise UntrustedFileError(
+                message=f"While downloading files detected {len(untrusted_files)} untrusted file(s): {untrusted_files} "
+                f"without MD5 hash sum to verify the download content. The download method was used with "
+                f"`download_files_without_hash=False` - which prevents from downloading such files. If you see "
+                f"this error while using hosted Roboflow serving option - contact us to get support.",
+                help_url="https://todo",
+            )
+    os.makedirs(target_dir, exist_ok=True)
+    progress = Progress(
+        "[progress.description]{task.description}",
+        BarColumn(),
+        DownloadColumn(),
+        TransferSpeedColumn(),
+        TimeRemainingColumn(),
+        disable=not verbose,
+    )
+    download_id = str(uuid4())
+    with progress:
+        with ThreadPoolExecutor(max_workers=max_parallel_downloads) as executor:
+            futures = []
+            for file_handle, download_url, md5_hash in files_specs:
+                future = executor.submit(
+                    safe_download_file,
+                    target_file_path=files_mapping[file_handle],
+                    download_url=download_url,
+                    md5_hash=md5_hash,
+                    verify_hash_while_download=verify_hash_while_download,
+                    download_id=download_id,
+                    progress=progress,
+                    response_codes_to_retry=response_codes_to_retry,
+                    request_timeout=request_timeout,
+                    max_threads_per_download=max_threads_per_download,
+                    file_lock_acquire_timeout=file_lock_acquire_timeout,
+                    on_file_created=on_file_created,
+                    on_file_renamed=on_file_renamed,
+                )
+                futures.append(future)
+            done_futures, pending_futures = wait(futures, return_when=FIRST_EXCEPTION)
+            for pending_future in pending_futures:
+                pending_future.cancel()
+            _ = wait(pending_futures)
+            for future in done_futures:
+                future_exception = future.exception()
+                if future_exception:
+                    raise future_exception
+        return files_mapping
+def construct_files_path_mapping(
+    target_dir: str,
+    files_specs: List[Tuple[FileHandle, DownloadUrl, MD5Hash]],
+    name_after: Literal["file_handle", "md5_hash"] = "file_handle",
+) -> Dict[FileHandle, str]:
+    result = {}
+    for file_handle, download_url, content_hash in files_specs:
+        if name_after == "md5_hash" and content_hash is None:
+            raise UntrustedFileError(
+                message="Attempted to download file without declared hash sum when "
+                "`name_after='md5_hash'` - this problem is either misconfiguration "
+                "of download procedure in `inference-models` or bug in the codebase. "
+                "If you see this error using hosted Roboflow solution - contact us to get "
+                "help. Running locally, verify the download code and raise an issue if you see "
+                "a bug: https://github.com/roboflow/inference/issues/",
+                help_url="https://todo",
+            )
+        if name_after == "md5_hash":
+            target_path = os.path.join(target_dir, content_hash)
+        else:
+            target_path = os.path.join(target_dir, file_handle)
+        result[file_handle] = target_path
+    return result
+def exclude_existing_files(
+    files_specs: List[Tuple[FileHandle, DownloadUrl, MD5Hash]],
+    files_mapping: Dict[FileHandle, str],
+) -> List[Tuple[FileHandle, DownloadUrl, MD5Hash]]:
+    result = []
+    for file_specs in files_specs:
+        target_path = files_mapping[file_specs[0]]
+        if not os.path.isfile(target_path):
+            result.append(file_specs)
+    return result
+def safe_download_file(
+    target_file_path: str,
+    download_url: str,
+    download_id: str,
+    md5_hash: MD5Hash,
+    verify_hash_while_download: bool,
+    progress: Progress,
+    response_codes_to_retry: Set[int],
+    request_timeout: int,
+    max_threads_per_download: int,
+    file_lock_acquire_timeout: int,
+    on_file_created: Optional[Callable[[str], None]] = None,
+    on_file_renamed: Optional[Callable[[str, str], None]] = None,
+) -> None:
+    ensure_parent_dir_exists(path=target_file_path)
+    target_file_dir, target_file_name = os.path.split(target_file_path)
+    lock_path = os.path.join(target_file_dir, f".{target_file_name}.lock")
+    tmp_download_file = os.path.abspath(
+        os.path.join(target_file_dir, f"{target_file_name}.{download_id}")
+    )
+    try:
+        with FileLock(lock_path, timeout=file_lock_acquire_timeout):
+            safe_execute_download(
+                download_url=download_url,
+                tmp_download_file=tmp_download_file,
+                target_file_path=target_file_path,
+                md5_hash=md5_hash,
+                verify_hash_while_download=verify_hash_while_download,
+                progress=progress,
+                response_codes_to_retry=response_codes_to_retry,
+                request_timeout=request_timeout,
+                max_threads_per_download=max_threads_per_download,
+                original_file_name=target_file_name,
+                on_file_created=on_file_created,
+                on_file_renamed=on_file_renamed,
+            )
+    finally:
+        remove_file_if_exists(path=tmp_download_file)
+def safe_execute_download(
+    download_url: str,
+    tmp_download_file: str,
+    target_file_path: str,
+    md5_hash: MD5Hash,
+    verify_hash_while_download: bool,
+    progress: Progress,
+    response_codes_to_retry: Set[int],
+    request_timeout: int,
+    max_threads_per_download: int,
+    original_file_name: str,
+    on_file_created: Optional[Callable[[str], None]] = None,
+    on_file_renamed: Optional[Callable[[str, str], None]] = None,
+) -> None:
+    expected_file_size = safe_check_range_download_option(
+        url=download_url,
+        timeout=request_timeout,
+        response_codes_to_retry=response_codes_to_retry,
+    )
+    download_task = progress.add_task(
+        description=f"{original_file_name}: Download",
+        total=expected_file_size,
+        start=True,
+        visible=True,
+    )
+    hash_calculation_task = (
+        []
+    )  # yeah, this is a dirty trick to add task in closure in runtime
+    progress_task_lock = Lock()
+    def on_chunk_downloaded(bytes_num: int) -> None:
+        with progress_task_lock:
+            progress.advance(download_task, bytes_num)
+    def on_hash_calculation_started() -> None:
+        if len(hash_calculation_task) > 0:
+            return None
+        progress.remove_task(download_task)
+        new_hash_calculation_task = progress.add_task(
+            description=f"{original_file_name}: Verify hash",
+            total=expected_file_size,
+            start=True,
+            visible=True,
+        )
+        hash_calculation_task.append(new_hash_calculation_task)
+    def on_hash_chunk_calculated(bytes_num: int) -> None:
+        if len(hash_calculation_task) != 1:
+            return None
+        progress.advance(hash_calculation_task[0], bytes_num)
+    if (
+        expected_file_size is None
+        or expected_file_size < MIN_SIZE_FOR_THREADED_DOWNLOAD
+        or max_threads_per_download <= 1
+    ):
+        stream_download(
+            url=download_url,
+            target_path=tmp_download_file,
+            timeout=request_timeout,
+            md5_hash=md5_hash,
+            verify_hash_while_download=verify_hash_while_download,
+            response_codes_to_retry=response_codes_to_retry,
+            on_chunk_downloaded=on_chunk_downloaded,
+            on_file_created=on_file_created,
+        )
+    else:
+        threaded_download_file(
+            url=download_url,
+            target_path=tmp_download_file,
+            file_size=expected_file_size,
+            response_codes_to_retry=response_codes_to_retry,
+            request_timeout=request_timeout,
+            md5_hash=md5_hash,
+            verify_hash_while_download=verify_hash_while_download,
+            max_threads_per_download=max_threads_per_download,
+            on_chunk_downloaded=on_chunk_downloaded,
+            on_file_created=on_file_created,
+            on_hash_calculation_started=on_hash_calculation_started,
+            on_hash_chunk_calculated=on_hash_chunk_calculated,
+        )
+    os.rename(tmp_download_file, target_file_path)
+    if on_file_renamed:
+        on_file_renamed(tmp_download_file, target_file_path)
+def safe_check_range_download_option(
+    url: str, timeout: int, response_codes_to_retry: Set[int]
+) -> Optional[int]:
+    try:
+        return check_range_download_option(
+            url=url, timeout=timeout, response_codes_to_retry=response_codes_to_retry
+        )
+    except Exception:
+        LOGGER.warning(f"Cannot use range requests for {url}")
+        return None
+@backoff.on_exception(
+    backoff.constant,
+    exception=RetryError,
+    max_tries=API_CALLS_MAX_TRIES,
+    interval=1,
+)
+def check_range_download_option(
+    url: str, timeout: int, response_codes_to_retry: Set[int]
+) -> Optional[int]:
+    try:
+        response = requests.head(url, timeout=timeout)
+    except (OSError, Timeout, requests.exceptions.ConnectionError):
+        raise RetryError(
+            message=f"Connectivity error for URL: {url}", help_url="https://todo"
+        )
+    if response.status_code in response_codes_to_retry:
+        raise RetryError(
+            message=f"Remote server returned response code {response.status_code} for URL {url}",
+            help_url="https://todo",
+        )
+    response.raise_for_status()
+    accept_ranges = response.headers.get("accept-ranges", "none")
+    content_length = response.headers.get("content-length")
+    if "bytes" not in accept_ranges.lower():
+        return None
+    if not content_length:
+        return None
+    return int(content_length)
+@backoff.on_exception(
+    backoff.constant,
+    exception=RetryError,
+    max_tries=API_CALLS_MAX_TRIES,
+    interval=1,
+)
+def get_content_length(
+    url: str,
+    timeout: Optional[int] = None,
+    response_codes_to_retry: Optional[Set[int]] = None,
+) -> Optional[int]:
+    if response_codes_to_retry is None:
+        response_codes_to_retry = IDEMPOTENT_API_REQUEST_CODES_TO_RETRY
+    if timeout is None:
+        timeout = API_CALLS_TIMEOUT
+    try:
+        response = requests.head(url, timeout=timeout)
+    except (OSError, Timeout, requests.exceptions.ConnectionError):
+        raise RetryError(
+            message=f"Connectivity error for URL: {url}", help_url="https://todo"
+        )
+    if response.status_code in response_codes_to_retry:
+        raise RetryError(
+            message=f"Remote server returned response code {response.status_code} for URL {url}",
+            help_url="https://todo",
+        )
+    response.raise_for_status()
+    content_length = response.headers.get("content-length")
+    if content_length is None:
+        return None
+    return int(content_length)
+def threaded_download_file(
+    url: str,
+    target_path: str,
+    file_size: int,
+    response_codes_to_retry: Set[int],
+    request_timeout: int,
+    max_threads_per_download: int,
+    md5_hash: MD5Hash,
+    verify_hash_while_download: bool,
+    on_chunk_downloaded: Optional[Callable[[int], None]] = None,
+    on_file_created: Optional[Callable[[str], None]] = None,
+    on_hash_calculation_started: Optional[Callable[[], None]] = None,
+    on_hash_chunk_calculated: Optional[Callable[[int], None]] = None,
+) -> None:
+    chunks_boundaries = generate_chunks_boundaries(
+        file_size=file_size,
+        max_threads=max_threads_per_download,
+        min_chunk_size=MIN_THREAD_CHUNK_SIZE,
+    )
+    pre_allocate_file(
+        path=target_path, file_size=file_size, on_file_created=on_file_created
+    )
+    futures = []
+    max_workers = min(len(chunks_boundaries), max_threads_per_download)
+    with ThreadPoolExecutor(max_workers=max_workers) as executor:
+        for start, end in chunks_boundaries:
+            future = executor.submit(
+                download_chunk,
+                url=url,
+                start=start,
+                end=end,
+                target_path=target_path,
+                timeout=request_timeout,
+                response_codes_to_retry=response_codes_to_retry,
+                on_chunk_downloaded=on_chunk_downloaded,
+            )
+            futures.append(future)
+        done_futures, pending_futures = wait(futures, return_when=FIRST_EXCEPTION)
+        for pending_future in pending_futures:
+            pending_future.cancel()
+        _ = wait(pending_futures)
+        for future in done_futures:
+            future_exception = future.exception()
+            if future_exception:
+                raise future_exception
+    if not verify_hash_while_download:
+        return None
+    if on_hash_calculation_started:
+        on_hash_calculation_started()
+    verify_hash_sum_of_local_file(
+        url=url,
+        file_path=target_path,
+        expected_md5_hash=md5_hash,
+        on_hash_chunk_calculated=on_hash_chunk_calculated,
+    )
+def verify_hash_sum_of_local_file(
+    url: str,
+    file_path: str,
+    expected_md5_hash: MD5Hash,
+    on_hash_chunk_calculated: Optional[Callable[[int], None]] = None,
+) -> None:
+    computed_hash = hashlib.md5()
+    for file_chunk in stream_file_bytes(
+        path=file_path, chunk_size=MIN_THREAD_CHUNK_SIZE
+    ):
+        computed_hash.update(file_chunk)
+        if on_hash_chunk_calculated:
+            on_hash_chunk_calculated(len(file_chunk))
+    if computed_hash.hexdigest() != expected_md5_hash:
+        raise FileHashSumMissmatch(
+            f"Could not confirm the validity of file content for url: {url}. "
+            f"Expected MD5: {expected_md5_hash}, calculated hash: {computed_hash.hexdigest()}",
+            help_url="https://todo",
+        )
+def generate_chunks_boundaries(
+    file_size: int,
+    max_threads: int,
+    min_chunk_size: int,
+) -> List[Tuple[int, int]]:
+    if file_size <= 0:
+        return []
+    chunk_size = math.ceil(file_size / max_threads)
+    if chunk_size < min_chunk_size:
+        chunk_size = min_chunk_size
+    ranges = []
+    accumulated_size = 0
+    while accumulated_size < file_size:
+        ranges.append((accumulated_size, accumulated_size + chunk_size - 1))
+        accumulated_size += chunk_size
+    ranges[-1] = (ranges[-1][0], file_size - 1)
+    return ranges
+@backoff.on_exception(
+    backoff.constant,
+    exception=RetryError,
+    max_tries=API_CALLS_MAX_TRIES,
+    interval=1,
+)
+def download_chunk(
+    url: str,
+    start: int,
+    end: int,
+    target_path: str,
+    timeout: int,
+    response_codes_to_retry: Set[int],
+    file_chunk: int = DEFAULT_STREAM_DOWNLOAD_CHUNK,
+    on_chunk_downloaded: Optional[Callable[[int], None]] = None,
+) -> None:
+    headers = {"Range": f"bytes={start}-{end}"}
+    try:
+        with requests.get(
+            url, headers=headers, stream=True, timeout=timeout
+        ) as response:
+            if response.status_code in response_codes_to_retry:
+                raise RetryError(
+                    message=f"File hosting returned {response.status_code}",
+                    help_url="https://todo",
+                )
+            response.raise_for_status()
+            if response.status_code != 206:
+                raise RetryError(
+                    message=f"Server does not support range requests (returned {response.status_code} instead of 206)",
+                    help_url="https://todo",
+                )
+            _handle_stream_download(
+                response=response,
+                target_path=target_path,
+                file_chunk=file_chunk,
+                on_chunk_downloaded=on_chunk_downloaded,
+                file_open_mode="r+b",
+                offset=start,
+            )
+    except (ConnectionError, Timeout, requests.exceptions.ConnectionError):
+        raise RetryError(
+            message=f"Connectivity error",
+            help_url="https://todo",
+        )
+@backoff.on_exception(
+    backoff.constant,
+    exception=RetryError,
+    max_tries=API_CALLS_MAX_TRIES,
+    interval=1,
+)
+def stream_download(
+    url: str,
+    target_path: str,
+    timeout: int,
+    response_codes_to_retry: Set[int],
+    md5_hash: MD5Hash,
+    verify_hash_while_download: bool,
+    file_chunk: int = DEFAULT_STREAM_DOWNLOAD_CHUNK,
+    on_chunk_downloaded: Optional[Callable[[int], None]] = None,
+    on_file_created: Optional[Callable[[str], None]] = None,
+) -> None:
+    ensure_parent_dir_exists(path=target_path)
+    computed_hash = (
+        HashNullObject()
+        if md5_hash is None or verify_hash_while_download is None
+        else hashlib.md5()
+    )
+    try:
+        with requests.get(url, stream=True, timeout=timeout) as response:
+            if response.status_code in response_codes_to_retry:
+                raise RetryError(
+                    message=f"File hosting returned {response.status_code}",
+                    help_url="https://todo",
+                )
+            response.raise_for_status()
+            _handle_stream_download(
+                response=response,
+                target_path=target_path,
+                file_chunk=file_chunk,
+                on_chunk_downloaded=on_chunk_downloaded,
+                content_storage=computed_hash,
+                on_file_created=on_file_created,
+            )
+    except (ConnectionError, Timeout, requests.exceptions.ConnectionError):
+        raise RetryError(
+            message=f"Connectivity error",
+            help_url="https://todo",
+        )
+    if not verify_hash_while_download:
+        return None
+    if computed_hash.hexdigest() != md5_hash:
+        raise FileHashSumMissmatch(
+            f"Could not confirm the validity of file content for url: {url}. Expected MD5: {md5_hash}, "
+            f"calculated hash: {computed_hash.hexdigest()}",
+            help_url="https://todo",
+        )
+    return None
+def _handle_stream_download(
+    response: Response,
+    target_path: str,
+    file_chunk: int,
+    on_chunk_downloaded: Optional[Callable[[int], None]] = None,
+    file_open_mode: str = "wb",
+    offset: Optional[int] = None,
+    content_storage: Optional[Union[hashlib.md5, HashNullObject]] = None,
+    on_file_created: Optional[Callable[[str], None]] = None,
+) -> None:
+    with open(target_path, file_open_mode) as file:
+        if on_file_created:
+            on_file_created(target_path)
+        if offset:
+            file.seek(offset)
+        for chunk in response.iter_content(file_chunk):
+            file.write(chunk)
+            if content_storage is not None:
+                content_storage.update(chunk)
+            if on_chunk_downloaded:
+                on_chunk_downloaded(len(chunk))

inference_models/utils/environment.py ADDED Viewed

@@ -0,0 +1,28 @@
+from typing import Any, List
+from inference_models.errors import InvalidEnvVariable
+def parse_comma_separated_values(values: str) -> List[str]:
+    if not values:
+        return []
+    return [v.strip() for v in values.split(",") if v.strip()]
+def str2bool(value: Any) -> bool:
+    if isinstance(value, bool):
+        return value
+    if not issubclass(type(value), str):
+        raise InvalidEnvVariable(
+            message=f"Expected a boolean environment variable (true or false) but got '{value}'",
+            help_url="https://todo",
+        )
+    if value.lower() == "true":
+        return True
+    elif value.lower() == "false":
+        return False
+    else:
+        raise InvalidEnvVariable(
+            message=f"Expected a boolean environment variable (true or false) but got '{value}'",
+            help_url="https://todo",
+        )

inference_models/utils/file_system.py ADDED Viewed

@@ -0,0 +1,51 @@
+import json
+import os
+from typing import Callable, Generator, Optional, Union
+def stream_file_lines(path: str) -> Generator[str, None, None]:
+    with open(path, "r") as f:
+        for line in f.readlines():
+            stripped_line = line.strip()
+            if stripped_line:
+                yield stripped_line
+def stream_file_bytes(path: str, chunk_size: int) -> Generator[bytes, None, None]:
+    chunk_size = max(chunk_size, 1)
+    with open(path, "rb") as f:
+        chunk = f.read(chunk_size)
+        while chunk:
+            yield chunk
+            chunk = f.read(chunk_size)
+def read_json(path: str) -> Optional[Union[dict, list]]:
+    with open(path) as f:
+        return json.load(f)
+def dump_json(path: str, content: Union[dict, list]) -> None:
+    ensure_parent_dir_exists(path=path)
+    with open(path, "w") as f:
+        json.dump(content, f)
+def pre_allocate_file(
+    path: str, file_size: int, on_file_created: Optional[Callable[[str], None]] = None
+) -> None:
+    ensure_parent_dir_exists(path=path)
+    with open(path, "wb") as f:
+        if on_file_created:
+            on_file_created(path)
+        f.truncate(file_size)
+def ensure_parent_dir_exists(path: str) -> None:
+    parent_dir = os.path.dirname(os.path.abspath(path))
+    os.makedirs(parent_dir, exist_ok=True)
+def remove_file_if_exists(path: str) -> None:
+    if os.path.isfile(path):
+        os.remove(path)

inference_models/utils/hashing.py ADDED Viewed

@@ -0,0 +1,7 @@
+import hashlib
+import json
+def hash_dict_content(content: dict) -> str:
+    content_string = json.dumps(content, sort_keys=True)
+    return hashlib.sha256(content_string.encode()).hexdigest()