PyPI - deepdoctection - Versions diffs - 0.32__py3-none-any.whl → 0.34__py3-none-any.whl - Mend

deepdoctection 0.32py3-none-any.whl → 0.34py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of deepdoctection might be problematic. Click here for more details.

Files changed (111) hide show

deepdoctection/__init__.py +8 -25
deepdoctection/analyzer/dd.py +84 -71
deepdoctection/dataflow/common.py +9 -5
deepdoctection/dataflow/custom.py +5 -5
deepdoctection/dataflow/custom_serialize.py +75 -18
deepdoctection/dataflow/parallel_map.py +3 -3
deepdoctection/dataflow/serialize.py +4 -4
deepdoctection/dataflow/stats.py +3 -3
deepdoctection/datapoint/annotation.py +78 -56
deepdoctection/datapoint/box.py +7 -7
deepdoctection/datapoint/convert.py +6 -6
deepdoctection/datapoint/image.py +157 -75
deepdoctection/datapoint/view.py +175 -151
deepdoctection/datasets/adapter.py +30 -24
deepdoctection/datasets/base.py +10 -10
deepdoctection/datasets/dataflow_builder.py +3 -3
deepdoctection/datasets/info.py +23 -25
deepdoctection/datasets/instances/doclaynet.py +48 -49
deepdoctection/datasets/instances/fintabnet.py +44 -45
deepdoctection/datasets/instances/funsd.py +23 -23
deepdoctection/datasets/instances/iiitar13k.py +8 -8
deepdoctection/datasets/instances/layouttest.py +2 -2
deepdoctection/datasets/instances/publaynet.py +3 -3
deepdoctection/datasets/instances/pubtables1m.py +18 -18
deepdoctection/datasets/instances/pubtabnet.py +30 -29
deepdoctection/datasets/instances/rvlcdip.py +28 -29
deepdoctection/datasets/instances/xfund.py +51 -30
deepdoctection/datasets/save.py +6 -6
deepdoctection/eval/accmetric.py +32 -33
deepdoctection/eval/base.py +8 -9
deepdoctection/eval/cocometric.py +13 -12
deepdoctection/eval/eval.py +32 -26
deepdoctection/eval/tedsmetric.py +16 -12
deepdoctection/eval/tp_eval_callback.py +7 -16
deepdoctection/extern/base.py +339 -134
deepdoctection/extern/d2detect.py +69 -89
deepdoctection/extern/deskew.py +11 -10
deepdoctection/extern/doctrocr.py +81 -64
deepdoctection/extern/fastlang.py +23 -16
deepdoctection/extern/hfdetr.py +53 -38
deepdoctection/extern/hflayoutlm.py +216 -155
deepdoctection/extern/hflm.py +35 -30
deepdoctection/extern/model.py +433 -255
deepdoctection/extern/pdftext.py +15 -15
deepdoctection/extern/pt/ptutils.py +4 -2
deepdoctection/extern/tessocr.py +39 -38
deepdoctection/extern/texocr.py +14 -16
deepdoctection/extern/tp/tfutils.py +16 -2
deepdoctection/extern/tp/tpcompat.py +11 -7
deepdoctection/extern/tp/tpfrcnn/config/config.py +4 -4
deepdoctection/extern/tp/tpfrcnn/modeling/backbone.py +1 -1
deepdoctection/extern/tp/tpfrcnn/modeling/model_box.py +5 -5
deepdoctection/extern/tp/tpfrcnn/modeling/model_fpn.py +6 -6
deepdoctection/extern/tp/tpfrcnn/modeling/model_frcnn.py +4 -4
deepdoctection/extern/tp/tpfrcnn/modeling/model_mrcnn.py +5 -3
deepdoctection/extern/tp/tpfrcnn/preproc.py +5 -5
deepdoctection/extern/tpdetect.py +40 -45
deepdoctection/mapper/cats.py +36 -40
deepdoctection/mapper/cocostruct.py +16 -12
deepdoctection/mapper/d2struct.py +22 -22
deepdoctection/mapper/hfstruct.py +7 -7
deepdoctection/mapper/laylmstruct.py +22 -24
deepdoctection/mapper/maputils.py +9 -10
deepdoctection/mapper/match.py +33 -2
deepdoctection/mapper/misc.py +6 -7
deepdoctection/mapper/pascalstruct.py +4 -4
deepdoctection/mapper/prodigystruct.py +6 -6
deepdoctection/mapper/pubstruct.py +84 -92
deepdoctection/mapper/tpstruct.py +3 -3
deepdoctection/mapper/xfundstruct.py +33 -33
deepdoctection/pipe/anngen.py +39 -14
deepdoctection/pipe/base.py +68 -99
deepdoctection/pipe/common.py +181 -85
deepdoctection/pipe/concurrency.py +14 -10
deepdoctection/pipe/doctectionpipe.py +24 -21
deepdoctection/pipe/language.py +20 -25
deepdoctection/pipe/layout.py +18 -16
deepdoctection/pipe/lm.py +49 -47
deepdoctection/pipe/order.py +63 -65
deepdoctection/pipe/refine.py +102 -109
deepdoctection/pipe/segment.py +157 -162
deepdoctection/pipe/sub_layout.py +50 -40
deepdoctection/pipe/text.py +37 -36
deepdoctection/pipe/transform.py +19 -16
deepdoctection/train/d2_frcnn_train.py +27 -25
deepdoctection/train/hf_detr_train.py +22 -18
deepdoctection/train/hf_layoutlm_train.py +49 -48
deepdoctection/train/tp_frcnn_train.py +10 -11
deepdoctection/utils/concurrency.py +1 -1
deepdoctection/utils/context.py +13 -6
deepdoctection/utils/develop.py +4 -4
deepdoctection/utils/env_info.py +52 -14
deepdoctection/utils/file_utils.py +6 -11
deepdoctection/utils/fs.py +41 -14
deepdoctection/utils/identifier.py +2 -2
deepdoctection/utils/logger.py +15 -15
deepdoctection/utils/metacfg.py +7 -7
deepdoctection/utils/pdf_utils.py +39 -14
deepdoctection/utils/settings.py +188 -182
deepdoctection/utils/tqdm.py +1 -1
deepdoctection/utils/transform.py +14 -9
deepdoctection/utils/types.py +104 -0
deepdoctection/utils/utils.py +7 -7
deepdoctection/utils/viz.py +70 -69
{deepdoctection-0.32.dist-info → deepdoctection-0.34.dist-info}/METADATA +7 -4
deepdoctection-0.34.dist-info/RECORD +146 -0
{deepdoctection-0.32.dist-info → deepdoctection-0.34.dist-info}/WHEEL +1 -1
deepdoctection/utils/detection_types.py +0 -68
deepdoctection-0.32.dist-info/RECORD +0 -146
{deepdoctection-0.32.dist-info → deepdoctection-0.34.dist-info}/LICENSE +0 -0
{deepdoctection-0.32.dist-info → deepdoctection-0.34.dist-info}/top_level.txt +0 -0

deepdoctection/extern/doctrocr.py CHANGED Viewed

@@ -23,25 +23,24 @@ from __future__ import annotations
 import os
 from abc import ABC
 from pathlib import Path
-from typing import Any, List, Literal, Mapping, Optional, Tuple, Union
+from typing import Any, Literal, Mapping, Optional, Union
 from zipfile import ZipFile
 from lazy_imports import try_import
-from ..utils.detection_types import ImageType, Requirement
+from ..utils.env_info import ENV_VARS_TRUE
 from ..utils.error import DependencyError
 from ..utils.file_utils import (
     get_doctr_requirement,
     get_pytorch_requirement,
     get_tensorflow_requirement,
     get_tf_addons_requirements,
-    pytorch_available,
-    tf_available,
 )
 from ..utils.fs import load_json
 from ..utils.settings import LayoutType, ObjectTypes, PageType, TypeOrStr
+from ..utils.types import PathLikeOrStr, PixelValues, Requirement
 from ..utils.viz import viz_handler
-from .base import DetectionResult, ImageTransformer, ObjectDetector, PredictorBase, TextRecognizer
+from .base import DetectionResult, ImageTransformer, ModelCategories, ObjectDetector, TextRecognizer
 from .pt.ptutils import get_torch_device
 from .tp.tfutils import get_tf_device
@@ -60,13 +59,24 @@ with try_import() as doctr_import_guard:
     from doctr.models.recognition.zoo import ARCHS, recognition
+def _get_doctr_requirements() -> list[Requirement]:
+    if os.environ.get("DD_USE_TF", "0") in ENV_VARS_TRUE:
+        return [get_tensorflow_requirement(), get_doctr_requirement(), get_tf_addons_requirements()]
+    if os.environ.get("DD_USE_TORCH", "0") in ENV_VARS_TRUE:
+        return [get_pytorch_requirement(), get_doctr_requirement()]
+    raise ModuleNotFoundError("Neither Tensorflow nor PyTorch has been installed. Cannot use DoctrTextRecognizer")
 def _load_model(
-    path_weights: str, doctr_predictor: Any, device: Union[torch.device, tf.device], lib: Literal["PT", "TF"]
+    path_weights: PathLikeOrStr,
+    doctr_predictor: Union[DetectionPredictor, RecognitionPredictor],
+    device: Union[torch.device, tf.device],
+    lib: Literal["PT", "TF"],
 ) -> None:
     """Loading a model either in TF or PT. We only shift the model to the device when using PyTorch. The shift of
     the model to the device in Tensorflow is done in the predict function."""
     if lib == "PT":
-        state_dict = torch.load(path_weights, map_location=device)
+        state_dict = torch.load(os.fspath(path_weights), map_location=device)
         for key in list(state_dict.keys()):
             state_dict["model." + key] = state_dict.pop(key)
         doctr_predictor.load_state_dict(state_dict)
@@ -74,27 +84,27 @@ def _load_model(
     elif lib == "TF":
         # Unzip the archive
         params_path = Path(path_weights).parent
-        is_zip_path = path_weights.endswith(".zip")
+        is_zip_path = os.fspath(path_weights).endswith(".zip")
         if is_zip_path:
             with ZipFile(path_weights, "r") as file:
                 file.extractall(path=params_path)
                 doctr_predictor.model.load_weights(params_path / "weights")
         else:
-            doctr_predictor.model.load_weights(path_weights)
+            doctr_predictor.model.load_weights(os.fspath(path_weights))
 def auto_select_lib_for_doctr() -> Literal["PT", "TF"]:
     """Auto select the DL library from environment variables"""
-    if os.environ.get("USE_TORCH"):
+    if os.environ.get("USE_TORCH", "0") in ENV_VARS_TRUE:
         return "PT"
-    if os.environ.get("USE_TF"):
+    if os.environ.get("USE_TF", "0") in ENV_VARS_TRUE:
         return "TF"
     raise DependencyError("At least one of the env variables USE_TORCH or USE_TF must be set.")
 def doctr_predict_text_lines(
-    np_img: ImageType, predictor: DetectionPredictor, device: Union[torch.device, tf.device], lib: Literal["TF", "PT"]
-) -> List[DetectionResult]:
+    np_img: PixelValues, predictor: DetectionPredictor, device: Union[torch.device, tf.device], lib: Literal["TF", "PT"]
+) -> list[DetectionResult]:
     """
     Generating text line DetectionResult based on Doctr DetectionPredictor.
@@ -113,7 +123,7 @@ def doctr_predict_text_lines(
         raise DependencyError("Tensorflow or PyTorch must be installed.")
     detection_results = [
         DetectionResult(
-            box=box[:4].tolist(), class_id=1, score=box[4], absolute_coords=False, class_name=LayoutType.word
+            box=box[:4].tolist(), class_id=1, score=box[4], absolute_coords=False, class_name=LayoutType.WORD
         )
         for box in raw_output[0]["words"]
     ]
@@ -121,11 +131,11 @@ def doctr_predict_text_lines(
 def doctr_predict_text(
-    inputs: List[Tuple[str, ImageType]],
+    inputs: list[tuple[str, PixelValues]],
     predictor: RecognitionPredictor,
     device: Union[torch.device, tf.device],
     lib: Literal["TF", "PT"],
-) -> List[DetectionResult]:
+) -> list[DetectionResult]:
     """
     Calls Doctr text recognition model on a batch of numpy arrays (text lines predicted from a text line detector) and
     returns the recognized text as DetectionResult
@@ -155,15 +165,15 @@ def doctr_predict_text(
 class DoctrTextlineDetectorMixin(ObjectDetector, ABC):
     """Base class for Doctr textline detector. This class only implements the basic wrapper functions"""
-    def __init__(self, categories: Mapping[str, TypeOrStr], lib: Optional[Literal["PT", "TF"]] = None):
-        self.categories = categories  # type: ignore
+    def __init__(self, categories: Mapping[int, TypeOrStr], lib: Optional[Literal["PT", "TF"]] = None):
+        self.categories = ModelCategories(init_categories=categories)
         self.lib = lib if lib is not None else self.auto_select_lib()
-    def possible_categories(self) -> List[ObjectTypes]:
-        return [LayoutType.word]
+    def get_category_names(self) -> tuple[ObjectTypes, ...]:
+        return self.categories.get_categories(as_dict=False)
     @staticmethod
-    def get_name(path_weights: str, architecture: str) -> str:
+    def get_name(path_weights: PathLikeOrStr, architecture: str) -> str:
         """Returns the name of the model"""
         return f"doctr_{architecture}" + "_".join(Path(path_weights).parts[-2:])
@@ -211,8 +221,8 @@ class DoctrTextlineDetector(DoctrTextlineDetectorMixin):
     def __init__(
         self,
         architecture: str,
-        path_weights: str,
-        categories: Mapping[str, TypeOrStr],
+        path_weights: PathLikeOrStr,
+        categories: Mapping[int, TypeOrStr],
         device: Optional[Union[Literal["cpu", "cuda"], torch.device, tf.device]] = None,
         lib: Optional[Literal["PT", "TF"]] = None,
     ) -> None:
@@ -227,7 +237,7 @@ class DoctrTextlineDetector(DoctrTextlineDetectorMixin):
         """
         super().__init__(categories, lib)
         self.architecture = architecture
-        self.path_weights = path_weights
+        self.path_weights = Path(path_weights)
         self.name = self.get_name(self.path_weights, self.architecture)
         self.model_id = self.get_model_id()
@@ -239,37 +249,37 @@ class DoctrTextlineDetector(DoctrTextlineDetectorMixin):
         self.doctr_predictor = self.get_wrapped_model(self.architecture, self.path_weights, self.device, self.lib)
-    def predict(self, np_img: ImageType) -> List[DetectionResult]:
+    def predict(self, np_img: PixelValues) -> list[DetectionResult]:
         """
         Prediction per image.
         :param np_img: image as numpy array
         :return: A list of DetectionResult
         """
-        detection_results = doctr_predict_text_lines(np_img, self.doctr_predictor, self.device, self.lib)
-        return detection_results
+        return doctr_predict_text_lines(np_img, self.doctr_predictor, self.device, self.lib)
     @classmethod
-    def get_requirements(cls) -> List[Requirement]:
-        if os.environ.get("DD_USE_TF"):
-            return [get_tensorflow_requirement(), get_doctr_requirement(), get_tf_addons_requirements()]
-        if os.environ.get("DD_USE_TORCH"):
-            return [get_pytorch_requirement(), get_doctr_requirement()]
-        raise ModuleNotFoundError("Neither Tensorflow nor PyTorch has been installed. Cannot use DoctrTextlineDetector")
+    def get_requirements(cls) -> list[Requirement]:
+        return _get_doctr_requirements()
-    def clone(self) -> PredictorBase:
-        return self.__class__(self.architecture, self.path_weights, self.categories, self.device, self.lib)
+    def clone(self) -> DoctrTextlineDetector:
+        return self.__class__(
+            self.architecture, self.path_weights, self.categories.get_categories(), self.device, self.lib
+        )
     @staticmethod
     def load_model(
-        path_weights: str, doctr_predictor: Any, device: Union[torch.device, tf.device], lib: Literal["PT", "TF"]
+        path_weights: PathLikeOrStr,
+        doctr_predictor: DetectionPredictor,
+        device: Union[torch.device, tf.device],
+        lib: Literal["PT", "TF"],
     ) -> None:
         """Loading model weights"""
         _load_model(path_weights, doctr_predictor, device, lib)
     @staticmethod
     def get_wrapped_model(
-        architecture: str, path_weights: str, device: Union[torch.device, tf.device], lib: Literal["PT", "TF"]
+        architecture: str, path_weights: PathLikeOrStr, device: Union[torch.device, tf.device], lib: Literal["PT", "TF"]
     ) -> Any:
         """
         Get the inner (wrapped) model.
@@ -290,6 +300,9 @@ class DoctrTextlineDetector(DoctrTextlineDetectorMixin):
         DoctrTextlineDetector.load_model(path_weights, doctr_predictor, device, lib)
         return doctr_predictor
+    def clear_model(self) -> None:
+        self.doctr_predictor = None
 class DoctrTextRecognizer(TextRecognizer):
     """
@@ -330,10 +343,10 @@ class DoctrTextRecognizer(TextRecognizer):
     def __init__(
         self,
         architecture: str,
-        path_weights: str,
+        path_weights: PathLikeOrStr,
         device: Optional[Union[Literal["cpu", "cuda"], torch.device, tf.device]] = None,
         lib: Optional[Literal["PT", "TF"]] = None,
-        path_config_json: Optional[str] = None,
+        path_config_json: Optional[PathLikeOrStr] = None,
     ) -> None:
         """
         :param architecture: DocTR supports various text recognition models, e.g. "crnn_vgg16_bn",
@@ -349,7 +362,7 @@ class DoctrTextRecognizer(TextRecognizer):
         self.lib = lib if lib is not None else self.auto_select_lib()
         self.architecture = architecture
-        self.path_weights = path_weights
+        self.path_weights = Path(path_weights)
         self.name = self.get_name(self.path_weights, self.architecture)
         self.model_id = self.get_model_id()
@@ -360,13 +373,13 @@ class DoctrTextRecognizer(TextRecognizer):
             self.device = get_torch_device(device)
         self.path_config_json = path_config_json
-        self.doctr_predictor = self.build_model(self.architecture, self.path_config_json)
+        self.doctr_predictor = self.build_model(self.architecture, self.lib, self.path_config_json)
         self.load_model(self.path_weights, self.doctr_predictor, self.device, self.lib)
         self.doctr_predictor = self.get_wrapped_model(
             self.architecture, self.path_weights, self.device, self.lib, self.path_config_json
         )
-    def predict(self, images: List[Tuple[str, ImageType]]) -> List[DetectionResult]:
+    def predict(self, images: list[tuple[str, PixelValues]]) -> list[DetectionResult]:
         """
         Prediction on a batch of text lines
@@ -378,25 +391,26 @@ class DoctrTextRecognizer(TextRecognizer):
         return []
     @classmethod
-    def get_requirements(cls) -> List[Requirement]:
-        if tf_available():
-            return [get_tensorflow_requirement(), get_doctr_requirement(), get_tf_addons_requirements()]
-        if pytorch_available():
-            return [get_pytorch_requirement(), get_doctr_requirement()]
-        raise ModuleNotFoundError("Neither Tensorflow nor PyTorch has been installed. Cannot use DoctrTextRecognizer")
-    def clone(self) -> PredictorBase:
+    def get_requirements(cls) -> list[Requirement]:
+        return _get_doctr_requirements()
+    def clone(self) -> DoctrTextRecognizer:
         return self.__class__(self.architecture, self.path_weights, self.device, self.lib)
     @staticmethod
     def load_model(
-        path_weights: str, doctr_predictor: Any, device: Union[torch.device, tf.device], lib: Literal["PT", "TF"]
+        path_weights: PathLikeOrStr,
+        doctr_predictor: RecognitionPredictor,
+        device: Union[torch.device, tf.device],
+        lib: Literal["PT", "TF"],
     ) -> None:
         """Loading model weights"""
         _load_model(path_weights, doctr_predictor, device, lib)
     @staticmethod
-    def build_model(architecture: str, path_config_json: Optional[str] = None) -> "RecognitionPredictor":
+    def build_model(
+        architecture: str, lib: Literal["TF", "PT"], path_config_json: Optional[PathLikeOrStr] = None
+    ) -> RecognitionPredictor:
         """Building the model"""
         # inspired and adapted from https://github.com/mindee/doctr/blob/main/doctr/models/recognition/zoo.py
@@ -419,6 +433,7 @@ class DoctrTextRecognizer(TextRecognizer):
             model = recognition.__dict__[architecture](pretrained=True, pretrained_backbone=True, **custom_configs)
         else:
+            # This is not documented, but you can also directly pass the model class to architecture
             if not isinstance(
                 architecture,
                 (recognition.CRNN, recognition.SAR, recognition.MASTER, recognition.ViTSTR, recognition.PARSeq),
@@ -426,16 +441,16 @@ class DoctrTextRecognizer(TextRecognizer):
                 raise ValueError(f"unknown architecture: {type(architecture)}")
             model = architecture
-        input_shape = model.cfg["input_shape"][:2] if tf_available() else model.cfg["input_shape"][-2:]
+        input_shape = model.cfg["input_shape"][:2] if lib == "TF" else model.cfg["input_shape"][-2:]
         return RecognitionPredictor(PreProcessor(input_shape, preserve_aspect_ratio=True, **recognition_configs), model)
     @staticmethod
     def get_wrapped_model(
         architecture: str,
-        path_weights: str,
+        path_weights: PathLikeOrStr,
         device: Union[torch.device, tf.device],
         lib: Literal["PT", "TF"],
-        path_config_json: Optional[str] = None,
+        path_config_json: Optional[PathLikeOrStr] = None,
     ) -> Any:
         """
         Get the inner (wrapped) model.
@@ -450,12 +465,12 @@ class DoctrTextRecognizer(TextRecognizer):
         a model trained on custom vocab.
         :return: Inner model which is a "nn.Module" in PyTorch or a "tf.keras.Model" in Tensorflow
         """
-        doctr_predictor = DoctrTextRecognizer.build_model(architecture, path_config_json)
+        doctr_predictor = DoctrTextRecognizer.build_model(architecture, lib, path_config_json)
         DoctrTextRecognizer.load_model(path_weights, doctr_predictor, device, lib)
         return doctr_predictor
     @staticmethod
-    def get_name(path_weights: str, architecture: str) -> str:
+    def get_name(path_weights: PathLikeOrStr, architecture: str) -> str:
         """Returns the name of the model"""
         return f"doctr_{architecture}" + "_".join(Path(path_weights).parts[-2:])
@@ -464,6 +479,9 @@ class DoctrTextRecognizer(TextRecognizer):
         """Auto select the DL library from the installed and from environment variables"""
         return auto_select_lib_for_doctr()
+    def clear_model(self) -> None:
+        self.doctr_predictor = None
 class DocTrRotationTransformer(ImageTransformer):
     """
@@ -497,7 +515,7 @@ class DocTrRotationTransformer(ImageTransformer):
         self.ratio_threshold_for_lines = ratio_threshold_for_lines
         self.name = "doctr_rotation_transformer"
-    def transform(self, np_img: ImageType, specification: DetectionResult) -> ImageType:
+    def transform(self, np_img: PixelValues, specification: DetectionResult) -> PixelValues:
         """
         Applies the predicted rotation to the image, effectively rotating the image backwards.
         This method uses either the Pillow library or OpenCV for the rotation operation, depending on the configuration.
@@ -508,19 +526,18 @@ class DocTrRotationTransformer(ImageTransformer):
         """
         return viz_handler.rotate_image(np_img, specification.angle)  # type: ignore
-    def predict(self, np_img: ImageType) -> DetectionResult:
+    def predict(self, np_img: PixelValues) -> DetectionResult:
         angle = estimate_orientation(np_img, self.number_contours, self.ratio_threshold_for_lines)
         if angle < 0:
             angle += 360
         return DetectionResult(angle=round(angle, 2))
     @classmethod
-    def get_requirements(cls) -> List[Requirement]:
+    def get_requirements(cls) -> list[Requirement]:
         return [get_doctr_requirement()]
-    def clone(self) -> PredictorBase:
+    def clone(self) -> DocTrRotationTransformer:
         return self.__class__(self.number_contours, self.ratio_threshold_for_lines)
-    @staticmethod
-    def possible_category() -> PageType:
-        return PageType.angle
+    def get_category_names(self) -> tuple[ObjectTypes, ...]:
+        return (PageType.ANGLE,)

deepdoctection/extern/fastlang.py CHANGED Viewed

@@ -18,16 +18,20 @@
 """
 Deepdoctection wrappers for fasttext language detection models
 """
+from __future__ import annotations
+import os
 from abc import ABC
-from copy import copy
 from pathlib import Path
-from typing import Any, List, Mapping, Tuple, Union
+from types import MappingProxyType
+from typing import Any, Mapping, Union
 from lazy_imports import try_import
 from ..utils.file_utils import Requirement, get_fasttext_requirement
 from ..utils.settings import TypeOrStr, get_type
-from .base import DetectionResult, LanguageDetector, PredictorBase
+from ..utils.types import PathLikeOrStr
+from .base import DetectionResult, LanguageDetector, ModelCategories
 with try_import() as import_guard:
     from fasttext import load_model  # type: ignore
@@ -38,22 +42,23 @@ class FasttextLangDetectorMixin(LanguageDetector, ABC):
     Base class for Fasttext language detection implementation. This class only implements the basic wrapper functions.
     """
-    def __init__(self, categories: Mapping[str, TypeOrStr]) -> None:
+    def __init__(self, categories: Mapping[int, TypeOrStr], categories_orig: Mapping[str, TypeOrStr]) -> None:
         """
         :param categories: A dict with the model output label and value. We use as convention the ISO 639-2 language
         """
-        self.categories = copy({idx: get_type(cat) for idx, cat in categories.items()})
+        self.categories = ModelCategories(init_categories=categories)
+        self.categories_orig = MappingProxyType({cat_orig: get_type(cat) for cat_orig, cat in categories_orig.items()})
-    def output_to_detection_result(self, output: Union[Tuple[Any, Any]]) -> DetectionResult:
+    def output_to_detection_result(self, output: Union[tuple[Any, Any]]) -> DetectionResult:
         """
         Generating `DetectionResult` from model output
         :param output: FastText model output
         :return: `DetectionResult` filled with `text` and `score`
         """
-        return DetectionResult(text=self.categories[output[0][0]], score=output[1][0])
+        return DetectionResult(text=self.categories_orig[output[0][0]], score=output[1][0])
     @staticmethod
-    def get_name(path_weights: str) -> str:
+    def get_name(path_weights: PathLikeOrStr) -> str:
         """Returns the name of the model"""
         return "fasttext_" + "_".join(Path(path_weights).parts[-2:])
@@ -80,15 +85,17 @@ class FasttextLangDetector(FasttextLangDetectorMixin):
     """
-    def __init__(self, path_weights: str, categories: Mapping[str, TypeOrStr]):
+    def __init__(
+        self, path_weights: PathLikeOrStr, categories: Mapping[int, TypeOrStr], categories_orig: Mapping[str, TypeOrStr]
+    ):
         """
         :param path_weights: path to model weights
         :param categories: A dict with the model output label and value. We use as convention the ISO 639-2 language
                            code.
         """
-        super().__init__(categories)
+        super().__init__(categories, categories_orig)
-        self.path_weights = path_weights
+        self.path_weights = Path(path_weights)
         self.name = self.get_name(self.path_weights)
         self.model_id = self.get_model_id()
@@ -100,16 +107,16 @@ class FasttextLangDetector(FasttextLangDetectorMixin):
         return self.output_to_detection_result(output)
     @classmethod
-    def get_requirements(cls) -> List[Requirement]:
+    def get_requirements(cls) -> list[Requirement]:
         return [get_fasttext_requirement()]
-    def clone(self) -> PredictorBase:
-        return self.__class__(self.path_weights, self.categories)
+    def clone(self) -> FasttextLangDetector:
+        return self.__class__(self.path_weights, self.categories.get_categories(), self.categories_orig)
     @staticmethod
-    def get_wrapped_model(path_weights: str) -> Any:
+    def get_wrapped_model(path_weights: PathLikeOrStr) -> Any:
         """
         Get the wrapped model
         :param path_weights: path to model weights
         """
-        return load_model(path_weights)
+        return load_model(os.fspath(path_weights))

deepdoctection 0.32__py3-none-any.whl → 0.34__py3-none-any.whl

Potentially problematic release.

deepdoctection 0.32py3-none-any.whl → 0.34py3-none-any.whl