PyPI - deepdoctection - Versions diffs - 0.31__py3-none-any.whl → 0.33__py3-none-any.whl - Mend

deepdoctection 0.31py3-none-any.whl → 0.33py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of deepdoctection might be problematic. Click here for more details.

Files changed (131) hide show

deepdoctection/__init__.py +16 -29
deepdoctection/analyzer/dd.py +70 -59
deepdoctection/configs/conf_dd_one.yaml +34 -31
deepdoctection/dataflow/common.py +9 -5
deepdoctection/dataflow/custom.py +5 -5
deepdoctection/dataflow/custom_serialize.py +75 -18
deepdoctection/dataflow/parallel_map.py +3 -3
deepdoctection/dataflow/serialize.py +4 -4
deepdoctection/dataflow/stats.py +3 -3
deepdoctection/datapoint/annotation.py +41 -56
deepdoctection/datapoint/box.py +9 -8
deepdoctection/datapoint/convert.py +6 -6
deepdoctection/datapoint/image.py +56 -44
deepdoctection/datapoint/view.py +245 -150
deepdoctection/datasets/__init__.py +1 -4
deepdoctection/datasets/adapter.py +35 -26
deepdoctection/datasets/base.py +14 -12
deepdoctection/datasets/dataflow_builder.py +3 -3
deepdoctection/datasets/info.py +24 -26
deepdoctection/datasets/instances/doclaynet.py +51 -51
deepdoctection/datasets/instances/fintabnet.py +46 -46
deepdoctection/datasets/instances/funsd.py +25 -24
deepdoctection/datasets/instances/iiitar13k.py +13 -10
deepdoctection/datasets/instances/layouttest.py +4 -3
deepdoctection/datasets/instances/publaynet.py +5 -5
deepdoctection/datasets/instances/pubtables1m.py +24 -21
deepdoctection/datasets/instances/pubtabnet.py +32 -30
deepdoctection/datasets/instances/rvlcdip.py +30 -30
deepdoctection/datasets/instances/xfund.py +26 -26
deepdoctection/datasets/save.py +6 -6
deepdoctection/eval/__init__.py +1 -4
deepdoctection/eval/accmetric.py +32 -33
deepdoctection/eval/base.py +8 -9
deepdoctection/eval/cocometric.py +15 -13
deepdoctection/eval/eval.py +41 -37
deepdoctection/eval/tedsmetric.py +30 -23
deepdoctection/eval/tp_eval_callback.py +16 -19
deepdoctection/extern/__init__.py +2 -7
deepdoctection/extern/base.py +339 -134
deepdoctection/extern/d2detect.py +85 -113
deepdoctection/extern/deskew.py +14 -11
deepdoctection/extern/doctrocr.py +141 -130
deepdoctection/extern/fastlang.py +27 -18
deepdoctection/extern/hfdetr.py +71 -62
deepdoctection/extern/hflayoutlm.py +504 -211
deepdoctection/extern/hflm.py +230 -0
deepdoctection/extern/model.py +488 -302
deepdoctection/extern/pdftext.py +23 -19
deepdoctection/extern/pt/__init__.py +1 -3
deepdoctection/extern/pt/nms.py +6 -2
deepdoctection/extern/pt/ptutils.py +29 -19
deepdoctection/extern/tessocr.py +39 -38
deepdoctection/extern/texocr.py +18 -18
deepdoctection/extern/tp/tfutils.py +57 -9
deepdoctection/extern/tp/tpcompat.py +21 -14
deepdoctection/extern/tp/tpfrcnn/__init__.py +20 -0
deepdoctection/extern/tp/tpfrcnn/common.py +7 -3
deepdoctection/extern/tp/tpfrcnn/config/__init__.py +20 -0
deepdoctection/extern/tp/tpfrcnn/config/config.py +13 -10
deepdoctection/extern/tp/tpfrcnn/modeling/__init__.py +20 -0
deepdoctection/extern/tp/tpfrcnn/modeling/backbone.py +18 -8
deepdoctection/extern/tp/tpfrcnn/modeling/generalized_rcnn.py +12 -6
deepdoctection/extern/tp/tpfrcnn/modeling/model_box.py +14 -9
deepdoctection/extern/tp/tpfrcnn/modeling/model_cascade.py +8 -5
deepdoctection/extern/tp/tpfrcnn/modeling/model_fpn.py +22 -17
deepdoctection/extern/tp/tpfrcnn/modeling/model_frcnn.py +21 -14
deepdoctection/extern/tp/tpfrcnn/modeling/model_mrcnn.py +19 -11
deepdoctection/extern/tp/tpfrcnn/modeling/model_rpn.py +15 -10
deepdoctection/extern/tp/tpfrcnn/predict.py +9 -4
deepdoctection/extern/tp/tpfrcnn/preproc.py +12 -8
deepdoctection/extern/tp/tpfrcnn/utils/__init__.py +20 -0
deepdoctection/extern/tp/tpfrcnn/utils/box_ops.py +10 -2
deepdoctection/extern/tpdetect.py +45 -53
deepdoctection/mapper/__init__.py +3 -8
deepdoctection/mapper/cats.py +27 -29
deepdoctection/mapper/cocostruct.py +10 -10
deepdoctection/mapper/d2struct.py +27 -26
deepdoctection/mapper/hfstruct.py +13 -8
deepdoctection/mapper/laylmstruct.py +178 -37
deepdoctection/mapper/maputils.py +12 -11
deepdoctection/mapper/match.py +2 -2
deepdoctection/mapper/misc.py +11 -9
deepdoctection/mapper/pascalstruct.py +4 -4
deepdoctection/mapper/prodigystruct.py +5 -5
deepdoctection/mapper/pubstruct.py +84 -92
deepdoctection/mapper/tpstruct.py +5 -5
deepdoctection/mapper/xfundstruct.py +33 -33
deepdoctection/pipe/__init__.py +1 -1
deepdoctection/pipe/anngen.py +12 -14
deepdoctection/pipe/base.py +52 -106
deepdoctection/pipe/common.py +72 -59
deepdoctection/pipe/concurrency.py +16 -11
deepdoctection/pipe/doctectionpipe.py +24 -21
deepdoctection/pipe/language.py +20 -25
deepdoctection/pipe/layout.py +20 -16
deepdoctection/pipe/lm.py +75 -105
deepdoctection/pipe/order.py +194 -89
deepdoctection/pipe/refine.py +111 -124
deepdoctection/pipe/segment.py +156 -161
deepdoctection/pipe/{cell.py → sub_layout.py} +50 -40
deepdoctection/pipe/text.py +37 -36
deepdoctection/pipe/transform.py +19 -16
deepdoctection/train/__init__.py +6 -12
deepdoctection/train/d2_frcnn_train.py +48 -41
deepdoctection/train/hf_detr_train.py +41 -30
deepdoctection/train/hf_layoutlm_train.py +153 -135
deepdoctection/train/tp_frcnn_train.py +32 -31
deepdoctection/utils/concurrency.py +1 -1
deepdoctection/utils/context.py +13 -6
deepdoctection/utils/develop.py +4 -4
deepdoctection/utils/env_info.py +87 -125
deepdoctection/utils/file_utils.py +6 -11
deepdoctection/utils/fs.py +22 -18
deepdoctection/utils/identifier.py +2 -2
deepdoctection/utils/logger.py +16 -15
deepdoctection/utils/metacfg.py +7 -7
deepdoctection/utils/mocks.py +93 -0
deepdoctection/utils/pdf_utils.py +11 -11
deepdoctection/utils/settings.py +185 -181
deepdoctection/utils/tqdm.py +1 -1
deepdoctection/utils/transform.py +14 -9
deepdoctection/utils/types.py +104 -0
deepdoctection/utils/utils.py +7 -7
deepdoctection/utils/viz.py +74 -72
{deepdoctection-0.31.dist-info → deepdoctection-0.33.dist-info}/METADATA +30 -21
deepdoctection-0.33.dist-info/RECORD +146 -0
{deepdoctection-0.31.dist-info → deepdoctection-0.33.dist-info}/WHEEL +1 -1
deepdoctection/utils/detection_types.py +0 -68
deepdoctection-0.31.dist-info/RECORD +0 -144
{deepdoctection-0.31.dist-info → deepdoctection-0.33.dist-info}/LICENSE +0 -0
{deepdoctection-0.31.dist-info → deepdoctection-0.33.dist-info}/top_level.txt +0 -0

deepdoctection/extern/base.py CHANGED Viewed

@@ -19,14 +19,211 @@
 """
 Abstract classes for unifying external base- and Doctection predictors
 """
+from __future__ import annotations
 from abc import ABC, abstractmethod
-from dataclasses import dataclass
-from typing import Any, Dict, List, Mapping, Optional, Tuple, Union
+from dataclasses import dataclass, field
+from types import MappingProxyType
+from typing import TYPE_CHECKING, Any, Literal, Mapping, Optional, Sequence, Union, overload
+from lazy_imports import try_import
-from ..utils.detection_types import ImageType, JsonDict, Requirement
 from ..utils.identifier import get_uuid_from_str
-from ..utils.settings import DefaultType, ObjectTypes, TypeOrStr, get_type
+from ..utils.logger import logger
+from ..utils.settings import (
+    DefaultType,
+    ObjectTypes,
+    TypeOrStr,
+    get_type,
+    token_class_tag_to_token_class_with_tag,
+    token_class_with_tag_to_token_class_and_tag,
+)
+from ..utils.types import JsonDict, PixelValues, Requirement
+if TYPE_CHECKING:
+    with try_import() as import_guard:
+        import torch
+@dataclass
+class ModelCategories:
+    """
+    Categories for models (except models for NER tasks) are managed in this class. Different to DatasetCategories,
+    these members are immutable.
+    **Example**:
+        categories = ModelCategories(init_categories={1: "text", 2: "title"})
+        cats = categories.get_categories(as_dict=True)  # {1: LayoutType.text, 2: LayoutType.title}
+        categories.filter_categories = [LayoutType.text]  # filter out text
+        cats = categories.get_categories(as_dict=True)  # {2: LayoutType.title}
+    """
+    init_categories: Optional[Mapping[int, TypeOrStr]] = field(repr=False)
+    _init_categories: MappingProxyType[int, ObjectTypes] = field(init=False, repr=False)
+    _filter_categories: Sequence[ObjectTypes] = field(init=False, repr=False, default_factory=tuple)
+    categories: MappingProxyType[int, ObjectTypes] = field(init=False)
+    def __post_init__(self) -> None:
+        """post init method"""
+        if self.init_categories:
+            self._init_categories = MappingProxyType({key: get_type(val) for key, val in self.init_categories.items()})
+        else:
+            if self._init_categories is None:
+                self._init_categories = MappingProxyType({})
+        self.categories = self._init_categories
+    @overload
+    def get_categories(self, as_dict: Literal[False]) -> tuple[ObjectTypes, ...]:
+        ...
+    @overload
+    def get_categories(
+        self, as_dict: Literal[True] = ..., name_as_key: Literal[False] = False
+    ) -> MappingProxyType[int, ObjectTypes]:
+        ...
+    @overload
+    def get_categories(self, as_dict: Literal[True], name_as_key: Literal[True]) -> MappingProxyType[ObjectTypes, int]:
+        ...
+    def get_categories(
+        self, as_dict: bool = True, name_as_key: bool = False
+    ) -> Union[MappingProxyType[int, ObjectTypes], MappingProxyType[ObjectTypes, int], tuple[ObjectTypes, ...]]:
+        """
+        Get the categories
+        :param as_dict: return as dict
+        :param name_as_key: if as_dict=`True` and name_as_key=`True` will swap key and value
+        :return: categories dict
+        """
+        if as_dict:
+            if name_as_key:
+                return MappingProxyType(
+                    {value: key for key, value in self._init_categories.items() if value not in self.filter_categories}
+                )
+            return MappingProxyType(
+                {key: value for key, value in self._init_categories.items() if value not in self.filter_categories}
+            )
+        return tuple(val for val in self._init_categories.values() if val not in self.filter_categories)
+    @property
+    def filter_categories(self) -> Sequence[ObjectTypes]:
+        """filter_categories"""
+        return self._filter_categories
+    @filter_categories.setter
+    def filter_categories(self, categories: Sequence[ObjectTypes]) -> None:
+        """categories setter"""
+        self._filter_categories = categories
+        self.categories = self.get_categories()
+    def shift_category_ids(self, shift_by: int) -> MappingProxyType[int, ObjectTypes]:
+        """
+        Shift category ids
+         **Example**:
+            categories = ModelCategories(init_categories={"1": "text", "2": "title"})
+            cats = categories.shift_category_ids(1) # {"2": LayoutType.text, "3": LayoutType.title}
+        :param shift_by: The value to shift the category id to the left or to the right
+        :return: shifted categories
+        """
+        return MappingProxyType({k + shift_by: v for k, v in self.get_categories().items()})
+@dataclass
+class NerModelCategories(ModelCategories):
+    """
+    Categories for models for NER tasks. It can handle the merging of token classes and bio tags to build a new set
+    of categories.
+    **Example**:
+        categories = NerModelCategories(categories_semantics=["question", "answer"], categories_bio=["B", "I"])
+        cats = categories.get_categories(as_dict=True)  # {"1": TokenClassWithTag.b_question,
+                                                           "2": TokenClassWithTag.i_question,
+                                                           "3": TokenClassWithTag.b_answer,
+                                                           "4": TokenClassWithTag.i_answer}
+    You can also leave the categories unchanged:
+    **Example**:
+        categories = NerModelCategories(init_categories={"1": "question", "2": "answer"})
+        cats = categories.get_categories(as_dict=True)  # {"1": TokenClasses.question,
+                                                           "2": TokenClasses.answer}
+    """
+    categories_semantics: Optional[Sequence[TypeOrStr]] = field(default=None)
+    categories_bio: Optional[Sequence[TypeOrStr]] = field(default=None)
+    _categories_semantics: tuple[ObjectTypes, ...] = field(init=False, repr=False)
+    _categories_bio: tuple[ObjectTypes, ...] = field(init=False, repr=False)
+    def __post_init__(self) -> None:
+        if not self.init_categories:
+            if not self.categories_semantics:
+                raise ValueError("If categories is None then categories_semantics cannot be None")
+            if not self.categories_bio:
+                raise ValueError("If categories is None then categories_bio cannot be None")
+        else:
+            self._init_categories = MappingProxyType({key: get_type(val) for key, val in self.init_categories.items()})
+        if self.categories_bio:
+            self._categories_bio = tuple((get_type(cat) for cat in self.categories_bio))
+        if self.categories_semantics:
+            self._categories_semantics = tuple((get_type(cat) for cat in self.categories_semantics))
+        if self.categories_bio and self.categories_semantics and self.init_categories:
+            logger.info("Will disregard categories_bio and categories_semantics")
+        if self.categories_bio and self.categories_semantics:
+            self._init_categories = self.merge_bio_semantics_categories(
+                self._categories_semantics, self._categories_bio
+            )
+        super().__post_init__()
+    @staticmethod
+    def merge_bio_semantics_categories(
+        categories_semantics: tuple[ObjectTypes, ...], categories_bio: tuple[ObjectTypes, ...]
+    ) -> MappingProxyType[int, ObjectTypes]:
+        """
+        Merge bio and semantics categories
+        **Example**:
+            categories = NerModelCategories(categories_semantics=["question", "answer"], categories_bio=["B", "I"])
+            cats = categories.get_categories(as_dict=True)  # {"1": TokenClassWithTag.b_question,
+                                                               "2": TokenClassWithTag.i_question,
+                                                               "3": TokenClassWithTag.b_answer,
+                                                               "4": TokenClassWithTag.i_answer}
+        :param categories_semantics: semantic categories (without tags)
+        :param categories_bio: bio tags
+        :return: A mapping of categories with tags
+        """
+        categories_list = sorted(
+            {
+                token_class_tag_to_token_class_with_tag(token, tag)
+                for token in categories_semantics
+                for tag in categories_bio
+            }
+        )
+        return MappingProxyType(dict(enumerate(categories_list, 1)))
+    @staticmethod
+    def disentangle_token_class_and_tag(category_name: ObjectTypes) -> Optional[tuple[ObjectTypes, ObjectTypes]]:
+        """
+        Disentangle token class and tag. It will return separate ObjectTypes for token class and tag.
+        **Example**:
+             NerModelCategories.disentangle_token_class_and_tag(TokenClassWithTag.b_question)
+             # (TokenClasses.question, TokenTags.begin)
+        :param category_name: A category name with token class and tag
+        :return: Tuple of disentangled token class and tag
+        """
+        return token_class_with_tag_to_token_class_and_tag(category_name)
 class PredictorBase(ABC):
@@ -51,14 +248,14 @@ class PredictorBase(ABC):
     @classmethod
     @abstractmethod
-    def get_requirements(cls) -> List[Requirement]:
+    def get_requirements(cls) -> list[Requirement]:
         """
         Get a list of requirements for running the detector
         """
         raise NotImplementedError()
     @abstractmethod
-    def clone(self) -> "PredictorBase":
+    def clone(self) -> PredictorBase:
         """
         Clone an instance
         """
@@ -72,6 +269,16 @@ class PredictorBase(ABC):
             return get_uuid_from_str(self.name)[:8]
         raise ValueError("name must be set before calling get_model_id")
+    def clear_model(self) -> None:
+        """
+        Clear the inner model of the model wrapper if it has one. Needed for model updates during training.
+        """
+        raise NotImplementedError(
+            "Maybe you forgot to implement this method in your pipeline component. This might "
+            "be the case when you run evaluation during training and need to update the "
+            "trained model in your pipeline component."
+        )
 @dataclass
 class DetectionResult:
@@ -101,24 +308,24 @@ class DetectionResult:
     """
-    box: Optional[List[float]] = None
+    box: Optional[list[float]] = None
     class_id: Optional[int] = None
     score: Optional[float] = None
-    mask: Optional[List[float]] = None
+    mask: Optional[list[float]] = None
     absolute_coords: bool = True
-    class_name: ObjectTypes = DefaultType.default_type
+    class_name: ObjectTypes = DefaultType.DEFAULT_TYPE
     text: Optional[Union[str, ObjectTypes]] = None
     block: Optional[str] = None
     line: Optional[str] = None
     uuid: Optional[str] = None
-    relationships: Optional[Dict[str, Any]] = None
+    relationships: Optional[dict[str, Any]] = None
     angle: Optional[float] = None
-class ObjectDetector(PredictorBase):
+class ObjectDetector(PredictorBase, ABC):
     """
     Abstract base class for object detection. This can be anything ranging from layout detection to OCR.
-    Use this to connect external detectors with Deep-Doctection predictors on images.
+    Use this to connect external detectors with deepdoctection predictors on images.
     **Example:**
@@ -127,20 +334,10 @@ class ObjectDetector(PredictorBase):
     and implement the `predict`.
     """
-    _categories: Mapping[str, ObjectTypes]
-    @property
-    def categories(self) -> Mapping[str, ObjectTypes]:
-        """categories"""
-        return self._categories
-    @categories.setter
-    def categories(self, categories: Mapping[str, TypeOrStr]) -> None:
-        """categories setter"""
-        self._categories = {key: get_type(value) for key, value in categories.items()}
+    categories: ModelCategories
     @abstractmethod
-    def predict(self, np_img: ImageType) -> List[DetectionResult]:
+    def predict(self, np_img: PixelValues) -> list[DetectionResult]:
         """
         Abstract method predict
         """
@@ -153,48 +350,45 @@ class ObjectDetector(PredictorBase):
         """
         return False
-    def possible_categories(self) -> List[ObjectTypes]:
+    @abstractmethod
+    def get_category_names(self) -> tuple[ObjectTypes, ...]:
+        """
+        Abstract method get_category_names
         """
-        Abstract method possible_categories. Must implement a method that returns a list of possible detectable
-        categories
+        raise NotImplementedError()
+    @abstractmethod
+    def clone(self) -> ObjectDetector:
+        """
+        Clone an instance
         """
-        return list(self.categories.values())
+        raise NotImplementedError()
-class PdfMiner(PredictorBase):
+class PdfMiner(PredictorBase, ABC):
     """
     Abstract base class for mining information from PDF documents. Reads in a bytes stream from a PDF document page.
     Use this to connect external pdf miners and wrap them into Deep-Doctection predictors.
     """
-    _categories: Mapping[str, ObjectTypes]
+    categories: ModelCategories
     _pdf_bytes: Optional[bytes] = None
-    _page: Any = None
-    @property
-    def categories(self) -> Mapping[str, ObjectTypes]:
-        """categories"""
-        return self._categories
-    @categories.setter
-    def categories(self, categories: Mapping[str, TypeOrStr]) -> None:
-        self._categories = {key: get_type(value) for key, value in categories.items()}
     @abstractmethod
-    def predict(self, pdf_bytes: bytes) -> List[DetectionResult]:
+    def predict(self, pdf_bytes: bytes) -> list[DetectionResult]:
         """
         Abstract method predict
         """
         raise NotImplementedError()
     @abstractmethod
-    def get_width_height(self, pdf_bytes: bytes) -> Tuple[float, float]:
+    def get_width_height(self, pdf_bytes: bytes) -> tuple[float, float]:
         """
         Abstract method get_width_height
         """
         raise NotImplementedError()
-    def clone(self) -> PredictorBase:
+    def clone(self) -> PdfMiner:
         return self.__class__()
     @property
@@ -204,14 +398,15 @@ class PdfMiner(PredictorBase):
         """
         return False
-    def possible_categories(self) -> List[ObjectTypes]:
+    @abstractmethod
+    def get_category_names(self) -> tuple[ObjectTypes, ...]:
         """
-        Returns a list of possible detectable categories
+        Abstract method get_category_names
         """
-        return list(self.categories.values())
+        raise NotImplementedError()
-class TextRecognizer(PredictorBase):
+class TextRecognizer(PredictorBase, ABC):
     """
     Abstract base class for text recognition. In contrast to ObjectDetector one assumes that `predict` accepts
     batches of numpy arrays. More precisely, when using `predict` pass a list of tuples with uuids (e.g. image_id,
@@ -219,7 +414,7 @@ class TextRecognizer(PredictorBase):
     """
     @abstractmethod
-    def predict(self, images: List[Tuple[str, ImageType]]) -> List[DetectionResult]:
+    def predict(self, images: list[tuple[str, PixelValues]]) -> list[DetectionResult]:
         """
         Abstract method predict
         """
@@ -232,6 +427,11 @@ class TextRecognizer(PredictorBase):
         """
         return True
+    @staticmethod
+    def get_category_names() -> tuple[ObjectTypes, ...]:
+        """return category names"""
+        return ()
 @dataclass
 class TokenClassResult:
@@ -258,9 +458,9 @@ class TokenClassResult:
     uuid: str
     token: str
     class_id: int
-    class_name: ObjectTypes = DefaultType.default_type
-    semantic_name: ObjectTypes = DefaultType.default_type
-    bio_tag: ObjectTypes = DefaultType.default_type
+    class_name: ObjectTypes = DefaultType.DEFAULT_TYPE
+    semantic_name: ObjectTypes = DefaultType.DEFAULT_TYPE
+    bio_tag: ObjectTypes = DefaultType.DEFAULT_TYPE
     score: Optional[float] = None
     token_id: Optional[int] = None
@@ -277,123 +477,137 @@ class SequenceClassResult:
     """
     class_id: int
-    class_name: ObjectTypes = DefaultType.default_type
+    class_name: ObjectTypes = DefaultType.DEFAULT_TYPE
     score: Optional[float] = None
     class_name_orig: Optional[str] = None
-class LMTokenClassifier(PredictorBase):
+class LMTokenClassifier(PredictorBase, ABC):
     """
     Abstract base class for token classifiers. If you want to connect external token classifiers with Deepdoctection
     predictors wrap them into a class derived from this class. Note, that this class is still DL library agnostic.
     """
-    _categories: Mapping[str, ObjectTypes]
-    @property
-    def categories(self) -> Mapping[str, ObjectTypes]:
-        """categories"""
-        return self._categories
-    @categories.setter
-    def categories(self, categories: Mapping[str, TypeOrStr]) -> None:
-        """categories setter"""
-        self._categories = {key: get_type(value) for key, value in categories.items()}
     @abstractmethod
-    def predict(self, **encodings: Union[List[List[str]], "torch.Tensor"]) -> List[TokenClassResult]:  # type: ignore
+    def predict(self, **encodings: Union[list[list[str]], torch.Tensor]) -> list[TokenClassResult]:
         """
         Abstract method predict
         """
         raise NotImplementedError()
-    def possible_tokens(self) -> List[ObjectTypes]:
-        """
-        Returns a list of possible detectable tokens
+    @staticmethod
+    def default_kwargs_for_image_to_features_mapping() -> JsonDict:
         """
-        return list(self.categories.values())
+        Some models require that their inputs must be pre-processed in a specific way. Responsible for converting
+        an `Image` datapoint into the input format in inference mode is a mapper function which is called
+        in a pipeline component. The mapper function's name, which has to be used must be specified in the returned
+        value of `image_to_features_mapping`.
+        This mapper function is often implemented for various models and can therefore have various parameters.
+        Some parameters can be inferred from the config file of the model parametrization. Some other might not be
+        in the parametrization and therefore have to be specified here.
-    @abstractmethod
-    def clone(self) -> "LMTokenClassifier":
-        """
-        Clone an instance
+        This method therefore returns a dictionary that contains as keys some arguments of the function
+        `image_to_features_mapping` and as values the values necessary for providing the model with the required input.
         """
-        raise NotImplementedError()
+        return {}
     @staticmethod
-    def default_kwargs_for_input_mapping() -> JsonDict:
+    def image_to_raw_features_mapping() -> str:
+        """Converting image into model features must often be divided into several steps. This is because the process
+        method during training and serving might differ: For training there might be additional augmentation steps
+        required or one might add some data batching. For this reason we have added two methods
+        `image_to_raw_features_mapping`, `image_to_features_mapping` that return a mapping function name for either for
+        training or inference purposes:
+        `image_to_raw_features_mapping` is used for training and transforms an image into raw features that can be
+        further processed through augmentation or batching. It should not be used when running inference, i.e. when
+        running the model in a pipeline component.
         """
-        Add some default arguments that might be necessary when preparing a sample. Overwrite this method
-        for some custom setting. `default_arguments_for_input_mapping` in `LMTokenClassifierService`.
+        return ""
+    @staticmethod
+    def image_to_features_mapping() -> str:
+        """Converting image into model features must often be divided into several steps. This is because the process
+        method during training and serving might differ: For training there might be additional augmentation steps
+        required or one might add some data batching. For this reason we have added two methods
+        `image_to_raw_features_mapping`, `image_to_features_mapping` that return a mapping function name for either for
+        training or inference purposes:
+        `image_to_features_mapping` is a mapping function that converts a single image into ready features that can
+        be directly fed into the model. We use this function to determine the input format of the model in a pipeline
+        component. Note that this function will also require specific parameters, which can be specified in
+        `default_kwargs_for_image_to_features_mapping`.
         """
-        return {}
+        return ""
-class LMSequenceClassifier(PredictorBase):
+class LMSequenceClassifier(PredictorBase, ABC):
     """
     Abstract base class for sequence classification. If you want to connect external sequence classifiers with
     deepdoctection predictors, wrap them into a class derived from this class.
     """
-    _categories: Mapping[str, ObjectTypes]
-    @property
-    def categories(self) -> Mapping[str, ObjectTypes]:
-        """categories"""
-        return self._categories
-    @categories.setter
-    def categories(self, categories: Mapping[str, TypeOrStr]) -> None:
-        """categories setter"""
-        self._categories = {key: get_type(value) for key, value in categories.items()}
     @abstractmethod
-    def predict(self, **encodings: Union[List[List[str]], "torch.Tensor"]) -> SequenceClassResult:  # type: ignore
+    def predict(self, **encodings: Union[list[list[str]], torch.Tensor]) -> SequenceClassResult:
         """
         Abstract method predict
         """
         raise NotImplementedError()
-    def possible_categories(self) -> List[ObjectTypes]:
-        """
-        Returns a list of possible detectable categories for a sequence
+    @staticmethod
+    def default_kwargs_for_image_to_features_mapping() -> JsonDict:
         """
-        return list(self.categories.values())
+        Some models require that their inputs must be pre-processed in a specific way. Responsible for converting
+        an `Image` datapoint into the input format in inference mode is a mapper function which is called
+        in a pipeline component. The mapper function's name, which has to be used must be specified in the returned
+        value of `image_to_features_mapping`.
+        This mapper function is often implemented for various models and can therefore have various parameters.
+        Some parameters can be inferred from the config file of the model parametrization. Some other might not be
+        in the parametrization and therefore have to be specified here.
-    @abstractmethod
-    def clone(self) -> "LMSequenceClassifier":
-        """
-        Clone an instance
+        This method therefore returns a dictionary that contains as keys some arguments of the function
+        `image_to_features_mapping` and as values the values necessary for providing the model with the required input.
         """
-        raise NotImplementedError()
+        return {}
     @staticmethod
-    def default_kwargs_for_input_mapping() -> JsonDict:
+    def image_to_raw_features_mapping() -> str:
+        """Converting image into model features must often be divided into several steps. This is because the process
+        method during training and serving might differ: For training there might be additional augmentation steps
+        required or one might add some data batching. For this reason we have added two methods
+        `image_to_raw_features_mapping`, `image_to_features_mapping` that return a mapping function name for either for
+        training or inference purposes:
+        `image_to_raw_features_mapping` is used for training and transforms an image into raw features that can be
+        further processed through augmentation or batching. It should not be used when running inference, i.e. when
+        running the model in a pipeline component.
         """
-        Add some default arguments that might be necessary when preparing a sample. Overwrite this method
-        for some custom setting. `default_arguments_for_input_mapping` in `LMTokenClassifierService`.
+        return ""
+    @staticmethod
+    def image_to_features_mapping() -> str:
+        """Converting image into model features must often be divided into several steps. This is because the process
+        method during training and serving might differ: For training there might be additional augmentation steps
+        required or one might add some data batching. For this reason we have added two methods
+        `image_to_raw_features_mapping`, `image_to_features_mapping` that return a mapping function name for either for
+        training or inference purposes:
+        `image_to_features_mapping` is a mapping function that converts a single image into ready features that can
+        be directly fed into the model. We use this function to determine the input format of the model in a pipeline
+        component. Note that this function will also require specific parameters, which can be specified in
+        `default_kwargs_for_image_to_features_mapping`.
         """
-        return {}
+        return ""
-class LanguageDetector(PredictorBase):
+class LanguageDetector(PredictorBase, ABC):
     """
     Abstract base class for language detectors. The `predict` accepts a string of arbitrary length and returns an
     ISO-639 code for the detected language.
     """
-    _categories: Mapping[str, ObjectTypes]
-    @property
-    def categories(self) -> Mapping[str, ObjectTypes]:
-        """categories"""
-        return self._categories
-    @categories.setter
-    def categories(self, categories: Mapping[str, TypeOrStr]) -> None:
-        """categories setter"""
-        self._categories = {key: get_type(value) for key, value in categories.items()}
     @abstractmethod
     def predict(self, text_string: str) -> DetectionResult:
         """
@@ -401,39 +615,30 @@ class LanguageDetector(PredictorBase):
         """
         raise NotImplementedError()
-    def possible_languages(self) -> List[ObjectTypes]:
-        """
-        Returns a list of possible detectable languages
-        """
-        return list(self.categories.values())
-class ImageTransformer(PredictorBase):
+class ImageTransformer(PredictorBase, ABC):
     """
     Abstract base class for transforming an image. The `transform` accepts and returns a numpy array
     """
     @abstractmethod
-    def transform(self, np_img: ImageType, specification: DetectionResult) -> ImageType:
+    def transform(self, np_img: PixelValues, specification: DetectionResult) -> PixelValues:
         """
         Abstract method transform
         """
         raise NotImplementedError()
     @abstractmethod
-    def predict(self, np_img: ImageType) -> DetectionResult:
+    def predict(self, np_img: PixelValues) -> DetectionResult:
         """
         Abstract method predict
         """
         raise NotImplementedError()
-    def clone(self) -> PredictorBase:
+    def clone(self) -> ImageTransformer:
         return self.__class__()
-    @staticmethod
     @abstractmethod
-    def possible_category() -> ObjectTypes:
-        """
-        Returns a (single) category the `ImageTransformer` can predict
-        """
+    def get_category_names(self) -> tuple[ObjectTypes, ...]:
+        """returns category names"""
         raise NotImplementedError()

deepdoctection 0.31__py3-none-any.whl → 0.33__py3-none-any.whl

Potentially problematic release.

deepdoctection 0.31py3-none-any.whl → 0.33py3-none-any.whl