PyPI - deepdoctection - Versions diffs - 0.42.0__py3-none-any.whl → 0.43__py3-none-any.whl - Mend

deepdoctection 0.42.0py3-none-any.whl → 0.43py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of deepdoctection might be problematic. Click here for more details.

Files changed (124) hide show

deepdoctection/__init__.py +2 -1
deepdoctection/analyzer/__init__.py +2 -1
deepdoctection/analyzer/config.py +904 -0
deepdoctection/analyzer/dd.py +36 -62
deepdoctection/analyzer/factory.py +311 -141
deepdoctection/configs/conf_dd_one.yaml +100 -44
deepdoctection/configs/profiles.jsonl +32 -0
deepdoctection/dataflow/__init__.py +9 -6
deepdoctection/dataflow/base.py +33 -15
deepdoctection/dataflow/common.py +96 -75
deepdoctection/dataflow/custom.py +36 -29
deepdoctection/dataflow/custom_serialize.py +135 -91
deepdoctection/dataflow/parallel_map.py +33 -31
deepdoctection/dataflow/serialize.py +15 -10
deepdoctection/dataflow/stats.py +41 -28
deepdoctection/datapoint/__init__.py +4 -6
deepdoctection/datapoint/annotation.py +104 -66
deepdoctection/datapoint/box.py +190 -130
deepdoctection/datapoint/convert.py +66 -39
deepdoctection/datapoint/image.py +151 -95
deepdoctection/datapoint/view.py +383 -236
deepdoctection/datasets/__init__.py +2 -6
deepdoctection/datasets/adapter.py +11 -11
deepdoctection/datasets/base.py +118 -81
deepdoctection/datasets/dataflow_builder.py +18 -12
deepdoctection/datasets/info.py +76 -57
deepdoctection/datasets/instances/__init__.py +6 -2
deepdoctection/datasets/instances/doclaynet.py +17 -14
deepdoctection/datasets/instances/fintabnet.py +16 -22
deepdoctection/datasets/instances/funsd.py +11 -6
deepdoctection/datasets/instances/iiitar13k.py +9 -9
deepdoctection/datasets/instances/layouttest.py +9 -9
deepdoctection/datasets/instances/publaynet.py +9 -9
deepdoctection/datasets/instances/pubtables1m.py +13 -13
deepdoctection/datasets/instances/pubtabnet.py +13 -15
deepdoctection/datasets/instances/rvlcdip.py +8 -8
deepdoctection/datasets/instances/xfund.py +11 -9
deepdoctection/datasets/registry.py +18 -11
deepdoctection/datasets/save.py +12 -11
deepdoctection/eval/__init__.py +3 -2
deepdoctection/eval/accmetric.py +72 -52
deepdoctection/eval/base.py +29 -10
deepdoctection/eval/cocometric.py +14 -12
deepdoctection/eval/eval.py +56 -41
deepdoctection/eval/registry.py +6 -3
deepdoctection/eval/tedsmetric.py +24 -9
deepdoctection/eval/tp_eval_callback.py +13 -12
deepdoctection/extern/__init__.py +1 -1
deepdoctection/extern/base.py +176 -97
deepdoctection/extern/d2detect.py +127 -92
deepdoctection/extern/deskew.py +19 -10
deepdoctection/extern/doctrocr.py +157 -106
deepdoctection/extern/fastlang.py +25 -17
deepdoctection/extern/hfdetr.py +137 -60
deepdoctection/extern/hflayoutlm.py +329 -248
deepdoctection/extern/hflm.py +67 -33
deepdoctection/extern/model.py +108 -762
deepdoctection/extern/pdftext.py +37 -12
deepdoctection/extern/pt/nms.py +15 -1
deepdoctection/extern/pt/ptutils.py +13 -9
deepdoctection/extern/tessocr.py +87 -54
deepdoctection/extern/texocr.py +29 -14
deepdoctection/extern/tp/tfutils.py +36 -8
deepdoctection/extern/tp/tpcompat.py +54 -16
deepdoctection/extern/tp/tpfrcnn/config/config.py +20 -4
deepdoctection/extern/tpdetect.py +4 -2
deepdoctection/mapper/__init__.py +1 -1
deepdoctection/mapper/cats.py +117 -76
deepdoctection/mapper/cocostruct.py +35 -17
deepdoctection/mapper/d2struct.py +56 -29
deepdoctection/mapper/hfstruct.py +32 -19
deepdoctection/mapper/laylmstruct.py +221 -185
deepdoctection/mapper/maputils.py +71 -35
deepdoctection/mapper/match.py +76 -62
deepdoctection/mapper/misc.py +68 -44
deepdoctection/mapper/pascalstruct.py +13 -12
deepdoctection/mapper/prodigystruct.py +33 -19
deepdoctection/mapper/pubstruct.py +42 -32
deepdoctection/mapper/tpstruct.py +39 -19
deepdoctection/mapper/xfundstruct.py +20 -13
deepdoctection/pipe/__init__.py +1 -2
deepdoctection/pipe/anngen.py +104 -62
deepdoctection/pipe/base.py +226 -107
deepdoctection/pipe/common.py +206 -123
deepdoctection/pipe/concurrency.py +74 -47
deepdoctection/pipe/doctectionpipe.py +108 -47
deepdoctection/pipe/language.py +41 -24
deepdoctection/pipe/layout.py +45 -18
deepdoctection/pipe/lm.py +146 -78
deepdoctection/pipe/order.py +196 -113
deepdoctection/pipe/refine.py +111 -63
deepdoctection/pipe/registry.py +1 -1
deepdoctection/pipe/segment.py +213 -142
deepdoctection/pipe/sub_layout.py +76 -46
deepdoctection/pipe/text.py +52 -33
deepdoctection/pipe/transform.py +8 -6
deepdoctection/train/d2_frcnn_train.py +87 -69
deepdoctection/train/hf_detr_train.py +72 -40
deepdoctection/train/hf_layoutlm_train.py +85 -46
deepdoctection/train/tp_frcnn_train.py +56 -28
deepdoctection/utils/concurrency.py +59 -16
deepdoctection/utils/context.py +40 -19
deepdoctection/utils/develop.py +25 -17
deepdoctection/utils/env_info.py +85 -36
deepdoctection/utils/error.py +16 -10
deepdoctection/utils/file_utils.py +246 -62
deepdoctection/utils/fs.py +162 -43
deepdoctection/utils/identifier.py +29 -16
deepdoctection/utils/logger.py +49 -32
deepdoctection/utils/metacfg.py +83 -21
deepdoctection/utils/pdf_utils.py +119 -62
deepdoctection/utils/settings.py +24 -10
deepdoctection/utils/tqdm.py +10 -5
deepdoctection/utils/transform.py +182 -46
deepdoctection/utils/utils.py +61 -28
deepdoctection/utils/viz.py +150 -104
deepdoctection-0.43.dist-info/METADATA +376 -0
deepdoctection-0.43.dist-info/RECORD +149 -0
{deepdoctection-0.42.0.dist-info → deepdoctection-0.43.dist-info}/WHEEL +1 -1
deepdoctection/analyzer/_config.py +0 -146
deepdoctection-0.42.0.dist-info/METADATA +0 -431
deepdoctection-0.42.0.dist-info/RECORD +0 -148
{deepdoctection-0.42.0.dist-info → deepdoctection-0.43.dist-info}/licenses/LICENSE +0 -0
{deepdoctection-0.42.0.dist-info → deepdoctection-0.43.dist-info}/top_level.txt +0 -0

deepdoctection/extern/hfdetr.py CHANGED Viewed

@@ -16,14 +16,15 @@
 # limitations under the License.
 """
-HF Detr model for object detection.
+HF Detr and DeformableDetr models.
 """
 from __future__ import annotations
 import os
 from abc import ABC
 from pathlib import Path
-from typing import Literal, Mapping, Optional, Sequence, Union
+from typing import TYPE_CHECKING, Literal, Mapping, Optional, Sequence, Union
 from lazy_imports import try_import
@@ -39,13 +40,17 @@ with try_import() as pt_import_guard:
 with try_import() as tr_import_guard:
     from transformers import (  # pylint: disable=W0611
-        AutoFeatureExtractor,
-        DetrFeatureExtractor,
-        DetrImageProcessor,
+        DeformableDetrForObjectDetection,
+        DeformableDetrImageProcessorFast,
+        DetrImageProcessorFast,
         PretrainedConfig,
         TableTransformerForObjectDetection,
     )
+    if TYPE_CHECKING:
+        EligibleDetrModel = Union[TableTransformerForObjectDetection, DeformableDetrForObjectDetection]
+        DetrImageProcessor = Union[DetrImageProcessorFast, DeformableDetrImageProcessorFast]
 def _detr_post_processing(
     boxes: torch.Tensor, scores: torch.Tensor, labels: torch.Tensor, nms_thresh: float
@@ -55,24 +60,27 @@ def _detr_post_processing(
 def detr_predict_image(
     np_img: PixelValues,
-    predictor: TableTransformerForObjectDetection,
+    predictor: EligibleDetrModel,
     feature_extractor: DetrImageProcessor,
     device: torch.device,
     threshold: float,
     nms_threshold: float,
 ) -> list[DetectionResult]:
     """
-    Calling predictor. Before doing that, tensors must be transferred to the device where the model is loaded. After
-    running prediction it will present prediction in DetectionResult format-
-    :param np_img: image as numpy array
-    :param predictor: TableTransformerForObjectDetection
-    :param feature_extractor: feature extractor
-    :param device: device where the model is loaded
-    :param threshold: Will filter all predictions with confidence score less threshold
-    :param nms_threshold: Threshold to perform NMS on prediction outputs. (Note, that NMS does not belong to canonical
-                          Detr inference processing)
+    Calling predictor. Before, tensors must be transferred to the device where the model is loaded.
+    Args:
+        np_img: Image as `np.array`.
+        predictor: `TableTransformerForObjectDetection` instance.
+        feature_extractor: Feature extractor instance.
+        device: Device where the model is loaded.
+        threshold: Will filter all predictions with confidence score less threshold.
+        nms_threshold: Threshold to perform NMS on prediction outputs.
+                       Note:
+                           NMS does not belong to canonical Detr inference processing.
+    Returns:
+        List of `DetectionResult` after running prediction.
     """
     target_sizes = [np_img.shape[:2]]
     inputs = feature_extractor(images=np_img, return_tensors="pt")
@@ -101,10 +109,10 @@ class HFDetrDerivedDetectorMixin(ObjectDetector, ABC):
     def __init__(self, categories: Mapping[int, TypeOrStr], filter_categories: Optional[Sequence[TypeOrStr]] = None):
         """
-        :param categories: A dict with key (indices) and values (category names).
-        :param filter_categories: The model might return objects that are not supposed to be predicted and that should
-                                  be filtered. Pass a list of category names that must not be returned
+        Args:
+            categories: A dict with key (indices) and values (category names).
+            filter_categories: The model might return objects that are not supposed to be predicted and that should
+                               be filtered. Pass a list of category names that must not be returned.
         """
         self.categories = ModelCategories(init_categories=categories)
         if filter_categories:
@@ -112,10 +120,13 @@ class HFDetrDerivedDetectorMixin(ObjectDetector, ABC):
     def _map_category_names(self, detection_results: list[DetectionResult]) -> list[DetectionResult]:
         """
-        Populating category names to detection results. Will also filter categories
+        Populating category names to `DetectionResult`. Will also filter categories.
+        Args:
+            detection_results: List of `DetectionResult`s.
-        :param detection_results: list of detection results
-        :return: List of detection results with attribute class_name populated
+        Returns:
+            List of `DetectionResult`s with `class_name`.
         """
         filtered_detection_result: list[DetectionResult] = []
         shifted_categories = self.categories.shift_category_ids(shift_by=-1)
@@ -132,24 +143,39 @@ class HFDetrDerivedDetectorMixin(ObjectDetector, ABC):
     @staticmethod
     def get_name(path_weights: PathLikeOrStr) -> str:
-        """Returns the name of the model"""
+        """
+        Returns the name of the model.
+        Args:
+            path_weights: Path to the model weights.
+        Returns:
+            Model name string.
+        """
         return "Transformers_Tatr_" + "_".join(Path(path_weights).parts[-2:])
     def get_category_names(self) -> tuple[ObjectTypes, ...]:
+        """
+        Returns:
+            Tuple of `category_name`s.
+        """
         return self.categories.get_categories(as_dict=False)
 class HFDetrDerivedDetector(HFDetrDerivedDetectorMixin):
     """
-    Model wrapper for TableTransformerForObjectDetection that again is based on
-    https://github.com/microsoft/table-transformer .
+    Model wrapper for `TableTransformerForObjectDetection` that again is based on
+    <https://github.com/microsoft/table-transformer>.
     The wrapper can be used to load pre-trained models for table detection and table structure recognition. Running Detr
-    models trained from scratch on custom datasets is possible as well. Note, that this wrapper will load
-    `TableTransformerForObjectDetection` that is slightly different compared to `DetrForObjectDetection` that can be
-    found in the transformer library as well.
+    models trained from scratch on custom datasets is possible as well.
+    Note:
+        This wrapper will load `TableTransformerForObjectDetection` that is slightly different compared to
+        `DetrForObjectDetection` that can be found in the transformer library as well.
+    Example:
+        ```python
         config_path = ModelCatalog.
         get_full_path_configs("microsoft/table-transformer-structure-recognition/pytorch_model.bin")
         weights_path = ModelDownloadManager.
@@ -162,6 +188,7 @@ class HFDetrDerivedDetector(HFDetrDerivedDetectorMixin):
         detr_predictor = HFDetrDerivedDetector(config_path,weights_path,feature_extractor_config_path,categories)
         detection_result = detr_predictor.predict(bgr_image_np_array)
+        ```
     """
     def __init__(
@@ -175,13 +202,15 @@ class HFDetrDerivedDetector(HFDetrDerivedDetectorMixin):
     ):
         """
         Set up the predictor.
-        :param path_config_json: The path to the json config.
-        :param path_weights: The path to the model checkpoint.
-        :param path_feature_extractor_config_json: The path to the feature extractor config.
-        :param categories: A dict with key (indices) and values (category names).
-        :param device: "cpu" or "cuda". If not specified will auto select depending on what is available
-        :param filter_categories: The model might return objects that are not supposed to be predicted and that should
-                                  be filtered. Pass a list of category names that must not be returned
+        Args:
+            path_config_json: The path to the json config.
+            path_weights: The path to the model checkpoint.
+            path_feature_extractor_config_json: The path to the feature extractor config.
+            categories: A dict with key (indices) and values (category names).
+            device: "cpu" or "cuda". If not specified will auto select depending on what is available.
+            filter_categories: The model might return objects that are not supposed to be predicted and that should
+                              be filtered. Pass a list of category names that must not be returned.
         """
         super().__init__(categories, filter_categories)
@@ -195,12 +224,21 @@ class HFDetrDerivedDetector(HFDetrDerivedDetectorMixin):
         self.config = self.get_config(path_config_json)
         self.hf_detr_predictor = self.get_model(self.path_weights, self.config)
-        self.feature_extractor = self.get_pre_processor(self.path_feature_extractor_config)
+        self.feature_extractor = self.get_pre_processor(self.path_feature_extractor_config, self.config)
         self.device = get_torch_device(device)
         self.hf_detr_predictor.to(self.device)
     def predict(self, np_img: PixelValues) -> list[DetectionResult]:
+        """
+        Predicts objects in an image.
+        Args:
+            np_img: Image as `np.array`.
+        Returns:
+            List of `DetectionResult`.
+        """
         results = detr_predict_image(
             np_img,
             self.hf_detr_predictor,
@@ -212,36 +250,71 @@ class HFDetrDerivedDetector(HFDetrDerivedDetectorMixin):
         return self._map_category_names(results)
     @staticmethod
-    def get_model(path_weights: PathLikeOrStr, config: PretrainedConfig) -> TableTransformerForObjectDetection:
+    def get_model(path_weights: PathLikeOrStr, config: PretrainedConfig) -> EligibleDetrModel:
         """
-        Builds the Detr model
+        Builds the Detr model.
-        :param path_weights: The path to the model checkpoint.
-        :param config: `PretrainedConfig`
-        :return: TableTransformerForObjectDetection instance
+        Args:
+            path_weights: The path to the model checkpoint.
+            config: `PretrainedConfig` instance.
+        Returns:
+            `TableTransformerForObjectDetection` instance.
+        Raises:
+            ValueError: If model architecture is not eligible.
         """
-        return TableTransformerForObjectDetection.from_pretrained(
-            pretrained_model_name_or_path=os.fspath(path_weights), config=config
+        if "TableTransformerForObjectDetection" in config.architectures:
+            return TableTransformerForObjectDetection.from_pretrained(
+                pretrained_model_name_or_path=os.fspath(path_weights), config=config
+            )
+        if "DeformableDetrForObjectDetection" in config.architectures:
+            return DeformableDetrForObjectDetection.from_pretrained(
+                pretrained_model_name_or_path=os.fspath(path_weights), config=config
+            )
+        raise ValueError(
+            f"Model architecture {config.architectures} not eligible. Please use either "
+            "TableTransformerForObjectDetection or DeformableDetrForObjectDetection."
         )
     @staticmethod
-    def get_pre_processor(path_feature_extractor_config: PathLikeOrStr) -> DetrImageProcessor:
+    def get_pre_processor(path_feature_extractor_config: PathLikeOrStr, config: PretrainedConfig) -> DetrImageProcessor:
         """
-        Builds the feature extractor
+        Builds the feature extractor.
+        Args:
+            path_feature_extractor_config: Path to feature extractor config.
+            config: Model configuration.
-        :return: DetrFeatureExtractor
+        Returns:
+            `DetrImageProcessor` instance.
+        Raises:
+            ValueError: If model architecture is not eligible.
         """
-        return DetrImageProcessor.from_pretrained(
-            pretrained_model_name_or_path=os.fspath(path_feature_extractor_config)
+        if "TableTransformerForObjectDetection" in config.architectures:
+            return DetrImageProcessorFast.from_pretrained(
+                pretrained_model_name_or_path=os.fspath(path_feature_extractor_config),
+            )
+        if "DeformableDetrForObjectDetection" in config.architectures:
+            return DeformableDetrImageProcessorFast.from_pretrained(
+                pretrained_model_name_or_path=os.fspath(path_feature_extractor_config),
+            )
+        raise ValueError(
+            f"Model architecture {config.architectures} not eligible. Please use either "
+            "TableTransformerForObjectDetection or DeformableDetrForObjectDetection."
         )
     @staticmethod
     def get_config(path_config: PathLikeOrStr) -> PretrainedConfig:
         """
-        Builds the config
+        Builds the config.
+        Args:
+            path_config: The path to the config.
-        :param path_config: The path to the json config.
-        :return: PretrainedConfig instance
+        Returns:
+            `PretrainedConfig` instance.
         """
         config = PretrainedConfig.from_pretrained(pretrained_model_name_or_path=os.fspath(path_config))
         config.use_timm_backbone = True
@@ -270,17 +343,21 @@ class HFDetrDerivedDetector(HFDetrDerivedDetectorMixin):
         device: Optional[Union[Literal["cpu", "cuda"], torch.device]] = None,
     ) -> TableTransformerForObjectDetection:
         """
-        Get the wrapped model
+        Get the wrapped model.
+        Args:
+            path_config_json: The path to the json config.
+            path_weights: The path to the model checkpoint.
+            device: "cpu" or "cuda". If not specified will auto select depending on what is available.
-        :param path_config_json: The path to the json config.
-        :param path_weights: The path to the model checkpoint.
-        :param device: "cpu" or "cuda". If not specified will auto select depending on what is available
-        :return: TableTransformerForObjectDetection instance
+        Returns:
+            `TableTransformerForObjectDetection` instance.
         """
         config = HFDetrDerivedDetector.get_config(path_config_json)
         hf_detr_predictor = HFDetrDerivedDetector.get_model(path_weights, config)
         device = get_torch_device(device)
-        return hf_detr_predictor.to(device)
+        hf_detr_predictor.to(device)
+        return hf_detr_predictor
     def clear_model(self) -> None:
         self.hf_detr_predictor = None

deepdoctection 0.42.0__py3-none-any.whl → 0.43__py3-none-any.whl

Potentially problematic release.

deepdoctection 0.42.0py3-none-any.whl → 0.43py3-none-any.whl