PyPI - deepdoctection - Versions diffs - 0.30__py3-none-any.whl → 0.32__py3-none-any.whl - Mend

deepdoctection 0.30py3-none-any.whl → 0.32py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of deepdoctection might be problematic. Click here for more details.

Files changed (120) hide show

deepdoctection/__init__.py +38 -29
deepdoctection/analyzer/dd.py +36 -29
deepdoctection/configs/conf_dd_one.yaml +34 -31
deepdoctection/dataflow/base.py +0 -19
deepdoctection/dataflow/custom.py +4 -3
deepdoctection/dataflow/custom_serialize.py +14 -5
deepdoctection/dataflow/parallel_map.py +12 -11
deepdoctection/dataflow/serialize.py +5 -4
deepdoctection/datapoint/annotation.py +35 -13
deepdoctection/datapoint/box.py +3 -5
deepdoctection/datapoint/convert.py +3 -1
deepdoctection/datapoint/image.py +79 -36
deepdoctection/datapoint/view.py +152 -49
deepdoctection/datasets/__init__.py +1 -4
deepdoctection/datasets/adapter.py +6 -3
deepdoctection/datasets/base.py +86 -11
deepdoctection/datasets/dataflow_builder.py +1 -1
deepdoctection/datasets/info.py +4 -4
deepdoctection/datasets/instances/doclaynet.py +3 -2
deepdoctection/datasets/instances/fintabnet.py +2 -1
deepdoctection/datasets/instances/funsd.py +2 -1
deepdoctection/datasets/instances/iiitar13k.py +5 -2
deepdoctection/datasets/instances/layouttest.py +4 -8
deepdoctection/datasets/instances/publaynet.py +2 -2
deepdoctection/datasets/instances/pubtables1m.py +6 -3
deepdoctection/datasets/instances/pubtabnet.py +2 -1
deepdoctection/datasets/instances/rvlcdip.py +2 -1
deepdoctection/datasets/instances/xfund.py +2 -1
deepdoctection/eval/__init__.py +1 -4
deepdoctection/eval/accmetric.py +1 -1
deepdoctection/eval/base.py +5 -4
deepdoctection/eval/cocometric.py +2 -1
deepdoctection/eval/eval.py +19 -15
deepdoctection/eval/tedsmetric.py +14 -11
deepdoctection/eval/tp_eval_callback.py +14 -7
deepdoctection/extern/__init__.py +2 -7
deepdoctection/extern/base.py +39 -13
deepdoctection/extern/d2detect.py +182 -90
deepdoctection/extern/deskew.py +36 -9
deepdoctection/extern/doctrocr.py +265 -83
deepdoctection/extern/fastlang.py +49 -9
deepdoctection/extern/hfdetr.py +106 -55
deepdoctection/extern/hflayoutlm.py +441 -122
deepdoctection/extern/hflm.py +225 -0
deepdoctection/extern/model.py +56 -47
deepdoctection/extern/pdftext.py +10 -5
deepdoctection/extern/pt/__init__.py +1 -3
deepdoctection/extern/pt/nms.py +6 -2
deepdoctection/extern/pt/ptutils.py +27 -18
deepdoctection/extern/tessocr.py +134 -22
deepdoctection/extern/texocr.py +6 -2
deepdoctection/extern/tp/tfutils.py +43 -9
deepdoctection/extern/tp/tpcompat.py +14 -11
deepdoctection/extern/tp/tpfrcnn/__init__.py +20 -0
deepdoctection/extern/tp/tpfrcnn/common.py +7 -3
deepdoctection/extern/tp/tpfrcnn/config/__init__.py +20 -0
deepdoctection/extern/tp/tpfrcnn/config/config.py +9 -6
deepdoctection/extern/tp/tpfrcnn/modeling/__init__.py +20 -0
deepdoctection/extern/tp/tpfrcnn/modeling/backbone.py +17 -7
deepdoctection/extern/tp/tpfrcnn/modeling/generalized_rcnn.py +12 -6
deepdoctection/extern/tp/tpfrcnn/modeling/model_box.py +9 -4
deepdoctection/extern/tp/tpfrcnn/modeling/model_cascade.py +8 -5
deepdoctection/extern/tp/tpfrcnn/modeling/model_fpn.py +16 -11
deepdoctection/extern/tp/tpfrcnn/modeling/model_frcnn.py +17 -10
deepdoctection/extern/tp/tpfrcnn/modeling/model_mrcnn.py +14 -8
deepdoctection/extern/tp/tpfrcnn/modeling/model_rpn.py +15 -10
deepdoctection/extern/tp/tpfrcnn/predict.py +9 -4
deepdoctection/extern/tp/tpfrcnn/preproc.py +8 -9
deepdoctection/extern/tp/tpfrcnn/utils/__init__.py +20 -0
deepdoctection/extern/tp/tpfrcnn/utils/box_ops.py +10 -2
deepdoctection/extern/tpdetect.py +54 -30
deepdoctection/mapper/__init__.py +3 -8
deepdoctection/mapper/d2struct.py +9 -7
deepdoctection/mapper/hfstruct.py +7 -2
deepdoctection/mapper/laylmstruct.py +164 -21
deepdoctection/mapper/maputils.py +16 -3
deepdoctection/mapper/misc.py +6 -3
deepdoctection/mapper/prodigystruct.py +1 -1
deepdoctection/mapper/pubstruct.py +10 -10
deepdoctection/mapper/tpstruct.py +3 -3
deepdoctection/pipe/__init__.py +1 -1
deepdoctection/pipe/anngen.py +35 -8
deepdoctection/pipe/base.py +53 -19
deepdoctection/pipe/common.py +23 -13
deepdoctection/pipe/concurrency.py +2 -1
deepdoctection/pipe/doctectionpipe.py +2 -2
deepdoctection/pipe/language.py +3 -2
deepdoctection/pipe/layout.py +6 -3
deepdoctection/pipe/lm.py +34 -66
deepdoctection/pipe/order.py +142 -35
deepdoctection/pipe/refine.py +26 -24
deepdoctection/pipe/segment.py +21 -16
deepdoctection/pipe/{cell.py → sub_layout.py} +30 -9
deepdoctection/pipe/text.py +14 -8
deepdoctection/pipe/transform.py +16 -9
deepdoctection/train/__init__.py +6 -12
deepdoctection/train/d2_frcnn_train.py +36 -28
deepdoctection/train/hf_detr_train.py +26 -17
deepdoctection/train/hf_layoutlm_train.py +133 -111
deepdoctection/train/tp_frcnn_train.py +21 -19
deepdoctection/utils/__init__.py +3 -0
deepdoctection/utils/concurrency.py +1 -1
deepdoctection/utils/context.py +2 -2
deepdoctection/utils/env_info.py +41 -84
deepdoctection/utils/error.py +84 -0
deepdoctection/utils/file_utils.py +4 -15
deepdoctection/utils/fs.py +7 -7
deepdoctection/utils/logger.py +1 -0
deepdoctection/utils/mocks.py +93 -0
deepdoctection/utils/pdf_utils.py +5 -4
deepdoctection/utils/settings.py +6 -1
deepdoctection/utils/transform.py +1 -1
deepdoctection/utils/utils.py +0 -6
deepdoctection/utils/viz.py +48 -5
{deepdoctection-0.30.dist-info → deepdoctection-0.32.dist-info}/METADATA +57 -73
deepdoctection-0.32.dist-info/RECORD +146 -0
{deepdoctection-0.30.dist-info → deepdoctection-0.32.dist-info}/WHEEL +1 -1
deepdoctection-0.30.dist-info/RECORD +0 -143
{deepdoctection-0.30.dist-info → deepdoctection-0.32.dist-info}/LICENSE +0 -0
{deepdoctection-0.30.dist-info → deepdoctection-0.32.dist-info}/top_level.txt +0 -0

deepdoctection/extern/d2detect.py CHANGED Viewed

@@ -18,42 +18,39 @@
 """
 D2 GeneralizedRCNN model as predictor for deepdoctection pipeline
 """
+from __future__ import annotations
 import io
+from abc import ABC
 from copy import copy
 from pathlib import Path
-from typing import Any, Dict, List, Literal, Mapping, Optional, Sequence
+from typing import Any, Dict, List, Literal, Mapping, Optional, Sequence, Union
 import numpy as np
+from lazy_imports import try_import
 from ..utils.detection_types import ImageType, Requirement
-from ..utils.file_utils import (
-    detectron2_available,
-    get_detectron2_requirement,
-    get_pytorch_requirement,
-    pytorch_available,
-)
-from ..utils.metacfg import set_config_by_yaml
+from ..utils.file_utils import get_detectron2_requirement, get_pytorch_requirement
+from ..utils.metacfg import AttrDict, set_config_by_yaml
 from ..utils.settings import ObjectTypes, TypeOrStr, get_type
 from ..utils.transform import InferenceResize, ResizeTransform
 from .base import DetectionResult, ObjectDetector, PredictorBase
 from .pt.nms import batched_nms
-from .pt.ptutils import set_torch_auto_device
+from .pt.ptutils import get_torch_device
-if pytorch_available():
+with try_import() as pt_import_guard:
     import torch
     import torch.cuda
     from torch import nn  # pylint: disable=W0611
-if detectron2_available():
+with try_import() as d2_import_guard:
     from detectron2.checkpoint import DetectionCheckpointer
     from detectron2.config import CfgNode, get_cfg  # pylint: disable=W0611
     from detectron2.modeling import GeneralizedRCNN, build_model  # pylint: disable=W0611
     from detectron2.structures import Instances  # pylint: disable=W0611
-def _d2_post_processing(
-    predictions: Dict[str, "Instances"], nms_thresh_class_agnostic: float
-) -> Dict[str, "Instances"]:
+def _d2_post_processing(predictions: Dict[str, Instances], nms_thresh_class_agnostic: float) -> Dict[str, Instances]:
     """
     D2 postprocessing steps, so that detection outputs are aligned with outputs of other packages (e.g. Tensorpack).
     Apply a class agnostic NMS.
@@ -71,7 +68,7 @@ def _d2_post_processing(
 def d2_predict_image(
     np_img: ImageType,
-    predictor: "nn.Module",
+    predictor: nn.Module,
     resizer: InferenceResize,
     nms_thresh_class_agnostic: float,
 ) -> List[DetectionResult]:
@@ -106,7 +103,7 @@ def d2_predict_image(
 def d2_jit_predict_image(
-    np_img: ImageType, d2_predictor: "nn.Module", resizer: InferenceResize, nms_thresh_class_agnostic: float
+    np_img: ImageType, d2_predictor: nn.Module, resizer: InferenceResize, nms_thresh_class_agnostic: float
 ) -> List[DetectionResult]:
     """
     Run detection on an image using torchscript. It will also handle the preprocessing internally which
@@ -144,7 +141,72 @@ def d2_jit_predict_image(
     return detect_result_list
-class D2FrcnnDetector(ObjectDetector):
+class D2FrcnnDetectorMixin(ObjectDetector, ABC):
+    """
+    Base class for D2 Faster-RCNN implementation. This class only implements the basic wrapper functions
+    """
+    def __init__(
+        self,
+        categories: Mapping[str, TypeOrStr],
+        filter_categories: Optional[Sequence[TypeOrStr]] = None,
+    ):
+        """
+        :param categories: A dict with key (indices) and values (category names). Index 0 must be reserved for a
+                           dummy 'BG' category. Note, that this convention is different from the builtin D2 framework,
+                           where models in the model zoo are trained with 'BG' class having the highest index.
+        :param filter_categories: The model might return objects that are not supposed to be predicted and that should
+                                  be filtered. Pass a list of category names that must not be returned
+        """
+        if filter_categories:
+            filter_categories = [get_type(cat) for cat in filter_categories]
+        self.filter_categories = filter_categories
+        self._categories_d2 = self._map_to_d2_categories(copy(categories))
+        self.categories = {idx: get_type(cat) for idx, cat in categories.items()}
+    def _map_category_names(self, detection_results: List[DetectionResult]) -> List[DetectionResult]:
+        """
+        Populating category names to detection results
+        :param detection_results: list of detection results. Will also filter categories
+        :return: List of detection results with attribute class_name populated
+        """
+        filtered_detection_result: List[DetectionResult] = []
+        for result in detection_results:
+            result.class_name = self._categories_d2[str(result.class_id)]
+            if isinstance(result.class_id, int):
+                result.class_id += 1
+            if self.filter_categories:
+                if result.class_name not in self.filter_categories:
+                    filtered_detection_result.append(result)
+            else:
+                filtered_detection_result.append(result)
+        return filtered_detection_result
+    @classmethod
+    def _map_to_d2_categories(cls, categories: Mapping[str, TypeOrStr]) -> Dict[str, ObjectTypes]:
+        return {str(int(k) - 1): get_type(v) for k, v in categories.items()}
+    def possible_categories(self) -> List[ObjectTypes]:
+        return list(self.categories.values())
+    @staticmethod
+    def get_inference_resizer(min_size_test: int, max_size_test: int) -> InferenceResize:
+        """Returns the resizer for the inference
+        :param min_size_test: minimum size of the resized image
+        :param max_size_test: maximum size of the resized image
+        """
+        return InferenceResize(min_size_test, max_size_test)
+    @staticmethod
+    def get_name(path_weights: str, architecture: str) -> str:
+        """Returns the name of the model"""
+        return f"detectron2_{architecture}" + "_".join(Path(path_weights).parts[-2:])
+class D2FrcnnDetector(D2FrcnnDetectorMixin):
     """
     D2 Faster-RCNN implementation with all the available backbones, normalizations throughout the model
     as well as FPN, optional Cascade-RCNN and many more.
@@ -155,6 +217,7 @@ class D2FrcnnDetector(ObjectDetector):
     the standard D2 output that takes into account of the situation that detected objects are disjoint. For more infos
     on this topic, see <https://github.com/facebookresearch/detectron2/issues/978> .
+    ```python
         config_path = ModelCatalog.get_full_path_configs("dd/d2/item/CASCADE_RCNN_R_50_FPN_GN.yaml")
         weights_path = ModelDownloadManager.maybe_download_weights_and_configs("item/d2_model-800000-layout.pkl")
         categories = ModelCatalog.get_profile("item/d2_model-800000-layout.pkl").categories
@@ -162,6 +225,7 @@ class D2FrcnnDetector(ObjectDetector):
         d2_predictor = D2FrcnnDetector(config_path,weights_path,categories,device="cpu")
         detection_results = d2_predictor.predict(bgr_image_np_array)
+    ```
     """
     def __init__(
@@ -170,7 +234,7 @@ class D2FrcnnDetector(ObjectDetector):
         path_weights: str,
         categories: Mapping[str, TypeOrStr],
         config_overwrite: Optional[List[str]] = None,
-        device: Optional[Literal["cpu", "cuda"]] = None,
+        device: Optional[Union[Literal["cpu", "cuda"], torch.device]] = None,
         filter_categories: Optional[Sequence[TypeOrStr]] = None,
     ):
         """
@@ -191,47 +255,38 @@ class D2FrcnnDetector(ObjectDetector):
         :param filter_categories: The model might return objects that are not supposed to be predicted and that should
                                   be filtered. Pass a list of category names that must not be returned
         """
+        super().__init__(categories, filter_categories)
-        self.name = "_".join(Path(path_weights).parts[-3:])
-        self._categories_d2 = self._map_to_d2_categories(copy(categories))
         self.path_weights = path_weights
-        d2_conf_list = ["MODEL.WEIGHTS", path_weights]
-        config_overwrite = config_overwrite if config_overwrite else []
-        for conf in config_overwrite:
-            key, val = conf.split("=", maxsplit=1)
-            d2_conf_list.extend([key, val])
         self.path_yaml = path_yaml
-        self.categories = copy(categories)  # type: ignore
+        config_overwrite = config_overwrite if config_overwrite else []
         self.config_overwrite = config_overwrite
-        if device is not None:
-            self.device = device
-        else:
-            self.device = set_torch_auto_device()
-        if filter_categories:
-            filter_categories = [get_type(cat) for cat in filter_categories]
-        self.filter_categories = filter_categories
-        self.cfg = self._set_config(path_yaml, d2_conf_list, device)
-        self.d2_predictor = D2FrcnnDetector.set_model(self.cfg)
-        self.resizer = InferenceResize(self.cfg.INPUT.MIN_SIZE_TEST, self.cfg.INPUT.MAX_SIZE_TEST)
-        self._instantiate_d2_predictor()
+        self.device = get_torch_device(device)
+        d2_conf_list = self._get_d2_config_list(path_weights, config_overwrite)
+        self.cfg = self._set_config(path_yaml, d2_conf_list, self.device)
+        self.name = self.get_name(path_weights, self.cfg.MODEL.META_ARCHITECTURE)
+        self.model_id = self.get_model_id()
+        self.d2_predictor = self._set_model(self.cfg)
+        self._instantiate_d2_predictor(self.d2_predictor, path_weights)
+        self.resizer = self.get_inference_resizer(self.cfg.INPUT.MIN_SIZE_TEST, self.cfg.INPUT.MAX_SIZE_TEST)
     @staticmethod
-    def _set_config(
-        path_yaml: str, d2_conf_list: List[str], device: Optional[Literal["cpu", "cuda"]] = None
-    ) -> "CfgNode":
+    def _set_config(path_yaml: str, d2_conf_list: List[str], device: torch.device) -> CfgNode:
         cfg = get_cfg()
         # additional attribute with default value, so that the true value can be loaded from the configs
         cfg.NMS_THRESH_CLASS_AGNOSTIC = 0.1
         cfg.merge_from_file(path_yaml)
         cfg.merge_from_list(d2_conf_list)
-        if not torch.cuda.is_available() or device == "cpu":
-            cfg.MODEL.DEVICE = "cpu"
+        cfg.MODEL.DEVICE = str(device)
         cfg.freeze()
         return cfg
     @staticmethod
-    def set_model(config: "CfgNode") -> "GeneralizedRCNN":
+    def _set_model(config: CfgNode) -> GeneralizedRCNN:
         """
         Build the D2 model. It uses the available builtin tools of D2
@@ -240,9 +295,10 @@ class D2FrcnnDetector(ObjectDetector):
         """
         return build_model(config.clone()).eval()
-    def _instantiate_d2_predictor(self) -> None:
-        checkpointer = DetectionCheckpointer(self.d2_predictor)
-        checkpointer.load(self.cfg.MODEL.WEIGHTS)
+    @staticmethod
+    def _instantiate_d2_predictor(wrapped_model: GeneralizedRCNN, path_weights: str) -> None:
+        checkpointer = DetectionCheckpointer(wrapped_model)
+        checkpointer.load(path_weights)
     def predict(self, np_img: ImageType) -> List[DetectionResult]:
         """
@@ -259,33 +315,10 @@ class D2FrcnnDetector(ObjectDetector):
         )
         return self._map_category_names(detection_results)
-    def _map_category_names(self, detection_results: List[DetectionResult]) -> List[DetectionResult]:
-        """
-        Populating category names to detection results
-        :param detection_results: list of detection results. Will also filter categories
-        :return: List of detection results with attribute class_name populated
-        """
-        filtered_detection_result: List[DetectionResult] = []
-        for result in detection_results:
-            result.class_name = self._categories_d2[str(result.class_id)]
-            if isinstance(result.class_id, int):
-                result.class_id += 1
-            if self.filter_categories:
-                if result.class_name not in self.filter_categories:
-                    filtered_detection_result.append(result)
-            else:
-                filtered_detection_result.append(result)
-        return filtered_detection_result
     @classmethod
     def get_requirements(cls) -> List[Requirement]:
         return [get_pytorch_requirement(), get_detectron2_requirement()]
-    @classmethod
-    def _map_to_d2_categories(cls, categories: Mapping[str, TypeOrStr]) -> Dict[str, ObjectTypes]:
-        return {str(int(k) - 1): get_type(v) for k, v in categories.items()}
     def clone(self) -> PredictorBase:
         return self.__class__(
             self.path_yaml,
@@ -296,11 +329,53 @@ class D2FrcnnDetector(ObjectDetector):
             self.filter_categories,
         )
-    def possible_categories(self) -> List[ObjectTypes]:
-        return list(self.categories.values())
+    @staticmethod
+    def get_wrapped_model(
+        path_yaml: str,
+        path_weights: str,
+        config_overwrite: List[str],
+        device: Optional[Union[Literal["cpu", "cuda"], torch.device]] = None,
+    ) -> GeneralizedRCNN:
+        """
+        Get the wrapped model. Useful if one do not want to build the wrapper but only needs the instantiated model.
+        Example:
+        ```python
+            path_yaml = ModelCatalog.get_full_path_configs("dd/d2/item/CASCADE_RCNN_R_50_FPN_GN.yaml")
+            weights_path = ModelDownloadManager.maybe_download_weights_and_configs("item/d2_model-800000-layout.pkl")
+            model = D2FrcnnDetector.get_wrapped_model(path_yaml,weights_path,["OUTPUT.FRCNN_NMS_THRESH=0.3",
+                                                                              "OUTPUT.RESULT_SCORE_THRESH=0.6"],
+                                                                              "cpu")
+            detect_result_list = d2_predict_image(np_img,model,InferenceResize(800,1333),0.3)
+        ```
+        :param path_yaml: The path to the yaml config. If the model is built using several config files, always use
+                          the highest level .yaml file.
+        :param path_weights: The path to the model checkpoint.
+        :param config_overwrite: Overwrite some hyperparameters defined by the yaml file with some new values. E.g.
+                                 ["OUTPUT.FRCNN_NMS_THRESH=0.3","OUTPUT.RESULT_SCORE_THRESH=0.6"].
+        :param device: "cpu" or "cuda". If not specified will auto select depending on what is available
+        :return: Detectron2 GeneralizedRCNN model
+        """
+        device = get_torch_device(device)
+        d2_conf_list = D2FrcnnDetector._get_d2_config_list(path_weights, config_overwrite)
+        cfg = D2FrcnnDetector._set_config(path_yaml, d2_conf_list, device)
+        model = D2FrcnnDetector._set_model(cfg)
+        D2FrcnnDetector._instantiate_d2_predictor(model, path_weights)
+        return model
+    @staticmethod
+    def _get_d2_config_list(path_weights: str, config_overwrite: List[str]) -> List[str]:
+        d2_conf_list = ["MODEL.WEIGHTS", path_weights]
+        config_overwrite = config_overwrite if config_overwrite else []
+        for conf in config_overwrite:
+            key, val = conf.split("=", maxsplit=1)
+            d2_conf_list.extend([key, val])
+        return d2_conf_list
-class D2FrcnnTracingDetector(ObjectDetector):
+class D2FrcnnTracingDetector(D2FrcnnDetectorMixin):
     """
     D2 Faster-RCNN exported torchscript model. Using this predictor has the advantage that Detectron2 does not have to
     be installed. The associated config setting only contains parameters that are involved in pre-and post-processing.
@@ -312,6 +387,8 @@ class D2FrcnnTracingDetector(ObjectDetector):
     the standard D2 output that takes into account of the situation that detected objects are disjoint. For more infos
     on this topic, see <https://github.com/facebookresearch/detectron2/issues/978> .
+    Example:
+    ```python
         config_path = ModelCatalog.get_full_path_configs("dd/d2/item/CASCADE_RCNN_R_50_FPN_GN.yaml")
         weights_path = ModelDownloadManager.maybe_download_weights_and_configs("item/d2_model-800000-layout.pkl")
         categories = ModelCatalog.get_profile("item/d2_model-800000-layout.pkl").categories
@@ -319,6 +396,7 @@ class D2FrcnnTracingDetector(ObjectDetector):
         d2_predictor = D2FrcnnDetector(config_path,weights_path,categories)
         detection_results = d2_predictor.predict(bgr_image_np_array)
+    ```
     """
     def __init__(
@@ -343,27 +421,28 @@ class D2FrcnnTracingDetector(ObjectDetector):
         :param filter_categories: The model might return objects that are not supposed to be predicted and that should
                                   be filtered. Pass a list of category names that must not be returned
         """
-        self.name = "_".join(Path(path_weights).parts[-2:])
-        self._categories_d2 = self._map_to_d2_categories(copy(categories))
+        super().__init__(categories, filter_categories)
         self.path_weights = path_weights
         self.path_yaml = path_yaml
-        self.categories = copy(categories)  # type: ignore
-        self.config_overwrite = config_overwrite
-        if filter_categories:
-            filter_categories = [get_type(cat) for cat in filter_categories]
-        self.filter_categories = filter_categories
-        self.cfg = set_config_by_yaml(self.path_yaml)
+        self.config_overwrite = copy(config_overwrite)
+        self.cfg = self._set_config(self.path_yaml, self.path_weights, self.config_overwrite)
+        self.name = self.get_name(path_weights, self.cfg.MODEL.META_ARCHITECTURE)
+        self.model_id = self.get_model_id()
+        self.resizer = self.get_inference_resizer(self.cfg.INPUT.MIN_SIZE_TEST, self.cfg.INPUT.MAX_SIZE_TEST)
+        self.d2_predictor = self.get_wrapped_model(self.path_weights)
+    @staticmethod
+    def _set_config(path_yaml: str, path_weights: str, config_overwrite: Optional[List[str]]) -> AttrDict:
+        cfg = set_config_by_yaml(path_yaml)
         config_overwrite = config_overwrite if config_overwrite else []
         config_overwrite.extend([f"MODEL.WEIGHTS={path_weights}"])
-        self.cfg.update_args(config_overwrite)
-        self.resizer = InferenceResize(self.cfg.INPUT.MIN_SIZE_TEST, self.cfg.INPUT.MAX_SIZE_TEST)
-        self.d2_predictor = self._instantiate_d2_predictor()
-    def _instantiate_d2_predictor(self) -> Any:
-        with open(self.path_weights, "rb") as file:
-            buffer = io.BytesIO(file.read())
-        # Load all tensors to the original device
-        return torch.jit.load(buffer)
+        cfg.update_args(config_overwrite)
+        return cfg
     def predict(self, np_img: ImageType) -> List[DetectionResult]:
         """
@@ -418,3 +497,16 @@ class D2FrcnnTracingDetector(ObjectDetector):
     def possible_categories(self) -> List[ObjectTypes]:
         return list(self.categories.values())
+    @staticmethod
+    def get_wrapped_model(path_weights: str) -> Any:
+        """
+        Get the wrapped model. Useful if one do not want to build the wrapper but only needs the instantiated model.
+        :param path_weights:
+        :return:
+        """
+        with open(path_weights, "rb") as file:
+            buffer = io.BytesIO(file.read())
+        # Load all tensors to the original device
+        return torch.jit.load(buffer)

deepdoctection/extern/deskew.py CHANGED Viewed

@@ -21,13 +21,16 @@ jdeskew estimator and rotator to deskew images: <https://github.com/phamquiluan/
 from typing import List
+from lazy_imports import try_import
 from ..utils.detection_types import ImageType, Requirement
-from ..utils.file_utils import get_jdeskew_requirement, jdeskew_available
-from .base import ImageTransformer
+from ..utils.file_utils import get_jdeskew_requirement
+from ..utils.settings import PageType
+from ..utils.viz import viz_handler
+from .base import DetectionResult, ImageTransformer
-if jdeskew_available():
+with try_import() as import_guard:
     from jdeskew.estimator import get_angle
-    from jdeskew.utility import rotate
 class Jdeskewer(ImageTransformer):
@@ -37,19 +40,43 @@ class Jdeskewer(ImageTransformer):
     """
     def __init__(self, min_angle_rotation: float = 2.0):
-        self.name = "jdeskew_transform"
+        self.name = "jdeskewer"
+        self.model_id = self.get_model_id()
         self.min_angle_rotation = min_angle_rotation
-    def transform(self, np_img: ImageType) -> ImageType:
-        angle = get_angle(np_img)
+    def transform(self, np_img: ImageType, specification: DetectionResult) -> ImageType:
+        """
+        Rotation of the image according to the angle determined by the jdeskew estimator.
+        **Example**:
+                    jdeskew_predictor = Jdeskewer()
+                    detection_result = jdeskew_predictor.predict(np_image)
+                    jdeskew_predictor.transform(np_image, DetectionResult(angle=5.0))
-        if angle > self.min_angle_rotation:
-            return rotate(np_img, angle)
+        :param np_img: image as numpy array
+        :param specification: DetectionResult with angle value
+        :return: image rotated by the angle
+        """
+        if abs(specification.angle) > self.min_angle_rotation:  # type: ignore
+            return viz_handler.rotate_image(np_img, specification.angle)  # type: ignore
         return np_img
+    def predict(self, np_img: ImageType) -> DetectionResult:
+        """
+        Predict the angle of the image to deskew it.
+        :param np_img: image as numpy array
+        :return: DetectionResult with angle value
+        """
+        return DetectionResult(angle=round(float(get_angle(np_img)), 4))
     @classmethod
     def get_requirements(cls) -> List[Requirement]:
         """
         Get a list of requirements for running the detector
         """
         return [get_jdeskew_requirement()]
+    @staticmethod
+    def possible_category() -> PageType:
+        return PageType.angle

deepdoctection 0.30__py3-none-any.whl → 0.32__py3-none-any.whl

Potentially problematic release.

deepdoctection 0.30py3-none-any.whl → 0.32py3-none-any.whl