PyPI - deepdoctection - Versions diffs - 0.42.1__py3-none-any.whl → 0.43__py3-none-any.whl - Mend

deepdoctection 0.42.1py3-none-any.whl → 0.43py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of deepdoctection might be problematic. Click here for more details.

Files changed (124) hide show

deepdoctection/__init__.py +2 -1
deepdoctection/analyzer/__init__.py +2 -1
deepdoctection/analyzer/config.py +904 -0
deepdoctection/analyzer/dd.py +36 -62
deepdoctection/analyzer/factory.py +311 -141
deepdoctection/configs/conf_dd_one.yaml +100 -44
deepdoctection/configs/profiles.jsonl +32 -0
deepdoctection/dataflow/__init__.py +9 -6
deepdoctection/dataflow/base.py +33 -15
deepdoctection/dataflow/common.py +96 -75
deepdoctection/dataflow/custom.py +36 -29
deepdoctection/dataflow/custom_serialize.py +135 -91
deepdoctection/dataflow/parallel_map.py +33 -31
deepdoctection/dataflow/serialize.py +15 -10
deepdoctection/dataflow/stats.py +41 -28
deepdoctection/datapoint/__init__.py +4 -6
deepdoctection/datapoint/annotation.py +104 -66
deepdoctection/datapoint/box.py +190 -130
deepdoctection/datapoint/convert.py +66 -39
deepdoctection/datapoint/image.py +151 -95
deepdoctection/datapoint/view.py +383 -236
deepdoctection/datasets/__init__.py +2 -6
deepdoctection/datasets/adapter.py +11 -11
deepdoctection/datasets/base.py +118 -81
deepdoctection/datasets/dataflow_builder.py +18 -12
deepdoctection/datasets/info.py +76 -57
deepdoctection/datasets/instances/__init__.py +6 -2
deepdoctection/datasets/instances/doclaynet.py +17 -14
deepdoctection/datasets/instances/fintabnet.py +16 -22
deepdoctection/datasets/instances/funsd.py +11 -6
deepdoctection/datasets/instances/iiitar13k.py +9 -9
deepdoctection/datasets/instances/layouttest.py +9 -9
deepdoctection/datasets/instances/publaynet.py +9 -9
deepdoctection/datasets/instances/pubtables1m.py +13 -13
deepdoctection/datasets/instances/pubtabnet.py +13 -15
deepdoctection/datasets/instances/rvlcdip.py +8 -8
deepdoctection/datasets/instances/xfund.py +11 -9
deepdoctection/datasets/registry.py +18 -11
deepdoctection/datasets/save.py +12 -11
deepdoctection/eval/__init__.py +3 -2
deepdoctection/eval/accmetric.py +72 -52
deepdoctection/eval/base.py +29 -10
deepdoctection/eval/cocometric.py +14 -12
deepdoctection/eval/eval.py +56 -41
deepdoctection/eval/registry.py +6 -3
deepdoctection/eval/tedsmetric.py +24 -9
deepdoctection/eval/tp_eval_callback.py +13 -12
deepdoctection/extern/__init__.py +1 -1
deepdoctection/extern/base.py +176 -97
deepdoctection/extern/d2detect.py +127 -92
deepdoctection/extern/deskew.py +19 -10
deepdoctection/extern/doctrocr.py +157 -106
deepdoctection/extern/fastlang.py +25 -17
deepdoctection/extern/hfdetr.py +137 -60
deepdoctection/extern/hflayoutlm.py +329 -248
deepdoctection/extern/hflm.py +67 -33
deepdoctection/extern/model.py +108 -762
deepdoctection/extern/pdftext.py +37 -12
deepdoctection/extern/pt/nms.py +15 -1
deepdoctection/extern/pt/ptutils.py +13 -9
deepdoctection/extern/tessocr.py +87 -54
deepdoctection/extern/texocr.py +29 -14
deepdoctection/extern/tp/tfutils.py +36 -8
deepdoctection/extern/tp/tpcompat.py +54 -16
deepdoctection/extern/tp/tpfrcnn/config/config.py +20 -4
deepdoctection/extern/tpdetect.py +4 -2
deepdoctection/mapper/__init__.py +1 -1
deepdoctection/mapper/cats.py +117 -76
deepdoctection/mapper/cocostruct.py +35 -17
deepdoctection/mapper/d2struct.py +56 -29
deepdoctection/mapper/hfstruct.py +32 -19
deepdoctection/mapper/laylmstruct.py +221 -185
deepdoctection/mapper/maputils.py +71 -35
deepdoctection/mapper/match.py +76 -62
deepdoctection/mapper/misc.py +68 -44
deepdoctection/mapper/pascalstruct.py +13 -12
deepdoctection/mapper/prodigystruct.py +33 -19
deepdoctection/mapper/pubstruct.py +42 -32
deepdoctection/mapper/tpstruct.py +39 -19
deepdoctection/mapper/xfundstruct.py +20 -13
deepdoctection/pipe/__init__.py +1 -2
deepdoctection/pipe/anngen.py +104 -62
deepdoctection/pipe/base.py +226 -107
deepdoctection/pipe/common.py +206 -123
deepdoctection/pipe/concurrency.py +74 -47
deepdoctection/pipe/doctectionpipe.py +108 -47
deepdoctection/pipe/language.py +41 -24
deepdoctection/pipe/layout.py +45 -18
deepdoctection/pipe/lm.py +146 -78
deepdoctection/pipe/order.py +196 -113
deepdoctection/pipe/refine.py +111 -63
deepdoctection/pipe/registry.py +1 -1
deepdoctection/pipe/segment.py +213 -142
deepdoctection/pipe/sub_layout.py +76 -46
deepdoctection/pipe/text.py +52 -33
deepdoctection/pipe/transform.py +8 -6
deepdoctection/train/d2_frcnn_train.py +87 -69
deepdoctection/train/hf_detr_train.py +72 -40
deepdoctection/train/hf_layoutlm_train.py +85 -46
deepdoctection/train/tp_frcnn_train.py +56 -28
deepdoctection/utils/concurrency.py +59 -16
deepdoctection/utils/context.py +40 -19
deepdoctection/utils/develop.py +25 -17
deepdoctection/utils/env_info.py +85 -36
deepdoctection/utils/error.py +16 -10
deepdoctection/utils/file_utils.py +246 -62
deepdoctection/utils/fs.py +162 -43
deepdoctection/utils/identifier.py +29 -16
deepdoctection/utils/logger.py +49 -32
deepdoctection/utils/metacfg.py +83 -21
deepdoctection/utils/pdf_utils.py +119 -62
deepdoctection/utils/settings.py +24 -10
deepdoctection/utils/tqdm.py +10 -5
deepdoctection/utils/transform.py +182 -46
deepdoctection/utils/utils.py +61 -28
deepdoctection/utils/viz.py +150 -104
deepdoctection-0.43.dist-info/METADATA +376 -0
deepdoctection-0.43.dist-info/RECORD +149 -0
deepdoctection/analyzer/_config.py +0 -146
deepdoctection-0.42.1.dist-info/METADATA +0 -431
deepdoctection-0.42.1.dist-info/RECORD +0 -148
{deepdoctection-0.42.1.dist-info → deepdoctection-0.43.dist-info}/WHEEL +0 -0
{deepdoctection-0.42.1.dist-info → deepdoctection-0.43.dist-info}/licenses/LICENSE +0 -0
{deepdoctection-0.42.1.dist-info → deepdoctection-0.43.dist-info}/top_level.txt +0 -0

deepdoctection/pipe/order.py CHANGED Viewed

@@ -16,7 +16,7 @@
 # limitations under the License.
 """
-Module for ordering text and layout segments pipeline components
+Ordering text and layout segments
 """
 from __future__ import annotations
@@ -43,22 +43,22 @@ from ..utils.settings import LayoutType, ObjectTypes, Relationships, TypeOrStr,
 class OrderGenerator:
     """
-    Class for implementing text ordering logic and tasks that have preparational character. This includes logic for
-    grouping word type `ImageAnnotation` into text lines, splitting text lines into sub-lines (by detecting gaps
-    between words) as well as ordering text blocks (e.g. titles, tables, etc.).
+    Class for implementing text ordering logic and tasks that have preparational character.
+    This includes logic for grouping word type `ImageAnnotation` into text lines, splitting text lines into sub-lines
+     (by detecting gaps between words), as well as ordering text blocks (e.g., titles, tables, etc.).
     """
     def __init__(self, starting_point_tolerance: float, broken_line_tolerance: float, height_tolerance: float):
         """
-        Parameters for steering grouping and ordering on word level as well as on text block level.
-        :param starting_point_tolerance: Threshold to identify if two text blocks belong to one column: To check if two
-                                         text blocks belong to the same column, one condition says, that
-                                         x-coordinates of vertices should not differ more than this threshold
-        :param broken_line_tolerance: Threshold to identify if two consecutive words belonging to one line should be
-                                      in two different sub lines (because they belong to two different text columns).
-        :param height_tolerance: Threshold to identify if two columns lying over each other belong together or need to
-                                 be separated. Scaling factor of relative text block height.
+        Args:
+            starting_point_tolerance: Threshold to identify if two text blocks belong to one column. To check if two
+                                      text blocks belong to the same column, one condition says that x-coordinates of
+                                      vertices should not differ more than this threshold.
+            broken_line_tolerance: Threshold to identify if two consecutive words belonging to one line should be in two
+                                   different sub-lines (because they belong to two different text columns).
+            height_tolerance: Threshold to identify if two columns lying over each other belong together or need to be
+                              separated. Scaling factor of relative text block height.
         """
         self.starting_point_tolerance = starting_point_tolerance
         self.broken_line_tolerance = broken_line_tolerance
@@ -70,11 +70,27 @@ class OrderGenerator:
     def group_words_into_lines(
         word_anns: Sequence[ImageAnnotation], image_id: Optional[str] = None
     ) -> list[tuple[int, int, str]]:
-        """Arranging words into horizontal text lines and sorting text lines vertically in order to give
-        an enumeration of words that is used for establishing the reading order. Using this reading order arragement
-        makes only sense for words within a rectangle and needs to be revised in more complex appearances.
-        Function returns triplets for every word ann `(word reading order position, text line position, word annotation
-        id)`.
+        """
+        Arranges words into horizontal text lines and sorts text lines vertically to provide an enumeration of words
+        used for establishing the reading order.
+        Using this reading order arrangement makes sense only for words within a rectangle and needs to be revised in
+        more complex appearances.
+        Example:
+            ```python
+            group_words_into_lines(word_anns, image_id)
+            ```
+        Args:
+            word_anns: Sequence of `ImageAnnotation` representing words.
+            image_id: Optional image ID.
+        Returns:
+            List of triplets for every word annotation: (word reading order position, text line position, word
+            annotation id).
         """
         reading_lines = []
         rows: list[dict[str, float]] = []
@@ -118,11 +134,22 @@ class OrderGenerator:
         line_anns: Sequence[ImageAnnotation], image_id: Optional[str] = None
     ) -> list[tuple[int, int, str]]:
         """
-        Sorting reading lines. Returns for a list of `ImageAnnotation` an list of tuples (each tuple containing the
-        reading order and the `annotation_id` for each list element.
-        :param line_anns: text line `ImageAnnotation`
-        :param image_id: image_id of underyling image (to find get the bounding boxes)
-        :return: `list[(reading_order, reading_order,annotation_id)]`
+        Sorts reading lines.
+        Returns for a list of `ImageAnnotation` a list of tuples, each tuple containing the reading order and the
+        `annotation_id` for each list element.
+        Args:
+            line_anns: Sequence of text line `ImageAnnotation`.
+            image_id: Image ID of underlying image (to get the bounding boxes).
+        Returns:
+            List of tuples (reading_order, reading_order, annotation_id).
+        Example:
+            ```python
+            group_lines_into_lines(line_anns, image_id)
+            ```
         """
         reading_lines = []
         for ann in line_anns:
@@ -173,17 +200,27 @@ class OrderGenerator:
         self, anns: list[ImageAnnotation], image_width: float, image_height: float, image_id: Optional[str] = None
     ) -> Sequence[tuple[int, str]]:
         """
-        Determining a text ordering of text blocks. These text blocks should be larger sections than barely words.
-        It will first try to detect columns, then try to consolidate columns and finally try to detecting connected
-        components of columns. A connected component of columns is a group of columns that lie next to each other.
-        Having to connected components lying over each other will infer a reading order where the upper block of
-        connected component will be read first followed by text blocks of columns of the second.
-        :param anns: list of `ImageAnnotation` with all list element to sort.
-        :param image_width: image width (to re-calculate bounding boxes into relative coords)
-        :param image_height: image height (to re-calculate bounding boxes into relative coords)
-        :param image_id: image id
-        :return: list of tuples with reading order position and `annotation_id`
+        Determines a text ordering of text blocks.
+        These text blocks should be larger sections than just words. It will first try to detect columns, then try to
+        consolidate columns, and finally try to detect connected components of columns. A connected component of columns
+        is a group of columns that lie next to each other. Having two connected components lying over each other will
+        infer a reading order where the upper block of the connected component will be read first, followed by text
+        blocks of columns of the second.
+        Example:
+            ```python
+            order_blocks(anns, image_width, image_height, image_id)
+            ```
+        Args:
+            anns: List of `ImageAnnotation` with all elements to sort.
+            image_width: Image width (to re-calculate bounding boxes into relative coordinates).
+            image_height: Image height (to re-calculate bounding boxes into relative coordinates).
+            image_id: Image ID.
+        Returns:
+            List of tuples with reading order position and `annotation_id`.
         """
         if not anns:
             return []
@@ -343,16 +380,24 @@ class OrderGenerator:
 class TextLineGenerator:
     """
-    Class for generating synthetic text lines from words. Possible to break text lines into sub lines by using
-    a paragraph break threshold. This allows to detect a multi column structure just by observing sub lines.
+    Class for generating synthetic text lines from words.
+    Possible to break text lines into sub-lines by using a paragraph break threshold. This allows detection of a
+    multi-column structure just by observing sub-lines.
     """
     def __init__(self, make_sub_lines: bool, paragraph_break: Optional[float] = None):
         """
-        :param make_sub_lines: Whether to build sub lines from lines.
-        :param paragraph_break: threshold of two consecutive words. If distance is larger than threshold, two sub-lines
-                                will be built. We use relative coordinates to calculate the distance between two
-                                consecutive words. A reasonable value is 0.035
+        Args:
+            make_sub_lines: Whether to build sub-lines from lines.
+            paragraph_break: Threshold of two consecutive words. If distance is larger than threshold, two sub-lines
+                will be built. Relative coordinates are used to calculate the distance between two consecutive words.
+                A reasonable value is `0.035`.
+        Raises:
+            ValueError: If `make_sub_lines` is `True` and `paragraph_break` is `None`.
         """
         if make_sub_lines and paragraph_break is None:
             raise ValueError("You must specify paragraph_break when setting make_sub_lines to True")
@@ -376,13 +421,22 @@ class TextLineGenerator:
         highest_level: bool = True,
     ) -> Sequence[DetectionResult]:
         """
-        Creating detecting result of lines (or sub lines) from given word type `ImageAnnotation`.
-        :param word_anns: list og given word type `ImageAnnotation`
-        :param image_width: image width
-        :param image_height: image height
-        :param image_id: image id
-        :return:
+        Creates detection result of lines (or sub-lines) from given word type `ImageAnnotation`.
+        Example:
+            ```python
+            create_detection_result(word_anns, image_width, image_height, image_id)
+            ```
+        Args:
+            word_anns: List of given word type `ImageAnnotation`.
+            image_width: Image width.
+            image_height: Image height.
+            image_id: Image ID.
+            highest_level: Whether this is the highest level of line creation.
+        Returns:
+            Sequence of `DetectionResult`.
         """
         if not word_anns:
             return []
@@ -462,9 +516,12 @@ class TextLineGenerator:
 class TextLineServiceMixin(PipelineComponent, ABC):
     """
-    This class is used to create text lines similar to TextOrderService.
-    It uses the logic of the TextOrderService but modifies it to suit its needs.
-    It specifically uses the _create_lines_for_words method and modifies the serve method.
+    This class is used to create text lines similar to `TextOrderService`.
+    It uses the logic of the `TextOrderService` but modifies it to suit its needs. It specifically uses the
+     `_create_lines_for_words` method and modifies the `serve` method.
     """
     def __init__(
@@ -474,7 +531,10 @@ class TextLineServiceMixin(PipelineComponent, ABC):
         paragraph_break: Optional[float] = None,
     ):
         """
-        Initialize the TextLineServiceMixin with a TextLineGenerator instance.
+        Args:
+            name: Name of the service.
+            include_residual_text_container: Whether to include residual text containers.
+            paragraph_break: Paragraph break threshold.
         """
         self.include_residual_text_container = include_residual_text_container
         self.text_line_generator = TextLineGenerator(self.include_residual_text_container, paragraph_break)
@@ -482,7 +542,13 @@ class TextLineServiceMixin(PipelineComponent, ABC):
     def _create_lines_for_words(self, word_anns: Sequence[ImageAnnotation]) -> Sequence[ImageAnnotation]:
         """
-        This method creates lines for words using the TextLineGenerator instance.
+        Creates lines for words using the `TextLineGenerator` instance.
+        Args:
+            word_anns: Sequence of `ImageAnnotation`.
+        Returns:
+            Sequence of `ImageAnnotation`.
         """
         detection_result_list = self.text_line_generator.create_detection_result(
             word_anns,
@@ -504,22 +570,24 @@ class TextLineServiceMixin(PipelineComponent, ABC):
 class TextLineService(TextLineServiceMixin):
     """
-    Some OCR systems do not identify lines of text but only provide text boxes for words. This is not sufficient
-    for certain applications. This service determines rule-based text lines based on word boxes. One difficulty is
-    that text lines are not continuous but are interrupted, for example in multi-column layouts.
-    These interruptions are taken into account insofar as the gap between two words on almost the same page height
-    must not be too large.
-    The service constructs new ImageAnnotation of the category `LayoutType.line` and forms relations between the
-    text lines and the words contained in the text lines. The reading order is not arranged.
+    Some OCR systems do not identify lines of text but only provide text boxes for words.
+    This is not sufficient for certain applications. This service determines rule-based text lines based on word boxes.
+    One difficulty is that text lines are not continuous but are interrupted, for example, in multi-column layouts.
+    These interruptions are taken into account insofar as the gap between two words on almost the same page height must
+    not be too large.
+    The service constructs new `ImageAnnotation` of the category `LayoutType.line` and forms relations between the text
+    lines and the words contained in the text lines. The reading order is not arranged.
     """
     def __init__(self, paragraph_break: Optional[float] = None):
         """
-        Initialize `TextLineService`
-        :param paragraph_break: threshold of two consecutive words. If distance is larger than threshold, two sublines
-                                will be built
+        Args:
+            paragraph_break: Threshold of two consecutive words. If distance is larger than threshold, two
+                             sub-lines will be built.
         """
         super().__init__(
             name="text_line",
@@ -553,24 +621,24 @@ class TextLineService(TextLineServiceMixin):
 class TextOrderService(TextLineServiceMixin):
     """
     Reading order of words within floating text blocks as well as reading order of blocks within simple text blocks.
-    To understand the difference between floating text blocks and simple text blocks consider a page containing an
-    article and a table. Table cells are text blocks that contain words which must be sorted.
-    However, they do not belong to floating text that encircle a table. They are rather an element that is supposed to
-    be read independently.
-    A heuristic argument for its ordering is used where the underlying assumption is the reading order from left to
-    right.
+    To understand the difference between floating text blocks and simple text blocks, consider a page containing an
+    article and a table. Table cells are text blocks that contain words which must be sorted. However, they do not
+    belong to floating text that encircle a table. They are rather an element that is supposed to be read independently.
-        - For the reading order within a text block, text containers (i.e. image annotations that contain character
-          sub annotations) are sorted based on their bounding box center and then lines are formed: Each word induces a
-          new line, provided that its center is not in a line that has already
-          been created by an already processed word. The entire block width is defined as the line width
-          and the upper or lower line limit of the word bounding box as the upper or lower line limit. The reading order
-          of the words is from left to right within a line. The reading order of the lines is from top to bottom.
+    A heuristic argument for its ordering is used where the underlying assumption is the reading order from left
+    to right.
-        - For the reading order of text blocks within a page, the blocks are sorted using a similar procedure, with the
-          difference that columns are formed instead of lines. Column lengths are defined as the length of the entire
-          page and the left and right text block boundaries as the left and right column boundaries.
+    - For the reading order within a text block, text containers (i.e., image annotations that contain character
+      sub-annotations) are sorted based on their bounding box center and then lines are formed: Each word induces a new
+      line, provided that its center is not in a line that has already been created by an already processed word. The
+      entire block width is defined as the line width and the upper or lower line limit of the word bounding box as the
+      upper or lower line limit. The reading order of the words is from left to right within a line. The reading order
+      of the lines is from top to bottom.
+    - For the reading order of text blocks within a page, the blocks are sorted using a similar procedure, with the
+      difference that columns are formed instead of lines. Column lengths are defined as the length of the entire page
+      and the left and right text block boundaries as the left and right column boundaries.
     A category annotation per word is generated, which fixes the order per word in the block, as well as a category
     annotation per block, which saves the reading order of the block per page.
@@ -578,10 +646,19 @@ class TextOrderService(TextLineServiceMixin):
     The blocks are defined in `text_block_categories` and text blocks that should be considered when generating
     narrative text must be added in `floating_text_block_categories`.
-        order = TextOrderService(text_container="word",
-                                 text_block_categories=["title", "text", "list", "cell",
-                                                        "head", "body"],
-                                 floating_text_block_categories=["title", "text", "list"])
+    Example:
+        ```python
+        order = TextOrderService(
+            text_container="word",
+            text_block_categories=["title", "text", "list", "cell", "head", "body"],
+            floating_text_block_categories=["title", "text", "list"]
+        )
+        ```
+    Note:
+        The blocks are defined in `text_block_categories` and text blocks that should be considered when generating
+        narrative text must be added in `floating_text_block_categories`.
     """
     def __init__(
@@ -596,40 +673,42 @@ class TextOrderService(TextLineServiceMixin):
         paragraph_break: Optional[float] = 0.035,
     ):
         """
-        :param text_container: name of an image annotation that has a CHARS sub category. These annotations will be
-                               ordered within all text blocks.
-        :param text_block_categories: name of image annotation that have a relation with text containers and where
-                                      text containers need to be sorted. It will default to
-                                      `..datapoint.view.IMAGE_DEFAULTS["text_block_categories"]`
-        :param floating_text_block_categories: name of image annotation that belong to floating text. These annotations
-                               form the highest hierarchy of text blocks that will be ordered to generate a narrative
-                               output of text. It will default to
-                               `..datapoint.view.IMAGE_DEFAULTS["floating_text_block_categories"]`
-        :param include_residual_text_container: Text containers with no parent text block (e.g. not matched with any
-                                                parent annotation in `MatchingService`) will not be assigned with a
-                                                reading. (Reading order will only be assigned to image annotations that
-                                                are floating_text_block_categories or text containers matched with
-                                                text block annotations.) Setting `include_residual_text_container=True`
-                                                will build synthetic text lines from text containers and regard these
-                                                text lines as floating text blocks.
-        :param starting_point_tolerance: Threshold to identify if two text blocks belong to one column: To check if two
-                                         text blocks belong to the same column, one condition says, that
-                                         x-coordinates of vertices should not differ more than this threshold
-        :param broken_line_tolerance: Threshold to identify if two consecutive words belonging to one line should be
-                                      in two different sub-lines (because they belong to two different text columns).
-        :param height_tolerance: Threshold to identify if two columns lying over each other belong together or need to
-                                 be separated. Scaling factor of relative text block height.
+        Args:
+            text_container: `Name` of an image annotation that has a CHARS sub-category. These annotations will be
+                            ordered within all text blocks.
+            text_block_categories: `Name` of image annotation that have a relation with text containers and where text
+                                   containers need to be sorted. Defaults to `IMAGE_DEFAULTS["text_block_categories"]`.
+            floating_text_block_categories: Name of image annotation that belong to floating text. These annotations
+                                            form the highest hierarchy of text blocks that will be ordered to generate a
+                                            narrative output of text. Defaults to
+                                            `IMAGE_DEFAULTS["floating_text_block_categories"]`.
+            include_residual_text_container: Text containers with no parent text block (e.g., not matched with any
+                                             parent annotation in `MatchingService`) will not be assigned with a
+                                             reading. (Reading order will only be assigned to image annotations that are
+                                             `floating_text_block_categories` or text containers matched with text block
+                                             annotations.) Setting `include_residual_text_container=True` will build
+                                             synthetic text lines from text containers and regard these text lines as
+                                             floating text blocks.
+            starting_point_tolerance: Threshold to identify if two text blocks belong to one column. To check if two
+                                      text blocks belong to the same column, one condition says that x-coordinates of
+                                      vertices should not differ more than this threshold.
+            broken_line_tolerance: Threshold to identify if two consecutive words belonging to one line should be in two
+                                   different sub-lines (because they belong to two different text columns).
+            height_tolerance: Threshold to identify if two columns lying over each other belong together or need to be
+                              separated. Scaling factor of relative text block height.
+            paragraph_break: Threshold of two consecutive words. If distance is larger than threshold, two sublines
+                             will be built.
         """
         self.text_container = get_type(text_container)
         if isinstance(text_block_categories, (str, ObjectTypes)):
             text_block_categories = (get_type(text_block_categories),)
         if text_block_categories is None:
-            text_block_categories = IMAGE_DEFAULTS["text_block_categories"]
+            text_block_categories = IMAGE_DEFAULTS.TEXT_BLOCK_CATEGORIES
         self.text_block_categories = tuple((get_type(category) for category in text_block_categories))
         if isinstance(floating_text_block_categories, (str, ObjectTypes)):
             floating_text_block_categories = (get_type(floating_text_block_categories),)
         if floating_text_block_categories is None:
-            floating_text_block_categories = IMAGE_DEFAULTS["floating_text_block_categories"]
+            floating_text_block_categories = IMAGE_DEFAULTS.FLOATING_TEXT_BLOCK_CATEGORIES
         self.floating_text_block_categories = tuple((get_type(category) for category in floating_text_block_categories))
         if include_residual_text_container:
             self.floating_text_block_categories = self.floating_text_block_categories + (LayoutType.LINE,)
@@ -676,10 +755,13 @@ class TextOrderService(TextLineServiceMixin):
     def order_text_in_text_block(self, text_block_ann: ImageAnnotation) -> None:
         """
-        Order text within a text block. It will take all child-like text containers (determined by a
-        `MatchingOrderService`)  from a block and going to order all items line-wise.
+        Orders text within a text block.
+        It will take all child-like text containers (determined by a `MatchingOrderService`) from a block and order
+        all items line-wise.
-        :param text_block_ann: text block annotation (category one of `text_block_categories`).
+        Args:
+            text_block_ann: Text block annotation (category one of `text_block_categories`).
         """
         text_container_ids = text_block_ann.get_relationship(Relationships.CHILD)
         text_container_ann = self.dp_manager.datapoint.get_annotation(
@@ -700,9 +782,10 @@ class TextOrderService(TextLineServiceMixin):
     def order_blocks(self, text_block_anns: list[ImageAnnotation]) -> None:
         """
-        Ordering of text blocks. Will use the internal order generator.
+        Orders text blocks using the internal order generator.
-        :param text_block_anns: list of `ImageAnnotation`.
+        Args:
+            text_block_anns: List of `ImageAnnotation`.
         """
         block_order_list = self.order_generator.order_blocks(
             text_block_anns, self.dp_manager.datapoint.width, self.dp_manager.datapoint.height

deepdoctection 0.42.1__py3-none-any.whl → 0.43__py3-none-any.whl

Potentially problematic release.

deepdoctection 0.42.1py3-none-any.whl → 0.43py3-none-any.whl