PyPI - deepdoctection - Versions diffs - 0.32__py3-none-any.whl → 0.34__py3-none-any.whl - Mend

deepdoctection 0.32py3-none-any.whl → 0.34py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of deepdoctection might be problematic. Click here for more details.

Files changed (111) hide show

deepdoctection/__init__.py +8 -25
deepdoctection/analyzer/dd.py +84 -71
deepdoctection/dataflow/common.py +9 -5
deepdoctection/dataflow/custom.py +5 -5
deepdoctection/dataflow/custom_serialize.py +75 -18
deepdoctection/dataflow/parallel_map.py +3 -3
deepdoctection/dataflow/serialize.py +4 -4
deepdoctection/dataflow/stats.py +3 -3
deepdoctection/datapoint/annotation.py +78 -56
deepdoctection/datapoint/box.py +7 -7
deepdoctection/datapoint/convert.py +6 -6
deepdoctection/datapoint/image.py +157 -75
deepdoctection/datapoint/view.py +175 -151
deepdoctection/datasets/adapter.py +30 -24
deepdoctection/datasets/base.py +10 -10
deepdoctection/datasets/dataflow_builder.py +3 -3
deepdoctection/datasets/info.py +23 -25
deepdoctection/datasets/instances/doclaynet.py +48 -49
deepdoctection/datasets/instances/fintabnet.py +44 -45
deepdoctection/datasets/instances/funsd.py +23 -23
deepdoctection/datasets/instances/iiitar13k.py +8 -8
deepdoctection/datasets/instances/layouttest.py +2 -2
deepdoctection/datasets/instances/publaynet.py +3 -3
deepdoctection/datasets/instances/pubtables1m.py +18 -18
deepdoctection/datasets/instances/pubtabnet.py +30 -29
deepdoctection/datasets/instances/rvlcdip.py +28 -29
deepdoctection/datasets/instances/xfund.py +51 -30
deepdoctection/datasets/save.py +6 -6
deepdoctection/eval/accmetric.py +32 -33
deepdoctection/eval/base.py +8 -9
deepdoctection/eval/cocometric.py +13 -12
deepdoctection/eval/eval.py +32 -26
deepdoctection/eval/tedsmetric.py +16 -12
deepdoctection/eval/tp_eval_callback.py +7 -16
deepdoctection/extern/base.py +339 -134
deepdoctection/extern/d2detect.py +69 -89
deepdoctection/extern/deskew.py +11 -10
deepdoctection/extern/doctrocr.py +81 -64
deepdoctection/extern/fastlang.py +23 -16
deepdoctection/extern/hfdetr.py +53 -38
deepdoctection/extern/hflayoutlm.py +216 -155
deepdoctection/extern/hflm.py +35 -30
deepdoctection/extern/model.py +433 -255
deepdoctection/extern/pdftext.py +15 -15
deepdoctection/extern/pt/ptutils.py +4 -2
deepdoctection/extern/tessocr.py +39 -38
deepdoctection/extern/texocr.py +14 -16
deepdoctection/extern/tp/tfutils.py +16 -2
deepdoctection/extern/tp/tpcompat.py +11 -7
deepdoctection/extern/tp/tpfrcnn/config/config.py +4 -4
deepdoctection/extern/tp/tpfrcnn/modeling/backbone.py +1 -1
deepdoctection/extern/tp/tpfrcnn/modeling/model_box.py +5 -5
deepdoctection/extern/tp/tpfrcnn/modeling/model_fpn.py +6 -6
deepdoctection/extern/tp/tpfrcnn/modeling/model_frcnn.py +4 -4
deepdoctection/extern/tp/tpfrcnn/modeling/model_mrcnn.py +5 -3
deepdoctection/extern/tp/tpfrcnn/preproc.py +5 -5
deepdoctection/extern/tpdetect.py +40 -45
deepdoctection/mapper/cats.py +36 -40
deepdoctection/mapper/cocostruct.py +16 -12
deepdoctection/mapper/d2struct.py +22 -22
deepdoctection/mapper/hfstruct.py +7 -7
deepdoctection/mapper/laylmstruct.py +22 -24
deepdoctection/mapper/maputils.py +9 -10
deepdoctection/mapper/match.py +33 -2
deepdoctection/mapper/misc.py +6 -7
deepdoctection/mapper/pascalstruct.py +4 -4
deepdoctection/mapper/prodigystruct.py +6 -6
deepdoctection/mapper/pubstruct.py +84 -92
deepdoctection/mapper/tpstruct.py +3 -3
deepdoctection/mapper/xfundstruct.py +33 -33
deepdoctection/pipe/anngen.py +39 -14
deepdoctection/pipe/base.py +68 -99
deepdoctection/pipe/common.py +181 -85
deepdoctection/pipe/concurrency.py +14 -10
deepdoctection/pipe/doctectionpipe.py +24 -21
deepdoctection/pipe/language.py +20 -25
deepdoctection/pipe/layout.py +18 -16
deepdoctection/pipe/lm.py +49 -47
deepdoctection/pipe/order.py +63 -65
deepdoctection/pipe/refine.py +102 -109
deepdoctection/pipe/segment.py +157 -162
deepdoctection/pipe/sub_layout.py +50 -40
deepdoctection/pipe/text.py +37 -36
deepdoctection/pipe/transform.py +19 -16
deepdoctection/train/d2_frcnn_train.py +27 -25
deepdoctection/train/hf_detr_train.py +22 -18
deepdoctection/train/hf_layoutlm_train.py +49 -48
deepdoctection/train/tp_frcnn_train.py +10 -11
deepdoctection/utils/concurrency.py +1 -1
deepdoctection/utils/context.py +13 -6
deepdoctection/utils/develop.py +4 -4
deepdoctection/utils/env_info.py +52 -14
deepdoctection/utils/file_utils.py +6 -11
deepdoctection/utils/fs.py +41 -14
deepdoctection/utils/identifier.py +2 -2
deepdoctection/utils/logger.py +15 -15
deepdoctection/utils/metacfg.py +7 -7
deepdoctection/utils/pdf_utils.py +39 -14
deepdoctection/utils/settings.py +188 -182
deepdoctection/utils/tqdm.py +1 -1
deepdoctection/utils/transform.py +14 -9
deepdoctection/utils/types.py +104 -0
deepdoctection/utils/utils.py +7 -7
deepdoctection/utils/viz.py +70 -69
{deepdoctection-0.32.dist-info → deepdoctection-0.34.dist-info}/METADATA +7 -4
deepdoctection-0.34.dist-info/RECORD +146 -0
{deepdoctection-0.32.dist-info → deepdoctection-0.34.dist-info}/WHEEL +1 -1
deepdoctection/utils/detection_types.py +0 -68
deepdoctection-0.32.dist-info/RECORD +0 -146
{deepdoctection-0.32.dist-info → deepdoctection-0.34.dist-info}/LICENSE +0 -0
{deepdoctection-0.32.dist-info → deepdoctection-0.34.dist-info}/top_level.txt +0 -0

deepdoctection/datapoint/view.py CHANGED Viewed

@@ -22,11 +22,10 @@ simplify consumption
 from __future__ import annotations
 from copy import copy
-from typing import Any, Dict, List, Mapping, Optional, Sequence, Set, Tuple, Type, Union, no_type_check
+from typing import Any, Mapping, Optional, Sequence, Type, TypedDict, Union, no_type_check
 import numpy as np
-from ..utils.detection_types import ImageType, JsonDict, Pathlike
 from ..utils.error import AnnotationError, ImageError
 from ..utils.logger import LoggingRecord, logger
 from ..utils.settings import (
@@ -35,13 +34,15 @@ from ..utils.settings import (
     ObjectTypes,
     PageType,
     Relationships,
+    SummaryType,
     TableType,
     TokenClasses,
     WordType,
     get_type,
 )
+from ..utils.types import HTML, AnnotationDict, Chunks, ImageDict, PathLikeOrStr, PixelValues, Text_, csv
 from ..utils.viz import draw_boxes, interactive_imshow, viz_handler
-from .annotation import ContainerAnnotation, ImageAnnotation, SummaryAnnotation, ann_from_dict
+from .annotation import CategoryAnnotation, ContainerAnnotation, ImageAnnotation, ann_from_dict
 from .box import BoundingBox, crop_box_from_image
 from .image import Image
@@ -68,7 +69,7 @@ class ImageAnnotationBaseView(ImageAnnotation):
     base_page: Page
     @property
-    def bbox(self) -> List[float]:
+    def bbox(self) -> list[float]:
         """
         Get the bounding box as list and in absolute coordinates of the base page.
         """
@@ -79,7 +80,7 @@ class ImageAnnotationBaseView(ImageAnnotation):
             bounding_box = bounding_box.transform(self.base_page.width, self.base_page.height, absolute_coords=True)
         return bounding_box.to_list(mode="xyxy")
-    def viz(self, interactive: bool = False) -> Optional[ImageType]:
+    def viz(self, interactive: bool = False) -> Optional[PixelValues]:
         """
         Display the annotation (without any sub-layout elements).
@@ -100,7 +101,7 @@ class ImageAnnotationBaseView(ImageAnnotation):
             return np_image
         raise AnnotationError(f"base_page.image is None for {self.annotation_id}")
-    def __getattr__(self, item: str) -> Optional[Union[str, int, List[str]]]:
+    def __getattr__(self, item: str) -> Optional[Union[str, int, list[str]]]:
         """
         Get attributes defined by registered `self.get_attribute_names()` in a multi step process:
@@ -124,19 +125,18 @@ class ImageAnnotationBaseView(ImageAnnotation):
                 return sub_cat.category_name
             if isinstance(sub_cat, ContainerAnnotation):
                 return sub_cat.value
-            return int(sub_cat.category_id)
+            return sub_cat.category_id
         if self.image is not None:
-            if self.image.summary is not None:
-                if item in self.image.summary.sub_categories:
-                    sub_cat = self.get_summary(get_type(item))
-                    if item != sub_cat.category_name:
-                        return sub_cat.category_name
-                    if isinstance(sub_cat, ContainerAnnotation):
-                        return sub_cat.value
-                    return int(sub_cat.category_id)
+            if item in self.image.summary.sub_categories:
+                sub_cat = self.get_summary(get_type(item))
+                if item != sub_cat.category_name:
+                    return sub_cat.category_name
+                if isinstance(sub_cat, ContainerAnnotation):
+                    return sub_cat.value
+                return sub_cat.category_id
         return None
-    def get_attribute_names(self) -> Set[str]:
+    def get_attribute_names(self) -> set[str]:
         """
         :return: A set of registered attributes. When sub classing modify this method accordingly.
         """
@@ -144,12 +144,11 @@ class ImageAnnotationBaseView(ImageAnnotation):
         # sub categories and summary sub categories are valid attribute names
         attribute_names = {"bbox", "np_image"}.union({cat.value for cat in self.sub_categories})
         if self.image:
-            if self.image.summary:
-                attribute_names = attribute_names.union({cat.value for cat in self.image.summary.sub_categories.keys()})
+            attribute_names = attribute_names.union({cat.value for cat in self.image.summary.sub_categories.keys()})
         return attribute_names
     @classmethod
-    def from_dict(cls, **kwargs: JsonDict) -> ImageAnnotationBaseView:
+    def from_dict(cls, **kwargs: AnnotationDict) -> ImageAnnotationBaseView:
         """
         Identical to its base class method for having correct return types. If the base class changes, please
         change this method as well.
@@ -165,8 +164,8 @@ class Word(ImageAnnotationBaseView):
     Word specific subclass of `ImageAnnotationBaseView` modelled by `WordType`.
     """
-    def get_attribute_names(self) -> Set[str]:
-        return set(WordType).union(super().get_attribute_names()).union({Relationships.reading_order})
+    def get_attribute_names(self) -> set[str]:
+        return set(WordType).union(super().get_attribute_names()).union({Relationships.READING_ORDER})
 class Layout(ImageAnnotationBaseView):
@@ -181,13 +180,13 @@ class Layout(ImageAnnotationBaseView):
     text_container: Optional[ObjectTypes] = None
     @property
-    def words(self) -> List[ImageAnnotationBaseView]:
+    def words(self) -> list[ImageAnnotationBaseView]:
         """
         Get a list of `ImageAnnotationBaseView` objects with `LayoutType` defined by `text_container`.
         It will only select those among all annotations that have an entry in `Relationships.child` .
         """
         if self.category_name != self.text_container:
-            text_ids = self.get_relationship(Relationships.child)
+            text_ids = self.get_relationship(Relationships.CHILD)
             return self.base_page.get_annotation(annotation_ids=text_ids, category_names=self.text_container)
         return [self]
@@ -199,17 +198,25 @@ class Layout(ImageAnnotationBaseView):
         words = self.get_ordered_words()
         return " ".join([word.characters for word in words])  # type: ignore
-    def get_ordered_words(self) -> List[ImageAnnotationBaseView]:
+    def get_ordered_words(self) -> list[ImageAnnotationBaseView]:
         """Returns a list of words order by reading order. Words with no reading order will not be returned"""
         words_with_reading_order = [word for word in self.words if word.reading_order is not None]
         words_with_reading_order.sort(key=lambda x: x.reading_order)  # type: ignore
         return words_with_reading_order
     @property
-    def text_(self) -> JsonDict:
-        """Returns a dict `{"text": text string,
-        "text_list": list of single words,
-        "annotation_ids": word annotation ids`"""
+    def text_(self) -> Text_:
+        """Returns a dict
+        `{"text": text string,
+          "text_list": list of single words,
+          "ann_ids": word annotation ids`,
+          "token_classes": token classes,
+          "token_tags": token tags,
+          "token_class_ids": token class ids,
+          "token_tag_ids": token tag ids}`
+        """
         words = self.get_ordered_words()
         characters, ann_ids, token_classes, token_tags, token_classes_ids, token_tag_ids = zip(
             *[
@@ -218,13 +225,11 @@ class Layout(ImageAnnotationBaseView):
                     word.annotation_id,
                     word.token_class,
                     word.token_tag,
-                    (
-                        word.get_sub_category(WordType.token_class).category_id
-                        if WordType.token_class in word.sub_categories
-                        else None
-                    ),
-                    (word.get_sub_category(WordType.token_tag).category_id)
-                    if WordType.token_tag in word.sub_categories
+                    word.get_sub_category(WordType.TOKEN_CLASS).category_id
+                    if WordType.TOKEN_CLASS in word.sub_categories
+                    else None,
+                    word.get_sub_category(WordType.TOKEN_TAG).category_id
+                    if WordType.TOKEN_TAG in word.sub_categories
                     else None,
                 )
                 for word in words
@@ -240,8 +245,8 @@ class Layout(ImageAnnotationBaseView):
             "token_tag_ids": token_tag_ids,
         }
-    def get_attribute_names(self) -> Set[str]:
-        return {"words", "text"}.union(super().get_attribute_names()).union({Relationships.reading_order})
+    def get_attribute_names(self) -> set[str]:
+        return {"words", "text"}.union(super().get_attribute_names()).union({Relationships.READING_ORDER})
     def __len__(self) -> int:
         """len of text counted by number of characters"""
@@ -253,7 +258,7 @@ class Cell(Layout):
     Cell specific subclass of `ImageAnnotationBaseView` modelled by `CellType`.
     """
-    def get_attribute_names(self) -> Set[str]:
+    def get_attribute_names(self) -> set[str]:
         return set(CellType).union(super().get_attribute_names())
@@ -263,52 +268,52 @@ class Table(Layout):
     """
     @property
-    def cells(self) -> List[ImageAnnotationBaseView]:
+    def cells(self) -> list[ImageAnnotationBaseView]:
         """
         A list of a table cells.
         """
-        all_relation_ids = self.get_relationship(Relationships.child)
+        all_relation_ids = self.get_relationship(Relationships.CHILD)
         cell_anns = self.base_page.get_annotation(
             annotation_ids=all_relation_ids,
             category_names=[
-                LayoutType.cell,
-                CellType.header,
-                CellType.body,
-                CellType.projected_row_header,
-                CellType.spanning,
-                CellType.row_header,
-                CellType.column_header,
+                LayoutType.CELL,
+                CellType.HEADER,
+                CellType.BODY,
+                CellType.PROJECTED_ROW_HEADER,
+                CellType.SPANNING,
+                CellType.ROW_HEADER,
+                CellType.COLUMN_HEADER,
             ],
         )
         return cell_anns
     @property
-    def rows(self) -> List[ImageAnnotationBaseView]:
+    def rows(self) -> list[ImageAnnotationBaseView]:
         """
         A list of a table rows.
         """
-        all_relation_ids = self.get_relationship(Relationships.child)
-        row_anns = self.base_page.get_annotation(annotation_ids=all_relation_ids, category_names=[LayoutType.row])
+        all_relation_ids = self.get_relationship(Relationships.CHILD)
+        row_anns = self.base_page.get_annotation(annotation_ids=all_relation_ids, category_names=[LayoutType.ROW])
         return row_anns
     @property
-    def columns(self) -> List[ImageAnnotationBaseView]:
+    def columns(self) -> list[ImageAnnotationBaseView]:
         """
         A list of a table columns.
         """
-        all_relation_ids = self.get_relationship(Relationships.child)
-        col_anns = self.base_page.get_annotation(annotation_ids=all_relation_ids, category_names=[LayoutType.column])
+        all_relation_ids = self.get_relationship(Relationships.CHILD)
+        col_anns = self.base_page.get_annotation(annotation_ids=all_relation_ids, category_names=[LayoutType.COLUMN])
         return col_anns
     @property
-    def html(self) -> str:
+    def html(self) -> HTML:
         """
         The html representation of the table
         """
         html_list = []
-        if TableType.html in self.sub_categories:
-            ann = self.get_sub_category(TableType.html)
+        if TableType.HTML in self.sub_categories:
+            ann = self.get_sub_category(TableType.HTML)
             if isinstance(ann, ContainerAnnotation):
                 if isinstance(ann.value, list):
                     html_list = copy(ann.value)
@@ -322,7 +327,7 @@ class Table(Layout):
         return "".join(html_list)
-    def get_attribute_names(self) -> Set[str]:
+    def get_attribute_names(self) -> set[str]:
         return (
             set(TableType)
             .union(super().get_attribute_names())
@@ -330,7 +335,7 @@ class Table(Layout):
         )
     @property
-    def csv(self) -> List[List[str]]:
+    def csv(self) -> csv:
         """Returns a csv-style representation of a table as list of lists of string. Cell content of cell with higher
         row or column spans will be shown at the upper left cell tile. All other tiles covered by the cell will be left
         as blank
@@ -355,17 +360,17 @@ class Table(Layout):
             return super().text
     @property
-    def text_(self) -> JsonDict:
+    def text_(self) -> Text_:
         cells = self.cells
         if not cells:
             return super().text_
-        text: List[str] = []
-        words: List[str] = []
-        ann_ids: List[str] = []
-        token_classes: List[str] = []
-        token_tags: List[str] = []
-        token_class_ids: List[str] = []
-        token_tag_ids: List[str] = []
+        text: list[str] = []
+        words: list[str] = []
+        ann_ids: list[str] = []
+        token_classes: list[str] = []
+        token_tags: list[str] = []
+        token_class_ids: list[str] = []
+        token_tag_ids: list[str] = []
         for cell in cells:
             text.extend(cell.text_["text"])  # type: ignore
             words.extend(cell.text_["words"])  # type: ignore
@@ -385,12 +390,12 @@ class Table(Layout):
         }
     @property
-    def words(self) -> List[ImageAnnotationBaseView]:
+    def words(self) -> list[ImageAnnotationBaseView]:
         """
         Get a list of `ImageAnnotationBaseView` objects with `LayoutType` defined by `text_container`.
         It will only select those among all annotations that have an entry in `Relationships.child` .
         """
-        all_words: List[ImageAnnotationBaseView] = []
+        all_words: list[ImageAnnotationBaseView] = []
         cells = self.cells
         if not cells:
             return super().words
@@ -398,12 +403,12 @@ class Table(Layout):
             all_words.extend(cell.words)  # type: ignore
         return all_words
-    def get_ordered_words(self) -> List[ImageAnnotationBaseView]:
+    def get_ordered_words(self) -> list[ImageAnnotationBaseView]:
         """Returns a list of words order by reading order. Words with no reading order will not be returned"""
         try:
             cells = self.cells
             all_words = []
-            cells.sort(key=lambda x: (x.row_number, x.column_number))
+            cells.sort(key=lambda x: (x.ROW_NUMBER, x.COLUMN_NUMBER))
             for cell in cells:
                 all_words.extend(cell.get_ordered_words())  # type: ignore
             return all_words
@@ -411,27 +416,42 @@ class Table(Layout):
             return super().get_ordered_words()
-IMAGE_ANNOTATION_TO_LAYOUTS: Dict[ObjectTypes, Type[Union[Layout, Table, Word]]] = {
-    **{i: Layout for i in LayoutType if (i not in {LayoutType.table, LayoutType.word, LayoutType.cell})},
-    LayoutType.table: Table,
-    LayoutType.table_rotated: Table,
-    LayoutType.word: Word,
-    LayoutType.cell: Cell,
-    CellType.projected_row_header: Cell,
-    CellType.spanning: Cell,
-    CellType.row_header: Cell,
-    CellType.column_header: Cell,
+IMAGE_ANNOTATION_TO_LAYOUTS: dict[ObjectTypes, Type[Union[Layout, Table, Word]]] = {
+    **{i: Layout for i in LayoutType if (i not in {LayoutType.TABLE, LayoutType.WORD, LayoutType.CELL})},
+    LayoutType.TABLE: Table,
+    LayoutType.TABLE_ROTATED: Table,
+    LayoutType.WORD: Word,
+    LayoutType.CELL: Cell,
+    CellType.PROJECTED_ROW_HEADER: Cell,
+    CellType.SPANNING: Cell,
+    CellType.ROW_HEADER: Cell,
+    CellType.COLUMN_HEADER: Cell,
 }
-IMAGE_DEFAULTS: Dict[str, Union[LayoutType, Sequence[ObjectTypes]]] = {
-    "text_container": LayoutType.word,
-    "floating_text_block_categories": [
-        LayoutType.text,
-        LayoutType.title,
-        LayoutType.figure,
-        LayoutType.list,
-    ],
-    "text_block_categories": [LayoutType.text, LayoutType.title, LayoutType.figure, LayoutType.list, LayoutType.cell],
+class ImageDefaults(TypedDict):
+    """ImageDefaults"""
+    text_container: LayoutType
+    floating_text_block_categories: tuple[LayoutType, ...]
+    text_block_categories: tuple[LayoutType, ...]
+IMAGE_DEFAULTS: ImageDefaults = {
+    "text_container": LayoutType.WORD,
+    "floating_text_block_categories": (
+        LayoutType.TEXT,
+        LayoutType.TITLE,
+        LayoutType.FIGURE,
+        LayoutType.LIST,
+    ),
+    "text_block_categories": (
+        LayoutType.TEXT,
+        LayoutType.TITLE,
+        LayoutType.FIGURE,
+        LayoutType.LIST,
+        LayoutType.CELL,
+    ),
 }
@@ -448,7 +468,7 @@ def ann_obj_view_factory(annotation: ImageAnnotation, text_container: ObjectType
     # We need to handle annotations that are text containers like words
     if annotation.category_name == text_container:
-        layout_class = IMAGE_ANNOTATION_TO_LAYOUTS[LayoutType.word]
+        layout_class = IMAGE_ANNOTATION_TO_LAYOUTS[LayoutType.WORD]
     else:
         layout_class = IMAGE_ANNOTATION_TO_LAYOUTS[annotation.category_name]
     ann_dict = annotation.as_dict()
@@ -477,9 +497,9 @@ class Page(Image):
     """
     text_container: ObjectTypes
-    floating_text_block_categories: List[ObjectTypes]
+    floating_text_block_categories: list[ObjectTypes]
     image_orig: Image
-    _attribute_names: Set[str] = {
+    _attribute_names: set[str] = {
         "text",
         "chunks",
         "tables",
@@ -500,7 +520,7 @@ class Page(Image):
         model_id: Optional[Union[str, Sequence[str]]] = None,
         session_ids: Optional[Union[str, Sequence[str]]] = None,
         ignore_inactive: bool = True,
-    ) -> List[ImageAnnotationBaseView]:
+    ) -> list[ImageAnnotationBaseView]:
         """
         Selection of annotations from the annotation container. Filter conditions can be defined by specifying
         the annotation_id or the category name. (Since only image annotations are currently allowed in the container,
@@ -523,9 +543,9 @@ class Page(Image):
         if category_names is not None:
             category_names = (
-                [get_type(cat_name) for cat_name in category_names]
-                if isinstance(category_names, list)
-                else [get_type(category_names)]  # type:ignore
+                (get_type(category_names),)
+                if isinstance(category_names, str)
+                else tuple(get_type(cat_name) for cat_name in category_names)
             )
         ann_ids = [annotation_ids] if isinstance(annotation_ids, str) else annotation_ids
         service_id = [service_id] if isinstance(service_id, str) else service_id
@@ -533,60 +553,59 @@ class Page(Image):
         session_id = [session_ids] if isinstance(session_ids, str) else session_ids
         if ignore_inactive:
-            anns = filter(lambda x: x.active, self.annotations)
+            anns: Union[list[ImageAnnotation], filter[ImageAnnotation]] = filter(lambda x: x.active, self.annotations)
         else:
-            anns = self.annotations  # type:ignore
+            anns = self.annotations
         if category_names is not None:
-            anns = filter(lambda x: x.category_name in category_names, anns)  # type:ignore
+            anns = filter(lambda x: x.category_name in category_names, anns)
         if ann_ids is not None:
-            anns = filter(lambda x: x.annotation_id in ann_ids, anns)  # type:ignore
+            anns = filter(lambda x: x.annotation_id in ann_ids, anns)
         if service_id is not None:
-            anns = filter(lambda x: x.generating_service in service_id, anns)  # type:ignore
+            anns = filter(lambda x: x.generating_service in service_id, anns)
         if model_id is not None:
-            anns = filter(lambda x: x.generating_model in model_id, anns)  # type:ignore
+            anns = filter(lambda x: x.generating_model in model_id, anns)
         if session_id is not None:
-            anns = filter(lambda x: x.session_id in session_id, anns)  # type:ignore
+            anns = filter(lambda x: x.session_id in session_id, anns)
-        return list(anns)  # type:ignore
+        return list(anns)  # type: ignore
     def __getattr__(self, item: str) -> Any:
         if item not in self.get_attribute_names():
             raise ImageError(f"Attribute {item} is not supported for {type(self)}")
-        if self.summary is not None:
-            if item in self.summary.sub_categories:
-                sub_cat = self.summary.get_sub_category(get_type(item))
-                if item != sub_cat.category_name:
-                    return sub_cat.category_name
-                if isinstance(sub_cat, ContainerAnnotation):
-                    return sub_cat.value
-                return int(sub_cat.category_id)
+        if item in self.summary.sub_categories:
+            sub_cat = self.summary.get_sub_category(get_type(item))
+            if item != sub_cat.category_name:
+                return sub_cat.category_name
+            if isinstance(sub_cat, ContainerAnnotation):
+                return sub_cat.value
+            return sub_cat.category_id
         return None
     @property
-    def layouts(self) -> List[ImageAnnotationBaseView]:
+    def layouts(self) -> list[ImageAnnotationBaseView]:
         """
         A list of a layouts. Layouts are all exactly all floating text block categories
         """
         return self.get_annotation(category_names=self.floating_text_block_categories)
     @property
-    def words(self) -> List[ImageAnnotationBaseView]:
+    def words(self) -> list[ImageAnnotationBaseView]:
         """
         A list of a words. Word are all text containers
         """
         return self.get_annotation(category_names=self.text_container)
     @property
-    def tables(self) -> List[ImageAnnotationBaseView]:
+    def tables(self) -> list[ImageAnnotationBaseView]:
         """
         A list of a tables.
         """
-        return self.get_annotation(category_names=LayoutType.table)
+        return self.get_annotation(category_names=LayoutType.TABLE)
     @classmethod
     def from_image(
@@ -612,13 +631,13 @@ class Page(Image):
         """
         if text_container is None:
-            text_container = IMAGE_DEFAULTS["text_container"]  # type: ignore
+            text_container = IMAGE_DEFAULTS["text_container"]
         if not floating_text_block_categories:
-            floating_text_block_categories = copy(IMAGE_DEFAULTS["floating_text_block_categories"])  # type: ignore
+            floating_text_block_categories = IMAGE_DEFAULTS["floating_text_block_categories"]
-        if include_residual_text_container and LayoutType.line not in floating_text_block_categories:  # type: ignore
-            floating_text_block_categories.append(LayoutType.line)  # type: ignore
+        if include_residual_text_container and LayoutType.LINE not in floating_text_block_categories:
+            floating_text_block_categories = tuple(floating_text_block_categories) + (LayoutType.LINE,)
         img_kwargs = image_orig.as_dict()
         page = cls(
@@ -646,18 +665,23 @@ class Page(Image):
                 if image_dict:
                     image = Image.from_dict(**image_dict)
                     layout_ann.image = cls.from_image(
-                        image, text_container, floating_text_block_categories, base_page=page
+                        image_orig=image,
+                        text_container=text_container,
+                        floating_text_block_categories=floating_text_block_categories,
+                        include_residual_text_container=include_residual_text_container,
+                        base_page=page,
                     )
             layout_ann.base_page = base_page if base_page is not None else page
             page.dump(layout_ann)
         if summary_dict := img_kwargs.get("_summary"):
-            page.summary = SummaryAnnotation.from_dict(**summary_dict)
+            page.summary = CategoryAnnotation.from_dict(**summary_dict)
+            page.summary.category_name = SummaryType.SUMMARY
         page.floating_text_block_categories = floating_text_block_categories  # type: ignore
-        page.text_container = text_container  # type: ignore
+        page.text_container = text_container
         page.include_residual_text_container = include_residual_text_container
         return page
-    def _order(self, block: str) -> List[ImageAnnotationBaseView]:
+    def _order(self, block: str) -> list[ImageAnnotationBaseView]:
         blocks_with_order = [layout for layout in getattr(self, block) if layout.reading_order is not None]
         blocks_with_order.sort(key=lambda x: x.reading_order)
         return blocks_with_order
@@ -678,18 +702,18 @@ class Page(Image):
         return self._make_text()
     @property
-    def text_(self) -> JsonDict:
+    def text_(self) -> Text_:
         """Returns a dict `{"text": text string,
         "text_list": list of single words,
         "annotation_ids": word annotation ids`"""
         block_with_order = self._order("layouts")
-        text: List[str] = []
-        words: List[str] = []
-        ann_ids: List[str] = []
-        token_classes: List[str] = []
-        token_tags: List[str] = []
-        token_class_ids: List[str] = []
-        token_tag_ids: List[str] = []
+        text: list[str] = []
+        words: list[str] = []
+        ann_ids: list[str] = []
+        token_classes: list[str] = []
+        token_tags: list[str] = []
+        token_class_ids: list[str] = []
+        token_tag_ids: list[str] = []
         for block in block_with_order:
             text.append(block.text_["text"])  # type: ignore
             words.extend(block.text_["words"])  # type: ignore
@@ -708,7 +732,7 @@ class Page(Image):
             "token_tag_ids": token_tag_ids,
         }
-    def get_layout_context(self, annotation_id: str, context_size: int = 3) -> List[ImageAnnotationBaseView]:
+    def get_layout_context(self, annotation_id: str, context_size: int = 3) -> list[ImageAnnotationBaseView]:
         """For a given `annotation_id` get a list of `ImageAnnotation` that are nearby in terms of reading order.
         For a given context_size it will return all layouts with reading_order between
         reading_order(annoation_id)-context_size and  reading_order(annoation_id)-context_size.
@@ -731,7 +755,7 @@ class Page(Image):
         ]
     @property
-    def chunks(self) -> List[Tuple[str, str, int, str, str, str, str]]:
+    def chunks(self) -> Chunks:
         """
         :return: Returns a "chunk" of a layout element or a table as 6-tuple containing
@@ -783,7 +807,7 @@ class Page(Image):
         ignore_default_token_class: bool = False,
         interactive: bool = False,
         **debug_kwargs: str,
-    ) -> Optional[ImageType]:
+    ) -> Optional[PixelValues]:
         """
         Display a page with detected bounding boxes of various types.
@@ -813,7 +837,7 @@ class Page(Image):
         :return: If `interactive=False` will return a numpy array.
         """
-        category_names_list: List[Union[str, None]] = []
+        category_names_list: list[Union[str, None]] = []
         box_stack = []
         cells_found = False
@@ -836,15 +860,15 @@ class Page(Image):
         if show_tables and not debug_kwargs:
             for table in self.tables:
                 box_stack.append(table.bbox)
-                category_names_list.append(LayoutType.table.value)
+                category_names_list.append(LayoutType.TABLE.value)
                 if show_cells:
                     for cell in table.cells:
                         if cell.category_name in {
-                            LayoutType.cell,
-                            CellType.projected_row_header,
-                            CellType.spanning,
-                            CellType.row_header,
-                            CellType.column_header,
+                            LayoutType.CELL,
+                            CellType.PROJECTED_ROW_HEADER,
+                            CellType.SPANNING,
+                            CellType.ROW_HEADER,
+                            CellType.COLUMN_HEADER,
                         }:
                             cells_found = True
                             box_stack.append(cell.bbox)
@@ -872,7 +896,7 @@ class Page(Image):
             for table in self.tables:
                 all_words.extend(table.words)
             if not all_words:
-                all_words = self.get_annotation(category_names=LayoutType.word)
+                all_words = self.get_annotation(category_names=LayoutType.WORD)
             if not ignore_default_token_class:
                 for word in all_words:
                     box_stack.append(word.bbox)
@@ -882,7 +906,7 @@ class Page(Image):
                         category_names_list.append(word.token_tag.value if word.token_tag is not None else None)
             else:
                 for word in all_words:
-                    if word.token_class is not None and word.token_class != TokenClasses.other:
+                    if word.token_class is not None and word.token_class != TokenClasses.OTHER:
                         box_stack.append(word.bbox)
                         if show_token_class:
                             category_names_list.append(word.token_class.value if word.token_class is not None else None)
@@ -915,7 +939,7 @@ class Page(Image):
         return None
     @classmethod
-    def get_attribute_names(cls) -> Set[str]:
+    def get_attribute_names(cls) -> set[str]:
         """
         :return: A set of registered attributes.
         """
@@ -945,9 +969,9 @@ class Page(Image):
         self,
         image_to_json: bool = True,
         highest_hierarchy_only: bool = False,
-        path: Optional[Pathlike] = None,
+        path: Optional[PathLikeOrStr] = None,
         dry: bool = False,
-    ) -> Optional[JsonDict]:
+    ) -> Optional[Union[ImageDict, str]]:
         """
         Export image as dictionary. As numpy array cannot be serialized `image` values will be converted into
         base64 encodings.
@@ -967,7 +991,7 @@ class Page(Image):
         cls,
         file_path: str,
         text_container: Optional[ObjectTypes] = None,
-        floating_text_block_categories: Optional[List[ObjectTypes]] = None,
+        floating_text_block_categories: Optional[list[ObjectTypes]] = None,
         include_residual_text_container: bool = True,
     ) -> Page:
         """Reading JSON file and building a `Page` object with given config.
@@ -981,16 +1005,16 @@ class Page(Image):
         image = Image.from_file(file_path)
         return cls.from_image(image, text_container, floating_text_block_categories, include_residual_text_container)
-    def get_token(self) -> List[Mapping[str, str]]:
+    def get_token(self) -> list[Mapping[str, str]]:
         """Return a list of tuples with word and non default token tags"""
         block_with_order = self._order("layouts")
         all_words = []
         for block in block_with_order:
             all_words.extend(block.get_ordered_words())  # type: ignore
         return [
-            {"word": word.characters, "entity": word.token_tag}
+            {"word": word.CHARACTERS, "entity": word.TOKEN_TAG}
             for word in all_words
-            if word.token_tag not in (TokenClasses.other, None)
+            if word.TOKEN_TAG not in (TokenClasses.OTHER, None)
         ]
     def __copy__(self) -> Page:

deepdoctection 0.32__py3-none-any.whl → 0.34__py3-none-any.whl

Potentially problematic release.

deepdoctection 0.32py3-none-any.whl → 0.34py3-none-any.whl