deepdoctection 0.39.3__tar.gz → 0.39.5__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of deepdoctection might be problematic. Click here for more details.
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/PKG-INFO +3 -3
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/__init__.py +1 -1
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datapoint/image.py +6 -6
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datapoint/view.py +4 -2
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/base.py +11 -1
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/info.py +1 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/doclaynet.py +10 -1
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/fintabnet.py +10 -1
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/funsd.py +10 -1
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/iiitar13k.py +10 -2
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/layouttest.py +8 -1
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/publaynet.py +10 -1
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/pubtables1m.py +10 -2
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/pubtabnet.py +10 -1
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/rvlcdip.py +10 -1
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/xfund.py +10 -1
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/registry.py +18 -3
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/doctrocr.py +9 -7
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/mapper/cats.py +1 -1
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection.egg-info/PKG-INFO +3 -3
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection.egg-info/requires.txt +2 -2
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/setup.py +1 -1
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/LICENSE +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/README.md +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/analyzer/__init__.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/analyzer/_config.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/analyzer/dd.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/analyzer/factory.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/configs/__init__.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/configs/conf_dd_one.yaml +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/configs/conf_tesseract.yaml +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/dataflow/__init__.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/dataflow/base.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/dataflow/common.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/dataflow/custom.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/dataflow/custom_serialize.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/dataflow/parallel_map.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/dataflow/serialize.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/dataflow/stats.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datapoint/__init__.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datapoint/annotation.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datapoint/box.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datapoint/convert.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/__init__.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/adapter.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/dataflow_builder.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/__init__.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/xsl/__init__.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/xsl/pascal_voc.xsl +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/save.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/eval/__init__.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/eval/accmetric.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/eval/base.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/eval/cocometric.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/eval/eval.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/eval/registry.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/eval/tedsmetric.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/eval/tp_eval_callback.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/__init__.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/base.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/d2detect.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/deskew.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/fastlang.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/hfdetr.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/hflayoutlm.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/hflm.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/model.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/pdftext.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/pt/__init__.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/pt/nms.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/pt/ptutils.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tessocr.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/texocr.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/__init__.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tfutils.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpcompat.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/__init__.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/common.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/config/__init__.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/config/config.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/modeling/__init__.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/modeling/backbone.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/modeling/generalized_rcnn.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/modeling/model_box.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/modeling/model_cascade.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/modeling/model_fpn.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/modeling/model_frcnn.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/modeling/model_mrcnn.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/modeling/model_rpn.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/predict.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/preproc.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/utils/__init__.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/utils/box_ops.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/utils/np_box_ops.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tpdetect.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/mapper/__init__.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/mapper/cocostruct.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/mapper/d2struct.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/mapper/hfstruct.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/mapper/laylmstruct.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/mapper/maputils.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/mapper/match.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/mapper/misc.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/mapper/pascalstruct.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/mapper/prodigystruct.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/mapper/pubstruct.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/mapper/tpstruct.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/mapper/xfundstruct.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/pipe/__init__.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/pipe/anngen.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/pipe/base.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/pipe/common.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/pipe/concurrency.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/pipe/doctectionpipe.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/pipe/language.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/pipe/layout.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/pipe/lm.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/pipe/order.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/pipe/refine.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/pipe/registry.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/pipe/segment.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/pipe/sub_layout.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/pipe/text.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/pipe/transform.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/py.typed +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/train/__init__.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/train/d2_frcnn_train.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/train/hf_detr_train.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/train/hf_layoutlm_train.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/train/tp_frcnn_train.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/utils/__init__.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/utils/concurrency.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/utils/context.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/utils/develop.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/utils/env_info.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/utils/error.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/utils/file_utils.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/utils/fs.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/utils/identifier.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/utils/logger.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/utils/metacfg.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/utils/mocks.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/utils/pdf_utils.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/utils/settings.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/utils/tqdm.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/utils/transform.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/utils/types.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/utils/utils.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/utils/viz.py +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection.egg-info/SOURCES.txt +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection.egg-info/dependency_links.txt +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection.egg-info/top_level.txt +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/setup.cfg +0 -0
- {deepdoctection-0.39.3 → deepdoctection-0.39.5}/tests/test_utils.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.2
|
|
2
2
|
Name: deepdoctection
|
|
3
|
-
Version: 0.39.
|
|
3
|
+
Version: 0.39.5
|
|
4
4
|
Summary: Repository for Document AI
|
|
5
5
|
Home-page: https://github.com/deepdoctection/deepdoctection
|
|
6
6
|
Author: Dr. Janis Meyer
|
|
@@ -57,7 +57,7 @@ Requires-Dist: tensorpack==0.11; extra == "tf"
|
|
|
57
57
|
Requires-Dist: protobuf==3.20.1; extra == "tf"
|
|
58
58
|
Requires-Dist: tensorflow-addons>=0.17.1; extra == "tf"
|
|
59
59
|
Requires-Dist: tf2onnx>=1.9.2; extra == "tf"
|
|
60
|
-
Requires-Dist: python-doctr==0.
|
|
60
|
+
Requires-Dist: python-doctr==0.9.0; extra == "tf"
|
|
61
61
|
Requires-Dist: pycocotools>=2.0.2; extra == "tf"
|
|
62
62
|
Requires-Dist: boto3==1.34.102; extra == "tf"
|
|
63
63
|
Requires-Dist: pdfplumber>=0.11.0; extra == "tf"
|
|
@@ -88,7 +88,7 @@ Requires-Dist: tqdm==4.64.0; extra == "pt"
|
|
|
88
88
|
Requires-Dist: timm>=0.9.16; extra == "pt"
|
|
89
89
|
Requires-Dist: transformers>=4.48.0; extra == "pt"
|
|
90
90
|
Requires-Dist: accelerate>=0.29.1; extra == "pt"
|
|
91
|
-
Requires-Dist: python-doctr==0.
|
|
91
|
+
Requires-Dist: python-doctr==0.9.0; extra == "pt"
|
|
92
92
|
Requires-Dist: boto3==1.34.102; extra == "pt"
|
|
93
93
|
Requires-Dist: pdfplumber>=0.11.0; extra == "pt"
|
|
94
94
|
Requires-Dist: fasttext-wheel; extra == "pt"
|
|
@@ -702,11 +702,11 @@ class Image:
|
|
|
702
702
|
return get_uuid(self.image_id, *container_ids)
|
|
703
703
|
|
|
704
704
|
def save(
|
|
705
|
-
|
|
706
|
-
|
|
707
|
-
|
|
708
|
-
|
|
709
|
-
|
|
705
|
+
self,
|
|
706
|
+
image_to_json: bool = True,
|
|
707
|
+
highest_hierarchy_only: bool = False,
|
|
708
|
+
path: Optional[PathLikeOrStr] = None,
|
|
709
|
+
dry: bool = False,
|
|
710
710
|
) -> Optional[Union[ImageDict, str]]:
|
|
711
711
|
"""
|
|
712
712
|
Export image as dictionary. As numpy array cannot be serialized `image` values will be converted into
|
|
@@ -723,7 +723,7 @@ class Image:
|
|
|
723
723
|
def set_image_keys_to_none(d): # type: ignore
|
|
724
724
|
if isinstance(d, dict):
|
|
725
725
|
for key, value in d.items():
|
|
726
|
-
if key ==
|
|
726
|
+
if key == "_image":
|
|
727
727
|
d[key] = None
|
|
728
728
|
else:
|
|
729
729
|
set_image_keys_to_none(value)
|
|
@@ -430,8 +430,10 @@ class Table(Layout):
|
|
|
430
430
|
category_names=[LayoutType.CELL, CellType.SPANNING], annotation_ids=all_relation_ids
|
|
431
431
|
)
|
|
432
432
|
column_cells = list(
|
|
433
|
-
filter(
|
|
434
|
-
|
|
433
|
+
filter(
|
|
434
|
+
lambda c: column_number in (c.column_number, c.column_number + c.column_span - 1), # type: ignore
|
|
435
|
+
all_cells,
|
|
436
|
+
) # type: ignore
|
|
435
437
|
)
|
|
436
438
|
column_cells.sort(key=lambda c: c.row_number) # type: ignore
|
|
437
439
|
return column_cells # type: ignore
|
|
@@ -394,6 +394,7 @@ class CustomDataset(DatasetBase):
|
|
|
394
394
|
dataflow_builder: Type[DataFlowBaseBuilder],
|
|
395
395
|
init_sub_categories: Optional[Mapping[ObjectTypes, Mapping[ObjectTypes, Sequence[ObjectTypes]]]] = None,
|
|
396
396
|
annotation_files: Optional[Mapping[str, Union[str, Sequence[str]]]] = None,
|
|
397
|
+
description: Optional[str] = None,
|
|
397
398
|
):
|
|
398
399
|
"""
|
|
399
400
|
:param name: Name of the dataset. It will not be used in the code, however it might be helpful, if several
|
|
@@ -422,6 +423,7 @@ class CustomDataset(DatasetBase):
|
|
|
422
423
|
:param annotation_files: A mapping to one or more annotation files, e.g.
|
|
423
424
|
|
|
424
425
|
annotation_file = {"train": "train_file.json", "test": "test_file.json"}
|
|
426
|
+
:param description: A description of the dataset.
|
|
425
427
|
"""
|
|
426
428
|
|
|
427
429
|
self.name = name
|
|
@@ -439,10 +441,18 @@ class CustomDataset(DatasetBase):
|
|
|
439
441
|
"annotation_files: Optional[Mapping[str, Union[str, Sequence[str]]]] = None):`"
|
|
440
442
|
)
|
|
441
443
|
self.dataflow_builder = dataflow_builder(self.location, self.annotation_files)
|
|
444
|
+
self.description = description
|
|
442
445
|
super().__init__()
|
|
443
446
|
|
|
444
447
|
def _info(self) -> DatasetInfo: # type: ignore # pylint: disable=W0221
|
|
445
|
-
return DatasetInfo(
|
|
448
|
+
return DatasetInfo(
|
|
449
|
+
name=self.name,
|
|
450
|
+
type=self.type,
|
|
451
|
+
description=self.description if self.description is not None else "",
|
|
452
|
+
license="",
|
|
453
|
+
url="",
|
|
454
|
+
splits={},
|
|
455
|
+
)
|
|
446
456
|
|
|
447
457
|
def _categories(self) -> DatasetCategories:
|
|
448
458
|
return DatasetCategories(init_categories=self.init_categories, init_sub_categories=self.init_sub_categories)
|
{deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/doclaynet.py
RENAMED
|
@@ -45,6 +45,7 @@ from ..info import DatasetCategories, DatasetInfo
|
|
|
45
45
|
from ..registry import dataset_registry
|
|
46
46
|
|
|
47
47
|
_NAME = "doclaynet"
|
|
48
|
+
_SHORT_DESCRIPTION = "DocLayNet is a human-annotated document layout segmentation dataset containing 80863 pages."
|
|
48
49
|
_DESCRIPTION = (
|
|
49
50
|
"DocLayNet is a human-annotated document layout segmentation dataset containing 80863 pages from a broad "
|
|
50
51
|
"variety of document sources. \n"
|
|
@@ -105,7 +106,15 @@ class DocLayNet(DatasetBase):
|
|
|
105
106
|
|
|
106
107
|
@classmethod
|
|
107
108
|
def _info(cls) -> DatasetInfo:
|
|
108
|
-
return DatasetInfo(
|
|
109
|
+
return DatasetInfo(
|
|
110
|
+
name=_NAME,
|
|
111
|
+
short_description=_SHORT_DESCRIPTION,
|
|
112
|
+
description=_DESCRIPTION,
|
|
113
|
+
license=_LICENSE,
|
|
114
|
+
splits=_SPLITS,
|
|
115
|
+
type=_TYPE,
|
|
116
|
+
url=_URL,
|
|
117
|
+
)
|
|
109
118
|
|
|
110
119
|
def _categories(self) -> DatasetCategories:
|
|
111
120
|
return DatasetCategories(init_categories=_INIT_CATEGORIES, init_sub_categories=_SUB_CATEGORIES)
|
{deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/fintabnet.py
RENAMED
|
@@ -54,6 +54,7 @@ from ..info import DatasetCategories, DatasetInfo
|
|
|
54
54
|
from ..registry import dataset_registry
|
|
55
55
|
|
|
56
56
|
_NAME = "fintabnet"
|
|
57
|
+
_SHORT_DESCRIPTION = "FinTabNet dataset contains complex tables from the annual reports of S&P 500 companies."
|
|
57
58
|
_DESCRIPTION = (
|
|
58
59
|
"FinTabNet dataset contains complex tables from the annual reports of S&P 500 companies with detailed \n"
|
|
59
60
|
" table structure annotations to help train and test structure recognition. \n"
|
|
@@ -129,7 +130,15 @@ class Fintabnet(_BuiltInDataset):
|
|
|
129
130
|
|
|
130
131
|
@classmethod
|
|
131
132
|
def _info(cls) -> DatasetInfo:
|
|
132
|
-
return DatasetInfo(
|
|
133
|
+
return DatasetInfo(
|
|
134
|
+
name=_NAME,
|
|
135
|
+
short_description=_SHORT_DESCRIPTION,
|
|
136
|
+
description=_DESCRIPTION,
|
|
137
|
+
license=_LICENSE,
|
|
138
|
+
url=_URL,
|
|
139
|
+
splits=_SPLITS,
|
|
140
|
+
type=_TYPE,
|
|
141
|
+
)
|
|
133
142
|
|
|
134
143
|
def _categories(self) -> DatasetCategories:
|
|
135
144
|
return DatasetCategories(init_categories=_INIT_CATEGORIES, init_sub_categories=_SUB_CATEGORIES)
|
|
@@ -66,6 +66,7 @@ def load_file(path_ann: PathLikeOrStr) -> FunsdDict:
|
|
|
66
66
|
|
|
67
67
|
|
|
68
68
|
_NAME = "funsd"
|
|
69
|
+
_SHORT_DESCRIPTION = "FUNSD: Form Understanding in Noisy Scanned Documents."
|
|
69
70
|
_DESCRIPTION = (
|
|
70
71
|
"FUNSD: Form Understanding in Noisy Scanned Documents. A dataset for Text Detection, Optical Character \n"
|
|
71
72
|
" Recognition, Spatial Layout Analysis and Form Understanding."
|
|
@@ -116,7 +117,15 @@ class Funsd(_BuiltInDataset):
|
|
|
116
117
|
|
|
117
118
|
@classmethod
|
|
118
119
|
def _info(cls) -> DatasetInfo:
|
|
119
|
-
return DatasetInfo(
|
|
120
|
+
return DatasetInfo(
|
|
121
|
+
name=_NAME,
|
|
122
|
+
short_description=_SHORT_DESCRIPTION,
|
|
123
|
+
description=_DESCRIPTION,
|
|
124
|
+
license=_LICENSE,
|
|
125
|
+
url=_URL,
|
|
126
|
+
splits=_SPLITS,
|
|
127
|
+
type=_TYPE,
|
|
128
|
+
)
|
|
120
129
|
|
|
121
130
|
def _categories(self) -> DatasetCategories:
|
|
122
131
|
return DatasetCategories(init_categories=_INIT_CATEGORIES, init_sub_categories=_SUB_CATEGORIES)
|
{deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/iiitar13k.py
RENAMED
|
@@ -60,7 +60,7 @@ with try_import() as import_guard:
|
|
|
60
60
|
from lxml import etree
|
|
61
61
|
|
|
62
62
|
_NAME = "iiitar13k"
|
|
63
|
-
|
|
63
|
+
_SHORT_DESCRIPTION = "IIIT-AR-13K: A New Dataset for Graphical Object Detection in Documents"
|
|
64
64
|
_DESCRIPTION = (
|
|
65
65
|
"[excerpt from Ajoy Mondal et. all. IIIT-AR-13K: A New Dataset for Graphical Object Detection in \n"
|
|
66
66
|
"Documents] ...This dataset, IIIT-AR-13K, is created by manually annotating the bounding boxes of \n"
|
|
@@ -97,7 +97,15 @@ class IIITar13K(_BuiltInDataset):
|
|
|
97
97
|
|
|
98
98
|
@classmethod
|
|
99
99
|
def _info(cls) -> DatasetInfo:
|
|
100
|
-
return DatasetInfo(
|
|
100
|
+
return DatasetInfo(
|
|
101
|
+
name=_NAME,
|
|
102
|
+
short_description=_SHORT_DESCRIPTION,
|
|
103
|
+
description=_DESCRIPTION,
|
|
104
|
+
license=_LICENSE,
|
|
105
|
+
url=_URL,
|
|
106
|
+
splits=_SPLITS,
|
|
107
|
+
type=_TYPE,
|
|
108
|
+
)
|
|
101
109
|
|
|
102
110
|
def _categories(self) -> DatasetCategories:
|
|
103
111
|
return DatasetCategories(init_categories=_INIT_CATEGORIES)
|
{deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/layouttest.py
RENAMED
|
@@ -73,7 +73,14 @@ class LayoutTest(_BuiltInDataset):
|
|
|
73
73
|
|
|
74
74
|
@classmethod
|
|
75
75
|
def _info(cls) -> DatasetInfo:
|
|
76
|
-
return DatasetInfo(
|
|
76
|
+
return DatasetInfo(
|
|
77
|
+
name=_NAME,
|
|
78
|
+
short_description=_DESCRIPTION,
|
|
79
|
+
description=_DESCRIPTION,
|
|
80
|
+
license=_LICENSE,
|
|
81
|
+
splits=_SPLITS,
|
|
82
|
+
type=_TYPE,
|
|
83
|
+
)
|
|
77
84
|
|
|
78
85
|
def _categories(self) -> DatasetCategories:
|
|
79
86
|
return DatasetCategories(init_categories=_INIT_CATEGORIES)
|
{deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/publaynet.py
RENAMED
|
@@ -43,6 +43,7 @@ from ..info import DatasetCategories, DatasetInfo
|
|
|
43
43
|
from ..registry import dataset_registry
|
|
44
44
|
|
|
45
45
|
_NAME = "publaynet"
|
|
46
|
+
_SHORT_DESCRIPTION = "PubLayNet is a dataset for document layout analysis."
|
|
46
47
|
_DESCRIPTION = (
|
|
47
48
|
"PubLayNet is a dataset for document layout analysis. It contains images of research papers and "
|
|
48
49
|
"articles \n"
|
|
@@ -79,7 +80,15 @@ class Publaynet(_BuiltInDataset):
|
|
|
79
80
|
|
|
80
81
|
@classmethod
|
|
81
82
|
def _info(cls) -> DatasetInfo:
|
|
82
|
-
return DatasetInfo(
|
|
83
|
+
return DatasetInfo(
|
|
84
|
+
name=_NAME,
|
|
85
|
+
short_description=_SHORT_DESCRIPTION,
|
|
86
|
+
description=_DESCRIPTION,
|
|
87
|
+
license=_LICENSE,
|
|
88
|
+
url=_URL,
|
|
89
|
+
splits=_SPLITS,
|
|
90
|
+
type=_TYPE,
|
|
91
|
+
)
|
|
83
92
|
|
|
84
93
|
def _categories(self) -> DatasetCategories:
|
|
85
94
|
return DatasetCategories(init_categories=_INIT_CATEGORIES)
|
{deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/pubtables1m.py
RENAMED
|
@@ -63,7 +63,7 @@ with try_import() as import_guard:
|
|
|
63
63
|
from lxml import etree
|
|
64
64
|
|
|
65
65
|
_NAME = "pubtables1m_det"
|
|
66
|
-
|
|
66
|
+
_SHORT_DESCRIPTION = "PubTables1M is a dataset for table detection and structure recognition."
|
|
67
67
|
_DESCRIPTION = (
|
|
68
68
|
"[excerpt from Brandon Smock et. all. PubTables-1M: Towards Comprehensive Table Extraction From Unstructured \n"
|
|
69
69
|
"Documents] '...we release PubTables1M, a dataset of nearly one million tables from PubMed Central Open Access \n"
|
|
@@ -100,7 +100,15 @@ class Pubtables1MDet(_BuiltInDataset):
|
|
|
100
100
|
|
|
101
101
|
@classmethod
|
|
102
102
|
def _info(cls) -> DatasetInfo:
|
|
103
|
-
return DatasetInfo(
|
|
103
|
+
return DatasetInfo(
|
|
104
|
+
name=_NAME,
|
|
105
|
+
short_description=_SHORT_DESCRIPTION,
|
|
106
|
+
description=_DESCRIPTION,
|
|
107
|
+
license=_LICENSE,
|
|
108
|
+
url=_URL,
|
|
109
|
+
splits=_SPLITS,
|
|
110
|
+
type=_TYPE,
|
|
111
|
+
)
|
|
104
112
|
|
|
105
113
|
def _categories(self) -> DatasetCategories:
|
|
106
114
|
return DatasetCategories(init_categories=_INIT_CATEGORIES_DET)
|
{deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/pubtabnet.py
RENAMED
|
@@ -45,6 +45,7 @@ from ..info import DatasetCategories
|
|
|
45
45
|
from ..registry import dataset_registry
|
|
46
46
|
|
|
47
47
|
_NAME = "pubtabnet"
|
|
48
|
+
_SHORT_DESCRIPTION = "PubTabNet is a dataset for image-based table recognition."
|
|
48
49
|
_DESCRIPTION = (
|
|
49
50
|
"PubTabNet is a large dataset for image-based table recognition, containing 568k+ images of \n"
|
|
50
51
|
"tabular data annotated with the corresponding HTML representation of the tables. The table images \n"
|
|
@@ -115,7 +116,15 @@ class Pubtabnet(_BuiltInDataset):
|
|
|
115
116
|
|
|
116
117
|
@classmethod
|
|
117
118
|
def _info(cls) -> DatasetInfo:
|
|
118
|
-
return DatasetInfo(
|
|
119
|
+
return DatasetInfo(
|
|
120
|
+
name=_NAME,
|
|
121
|
+
short_description=_SHORT_DESCRIPTION,
|
|
122
|
+
description=_DESCRIPTION,
|
|
123
|
+
license=_LICENSE,
|
|
124
|
+
url=_URL,
|
|
125
|
+
splits=_SPLITS,
|
|
126
|
+
type=_TYPE,
|
|
127
|
+
)
|
|
119
128
|
|
|
120
129
|
def _categories(self) -> DatasetCategories:
|
|
121
130
|
return DatasetCategories(init_categories=_INIT_CATEGORIES, init_sub_categories=_SUB_CATEGORIES)
|
{deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/rvlcdip.py
RENAMED
|
@@ -48,6 +48,7 @@ from ..info import DatasetCategories, DatasetInfo
|
|
|
48
48
|
from ..registry import dataset_registry
|
|
49
49
|
|
|
50
50
|
_NAME = "rvl-cdip"
|
|
51
|
+
_SHORT_DESCRIPTION = "RVL-CDIP is a dataset for document classification."
|
|
51
52
|
_DESCRIPTION = (
|
|
52
53
|
"The RVL-CDIP (Ryerson Vision Lab Complex Document Information Processing) dataset consists of 400, 000 gray- \n"
|
|
53
54
|
"scale images in 16 classes, with 25, 000 images per class . There are 320, 000 training images, 40, 000 \n"
|
|
@@ -98,7 +99,15 @@ class Rvlcdip(_BuiltInDataset):
|
|
|
98
99
|
|
|
99
100
|
@classmethod
|
|
100
101
|
def _info(cls) -> DatasetInfo:
|
|
101
|
-
return DatasetInfo(
|
|
102
|
+
return DatasetInfo(
|
|
103
|
+
name=_NAME,
|
|
104
|
+
short_description=_SHORT_DESCRIPTION,
|
|
105
|
+
description=_DESCRIPTION,
|
|
106
|
+
license=_LICENSE,
|
|
107
|
+
url=_URL,
|
|
108
|
+
splits=_SPLITS,
|
|
109
|
+
type=_TYPE,
|
|
110
|
+
)
|
|
102
111
|
|
|
103
112
|
def _categories(self) -> DatasetCategories:
|
|
104
113
|
return DatasetCategories(init_categories=_INIT_CATEGORIES)
|
|
@@ -45,6 +45,7 @@ from ..info import DatasetCategories
|
|
|
45
45
|
from ..registry import dataset_registry
|
|
46
46
|
|
|
47
47
|
_NAME = "xfund"
|
|
48
|
+
_SHORT_DESCRIPTION = "XFUND is a multilingual form understanding benchmark dataset."
|
|
48
49
|
_DESCRIPTION = (
|
|
49
50
|
"XFUND is a multilingual form understanding benchmark dataset that includes human-labeled forms with \n"
|
|
50
51
|
"key-value pairs in 7 languages (Chinese, Japanese, Spanish, French, Italian, German, Portuguese)."
|
|
@@ -103,7 +104,15 @@ class Xfund(_BuiltInDataset):
|
|
|
103
104
|
|
|
104
105
|
@classmethod
|
|
105
106
|
def _info(cls) -> DatasetInfo:
|
|
106
|
-
return DatasetInfo(
|
|
107
|
+
return DatasetInfo(
|
|
108
|
+
name=_NAME,
|
|
109
|
+
short_description=_SHORT_DESCRIPTION,
|
|
110
|
+
description=_DESCRIPTION,
|
|
111
|
+
license=_LICENSE,
|
|
112
|
+
url=_URL,
|
|
113
|
+
splits=_SPLITS,
|
|
114
|
+
type=_TYPE,
|
|
115
|
+
)
|
|
107
116
|
|
|
108
117
|
def _categories(self) -> DatasetCategories:
|
|
109
118
|
return DatasetCategories(init_categories=_INIT_CATEGORIES, init_sub_categories=_SUB_CATEGORIES)
|
|
@@ -65,18 +65,33 @@ def print_dataset_infos(add_license: bool = True, add_info: bool = True) -> None
|
|
|
65
65
|
data = dataset_registry.get_all()
|
|
66
66
|
num_columns = min(6, len(data))
|
|
67
67
|
infos = []
|
|
68
|
+
|
|
68
69
|
for dataset in data.items():
|
|
69
70
|
info = [dataset[0]]
|
|
71
|
+
ds = dataset[1]()
|
|
72
|
+
info.append(ds.dataset_info.type)
|
|
70
73
|
if add_license:
|
|
71
|
-
info.append(
|
|
74
|
+
info.append(ds.dataset_info.license) # pylint: disable=W0212
|
|
72
75
|
if add_info:
|
|
73
|
-
info.append(
|
|
76
|
+
info.append(ds.dataset_info.short_description) # pylint: disable=W0212
|
|
77
|
+
if ds.dataflow.categories is not None: # pylint: disable=W0212
|
|
78
|
+
categories = "\n".join(ds.dataflow.categories.init_categories) # Format categories as multi-line string
|
|
79
|
+
sub_categories = "\n".join(
|
|
80
|
+
f"{key}: {', '.join(values)}" for key, values in ds.dataflow.categories.init_sub_categories.items()
|
|
81
|
+
) # Format sub-categories as multi-line string
|
|
82
|
+
info.append(categories)
|
|
83
|
+
info.append(sub_categories)
|
|
84
|
+
else:
|
|
85
|
+
info.append("")
|
|
86
|
+
info.append("")
|
|
74
87
|
infos.append(info)
|
|
75
|
-
|
|
88
|
+
|
|
89
|
+
header = ["dataset", "type"]
|
|
76
90
|
if add_license:
|
|
77
91
|
header.append("license")
|
|
78
92
|
if add_info:
|
|
79
93
|
header.append("description")
|
|
94
|
+
header.append("categories")
|
|
80
95
|
table = tabulate(
|
|
81
96
|
infos, headers=header * (num_columns // 2), tablefmt="fancy_grid", stralign="left", numalign="left"
|
|
82
97
|
)
|
|
@@ -79,8 +79,8 @@ def _load_model(
|
|
|
79
79
|
state_dict = torch.load(os.fspath(path_weights), map_location=device)
|
|
80
80
|
for key in list(state_dict.keys()):
|
|
81
81
|
state_dict["model." + key] = state_dict.pop(key)
|
|
82
|
-
doctr_predictor.load_state_dict(state_dict)
|
|
83
|
-
doctr_predictor.to(device)
|
|
82
|
+
doctr_predictor.load_state_dict(state_dict) # type: ignore
|
|
83
|
+
doctr_predictor.to(device) # type: ignore
|
|
84
84
|
elif lib == "TF":
|
|
85
85
|
# Unzip the archive
|
|
86
86
|
params_path = Path(path_weights).parent
|
|
@@ -88,9 +88,9 @@ def _load_model(
|
|
|
88
88
|
if is_zip_path:
|
|
89
89
|
with ZipFile(path_weights, "r") as file:
|
|
90
90
|
file.extractall(path=params_path)
|
|
91
|
-
doctr_predictor.model.load_weights(params_path / "weights")
|
|
91
|
+
doctr_predictor.model.load_weights(params_path / "weights") # type: ignore
|
|
92
92
|
else:
|
|
93
|
-
doctr_predictor.model.load_weights(os.fspath(path_weights))
|
|
93
|
+
doctr_predictor.model.load_weights(os.fspath(path_weights)) # type: ignore
|
|
94
94
|
|
|
95
95
|
|
|
96
96
|
def auto_select_lib_for_doctr() -> Literal["PT", "TF"]:
|
|
@@ -125,7 +125,7 @@ def doctr_predict_text_lines(
|
|
|
125
125
|
DetectionResult(
|
|
126
126
|
box=box[:4].tolist(), class_id=1, score=box[4], absolute_coords=False, class_name=LayoutType.WORD
|
|
127
127
|
)
|
|
128
|
-
for box in raw_output[0]["words"]
|
|
128
|
+
for box in raw_output[0]["words"] # type: ignore
|
|
129
129
|
]
|
|
130
130
|
return detection_results
|
|
131
131
|
|
|
@@ -480,7 +480,7 @@ class DoctrTextRecognizer(TextRecognizer):
|
|
|
480
480
|
return auto_select_lib_for_doctr()
|
|
481
481
|
|
|
482
482
|
def clear_model(self) -> None:
|
|
483
|
-
self.doctr_predictor = None
|
|
483
|
+
self.doctr_predictor = None # type: ignore
|
|
484
484
|
|
|
485
485
|
|
|
486
486
|
class DocTrRotationTransformer(ImageTransformer):
|
|
@@ -527,7 +527,9 @@ class DocTrRotationTransformer(ImageTransformer):
|
|
|
527
527
|
return viz_handler.rotate_image(np_img, specification.angle) # type: ignore
|
|
528
528
|
|
|
529
529
|
def predict(self, np_img: PixelValues) -> DetectionResult:
|
|
530
|
-
angle = estimate_orientation(
|
|
530
|
+
angle = estimate_orientation(
|
|
531
|
+
np_img, n_ct=self.number_contours, ratio_threshold_for_lines=self.ratio_threshold_for_lines
|
|
532
|
+
)
|
|
531
533
|
if angle < 0:
|
|
532
534
|
angle += 360
|
|
533
535
|
return DetectionResult(angle=round(angle, 2))
|
|
@@ -55,7 +55,7 @@ def cat_to_sub_cat(
|
|
|
55
55
|
sub_cat = ann.get_sub_category(sub_cat_type)
|
|
56
56
|
if sub_cat:
|
|
57
57
|
ann.category_name = sub_cat.category_name
|
|
58
|
-
ann.category_id = categories_dict_names_as_key.get(ann.category_name,DEFAULT_CATEGORY_ID)
|
|
58
|
+
ann.category_id = categories_dict_names_as_key.get(ann.category_name, DEFAULT_CATEGORY_ID)
|
|
59
59
|
|
|
60
60
|
return dp
|
|
61
61
|
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.2
|
|
2
2
|
Name: deepdoctection
|
|
3
|
-
Version: 0.39.
|
|
3
|
+
Version: 0.39.5
|
|
4
4
|
Summary: Repository for Document AI
|
|
5
5
|
Home-page: https://github.com/deepdoctection/deepdoctection
|
|
6
6
|
Author: Dr. Janis Meyer
|
|
@@ -57,7 +57,7 @@ Requires-Dist: tensorpack==0.11; extra == "tf"
|
|
|
57
57
|
Requires-Dist: protobuf==3.20.1; extra == "tf"
|
|
58
58
|
Requires-Dist: tensorflow-addons>=0.17.1; extra == "tf"
|
|
59
59
|
Requires-Dist: tf2onnx>=1.9.2; extra == "tf"
|
|
60
|
-
Requires-Dist: python-doctr==0.
|
|
60
|
+
Requires-Dist: python-doctr==0.9.0; extra == "tf"
|
|
61
61
|
Requires-Dist: pycocotools>=2.0.2; extra == "tf"
|
|
62
62
|
Requires-Dist: boto3==1.34.102; extra == "tf"
|
|
63
63
|
Requires-Dist: pdfplumber>=0.11.0; extra == "tf"
|
|
@@ -88,7 +88,7 @@ Requires-Dist: tqdm==4.64.0; extra == "pt"
|
|
|
88
88
|
Requires-Dist: timm>=0.9.16; extra == "pt"
|
|
89
89
|
Requires-Dist: transformers>=4.48.0; extra == "pt"
|
|
90
90
|
Requires-Dist: accelerate>=0.29.1; extra == "pt"
|
|
91
|
-
Requires-Dist: python-doctr==0.
|
|
91
|
+
Requires-Dist: python-doctr==0.9.0; extra == "pt"
|
|
92
92
|
Requires-Dist: boto3==1.34.102; extra == "pt"
|
|
93
93
|
Requires-Dist: pdfplumber>=0.11.0; extra == "pt"
|
|
94
94
|
Requires-Dist: fasttext-wheel; extra == "pt"
|
|
@@ -69,7 +69,7 @@ tqdm==4.64.0
|
|
|
69
69
|
timm>=0.9.16
|
|
70
70
|
transformers>=4.48.0
|
|
71
71
|
accelerate>=0.29.1
|
|
72
|
-
python-doctr==0.
|
|
72
|
+
python-doctr==0.9.0
|
|
73
73
|
boto3==1.34.102
|
|
74
74
|
pdfplumber>=0.11.0
|
|
75
75
|
fasttext-wheel
|
|
@@ -105,7 +105,7 @@ tensorpack==0.11
|
|
|
105
105
|
protobuf==3.20.1
|
|
106
106
|
tensorflow-addons>=0.17.1
|
|
107
107
|
tf2onnx>=1.9.2
|
|
108
|
-
python-doctr==0.
|
|
108
|
+
python-doctr==0.9.0
|
|
109
109
|
pycocotools>=2.0.2
|
|
110
110
|
boto3==1.34.102
|
|
111
111
|
pdfplumber>=0.11.0
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/__init__.py
RENAMED
|
File without changes
|
{deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/xsl/__init__.py
RENAMED
|
File without changes
|
{deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/datasets/instances/xsl/pascal_voc.xsl
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
{deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/config/__init__.py
RENAMED
|
File without changes
|
{deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/config/config.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/utils/__init__.py
RENAMED
|
File without changes
|
{deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/utils/box_ops.py
RENAMED
|
File without changes
|
{deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection/extern/tp/tpfrcnn/utils/np_box_ops.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{deepdoctection-0.39.3 → deepdoctection-0.39.5}/deepdoctection.egg-info/dependency_links.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|