docling-ibm-models 0.2.0__py3-none-any.whl → 1.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -118,7 +118,7 @@ class LayoutPredictor:
118
118
  }
119
119
  return info
120
120
 
121
- def predict(self, orig_img: Union[Image, np.array]) -> Iterable[dict]:
121
+ def predict(self, orig_img: Union[Image.Image, np.ndarray]) -> Iterable[dict]:
122
122
  r"""
123
123
  Predict bounding boxes for a given image.
124
124
  The origin (0, 0) is the top-left corner and the predicted bbox coords are provided as:
@@ -177,7 +177,7 @@ class TFPredictor:
177
177
  self._model_type = self._config["model"]["type"]
178
178
  # Added import here to avoid loading turbotransformer library unnecessarily
179
179
  if self._model_type == "TableModel04_rs":
180
- from docling_ibm_models.tableformer.models.table04_rs.tablemodel04_rs import ( # noqa: F401
180
+ from docling_ibm_models.tableformer.models.table04_rs.tablemodel04_rs import ( # noqa
181
181
  TableModel04_rs,
182
182
  )
183
183
  for candidate in BaseModel.__subclasses__():
@@ -437,10 +437,10 @@ class TFPredictor:
437
437
  for pdf_cell in pdf_cells:
438
438
  if pdf_cell["id"] == docling_item["cell_id"]:
439
439
  text_cell_bbox = {
440
- "b": pdf_cell["bbox"][1],
440
+ "b": pdf_cell["bbox"][3],
441
441
  "l": pdf_cell["bbox"][0],
442
442
  "r": pdf_cell["bbox"][2],
443
- "t": pdf_cell["bbox"][3],
443
+ "t": pdf_cell["bbox"][1],
444
444
  "token": pdf_cell["text"],
445
445
  }
446
446
  tf_cells_map[cell_key]["text_cell_bboxes"].append(
@@ -468,10 +468,10 @@ class TFPredictor:
468
468
  for pdf_cell in pdf_cells:
469
469
  if pdf_cell["id"] == docling_item["cell_id"]:
470
470
  text_cell_bbox = {
471
- "b": pdf_cell["bbox"][1],
471
+ "b": pdf_cell["bbox"][3],
472
472
  "l": pdf_cell["bbox"][0],
473
473
  "r": pdf_cell["bbox"][2],
474
- "t": pdf_cell["bbox"][3],
474
+ "t": pdf_cell["bbox"][1],
475
475
  "token": pdf_cell["text"],
476
476
  }
477
477
  tf_cells_map[cell_key]["text_cell_bboxes"].append(
@@ -1,12 +1,12 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: docling-ibm-models
3
- Version: 0.2.0
3
+ Version: 1.1.0
4
4
  Summary: This package contains the AI models used by the Docling PDF conversion package
5
5
  License: MIT
6
6
  Keywords: docling,convert,document,pdf,layout model,segmentation,table structure,table former
7
7
  Author: Nikos Livathinos
8
8
  Author-email: nli@zurich.ibm.com
9
- Requires-Python: >=3.11,<4.0
9
+ Requires-Python: >=3.10,<4.0
10
10
  Classifier: Development Status :: 5 - Production/Stable
11
11
  Classifier: Intended Audience :: Developers
12
12
  Classifier: Intended Audience :: Science/Research
@@ -14,6 +14,7 @@ Classifier: License :: OSI Approved :: MIT License
14
14
  Classifier: Operating System :: MacOS :: MacOS X
15
15
  Classifier: Operating System :: POSIX :: Linux
16
16
  Classifier: Programming Language :: Python :: 3
17
+ Classifier: Programming Language :: Python :: 3.10
17
18
  Classifier: Programming Language :: Python :: 3.11
18
19
  Classifier: Programming Language :: Python :: 3.12
19
20
  Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
@@ -32,7 +33,16 @@ Requires-Dist: torchvision (==0.17.2)
32
33
  Requires-Dist: tqdm (>=4.64.0,<5.0.0)
33
34
  Description-Content-Type: text/markdown
34
35
 
35
- # Docling-models
36
+ [![PyPI version](https://img.shields.io/pypi/v/docling-ibm-models)](https://pypi.org/project/docling-ibm-models/)
37
+ ![Python](https://img.shields.io/badge/python-3.10%20|%203.11%20|%203.12-blue)
38
+ [![Poetry](https://img.shields.io/endpoint?url=https://python-poetry.org/badge/v0.json)](https://python-poetry.org/)
39
+ [![Code style: black](https://img.shields.io/badge/code%20style-black-000000.svg)](https://github.com/psf/black)
40
+ [![Imports: isort](https://img.shields.io/badge/%20imports-isort-%231674b1?style=flat&labelColor=ef8336)](https://pycqa.github.io/isort/)
41
+ [![pre-commit](https://img.shields.io/badge/pre--commit-enabled-brightgreen?logo=pre-commit&logoColor=white)](https://github.com/pre-commit/pre-commit)
42
+ [![Models on Hugging Face](https://img.shields.io/badge/%F0%9F%A4%97%20Hugging%20Face-Model-blue)](https://huggingface.co/ds4sd/docling-models/)
43
+ [![License MIT](https://img.shields.io/github/license/ds4sd/deepsearch-toolkit)](https://opensource.org/licenses/MIT)
44
+
45
+ # Docling IBM models
36
46
 
37
47
  AI modules to support the Dockling PDF document conversion project.
38
48
 
@@ -41,7 +51,7 @@ AI modules to support the Dockling PDF document conversion project.
41
51
 
42
52
 
43
53
  ## Installation Instructions
44
-
54
+
45
55
  ### MacOS / Linux
46
56
 
47
57
  To install `poetry` locally, use either `pip` or `homebrew`.
@@ -49,8 +59,8 @@ To install `poetry` locally, use either `pip` or `homebrew`.
49
59
  To install `poetry` on a docker container, do the following:
50
60
  ```
51
61
  ENV POETRY_NO_INTERACTION=1 \
52
- POETRY_VIRTUALENVS_CREATE=false
53
-
62
+ POETRY_VIRTUALENVS_CREATE=false
63
+
54
64
  # Install poetry
55
65
  RUN curl -sSL 'https://install.python-poetry.org' > install-poetry.py \
56
66
  && python install-poetry.py \
@@ -58,10 +68,10 @@ RUN curl -sSL 'https://install.python-poetry.org' > install-poetry.py \
58
68
  && rm install-poetry.py
59
69
  ```
60
70
 
61
- To install and run the package, simply set up a poetry environment
71
+ To install and run the package, simply set up a poetry environment
62
72
 
63
73
  ```
64
- poetry env use $(which python3.11)
74
+ poetry env use $(which python3.10)
65
75
  poetry shell
66
76
  ```
67
77
 
@@ -105,7 +115,7 @@ Example configuration can be seen inside test `tests/test_tf_predictor.py`
105
115
  These are the main sections of the configuration file:
106
116
 
107
117
  - `dataset`: The directory for prepared data and the parameters used during the data loading.
108
- - `model`: The type, name and hyperparameters of the model. Also the directory to save/load the
118
+ - `model`: The type, name and hyperparameters of the model. Also the directory to save/load the
109
119
  trained checkpoint files.
110
120
  - `train`: Parameters for the training of the model.
111
121
  - `predict`: Parameters for the evaluation of the model.
@@ -131,7 +141,7 @@ First download the model weights (see above), then run:
131
141
  ./devtools/check_code.sh
132
142
  ```
133
143
 
134
- This will also generate prediction and matching visualizations that can be found here:
144
+ This will also generate prediction and matching visualizations that can be found here:
135
145
  `tests\test_data\viz\`
136
146
 
137
147
  Visualization outlines:
@@ -1,4 +1,4 @@
1
- docling_ibm_models/layoutmodel/layout_predictor.py,sha256=SdEsqlsb9zq2sCEzgim4geuCXlcno6eEu2PmYopGzOU,5557
1
+ docling_ibm_models/layoutmodel/layout_predictor.py,sha256=y1Z51hUKju8SCvejCWWr04xbV_CmJrJ32FgA56tkgNU,5565
2
2
  docling_ibm_models/tableformer/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
3
3
  docling_ibm_models/tableformer/common.py,sha256=RV2ptqgkfz1OIoN-WqiSeln0pkZ_7zTO9DhOcbvPS5k,6023
4
4
  docling_ibm_models/tableformer/data_management/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -7,7 +7,7 @@ docling_ibm_models/tableformer/data_management/functional.py,sha256=UrXsEm4DSc1Q
7
7
  docling_ibm_models/tableformer/data_management/matching_post_processor.py,sha256=HYG-wx5PQC38hTQfyXr3zUnZ6--aSs55x8g9PdsROGU,54207
8
8
  docling_ibm_models/tableformer/data_management/tf_cell_matcher.py,sha256=DFu428Cr84maT9WehdoZkpkJKeahwe5JlclvTC6fuVY,20870
9
9
  docling_ibm_models/tableformer/data_management/tf_dataset.py,sha256=6_qSsYt6qoE2JBzUNrJfCDX3Kgg7tyrv3kimGLdEQ5o,49890
10
- docling_ibm_models/tableformer/data_management/tf_predictor.py,sha256=I317-qMK13eqUvT4Ix2Q02uzkKQDCoKcf9GqIGVBy70,38508
10
+ docling_ibm_models/tableformer/data_management/tf_predictor.py,sha256=3e7ICgs3r9YclOLWuoOvqSveQHcERvZYmOBMtmslJqU,38502
11
11
  docling_ibm_models/tableformer/data_management/transforms.py,sha256=_i1HXkX8LAuHbeGRrg8kF9yFNJRQZOKmWzxKt559ABQ,13268
12
12
  docling_ibm_models/tableformer/models/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
13
13
  docling_ibm_models/tableformer/models/common/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -26,7 +26,7 @@ docling_ibm_models/tableformer/utils/app_profiler.py,sha256=13dvwo5byzfP2ejqGBFw
26
26
  docling_ibm_models/tableformer/utils/torch_utils.py,sha256=uN0rK9mSXy1ewBnBnILrWebJhhVU4N-XJZBqNiLJwlQ,8893
27
27
  docling_ibm_models/tableformer/utils/utils.py,sha256=8Bxf1rEn977lFbY9NX0r5xh9PvxIRipQZX_EZW92XfA,10980
28
28
  docling_ibm_models/tableformer/utils/variance.py,sha256=USjRwaMsCmzvc6PeWskaAJnUjbliRVd_MqNKLjMDQw8,4675
29
- docling_ibm_models-0.2.0.dist-info/LICENSE,sha256=ACwmltkrXIz5VsEQcrqljq-fat6ZXAMepjXGoe40KtE,1069
30
- docling_ibm_models-0.2.0.dist-info/METADATA,sha256=Sp-I-WgmqMBo4G5kvBwQsVTIjwHpWpa6i0aGevNzG3I,6003
31
- docling_ibm_models-0.2.0.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
32
- docling_ibm_models-0.2.0.dist-info/RECORD,,
29
+ docling_ibm_models-1.1.0.dist-info/LICENSE,sha256=ACwmltkrXIz5VsEQcrqljq-fat6ZXAMepjXGoe40KtE,1069
30
+ docling_ibm_models-1.1.0.dist-info/METADATA,sha256=4kkqQ-JbpWLfyyhrBD6YzzVqEep12DzKRUx-7OqsXqk,7028
31
+ docling_ibm_models-1.1.0.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
32
+ docling_ibm_models-1.1.0.dist-info/RECORD,,