deepdoctection 0.43.4__py3-none-any.whl → 0.43.5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of deepdoctection might be problematic. Click here for more details.

@@ -25,7 +25,7 @@ from .utils.logger import LoggingRecord, logger
25
25
 
26
26
  # pylint: enable=wrong-import-position
27
27
 
28
- __version__ = "0.43.4"
28
+ __version__ = "0.43.5"
29
29
 
30
30
  _IMPORT_STRUCTURE = {
31
31
  "analyzer": ["config_sanity_checks", "get_dd_analyzer", "ServiceFactory"],
@@ -484,7 +484,7 @@ class CustomDataset(DatasetBase):
484
484
  return DatasetInfo(
485
485
  name=self.name,
486
486
  type=self.type,
487
- description=self.description if self.description is not None else "",
487
+ short_description=self.description if self.description is not None else "",
488
488
  license="",
489
489
  url="",
490
490
  splits={},
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: deepdoctection
3
- Version: 0.43.4
3
+ Version: 0.43.5
4
4
  Summary: Repository for Document AI
5
5
  Home-page: https://github.com/deepdoctection/deepdoctection
6
6
  Author: Dr. Janis Meyer
@@ -168,13 +168,9 @@ Version `v.0.43` includes a significant redesign of the Analyzer's default confi
168
168
  </p>
169
169
 
170
170
 
171
-
172
171
  **deep**doctection is a Python library that orchestrates Scan and PDF document layout analysis and extraction for RAG.
173
172
  It also provides a framework for training, evaluating and inferencing Document AI models.
174
173
 
175
- Check the demo of a document layout analysis pipeline with OCR on 🤗
176
- [**Hugging Face spaces**](https://huggingface.co/spaces/deepdoctection/deepdoctection).
177
-
178
174
  # Overview
179
175
 
180
176
  - Document layout analysis and table recognition in PyTorch with
@@ -197,6 +193,54 @@ for an easy start.
197
193
 
198
194
  Check the [**release notes**](https://github.com/deepdoctection/deepdoctection/releases) for recent updates.
199
195
 
196
+
197
+ ----------------------------------------------------------------------------------------
198
+
199
+ # Hugging Face Space Demo
200
+
201
+ Check the demo of a document layout analysis pipeline with OCR on 🤗
202
+ [**Hugging Face spaces**](https://huggingface.co/spaces/deepdoctection/deepdoctection) or use the gradio client.
203
+
204
+ ```
205
+ pip install gradio_client # requires Python >= 3.10
206
+ ```
207
+
208
+ To process a single image:
209
+
210
+ ```python
211
+ from gradio_client import Client, handle_file
212
+
213
+ if __name__ == "__main__":
214
+
215
+ client = Client("deepdoctection/deepdoctection")
216
+ result = client.predict(
217
+ img=handle_file('/local_path/to/dir/file_name.jpeg'), # accepts image files, e.g. JPEG, PNG
218
+ pdf=None,
219
+ max_datapoints = 2,
220
+ api_name = "/analyze_image"
221
+ )
222
+ print(result)
223
+ ```
224
+
225
+ To process a PDF document:
226
+
227
+ ```python
228
+ from gradio_client import Client, handle_file
229
+
230
+ if __name__ == "__main__":
231
+
232
+ client = Client("deepdoctection/deepdoctection")
233
+ result = client.predict(
234
+ img=None,
235
+ pdf=handle_file("/local_path/to/dir/your_doc.pdf"),
236
+ max_datapoints = 2, # increase to process up to 9 pages
237
+ api_name = "/analyze_image"
238
+ )
239
+ print(result)
240
+ ```
241
+
242
+ --------------------------------------------------------------------------------------------------------
243
+
200
244
  # Example
201
245
 
202
246
  ```python
@@ -242,8 +286,9 @@ alt="text" width="40%">
242
286
  </p>
243
287
 
244
288
 
289
+ -----------------------------------------------------------------------------------------
245
290
 
246
- ## Requirements
291
+ # Requirements
247
292
 
248
293
  ![requirements](https://github.com/deepdoctection/deepdoctection/raw/master/docs/tutorials/_imgs/install_01.png)
249
294
 
@@ -262,11 +307,13 @@ alt="text" width="40%">
262
307
  | DocTr | ✅ | ❌ | ✅ |
263
308
  | LayoutLM (v1, v2, v3, XLM) via Transformers | ✅ | ❌ | ❌ |
264
309
 
265
- ## Installation
310
+ ------------------------------------------------------------------------------------------
311
+
312
+ # Installation
266
313
 
267
314
  We recommend using a virtual environment.
268
315
 
269
- #### Get started installation
316
+ ## Get started installation
270
317
 
271
318
  For a simple setup which is enough to parse documents with the default setting, install the following:
272
319
 
@@ -288,7 +335,7 @@ pip install deepdoctection
288
335
 
289
336
  Both setups are sufficient to run the [**introduction notebook**](https://github.com/deepdoctection/notebooks/blob/main/Get_Started.ipynb).
290
337
 
291
- #### Full installation
338
+ ### Full installation
292
339
 
293
340
  The following installation will give you ALL models available within the Deep Learning framework as well as all models
294
341
  that are independent of Tensorflow/PyTorch.
@@ -318,7 +365,7 @@ pip install deepdoctection[tf]
318
365
  For further information, please consult the [**full installation instructions**](https://deepdoctection.readthedocs.io/en/latest/install/).
319
366
 
320
367
 
321
- ### Installation from source
368
+ ## Installation from source
322
369
 
323
370
  Download the repository or clone via
324
371
 
@@ -341,8 +388,7 @@ pip install ".[tf]" # or "pip install -e .[tf]"
341
388
  ```
342
389
 
343
390
 
344
-
345
- ### Running a Docker container from Docker hub
391
+ ## Running a Docker container from Docker hub
346
392
 
347
393
  Pre-existing Docker images can be downloaded from the [Docker hub](https://hub.docker.com/r/deepdoctection/deepdoctection).
348
394
 
@@ -360,16 +406,18 @@ docker compose up -d
360
406
 
361
407
  will start the container. There is no endpoint exposed, though.
362
408
 
363
- ## Credits
409
+ -----------------------------------------------------------------------------------------------
410
+
411
+ # Credits
364
412
 
365
413
  We thank all libraries that provide high quality code and pre-trained models. Without, it would have been impossible
366
414
  to develop this framework.
367
415
 
368
416
 
369
- ## If you like **deep**doctection ...
417
+ # If you like **deep**doctection ...
370
418
 
371
419
  ...you can easily support the project by making it more visible. Leaving a star or a recommendation will help.
372
420
 
373
- ## License
421
+ # License
374
422
 
375
423
  Distributed under the Apache 2.0 License. Check [LICENSE](https://github.com/deepdoctection/deepdoctection/blob/master/LICENSE) for additional information.
@@ -1,4 +1,4 @@
1
- deepdoctection/__init__.py,sha256=UftLKUS4Z03F_LCcON51Gx0XEKfCLp7VAw9MKysFLxQ,12964
1
+ deepdoctection/__init__.py,sha256=ackdlzoLcoHJAmWtxrkE2PnYgG-3q9bL2c1d3kqFgTY,12964
2
2
  deepdoctection/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
3
3
  deepdoctection/analyzer/__init__.py,sha256=wg0BcFwdCeREwzZfa--Yx8HUJ9LPv5z5PmLwtkZdPH8,772
4
4
  deepdoctection/analyzer/config.py,sha256=DToaXs59w7SpEi2vkeBEyrBwyyGiXUST_N99wL9nHoI,41762
@@ -24,7 +24,7 @@ deepdoctection/datapoint/image.py,sha256=kqwCz8DSc19hQpkl_4L1_Ek7_2KrH5KsV9e0S-R
24
24
  deepdoctection/datapoint/view.py,sha256=YtoqafStrHqbfyD628-W1HOA2Gb0kUI2oaEiteBHjbA,57902
25
25
  deepdoctection/datasets/__init__.py,sha256=4ifjIwWCPYiS31GzUlVDScrkNOrb1eo5xHlRXNyg_58,994
26
26
  deepdoctection/datasets/adapter.py,sha256=VSLM_980aHi4TpgOxfxiBHiF_fUXyh348PXet6zTo-4,7779
27
- deepdoctection/datasets/base.py,sha256=HTIquJir2BZRTLl1HSQM0ICfvjIaWAjJeyz3BEHgdb0,23175
27
+ deepdoctection/datasets/base.py,sha256=Qfh52aVtBd2df2ZY0hjLz4D1jrExnPuu_8uYpolVNks,23181
28
28
  deepdoctection/datasets/dataflow_builder.py,sha256=0vwkItr0wVbKPtTXoS6uJLO9QQNWbS0Ri7CySuywWxU,4186
29
29
  deepdoctection/datasets/info.py,sha256=DLRYq3cHp3L34CcSXPUJ8j8wguJp2aVdoH-AhODNLBA,20814
30
30
  deepdoctection/datasets/registry.py,sha256=qYRVycNYFeAzWB7jENGYzokgyzIEvTRb49he2UmPUe8,3451
@@ -142,8 +142,8 @@ deepdoctection/utils/transform.py,sha256=jgeCyQWLN9q79jCGW7jysyKUKcJ1AVMk8OslF-3
142
142
  deepdoctection/utils/types.py,sha256=ti4WdtIJSg3TGK_YPkkoY9PYGMnR2tTX6Xfik8U1pNk,2986
143
143
  deepdoctection/utils/utils.py,sha256=NBUb1qbx8Jm-AvYN1Sdbk0huXhbAKxZ-ZtOcMespsMM,7064
144
144
  deepdoctection/utils/viz.py,sha256=bujRIujvX317rPz4jBrj0yd3WP8wPjDUiI5GUrw9MzQ,27339
145
- deepdoctection-0.43.4.dist-info/licenses/LICENSE,sha256=GQ0rUvuGdrMNEI3iHK5UQx6dIMU1QwAuyXsxUHn5MEQ,11351
146
- deepdoctection-0.43.4.dist-info/METADATA,sha256=Rq3g8AYO5ClbhHXAHJVh7YkpeP22PBwpB_TN57TbSOI,13389
147
- deepdoctection-0.43.4.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
148
- deepdoctection-0.43.4.dist-info/top_level.txt,sha256=hs2DdoOL9h4mnHhmO82BT4pz4QATIoOZ20PZmlnxFI8,15
149
- deepdoctection-0.43.4.dist-info/RECORD,,
145
+ deepdoctection-0.43.5.dist-info/licenses/LICENSE,sha256=GQ0rUvuGdrMNEI3iHK5UQx6dIMU1QwAuyXsxUHn5MEQ,11351
146
+ deepdoctection-0.43.5.dist-info/METADATA,sha256=EeIEGN2SrcUzSny93poDmEM7Fogqqiep_XDHOs--XpM,14782
147
+ deepdoctection-0.43.5.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
148
+ deepdoctection-0.43.5.dist-info/top_level.txt,sha256=hs2DdoOL9h4mnHhmO82BT4pz4QATIoOZ20PZmlnxFI8,15
149
+ deepdoctection-0.43.5.dist-info/RECORD,,