docling 2.30.0__py3-none-any.whl → 2.31.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- docling/backend/asciidoc_backend.py +7 -15
- docling/backend/csv_backend.py +1 -1
- docling/backend/docling_parse_backend.py +2 -2
- docling/backend/docling_parse_v2_backend.py +2 -2
- docling/backend/docling_parse_v4_backend.py +3 -4
- docling/backend/docx/latex/latex_dict.py +0 -5
- docling/backend/docx/latex/omml.py +4 -7
- docling/backend/html_backend.py +26 -9
- docling/backend/md_backend.py +5 -7
- docling/backend/msexcel_backend.py +1 -7
- docling/backend/mspowerpoint_backend.py +4 -7
- docling/backend/msword_backend.py +4 -4
- docling/backend/pdf_backend.py +2 -1
- docling/backend/pypdfium2_backend.py +3 -3
- docling/backend/xml/jats_backend.py +10 -13
- docling/backend/xml/uspto_backend.py +15 -19
- docling/cli/main.py +7 -7
- docling/cli/models.py +2 -3
- docling/datamodel/base_models.py +7 -5
- docling/datamodel/document.py +11 -10
- docling/datamodel/pipeline_options.py +0 -1
- docling/document_converter.py +5 -5
- docling/models/api_vlm_model.py +1 -2
- docling/models/base_model.py +2 -4
- docling/models/base_ocr_model.py +2 -2
- docling/models/code_formula_model.py +2 -1
- docling/models/document_picture_classifier.py +2 -1
- docling/models/easyocr_model.py +10 -11
- docling/models/factories/__init__.py +2 -2
- docling/models/factories/base_factory.py +1 -1
- docling/models/hf_mlx_model.py +4 -6
- docling/models/hf_vlm_model.py +7 -5
- docling/models/layout_model.py +2 -2
- docling/models/ocr_mac_model.py +3 -4
- docling/models/page_assemble_model.py +7 -12
- docling/models/page_preprocessing_model.py +2 -1
- docling/models/picture_description_api_model.py +2 -1
- docling/models/picture_description_base_model.py +2 -3
- docling/models/picture_description_vlm_model.py +2 -3
- docling/models/rapid_ocr_model.py +2 -3
- docling/models/readingorder_model.py +8 -23
- docling/models/table_structure_model.py +2 -6
- docling/models/tesseract_ocr_cli_model.py +17 -16
- docling/models/tesseract_ocr_model.py +8 -6
- docling/pipeline/base_pipeline.py +4 -8
- docling/pipeline/simple_pipeline.py +0 -1
- docling/pipeline/standard_pdf_pipeline.py +0 -1
- docling/pipeline/vlm_pipeline.py +0 -3
- docling/utils/export.py +2 -4
- docling/utils/glm_utils.py +2 -2
- docling/utils/layout_postprocessor.py +4 -2
- docling/utils/model_downloader.py +7 -7
- docling/utils/utils.py +1 -1
- {docling-2.30.0.dist-info → docling-2.31.0.dist-info}/METADATA +2 -1
- docling-2.31.0.dist-info/RECORD +86 -0
- docling-2.30.0.dist-info/RECORD +0 -86
- {docling-2.30.0.dist-info → docling-2.31.0.dist-info}/LICENSE +0 -0
- {docling-2.30.0.dist-info → docling-2.31.0.dist-info}/WHEEL +0 -0
- {docling-2.30.0.dist-info → docling-2.31.0.dist-info}/entry_points.txt +0 -0
docling/pipeline/vlm_pipeline.py
CHANGED
@@ -1,5 +1,4 @@
|
|
1
1
|
import logging
|
2
|
-
import warnings
|
3
2
|
from io import BytesIO
|
4
3
|
from pathlib import Path
|
5
4
|
from typing import List, Optional, Union, cast
|
@@ -32,7 +31,6 @@ _log = logging.getLogger(__name__)
|
|
32
31
|
|
33
32
|
|
34
33
|
class VlmPipeline(PaginatedPipeline):
|
35
|
-
|
36
34
|
def __init__(self, pipeline_options: VlmPipelineOptions):
|
37
35
|
super().__init__(pipeline_options)
|
38
36
|
self.keep_backend = True
|
@@ -114,7 +112,6 @@ class VlmPipeline(PaginatedPipeline):
|
|
114
112
|
|
115
113
|
def _assemble_document(self, conv_res: ConversionResult) -> ConversionResult:
|
116
114
|
with TimeRecorder(conv_res, "doc_assemble", scope=ProfilingScope.DOCUMENT):
|
117
|
-
|
118
115
|
if (
|
119
116
|
self.pipeline_options.vlm_options.response_format
|
120
117
|
== ResponseFormat.DOCTAGS
|
docling/utils/export.py
CHANGED
@@ -1,8 +1,8 @@
|
|
1
1
|
import logging
|
2
|
-
from
|
2
|
+
from collections.abc import Iterable
|
3
|
+
from typing import Any, Dict, List, Tuple, Union
|
3
4
|
|
4
5
|
from docling_core.types.doc import BoundingBox, CoordOrigin
|
5
|
-
from docling_core.types.doc.page import TextCell
|
6
6
|
from docling_core.types.legacy_doc.base import BaseCell, BaseText, Ref, Table
|
7
7
|
|
8
8
|
from docling.datamodel.document import ConversionResult, Page
|
@@ -13,7 +13,6 @@ _log = logging.getLogger(__name__)
|
|
13
13
|
def generate_multimodal_pages(
|
14
14
|
doc_result: ConversionResult,
|
15
15
|
) -> Iterable[Tuple[str, str, List[Dict[str, Any]], List[Dict[str, Any]], Page]]:
|
16
|
-
|
17
16
|
label_to_doclaynet = {
|
18
17
|
"title": "title",
|
19
18
|
"table-of-contents": "document_index",
|
@@ -122,7 +121,6 @@ def generate_multimodal_pages(
|
|
122
121
|
if doc.main_text is None:
|
123
122
|
return
|
124
123
|
for ix, orig_item in enumerate(doc.main_text):
|
125
|
-
|
126
124
|
item = doc._resolve_ref(orig_item) if isinstance(orig_item, Ref) else orig_item
|
127
125
|
if item is None or item.prov is None or len(item.prov) == 0:
|
128
126
|
_log.debug(f"Skipping item {orig_item}")
|
docling/utils/glm_utils.py
CHANGED
@@ -29,7 +29,7 @@ def resolve_item(paths, obj):
|
|
29
29
|
|
30
30
|
try:
|
31
31
|
key = int(paths[0])
|
32
|
-
except:
|
32
|
+
except Exception:
|
33
33
|
key = paths[0]
|
34
34
|
|
35
35
|
if len(paths) == 1:
|
@@ -67,7 +67,7 @@ def _flatten_table_grid(grid: List[List[dict]]) -> List[dict]:
|
|
67
67
|
return unique_objects
|
68
68
|
|
69
69
|
|
70
|
-
def to_docling_document(doc_glm, update_name_label=False) -> DoclingDocument:
|
70
|
+
def to_docling_document(doc_glm, update_name_label=False) -> DoclingDocument: # noqa: C901
|
71
71
|
origin = DocumentOrigin(
|
72
72
|
mimetype="application/pdf",
|
73
73
|
filename=doc_glm["file-info"]["filename"],
|
@@ -18,7 +18,7 @@ class UnionFind:
|
|
18
18
|
|
19
19
|
def __init__(self, elements):
|
20
20
|
self.parent = {elem: elem for elem in elements}
|
21
|
-
self.rank =
|
21
|
+
self.rank = dict.fromkeys(elements, 0)
|
22
22
|
|
23
23
|
def find(self, x):
|
24
24
|
if self.parent[x] != x:
|
@@ -484,7 +484,9 @@ class LayoutPostprocessor:
|
|
484
484
|
spatial_index = (
|
485
485
|
self.regular_index
|
486
486
|
if cluster_type == "regular"
|
487
|
-
else self.picture_index
|
487
|
+
else self.picture_index
|
488
|
+
if cluster_type == "picture"
|
489
|
+
else self.wrapper_index
|
488
490
|
)
|
489
491
|
|
490
492
|
# Map of currently valid clusters
|
@@ -37,7 +37,7 @@ def download_models(
|
|
37
37
|
output_dir.mkdir(exist_ok=True, parents=True)
|
38
38
|
|
39
39
|
if with_layout:
|
40
|
-
_log.info(
|
40
|
+
_log.info("Downloading layout model...")
|
41
41
|
LayoutModel.download_models(
|
42
42
|
local_dir=output_dir / LayoutModel._model_repo_folder,
|
43
43
|
force=force,
|
@@ -45,7 +45,7 @@ def download_models(
|
|
45
45
|
)
|
46
46
|
|
47
47
|
if with_tableformer:
|
48
|
-
_log.info(
|
48
|
+
_log.info("Downloading tableformer model...")
|
49
49
|
TableStructureModel.download_models(
|
50
50
|
local_dir=output_dir / TableStructureModel._model_repo_folder,
|
51
51
|
force=force,
|
@@ -53,7 +53,7 @@ def download_models(
|
|
53
53
|
)
|
54
54
|
|
55
55
|
if with_picture_classifier:
|
56
|
-
_log.info(
|
56
|
+
_log.info("Downloading picture classifier model...")
|
57
57
|
DocumentPictureClassifier.download_models(
|
58
58
|
local_dir=output_dir / DocumentPictureClassifier._model_repo_folder,
|
59
59
|
force=force,
|
@@ -61,7 +61,7 @@ def download_models(
|
|
61
61
|
)
|
62
62
|
|
63
63
|
if with_code_formula:
|
64
|
-
_log.info(
|
64
|
+
_log.info("Downloading code formula model...")
|
65
65
|
CodeFormulaModel.download_models(
|
66
66
|
local_dir=output_dir / CodeFormulaModel._model_repo_folder,
|
67
67
|
force=force,
|
@@ -69,7 +69,7 @@ def download_models(
|
|
69
69
|
)
|
70
70
|
|
71
71
|
if with_smolvlm:
|
72
|
-
_log.info(
|
72
|
+
_log.info("Downloading SmolVlm model...")
|
73
73
|
PictureDescriptionVlmModel.download_models(
|
74
74
|
repo_id=smolvlm_picture_description.repo_id,
|
75
75
|
local_dir=output_dir / smolvlm_picture_description.repo_cache_folder,
|
@@ -78,7 +78,7 @@ def download_models(
|
|
78
78
|
)
|
79
79
|
|
80
80
|
if with_granite_vision:
|
81
|
-
_log.info(
|
81
|
+
_log.info("Downloading Granite Vision model...")
|
82
82
|
PictureDescriptionVlmModel.download_models(
|
83
83
|
repo_id=granite_picture_description.repo_id,
|
84
84
|
local_dir=output_dir / granite_picture_description.repo_cache_folder,
|
@@ -87,7 +87,7 @@ def download_models(
|
|
87
87
|
)
|
88
88
|
|
89
89
|
if with_easyocr:
|
90
|
-
_log.info(
|
90
|
+
_log.info("Downloading easyocr models...")
|
91
91
|
EasyOcrModel.download_models(
|
92
92
|
local_dir=output_dir / EasyOcrModel._model_repo_folder,
|
93
93
|
force=force,
|
docling/utils/utils.py
CHANGED
@@ -13,7 +13,7 @@ def chunkify(iterator, chunk_size):
|
|
13
13
|
if isinstance(iterator, List):
|
14
14
|
iterator = iter(iterator)
|
15
15
|
for first in iterator: # Take the first element from the iterator
|
16
|
-
yield [first
|
16
|
+
yield [first, *list(islice(iterator, chunk_size - 1))]
|
17
17
|
|
18
18
|
|
19
19
|
def create_file_hash(path_or_stream: Union[BytesIO, Path]) -> str:
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: docling
|
3
|
-
Version: 2.
|
3
|
+
Version: 2.31.0
|
4
4
|
Summary: SDK and CLI for parsing PDF, DOCX, HTML, and more, to a unified document representation for powering downstream workflows such as gen AI applications.
|
5
5
|
Home-page: https://github.com/docling-project/docling
|
6
6
|
License: MIT
|
@@ -86,6 +86,7 @@ Description-Content-Type: text/markdown
|
|
86
86
|
[](https://opensource.org/licenses/MIT)
|
87
87
|
[](https://pepy.tech/projects/docling)
|
88
88
|
[](https://apify.com/vancura/docling)
|
89
|
+
[](https://www.bestpractices.dev/projects/10101)
|
89
90
|
[](https://lfaidata.foundation/projects/)
|
90
91
|
|
91
92
|
Docling simplifies document processing, parsing diverse formats — including advanced PDF understanding — and providing seamless integrations with the gen AI ecosystem.
|
@@ -0,0 +1,86 @@
|
|
1
|
+
docling/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
2
|
+
docling/backend/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
3
|
+
docling/backend/abstract_backend.py,sha256=1lNxzwDTn303aXduPDVmTyXn-5ZIoWMLYqNxANGWmQQ,1658
|
4
|
+
docling/backend/asciidoc_backend.py,sha256=VZ8Xk1VHGHRqBo_TdtMzRAu1NFaFaJ8dk4CaEcBaEm0,14038
|
5
|
+
docling/backend/csv_backend.py,sha256=2g9famYG2W-ID9jEdZPxc6O8QGv1vWQfjN8pL-QMBE0,4536
|
6
|
+
docling/backend/docling_parse_backend.py,sha256=V_CsUdN5RkGQBBq7A_ReAiUW4CQVh0-1Ur157Ozurdg,8017
|
7
|
+
docling/backend/docling_parse_v2_backend.py,sha256=6fokgqb1hMbZua33gL46EFamrwPTC7ms6ZuEHw-Dv28,9395
|
8
|
+
docling/backend/docling_parse_v4_backend.py,sha256=-WJZs0IsdN6blhkvTS1eh_qhujYLyJ3XcOMqS6AaXxg,6282
|
9
|
+
docling/backend/docx/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
10
|
+
docling/backend/docx/latex/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
11
|
+
docling/backend/docx/latex/latex_dict.py,sha256=tFJp4ScT_AkY2ON7nLEa560p601Jq2glcZvMKxxjn7w,6593
|
12
|
+
docling/backend/docx/latex/omml.py,sha256=nEpcfyyrOucJyj6cD7wfThrIa-q0CQCoqMb3dkrhCRg,12094
|
13
|
+
docling/backend/html_backend.py,sha256=TBiMAp3s_QbQTRymFA7wScXECyHn_w-Kb8MbqRibTmE,20099
|
14
|
+
docling/backend/json/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
15
|
+
docling/backend/json/docling_json_backend.py,sha256=LlFMVoZrrCfVwbDuRbNN4Xg96Lujh4xxrTBt9jGhY9I,1984
|
16
|
+
docling/backend/md_backend.py,sha256=EdGBXe0n8zniO1LSF3VIjviKs1VRUujpF8aFUpJ5D1k,17209
|
17
|
+
docling/backend/msexcel_backend.py,sha256=3j0WQfqDpgPXdPMCguefdv7arcNVDedPD6gl54cmLn8,18110
|
18
|
+
docling/backend/mspowerpoint_backend.py,sha256=RwqfvvzrtM56L9uf7PR9lvlHJ-LyYGpkS1iVxkTl72Q,17203
|
19
|
+
docling/backend/msword_backend.py,sha256=Xdrs_k160-tDUmhcFGZ7MBbpiYkwPLT3wl3FUO2Ui1A,32476
|
20
|
+
docling/backend/pdf_backend.py,sha256=KE9TMuFO5WX-o5A_DAd4tEaLi4HMZ4XjKdpllItVkWM,2238
|
21
|
+
docling/backend/pypdfium2_backend.py,sha256=pX8f0WbUb0KTDTKyQuLzP_lgHHubyGXWD33vmpefPy8,10805
|
22
|
+
docling/backend/xml/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
23
|
+
docling/backend/xml/jats_backend.py,sha256=g9YNSS8kqhVL7ceZF2jR7Aaqbh1F1Zn6jmte0HyEH20,24926
|
24
|
+
docling/backend/xml/uspto_backend.py,sha256=iE1PSAgXqtHkqcsC1RUJiwuyKNlf2elucCV1V2sk0kQ,70926
|
25
|
+
docling/chunking/__init__.py,sha256=h83TDs0AuOV6oEPLAPrn9dpGKiU-2Vg6IRNo4cv6GDA,346
|
26
|
+
docling/cli/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
27
|
+
docling/cli/main.py,sha256=Z6EdrwESOKUBHF6yJlzuwnznScBtdrlbU_xB0AT9cA4,26137
|
28
|
+
docling/cli/models.py,sha256=Cyv7d_c8J62luGWsYvbcC9_3UpPp_TVsFo5vJAyr4kI,3940
|
29
|
+
docling/cli/tools.py,sha256=QhtRxQG0TVrfsMqdv5i7J0_qQy1ZZyWYnHPwJl7b5oY,322
|
30
|
+
docling/datamodel/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
31
|
+
docling/datamodel/base_models.py,sha256=DRE_XoldtCreWF4ucO0iK0l8uOnfvnhQaYjV0z1Qe0M,7921
|
32
|
+
docling/datamodel/document.py,sha256=02QybqtnQ0genFU7UF9pVL3fIwguu9br0JbdtcUvu4o,14998
|
33
|
+
docling/datamodel/pipeline_options.py,sha256=-1QG8dY0RZkTJb66lXErEAnPq4F_1vgnk_5AcIr3cgU,13350
|
34
|
+
docling/datamodel/settings.py,sha256=bNMdowIKv7RUchabQTo4rFNEsxfB6pGg2LoZSY634zo,1869
|
35
|
+
docling/document_converter.py,sha256=zSaGp2zx73kiE1KHmEHwnG-wxJvcMiyyn2fCAM2vdYk,13804
|
36
|
+
docling/exceptions.py,sha256=K1WnCS1leK2JtMB5ewZWKkb0EaijFgl-tRzrO9ntgPM,134
|
37
|
+
docling/models/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
38
|
+
docling/models/api_vlm_model.py,sha256=w1SzdG3Ypz_0iZGiX-skMwV1E1JnOHH2BJiNkcEEIAA,2478
|
39
|
+
docling/models/base_model.py,sha256=Zx_nByGYkubTvvYiQxwiB6P8lc7wOD4ZTC2QIw6vCEg,2950
|
40
|
+
docling/models/base_ocr_model.py,sha256=_iD8QCKQdv2VWrIuSRPyGP4oCz94h84WriHg9F2k-Z0,7172
|
41
|
+
docling/models/code_formula_model.py,sha256=9cplJFvP7jcJGz-p-MmL8_lqUhmaXZu7wKyX2aOTujs,11504
|
42
|
+
docling/models/document_picture_classifier.py,sha256=tyOnyM0vh8-pjh9PiHa_67YpK-3pc_vGQKlnfAyraBs,6255
|
43
|
+
docling/models/easyocr_model.py,sha256=3rgXMeB7LbMjevCAVDMG3voe3PQhQ7B-RyYrXzefUlQ,7365
|
44
|
+
docling/models/factories/__init__.py,sha256=x_EM5dDg_A3HBcBYzOoqwmA2AFLtJ1IzYDPX-R1A-Sg,868
|
45
|
+
docling/models/factories/base_factory.py,sha256=MfWIljMETi5aaVR-6qLTelW8u1gwDAQsOwg3fu7O4Qc,4028
|
46
|
+
docling/models/factories/ocr_factory.py,sha256=G5RkmkKvkl-ihpo6qSj8WC77VdlVSQ1s0ekwUX2ILts,316
|
47
|
+
docling/models/factories/picture_description_factory.py,sha256=Ru3-TnVVEKf5O07C_UpGf2HCOHc7j20AJzfficw3agM,385
|
48
|
+
docling/models/hf_mlx_model.py,sha256=B_B4hFU-jU0g_DQtQD8w4Ejorn10mkDuFI93wR_WhGk,4897
|
49
|
+
docling/models/hf_vlm_model.py,sha256=SiPMTLghMUjJ66dA2yN4UujpLO6PiOhLEPInWtXV_5s,6912
|
50
|
+
docling/models/layout_model.py,sha256=0fiJXJ4aPmcMsYY7rbN9LJ2mZ0_8G0ODY9kyNTAN3Ws,7823
|
51
|
+
docling/models/ocr_mac_model.py,sha256=A3TlEbvvwhkWiq9YARos3Y9yNcpPYQ7JGc_4hFtAK-8,5370
|
52
|
+
docling/models/page_assemble_model.py,sha256=GO7JI1D6T6EkSW94cLQobPGNQUahkxQqTPRwj5CnmFE,6304
|
53
|
+
docling/models/page_preprocessing_model.py,sha256=6pOGXiFQ-oz06UmJdcaYMdVyfZ0YVLWS6efGcx7Mxws,3105
|
54
|
+
docling/models/picture_description_api_model.py,sha256=qs3n0smC9DXhzwJeK_iQG08Y6ZFHInKtdGPVhzgvxgU,2091
|
55
|
+
docling/models/picture_description_base_model.py,sha256=FbBVXzAOB87xpJN28tuGCxoAdcf6mZNUOqJR7ljUg5g,2946
|
56
|
+
docling/models/picture_description_vlm_model.py,sha256=nS68qbJQCP94-gbgFfAzMLaEC-wquSLEwuDix287c9c,4067
|
57
|
+
docling/models/plugins/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
58
|
+
docling/models/plugins/defaults.py,sha256=qslXGnRX07Z3GGttNriqaox0v0vXp4zs4KLurHCZjp4,858
|
59
|
+
docling/models/rapid_ocr_model.py,sha256=Tq_1Egu5Hjx7Y69Vox17QTtRXztSyflB1fhN08CWQwY,5894
|
60
|
+
docling/models/readingorder_model.py,sha256=BxACJ-aIl2aUlyLcyl-uDtuSZH_mCLJgbkDG4Sx_www,14564
|
61
|
+
docling/models/table_structure_model.py,sha256=dR3JkiPkdbScaNy6dia4_ZXPYESSiMDZztD-lLHE1uY,12591
|
62
|
+
docling/models/tesseract_ocr_cli_model.py,sha256=iFdOud5ymoW9WV8bWLCDpd3LJBo9M5bTT5vc635zEDY,10229
|
63
|
+
docling/models/tesseract_ocr_model.py,sha256=oPKOoTTcpYUTDNRteBG-MFcxB9SDC6dk4HuKjIODwMk,9310
|
64
|
+
docling/pipeline/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
65
|
+
docling/pipeline/base_pipeline.py,sha256=DnuxAf7EQusdSRae0QUVth-0f2mSff8JZjX-2vazk00,8751
|
66
|
+
docling/pipeline/simple_pipeline.py,sha256=TXZOwR7hZRji462ZTIpte0VJjzbxvNVE8dbLFANDhSU,2253
|
67
|
+
docling/pipeline/standard_pdf_pipeline.py,sha256=iNZMMGiHTwV6I4u_jjqXhVJ_DiPn_O9qnnee3PQxidc,10773
|
68
|
+
docling/pipeline/vlm_pipeline.py,sha256=g3bxPEqxK8x-B5S6pOpNNo5GxCMCRDZgPJUFqsBA1eg,9720
|
69
|
+
docling/py.typed,sha256=AbpHGcgLb-kRsJGnwFEktk7uzpZOCcBY74-YBdrKVGs,1
|
70
|
+
docling/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
71
|
+
docling/utils/accelerator_utils.py,sha256=ONNRrC8fH-8E93WUCNhfOq1t7WrQ1T7-YsmExTOY5f0,2292
|
72
|
+
docling/utils/api_image_request.py,sha256=_CgdzmPqdsyXmyYUFGLZcXcoH586qC6A1p5vsNbj1Q0,1416
|
73
|
+
docling/utils/export.py,sha256=VwVUnYDk3mhGmISDbVm306fwpGNnoojouStBD4UajXI,4673
|
74
|
+
docling/utils/glm_utils.py,sha256=TKOWQqWAHsX_w4fvoAA7_2xCi_urhnp1DsmjY8_sk5w,12274
|
75
|
+
docling/utils/layout_postprocessor.py,sha256=x7exVG3HYzV9M_O78FfyoG43Y2L7PPMMydvSNwjqh8s,24528
|
76
|
+
docling/utils/locks.py,sha256=RzqQtD5UispgV71pGN_nU6GYfeN11BN0Sh_Dq9ycqGo,52
|
77
|
+
docling/utils/model_downloader.py,sha256=AMqfHTmZzzsPrlcHFdX7hhW-a3Ki6ndjnTjQQYrDSxU,3206
|
78
|
+
docling/utils/ocr_utils.py,sha256=F7iOOjqolUcImUzir4qjDQd4QWSO3s6JC4WRn3U7uY4,263
|
79
|
+
docling/utils/profiling.py,sha256=YaMGoB9MMZpagF9mb5ndoHj8Lpb9aIdb7El-Pl7IcFs,1753
|
80
|
+
docling/utils/utils.py,sha256=xxmVMhQWr7oVBy93IGGpr2x8FBVRHNDwD31kwAF5xK4,1866
|
81
|
+
docling/utils/visualization.py,sha256=tY2ylE2aiQKkmzlSLnFW-HTfFyqUUMguW18ldd1PLfo,2868
|
82
|
+
docling-2.31.0.dist-info/LICENSE,sha256=mBb7ErEcM8VS9OhiGHnQ2kk75HwPhr54W1Oiz3965MY,1088
|
83
|
+
docling-2.31.0.dist-info/METADATA,sha256=tScsMgyfrwtIaCKPl-ygViccYxnRADeUNuHKDGjw7ww,10108
|
84
|
+
docling-2.31.0.dist-info/WHEEL,sha256=Nq82e9rUAnEjt98J6MlVmMCZb-t9cYE2Ir1kpBmnWfs,88
|
85
|
+
docling-2.31.0.dist-info/entry_points.txt,sha256=pIxel-UeVo1S7FhoNG5xgEfPjLZfBLi_N9TsGPtJSLo,144
|
86
|
+
docling-2.31.0.dist-info/RECORD,,
|
docling-2.30.0.dist-info/RECORD
DELETED
@@ -1,86 +0,0 @@
|
|
1
|
-
docling/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
2
|
-
docling/backend/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
3
|
-
docling/backend/abstract_backend.py,sha256=1lNxzwDTn303aXduPDVmTyXn-5ZIoWMLYqNxANGWmQQ,1658
|
4
|
-
docling/backend/asciidoc_backend.py,sha256=xBtmYkRkPICIfMbB8AFIw_or4IZGB17mP_LhXorvZ1k,14060
|
5
|
-
docling/backend/csv_backend.py,sha256=lCNSkgB55IbAig7w4IyXRkX23aM3Nojj6GdXNoaNjY4,4536
|
6
|
-
docling/backend/docling_parse_backend.py,sha256=tcy4cPD_dtGD37CjivbFvwzwXVcrb3HVmofyasxLum8,7991
|
7
|
-
docling/backend/docling_parse_v2_backend.py,sha256=70kXqYhht-A8zb9z5emMe_1i0l9dyQGrM8lg1cmAvqc,9369
|
8
|
-
docling/backend/docling_parse_v4_backend.py,sha256=IECMJQWEvYqQv043_1Ho6dLkCbuaK8cMUsqcxwqruXo,6287
|
9
|
-
docling/backend/docx/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
10
|
-
docling/backend/docx/latex/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
11
|
-
docling/backend/docx/latex/latex_dict.py,sha256=5pOMY_KyxYmgBZ40IrA4q0t5L6JvXOCx5cVwoQE1lls,6690
|
12
|
-
docling/backend/docx/latex/omml.py,sha256=5zuXYOQ10e9nSTKFURBjoU-XSQZVHsVyIiCsGYGVAk8,12127
|
13
|
-
docling/backend/html_backend.py,sha256=ghPLZfdBEPBzLIO9IWzzx0t1Os9B9r4VyGyEZtMsZVI,19468
|
14
|
-
docling/backend/json/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
15
|
-
docling/backend/json/docling_json_backend.py,sha256=LlFMVoZrrCfVwbDuRbNN4Xg96Lujh4xxrTBt9jGhY9I,1984
|
16
|
-
docling/backend/md_backend.py,sha256=lqDiKIBHGsA0u-H1n9oVpPlrcpVT4gYRuNXXcyGlftM,17219
|
17
|
-
docling/backend/msexcel_backend.py,sha256=KRPoHRDv-mqko9RUHGQCzdRrvDo7g7zSU2Z5zoL_Hzo,18106
|
18
|
-
docling/backend/mspowerpoint_backend.py,sha256=X55-1anXm562wxAuYn5uwQkqKjirmgrn1KfbeaKUbXw,17273
|
19
|
-
docling/backend/msword_backend.py,sha256=CgNPjU8SQ7rkAYH_BGiUyv568MGhoH3R0M39WBT8gkc,32468
|
20
|
-
docling/backend/pdf_backend.py,sha256=odWb1rxk3WCUIEJMhq-dYFNUQ1pSDuNHbU9wlTZIRAs,2211
|
21
|
-
docling/backend/pypdfium2_backend.py,sha256=wRwhA5XHRqL7vyNhCAHM6P-ONkwtyjKG9LgC4NJ-4i8,10784
|
22
|
-
docling/backend/xml/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
23
|
-
docling/backend/xml/jats_backend.py,sha256=HXailrDjiwu4swwFnXy3lNfRtLZmkBBp4yqafCvdr7s,24945
|
24
|
-
docling/backend/xml/uspto_backend.py,sha256=H0jwIt2skOke_yEUk0wfXCtodrB-hrj2ygLtB3jMWaI,71056
|
25
|
-
docling/chunking/__init__.py,sha256=h83TDs0AuOV6oEPLAPrn9dpGKiU-2Vg6IRNo4cv6GDA,346
|
26
|
-
docling/cli/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
27
|
-
docling/cli/main.py,sha256=TD-cEf4giuk1O5NPoB-heXHHteUqKoLsj4Rg4xsBUrs,26119
|
28
|
-
docling/cli/models.py,sha256=tM_qbMM3YOPxFU7JlME96MLbtd1CX_bOAK7FS-NhJvY,3979
|
29
|
-
docling/cli/tools.py,sha256=QhtRxQG0TVrfsMqdv5i7J0_qQy1ZZyWYnHPwJl7b5oY,322
|
30
|
-
docling/datamodel/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
31
|
-
docling/datamodel/base_models.py,sha256=fJfFMaHXc-CUrAVfhPF8lKrdb-gaXr2tohx6dHldvRU,7926
|
32
|
-
docling/datamodel/document.py,sha256=V0iK1MYOkPIzd4eQa-G8unp-t01fktlG9wwQ1IwE6Zg,15109
|
33
|
-
docling/datamodel/pipeline_options.py,sha256=iGLijZR-YOtmg0RQs59pqoG_1uGsDYbg5wMDD0FWYx4,13351
|
34
|
-
docling/datamodel/settings.py,sha256=bNMdowIKv7RUchabQTo4rFNEsxfB6pGg2LoZSY634zo,1869
|
35
|
-
docling/document_converter.py,sha256=LCX92FzgmXNJLFVSQfjqH9SGe3zA7FGwARedSigFIpY,13798
|
36
|
-
docling/exceptions.py,sha256=K1WnCS1leK2JtMB5ewZWKkb0EaijFgl-tRzrO9ntgPM,134
|
37
|
-
docling/models/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
38
|
-
docling/models/api_vlm_model.py,sha256=6SxMsFPf0SbT365P67KspdpF3TXZSeu5kmPE3lXAhW4,2470
|
39
|
-
docling/models/base_model.py,sha256=9xJ0VIlpR2BzqoEWMC8LYp5Y96QAEKip4b_HCwCDltY,2931
|
40
|
-
docling/models/base_ocr_model.py,sha256=xvKMhE4ZOGkL2GAhpDvrAHLLFps3ZUfxXZ5ctL1lXUw,7226
|
41
|
-
docling/models/code_formula_model.py,sha256=mOu5luYMzyrCCr8MRGOciNcSvULpQysDd_FXn96WPc8,11477
|
42
|
-
docling/models/document_picture_classifier.py,sha256=fz77RsTdlnA_yC47O-KUq2xVWMKX0_9jm_EGcHliw-E,6235
|
43
|
-
docling/models/easyocr_model.py,sha256=ezq3yv5lORe7T1bbSoTZALck2oHqyEHq57cRfhMYCCQ,7401
|
44
|
-
docling/models/factories/__init__.py,sha256=e4lFmRfmW5hWqvJjY5xaVFbvCQhDBCrVeSq85Q2K_aM,872
|
45
|
-
docling/models/factories/base_factory.py,sha256=pNR9-B_BKs2sYNyHnp2ON2l3r6Dy9lcof4qmwHlAryI,4032
|
46
|
-
docling/models/factories/ocr_factory.py,sha256=G5RkmkKvkl-ihpo6qSj8WC77VdlVSQ1s0ekwUX2ILts,316
|
47
|
-
docling/models/factories/picture_description_factory.py,sha256=Ru3-TnVVEKf5O07C_UpGf2HCOHc7j20AJzfficw3agM,385
|
48
|
-
docling/models/hf_mlx_model.py,sha256=2eSHphJm5LAfiSA24blVMc2znJlKMYrtmmzq8ffc-rU,4924
|
49
|
-
docling/models/hf_vlm_model.py,sha256=NUtLEuG-kNGJeDHWmQKAAOZG4WF0a5hn-KXUUM1mHBQ,6820
|
50
|
-
docling/models/layout_model.py,sha256=7fQWipGV1HDrvbP4uOKa9QAicQl89jp7lailQmbFL3w,7804
|
51
|
-
docling/models/ocr_mac_model.py,sha256=2pZaUWg19go_u88mKWr5y_52PAYEN__GsbyUYLdY4zo,5353
|
52
|
-
docling/models/page_assemble_model.py,sha256=ivkCdbZJpFcGl7CazLegcP1tLK8ZixDfVhQXqsdW_UA,6359
|
53
|
-
docling/models/page_preprocessing_model.py,sha256=Ja7RE1K-2fWxWrxOzNm6QDSGqFf-MY6_uY5OAZ7AQSo,3078
|
54
|
-
docling/models/picture_description_api_model.py,sha256=DowWOU93MXAjj3N1A9ex88Sa3Nic2c3dfoOYir5jZEA,2064
|
55
|
-
docling/models/picture_description_base_model.py,sha256=khuhQZDAZemZMe4BsrBMpjEwkY3nhMFXuczjQpSQrVY,2971
|
56
|
-
docling/models/picture_description_vlm_model.py,sha256=I2Un3vfhQVeWEyZ3Sd3Kygw9la2QSZCwDfl_7XVlMm4,4042
|
57
|
-
docling/models/plugins/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
58
|
-
docling/models/plugins/defaults.py,sha256=qslXGnRX07Z3GGttNriqaox0v0vXp4zs4KLurHCZjp4,858
|
59
|
-
docling/models/rapid_ocr_model.py,sha256=C_I0Ek9mAPIyTFRHuNbqtXg1c15rLNDE1tJ6_hPIi4c,5869
|
60
|
-
docling/models/readingorder_model.py,sha256=hNWbBX3uZv1FxMwKNKn2JFQuQqTspBLsJBVEidXr6Wk,14869
|
61
|
-
docling/models/table_structure_model.py,sha256=pvTsqUa5QIANBUfot0XXG1UUeku-eaUi04EPE-Yh2g0,12597
|
62
|
-
docling/models/tesseract_ocr_cli_model.py,sha256=CZ1W0QbvveIpXO0qSXmXFqz71P4PfLfJBQIqU_Wlg_E,10072
|
63
|
-
docling/models/tesseract_ocr_model.py,sha256=UpLAgKgJtBgbKtJELmKBNMcejJJKBCyFK0q-WgZN1Eg,9256
|
64
|
-
docling/pipeline/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
65
|
-
docling/pipeline/base_pipeline.py,sha256=9ABK-Cr235bxE5vweoIA5rgBZV_EF8qFxAqLI27H_Pg,8749
|
66
|
-
docling/pipeline/simple_pipeline.py,sha256=mZqANqUtAOFAyqQEShErQnAUz6tJFOl6zVoazEDJ_wE,2254
|
67
|
-
docling/pipeline/standard_pdf_pipeline.py,sha256=gPNqUparhIONG4AyMekW9OfZ7t8YMs0odhtbE6Z-Hxw,10784
|
68
|
-
docling/pipeline/vlm_pipeline.py,sha256=dqQYAd3viW577TVSZltnB4P-f-ZUWQh0J8SSFDuQN6Q,9738
|
69
|
-
docling/py.typed,sha256=AbpHGcgLb-kRsJGnwFEktk7uzpZOCcBY74-YBdrKVGs,1
|
70
|
-
docling/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
71
|
-
docling/utils/accelerator_utils.py,sha256=ONNRrC8fH-8E93WUCNhfOq1t7WrQ1T7-YsmExTOY5f0,2292
|
72
|
-
docling/utils/api_image_request.py,sha256=_CgdzmPqdsyXmyYUFGLZcXcoH586qC6A1p5vsNbj1Q0,1416
|
73
|
-
docling/utils/export.py,sha256=4W-ptI1fLdVrtoqHdHY1RF9Xn2Yescs-hunITqxJ7Is,4697
|
74
|
-
docling/utils/glm_utils.py,sha256=W4JRoP0xQ6SJmhhIoAfcKxm5dr1CFvLHp8pqI1kdhxs,12250
|
75
|
-
docling/utils/layout_postprocessor.py,sha256=Q36DfcIYMuMfC6LzCBIrYtHK7pBE-Xyvjepz660s9UM,24508
|
76
|
-
docling/utils/locks.py,sha256=RzqQtD5UispgV71pGN_nU6GYfeN11BN0Sh_Dq9ycqGo,52
|
77
|
-
docling/utils/model_downloader.py,sha256=sxAQvjiIu9m2Ur5Ot5C5SATmgWJAHi0xSjzxj8QXYJk,3213
|
78
|
-
docling/utils/ocr_utils.py,sha256=F7iOOjqolUcImUzir4qjDQd4QWSO3s6JC4WRn3U7uY4,263
|
79
|
-
docling/utils/profiling.py,sha256=YaMGoB9MMZpagF9mb5ndoHj8Lpb9aIdb7El-Pl7IcFs,1753
|
80
|
-
docling/utils/utils.py,sha256=0ozCk7zUkYzxRVmYoIB2zA1lqjQOuaQzxfGuf1wmKW4,1866
|
81
|
-
docling/utils/visualization.py,sha256=tY2ylE2aiQKkmzlSLnFW-HTfFyqUUMguW18ldd1PLfo,2868
|
82
|
-
docling-2.30.0.dist-info/LICENSE,sha256=mBb7ErEcM8VS9OhiGHnQ2kk75HwPhr54W1Oiz3965MY,1088
|
83
|
-
docling-2.30.0.dist-info/METADATA,sha256=HSI154YUnSDJE8BMMjOuu-U3EXQg0ksFuyuyzv7-UdU,9982
|
84
|
-
docling-2.30.0.dist-info/WHEEL,sha256=Nq82e9rUAnEjt98J6MlVmMCZb-t9cYE2Ir1kpBmnWfs,88
|
85
|
-
docling-2.30.0.dist-info/entry_points.txt,sha256=pIxel-UeVo1S7FhoNG5xgEfPjLZfBLi_N9TsGPtJSLo,144
|
86
|
-
docling-2.30.0.dist-info/RECORD,,
|
File without changes
|
File without changes
|
File without changes
|