docling-core 2.12.0__tar.gz → 2.12.1__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of docling-core might be problematic. Click here for more details.
- {docling_core-2.12.0 → docling_core-2.12.1}/PKG-INFO +1 -1
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/legacy_doc/document.py +13 -8
- {docling_core-2.12.0 → docling_core-2.12.1}/pyproject.toml +1 -1
- {docling_core-2.12.0 → docling_core-2.12.1}/LICENSE +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/README.md +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/__init__.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/cli/__init__.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/cli/view.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/py.typed +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/resources/schemas/doc/ANN.json +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/resources/schemas/doc/DOC.json +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/resources/schemas/doc/OCR-output.json +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/resources/schemas/doc/RAW.json +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/resources/schemas/generated/ccs_document_schema.json +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/resources/schemas/generated/minimal_document_schema_flat.json +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/resources/schemas/search/search_doc_mapping.json +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/resources/schemas/search/search_doc_mapping_v2.json +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/search/__init__.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/search/json_schema_to_search_mapper.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/search/mapping.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/search/meta.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/search/package.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/transforms/__init__.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/transforms/chunker/__init__.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/transforms/chunker/base.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/transforms/chunker/hierarchical_chunker.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/transforms/chunker/hybrid_chunker.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/__init__.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/base.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/doc/__init__.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/doc/base.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/doc/document.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/doc/labels.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/doc/tokens.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/doc/utils.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/gen/__init__.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/gen/generic.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/io/__init__.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/legacy_doc/__init__.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/legacy_doc/base.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/legacy_doc/doc_ann.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/legacy_doc/doc_ocr.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/legacy_doc/doc_raw.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/legacy_doc/tokens.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/nlp/__init__.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/nlp/qa.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/nlp/qa_labels.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/rec/__init__.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/rec/attribute.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/rec/base.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/rec/predicate.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/rec/record.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/rec/statement.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/types/rec/subject.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/utils/__init__.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/utils/alias.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/utils/file.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/utils/generate_docs.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/utils/generate_jsonschema.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/utils/legacy.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/utils/validate.py +0 -0
- {docling_core-2.12.0 → docling_core-2.12.1}/docling_core/utils/validators.py +0 -0
|
@@ -550,17 +550,18 @@ class ExportedCCSDocument(
|
|
|
550
550
|
|
|
551
551
|
elif (
|
|
552
552
|
isinstance(item, Table)
|
|
553
|
-
and item.data
|
|
553
|
+
and (item.data or item.text)
|
|
554
554
|
and item_type in main_text_labels
|
|
555
555
|
):
|
|
556
556
|
|
|
557
557
|
md_table = ""
|
|
558
558
|
table = []
|
|
559
|
-
|
|
560
|
-
|
|
561
|
-
|
|
562
|
-
|
|
563
|
-
|
|
559
|
+
if item.data is not None:
|
|
560
|
+
for row in item.data:
|
|
561
|
+
tmp = []
|
|
562
|
+
for col in row:
|
|
563
|
+
tmp.append(col.text)
|
|
564
|
+
table.append(tmp)
|
|
564
565
|
|
|
565
566
|
if len(table) > 1 and len(table[0]) > 0:
|
|
566
567
|
try:
|
|
@@ -579,7 +580,9 @@ class ExportedCCSDocument(
|
|
|
579
580
|
if item.text:
|
|
580
581
|
markdown_text = item.text
|
|
581
582
|
if not strict_text:
|
|
582
|
-
markdown_text +=
|
|
583
|
+
markdown_text += (
|
|
584
|
+
"\n\n" if len(markdown_text) > 0 else ""
|
|
585
|
+
) + md_table
|
|
583
586
|
|
|
584
587
|
elif isinstance(item, Figure) and item_type in main_text_labels:
|
|
585
588
|
|
|
@@ -587,7 +590,9 @@ class ExportedCCSDocument(
|
|
|
587
590
|
if item.text:
|
|
588
591
|
markdown_text = item.text
|
|
589
592
|
if not strict_text:
|
|
590
|
-
markdown_text +=
|
|
593
|
+
markdown_text += (
|
|
594
|
+
"\n" if len(markdown_text) > 0 else ""
|
|
595
|
+
) + image_placeholder
|
|
591
596
|
|
|
592
597
|
if markdown_text:
|
|
593
598
|
md_texts.append(markdown_text)
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{docling_core-2.12.0 → docling_core-2.12.1}/docling_core/resources/schemas/doc/OCR-output.json
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{docling_core-2.12.0 → docling_core-2.12.1}/docling_core/search/json_schema_to_search_mapper.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{docling_core-2.12.0 → docling_core-2.12.1}/docling_core/transforms/chunker/hierarchical_chunker.py
RENAMED
|
File without changes
|
{docling_core-2.12.0 → docling_core-2.12.1}/docling_core/transforms/chunker/hybrid_chunker.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|