docling-core 2.3.0__tar.gz → 2.3.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of docling-core might be problematic. Click here for more details.

Files changed (55) hide show
  1. {docling_core-2.3.0 → docling_core-2.3.1}/PKG-INFO +1 -1
  2. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/transforms/chunker/hierarchical_chunker.py +7 -6
  3. {docling_core-2.3.0 → docling_core-2.3.1}/pyproject.toml +1 -1
  4. {docling_core-2.3.0 → docling_core-2.3.1}/LICENSE +0 -0
  5. {docling_core-2.3.0 → docling_core-2.3.1}/README.md +0 -0
  6. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/__init__.py +0 -0
  7. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/py.typed +0 -0
  8. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/resources/schemas/doc/ANN.json +0 -0
  9. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/resources/schemas/doc/DOC.json +0 -0
  10. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/resources/schemas/doc/OCR-output.json +0 -0
  11. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/resources/schemas/doc/RAW.json +0 -0
  12. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/resources/schemas/generated/ccs_document_schema.json +0 -0
  13. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/resources/schemas/generated/minimal_document_schema_flat.json +0 -0
  14. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/resources/schemas/search/search_doc_mapping.json +0 -0
  15. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/resources/schemas/search/search_doc_mapping_v2.json +0 -0
  16. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/search/__init__.py +0 -0
  17. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/search/json_schema_to_search_mapper.py +0 -0
  18. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/search/mapping.py +0 -0
  19. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/search/meta.py +0 -0
  20. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/search/package.py +0 -0
  21. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/transforms/__init__.py +0 -0
  22. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/transforms/chunker/__init__.py +0 -0
  23. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/transforms/chunker/base.py +0 -0
  24. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/__init__.py +0 -0
  25. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/base.py +0 -0
  26. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/doc/__init__.py +0 -0
  27. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/doc/base.py +0 -0
  28. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/doc/document.py +0 -0
  29. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/doc/labels.py +0 -0
  30. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/gen/__init__.py +0 -0
  31. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/gen/generic.py +0 -0
  32. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/legacy_doc/__init__.py +0 -0
  33. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/legacy_doc/base.py +0 -0
  34. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/legacy_doc/doc_ann.py +0 -0
  35. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/legacy_doc/doc_ocr.py +0 -0
  36. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/legacy_doc/doc_raw.py +0 -0
  37. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/legacy_doc/document.py +0 -0
  38. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/legacy_doc/tokens.py +0 -0
  39. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/nlp/__init__.py +0 -0
  40. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/nlp/qa.py +0 -0
  41. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/nlp/qa_labels.py +0 -0
  42. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/rec/__init__.py +0 -0
  43. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/rec/attribute.py +0 -0
  44. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/rec/base.py +0 -0
  45. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/rec/predicate.py +0 -0
  46. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/rec/record.py +0 -0
  47. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/rec/statement.py +0 -0
  48. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/types/rec/subject.py +0 -0
  49. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/utils/__init__.py +0 -0
  50. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/utils/alias.py +0 -0
  51. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/utils/file.py +0 -0
  52. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/utils/generate_docs.py +0 -0
  53. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/utils/generate_jsonschema.py +0 -0
  54. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/utils/validate.py +0 -0
  55. {docling_core-2.3.0 → docling_core-2.3.1}/docling_core/utils/validators.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: docling-core
3
- Version: 2.3.0
3
+ Version: 2.3.1
4
4
  Summary: A python library to define and validate data types in Docling.
5
5
  Home-page: https://ds4sd.github.io/
6
6
  License: MIT
@@ -183,14 +183,15 @@ class HierarchicalChunker(BaseChunker):
183
183
  )
184
184
  list_items = [] # reset
185
185
 
186
- if isinstance(
187
- item, SectionHeaderItem
188
- ) or ( # TODO remove when all captured as SectionHeaderItem:
186
+ if isinstance(item, SectionHeaderItem) or (
189
187
  isinstance(item, TextItem)
190
- and item.label == DocItemLabel.SECTION_HEADER
188
+ and item.label in [DocItemLabel.SECTION_HEADER, DocItemLabel.TITLE]
191
189
  ):
192
- # TODO second branch not needed once cleanup above complete:
193
- level = item.level if isinstance(item, SectionHeaderItem) else 1
190
+ level = (
191
+ item.level
192
+ if isinstance(item, SectionHeaderItem)
193
+ else (0 if item.label == DocItemLabel.TITLE else 1)
194
+ )
194
195
  heading_by_level[level] = item.text
195
196
 
196
197
  # remove headings of higher level as they just went out of scope
@@ -1,6 +1,6 @@
1
1
  [tool.poetry]
2
2
  name = "docling-core"
3
- version = "2.3.0"
3
+ version = "2.3.1"
4
4
  description = "A python library to define and validate data types in Docling."
5
5
  license = "MIT"
6
6
  authors = [
File without changes
File without changes