docling-core 2.24.0__tar.gz → 2.24.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of docling-core might be problematic. Click here for more details.

Files changed (69) hide show
  1. {docling_core-2.24.0 → docling_core-2.24.1}/PKG-INFO +1 -1
  2. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/doc/page.py +10 -3
  3. {docling_core-2.24.0 → docling_core-2.24.1}/pyproject.toml +1 -1
  4. {docling_core-2.24.0 → docling_core-2.24.1}/LICENSE +0 -0
  5. {docling_core-2.24.0 → docling_core-2.24.1}/README.md +0 -0
  6. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/__init__.py +0 -0
  7. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/cli/__init__.py +0 -0
  8. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/cli/view.py +0 -0
  9. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/experimental/__init__.py +0 -0
  10. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/experimental/serializer/__init__.py +0 -0
  11. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/experimental/serializer/base.py +0 -0
  12. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/experimental/serializer/common.py +0 -0
  13. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/experimental/serializer/doctags.py +0 -0
  14. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/experimental/serializer/markdown.py +0 -0
  15. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/py.typed +0 -0
  16. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/resources/schemas/doc/ANN.json +0 -0
  17. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/resources/schemas/doc/DOC.json +0 -0
  18. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/resources/schemas/doc/OCR-output.json +0 -0
  19. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/resources/schemas/doc/RAW.json +0 -0
  20. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/resources/schemas/generated/ccs_document_schema.json +0 -0
  21. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/resources/schemas/generated/minimal_document_schema_flat.json +0 -0
  22. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/resources/schemas/search/search_doc_mapping.json +0 -0
  23. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/resources/schemas/search/search_doc_mapping_v2.json +0 -0
  24. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/search/__init__.py +0 -0
  25. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/search/json_schema_to_search_mapper.py +0 -0
  26. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/search/mapping.py +0 -0
  27. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/search/meta.py +0 -0
  28. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/search/package.py +0 -0
  29. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/transforms/__init__.py +0 -0
  30. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/transforms/chunker/__init__.py +0 -0
  31. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/transforms/chunker/base.py +0 -0
  32. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/transforms/chunker/hierarchical_chunker.py +0 -0
  33. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/transforms/chunker/hybrid_chunker.py +0 -0
  34. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/__init__.py +0 -0
  35. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/base.py +0 -0
  36. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/doc/__init__.py +0 -0
  37. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/doc/base.py +0 -0
  38. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/doc/document.py +0 -0
  39. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/doc/labels.py +0 -0
  40. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/doc/tokens.py +0 -0
  41. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/doc/utils.py +0 -0
  42. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/gen/__init__.py +0 -0
  43. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/gen/generic.py +0 -0
  44. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/io/__init__.py +0 -0
  45. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/legacy_doc/__init__.py +0 -0
  46. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/legacy_doc/base.py +0 -0
  47. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/legacy_doc/doc_ann.py +0 -0
  48. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/legacy_doc/doc_ocr.py +0 -0
  49. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/legacy_doc/doc_raw.py +0 -0
  50. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/legacy_doc/document.py +0 -0
  51. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/legacy_doc/tokens.py +0 -0
  52. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/nlp/__init__.py +0 -0
  53. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/nlp/qa.py +0 -0
  54. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/nlp/qa_labels.py +0 -0
  55. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/rec/__init__.py +0 -0
  56. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/rec/attribute.py +0 -0
  57. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/rec/base.py +0 -0
  58. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/rec/predicate.py +0 -0
  59. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/rec/record.py +0 -0
  60. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/rec/statement.py +0 -0
  61. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/types/rec/subject.py +0 -0
  62. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/utils/__init__.py +0 -0
  63. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/utils/alias.py +0 -0
  64. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/utils/file.py +0 -0
  65. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/utils/generate_docs.py +0 -0
  66. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/utils/generate_jsonschema.py +0 -0
  67. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/utils/legacy.py +0 -0
  68. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/utils/validate.py +0 -0
  69. {docling_core-2.24.0 → docling_core-2.24.1}/docling_core/utils/validators.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: docling-core
3
- Version: 2.24.0
3
+ Version: 2.24.1
4
4
  Summary: A python library to define and validate data types in Docling.
5
5
  Home-page: https://github.com/docling-project
6
6
  License: MIT
@@ -1,5 +1,6 @@
1
1
  """Datastructures for PaginatedDocument."""
2
2
 
3
+ import copy
3
4
  import json
4
5
  import logging
5
6
  import math
@@ -530,10 +531,16 @@ class SegmentedPdfPage(SegmentedPage):
530
531
  """
531
532
  cells = []
532
533
  for page_cell in self.iterate_cells(cell_unit):
533
- cell_bbox = page_cell.to_bounding_box()
534
+ pc = copy.deepcopy(page_cell)
535
+ # Bring cell_bbox coord origin to the same as input bbox.coord_origin:
536
+ if page_cell.rect.coord_origin != bbox.coord_origin:
537
+ if bbox.coord_origin == CoordOrigin.TOPLEFT:
538
+ pc.rect = pc.rect.to_top_left_origin(self.dimension.height)
539
+ elif bbox.coord_origin == CoordOrigin.BOTTOMLEFT:
540
+ pc.rect = pc.rect.to_bottom_left_origin(self.dimension.height)
541
+ cell_bbox = pc.to_bounding_box()
534
542
  if cell_bbox.intersection_over_self(bbox) > ios:
535
- cells.append(page_cell)
536
-
543
+ cells.append(pc)
537
544
  return cells
538
545
 
539
546
  def export_to_dict(self) -> Dict:
@@ -1,6 +1,6 @@
1
1
  [tool.poetry]
2
2
  name = "docling-core"
3
- version = "2.24.0"
3
+ version = "2.24.1"
4
4
  description = "A python library to define and validate data types in Docling."
5
5
  license = "MIT"
6
6
  authors = [
File without changes
File without changes