docling-jobkit 1.9.1__py3-none-any.whl → 1.10.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -208,6 +208,7 @@ class DoclingConverterManager:
208
208
  do_code_enrichment=request.do_code_enrichment,
209
209
  do_formula_enrichment=request.do_formula_enrichment,
210
210
  do_picture_classification=request.do_picture_classification,
211
+ do_chart_extraction=request.do_chart_extraction,
211
212
  do_picture_description=request.do_picture_description,
212
213
  )
213
214
  pipeline_options.table_structure_options = TableStructureOptions(
@@ -454,6 +454,17 @@ class ConvertDocumentsOptions(BaseModel):
454
454
  ),
455
455
  ] = False
456
456
 
457
+ do_chart_extraction: Annotated[
458
+ bool,
459
+ Field(
460
+ description=(
461
+ "If enabled, extract numeric data from charts. "
462
+ "Boolean. Optional, defaults to false."
463
+ ),
464
+ examples=[False],
465
+ ),
466
+ ] = False
467
+
457
468
  do_picture_description: Annotated[
458
469
  bool,
459
470
  Field(
@@ -255,4 +255,6 @@ class RQOrchestrator(BaseOrchestrator):
255
255
  raise RuntimeError("No connection to Redis")
256
256
 
257
257
  async def clear_converters(self):
258
- pass
258
+ self._rq_queue.enqueue(
259
+ "docling_jobkit.orchestrators.rq.worker.clear_cache_task",
260
+ )
@@ -187,6 +187,16 @@ def docling_task(
187
187
  return result_key
188
188
 
189
189
 
190
+ def clear_cache_task(conversion_manager: DoclingConverterManager, **_):
191
+ """RQ job that clears the converter cache on the worker."""
192
+ _log.info("Clearing converter cache on worker")
193
+ conversion_manager.clear_cache()
194
+ import gc
195
+
196
+ gc.collect()
197
+ _log.info("Converter cache cleared")
198
+
199
+
190
200
  def run_worker(
191
201
  rq_config: Optional[RQOrchestratorConfig] = None,
192
202
  cm_config: Optional[DoclingConverterManagerConfig] = None,
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: docling-jobkit
3
- Version: 1.9.1
3
+ Version: 1.10.1
4
4
  Summary: Running a distributed job processing documents with Docling.
5
5
  Project-URL: Homepage, https://github.com/docling-project/docling-jobkit
6
6
  Project-URL: Documentation, https://docling-project.github.io/docling/usage/jobkit/
@@ -27,7 +27,7 @@ Classifier: Topic :: Software Development :: Libraries :: Python Modules
27
27
  Classifier: Typing :: Typed
28
28
  Requires-Python: >=3.10
29
29
  Requires-Dist: boto3~=1.35
30
- Requires-Dist: docling~=2.60
30
+ Requires-Dist: docling~=2.72
31
31
  Requires-Dist: httpx<1,>=0.28
32
32
  Requires-Dist: pandas~=2.2
33
33
  Requires-Dist: pydantic-settings~=2.4
@@ -19,13 +19,13 @@ docling_jobkit/connectors/target_processor.py,sha256=2iIJE7Ip_-1dxJGt02_ALwDC2BP
19
19
  docling_jobkit/connectors/target_processor_factory.py,sha256=A-ZuwQiuYK6HVNHTZomIVBZ3tC9D6femv3-7PSNQkEA,901
20
20
  docling_jobkit/convert/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
21
21
  docling_jobkit/convert/chunking.py,sha256=vvdrvg66JB8Snwnbo7yzYXox6b2rRFDS9R4UyTXvq58,12014
22
- docling_jobkit/convert/manager.py,sha256=SPsPGf600vXL1H0tcXyQ7L7CCJlQcAz9gsetX4XWSPo,15938
22
+ docling_jobkit/convert/manager.py,sha256=-FAmtQf4j4pl49r7WRsd_yejTZ44Art_uyUhIUDCdp8,15999
23
23
  docling_jobkit/convert/results.py,sha256=vQvOuXIdlmPskHwUJlXX2zyJSb2k20ip5TfzuyPH5mU,9053
24
24
  docling_jobkit/convert/results_processor.py,sha256=obwFclxHEmAO_9wsJD6qqd2F0OfQy6ysO-ZJbc3MPF4,16559
25
25
  docling_jobkit/datamodel/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
26
26
  docling_jobkit/datamodel/callback.py,sha256=telxud7vFVxXxuP3iZn59ArrnRoUr0XZu5tQfCnMG0U,1157
27
27
  docling_jobkit/datamodel/chunking.py,sha256=ju_5BkCadPJnv_iKpnxFHkD8ermOOBrWSElz78mn7W8,2216
28
- docling_jobkit/datamodel/convert.py,sha256=pJdXlCQrXDYPpp9ZxgFmc3OlJsHmLhk1n-KA1g3c6Do,19285
28
+ docling_jobkit/datamodel/convert.py,sha256=6wR1hm-zQt17DiMcFgaCK63AjbYElyhwxTFQpgq4v5o,19568
29
29
  docling_jobkit/datamodel/google_drive_coords.py,sha256=Gb_V0qY0YIMXpMRhKMKyr3Yqbpt7IPQ1qHmhnJfM07M,3596
30
30
  docling_jobkit/datamodel/http_inputs.py,sha256=jQF7fD_lbq1bI1z5snHe4q9wuWhEi8p1_tnNt47xVOk,1182
31
31
  docling_jobkit/datamodel/result.py,sha256=WaasDSc_aAyuN3wfGlWqt1ZksC_5tIDHcafgeVpzKeQ,3369
@@ -50,12 +50,12 @@ docling_jobkit/orchestrators/local/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQe
50
50
  docling_jobkit/orchestrators/local/orchestrator.py,sha256=swMw3a-Lm4a13poLV2JE33uF_EeBDyM3VZ71Dhbt-_o,4921
51
51
  docling_jobkit/orchestrators/local/worker.py,sha256=v4YNAZsSIcnNzsLDXot_3jdiy_lfIlH4h6E1hLRixS0,5818
52
52
  docling_jobkit/orchestrators/rq/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
53
- docling_jobkit/orchestrators/rq/orchestrator.py,sha256=sP0EzjhKST8R6tPW3cVyaAzGWNDd-7AdaWhWMUi7QY8,9259
54
- docling_jobkit/orchestrators/rq/worker.py,sha256=tSGQCMFgHZTUqmIVkhVq8bYFdVl0eyhcm7NT22vmsHk,6719
53
+ docling_jobkit/orchestrators/rq/orchestrator.py,sha256=HglKgoEWOgFzeF_EooIWJw12TDUjJ9YEADUkl-a1pw8,9359
54
+ docling_jobkit/orchestrators/rq/worker.py,sha256=TR2kurNQK9aBFZqAV1nFALm2B7qmPRQDDgZAzhIQpDM,7019
55
55
  docling_jobkit/ray_job/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
56
56
  docling_jobkit/ray_job/main.py,sha256=6VyAsn9wk3v09qH4uQb4u1YnesX_-1DJrEg2MkDXy2k,13648
57
- docling_jobkit-1.9.1.dist-info/METADATA,sha256=1yNU0nhZJp9vLnBg03KKRDKa7edkBtnmXOZbfpOZbRM,10475
58
- docling_jobkit-1.9.1.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
59
- docling_jobkit-1.9.1.dist-info/entry_points.txt,sha256=-tTX7hZPMCPZ2zVSUhI2BTPFglsds_A6PbCpPR7gUVM,181
60
- docling_jobkit-1.9.1.dist-info/licenses/LICENSE,sha256=mBb7ErEcM8VS9OhiGHnQ2kk75HwPhr54W1Oiz3965MY,1088
61
- docling_jobkit-1.9.1.dist-info/RECORD,,
57
+ docling_jobkit-1.10.1.dist-info/METADATA,sha256=aGgZYN1vtI7Ag1UkNwbg7XpJ8FZHn9Wyk_PQDLaBunk,10476
58
+ docling_jobkit-1.10.1.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
59
+ docling_jobkit-1.10.1.dist-info/entry_points.txt,sha256=-tTX7hZPMCPZ2zVSUhI2BTPFglsds_A6PbCpPR7gUVM,181
60
+ docling_jobkit-1.10.1.dist-info/licenses/LICENSE,sha256=mBb7ErEcM8VS9OhiGHnQ2kk75HwPhr54W1Oiz3965MY,1088
61
+ docling_jobkit-1.10.1.dist-info/RECORD,,