sparrow-parse 1.0.1__tar.gz → 1.0.2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (27) hide show
  1. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/PKG-INFO +1 -1
  2. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/setup.py +1 -1
  3. sparrow-parse-1.0.2/sparrow_parse/__init__.py +1 -0
  4. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse/extractors/vllm_extractor.py +8 -0
  5. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse.egg-info/PKG-INFO +1 -1
  6. sparrow-parse-1.0.1/sparrow_parse/__init__.py +0 -1
  7. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/README.md +0 -0
  8. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/setup.cfg +0 -0
  9. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse/__main__.py +0 -0
  10. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse/extractors/__init__.py +0 -0
  11. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse/helpers/__init__.py +0 -0
  12. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse/helpers/image_optimizer.py +0 -0
  13. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse/helpers/pdf_optimizer.py +0 -0
  14. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse/processors/__init__.py +0 -0
  15. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse/processors/table_structure_processor.py +0 -0
  16. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse/text_extraction.py +0 -0
  17. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse/vllm/__init__.py +0 -0
  18. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse/vllm/huggingface_inference.py +0 -0
  19. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse/vllm/inference_base.py +0 -0
  20. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse/vllm/inference_factory.py +0 -0
  21. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse/vllm/local_gpu_inference.py +0 -0
  22. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse/vllm/mlx_inference.py +0 -0
  23. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse.egg-info/SOURCES.txt +0 -0
  24. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse.egg-info/dependency_links.txt +0 -0
  25. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse.egg-info/entry_points.txt +0 -0
  26. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse.egg-info/requires.txt +0 -0
  27. {sparrow-parse-1.0.1 → sparrow-parse-1.0.2}/sparrow_parse.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: sparrow-parse
3
- Version: 1.0.1
3
+ Version: 1.0.2
4
4
  Summary: Sparrow Parse is a Python package (part of Sparrow) for parsing and extracting information from documents.
5
5
  Home-page: https://github.com/katanaml/sparrow/tree/main/sparrow-data/parse
6
6
  Author: Andrej Baranovskij
@@ -8,7 +8,7 @@ with open("requirements.txt", "r", encoding="utf-8") as fh:
8
8
 
9
9
  setup(
10
10
  name="sparrow-parse",
11
- version="1.0.1",
11
+ version="1.0.2",
12
12
  author="Andrej Baranovskij",
13
13
  author_email="andrejus.baranovskis@gmail.com",
14
14
  description="Sparrow Parse is a Python package (part of Sparrow) for parsing and extracting information from documents.",
@@ -0,0 +1 @@
1
+ __version__ = '1.0.2'
@@ -147,6 +147,14 @@ class VLLMExtractor(object):
147
147
  table_detector = TableDetector()
148
148
  cropped_tables = table_detector.detect_tables(file_path, local=False, debug_dir=debug_dir, debug=debug)
149
149
  results_array = []
150
+
151
+ # Check if no tables were found
152
+ if cropped_tables is None:
153
+ if debug:
154
+ print(f"No tables detected in {file_path}")
155
+ # Return a structured no-tables-found response instead of failing
156
+ return [json.dumps({"message": "No tables detected in the document", "status": "empty"})]
157
+
150
158
  temp_dir = tempfile.mkdtemp()
151
159
 
152
160
  for i, table in enumerate(cropped_tables):
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: sparrow-parse
3
- Version: 1.0.1
3
+ Version: 1.0.2
4
4
  Summary: Sparrow Parse is a Python package (part of Sparrow) for parsing and extracting information from documents.
5
5
  Home-page: https://github.com/katanaml/sparrow/tree/main/sparrow-data/parse
6
6
  Author: Andrej Baranovskij
@@ -1 +0,0 @@
1
- __version__ = '1.0.1'
File without changes
File without changes