PyPI - chunkr-ai - Versions diffs - 0.0.35__tar.gz → 0.0.36__tar.gz - Mend

chunkr-ai 0.0.35tar.gz → 0.0.36tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (22) hide show

{chunkr_ai-0.0.35/src/chunkr_ai.egg-info → chunkr_ai-0.0.36}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.2
 Name: chunkr-ai
-Version: 0.0.35
+Version: 0.0.36
 Summary: Python client for Chunkr: open source document intelligence
 Author-email: Ishaan Kapoor <ishaan@lumina.sh>
 License: MIT License

{chunkr_ai-0.0.35 → chunkr_ai-0.0.36}/pyproject.toml RENAMED Viewed

@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 [project]
 name = "chunkr-ai"
-version = "0.0.35"
+version = "0.0.36"
 authors = [{"name" = "Ishaan Kapoor", "email" = "ishaan@lumina.sh"}]
 description = "Python client for Chunkr: open source document intelligence"
 readme = "README.md"

{chunkr_ai-0.0.35 → chunkr_ai-0.0.36}/src/chunkr_ai/api/task_response.py RENAMED Viewed

@@ -103,6 +103,29 @@ class TaskResponse(BaseModel, Generic[T]):
         r.raise_for_status()
         return await self.poll()
+    def _write_to_file(self, content: str | dict, output_file: str, is_json: bool = False) -> None:
+        """Helper method to write content to a file
+        Args:
+            content: Content to write (string or dict for JSON)
+            output_file: Path to save the content
+            is_json: Whether the content should be written as JSON
+        """
+        class DateTimeEncoder(json.JSONEncoder):
+            def default(self, obj):
+                if isinstance(obj, datetime):
+                    return obj.isoformat()
+                return super().default(obj)
+        if output_file:
+            directory = os.path.dirname(output_file)
+            if directory:
+                os.makedirs(directory, exist_ok=True)
+            with open(output_file, "w", encoding="utf-8") as f:
+                if is_json:
+                    json.dump(content, f, cls=DateTimeEncoder, indent=2)
+                else:
+                    f.write(content)
     def html(self, output_file: str = None) -> str:
         """Get the full HTML of the task
@@ -110,10 +133,7 @@ class TaskResponse(BaseModel, Generic[T]):
             output_file (str, optional): Path to save the HTML content. Defaults to None.
         """
         content = self._get_content("html")
-        if output_file:
-            os.makedirs(os.path.dirname(output_file), exist_ok=True)
-            with open(output_file, "w", encoding="utf-8") as f:
-                f.write(content)
+        self._write_to_file(content, output_file)
         return content
     def markdown(self, output_file: str = None) -> str:
@@ -123,10 +143,7 @@ class TaskResponse(BaseModel, Generic[T]):
             output_file (str, optional): Path to save the markdown content. Defaults to None.
         """
         content = self._get_content("markdown")
-        if output_file:
-            os.makedirs(os.path.dirname(output_file), exist_ok=True)
-            with open(output_file, "w", encoding="utf-8") as f:
-                f.write(content)
+        self._write_to_file(content, output_file)
         return content
     def content(self, output_file: str = None) -> str:
@@ -136,10 +153,7 @@ class TaskResponse(BaseModel, Generic[T]):
             output_file (str, optional): Path to save the content. Defaults to None.
         """
         content = self._get_content("content")
-        if output_file:
-            os.makedirs(os.path.dirname(output_file), exist_ok=True)
-            with open(output_file, "w", encoding="utf-8") as f:
-                f.write(content)
+        self._write_to_file(content, output_file)
         return content
     def json(self, output_file: str = None) -> dict:
@@ -148,17 +162,8 @@ class TaskResponse(BaseModel, Generic[T]):
         Args:
             output_file (str, optional): Path to save the task data as JSON. Defaults to None.
         """
-        class DateTimeEncoder(json.JSONEncoder):
-            def default(self, obj):
-                if isinstance(obj, datetime):
-                    return obj.isoformat()
-                return super().default(obj)
         data = self.model_dump()
-        if output_file:
-            os.makedirs(os.path.dirname(output_file), exist_ok=True)
-            with open(output_file, "w", encoding="utf-8") as f:
-                json.dump(data, f, cls=DateTimeEncoder, indent=2)
+        self._write_to_file(data, output_file, is_json=True)
         return data
     def _get_content(self, t: str) -> str:

{chunkr_ai-0.0.35 → chunkr_ai-0.0.36/src/chunkr_ai.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.2
 Name: chunkr-ai
-Version: 0.0.35
+Version: 0.0.36
 Summary: Python client for Chunkr: open source document intelligence
 Author-email: Ishaan Kapoor <ishaan@lumina.sh>
 License: MIT License

{chunkr_ai-0.0.35 → chunkr_ai-0.0.36}/tests/test_chunkr.py RENAMED Viewed

@@ -67,6 +67,7 @@ async def test_send_pil_image(client, sample_image):
     response = await client.upload(sample_image)
     assert response.task_id is not None
     assert response.status == "Succeeded"
+    assert response.output is not None
 @pytest.mark.asyncio
 async def test_ocr_auto(client, sample_path):
@@ -220,3 +221,32 @@ async def test_task_operations_after_client_close(client, sample_path):
     await client.close()
     result = await task.poll()
     assert result.status == "Succeeded"
+@pytest.mark.asyncio
+async def test_output_files_no_dir(client, sample_path, tmp_path):
+    await client.upload(sample_path)
+    html_file = tmp_path / "output.html"
+    md_file = tmp_path / "output.md"
+    content_file = tmp_path / "output.txt"
+    json_file = tmp_path / "output.json"
+    assert html_file.exists()
+    assert md_file.exists()
+    assert content_file.exists()
+    assert json_file.exists()
+@pytest.mark.asyncio
+async def test_output_files_with_dirs(client, sample_path, tmp_path):
+    await client.upload(sample_path)
+    nested_dir = tmp_path / "nested" / "output" / "dir"
+    html_file = nested_dir / "output.html"
+    md_file = nested_dir / "output.md"
+    content_file = nested_dir / "output.txt"
+    json_file = nested_dir / "output.json"
+    assert html_file.exists()
+    assert md_file.exists()
+    assert content_file.exists()
+    assert json_file.exists()