PyPI - firecrawl - Versions diffs - 2.9.0__tar.gz → 2.10.0__tar.gz - Mend

firecrawl 2.9.0tar.gz → 2.10.0tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of firecrawl might be problematic. Click here for more details.

Files changed (18) hide show

{firecrawl-2.9.0 → firecrawl-2.10.0}/LICENSE RENAMED Viewed

File without changes

{firecrawl-2.9.0 → firecrawl-2.10.0}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: firecrawl
-Version: 2.9.0
+Version: 2.10.0
 Summary: Python SDK for Firecrawl API
 Home-page: https://github.com/mendableai/firecrawl
 Author: Mendable.ai

{firecrawl-2.9.0 → firecrawl-2.10.0}/README.md RENAMED Viewed

File without changes

{firecrawl-2.9.0 → firecrawl-2.10.0}/firecrawl/__init__.py RENAMED Viewed

@@ -13,7 +13,7 @@ import os
 from .firecrawl import FirecrawlApp, AsyncFirecrawlApp, JsonConfig, ScrapeOptions, ChangeTrackingOptions # noqa
-__version__ = "2.9.0"
+__version__ = "2.10.0"
 # Define the logger for the Firecrawl project
 logger: logging.Logger = logging.getLogger("firecrawl")

{firecrawl-2.9.0 → firecrawl-2.10.0}/firecrawl/__tests__/e2e_withAuth/__init__.py RENAMED Viewed

File without changes

{firecrawl-2.9.0 → firecrawl-2.10.0}/firecrawl/__tests__/e2e_withAuth/test.py RENAMED Viewed

File without changes

{firecrawl-2.9.0 → firecrawl-2.10.0}/firecrawl/__tests__/v1/e2e_withAuth/__init__.py RENAMED Viewed

File without changes

{firecrawl-2.9.0 → firecrawl-2.10.0}/firecrawl/__tests__/v1/e2e_withAuth/test.py RENAMED Viewed

@@ -437,4 +437,29 @@ def test_search_with_invalid_params():
         app.search("test query", {"invalid_param": "value"})
     assert "ValidationError" in str(e.value)
+# def test_scrape_url_with_parse_pdf_true():
+#     if TEST_API_KEY:
+#         app = FirecrawlApp(api_url=API_URL, api_key=TEST_API_KEY)
+#         response = app.scrape_url('https://arxiv.org/pdf/astro-ph/9301001.pdf', parse_pdf=True)
+#         assert response is not None
+#         assert 'markdown' in response
+#         assert len(response['markdown']) > 100
+# def test_scrape_url_with_parse_pdf_false():
+#     if TEST_API_KEY:
+#         app = FirecrawlApp(api_url=API_URL, api_key=TEST_API_KEY)
+#         response = app.scrape_url('https://arxiv.org/pdf/astro-ph/9301001.pdf', parse_pdf=False)
+#         assert response is not None
+#         assert 'markdown' in response
+#         assert 'h7uKu14adDL6yGfnGf2qycY5uq8kC3OKCWkPxm' in response['markdown']
+# def test_scrape_options_with_parse_pdf():
+#     if TEST_API_KEY:
+#         from firecrawl.firecrawl import ScrapeOptions
+#         app = FirecrawlApp(api_url=API_URL, api_key=TEST_API_KEY)
+#         scrape_options = ScrapeOptions(parsePDF=False, formats=['markdown'])
+#         response = app.search("firecrawl", limit=1, scrape_options=scrape_options)
+#         assert response is not None
+#         assert 'data' in response

{firecrawl-2.9.0 → firecrawl-2.10.0}/firecrawl/firecrawl.py RENAMED Viewed

@@ -160,6 +160,7 @@ class ScrapeOptions(pydantic.BaseModel):
     changeTrackingOptions: Optional[ChangeTrackingOptions] = None
     maxAge: Optional[int] = None
     storeInCache: Optional[bool] = None
+    parsePDF: Optional[bool] = None
 class WaitAction(pydantic.BaseModel):
     """Wait action to perform during scraping."""
@@ -465,6 +466,7 @@ class FirecrawlApp:
             remove_base64_images: Optional[bool] = None,
             block_ads: Optional[bool] = None,
             proxy: Optional[Literal["basic", "stealth", "auto"]] = None,
+            parse_pdf: Optional[bool] = None,
             extract: Optional[JsonConfig] = None,
             json_options: Optional[JsonConfig] = None,
             actions: Optional[List[Union[WaitAction, ScreenshotAction, ClickAction, WriteAction, PressAction, ScrollAction, ScrapeAction, ExecuteJavascriptAction]]] = None,
@@ -538,6 +540,8 @@ class FirecrawlApp:
             scrape_params['blockAds'] = block_ads
         if proxy:
             scrape_params['proxy'] = proxy
+        if parse_pdf is not None:
+            scrape_params['parsePDF'] = parse_pdf
         if extract is not None:
             extract = self._ensure_schema_dict(extract)
             if isinstance(extract, dict) and "schema" in extract:
@@ -2904,6 +2908,7 @@ class AsyncFirecrawlApp(FirecrawlApp):
             remove_base64_images: Optional[bool] = None,
             block_ads: Optional[bool] = None,
             proxy: Optional[Literal["basic", "stealth", "auto"]] = None,
+            parse_pdf: Optional[bool] = None,
             extract: Optional[JsonConfig] = None,
             json_options: Optional[JsonConfig] = None,
             actions: Optional[List[Union[WaitAction, ScreenshotAction, ClickAction, WriteAction, PressAction, ScrollAction, ScrapeAction, ExecuteJavascriptAction]]] = None,
@@ -2981,6 +2986,8 @@ class AsyncFirecrawlApp(FirecrawlApp):
             scrape_params['blockAds'] = block_ads
         if proxy:
             scrape_params['proxy'] = proxy
+        if parse_pdf is not None:
+            scrape_params['parsePDF'] = parse_pdf
         if extract is not None:
             extract = self._ensure_schema_dict(extract)
             if isinstance(extract, dict) and "schema" in extract:

{firecrawl-2.9.0 → firecrawl-2.10.0}/firecrawl.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: firecrawl
-Version: 2.9.0
+Version: 2.10.0
 Summary: Python SDK for Firecrawl API
 Home-page: https://github.com/mendableai/firecrawl
 Author: Mendable.ai

{firecrawl-2.9.0 → firecrawl-2.10.0}/tests/test_change_tracking.py RENAMED Viewed

File without changes

{firecrawl-2.9.0 → firecrawl-2.10.0}/firecrawl.egg-info/SOURCES.txt RENAMED Viewed

File without changes

{firecrawl-2.9.0 → firecrawl-2.10.0}/firecrawl.egg-info/dependency_links.txt RENAMED Viewed

File without changes

{firecrawl-2.9.0 → firecrawl-2.10.0}/firecrawl.egg-info/requires.txt RENAMED Viewed

File without changes

{firecrawl-2.9.0 → firecrawl-2.10.0}/firecrawl.egg-info/top_level.txt RENAMED Viewed

File without changes

{firecrawl-2.9.0 → firecrawl-2.10.0}/pyproject.toml RENAMED Viewed

File without changes

{firecrawl-2.9.0 → firecrawl-2.10.0}/setup.cfg RENAMED Viewed

File without changes

{firecrawl-2.9.0 → firecrawl-2.10.0}/setup.py RENAMED Viewed

File without changes

firecrawl 2.9.0__tar.gz → 2.10.0__tar.gz

Potentially problematic release.

firecrawl 2.9.0tar.gz → 2.10.0tar.gz