firecrawl-py 2.7.0__tar.gz → 2.8.0__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of firecrawl-py might be problematic. Click here for more details.
- {firecrawl_py-2.7.0 → firecrawl_py-2.8.0}/PKG-INFO +1 -1
- {firecrawl_py-2.7.0 → firecrawl_py-2.8.0}/firecrawl/__init__.py +1 -1
- {firecrawl_py-2.7.0 → firecrawl_py-2.8.0}/firecrawl/firecrawl.py +24 -11
- {firecrawl_py-2.7.0 → firecrawl_py-2.8.0}/firecrawl_py.egg-info/PKG-INFO +1 -1
- {firecrawl_py-2.7.0 → firecrawl_py-2.8.0}/LICENSE +0 -0
- {firecrawl_py-2.7.0 → firecrawl_py-2.8.0}/README.md +0 -0
- {firecrawl_py-2.7.0 → firecrawl_py-2.8.0}/firecrawl/__tests__/e2e_withAuth/__init__.py +0 -0
- {firecrawl_py-2.7.0 → firecrawl_py-2.8.0}/firecrawl/__tests__/e2e_withAuth/test.py +0 -0
- {firecrawl_py-2.7.0 → firecrawl_py-2.8.0}/firecrawl/__tests__/v1/e2e_withAuth/__init__.py +0 -0
- {firecrawl_py-2.7.0 → firecrawl_py-2.8.0}/firecrawl/__tests__/v1/e2e_withAuth/test.py +0 -0
- {firecrawl_py-2.7.0 → firecrawl_py-2.8.0}/firecrawl_py.egg-info/SOURCES.txt +0 -0
- {firecrawl_py-2.7.0 → firecrawl_py-2.8.0}/firecrawl_py.egg-info/dependency_links.txt +0 -0
- {firecrawl_py-2.7.0 → firecrawl_py-2.8.0}/firecrawl_py.egg-info/requires.txt +0 -0
- {firecrawl_py-2.7.0 → firecrawl_py-2.8.0}/firecrawl_py.egg-info/top_level.txt +0 -0
- {firecrawl_py-2.7.0 → firecrawl_py-2.8.0}/pyproject.toml +0 -0
- {firecrawl_py-2.7.0 → firecrawl_py-2.8.0}/setup.cfg +0 -0
- {firecrawl_py-2.7.0 → firecrawl_py-2.8.0}/setup.py +0 -0
- {firecrawl_py-2.7.0 → firecrawl_py-2.8.0}/tests/test_change_tracking.py +0 -0
|
@@ -13,7 +13,7 @@ import os
|
|
|
13
13
|
|
|
14
14
|
from .firecrawl import FirecrawlApp, AsyncFirecrawlApp, JsonConfig, ScrapeOptions, ChangeTrackingOptions # noqa
|
|
15
15
|
|
|
16
|
-
__version__ = "2.
|
|
16
|
+
__version__ = "2.8.0"
|
|
17
17
|
|
|
18
18
|
# Define the logger for the Firecrawl project
|
|
19
19
|
logger: logging.Logger = logging.getLogger("firecrawl")
|
|
@@ -140,6 +140,7 @@ class ChangeTrackingOptions(pydantic.BaseModel):
|
|
|
140
140
|
modes: Optional[List[Literal["git-diff", "json"]]] = None
|
|
141
141
|
schema: Optional[Any] = None
|
|
142
142
|
prompt: Optional[str] = None
|
|
143
|
+
tag: Optional[str] = None
|
|
143
144
|
|
|
144
145
|
class ScrapeOptions(pydantic.BaseModel):
|
|
145
146
|
"""Parameters for scraping operations."""
|
|
@@ -155,8 +156,10 @@ class ScrapeOptions(pydantic.BaseModel):
|
|
|
155
156
|
skipTlsVerification: Optional[bool] = None
|
|
156
157
|
removeBase64Images: Optional[bool] = None
|
|
157
158
|
blockAds: Optional[bool] = None
|
|
158
|
-
proxy: Optional[Literal["basic", "stealth"]] = None
|
|
159
|
+
proxy: Optional[Literal["basic", "stealth", "auto"]] = None
|
|
159
160
|
changeTrackingOptions: Optional[ChangeTrackingOptions] = None
|
|
161
|
+
maxAge: Optional[int] = None
|
|
162
|
+
storeInCache: Optional[bool] = None
|
|
160
163
|
|
|
161
164
|
class WaitAction(pydantic.BaseModel):
|
|
162
165
|
"""Wait action to perform during scraping."""
|
|
@@ -292,6 +295,7 @@ class MapParams(pydantic.BaseModel):
|
|
|
292
295
|
sitemapOnly: Optional[bool] = None
|
|
293
296
|
limit: Optional[int] = None
|
|
294
297
|
timeout: Optional[int] = None
|
|
298
|
+
useIndex: Optional[bool] = None
|
|
295
299
|
|
|
296
300
|
class MapResponse(pydantic.BaseModel):
|
|
297
301
|
"""Response from mapping operations."""
|
|
@@ -459,11 +463,13 @@ class FirecrawlApp:
|
|
|
459
463
|
skip_tls_verification: Optional[bool] = None,
|
|
460
464
|
remove_base64_images: Optional[bool] = None,
|
|
461
465
|
block_ads: Optional[bool] = None,
|
|
462
|
-
proxy: Optional[Literal["basic", "stealth"]] = None,
|
|
466
|
+
proxy: Optional[Literal["basic", "stealth", "auto"]] = None,
|
|
463
467
|
extract: Optional[JsonConfig] = None,
|
|
464
468
|
json_options: Optional[JsonConfig] = None,
|
|
465
469
|
actions: Optional[List[Union[WaitAction, ScreenshotAction, ClickAction, WriteAction, PressAction, ScrollAction, ScrapeAction, ExecuteJavascriptAction]]] = None,
|
|
466
470
|
change_tracking_options: Optional[ChangeTrackingOptions] = None,
|
|
471
|
+
max_age: Optional[int] = None,
|
|
472
|
+
store_in_cache: Optional[bool] = None,
|
|
467
473
|
**kwargs) -> ScrapeResponse[Any]:
|
|
468
474
|
"""
|
|
469
475
|
Scrape and extract content from a URL.
|
|
@@ -481,7 +487,7 @@ class FirecrawlApp:
|
|
|
481
487
|
skip_tls_verification (Optional[bool]): Skip TLS verification
|
|
482
488
|
remove_base64_images (Optional[bool]): Remove base64 images
|
|
483
489
|
block_ads (Optional[bool]): Block ads
|
|
484
|
-
proxy (Optional[Literal["basic", "stealth"]]): Proxy type (basic/stealth)
|
|
490
|
+
proxy (Optional[Literal["basic", "stealth", "auto"]]): Proxy type (basic/stealth)
|
|
485
491
|
extract (Optional[JsonConfig]): Content extraction settings
|
|
486
492
|
json_options (Optional[JsonConfig]): JSON extraction settings
|
|
487
493
|
actions (Optional[List[Union[WaitAction, ScreenshotAction, ClickAction, WriteAction, PressAction, ScrollAction, ScrapeAction, ExecuteJavascriptAction]]]): Actions to perform
|
|
@@ -545,6 +551,10 @@ class FirecrawlApp:
|
|
|
545
551
|
scrape_params['actions'] = [action if isinstance(action, dict) else action.dict(exclude_none=True) for action in actions]
|
|
546
552
|
if change_tracking_options:
|
|
547
553
|
scrape_params['changeTrackingOptions'] = change_tracking_options if isinstance(change_tracking_options, dict) else change_tracking_options.dict(exclude_none=True)
|
|
554
|
+
if max_age is not None:
|
|
555
|
+
scrape_params['maxAge'] = max_age
|
|
556
|
+
if store_in_cache is not None:
|
|
557
|
+
scrape_params['storeInCache'] = store_in_cache
|
|
548
558
|
|
|
549
559
|
scrape_params.update(kwargs)
|
|
550
560
|
|
|
@@ -1102,6 +1112,7 @@ class FirecrawlApp:
|
|
|
1102
1112
|
sitemap_only: Optional[bool] = None,
|
|
1103
1113
|
limit: Optional[int] = None,
|
|
1104
1114
|
timeout: Optional[int] = None,
|
|
1115
|
+
use_index: Optional[bool] = None,
|
|
1105
1116
|
**kwargs) -> MapResponse:
|
|
1106
1117
|
"""
|
|
1107
1118
|
Map and discover links from a URL.
|
|
@@ -1144,7 +1155,9 @@ class FirecrawlApp:
|
|
|
1144
1155
|
map_params['limit'] = limit
|
|
1145
1156
|
if timeout is not None:
|
|
1146
1157
|
map_params['timeout'] = timeout
|
|
1147
|
-
|
|
1158
|
+
if use_index is not None:
|
|
1159
|
+
map_params['useIndex'] = use_index
|
|
1160
|
+
|
|
1148
1161
|
# Add any additional kwargs
|
|
1149
1162
|
map_params.update(kwargs)
|
|
1150
1163
|
|
|
@@ -1191,7 +1204,7 @@ class FirecrawlApp:
|
|
|
1191
1204
|
skip_tls_verification: Optional[bool] = None,
|
|
1192
1205
|
remove_base64_images: Optional[bool] = None,
|
|
1193
1206
|
block_ads: Optional[bool] = None,
|
|
1194
|
-
proxy: Optional[Literal["basic", "stealth"]] = None,
|
|
1207
|
+
proxy: Optional[Literal["basic", "stealth", "auto"]] = None,
|
|
1195
1208
|
extract: Optional[JsonConfig] = None,
|
|
1196
1209
|
json_options: Optional[JsonConfig] = None,
|
|
1197
1210
|
actions: Optional[List[Union[WaitAction, ScreenshotAction, ClickAction, WriteAction, PressAction, ScrollAction, ScrapeAction, ExecuteJavascriptAction]]] = None,
|
|
@@ -1325,7 +1338,7 @@ class FirecrawlApp:
|
|
|
1325
1338
|
skip_tls_verification: Optional[bool] = None,
|
|
1326
1339
|
remove_base64_images: Optional[bool] = None,
|
|
1327
1340
|
block_ads: Optional[bool] = None,
|
|
1328
|
-
proxy: Optional[Literal["basic", "stealth"]] = None,
|
|
1341
|
+
proxy: Optional[Literal["basic", "stealth", "auto"]] = None,
|
|
1329
1342
|
extract: Optional[JsonConfig] = None,
|
|
1330
1343
|
json_options: Optional[JsonConfig] = None,
|
|
1331
1344
|
actions: Optional[List[Union[WaitAction, ScreenshotAction, ClickAction, WriteAction, PressAction, ScrollAction, ScrapeAction, ExecuteJavascriptAction]]] = None,
|
|
@@ -1457,7 +1470,7 @@ class FirecrawlApp:
|
|
|
1457
1470
|
skip_tls_verification: Optional[bool] = None,
|
|
1458
1471
|
remove_base64_images: Optional[bool] = None,
|
|
1459
1472
|
block_ads: Optional[bool] = None,
|
|
1460
|
-
proxy: Optional[Literal["basic", "stealth"]] = None,
|
|
1473
|
+
proxy: Optional[Literal["basic", "stealth", "auto"]] = None,
|
|
1461
1474
|
extract: Optional[JsonConfig] = None,
|
|
1462
1475
|
json_options: Optional[JsonConfig] = None,
|
|
1463
1476
|
actions: Optional[List[Union[WaitAction, ScreenshotAction, ClickAction, WriteAction, PressAction, ScrollAction, ScrapeAction, ExecuteJavascriptAction]]] = None,
|
|
@@ -2852,7 +2865,7 @@ class AsyncFirecrawlApp(FirecrawlApp):
|
|
|
2852
2865
|
skip_tls_verification: Optional[bool] = None,
|
|
2853
2866
|
remove_base64_images: Optional[bool] = None,
|
|
2854
2867
|
block_ads: Optional[bool] = None,
|
|
2855
|
-
proxy: Optional[Literal["basic", "stealth"]] = None,
|
|
2868
|
+
proxy: Optional[Literal["basic", "stealth", "auto"]] = None,
|
|
2856
2869
|
extract: Optional[JsonConfig] = None,
|
|
2857
2870
|
json_options: Optional[JsonConfig] = None,
|
|
2858
2871
|
actions: Optional[List[Union[WaitAction, ScreenshotAction, ClickAction, WriteAction, PressAction, ScrollAction, ScrapeAction, ExecuteJavascriptAction]]] = None,
|
|
@@ -2873,7 +2886,7 @@ class AsyncFirecrawlApp(FirecrawlApp):
|
|
|
2873
2886
|
skip_tls_verification (Optional[bool]): Skip TLS verification
|
|
2874
2887
|
remove_base64_images (Optional[bool]): Remove base64 images
|
|
2875
2888
|
block_ads (Optional[bool]): Block ads
|
|
2876
|
-
proxy (Optional[Literal["basic", "stealth"]]): Proxy type (basic/stealth)
|
|
2889
|
+
proxy (Optional[Literal["basic", "stealth", "auto"]]): Proxy type (basic/stealth)
|
|
2877
2890
|
extract (Optional[JsonConfig]): Content extraction settings
|
|
2878
2891
|
json_options (Optional[JsonConfig]): JSON extraction settings
|
|
2879
2892
|
actions (Optional[List[Union[WaitAction, ScreenshotAction, ClickAction, WriteAction, PressAction, ScrollAction, ScrapeAction, ExecuteJavascriptAction]]]): Actions to perform
|
|
@@ -2981,7 +2994,7 @@ class AsyncFirecrawlApp(FirecrawlApp):
|
|
|
2981
2994
|
skip_tls_verification: Optional[bool] = None,
|
|
2982
2995
|
remove_base64_images: Optional[bool] = None,
|
|
2983
2996
|
block_ads: Optional[bool] = None,
|
|
2984
|
-
proxy: Optional[Literal["basic", "stealth"]] = None,
|
|
2997
|
+
proxy: Optional[Literal["basic", "stealth", "auto"]] = None,
|
|
2985
2998
|
extract: Optional[JsonConfig] = None,
|
|
2986
2999
|
json_options: Optional[JsonConfig] = None,
|
|
2987
3000
|
actions: Optional[List[Union[WaitAction, ScreenshotAction, ClickAction, WriteAction, PressAction, ScrollAction, ScrapeAction, ExecuteJavascriptAction]]] = None,
|
|
@@ -3120,7 +3133,7 @@ class AsyncFirecrawlApp(FirecrawlApp):
|
|
|
3120
3133
|
skip_tls_verification: Optional[bool] = None,
|
|
3121
3134
|
remove_base64_images: Optional[bool] = None,
|
|
3122
3135
|
block_ads: Optional[bool] = None,
|
|
3123
|
-
proxy: Optional[Literal["basic", "stealth"]] = None,
|
|
3136
|
+
proxy: Optional[Literal["basic", "stealth", "auto"]] = None,
|
|
3124
3137
|
extract: Optional[JsonConfig] = None,
|
|
3125
3138
|
json_options: Optional[JsonConfig] = None,
|
|
3126
3139
|
actions: Optional[List[Union[WaitAction, ScreenshotAction, ClickAction, WriteAction, PressAction, ScrollAction, ScrapeAction, ExecuteJavascriptAction]]] = None,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|