firecrawl 1.2.0__tar.gz → 1.2.2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of firecrawl might be problematic. Click here for more details.
- {firecrawl-1.2.0 → firecrawl-1.2.2}/PKG-INFO +1 -1
- {firecrawl-1.2.0 → firecrawl-1.2.2}/firecrawl/__init__.py +1 -1
- {firecrawl-1.2.0 → firecrawl-1.2.2}/firecrawl/firecrawl.py +17 -25
- {firecrawl-1.2.0 → firecrawl-1.2.2}/firecrawl.egg-info/PKG-INFO +1 -1
- {firecrawl-1.2.0 → firecrawl-1.2.2}/LICENSE +0 -0
- {firecrawl-1.2.0 → firecrawl-1.2.2}/README.md +0 -0
- {firecrawl-1.2.0 → firecrawl-1.2.2}/firecrawl/__tests__/e2e_withAuth/__init__.py +0 -0
- {firecrawl-1.2.0 → firecrawl-1.2.2}/firecrawl/__tests__/e2e_withAuth/test.py +0 -0
- {firecrawl-1.2.0 → firecrawl-1.2.2}/firecrawl/__tests__/v1/e2e_withAuth/__init__.py +0 -0
- {firecrawl-1.2.0 → firecrawl-1.2.2}/firecrawl/__tests__/v1/e2e_withAuth/test.py +0 -0
- {firecrawl-1.2.0 → firecrawl-1.2.2}/firecrawl.egg-info/SOURCES.txt +0 -0
- {firecrawl-1.2.0 → firecrawl-1.2.2}/firecrawl.egg-info/dependency_links.txt +0 -0
- {firecrawl-1.2.0 → firecrawl-1.2.2}/firecrawl.egg-info/requires.txt +0 -0
- {firecrawl-1.2.0 → firecrawl-1.2.2}/firecrawl.egg-info/top_level.txt +0 -0
- {firecrawl-1.2.0 → firecrawl-1.2.2}/pyproject.toml +0 -0
- {firecrawl-1.2.0 → firecrawl-1.2.2}/setup.cfg +0 -0
- {firecrawl-1.2.0 → firecrawl-1.2.2}/setup.py +0 -0
|
@@ -59,31 +59,17 @@ class FirecrawlApp:
|
|
|
59
59
|
|
|
60
60
|
# If there are additional params, process them
|
|
61
61
|
if params:
|
|
62
|
-
|
|
63
|
-
|
|
64
|
-
|
|
65
|
-
if
|
|
66
|
-
|
|
67
|
-
|
|
68
|
-
|
|
69
|
-
|
|
70
|
-
|
|
71
|
-
|
|
72
|
-
|
|
73
|
-
if key not in ['extractorOptions']:
|
|
74
|
-
scrape_params[key] = value
|
|
75
|
-
elif self.version == 'v1':
|
|
76
|
-
# Handle extract (for v1)
|
|
77
|
-
extract = params.get('extract', {})
|
|
78
|
-
if extract:
|
|
79
|
-
if 'schema' in extract and hasattr(extract['schema'], 'schema'):
|
|
80
|
-
extract['schema'] = extract['schema'].schema()
|
|
81
|
-
scrape_params['extract'] = extract
|
|
82
|
-
|
|
83
|
-
# Include any other params directly at the top level of scrape_params
|
|
84
|
-
for key, value in params.items():
|
|
85
|
-
if key not in ['extract']:
|
|
86
|
-
scrape_params[key] = value
|
|
62
|
+
# Handle extract (for v1)
|
|
63
|
+
extract = params.get('extract', {})
|
|
64
|
+
if extract:
|
|
65
|
+
if 'schema' in extract and hasattr(extract['schema'], 'schema'):
|
|
66
|
+
extract['schema'] = extract['schema'].schema()
|
|
67
|
+
scrape_params['extract'] = extract
|
|
68
|
+
|
|
69
|
+
# Include any other params directly at the top level of scrape_params
|
|
70
|
+
for key, value in params.items():
|
|
71
|
+
if key not in ['extract']:
|
|
72
|
+
scrape_params[key] = value
|
|
87
73
|
|
|
88
74
|
endpoint = f'/v1/scrape'
|
|
89
75
|
# Make the POST request with the prepared headers and JSON data
|
|
@@ -360,6 +346,12 @@ class FirecrawlApp:
|
|
|
360
346
|
status_data = status_response.json()
|
|
361
347
|
if status_data['status'] == 'completed':
|
|
362
348
|
if 'data' in status_data:
|
|
349
|
+
data = status_data['data']
|
|
350
|
+
while 'next' in status_data:
|
|
351
|
+
status_response = self._get_request(status_data['next'], headers)
|
|
352
|
+
status_data = status_response.json()
|
|
353
|
+
data.extend(status_data['data'])
|
|
354
|
+
status_data['data'] = data
|
|
363
355
|
return status_data
|
|
364
356
|
else:
|
|
365
357
|
raise Exception('Crawl job completed but no data was returned')
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|