spiderforce4ai 2.6.4__tar.gz → 2.6.6__tar.gz
Sign up to get free protection for your applications and to get access to all the features.
- {spiderforce4ai-2.6.4 → spiderforce4ai-2.6.6}/PKG-INFO +1 -1
- {spiderforce4ai-2.6.4 → spiderforce4ai-2.6.6}/pyproject.toml +1 -1
- {spiderforce4ai-2.6.4 → spiderforce4ai-2.6.6}/setup.py +1 -1
- {spiderforce4ai-2.6.4 → spiderforce4ai-2.6.6}/spiderforce4ai/post_extraction_agent.py +21 -5
- {spiderforce4ai-2.6.4 → spiderforce4ai-2.6.6}/spiderforce4ai.egg-info/PKG-INFO +1 -1
- {spiderforce4ai-2.6.4 → spiderforce4ai-2.6.6}/README.md +0 -0
- {spiderforce4ai-2.6.4 → spiderforce4ai-2.6.6}/setup.cfg +0 -0
- {spiderforce4ai-2.6.4 → spiderforce4ai-2.6.6}/spiderforce4ai/__init__.py +0 -0
- {spiderforce4ai-2.6.4 → spiderforce4ai-2.6.6}/spiderforce4ai.egg-info/SOURCES.txt +0 -0
- {spiderforce4ai-2.6.4 → spiderforce4ai-2.6.6}/spiderforce4ai.egg-info/dependency_links.txt +0 -0
- {spiderforce4ai-2.6.4 → spiderforce4ai-2.6.6}/spiderforce4ai.egg-info/entry_points.txt +0 -0
- {spiderforce4ai-2.6.4 → spiderforce4ai-2.6.6}/spiderforce4ai.egg-info/not-zip-safe +0 -0
- {spiderforce4ai-2.6.4 → spiderforce4ai-2.6.6}/spiderforce4ai.egg-info/requires.txt +0 -0
- {spiderforce4ai-2.6.4 → spiderforce4ai-2.6.6}/spiderforce4ai.egg-info/top_level.txt +0 -0
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
4
4
|
|
5
5
|
[project]
|
6
6
|
name = "spiderforce4ai"
|
7
|
-
version = "2.6.
|
7
|
+
version = "2.6.6"
|
8
8
|
description = "Python wrapper for SpiderForce4AI HTML-to-Markdown conversion service with LLM post-processing"
|
9
9
|
readme = "README.md"
|
10
10
|
authors = [
|
@@ -7,7 +7,7 @@ with open("README.md", encoding="utf-8") as f:
|
|
7
7
|
|
8
8
|
setup(
|
9
9
|
name="spiderforce4ai",
|
10
|
-
version="2.6.
|
10
|
+
version="2.6.6",
|
11
11
|
author="Piotr Tamulewicz",
|
12
12
|
author_email="pt@petertam.pro",
|
13
13
|
description="Python wrapper for SpiderForce4AI HTML-to-Markdown conversion service with LLM post-processing",
|
@@ -285,11 +285,16 @@ class PostExtractionAgent:
|
|
285
285
|
try:
|
286
286
|
with open(self.config.output_file, 'r', encoding='utf-8') as f:
|
287
287
|
current_results = json.load(f)
|
288
|
+
# Convert to list if it's a dict, or initialize new list
|
289
|
+
if isinstance(current_results, dict):
|
290
|
+
current_results = list(current_results.values())
|
291
|
+
elif not isinstance(current_results, list):
|
292
|
+
current_results = []
|
288
293
|
except (json.JSONDecodeError, FileNotFoundError):
|
289
|
-
current_results =
|
294
|
+
current_results = []
|
290
295
|
|
291
|
-
#
|
292
|
-
current_results
|
296
|
+
# Add new result to list
|
297
|
+
current_results.append(result)
|
293
298
|
|
294
299
|
# Save atomically using temporary file
|
295
300
|
temp_file = self.config.output_file.with_suffix('.tmp')
|
@@ -341,15 +346,26 @@ class PostExtractionAgent:
|
|
341
346
|
# Add URL to result before transformation
|
342
347
|
result['url'] = url
|
343
348
|
|
344
|
-
logger.info(f"Executing
|
349
|
+
logger.info(f"Executing transformer function for {url}")
|
345
350
|
transformed_result = self.config.custom_transform_function(result)
|
346
351
|
logger.info(f"Successfully applied custom transformation for {url}")
|
352
|
+
|
353
|
+
# Save the transformed result to combined output
|
354
|
+
if self.config.output_file:
|
355
|
+
self._save_result_sync(url, transformed_result)
|
356
|
+
logger.info(f"Saved transformed result to combined output for {url}")
|
357
|
+
|
347
358
|
logger.info(f"Webhook response sent for {url}")
|
348
|
-
return transformed_result
|
359
|
+
return transformed_result
|
349
360
|
except Exception as e:
|
350
361
|
error_msg = f"Warning: Issue in custom transform for {url}: {str(e)}"
|
351
362
|
logger.warning(error_msg)
|
352
363
|
console.print(f"[yellow]{error_msg}[/yellow]")
|
364
|
+
|
365
|
+
# Save original result if transformation fails
|
366
|
+
if self.config.output_file:
|
367
|
+
self._save_result_sync(url, result)
|
368
|
+
logger.info(f"Saved original result to combined output for {url}")
|
353
369
|
|
354
370
|
# Save result synchronously
|
355
371
|
try:
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|