spiderforce4ai 2.4.9__py3-none-any.whl → 2.5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -5,6 +5,9 @@ import asyncio
5
5
  import aiohttp
6
6
  import json
7
7
  import logging
8
+
9
+ logger = logging.getLogger(__name__)
10
+ import logging
8
11
  from typing import List, Dict, Union, Optional, Tuple, Callable, Any
9
12
  from dataclasses import dataclass, asdict
10
13
  from urllib.parse import urljoin, urlparse
@@ -877,7 +880,20 @@ class SpiderForce4AI:
877
880
 
878
881
  for result in successful_results:
879
882
  try:
880
- result.extraction_result = asyncio.run(agent.process_content(result.url, result.markdown))
883
+ # Get LLM response
884
+ llm_response = agent.process_content(result.url, result.markdown)
885
+ if llm_response:
886
+ # Add URL to the response before transformation
887
+ llm_response['url'] = result.url
888
+ # Apply transformation if provided
889
+ if config.post_agent_transformer_function:
890
+ try:
891
+ result.extraction_result = config.post_agent_transformer_function(llm_response)
892
+ except Exception as e:
893
+ logger.error(f"Transformer error for {result.url}: {str(e)}")
894
+ result.extraction_result = llm_response # Use original response if transform fails
895
+ else:
896
+ result.extraction_result = llm_response
881
897
  progress.update(llm_task, advance=1)
882
898
  except Exception as e:
883
899
  console.print(f"[red]Error in post-extraction processing for {result.url}: {str(e)}[/red]")
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.2
2
2
  Name: spiderforce4ai
3
- Version: 2.4.9
3
+ Version: 2.5
4
4
  Summary: Python wrapper for SpiderForce4AI HTML-to-Markdown conversion service with LLM post-processing
5
5
  Home-page: https://petertam.pro
6
6
  Author: Piotr Tamulewicz
@@ -0,0 +1,7 @@
1
+ spiderforce4ai/__init__.py,sha256=T0H2nqzhvXuxYMKgWAVoRrSIUV72H7yZ8SHIsbG9I4g,43327
2
+ spiderforce4ai/post_extraction_agent.py,sha256=so5Ze7Vz3konpQ0iT7ZxDGE9kIYeTwPTFyzezRc5oys,15392
3
+ spiderforce4ai-2.5.dist-info/METADATA,sha256=4iP462Pmx5GikzNhhPFHhm89BdkGqTzFDTeiPN1Xp4U,9010
4
+ spiderforce4ai-2.5.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
5
+ spiderforce4ai-2.5.dist-info/entry_points.txt,sha256=ibARQxOlDiL1ho12zbDZt4Uq5RKSIk_qk159ZlZ46hc,59
6
+ spiderforce4ai-2.5.dist-info/top_level.txt,sha256=Kth7A21Js7DCp0j5XBBi-FE45SCLouZkeNZU__Yr9Yk,15
7
+ spiderforce4ai-2.5.dist-info/RECORD,,
@@ -1,7 +0,0 @@
1
- spiderforce4ai/__init__.py,sha256=DUPOKF7-vCVQi7JimsStU1qjk5x3yVUoMnUVOJxOrGk,42360
2
- spiderforce4ai/post_extraction_agent.py,sha256=so5Ze7Vz3konpQ0iT7ZxDGE9kIYeTwPTFyzezRc5oys,15392
3
- spiderforce4ai-2.4.9.dist-info/METADATA,sha256=kEq3anAkoe_wpPVzpgaJlsSuAzTQHDgXiDFpirXvUQc,9012
4
- spiderforce4ai-2.4.9.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
5
- spiderforce4ai-2.4.9.dist-info/entry_points.txt,sha256=ibARQxOlDiL1ho12zbDZt4Uq5RKSIk_qk159ZlZ46hc,59
6
- spiderforce4ai-2.4.9.dist-info/top_level.txt,sha256=Kth7A21Js7DCp0j5XBBi-FE45SCLouZkeNZU__Yr9Yk,15
7
- spiderforce4ai-2.4.9.dist-info/RECORD,,