spiderforce4ai 2.4.9__py3-none-any.whl → 2.5__py3-none-any.whl

Sign up to get free protection for your applications and to get access to all the features.
@@ -5,6 +5,9 @@ import asyncio
5
5
  import aiohttp
6
6
  import json
7
7
  import logging
8
+
9
+ logger = logging.getLogger(__name__)
10
+ import logging
8
11
  from typing import List, Dict, Union, Optional, Tuple, Callable, Any
9
12
  from dataclasses import dataclass, asdict
10
13
  from urllib.parse import urljoin, urlparse
@@ -877,7 +880,20 @@ class SpiderForce4AI:
877
880
 
878
881
  for result in successful_results:
879
882
  try:
880
- result.extraction_result = asyncio.run(agent.process_content(result.url, result.markdown))
883
+ # Get LLM response
884
+ llm_response = agent.process_content(result.url, result.markdown)
885
+ if llm_response:
886
+ # Add URL to the response before transformation
887
+ llm_response['url'] = result.url
888
+ # Apply transformation if provided
889
+ if config.post_agent_transformer_function:
890
+ try:
891
+ result.extraction_result = config.post_agent_transformer_function(llm_response)
892
+ except Exception as e:
893
+ logger.error(f"Transformer error for {result.url}: {str(e)}")
894
+ result.extraction_result = llm_response # Use original response if transform fails
895
+ else:
896
+ result.extraction_result = llm_response
881
897
  progress.update(llm_task, advance=1)
882
898
  except Exception as e:
883
899
  console.print(f"[red]Error in post-extraction processing for {result.url}: {str(e)}[/red]")
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.2
2
2
  Name: spiderforce4ai
3
- Version: 2.4.9
3
+ Version: 2.5
4
4
  Summary: Python wrapper for SpiderForce4AI HTML-to-Markdown conversion service with LLM post-processing
5
5
  Home-page: https://petertam.pro
6
6
  Author: Piotr Tamulewicz
@@ -0,0 +1,7 @@
1
+ spiderforce4ai/__init__.py,sha256=T0H2nqzhvXuxYMKgWAVoRrSIUV72H7yZ8SHIsbG9I4g,43327
2
+ spiderforce4ai/post_extraction_agent.py,sha256=so5Ze7Vz3konpQ0iT7ZxDGE9kIYeTwPTFyzezRc5oys,15392
3
+ spiderforce4ai-2.5.dist-info/METADATA,sha256=4iP462Pmx5GikzNhhPFHhm89BdkGqTzFDTeiPN1Xp4U,9010
4
+ spiderforce4ai-2.5.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
5
+ spiderforce4ai-2.5.dist-info/entry_points.txt,sha256=ibARQxOlDiL1ho12zbDZt4Uq5RKSIk_qk159ZlZ46hc,59
6
+ spiderforce4ai-2.5.dist-info/top_level.txt,sha256=Kth7A21Js7DCp0j5XBBi-FE45SCLouZkeNZU__Yr9Yk,15
7
+ spiderforce4ai-2.5.dist-info/RECORD,,
@@ -1,7 +0,0 @@
1
- spiderforce4ai/__init__.py,sha256=DUPOKF7-vCVQi7JimsStU1qjk5x3yVUoMnUVOJxOrGk,42360
2
- spiderforce4ai/post_extraction_agent.py,sha256=so5Ze7Vz3konpQ0iT7ZxDGE9kIYeTwPTFyzezRc5oys,15392
3
- spiderforce4ai-2.4.9.dist-info/METADATA,sha256=kEq3anAkoe_wpPVzpgaJlsSuAzTQHDgXiDFpirXvUQc,9012
4
- spiderforce4ai-2.4.9.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
5
- spiderforce4ai-2.4.9.dist-info/entry_points.txt,sha256=ibARQxOlDiL1ho12zbDZt4Uq5RKSIk_qk159ZlZ46hc,59
6
- spiderforce4ai-2.4.9.dist-info/top_level.txt,sha256=Kth7A21Js7DCp0j5XBBi-FE45SCLouZkeNZU__Yr9Yk,15
7
- spiderforce4ai-2.4.9.dist-info/RECORD,,