PyPI - aiecs - Versions diffs - 1.0.8__py3-none-any.whl → 1.2.0__py3-none-any.whl - Mend

aiecs 1.0.8py3-none-any.whl → 1.2.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of aiecs might be problematic. Click here for more details.

Files changed (81) hide show

aiecs/__init__.py +1 -1
aiecs/aiecs_client.py +159 -1
aiecs/config/config.py +6 -0
aiecs/domain/__init__.py +95 -0
aiecs/domain/community/__init__.py +159 -0
aiecs/domain/community/agent_adapter.py +516 -0
aiecs/domain/community/analytics.py +465 -0
aiecs/domain/community/collaborative_workflow.py +99 -7
aiecs/domain/community/communication_hub.py +649 -0
aiecs/domain/community/community_builder.py +322 -0
aiecs/domain/community/community_integration.py +365 -12
aiecs/domain/community/community_manager.py +481 -5
aiecs/domain/community/decision_engine.py +459 -13
aiecs/domain/community/exceptions.py +238 -0
aiecs/domain/community/models/__init__.py +36 -0
aiecs/domain/community/resource_manager.py +1 -1
aiecs/domain/community/shared_context_manager.py +621 -0
aiecs/domain/context/__init__.py +24 -0
aiecs/domain/context/context_engine.py +37 -33
aiecs/main.py +20 -2
aiecs/scripts/aid/VERSION_MANAGEMENT.md +97 -0
aiecs/scripts/aid/__init__.py +15 -0
aiecs/scripts/aid/version_manager.py +224 -0
aiecs/scripts/dependance_check/__init__.py +18 -0
aiecs/scripts/{download_nlp_data.py → dependance_check/download_nlp_data.py} +51 -8
aiecs/scripts/dependance_patch/__init__.py +8 -0
aiecs/scripts/dependance_patch/fix_weasel/__init__.py +12 -0
aiecs/scripts/tools_develop/README.md +340 -0
aiecs/scripts/tools_develop/__init__.py +16 -0
aiecs/scripts/tools_develop/check_type_annotations.py +263 -0
aiecs/scripts/tools_develop/validate_tool_schemas.py +346 -0
aiecs/tools/__init__.py +53 -34
aiecs/tools/docs/__init__.py +106 -0
aiecs/tools/docs/ai_document_orchestrator.py +556 -0
aiecs/tools/docs/ai_document_writer_orchestrator.py +2222 -0
aiecs/tools/docs/content_insertion_tool.py +1234 -0
aiecs/tools/docs/document_creator_tool.py +1179 -0
aiecs/tools/docs/document_layout_tool.py +1105 -0
aiecs/tools/docs/document_parser_tool.py +924 -0
aiecs/tools/docs/document_writer_tool.py +1636 -0
aiecs/tools/langchain_adapter.py +102 -51
aiecs/tools/schema_generator.py +265 -0
aiecs/tools/statistics/__init__.py +82 -0
aiecs/tools/statistics/ai_data_analysis_orchestrator.py +581 -0
aiecs/tools/statistics/ai_insight_generator_tool.py +473 -0
aiecs/tools/statistics/ai_report_orchestrator_tool.py +629 -0
aiecs/tools/statistics/data_loader_tool.py +518 -0
aiecs/tools/statistics/data_profiler_tool.py +599 -0
aiecs/tools/statistics/data_transformer_tool.py +531 -0
aiecs/tools/statistics/data_visualizer_tool.py +460 -0
aiecs/tools/statistics/model_trainer_tool.py +470 -0
aiecs/tools/statistics/statistical_analyzer_tool.py +426 -0
aiecs/tools/task_tools/chart_tool.py +2 -1
aiecs/tools/task_tools/image_tool.py +43 -43
aiecs/tools/task_tools/office_tool.py +48 -36
aiecs/tools/task_tools/pandas_tool.py +37 -33
aiecs/tools/task_tools/report_tool.py +67 -56
aiecs/tools/task_tools/research_tool.py +32 -31
aiecs/tools/task_tools/scraper_tool.py +53 -46
aiecs/tools/task_tools/search_tool.py +1123 -0
aiecs/tools/task_tools/stats_tool.py +20 -15
{aiecs-1.0.8.dist-info → aiecs-1.2.0.dist-info}/METADATA +5 -1
aiecs-1.2.0.dist-info/RECORD +135 -0
aiecs-1.2.0.dist-info/entry_points.txt +10 -0
aiecs/tools/task_tools/search_api.py +0 -7
aiecs-1.0.8.dist-info/RECORD +0 -98
aiecs-1.0.8.dist-info/entry_points.txt +0 -7
/aiecs/scripts/{DEPENDENCY_SYSTEM_SUMMARY.md → dependance_check/DEPENDENCY_SYSTEM_SUMMARY.md} +0 -0
/aiecs/scripts/{README_DEPENDENCY_CHECKER.md → dependance_check/README_DEPENDENCY_CHECKER.md} +0 -0
/aiecs/scripts/{dependency_checker.py → dependance_check/dependency_checker.py} +0 -0
/aiecs/scripts/{dependency_fixer.py → dependance_check/dependency_fixer.py} +0 -0
/aiecs/scripts/{quick_dependency_check.py → dependance_check/quick_dependency_check.py} +0 -0
/aiecs/scripts/{setup_nlp_data.sh → dependance_check/setup_nlp_data.sh} +0 -0
/aiecs/scripts/{README_WEASEL_PATCH.md → dependance_patch/fix_weasel/README_WEASEL_PATCH.md} +0 -0
/aiecs/scripts/{fix_weasel_validator.py → dependance_patch/fix_weasel/fix_weasel_validator.py} +0 -0
/aiecs/scripts/{fix_weasel_validator.sh → dependance_patch/fix_weasel/fix_weasel_validator.sh} +0 -0
/aiecs/scripts/{patch_weasel_library.sh → dependance_patch/fix_weasel/patch_weasel_library.sh} +0 -0
/aiecs/scripts/{run_weasel_patch.sh → dependance_patch/fix_weasel/run_weasel_patch.sh} +0 -0
{aiecs-1.0.8.dist-info → aiecs-1.2.0.dist-info}/WHEEL +0 -0
{aiecs-1.0.8.dist-info → aiecs-1.2.0.dist-info}/licenses/LICENSE +0 -0
{aiecs-1.0.8.dist-info → aiecs-1.2.0.dist-info}/top_level.txt +0 -0

aiecs/tools/task_tools/scraper_tool.py CHANGED Viewed

@@ -12,8 +12,7 @@ from urllib.parse import urlparse, urljoin
 import httpx
 from bs4 import BeautifulSoup
 from urllib import request as urllib_request
-from pydantic import BaseModel, ValidationError, ConfigDict
-from pydantic_settings import BaseSettings
+from pydantic import BaseModel, ValidationError, ConfigDict, Field
 from aiecs.tools.base_tool import BaseTool
 from aiecs.tools import register_tool
@@ -45,31 +44,6 @@ class RenderEngine(str, Enum):
     NONE = "none"
     PLAYWRIGHT = "playwright"
-# Global settings
-class ScraperSettings(BaseSettings):
-    """
-    Configuration for ScraperTool.
-    Attributes:
-        user_agent (str): User agent for HTTP requests.
-        max_content_length (int): Maximum content length in bytes.
-        output_dir (str): Directory for output files.
-        scrapy_command (str): Command to run Scrapy.
-        allowed_domains (List[str]): Allowed domains for scraping.
-        blocked_domains (List[str]): Blocked domains for scraping.
-        playwright_available (bool): Whether Playwright is available.
-        env_prefix (str): Environment variable prefix.
-    """
-    user_agent: str = "PythonMiddlewareScraper/2.0"
-    max_content_length: int = 10 * 1024 * 1024  # 10MB
-    output_dir: str = os.path.join(tempfile.gettempdir(), 'scraper_outputs')
-    scrapy_command: str = "scrapy"
-    allowed_domains: List[str] = []
-    blocked_domains: List[str] = []
-    playwright_available: bool = False
-    env_prefix: str = "SCRAPER_TOOL_"
-    model_config = ConfigDict(env_prefix="SCRAPER_TOOL_")
 # Exceptions
 class ScraperToolError(Exception):
@@ -117,39 +91,72 @@ class ScraperTool(BaseTool):
     - Scrapy integration for advanced crawling
     - Output in various formats: text, JSON, HTML, Markdown, CSV
     """
+    # Configuration schema
+    class Config(BaseModel):
+        """Configuration for the scraper tool"""
+        model_config = ConfigDict(env_prefix="SCRAPER_TOOL_")
+        user_agent: str = Field(
+            default="PythonMiddlewareScraper/2.0",
+            description="User agent for HTTP requests"
+        )
+        max_content_length: int = Field(
+            default=10 * 1024 * 1024,
+            description="Maximum content length in bytes"
+        )
+        output_dir: str = Field(
+            default=os.path.join(tempfile.gettempdir(), 'scraper_outputs'),
+            description="Directory for output files"
+        )
+        scrapy_command: str = Field(
+            default="scrapy",
+            description="Command to run Scrapy"
+        )
+        allowed_domains: List[str] = Field(
+            default=[],
+            description="Allowed domains for scraping"
+        )
+        blocked_domains: List[str] = Field(
+            default=[],
+            description="Blocked domains for scraping"
+        )
+        playwright_available: bool = Field(
+            default=False,
+            description="Whether Playwright is available (auto-detected)"
+        )
     def __init__(self, config: Optional[Dict] = None):
         """
         Initialize ScraperTool with settings and resources.
         Args:
-            config (Dict, optional): Configuration overrides for ScraperSettings.
+            config (Dict, optional): Configuration overrides for ScraperTool.
         Raises:
             ValueError: If config contains invalid settings.
         """
         super().__init__(config)
-        self.settings = ScraperSettings()
-        if config:
-            try:
-                self.settings = self.settings.model_validate({**self.settings.model_dump(), **config})
-            except ValidationError as e:
-                raise ValueError(f"Invalid settings: {e}")
+        # Parse configuration
+        self.config = self.Config(**(config or {}))
         self.logger = logging.getLogger(__name__)
         if not self.logger.handlers:
             handler = logging.StreamHandler()
             handler.setFormatter(logging.Formatter('%(asctime)s %(levelname)s %(message)s'))
             self.logger.addHandler(handler)
         self.logger.setLevel(logging.INFO)
-        os.makedirs(self.settings.output_dir, exist_ok=True)
+        os.makedirs(self.config.output_dir, exist_ok=True)
         self._check_external_tools()
     def _check_external_tools(self):
         """Check if external tools are available."""
         try:
             import playwright
-            self.settings.playwright_available = True
+            self.config.playwright_available = True
         except ImportError:
-            self.settings.playwright_available = False
+            self.config.playwright_available = False
     async def _save_output(self, content: Any, path: str, format: OutputFormat) -> None:
@@ -232,7 +239,7 @@ class ScraperTool(BaseTool):
         try:
             headers = headers or {}
             if 'User-Agent' not in headers:
-                headers['User-Agent'] = self.settings.user_agent
+                headers['User-Agent'] = self.config.user_agent
             kwargs = {
                 'params': params,
                 'headers': headers,
@@ -261,7 +268,7 @@ class ScraperTool(BaseTool):
             except httpx.HTTPStatusError as e:
                 raise HttpError(f"HTTP {e.response.status_code}: {e.response.reason_phrase} for {url}")
-            if len(resp.content) > self.settings.max_content_length:
+            if len(resp.content) > self.config.max_content_length:
                 raise HttpError(f"Response content too large: {len(resp.content)} bytes")
             if content_type == ContentType.JSON:
@@ -308,7 +315,7 @@ class ScraperTool(BaseTool):
             headers = headers or {}
             if 'User-Agent' not in headers:
-                headers['User-Agent'] = self.settings.user_agent
+                headers['User-Agent'] = self.config.user_agent
             data_bytes = None
             if data:
                 data_bytes = urllib.parse.urlencode(data).encode()
@@ -320,7 +327,7 @@ class ScraperTool(BaseTool):
             )
             with urllib_request.urlopen(req) as resp:
                 content_length = resp.getheader('Content-Length')
-                if content_length and int(content_length) > self.settings.max_content_length:
+                if content_length and int(content_length) > self.config.max_content_length:
                     raise HttpError(f"Response content too large: {content_length} bytes")
                 content = resp.read()
                 charset = resp.headers.get_content_charset() or 'utf-8'
@@ -375,7 +382,7 @@ class ScraperTool(BaseTool):
         """
         try:
             if engine == RenderEngine.PLAYWRIGHT:
-                if not self.settings.playwright_available:
+                if not self.config.playwright_available:
                     raise RenderingError("Playwright is not available. Install with 'pip install playwright'")
                 result = await self._render_with_playwright(url, wait_time, wait_selector, scroll_to_bottom, screenshot, screenshot_path)
             else:
@@ -393,7 +400,7 @@ class ScraperTool(BaseTool):
         async with async_playwright() as p:
             browser = await p.chromium.launch()
             page = await browser.new_page(
-                user_agent=self.settings.user_agent,
+                user_agent=self.config.user_agent,
                 viewport={'width': 1280, 'height': 800}
             )
             try:
@@ -407,7 +414,7 @@ class ScraperTool(BaseTool):
                     await page.wait_for_timeout(1000)
                 screenshot_result = None
                 if screenshot:
-                    screenshot_path = screenshot_path or os.path.join(self.settings.output_dir, f"screenshot_{int(time.time())}.png")
+                    screenshot_path = screenshot_path or os.path.join(self.config.output_dir, f"screenshot_{int(time.time())}.png")
                     os.makedirs(os.path.dirname(os.path.abspath(screenshot_path)), exist_ok=True)
                     await page.screenshot(path=screenshot_path)
                     screenshot_result = screenshot_path
@@ -447,10 +454,10 @@ class ScraperTool(BaseTool):
             start_time = time.time()
             os.makedirs(os.path.dirname(os.path.abspath(output_path)), exist_ok=True)
             cmd = [
-                self.settings.scrapy_command,
+                self.config.scrapy_command,
                 'crawl', spider_name,
                 '-o', output_path,
-                '-s', f'USER_AGENT={self.settings.user_agent}',
+                '-s', f'USER_AGENT={self.config.user_agent}',
                 '-s', 'LOG_LEVEL=INFO'
             ]
             if spider_args:

aiecs 1.0.8__py3-none-any.whl → 1.2.0__py3-none-any.whl

Potentially problematic release.

aiecs 1.0.8py3-none-any.whl → 1.2.0py3-none-any.whl