PyPI - entari-plugin-hyw - Versions diffs - 0.3.5__py3-none-any.whl → 4.0.0rc14__py3-none-any.whl - Mend

entari-plugin-hyw 0.3.5py3-none-any.whl → 4.0.0rc14py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of entari-plugin-hyw might be problematic. Click here for more details.

Files changed (78) hide show

entari_plugin_hyw/Untitled-1 +1865 -0
entari_plugin_hyw/__init__.py +979 -116
entari_plugin_hyw/filters.py +83 -0
entari_plugin_hyw/history.py +251 -0
entari_plugin_hyw/misc.py +214 -0
entari_plugin_hyw/search_cache.py +154 -0
entari_plugin_hyw-4.0.0rc14.dist-info/METADATA +118 -0
entari_plugin_hyw-4.0.0rc14.dist-info/RECORD +72 -0
{entari_plugin_hyw-0.3.5.dist-info → entari_plugin_hyw-4.0.0rc14.dist-info}/WHEEL +1 -1
{entari_plugin_hyw-0.3.5.dist-info → entari_plugin_hyw-4.0.0rc14.dist-info}/top_level.txt +1 -0
hyw_core/__init__.py +94 -0
hyw_core/agent.py +768 -0
hyw_core/browser_control/__init__.py +63 -0
hyw_core/browser_control/assets/card-dist/index.html +425 -0
hyw_core/browser_control/assets/card-dist/logos/anthropic.svg +1 -0
hyw_core/browser_control/assets/card-dist/logos/cerebras.svg +9 -0
hyw_core/browser_control/assets/card-dist/logos/deepseek.png +0 -0
hyw_core/browser_control/assets/card-dist/logos/gemini.svg +1 -0
hyw_core/browser_control/assets/card-dist/logos/google.svg +1 -0
hyw_core/browser_control/assets/card-dist/logos/grok.png +0 -0
hyw_core/browser_control/assets/card-dist/logos/huggingface.png +0 -0
hyw_core/browser_control/assets/card-dist/logos/microsoft.svg +15 -0
hyw_core/browser_control/assets/card-dist/logos/minimax.png +0 -0
hyw_core/browser_control/assets/card-dist/logos/mistral.png +0 -0
hyw_core/browser_control/assets/card-dist/logos/nvida.png +0 -0
hyw_core/browser_control/assets/card-dist/logos/openai.svg +1 -0
hyw_core/browser_control/assets/card-dist/logos/openrouter.png +0 -0
hyw_core/browser_control/assets/card-dist/logos/perplexity.svg +24 -0
hyw_core/browser_control/assets/card-dist/logos/qwen.png +0 -0
hyw_core/browser_control/assets/card-dist/logos/xai.png +0 -0
hyw_core/browser_control/assets/card-dist/logos/xiaomi.png +0 -0
hyw_core/browser_control/assets/card-dist/logos/zai.png +0 -0
hyw_core/browser_control/assets/card-dist/vite.svg +1 -0
hyw_core/browser_control/assets/index.html +5691 -0
hyw_core/browser_control/assets/logos/anthropic.svg +1 -0
hyw_core/browser_control/assets/logos/cerebras.svg +9 -0
hyw_core/browser_control/assets/logos/deepseek.png +0 -0
hyw_core/browser_control/assets/logos/gemini.svg +1 -0
hyw_core/browser_control/assets/logos/google.svg +1 -0
hyw_core/browser_control/assets/logos/grok.png +0 -0
hyw_core/browser_control/assets/logos/huggingface.png +0 -0
hyw_core/browser_control/assets/logos/microsoft.svg +15 -0
hyw_core/browser_control/assets/logos/minimax.png +0 -0
hyw_core/browser_control/assets/logos/mistral.png +0 -0
hyw_core/browser_control/assets/logos/nvida.png +0 -0
hyw_core/browser_control/assets/logos/openai.svg +1 -0
hyw_core/browser_control/assets/logos/openrouter.png +0 -0
hyw_core/browser_control/assets/logos/perplexity.svg +24 -0
hyw_core/browser_control/assets/logos/qwen.png +0 -0
hyw_core/browser_control/assets/logos/xai.png +0 -0
hyw_core/browser_control/assets/logos/xiaomi.png +0 -0
hyw_core/browser_control/assets/logos/zai.png +0 -0
hyw_core/browser_control/engines/__init__.py +15 -0
hyw_core/browser_control/engines/base.py +13 -0
hyw_core/browser_control/engines/default.py +166 -0
hyw_core/browser_control/engines/duckduckgo.py +171 -0
hyw_core/browser_control/landing.html +172 -0
hyw_core/browser_control/manager.py +173 -0
hyw_core/browser_control/renderer.py +446 -0
hyw_core/browser_control/service.py +940 -0
hyw_core/config.py +154 -0
hyw_core/core.py +462 -0
hyw_core/crawling/__init__.py +18 -0
hyw_core/crawling/completeness.py +437 -0
hyw_core/crawling/models.py +88 -0
hyw_core/definitions.py +104 -0
hyw_core/image_cache.py +274 -0
hyw_core/pipeline.py +502 -0
hyw_core/search.py +171 -0
hyw_core/stages/__init__.py +21 -0
hyw_core/stages/base.py +95 -0
hyw_core/stages/summary.py +191 -0
entari_plugin_hyw/agent.py +0 -419
entari_plugin_hyw/compressor.py +0 -59
entari_plugin_hyw/tools.py +0 -236
entari_plugin_hyw/vision.py +0 -35
entari_plugin_hyw-0.3.5.dist-info/METADATA +0 -112
entari_plugin_hyw-0.3.5.dist-info/RECORD +0 -9

hyw_core/stages/__init__.py ADDED Viewed

@@ -0,0 +1,21 @@
+"""
+hyw_core.stages - Pipeline Stages
+This subpackage provides the pipeline stage implementations:
+- BaseStage: Abstract base class for all stages
+- StageContext: Shared context between stages
+- StageResult: Stage execution result
+- InstructStage: Initial task planning and search execution
+- SummaryStage: Final response generation
+"""
+from .base import BaseStage, StageContext, StageResult
+from .summary import SummaryStage
+__all__ = [
+    "BaseStage",
+    "StageContext",
+    "StageResult",
+    "SummaryStage",
+]

hyw_core/stages/base.py ADDED Viewed

@@ -0,0 +1,95 @@
+"""
+Stage Base Classes
+Abstract base classes for pipeline stages.
+Each stage is a self-contained unit of work.
+"""
+from abc import ABC, abstractmethod
+from dataclasses import dataclass, field
+from typing import Any, Dict, List, Optional
+from openai import AsyncOpenAI
+@dataclass
+class StageContext:
+    """Shared context passed between stages."""
+    user_input: str
+    images: List[str] = field(default_factory=list)
+    conversation_history: List[Dict] = field(default_factory=list)
+    instruct_history: List[Dict] = field(default_factory=list)  # History for Instruct stage rounds
+    # Accumulated data
+    web_results: List[Dict] = field(default_factory=list)
+    agent_context: str = ""
+    review_context: str = "" # Context passed from Instruct to Review stage
+    # Mode info (set by Instruct stage)
+    task_list: List[str] = field(default_factory=list)
+    # Control flags
+    should_refuse: bool = False
+    refuse_reason: str = ""
+    selected_mode: str = "fast"  # "fast" or "deepsearch"
+    # ID counter for unified referencing
+    global_id_counter: int = 0
+    # Model capabilities
+    image_input_supported: bool = True
+    # Search timing
+    search_time: float = 0.0
+    def next_id(self) -> int:
+        """Get next global ID."""
+        self.global_id_counter += 1
+        return self.global_id_counter
+@dataclass
+class StageResult:
+    """Result from a stage execution."""
+    success: bool
+    data: Dict[str, Any] = field(default_factory=dict)
+    usage: Dict[str, int] = field(default_factory=lambda: {"input_tokens": 0, "output_tokens": 0})
+    trace: Dict[str, Any] = field(default_factory=dict)
+    error: Optional[str] = None
+class BaseStage(ABC):
+    """Abstract base class for pipeline stages."""
+    def __init__(self, config: Any, search_service: Any, client: AsyncOpenAI):
+        self.config = config
+        self.search_service = search_service
+        self.client = client
+    @property
+    @abstractmethod
+    def name(self) -> str:
+        """Stage name for logging and tracing."""
+        pass
+    @abstractmethod
+    async def execute(self, context: StageContext) -> StageResult:
+        """
+        Execute the stage.
+        Args:
+            context: Shared context with accumulated data
+        Returns:
+            StageResult with success status, data, usage, and trace info
+        """
+        pass
+    def _client_for(self, api_key: Optional[str], base_url: Optional[str]) -> AsyncOpenAI:
+        """Get or create client with custom credentials."""
+        if api_key or base_url:
+            return AsyncOpenAI(
+                base_url=base_url or self.config.base_url,
+                api_key=api_key or self.config.api_key
+            )
+        return self.client

hyw_core/stages/summary.py ADDED Viewed

@@ -0,0 +1,191 @@
+"""
+Summary Stage
+Generates final response based on gathered information.
+Different output formats for different modes.
+"""
+import time
+import re
+from typing import Any, Dict, List, Optional
+from loguru import logger
+from openai import AsyncOpenAI
+from .base import BaseStage, StageContext, StageResult
+from ..definitions import SUMMARY_REPORT_SP, get_refuse_answer_tool
+class SummaryStage(BaseStage):
+    """
+    Summary Stage: Generate final response.
+    """
+    @property
+    def name(self) -> str:
+        return "Summary"
+    async def execute(
+        self,
+        context: StageContext,
+        images: List[str] = None
+    ) -> StageResult:
+        """Generate summary."""
+        start_time = time.time()
+        # Format context from web results
+        web_content = self._format_web_content(context)
+        # Tools
+        refuse_tool = get_refuse_answer_tool()
+        full_context = f"{context.agent_context}\n\n{web_content}"
+        # Select prompt
+        language = getattr(self.config, "language", "Simplified Chinese")
+        system_prompt = SUMMARY_REPORT_SP + f"\n\n用户要求的语言: {language}"
+        # Build Context Message
+        context_message = f"## Web Search & Page Content\n\n```context\n{full_context}\n```"
+        # Build user content
+        user_text = context.user_input or "..."
+        if images:
+            # Add image context message for multimodal input
+            image_context = f"[System: The user has provided {len(images)} image(s). Please analyze these images together with the text query to provide a comprehensive response.]"
+            user_content: List[Dict[str, Any]] = [{"type": "text", "text": f"{image_context}\n\n{user_text}"}]
+            for img_b64 in images:
+                url = f"data:image/jpeg;base64,{img_b64}" if not img_b64.startswith("data:") else img_b64
+                user_content.append({"type": "image_url", "image_url": {"url": url}})
+        else:
+            user_content = user_text
+        messages = [
+            {"role": "system", "content": system_prompt},
+            {"role": "user", "content": context_message},
+            {"role": "user", "content": user_content}
+        ]
+        # Get model config
+        model_cfg = self.config.get_model_config("main")
+        client = self._client_for(
+            api_key=model_cfg.api_key,
+            base_url=model_cfg.base_url
+        )
+        model = model_cfg.model_name or self.config.model_name
+        try:
+            response = await client.chat.completions.create(
+                model=model,
+                messages=messages,
+                temperature=self.config.temperature,
+                extra_body=getattr(self.config, "summary_extra_body", None),
+                tools=[refuse_tool],
+                tool_choice="auto",
+            )
+        except Exception as e:
+            logger.error(f"SummaryStage LLM error: {e}")
+            return StageResult(
+                success=False,
+                error=str(e),
+                data={"content": f"Error generating summary: {e}"}
+            )
+        usage = {"input_tokens": 0, "output_tokens": 0}
+        if hasattr(response, "usage") and response.usage:
+            usage["input_tokens"] = getattr(response.usage, "prompt_tokens", 0) or 0
+            usage["output_tokens"] = getattr(response.usage, "completion_tokens", 0) or 0
+        # Handle Tool Calls (Refusal)
+        tool_calls = response.choices[0].message.tool_calls
+        if tool_calls:
+            for tc in tool_calls:
+                if tc.function.name == "refuse_answer":
+                    import json
+                    try:
+                        args = json.loads(tc.function.arguments)
+                        reason = args.get("reason", "Refused")
+                        context.should_refuse = True
+                        context.refuse_reason = reason
+                        return StageResult(
+                            success=True,
+                            data={"content": f"Refused: {reason}"},
+                            usage=usage,
+                            trace={"skipped": True, "reason": reason}
+                        )
+                    except: pass
+        content = (response.choices[0].message.content or "").strip()
+        return StageResult(
+            success=True,
+            data={"content": content},
+            usage=usage,
+            trace={
+                "model": model,
+                "provider": model_cfg.model_provider or "Unknown",
+                "usage": usage,
+                "system_prompt": system_prompt,
+                "context_message": context_message,  # Includes vision description + search results
+                "output": content,
+                "time": time.time() - start_time,
+                "images_count": len(images) if images else 0,
+            }
+        )
+    def _strip_links(self, text: str) -> str:
+        """Strip markdown links [text](url) -> text and remove bare URLs."""
+        # Replace [text](url) with text
+        text = re.sub(r'\[([^\]]+)\]\([^\)]+\)', r'\1', text)
+        # Remove bare URLs (http/https) roughly, trying to preserve surrounding text if possible?
+        # A simple pattern for http/s
+        text = re.sub(r'https?://\S+', '', text)
+        return text
+    def _format_web_content(self, context: StageContext) -> str:
+        """Format web results for summary prompt."""
+        if not context.web_results:
+            return ""
+        # Sort results: pages first, then raw searches, then snippets
+        def get_priority(item_type):
+            if item_type == "page": return 0
+            if item_type == "search_raw_page": return 1
+            return 2  # search (snippets)
+        sorted_results = sorted(
+            context.web_results,
+            key=lambda x: get_priority(x.get("_type"))
+        )
+        lines = []
+        seen_urls = set()
+        for res in sorted_results:
+            type_ = res.get("_type")
+            idx = res.get("_id")
+            title = (res.get("title", "") or "").strip()
+            url = res.get("url", "")
+            # Deduplicate items by URL (keep higher priority item only)
+            if url:
+                if url in seen_urls:
+                    continue
+                seen_urls.add(url)
+            # url = res.get("url", "") # Removed as requested
+            if type_ == "page":
+                content = (res.get("content", "") or "").strip()
+                content = self._strip_links(content)
+                lines.append(f"[{idx}] Title: {title}\nContent:\n{content}\n")
+            elif type_ == "search":
+                snippet = (res.get("content", "") or "").strip()
+                snippet = self._strip_links(snippet)
+                lines.append(f"[{idx}] Title: {title}\nSnippet: {snippet}\n")
+        return "\n".join(lines)

entari-plugin-hyw 0.3.5__py3-none-any.whl → 4.0.0rc14__py3-none-any.whl

Potentially problematic release.

entari-plugin-hyw 0.3.5py3-none-any.whl → 4.0.0rc14py3-none-any.whl