PyPI - hdsp-jupyter-extension - Versions diffs - 2.0.5__py3-none-any.whl → 2.0.7__py3-none-any.whl - Mend

hdsp-jupyter-extension 2.0.5py3-none-any.whl → 2.0.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (90) hide show

agent_server/langchain/middleware/code_search_middleware.py DELETED Viewed

@@ -1,278 +0,0 @@
-"""
-Code Search Middleware
-Automatically searches workspace and notebook cells for relevant code
-before model calls. Helps the agent understand existing code context.
-"""
-import logging
-import re
-from typing import Any, Dict, List, Optional
-from agent_server.langchain.executors.notebook_searcher import (
-    NotebookSearcher,
-    get_notebook_searcher,
-)
-from agent_server.langchain.state import AgentRuntime, AgentState, SearchResult
-logger = logging.getLogger(__name__)
-class CodeSearchMiddleware:
-    """
-    Middleware that searches for relevant code before model calls.
-    This middleware:
-    1. Extracts search terms from the user request
-    2. Searches workspace files and notebook cells
-    3. Injects relevant code context into the state
-    Uses @before_model hook pattern from LangChain middleware.
-    """
-    def __init__(
-        self,
-        notebook_searcher: Optional[NotebookSearcher] = None,
-        workspace_root: str = ".",
-        max_results: int = 10,
-        auto_search: bool = True,
-        search_patterns: Optional[List[str]] = None,
-        enabled: bool = True,
-    ):
-        """
-        Initialize code search middleware.
-        Args:
-            notebook_searcher: NotebookSearcher instance
-            workspace_root: Root directory for searches
-            max_results: Maximum search results to include
-            auto_search: Automatically extract and search patterns
-            search_patterns: Additional patterns to always search
-            enabled: Whether the middleware is enabled
-        """
-        self._searcher = notebook_searcher
-        self._workspace_root = workspace_root
-        self._max_results = max_results
-        self._auto_search = auto_search
-        self._search_patterns = search_patterns or []
-        self._enabled = enabled
-    @property
-    def name(self) -> str:
-        return "CodeSearchMiddleware"
-    def _get_searcher(self) -> NotebookSearcher:
-        """Get or create notebook searcher"""
-        if self._searcher is None:
-            self._searcher = get_notebook_searcher(self._workspace_root)
-        return self._searcher
-    def _extract_search_terms(self, request: str) -> List[str]:
-        """
-        Extract potential search terms from user request.
-        Looks for:
-        - Variable names (snake_case, camelCase)
-        - Function calls (func_name(), methodName())
-        - Class names (PascalCase)
-        - File references (*.py, *.ipynb)
-        - Quoted strings
-        """
-        terms = set()
-        # Extract quoted strings
-        quoted = re.findall(r'["\']([^"\']+)["\']', request)
-        terms.update(quoted)
-        # Extract potential identifiers (excluding common words)
-        common_words = {
-            "the", "a", "an", "is", "are", "was", "were", "be", "been",
-            "have", "has", "had", "do", "does", "did", "will", "would",
-            "could", "should", "may", "might", "must", "shall", "can",
-            "for", "and", "or", "but", "in", "on", "at", "to", "from",
-            "with", "by", "about", "into", "through", "during", "before",
-            "after", "above", "below", "between", "under", "again",
-            "further", "then", "once", "here", "there", "when", "where",
-            "why", "how", "all", "each", "every", "both", "few", "more",
-            "most", "other", "some", "such", "no", "nor", "not", "only",
-            "own", "same", "so", "than", "too", "very", "just", "also",
-            "now", "please", "help", "want", "need", "make", "create",
-            "use", "using", "show", "display", "get", "set", "add",
-            "remove", "delete", "update", "change", "modify", "fix",
-        }
-        # Look for identifiers (snake_case, camelCase, PascalCase)
-        identifiers = re.findall(r'\b([a-zA-Z_][a-zA-Z0-9_]*)\b', request)
-        for ident in identifiers:
-            if ident.lower() not in common_words and len(ident) > 2:
-                terms.add(ident)
-        # Look for file patterns
-        file_patterns = re.findall(r'\b(\w+\.(?:py|ipynb|csv|json|txt))\b', request)
-        terms.update(file_patterns)
-        # Look for function/method calls
-        func_calls = re.findall(r'\b(\w+)\s*\(', request)
-        for func in func_calls:
-            if func.lower() not in common_words:
-                terms.add(func)
-        return list(terms)[:10]  # Limit to top 10 terms
-    async def before_model(
-        self,
-        state: AgentState,
-        runtime: AgentRuntime,
-    ) -> Optional[Dict[str, Any]]:
-        """
-        Hook called before each model invocation.
-        Searches for relevant code and injects into state.
-        Args:
-            state: Current agent state
-            runtime: Agent runtime context
-        Returns:
-            Updated state fields or None
-        """
-        # Skip if middleware is disabled
-        if not self._enabled:
-            return None
-        # Skip if search results already present
-        if state.get("search_results"):
-            return None
-        user_request = state.get("user_request", "")
-        if not user_request:
-            return None
-        search_results: List[SearchResult] = []
-        searcher = self._get_searcher()
-        # Get current notebook path
-        notebook_context = state.get("notebook_context", {})
-        current_notebook = notebook_context.get("notebook_path", "")
-        # Auto-extract search terms
-        if self._auto_search:
-            terms = self._extract_search_terms(user_request)
-            terms.extend(self._search_patterns)
-        else:
-            terms = self._search_patterns
-        if not terms:
-            return None
-        logger.info(f"Searching for terms: {terms}")
-        # Search current notebook first
-        if current_notebook:
-            for term in terms[:5]:  # Limit terms for current notebook
-                try:
-                    results = searcher.search_notebook(
-                        current_notebook,
-                        term,
-                        max_results=3,
-                    )
-                    for match in results.matches:
-                        search_results.append(SearchResult(
-                            file_path=match.file_path,
-                            cell_index=match.cell_index,
-                            line_number=match.line_number,
-                            content=match.content,
-                            match_type="cell",
-                        ))
-                except Exception as e:
-                    logger.warning(f"Notebook search failed: {e}")
-        # Search workspace for remaining capacity
-        remaining = self._max_results - len(search_results)
-        if remaining > 0:
-            for term in terms[:3]:  # Limit workspace searches
-                try:
-                    results = searcher.search_workspace(
-                        term,
-                        max_results=remaining,
-                    )
-                    for match in results.matches:
-                        # Avoid duplicates
-                        if not any(
-                            r["file_path"] == match.file_path and
-                            r.get("line_number") == match.line_number
-                            for r in search_results
-                        ):
-                            search_results.append(SearchResult(
-                                file_path=match.file_path,
-                                cell_index=match.cell_index,
-                                line_number=match.line_number,
-                                content=match.content,
-                                match_type=match.match_type,
-                            ))
-                except Exception as e:
-                    logger.warning(f"Workspace search failed: {e}")
-        if search_results:
-            logger.info(f"Found {len(search_results)} relevant code snippets")
-            return {"search_results": search_results[:self._max_results]}
-        return None
-    def format_search_results_for_prompt(
-        self,
-        search_results: List[SearchResult],
-    ) -> str:
-        """
-        Format search results for inclusion in the prompt.
-        Args:
-            search_results: List of search results
-        Returns:
-            Formatted context string
-        """
-        if not search_results:
-            return ""
-        lines = ["## Relevant Code from Workspace"]
-        for i, result in enumerate(search_results[:self._max_results], 1):
-            file_path = result.get("file_path", "unknown")
-            cell_idx = result.get("cell_index")
-            line_num = result.get("line_number")
-            content = result.get("content", "")
-            location = f"{file_path}"
-            if cell_idx is not None:
-                location += f" [Cell {cell_idx}]"
-            if line_num is not None:
-                location += f":L{line_num}"
-            lines.append(f"\n### {i}. {location}")
-            lines.append(f"```\n{content}\n```")
-        return "\n".join(lines)
-def create_code_search_middleware(
-    workspace_root: str = ".",
-    max_results: int = 10,
-    auto_search: bool = True,
-) -> CodeSearchMiddleware:
-    """
-    Factory function to create code search middleware.
-    Args:
-        workspace_root: Root directory for searches
-        max_results: Maximum results to include
-        auto_search: Auto-extract search terms from request
-    Returns:
-        Configured CodeSearchMiddleware instance
-    """
-    return CodeSearchMiddleware(
-        workspace_root=workspace_root,
-        max_results=max_results,
-        auto_search=auto_search,
-    )

agent_server/langchain/middleware/error_handling_middleware.py DELETED Viewed

@@ -1,338 +0,0 @@
-"""
-Error Handling Middleware
-Classifies errors and decides on recovery strategies after tool execution.
-Implements self-healing and adaptive replanning logic.
-"""
-import logging
-from typing import Any, Dict, List, Optional
-from agent_server.langchain.state import AgentRuntime, AgentState
-logger = logging.getLogger(__name__)
-class ErrorHandlingMiddleware:
-    """
-    Middleware that handles errors after tool execution.
-    This middleware:
-    1. Classifies errors using ErrorClassifier
-    2. Decides on recovery strategy (refine, insert_steps, replan)
-    3. Updates state with recovery information
-    4. Tracks retry attempts
-    Uses @after_tool_call hook pattern from LangChain middleware.
-    """
-    def __init__(
-        self,
-        error_classifier: Any = None,
-        max_retries: int = 3,
-        use_llm_fallback: bool = True,
-        enabled: bool = True,
-    ):
-        """
-        Initialize error handling middleware.
-        Args:
-            error_classifier: ErrorClassifier instance
-            max_retries: Maximum retry attempts per error
-            use_llm_fallback: Use LLM for complex error analysis
-            enabled: Whether error handling is enabled
-        """
-        self._classifier = error_classifier
-        self._max_retries = max_retries
-        self._use_llm_fallback = use_llm_fallback
-        self._enabled = enabled
-    @property
-    def name(self) -> str:
-        return "ErrorHandlingMiddleware"
-    def _get_classifier(self):
-        """Lazy load error classifier"""
-        if self._classifier is None:
-            try:
-                from agent_server.core.error_classifier import get_error_classifier
-                self._classifier = get_error_classifier()
-            except ImportError:
-                logger.warning("ErrorClassifier not available")
-                return None
-        return self._classifier
-    def _classify_error(
-        self,
-        error_type: str,
-        error_message: str,
-        traceback: Optional[List[str]] = None,
-        previous_attempts: int = 0,
-    ) -> Dict[str, Any]:
-        """Classify error using ErrorClassifier"""
-        classifier = self._get_classifier()
-        if classifier is None:
-            # Fallback classification
-            return self._fallback_classify(error_type, error_message)
-        try:
-            traceback_str = "\n".join(traceback) if traceback else ""
-            # Check if LLM fallback should be used
-            should_use_llm, reason = classifier.should_use_llm_fallback(
-                error_type=error_type,
-                traceback=traceback_str,
-                previous_attempts=previous_attempts,
-            )
-            # Classify using pattern matching
-            analysis = classifier.classify(
-                error_type=error_type,
-                error_message=error_message,
-                traceback=traceback_str,
-            )
-            result = analysis.to_dict()
-            result["should_use_llm"] = should_use_llm
-            result["llm_reason"] = reason
-            return result
-        except Exception as e:
-            logger.error(f"Error classification failed: {e}")
-            return self._fallback_classify(error_type, error_message)
-    def _fallback_classify(
-        self,
-        error_type: str,
-        error_message: str,
-    ) -> Dict[str, Any]:
-        """Fallback error classification without ErrorClassifier"""
-        # Simple heuristic-based classification
-        # Module not found -> need to install
-        if error_type in ("ModuleNotFoundError", "ImportError"):
-            module_name = self._extract_module_name(error_message)
-            return {
-                "decision": "insert_steps",
-                "analysis": {
-                    "root_cause": f"Missing module: {module_name}",
-                    "is_approach_problem": False,
-                },
-                "reasoning": "Package installation required",
-                "changes": {
-                    "new_steps": [{
-                        "description": f"Install {module_name}",
-                        "toolCalls": [{
-                            "tool": "jupyter_cell",
-                            "parameters": {
-                                "code": f"!pip install {module_name}"
-                            }
-                        }]
-                    }]
-                },
-                "confidence": 0.9,
-            }
-        # Syntax/Type/Value errors -> refine code
-        if error_type in ("SyntaxError", "TypeError", "ValueError", "KeyError", "IndexError"):
-            return {
-                "decision": "refine",
-                "analysis": {
-                    "root_cause": f"{error_type}: {error_message}",
-                    "is_approach_problem": False,
-                },
-                "reasoning": "Code can be fixed with refinement",
-                "changes": {},
-                "confidence": 0.8,
-            }
-        # Name errors -> might be missing definition
-        if error_type == "NameError":
-            return {
-                "decision": "refine",
-                "analysis": {
-                    "root_cause": f"Undefined variable: {error_message}",
-                    "is_approach_problem": False,
-                },
-                "reasoning": "Variable not defined, need to fix code",
-                "changes": {},
-                "confidence": 0.7,
-            }
-        # Default -> try refinement first
-        return {
-            "decision": "refine",
-            "analysis": {
-                "root_cause": f"{error_type}: {error_message}",
-                "is_approach_problem": False,
-            },
-            "reasoning": "Attempting code refinement",
-            "changes": {},
-            "confidence": 0.5,
-        }
-    def _extract_module_name(self, error_message: str) -> str:
-        """Extract module name from import error message"""
-        import re
-        # Match "No module named 'xxx'" or "No module named 'xxx.yyy'"
-        match = re.search(r"No module named ['\"]([^'\"]+)['\"]", error_message)
-        if match:
-            module = match.group(1).split(".")[0]
-            # Handle common aliases
-            aliases = {
-                "sklearn": "scikit-learn",
-                "cv2": "opencv-python",
-                "PIL": "pillow",
-            }
-            return aliases.get(module, module)
-        return "unknown-package"
-    async def after_tool_call(
-        self,
-        tool_name: str,
-        tool_input: Dict[str, Any],
-        tool_result: Dict[str, Any],
-        state: AgentState,
-        runtime: AgentRuntime,
-    ) -> Optional[Dict[str, Any]]:
-        """
-        Hook called after each tool execution.
-        Handles errors and updates recovery strategy.
-        Args:
-            tool_name: Name of the tool that was called
-            tool_input: Tool input parameters
-            tool_result: Result from tool execution
-            state: Current agent state
-            runtime: Agent runtime context
-        Returns:
-            Modified result or None
-        """
-        if not self._enabled:
-            return None
-        # Only handle jupyter_cell errors
-        if tool_name != "jupyter_cell_tool":
-            return None
-        # Check if execution succeeded
-        if tool_result.get("success", True):
-            # Reset error count on success
-            state["error_count"] = 0
-            state["last_error"] = None
-            state["recovery_strategy"] = None
-            return None
-        # Handle execution error
-        error_type = tool_result.get("error_type", "UnknownError")
-        error_message = tool_result.get("error", "Unknown error")
-        traceback = tool_result.get("traceback", [])
-        error_count = state.get("error_count", 0)
-        logger.info(f"Handling error: {error_type} (attempt {error_count})")
-        # Classify error and get recovery strategy
-        classification = self._classify_error(
-            error_type=error_type,
-            error_message=error_message,
-            traceback=traceback,
-            previous_attempts=error_count,
-        )
-        # Check retry limit
-        if error_count >= self._max_retries:
-            classification["decision"] = "replan_remaining"
-            classification["reasoning"] = f"Max retries ({self._max_retries}) exceeded"
-        # Update state with recovery information
-        state["recovery_strategy"] = classification["decision"]
-        state["last_error"] = {
-            "error_type": error_type,
-            "error_message": error_message,
-            "traceback": traceback,
-            "classification": classification,
-        }
-        # Enrich tool result with classification
-        tool_result["error_classification"] = classification
-        tool_result["recovery_strategy"] = classification["decision"]
-        tool_result["recovery_changes"] = classification.get("changes", {})
-        logger.info(
-            f"Error classified: decision={classification['decision']}, "
-            f"confidence={classification.get('confidence', 0)}"
-        )
-        return tool_result
-    def format_error_feedback(
-        self,
-        last_error: Dict[str, Any],
-    ) -> str:
-        """
-        Format error information for feedback to the model.
-        Args:
-            last_error: Last error information from state
-        Returns:
-            Formatted feedback string
-        """
-        if not last_error:
-            return ""
-        lines = ["## Execution Error"]
-        error_type = last_error.get("error_type", "UnknownError")
-        error_message = last_error.get("error_message", "")
-        lines.append(f"**Type**: {error_type}")
-        lines.append(f"**Message**: {error_message}")
-        classification = last_error.get("classification", {})
-        if classification:
-            decision = classification.get("decision", "unknown")
-            reasoning = classification.get("reasoning", "")
-            lines.append(f"\n**Recovery Strategy**: {decision}")
-            lines.append(f"**Reasoning**: {reasoning}")
-            changes = classification.get("changes", {})
-            if changes:
-                lines.append("\n**Suggested Changes**:")
-                if "new_steps" in changes:
-                    for step in changes["new_steps"]:
-                        lines.append(f"- {step.get('description', 'New step')}")
-        return "\n".join(lines)
-def create_error_handling_middleware(
-    max_retries: int = 3,
-    use_llm_fallback: bool = True,
-    enabled: bool = True,
-) -> ErrorHandlingMiddleware:
-    """
-    Factory function to create error handling middleware.
-    Args:
-        max_retries: Maximum retry attempts
-        use_llm_fallback: Use LLM for complex errors
-        enabled: Whether to enable error handling
-    Returns:
-        Configured ErrorHandlingMiddleware instance
-    """
-    return ErrorHandlingMiddleware(
-        max_retries=max_retries,
-        use_llm_fallback=use_llm_fallback,
-        enabled=enabled,
-    )

hdsp-jupyter-extension 2.0.5__py3-none-any.whl → 2.0.7__py3-none-any.whl

hdsp-jupyter-extension 2.0.5py3-none-any.whl → 2.0.7py3-none-any.whl