PyPI - hdsp-jupyter-extension - Versions diffs - 2.0.6__py3-none-any.whl → 2.0.8__py3-none-any.whl - Mend

hdsp-jupyter-extension 2.0.6py3-none-any.whl → 2.0.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (88) hide show

agent_server/langchain/custom_middleware.py ADDED Viewed

@@ -0,0 +1,663 @@
+"""
+Custom middleware for LangChain agent.
+Provides middleware for handling empty responses, limiting tool calls,
+injecting continuation prompts, and patching dangling tool calls.
+"""
+import json
+import logging
+import re
+import uuid
+from typing import Any, Dict, Optional
+from langchain_core.messages import AIMessage, HumanMessage
+from agent_server.langchain.logging_utils import (
+    _format_middleware_marker,
+    _with_middleware_logging,
+)
+from agent_server.langchain.prompts import JSON_TOOL_SCHEMA, NON_HITL_TOOLS
+logger = logging.getLogger(__name__)
+def parse_json_tool_call(text) -> Optional[Dict[str, Any]]:
+    """Parse JSON tool call from text response.
+    Args:
+        text: Raw text that may contain a JSON tool call (str or list)
+    Returns:
+        Parsed dictionary with 'tool' and 'arguments' keys, or None
+    """
+    if not text:
+        return None
+    # Handle list content (multimodal responses from Gemini)
+    if isinstance(text, list):
+        text_parts = []
+        for part in text:
+            if isinstance(part, str):
+                text_parts.append(part)
+            elif isinstance(part, dict) and part.get("type") == "text":
+                text_parts.append(part.get("text", ""))
+        text = "\n".join(text_parts)
+    if not isinstance(text, str) or not text:
+        return None
+    # Clean up response
+    text = text.strip()
+    if text.startswith("```json"):
+        text = text[7:]
+    elif text.startswith("```"):
+        text = text[3:]
+    if text.endswith("```"):
+        text = text[:-3]
+    text = text.strip()
+    # Try direct JSON parse
+    try:
+        data = json.loads(text)
+        if "tool" in data:
+            return data
+    except json.JSONDecodeError:
+        pass
+    # Try to find JSON object in response
+    json_match = re.search(r"\{[\s\S]*\}", text)
+    if json_match:
+        try:
+            data = json.loads(json_match.group())
+            if "tool" in data:
+                return data
+        except json.JSONDecodeError:
+            pass
+    return None
+def normalize_tool_name(tool_name: str) -> str:
+    """Normalize tool name to match registered tool names.
+    Rules:
+    - write_todos_tool → write_todos (TodoListMiddleware exception)
+    - other tools without _tool suffix → add _tool suffix
+    """
+    if tool_name == "write_todos_tool":
+        return "write_todos"
+    if not tool_name.endswith("_tool") and tool_name != "write_todos":
+        return f"{tool_name}_tool"
+    return tool_name
+def create_tool_call_message(tool_name: str, arguments: Dict[str, Any]) -> AIMessage:
+    """Create AIMessage with tool_calls from parsed JSON.
+    Args:
+        tool_name: Name of the tool to call
+        arguments: Tool arguments dictionary
+    Returns:
+        AIMessage with properly formatted tool_calls
+    """
+    tool_name = normalize_tool_name(tool_name)
+    return AIMessage(
+        content="",
+        tool_calls=[
+            {
+                "name": tool_name,
+                "args": arguments,
+                "id": str(uuid.uuid4()),
+                "type": "tool_call",
+            }
+        ],
+    )
+def create_handle_empty_response_middleware(wrap_model_call):
+    """Create middleware to detect and handle empty LLM responses with JSON fallback.
+    For models that don't support native tool calling well (e.g., Gemini 2.5 Flash),
+    this middleware:
+    1. Detects empty or text-only responses (no tool_calls)
+    2. Retries with JSON schema prompt to force structured output
+    3. Parses JSON response and injects tool_calls into AIMessage
+    4. Falls back to synthetic final_answer if all else fails
+    Args:
+        wrap_model_call: LangChain's wrap_model_call decorator
+    Returns:
+        Middleware function
+    """
+    @wrap_model_call
+    @_with_middleware_logging("handle_empty_response")
+    def handle_empty_response(request, handler):
+        max_retries = 2
+        # Check if last message is final_answer_tool result - if so, don't retry/synthesize
+        # This allows agent to naturally terminate after final_answer_tool
+        messages = request.messages
+        if messages:
+            last_msg = messages[-1]
+            if getattr(last_msg, "type", "") == "tool":
+                tool_name = getattr(last_msg, "name", "") or ""
+                if not tool_name:
+                    try:
+                        content_json = json.loads(last_msg.content)
+                        tool_name = content_json.get("tool", "")
+                    except (json.JSONDecodeError, TypeError, AttributeError):
+                        pass
+                if tool_name in ("final_answer_tool", "final_answer"):
+                    logger.info(
+                        "Last message is final_answer_tool result - allowing natural termination"
+                    )
+                    # Just call handler and return response as-is (no retry/synthesize)
+                    return handler(request)
+        for attempt in range(max_retries + 1):
+            response = handler(request)
+            # Extract AIMessage from response
+            response_message = _extract_ai_message(response)
+            has_content = (
+                bool(getattr(response_message, "content", None))
+                if response_message
+                else False
+            )
+            has_tool_calls = (
+                bool(getattr(response_message, "tool_calls", None))
+                if response_message
+                else False
+            )
+            logger.info(
+                "handle_empty_response: attempt=%d, type=%s, content=%s, tool_calls=%s",
+                attempt + 1,
+                type(response_message).__name__ if response_message else None,
+                has_content,
+                has_tool_calls,
+            )
+            # Valid response with tool_calls
+            if has_tool_calls:
+                return response
+            # Try to parse JSON from content
+            if has_content and response_message:
+                parsed = parse_json_tool_call(response_message.content)
+                if parsed:
+                    tool_name = parsed.get("tool", "")
+                    arguments = parsed.get("arguments", {})
+                    logger.info(
+                        "Parsed JSON tool call from content: tool=%s",
+                        tool_name,
+                    )
+                    new_message = create_tool_call_message(tool_name, arguments)
+                    response = _replace_ai_message_in_response(response, new_message)
+                    return response
+            # Invalid response - retry with JSON schema prompt
+            if response_message and attempt < max_retries:
+                reason = "text-only" if has_content else "empty"
+                logger.warning(
+                    "Invalid AIMessage (%s) detected (attempt %d/%d). "
+                    "Retrying with JSON schema prompt...",
+                    reason,
+                    attempt + 1,
+                    max_retries + 1,
+                )
+                json_prompt = _build_json_prompt(request, response_message, has_content)
+                request = request.override(
+                    messages=request.messages + [HumanMessage(content=json_prompt)]
+                )
+                continue
+            # Max retries exhausted - synthesize final_answer
+            if response_message:
+                logger.warning(
+                    "Max retries exhausted. Synthesizing final_answer response."
+                )
+                synthetic_message = _create_synthetic_final_answer(
+                    request, response_message, has_content
+                )
+                response = _replace_ai_message_in_response(response, synthetic_message)
+                return response
+            return response
+        return response
+    return handle_empty_response
+def _extract_ai_message(response):
+    """Extract AIMessage from various response formats."""
+    if hasattr(response, "result"):
+        result = response.result
+        if isinstance(result, list):
+            for msg in reversed(result):
+                if isinstance(msg, AIMessage):
+                    return msg
+        elif isinstance(result, AIMessage):
+            return result
+    elif hasattr(response, "message"):
+        return response.message
+    elif hasattr(response, "messages") and response.messages:
+        return response.messages[-1]
+    elif isinstance(response, AIMessage):
+        return response
+    return None
+def _replace_ai_message_in_response(response, new_message):
+    """Replace AIMessage in response with a new one."""
+    if hasattr(response, "result"):
+        if isinstance(response.result, list):
+            new_result = [
+                new_message if isinstance(m, AIMessage) else m for m in response.result
+            ]
+            response.result = new_result
+        else:
+            response.result = new_message
+    return response
+def _build_json_prompt(request, response_message, has_content):
+    """Build JSON-forcing prompt based on context."""
+    todos = request.state.get("todos", [])
+    pending_todos = [t for t in todos if t.get("status") in ("pending", "in_progress")]
+    if has_content:
+        content_preview = response_message.content[:300]
+        return (
+            f"{JSON_TOOL_SCHEMA}\n\n"
+            f"Your previous response was text, not JSON. "
+            f"Wrap your answer in final_answer_tool:\n"
+            f'{{"tool": "final_answer_tool", "arguments": {{"answer": "{content_preview}..."}}}}'
+        )
+    elif pending_todos:
+        todo_list = ", ".join(t.get("content", "")[:20] for t in pending_todos[:3])
+        example_json = '{"tool": "jupyter_cell_tool", "arguments": {"code": "import pandas as pd\\ndf = pd.read_csv(\'titanic.csv\')\\nprint(df.head())"}}'
+        return (
+            f"{JSON_TOOL_SCHEMA}\n\n"
+            f"Pending tasks: {todo_list}\n"
+            f"Call jupyter_cell_tool with Python code to complete the next task.\n"
+            f"Example: {example_json}"
+        )
+    else:
+        return (
+            f"{JSON_TOOL_SCHEMA}\n\n"
+            f"All tasks completed. Call final_answer_tool:\n"
+            f'{{"tool": "final_answer_tool", "arguments": {{"answer": "작업이 완료되었습니다."}}}}'
+        )
+def _create_synthetic_final_answer(request, response_message, has_content):
+    """Create synthetic final_answer message."""
+    if has_content and response_message.content:
+        summary = response_message.content
+        logger.info(
+            "Using LLM's text content as final answer (length=%d)",
+            len(summary),
+        )
+    else:
+        todos = request.state.get("todos", [])
+        completed_todos = [
+            t.get("content", "") for t in todos if t.get("status") == "completed"
+        ]
+        summary = (
+            f"작업이 완료되었습니다. 완료된 항목: {', '.join(completed_todos[:5])}"
+            if completed_todos
+            else "작업이 완료되었습니다."
+        )
+    return AIMessage(
+        content="",
+        tool_calls=[
+            {
+                "name": "final_answer_tool",
+                "args": {"answer": summary},
+                "id": str(uuid.uuid4()),
+                "type": "tool_call",
+            }
+        ],
+    )
+def create_limit_tool_calls_middleware(wrap_model_call):
+    """Create middleware to limit model to one tool call at a time.
+    Some models (like vLLM GPT) return multiple tool calls in a single response.
+    This causes conflicts with TodoListMiddleware when processing multiple decisions.
+    By limiting to one tool call, we ensure the agent processes actions sequentially.
+    Args:
+        wrap_model_call: LangChain's wrap_model_call decorator
+    Returns:
+        Middleware function
+    """
+    @wrap_model_call
+    @_with_middleware_logging("limit_tool_calls_to_one")
+    def limit_tool_calls_to_one(request, handler):
+        response = handler(request)
+        if hasattr(response, "result"):
+            result = response.result
+            messages = result if isinstance(result, list) else [result]
+            for msg in messages:
+                if isinstance(msg, AIMessage) and hasattr(msg, "tool_calls"):
+                    tool_calls = msg.tool_calls
+                    if tool_calls and len(tool_calls) > 1:
+                        logger.info(
+                            "Limiting tool calls from %d to 1 (keeping first: %s)",
+                            len(tool_calls),
+                            tool_calls[0].get("name", "unknown")
+                            if tool_calls
+                            else "none",
+                        )
+                        msg.tool_calls = [tool_calls[0]]
+        return response
+    return limit_tool_calls_to_one
+def _get_string_params_from_tools(tools) -> Dict[str, set]:
+    """Extract string parameter names from tool schemas.
+    Analyzes each tool's Pydantic args_schema to determine which parameters
+    should be strings (not arrays).
+    Args:
+        tools: List of LangChain tools
+    Returns:
+        Dict mapping tool names to sets of string parameter names
+    """
+    from typing import get_args, get_origin
+    tool_string_params: Dict[str, set] = {}
+    for tool in tools:
+        tool_name = getattr(tool, "name", None)
+        if not tool_name:
+            continue
+        args_schema = getattr(tool, "args_schema", None)
+        if not args_schema:
+            continue
+        string_params = set()
+        # Get field annotations from Pydantic model
+        try:
+            annotations = getattr(args_schema, "__annotations__", {})
+            for field_name, field_type in annotations.items():
+                origin = get_origin(field_type)
+                # Check if it's a simple str type
+                if field_type is str:
+                    string_params.add(field_name)
+                # Check if it's Optional[str] (Union[str, None])
+                elif origin is type(None) or str(origin) == "typing.Union":
+                    args = get_args(field_type)
+                    if str in args:
+                        string_params.add(field_name)
+        except Exception as e:
+            logger.debug("Failed to analyze schema for tool %s: %s", tool_name, e)
+        if string_params:
+            tool_string_params[tool_name] = string_params
+            logger.debug("Tool %s string params: %s", tool_name, string_params)
+    return tool_string_params
+def create_normalize_tool_args_middleware(wrap_model_call, tools=None):
+    """Create middleware to normalize tool call arguments.
+    Gemini sometimes returns tool call arguments with list values instead of strings.
+    This middleware converts list arguments to strings ONLY for parameters that
+    are defined as str in the tool's Pydantic schema.
+    Args:
+        wrap_model_call: LangChain's wrap_model_call decorator
+        tools: Optional list of tools to analyze for type information
+    Returns:
+        Middleware function
+    """
+    # Build tool -> string params mapping from tool schemas
+    tool_string_params: Dict[str, set] = {}
+    if tools:
+        tool_string_params = _get_string_params_from_tools(tools)
+        logger.info(
+            "Initialized normalize_tool_args with %d tools: %s",
+            len(tool_string_params),
+            {k: list(v) for k, v in tool_string_params.items()},
+        )
+    @wrap_model_call
+    @_with_middleware_logging("normalize_tool_args")
+    def normalize_tool_args(request, handler):
+        response = handler(request)
+        if hasattr(response, "result"):
+            result = response.result
+            messages = result if isinstance(result, list) else [result]
+            for msg in messages:
+                if isinstance(msg, AIMessage) and hasattr(msg, "tool_calls"):
+                    tool_calls = msg.tool_calls
+                    if tool_calls:
+                        for tool_call in tool_calls:
+                            tool_name = tool_call.get("name", "")
+                            # Normalize tool name (e.g., write_todos_tool → write_todos)
+                            normalized_name = normalize_tool_name(tool_name)
+                            if normalized_name != tool_name:
+                                logger.info(
+                                    "Normalized tool name: %s → %s",
+                                    tool_name,
+                                    normalized_name,
+                                )
+                                tool_call["name"] = normalized_name
+                                tool_name = normalized_name
+                            string_params = tool_string_params.get(tool_name, set())
+                            if "args" in tool_call and isinstance(
+                                tool_call["args"], dict
+                            ):
+                                args = tool_call["args"]
+                                # Normalize list arguments to strings for str-typed params
+                                for key, value in args.items():
+                                    if key in string_params and isinstance(value, list):
+                                        # Join list items into a single string
+                                        text_parts = []
+                                        for part in value:
+                                            if isinstance(part, str):
+                                                text_parts.append(part)
+                                            elif (
+                                                isinstance(part, dict)
+                                                and part.get("type") == "text"
+                                            ):
+                                                text_parts.append(part.get("text", ""))
+                                        if text_parts:
+                                            normalized_value = "\n".join(text_parts)
+                                            logger.info(
+                                                "Normalized list argument '%s' to string (length=%d) for tool '%s'",
+                                                key,
+                                                len(normalized_value),
+                                                tool_name,
+                                            )
+                                            args[key] = normalized_value
+        return response
+    return normalize_tool_args
+def create_inject_continuation_middleware(wrap_model_call):
+    """Create middleware to inject continuation prompt after non-HITL tool execution.
+    Non-HITL tools execute immediately without user approval, which can cause
+    Gemini to produce empty responses. This middleware injects a system message
+    to remind the LLM to continue with the next action.
+    Args:
+        wrap_model_call: LangChain's wrap_model_call decorator
+    Returns:
+        Middleware function
+    """
+    @wrap_model_call
+    @_with_middleware_logging("inject_continuation_after_non_hitl_tool")
+    def inject_continuation_after_non_hitl_tool(request, handler):
+        messages = request.messages
+        if not messages:
+            return handler(request)
+        last_msg = messages[-1]
+        if getattr(last_msg, "type", "") == "tool":
+            tool_name = getattr(last_msg, "name", "") or ""
+            # Try to extract tool name from content
+            if not tool_name:
+                try:
+                    content_json = json.loads(last_msg.content)
+                    tool_name = content_json.get("tool", "")
+                except (json.JSONDecodeError, TypeError, AttributeError):
+                    pass
+            if tool_name in NON_HITL_TOOLS:
+                logger.info(
+                    "Injecting continuation prompt after non-HITL tool: %s",
+                    tool_name,
+                )
+                todos = request.state.get("todos", [])
+                pending_todos = [
+                    t for t in todos if t.get("status") in ("pending", "in_progress")
+                ]
+                if pending_todos:
+                    pending_list = ", ".join(
+                        t.get("content", "")[:30] for t in pending_todos[:3]
+                    )
+                    continuation = (
+                        f"Tool '{tool_name}' completed. "
+                        f"Continue with pending tasks: {pending_list}. "
+                        f"Call jupyter_cell_tool or the next appropriate tool."
+                    )
+                else:
+                    continuation = (
+                        f"Tool '{tool_name}' completed. All tasks done. "
+                        f"Call final_answer_tool with a summary NOW."
+                    )
+                new_messages = list(messages) + [
+                    HumanMessage(content=f"[SYSTEM] {continuation}")
+                ]
+                request = request.override(messages=new_messages)
+        return handler(request)
+    return inject_continuation_after_non_hitl_tool
+def create_patch_tool_calls_middleware(AgentMiddleware, ToolMessage, Overwrite):
+    """Create middleware to patch dangling tool calls.
+    When a new user message arrives before a tool call completes, we need to
+    add synthetic ToolMessage responses for those dangling calls so the
+    conversation can continue properly.
+    Args:
+        AgentMiddleware: LangChain's AgentMiddleware base class
+        ToolMessage: LangChain's ToolMessage class
+        Overwrite: LangGraph's Overwrite type
+    Returns:
+        PatchToolCallsMiddleware class instance
+    """
+    class PatchToolCallsMiddleware(AgentMiddleware):
+        """Patch dangling tool calls so the agent can continue."""
+        def before_agent(self, state, runtime):
+            logger.info(
+                "%s",
+                _format_middleware_marker(
+                    "PatchToolCallsMiddleware.before_agent", "START"
+                ),
+            )
+            messages = state.get("messages", [])
+            if not messages:
+                logger.info(
+                    "%s",
+                    _format_middleware_marker(
+                        "PatchToolCallsMiddleware.before_agent", "NOOP"
+                    ),
+                )
+                return None
+            patched = []
+            for i, msg in enumerate(messages):
+                patched.append(msg)
+                if getattr(msg, "type", "") == "ai" and getattr(
+                    msg, "tool_calls", None
+                ):
+                    for tool_call in msg.tool_calls:
+                        tool_call_id = tool_call.get("id")
+                        if not tool_call_id:
+                            continue
+                        has_tool_msg = any(
+                            (
+                                getattr(m, "type", "") == "tool"
+                                and getattr(m, "tool_call_id", None) == tool_call_id
+                            )
+                            for m in messages[i:]
+                        )
+                        if not has_tool_msg:
+                            tool_msg = (
+                                f"Tool call {tool_call.get('name', 'unknown')} with id {tool_call_id} "
+                                "was cancelled - another message came in before it could be completed."
+                            )
+                            patched.append(
+                                ToolMessage(
+                                    content=tool_msg,
+                                    name=tool_call.get("name", "unknown"),
+                                    tool_call_id=tool_call_id,
+                                )
+                            )
+            if patched == messages:
+                logger.info(
+                    "%s",
+                    _format_middleware_marker(
+                        "PatchToolCallsMiddleware.before_agent", "NOOP"
+                    ),
+                )
+                return None
+            logger.info(
+                "%s",
+                _format_middleware_marker(
+                    "PatchToolCallsMiddleware.before_agent", "PATCHED"
+                ),
+            )
+            return {"messages": Overwrite(patched)}
+    return PatchToolCallsMiddleware()

agent_server/langchain/executors/__init__.py CHANGED Viewed

@@ -1,15 +1,10 @@
 """
-Jupyter Executors (Embedded Mode)
-Provides direct access to Jupyter kernel for code execution
-when running inside JupyterLab server.
+Jupyter Executors
 Components:
-- JupyterExecutor: Execute code in Jupyter kernel
 - NotebookSearcher: Search notebooks and cells
 """
-from agent_server.langchain.executors.jupyter_executor import JupyterExecutor
 from agent_server.langchain.executors.notebook_searcher import NotebookSearcher
-__all__ = ["JupyterExecutor", "NotebookSearcher"]
+__all__ = ["NotebookSearcher"]

hdsp-jupyter-extension 2.0.6__py3-none-any.whl → 2.0.8__py3-none-any.whl

hdsp-jupyter-extension 2.0.6py3-none-any.whl → 2.0.8py3-none-any.whl