PyPI - hdsp-jupyter-extension - Versions diffs - 2.0.1__py3-none-any.whl → 2.0.2__py3-none-any.whl - Mend

hdsp-jupyter-extension 2.0.1py3-none-any.whl → 2.0.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (78) hide show

agent_server/langchain/agent.py ADDED Viewed

@@ -0,0 +1,694 @@
+"""
+LangChain Agent
+Main agent creation module for tool-driven chat execution.
+"""
+import logging
+from typing import Any, Dict, Optional
+from agent_server.langchain.tools import (
+    final_answer_tool,
+    jupyter_cell_tool,
+    list_files_tool,
+    markdown_tool,
+    read_file_tool,
+    search_notebook_cells_tool,
+    search_workspace_tool,
+    write_file_tool,
+)
+logger = logging.getLogger(__name__)
+def _create_llm(llm_config: Dict[str, Any]):
+    """Create LangChain LLM from config"""
+    provider = llm_config.get("provider", "gemini")
+    if provider == "gemini":
+        from langchain_google_genai import ChatGoogleGenerativeAI
+        gemini_config = llm_config.get("gemini", {})
+        api_key = gemini_config.get("apiKey")
+        model = gemini_config.get("model", "gemini-2.5-pro")
+        if not api_key:
+            raise ValueError("Gemini API key not configured")
+        logger.info(f"Creating Gemini LLM with model: {model}")
+        # Gemini 2.5 Flash has issues with tool calling in LangChain
+        # Use convert_system_message_to_human for better compatibility
+        llm = ChatGoogleGenerativeAI(
+            model=model,
+            google_api_key=api_key,
+            temperature=0.0,
+            max_output_tokens=8192,
+            convert_system_message_to_human=True,  # Better tool calling support
+        )
+        return llm
+    elif provider == "openai":
+        from langchain_openai import ChatOpenAI
+        openai_config = llm_config.get("openai", {})
+        api_key = openai_config.get("apiKey")
+        model = openai_config.get("model", "gpt-4")
+        if not api_key:
+            raise ValueError("OpenAI API key not configured")
+        llm = ChatOpenAI(
+            model=model,
+            api_key=api_key,
+            temperature=0.0,
+            max_tokens=4096,
+        )
+        return llm
+    elif provider == "vllm":
+        from langchain_openai import ChatOpenAI
+        vllm_config = llm_config.get("vllm", {})
+        endpoint = vllm_config.get("endpoint", "http://localhost:8000")
+        model = vllm_config.get("model", "default")
+        api_key = vllm_config.get("apiKey", "dummy")
+        llm = ChatOpenAI(
+            model=model,
+            api_key=api_key,
+            base_url=f"{endpoint}/v1",
+            temperature=0.0,
+            max_tokens=4096,
+        )
+        return llm
+    else:
+        raise ValueError(f"Unsupported LLM provider: {provider}")
+def _get_all_tools():
+    """Get all available tools for the agent"""
+    return [
+        jupyter_cell_tool,
+        markdown_tool,
+        final_answer_tool,
+        read_file_tool,
+        write_file_tool,
+        list_files_tool,
+        search_workspace_tool,
+        search_notebook_cells_tool,
+    ]
+def create_simple_chat_agent(
+    llm_config: Dict[str, Any],
+    workspace_root: str = ".",
+    enable_hitl: bool = True,
+    enable_todo_list: bool = True,
+    checkpointer: Optional[object] = None,
+):
+    """
+    Create a simple chat agent using LangChain's create_agent with Human-in-the-Loop.
+    This is a simplified version for chat mode that uses LangChain's built-in
+    HumanInTheLoopMiddleware and TodoListMiddleware.
+    Args:
+        llm_config: LLM configuration
+        workspace_root: Root directory
+        enable_hitl: Enable Human-in-the-Loop for code execution
+        enable_todo_list: Enable TodoListMiddleware for task planning
+    Returns:
+        Configured agent with HITL and TodoList middleware
+    """
+    try:
+        from langchain.agents import create_agent
+        from langchain.agents.middleware import (
+            AgentMiddleware,
+            HumanInTheLoopMiddleware,
+            ModelCallLimitMiddleware,
+            ModelRequest,
+            ModelResponse,
+            TodoListMiddleware,
+            ToolCallLimitMiddleware,
+            wrap_model_call,
+        )
+        from langchain_core.messages import AIMessage, ToolMessage as LCToolMessage
+        from langgraph.checkpoint.memory import InMemorySaver
+        from langgraph.types import Overwrite
+    except ImportError as e:
+        logger.error(f"Failed to import LangChain agent components: {e}")
+        raise ImportError(
+            "LangChain agent components not available. "
+            "Install with: pip install langchain langgraph"
+        ) from e
+    # Create LLM
+    llm = _create_llm(llm_config)
+    # Get tools
+    tools = _get_all_tools()
+    # Configure middleware
+    middleware = []
+    # JSON Schema for fallback tool calling
+    JSON_TOOL_SCHEMA = """You MUST respond with ONLY valid JSON matching this schema:
+{
+  "tool": "<tool_name>",
+  "arguments": {"arg1": "value1", ...}
+}
+Available tools:
+- jupyter_cell_tool: Execute Python code. Arguments: {"code": "<python_code>"}
+- markdown_tool: Add markdown cell. Arguments: {"content": "<markdown>"}
+- final_answer_tool: Complete task. Arguments: {"answer": "<summary>"}
+- write_todos: Update task list. Arguments: {"todos": [{"content": "...", "status": "pending|in_progress|completed"}]}
+- read_file_tool: Read file. Arguments: {"path": "<file_path>"}
+- list_files_tool: List directory. Arguments: {"path": "."}
+Output ONLY the JSON object, no markdown, no explanation."""
+    def _parse_json_tool_call(text: str) -> Optional[Dict[str, Any]]:
+        """Parse JSON tool call from text response."""
+        import json
+        import re
+        if not text:
+            return None
+        # Clean up response
+        text = text.strip()
+        if text.startswith("```json"):
+            text = text[7:]
+        elif text.startswith("```"):
+            text = text[3:]
+        if text.endswith("```"):
+            text = text[:-3]
+        text = text.strip()
+        # Try direct JSON parse
+        try:
+            data = json.loads(text)
+            if "tool" in data:
+                return data
+        except json.JSONDecodeError:
+            pass
+        # Try to find JSON object in response
+        json_match = re.search(r'\{[\s\S]*\}', text)
+        if json_match:
+            try:
+                data = json.loads(json_match.group())
+                if "tool" in data:
+                    return data
+            except json.JSONDecodeError:
+                pass
+        return None
+    def _create_tool_call_message(tool_name: str, arguments: Dict[str, Any]) -> AIMessage:
+        """Create AIMessage with tool_calls from parsed JSON."""
+        import uuid
+        # Normalize tool name
+        if not tool_name.endswith("_tool"):
+            tool_name = f"{tool_name}_tool"
+        return AIMessage(
+            content="",
+            tool_calls=[
+                {
+                    "name": tool_name,
+                    "args": arguments,
+                    "id": str(uuid.uuid4()),
+                    "type": "tool_call",
+                }
+            ],
+        )
+    # Middleware to detect and handle empty LLM responses with JSON fallback
+    @wrap_model_call
+    def handle_empty_response(
+        request: ModelRequest,
+        handler,
+    ) -> ModelResponse:
+        """
+        Detect empty/invalid AIMessage responses and retry with JSON schema fallback.
+        For models that don't support native tool calling well (e.g., Gemini 2.5 Flash),
+        this middleware:
+        1. Detects empty or text-only responses (no tool_calls)
+        2. Retries with JSON schema prompt to force structured output
+        3. Parses JSON response and injects tool_calls into AIMessage
+        4. Falls back to synthetic final_answer if all else fails
+        """
+        import json
+        import uuid
+        from langchain_core.messages import HumanMessage
+        max_retries = 2  # Allow more retries for JSON fallback
+        for attempt in range(max_retries + 1):
+            response = handler(request)
+            # Extract AIMessage from response
+            response_message = None
+            if hasattr(response, 'result'):
+                result = response.result
+                if isinstance(result, list):
+                    for msg in reversed(result):
+                        if isinstance(msg, AIMessage):
+                            response_message = msg
+                            break
+                elif isinstance(result, AIMessage):
+                    response_message = result
+            elif hasattr(response, 'message'):
+                response_message = response.message
+            elif hasattr(response, 'messages') and response.messages:
+                response_message = response.messages[-1]
+            elif isinstance(response, AIMessage):
+                response_message = response
+            has_content = bool(getattr(response_message, 'content', None)) if response_message else False
+            has_tool_calls = bool(getattr(response_message, 'tool_calls', None)) if response_message else False
+            logger.info(
+                "handle_empty_response: attempt=%d, type=%s, content=%s, tool_calls=%s",
+                attempt + 1,
+                type(response_message).__name__ if response_message else None,
+                has_content,
+                has_tool_calls,
+            )
+            # Valid response with tool_calls
+            if has_tool_calls:
+                return response
+            # Try to parse JSON from content (model might have output JSON without tool_calls)
+            if has_content and response_message:
+                parsed = _parse_json_tool_call(response_message.content)
+                if parsed:
+                    tool_name = parsed.get("tool", "")
+                    arguments = parsed.get("arguments", {})
+                    logger.info(
+                        "Parsed JSON tool call from content: tool=%s",
+                        tool_name,
+                    )
+                    # Create new AIMessage with tool_calls
+                    new_message = _create_tool_call_message(tool_name, arguments)
+                    # Replace in response
+                    if hasattr(response, 'result'):
+                        if isinstance(response.result, list):
+                            new_result = [
+                                new_message if isinstance(m, AIMessage) else m
+                                for m in response.result
+                            ]
+                            response.result = new_result
+                        else:
+                            response.result = new_message
+                    return response
+            # Invalid response - retry with JSON schema prompt
+            if response_message and attempt < max_retries:
+                reason = "text-only" if has_content else "empty"
+                logger.warning(
+                    "Invalid AIMessage (%s) detected (attempt %d/%d). "
+                    "Retrying with JSON schema prompt...",
+                    reason,
+                    attempt + 1,
+                    max_retries + 1,
+                )
+                # Get context for prompt
+                todos = request.state.get("todos", [])
+                pending_todos = [
+                    t for t in todos
+                    if t.get("status") in ("pending", "in_progress")
+                ]
+                # Build JSON-forcing prompt
+                if has_content:
+                    # LLM wrote text - ask to wrap in final_answer
+                    content_preview = response_message.content[:300]
+                    json_prompt = (
+                        f"{JSON_TOOL_SCHEMA}\n\n"
+                        f"Your previous response was text, not JSON. "
+                        f"Wrap your answer in final_answer_tool:\n"
+                        f'{{"tool": "final_answer_tool", "arguments": {{"answer": "{content_preview}..."}}}}'
+                    )
+                elif pending_todos:
+                    todo_list = ", ".join(t.get("content", "")[:20] for t in pending_todos[:3])
+                    example_json = '{"tool": "jupyter_cell_tool", "arguments": {"code": "import pandas as pd\\ndf = pd.read_csv(\'titanic.csv\')\\nprint(df.head())"}}'
+                    json_prompt = (
+                        f"{JSON_TOOL_SCHEMA}\n\n"
+                        f"Pending tasks: {todo_list}\n"
+                        f"Call jupyter_cell_tool with Python code to complete the next task.\n"
+                        f"Example: {example_json}"
+                    )
+                else:
+                    json_prompt = (
+                        f"{JSON_TOOL_SCHEMA}\n\n"
+                        f"All tasks completed. Call final_answer_tool:\n"
+                        f'{{"tool": "final_answer_tool", "arguments": {{"answer": "작업이 완료되었습니다."}}}}'
+                    )
+                # Add JSON prompt and retry
+                request = request.override(
+                    messages=request.messages + [
+                        HumanMessage(content=json_prompt)
+                    ]
+                )
+                continue
+            # Max retries exhausted - synthesize final_answer
+            if response_message:
+                logger.warning(
+                    "Max retries exhausted. Synthesizing final_answer response."
+                )
+                # Use LLM's text content if available
+                if has_content and response_message.content:
+                    summary = response_message.content
+                    logger.info(
+                        "Using LLM's text content as final answer (length=%d)",
+                        len(summary),
+                    )
+                else:
+                    todos = request.state.get("todos", [])
+                    completed_todos = [
+                        t.get("content", "") for t in todos
+                        if t.get("status") == "completed"
+                    ]
+                    summary = (
+                        f"작업이 완료되었습니다. 완료된 항목: {', '.join(completed_todos[:5])}"
+                        if completed_todos
+                        else "작업이 완료되었습니다."
+                    )
+                # Create synthetic final_answer
+                synthetic_message = AIMessage(
+                    content="",
+                    tool_calls=[
+                        {
+                            "name": "final_answer_tool",
+                            "args": {"answer": summary},
+                            "id": str(uuid.uuid4()),
+                            "type": "tool_call",
+                        }
+                    ],
+                )
+                # Replace in response
+                if hasattr(response, 'result'):
+                    if isinstance(response.result, list):
+                        new_result = []
+                        replaced = False
+                        for msg in response.result:
+                            if isinstance(msg, AIMessage) and not replaced:
+                                new_result.append(synthetic_message)
+                                replaced = True
+                            else:
+                                new_result.append(msg)
+                        if not replaced:
+                            new_result.append(synthetic_message)
+                        response.result = new_result
+                    else:
+                        response.result = synthetic_message
+                    return response
+            # Return response (either valid or after max retries)
+            return response
+        return response
+    middleware.append(handle_empty_response)
+    # Non-HITL tools that execute immediately without user approval
+    NON_HITL_TOOLS = {
+        "markdown_tool", "markdown",
+        "read_file_tool", "read_file",
+        "list_files_tool", "list_files",
+        "search_workspace_tool", "search_workspace",
+        "search_notebook_cells_tool", "search_notebook_cells",
+        "write_todos",
+    }
+    # Middleware to inject continuation prompt after non-HITL tool execution
+    @wrap_model_call
+    def inject_continuation_after_non_hitl_tool(
+        request: ModelRequest,
+        handler,
+    ) -> ModelResponse:
+        """
+        Inject a continuation prompt when the last message is from a non-HITL tool.
+        Non-HITL tools execute immediately without user approval, which can cause
+        Gemini to produce empty responses. This middleware injects a system message
+        to remind the LLM to continue with the next action.
+        """
+        messages = request.messages
+        if not messages:
+            return handler(request)
+        # Check if the last message is a ToolMessage from a non-HITL tool
+        last_msg = messages[-1]
+        if getattr(last_msg, "type", "") == "tool":
+            tool_name = getattr(last_msg, "name", "") or ""
+            # Also try to extract tool name from content
+            if not tool_name:
+                try:
+                    import json
+                    content_json = json.loads(last_msg.content)
+                    tool_name = content_json.get("tool", "")
+                except (json.JSONDecodeError, TypeError, AttributeError):
+                    pass
+            if tool_name in NON_HITL_TOOLS:
+                logger.info(
+                    "Injecting continuation prompt after non-HITL tool: %s",
+                    tool_name,
+                )
+                # Get todos context
+                todos = request.state.get("todos", [])
+                pending_todos = [
+                    t for t in todos
+                    if t.get("status") in ("pending", "in_progress")
+                ]
+                if pending_todos:
+                    pending_list = ", ".join(
+                        t.get("content", "")[:30] for t in pending_todos[:3]
+                    )
+                    continuation = (
+                        f"Tool '{tool_name}' completed. "
+                        f"Continue with pending tasks: {pending_list}. "
+                        f"Call jupyter_cell_tool or the next appropriate tool."
+                    )
+                else:
+                    continuation = (
+                        f"Tool '{tool_name}' completed. All tasks done. "
+                        f"Call final_answer_tool with a summary NOW."
+                    )
+                # Inject as a system-like user message
+                from langchain_core.messages import HumanMessage
+                new_messages = list(messages) + [
+                    HumanMessage(content=f"[SYSTEM] {continuation}")
+                ]
+                request = request.override(messages=new_messages)
+        return handler(request)
+    middleware.append(inject_continuation_after_non_hitl_tool)
+    class PatchToolCallsMiddleware(AgentMiddleware):
+        """Patch dangling tool calls so the agent can continue."""
+        def before_agent(self, state, runtime):
+            messages = state.get("messages", [])
+            if not messages:
+                return None
+            patched = []
+            for i, msg in enumerate(messages):
+                patched.append(msg)
+                if getattr(msg, "type", "") == "ai" and getattr(
+                    msg, "tool_calls", None
+                ):
+                    for tool_call in msg.tool_calls:
+                        tool_call_id = tool_call.get("id")
+                        if not tool_call_id:
+                            continue
+                        has_tool_msg = any(
+                            (
+                                getattr(m, "type", "") == "tool"
+                                and getattr(m, "tool_call_id", None) == tool_call_id
+                            )
+                            for m in messages[i:]
+                        )
+                        if not has_tool_msg:
+                            tool_msg = (
+                                f"Tool call {tool_call.get('name', 'unknown')} with id {tool_call_id} "
+                                "was cancelled - another message came in before it could be completed."
+                            )
+                            patched.append(
+                                LCToolMessage(
+                                    content=tool_msg,
+                                    name=tool_call.get("name", "unknown"),
+                                    tool_call_id=tool_call_id,
+                                )
+                            )
+            if patched == messages:
+                return None
+            return {"messages": Overwrite(patched)}
+    middleware.append(PatchToolCallsMiddleware())
+    # Add TodoListMiddleware for task planning
+    if enable_todo_list:
+        todo_middleware = TodoListMiddleware(
+            system_prompt="""
+## CRITICAL WORKFLOW RULES - MUST FOLLOW:
+1. NEVER stop after calling write_todos - ALWAYS make another tool call immediately
+2. write_todos is ONLY for tracking progress - it does NOT complete any work
+3. After EVERY write_todos call, you MUST call another tool (jupyter_cell_tool, markdown_tool, or final_answer_tool)
+## Todo List Management:
+- Before complex tasks, use write_todos to create a task list
+- Update todos as you complete each step (mark 'in_progress' → 'completed')
+- Each todo item should be specific and descriptive (10-50 characters)
+- All todo items must be written in Korean
+- ALWAYS include "다음 단계 제시" as the LAST item
+## Task Completion Flow:
+1. When current task is done → mark it 'completed' with write_todos
+2. IMMEDIATELY call the next tool (jupyter_cell_tool for code, markdown_tool for text)
+3. For "다음 단계 제시" → mark completed, then call final_answer_tool with suggestions
+4. NEVER end your turn after write_todos - you MUST continue with actual work
+## FORBIDDEN PATTERNS:
+❌ Calling write_todos and then stopping
+❌ Updating todo status without doing the actual work
+❌ Ending turn without calling final_answer_tool when all tasks are done
+""",
+            tool_description="""Update the task list for tracking progress.
+⚠️ CRITICAL: This tool is ONLY for tracking - it does NOT do any actual work.
+After calling this tool, you MUST IMMEDIATELY call another tool (jupyter_cell_tool, markdown_tool, or final_answer_tool).
+NEVER end your response after calling write_todos - always continue with the next action tool.""",
+        )
+        middleware.append(todo_middleware)
+    if enable_hitl:
+        # Add Human-in-the-Loop middleware for code execution
+        hitl_middleware = HumanInTheLoopMiddleware(
+            interrupt_on={
+                # Require approval before executing code
+                "jupyter_cell_tool": {
+                    "allowed_decisions": ["approve", "edit", "reject"],
+                    "description": "🔍 Code execution requires approval",
+                },
+                # Safe operations - no approval needed
+                "markdown_tool": False,
+                "read_file_tool": False,
+                "list_files_tool": False,
+                "search_workspace_tool": False,
+                "search_notebook_cells_tool": False,
+                "write_todos": False,  # Todo updates don't need approval
+                # File write requires approval
+                "write_file_tool": {
+                    "allowed_decisions": ["approve", "edit", "reject"],
+                    "description": "⚠️ File write requires approval",
+                },
+                # Final answer doesn't need approval
+                "final_answer_tool": False,
+            },
+            description_prefix="Tool execution pending approval",
+        )
+        middleware.append(hitl_middleware)
+    # Add loop prevention middleware
+    # ModelCallLimitMiddleware: Prevent infinite LLM calls
+    model_limit_middleware = ModelCallLimitMiddleware(
+        run_limit=30,  # Max 30 LLM calls per user message
+        exit_behavior="end",  # Gracefully end when limit reached
+    )
+    middleware.append(model_limit_middleware)
+    logger.info("Added ModelCallLimitMiddleware with run_limit=30")
+    # ToolCallLimitMiddleware: Prevent specific tools from being called too many times
+    # Limit write_todos to prevent the loop we observed
+    write_todos_limit = ToolCallLimitMiddleware(
+        tool_name="write_todos",
+        run_limit=5,  # Max 5 write_todos calls per user message
+        exit_behavior="continue",  # Let agent continue with other tools
+    )
+    middleware.append(write_todos_limit)
+    # Limit list_files_tool to prevent excessive directory listing
+    list_files_limit = ToolCallLimitMiddleware(
+        tool_name="list_files_tool",
+        run_limit=5,  # Max 5 list_files calls per user message
+        exit_behavior="continue",
+    )
+    middleware.append(list_files_limit)
+    logger.info("Added ToolCallLimitMiddleware for write_todos and list_files_tool")
+    # System prompt for the agent
+    system_prompt = """You are an expert Python data scientist and Jupyter notebook assistant.
+Your role is to help users with data analysis, visualization, and Python coding tasks in Jupyter notebooks.
+## ⚠️ CRITICAL RULE: NEVER produce an empty response
+You MUST ALWAYS call a tool in every response. After any tool result, you MUST:
+1. Check your todo list - are there pending or in_progress items?
+2. If YES → call the next appropriate tool (jupyter_cell_tool, markdown_tool, etc.)
+3. If ALL todos are completed → call final_answer_tool with a summary
+NEVER end your turn without calling a tool. NEVER produce an empty response.
+## Available Tools
+1. **jupyter_cell_tool**: Execute Python code in a new notebook cell
+2. **markdown_tool**: Add a markdown explanation cell
+3. **final_answer_tool**: Complete the task with a summary - REQUIRED when done
+4. **read_file_tool**: Read file contents
+5. **write_file_tool**: Write file contents
+6. **list_files_tool**: List directory contents
+7. **search_workspace_tool**: Search for patterns in workspace files
+8. **search_notebook_cells_tool**: Search for patterns in notebook cells
+9. **write_todos**: Create and update task list for complex multi-step tasks
+## Mandatory Workflow
+1. After EVERY tool result, immediately call the next tool
+2. Continue until ALL todos show status: "completed"
+3. ONLY THEN call final_answer_tool to summarize
+4. If `!pip install` fails, use `!pip3 install` instead
+5. For plots and charts, use English text only
+## ❌ FORBIDDEN (will break the workflow)
+- Producing an empty response (no tool call, no content)
+- Stopping after any tool without calling the next tool
+- Ending without calling final_answer_tool
+- Leaving todos in "in_progress" or "pending" state without continuing
+"""
+    logger.info("SimpleChatAgent system_prompt: %s", system_prompt)
+    # Create agent with checkpointer (required for HITL)
+    agent = create_agent(
+        model=llm,
+        tools=tools,
+        middleware=middleware,
+        checkpointer=checkpointer or InMemorySaver(),  # Required for interrupt/resume
+        system_prompt=system_prompt,  # Tell the agent to use tools
+    )
+    return agent

hdsp-jupyter-extension 2.0.1__py3-none-any.whl → 2.0.2__py3-none-any.whl

hdsp-jupyter-extension 2.0.1py3-none-any.whl → 2.0.2py3-none-any.whl