PyPI - gobby - Versions diffs - 0.2.8__py3-none-any.whl → 0.2.11__py3-none-any.whl - Mend

gobby 0.2.8py3-none-any.whl → 0.2.11py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (168) hide show

gobby/__init__.py +1 -1
gobby/adapters/__init__.py +6 -0
gobby/adapters/base.py +11 -2
gobby/adapters/claude_code.py +5 -28
gobby/adapters/codex_impl/adapter.py +38 -43
gobby/adapters/copilot.py +324 -0
gobby/adapters/cursor.py +373 -0
gobby/adapters/gemini.py +2 -26
gobby/adapters/windsurf.py +359 -0
gobby/agents/definitions.py +162 -2
gobby/agents/isolation.py +33 -1
gobby/agents/pty_reader.py +192 -0
gobby/agents/registry.py +10 -1
gobby/agents/runner.py +24 -8
gobby/agents/sandbox.py +8 -3
gobby/agents/session.py +4 -0
gobby/agents/spawn.py +9 -2
gobby/agents/spawn_executor.py +49 -61
gobby/agents/spawners/command_builder.py +4 -4
gobby/app_context.py +64 -0
gobby/cli/__init__.py +4 -0
gobby/cli/install.py +259 -4
gobby/cli/installers/__init__.py +12 -0
gobby/cli/installers/copilot.py +242 -0
gobby/cli/installers/cursor.py +244 -0
gobby/cli/installers/shared.py +3 -0
gobby/cli/installers/windsurf.py +242 -0
gobby/cli/pipelines.py +639 -0
gobby/cli/sessions.py +3 -1
gobby/cli/skills.py +209 -0
gobby/cli/tasks/crud.py +6 -5
gobby/cli/tasks/search.py +1 -1
gobby/cli/ui.py +116 -0
gobby/cli/utils.py +5 -17
gobby/cli/workflows.py +38 -17
gobby/config/app.py +5 -0
gobby/config/features.py +0 -20
gobby/config/skills.py +23 -2
gobby/config/tasks.py +4 -0
gobby/hooks/broadcaster.py +9 -0
gobby/hooks/event_handlers/__init__.py +155 -0
gobby/hooks/event_handlers/_agent.py +175 -0
gobby/hooks/event_handlers/_base.py +92 -0
gobby/hooks/event_handlers/_misc.py +66 -0
gobby/hooks/event_handlers/_session.py +487 -0
gobby/hooks/event_handlers/_tool.py +196 -0
gobby/hooks/events.py +48 -0
gobby/hooks/hook_manager.py +27 -3
gobby/install/copilot/hooks/hook_dispatcher.py +203 -0
gobby/install/cursor/hooks/hook_dispatcher.py +203 -0
gobby/install/gemini/hooks/hook_dispatcher.py +8 -0
gobby/install/windsurf/hooks/hook_dispatcher.py +205 -0
gobby/llm/__init__.py +14 -1
gobby/llm/claude.py +594 -43
gobby/llm/service.py +149 -0
gobby/mcp_proxy/importer.py +4 -41
gobby/mcp_proxy/instructions.py +9 -27
gobby/mcp_proxy/manager.py +13 -3
gobby/mcp_proxy/models.py +1 -0
gobby/mcp_proxy/registries.py +66 -5
gobby/mcp_proxy/server.py +6 -2
gobby/mcp_proxy/services/recommendation.py +2 -28
gobby/mcp_proxy/services/tool_filter.py +7 -0
gobby/mcp_proxy/services/tool_proxy.py +19 -1
gobby/mcp_proxy/stdio.py +37 -21
gobby/mcp_proxy/tools/agents.py +7 -0
gobby/mcp_proxy/tools/artifacts.py +3 -3
gobby/mcp_proxy/tools/hub.py +30 -1
gobby/mcp_proxy/tools/orchestration/cleanup.py +5 -5
gobby/mcp_proxy/tools/orchestration/monitor.py +1 -1
gobby/mcp_proxy/tools/orchestration/orchestrate.py +8 -3
gobby/mcp_proxy/tools/orchestration/review.py +17 -4
gobby/mcp_proxy/tools/orchestration/wait.py +7 -7
gobby/mcp_proxy/tools/pipelines/__init__.py +254 -0
gobby/mcp_proxy/tools/pipelines/_discovery.py +67 -0
gobby/mcp_proxy/tools/pipelines/_execution.py +281 -0
gobby/mcp_proxy/tools/sessions/_crud.py +4 -4
gobby/mcp_proxy/tools/sessions/_handoff.py +1 -1
gobby/mcp_proxy/tools/skills/__init__.py +184 -30
gobby/mcp_proxy/tools/spawn_agent.py +229 -14
gobby/mcp_proxy/tools/task_readiness.py +27 -4
gobby/mcp_proxy/tools/tasks/_context.py +8 -0
gobby/mcp_proxy/tools/tasks/_crud.py +27 -1
gobby/mcp_proxy/tools/tasks/_helpers.py +1 -1
gobby/mcp_proxy/tools/tasks/_lifecycle.py +125 -8
gobby/mcp_proxy/tools/tasks/_lifecycle_validation.py +2 -1
gobby/mcp_proxy/tools/tasks/_search.py +1 -1
gobby/mcp_proxy/tools/workflows/__init__.py +273 -0
gobby/mcp_proxy/tools/workflows/_artifacts.py +225 -0
gobby/mcp_proxy/tools/workflows/_import.py +112 -0
gobby/mcp_proxy/tools/workflows/_lifecycle.py +332 -0
gobby/mcp_proxy/tools/workflows/_query.py +226 -0
gobby/mcp_proxy/tools/workflows/_resolution.py +78 -0
gobby/mcp_proxy/tools/workflows/_terminal.py +175 -0
gobby/mcp_proxy/tools/worktrees.py +54 -15
gobby/memory/components/__init__.py +0 -0
gobby/memory/components/ingestion.py +98 -0
gobby/memory/components/search.py +108 -0
gobby/memory/context.py +5 -5
gobby/memory/manager.py +16 -25
gobby/paths.py +51 -0
gobby/prompts/loader.py +1 -35
gobby/runner.py +131 -16
gobby/servers/http.py +193 -150
gobby/servers/routes/__init__.py +2 -0
gobby/servers/routes/admin.py +56 -0
gobby/servers/routes/mcp/endpoints/execution.py +33 -32
gobby/servers/routes/mcp/endpoints/registry.py +8 -8
gobby/servers/routes/mcp/hooks.py +10 -1
gobby/servers/routes/pipelines.py +227 -0
gobby/servers/websocket.py +314 -1
gobby/sessions/analyzer.py +89 -3
gobby/sessions/manager.py +5 -5
gobby/sessions/transcripts/__init__.py +3 -0
gobby/sessions/transcripts/claude.py +5 -0
gobby/sessions/transcripts/codex.py +5 -0
gobby/sessions/transcripts/gemini.py +5 -0
gobby/skills/hubs/__init__.py +25 -0
gobby/skills/hubs/base.py +234 -0
gobby/skills/hubs/claude_plugins.py +328 -0
gobby/skills/hubs/clawdhub.py +289 -0
gobby/skills/hubs/github_collection.py +465 -0
gobby/skills/hubs/manager.py +263 -0
gobby/skills/hubs/skillhub.py +342 -0
gobby/skills/parser.py +23 -0
gobby/skills/sync.py +5 -4
gobby/storage/artifacts.py +19 -0
gobby/storage/memories.py +4 -4
gobby/storage/migrations.py +118 -3
gobby/storage/pipelines.py +367 -0
gobby/storage/sessions.py +23 -4
gobby/storage/skills.py +48 -8
gobby/storage/tasks/_aggregates.py +2 -2
gobby/storage/tasks/_lifecycle.py +4 -4
gobby/storage/tasks/_models.py +7 -1
gobby/storage/tasks/_queries.py +3 -3
gobby/sync/memories.py +4 -3
gobby/tasks/commits.py +48 -17
gobby/tasks/external_validator.py +4 -17
gobby/tasks/validation.py +13 -87
gobby/tools/summarizer.py +18 -51
gobby/utils/status.py +13 -0
gobby/workflows/actions.py +80 -0
gobby/workflows/context_actions.py +265 -27
gobby/workflows/definitions.py +119 -1
gobby/workflows/detection_helpers.py +23 -11
gobby/workflows/enforcement/__init__.py +11 -1
gobby/workflows/enforcement/blocking.py +96 -0
gobby/workflows/enforcement/handlers.py +35 -1
gobby/workflows/enforcement/task_policy.py +18 -0
gobby/workflows/engine.py +26 -4
gobby/workflows/evaluator.py +8 -5
gobby/workflows/lifecycle_evaluator.py +59 -27
gobby/workflows/loader.py +567 -30
gobby/workflows/lobster_compat.py +147 -0
gobby/workflows/pipeline_executor.py +801 -0
gobby/workflows/pipeline_state.py +172 -0
gobby/workflows/pipeline_webhooks.py +206 -0
gobby/workflows/premature_stop.py +5 -0
gobby/worktrees/git.py +135 -20
{gobby-0.2.8.dist-info → gobby-0.2.11.dist-info}/METADATA +56 -22
{gobby-0.2.8.dist-info → gobby-0.2.11.dist-info}/RECORD +166 -122
gobby/hooks/event_handlers.py +0 -1008
gobby/mcp_proxy/tools/workflows.py +0 -1023
{gobby-0.2.8.dist-info → gobby-0.2.11.dist-info}/WHEEL +0 -0
{gobby-0.2.8.dist-info → gobby-0.2.11.dist-info}/entry_points.txt +0 -0
{gobby-0.2.8.dist-info → gobby-0.2.11.dist-info}/licenses/LICENSE.md +0 -0
{gobby-0.2.8.dist-info → gobby-0.2.11.dist-info}/top_level.txt +0 -0

gobby/llm/claude.py CHANGED Viewed

@@ -1,5 +1,9 @@
 """
 Claude implementation of LLMProvider.
+Supports two authentication modes:
+- subscription: Uses Claude Agent SDK via Claude CLI (requires CLI installed)
+- api_key: Uses LiteLLM with anthropic/ prefix (BYOK, no CLI needed)
 """
 import asyncio
@@ -8,8 +12,9 @@ import logging
 import os
 import shutil
 import time
+from collections.abc import AsyncIterator
 from dataclasses import dataclass, field
-from typing import Any
+from typing import Any, Literal, cast
 from claude_agent_sdk import (
     AssistantMessage,
@@ -26,6 +31,9 @@ from claude_agent_sdk import (
 from gobby.config.app import DaemonConfig
 from gobby.llm.base import LLMProvider
+# Type alias for auth mode
+AuthMode = Literal["subscription", "api_key"]
 @dataclass
 class ToolCall:
@@ -55,14 +63,82 @@ class MCPToolResult:
     """List of tool calls made during generation."""
+# Streaming event types for stream_with_mcp_tools
+@dataclass
+class TextChunk:
+    """A chunk of text from the streaming response."""
+    content: str
+    """The text content."""
+@dataclass
+class ToolCallEvent:
+    """Event when a tool is being called."""
+    tool_call_id: str
+    """Unique ID for this tool call."""
+    tool_name: str
+    """Full tool name (e.g., mcp__gobby-tasks__create_task)."""
+    server_name: str
+    """Extracted server name (e.g., gobby-tasks)."""
+    arguments: dict[str, Any]
+    """Arguments passed to the tool."""
+@dataclass
+class ToolResultEvent:
+    """Event when a tool call completes."""
+    tool_call_id: str
+    """ID matching the original ToolCallEvent."""
+    success: bool
+    """Whether the tool call succeeded."""
+    result: Any = None
+    """Result data if successful."""
+    error: str | None = None
+    """Error message if failed."""
+@dataclass
+class DoneEvent:
+    """Event when streaming is complete."""
+    tool_calls_count: int
+    """Total number of tool calls made."""
+    cost_usd: float | None = None
+    """Cost in USD if available."""
+    duration_ms: float | None = None
+    """Duration in milliseconds if available."""
+# Union type for all streaming events
+ChatEvent = TextChunk | ToolCallEvent | ToolResultEvent | DoneEvent
 logger = logging.getLogger(__name__)
 class ClaudeLLMProvider(LLMProvider):
     """
-    Claude implementation of LLMProvider using claude_agent_sdk.
+    Claude implementation of LLMProvider.
+    Supports two authentication modes:
+    - subscription (default): Uses Claude Agent SDK via Claude CLI
+    - api_key: Uses LiteLLM with anthropic/ prefix (BYOK, no CLI needed)
-    Uses subscription-based authentication through Claude CLI.
+    The auth_mode is determined by:
+    1. Constructor parameter (highest priority)
+    2. Config file: llm_providers.claude.auth_mode
+    3. Default: "subscription"
     """
     @property
@@ -70,16 +146,40 @@ class ClaudeLLMProvider(LLMProvider):
         """Return provider name."""
         return "claude"
-    def __init__(self, config: DaemonConfig):
+    @property
+    def auth_mode(self) -> AuthMode:
+        """Return current authentication mode."""
+        return self._auth_mode
+    def __init__(
+        self,
+        config: DaemonConfig,
+        auth_mode: AuthMode | None = None,
+    ):
         """
         Initialize ClaudeLLMProvider.
         Args:
             config: Client configuration.
+            auth_mode: Authentication mode override. If None, uses config or default.
         """
         self.config = config
         self.logger = logger
-        self._claude_cli_path = self._find_cli_path()
+        self._litellm: Any = None
+        # Determine auth mode from param -> config -> default
+        self._auth_mode: AuthMode = "subscription"
+        if auth_mode:
+            self._auth_mode = auth_mode
+        elif config.llm_providers and config.llm_providers.claude:
+            self._auth_mode = config.llm_providers.claude.auth_mode  # type: ignore[assignment]
+        # Set up based on auth mode
+        if self._auth_mode == "subscription":
+            self._claude_cli_path = self._find_cli_path()
+        else:  # api_key
+            self._claude_cli_path = None
+            self._setup_litellm()
     def _find_cli_path(self) -> str | None:
         """
@@ -147,17 +247,37 @@ class ClaudeLLMProvider(LLMProvider):
         return cli_path
-    async def generate_summary(
-        self, context: dict[str, Any], prompt_template: str | None = None
-    ) -> str:
+    def _setup_litellm(self) -> None:
         """
-        Generate session summary using Claude.
+        Initialize LiteLLM for api_key mode.
+        LiteLLM reads ANTHROPIC_API_KEY from the environment automatically.
         """
-        cli_path = self._verify_cli_path()
-        if not cli_path:
-            return "Session summary unavailable (Claude CLI not found)"
+        try:
+            import litellm
-        # Build formatted context for prompt template
+            self._litellm = litellm
+            self.logger.debug("LiteLLM initialized for Claude api_key mode")
+        except ImportError:
+            self.logger.error("litellm package required for api_key mode")
+    def _format_summary_context(self, context: dict[str, Any], prompt_template: str | None) -> str:
+        """
+        Format context and validate prompt template for summary generation.
+        Transforms list/dict values to strings for template substitution
+        and validates that a prompt template is provided.
+        Args:
+            context: Raw context dict with transcript_summary, last_messages, etc.
+            prompt_template: Template string with placeholders for context values.
+        Returns:
+            Formatted prompt string ready for LLM consumption.
+        Raises:
+            ValueError: If prompt_template is None.
+        """
         # Transform list/dict values to strings for template substitution
         formatted_context = {
             "transcript_summary": context.get("transcript_summary", ""),
@@ -171,13 +291,68 @@ class ClaudeLLMProvider(LLMProvider):
             },
         }
-        # Build prompt - prompt_template is required
+        # Validate prompt_template is provided
         if not prompt_template:
             raise ValueError(
                 "prompt_template is required for generate_summary. "
                 "Configure 'session_summary.prompt' in ~/.gobby/config.yaml"
             )
-        prompt = prompt_template.format(**formatted_context)
+        return prompt_template.format(**formatted_context)
+    async def _retry_async(
+        self,
+        operation: Any,
+        max_retries: int = 3,
+        delay: float = 1.0,
+        on_retry: Any | None = None,
+    ) -> Any:
+        """
+        Execute an async operation with retry logic.
+        Args:
+            operation: Callable that returns an awaitable (coroutine factory).
+            max_retries: Maximum number of attempts (default: 3).
+            delay: Delay in seconds between retries (default: 1.0).
+            on_retry: Optional callback(attempt: int, error: Exception) called on retry.
+        Returns:
+            Result of the operation if successful.
+        Raises:
+            Exception: The last exception if all retries fail.
+        """
+        for attempt in range(max_retries):
+            try:
+                return await operation()
+            except Exception as e:
+                if attempt < max_retries - 1:
+                    if on_retry:
+                        on_retry(attempt, e)
+                    await asyncio.sleep(delay)
+                else:
+                    raise
+    async def generate_summary(
+        self, context: dict[str, Any], prompt_template: str | None = None
+    ) -> str:
+        """
+        Generate session summary using Claude.
+        """
+        if self._auth_mode == "subscription":
+            return await self._generate_summary_sdk(context, prompt_template)
+        else:
+            return await self._generate_summary_litellm(context, prompt_template)
+    async def _generate_summary_sdk(
+        self, context: dict[str, Any], prompt_template: str | None = None
+    ) -> str:
+        """Generate session summary using Claude Agent SDK (subscription mode)."""
+        cli_path = self._verify_cli_path()
+        if not cli_path:
+            return "Session summary unavailable (Claude CLI not found)"
+        prompt = self._format_summary_context(context, prompt_template)
         # Configure Claude Agent SDK
         options = ClaudeAgentOptions(
@@ -205,8 +380,45 @@ class ClaudeLLMProvider(LLMProvider):
             self.logger.error(f"Failed to generate summary with Claude: {e}")
             return f"Session summary generation failed: {e}"
+    async def _generate_summary_litellm(
+        self, context: dict[str, Any], prompt_template: str | None = None
+    ) -> str:
+        """Generate session summary using LiteLLM (api_key mode)."""
+        if not self._litellm:
+            return "Session summary unavailable (LiteLLM not initialized)"
+        prompt = self._format_summary_context(context, prompt_template)
+        try:
+            response = await self._litellm.acompletion(
+                model=f"anthropic/{self.config.session_summary.model}",
+                messages=[
+                    {
+                        "role": "system",
+                        "content": "You are a session summary generator. Create comprehensive, actionable summaries.",
+                    },
+                    {"role": "user", "content": prompt},
+                ],
+                max_tokens=4000,
+            )
+            return response.choices[0].message.content or ""
+        except Exception as e:
+            self.logger.error(f"Failed to generate summary with LiteLLM: {e}")
+            return f"Session summary generation failed: {e}"
     async def synthesize_title(
         self, user_prompt: str, prompt_template: str | None = None
+    ) -> str | None:
+        """
+        Synthesize session title using Claude.
+        """
+        if self._auth_mode == "subscription":
+            return await self._synthesize_title_sdk(user_prompt, prompt_template)
+        else:
+            return await self._synthesize_title_litellm(user_prompt, prompt_template)
+    async def _synthesize_title_sdk(
+        self, user_prompt: str, prompt_template: str | None = None
     ) -> str | None:
         """
         Synthesize session title using Claude.
@@ -243,26 +455,63 @@ class ClaudeLLMProvider(LLMProvider):
                             title_text = block.text
             return title_text.strip()
+        def _on_retry(attempt: int, error: Exception) -> None:
+            self.logger.warning(
+                f"Title synthesis failed (attempt {attempt + 1}), retrying: {error}"
+            )
         try:
-            # Retry logic for title synthesis
-            max_retries = 3
-            for attempt in range(max_retries):
-                try:
-                    return await _run_query()
-                except Exception as e:
-                    if attempt < max_retries - 1:
-                        self.logger.warning(
-                            f"Title synthesis failed (attempt {attempt + 1}), retrying: {e}"
-                        )
-                        await asyncio.sleep(1)
-                    else:
-                        raise e
-            # This should be unreachable, but mypy can't prove it
-            return None  # pragma: no cover
+            result = await self._retry_async(
+                _run_query, max_retries=3, delay=1.0, on_retry=_on_retry
+            )
+            return cast(str, result)
         except Exception as e:
             self.logger.error(f"Failed to synthesize title with Claude: {e}")
             return None
+    async def _synthesize_title_litellm(
+        self, user_prompt: str, prompt_template: str | None = None
+    ) -> str | None:
+        """Synthesize session title using LiteLLM (api_key mode)."""
+        if not self._litellm:
+            return None
+        # Build prompt - prompt_template is required
+        if not prompt_template:
+            raise ValueError(
+                "prompt_template is required for synthesize_title. "
+                "Configure 'title_synthesis.prompt' in ~/.gobby/config.yaml"
+            )
+        prompt = prompt_template.format(user_prompt=user_prompt)
+        async def _run_query() -> str:
+            response = await self._litellm.acompletion(
+                model=f"anthropic/{self.config.title_synthesis.model}",
+                messages=[
+                    {
+                        "role": "system",
+                        "content": "You are a session title generator. Create concise, descriptive titles.",
+                    },
+                    {"role": "user", "content": prompt},
+                ],
+                max_tokens=100,
+            )
+            return (response.choices[0].message.content or "").strip()
+        def _on_retry(attempt: int, error: Exception) -> None:
+            self.logger.warning(
+                f"Title synthesis failed (attempt {attempt + 1}), retrying: {error}"
+            )
+        try:
+            result = await self._retry_async(
+                _run_query, max_retries=3, delay=1.0, on_retry=_on_retry
+            )
+            return cast(str, result)
+        except Exception as e:
+            self.logger.error(f"Failed to synthesize title with LiteLLM: {e}")
+            return None
     async def generate_text(
         self,
         prompt: str,
@@ -272,6 +521,18 @@ class ClaudeLLMProvider(LLMProvider):
         """
         Generate text using Claude.
         """
+        if self._auth_mode == "subscription":
+            return await self._generate_text_sdk(prompt, system_prompt, model)
+        else:
+            return await self._generate_text_litellm(prompt, system_prompt, model)
+    async def _generate_text_sdk(
+        self,
+        prompt: str,
+        system_prompt: str | None = None,
+        model: str | None = None,
+    ) -> str:
+        """Generate text using Claude Agent SDK (subscription mode)."""
         cli_path = self._verify_cli_path()
         if not cli_path:
             return "Generation unavailable (Claude CLI not found)"
@@ -323,6 +584,36 @@ class ClaudeLLMProvider(LLMProvider):
             self.logger.error(f"Failed to generate text with Claude: {e}", exc_info=True)
             return f"Generation failed: {e}"
+    async def _generate_text_litellm(
+        self,
+        prompt: str,
+        system_prompt: str | None = None,
+        model: str | None = None,
+    ) -> str:
+        """Generate text using LiteLLM (api_key mode)."""
+        if not self._litellm:
+            return "Generation unavailable (LiteLLM not initialized)"
+        model = model or "claude-haiku-4-5"
+        litellm_model = f"anthropic/{model}"
+        try:
+            response = await self._litellm.acompletion(
+                model=litellm_model,
+                messages=[
+                    {
+                        "role": "system",
+                        "content": system_prompt or "You are a helpful assistant.",
+                    },
+                    {"role": "user", "content": prompt},
+                ],
+                max_tokens=4000,
+            )
+            return response.choices[0].message.content or ""
+        except Exception as e:
+            self.logger.error(f"Failed to generate text with LiteLLM: {e}", exc_info=True)
+            return f"Generation failed: {e}"
     async def generate_with_mcp_tools(
         self,
         prompt: str,
@@ -338,6 +629,9 @@ class ClaudeLLMProvider(LLMProvider):
         This method enables the agent to call MCP tools during generation,
         tracking all tool calls made and returning them alongside the final text.
+        Note: This method requires subscription mode (Claude Agent SDK).
+        In api_key mode, returns an error message.
         Args:
             prompt: User prompt to process.
             allowed_tools: List of allowed MCP tool patterns.
@@ -364,6 +658,14 @@ class ClaudeLLMProvider(LLMProvider):
             >>> for call in result.tool_calls:
             ...     print(f"Called {call.tool_name} with {call.arguments}")
         """
+        # MCP tools require subscription mode (Claude Agent SDK)
+        if self._auth_mode == "api_key":
+            return MCPToolResult(
+                text="MCP tools require subscription mode. "
+                "Set auth_mode: subscription in llm_providers.claude config.",
+                tool_calls=[],
+            )
         cli_path = self._verify_cli_path()
         if not cli_path:
             return MCPToolResult(
@@ -421,7 +723,7 @@ class ClaudeLLMProvider(LLMProvider):
                 parts = full_tool_name.split("__")
                 if len(parts) >= 2:
                     return parts[1]
-            return "unknown"
+            return "builtin"
         # Run async query
         async def _run_query() -> str:
@@ -487,6 +789,160 @@ class ClaudeLLMProvider(LLMProvider):
                 tool_calls=tool_calls,
             )
+    async def stream_with_mcp_tools(
+        self,
+        prompt: str,
+        allowed_tools: list[str],
+        system_prompt: str | None = None,
+        model: str | None = None,
+        max_turns: int = 10,
+    ) -> AsyncIterator[ChatEvent]:
+        """
+        Stream generation with MCP tools, yielding events as they occur.
+        This method enables real-time streaming of text and tool call events
+        during multi-turn agent conversations. Unlike generate_with_mcp_tools(),
+        this yields events incrementally rather than waiting for completion.
+        Note: This method requires subscription mode (Claude Agent SDK).
+        Args:
+            prompt: User prompt to process.
+            allowed_tools: List of allowed MCP tool patterns.
+                Tools should be in format "mcp__{server}__{tool}" or patterns
+                like "mcp__gobby-tasks__*" for all tools from a server.
+            system_prompt: Optional system prompt.
+            model: Optional model override (default: claude-sonnet-4-5).
+            max_turns: Maximum number of agentic turns (default: 10).
+        Yields:
+            ChatEvent: One of TextChunk, ToolCallEvent, ToolResultEvent, or DoneEvent.
+        Example:
+            >>> async for event in provider.stream_with_mcp_tools(
+            ...     prompt="Create a task called 'Fix bug'",
+            ...     allowed_tools=["mcp__gobby-tasks__*"],
+            ... ):
+            ...     if isinstance(event, TextChunk):
+            ...         print(event.content, end="")
+            ...     elif isinstance(event, ToolCallEvent):
+            ...         print(f"Calling {event.tool_name}...")
+        """
+        # MCP tools require subscription mode (Claude Agent SDK)
+        if self._auth_mode == "api_key":
+            yield TextChunk(
+                content="MCP tools require subscription mode. "
+                "Set auth_mode: subscription in llm_providers.claude config."
+            )
+            yield DoneEvent(tool_calls_count=0)
+            return
+        cli_path = self._verify_cli_path()
+        if not cli_path:
+            yield TextChunk(content="Generation unavailable (Claude CLI not found)")
+            yield DoneEvent(tool_calls_count=0)
+            return
+        # Build mcp_servers config - use .mcp.json if gobby tools requested
+        from pathlib import Path
+        mcp_servers_config: dict[str, Any] | str | None = None
+        if any("gobby" in t for t in allowed_tools):
+            cwd_config = Path.cwd() / ".mcp.json"
+            if cwd_config.exists():
+                mcp_servers_config = str(cwd_config)
+            else:
+                gobby_root = Path(__file__).parent.parent.parent.parent
+                gobby_config = gobby_root / ".mcp.json"
+                if gobby_config.exists():
+                    mcp_servers_config = str(gobby_config)
+        # Configure Claude Agent SDK with MCP tools
+        options = ClaudeAgentOptions(
+            system_prompt=system_prompt
+            or "You are Gobby, a helpful assistant with access to tools.",
+            max_turns=max_turns,
+            model=model or "claude-sonnet-4-5",
+            allowed_tools=allowed_tools,
+            permission_mode="bypassPermissions",
+            cli_path=cli_path,
+            mcp_servers=mcp_servers_config if mcp_servers_config is not None else {},
+        )
+        def _parse_server_name(full_tool_name: str) -> str:
+            """Extract server name from mcp__{server}__{tool} format."""
+            if full_tool_name.startswith("mcp__"):
+                parts = full_tool_name.split("__")
+                if len(parts) >= 2:
+                    return parts[1]
+            return "builtin"
+        tool_calls_count = 0
+        pending_tool_calls: dict[str, str] = {}  # Map tool_use_id -> tool_name
+        needs_spacing_before_text = False  # Track if we need spacing before text
+        try:
+            async for message in query(prompt=prompt, options=options):
+                if isinstance(message, ResultMessage):
+                    # Final result - extract metadata
+                    cost_usd = getattr(message, "total_cost_usd", None)
+                    duration_ms = getattr(message, "duration_ms", None)
+                    yield DoneEvent(
+                        tool_calls_count=tool_calls_count,
+                        cost_usd=cost_usd,
+                        duration_ms=duration_ms,
+                    )
+                elif isinstance(message, AssistantMessage):
+                    for block in message.content:
+                        if isinstance(block, TextBlock):
+                            # Add spacing before text that follows tool calls/results
+                            # This ensures proper paragraph separation in the UI
+                            text = block.text
+                            if needs_spacing_before_text and text:
+                                # Ensure we have a proper paragraph break (double newline)
+                                # even if the text starts with a single newline
+                                text = text.lstrip("\n")
+                                if text:
+                                    text = "\n\n" + text
+                            yield TextChunk(content=text)
+                            needs_spacing_before_text = False
+                        elif isinstance(block, ToolUseBlock):
+                            tool_calls_count += 1
+                            server_name = _parse_server_name(block.name)
+                            pending_tool_calls[block.id] = block.name
+                            yield ToolCallEvent(
+                                tool_call_id=block.id,
+                                tool_name=block.name,
+                                server_name=server_name,
+                                arguments=block.input if isinstance(block.input, dict) else {},
+                            )
+                elif isinstance(message, UserMessage):
+                    # UserMessage may contain tool results
+                    if isinstance(message.content, list):
+                        for block in message.content:
+                            if isinstance(block, ToolResultBlock):
+                                # Determine success based on is_error attribute
+                                is_error = getattr(block, "is_error", False)
+                                yield ToolResultEvent(
+                                    tool_call_id=block.tool_use_id,
+                                    success=not is_error,
+                                    result=block.content if not is_error else None,
+                                    error=str(block.content) if is_error else None,
+                                )
+                                needs_spacing_before_text = True
+        except ExceptionGroup as eg:
+            errors = [f"{type(exc).__name__}: {exc}" for exc in eg.exceptions]
+            yield TextChunk(content=f"Generation failed: {'; '.join(errors)}")
+            yield DoneEvent(tool_calls_count=tool_calls_count)
+        except Exception as e:
+            self.logger.error(f"Failed to stream with MCP tools: {e}", exc_info=True)
+            yield TextChunk(content=f"Generation failed: {e}")
+            yield DoneEvent(tool_calls_count=tool_calls_count)
     async def describe_image(
         self,
         image_path: str,
@@ -495,7 +951,8 @@ class ClaudeLLMProvider(LLMProvider):
         """
         Generate a text description of an image using Claude's vision capabilities.
-        Uses LiteLLM for unified cost tracking with anthropic/claude-haiku-4-5 model.
+        In subscription mode, uses Claude Agent SDK.
+        In api_key mode, uses LiteLLM with anthropic/ prefix.
         Args:
             image_path: Path to the image file to describe
@@ -504,6 +961,21 @@ class ClaudeLLMProvider(LLMProvider):
         Returns:
             Text description of the image
         """
+        if self._auth_mode == "subscription":
+            return await self._describe_image_sdk(image_path, context)
+        else:
+            return await self._describe_image_litellm(image_path, context)
+    def _prepare_image_data(self, image_path: str) -> tuple[str, str] | str:
+        """
+        Validate and prepare image data for API calls.
+        Args:
+            image_path: Path to the image file.
+        Returns:
+            Tuple of (image_base64, mime_type) on success, or error string on failure.
+        """
         import base64
         import mimetypes
         from pathlib import Path
@@ -524,21 +996,103 @@ class ClaudeLLMProvider(LLMProvider):
         # Determine media type
         mime_type, _ = mimetypes.guess_type(str(path))
         if mime_type not in ["image/jpeg", "image/png", "image/gif", "image/webp"]:
-            # Default to png for unknown types
             mime_type = "image/png"
+        return (image_base64, mime_type)
+    async def _describe_image_sdk(
+        self,
+        image_path: str,
+        context: str | None = None,
+    ) -> str:
+        """Describe image using Claude Agent SDK (subscription mode)."""
+        cli_path = self._verify_cli_path()
+        if not cli_path:
+            return "Image description unavailable (Claude CLI not found)"
+        # Prepare image data
+        result = self._prepare_image_data(image_path)
+        if isinstance(result, str):
+            return result
+        image_base64, mime_type = result
+        # Build prompt with image
+        text_prompt = "Please describe this image in detail, focusing on the key visual elements and any text visible."
+        if context:
+            text_prompt = f"{context}\n\n{text_prompt}"
+        # Configure Claude Agent SDK
+        options = ClaudeAgentOptions(
+            system_prompt="You are a vision assistant that describes images in detail.",
+            max_turns=1,
+            model="claude-haiku-4-5",
+            tools=[],
+            allowed_tools=[],
+            permission_mode="default",
+            cli_path=cli_path,
+        )
+        # Build async generator yielding structured message with image content
+        # The SDK accepts AsyncIterable[dict] for multimodal input
+        async def _message_generator() -> Any:
+            yield {
+                "role": "user",
+                "content": [
+                    {"type": "text", "text": text_prompt},
+                    {
+                        "type": "image",
+                        "source": {
+                            "type": "base64",
+                            "media_type": mime_type,
+                            "data": image_base64,
+                        },
+                    },
+                ],
+            }
+        async def _run_query() -> str:
+            result_text = ""
+            async for message in query(prompt=_message_generator(), options=options):
+                if isinstance(message, AssistantMessage):
+                    for block in message.content:
+                        if isinstance(block, TextBlock):
+                            result_text += block.text
+                elif isinstance(message, ResultMessage):
+                    if message.result:
+                        result_text = message.result
+            return result_text
+        try:
+            return await _run_query()
+        except Exception as e:
+            self.logger.error(f"Failed to describe image with Claude SDK: {e}")
+            return f"Image description failed: {e}"
+    async def _describe_image_litellm(
+        self,
+        image_path: str,
+        context: str | None = None,
+    ) -> str:
+        """Describe image using LiteLLM (api_key mode)."""
+        if not self._litellm:
+            return "Image description unavailable (LiteLLM not initialized)"
+        # Prepare image data
+        result = self._prepare_image_data(image_path)
+        if isinstance(result, str):
+            return result
+        image_base64, mime_type = result
         # Build prompt
         prompt = "Please describe this image in detail, focusing on the key visual elements and any text visible."
         if context:
             prompt = f"{context}\n\n{prompt}"
-        # Use LiteLLM for unified cost tracking
         try:
-            import litellm
-            # Route through LiteLLM with anthropic prefix for cost tracking
-            response = await litellm.acompletion(
-                model="anthropic/claude-haiku-4-5-20251001",  # Use haiku for cost efficiency
+            # Route through LiteLLM with anthropic prefix
+            # Use same model as SDK path for consistency
+            response = await self._litellm.acompletion(
+                model="anthropic/claude-haiku-4-5",
                 messages=[
                     {
                         "role": "user",
@@ -558,9 +1112,6 @@ class ClaudeLLMProvider(LLMProvider):
                 return "No description generated"
             return response.choices[0].message.content or "No description generated"
-        except ImportError:
-            self.logger.error("LiteLLM not installed, falling back to unavailable")
-            return "Image description unavailable (LiteLLM not installed)"
         except Exception as e:
-            self.logger.error(f"Failed to describe image with Claude via LiteLLM: {e}")
+            self.logger.error(f"Failed to describe image with LiteLLM: {e}")
             return f"Image description failed: {e}"

gobby 0.2.8__py3-none-any.whl → 0.2.11__py3-none-any.whl

gobby 0.2.8py3-none-any.whl → 0.2.11py3-none-any.whl