PyPI - gobby - Versions diffs - 0.2.5__py3-none-any.whl → 0.2.6__py3-none-any.whl - Mend

gobby 0.2.5py3-none-any.whl → 0.2.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (148) hide show

gobby/adapters/claude_code.py +13 -4
gobby/adapters/codex.py +43 -3
gobby/agents/runner.py +8 -0
gobby/cli/__init__.py +6 -0
gobby/cli/clones.py +419 -0
gobby/cli/conductor.py +266 -0
gobby/cli/installers/antigravity.py +3 -9
gobby/cli/installers/claude.py +9 -9
gobby/cli/installers/codex.py +2 -8
gobby/cli/installers/gemini.py +2 -8
gobby/cli/installers/shared.py +71 -8
gobby/cli/skills.py +858 -0
gobby/cli/tasks/ai.py +0 -440
gobby/cli/tasks/crud.py +44 -6
gobby/cli/tasks/main.py +0 -4
gobby/cli/tui.py +2 -2
gobby/cli/utils.py +3 -3
gobby/clones/__init__.py +13 -0
gobby/clones/git.py +547 -0
gobby/conductor/__init__.py +16 -0
gobby/conductor/alerts.py +135 -0
gobby/conductor/loop.py +164 -0
gobby/conductor/monitors/__init__.py +11 -0
gobby/conductor/monitors/agents.py +116 -0
gobby/conductor/monitors/tasks.py +155 -0
gobby/conductor/pricing.py +234 -0
gobby/conductor/token_tracker.py +160 -0
gobby/config/app.py +63 -1
gobby/config/search.py +110 -0
gobby/config/servers.py +1 -1
gobby/config/skills.py +43 -0
gobby/config/tasks.py +6 -14
gobby/hooks/event_handlers.py +145 -2
gobby/hooks/hook_manager.py +48 -2
gobby/hooks/skill_manager.py +130 -0
gobby/install/claude/hooks/hook_dispatcher.py +4 -4
gobby/install/codex/hooks/hook_dispatcher.py +1 -1
gobby/install/gemini/hooks/hook_dispatcher.py +87 -12
gobby/llm/claude.py +22 -34
gobby/llm/claude_executor.py +46 -256
gobby/llm/codex_executor.py +59 -291
gobby/llm/executor.py +21 -0
gobby/llm/gemini.py +134 -110
gobby/llm/litellm_executor.py +143 -6
gobby/llm/resolver.py +95 -33
gobby/mcp_proxy/instructions.py +54 -0
gobby/mcp_proxy/models.py +15 -0
gobby/mcp_proxy/registries.py +68 -5
gobby/mcp_proxy/server.py +33 -3
gobby/mcp_proxy/services/tool_proxy.py +81 -1
gobby/mcp_proxy/stdio.py +2 -1
gobby/mcp_proxy/tools/__init__.py +0 -2
gobby/mcp_proxy/tools/agent_messaging.py +317 -0
gobby/mcp_proxy/tools/clones.py +903 -0
gobby/mcp_proxy/tools/memory.py +1 -24
gobby/mcp_proxy/tools/metrics.py +65 -1
gobby/mcp_proxy/tools/orchestration/__init__.py +3 -0
gobby/mcp_proxy/tools/orchestration/cleanup.py +151 -0
gobby/mcp_proxy/tools/orchestration/wait.py +467 -0
gobby/mcp_proxy/tools/session_messages.py +1 -2
gobby/mcp_proxy/tools/skills/__init__.py +631 -0
gobby/mcp_proxy/tools/task_orchestration.py +7 -0
gobby/mcp_proxy/tools/task_readiness.py +14 -0
gobby/mcp_proxy/tools/task_sync.py +1 -1
gobby/mcp_proxy/tools/tasks/_context.py +0 -20
gobby/mcp_proxy/tools/tasks/_crud.py +91 -4
gobby/mcp_proxy/tools/tasks/_expansion.py +348 -0
gobby/mcp_proxy/tools/tasks/_factory.py +6 -16
gobby/mcp_proxy/tools/tasks/_lifecycle.py +60 -29
gobby/mcp_proxy/tools/tasks/_lifecycle_validation.py +18 -29
gobby/mcp_proxy/tools/workflows.py +1 -1
gobby/mcp_proxy/tools/worktrees.py +5 -0
gobby/memory/backends/__init__.py +6 -1
gobby/memory/backends/mem0.py +6 -1
gobby/memory/extractor.py +477 -0
gobby/memory/manager.py +11 -2
gobby/prompts/defaults/handoff/compact.md +63 -0
gobby/prompts/defaults/handoff/session_end.md +57 -0
gobby/prompts/defaults/memory/extract.md +61 -0
gobby/runner.py +37 -16
gobby/search/__init__.py +48 -6
gobby/search/backends/__init__.py +159 -0
gobby/search/backends/embedding.py +225 -0
gobby/search/embeddings.py +238 -0
gobby/search/models.py +148 -0
gobby/search/unified.py +496 -0
gobby/servers/http.py +23 -8
gobby/servers/routes/admin.py +280 -0
gobby/servers/routes/mcp/tools.py +241 -52
gobby/servers/websocket.py +2 -2
gobby/sessions/analyzer.py +2 -0
gobby/sessions/transcripts/base.py +1 -0
gobby/sessions/transcripts/claude.py +64 -5
gobby/skills/__init__.py +91 -0
gobby/skills/loader.py +685 -0
gobby/skills/manager.py +384 -0
gobby/skills/parser.py +258 -0
gobby/skills/search.py +463 -0
gobby/skills/sync.py +119 -0
gobby/skills/updater.py +385 -0
gobby/skills/validator.py +368 -0
gobby/storage/clones.py +378 -0
gobby/storage/database.py +1 -1
gobby/storage/memories.py +43 -13
gobby/storage/migrations.py +180 -6
gobby/storage/sessions.py +73 -0
gobby/storage/skills.py +749 -0
gobby/storage/tasks/_crud.py +4 -4
gobby/storage/tasks/_lifecycle.py +41 -6
gobby/storage/tasks/_manager.py +14 -5
gobby/storage/tasks/_models.py +8 -3
gobby/sync/memories.py +39 -4
gobby/sync/tasks.py +83 -6
gobby/tasks/__init__.py +1 -2
gobby/tasks/validation.py +24 -15
gobby/tui/api_client.py +4 -7
gobby/tui/app.py +5 -3
gobby/tui/screens/orchestrator.py +1 -2
gobby/tui/screens/tasks.py +2 -4
gobby/tui/ws_client.py +1 -1
gobby/utils/daemon_client.py +2 -2
gobby/workflows/actions.py +84 -2
gobby/workflows/context_actions.py +43 -0
gobby/workflows/detection_helpers.py +115 -31
gobby/workflows/engine.py +13 -2
gobby/workflows/lifecycle_evaluator.py +29 -1
gobby/workflows/loader.py +19 -6
gobby/workflows/memory_actions.py +74 -0
gobby/workflows/summary_actions.py +17 -0
gobby/workflows/task_enforcement_actions.py +448 -6
{gobby-0.2.5.dist-info → gobby-0.2.6.dist-info}/METADATA +82 -21
{gobby-0.2.5.dist-info → gobby-0.2.6.dist-info}/RECORD +136 -107
gobby/install/codex/prompts/forget.md +0 -7
gobby/install/codex/prompts/memories.md +0 -7
gobby/install/codex/prompts/recall.md +0 -7
gobby/install/codex/prompts/remember.md +0 -13
gobby/llm/gemini_executor.py +0 -339
gobby/mcp_proxy/tools/task_expansion.py +0 -591
gobby/tasks/context.py +0 -747
gobby/tasks/criteria.py +0 -342
gobby/tasks/expansion.py +0 -626
gobby/tasks/prompts/expand.py +0 -327
gobby/tasks/research.py +0 -421
gobby/tasks/tdd.py +0 -352
{gobby-0.2.5.dist-info → gobby-0.2.6.dist-info}/WHEEL +0 -0
{gobby-0.2.5.dist-info → gobby-0.2.6.dist-info}/entry_points.txt +0 -0
{gobby-0.2.5.dist-info → gobby-0.2.6.dist-info}/licenses/LICENSE.md +0 -0
{gobby-0.2.5.dist-info → gobby-0.2.6.dist-info}/top_level.txt +0 -0

gobby/llm/claude.py CHANGED Viewed

@@ -495,7 +495,7 @@ class ClaudeLLMProvider(LLMProvider):
         """
         Generate a text description of an image using Claude's vision capabilities.
-        Uses the Anthropic API directly for vision support.
+        Uses LiteLLM for unified cost tracking with anthropic/claude-haiku-4-5 model.
         Args:
             image_path: Path to the image file to describe
@@ -508,8 +508,6 @@ class ClaudeLLMProvider(LLMProvider):
         import mimetypes
         from pathlib import Path
-        import anthropic
         # Validate image exists
         path = Path(image_path)
         if not path.exists():
@@ -534,45 +532,35 @@ class ClaudeLLMProvider(LLMProvider):
         if context:
             prompt = f"{context}\n\n{prompt}"
-        # Use Anthropic API for vision
-        api_key = os.environ.get("ANTHROPIC_API_KEY")
-        if not api_key:
-            return "Image description unavailable (ANTHROPIC_API_KEY not set)"
+        # Use LiteLLM for unified cost tracking
         try:
-            client = anthropic.AsyncAnthropic(api_key=api_key)
-            # Type annotation to satisfy mypy
-            image_block: anthropic.types.ImageBlockParam = {
-                "type": "image",
-                "source": {
-                    "type": "base64",
-                    "media_type": mime_type,  # type: ignore[typeddict-item]
-                    "data": image_base64,
-                },
-            }
-            text_block: anthropic.types.TextBlockParam = {
-                "type": "text",
-                "text": prompt,
-            }
-            message = await client.messages.create(
-                model="claude-haiku-4-5-latest",  # Use haiku for cost efficiency
-                max_tokens=1024,
+            import litellm
+            # Route through LiteLLM with anthropic prefix for cost tracking
+            response = await litellm.acompletion(
+                model="anthropic/claude-haiku-4-5-20251001",  # Use haiku for cost efficiency
                 messages=[
                     {
                         "role": "user",
-                        "content": [image_block, text_block],
+                        "content": [
+                            {"type": "text", "text": prompt},
+                            {
+                                "type": "image_url",
+                                "image_url": {"url": f"data:{mime_type};base64,{image_base64}"},
+                            },
+                        ],
                     }
                 ],
+                max_tokens=1024,
             )
-            # Extract text from response
-            result = ""
-            for block in message.content:
-                if hasattr(block, "text"):
-                    result += block.text
-            return result if result else "No description generated"
+            if not response or not getattr(response, "choices", None):
+                return "No description generated"
+            return response.choices[0].message.content or "No description generated"
+        except ImportError:
+            self.logger.error("LiteLLM not installed, falling back to unavailable")
+            return "Image description unavailable (LiteLLM not installed)"
         except Exception as e:
-            self.logger.error(f"Failed to describe image with Claude: {e}")
+            self.logger.error(f"Failed to describe image with Claude via LiteLLM: {e}")
             return f"Image description failed: {e}"

gobby/llm/claude_executor.py CHANGED Viewed

@@ -1,22 +1,20 @@
 """
-Claude implementation of AgentExecutor.
+Claude implementation of AgentExecutor for subscription mode only.
-Supports multiple auth modes:
-- api_key: Direct Anthropic API with API key
-- subscription: Claude Agent SDK with CLI (Pro/Team subscriptions)
+This executor uses the Claude Agent SDK with CLI for Pro/Team subscriptions.
+Note: api_key mode is now routed through LiteLLMExecutor for unified cost tracking.
+Use the resolver.create_executor() function which handles routing automatically.
 """
 import asyncio
 import concurrent.futures
 import json
 import logging
-import os
 import shutil
 from collections.abc import Callable
 from typing import Any, Literal
-import anthropic
 from gobby.llm.executor import (
     AgentExecutor,
     AgentResult,
@@ -28,26 +26,28 @@ from gobby.llm.executor import (
 logger = logging.getLogger(__name__)
-# Auth mode type
-ClaudeAuthMode = Literal["api_key", "subscription"]
+# Auth mode type - subscription only, api_key routes through LiteLLM
+ClaudeAuthMode = Literal["subscription"]
 class ClaudeExecutor(AgentExecutor):
     """
-    Claude implementation of AgentExecutor.
+    Claude implementation of AgentExecutor for subscription mode only.
+    Uses Claude Agent SDK with CLI for Pro/Team subscriptions. This executor
+    is for subscription-based authentication only.
-    Supports two authentication modes:
-    - api_key: Uses the Anthropic API directly with an API key
-    - subscription: Uses Claude Agent SDK with CLI for Pro/Team subscriptions
+    For api_key mode, use LiteLLMExecutor with provider="claude" which routes
+    through anthropic/model-name for unified cost tracking.
     The executor implements a proper agentic loop:
-    1. Send prompt to Claude with tool schemas
+    1. Send prompt to Claude with tool schemas via SDK
     2. When Claude requests a tool, call tool_handler
     3. Send tool result back to Claude
     4. Repeat until Claude stops requesting tools or limits are reached
     Example:
-        >>> executor = ClaudeExecutor(auth_mode="api_key", api_key="sk-ant-...")
+        >>> executor = ClaudeExecutor(auth_mode="subscription")
         >>> result = await executor.run(
         ...     prompt="Create a task",
         ...     tools=[ToolSchema(name="create_task", ...)],
@@ -55,71 +55,47 @@ class ClaudeExecutor(AgentExecutor):
         ... )
     """
-    _client: anthropic.AsyncAnthropic | None
     _cli_path: str
     def __init__(
         self,
-        auth_mode: ClaudeAuthMode = "api_key",
-        api_key: str | None = None,
+        auth_mode: ClaudeAuthMode = "subscription",
         default_model: str = "claude-sonnet-4-20250514",
     ):
         """
-        Initialize ClaudeExecutor.
+        Initialize ClaudeExecutor for subscription mode.
         Args:
-            auth_mode: Authentication mode ("api_key" or "subscription").
-            api_key: Anthropic API key (required for api_key mode).
+            auth_mode: Must be "subscription". API key mode is handled by LiteLLMExecutor.
             default_model: Default model to use if not specified in run().
+        Raises:
+            ValueError: If auth_mode is not "subscription" or Claude CLI not found.
         """
+        if auth_mode != "subscription":
+            raise ValueError(
+                "ClaudeExecutor only supports subscription mode. "
+                "For api_key mode, use LiteLLMExecutor with provider='claude'."
+            )
         self.auth_mode = auth_mode
         self.default_model = default_model
         self.logger = logger
-        self._client = None
         self._cli_path = ""
-        if auth_mode == "api_key":
-            # Use provided key or fall back to environment variable
-            key = api_key or os.environ.get("ANTHROPIC_API_KEY")
-            if not key:
-                raise ValueError(
-                    "API key required for api_key mode. "
-                    "Provide api_key parameter or set ANTHROPIC_API_KEY env var."
-                )
-            self._client = anthropic.AsyncAnthropic(api_key=key)
-        elif auth_mode == "subscription":
-            # Verify Claude CLI is available for subscription mode
-            cli_path = shutil.which("claude")
-            if not cli_path:
-                raise ValueError(
-                    "Claude CLI not found in PATH. Install Claude Code for subscription mode."
-                )
-            self._cli_path = cli_path
-        else:
-            raise ValueError(f"Unknown auth_mode: {auth_mode}")
+        # Verify Claude CLI is available for subscription mode
+        cli_path = shutil.which("claude")
+        if not cli_path:
+            raise ValueError(
+                "Claude CLI not found in PATH. Install Claude Code for subscription mode."
+            )
+        self._cli_path = cli_path
     @property
     def provider_name(self) -> str:
         """Return the provider name."""
         return "claude"
-    def _convert_tools_to_anthropic_format(
-        self, tools: list[ToolSchema]
-    ) -> list[anthropic.types.ToolParam]:
-        """Convert ToolSchema list to Anthropic API format."""
-        anthropic_tools: list[anthropic.types.ToolParam] = []
-        for tool in tools:
-            # input_schema must have "type": "object" at minimum
-            input_schema: dict[str, Any] = {"type": "object", **tool.input_schema}
-            anthropic_tools.append(
-                {
-                    "name": tool.name,
-                    "description": tool.description,
-                    "input_schema": input_schema,
-                }
-            )
-        return anthropic_tools
     async def run(
         self,
         prompt: str,
@@ -131,10 +107,10 @@ class ClaudeExecutor(AgentExecutor):
         timeout: float = 120.0,
     ) -> AgentResult:
         """
-        Execute an agentic loop with tool calling.
+        Execute an agentic loop with tool calling via Claude Agent SDK.
-        Runs Claude with the given prompt, calling tools via tool_handler
-        until completion, max_turns, or timeout.
+        Runs Claude with the given prompt using subscription-based authentication,
+        calling tools via tool_handler until completion, max_turns, or timeout.
         Args:
             prompt: The user prompt to process.
@@ -148,201 +124,15 @@ class ClaudeExecutor(AgentExecutor):
         Returns:
             AgentResult with output, status, and tool call records.
         """
-        if self.auth_mode == "api_key":
-            return await self._run_with_api(
-                prompt=prompt,
-                tools=tools,
-                tool_handler=tool_handler,
-                system_prompt=system_prompt,
-                model=model or self.default_model,
-                max_turns=max_turns,
-                timeout=timeout,
-            )
-        else:
-            return await self._run_with_sdk(
-                prompt=prompt,
-                tools=tools,
-                tool_handler=tool_handler,
-                system_prompt=system_prompt,
-                model=model or self.default_model,
-                max_turns=max_turns,
-                timeout=timeout,
-            )
-    async def _run_with_api(
-        self,
-        prompt: str,
-        tools: list[ToolSchema],
-        tool_handler: ToolHandler,
-        system_prompt: str | None,
-        model: str,
-        max_turns: int,
-        timeout: float,
-    ) -> AgentResult:
-        """Run using direct Anthropic API."""
-        if self._client is None:
-            return AgentResult(
-                output="",
-                status="error",
-                error="Anthropic client not initialized",
-                turns_used=0,
-            )
-        tool_calls: list[ToolCallRecord] = []
-        anthropic_tools = self._convert_tools_to_anthropic_format(tools)
-        # Build initial messages
-        messages: list[anthropic.types.MessageParam] = [{"role": "user", "content": prompt}]
-        # Track turns in outer scope so timeout handler can access the count
-        turns_counter = [0]
-        async def _run_loop() -> AgentResult:
-            nonlocal messages
-            turns_used = 0
-            final_output = ""
-            client = self._client
-            if client is None:
-                raise RuntimeError("ClaudeExecutor client not initialized")
-            while turns_used < max_turns:
-                turns_used += 1
-                turns_counter[0] = turns_used
-                # Call Claude
-                try:
-                    response = await client.messages.create(
-                        model=model,
-                        max_tokens=8192,
-                        system=system_prompt or "You are a helpful assistant.",
-                        messages=messages,
-                        tools=anthropic_tools if anthropic_tools else [],
-                    )
-                except anthropic.APIError as e:
-                    return AgentResult(
-                        output="",
-                        status="error",
-                        tool_calls=tool_calls,
-                        error=f"Anthropic API error: {e}",
-                        turns_used=turns_used,
-                    )
-                # Process response
-                assistant_content: list[anthropic.types.ContentBlockParam] = []
-                tool_use_blocks: list[dict[str, Any]] = []
-                for block in response.content:
-                    if block.type == "text":
-                        final_output = block.text
-                        assistant_content.append({"type": "text", "text": block.text})
-                    elif block.type == "tool_use":
-                        tool_use_blocks.append(
-                            {
-                                "id": block.id,
-                                "name": block.name,
-                                "input": block.input,
-                            }
-                        )
-                        assistant_content.append(
-                            {
-                                "type": "tool_use",
-                                "id": block.id,
-                                "name": block.name,
-                                "input": dict(block.input) if block.input else {},
-                            }
-                        )
-                # Add assistant message to history
-                messages.append({"role": "assistant", "content": assistant_content})
-                # If no tool use, we're done
-                if not tool_use_blocks:
-                    return AgentResult(
-                        output=final_output,
-                        status="success",
-                        tool_calls=tool_calls,
-                        turns_used=turns_used,
-                    )
-                # Handle tool calls
-                tool_results: list[anthropic.types.ToolResultBlockParam] = []
-                for tool_use in tool_use_blocks:
-                    tool_name = tool_use["name"]
-                    arguments = tool_use["input"] if isinstance(tool_use["input"], dict) else {}
-                    # Record the tool call
-                    record = ToolCallRecord(
-                        tool_name=tool_name,
-                        arguments=arguments,
-                    )
-                    tool_calls.append(record)
-                    # Execute via handler
-                    try:
-                        result = await tool_handler(tool_name, arguments)
-                        record.result = result
-                        # Format result for Claude
-                        if result.success:
-                            content = json.dumps(result.result) if result.result else "Success"
-                        else:
-                            content = f"Error: {result.error}"
-                        tool_results.append(
-                            {
-                                "type": "tool_result",
-                                "tool_use_id": tool_use["id"],
-                                "content": content,
-                            }
-                        )
-                    except Exception as e:
-                        self.logger.error(f"Tool handler error for {tool_name}: {e}")
-                        record.result = ToolResult(
-                            tool_name=tool_name,
-                            success=False,
-                            error=str(e),
-                        )
-                        tool_results.append(
-                            {
-                                "type": "tool_result",
-                                "tool_use_id": tool_use["id"],
-                                "content": f"Error: {e}",
-                                "is_error": True,
-                            }
-                        )
-                # Add tool results to messages
-                messages.append({"role": "user", "content": tool_results})
-                # Check stop reason
-                if response.stop_reason == "end_turn":
-                    return AgentResult(
-                        output=final_output,
-                        status="success",
-                        tool_calls=tool_calls,
-                        turns_used=turns_used,
-                    )
-            # Max turns reached
-            return AgentResult(
-                output=final_output,
-                status="partial",
-                tool_calls=tool_calls,
-                turns_used=turns_used,
-            )
-        # Run with timeout
-        try:
-            return await asyncio.wait_for(_run_loop(), timeout=timeout)
-        except TimeoutError:
-            return AgentResult(
-                output="",
-                status="timeout",
-                tool_calls=tool_calls,
-                error=f"Execution timed out after {timeout}s",
-                turns_used=turns_counter[0],
-            )
+        return await self._run_with_sdk(
+            prompt=prompt,
+            tools=tools,
+            tool_handler=tool_handler,
+            system_prompt=system_prompt,
+            model=model or self.default_model,
+            max_turns=max_turns,
+            timeout=timeout,
+        )
     async def _run_with_sdk(
         self,

gobby 0.2.5__py3-none-any.whl → 0.2.6__py3-none-any.whl

gobby 0.2.5py3-none-any.whl → 0.2.6py3-none-any.whl