PyPI - gobby - Versions diffs - 0.2.5__py3-none-any.whl → 0.2.7__py3-none-any.whl - Mend

gobby 0.2.5py3-none-any.whl → 0.2.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (244) hide show

gobby/__init__.py +1 -1
gobby/adapters/__init__.py +2 -1
gobby/adapters/claude_code.py +13 -4
gobby/adapters/codex_impl/__init__.py +28 -0
gobby/adapters/codex_impl/adapter.py +722 -0
gobby/adapters/codex_impl/client.py +679 -0
gobby/adapters/codex_impl/protocol.py +20 -0
gobby/adapters/codex_impl/types.py +68 -0
gobby/agents/definitions.py +11 -1
gobby/agents/isolation.py +395 -0
gobby/agents/runner.py +8 -0
gobby/agents/sandbox.py +261 -0
gobby/agents/spawn.py +42 -287
gobby/agents/spawn_executor.py +385 -0
gobby/agents/spawners/__init__.py +24 -0
gobby/agents/spawners/command_builder.py +189 -0
gobby/agents/spawners/embedded.py +21 -2
gobby/agents/spawners/headless.py +21 -2
gobby/agents/spawners/prompt_manager.py +125 -0
gobby/cli/__init__.py +6 -0
gobby/cli/clones.py +419 -0
gobby/cli/conductor.py +266 -0
gobby/cli/install.py +4 -4
gobby/cli/installers/antigravity.py +3 -9
gobby/cli/installers/claude.py +15 -9
gobby/cli/installers/codex.py +2 -8
gobby/cli/installers/gemini.py +8 -8
gobby/cli/installers/shared.py +175 -13
gobby/cli/sessions.py +1 -1
gobby/cli/skills.py +858 -0
gobby/cli/tasks/ai.py +0 -440
gobby/cli/tasks/crud.py +44 -6
gobby/cli/tasks/main.py +0 -4
gobby/cli/tui.py +2 -2
gobby/cli/utils.py +12 -5
gobby/clones/__init__.py +13 -0
gobby/clones/git.py +547 -0
gobby/conductor/__init__.py +16 -0
gobby/conductor/alerts.py +135 -0
gobby/conductor/loop.py +164 -0
gobby/conductor/monitors/__init__.py +11 -0
gobby/conductor/monitors/agents.py +116 -0
gobby/conductor/monitors/tasks.py +155 -0
gobby/conductor/pricing.py +234 -0
gobby/conductor/token_tracker.py +160 -0
gobby/config/__init__.py +12 -97
gobby/config/app.py +69 -91
gobby/config/extensions.py +2 -2
gobby/config/features.py +7 -130
gobby/config/search.py +110 -0
gobby/config/servers.py +1 -1
gobby/config/skills.py +43 -0
gobby/config/tasks.py +9 -41
gobby/hooks/__init__.py +0 -13
gobby/hooks/event_handlers.py +188 -2
gobby/hooks/hook_manager.py +50 -4
gobby/hooks/plugins.py +1 -1
gobby/hooks/skill_manager.py +130 -0
gobby/hooks/webhooks.py +1 -1
gobby/install/claude/hooks/hook_dispatcher.py +4 -4
gobby/install/codex/hooks/hook_dispatcher.py +1 -1
gobby/install/gemini/hooks/hook_dispatcher.py +87 -12
gobby/llm/claude.py +22 -34
gobby/llm/claude_executor.py +46 -256
gobby/llm/codex_executor.py +59 -291
gobby/llm/executor.py +21 -0
gobby/llm/gemini.py +134 -110
gobby/llm/litellm_executor.py +143 -6
gobby/llm/resolver.py +98 -35
gobby/mcp_proxy/importer.py +62 -4
gobby/mcp_proxy/instructions.py +56 -0
gobby/mcp_proxy/models.py +15 -0
gobby/mcp_proxy/registries.py +68 -8
gobby/mcp_proxy/server.py +33 -3
gobby/mcp_proxy/services/recommendation.py +43 -11
gobby/mcp_proxy/services/tool_proxy.py +81 -1
gobby/mcp_proxy/stdio.py +2 -1
gobby/mcp_proxy/tools/__init__.py +0 -2
gobby/mcp_proxy/tools/agent_messaging.py +317 -0
gobby/mcp_proxy/tools/agents.py +31 -731
gobby/mcp_proxy/tools/clones.py +518 -0
gobby/mcp_proxy/tools/memory.py +3 -26
gobby/mcp_proxy/tools/metrics.py +65 -1
gobby/mcp_proxy/tools/orchestration/__init__.py +3 -0
gobby/mcp_proxy/tools/orchestration/cleanup.py +151 -0
gobby/mcp_proxy/tools/orchestration/wait.py +467 -0
gobby/mcp_proxy/tools/sessions/__init__.py +14 -0
gobby/mcp_proxy/tools/sessions/_commits.py +232 -0
gobby/mcp_proxy/tools/sessions/_crud.py +253 -0
gobby/mcp_proxy/tools/sessions/_factory.py +63 -0
gobby/mcp_proxy/tools/sessions/_handoff.py +499 -0
gobby/mcp_proxy/tools/sessions/_messages.py +138 -0
gobby/mcp_proxy/tools/skills/__init__.py +616 -0
gobby/mcp_proxy/tools/spawn_agent.py +417 -0
gobby/mcp_proxy/tools/task_orchestration.py +7 -0
gobby/mcp_proxy/tools/task_readiness.py +14 -0
gobby/mcp_proxy/tools/task_sync.py +1 -1
gobby/mcp_proxy/tools/tasks/_context.py +0 -20
gobby/mcp_proxy/tools/tasks/_crud.py +91 -4
gobby/mcp_proxy/tools/tasks/_expansion.py +348 -0
gobby/mcp_proxy/tools/tasks/_factory.py +6 -16
gobby/mcp_proxy/tools/tasks/_lifecycle.py +110 -45
gobby/mcp_proxy/tools/tasks/_lifecycle_validation.py +18 -29
gobby/mcp_proxy/tools/workflows.py +1 -1
gobby/mcp_proxy/tools/worktrees.py +0 -338
gobby/memory/backends/__init__.py +6 -1
gobby/memory/backends/mem0.py +6 -1
gobby/memory/extractor.py +477 -0
gobby/memory/ingestion/__init__.py +5 -0
gobby/memory/ingestion/multimodal.py +221 -0
gobby/memory/manager.py +73 -285
gobby/memory/search/__init__.py +10 -0
gobby/memory/search/coordinator.py +248 -0
gobby/memory/services/__init__.py +5 -0
gobby/memory/services/crossref.py +142 -0
gobby/prompts/loader.py +5 -2
gobby/runner.py +37 -16
gobby/search/__init__.py +48 -6
gobby/search/backends/__init__.py +159 -0
gobby/search/backends/embedding.py +225 -0
gobby/search/embeddings.py +238 -0
gobby/search/models.py +148 -0
gobby/search/unified.py +496 -0
gobby/servers/http.py +24 -12
gobby/servers/routes/admin.py +294 -0
gobby/servers/routes/mcp/endpoints/__init__.py +61 -0
gobby/servers/routes/mcp/endpoints/discovery.py +405 -0
gobby/servers/routes/mcp/endpoints/execution.py +568 -0
gobby/servers/routes/mcp/endpoints/registry.py +378 -0
gobby/servers/routes/mcp/endpoints/server.py +304 -0
gobby/servers/routes/mcp/hooks.py +1 -1
gobby/servers/routes/mcp/tools.py +48 -1317
gobby/servers/websocket.py +2 -2
gobby/sessions/analyzer.py +2 -0
gobby/sessions/lifecycle.py +1 -1
gobby/sessions/processor.py +10 -0
gobby/sessions/transcripts/base.py +2 -0
gobby/sessions/transcripts/claude.py +79 -10
gobby/skills/__init__.py +91 -0
gobby/skills/loader.py +685 -0
gobby/skills/manager.py +384 -0
gobby/skills/parser.py +286 -0
gobby/skills/search.py +463 -0
gobby/skills/sync.py +119 -0
gobby/skills/updater.py +385 -0
gobby/skills/validator.py +368 -0
gobby/storage/clones.py +378 -0
gobby/storage/database.py +1 -1
gobby/storage/memories.py +43 -13
gobby/storage/migrations.py +162 -201
gobby/storage/sessions.py +116 -7
gobby/storage/skills.py +782 -0
gobby/storage/tasks/_crud.py +4 -4
gobby/storage/tasks/_lifecycle.py +57 -7
gobby/storage/tasks/_manager.py +14 -5
gobby/storage/tasks/_models.py +8 -3
gobby/sync/memories.py +40 -5
gobby/sync/tasks.py +83 -6
gobby/tasks/__init__.py +1 -2
gobby/tasks/external_validator.py +1 -1
gobby/tasks/validation.py +46 -35
gobby/tools/summarizer.py +91 -10
gobby/tui/api_client.py +4 -7
gobby/tui/app.py +5 -3
gobby/tui/screens/orchestrator.py +1 -2
gobby/tui/screens/tasks.py +2 -4
gobby/tui/ws_client.py +1 -1
gobby/utils/daemon_client.py +2 -2
gobby/utils/project_context.py +2 -3
gobby/utils/status.py +13 -0
gobby/workflows/actions.py +221 -1135
gobby/workflows/artifact_actions.py +31 -0
gobby/workflows/autonomous_actions.py +11 -0
gobby/workflows/context_actions.py +93 -1
gobby/workflows/detection_helpers.py +115 -31
gobby/workflows/enforcement/__init__.py +47 -0
gobby/workflows/enforcement/blocking.py +269 -0
gobby/workflows/enforcement/commit_policy.py +283 -0
gobby/workflows/enforcement/handlers.py +269 -0
gobby/workflows/{task_enforcement_actions.py → enforcement/task_policy.py} +29 -388
gobby/workflows/engine.py +13 -2
gobby/workflows/git_utils.py +106 -0
gobby/workflows/lifecycle_evaluator.py +29 -1
gobby/workflows/llm_actions.py +30 -0
gobby/workflows/loader.py +19 -6
gobby/workflows/mcp_actions.py +20 -1
gobby/workflows/memory_actions.py +154 -0
gobby/workflows/safe_evaluator.py +183 -0
gobby/workflows/session_actions.py +44 -0
gobby/workflows/state_actions.py +60 -1
gobby/workflows/stop_signal_actions.py +55 -0
gobby/workflows/summary_actions.py +111 -1
gobby/workflows/task_sync_actions.py +347 -0
gobby/workflows/todo_actions.py +34 -1
gobby/workflows/webhook_actions.py +185 -0
{gobby-0.2.5.dist-info → gobby-0.2.7.dist-info}/METADATA +87 -21
{gobby-0.2.5.dist-info → gobby-0.2.7.dist-info}/RECORD +201 -172
{gobby-0.2.5.dist-info → gobby-0.2.7.dist-info}/WHEEL +1 -1
gobby/adapters/codex.py +0 -1292
gobby/install/claude/commands/gobby/bug.md +0 -51
gobby/install/claude/commands/gobby/chore.md +0 -51
gobby/install/claude/commands/gobby/epic.md +0 -52
gobby/install/claude/commands/gobby/eval.md +0 -235
gobby/install/claude/commands/gobby/feat.md +0 -49
gobby/install/claude/commands/gobby/nit.md +0 -52
gobby/install/claude/commands/gobby/ref.md +0 -52
gobby/install/codex/prompts/forget.md +0 -7
gobby/install/codex/prompts/memories.md +0 -7
gobby/install/codex/prompts/recall.md +0 -7
gobby/install/codex/prompts/remember.md +0 -13
gobby/llm/gemini_executor.py +0 -339
gobby/mcp_proxy/tools/session_messages.py +0 -1056
gobby/mcp_proxy/tools/task_expansion.py +0 -591
gobby/prompts/defaults/expansion/system.md +0 -119
gobby/prompts/defaults/expansion/user.md +0 -48
gobby/prompts/defaults/external_validation/agent.md +0 -72
gobby/prompts/defaults/external_validation/external.md +0 -63
gobby/prompts/defaults/external_validation/spawn.md +0 -83
gobby/prompts/defaults/external_validation/system.md +0 -6
gobby/prompts/defaults/features/import_mcp.md +0 -22
gobby/prompts/defaults/features/import_mcp_github.md +0 -17
gobby/prompts/defaults/features/import_mcp_search.md +0 -16
gobby/prompts/defaults/features/recommend_tools.md +0 -32
gobby/prompts/defaults/features/recommend_tools_hybrid.md +0 -35
gobby/prompts/defaults/features/recommend_tools_llm.md +0 -30
gobby/prompts/defaults/features/server_description.md +0 -20
gobby/prompts/defaults/features/server_description_system.md +0 -6
gobby/prompts/defaults/features/task_description.md +0 -31
gobby/prompts/defaults/features/task_description_system.md +0 -6
gobby/prompts/defaults/features/tool_summary.md +0 -17
gobby/prompts/defaults/features/tool_summary_system.md +0 -6
gobby/prompts/defaults/research/step.md +0 -58
gobby/prompts/defaults/validation/criteria.md +0 -47
gobby/prompts/defaults/validation/validate.md +0 -38
gobby/storage/migrations_legacy.py +0 -1359
gobby/tasks/context.py +0 -747
gobby/tasks/criteria.py +0 -342
gobby/tasks/expansion.py +0 -626
gobby/tasks/prompts/expand.py +0 -327
gobby/tasks/research.py +0 -421
gobby/tasks/tdd.py +0 -352
{gobby-0.2.5.dist-info → gobby-0.2.7.dist-info}/entry_points.txt +0 -0
{gobby-0.2.5.dist-info → gobby-0.2.7.dist-info}/licenses/LICENSE.md +0 -0
{gobby-0.2.5.dist-info → gobby-0.2.7.dist-info}/top_level.txt +0 -0

gobby/llm/codex_executor.py CHANGED Viewed

@@ -1,30 +1,19 @@
 """
-Codex (OpenAI) implementation of AgentExecutor.
+Codex (OpenAI) implementation of AgentExecutor for CLI/subscription mode only.
-Supports two authentication modes with different capabilities:
+This executor spawns `codex exec --json` CLI and parses JSONL events.
+It uses Codex's built-in tools (bash, file operations, etc.) - NO custom tool
+injection is supported.
-1. api_key mode (OPENAI_API_KEY):
-   - Uses OpenAI API with function calling
-   - Full tool injection support
-   - Requires OPENAI_API_KEY environment variable
-2. subscription mode (ChatGPT Plus/Pro/Team/Enterprise):
-   - Spawns `codex exec --json` CLI and parses JSONL events
-   - Uses Codex's built-in tools (bash, file operations, etc.)
-   - NO custom tool injection - tools parameter is IGNORED
-   - Good for delegating complete autonomous tasks
-IMPORTANT: These modes have fundamentally different capabilities.
-Use api_key mode if you need custom MCP tool injection.
-Use subscription mode for delegating complete tasks to Codex.
+Note: api_key mode is now routed through LiteLLMExecutor for unified cost tracking.
+Use the resolver.create_executor() function which handles routing automatically.
 """
 import asyncio
 import json
 import logging
-import os
 import shutil
-from typing import Any, Literal
+from typing import Literal
 from gobby.llm.executor import (
     AgentExecutor,
@@ -36,39 +25,23 @@ from gobby.llm.executor import (
 logger = logging.getLogger(__name__)
-# Auth mode type
-CodexAuthMode = Literal["api_key", "subscription"]
+# Auth mode type - subscription/cli only, api_key routes through LiteLLM
+CodexAuthMode = Literal["subscription", "cli"]
 class CodexExecutor(AgentExecutor):
     """
-    Codex (OpenAI) implementation of AgentExecutor.
-    Supports two authentication modes with DIFFERENT CAPABILITIES:
-    api_key mode:
-        - Uses OpenAI API function calling (like GPT-4)
-        - Full tool injection support via tools parameter
-        - Requires OPENAI_API_KEY environment variable
-        - Standard agentic loop with custom tools
-    subscription mode:
-        - Spawns `codex exec --json` CLI process
-        - Parses JSONL events (thread.started, item.completed, turn.completed)
-        - Uses Codex's built-in tools ONLY (bash, file ops, web search, etc.)
-        - The `tools` parameter is IGNORED in this mode
-        - Cannot inject custom MCP tools
-        - Best for delegating complete autonomous tasks
-    Example (api_key mode):
-        >>> executor = CodexExecutor(auth_mode="api_key")
-        >>> result = await executor.run(
-        ...     prompt="Create a task",
-        ...     tools=[ToolSchema(name="create_task", ...)],
-        ...     tool_handler=my_handler,
-        ... )
+    Codex (OpenAI) implementation of AgentExecutor for CLI mode only.
+    Spawns `codex exec --json` CLI process and parses JSONL events.
+    Uses Codex's built-in tools ONLY (bash, file ops, web search, etc.).
+    The `tools` parameter is IGNORED - cannot inject custom MCP tools.
+    Best for delegating complete autonomous tasks.
+    For api_key mode with custom tool injection, use LiteLLMExecutor with
+    provider="codex" which routes through OpenAI API for unified cost tracking.
-    Example (subscription mode):
+    Example:
         >>> executor = CodexExecutor(auth_mode="subscription")
         >>> result = await executor.run(
         ...     prompt="Fix the bug in main.py and run the tests",
@@ -77,83 +50,49 @@ class CodexExecutor(AgentExecutor):
         ... )
     """
+    _cli_path: str
     def __init__(
         self,
-        auth_mode: CodexAuthMode = "api_key",
-        api_key: str | None = None,
+        auth_mode: CodexAuthMode = "subscription",
         default_model: str = "gpt-4o",
     ):
         """
-        Initialize CodexExecutor.
+        Initialize CodexExecutor for CLI/subscription mode.
         Args:
-            auth_mode: Authentication mode.
-                - "api_key": Use OpenAI API with function calling (requires OPENAI_API_KEY)
-                - "subscription": Use Codex CLI with ChatGPT subscription (requires `codex` in PATH)
-            api_key: OpenAI API key (optional for api_key mode, uses OPENAI_API_KEY env var).
-            default_model: Default model for api_key mode (default: gpt-4o).
+            auth_mode: Must be "subscription" or "cli". API key mode is handled by LiteLLMExecutor.
+            default_model: Default model (not used in CLI mode, kept for interface compatibility).
+        Raises:
+            ValueError: If auth_mode is not "subscription"/"cli" or Codex CLI not found.
         """
+        if auth_mode not in ("subscription", "cli"):
+            raise ValueError(
+                "CodexExecutor only supports subscription/cli mode. "
+                "For api_key mode with custom tools, use LiteLLMExecutor with provider='codex'."
+            )
         self.auth_mode = auth_mode
         self.default_model = default_model
         self.logger = logger
-        self._client: Any = None
-        self._cli_path: str = ""
-        if auth_mode == "api_key":
-            # Use provided key or fall back to environment variable
-            key = api_key or os.environ.get("OPENAI_API_KEY")
-            if not key:
-                raise ValueError(
-                    "API key required for api_key mode. "
-                    "Provide api_key parameter or set OPENAI_API_KEY env var."
-                )
-            try:
-                from openai import AsyncOpenAI
-                self._client = AsyncOpenAI(api_key=key)
-                self.logger.debug("CodexExecutor initialized with API key")
-            except ImportError as e:
-                raise ImportError(
-                    "openai package not found. Please install with `pip install openai`."
-                ) from e
-        elif auth_mode == "subscription":
-            # Verify Codex CLI is available
-            cli_path = shutil.which("codex")
-            if not cli_path:
-                raise ValueError(
-                    "Codex CLI not found in PATH. "
-                    "Install Codex CLI and run `codex login` for subscription mode."
-                )
-            self._cli_path = cli_path
-            self.logger.debug(f"CodexExecutor initialized with CLI at {cli_path}")
-        else:
-            raise ValueError(f"Unknown auth_mode: {auth_mode}")
+        self._cli_path = ""
+        # Verify Codex CLI is available
+        cli_path = shutil.which("codex")
+        if not cli_path:
+            raise ValueError(
+                "Codex CLI not found in PATH. "
+                "Install Codex CLI and run `codex login` for subscription mode."
+            )
+        self._cli_path = cli_path
+        self.logger.debug(f"CodexExecutor initialized with CLI at {cli_path}")
     @property
     def provider_name(self) -> str:
         """Return the provider name."""
         return "codex"
-    def _convert_tools_to_openai_format(self, tools: list[ToolSchema]) -> list[dict[str, Any]]:
-        """Convert ToolSchema list to OpenAI function calling format."""
-        openai_tools = []
-        for tool in tools:
-            # Ensure input_schema has "type": "object"
-            params = {"type": "object", **tool.input_schema}
-            openai_tools.append(
-                {
-                    "type": "function",
-                    "function": {
-                        "name": tool.name,
-                        "description": tool.description,
-                        "parameters": params,
-                    },
-                }
-            )
-        return openai_tools
     async def run(
         self,
         prompt: str,
@@ -165,200 +104,29 @@ class CodexExecutor(AgentExecutor):
         timeout: float = 120.0,
     ) -> AgentResult:
         """
-        Execute an agentic loop.
+        Execute Codex CLI and parse JSONL events.
+        Note: The tools and tool_handler parameters are IGNORED in CLI mode.
+        Codex uses its own built-in tools (bash, file operations, etc.).
-        For api_key mode: Uses OpenAI function calling with custom tools.
-        For subscription mode: Spawns Codex CLI (tools parameter is IGNORED).
+        For custom tool injection, use LiteLLMExecutor with provider="codex".
         Args:
             prompt: The user prompt to process.
-            tools: List of available tools (IGNORED in subscription mode).
-            tool_handler: Callback for tool calls (NOT CALLED in subscription mode).
-            system_prompt: Optional system prompt (api_key mode only).
-            model: Optional model override (api_key mode only).
-            max_turns: Maximum turns before stopping (api_key mode only).
+            tools: IGNORED - Codex uses its own tools.
+            tool_handler: IGNORED - not called in CLI mode.
+            system_prompt: IGNORED in CLI mode.
+            model: IGNORED in CLI mode.
+            max_turns: IGNORED in CLI mode.
             timeout: Maximum execution time in seconds.
         Returns:
             AgentResult with output, status, and tool call records.
         """
-        if self.auth_mode == "api_key":
-            return await self._run_with_api(
-                prompt=prompt,
-                tools=tools,
-                tool_handler=tool_handler,
-                system_prompt=system_prompt,
-                model=model or self.default_model,
-                max_turns=max_turns,
-                timeout=timeout,
-            )
-        else:
-            return await self._run_with_cli(
-                prompt=prompt,
-                timeout=timeout,
-            )
-    async def _run_with_api(
-        self,
-        prompt: str,
-        tools: list[ToolSchema],
-        tool_handler: ToolHandler,
-        system_prompt: str | None,
-        model: str,
-        max_turns: int,
-        timeout: float,
-    ) -> AgentResult:
-        """Run using OpenAI API with function calling."""
-        if self._client is None:
-            return AgentResult(
-                output="",
-                status="error",
-                error="OpenAI client not initialized",
-                turns_used=0,
-            )
-        tool_calls_list: list[ToolCallRecord] = []
-        openai_tools = self._convert_tools_to_openai_format(tools)
-        # Build initial messages
-        messages: list[dict[str, Any]] = []
-        if system_prompt:
-            messages.append({"role": "system", "content": system_prompt})
-        messages.append({"role": "user", "content": prompt})
-        # Track turns in outer scope so timeout handler can access the count
-        turns_counter = [0]
-        async def _run_loop() -> AgentResult:
-            nonlocal messages
-            turns_used = 0
-            final_output = ""
-            client = self._client
-            if client is None:
-                raise RuntimeError("CodexExecutor client not initialized")
-            while turns_used < max_turns:
-                turns_used += 1
-                turns_counter[0] = turns_used
-                # Call OpenAI
-                try:
-                    response = await client.chat.completions.create(
-                        model=model,
-                        messages=messages,
-                        tools=openai_tools if openai_tools else None,
-                        max_tokens=8192,
-                    )
-                except Exception as e:
-                    self.logger.error(f"OpenAI API error: {e}")
-                    return AgentResult(
-                        output="",
-                        status="error",
-                        tool_calls=tool_calls_list,
-                        error=f"OpenAI API error: {e}",
-                        turns_used=turns_used,
-                    )
-                # Get the assistant's message
-                choice = response.choices[0]
-                message = choice.message
-                # Extract text content
-                if message.content:
-                    final_output = message.content
-                # Add assistant message to history
-                messages.append(message.model_dump())
-                # Check if there are tool calls
-                if not message.tool_calls:
-                    # No tool calls - we're done
-                    return AgentResult(
-                        output=final_output,
-                        status="success",
-                        tool_calls=tool_calls_list,
-                        turns_used=turns_used,
-                    )
-                # Handle tool calls
-                for tool_call in message.tool_calls:
-                    tool_name = tool_call.function.name
-                    try:
-                        arguments = json.loads(tool_call.function.arguments)
-                    except json.JSONDecodeError as e:
-                        self.logger.warning(
-                            f"Failed to parse tool call arguments for '{tool_name}' "
-                            f"(id={getattr(tool_call, 'id', 'unknown')}): {e}. "
-                            f"Arguments: {tool_call.function.arguments!r}"
-                        )
-                        arguments = {}
-                    # Record the tool call
-                    record = ToolCallRecord(
-                        tool_name=tool_name,
-                        arguments=arguments,
-                    )
-                    tool_calls_list.append(record)
-                    # Execute via handler
-                    try:
-                        result = await tool_handler(tool_name, arguments)
-                        record.result = result
-                        # Format result for OpenAI
-                        if result.success:
-                            content = json.dumps(result.result) if result.result else "Success"
-                        else:
-                            content = f"Error: {result.error}"
-                    except Exception as e:
-                        self.logger.error(f"Tool handler error for {tool_name}: {e}")
-                        from gobby.llm.executor import ToolResult as TR
-                        record.result = TR(
-                            tool_name=tool_name,
-                            success=False,
-                            error=str(e),
-                        )
-                        content = f"Error: {e}"
-                    # Add tool result to messages
-                    messages.append(
-                        {
-                            "role": "tool",
-                            "tool_call_id": tool_call.id,
-                            "content": content,
-                        }
-                    )
-                # Check finish reason
-                if choice.finish_reason == "stop":
-                    return AgentResult(
-                        output=final_output,
-                        status="success",
-                        tool_calls=tool_calls_list,
-                        turns_used=turns_used,
-                    )
-            # Max turns reached
-            return AgentResult(
-                output=final_output,
-                status="partial",
-                tool_calls=tool_calls_list,
-                turns_used=turns_used,
-            )
-        # Run with timeout
-        try:
-            return await asyncio.wait_for(_run_loop(), timeout=timeout)
-        except TimeoutError:
-            return AgentResult(
-                output="",
-                status="timeout",
-                tool_calls=tool_calls_list,
-                error=f"Execution timed out after {timeout}s",
-                turns_used=turns_counter[0],
-            )
+        return await self._run_with_cli(
+            prompt=prompt,
+            timeout=timeout,
+        )
     async def _run_with_cli(
         self,

gobby/llm/executor.py CHANGED Viewed

@@ -59,6 +59,23 @@ class ToolCallRecord:
     """Result from the tool execution."""
+@dataclass
+class CostInfo:
+    """Cost information from an LLM call."""
+    prompt_tokens: int = 0
+    """Number of tokens in the prompt."""
+    completion_tokens: int = 0
+    """Number of tokens in the completion."""
+    total_cost: float = 0.0
+    """Total cost in USD for this call."""
+    model: str = ""
+    """Model used for this call (LiteLLM format with prefix)."""
 @dataclass
 class AgentResult:
     """Result from running an agent to completion."""
@@ -93,6 +110,9 @@ class AgentResult:
     child_session_id: str | None = None
     """ID of the child session created for this agent (set by AgentRunner)."""
+    cost_info: CostInfo | None = None
+    """Cost tracking information (populated by LiteLLM executor)."""
 # Type alias for the tool handler callback
 ToolHandler = Callable[[str, dict[str, Any]], Awaitable[ToolResult]]
@@ -310,6 +330,7 @@ class AgentExecutor(ABC):
         if completion_result is not None:
             completion_result.tool_calls = result.tool_calls
             completion_result.turns_used = result.turns_used
+            completion_result.cost_info = result.cost_info
             return completion_result
         # Otherwise, return the raw result (might be timeout or natural end)

gobby 0.2.5__py3-none-any.whl → 0.2.7__py3-none-any.whl

gobby 0.2.5py3-none-any.whl → 0.2.7py3-none-any.whl