PyPI - gobby - Versions diffs - 0.2.5__py3-none-any.whl → 0.2.7__py3-none-any.whl - Mend

gobby 0.2.5py3-none-any.whl → 0.2.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (244) hide show

gobby/__init__.py +1 -1
gobby/adapters/__init__.py +2 -1
gobby/adapters/claude_code.py +13 -4
gobby/adapters/codex_impl/__init__.py +28 -0
gobby/adapters/codex_impl/adapter.py +722 -0
gobby/adapters/codex_impl/client.py +679 -0
gobby/adapters/codex_impl/protocol.py +20 -0
gobby/adapters/codex_impl/types.py +68 -0
gobby/agents/definitions.py +11 -1
gobby/agents/isolation.py +395 -0
gobby/agents/runner.py +8 -0
gobby/agents/sandbox.py +261 -0
gobby/agents/spawn.py +42 -287
gobby/agents/spawn_executor.py +385 -0
gobby/agents/spawners/__init__.py +24 -0
gobby/agents/spawners/command_builder.py +189 -0
gobby/agents/spawners/embedded.py +21 -2
gobby/agents/spawners/headless.py +21 -2
gobby/agents/spawners/prompt_manager.py +125 -0
gobby/cli/__init__.py +6 -0
gobby/cli/clones.py +419 -0
gobby/cli/conductor.py +266 -0
gobby/cli/install.py +4 -4
gobby/cli/installers/antigravity.py +3 -9
gobby/cli/installers/claude.py +15 -9
gobby/cli/installers/codex.py +2 -8
gobby/cli/installers/gemini.py +8 -8
gobby/cli/installers/shared.py +175 -13
gobby/cli/sessions.py +1 -1
gobby/cli/skills.py +858 -0
gobby/cli/tasks/ai.py +0 -440
gobby/cli/tasks/crud.py +44 -6
gobby/cli/tasks/main.py +0 -4
gobby/cli/tui.py +2 -2
gobby/cli/utils.py +12 -5
gobby/clones/__init__.py +13 -0
gobby/clones/git.py +547 -0
gobby/conductor/__init__.py +16 -0
gobby/conductor/alerts.py +135 -0
gobby/conductor/loop.py +164 -0
gobby/conductor/monitors/__init__.py +11 -0
gobby/conductor/monitors/agents.py +116 -0
gobby/conductor/monitors/tasks.py +155 -0
gobby/conductor/pricing.py +234 -0
gobby/conductor/token_tracker.py +160 -0
gobby/config/__init__.py +12 -97
gobby/config/app.py +69 -91
gobby/config/extensions.py +2 -2
gobby/config/features.py +7 -130
gobby/config/search.py +110 -0
gobby/config/servers.py +1 -1
gobby/config/skills.py +43 -0
gobby/config/tasks.py +9 -41
gobby/hooks/__init__.py +0 -13
gobby/hooks/event_handlers.py +188 -2
gobby/hooks/hook_manager.py +50 -4
gobby/hooks/plugins.py +1 -1
gobby/hooks/skill_manager.py +130 -0
gobby/hooks/webhooks.py +1 -1
gobby/install/claude/hooks/hook_dispatcher.py +4 -4
gobby/install/codex/hooks/hook_dispatcher.py +1 -1
gobby/install/gemini/hooks/hook_dispatcher.py +87 -12
gobby/llm/claude.py +22 -34
gobby/llm/claude_executor.py +46 -256
gobby/llm/codex_executor.py +59 -291
gobby/llm/executor.py +21 -0
gobby/llm/gemini.py +134 -110
gobby/llm/litellm_executor.py +143 -6
gobby/llm/resolver.py +98 -35
gobby/mcp_proxy/importer.py +62 -4
gobby/mcp_proxy/instructions.py +56 -0
gobby/mcp_proxy/models.py +15 -0
gobby/mcp_proxy/registries.py +68 -8
gobby/mcp_proxy/server.py +33 -3
gobby/mcp_proxy/services/recommendation.py +43 -11
gobby/mcp_proxy/services/tool_proxy.py +81 -1
gobby/mcp_proxy/stdio.py +2 -1
gobby/mcp_proxy/tools/__init__.py +0 -2
gobby/mcp_proxy/tools/agent_messaging.py +317 -0
gobby/mcp_proxy/tools/agents.py +31 -731
gobby/mcp_proxy/tools/clones.py +518 -0
gobby/mcp_proxy/tools/memory.py +3 -26
gobby/mcp_proxy/tools/metrics.py +65 -1
gobby/mcp_proxy/tools/orchestration/__init__.py +3 -0
gobby/mcp_proxy/tools/orchestration/cleanup.py +151 -0
gobby/mcp_proxy/tools/orchestration/wait.py +467 -0
gobby/mcp_proxy/tools/sessions/__init__.py +14 -0
gobby/mcp_proxy/tools/sessions/_commits.py +232 -0
gobby/mcp_proxy/tools/sessions/_crud.py +253 -0
gobby/mcp_proxy/tools/sessions/_factory.py +63 -0
gobby/mcp_proxy/tools/sessions/_handoff.py +499 -0
gobby/mcp_proxy/tools/sessions/_messages.py +138 -0
gobby/mcp_proxy/tools/skills/__init__.py +616 -0
gobby/mcp_proxy/tools/spawn_agent.py +417 -0
gobby/mcp_proxy/tools/task_orchestration.py +7 -0
gobby/mcp_proxy/tools/task_readiness.py +14 -0
gobby/mcp_proxy/tools/task_sync.py +1 -1
gobby/mcp_proxy/tools/tasks/_context.py +0 -20
gobby/mcp_proxy/tools/tasks/_crud.py +91 -4
gobby/mcp_proxy/tools/tasks/_expansion.py +348 -0
gobby/mcp_proxy/tools/tasks/_factory.py +6 -16
gobby/mcp_proxy/tools/tasks/_lifecycle.py +110 -45
gobby/mcp_proxy/tools/tasks/_lifecycle_validation.py +18 -29
gobby/mcp_proxy/tools/workflows.py +1 -1
gobby/mcp_proxy/tools/worktrees.py +0 -338
gobby/memory/backends/__init__.py +6 -1
gobby/memory/backends/mem0.py +6 -1
gobby/memory/extractor.py +477 -0
gobby/memory/ingestion/__init__.py +5 -0
gobby/memory/ingestion/multimodal.py +221 -0
gobby/memory/manager.py +73 -285
gobby/memory/search/__init__.py +10 -0
gobby/memory/search/coordinator.py +248 -0
gobby/memory/services/__init__.py +5 -0
gobby/memory/services/crossref.py +142 -0
gobby/prompts/loader.py +5 -2
gobby/runner.py +37 -16
gobby/search/__init__.py +48 -6
gobby/search/backends/__init__.py +159 -0
gobby/search/backends/embedding.py +225 -0
gobby/search/embeddings.py +238 -0
gobby/search/models.py +148 -0
gobby/search/unified.py +496 -0
gobby/servers/http.py +24 -12
gobby/servers/routes/admin.py +294 -0
gobby/servers/routes/mcp/endpoints/__init__.py +61 -0
gobby/servers/routes/mcp/endpoints/discovery.py +405 -0
gobby/servers/routes/mcp/endpoints/execution.py +568 -0
gobby/servers/routes/mcp/endpoints/registry.py +378 -0
gobby/servers/routes/mcp/endpoints/server.py +304 -0
gobby/servers/routes/mcp/hooks.py +1 -1
gobby/servers/routes/mcp/tools.py +48 -1317
gobby/servers/websocket.py +2 -2
gobby/sessions/analyzer.py +2 -0
gobby/sessions/lifecycle.py +1 -1
gobby/sessions/processor.py +10 -0
gobby/sessions/transcripts/base.py +2 -0
gobby/sessions/transcripts/claude.py +79 -10
gobby/skills/__init__.py +91 -0
gobby/skills/loader.py +685 -0
gobby/skills/manager.py +384 -0
gobby/skills/parser.py +286 -0
gobby/skills/search.py +463 -0
gobby/skills/sync.py +119 -0
gobby/skills/updater.py +385 -0
gobby/skills/validator.py +368 -0
gobby/storage/clones.py +378 -0
gobby/storage/database.py +1 -1
gobby/storage/memories.py +43 -13
gobby/storage/migrations.py +162 -201
gobby/storage/sessions.py +116 -7
gobby/storage/skills.py +782 -0
gobby/storage/tasks/_crud.py +4 -4
gobby/storage/tasks/_lifecycle.py +57 -7
gobby/storage/tasks/_manager.py +14 -5
gobby/storage/tasks/_models.py +8 -3
gobby/sync/memories.py +40 -5
gobby/sync/tasks.py +83 -6
gobby/tasks/__init__.py +1 -2
gobby/tasks/external_validator.py +1 -1
gobby/tasks/validation.py +46 -35
gobby/tools/summarizer.py +91 -10
gobby/tui/api_client.py +4 -7
gobby/tui/app.py +5 -3
gobby/tui/screens/orchestrator.py +1 -2
gobby/tui/screens/tasks.py +2 -4
gobby/tui/ws_client.py +1 -1
gobby/utils/daemon_client.py +2 -2
gobby/utils/project_context.py +2 -3
gobby/utils/status.py +13 -0
gobby/workflows/actions.py +221 -1135
gobby/workflows/artifact_actions.py +31 -0
gobby/workflows/autonomous_actions.py +11 -0
gobby/workflows/context_actions.py +93 -1
gobby/workflows/detection_helpers.py +115 -31
gobby/workflows/enforcement/__init__.py +47 -0
gobby/workflows/enforcement/blocking.py +269 -0
gobby/workflows/enforcement/commit_policy.py +283 -0
gobby/workflows/enforcement/handlers.py +269 -0
gobby/workflows/{task_enforcement_actions.py → enforcement/task_policy.py} +29 -388
gobby/workflows/engine.py +13 -2
gobby/workflows/git_utils.py +106 -0
gobby/workflows/lifecycle_evaluator.py +29 -1
gobby/workflows/llm_actions.py +30 -0
gobby/workflows/loader.py +19 -6
gobby/workflows/mcp_actions.py +20 -1
gobby/workflows/memory_actions.py +154 -0
gobby/workflows/safe_evaluator.py +183 -0
gobby/workflows/session_actions.py +44 -0
gobby/workflows/state_actions.py +60 -1
gobby/workflows/stop_signal_actions.py +55 -0
gobby/workflows/summary_actions.py +111 -1
gobby/workflows/task_sync_actions.py +347 -0
gobby/workflows/todo_actions.py +34 -1
gobby/workflows/webhook_actions.py +185 -0
{gobby-0.2.5.dist-info → gobby-0.2.7.dist-info}/METADATA +87 -21
{gobby-0.2.5.dist-info → gobby-0.2.7.dist-info}/RECORD +201 -172
{gobby-0.2.5.dist-info → gobby-0.2.7.dist-info}/WHEEL +1 -1
gobby/adapters/codex.py +0 -1292
gobby/install/claude/commands/gobby/bug.md +0 -51
gobby/install/claude/commands/gobby/chore.md +0 -51
gobby/install/claude/commands/gobby/epic.md +0 -52
gobby/install/claude/commands/gobby/eval.md +0 -235
gobby/install/claude/commands/gobby/feat.md +0 -49
gobby/install/claude/commands/gobby/nit.md +0 -52
gobby/install/claude/commands/gobby/ref.md +0 -52
gobby/install/codex/prompts/forget.md +0 -7
gobby/install/codex/prompts/memories.md +0 -7
gobby/install/codex/prompts/recall.md +0 -7
gobby/install/codex/prompts/remember.md +0 -13
gobby/llm/gemini_executor.py +0 -339
gobby/mcp_proxy/tools/session_messages.py +0 -1056
gobby/mcp_proxy/tools/task_expansion.py +0 -591
gobby/prompts/defaults/expansion/system.md +0 -119
gobby/prompts/defaults/expansion/user.md +0 -48
gobby/prompts/defaults/external_validation/agent.md +0 -72
gobby/prompts/defaults/external_validation/external.md +0 -63
gobby/prompts/defaults/external_validation/spawn.md +0 -83
gobby/prompts/defaults/external_validation/system.md +0 -6
gobby/prompts/defaults/features/import_mcp.md +0 -22
gobby/prompts/defaults/features/import_mcp_github.md +0 -17
gobby/prompts/defaults/features/import_mcp_search.md +0 -16
gobby/prompts/defaults/features/recommend_tools.md +0 -32
gobby/prompts/defaults/features/recommend_tools_hybrid.md +0 -35
gobby/prompts/defaults/features/recommend_tools_llm.md +0 -30
gobby/prompts/defaults/features/server_description.md +0 -20
gobby/prompts/defaults/features/server_description_system.md +0 -6
gobby/prompts/defaults/features/task_description.md +0 -31
gobby/prompts/defaults/features/task_description_system.md +0 -6
gobby/prompts/defaults/features/tool_summary.md +0 -17
gobby/prompts/defaults/features/tool_summary_system.md +0 -6
gobby/prompts/defaults/research/step.md +0 -58
gobby/prompts/defaults/validation/criteria.md +0 -47
gobby/prompts/defaults/validation/validate.md +0 -38
gobby/storage/migrations_legacy.py +0 -1359
gobby/tasks/context.py +0 -747
gobby/tasks/criteria.py +0 -342
gobby/tasks/expansion.py +0 -626
gobby/tasks/prompts/expand.py +0 -327
gobby/tasks/research.py +0 -421
gobby/tasks/tdd.py +0 -352
{gobby-0.2.5.dist-info → gobby-0.2.7.dist-info}/entry_points.txt +0 -0
{gobby-0.2.5.dist-info → gobby-0.2.7.dist-info}/licenses/LICENSE.md +0 -0
{gobby-0.2.5.dist-info → gobby-0.2.7.dist-info}/top_level.txt +0 -0

gobby/workflows/artifact_actions.py CHANGED Viewed

@@ -4,6 +4,7 @@ Extracted from actions.py as part of strangler fig decomposition.
 These functions handle file artifact capture and reading.
 """
+import asyncio
 import glob
 import logging
 import os
@@ -101,3 +102,33 @@ def read_artifact(
     except Exception as e:
         logger.error(f"read_artifact: Failed to read {filepath}: {e}")
         return None
+# --- ActionHandler-compatible wrappers ---
+# These match the ActionHandler protocol: (context: ActionContext, **kwargs) -> dict | None
+if __name__ != "__main__":
+    from typing import TYPE_CHECKING
+    if TYPE_CHECKING:
+        from gobby.workflows.actions import ActionContext
+async def handle_capture_artifact(context: "ActionContext", **kwargs: Any) -> dict[str, Any] | None:
+    """ActionHandler wrapper for capture_artifact."""
+    return await asyncio.to_thread(
+        capture_artifact,
+        state=context.state,
+        pattern=kwargs.get("pattern"),
+        save_as=kwargs.get("as"),
+    )
+async def handle_read_artifact(context: "ActionContext", **kwargs: Any) -> dict[str, Any] | None:
+    """ActionHandler wrapper for read_artifact."""
+    return await asyncio.to_thread(
+        read_artifact,
+        state=context.state,
+        pattern=kwargs.get("pattern"),
+        variable_name=kwargs.get("as"),
+    )

gobby/workflows/autonomous_actions.py CHANGED Viewed

@@ -284,3 +284,14 @@ def get_progress_summary(
         "last_event_at": (summary.last_event_at.isoformat() if summary.last_event_at else None),
         "events_by_type": {k.value: v for k, v in summary.events_by_type.items()},
     }
+# --- ActionHandler-compatible wrappers ---
+# These match the ActionHandler protocol: (context: ActionContext, **kwargs) -> dict | None
+# Note: These handlers require executor access for progress_tracker and stuck_detector,
+# so they are created as closures inside ActionExecutor._register_defaults().
+# No wrapper functions are defined in this file. The actual handler implementations
+# are closures created in ActionExecutor._register_defaults() which capture the
+# executor's self.progress_tracker and self.stuck_detector references. See that
+# method for the actual implementations and where these components are hooked up.

gobby/workflows/context_actions.py CHANGED Viewed

@@ -6,10 +6,14 @@ These functions handle context injection, message injection, and handoff extract
 from __future__ import annotations
+import asyncio
 import json
 import logging
 from pathlib import Path
-from typing import Any
+from typing import TYPE_CHECKING, Any
+if TYPE_CHECKING:
+    from gobby.workflows.actions import ActionContext
 from gobby.workflows.git_utils import get_git_status, get_recent_git_commits
@@ -304,6 +308,17 @@ def extract_handoff_context(
         except Exception as wt_err:
             logger.debug(f"Failed to get worktree context: {wt_err}")
+        # Add active skills from HookSkillManager
+        try:
+            from gobby.hooks.skill_manager import HookSkillManager
+            skill_manager = HookSkillManager()
+            core_skills = skill_manager.discover_core_skills()
+            always_apply_skills = [s.name for s in core_skills if s.is_always_apply()]
+            handoff_ctx.active_skills = always_apply_skills
+        except Exception as skill_err:
+            logger.debug(f"Failed to get active skills: {skill_err}")
         # Format as markdown (like /clear stores formatted summary)
         markdown = format_handoff_as_markdown(handoff_ctx)
@@ -320,6 +335,32 @@ def extract_handoff_context(
         return {"error": str(e)}
+def recommend_skills_for_task(task: dict[str, Any] | None) -> list[str]:
+    """Recommend relevant skills based on task category.
+    Uses HookSkillManager to get skill recommendations based on the task's
+    category field. Returns always-apply skills if no category is set.
+    Args:
+        task: Task dict with optional 'category' field, or None.
+    Returns:
+        List of recommended skill names for this task.
+    """
+    if task is None:
+        return []
+    try:
+        from gobby.hooks.skill_manager import HookSkillManager
+        manager = HookSkillManager()
+        category = task.get("category")
+        return manager.recommend_skills(category=category)
+    except Exception as e:
+        logger.debug(f"Failed to recommend skills: {e}")
+        return []
 def format_handoff_as_markdown(ctx: Any, prompt_template: str | None = None) -> str:
     """Format HandoffContext as markdown for storage.
@@ -391,4 +432,55 @@ def format_handoff_as_markdown(ctx: Any, prompt_template: str | None = None) ->
             lines.append(f"- {activity}")
         sections.append("\n".join(lines))
+    # Active skills section
+    if hasattr(ctx, "active_skills") and ctx.active_skills:
+        lines = ["### Active Skills"]
+        lines.append(f"Skills available: {', '.join(ctx.active_skills)}")
+        sections.append("\n".join(lines))
     return "\n\n".join(sections)
+# --- ActionHandler-compatible wrappers ---
+# These match the ActionHandler protocol: (context: ActionContext, **kwargs) -> dict | None
+async def handle_inject_context(context: ActionContext, **kwargs: Any) -> dict[str, Any] | None:
+    """ActionHandler wrapper for inject_context."""
+    return await asyncio.to_thread(
+        inject_context,
+        session_manager=context.session_manager,
+        session_id=context.session_id,
+        state=context.state,
+        template_engine=context.template_engine,
+        source=kwargs.get("source"),
+        template=kwargs.get("template"),
+        require=kwargs.get("require", False),
+    )
+async def handle_inject_message(context: ActionContext, **kwargs: Any) -> dict[str, Any] | None:
+    """ActionHandler wrapper for inject_message."""
+    return await asyncio.to_thread(
+        inject_message,
+        session_manager=context.session_manager,
+        session_id=context.session_id,
+        state=context.state,
+        template_engine=context.template_engine,
+        content=kwargs.get("content"),
+        **{k: v for k, v in kwargs.items() if k != "content"},
+    )
+async def handle_extract_handoff_context(
+    context: ActionContext, **kwargs: Any
+) -> dict[str, Any] | None:
+    """ActionHandler wrapper for extract_handoff_context."""
+    return await asyncio.to_thread(
+        extract_handoff_context,
+        session_manager=context.session_manager,
+        session_id=context.session_id,
+        config=context.config,
+        db=context.db,
+        worktree_manager=kwargs.get("worktree_manager"),
+    )

gobby/workflows/detection_helpers.py CHANGED Viewed

@@ -11,6 +11,7 @@ from typing import TYPE_CHECKING
 if TYPE_CHECKING:
     from gobby.hooks.events import HookEvent
+    from gobby.storage.tasks import LocalTaskManager
     from gobby.tasks.session_tasks import SessionTaskManager
     from .definitions import WorkflowState
@@ -22,6 +23,7 @@ def detect_task_claim(
     event: "HookEvent",
     state: "WorkflowState",
     session_task_manager: "SessionTaskManager | None" = None,
+    task_manager: "LocalTaskManager | None" = None,
 ) -> None:
     """Detect gobby-tasks calls that claim or release a task for this session.
@@ -44,7 +46,8 @@ def detect_task_claim(
     tool_name = event.data.get("tool_name", "")
     tool_input = event.data.get("tool_input", {}) or {}
-    tool_output = event.data.get("tool_output", {}) or {}
+    # Claude Code sends "tool_result", but we also check "tool_output" for compatibility
+    tool_output = event.data.get("tool_result") or event.data.get("tool_output") or {}
     # Check if this is a gobby-tasks call via MCP proxy
     # Tool name could be "call_tool" (from legacy) or "mcp__gobby__call_tool" (direct)
@@ -58,7 +61,34 @@ def detect_task_claim(
     # Check inner tool name
     inner_tool_name = tool_input.get("tool_name", "")
-    if inner_tool_name not in ("create_task", "update_task", "close_task"):
+    # Handle close_task - clears task_claimed when task is closed
+    # Note: Claude Code doesn't include tool_result in post-tool-use hooks, so for CC
+    # the workflow state is updated directly in the MCP proxy's close_task function.
+    # This detection provides a fallback for CLIs that do report tool results (Gemini/Codex).
+    if inner_tool_name == "close_task":
+        tool_output = event.data.get("tool_result") or event.data.get("tool_output") or {}
+        # If no tool output, skip - can't verify success
+        # The MCP proxy's close_task handles state clearing for successful closes
+        if not tool_output:
+            return
+        # Check if close succeeded (not an error)
+        if isinstance(tool_output, dict):
+            if tool_output.get("error") or tool_output.get("status") == "error":
+                return
+            result = tool_output.get("result", {})
+            if isinstance(result, dict) and result.get("error"):
+                return
+        # Clear task_claimed on successful close
+        state.variables["task_claimed"] = False
+        state.variables["claimed_task_id"] = None
+        logger.info(f"Session {state.session_id}: task_claimed=False (detected close_task success)")
+        return
+    if inner_tool_name not in ("create_task", "update_task", "claim_task"):
         return
     # For update_task, only count if status is being set to in_progress
@@ -66,11 +96,9 @@ def detect_task_claim(
         arguments = tool_input.get("arguments", {}) or {}
         if arguments.get("status") != "in_progress":
             return
+    # claim_task always counts (it sets status to in_progress internally)
-    # For close_task, we'll clear task_claimed after success check
-    is_close_task = inner_tool_name == "close_task"
-    # Check if the call succeeded (not an error)
+    # Check if the call succeeded (not an error) - for non-close_task operations
     # tool_output structure varies, but errors typically have "error" key
     # or the MCP response has "status": "error"
     if isinstance(tool_output, dict):
@@ -81,35 +109,26 @@ def detect_task_claim(
         if isinstance(result, dict) and result.get("error"):
             return
-    # Handle close_task - clear the claim only if closing the claimed task
-    if is_close_task:
-        arguments = tool_input.get("arguments", {}) or {}
-        closed_task_id = arguments.get("task_id")
-        claimed_task_id = state.variables.get("claimed_task_id")
-        # Only clear task_claimed if we're closing the task that was claimed
-        if closed_task_id and claimed_task_id and closed_task_id == claimed_task_id:
-            state.variables["task_claimed"] = False
-            state.variables["claimed_task_id"] = None
-            logger.info(
-                f"Session {state.session_id}: task_claimed=False "
-                f"(claimed task {closed_task_id} closed via close_task)"
-            )
-        else:
-            logger.debug(
-                f"Session {state.session_id}: close_task for {closed_task_id} "
-                f"(claimed: {claimed_task_id}) - not clearing task_claimed"
-            )
-        return
     # Extract task_id based on tool type
     arguments = tool_input.get("arguments", {}) or {}
-    if inner_tool_name == "update_task":
+    if inner_tool_name in ("update_task", "claim_task"):
         task_id = arguments.get("task_id")
+        # Resolve to UUID for consistent comparison with close_task
+        if task_id and task_manager:
+            try:
+                task = task_manager.get_task(task_id)
+                if task:
+                    task_id = task.id  # Use UUID
+            except Exception:  # nosec B110 - best effort resolution, keep original if fails
+                pass
     elif inner_tool_name == "create_task":
         # For create_task, the id is in the result
         result = tool_output.get("result", {}) if isinstance(tool_output, dict) else {}
         task_id = result.get("id") if isinstance(result, dict) else None
+        # Skip if we can't get the task ID (e.g., Claude Code doesn't include tool results)
+        # The MCP tool itself handles state updates in this case via _crud.py
+        if not task_id:
+            return
     else:
         task_id = None
@@ -121,8 +140,8 @@ def detect_task_claim(
         f"(via {inner_tool_name})"
     )
-    # Auto-link task to session when status is set to in_progress
-    if inner_tool_name == "update_task":
+    # Auto-link task to session when claiming a task
+    if inner_tool_name in ("update_task", "claim_task"):
         arguments = tool_input.get("arguments", {}) or {}
         task_id = arguments.get("task_id")
         if task_id and session_task_manager:
@@ -159,6 +178,70 @@ def detect_plan_mode(event: "HookEvent", state: "WorkflowState") -> None:
         logger.info(f"Session {state.session_id}: plan_mode=False (exited plan mode)")
+def detect_plan_mode_from_context(event: "HookEvent", state: "WorkflowState") -> None:
+    """Detect plan mode from system reminders injected by Claude Code.
+    Claude Code injects system reminders like "Plan mode is active" when the user
+    enters plan mode via the UI (not via the EnterPlanMode tool). This function
+    detects those reminders and sets the plan_mode variable accordingly.
+    IMPORTANT: Only matches indicators within <system-reminder> tags to avoid
+    false positives from handoff context or user messages that mention plan mode.
+    This complements detect_plan_mode() which only catches programmatic tool calls.
+    Args:
+        event: The BEFORE_AGENT hook event (contains user prompt with system reminders)
+        state: Current workflow state (modified in place)
+    """
+    if not event.data:
+        return
+    # Check for plan mode system reminder in the prompt
+    prompt = event.data.get("prompt", "") or ""
+    # Extract only content within <system-reminder> tags to avoid false positives
+    # from handoff context or user messages mentioning plan mode
+    import re
+    system_reminders = re.findall(r"<system-reminder>(.*?)</system-reminder>", prompt, re.DOTALL)
+    reminder_text = " ".join(system_reminders)
+    # Claude Code injects these phrases in system reminders when plan mode is active
+    plan_mode_indicators = [
+        "Plan mode is active",
+        "Plan mode still active",
+        "You are in plan mode",
+    ]
+    # Check if plan mode is indicated in system reminders only
+    for indicator in plan_mode_indicators:
+        if indicator in reminder_text:
+            if not state.variables.get("plan_mode"):
+                state.variables["plan_mode"] = True
+                logger.info(
+                    f"Session {state.session_id}: plan_mode=True "
+                    f"(detected from system reminder: '{indicator}')"
+                )
+            return
+    # Detect exit from plan mode (also only in system reminders)
+    exit_indicators = [
+        "Exited Plan Mode",
+        "Plan mode exited",
+    ]
+    for indicator in exit_indicators:
+        if indicator in reminder_text:
+            if state.variables.get("plan_mode"):
+                state.variables["plan_mode"] = False
+                logger.info(
+                    f"Session {state.session_id}: plan_mode=False "
+                    f"(detected from system reminder: '{indicator}')"
+                )
+            return
 def detect_mcp_call(event: "HookEvent", state: "WorkflowState") -> None:
     """Track MCP tool calls by server/tool for workflow conditions.
@@ -180,7 +263,8 @@ def detect_mcp_call(event: "HookEvent", state: "WorkflowState") -> None:
     tool_name = event.data.get("tool_name", "")
     tool_input = event.data.get("tool_input", {}) or {}
-    tool_output = event.data.get("tool_output", {}) or {}
+    # Claude Code sends "tool_result", but we also check "tool_output" for compatibility
+    tool_output = event.data.get("tool_result") or event.data.get("tool_output") or {}
     # Check for MCP proxy call
     if tool_name not in ("call_tool", "mcp__gobby__call_tool"):

gobby/workflows/enforcement/__init__.py ADDED Viewed

@@ -0,0 +1,47 @@
+"""Task enforcement actions for workflow engine.
+This package provides actions that enforce task tracking before allowing
+certain tools, and enforce task completion before allowing agent to stop.
+"""
+from gobby.workflows.enforcement.blocking import block_tools
+from gobby.workflows.enforcement.commit_policy import (
+    capture_baseline_dirty_files,
+    require_commit_before_stop,
+    require_task_review_or_close_before_stop,
+)
+from gobby.workflows.enforcement.handlers import (
+    handle_block_tools,
+    handle_capture_baseline_dirty_files,
+    handle_require_active_task,
+    handle_require_commit_before_stop,
+    handle_require_task_complete,
+    handle_require_task_review_or_close_before_stop,
+    handle_validate_session_task_scope,
+)
+from gobby.workflows.enforcement.task_policy import (
+    require_active_task,
+    require_task_complete,
+    validate_session_task_scope,
+)
+__all__ = [
+    # Blocking
+    "block_tools",
+    # Commit policy
+    "capture_baseline_dirty_files",
+    "require_commit_before_stop",
+    "require_task_review_or_close_before_stop",
+    # Task policy
+    "require_active_task",
+    "require_task_complete",
+    "validate_session_task_scope",
+    # Handlers
+    "handle_block_tools",
+    "handle_capture_baseline_dirty_files",
+    "handle_require_active_task",
+    "handle_require_commit_before_stop",
+    "handle_require_task_complete",
+    "handle_require_task_review_or_close_before_stop",
+    "handle_validate_session_task_scope",
+]

gobby 0.2.5__py3-none-any.whl → 0.2.7__py3-none-any.whl

gobby 0.2.5py3-none-any.whl → 0.2.7py3-none-any.whl