PyPI - gobby - Versions diffs - 0.2.9__py3-none-any.whl → 0.2.11__py3-none-any.whl - Mend

gobby 0.2.9py3-none-any.whl → 0.2.11py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (134) hide show

gobby/__init__.py +1 -1
gobby/adapters/__init__.py +6 -0
gobby/adapters/base.py +11 -2
gobby/adapters/claude_code.py +2 -2
gobby/adapters/codex_impl/adapter.py +38 -43
gobby/adapters/copilot.py +324 -0
gobby/adapters/cursor.py +373 -0
gobby/adapters/gemini.py +2 -26
gobby/adapters/windsurf.py +359 -0
gobby/agents/definitions.py +162 -2
gobby/agents/isolation.py +33 -1
gobby/agents/pty_reader.py +192 -0
gobby/agents/registry.py +10 -1
gobby/agents/runner.py +24 -8
gobby/agents/sandbox.py +8 -3
gobby/agents/session.py +4 -0
gobby/agents/spawn.py +9 -2
gobby/agents/spawn_executor.py +49 -61
gobby/agents/spawners/command_builder.py +4 -4
gobby/app_context.py +5 -0
gobby/cli/__init__.py +4 -0
gobby/cli/install.py +259 -4
gobby/cli/installers/__init__.py +12 -0
gobby/cli/installers/copilot.py +242 -0
gobby/cli/installers/cursor.py +244 -0
gobby/cli/installers/shared.py +3 -0
gobby/cli/installers/windsurf.py +242 -0
gobby/cli/pipelines.py +639 -0
gobby/cli/sessions.py +3 -1
gobby/cli/skills.py +209 -0
gobby/cli/tasks/crud.py +6 -5
gobby/cli/tasks/search.py +1 -1
gobby/cli/ui.py +116 -0
gobby/cli/workflows.py +38 -17
gobby/config/app.py +5 -0
gobby/config/skills.py +23 -2
gobby/hooks/broadcaster.py +9 -0
gobby/hooks/event_handlers/_base.py +6 -1
gobby/hooks/event_handlers/_session.py +44 -130
gobby/hooks/events.py +48 -0
gobby/hooks/hook_manager.py +25 -3
gobby/install/copilot/hooks/hook_dispatcher.py +203 -0
gobby/install/cursor/hooks/hook_dispatcher.py +203 -0
gobby/install/gemini/hooks/hook_dispatcher.py +8 -0
gobby/install/windsurf/hooks/hook_dispatcher.py +205 -0
gobby/llm/__init__.py +14 -1
gobby/llm/claude.py +217 -1
gobby/llm/service.py +149 -0
gobby/mcp_proxy/instructions.py +9 -27
gobby/mcp_proxy/models.py +1 -0
gobby/mcp_proxy/registries.py +56 -9
gobby/mcp_proxy/server.py +6 -2
gobby/mcp_proxy/services/tool_filter.py +7 -0
gobby/mcp_proxy/services/tool_proxy.py +19 -1
gobby/mcp_proxy/stdio.py +37 -21
gobby/mcp_proxy/tools/agents.py +7 -0
gobby/mcp_proxy/tools/hub.py +30 -1
gobby/mcp_proxy/tools/orchestration/cleanup.py +5 -5
gobby/mcp_proxy/tools/orchestration/monitor.py +1 -1
gobby/mcp_proxy/tools/orchestration/orchestrate.py +8 -3
gobby/mcp_proxy/tools/orchestration/review.py +17 -4
gobby/mcp_proxy/tools/orchestration/wait.py +7 -7
gobby/mcp_proxy/tools/pipelines/__init__.py +254 -0
gobby/mcp_proxy/tools/pipelines/_discovery.py +67 -0
gobby/mcp_proxy/tools/pipelines/_execution.py +281 -0
gobby/mcp_proxy/tools/sessions/_crud.py +4 -4
gobby/mcp_proxy/tools/sessions/_handoff.py +1 -1
gobby/mcp_proxy/tools/skills/__init__.py +184 -30
gobby/mcp_proxy/tools/spawn_agent.py +229 -14
gobby/mcp_proxy/tools/tasks/_context.py +8 -0
gobby/mcp_proxy/tools/tasks/_crud.py +27 -1
gobby/mcp_proxy/tools/tasks/_helpers.py +1 -1
gobby/mcp_proxy/tools/tasks/_lifecycle.py +125 -8
gobby/mcp_proxy/tools/tasks/_lifecycle_validation.py +2 -1
gobby/mcp_proxy/tools/tasks/_search.py +1 -1
gobby/mcp_proxy/tools/workflows/__init__.py +9 -2
gobby/mcp_proxy/tools/workflows/_lifecycle.py +12 -1
gobby/mcp_proxy/tools/workflows/_query.py +45 -26
gobby/mcp_proxy/tools/workflows/_terminal.py +39 -3
gobby/mcp_proxy/tools/worktrees.py +54 -15
gobby/memory/context.py +5 -5
gobby/runner.py +108 -6
gobby/servers/http.py +7 -1
gobby/servers/routes/__init__.py +2 -0
gobby/servers/routes/admin.py +44 -0
gobby/servers/routes/mcp/endpoints/execution.py +18 -25
gobby/servers/routes/mcp/hooks.py +10 -1
gobby/servers/routes/pipelines.py +227 -0
gobby/servers/websocket.py +314 -1
gobby/sessions/analyzer.py +87 -1
gobby/sessions/manager.py +5 -5
gobby/sessions/transcripts/__init__.py +3 -0
gobby/sessions/transcripts/claude.py +5 -0
gobby/sessions/transcripts/codex.py +5 -0
gobby/sessions/transcripts/gemini.py +5 -0
gobby/skills/hubs/__init__.py +25 -0
gobby/skills/hubs/base.py +234 -0
gobby/skills/hubs/claude_plugins.py +328 -0
gobby/skills/hubs/clawdhub.py +289 -0
gobby/skills/hubs/github_collection.py +465 -0
gobby/skills/hubs/manager.py +263 -0
gobby/skills/hubs/skillhub.py +342 -0
gobby/storage/memories.py +4 -4
gobby/storage/migrations.py +95 -3
gobby/storage/pipelines.py +367 -0
gobby/storage/sessions.py +23 -4
gobby/storage/skills.py +1 -1
gobby/storage/tasks/_aggregates.py +2 -2
gobby/storage/tasks/_lifecycle.py +4 -4
gobby/storage/tasks/_models.py +7 -1
gobby/storage/tasks/_queries.py +3 -3
gobby/sync/memories.py +4 -3
gobby/tasks/commits.py +48 -17
gobby/workflows/actions.py +75 -0
gobby/workflows/context_actions.py +246 -5
gobby/workflows/definitions.py +119 -1
gobby/workflows/detection_helpers.py +23 -11
gobby/workflows/enforcement/task_policy.py +18 -0
gobby/workflows/engine.py +20 -1
gobby/workflows/evaluator.py +8 -5
gobby/workflows/lifecycle_evaluator.py +57 -26
gobby/workflows/loader.py +567 -30
gobby/workflows/lobster_compat.py +147 -0
gobby/workflows/pipeline_executor.py +801 -0
gobby/workflows/pipeline_state.py +172 -0
gobby/workflows/pipeline_webhooks.py +206 -0
gobby/workflows/premature_stop.py +5 -0
gobby/worktrees/git.py +135 -20
{gobby-0.2.9.dist-info → gobby-0.2.11.dist-info}/METADATA +56 -22
{gobby-0.2.9.dist-info → gobby-0.2.11.dist-info}/RECORD +134 -106
{gobby-0.2.9.dist-info → gobby-0.2.11.dist-info}/WHEEL +0 -0
{gobby-0.2.9.dist-info → gobby-0.2.11.dist-info}/entry_points.txt +0 -0
{gobby-0.2.9.dist-info → gobby-0.2.11.dist-info}/licenses/LICENSE.md +0 -0
{gobby-0.2.9.dist-info → gobby-0.2.11.dist-info}/top_level.txt +0 -0

gobby/workflows/detection_helpers.py CHANGED Viewed

@@ -103,30 +103,42 @@ def detect_task_claim(
         if isinstance(result, dict) and result.get("error"):
             return
-    # Extract task_id based on tool type
+    # Extract task_id based on tool type - MUST resolve to UUID
+    # Refs like '#123' will fail comparison with task.id (UUID) in close_task logic
     arguments = tool_input.get("arguments", {}) or {}
+    task_id: str | None = None
     if inner_tool_name in ("update_task", "claim_task"):
-        task_id = arguments.get("task_id")
-        # Resolve to UUID for consistent comparison with close_task
-        if task_id and task_manager:
+        raw_task_id = arguments.get("task_id")
+        # MUST resolve to UUID - refs like '#123' break comparisons in close_task
+        if raw_task_id and task_manager:
             try:
-                task = task_manager.get_task(task_id)
+                task = task_manager.get_task(raw_task_id)
                 if task:
                     task_id = task.id  # Use UUID
-            except Exception:  # nosec B110 - best effort resolution, keep original if fails
-                pass
+                else:
+                    logger.warning(
+                        f"Cannot resolve task ref '{raw_task_id}' to UUID - task not found"
+                    )
+            except Exception as e:
+                logger.warning(f"Cannot resolve task ref '{raw_task_id}' to UUID: {e}")
+        elif raw_task_id and not task_manager:
+            logger.warning(f"Cannot resolve task ref '{raw_task_id}' to UUID - no task_manager")
     elif inner_tool_name == "create_task":
-        # For create_task, the id is in the result
+        # For create_task, the id is in the result (already a UUID)
         result = tool_output.get("result", {}) if isinstance(tool_output, dict) else {}
         task_id = result.get("id") if isinstance(result, dict) else None
         # Skip if we can't get the task ID (e.g., Claude Code doesn't include tool results)
         # The MCP tool itself handles state updates in this case via _crud.py
         if not task_id:
             return
-    else:
-        task_id = None
-    # All conditions met - set task_claimed and claimed_task_id
+    # Only set claimed_task_id if we have a valid UUID
+    if not task_id:
+        logger.debug(f"Skipping task claim state update - no valid UUID for {inner_tool_name}")
+        return
+    # All conditions met - set task_claimed and claimed_task_id (UUID)
     state.variables["task_claimed"] = True
     state.variables["claimed_task_id"] = task_id
     logger.info(

gobby/workflows/enforcement/task_policy.py CHANGED Viewed

@@ -6,6 +6,7 @@ Provides actions that enforce task tracking and scoping requirements.
 from __future__ import annotations
 import logging
+import uuid
 from typing import TYPE_CHECKING, Any
 from gobby.mcp_proxy.tools.task_readiness import is_descendant_of
@@ -21,6 +22,15 @@ if TYPE_CHECKING:
 logger = logging.getLogger(__name__)
+def _is_uuid(value: str) -> bool:
+    """Check if a string is a valid UUID (not a ref like #123)."""
+    try:
+        uuid.UUID(value)
+        return True
+    except (ValueError, TypeError):
+        return False
 async def require_task_complete(
     task_manager: LocalTaskManager | None,
     session_id: str,
@@ -84,6 +94,14 @@ async def require_task_complete(
     if workflow_state:
         has_claimed_task = workflow_state.variables.get("task_claimed", False)
         claimed_task_id = workflow_state.variables.get("claimed_task_id")
+        # Resolve claimed_task_id to UUID if it's a ref (backward compat)
+        if claimed_task_id and not _is_uuid(claimed_task_id):
+            try:
+                claimed_task = task_manager.get_task(claimed_task_id)
+                if claimed_task:
+                    claimed_task_id = claimed_task.id
+            except Exception:  # nosec B110 - keep original ID if resolution fails
+                claimed_task_id = claimed_task_id  # explicit no-op
     try:
         # Collect incomplete tasks across all specified task IDs

gobby/workflows/engine.py CHANGED Viewed

@@ -116,7 +116,11 @@ class WorkflowEngine:
                 if state.step != "reflect":
                     project_path = Path(event.cwd) if event.cwd else None
                     workflow = self.loader.load_workflow(state.workflow_name, project_path)
-                    if workflow and workflow.get_step("reflect"):
+                    if (
+                        workflow
+                        and isinstance(workflow, WorkflowDefinition)
+                        and workflow.get_step("reflect")
+                    ):
                         await self.transition_to(state, "reflect", workflow)
                         return HookResponse(
                             decision="modify",
@@ -145,6 +149,11 @@ class WorkflowEngine:
             )
             return HookResponse(decision="allow")
+        # Step handling only applies to WorkflowDefinition, not PipelineDefinition
+        if not isinstance(workflow, WorkflowDefinition):
+            logger.debug(f"Workflow '{workflow.name}' is a pipeline, skipping step handling")
+            return HookResponse(decision="allow")
         # 4. Process event
         # Logic matches WORKFLOWS.md "Evaluation Flow"
@@ -344,6 +353,8 @@ class WorkflowEngine:
             memory_sync_manager=self.action_executor.memory_sync_manager,
             task_sync_manager=self.action_executor.task_sync_manager,
             session_task_manager=self.action_executor.session_task_manager,
+            pipeline_executor=self.action_executor.pipeline_executor,
+            workflow_loader=self.action_executor.workflow_loader,
         )
         for action_def in actions:
@@ -530,6 +541,14 @@ class WorkflowEngine:
                 "error": f"Workflow '{workflow_name}' is lifecycle type (auto-runs on events)",
             }
+        # Only WorkflowDefinition can be activated as step workflows
+        if not isinstance(definition, WorkflowDefinition):
+            logger.debug(f"Workflow '{workflow_name}' is a pipeline, not a step workflow")
+            return {
+                "success": False,
+                "error": f"'{workflow_name}' is a pipeline. Use pipeline execution instead.",
+            }
         # Check for existing step workflow
         existing = self.state_manager.get_state(session_id)
         if existing and existing.workflow_name != "__lifecycle__":

gobby/workflows/evaluator.py CHANGED Viewed

@@ -23,7 +23,7 @@ def is_task_complete(task: Any) -> bool:
     A task is complete if:
     - status is 'closed', OR
-    - status is 'review' AND requires_user_review is False
+    - status is 'needs_review' AND requires_user_review is False
       (agent marked for visibility but doesn't need user sign-off)
     Tasks in 'review' with requires_user_review=True are NOT complete
@@ -38,7 +38,7 @@ def is_task_complete(task: Any) -> bool:
     if task.status == "closed":
         return True
     requires_user_review = getattr(task, "requires_user_review", False)
-    if task.status == "review" and not requires_user_review:
+    if task.status == "needs_review" and not requires_user_review:
         return True
     return False
@@ -55,7 +55,7 @@ def task_needs_user_review(task_manager: Any, task_id: str | None) -> bool:
         task_id: Task ID to check
     Returns:
-        True if task is in 'review' status AND has requires_user_review=True.
+        True if task is in 'needs_review' status AND has requires_user_review=True.
         Returns False if task_id is None or task not found.
     """
     if not task_id or not task_manager:
@@ -65,7 +65,7 @@ def task_needs_user_review(task_manager: Any, task_id: str | None) -> bool:
     if not task:
         return False
-    return bool(task.status == "review" and getattr(task, "requires_user_review", False))
+    return bool(task.status == "needs_review" and getattr(task, "requires_user_review", False))
 def task_tree_complete(task_manager: Any, task_id: str | list[str] | None) -> bool:
@@ -74,7 +74,7 @@ def task_tree_complete(task_manager: Any, task_id: str | list[str] | None) -> bo
     A task is complete if:
     - status is 'closed', OR
-    - status is 'review' AND requires_user_review is False
+    - status is 'needs_review' AND requires_user_review is False
     Used in workflow transition conditions like:
         when: "task_tree_complete(variables.session_task)"
@@ -283,6 +283,9 @@ class ConditionEvaluator:
                 "None": None,
                 "True": True,
                 "False": False,
+                # YAML/JSON use lowercase booleans
+                "true": True,
+                "false": False,
             }
             # Add plugin conditions as callable functions

gobby/workflows/lifecycle_evaluator.py CHANGED Viewed

@@ -10,10 +10,10 @@ from datetime import UTC, datetime
 from typing import TYPE_CHECKING, Any, Literal
 from gobby.hooks.events import HookEvent, HookEventType, HookResponse
+from gobby.workflows.definitions import WorkflowDefinition, WorkflowState
 if TYPE_CHECKING:
     from .actions import ActionExecutor
-    from .definitions import WorkflowDefinition, WorkflowState
     from .evaluator import ConditionEvaluator
     from .loader import WorkflowLoader
     from .state_manager import WorkflowStateManager
@@ -123,28 +123,30 @@ async def evaluate_workflow_triggers(
     session_id = event.metadata.get("_platform_session_id") or "global"
     # Try to load existing state, or create new one
-    state = state_manager.get_state(session_id)
-    if state is None:
-        state = WorkflowState(
-            session_id=session_id,
-            workflow_name=workflow.name,
-            step="global",
-            step_entered_at=datetime.now(UTC),
-            step_action_count=0,
-            total_action_count=0,
-            artifacts=event.data.get("artifacts", {}) if event.data else {},
-            observations=[],
-            reflection_pending=False,
-            context_injected=False,
-            variables={},
-            task_list=None,
-            current_task_index=0,
-            files_modified_this_task=0,
-        )
-    # Merge context_data into state variables (context_data has session vars from earlier load)
+    # Track whether we created a new state to determine save behavior later
+    existing_state = state_manager.get_state(session_id)
+    state_was_created = existing_state is None
+    state: WorkflowState = existing_state or WorkflowState(
+        session_id=session_id,
+        workflow_name=workflow.name,
+        step="global",
+        step_entered_at=datetime.now(UTC),
+        step_action_count=0,
+        total_action_count=0,
+        artifacts=event.data.get("artifacts", {}) if event.data else {},
+        observations=[],
+        reflection_pending=False,
+        context_injected=False,
+        variables={},
+        task_list=None,
+        current_task_index=0,
+        files_modified_this_task=0,
+    )
+    # Merge context_data (workflow defaults) into state variables
+    # Persisted state values take precedence over workflow defaults
     if context_data:
-        state.variables.update(context_data)
+        state.variables = {**context_data, **state.variables}
     action_ctx = ActionContext(
         session_id=session_id,
@@ -236,11 +238,28 @@ async def evaluate_workflow_triggers(
                 exc_info=True,
             )
-    # Persist state changes (e.g., _injected_memory_ids from memory_recall_relevant)
+    # Persist state changes (e.g., _injected_memory_ids from memory_recall_relevant,
+    # unlocked_tools from track_schema_lookup)
     # Only save if we have a real session ID (not "global" fallback)
     # The workflow_states table has a FK to sessions, so we can't save for non-existent sessions
     if session_id != "global":
-        state_manager.save_state(state)
+        if state_was_created:
+            # We created a new lifecycle state - check for existing step workflow
+            # to avoid overwriting it with our new lifecycle state.
+            # Step workflows (activated via activate_workflow) have their own workflow_name.
+            current_state = state_manager.get_state(session_id)
+            is_step_workflow = (
+                current_state is not None
+                and current_state.workflow_name != "__lifecycle__"
+                and current_state.workflow_name != workflow.name
+            )
+            if not is_step_workflow:
+                state_manager.save_state(state)
+        else:
+            # We fetched an existing state (possibly a step workflow) and updated
+            # its variables. Safe to save since we're just persisting variable
+            # changes (like unlocked_tools), not changing workflow_name or step.
+            state_manager.save_state(state)
     final_context = "\n\n".join(injected_context) if injected_context else None
     logger.debug(
@@ -290,6 +309,11 @@ async def evaluate_lifecycle_triggers(
         logger.warning(f"Workflow '{workflow_name}' not found in project_path={project_path}")
         return HookResponse(decision="allow")
+    # Lifecycle triggers only apply to WorkflowDefinition, not PipelineDefinition
+    if not isinstance(workflow, WorkflowDefinition):
+        logger.debug(f"Workflow '{workflow_name}' is not a WorkflowDefinition, skipping triggers")
+        return HookResponse(decision="allow")
     logger.debug(
         f"Workflow '{workflow_name}' loaded, triggers={list(workflow.triggers.keys()) if workflow.triggers else []}"
     )
@@ -533,6 +557,10 @@ async def evaluate_all_lifecycle_workflows(
         for discovered in workflows:
             workflow = discovered.definition
+            # Skip PipelineDefinition - lifecycle triggers only for WorkflowDefinition
+            if not isinstance(workflow, WorkflowDefinition):
+                continue
             # Skip if this workflow+trigger has already been processed
             key = (workflow.name, trigger_name)
             if key in processed_triggers:
@@ -540,10 +568,11 @@ async def evaluate_all_lifecycle_workflows(
             # Merge workflow definition's default variables (lower priority than session state)
             # Precedence: session state > workflow YAML defaults
-            workflow_context = {**workflow.variables, **context_data}
+            # Update context_data directly so workflow variables propagate to response metadata
+            context_data = {**workflow.variables, **context_data}
             response = await evaluate_workflow_triggers(
-                workflow, event, workflow_context, state_manager, action_executor, evaluator
+                workflow, event, context_data, state_manager, action_executor, evaluator
             )
             # Accumulate context
@@ -594,6 +623,7 @@ async def evaluate_all_lifecycle_workflows(
                 )
             detect_task_claim_fn(event, state)
             detect_plan_mode_fn(event, state)
+            # Safe to save - we're updating variables on existing state, not changing workflow_name
             state_manager.save_state(state)
     # Detect plan mode from system reminders for BEFORE_AGENT events
@@ -609,6 +639,7 @@ async def evaluate_all_lifecycle_workflows(
                     step="",
                 )
             detect_plan_mode_from_context_fn(event, state)
+            # Safe to save - we're updating variables on existing state, not changing workflow_name
             state_manager.save_state(state)
     # Check for premature stop in active step workflows on STOP events

gobby 0.2.9__py3-none-any.whl → 0.2.11__py3-none-any.whl

gobby 0.2.9py3-none-any.whl → 0.2.11py3-none-any.whl