PyPI - gobby - Versions diffs - 0.2.5__py3-none-any.whl - Mend

gobby 0.2.5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (383) hide show

gobby/__init__.py +3 -0
gobby/adapters/__init__.py +30 -0
gobby/adapters/base.py +93 -0
gobby/adapters/claude_code.py +276 -0
gobby/adapters/codex.py +1292 -0
gobby/adapters/gemini.py +343 -0
gobby/agents/__init__.py +37 -0
gobby/agents/codex_session.py +120 -0
gobby/agents/constants.py +112 -0
gobby/agents/context.py +362 -0
gobby/agents/definitions.py +133 -0
gobby/agents/gemini_session.py +111 -0
gobby/agents/registry.py +618 -0
gobby/agents/runner.py +968 -0
gobby/agents/session.py +259 -0
gobby/agents/spawn.py +916 -0
gobby/agents/spawners/__init__.py +77 -0
gobby/agents/spawners/base.py +142 -0
gobby/agents/spawners/cross_platform.py +266 -0
gobby/agents/spawners/embedded.py +225 -0
gobby/agents/spawners/headless.py +226 -0
gobby/agents/spawners/linux.py +125 -0
gobby/agents/spawners/macos.py +277 -0
gobby/agents/spawners/windows.py +308 -0
gobby/agents/tty_config.py +319 -0
gobby/autonomous/__init__.py +32 -0
gobby/autonomous/progress_tracker.py +447 -0
gobby/autonomous/stop_registry.py +269 -0
gobby/autonomous/stuck_detector.py +383 -0
gobby/cli/__init__.py +67 -0
gobby/cli/__main__.py +8 -0
gobby/cli/agents.py +529 -0
gobby/cli/artifacts.py +266 -0
gobby/cli/daemon.py +329 -0
gobby/cli/extensions.py +526 -0
gobby/cli/github.py +263 -0
gobby/cli/init.py +53 -0
gobby/cli/install.py +614 -0
gobby/cli/installers/__init__.py +37 -0
gobby/cli/installers/antigravity.py +65 -0
gobby/cli/installers/claude.py +363 -0
gobby/cli/installers/codex.py +192 -0
gobby/cli/installers/gemini.py +294 -0
gobby/cli/installers/git_hooks.py +377 -0
gobby/cli/installers/shared.py +737 -0
gobby/cli/linear.py +250 -0
gobby/cli/mcp.py +30 -0
gobby/cli/mcp_proxy.py +698 -0
gobby/cli/memory.py +304 -0
gobby/cli/merge.py +384 -0
gobby/cli/projects.py +79 -0
gobby/cli/sessions.py +622 -0
gobby/cli/tasks/__init__.py +30 -0
gobby/cli/tasks/_utils.py +658 -0
gobby/cli/tasks/ai.py +1025 -0
gobby/cli/tasks/commits.py +169 -0
gobby/cli/tasks/crud.py +685 -0
gobby/cli/tasks/deps.py +135 -0
gobby/cli/tasks/labels.py +63 -0
gobby/cli/tasks/main.py +273 -0
gobby/cli/tasks/search.py +178 -0
gobby/cli/tui.py +34 -0
gobby/cli/utils.py +513 -0
gobby/cli/workflows.py +927 -0
gobby/cli/worktrees.py +481 -0
gobby/config/__init__.py +129 -0
gobby/config/app.py +551 -0
gobby/config/extensions.py +167 -0
gobby/config/features.py +472 -0
gobby/config/llm_providers.py +98 -0
gobby/config/logging.py +66 -0
gobby/config/mcp.py +346 -0
gobby/config/persistence.py +247 -0
gobby/config/servers.py +141 -0
gobby/config/sessions.py +250 -0
gobby/config/tasks.py +784 -0
gobby/hooks/__init__.py +104 -0
gobby/hooks/artifact_capture.py +213 -0
gobby/hooks/broadcaster.py +243 -0
gobby/hooks/event_handlers.py +723 -0
gobby/hooks/events.py +218 -0
gobby/hooks/git.py +169 -0
gobby/hooks/health_monitor.py +171 -0
gobby/hooks/hook_manager.py +856 -0
gobby/hooks/hook_types.py +575 -0
gobby/hooks/plugins.py +813 -0
gobby/hooks/session_coordinator.py +396 -0
gobby/hooks/verification_runner.py +268 -0
gobby/hooks/webhooks.py +339 -0
gobby/install/claude/commands/gobby/bug.md +51 -0
gobby/install/claude/commands/gobby/chore.md +51 -0
gobby/install/claude/commands/gobby/epic.md +52 -0
gobby/install/claude/commands/gobby/eval.md +235 -0
gobby/install/claude/commands/gobby/feat.md +49 -0
gobby/install/claude/commands/gobby/nit.md +52 -0
gobby/install/claude/commands/gobby/ref.md +52 -0
gobby/install/claude/hooks/HOOK_SCHEMAS.md +632 -0
gobby/install/claude/hooks/hook_dispatcher.py +364 -0
gobby/install/claude/hooks/validate_settings.py +102 -0
gobby/install/claude/hooks-template.json +118 -0
gobby/install/codex/hooks/hook_dispatcher.py +153 -0
gobby/install/codex/prompts/forget.md +7 -0
gobby/install/codex/prompts/memories.md +7 -0
gobby/install/codex/prompts/recall.md +7 -0
gobby/install/codex/prompts/remember.md +13 -0
gobby/install/gemini/hooks/hook_dispatcher.py +268 -0
gobby/install/gemini/hooks-template.json +138 -0
gobby/install/shared/plugins/code_guardian.py +456 -0
gobby/install/shared/plugins/example_notify.py +331 -0
gobby/integrations/__init__.py +10 -0
gobby/integrations/github.py +145 -0
gobby/integrations/linear.py +145 -0
gobby/llm/__init__.py +40 -0
gobby/llm/base.py +120 -0
gobby/llm/claude.py +578 -0
gobby/llm/claude_executor.py +503 -0
gobby/llm/codex.py +322 -0
gobby/llm/codex_executor.py +513 -0
gobby/llm/executor.py +316 -0
gobby/llm/factory.py +34 -0
gobby/llm/gemini.py +258 -0
gobby/llm/gemini_executor.py +339 -0
gobby/llm/litellm.py +287 -0
gobby/llm/litellm_executor.py +303 -0
gobby/llm/resolver.py +499 -0
gobby/llm/service.py +236 -0
gobby/mcp_proxy/__init__.py +29 -0
gobby/mcp_proxy/actions.py +175 -0
gobby/mcp_proxy/daemon_control.py +198 -0
gobby/mcp_proxy/importer.py +436 -0
gobby/mcp_proxy/lazy.py +325 -0
gobby/mcp_proxy/manager.py +798 -0
gobby/mcp_proxy/metrics.py +609 -0
gobby/mcp_proxy/models.py +139 -0
gobby/mcp_proxy/registries.py +215 -0
gobby/mcp_proxy/schema_hash.py +381 -0
gobby/mcp_proxy/semantic_search.py +706 -0
gobby/mcp_proxy/server.py +549 -0
gobby/mcp_proxy/services/__init__.py +0 -0
gobby/mcp_proxy/services/fallback.py +306 -0
gobby/mcp_proxy/services/recommendation.py +224 -0
gobby/mcp_proxy/services/server_mgmt.py +214 -0
gobby/mcp_proxy/services/system.py +72 -0
gobby/mcp_proxy/services/tool_filter.py +231 -0
gobby/mcp_proxy/services/tool_proxy.py +309 -0
gobby/mcp_proxy/stdio.py +565 -0
gobby/mcp_proxy/tools/__init__.py +27 -0
gobby/mcp_proxy/tools/agents.py +1103 -0
gobby/mcp_proxy/tools/artifacts.py +207 -0
gobby/mcp_proxy/tools/hub.py +335 -0
gobby/mcp_proxy/tools/internal.py +337 -0
gobby/mcp_proxy/tools/memory.py +543 -0
gobby/mcp_proxy/tools/merge.py +422 -0
gobby/mcp_proxy/tools/metrics.py +283 -0
gobby/mcp_proxy/tools/orchestration/__init__.py +23 -0
gobby/mcp_proxy/tools/orchestration/cleanup.py +619 -0
gobby/mcp_proxy/tools/orchestration/monitor.py +380 -0
gobby/mcp_proxy/tools/orchestration/orchestrate.py +746 -0
gobby/mcp_proxy/tools/orchestration/review.py +736 -0
gobby/mcp_proxy/tools/orchestration/utils.py +16 -0
gobby/mcp_proxy/tools/session_messages.py +1056 -0
gobby/mcp_proxy/tools/task_dependencies.py +219 -0
gobby/mcp_proxy/tools/task_expansion.py +591 -0
gobby/mcp_proxy/tools/task_github.py +393 -0
gobby/mcp_proxy/tools/task_linear.py +379 -0
gobby/mcp_proxy/tools/task_orchestration.py +77 -0
gobby/mcp_proxy/tools/task_readiness.py +522 -0
gobby/mcp_proxy/tools/task_sync.py +351 -0
gobby/mcp_proxy/tools/task_validation.py +843 -0
gobby/mcp_proxy/tools/tasks/__init__.py +25 -0
gobby/mcp_proxy/tools/tasks/_context.py +112 -0
gobby/mcp_proxy/tools/tasks/_crud.py +516 -0
gobby/mcp_proxy/tools/tasks/_factory.py +176 -0
gobby/mcp_proxy/tools/tasks/_helpers.py +129 -0
gobby/mcp_proxy/tools/tasks/_lifecycle.py +517 -0
gobby/mcp_proxy/tools/tasks/_lifecycle_validation.py +301 -0
gobby/mcp_proxy/tools/tasks/_resolution.py +55 -0
gobby/mcp_proxy/tools/tasks/_search.py +215 -0
gobby/mcp_proxy/tools/tasks/_session.py +125 -0
gobby/mcp_proxy/tools/workflows.py +973 -0
gobby/mcp_proxy/tools/worktrees.py +1264 -0
gobby/mcp_proxy/transports/__init__.py +0 -0
gobby/mcp_proxy/transports/base.py +95 -0
gobby/mcp_proxy/transports/factory.py +44 -0
gobby/mcp_proxy/transports/http.py +139 -0
gobby/mcp_proxy/transports/stdio.py +213 -0
gobby/mcp_proxy/transports/websocket.py +136 -0
gobby/memory/backends/__init__.py +116 -0
gobby/memory/backends/mem0.py +408 -0
gobby/memory/backends/memu.py +485 -0
gobby/memory/backends/null.py +111 -0
gobby/memory/backends/openmemory.py +537 -0
gobby/memory/backends/sqlite.py +304 -0
gobby/memory/context.py +87 -0
gobby/memory/manager.py +1001 -0
gobby/memory/protocol.py +451 -0
gobby/memory/search/__init__.py +66 -0
gobby/memory/search/text.py +127 -0
gobby/memory/viz.py +258 -0
gobby/prompts/__init__.py +13 -0
gobby/prompts/defaults/expansion/system.md +119 -0
gobby/prompts/defaults/expansion/user.md +48 -0
gobby/prompts/defaults/external_validation/agent.md +72 -0
gobby/prompts/defaults/external_validation/external.md +63 -0
gobby/prompts/defaults/external_validation/spawn.md +83 -0
gobby/prompts/defaults/external_validation/system.md +6 -0
gobby/prompts/defaults/features/import_mcp.md +22 -0
gobby/prompts/defaults/features/import_mcp_github.md +17 -0
gobby/prompts/defaults/features/import_mcp_search.md +16 -0
gobby/prompts/defaults/features/recommend_tools.md +32 -0
gobby/prompts/defaults/features/recommend_tools_hybrid.md +35 -0
gobby/prompts/defaults/features/recommend_tools_llm.md +30 -0
gobby/prompts/defaults/features/server_description.md +20 -0
gobby/prompts/defaults/features/server_description_system.md +6 -0
gobby/prompts/defaults/features/task_description.md +31 -0
gobby/prompts/defaults/features/task_description_system.md +6 -0
gobby/prompts/defaults/features/tool_summary.md +17 -0
gobby/prompts/defaults/features/tool_summary_system.md +6 -0
gobby/prompts/defaults/research/step.md +58 -0
gobby/prompts/defaults/validation/criteria.md +47 -0
gobby/prompts/defaults/validation/validate.md +38 -0
gobby/prompts/loader.py +346 -0
gobby/prompts/models.py +113 -0
gobby/py.typed +0 -0
gobby/runner.py +488 -0
gobby/search/__init__.py +23 -0
gobby/search/protocol.py +104 -0
gobby/search/tfidf.py +232 -0
gobby/servers/__init__.py +7 -0
gobby/servers/http.py +636 -0
gobby/servers/models.py +31 -0
gobby/servers/routes/__init__.py +23 -0
gobby/servers/routes/admin.py +416 -0
gobby/servers/routes/dependencies.py +118 -0
gobby/servers/routes/mcp/__init__.py +24 -0
gobby/servers/routes/mcp/hooks.py +135 -0
gobby/servers/routes/mcp/plugins.py +121 -0
gobby/servers/routes/mcp/tools.py +1337 -0
gobby/servers/routes/mcp/webhooks.py +159 -0
gobby/servers/routes/sessions.py +582 -0
gobby/servers/websocket.py +766 -0
gobby/sessions/__init__.py +13 -0
gobby/sessions/analyzer.py +322 -0
gobby/sessions/lifecycle.py +240 -0
gobby/sessions/manager.py +563 -0
gobby/sessions/processor.py +225 -0
gobby/sessions/summary.py +532 -0
gobby/sessions/transcripts/__init__.py +41 -0
gobby/sessions/transcripts/base.py +125 -0
gobby/sessions/transcripts/claude.py +386 -0
gobby/sessions/transcripts/codex.py +143 -0
gobby/sessions/transcripts/gemini.py +195 -0
gobby/storage/__init__.py +21 -0
gobby/storage/agents.py +409 -0
gobby/storage/artifact_classifier.py +341 -0
gobby/storage/artifacts.py +285 -0
gobby/storage/compaction.py +67 -0
gobby/storage/database.py +357 -0
gobby/storage/inter_session_messages.py +194 -0
gobby/storage/mcp.py +680 -0
gobby/storage/memories.py +562 -0
gobby/storage/merge_resolutions.py +550 -0
gobby/storage/migrations.py +860 -0
gobby/storage/migrations_legacy.py +1359 -0
gobby/storage/projects.py +166 -0
gobby/storage/session_messages.py +251 -0
gobby/storage/session_tasks.py +97 -0
gobby/storage/sessions.py +817 -0
gobby/storage/task_dependencies.py +223 -0
gobby/storage/tasks/__init__.py +42 -0
gobby/storage/tasks/_aggregates.py +180 -0
gobby/storage/tasks/_crud.py +449 -0
gobby/storage/tasks/_id.py +104 -0
gobby/storage/tasks/_lifecycle.py +311 -0
gobby/storage/tasks/_manager.py +889 -0
gobby/storage/tasks/_models.py +300 -0
gobby/storage/tasks/_ordering.py +119 -0
gobby/storage/tasks/_path_cache.py +110 -0
gobby/storage/tasks/_queries.py +343 -0
gobby/storage/tasks/_search.py +143 -0
gobby/storage/workflow_audit.py +393 -0
gobby/storage/worktrees.py +547 -0
gobby/sync/__init__.py +29 -0
gobby/sync/github.py +333 -0
gobby/sync/linear.py +304 -0
gobby/sync/memories.py +284 -0
gobby/sync/tasks.py +641 -0
gobby/tasks/__init__.py +8 -0
gobby/tasks/build_verification.py +193 -0
gobby/tasks/commits.py +633 -0
gobby/tasks/context.py +747 -0
gobby/tasks/criteria.py +342 -0
gobby/tasks/enhanced_validator.py +226 -0
gobby/tasks/escalation.py +263 -0
gobby/tasks/expansion.py +626 -0
gobby/tasks/external_validator.py +764 -0
gobby/tasks/issue_extraction.py +171 -0
gobby/tasks/prompts/expand.py +327 -0
gobby/tasks/research.py +421 -0
gobby/tasks/tdd.py +352 -0
gobby/tasks/tree_builder.py +263 -0
gobby/tasks/validation.py +712 -0
gobby/tasks/validation_history.py +357 -0
gobby/tasks/validation_models.py +89 -0
gobby/tools/__init__.py +0 -0
gobby/tools/summarizer.py +170 -0
gobby/tui/__init__.py +5 -0
gobby/tui/api_client.py +281 -0
gobby/tui/app.py +327 -0
gobby/tui/screens/__init__.py +25 -0
gobby/tui/screens/agents.py +333 -0
gobby/tui/screens/chat.py +450 -0
gobby/tui/screens/dashboard.py +377 -0
gobby/tui/screens/memory.py +305 -0
gobby/tui/screens/metrics.py +231 -0
gobby/tui/screens/orchestrator.py +904 -0
gobby/tui/screens/sessions.py +412 -0
gobby/tui/screens/tasks.py +442 -0
gobby/tui/screens/workflows.py +289 -0
gobby/tui/screens/worktrees.py +174 -0
gobby/tui/widgets/__init__.py +21 -0
gobby/tui/widgets/chat.py +210 -0
gobby/tui/widgets/conductor.py +104 -0
gobby/tui/widgets/menu.py +132 -0
gobby/tui/widgets/message_panel.py +160 -0
gobby/tui/widgets/review_gate.py +224 -0
gobby/tui/widgets/task_tree.py +99 -0
gobby/tui/widgets/token_budget.py +166 -0
gobby/tui/ws_client.py +258 -0
gobby/utils/__init__.py +3 -0
gobby/utils/daemon_client.py +235 -0
gobby/utils/git.py +222 -0
gobby/utils/id.py +38 -0
gobby/utils/json_helpers.py +161 -0
gobby/utils/logging.py +376 -0
gobby/utils/machine_id.py +135 -0
gobby/utils/metrics.py +589 -0
gobby/utils/project_context.py +182 -0
gobby/utils/project_init.py +263 -0
gobby/utils/status.py +256 -0
gobby/utils/validation.py +80 -0
gobby/utils/version.py +23 -0
gobby/workflows/__init__.py +4 -0
gobby/workflows/actions.py +1310 -0
gobby/workflows/approval_flow.py +138 -0
gobby/workflows/artifact_actions.py +103 -0
gobby/workflows/audit_helpers.py +110 -0
gobby/workflows/autonomous_actions.py +286 -0
gobby/workflows/context_actions.py +394 -0
gobby/workflows/definitions.py +130 -0
gobby/workflows/detection_helpers.py +208 -0
gobby/workflows/engine.py +485 -0
gobby/workflows/evaluator.py +669 -0
gobby/workflows/git_utils.py +96 -0
gobby/workflows/hooks.py +169 -0
gobby/workflows/lifecycle_evaluator.py +613 -0
gobby/workflows/llm_actions.py +70 -0
gobby/workflows/loader.py +333 -0
gobby/workflows/mcp_actions.py +60 -0
gobby/workflows/memory_actions.py +272 -0
gobby/workflows/premature_stop.py +164 -0
gobby/workflows/session_actions.py +139 -0
gobby/workflows/state_actions.py +123 -0
gobby/workflows/state_manager.py +104 -0
gobby/workflows/stop_signal_actions.py +163 -0
gobby/workflows/summary_actions.py +344 -0
gobby/workflows/task_actions.py +249 -0
gobby/workflows/task_enforcement_actions.py +901 -0
gobby/workflows/templates.py +52 -0
gobby/workflows/todo_actions.py +84 -0
gobby/workflows/webhook.py +223 -0
gobby/workflows/webhook_executor.py +399 -0
gobby/worktrees/__init__.py +5 -0
gobby/worktrees/git.py +690 -0
gobby/worktrees/merge/__init__.py +20 -0
gobby/worktrees/merge/conflict_parser.py +177 -0
gobby/worktrees/merge/resolver.py +485 -0
gobby-0.2.5.dist-info/METADATA +351 -0
gobby-0.2.5.dist-info/RECORD +383 -0
gobby-0.2.5.dist-info/WHEEL +5 -0
gobby-0.2.5.dist-info/entry_points.txt +2 -0
gobby-0.2.5.dist-info/licenses/LICENSE.md +193 -0
gobby-0.2.5.dist-info/top_level.txt +1 -0

gobby/mcp_proxy/tools/task_validation.py ADDED Viewed

@@ -0,0 +1,843 @@
+"""
+Validation MCP tools for Gobby Task System.
+Extracted from tasks.py using Strangler Fig pattern.
+Exposes functionality for:
+- Task validation (validate_task, generate_validation_criteria)
+- Validation status (get_validation_status, reset_validation_count)
+- Validation history (get_validation_history, get_recurring_issues, clear_validation_history)
+- De-escalation (de_escalate_task)
+- QA loop (validate_and_fix, run_fix_attempt)
+These tools are registered with the InternalToolRegistry and accessed
+via the downstream proxy pattern (call_tool, list_tools, get_tool_schema).
+"""
+import logging
+from typing import TYPE_CHECKING, Any
+from gobby.mcp_proxy.tools.internal import InternalToolRegistry
+from gobby.storage.tasks import LocalTaskManager, TaskNotFoundError
+from gobby.tasks.validation import TaskValidator
+from gobby.tasks.validation_history import ValidationHistoryManager
+if TYPE_CHECKING:
+    from gobby.agents.runner import AgentRunner
+    from gobby.storage.projects import LocalProjectManager
+logger = logging.getLogger(__name__)
+def create_validation_registry(
+    task_manager: LocalTaskManager,
+    task_validator: TaskValidator | None = None,
+    project_manager: "LocalProjectManager | None" = None,
+    get_project_repo_path: Any = None,
+    agent_runner: "AgentRunner | None" = None,
+) -> InternalToolRegistry:
+    """
+    Create a validation tool registry with all validation-related tools.
+    Args:
+        task_manager: LocalTaskManager instance
+        task_validator: TaskValidator instance (optional, enables LLM validation)
+        project_manager: LocalProjectManager instance (optional)
+        get_project_repo_path: Callable to get repo path from project ID (optional)
+        agent_runner: AgentRunner instance (optional, enables fix agent spawning)
+    Returns:
+        InternalToolRegistry with all validation tools registered
+    """
+    # Lazy import to avoid circular dependency
+    from gobby.mcp_proxy.tools.tasks import resolve_task_id_for_mcp
+    registry = InternalToolRegistry(
+        name="gobby-tasks-validation",
+        description="Task validation tools - validate, criteria, history",
+    )
+    # Create helper managers
+    validation_history_manager = ValidationHistoryManager(task_manager.db)
+    @registry.tool(
+        name="validate_task",
+        description="Validate if a task is completed. Auto-gathers context from recent commits and relevant files if changes_summary not provided.",
+    )
+    async def validate_task(
+        task_id: str,
+        changes_summary: str | None = None,
+        context_files: list[str] | None = None,
+    ) -> dict[str, Any]:
+        """
+        Validate task completion.
+        For parent tasks (tasks with children), validation checks if all children are closed.
+        For leaf tasks, uses LLM-based validation against criteria.
+        If changes_summary is not provided for leaf tasks, uses smart context gathering:
+        1. Current uncommitted changes (staged + unstaged)
+        2. Multi-commit window (last 10 commits)
+        3. File-based analysis (reads files mentioned in criteria)
+        Args:
+            task_id: Task reference: #N, N (seq_num), path (1.2.3), or UUID
+            changes_summary: Summary of changes made (optional - auto-gathered if not provided)
+            context_files: List of file paths to read for context (optional)
+        Returns:
+            Validation result
+        """
+        # Resolve task reference
+        try:
+            resolved_task_id = resolve_task_id_for_mcp(task_manager, task_id)
+        except (TaskNotFoundError, ValueError) as e:
+            return {"error": f"Invalid task_id: {e}"}
+        task = task_manager.get_task(resolved_task_id)
+        if not task:
+            return {"error": f"Task not found: {task_id}"}
+        # Check if task has children (is a parent task)
+        children = task_manager.list_tasks(parent_task_id=task.id, limit=1000)
+        if children:
+            # Parent task: validate based on child completion
+            open_children = [c for c in children if c.status != "closed"]
+            all_closed = len(open_children) == 0
+            from gobby.tasks.validation import ValidationResult
+            if all_closed:
+                result = ValidationResult(
+                    status="valid",
+                    feedback=f"All {len(children)} child tasks are completed.",
+                )
+            else:
+                open_titles = [f"- {c.id}: {c.title}" for c in open_children[:5]]
+                remaining = len(open_children) - 5 if len(open_children) > 5 else 0
+                feedback = f"{len(open_children)} of {len(children)} child tasks still open:\n"
+                feedback += "\n".join(open_titles)
+                if remaining > 0:
+                    feedback += f"\n... and {remaining} more"
+                result = ValidationResult(status="invalid", feedback=feedback)
+        else:
+            # Leaf task: use LLM-based validation
+            if not task_validator:
+                raise RuntimeError("Task validation is not enabled")
+            # Use provided changes_summary or auto-gather via smart context
+            validation_context = changes_summary
+            if not validation_context:
+                from gobby.tasks.validation import get_validation_context_smart
+                # Get project repo_path for git commands
+                repo_path = None
+                if get_project_repo_path and task.project_id:
+                    repo_path = get_project_repo_path(task.project_id)
+                smart_context = get_validation_context_smart(
+                    task_title=task.title,
+                    validation_criteria=task.validation_criteria,
+                    task_description=task.description,
+                    cwd=repo_path,
+                )
+                if smart_context:
+                    validation_context = f"Validation context:\n\n{smart_context}"
+            if not validation_context:
+                raise ValueError(
+                    "No changes found for validation. Either provide changes_summary "
+                    "or ensure there are uncommitted changes or recent commits."
+                )
+            result = await task_validator.validate_task(
+                task_id=task.id,
+                title=task.title,
+                description=task.description,
+                changes_summary=validation_context,
+                validation_criteria=task.validation_criteria,
+                context_files=context_files,
+                category=task.category,
+            )
+        # Record validation iteration to history
+        # Calculate iteration number based on fail count (current fail count + 1 for this attempt)
+        current_fail_count = task.validation_fail_count or 0
+        iteration_number = current_fail_count + 1
+        # Determine validator type and context type
+        validator_type = "parent_completion" if children else "llm"
+        context_type = "child_status" if children else "smart_context"
+        context_summary = (
+            f"{len(children)} children checked" if children else "Auto-gathered from git/files"
+        )
+        validation_history_manager.record_iteration(
+            task_id=task.id,
+            iteration=iteration_number,
+            status=result.status,
+            feedback=result.feedback,
+            issues=None,  # ValidationResult from validation.py doesn't have issues
+            context_type=context_type,
+            context_summary=context_summary,
+            validator_type=validator_type,
+        )
+        # Update validation status
+        updates: dict[str, Any] = {
+            "validation_status": result.status,
+            "validation_feedback": result.feedback,
+        }
+        MAX_RETRIES = 3
+        if result.status == "valid":
+            # Success: Close task
+            task_manager.close_task(task.id, reason="Completed via validation")
+        elif result.status == "invalid":
+            # Failure: Increment fail count
+            current_fail_count = task.validation_fail_count or 0
+            new_fail_count = current_fail_count + 1
+            updates["validation_fail_count"] = new_fail_count
+            feedback_str = result.feedback or "Validation failed (no feedback provided)."
+            if new_fail_count < MAX_RETRIES:
+                # Create subtask to fix issues
+                fix_task = task_manager.create_task(
+                    project_id=task.project_id,
+                    title=f"Fix validation failures for {task.title}",
+                    description=f"Validation failed with feedback:\n{feedback_str}\n\nPlease fix the issues and re-validate.",
+                    parent_task_id=task.id,
+                    priority=1,  # High priority fix
+                    task_type="bug",
+                )
+                updates["validation_feedback"] = (
+                    feedback_str + f"\n\nCreated fix task: {fix_task.id}"
+                )
+            else:
+                # Exceeded retries: Mark as failed
+                updates["status"] = "failed"
+                updates["validation_feedback"] = (
+                    feedback_str + f"\n\nExceeded max retries ({MAX_RETRIES}). Marked as failed."
+                )
+        task_manager.update_task(task.id, **updates)
+        return {
+            "is_valid": result.status == "valid",
+            "feedback": result.feedback,
+            "status": result.status,
+            "fail_count": updates.get("validation_fail_count", task.validation_fail_count),
+        }
+    @registry.tool(
+        name="get_validation_status",
+        description="Get validation details for a task.",
+    )
+    def get_validation_status(task_id: str) -> dict[str, Any]:
+        """
+        Get validation details.
+        Args:
+            task_id: Task reference: #N, N (seq_num), path (1.2.3), or UUID
+        Returns:
+            Validation details
+        """
+        # Resolve task reference
+        try:
+            resolved_task_id = resolve_task_id_for_mcp(task_manager, task_id)
+        except (TaskNotFoundError, ValueError) as e:
+            return {"error": f"Invalid task_id: {e}"}
+        task = task_manager.get_task(resolved_task_id)
+        if not task:
+            raise ValueError(f"Task not found: {task_id}")
+        return {
+            "task_id": task.id,
+            "validation_status": task.validation_status,
+            "validation_feedback": task.validation_feedback,
+            "validation_criteria": task.validation_criteria,
+            "validation_fail_count": task.validation_fail_count,
+            "use_external_validator": task.use_external_validator,
+        }
+    @registry.tool(
+        name="reset_validation_count",
+        description="Reset validation failure count for a task.",
+    )
+    def reset_validation_count(task_id: str) -> dict[str, Any]:
+        """
+        Reset validation failure count.
+        Args:
+            task_id: Task reference: #N, N (seq_num), path (1.2.3), or UUID
+        Returns:
+            Updated task details
+        """
+        # Resolve task reference
+        try:
+            resolved_task_id = resolve_task_id_for_mcp(task_manager, task_id)
+        except (TaskNotFoundError, ValueError) as e:
+            return {"error": f"Invalid task_id: {e}"}
+        task = task_manager.get_task(resolved_task_id)
+        if not task:
+            raise ValueError(f"Task not found: {task_id}")
+        updated_task = task_manager.update_task(task.id, validation_fail_count=0)
+        return {
+            "task_id": updated_task.id,
+            "validation_fail_count": updated_task.validation_fail_count,
+            "message": "Validation failure count reset to 0",
+        }
+    @registry.tool(
+        name="get_validation_history",
+        description="Get full validation history for a task, including all iterations, feedback, and issues.",
+    )
+    def get_validation_history(task_id: str) -> dict[str, Any]:
+        """
+        Get validation history for a task.
+        Returns all validation iterations with their status, feedback, and issues.
+        Args:
+            task_id: Task reference: #N, N (seq_num), path (1.2.3), or UUID
+        Returns:
+            Validation history with all iterations
+        """
+        # Resolve task reference
+        try:
+            resolved_task_id = resolve_task_id_for_mcp(task_manager, task_id)
+        except (TaskNotFoundError, ValueError) as e:
+            return {"error": f"Invalid task_id: {e}"}
+        task = task_manager.get_task(resolved_task_id)
+        if not task:
+            raise ValueError(f"Task {task_id} not found")
+        history = validation_history_manager.get_iteration_history(task.id)
+        # Convert iterations to serializable format
+        history_dicts = []
+        for iteration in history:
+            iter_dict: dict[str, Any] = {
+                "iteration": iteration.iteration,
+                "status": iteration.status,
+                "feedback": iteration.feedback,
+                "issues": [i.to_dict() for i in (iteration.issues or [])],
+                "context_type": iteration.context_type,
+                "context_summary": iteration.context_summary,
+                "validator_type": iteration.validator_type,
+                "created_at": iteration.created_at,
+            }
+            history_dicts.append(iter_dict)
+        return {
+            "task_id": task_id,
+            "history": history_dicts,
+            "total_iterations": len(history_dicts),
+        }
+    @registry.tool(
+        name="get_recurring_issues",
+        description="Analyze validation history for recurring issues that keep appearing across iterations.",
+    )
+    def get_recurring_issues(
+        task_id: str,
+        threshold: int = 2,
+    ) -> dict[str, Any]:
+        """
+        Get recurring issues analysis for a task.
+        Finds issues that appear multiple times across validation iterations.
+        Args:
+            task_id: Task reference: #N, N (seq_num), path (1.2.3), or UUID
+            threshold: Minimum occurrences to consider an issue recurring (default: 2)
+        Returns:
+            Recurring issues analysis with grouped issues and counts
+        """
+        # Resolve task reference
+        try:
+            resolved_task_id = resolve_task_id_for_mcp(task_manager, task_id)
+        except (TaskNotFoundError, ValueError) as e:
+            return {"error": f"Invalid task_id: {e}"}
+        task = task_manager.get_task(resolved_task_id)
+        if not task:
+            return {"error": f"Task {task_id} not found"}
+        summary = validation_history_manager.get_recurring_issue_summary(
+            task.id, threshold=threshold
+        )
+        has_recurring = validation_history_manager.has_recurring_issues(
+            task.id, threshold=threshold
+        )
+        return {
+            "task_id": task.id,
+            "recurring_issues": summary["recurring_issues"],
+            "total_iterations": summary["total_iterations"],
+            "has_recurring": has_recurring,
+        }
+    @registry.tool(
+        name="clear_validation_history",
+        description="Clear all validation history for a task. Use after major changes that invalidate previous feedback.",
+    )
+    def clear_validation_history(
+        task_id: str,
+        reason: str | None = None,
+    ) -> dict[str, Any]:
+        """
+        Clear validation history for a fresh start.
+        Removes all validation iterations and resets the fail count.
+        Args:
+            task_id: Task reference: #N, N (seq_num), path (1.2.3), or UUID
+            reason: Optional reason for clearing history
+        Returns:
+            Confirmation of cleared history
+        """
+        # Resolve task reference
+        try:
+            resolved_task_id = resolve_task_id_for_mcp(task_manager, task_id)
+        except (TaskNotFoundError, ValueError) as e:
+            return {"error": f"Invalid task_id: {e}"}
+        task = task_manager.get_task(resolved_task_id)
+        if not task:
+            return {"error": f"Task {task_id} not found"}
+        # Get count before clearing for response
+        history = validation_history_manager.get_iteration_history(task.id)
+        iterations_count = len(history)
+        # Clear history
+        validation_history_manager.clear_history(task.id)
+        # Also reset validation fail count
+        task_manager.update_task(task.id, validation_fail_count=0)
+        return {
+            "task_id": task.id,
+            "cleared": True,
+            "iterations_cleared": iterations_count,
+            "reason": reason,
+        }
+    @registry.tool(
+        name="de_escalate_task",
+        description="Return an escalated task to open status after human intervention resolves the issue.",
+    )
+    def de_escalate_task(
+        task_id: str,
+        reason: str,
+        reset_validation: bool = False,
+    ) -> dict[str, Any]:
+        """
+        De-escalate a task back to open status.
+        Args:
+            task_id: Task reference: #N, N (seq_num), path (1.2.3), or UUID
+            reason: Reason for de-escalation (required)
+            reset_validation: Also reset validation fail count (default: False)
+        Returns:
+            Updated task details
+        """
+        # Resolve task reference
+        try:
+            resolved_task_id = resolve_task_id_for_mcp(task_manager, task_id)
+        except (TaskNotFoundError, ValueError) as e:
+            return {"error": f"Invalid task_id: {e}"}
+        task = task_manager.get_task(resolved_task_id)
+        if not task:
+            return {"error": f"Task {task_id} not found"}
+        if task.status != "escalated":
+            return {"error": f"Task {task_id} is not escalated (current status: {task.status})"}
+        # Build update kwargs
+        update_kwargs: dict[str, Any] = {
+            "status": "open",
+            "escalated_at": None,
+            "escalation_reason": None,
+        }
+        if reset_validation:
+            update_kwargs["validation_fail_count"] = 0
+        updated_task = task_manager.update_task(task.id, **update_kwargs)
+        return {
+            "task_id": updated_task.id,
+            "status": updated_task.status,
+            "escalated_at": updated_task.escalated_at,
+            "escalation_reason": updated_task.escalation_reason,
+            "de_escalation_reason": reason,
+            "validation_reset": reset_validation,
+        }
+    @registry.tool(
+        name="generate_validation_criteria",
+        description="Generate validation criteria for a task using AI. Updates the task with the generated criteria.",
+    )
+    async def generate_validation_criteria(task_id: str) -> dict[str, Any]:
+        """
+        Generate validation criteria for a task using AI.
+        For parent tasks (tasks with children), sets criteria to "All child tasks completed".
+        For leaf tasks, uses LLM to generate criteria from title/description.
+        Args:
+            task_id: Task reference: #N, N (seq_num), path (1.2.3), or UUID
+        Returns:
+            Generated criteria and updated task info
+        """
+        # Resolve task reference
+        try:
+            resolved_task_id = resolve_task_id_for_mcp(task_manager, task_id)
+        except (TaskNotFoundError, ValueError) as e:
+            return {"error": f"Invalid task_id: {e}"}
+        task = task_manager.get_task(resolved_task_id)
+        if not task:
+            raise ValueError(f"Task not found: {task_id}")
+        if task.validation_criteria:
+            return {
+                "task_id": task.id,
+                "validation_criteria": task.validation_criteria,
+                "generated": False,
+                "message": "Task already has validation criteria",
+            }
+        # Check if task has children (is a parent task)
+        children = task_manager.list_tasks(parent_task_id=task.id, limit=1)
+        criteria: str | None
+        if children:
+            # Parent task: criteria is child completion
+            criteria = "All child tasks must be completed (status: closed)."
+        else:
+            # Leaf task: use LLM to generate criteria
+            if not task_validator:
+                raise RuntimeError("Task validation is not enabled")
+            criteria = await task_validator.generate_criteria(
+                title=task.title,
+                description=task.description,
+                labels=task.labels,
+            )
+            if not criteria:
+                return {
+                    "task_id": task.id,
+                    "validation_criteria": None,
+                    "generated": False,
+                    "error": "Failed to generate criteria",
+                }
+        # Update task with generated criteria
+        task_manager.update_task(task.id, validation_criteria=criteria)
+        return {
+            "task_id": task.id,
+            "validation_criteria": criteria,
+            "generated": True,
+            "is_parent_task": len(children) > 0,
+        }
+    @registry.tool(
+        name="run_fix_attempt",
+        description="Spawn a fix agent to address validation issues. Returns when the fix attempt completes.",
+    )
+    async def run_fix_attempt(
+        task_id: str,
+        issues: list[str] | None = None,
+        timeout: float = 120.0,
+        max_turns: int = 10,
+    ) -> dict[str, Any]:
+        """
+        Spawn an agent to fix validation issues for a task.
+        The fix agent is given the original task context plus validation
+        failure details to guide its fixes.
+        Args:
+            task_id: Task reference: #N, N (seq_num), path (1.2.3), or UUID
+            issues: List of specific issues to fix (uses validation_feedback if not provided)
+            timeout: Max time for fix attempt in seconds (default: 120)
+            max_turns: Max agent turns (default: 10)
+        Returns:
+            Dict with success status and fix details
+        """
+        # Resolve task reference
+        try:
+            resolved_task_id = resolve_task_id_for_mcp(task_manager, task_id)
+        except (TaskNotFoundError, ValueError) as e:
+            return {"error": f"Invalid task_id: {e}"}
+        if not agent_runner:
+            return {
+                "success": False,
+                "error": "Agent runner not configured - cannot spawn fix agent",
+            }
+        task = task_manager.get_task(resolved_task_id)
+        if not task:
+            return {"success": False, "error": f"Task not found: {task_id}"}
+        # Get issues from parameter or task validation feedback
+        issues_text = ""
+        if issues:
+            issues_text = "\n".join(f"- {issue}" for issue in issues)
+        elif task.validation_feedback:
+            issues_text = task.validation_feedback
+        else:
+            return {
+                "success": False,
+                "error": "No issues provided and no validation feedback on task",
+            }
+        # Get repo path for context
+        repo_path = None
+        if get_project_repo_path and task.project_id:
+            repo_path = get_project_repo_path(task.project_id)
+        # Build fix prompt
+        fix_prompt = f"""You are fixing validation failures for a task.
+## Original Task
+**Title:** {task.title}
+**Description:** {task.description or "No description provided."}
+## Validation Criteria
+{task.validation_criteria or "No specific criteria - use task description."}
+## Validation Failures
+{issues_text}
+## Instructions
+1. Read the relevant files to understand the current state
+2. Fix the issues listed above
+3. Ensure all validation criteria pass after your fixes
+4. Do NOT create new tasks - fix the issues directly
+Focus on fixing ONLY the listed issues. Do not make unrelated changes.
+"""
+        try:
+            from gobby.agents.runner import AgentConfig
+            config = AgentConfig(
+                prompt=fix_prompt,
+                parent_session_id=None,  # No parent session for fix agent
+                project_id=task.project_id,
+                machine_id=None,  # Will be inferred
+                source="claude",
+                workflow=None,  # No workflow - direct execution
+                task=None,  # Don't claim the task
+                mode="headless",
+                timeout=timeout,
+                max_turns=max_turns,
+                project_path=repo_path,
+            )
+            # Run the fix agent
+            result = await agent_runner.run(config)
+            # Record the fix attempt
+            iteration = (task.validation_fail_count or 0) + 1
+            validation_history_manager.record_iteration(
+                task_id=task.id,
+                iteration=iteration,
+                status="fix_attempted",
+                feedback=f"Fix agent completed with status: {result.status}",
+                issues=None,
+                context_type="fix_agent",
+                context_summary=f"Fix attempt {iteration}",
+                validator_type="fix_agent",
+            )
+            return {
+                "success": True,
+                "task_id": task_id,
+                "fix_status": result.status,
+                "agent_output": result.output,
+                "agent_turns": result.turns_used,
+            }
+        except Exception as e:
+            logger.exception(f"Fix attempt failed for task {task_id}")
+            return {
+                "success": False,
+                "error": f"Fix agent failed: {e!s}",
+            }
+    @registry.tool(
+        name="validate_and_fix",
+        description="Run validation loop with automatic fix attempts. Validates, spawns fix agent if needed, re-validates.",
+    )
+    async def validate_and_fix(
+        task_id: str,
+        max_retries: int = 3,
+        auto_fix: bool = True,
+        fix_timeout: float = 120.0,
+    ) -> dict[str, Any]:
+        """
+        Run validation loop with automatic fix attempts.
+        1. Validate task completion
+        2. If failed and auto_fix=True:
+           - Spawn fix agent to address issues
+           - Re-validate after fix
+           - Repeat up to max_retries
+        3. If still failing after retries:
+           - Create fix subtask with failure details
+           - Mark task status = 'failed'
+        Args:
+            task_id: Task reference: #N, N (seq_num), path (1.2.3), or UUID
+            max_retries: Maximum fix attempts before giving up (default: 3)
+            auto_fix: Whether to attempt automatic fixes (default: True)
+            fix_timeout: Timeout per fix attempt in seconds (default: 120)
+        Returns:
+            Validation result with loop history
+        """
+        # Resolve task reference
+        try:
+            resolved_task_id = resolve_task_id_for_mcp(task_manager, task_id)
+        except (TaskNotFoundError, ValueError) as e:
+            return {"error": f"Invalid task_id: {e}"}
+        task = task_manager.get_task(resolved_task_id)
+        if not task:
+            return {"success": False, "error": f"Task not found: {task_id}"}
+        # Check if task has children (parent tasks use child completion validation)
+        children = task_manager.list_tasks(parent_task_id=task.id, limit=1)
+        if children:
+            # For parent tasks, just run regular validation (no fix loop)
+            result = await validate_task(task.id)
+            return {
+                "success": True,
+                "task_id": task.id,
+                "is_parent_task": True,
+                "validation_result": result,
+            }
+        loop_history: list[dict[str, Any]] = []
+        current_retry = 0
+        while current_retry < max_retries:
+            # Run validation
+            validation_result = await validate_task(task.id)
+            loop_history.append(
+                {
+                    "iteration": current_retry + 1,
+                    "action": "validate",
+                    "result": validation_result,
+                }
+            )
+            if validation_result.get("is_valid"):
+                # Success! Task is closed by validate_task
+                return {
+                    "success": True,
+                    "task_id": task.id,
+                    "is_valid": True,
+                    "iterations": current_retry + 1,
+                    "loop_history": loop_history,
+                    "message": "Task validated successfully",
+                }
+            # Validation failed - attempt fix if enabled and agent runner available
+            if not auto_fix:
+                break
+            if not agent_runner:
+                loop_history.append(
+                    {
+                        "iteration": current_retry + 1,
+                        "action": "fix_skipped",
+                        "reason": "Agent runner not configured",
+                    }
+                )
+                break
+            # Spawn fix agent
+            fix_result = await run_fix_attempt(
+                task_id=task.id,
+                timeout=fix_timeout,
+            )
+            loop_history.append(
+                {
+                    "iteration": current_retry + 1,
+                    "action": "fix_attempt",
+                    "result": fix_result,
+                }
+            )
+            if not fix_result.get("success"):
+                # Fix agent failed to run
+                logger.warning(f"Fix attempt {current_retry + 1} failed: {fix_result.get('error')}")
+            current_retry += 1
+        # All retries exhausted - mark as failed
+        final_feedback = f"QA loop exhausted after {current_retry} fix attempts."
+        if loop_history:
+            last_validation = next(
+                (h for h in reversed(loop_history) if h.get("action") == "validate"),
+                None,
+            )
+            if last_validation and last_validation.get("result", {}).get("feedback"):
+                final_feedback += (
+                    f"\n\nLast validation feedback:\n{last_validation['result']['feedback']}"
+                )
+        # Create fix subtask for manual intervention
+        fix_task = task_manager.create_task(
+            project_id=task.project_id,
+            title=f"[Manual Fix] {task.title}",
+            description=f"Automatic fix attempts failed.\n\n{final_feedback}",
+            parent_task_id=task.id,
+            priority=1,
+            task_type="bug",
+        )
+        # Mark task as failed
+        task_manager.update_task(
+            task.id,
+            status="failed",
+            validation_feedback=final_feedback,
+        )
+        return {
+            "success": False,
+            "task_id": task.id,
+            "is_valid": False,
+            "iterations": current_retry,
+            "loop_history": loop_history,
+            "fix_subtask_id": fix_task.id,
+            "message": f"Validation failed after {current_retry} fix attempts. Created fix subtask: {fix_task.id}",
+        }
+    return registry