PyPI - gobby - Versions diffs - 0.2.8__py3-none-any.whl → 0.2.11__py3-none-any.whl - Mend

gobby 0.2.8py3-none-any.whl → 0.2.11py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (168) hide show

gobby/__init__.py +1 -1
gobby/adapters/__init__.py +6 -0
gobby/adapters/base.py +11 -2
gobby/adapters/claude_code.py +5 -28
gobby/adapters/codex_impl/adapter.py +38 -43
gobby/adapters/copilot.py +324 -0
gobby/adapters/cursor.py +373 -0
gobby/adapters/gemini.py +2 -26
gobby/adapters/windsurf.py +359 -0
gobby/agents/definitions.py +162 -2
gobby/agents/isolation.py +33 -1
gobby/agents/pty_reader.py +192 -0
gobby/agents/registry.py +10 -1
gobby/agents/runner.py +24 -8
gobby/agents/sandbox.py +8 -3
gobby/agents/session.py +4 -0
gobby/agents/spawn.py +9 -2
gobby/agents/spawn_executor.py +49 -61
gobby/agents/spawners/command_builder.py +4 -4
gobby/app_context.py +64 -0
gobby/cli/__init__.py +4 -0
gobby/cli/install.py +259 -4
gobby/cli/installers/__init__.py +12 -0
gobby/cli/installers/copilot.py +242 -0
gobby/cli/installers/cursor.py +244 -0
gobby/cli/installers/shared.py +3 -0
gobby/cli/installers/windsurf.py +242 -0
gobby/cli/pipelines.py +639 -0
gobby/cli/sessions.py +3 -1
gobby/cli/skills.py +209 -0
gobby/cli/tasks/crud.py +6 -5
gobby/cli/tasks/search.py +1 -1
gobby/cli/ui.py +116 -0
gobby/cli/utils.py +5 -17
gobby/cli/workflows.py +38 -17
gobby/config/app.py +5 -0
gobby/config/features.py +0 -20
gobby/config/skills.py +23 -2
gobby/config/tasks.py +4 -0
gobby/hooks/broadcaster.py +9 -0
gobby/hooks/event_handlers/__init__.py +155 -0
gobby/hooks/event_handlers/_agent.py +175 -0
gobby/hooks/event_handlers/_base.py +92 -0
gobby/hooks/event_handlers/_misc.py +66 -0
gobby/hooks/event_handlers/_session.py +487 -0
gobby/hooks/event_handlers/_tool.py +196 -0
gobby/hooks/events.py +48 -0
gobby/hooks/hook_manager.py +27 -3
gobby/install/copilot/hooks/hook_dispatcher.py +203 -0
gobby/install/cursor/hooks/hook_dispatcher.py +203 -0
gobby/install/gemini/hooks/hook_dispatcher.py +8 -0
gobby/install/windsurf/hooks/hook_dispatcher.py +205 -0
gobby/llm/__init__.py +14 -1
gobby/llm/claude.py +594 -43
gobby/llm/service.py +149 -0
gobby/mcp_proxy/importer.py +4 -41
gobby/mcp_proxy/instructions.py +9 -27
gobby/mcp_proxy/manager.py +13 -3
gobby/mcp_proxy/models.py +1 -0
gobby/mcp_proxy/registries.py +66 -5
gobby/mcp_proxy/server.py +6 -2
gobby/mcp_proxy/services/recommendation.py +2 -28
gobby/mcp_proxy/services/tool_filter.py +7 -0
gobby/mcp_proxy/services/tool_proxy.py +19 -1
gobby/mcp_proxy/stdio.py +37 -21
gobby/mcp_proxy/tools/agents.py +7 -0
gobby/mcp_proxy/tools/artifacts.py +3 -3
gobby/mcp_proxy/tools/hub.py +30 -1
gobby/mcp_proxy/tools/orchestration/cleanup.py +5 -5
gobby/mcp_proxy/tools/orchestration/monitor.py +1 -1
gobby/mcp_proxy/tools/orchestration/orchestrate.py +8 -3
gobby/mcp_proxy/tools/orchestration/review.py +17 -4
gobby/mcp_proxy/tools/orchestration/wait.py +7 -7
gobby/mcp_proxy/tools/pipelines/__init__.py +254 -0
gobby/mcp_proxy/tools/pipelines/_discovery.py +67 -0
gobby/mcp_proxy/tools/pipelines/_execution.py +281 -0
gobby/mcp_proxy/tools/sessions/_crud.py +4 -4
gobby/mcp_proxy/tools/sessions/_handoff.py +1 -1
gobby/mcp_proxy/tools/skills/__init__.py +184 -30
gobby/mcp_proxy/tools/spawn_agent.py +229 -14
gobby/mcp_proxy/tools/task_readiness.py +27 -4
gobby/mcp_proxy/tools/tasks/_context.py +8 -0
gobby/mcp_proxy/tools/tasks/_crud.py +27 -1
gobby/mcp_proxy/tools/tasks/_helpers.py +1 -1
gobby/mcp_proxy/tools/tasks/_lifecycle.py +125 -8
gobby/mcp_proxy/tools/tasks/_lifecycle_validation.py +2 -1
gobby/mcp_proxy/tools/tasks/_search.py +1 -1
gobby/mcp_proxy/tools/workflows/__init__.py +273 -0
gobby/mcp_proxy/tools/workflows/_artifacts.py +225 -0
gobby/mcp_proxy/tools/workflows/_import.py +112 -0
gobby/mcp_proxy/tools/workflows/_lifecycle.py +332 -0
gobby/mcp_proxy/tools/workflows/_query.py +226 -0
gobby/mcp_proxy/tools/workflows/_resolution.py +78 -0
gobby/mcp_proxy/tools/workflows/_terminal.py +175 -0
gobby/mcp_proxy/tools/worktrees.py +54 -15
gobby/memory/components/__init__.py +0 -0
gobby/memory/components/ingestion.py +98 -0
gobby/memory/components/search.py +108 -0
gobby/memory/context.py +5 -5
gobby/memory/manager.py +16 -25
gobby/paths.py +51 -0
gobby/prompts/loader.py +1 -35
gobby/runner.py +131 -16
gobby/servers/http.py +193 -150
gobby/servers/routes/__init__.py +2 -0
gobby/servers/routes/admin.py +56 -0
gobby/servers/routes/mcp/endpoints/execution.py +33 -32
gobby/servers/routes/mcp/endpoints/registry.py +8 -8
gobby/servers/routes/mcp/hooks.py +10 -1
gobby/servers/routes/pipelines.py +227 -0
gobby/servers/websocket.py +314 -1
gobby/sessions/analyzer.py +89 -3
gobby/sessions/manager.py +5 -5
gobby/sessions/transcripts/__init__.py +3 -0
gobby/sessions/transcripts/claude.py +5 -0
gobby/sessions/transcripts/codex.py +5 -0
gobby/sessions/transcripts/gemini.py +5 -0
gobby/skills/hubs/__init__.py +25 -0
gobby/skills/hubs/base.py +234 -0
gobby/skills/hubs/claude_plugins.py +328 -0
gobby/skills/hubs/clawdhub.py +289 -0
gobby/skills/hubs/github_collection.py +465 -0
gobby/skills/hubs/manager.py +263 -0
gobby/skills/hubs/skillhub.py +342 -0
gobby/skills/parser.py +23 -0
gobby/skills/sync.py +5 -4
gobby/storage/artifacts.py +19 -0
gobby/storage/memories.py +4 -4
gobby/storage/migrations.py +118 -3
gobby/storage/pipelines.py +367 -0
gobby/storage/sessions.py +23 -4
gobby/storage/skills.py +48 -8
gobby/storage/tasks/_aggregates.py +2 -2
gobby/storage/tasks/_lifecycle.py +4 -4
gobby/storage/tasks/_models.py +7 -1
gobby/storage/tasks/_queries.py +3 -3
gobby/sync/memories.py +4 -3
gobby/tasks/commits.py +48 -17
gobby/tasks/external_validator.py +4 -17
gobby/tasks/validation.py +13 -87
gobby/tools/summarizer.py +18 -51
gobby/utils/status.py +13 -0
gobby/workflows/actions.py +80 -0
gobby/workflows/context_actions.py +265 -27
gobby/workflows/definitions.py +119 -1
gobby/workflows/detection_helpers.py +23 -11
gobby/workflows/enforcement/__init__.py +11 -1
gobby/workflows/enforcement/blocking.py +96 -0
gobby/workflows/enforcement/handlers.py +35 -1
gobby/workflows/enforcement/task_policy.py +18 -0
gobby/workflows/engine.py +26 -4
gobby/workflows/evaluator.py +8 -5
gobby/workflows/lifecycle_evaluator.py +59 -27
gobby/workflows/loader.py +567 -30
gobby/workflows/lobster_compat.py +147 -0
gobby/workflows/pipeline_executor.py +801 -0
gobby/workflows/pipeline_state.py +172 -0
gobby/workflows/pipeline_webhooks.py +206 -0
gobby/workflows/premature_stop.py +5 -0
gobby/worktrees/git.py +135 -20
{gobby-0.2.8.dist-info → gobby-0.2.11.dist-info}/METADATA +56 -22
{gobby-0.2.8.dist-info → gobby-0.2.11.dist-info}/RECORD +166 -122
gobby/hooks/event_handlers.py +0 -1008
gobby/mcp_proxy/tools/workflows.py +0 -1023
{gobby-0.2.8.dist-info → gobby-0.2.11.dist-info}/WHEEL +0 -0
{gobby-0.2.8.dist-info → gobby-0.2.11.dist-info}/entry_points.txt +0 -0
{gobby-0.2.8.dist-info → gobby-0.2.11.dist-info}/licenses/LICENSE.md +0 -0
{gobby-0.2.8.dist-info → gobby-0.2.11.dist-info}/top_level.txt +0 -0

gobby/storage/skills.py CHANGED Viewed

@@ -23,7 +23,7 @@ logger = logging.getLogger(__name__)
 _UNSET: Any = object()
 # Valid source types for skills
-SkillSourceType = Literal["local", "github", "url", "zip", "filesystem"]
+SkillSourceType = Literal["local", "github", "url", "zip", "filesystem", "hub"]
 @dataclass
@@ -91,6 +91,8 @@ class Skill:
     # Gobby-specific
     enabled: bool = True
+    always_apply: bool = False
+    injection_format: str = "summary"  # "summary", "full", "content"
     project_id: str | None = None
     # Timestamps
@@ -131,6 +133,10 @@ class Skill:
             hub_slug=row["hub_slug"] if "hub_slug" in row.keys() else None,
             hub_version=row["hub_version"] if "hub_version" in row.keys() else None,
             enabled=bool(row["enabled"]),
+            always_apply=bool(row["always_apply"]) if "always_apply" in row.keys() else False,
+            injection_format=row["injection_format"]
+            if "injection_format" in row.keys()
+            else "summary",
             project_id=row["project_id"],
             created_at=row["created_at"],
             updated_at=row["updated_at"],
@@ -159,6 +165,8 @@ class Skill:
             "hub_slug": self.hub_slug,
             "hub_version": self.hub_version,
             "enabled": self.enabled,
+            "always_apply": self.always_apply,
+            "injection_format": self.injection_format,
             "project_id": self.project_id,
             "created_at": self.created_at,
             "updated_at": self.updated_at,
@@ -192,9 +200,13 @@ class Skill:
     def is_always_apply(self) -> bool:
         """Check if this is a core skill that should always be applied.
-        Supports both top-level alwaysApply and nested metadata.skillport.alwaysApply.
-        Top-level takes precedence.
+        Reads from the always_apply column first (set during sync from frontmatter).
+        Falls back to metadata for backwards compatibility with older records.
         """
+        # Primary: read from column (set during sync)
+        if self.always_apply:
+            return True
+        # Fallback: check metadata for backwards compatibility
         if not self.metadata:
             return False
         # Check top-level first
@@ -407,6 +419,8 @@ class LocalSkillManager:
         hub_slug: str | None = None,
         hub_version: str | None = None,
         enabled: bool = True,
+        always_apply: bool = False,
+        injection_format: str = "summary",
         project_id: str | None = None,
     ) -> Skill:
         """Create a new skill.
@@ -427,6 +441,8 @@ class LocalSkillManager:
             hub_slug: Optional hub slug
             hub_version: Optional hub version
             enabled: Whether skill is active
+            always_apply: Whether skill should always be injected at session start
+            injection_format: How to inject skill (summary, full, content)
             project_id: Project scope (None for global)
         Returns:
@@ -457,8 +473,9 @@ class LocalSkillManager:
                     id, name, description, content, version, license,
                     compatibility, allowed_tools, metadata, source_path,
                     source_type, source_ref, hub_name, hub_slug, hub_version,
-                    enabled, project_id, created_at, updated_at
-                ) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+                    enabled, always_apply, injection_format, project_id,
+                    created_at, updated_at
+                ) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
                 """,
                 (
                     skill_id,
@@ -477,6 +494,8 @@ class LocalSkillManager:
                     hub_slug,
                     hub_version,
                     enabled,
+                    always_apply,
+                    injection_format,
                     project_id,
                     now,
                     now,
@@ -559,6 +578,8 @@ class LocalSkillManager:
         hub_slug: str | None = _UNSET,
         hub_version: str | None = _UNSET,
         enabled: bool | None = None,
+        always_apply: bool | None = None,
+        injection_format: str | None = None,
     ) -> Skill:
         """Update an existing skill.
@@ -579,6 +600,8 @@ class LocalSkillManager:
             hub_slug: New hub slug (use _UNSET to leave unchanged, None to clear)
             hub_version: New hub version (use _UNSET to leave unchanged, None to clear)
             enabled: New enabled state (optional)
+            always_apply: New always_apply state (optional)
+            injection_format: New injection format (optional)
         Returns:
             The updated Skill
@@ -634,6 +657,12 @@ class LocalSkillManager:
         if enabled is not None:
             updates.append("enabled = ?")
             params.append(enabled)
+        if always_apply is not None:
+            updates.append("always_apply = ?")
+            params.append(always_apply)
+        if injection_format is not None:
+            updates.append("injection_format = ?")
+            params.append(injection_format)
         if not updates:
             return self.get_skill(skill_id)
@@ -770,7 +799,7 @@ class LocalSkillManager:
         return [Skill.from_row(row) for row in rows]
     def list_core_skills(self, project_id: str | None = None) -> list[Skill]:
-        """List skills with alwaysApply=true.
+        """List skills with always_apply=true (efficiently via column query).
         Args:
             project_id: Optional project scope
@@ -778,8 +807,19 @@ class LocalSkillManager:
         Returns:
             List of core skills (always-apply skills)
         """
-        skills = self.list_skills(project_id=project_id, enabled=True, limit=1000)
-        return [s for s in skills if s.is_always_apply()]
+        query = "SELECT * FROM skills WHERE always_apply = 1 AND enabled = 1"
+        params: list[Any] = []
+        if project_id:
+            query += " AND (project_id = ? OR project_id IS NULL)"
+            params.append(project_id)
+        else:
+            query += " AND project_id IS NULL"
+        query += " ORDER BY name ASC"
+        rows = self.db.fetchall(query, tuple(params))
+        return [Skill.from_row(row) for row in rows]
     def skill_exists(self, skill_id: str) -> bool:
         """Check if a skill with the given ID exists.

gobby/storage/tasks/_aggregates.py CHANGED Viewed

@@ -97,7 +97,7 @@ def count_ready_tasks(
           -- Blocker is unresolved if not closed AND not in review without requiring user review
           AND NOT (
               blocker.status = 'closed'
-              OR (blocker.status = 'review' AND blocker.requires_user_review = 0)
+              OR (blocker.status = 'needs_review' AND blocker.requires_user_review = 0)
           )
           -- Exclude ancestor blocked by any descendant (completion block, not work block)
           -- Check if t.id appears anywhere in blocker's ancestor chain
@@ -153,7 +153,7 @@ def count_blocked_tasks(
           -- Blocker is unresolved if not closed AND not in review without requiring user review
           AND NOT (
               blocker.status = 'closed'
-              OR (blocker.status = 'review' AND blocker.requires_user_review = 0)
+              OR (blocker.status = 'needs_review' AND blocker.requires_user_review = 0)
           )
           -- Exclude ancestor blocked by any descendant (completion block, not work block)
           -- Check if t.id appears anywhere in blocker's ancestor chain

gobby/storage/tasks/_lifecycle.py CHANGED Viewed

@@ -57,9 +57,9 @@ def close_task(
                 f"Cannot close task {task_id}: has {len(open_children)} open child task(s): {child_list}"
             )
-    # Check if task is being closed from review state (user acceptance)
+    # Check if task is being closed from needs_review state (user acceptance)
     current_task = get_task(db, task_id)
-    accepted_by_user = current_task.status == "review" if current_task else False
+    accepted_by_user = current_task.status == "needs_review" if current_task else False
     now = datetime.now(UTC).isoformat()
     with db.transaction() as conn:
@@ -117,8 +117,8 @@ def reopen_task(
         ValueError: If task not found or not closed/review
     """
     task = get_task(db, task_id)
-    if task.status not in ("closed", "review"):
-        raise ValueError(f"Task {task_id} is not closed or in review (status: {task.status})")
+    if task.status not in ("closed", "needs_review"):
+        raise ValueError(f"Task {task_id} is not closed or in needs_review (status: {task.status})")
     now = datetime.now(UTC).isoformat()

gobby/storage/tasks/_models.py CHANGED Viewed

@@ -82,7 +82,13 @@ class Task:
     project_id: str
     title: str
     status: Literal[
-        "open", "in_progress", "review", "closed", "failed", "escalated", "needs_decomposition"
+        "open",
+        "in_progress",
+        "needs_review",
+        "closed",
+        "failed",
+        "escalated",
+        "needs_decomposition",
     ]
     priority: int
     task_type: str  # bug, feature, task, epic, chore

gobby/storage/tasks/_queries.py CHANGED Viewed

@@ -156,7 +156,7 @@ def list_ready_tasks(
               -- Blocker is unresolved if not closed AND not in review without requiring user review
               AND NOT (
                   blocker.status = 'closed'
-                  OR (blocker.status = 'review' AND blocker.requires_user_review = 0)
+                  OR (blocker.status = 'needs_review' AND blocker.requires_user_review = 0)
               )
               -- Exclude ancestor blocked by any descendant (completion block, not work block)
               AND NOT EXISTS (
@@ -186,7 +186,7 @@ def list_ready_tasks(
               -- Blocker is unresolved if not closed AND not in review without requiring user review
               AND NOT (
                   blocker.status = 'closed'
-                  OR (blocker.status = 'review' AND blocker.requires_user_review = 0)
+                  OR (blocker.status = 'needs_review' AND blocker.requires_user_review = 0)
               )
               -- Exclude ancestor blocked by any descendant (completion block, not work block)
               AND NOT EXISTS (
@@ -266,7 +266,7 @@ def list_blocked_tasks(
           -- Blocker is unresolved if not closed AND not in review without requiring user review
           AND NOT (
               blocker.status = 'closed'
-              OR (blocker.status = 'review' AND blocker.requires_user_review = 0)
+              OR (blocker.status = 'needs_review' AND blocker.requires_user_review = 0)
           )
           -- Exclude ancestor blocked by any descendant (completion block, not work block)
           AND NOT EXISTS (

gobby/sync/memories.py CHANGED Viewed

@@ -131,8 +131,8 @@ class MemoryBackupManager:
             from gobby.utils.project_context import get_project_context
             project_ctx = get_project_context()
-            if project_ctx and project_ctx.get("path"):
-                project_path = Path(project_ctx["path"]).expanduser().resolve()
+            if project_ctx and project_ctx.get("project_path"):
+                project_path = Path(project_ctx["project_path"]).expanduser().resolve()
                 return project_path / self.export_path
         except Exception:
             pass  # nosec B110 - fall back to cwd if project context unavailable
@@ -289,7 +289,8 @@ class MemoryBackupManager:
             return 0
         try:
-            memories = self.memory_manager.list_memories()
+            # Use high limit to export all memories for backup (default is 50)
+            memories = self.memory_manager.list_memories(limit=10000)
             # Deduplicate by content before export
             unique_memories = self._deduplicate_memories(memories)

gobby/tasks/commits.py CHANGED Viewed

@@ -487,30 +487,49 @@ def extract_mentioned_symbols(task: dict[str, Any]) -> list[str]:
 # Task ID patterns to search for in commit messages
-# Supports #N format (e.g., #1, #47) - human-friendly task references
+# Uses {project}-#N format to avoid GitHub auto-linking and match CLI display format
+# Patterns capture both project name and task number for validation
 TASK_ID_PATTERNS = [
-    # [#N] - bracket format
-    r"\[#(\d+)\]",
-    # #N: - hash-colon format (at start of line or after space)
-    r"(?:^|\s)#(\d+):",
-    # Implements/Fixes/Closes/Refs #N (supports multiple: #1, #2, #3)
-    r"(?:implements|fixes|closes|refs)\s+#(\d+)",
-    # Standalone #N after whitespace (with word boundary to avoid false positives)
-    r"(?:^|\s)#(\d+)\b(?![\d.])",
+    # [project-#N] - bracket format (primary)
+    r"\[(\w+)-#(\d+)\]",
+    # project-#N - standalone format (word boundary before, after digits)
+    r"(?:^|\s)(\w+)-#(\d+)\b",
+    # Implements/Fixes/Closes/Refs project-#N
+    r"(?:implements|fixes|closes|refs)\s+(\w+)-#(\d+)",
 ]
-def extract_task_ids_from_message(message: str) -> list[str]:
+def get_current_project_name() -> str | None:
+    """Get current project name from context.
+    Returns:
+        Project name or None if not in a project.
+    """
+    from gobby.utils.project_context import get_project_context
+    ctx = get_project_context()
+    if ctx and ctx.get("name"):
+        name: str = ctx["name"]
+        return name
+    return None
+def extract_task_ids_from_message(
+    message: str,
+    project_name: str | None = None,
+) -> list[str]:
     """Extract task IDs from a commit message.
     Supports patterns:
-    - [#N] - bracket format
-    - #N: - hash-colon format (at start of message)
-    - Implements/Fixes/Closes/Refs #N
-    - Multiple references: #1, #2, #3
+    - [project-#N] - bracket format (primary)
+    - project-#N - standalone format
+    - Implements/Fixes/Closes/Refs project-#N
     Args:
         message: Commit message to parse.
+        project_name: Optional project name to filter matches. If provided,
+            only returns task IDs from commits referencing this project.
+            If None, returns all task IDs found regardless of project.
     Returns:
         List of unique task references found (e.g., ["#1", "#42"]).
@@ -520,8 +539,13 @@ def extract_task_ids_from_message(message: str) -> list[str]:
     for pattern in TASK_ID_PATTERNS:
         matches = re.findall(pattern, message, re.IGNORECASE | re.MULTILINE)
         for match in matches:
+            # match is a tuple: (project, task_number)
+            found_project, task_num = match
+            # Filter by project name if specified
+            if project_name and found_project.lower() != project_name.lower():
+                continue
             # Format as #N
-            task_id = f"#{match}"
+            task_id = f"#{task_num}"
             task_ids.add(task_id)
     return list(task_ids)
@@ -547,6 +571,7 @@ def auto_link_commits(
     task_id: str | None = None,
     since: str | None = None,
     cwd: str | Path | None = None,
+    project_name: str | None = None,
 ) -> AutoLinkResult:
     """Auto-detect and link commits that mention task IDs.
@@ -558,12 +583,18 @@ def auto_link_commits(
         task_id: Optional specific task ID to filter for.
         since: Optional git --since parameter (e.g., "1 week ago", "2024-01-01").
         cwd: Working directory for git commands.
+        project_name: Optional project name to filter commits. If not provided,
+            auto-detects from current project context.
     Returns:
         AutoLinkResult with details of linked and skipped commits.
     """
     working_dir = Path(cwd) if cwd else Path.cwd()
+    # Get project name for filtering (auto-detect if not provided)
+    if project_name is None:
+        project_name = get_current_project_name()
     # Build git log command
     # Format: "sha|message" for easy parsing
     git_cmd = ["git", "log", "--pretty=format:%h|%s"]
@@ -590,8 +621,8 @@ def auto_link_commits(
         commit_sha, message = parts
-        # Extract task IDs from message
-        found_task_ids = extract_task_ids_from_message(message)
+        # Extract task IDs from message (filtered by project name)
+        found_task_ids = extract_task_ids_from_message(message, project_name)
         if not found_task_ids:
             continue

gobby/tasks/external_validator.py CHANGED Viewed

@@ -46,12 +46,7 @@ if TYPE_CHECKING:
 logger = logging.getLogger(__name__)
 # Default system prompt for external validators
-DEFAULT_EXTERNAL_SYSTEM_PROMPT = (
-    "You are an objective QA validator reviewing code changes. "
-    "You have no prior context about this task - evaluate purely based on "
-    "the acceptance criteria and the changes provided. "
-    "Be thorough but fair in your assessment."
-)
 # Module-level loader (initialized lazily)
 _loader: PromptLoader | None = None
@@ -62,10 +57,7 @@ def _get_loader(project_dir: Path | None = None) -> PromptLoader:
     global _loader
     if _loader is None:
         _loader = PromptLoader(project_dir=project_dir)
-        # Register fallbacks for strangler fig pattern
-        _loader.register_fallback(
-            "external_validation/system", lambda: DEFAULT_EXTERNAL_SYSTEM_PROMPT
-        )
     return _loader
@@ -218,13 +210,8 @@ async def _run_llm_validation(
     # Build the validation prompt
     prompt = _build_external_validation_prompt(task, changes_context)
-    # System prompt emphasizing objectivity
-    system_prompt = (
-        "You are an objective QA validator reviewing code changes. "
-        "You have no prior context about this task - evaluate purely based on "
-        "the acceptance criteria and the changes provided. "
-        "Be thorough but fair in your assessment."
-    )
+    # Render system prompt
+    system_prompt = _get_loader().render("external_validation/system", {})
     try:
         provider = llm_service.get_provider(config.provider)

gobby/tasks/validation.py CHANGED Viewed

@@ -27,51 +27,6 @@ from gobby.utils.json_helpers import extract_json_object
 logger = logging.getLogger(__name__)
-# Default prompts (fallbacks for strangler fig pattern)
-DEFAULT_VALIDATE_PROMPT = """Validate if the following changes satisfy the requirements.
-Task: {title}
-{category_section}{criteria_text}
-{changes_section}
-IMPORTANT: Return ONLY a JSON object, nothing else. No explanation, no preamble.
-Format: {{"status": "valid", "feedback": "..."}} or {{"status": "invalid", "feedback": "..."}}
-"""
-DEFAULT_CRITERIA_PROMPT = """Generate validation criteria for this task.
-Task: {title}
-Description: {description}
-CRITICAL RULES - You MUST follow these:
-1. **Only stated requirements** - Include ONLY requirements explicitly written in the title or description
-2. **No invented values** - Do NOT invent specific numbers, timeouts, thresholds, or limits unless they appear in the task
-3. **No invented edge cases** - Do NOT add edge cases, error scenarios, or boundary conditions beyond what's described
-4. **Proportional detail** - Vague tasks get vague criteria; detailed tasks get detailed criteria
-5. **When in doubt, leave it out** - If something isn't mentioned, don't include it
-For vague requirements like "fix X" or "add Y", use criteria like:
-- "X no longer produces the reported error/warning"
-- "Y functionality works as expected"
-- "Existing tests continue to pass"
-- "No regressions introduced"
-DO NOT generate criteria like:
-- "timeout defaults to 30 seconds" (unless 30 seconds is in the task description)
-- "handles edge case Z" (unless Z is mentioned in the task)
-- "logs with format X" (unless that format is specified)
-Format as markdown checkboxes:
-## Deliverable
-- [ ] What the task explicitly asks for
-## Functional Requirements
-- [ ] Only requirements stated in the description
-## Verification
-- [ ] Tests pass (if applicable)
-- [ ] No regressions
-"""
 # Default number of commits to look back when gathering context
 DEFAULT_COMMIT_WINDOW = 10
@@ -490,10 +445,6 @@ class TaskValidator:
         self.llm_service = llm_service
         self._loader = PromptLoader(project_dir=project_dir)
-        # Register fallbacks for strangler fig pattern
-        self._loader.register_fallback("validation/validate", lambda: DEFAULT_VALIDATE_PROMPT)
-        self._loader.register_fallback("validation/criteria", lambda: DEFAULT_CRITERIA_PROMPT)
     async def gather_validation_context(self, file_paths: list[str]) -> str:
         """
         Gather context for validation from files.
@@ -588,35 +539,16 @@ class TaskValidator:
             else:
                 category_section += "\n"
-        # Build prompt using PromptLoader or legacy config
-        if self.config.prompt_path:
-            prompt_path = self.config.prompt_path
-            template_context = {
-                "title": title,
-                "category_section": category_section,
-                "criteria_text": criteria_text,
-                "changes_section": changes_section,
-                "file_context": file_context[:50000] if file_context else "",
-            }
-            try:
-                prompt = self._loader.render(prompt_path, template_context)
-            except FileNotFoundError:
-                logger.debug(f"Prompt template '{prompt_path}' not found, using fallback")
-                prompt = DEFAULT_VALIDATE_PROMPT.format(**template_context)
-                if file_context:
-                    prompt += f"\nFile Context:\n{file_context[:50000]}\n"
-        else:
-            # Default behavior
-            template_context = {
-                "title": title,
-                "category_section": category_section,
-                "criteria_text": criteria_text,
-                "changes_section": changes_section,
-                "file_context": file_context[:50000] if file_context else "",
-            }
-            prompt = DEFAULT_VALIDATE_PROMPT.format(**template_context)
-            if file_context:
-                prompt += f"\nFile Context:\n{file_context[:50000]}\n"
+        # Build prompt using PromptLoader
+        prompt_path = self.config.prompt_path or "validation/validate"
+        template_context = {
+            "title": title,
+            "category_section": category_section,
+            "criteria_text": criteria_text,
+            "changes_section": changes_section,
+            "file_context": file_context[:50000] if file_context else "",
+        }
+        prompt = self._loader.render(prompt_path, template_context)
         try:
             provider = self.llm_service.get_provider(self.config.provider)
@@ -670,19 +602,13 @@ class TaskValidator:
         if not self.config.enabled:
             return None
-        # Build prompt using PromptLoader or legacy config
+        # Use PromptLoader
+        prompt_path = self.config.criteria_prompt_path or "validation/criteria"
         template_context = {
             "title": title,
             "description": description or "(no description)",
         }
-        # Use PromptLoader
-        prompt_path = self.config.criteria_prompt_path or "validation/criteria"
-        try:
-            prompt = self._loader.render(prompt_path, template_context)
-        except FileNotFoundError:
-            logger.debug(f"Prompt template '{prompt_path}' not found, using fallback")
-            prompt = DEFAULT_CRITERIA_PROMPT.format(**template_context)
+        prompt = self._loader.render(prompt_path, template_context)
         try:
             provider = self.llm_service.get_provider(self.config.provider)

gobby/tools/summarizer.py CHANGED Viewed

@@ -23,25 +23,6 @@ MAX_DESCRIPTION_LENGTH = 200
 _config: ToolSummarizerConfig | None = None
 _loader: PromptLoader | None = None
-DEFAULT_SUMMARY_PROMPT = """Summarize this MCP tool description in 180 characters or less.
-Keep it to three sentences or less. Be concise and preserve the key functionality.
-Do not add quotes, extra formatting, or code examples.
-Description: {description}
-Summary:"""
-DEFAULT_SUMMARY_SYSTEM_PROMPT = "You are a technical summarizer. Create concise tool descriptions."
-DEFAULT_SERVER_DESC_PROMPT = """Write a single concise sentence describing what the '{server_name}' MCP server does based on its tools.
-Tools:
-{tools_list}
-Description (1 sentence, try to keep under 100 characters):"""
-DEFAULT_SERVER_DESC_SYSTEM_PROMPT = "You write concise technical descriptions."
 def init_summarizer_config(config: ToolSummarizerConfig, project_dir: str | None = None) -> None:
     """Initialize the summarizer with configuration."""
@@ -50,13 +31,6 @@ def init_summarizer_config(config: ToolSummarizerConfig, project_dir: str | None
     global _config, _loader
     _config = config
     _loader = PromptLoader(project_dir=Path(project_dir) if project_dir else None)
-    # Register fallbacks
-    _loader.register_fallback("features/tool_summary", lambda: DEFAULT_SUMMARY_PROMPT)
-    _loader.register_fallback("features/tool_summary_system", lambda: DEFAULT_SUMMARY_SYSTEM_PROMPT)
-    _loader.register_fallback("features/server_description", lambda: DEFAULT_SERVER_DESC_PROMPT)
-    _loader.register_fallback(
-        "features/server_description_system", lambda: DEFAULT_SERVER_DESC_SYSTEM_PROMPT
-    )
 def _get_config() -> ToolSummarizerConfig:
@@ -96,9 +70,9 @@ async def _summarize_description_with_claude(description: str) -> str:
             if _loader is None:
                 raise RuntimeError("Summarizer not initialized")
             prompt = _loader.render(prompt_path, {"description": description})
-        except (FileNotFoundError, OSError, KeyError, ValueError, RuntimeError) as e:
-            logger.debug(f"Failed to load prompt from {prompt_path}: {e}, using default")
-            prompt = DEFAULT_SUMMARY_PROMPT.format(description=description)
+        except (OSError, KeyError, ValueError, RuntimeError) as e:
+            logger.debug(f"Failed to load prompt from {prompt_path}: {e}")
+            raise
         # Get system prompt
         sys_prompt_path = config.system_prompt_path or "features/tool_summary_system"
@@ -106,9 +80,9 @@ async def _summarize_description_with_claude(description: str) -> str:
             if _loader is None:
                 raise RuntimeError("Summarizer not initialized")
             system_prompt = _loader.render(sys_prompt_path, {})
-        except (FileNotFoundError, OSError, KeyError, ValueError, RuntimeError) as e:
-            logger.debug(f"Failed to load system prompt from {sys_prompt_path}: {e}, using default")
-            system_prompt = DEFAULT_SUMMARY_SYSTEM_PROMPT
+        except (OSError, KeyError, ValueError, RuntimeError) as e:
+            logger.debug(f"Failed to load system prompt from {sys_prompt_path}: {e}")
+            system_prompt = "You are a technical summarizer."
         # Configure for single-turn completion
         options = ClaudeAgentOptions(
@@ -198,30 +172,23 @@ async def generate_server_description(
             "server_name": server_name,
             "tools_list": tools_list,
         }
-        try:
-            if _loader is None:
-                _get_config()  # force init
-            if _loader is None:
-                # Still None after _get_config, use default
-                prompt = DEFAULT_SERVER_DESC_PROMPT.format(**context)
-            else:
-                prompt = _loader.render(prompt_path, context)
-        except (FileNotFoundError, OSError, KeyError, ValueError, RuntimeError) as e:
-            logger.debug(f"Failed to load prompt from {prompt_path}: {e}, using default")
-            prompt = DEFAULT_SERVER_DESC_PROMPT.format(**context)
+        if _loader is None:
+            _get_config()  # force init
+        if _loader is None:
+            # Still None after _get_config, use default
+            raise RuntimeError("Summarizer not initialized")
+        else:
+            prompt = _loader.render(prompt_path, context)
         # Get system prompt
         sys_prompt_path = (
             config.server_description_system_prompt_path or "features/server_description_system"
         )
-        try:
-            if _loader is None:
-                system_prompt = DEFAULT_SERVER_DESC_SYSTEM_PROMPT
-            else:
-                system_prompt = _loader.render(sys_prompt_path, {})
-        except (FileNotFoundError, OSError, KeyError, ValueError, RuntimeError) as e:
-            logger.debug(f"Failed to load system prompt from {sys_prompt_path}: {e}, using default")
-            system_prompt = DEFAULT_SERVER_DESC_SYSTEM_PROMPT
+        if _loader is None:
+            system_prompt = "You write concise technical descriptions."
+        else:
+            system_prompt = _loader.render(sys_prompt_path, {})
         # Configure for single-turn completion
         options = ClaudeAgentOptions(

gobby 0.2.8__py3-none-any.whl → 0.2.11__py3-none-any.whl

gobby 0.2.8py3-none-any.whl → 0.2.11py3-none-any.whl