PyPI - gobby - Versions diffs - 0.2.5__py3-none-any.whl → 0.2.7__py3-none-any.whl - Mend

gobby 0.2.5py3-none-any.whl → 0.2.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (244) hide show

gobby/__init__.py +1 -1
gobby/adapters/__init__.py +2 -1
gobby/adapters/claude_code.py +13 -4
gobby/adapters/codex_impl/__init__.py +28 -0
gobby/adapters/codex_impl/adapter.py +722 -0
gobby/adapters/codex_impl/client.py +679 -0
gobby/adapters/codex_impl/protocol.py +20 -0
gobby/adapters/codex_impl/types.py +68 -0
gobby/agents/definitions.py +11 -1
gobby/agents/isolation.py +395 -0
gobby/agents/runner.py +8 -0
gobby/agents/sandbox.py +261 -0
gobby/agents/spawn.py +42 -287
gobby/agents/spawn_executor.py +385 -0
gobby/agents/spawners/__init__.py +24 -0
gobby/agents/spawners/command_builder.py +189 -0
gobby/agents/spawners/embedded.py +21 -2
gobby/agents/spawners/headless.py +21 -2
gobby/agents/spawners/prompt_manager.py +125 -0
gobby/cli/__init__.py +6 -0
gobby/cli/clones.py +419 -0
gobby/cli/conductor.py +266 -0
gobby/cli/install.py +4 -4
gobby/cli/installers/antigravity.py +3 -9
gobby/cli/installers/claude.py +15 -9
gobby/cli/installers/codex.py +2 -8
gobby/cli/installers/gemini.py +8 -8
gobby/cli/installers/shared.py +175 -13
gobby/cli/sessions.py +1 -1
gobby/cli/skills.py +858 -0
gobby/cli/tasks/ai.py +0 -440
gobby/cli/tasks/crud.py +44 -6
gobby/cli/tasks/main.py +0 -4
gobby/cli/tui.py +2 -2
gobby/cli/utils.py +12 -5
gobby/clones/__init__.py +13 -0
gobby/clones/git.py +547 -0
gobby/conductor/__init__.py +16 -0
gobby/conductor/alerts.py +135 -0
gobby/conductor/loop.py +164 -0
gobby/conductor/monitors/__init__.py +11 -0
gobby/conductor/monitors/agents.py +116 -0
gobby/conductor/monitors/tasks.py +155 -0
gobby/conductor/pricing.py +234 -0
gobby/conductor/token_tracker.py +160 -0
gobby/config/__init__.py +12 -97
gobby/config/app.py +69 -91
gobby/config/extensions.py +2 -2
gobby/config/features.py +7 -130
gobby/config/search.py +110 -0
gobby/config/servers.py +1 -1
gobby/config/skills.py +43 -0
gobby/config/tasks.py +9 -41
gobby/hooks/__init__.py +0 -13
gobby/hooks/event_handlers.py +188 -2
gobby/hooks/hook_manager.py +50 -4
gobby/hooks/plugins.py +1 -1
gobby/hooks/skill_manager.py +130 -0
gobby/hooks/webhooks.py +1 -1
gobby/install/claude/hooks/hook_dispatcher.py +4 -4
gobby/install/codex/hooks/hook_dispatcher.py +1 -1
gobby/install/gemini/hooks/hook_dispatcher.py +87 -12
gobby/llm/claude.py +22 -34
gobby/llm/claude_executor.py +46 -256
gobby/llm/codex_executor.py +59 -291
gobby/llm/executor.py +21 -0
gobby/llm/gemini.py +134 -110
gobby/llm/litellm_executor.py +143 -6
gobby/llm/resolver.py +98 -35
gobby/mcp_proxy/importer.py +62 -4
gobby/mcp_proxy/instructions.py +56 -0
gobby/mcp_proxy/models.py +15 -0
gobby/mcp_proxy/registries.py +68 -8
gobby/mcp_proxy/server.py +33 -3
gobby/mcp_proxy/services/recommendation.py +43 -11
gobby/mcp_proxy/services/tool_proxy.py +81 -1
gobby/mcp_proxy/stdio.py +2 -1
gobby/mcp_proxy/tools/__init__.py +0 -2
gobby/mcp_proxy/tools/agent_messaging.py +317 -0
gobby/mcp_proxy/tools/agents.py +31 -731
gobby/mcp_proxy/tools/clones.py +518 -0
gobby/mcp_proxy/tools/memory.py +3 -26
gobby/mcp_proxy/tools/metrics.py +65 -1
gobby/mcp_proxy/tools/orchestration/__init__.py +3 -0
gobby/mcp_proxy/tools/orchestration/cleanup.py +151 -0
gobby/mcp_proxy/tools/orchestration/wait.py +467 -0
gobby/mcp_proxy/tools/sessions/__init__.py +14 -0
gobby/mcp_proxy/tools/sessions/_commits.py +232 -0
gobby/mcp_proxy/tools/sessions/_crud.py +253 -0
gobby/mcp_proxy/tools/sessions/_factory.py +63 -0
gobby/mcp_proxy/tools/sessions/_handoff.py +499 -0
gobby/mcp_proxy/tools/sessions/_messages.py +138 -0
gobby/mcp_proxy/tools/skills/__init__.py +616 -0
gobby/mcp_proxy/tools/spawn_agent.py +417 -0
gobby/mcp_proxy/tools/task_orchestration.py +7 -0
gobby/mcp_proxy/tools/task_readiness.py +14 -0
gobby/mcp_proxy/tools/task_sync.py +1 -1
gobby/mcp_proxy/tools/tasks/_context.py +0 -20
gobby/mcp_proxy/tools/tasks/_crud.py +91 -4
gobby/mcp_proxy/tools/tasks/_expansion.py +348 -0
gobby/mcp_proxy/tools/tasks/_factory.py +6 -16
gobby/mcp_proxy/tools/tasks/_lifecycle.py +110 -45
gobby/mcp_proxy/tools/tasks/_lifecycle_validation.py +18 -29
gobby/mcp_proxy/tools/workflows.py +1 -1
gobby/mcp_proxy/tools/worktrees.py +0 -338
gobby/memory/backends/__init__.py +6 -1
gobby/memory/backends/mem0.py +6 -1
gobby/memory/extractor.py +477 -0
gobby/memory/ingestion/__init__.py +5 -0
gobby/memory/ingestion/multimodal.py +221 -0
gobby/memory/manager.py +73 -285
gobby/memory/search/__init__.py +10 -0
gobby/memory/search/coordinator.py +248 -0
gobby/memory/services/__init__.py +5 -0
gobby/memory/services/crossref.py +142 -0
gobby/prompts/loader.py +5 -2
gobby/runner.py +37 -16
gobby/search/__init__.py +48 -6
gobby/search/backends/__init__.py +159 -0
gobby/search/backends/embedding.py +225 -0
gobby/search/embeddings.py +238 -0
gobby/search/models.py +148 -0
gobby/search/unified.py +496 -0
gobby/servers/http.py +24 -12
gobby/servers/routes/admin.py +294 -0
gobby/servers/routes/mcp/endpoints/__init__.py +61 -0
gobby/servers/routes/mcp/endpoints/discovery.py +405 -0
gobby/servers/routes/mcp/endpoints/execution.py +568 -0
gobby/servers/routes/mcp/endpoints/registry.py +378 -0
gobby/servers/routes/mcp/endpoints/server.py +304 -0
gobby/servers/routes/mcp/hooks.py +1 -1
gobby/servers/routes/mcp/tools.py +48 -1317
gobby/servers/websocket.py +2 -2
gobby/sessions/analyzer.py +2 -0
gobby/sessions/lifecycle.py +1 -1
gobby/sessions/processor.py +10 -0
gobby/sessions/transcripts/base.py +2 -0
gobby/sessions/transcripts/claude.py +79 -10
gobby/skills/__init__.py +91 -0
gobby/skills/loader.py +685 -0
gobby/skills/manager.py +384 -0
gobby/skills/parser.py +286 -0
gobby/skills/search.py +463 -0
gobby/skills/sync.py +119 -0
gobby/skills/updater.py +385 -0
gobby/skills/validator.py +368 -0
gobby/storage/clones.py +378 -0
gobby/storage/database.py +1 -1
gobby/storage/memories.py +43 -13
gobby/storage/migrations.py +162 -201
gobby/storage/sessions.py +116 -7
gobby/storage/skills.py +782 -0
gobby/storage/tasks/_crud.py +4 -4
gobby/storage/tasks/_lifecycle.py +57 -7
gobby/storage/tasks/_manager.py +14 -5
gobby/storage/tasks/_models.py +8 -3
gobby/sync/memories.py +40 -5
gobby/sync/tasks.py +83 -6
gobby/tasks/__init__.py +1 -2
gobby/tasks/external_validator.py +1 -1
gobby/tasks/validation.py +46 -35
gobby/tools/summarizer.py +91 -10
gobby/tui/api_client.py +4 -7
gobby/tui/app.py +5 -3
gobby/tui/screens/orchestrator.py +1 -2
gobby/tui/screens/tasks.py +2 -4
gobby/tui/ws_client.py +1 -1
gobby/utils/daemon_client.py +2 -2
gobby/utils/project_context.py +2 -3
gobby/utils/status.py +13 -0
gobby/workflows/actions.py +221 -1135
gobby/workflows/artifact_actions.py +31 -0
gobby/workflows/autonomous_actions.py +11 -0
gobby/workflows/context_actions.py +93 -1
gobby/workflows/detection_helpers.py +115 -31
gobby/workflows/enforcement/__init__.py +47 -0
gobby/workflows/enforcement/blocking.py +269 -0
gobby/workflows/enforcement/commit_policy.py +283 -0
gobby/workflows/enforcement/handlers.py +269 -0
gobby/workflows/{task_enforcement_actions.py → enforcement/task_policy.py} +29 -388
gobby/workflows/engine.py +13 -2
gobby/workflows/git_utils.py +106 -0
gobby/workflows/lifecycle_evaluator.py +29 -1
gobby/workflows/llm_actions.py +30 -0
gobby/workflows/loader.py +19 -6
gobby/workflows/mcp_actions.py +20 -1
gobby/workflows/memory_actions.py +154 -0
gobby/workflows/safe_evaluator.py +183 -0
gobby/workflows/session_actions.py +44 -0
gobby/workflows/state_actions.py +60 -1
gobby/workflows/stop_signal_actions.py +55 -0
gobby/workflows/summary_actions.py +111 -1
gobby/workflows/task_sync_actions.py +347 -0
gobby/workflows/todo_actions.py +34 -1
gobby/workflows/webhook_actions.py +185 -0
{gobby-0.2.5.dist-info → gobby-0.2.7.dist-info}/METADATA +87 -21
{gobby-0.2.5.dist-info → gobby-0.2.7.dist-info}/RECORD +201 -172
{gobby-0.2.5.dist-info → gobby-0.2.7.dist-info}/WHEEL +1 -1
gobby/adapters/codex.py +0 -1292
gobby/install/claude/commands/gobby/bug.md +0 -51
gobby/install/claude/commands/gobby/chore.md +0 -51
gobby/install/claude/commands/gobby/epic.md +0 -52
gobby/install/claude/commands/gobby/eval.md +0 -235
gobby/install/claude/commands/gobby/feat.md +0 -49
gobby/install/claude/commands/gobby/nit.md +0 -52
gobby/install/claude/commands/gobby/ref.md +0 -52
gobby/install/codex/prompts/forget.md +0 -7
gobby/install/codex/prompts/memories.md +0 -7
gobby/install/codex/prompts/recall.md +0 -7
gobby/install/codex/prompts/remember.md +0 -13
gobby/llm/gemini_executor.py +0 -339
gobby/mcp_proxy/tools/session_messages.py +0 -1056
gobby/mcp_proxy/tools/task_expansion.py +0 -591
gobby/prompts/defaults/expansion/system.md +0 -119
gobby/prompts/defaults/expansion/user.md +0 -48
gobby/prompts/defaults/external_validation/agent.md +0 -72
gobby/prompts/defaults/external_validation/external.md +0 -63
gobby/prompts/defaults/external_validation/spawn.md +0 -83
gobby/prompts/defaults/external_validation/system.md +0 -6
gobby/prompts/defaults/features/import_mcp.md +0 -22
gobby/prompts/defaults/features/import_mcp_github.md +0 -17
gobby/prompts/defaults/features/import_mcp_search.md +0 -16
gobby/prompts/defaults/features/recommend_tools.md +0 -32
gobby/prompts/defaults/features/recommend_tools_hybrid.md +0 -35
gobby/prompts/defaults/features/recommend_tools_llm.md +0 -30
gobby/prompts/defaults/features/server_description.md +0 -20
gobby/prompts/defaults/features/server_description_system.md +0 -6
gobby/prompts/defaults/features/task_description.md +0 -31
gobby/prompts/defaults/features/task_description_system.md +0 -6
gobby/prompts/defaults/features/tool_summary.md +0 -17
gobby/prompts/defaults/features/tool_summary_system.md +0 -6
gobby/prompts/defaults/research/step.md +0 -58
gobby/prompts/defaults/validation/criteria.md +0 -47
gobby/prompts/defaults/validation/validate.md +0 -38
gobby/storage/migrations_legacy.py +0 -1359
gobby/tasks/context.py +0 -747
gobby/tasks/criteria.py +0 -342
gobby/tasks/expansion.py +0 -626
gobby/tasks/prompts/expand.py +0 -327
gobby/tasks/research.py +0 -421
gobby/tasks/tdd.py +0 -352
{gobby-0.2.5.dist-info → gobby-0.2.7.dist-info}/entry_points.txt +0 -0
{gobby-0.2.5.dist-info → gobby-0.2.7.dist-info}/licenses/LICENSE.md +0 -0
{gobby-0.2.5.dist-info → gobby-0.2.7.dist-info}/top_level.txt +0 -0

gobby/tasks/expansion.py DELETED Viewed

@@ -1,626 +0,0 @@
-"""
-Task expansion module.
-Handles breaking down high-level tasks into smaller, actionable subtasks
-using LLM providers with structured JSON output.
-"""
-import asyncio
-import json
-import logging
-import re
-from dataclasses import dataclass
-from typing import Any
-from gobby.config.app import ProjectVerificationConfig, TaskExpansionConfig
-from gobby.llm import LLMService
-from gobby.storage.task_dependencies import TaskDependencyManager
-from gobby.storage.tasks import LocalTaskManager, Task
-from gobby.tasks.context import ExpansionContext, ExpansionContextGatherer
-from gobby.tasks.criteria import PatternCriteriaInjector
-from gobby.tasks.prompts.expand import ExpansionPromptBuilder
-from gobby.utils.json_helpers import extract_json_from_text
-from gobby.utils.project_context import get_verification_config
-logger = logging.getLogger(__name__)
-@dataclass
-class SubtaskSpec:
-    """Parsed subtask specification from LLM output."""
-    title: str
-    description: str | None = None
-    priority: int = 2
-    task_type: str = "task"
-    category: str | None = None
-    validation: str | None = None  # Acceptance criteria from LLM
-    depends_on: list[int] | None = None
-    def __post_init__(self) -> None:
-        """Validate and normalize category after initialization."""
-        if self.category:
-            from gobby.storage.tasks import validate_category
-            self.category = validate_category(self.category)
-class TaskExpander:
-    """Expands tasks into subtasks using LLM and context."""
-    def __init__(
-        self,
-        config: TaskExpansionConfig,
-        llm_service: LLMService,
-        task_manager: LocalTaskManager,
-        mcp_manager: Any | None = None,
-        verification_config: ProjectVerificationConfig | None = None,
-    ):
-        self.config = config
-        self.llm_service = llm_service
-        self.task_manager = task_manager
-        self.mcp_manager = mcp_manager
-        self.context_gatherer = ExpansionContextGatherer(
-            task_manager=task_manager,
-            llm_service=llm_service,
-            config=config,
-            mcp_manager=mcp_manager,
-        )
-        self.prompt_builder = ExpansionPromptBuilder(config)
-        # Initialize pattern criteria injector
-        # Try to get verification config from project if not provided
-        if verification_config is None:
-            verification_config = get_verification_config()
-        self.criteria_injector = PatternCriteriaInjector(
-            pattern_config=config.pattern_criteria,
-            verification_config=verification_config,
-        )
-    def _resolve_tdd_mode(self, session_id: str | None, task_type: str | None = None) -> bool:
-        """Resolve tdd_mode with cascading precedence.
-        Order: task_type override > step workflow > lifecycle workflow > config.yaml > pydantic default
-        Epic tasks never use TDD mode since their closing condition is
-        'all children are closed', not test-based verification.
-        Args:
-            session_id: Session ID to resolve TDD mode from workflow state
-            task_type: Task type - epics always disable TDD mode
-        Returns:
-            True if TDD mode is enabled, False otherwise
-        """
-        # Epics never use TDD mode
-        if task_type == "epic":
-            return False
-        if session_id:
-            try:
-                from gobby.workflows.state_manager import WorkflowStateManager
-                state_manager = WorkflowStateManager(self.task_manager.db)
-                state = state_manager.get_state(session_id)
-                if state and state.variables and "tdd_mode" in state.variables:
-                    return bool(state.variables["tdd_mode"])
-            except Exception as e:
-                logger.debug(f"Failed to resolve tdd_mode from workflow state: {e}")
-        # Fall back to config (includes pydantic default)
-        return self.config.tdd_mode
-    async def expand_task(
-        self,
-        task_id: str,
-        title: str,
-        description: str | None = None,
-        context: str | None = None,
-        enable_web_research: bool = False,
-        enable_code_context: bool = True,
-        session_id: str | None = None,
-    ) -> dict[str, Any]:
-        """
-        Expand a task into subtasks using structured JSON output.
-        The LLM returns a JSON object with subtask specifications, which are
-        then parsed and created as tasks with proper dependency wiring.
-        Note: This creates plain subtasks only. To apply TDD structure
-        (test/implement/refactor triplets), use the apply_tdd command
-        separately after expansion.
-        Args:
-            task_id: ID of the task to expand
-            title: Task title
-            description: Task description
-            context: Additional context for expansion
-            enable_web_research: Whether to enable web research (default: False)
-            enable_code_context: Whether to enable code context gathering (default: True)
-            session_id: Session ID for TDD mode resolution (optional)
-        Returns:
-            Dictionary with:
-            - subtask_ids: List of created subtask IDs
-            - subtask_count: Number of subtasks created
-            - raw_response: The raw LLM response (for debugging)
-        """
-        if not self.config.enabled:
-            logger.info("Task expansion disabled, skipping")
-            return {
-                "subtask_ids": [],
-                "subtask_count": 0,
-                "raw_response": "Expansion disabled",
-            }
-        logger.info(f"Expanding task {task_id}: {title}")
-        # Apply overall timeout for entire expansion
-        timeout_seconds = self.config.timeout
-        try:
-            async with asyncio.timeout(timeout_seconds):
-                return await self._expand_task_impl(
-                    task_id=task_id,
-                    title=title,
-                    description=description,
-                    context=context,
-                    enable_web_research=enable_web_research,
-                    enable_code_context=enable_code_context,
-                    session_id=session_id,
-                )
-        except TimeoutError:
-            error_msg = (
-                f"Task expansion timed out after {timeout_seconds} seconds. "
-                f"Consider increasing task_expansion.timeout in config or simplifying the task."
-            )
-            logger.error(f"Expansion timeout for {task_id}: {error_msg}")
-            return {
-                "error": error_msg,
-                "subtask_ids": [],
-                "subtask_count": 0,
-                "timeout": True,
-            }
-    async def _expand_task_impl(
-        self,
-        task_id: str,
-        title: str,
-        description: str | None = None,
-        context: str | None = None,
-        enable_web_research: bool = False,
-        enable_code_context: bool = True,
-        session_id: str | None = None,
-    ) -> dict[str, Any]:
-        """Internal implementation of expand_task (called within timeout context)."""
-        # Gather enhanced context
-        task_obj = self.task_manager.get_task(task_id)
-        if not task_obj:
-            logger.warning(f"Task {task_id} not found for context gathering, using basic info")
-            task_obj = Task(
-                id=task_id,
-                project_id="unknown",
-                title=title,
-                status="open",
-                priority=2,
-                task_type="task",
-                created_at="",
-                updated_at="",
-                description=description,
-            )
-        expansion_ctx = await self.context_gatherer.gather_context(
-            task_obj,
-            enable_web_research=enable_web_research,
-            enable_code_context=enable_code_context,
-        )
-        # Inject pattern-specific criteria based on task labels and description
-        pattern_criteria = self.criteria_injector.inject(
-            task=task_obj,
-            context=expansion_ctx,
-        )
-        # Combine user context with pattern criteria if detected
-        combined_instructions = context or ""
-        if pattern_criteria:
-            logger.info(f"Detected patterns for {task_id}, adding pattern-specific criteria")
-            if combined_instructions:
-                combined_instructions += f"\n\n{pattern_criteria}"
-            else:
-                combined_instructions = pattern_criteria
-        # Build prompt using builder
-        prompt = self.prompt_builder.build_user_prompt(
-            task=task_obj,
-            context=expansion_ctx,
-            user_instructions=combined_instructions if combined_instructions else None,
-        )
-        try:
-            # Get provider and generate text response
-            provider = self.llm_service.get_provider(self.config.provider)
-            # Resolve TDD mode from session workflow state or config
-            # Epics never use TDD mode
-            tdd_mode = self._resolve_tdd_mode(session_id, task_obj.task_type)
-            # Note: TDD transformation is applied separately via apply_tdd command.
-            # The expand_task only creates plain subtasks.
-            response = await provider.generate_text(
-                prompt=prompt,
-                system_prompt=self.prompt_builder.get_system_prompt(tdd_mode=tdd_mode),
-                model=self.config.model,
-            )
-            logger.debug(f"LLM response (first 500 chars): {response[:500]}")
-            # Parse JSON from response
-            subtask_specs = self._parse_subtasks(response)
-            logger.debug(f"Parsed {len(subtask_specs)} subtask specs")
-            if not subtask_specs:
-                logger.warning(f"No subtasks parsed from response for {task_id}")
-                return {
-                    "subtask_ids": [],
-                    "subtask_count": 0,
-                    "raw_response": response,
-                    "error": "No subtasks found in response",
-                }
-            # Create tasks with dependency wiring and precise criteria
-            # Note: TDD transformation is done separately via apply_tdd command
-            subtask_ids = await self._create_subtasks(
-                parent_task_id=task_id,
-                project_id=task_obj.project_id,
-                subtask_specs=subtask_specs,
-                expansion_context=expansion_ctx,
-                parent_labels=task_obj.labels or [],
-            )
-            # Save expansion context to the parent task for audit/reuse
-            self._save_expansion_context(task_id, expansion_ctx)
-            logger.info(f"Expansion complete for {task_id}: created {len(subtask_ids)} subtasks")
-            return {
-                "subtask_ids": subtask_ids,
-                "subtask_count": len(subtask_ids),
-                "raw_response": response,
-            }
-        except Exception as e:
-            error_msg = str(e) or f"{type(e).__name__}: (no message)"
-            logger.error(f"Failed to expand task {task_id}: {error_msg}", exc_info=True)
-            return {"error": error_msg, "subtask_ids": [], "subtask_count": 0}
-    # Patterns that indicate a test task (case-insensitive)
-    TEST_TASK_PATTERNS = (
-        r"^write\s+tests?\s+for",
-        r"^add\s+(?:unit\s+)?tests?\s+for",
-        r"^create\s+(?:unit\s+)?tests?",
-        r"^unit\s+tests?\s+for",
-        r"^integration\s+tests?\s+for",
-        r"^test\s+(?:the\s+)?",
-        r"^verify\s+with\s+tests?",
-        r"tests?\s+for\s+.*(?:class|function|method|module)",
-    )
-    def _is_test_task(self, title: str, category: str | None) -> bool:
-        """Check if a subtask is a test task that should be filtered out.
-        TDD sandwich pattern creates test tasks automatically. LLM-generated
-        test tasks would cause duplicates and should be filtered.
-        Args:
-            title: The subtask title
-            category: The subtask category (if provided)
-        Returns:
-            True if this is a test task that should be filtered
-        """
-        # Don't filter refactor tasks - they may legitimately update existing tests
-        if category and category.lower() == "refactor":
-            return False
-        # Filter by category=test
-        if category and category.lower() == "test":
-            return True
-        # Filter by title patterns (only when category is not explicitly set to refactor)
-        title_lower = title.lower().strip()
-        for pattern in self.TEST_TASK_PATTERNS:
-            if re.search(pattern, title_lower, re.IGNORECASE):
-                return True
-        return False
-    def _parse_subtasks(self, response: str) -> list[SubtaskSpec]:
-        """
-        Parse subtask specifications from LLM JSON response.
-        Filters out test tasks since TDD sandwich creates them automatically.
-        Args:
-            response: Raw LLM response text (should be JSON)
-        Returns:
-            List of SubtaskSpec objects parsed from the response
-        """
-        # Try to extract JSON from the response
-        json_str = self._extract_json(response)
-        if not json_str:
-            logger.warning("No JSON found in response")
-            return []
-        try:
-            data = json.loads(json_str)
-        except json.JSONDecodeError as e:
-            logger.error(f"Failed to parse JSON: {e}")
-            return []
-        # Extract subtasks array
-        subtasks_data = data.get("subtasks", [])
-        if not isinstance(subtasks_data, list):
-            logger.warning(f"Expected 'subtasks' to be a list, got {type(subtasks_data)}")
-            return []
-        # Parse each subtask, filtering out test tasks
-        subtask_specs = []
-        filtered_count = 0
-        for i, item in enumerate(subtasks_data):
-            if not isinstance(item, dict):
-                logger.warning(f"Subtask {i} is not a dict, skipping")
-                continue
-            if "title" not in item:
-                logger.warning(f"Subtask {i} missing title, skipping")
-                continue
-            title = item["title"]
-            category = item.get("category")
-            # Filter out test tasks - TDD sandwich creates them automatically
-            if self._is_test_task(title, category):
-                logger.debug(f"Filtered test task: '{title}' (category={category})")
-                filtered_count += 1
-                continue
-            spec = SubtaskSpec(
-                title=title,
-                description=item.get("description"),
-                priority=item.get("priority", 2),
-                task_type=item.get("task_type", "task"),
-                category=category,
-                validation=item.get("validation"),
-                depends_on=item.get("depends_on"),
-            )
-            subtask_specs.append(spec)
-        if filtered_count > 0:
-            logger.debug(f"Filtered {filtered_count} test tasks from LLM output")
-        return subtask_specs
-    def _extract_json(self, text: str) -> str | None:
-        """Extract JSON from text. Delegates to shared utility."""
-        return extract_json_from_text(text)
-    async def _create_subtasks(
-        self,
-        parent_task_id: str,
-        project_id: str,
-        subtask_specs: list[SubtaskSpec],
-        expansion_context: ExpansionContext | None = None,
-        parent_labels: list[str] | None = None,
-    ) -> list[str]:
-        """
-        Create tasks from parsed subtask specifications.
-        Handles dependency wiring by mapping depends_on indices to task IDs.
-        Generates precise validation criteria using expansion context.
-        Note: TDD transformation is NOT done here. Use apply_tdd separately
-        to transform code tasks into test/implement/refactor triplets.
-        Args:
-            parent_task_id: ID of the parent task
-            project_id: Project ID for the new tasks
-            subtask_specs: List of parsed subtask specifications
-            expansion_context: Context gathered during expansion (for criteria generation)
-            parent_labels: Labels from the parent task (for pattern detection)
-        Returns:
-            List of created task IDs
-        """
-        created_ids: list[str] = []
-        dep_manager = TaskDependencyManager(self.task_manager.db)
-        # Map subtask_spec index to task ID for dependency wiring
-        spec_index_to_id: dict[int, str] = {}
-        for i, spec in enumerate(subtask_specs):
-            # Build description
-            description = spec.description or ""
-            # Use validation from LLM output directly as validation_criteria
-            # This replaces the post-expansion generate_criteria() loop
-            validation_criteria = spec.validation
-            # If no validation from LLM and context available, generate precise criteria
-            if not validation_criteria and expansion_context:
-                precise_criteria = await self._generate_precise_criteria(
-                    spec=spec,
-                    context=expansion_context,
-                    parent_labels=parent_labels or [],
-                )
-                if precise_criteria:
-                    validation_criteria = precise_criteria
-            # Create the task with validation_criteria from LLM output
-            task = self.task_manager.create_task(
-                title=spec.title,
-                description=description if description else None,
-                project_id=project_id,
-                priority=spec.priority,
-                task_type=spec.task_type,
-                parent_task_id=parent_task_id,
-                category=spec.category,
-                validation_criteria=validation_criteria,
-            )
-            created_ids.append(task.id)
-            logger.debug(f"Created subtask {task.id}: {spec.title}")
-            spec_index_to_id[i] = task.id
-            # Add dependencies
-            if spec.depends_on:
-                for dep_idx in spec.depends_on:
-                    if dep_idx in spec_index_to_id:
-                        blocker_id = spec_index_to_id[dep_idx]
-                        try:
-                            dep_manager.add_dependency(task.id, blocker_id, "blocks")
-                            logger.debug(f"Added dependency: {task.id} blocked by {blocker_id}")
-                        except Exception as e:
-                            logger.warning(f"Failed to add dependency: {e}")
-                    else:
-                        logger.warning(
-                            f"Subtask {i} references invalid or forward index {dep_idx}, skipping dependency"
-                        )
-        return created_ids
-    def _save_expansion_context(
-        self,
-        task_id: str,
-        context: "ExpansionContext",
-    ) -> None:
-        """
-        Save expansion context to the task for audit and reuse.
-        Stores web research results and other context in the task's
-        expansion_context field as JSON.
-        Args:
-            task_id: ID of the task to update
-            context: The expansion context to save
-        """
-        try:
-            # Build a slim context dict focused on web research
-            context_data: dict[str, Any] = {}
-            if context.web_research:
-                context_data["web_research"] = context.web_research
-            if context.agent_findings:
-                context_data["agent_findings"] = context.agent_findings
-            if context.relevant_files:
-                context_data["relevant_files"] = context.relevant_files
-            if not context_data:
-                logger.debug(f"No expansion context to save for {task_id}")
-                return
-            # Serialize and update the task
-            context_json = json.dumps(context_data)
-            self.task_manager.update_task(task_id, expansion_context=context_json)
-            logger.debug(f"Saved expansion context for {task_id} ({len(context_json)} bytes)")
-        except Exception as e:
-            logger.warning(f"Failed to save expansion context for {task_id}: {e}")
-    async def _generate_precise_criteria(
-        self,
-        spec: SubtaskSpec,
-        context: ExpansionContext,
-        parent_labels: list[str],
-    ) -> str:
-        """
-        Generate precise validation criteria for a subtask using full expansion context.
-        Args:
-            spec: The subtask specification
-            context: Full expansion context with verification commands, signatures, etc.
-            parent_labels: Labels from the parent task (for pattern detection)
-        Returns:
-            Markdown-formatted validation criteria string
-        """
-        criteria_parts: list[str] = []
-        # 1. Start with pattern-specific criteria from parent labels
-        pattern_criteria = self.criteria_injector.inject_for_labels(
-            labels=parent_labels,
-            extra_placeholders=context.verification_commands,
-        )
-        if pattern_criteria:
-            criteria_parts.append(pattern_criteria)
-        # 2. Add base criteria from category if present
-        if spec.category:
-            # Substitute verification commands into category
-            strategy = spec.category
-            if context.verification_commands:
-                for name, cmd in context.verification_commands.items():
-                    strategy = strategy.replace(f"{{{name}}}", f"`{cmd}`")
-            criteria_parts.append(f"## Test Strategy\n\n- [ ] {strategy}")
-        # 3. Add file-specific criteria if relevant files are mentioned
-        if context.relevant_files and spec.description:
-            relevant_for_subtask = [
-                f
-                for f in context.relevant_files
-                if f.lower() in (spec.title + (spec.description or "")).lower()
-            ]
-            if relevant_for_subtask:
-                file_criteria = ["## File Requirements", ""]
-                for f in relevant_for_subtask:
-                    file_criteria.append(f"- [ ] `{f}` is correctly modified/created")
-                criteria_parts.append("\n".join(file_criteria))
-        # 4. Add function signature criteria if applicable
-        if context.function_signatures and spec.description:
-            desc_lower = (spec.description or "").lower()
-            for _file_path, signatures in context.function_signatures.items():
-                for sig in signatures:
-                    if not sig:
-                        continue
-                    # Extract function name robustly using regex
-                    # Handles: "def func_name(", "async def func_name(", "func_name("
-                    func_name = None
-                    # Try regex patterns first
-                    match = re.search(r"(?:async\s+)?def\s+(\w+)", sig)
-                    if match:
-                        func_name = match.group(1)
-                    else:
-                        # Fallback: try to get name before first paren
-                        match = re.search(r"(\w+)\s*\(", sig)
-                        if match:
-                            func_name = match.group(1)
-                        else:
-                            # Last resort: use existing split logic
-                            try:
-                                func_name = (
-                                    sig.split("(")[0].split()[-1] if "(" in sig else sig.split()[-1]
-                                )
-                            except (IndexError, AttributeError):
-                                continue
-                    if func_name and func_name.lower() in desc_lower:
-                        criteria_parts.append(
-                            f"## Function Integrity\n\n"
-                            f"- [ ] `{func_name}` signature preserved or updated as intended"
-                        )
-                        break
-        # 5. Add verification command criteria
-        if context.verification_commands:
-            verification_criteria = ["## Verification", ""]
-            for name, cmd in context.verification_commands.items():
-                if name in ["unit_tests", "type_check", "lint"]:
-                    verification_criteria.append(f"- [ ] `{cmd}` passes")
-            if len(verification_criteria) > 2:  # Has items beyond header
-                criteria_parts.append("\n".join(verification_criteria))
-        return "\n\n".join(criteria_parts) if criteria_parts else ""

gobby 0.2.5__py3-none-any.whl → 0.2.7__py3-none-any.whl

gobby 0.2.5py3-none-any.whl → 0.2.7py3-none-any.whl