PyPI - gobby - Versions diffs - 0.2.5__py3-none-any.whl - Mend

gobby 0.2.5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (383) hide show

gobby/__init__.py +3 -0
gobby/adapters/__init__.py +30 -0
gobby/adapters/base.py +93 -0
gobby/adapters/claude_code.py +276 -0
gobby/adapters/codex.py +1292 -0
gobby/adapters/gemini.py +343 -0
gobby/agents/__init__.py +37 -0
gobby/agents/codex_session.py +120 -0
gobby/agents/constants.py +112 -0
gobby/agents/context.py +362 -0
gobby/agents/definitions.py +133 -0
gobby/agents/gemini_session.py +111 -0
gobby/agents/registry.py +618 -0
gobby/agents/runner.py +968 -0
gobby/agents/session.py +259 -0
gobby/agents/spawn.py +916 -0
gobby/agents/spawners/__init__.py +77 -0
gobby/agents/spawners/base.py +142 -0
gobby/agents/spawners/cross_platform.py +266 -0
gobby/agents/spawners/embedded.py +225 -0
gobby/agents/spawners/headless.py +226 -0
gobby/agents/spawners/linux.py +125 -0
gobby/agents/spawners/macos.py +277 -0
gobby/agents/spawners/windows.py +308 -0
gobby/agents/tty_config.py +319 -0
gobby/autonomous/__init__.py +32 -0
gobby/autonomous/progress_tracker.py +447 -0
gobby/autonomous/stop_registry.py +269 -0
gobby/autonomous/stuck_detector.py +383 -0
gobby/cli/__init__.py +67 -0
gobby/cli/__main__.py +8 -0
gobby/cli/agents.py +529 -0
gobby/cli/artifacts.py +266 -0
gobby/cli/daemon.py +329 -0
gobby/cli/extensions.py +526 -0
gobby/cli/github.py +263 -0
gobby/cli/init.py +53 -0
gobby/cli/install.py +614 -0
gobby/cli/installers/__init__.py +37 -0
gobby/cli/installers/antigravity.py +65 -0
gobby/cli/installers/claude.py +363 -0
gobby/cli/installers/codex.py +192 -0
gobby/cli/installers/gemini.py +294 -0
gobby/cli/installers/git_hooks.py +377 -0
gobby/cli/installers/shared.py +737 -0
gobby/cli/linear.py +250 -0
gobby/cli/mcp.py +30 -0
gobby/cli/mcp_proxy.py +698 -0
gobby/cli/memory.py +304 -0
gobby/cli/merge.py +384 -0
gobby/cli/projects.py +79 -0
gobby/cli/sessions.py +622 -0
gobby/cli/tasks/__init__.py +30 -0
gobby/cli/tasks/_utils.py +658 -0
gobby/cli/tasks/ai.py +1025 -0
gobby/cli/tasks/commits.py +169 -0
gobby/cli/tasks/crud.py +685 -0
gobby/cli/tasks/deps.py +135 -0
gobby/cli/tasks/labels.py +63 -0
gobby/cli/tasks/main.py +273 -0
gobby/cli/tasks/search.py +178 -0
gobby/cli/tui.py +34 -0
gobby/cli/utils.py +513 -0
gobby/cli/workflows.py +927 -0
gobby/cli/worktrees.py +481 -0
gobby/config/__init__.py +129 -0
gobby/config/app.py +551 -0
gobby/config/extensions.py +167 -0
gobby/config/features.py +472 -0
gobby/config/llm_providers.py +98 -0
gobby/config/logging.py +66 -0
gobby/config/mcp.py +346 -0
gobby/config/persistence.py +247 -0
gobby/config/servers.py +141 -0
gobby/config/sessions.py +250 -0
gobby/config/tasks.py +784 -0
gobby/hooks/__init__.py +104 -0
gobby/hooks/artifact_capture.py +213 -0
gobby/hooks/broadcaster.py +243 -0
gobby/hooks/event_handlers.py +723 -0
gobby/hooks/events.py +218 -0
gobby/hooks/git.py +169 -0
gobby/hooks/health_monitor.py +171 -0
gobby/hooks/hook_manager.py +856 -0
gobby/hooks/hook_types.py +575 -0
gobby/hooks/plugins.py +813 -0
gobby/hooks/session_coordinator.py +396 -0
gobby/hooks/verification_runner.py +268 -0
gobby/hooks/webhooks.py +339 -0
gobby/install/claude/commands/gobby/bug.md +51 -0
gobby/install/claude/commands/gobby/chore.md +51 -0
gobby/install/claude/commands/gobby/epic.md +52 -0
gobby/install/claude/commands/gobby/eval.md +235 -0
gobby/install/claude/commands/gobby/feat.md +49 -0
gobby/install/claude/commands/gobby/nit.md +52 -0
gobby/install/claude/commands/gobby/ref.md +52 -0
gobby/install/claude/hooks/HOOK_SCHEMAS.md +632 -0
gobby/install/claude/hooks/hook_dispatcher.py +364 -0
gobby/install/claude/hooks/validate_settings.py +102 -0
gobby/install/claude/hooks-template.json +118 -0
gobby/install/codex/hooks/hook_dispatcher.py +153 -0
gobby/install/codex/prompts/forget.md +7 -0
gobby/install/codex/prompts/memories.md +7 -0
gobby/install/codex/prompts/recall.md +7 -0
gobby/install/codex/prompts/remember.md +13 -0
gobby/install/gemini/hooks/hook_dispatcher.py +268 -0
gobby/install/gemini/hooks-template.json +138 -0
gobby/install/shared/plugins/code_guardian.py +456 -0
gobby/install/shared/plugins/example_notify.py +331 -0
gobby/integrations/__init__.py +10 -0
gobby/integrations/github.py +145 -0
gobby/integrations/linear.py +145 -0
gobby/llm/__init__.py +40 -0
gobby/llm/base.py +120 -0
gobby/llm/claude.py +578 -0
gobby/llm/claude_executor.py +503 -0
gobby/llm/codex.py +322 -0
gobby/llm/codex_executor.py +513 -0
gobby/llm/executor.py +316 -0
gobby/llm/factory.py +34 -0
gobby/llm/gemini.py +258 -0
gobby/llm/gemini_executor.py +339 -0
gobby/llm/litellm.py +287 -0
gobby/llm/litellm_executor.py +303 -0
gobby/llm/resolver.py +499 -0
gobby/llm/service.py +236 -0
gobby/mcp_proxy/__init__.py +29 -0
gobby/mcp_proxy/actions.py +175 -0
gobby/mcp_proxy/daemon_control.py +198 -0
gobby/mcp_proxy/importer.py +436 -0
gobby/mcp_proxy/lazy.py +325 -0
gobby/mcp_proxy/manager.py +798 -0
gobby/mcp_proxy/metrics.py +609 -0
gobby/mcp_proxy/models.py +139 -0
gobby/mcp_proxy/registries.py +215 -0
gobby/mcp_proxy/schema_hash.py +381 -0
gobby/mcp_proxy/semantic_search.py +706 -0
gobby/mcp_proxy/server.py +549 -0
gobby/mcp_proxy/services/__init__.py +0 -0
gobby/mcp_proxy/services/fallback.py +306 -0
gobby/mcp_proxy/services/recommendation.py +224 -0
gobby/mcp_proxy/services/server_mgmt.py +214 -0
gobby/mcp_proxy/services/system.py +72 -0
gobby/mcp_proxy/services/tool_filter.py +231 -0
gobby/mcp_proxy/services/tool_proxy.py +309 -0
gobby/mcp_proxy/stdio.py +565 -0
gobby/mcp_proxy/tools/__init__.py +27 -0
gobby/mcp_proxy/tools/agents.py +1103 -0
gobby/mcp_proxy/tools/artifacts.py +207 -0
gobby/mcp_proxy/tools/hub.py +335 -0
gobby/mcp_proxy/tools/internal.py +337 -0
gobby/mcp_proxy/tools/memory.py +543 -0
gobby/mcp_proxy/tools/merge.py +422 -0
gobby/mcp_proxy/tools/metrics.py +283 -0
gobby/mcp_proxy/tools/orchestration/__init__.py +23 -0
gobby/mcp_proxy/tools/orchestration/cleanup.py +619 -0
gobby/mcp_proxy/tools/orchestration/monitor.py +380 -0
gobby/mcp_proxy/tools/orchestration/orchestrate.py +746 -0
gobby/mcp_proxy/tools/orchestration/review.py +736 -0
gobby/mcp_proxy/tools/orchestration/utils.py +16 -0
gobby/mcp_proxy/tools/session_messages.py +1056 -0
gobby/mcp_proxy/tools/task_dependencies.py +219 -0
gobby/mcp_proxy/tools/task_expansion.py +591 -0
gobby/mcp_proxy/tools/task_github.py +393 -0
gobby/mcp_proxy/tools/task_linear.py +379 -0
gobby/mcp_proxy/tools/task_orchestration.py +77 -0
gobby/mcp_proxy/tools/task_readiness.py +522 -0
gobby/mcp_proxy/tools/task_sync.py +351 -0
gobby/mcp_proxy/tools/task_validation.py +843 -0
gobby/mcp_proxy/tools/tasks/__init__.py +25 -0
gobby/mcp_proxy/tools/tasks/_context.py +112 -0
gobby/mcp_proxy/tools/tasks/_crud.py +516 -0
gobby/mcp_proxy/tools/tasks/_factory.py +176 -0
gobby/mcp_proxy/tools/tasks/_helpers.py +129 -0
gobby/mcp_proxy/tools/tasks/_lifecycle.py +517 -0
gobby/mcp_proxy/tools/tasks/_lifecycle_validation.py +301 -0
gobby/mcp_proxy/tools/tasks/_resolution.py +55 -0
gobby/mcp_proxy/tools/tasks/_search.py +215 -0
gobby/mcp_proxy/tools/tasks/_session.py +125 -0
gobby/mcp_proxy/tools/workflows.py +973 -0
gobby/mcp_proxy/tools/worktrees.py +1264 -0
gobby/mcp_proxy/transports/__init__.py +0 -0
gobby/mcp_proxy/transports/base.py +95 -0
gobby/mcp_proxy/transports/factory.py +44 -0
gobby/mcp_proxy/transports/http.py +139 -0
gobby/mcp_proxy/transports/stdio.py +213 -0
gobby/mcp_proxy/transports/websocket.py +136 -0
gobby/memory/backends/__init__.py +116 -0
gobby/memory/backends/mem0.py +408 -0
gobby/memory/backends/memu.py +485 -0
gobby/memory/backends/null.py +111 -0
gobby/memory/backends/openmemory.py +537 -0
gobby/memory/backends/sqlite.py +304 -0
gobby/memory/context.py +87 -0
gobby/memory/manager.py +1001 -0
gobby/memory/protocol.py +451 -0
gobby/memory/search/__init__.py +66 -0
gobby/memory/search/text.py +127 -0
gobby/memory/viz.py +258 -0
gobby/prompts/__init__.py +13 -0
gobby/prompts/defaults/expansion/system.md +119 -0
gobby/prompts/defaults/expansion/user.md +48 -0
gobby/prompts/defaults/external_validation/agent.md +72 -0
gobby/prompts/defaults/external_validation/external.md +63 -0
gobby/prompts/defaults/external_validation/spawn.md +83 -0
gobby/prompts/defaults/external_validation/system.md +6 -0
gobby/prompts/defaults/features/import_mcp.md +22 -0
gobby/prompts/defaults/features/import_mcp_github.md +17 -0
gobby/prompts/defaults/features/import_mcp_search.md +16 -0
gobby/prompts/defaults/features/recommend_tools.md +32 -0
gobby/prompts/defaults/features/recommend_tools_hybrid.md +35 -0
gobby/prompts/defaults/features/recommend_tools_llm.md +30 -0
gobby/prompts/defaults/features/server_description.md +20 -0
gobby/prompts/defaults/features/server_description_system.md +6 -0
gobby/prompts/defaults/features/task_description.md +31 -0
gobby/prompts/defaults/features/task_description_system.md +6 -0
gobby/prompts/defaults/features/tool_summary.md +17 -0
gobby/prompts/defaults/features/tool_summary_system.md +6 -0
gobby/prompts/defaults/research/step.md +58 -0
gobby/prompts/defaults/validation/criteria.md +47 -0
gobby/prompts/defaults/validation/validate.md +38 -0
gobby/prompts/loader.py +346 -0
gobby/prompts/models.py +113 -0
gobby/py.typed +0 -0
gobby/runner.py +488 -0
gobby/search/__init__.py +23 -0
gobby/search/protocol.py +104 -0
gobby/search/tfidf.py +232 -0
gobby/servers/__init__.py +7 -0
gobby/servers/http.py +636 -0
gobby/servers/models.py +31 -0
gobby/servers/routes/__init__.py +23 -0
gobby/servers/routes/admin.py +416 -0
gobby/servers/routes/dependencies.py +118 -0
gobby/servers/routes/mcp/__init__.py +24 -0
gobby/servers/routes/mcp/hooks.py +135 -0
gobby/servers/routes/mcp/plugins.py +121 -0
gobby/servers/routes/mcp/tools.py +1337 -0
gobby/servers/routes/mcp/webhooks.py +159 -0
gobby/servers/routes/sessions.py +582 -0
gobby/servers/websocket.py +766 -0
gobby/sessions/__init__.py +13 -0
gobby/sessions/analyzer.py +322 -0
gobby/sessions/lifecycle.py +240 -0
gobby/sessions/manager.py +563 -0
gobby/sessions/processor.py +225 -0
gobby/sessions/summary.py +532 -0
gobby/sessions/transcripts/__init__.py +41 -0
gobby/sessions/transcripts/base.py +125 -0
gobby/sessions/transcripts/claude.py +386 -0
gobby/sessions/transcripts/codex.py +143 -0
gobby/sessions/transcripts/gemini.py +195 -0
gobby/storage/__init__.py +21 -0
gobby/storage/agents.py +409 -0
gobby/storage/artifact_classifier.py +341 -0
gobby/storage/artifacts.py +285 -0
gobby/storage/compaction.py +67 -0
gobby/storage/database.py +357 -0
gobby/storage/inter_session_messages.py +194 -0
gobby/storage/mcp.py +680 -0
gobby/storage/memories.py +562 -0
gobby/storage/merge_resolutions.py +550 -0
gobby/storage/migrations.py +860 -0
gobby/storage/migrations_legacy.py +1359 -0
gobby/storage/projects.py +166 -0
gobby/storage/session_messages.py +251 -0
gobby/storage/session_tasks.py +97 -0
gobby/storage/sessions.py +817 -0
gobby/storage/task_dependencies.py +223 -0
gobby/storage/tasks/__init__.py +42 -0
gobby/storage/tasks/_aggregates.py +180 -0
gobby/storage/tasks/_crud.py +449 -0
gobby/storage/tasks/_id.py +104 -0
gobby/storage/tasks/_lifecycle.py +311 -0
gobby/storage/tasks/_manager.py +889 -0
gobby/storage/tasks/_models.py +300 -0
gobby/storage/tasks/_ordering.py +119 -0
gobby/storage/tasks/_path_cache.py +110 -0
gobby/storage/tasks/_queries.py +343 -0
gobby/storage/tasks/_search.py +143 -0
gobby/storage/workflow_audit.py +393 -0
gobby/storage/worktrees.py +547 -0
gobby/sync/__init__.py +29 -0
gobby/sync/github.py +333 -0
gobby/sync/linear.py +304 -0
gobby/sync/memories.py +284 -0
gobby/sync/tasks.py +641 -0
gobby/tasks/__init__.py +8 -0
gobby/tasks/build_verification.py +193 -0
gobby/tasks/commits.py +633 -0
gobby/tasks/context.py +747 -0
gobby/tasks/criteria.py +342 -0
gobby/tasks/enhanced_validator.py +226 -0
gobby/tasks/escalation.py +263 -0
gobby/tasks/expansion.py +626 -0
gobby/tasks/external_validator.py +764 -0
gobby/tasks/issue_extraction.py +171 -0
gobby/tasks/prompts/expand.py +327 -0
gobby/tasks/research.py +421 -0
gobby/tasks/tdd.py +352 -0
gobby/tasks/tree_builder.py +263 -0
gobby/tasks/validation.py +712 -0
gobby/tasks/validation_history.py +357 -0
gobby/tasks/validation_models.py +89 -0
gobby/tools/__init__.py +0 -0
gobby/tools/summarizer.py +170 -0
gobby/tui/__init__.py +5 -0
gobby/tui/api_client.py +281 -0
gobby/tui/app.py +327 -0
gobby/tui/screens/__init__.py +25 -0
gobby/tui/screens/agents.py +333 -0
gobby/tui/screens/chat.py +450 -0
gobby/tui/screens/dashboard.py +377 -0
gobby/tui/screens/memory.py +305 -0
gobby/tui/screens/metrics.py +231 -0
gobby/tui/screens/orchestrator.py +904 -0
gobby/tui/screens/sessions.py +412 -0
gobby/tui/screens/tasks.py +442 -0
gobby/tui/screens/workflows.py +289 -0
gobby/tui/screens/worktrees.py +174 -0
gobby/tui/widgets/__init__.py +21 -0
gobby/tui/widgets/chat.py +210 -0
gobby/tui/widgets/conductor.py +104 -0
gobby/tui/widgets/menu.py +132 -0
gobby/tui/widgets/message_panel.py +160 -0
gobby/tui/widgets/review_gate.py +224 -0
gobby/tui/widgets/task_tree.py +99 -0
gobby/tui/widgets/token_budget.py +166 -0
gobby/tui/ws_client.py +258 -0
gobby/utils/__init__.py +3 -0
gobby/utils/daemon_client.py +235 -0
gobby/utils/git.py +222 -0
gobby/utils/id.py +38 -0
gobby/utils/json_helpers.py +161 -0
gobby/utils/logging.py +376 -0
gobby/utils/machine_id.py +135 -0
gobby/utils/metrics.py +589 -0
gobby/utils/project_context.py +182 -0
gobby/utils/project_init.py +263 -0
gobby/utils/status.py +256 -0
gobby/utils/validation.py +80 -0
gobby/utils/version.py +23 -0
gobby/workflows/__init__.py +4 -0
gobby/workflows/actions.py +1310 -0
gobby/workflows/approval_flow.py +138 -0
gobby/workflows/artifact_actions.py +103 -0
gobby/workflows/audit_helpers.py +110 -0
gobby/workflows/autonomous_actions.py +286 -0
gobby/workflows/context_actions.py +394 -0
gobby/workflows/definitions.py +130 -0
gobby/workflows/detection_helpers.py +208 -0
gobby/workflows/engine.py +485 -0
gobby/workflows/evaluator.py +669 -0
gobby/workflows/git_utils.py +96 -0
gobby/workflows/hooks.py +169 -0
gobby/workflows/lifecycle_evaluator.py +613 -0
gobby/workflows/llm_actions.py +70 -0
gobby/workflows/loader.py +333 -0
gobby/workflows/mcp_actions.py +60 -0
gobby/workflows/memory_actions.py +272 -0
gobby/workflows/premature_stop.py +164 -0
gobby/workflows/session_actions.py +139 -0
gobby/workflows/state_actions.py +123 -0
gobby/workflows/state_manager.py +104 -0
gobby/workflows/stop_signal_actions.py +163 -0
gobby/workflows/summary_actions.py +344 -0
gobby/workflows/task_actions.py +249 -0
gobby/workflows/task_enforcement_actions.py +901 -0
gobby/workflows/templates.py +52 -0
gobby/workflows/todo_actions.py +84 -0
gobby/workflows/webhook.py +223 -0
gobby/workflows/webhook_executor.py +399 -0
gobby/worktrees/__init__.py +5 -0
gobby/worktrees/git.py +690 -0
gobby/worktrees/merge/__init__.py +20 -0
gobby/worktrees/merge/conflict_parser.py +177 -0
gobby/worktrees/merge/resolver.py +485 -0
gobby-0.2.5.dist-info/METADATA +351 -0
gobby-0.2.5.dist-info/RECORD +383 -0
gobby-0.2.5.dist-info/WHEEL +5 -0
gobby-0.2.5.dist-info/entry_points.txt +2 -0
gobby-0.2.5.dist-info/licenses/LICENSE.md +193 -0
gobby-0.2.5.dist-info/top_level.txt +1 -0

gobby/storage/artifact_classifier.py ADDED Viewed

@@ -0,0 +1,341 @@
+"""Artifact type classifier.
+Automatically classifies content into artifact types:
+- code: Programming language code blocks
+- file_path: File or directory paths
+- error: Error messages and stack traces
+- command_output: Terminal/shell command output
+- structured_data: JSON, YAML, TOML, XML
+- text: Plain text (default)
+Also extracts relevant metadata for each type (language, extension, format, etc.)
+"""
+from __future__ import annotations
+import json
+import re
+from dataclasses import dataclass, field
+from enum import Enum
+from typing import Any
+__all__ = ["ArtifactType", "ClassificationResult", "classify_artifact"]
+class ArtifactType(str, Enum):
+    """Artifact type enumeration."""
+    CODE = "code"
+    FILE_PATH = "file_path"
+    ERROR = "error"
+    COMMAND_OUTPUT = "command_output"
+    STRUCTURED_DATA = "structured_data"
+    TEXT = "text"
+@dataclass
+class ClassificationResult:
+    """Result of artifact classification."""
+    artifact_type: ArtifactType
+    metadata: dict[str, Any] = field(default_factory=dict)
+    def to_dict(self) -> dict[str, Any]:
+        """Convert to dictionary."""
+        return {
+            "artifact_type": self.artifact_type.value,
+            "metadata": self.metadata,
+        }
+# Language detection patterns (more specific patterns first)
+_LANGUAGE_PATTERNS: list[tuple[str, re.Pattern[str]]] = [
+    # Python
+    (
+        "python",
+        re.compile(
+            r"^\s*(def\s+\w+|class\s+\w+|import\s+\w+|from\s+\w+\s+import|async\s+def\s+\w+|@\w+)",
+            re.MULTILINE,
+        ),
+    ),
+    # TypeScript (must be before JavaScript - has interface/type)
+    (
+        "typescript",
+        re.compile(
+            r"^\s*(interface\s+\w+|type\s+\w+\s*=|:\s*(string|number|boolean|any)\b)", re.MULTILINE
+        ),
+    ),
+    # JavaScript
+    (
+        "javascript",
+        re.compile(
+            r"^\s*(function\s+\w+|const\s+\w+\s*=|let\s+\w+\s*=|var\s+\w+\s*=|=>\s*\{)",
+            re.MULTILINE,
+        ),
+    ),
+    # Rust
+    (
+        "rust",
+        re.compile(
+            r"^\s*(fn\s+\w+|impl\s+|struct\s+\w+|enum\s+\w+|use\s+\w+|pub\s+fn)", re.MULTILINE
+        ),
+    ),
+    # Go
+    ("go", re.compile(r"^\s*(func\s+\w+|func\s+\(\w+|package\s+\w+|import\s+\()", re.MULTILINE)),
+    # SQL
+    (
+        "sql",
+        re.compile(
+            r"^\s*(SELECT\s+|INSERT\s+INTO|UPDATE\s+\w+\s+SET|DELETE\s+FROM|CREATE\s+TABLE|DROP\s+TABLE)",
+            re.IGNORECASE | re.MULTILINE,
+        ),
+    ),
+    # Shell/Bash
+    (
+        "bash",
+        re.compile(
+            r"(^#!/bin/(ba)?sh|^\s*for\s+\w+\s+in\s+|^\s*if\s+\[\[?\s+|^\s*while\s+|echo\s+[\"'])",
+            re.MULTILINE,
+        ),
+    ),
+]
+# Markdown code fence pattern
+_CODE_FENCE_PATTERN = re.compile(r"^```(\w*).*?\n(.*?)```", re.DOTALL | re.MULTILINE)
+# File path patterns
+_UNIX_PATH_PATTERN = re.compile(r"^(/[\w./\-_]+|\.{1,2}/[\w./\-_]+)$")
+_WINDOWS_PATH_PATTERN = re.compile(r"^[A-Za-z]:\\[\w\\/.\-_]+$")
+_RELATIVE_PATH_PATTERN = re.compile(r"^[\w\-_]+/[\w./\-_]+\.\w+$")
+# Error patterns
+_ERROR_PATTERNS = [
+    re.compile(r"^Traceback \(most recent call last\):", re.MULTILINE),
+    re.compile(r"^\w+Error:\s+", re.MULTILINE),
+    re.compile(r"^TypeError:\s+", re.MULTILINE),
+    re.compile(r"^Exception\s+", re.MULTILINE),
+    re.compile(r"^Error:\s+", re.MULTILINE),
+    re.compile(r"thread\s+'.*'\s+panicked\s+at", re.MULTILINE),
+    re.compile(r"^\s+at\s+[\w.]+\([\w.]+:\d+\)$", re.MULTILINE),  # JS stack trace line
+]
+# Command output patterns
+_COMMAND_OUTPUT_PATTERNS = [
+    re.compile(r"^On branch\s+\w+", re.MULTILINE),  # git status
+    re.compile(r"^\$ \w+", re.MULTILINE),  # shell prompt
+    re.compile(r"^npm\s+(WARN|ERR!?|notice)", re.MULTILINE),  # npm
+    re.compile(r"^={3,}\s+test session starts\s+={3,}$", re.MULTILINE),  # pytest
+    re.compile(r"^total\s+\d+\s*$", re.MULTILINE),  # ls -l
+    re.compile(r"^(d|-)rwx", re.MULTILINE),  # ls -l permissions
+    re.compile(r"^added\s+\d+\s+packages?", re.MULTILINE),  # npm install
+    re.compile(r"^collected\s+\d+\s+items?", re.MULTILINE),  # pytest
+    re.compile(r"^\d+\s+passed", re.MULTILINE),  # pytest results
+]
+def _detect_language(content: str) -> str | None:
+    """Detect programming language from content."""
+    for lang, pattern in _LANGUAGE_PATTERNS:
+        if pattern.search(content):
+            return lang
+    return None
+def _is_file_path(content: str) -> tuple[bool, dict[str, Any]]:
+    """Check if content is a file path and extract metadata."""
+    content = content.strip()
+    # Don't classify multi-line content as a file path
+    if "\n" in content:
+        return False, {}
+    metadata: dict[str, Any] = {}
+    # Check patterns
+    if _UNIX_PATH_PATTERN.match(content):
+        pass
+    elif _WINDOWS_PATH_PATTERN.match(content):
+        pass
+    elif _RELATIVE_PATH_PATTERN.match(content):
+        pass
+    else:
+        return False, {}
+    # Extract filename and extension
+    parts = content.replace("\\", "/").split("/")
+    filename = parts[-1]
+    metadata["filename"] = filename
+    if "." in filename:
+        ext = filename.rsplit(".", 1)[-1]
+        metadata["extension"] = ext
+    else:
+        metadata["extension"] = None
+    return True, metadata
+def _is_error(content: str) -> bool:
+    """Check if content is an error message or stack trace."""
+    for pattern in _ERROR_PATTERNS:
+        if pattern.search(content):
+            return True
+    return False
+def _is_command_output(content: str) -> bool:
+    """Check if content is command output."""
+    for pattern in _COMMAND_OUTPUT_PATTERNS:
+        if pattern.search(content):
+            return True
+    return False
+def _is_json(content: str) -> bool:
+    """Check if content is valid JSON."""
+    content = content.strip()
+    if not (content.startswith("{") or content.startswith("[")):
+        return False
+    try:
+        json.loads(content)
+        return True
+    except (json.JSONDecodeError, ValueError):
+        return False
+def _is_yaml(content: str) -> bool:
+    """Check if content looks like YAML (simple heuristic)."""
+    content = content.strip()
+    lines = content.split("\n")
+    # YAML typically has key: value patterns
+    # Must have actual values after the colon (not just colons in prose)
+    yaml_kv_pattern = re.compile(r"^\s*[\w\-_]+:\s*\S")
+    yaml_list_with_kv_pattern = re.compile(r"^\s*-\s+[\w\-_]+:\s*")
+    yaml_kv_lines = 0
+    total_non_empty = 0
+    for line in lines:
+        line = line.strip()
+        if not line or line.startswith("#"):
+            continue
+        total_non_empty += 1
+        # Count lines with key: value pattern (not just list items)
+        if yaml_kv_pattern.match(line) or yaml_list_with_kv_pattern.match(line):
+            yaml_kv_lines += 1
+    # Need at least 2 key-value lines and they should be significant portion
+    return yaml_kv_lines >= 2 and (yaml_kv_lines / max(total_non_empty, 1)) > 0.3
+def _is_toml(content: str) -> bool:
+    """Check if content looks like TOML."""
+    content = content.strip()
+    # TOML has [section] headers and key = value
+    section_pattern = re.compile(r"^\s*\[[\w.\-]+\]\s*$", re.MULTILINE)
+    kv_pattern = re.compile(r"^\s*[\w\-]+\s*=\s*", re.MULTILINE)
+    has_section = section_pattern.search(content) is not None
+    has_kv = kv_pattern.search(content) is not None
+    return has_section and has_kv
+def _is_xml(content: str) -> bool:
+    """Check if content looks like XML."""
+    content = content.strip()
+    # XML starts with <?xml or <tag>
+    if content.startswith("<?xml"):
+        return True
+    # Check for matching opening/closing tags
+    tag_pattern = re.compile(r"^<(\w+)[^>]*>.*</\1>", re.DOTALL)
+    return tag_pattern.match(content) is not None
+def _is_code_block(content: str) -> tuple[bool, dict[str, Any]]:
+    """Check if content is a markdown code block and extract language."""
+    match = _CODE_FENCE_PATTERN.match(content.strip())
+    if match:
+        lang = match.group(1).lower() if match.group(1) else None
+        return True, {"language": lang} if lang else {}
+    return False, {}
+def classify_artifact(content: str) -> ClassificationResult:
+    """
+    Classify content into an artifact type with metadata.
+    Args:
+        content: The content to classify
+    Returns:
+        ClassificationResult with artifact_type and extracted metadata
+    """
+    if not content or not content.strip():
+        return ClassificationResult(artifact_type=ArtifactType.TEXT, metadata={})
+    # Check for markdown code fence first
+    is_code_fence, fence_metadata = _is_code_block(content)
+    if is_code_fence:
+        metadata = fence_metadata.copy()
+        # If no language in fence, try to detect from content
+        if "language" not in metadata or not metadata["language"]:
+            inner_content = _CODE_FENCE_PATTERN.match(content.strip())
+            if inner_content:
+                detected_lang = _detect_language(inner_content.group(2))
+                if detected_lang:
+                    metadata["language"] = detected_lang
+        return ClassificationResult(artifact_type=ArtifactType.CODE, metadata=metadata)
+    # Check for file path (single line only)
+    is_path, path_metadata = _is_file_path(content)
+    if is_path:
+        return ClassificationResult(artifact_type=ArtifactType.FILE_PATH, metadata=path_metadata)
+    # Check for error messages/stack traces
+    if _is_error(content):
+        metadata = {}
+        # Try to extract error type
+        error_match = re.search(r"^(\w+Error):", content, re.MULTILINE)
+        if error_match:
+            metadata["error"] = error_match.group(1)
+        return ClassificationResult(artifact_type=ArtifactType.ERROR, metadata=metadata)
+    # Check for code patterns BEFORE structured data
+    # (TypeScript interfaces look like YAML otherwise)
+    detected_lang = _detect_language(content)
+    if detected_lang:
+        return ClassificationResult(
+            artifact_type=ArtifactType.CODE, metadata={"language": detected_lang}
+        )
+    # Check for structured data formats
+    if _is_json(content):
+        return ClassificationResult(
+            artifact_type=ArtifactType.STRUCTURED_DATA, metadata={"format": "json"}
+        )
+    if _is_xml(content):
+        return ClassificationResult(
+            artifact_type=ArtifactType.STRUCTURED_DATA, metadata={"format": "xml"}
+        )
+    if _is_toml(content):
+        return ClassificationResult(
+            artifact_type=ArtifactType.STRUCTURED_DATA, metadata={"format": "toml"}
+        )
+    if _is_yaml(content):
+        return ClassificationResult(
+            artifact_type=ArtifactType.STRUCTURED_DATA, metadata={"format": "yaml"}
+        )
+    # Check for command output
+    if _is_command_output(content):
+        return ClassificationResult(artifact_type=ArtifactType.COMMAND_OUTPUT, metadata={})
+    # Default to text
+    return ClassificationResult(artifact_type=ArtifactType.TEXT, metadata={})

gobby/storage/artifacts.py ADDED Viewed

@@ -0,0 +1,285 @@
+"""
+Session artifacts storage module.
+Stores code snippets, diffs, errors, and other artifacts from sessions
+with optional FTS5 full-text search support.
+"""
+import json
+import logging
+import sqlite3
+from collections.abc import Callable
+from dataclasses import dataclass
+from datetime import UTC, datetime
+from typing import Any
+from gobby.storage.database import DatabaseProtocol
+from gobby.utils.id import generate_prefixed_id
+logger = logging.getLogger(__name__)
+@dataclass
+class Artifact:
+    """A session artifact representing code, diff, error, or other content."""
+    id: str
+    session_id: str
+    artifact_type: str
+    content: str
+    created_at: str
+    metadata: dict[str, Any] | None = None
+    source_file: str | None = None
+    line_start: int | None = None
+    line_end: int | None = None
+    @classmethod
+    def from_row(cls, row: sqlite3.Row) -> "Artifact":
+        """Create an Artifact from a database row."""
+        metadata_json = row["metadata_json"]
+        metadata = json.loads(metadata_json) if metadata_json else None
+        return cls(
+            id=row["id"],
+            session_id=row["session_id"],
+            artifact_type=row["artifact_type"],
+            content=row["content"],
+            created_at=row["created_at"],
+            metadata=metadata,
+            source_file=row["source_file"],
+            line_start=row["line_start"],
+            line_end=row["line_end"],
+        )
+    def to_dict(self) -> dict[str, Any]:
+        """Convert artifact to dictionary for serialization."""
+        return {
+            "id": self.id,
+            "session_id": self.session_id,
+            "artifact_type": self.artifact_type,
+            "content": self.content,
+            "created_at": self.created_at,
+            "metadata": self.metadata,
+            "source_file": self.source_file,
+            "line_start": self.line_start,
+            "line_end": self.line_end,
+        }
+class LocalArtifactManager:
+    """Manages session artifacts in local SQLite database."""
+    def __init__(self, db: DatabaseProtocol):
+        self.db = db
+        self._change_listeners: list[Callable[[], Any]] = []
+    def add_change_listener(self, listener: Callable[[], Any]) -> None:
+        """Add a change listener that will be called on create/delete."""
+        self._change_listeners.append(listener)
+    def _notify_listeners(self) -> None:
+        """Notify all change listeners."""
+        for listener in self._change_listeners:
+            try:
+                listener()
+            except Exception as e:
+                logger.error(f"Error in artifact change listener: {e}")
+    def create_artifact(
+        self,
+        session_id: str,
+        artifact_type: str,
+        content: str,
+        metadata: dict[str, Any] | None = None,
+        source_file: str | None = None,
+        line_start: int | None = None,
+        line_end: int | None = None,
+    ) -> Artifact:
+        """Create a new artifact.
+        Args:
+            session_id: ID of the session this artifact belongs to
+            artifact_type: Type of artifact (code, diff, error, etc.)
+            content: The artifact content
+            metadata: Optional metadata dict
+            source_file: Optional source file path
+            line_start: Optional starting line number
+            line_end: Optional ending line number
+        Returns:
+            The created Artifact
+        """
+        now = datetime.now(UTC).isoformat()
+        artifact_id = generate_prefixed_id("art", content[:50] + session_id)
+        metadata_json = json.dumps(metadata) if metadata else None
+        with self.db.transaction() as conn:
+            conn.execute(
+                """
+                INSERT INTO session_artifacts (
+                    id, session_id, artifact_type, content, metadata_json,
+                    source_file, line_start, line_end, created_at
+                ) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?)
+                """,
+                (
+                    artifact_id,
+                    session_id,
+                    artifact_type,
+                    content,
+                    metadata_json,
+                    source_file,
+                    line_start,
+                    line_end,
+                    now,
+                ),
+            )
+            # Also insert into FTS5 table for full-text search
+            conn.execute(
+                "INSERT INTO session_artifacts_fts (id, content) VALUES (?, ?)",
+                (artifact_id, content),
+            )
+        self._notify_listeners()
+        return self.get_artifact(artifact_id)  # type: ignore[return-value]
+    def get_artifact(self, artifact_id: str) -> Artifact | None:
+        """Get an artifact by ID.
+        Args:
+            artifact_id: The artifact ID
+        Returns:
+            The Artifact if found, None otherwise
+        """
+        row = self.db.fetchone("SELECT * FROM session_artifacts WHERE id = ?", (artifact_id,))
+        if not row:
+            return None
+        return Artifact.from_row(row)
+    def list_artifacts(
+        self,
+        session_id: str | None = None,
+        artifact_type: str | None = None,
+        limit: int = 100,
+        offset: int = 0,
+    ) -> list[Artifact]:
+        """List artifacts with optional filters.
+        Args:
+            session_id: Filter by session ID
+            artifact_type: Filter by artifact type
+            limit: Maximum number of results
+            offset: Offset for pagination
+        Returns:
+            List of matching Artifacts
+        """
+        query = "SELECT * FROM session_artifacts WHERE 1=1"
+        params: list[Any] = []
+        if session_id:
+            query += " AND session_id = ?"
+            params.append(session_id)
+        if artifact_type:
+            query += " AND artifact_type = ?"
+            params.append(artifact_type)
+        query += " ORDER BY created_at DESC LIMIT ? OFFSET ?"
+        params.extend([limit, offset])
+        rows = self.db.fetchall(query, tuple(params))
+        return [Artifact.from_row(row) for row in rows]
+    def delete_artifact(self, artifact_id: str) -> bool:
+        """Delete an artifact by ID.
+        Args:
+            artifact_id: The artifact ID to delete
+        Returns:
+            True if deleted, False if not found
+        """
+        with self.db.transaction() as conn:
+            cursor = conn.execute("DELETE FROM session_artifacts WHERE id = ?", (artifact_id,))
+            if cursor.rowcount == 0:
+                return False
+            # Also delete from FTS5 table
+            conn.execute("DELETE FROM session_artifacts_fts WHERE id = ?", (artifact_id,))
+        self._notify_listeners()
+        return True
+    def search_artifacts(
+        self,
+        query_text: str,
+        session_id: str | None = None,
+        artifact_type: str | None = None,
+        limit: int = 50,
+    ) -> list[Artifact]:
+        """Search artifacts by content using FTS5 full-text search.
+        Uses FTS5 MATCH query on session_artifacts_fts with bm25 ranking.
+        Can optionally filter by session_id and/or artifact_type.
+        Args:
+            query_text: The search query text
+            session_id: Optional session ID filter
+            artifact_type: Optional artifact type filter
+            limit: Maximum number of results (default: 50)
+        Returns:
+            List of matching Artifacts ordered by relevance (bm25 ranking)
+        """
+        # Empty query returns empty results
+        if not query_text or not query_text.strip():
+            return []
+        # Escape FTS5 special characters and build query
+        # Split into words and add prefix matching for each term
+        words = query_text.strip().split()
+        if not words:
+            return []
+        # Build FTS5 query: each word becomes a prefix search term
+        # e.g., "calculate total" -> "calculate* total*"
+        fts_terms = []
+        for word in words:
+            # Remove FTS5 special chars that would break syntax: * ^ " ( ) AND OR NOT
+            # Keep only alphanumeric and safe punctuation
+            sanitized = ""
+            for char in word:
+                if char.isalnum() or char in "-_":
+                    sanitized += char
+            if sanitized:
+                fts_terms.append(f"{sanitized}*")
+        if not fts_terms:
+            return []
+        fts_query = " ".join(fts_terms)
+        # Use FTS5 MATCH query with JOIN to main table
+        # Order by bm25() for relevance ranking (lower bm25 = more relevant)
+        sql = """
+            SELECT sa.*
+            FROM session_artifacts sa
+            INNER JOIN session_artifacts_fts fts ON sa.id = fts.id
+            WHERE fts.content MATCH ?
+        """
+        params: list[Any] = [fts_query]
+        if session_id:
+            sql += " AND sa.session_id = ?"
+            params.append(session_id)
+        if artifact_type:
+            sql += " AND sa.artifact_type = ?"
+            params.append(artifact_type)
+        sql += " ORDER BY bm25(session_artifacts_fts) LIMIT ?"
+        params.append(limit)
+        rows = self.db.fetchall(sql, tuple(params))
+        return [Artifact.from_row(row) for row in rows]

gobby/storage/compaction.py ADDED Viewed

@@ -0,0 +1,67 @@
+"""Task compaction logic."""
+from datetime import UTC, datetime, timedelta
+from typing import Any
+from gobby.storage.tasks import LocalTaskManager
+class TaskCompactor:
+    """Handles compaction of old closed tasks."""
+    def __init__(self, task_manager: LocalTaskManager) -> None:
+        self.task_manager = task_manager
+    def find_candidates(self, days_closed: int = 30) -> list[dict[str, Any]]:
+        """
+        Find tasks that have been closed for longer than the specified days
+        and haven't been compacted yet.
+        """
+        cutoff = datetime.now(UTC) - timedelta(days=days_closed)
+        cutoff_str = cutoff.isoformat()
+        # Query directly since we need custom filtering not exposed by list_tasks
+        sql = """
+            SELECT * FROM tasks
+            WHERE status = 'closed'
+              AND updated_at < ?
+              AND compacted_at IS NULL
+            ORDER BY updated_at ASC
+        """
+        rows = self.task_manager.db.fetchall(sql, (cutoff_str,))
+        return [dict(row) for row in rows]
+    def compact_task(self, task_id: str, summary: str) -> None:
+        """
+        Compact a task by replacing its description with a summary.
+        """
+        # Update database directly to set compacted_at
+        now = datetime.now(UTC).isoformat()
+        # We preserve the title but replace description with summary
+        # and mark it as compacted.
+        sql = """
+            UPDATE tasks
+            SET description = ?,
+                summary = ?,
+                compacted_at = ?,
+                updated_at = ?
+            WHERE id = ?
+        """
+        self.task_manager.db.execute(sql, (summary, summary, now, now, task_id))
+        self.task_manager._notify_listeners()
+    def get_stats(self) -> dict[str, Any]:
+        """Get compaction statistics."""
+        sql_total = "SELECT COUNT(*) as c FROM tasks WHERE status = 'closed'"
+        sql_compacted = "SELECT COUNT(*) as c FROM tasks WHERE compacted_at IS NOT NULL"
+        total = (self.task_manager.db.fetchone(sql_total) or {"c": 0})["c"]
+        compacted = (self.task_manager.db.fetchone(sql_compacted) or {"c": 0})["c"]
+        return {
+            "total_closed": total,
+            "compacted": compacted,
+            "rate": round(compacted / total * 100, 1) if total > 0 else 0,
+        }