PyPI - claude-jacked - Versions diffs - 0.2.3__py3-none-any.whl → 0.2.9__py3-none-any.whl - Mend

claude-jacked 0.2.3py3-none-any.whl → 0.2.9py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

claude_jacked-0.2.9.dist-info/METADATA +523 -0
claude_jacked-0.2.9.dist-info/RECORD +33 -0
jacked/cli.py +752 -47
jacked/client.py +196 -29
jacked/data/agents/code-simplicity-reviewer.md +87 -0
jacked/data/agents/defensive-error-handler.md +93 -0
jacked/data/agents/double-check-reviewer.md +214 -0
jacked/data/agents/git-pr-workflow-manager.md +149 -0
jacked/data/agents/issue-pr-coordinator.md +131 -0
jacked/data/agents/pr-workflow-checker.md +199 -0
jacked/data/agents/readme-maintainer.md +123 -0
jacked/data/agents/test-coverage-engineer.md +155 -0
jacked/data/agents/test-coverage-improver.md +139 -0
jacked/data/agents/wiki-documentation-architect.md +580 -0
jacked/data/commands/audit-rules.md +103 -0
jacked/data/commands/dc.md +155 -0
jacked/data/commands/learn.md +89 -0
jacked/data/commands/pr.md +4 -0
jacked/data/commands/redo.md +85 -0
jacked/data/commands/techdebt.md +115 -0
jacked/data/prompts/security_gatekeeper.txt +58 -0
jacked/data/rules/jacked_behaviors.md +11 -0
jacked/data/skills/jacked/SKILL.md +162 -0
jacked/index_write_tracker.py +227 -0
jacked/indexer.py +255 -129
jacked/retriever.py +389 -137
jacked/searcher.py +65 -13
jacked/transcript.py +339 -0
claude_jacked-0.2.3.dist-info/METADATA +0 -483
claude_jacked-0.2.3.dist-info/RECORD +0 -13
{claude_jacked-0.2.3.dist-info → claude_jacked-0.2.9.dist-info}/WHEEL +0 -0
{claude_jacked-0.2.3.dist-info → claude_jacked-0.2.9.dist-info}/entry_points.txt +0 -0
{claude_jacked-0.2.3.dist-info → claude_jacked-0.2.9.dist-info}/licenses/LICENSE +0 -0

jacked/searcher.py CHANGED Viewed

@@ -3,11 +3,18 @@ Session searching for Jacked.
 Handles semantic search across indexed sessions using Qdrant Cloud Inference.
 Implements multi-factor ranking: ownership, repo, recency, and semantic similarity.
+Supports filtering by content_type:
+- plan: Full implementation strategy (gold)
+- subagent_summary: Rich summaries from agent outputs (gold)
+- summary_label: Tiny chapter titles from compaction
+- user_message: User messages for intent matching
+- chunk: Full transcript chunks
 """
 import logging
 import math
-from dataclasses import dataclass
+from dataclasses import dataclass, field
 from datetime import datetime, timezone
 from typing import Optional
 from collections import defaultdict
@@ -16,6 +23,15 @@ from jacked.config import SmartForkConfig, get_repo_id
 from jacked.client import QdrantSessionClient
+# Default content types for search (high-value content)
+DEFAULT_SEARCH_CONTENT_TYPES = [
+    "plan",
+    "subagent_summary",
+    "summary_label",
+    "user_message",
+]
 logger = logging.getLogger(__name__)
@@ -37,6 +53,9 @@ class SearchResult:
         is_current_repo: Whether this is from the current repo
         intent_preview: Preview of the matched intent text
         chunk_count: Number of transcript chunks stored
+        has_plan: Whether this session has a plan file indexed
+        has_agent_summaries: Whether this session has agent summaries
+        content_types_found: Set of content types found in this session
     """
     session_id: str
     repo_name: str
@@ -50,13 +69,23 @@ class SearchResult:
     is_current_repo: bool
     intent_preview: str
     chunk_count: int
+    has_plan: bool = False
+    has_agent_summaries: bool = False
+    content_types_found: set = field(default_factory=set)
     def __str__(self) -> str:
         """Format result for display."""
         ts_str = self.timestamp.strftime("%Y-%m-%d") if self.timestamp else "unknown"
         owner = "YOU" if self.is_own else f"@{self.user_name}"
+        # Add indicators for rich content
+        indicators = []
+        if self.has_plan:
+            indicators.append("📋")
+        if self.has_agent_summaries:
+            indicators.append("🤖")
+        indicator_str = " ".join(indicators)
         return (
-            f"[{self.score:.0f}%] {owner} - {self.repo_name} - {ts_str}\n"
+            f"[{self.score:.0f}%] {owner} - {self.repo_name} - {ts_str} {indicator_str}\n"
             f"      {self.intent_preview[:80]}..."
         )
@@ -96,6 +125,7 @@ class SessionSearcher:
         min_score: float = 0.3,
         mine_only: bool = False,
         user_filter: Optional[str] = None,
+        content_types: Optional[list[str]] = None,
     ) -> list[SearchResult]:
         """
         Search for sessions similar to the query with multi-factor ranking.
@@ -113,6 +143,8 @@ class SessionSearcher:
             min_score: Minimum cosine similarity score (0-1)
             mine_only: If True, only return current user's sessions
             user_filter: If set, only return sessions from this user
+            content_types: Content types to search (default: plan, subagent_summary,
+                          summary_label, user_message). Use ["chunk"] for full-text search.
         Returns:
             List of SearchResult objects, sorted by multi-factor relevance
@@ -126,18 +158,31 @@ class SessionSearcher:
         current_repo_id = get_repo_id(repo_path) if repo_path else None
         current_user = self.config.user_name
-        # Search for intent points using server-side embedding
+        # Default to high-value content types
+        if content_types is None:
+            content_types = DEFAULT_SEARCH_CONTENT_TYPES
+        # Build user filter for Qdrant (more efficient than post-filter)
+        qdrant_user_filter = None
+        if mine_only:
+            qdrant_user_filter = current_user
+        elif user_filter:
+            qdrant_user_filter = user_filter
+        # Search using content_types filter
         # Get more results than needed since we'll aggregate and re-rank
         raw_results = self.client.search(
             query_text=query,
             repo_id=None,  # Don't filter in Qdrant, we'll boost instead
-            point_type="intent",
+            content_types=content_types,
+            user_name=qdrant_user_filter,
             limit=limit * 10,  # Get extra for aggregation and filtering
         )
-        # Aggregate by session (multiple intent chunks per session)
+        # Aggregate by session (multiple points per session)
         session_scores: dict[str, list[float]] = defaultdict(list)
         session_data: dict[str, dict] = {}
+        session_content_types: dict[str, set] = defaultdict(set)
         for result in raw_results:
             if result.score < min_score:
@@ -146,17 +191,13 @@ class SessionSearcher:
             payload = result.payload or {}
             session_id = payload.get("session_id")
             session_user = payload.get("user_name", "unknown")
+            content_type = payload.get("content_type", payload.get("type", ""))
             if not session_id:
                 continue
-            # Apply filters
-            if mine_only and session_user != current_user:
-                continue
-            if user_filter and session_user != user_filter:
-                continue
             session_scores[session_id].append(result.score)
+            session_content_types[session_id].add(content_type)
             # Keep the best payload data (highest score)
             if session_id not in session_data or result.score > max(session_scores[session_id][:-1], default=0):
@@ -168,6 +209,7 @@ class SessionSearcher:
             # Use max score for semantic ranking (best match in session)
             semantic_score = max(scores)
             payload = session_data[session_id]
+            found_types = session_content_types[session_id]
             # Parse timestamp
             timestamp = None
@@ -192,6 +234,9 @@ class SessionSearcher:
                 timestamp=timestamp,
             )
+            # Get preview text - prefer content field over intent_text
+            preview = payload.get("content", payload.get("intent_text", ""))[:200]
             results.append(
                 SearchResult(
                     session_id=session_id,
@@ -204,8 +249,11 @@ class SessionSearcher:
                     semantic_score=semantic_score * 100,
                     is_own=is_own,
                     is_current_repo=is_current_repo,
-                    intent_preview=payload.get("intent_text", "")[:200],
-                    chunk_count=payload.get("transcript_chunk_count", 0),
+                    intent_preview=preview,
+                    chunk_count=payload.get("total_chunks", 0),
+                    has_plan="plan" in found_types,
+                    has_agent_summaries="subagent_summary" in found_types,
+                    content_types_found=found_types,
                 )
             )
@@ -285,9 +333,13 @@ class SessionSearcher:
                     session_id=session.get("session_id", ""),
                     repo_name=session.get("repo_name", "unknown"),
                     repo_path=session.get("repo_path", ""),
+                    user_name=session.get("user_name", "unknown"),
                     machine=session.get("machine", "unknown"),
                     timestamp=timestamp,
                     score=100,  # No relevance score for list
+                    semantic_score=0.0,  # Not applicable for list
+                    is_own=session.get("user_name") == self.config.user_name,
+                    is_current_repo=True,  # We're filtering by repo
                     intent_preview="",  # Not available in list
                     chunk_count=session.get("chunk_count", 0),
                 )

jacked/transcript.py CHANGED Viewed

@@ -475,3 +475,342 @@ def _is_uuid_format(name: str) -> bool:
     """
     uuid_pattern = r"^[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}$"
     return bool(re.match(uuid_pattern, name.lower()))
+# =============================================================================
+# NEW: Extraction functions for subagent summaries, labels, and plans
+# =============================================================================
+@dataclass
+class SummaryLabel:
+    """A compaction summary label (tiny chapter title).
+    Examples:
+        >>> label = SummaryLabel("Implementing auth flow", "abc123", None)
+        >>> label.label
+        'Implementing auth flow'
+    """
+    label: str
+    leaf_uuid: Optional[str] = None
+    timestamp: Optional[datetime] = None
+@dataclass
+class AgentSummary:
+    """Summary extracted from a subagent's final output.
+    Examples:
+        >>> summary = AgentSummary("a4e75d5", "Explore", "## Summary\\n...", None)
+        >>> summary.agent_id
+        'a4e75d5'
+    """
+    agent_id: str
+    agent_type: Optional[str]
+    summary_text: str
+    timestamp: Optional[datetime] = None
+@dataclass
+class PlanFile:
+    """A plan file linked to a session via slug.
+    Examples:
+        >>> plan = PlanFile("hidden-finding-goose", Path("..."), "# Plan content")
+        >>> plan.slug
+        'hidden-finding-goose'
+    """
+    slug: str
+    path: Path
+    content: str
+def find_subagent_files(session_path: Path) -> list[Path]:
+    """Find all subagent JSONL files for a session.
+    Subagents are stored in {session-id}/subagents/agent-*.jsonl
+    Args:
+        session_path: Path to the main session JSONL file
+    Returns:
+        List of paths to subagent JSONL files
+    Examples:
+        >>> # files = find_subagent_files(Path('session.jsonl'))  # doctest: +SKIP
+    """
+    # Session dir is {session-id}/ next to {session-id}.jsonl
+    session_dir = session_path.parent / session_path.stem
+    subagents_dir = session_dir / "subagents"
+    if not subagents_dir.exists():
+        return []
+    # Use iterator to avoid memory issues with large directories
+    return sorted(subagents_dir.glob("agent-*.jsonl"))
+def extract_agent_summary(agent_file: Path) -> Optional[AgentSummary]:
+    """Extract the final summary text from an agent's session.
+    The summary is the text content from the LAST assistant message.
+    Args:
+        agent_file: Path to an agent-*.jsonl file
+    Returns:
+        AgentSummary or None if no usable summary found
+    Examples:
+        >>> # summary = extract_agent_summary(Path('agent-abc.jsonl'))  # doctest: +SKIP
+    """
+    # Extract agent_id from filename: agent-a4e75d5.jsonl -> a4e75d5
+    agent_id = agent_file.stem.replace("agent-", "")
+    last_assistant_msg = None
+    timestamp = None
+    try:
+        with open(agent_file, "r", encoding="utf-8") as f:
+            for line in f:
+                line = line.strip()
+                if not line:
+                    continue
+                try:
+                    data = json.loads(line)
+                except json.JSONDecodeError:
+                    continue
+                if data.get("type") == "assistant":
+                    last_assistant_msg = data
+                    ts_str = data.get("timestamp")
+                    if ts_str:
+                        try:
+                            timestamp = datetime.fromisoformat(ts_str.replace("Z", "+00:00"))
+                        except ValueError:
+                            pass
+    except (IOError, OSError) as e:
+        logger.warning(f"Failed to read agent file {agent_file}: {e}")
+        return None
+    if not last_assistant_msg:
+        return None
+    # Extract text content from the message
+    message = last_assistant_msg.get("message", {})
+    content = message.get("content", [])
+    text_parts = []
+    if isinstance(content, list):
+        for block in content:
+            if isinstance(block, dict) and block.get("type") == "text":
+                text = block.get("text", "")
+                if text:
+                    text_parts.append(text)
+    elif isinstance(content, str):
+        text_parts.append(content)
+    summary_text = "\n".join(text_parts).strip()
+    # Skip if too short (likely not a real summary)
+    if len(summary_text) < 200:
+        logger.debug(f"Agent {agent_id} summary too short ({len(summary_text)} chars), skipping")
+        return None
+    # Agent type is hard to detect from the file itself
+    # Could infer from content patterns but skip for MVP
+    agent_type = None
+    return AgentSummary(
+        agent_id=agent_id,
+        agent_type=agent_type,
+        summary_text=summary_text,
+        timestamp=timestamp,
+    )
+def extract_summary_labels(session_path: Path) -> list[SummaryLabel]:
+    """Extract summary labels from a session JSONL file.
+    These are the tiny "chapter titles" from compaction events.
+    Args:
+        session_path: Path to the main session JSONL file
+    Returns:
+        List of SummaryLabel objects
+    Examples:
+        >>> # labels = extract_summary_labels(Path('session.jsonl'))  # doctest: +SKIP
+    """
+    labels = []
+    try:
+        with open(session_path, "r", encoding="utf-8") as f:
+            for line in f:
+                line = line.strip()
+                if not line:
+                    continue
+                try:
+                    data = json.loads(line)
+                except json.JSONDecodeError:
+                    continue
+                if data.get("type") == "summary":
+                    label_text = data.get("summary", "")
+                    if label_text:
+                        timestamp = None
+                        ts_str = data.get("timestamp")
+                        if ts_str:
+                            try:
+                                timestamp = datetime.fromisoformat(ts_str.replace("Z", "+00:00"))
+                            except ValueError:
+                                pass
+                        labels.append(SummaryLabel(
+                            label=label_text,
+                            leaf_uuid=data.get("leafUuid"),
+                            timestamp=timestamp,
+                        ))
+    except (IOError, OSError) as e:
+        logger.warning(f"Failed to read session file {session_path}: {e}")
+    return labels
+def extract_session_slug(session_path: Path) -> Optional[str]:
+    """Extract the slug from a session JSONL file.
+    The slug links the session to its plan file in ~/.claude/plans/
+    Args:
+        session_path: Path to the main session JSONL file
+    Returns:
+        The slug string or None if not found
+    Examples:
+        >>> # slug = extract_session_slug(Path('session.jsonl'))  # doctest: +SKIP
+    """
+    try:
+        with open(session_path, "r", encoding="utf-8") as f:
+            for line in f:
+                line = line.strip()
+                if not line:
+                    continue
+                try:
+                    data = json.loads(line)
+                except json.JSONDecodeError:
+                    continue
+                if "slug" in data:
+                    return data["slug"]
+    except (IOError, OSError) as e:
+        logger.warning(f"Failed to read session file {session_path}: {e}")
+    return None
+def find_plan_file(slug: str, plans_dir: Optional[Path] = None) -> Optional[PlanFile]:
+    """Find and read the plan file for a session slug.
+    Args:
+        slug: The session slug (e.g., "hidden-finding-goose")
+        plans_dir: Path to plans directory (default: ~/.claude/plans/)
+    Returns:
+        PlanFile or None if not found or invalid
+    Examples:
+        >>> # plan = find_plan_file("hidden-finding-goose")  # doctest: +SKIP
+    """
+    if plans_dir is None:
+        plans_dir = Path.home() / ".claude" / "plans"
+    plan_path = plans_dir / f"{slug}.md"
+    if not plan_path.exists():
+        return None
+    try:
+        # Size validation - skip huge files
+        file_size = plan_path.stat().st_size
+        if file_size > 100_000:  # 100KB sanity check
+            logger.warning(f"Plan file too large ({file_size} bytes), skipping: {plan_path}")
+            return None
+        if file_size < 50:  # Too small to be useful
+            logger.debug(f"Plan file too small ({file_size} bytes), skipping: {plan_path}")
+            return None
+        content = plan_path.read_text(encoding="utf-8")
+        return PlanFile(
+            slug=slug,
+            path=plan_path,
+            content=content,
+        )
+    except (IOError, OSError) as e:
+        logger.warning(f"Failed to read plan file {plan_path}: {e}")
+        return None
+@dataclass
+class EnrichedTranscript(ParsedTranscript):
+    """ParsedTranscript with additional extracted data.
+    Adds subagent summaries, summary labels, and plan file content.
+    """
+    summary_labels: list[SummaryLabel] = field(default_factory=list)
+    agent_summaries: list[AgentSummary] = field(default_factory=list)
+    plan: Optional[PlanFile] = None
+    slug: Optional[str] = None
+def parse_jsonl_file_enriched(filepath: Path) -> EnrichedTranscript:
+    """Parse a Claude session with all enriched data.
+    Extracts:
+    - Messages (user, assistant)
+    - Summary labels (compaction chapter titles)
+    - Subagent summaries (gold context from agent outputs)
+    - Plan file (if linked via slug)
+    Args:
+        filepath: Path to the .jsonl session file
+    Returns:
+        EnrichedTranscript with all extracted data
+    Examples:
+        >>> # transcript = parse_jsonl_file_enriched(Path('session.jsonl'))  # doctest: +SKIP
+    """
+    # Parse base transcript
+    base = parse_jsonl_file(filepath)
+    # Extract summary labels
+    labels = extract_summary_labels(filepath)
+    # Extract subagent summaries
+    agent_summaries = []
+    for agent_file in find_subagent_files(filepath):
+        summary = extract_agent_summary(agent_file)
+        if summary:
+            agent_summaries.append(summary)
+    # Extract plan file via slug
+    slug = extract_session_slug(filepath)
+    plan = find_plan_file(slug) if slug else None
+    return EnrichedTranscript(
+        session_id=base.session_id,
+        messages=base.messages,
+        user_messages=base.user_messages,
+        full_text=base.full_text,
+        intent_text=base.intent_text,
+        timestamp=base.timestamp,
+        summary_labels=labels,
+        agent_summaries=agent_summaries,
+        plan=plan,
+        slug=slug,
+    )

claude-jacked 0.2.3__py3-none-any.whl → 0.2.9__py3-none-any.whl

claude-jacked 0.2.3py3-none-any.whl → 0.2.9py3-none-any.whl