PyPI - shotgun-sh - Versions diffs - 0.2.17__py3-none-any.whl → 0.3.3.dev1__py3-none-any.whl - Mend

shotgun-sh 0.2.17py3-none-any.whl → 0.3.3.dev1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (112) hide show

shotgun/agents/agent_manager.py +28 -14
shotgun/agents/common.py +1 -1
shotgun/agents/config/README.md +89 -0
shotgun/agents/config/__init__.py +10 -1
shotgun/agents/config/manager.py +323 -53
shotgun/agents/config/models.py +85 -21
shotgun/agents/config/provider.py +51 -13
shotgun/agents/config/streaming_test.py +119 -0
shotgun/agents/context_analyzer/analyzer.py +6 -2
shotgun/agents/conversation/__init__.py +18 -0
shotgun/agents/conversation/filters.py +164 -0
shotgun/agents/conversation/history/chunking.py +278 -0
shotgun/agents/{history → conversation/history}/compaction.py +27 -1
shotgun/agents/{history → conversation/history}/constants.py +5 -0
shotgun/agents/conversation/history/file_content_deduplication.py +216 -0
shotgun/agents/{history → conversation/history}/history_processors.py +267 -3
shotgun/agents/{history → conversation/history}/token_counting/anthropic.py +8 -0
shotgun/agents/{conversation_manager.py → conversation/manager.py} +1 -1
shotgun/agents/{conversation_history.py → conversation/models.py} +8 -94
shotgun/agents/error/__init__.py +11 -0
shotgun/agents/error/models.py +19 -0
shotgun/agents/runner.py +230 -0
shotgun/agents/tools/web_search/openai.py +1 -1
shotgun/build_constants.py +2 -2
shotgun/cli/clear.py +1 -1
shotgun/cli/compact.py +5 -3
shotgun/cli/context.py +44 -1
shotgun/cli/error_handler.py +24 -0
shotgun/cli/export.py +34 -34
shotgun/cli/plan.py +34 -34
shotgun/cli/research.py +17 -9
shotgun/cli/spec/__init__.py +5 -0
shotgun/cli/spec/backup.py +81 -0
shotgun/cli/spec/commands.py +132 -0
shotgun/cli/spec/models.py +48 -0
shotgun/cli/spec/pull_service.py +219 -0
shotgun/cli/specify.py +20 -19
shotgun/cli/tasks.py +34 -34
shotgun/codebase/core/ingestor.py +153 -7
shotgun/codebase/models.py +2 -0
shotgun/exceptions.py +325 -0
shotgun/llm_proxy/__init__.py +17 -0
shotgun/llm_proxy/client.py +215 -0
shotgun/llm_proxy/models.py +137 -0
shotgun/logging_config.py +42 -0
shotgun/main.py +4 -0
shotgun/posthog_telemetry.py +1 -1
shotgun/prompts/agents/partials/common_agent_system_prompt.j2 +28 -3
shotgun/prompts/agents/partials/interactive_mode.j2 +3 -3
shotgun/prompts/agents/plan.j2 +16 -0
shotgun/prompts/agents/research.j2 +16 -3
shotgun/prompts/agents/specify.j2 +54 -1
shotgun/prompts/agents/state/system_state.j2 +0 -2
shotgun/prompts/agents/tasks.j2 +16 -0
shotgun/prompts/history/chunk_summarization.j2 +34 -0
shotgun/prompts/history/combine_summaries.j2 +53 -0
shotgun/sdk/codebase.py +14 -3
shotgun/settings.py +5 -0
shotgun/shotgun_web/__init__.py +67 -1
shotgun/shotgun_web/client.py +42 -1
shotgun/shotgun_web/constants.py +46 -0
shotgun/shotgun_web/exceptions.py +29 -0
shotgun/shotgun_web/models.py +390 -0
shotgun/shotgun_web/shared_specs/__init__.py +32 -0
shotgun/shotgun_web/shared_specs/file_scanner.py +175 -0
shotgun/shotgun_web/shared_specs/hasher.py +83 -0
shotgun/shotgun_web/shared_specs/models.py +71 -0
shotgun/shotgun_web/shared_specs/upload_pipeline.py +329 -0
shotgun/shotgun_web/shared_specs/utils.py +34 -0
shotgun/shotgun_web/specs_client.py +703 -0
shotgun/shotgun_web/supabase_client.py +31 -0
shotgun/tui/app.py +73 -9
shotgun/tui/containers.py +1 -1
shotgun/tui/layout.py +5 -0
shotgun/tui/screens/chat/chat_screen.py +372 -95
shotgun/tui/screens/chat/codebase_index_prompt_screen.py +196 -17
shotgun/tui/screens/chat_screen/command_providers.py +13 -2
shotgun/tui/screens/chat_screen/hint_message.py +76 -1
shotgun/tui/screens/confirmation_dialog.py +40 -0
shotgun/tui/screens/directory_setup.py +45 -41
shotgun/tui/screens/feedback.py +10 -3
shotgun/tui/screens/github_issue.py +11 -2
shotgun/tui/screens/model_picker.py +28 -8
shotgun/tui/screens/onboarding.py +149 -0
shotgun/tui/screens/pipx_migration.py +58 -6
shotgun/tui/screens/provider_config.py +66 -8
shotgun/tui/screens/shared_specs/__init__.py +21 -0
shotgun/tui/screens/shared_specs/create_spec_dialog.py +273 -0
shotgun/tui/screens/shared_specs/models.py +56 -0
shotgun/tui/screens/shared_specs/share_specs_dialog.py +390 -0
shotgun/tui/screens/shared_specs/upload_progress_screen.py +452 -0
shotgun/tui/screens/shotgun_auth.py +110 -16
shotgun/tui/screens/spec_pull.py +288 -0
shotgun/tui/screens/welcome.py +123 -0
shotgun/tui/services/conversation_service.py +5 -2
shotgun/tui/widgets/widget_coordinator.py +1 -1
{shotgun_sh-0.2.17.dist-info → shotgun_sh-0.3.3.dev1.dist-info}/METADATA +9 -2
{shotgun_sh-0.2.17.dist-info → shotgun_sh-0.3.3.dev1.dist-info}/RECORD +112 -77
{shotgun_sh-0.2.17.dist-info → shotgun_sh-0.3.3.dev1.dist-info}/WHEEL +1 -1
/shotgun/agents/{history → conversation/history}/__init__.py +0 -0
/shotgun/agents/{history → conversation/history}/context_extraction.py +0 -0
/shotgun/agents/{history → conversation/history}/history_building.py +0 -0
/shotgun/agents/{history → conversation/history}/message_utils.py +0 -0
/shotgun/agents/{history → conversation/history}/token_counting/__init__.py +0 -0
/shotgun/agents/{history → conversation/history}/token_counting/base.py +0 -0
/shotgun/agents/{history → conversation/history}/token_counting/openai.py +0 -0
/shotgun/agents/{history → conversation/history}/token_counting/sentencepiece_counter.py +0 -0
/shotgun/agents/{history → conversation/history}/token_counting/tokenizer_cache.py +0 -0
/shotgun/agents/{history → conversation/history}/token_counting/utils.py +0 -0
/shotgun/agents/{history → conversation/history}/token_estimation.py +0 -0
{shotgun_sh-0.2.17.dist-info → shotgun_sh-0.3.3.dev1.dist-info}/entry_points.txt +0 -0
{shotgun_sh-0.2.17.dist-info → shotgun_sh-0.3.3.dev1.dist-info}/licenses/LICENSE +0 -0

shotgun/agents/{history → conversation/history}/history_processors.py RENAMED Viewed

@@ -13,6 +13,7 @@ from pydantic_ai.messages import (
     UserPromptPart,
 )
+from shotgun.agents.conversation.filters import filter_orphaned_tool_responses
 from shotgun.agents.llm import shotgun_model_request
 from shotgun.agents.messages import AgentSystemPrompt, SystemStatusPrompt
 from shotgun.agents.models import AgentDeps
@@ -21,7 +22,7 @@ from shotgun.logging_config import get_logger
 from shotgun.posthog_telemetry import track_event
 from shotgun.prompts import PromptLoader
-from .constants import SUMMARY_MARKER, TOKEN_LIMIT_RATIO
+from .constants import CHUNK_SAFE_RATIO, SUMMARY_MARKER, TOKEN_LIMIT_RATIO
 from .context_extraction import extract_context_from_messages
 from .history_building import ensure_ends_with_model_request
 from .message_utils import (
@@ -38,7 +39,7 @@ from .token_estimation import (
 )
 if TYPE_CHECKING:
-    pass
+    from . import chunking
 class ContextProtocol(Protocol):
@@ -416,6 +417,9 @@ async def token_limit_compactor(
             compacted_messages, messages
         )
+        # Filter out orphaned tool responses (tool responses without tool calls)
+        compacted_messages = filter_orphaned_tool_responses(compacted_messages)
         logger.debug(
             f"Incremental compaction complete: {len(messages)} -> {len(compacted_messages)} messages"
         )
@@ -489,10 +493,32 @@ async def _full_compaction(
     deps: AgentDeps,
     messages: list[ModelMessage],
 ) -> list[ModelMessage]:
-    """Perform full compaction for first-time summarization."""
+    """Perform full compaction for first-time summarization.
+    If the conversation is too large for single-pass compaction, delegates
+    to chunked compaction which breaks the conversation into logical chunks.
+    """
     # Extract context from all messages
     context = extract_context_from_messages(messages)
+    # Check if context would exceed model limit for compaction request
+    # We use CHUNK_SAFE_RATIO (70%) to leave room for prompt overhead
+    max_safe_input = int(deps.llm_model.max_input_tokens * CHUNK_SAFE_RATIO)
+    # Estimate context tokens
+    context_request: list[ModelMessage] = [ModelRequest.user_text_prompt(context)]
+    context_tokens = await estimate_tokens_from_messages(
+        context_request, deps.llm_model
+    )
+    if context_tokens > max_safe_input:
+        # Context too large for single-pass compaction - use chunked approach
+        logger.info(
+            f"Context ({context_tokens:,} tokens) exceeds safe limit "
+            f"({max_safe_input:,} tokens), using chunked compaction"
+        )
+        return await _chunked_compaction(deps, messages)
     # Use regular summarization prompt
     summarization_prompt = prompt_loader.render("history/summarization.j2")
     request_messages: list[ModelMessage] = [
@@ -565,6 +591,9 @@ async def _full_compaction(
     # Ensure history ends with ModelRequest for PydanticAI compatibility
     compacted_messages = ensure_ends_with_model_request(compacted_messages, messages)
+    # Filter out orphaned tool responses (tool responses without tool calls)
+    compacted_messages = filter_orphaned_tool_responses(compacted_messages)
     # Track full compaction event
     messages_before = len(messages)
     messages_after = len(compacted_messages)
@@ -592,3 +621,238 @@ async def _full_compaction(
     )
     return compacted_messages
+async def _chunked_compaction(
+    deps: AgentDeps,
+    messages: list[ModelMessage],
+) -> list[ModelMessage]:
+    """Perform chunked compaction for oversized conversations.
+    Breaks the conversation into logical chunks, summarizes each sequentially,
+    then combines the summaries into a master summary.
+    """
+    from .chunking import chunk_messages_for_compaction
+    # Split into chunks and retention window
+    chunks, retained_messages = await chunk_messages_for_compaction(
+        messages, deps.llm_model
+    )
+    if not chunks:
+        # No chunks to summarize (conversation too small), return retained messages
+        logger.debug("No chunks to summarize, returning retained messages")
+        return retained_messages
+    # Track chunked compaction
+    total_chunks = len(chunks)
+    logger.info(f"Starting chunked compaction: {total_chunks} chunks to process")
+    # Summarize each chunk sequentially
+    chunk_summaries: list[str] = []
+    for chunk in chunks:
+        try:
+            summary = await _summarize_chunk(chunk, total_chunks, deps)
+            chunk_summaries.append(summary)
+            logger.debug(
+                f"Chunk {chunk.chunk_index + 1}/{total_chunks} summarized successfully"
+            )
+        except Exception as e:
+            logger.warning(
+                f"Failed to summarize chunk {chunk.chunk_index + 1}/{total_chunks}: {e}"
+            )
+            # Continue with other chunks - we'll note the gap in fusion
+            chunk_summaries.append(
+                f"[Chunk {chunk.chunk_index + 1} summary unavailable]"
+            )
+    # Combine summaries into master summary
+    if len(chunk_summaries) == 1:
+        final_summary = chunk_summaries[0]
+    else:
+        final_summary = await _combine_chunk_summaries(chunk_summaries, deps)
+    # Build final compacted history
+    compacted = _build_chunked_compaction_result(
+        final_summary, messages, retained_messages, deps
+    )
+    # Track chunked compaction event
+    track_event(
+        "chunked_compaction_triggered",
+        {
+            "num_chunks": total_chunks,
+            "chunks_succeeded": sum(
+                1 for s in chunk_summaries if not s.startswith("[Chunk")
+            ),
+            "retention_window_size": len(retained_messages),
+            "model_name": deps.llm_model.name.value,
+            "provider": deps.llm_model.provider.value,
+        },
+    )
+    return compacted
+async def _summarize_chunk(
+    chunk: "chunking.Chunk",
+    total_chunks: int,
+    deps: AgentDeps,
+) -> str:
+    """Summarize a single chunk of messages."""
+    chunk_messages = chunk.get_all_messages()
+    context = extract_context_from_messages(chunk_messages)
+    # Use chunk summarization template
+    chunk_prompt = prompt_loader.render(
+        "history/chunk_summarization.j2",
+        chunk_index=chunk.chunk_index + 1,
+        total_chunks=total_chunks,
+        chunk_content=context,
+    )
+    request_messages: list[ModelMessage] = [
+        ModelRequest.user_text_prompt(context, instructions=chunk_prompt)
+    ]
+    max_tokens = await calculate_max_summarization_tokens(
+        deps.llm_model, request_messages
+    )
+    log_summarization_request(
+        deps.llm_model,
+        max_tokens,
+        chunk_prompt,
+        context[:500] + "..." if len(context) > 500 else context,
+        f"CHUNK_{chunk.chunk_index + 1}",
+    )
+    response = await shotgun_model_request(
+        model_config=deps.llm_model,
+        messages=request_messages,
+        model_settings=ModelSettings(max_tokens=max_tokens),
+    )
+    log_summarization_response(response, f"CHUNK_{chunk.chunk_index + 1}")
+    if response.parts and isinstance(response.parts[0], TextPart):
+        return response.parts[0].content
+    return ""
+async def _combine_chunk_summaries(
+    summaries: list[str],
+    deps: AgentDeps,
+) -> str:
+    """Combine multiple chunk summaries into a unified summary."""
+    # Check if combined summaries exceed limit (may need recursive combination)
+    combined_text = "\n\n".join(summaries)
+    combined_request: list[ModelMessage] = [
+        ModelRequest.user_text_prompt(combined_text)
+    ]
+    combined_tokens = await estimate_tokens_from_messages(
+        combined_request, deps.llm_model
+    )
+    max_safe_input = int(deps.llm_model.max_input_tokens * CHUNK_SAFE_RATIO)
+    if combined_tokens > max_safe_input:
+        # Recursive: split summaries in half and combine each half first
+        logger.warning(
+            f"Combined summaries too large ({combined_tokens:,} tokens), "
+            f"applying recursive combination"
+        )
+        mid = len(summaries) // 2
+        first_half = await _combine_chunk_summaries(summaries[:mid], deps)
+        second_half = await _combine_chunk_summaries(summaries[mid:], deps)
+        summaries = [first_half, second_half]
+    # Use combination template
+    combine_prompt = prompt_loader.render(
+        "history/combine_summaries.j2",
+        num_summaries=len(summaries),
+        chunk_summaries=summaries,
+    )
+    request_messages: list[ModelMessage] = [
+        ModelRequest.user_text_prompt(
+            "\n\n---\n\n".join(summaries), instructions=combine_prompt
+        )
+    ]
+    max_tokens = await calculate_max_summarization_tokens(
+        deps.llm_model, request_messages
+    )
+    log_summarization_request(
+        deps.llm_model,
+        max_tokens,
+        combine_prompt,
+        f"[{len(summaries)} summaries to combine]",
+        "COMBINE",
+    )
+    response = await shotgun_model_request(
+        model_config=deps.llm_model,
+        messages=request_messages,
+        model_settings=ModelSettings(max_tokens=max_tokens),
+    )
+    log_summarization_response(response, "COMBINE")
+    if response.parts and isinstance(response.parts[0], TextPart):
+        return response.parts[0].content
+    return ""
+def _build_chunked_compaction_result(
+    final_summary: str,
+    original_messages: list[ModelMessage],
+    retained_messages: list[ModelMessage],
+    deps: AgentDeps,
+) -> list[ModelMessage]:
+    """Build the final compacted history from chunked compaction."""
+    from pydantic_ai.messages import ModelRequestPart
+    # Extract system context from original messages
+    agent_prompt = get_agent_system_prompt(original_messages) or ""
+    system_status = get_latest_system_status(original_messages) or ""
+    first_user = get_first_user_request(original_messages) or ""
+    # Create marked summary
+    summary_part = TextPart(content=f"{SUMMARY_MARKER} {final_summary}")
+    summary_message = ModelResponse(parts=[summary_part])
+    # Build compacted structure
+    compacted: list[ModelMessage] = []
+    # Initial request with system context
+    parts: list[ModelRequestPart] = []
+    if agent_prompt:
+        parts.append(AgentSystemPrompt(content=agent_prompt))
+    if system_status:
+        parts.append(SystemStatusPrompt(content=system_status))
+    if first_user:
+        parts.append(UserPromptPart(content=first_user))
+    if parts:
+        compacted.append(ModelRequest(parts=parts))
+    # Add summary
+    compacted.append(summary_message)
+    # Add retained messages (recent context)
+    compacted.extend(retained_messages)
+    # Ensure ends with ModelRequest for PydanticAI compatibility
+    compacted = ensure_ends_with_model_request(compacted, original_messages)
+    # Filter orphaned tool responses
+    compacted = filter_orphaned_tool_responses(compacted)
+    logger.info(
+        f"Chunked compaction complete: {len(original_messages)} messages -> "
+        f"{len(compacted)} messages (retained {len(retained_messages)} recent)"
+    )
+    return compacted

shotgun/agents/{history → conversation/history}/token_counting/anthropic.py RENAMED Viewed

@@ -1,6 +1,7 @@
 """Anthropic token counting using official client."""
 import logfire
+from anthropic import APIStatusError
 from pydantic_ai.messages import ModelMessage
 from shotgun.agents.config.models import KeyProvider
@@ -103,6 +104,13 @@ class AnthropicTokenCounter(TokenCounter):
                 exception_type=type(e).__name__,
                 exception_message=str(e),
             )
+            # Re-raise API errors directly so they can be classified by the runner
+            # This allows proper error classification for BYOK users (authentication, rate limits, etc.)
+            if isinstance(e, APIStatusError):
+                raise
+            # Only wrap library-level errors in RuntimeError
             raise RuntimeError(
                 f"Anthropic token counting API failed for {self.model_name}: {type(e).__name__}: {str(e)}"
             ) from e

shotgun/agents/{conversation_manager.py → conversation/manager.py} RENAMED Viewed

@@ -11,7 +11,7 @@ from shotgun.logging_config import get_logger
 from shotgun.utils import get_shotgun_home
 from shotgun.utils.file_system_utils import async_copy_file
-from .conversation_history import ConversationHistory
+from .models import ConversationHistory
 logger = get_logger(__name__)

shotgun/agents/{conversation_history.py → conversation/models.py} RENAMED Viewed

@@ -1,7 +1,5 @@
-"""Models and utilities for persisting TUI conversation history."""
+"""Models for persisting TUI conversation history."""
-import json
-import logging
 from datetime import datetime
 from typing import Any, cast
@@ -16,101 +14,15 @@ from pydantic_core import to_jsonable_python
 from shotgun.tui.screens.chat_screen.hint_message import HintMessage
-__all__ = ["HintMessage", "ConversationHistory"]
-logger = logging.getLogger(__name__)
+from .filters import (
+    filter_incomplete_messages,
+    filter_orphaned_tool_responses,
+    is_tool_call_complete,
+)
 SerializedMessage = dict[str, Any]
-def is_tool_call_complete(tool_call: ToolCallPart) -> bool:
-    """Check if a tool call has valid, complete JSON arguments.
-    Args:
-        tool_call: The tool call part to validate
-    Returns:
-        True if the tool call args are valid JSON, False otherwise
-    """
-    if tool_call.args is None:
-        return True  # No args is valid
-    if isinstance(tool_call.args, dict):
-        return True  # Already parsed dict is valid
-    if not isinstance(tool_call.args, str):
-        return False
-    # Try to parse the JSON string
-    try:
-        json.loads(tool_call.args)
-        return True
-    except (json.JSONDecodeError, ValueError) as e:
-        # Log incomplete tool call detection
-        args_preview = (
-            tool_call.args[:100] + "..."
-            if len(tool_call.args) > 100
-            else tool_call.args
-        )
-        logger.info(
-            "Detected incomplete tool call in validation",
-            extra={
-                "tool_name": tool_call.tool_name,
-                "tool_call_id": tool_call.tool_call_id,
-                "args_preview": args_preview,
-                "error": str(e),
-            },
-        )
-        return False
-def filter_incomplete_messages(messages: list[ModelMessage]) -> list[ModelMessage]:
-    """Filter out messages with incomplete tool calls.
-    Args:
-        messages: List of messages to filter
-    Returns:
-        List of messages with only complete tool calls
-    """
-    filtered: list[ModelMessage] = []
-    filtered_count = 0
-    filtered_tool_names: list[str] = []
-    for message in messages:
-        # Only check ModelResponse messages for tool calls
-        if not isinstance(message, ModelResponse):
-            filtered.append(message)
-            continue
-        # Check if any tool calls are incomplete
-        has_incomplete_tool_call = False
-        for part in message.parts:
-            if isinstance(part, ToolCallPart) and not is_tool_call_complete(part):
-                has_incomplete_tool_call = True
-                filtered_tool_names.append(part.tool_name)
-                break
-        # Only include messages without incomplete tool calls
-        if not has_incomplete_tool_call:
-            filtered.append(message)
-        else:
-            filtered_count += 1
-    # Log if any messages were filtered
-    if filtered_count > 0:
-        logger.info(
-            "Filtered incomplete messages before saving",
-            extra={
-                "filtered_count": filtered_count,
-                "total_messages": len(messages),
-                "filtered_tool_names": filtered_tool_names,
-            },
-        )
-    return filtered
 class ConversationState(BaseModel):
     """Represents the complete state of a conversation in memory."""
@@ -144,6 +56,8 @@ class ConversationHistory(BaseModel):
         """
         # Filter out messages with incomplete tool calls to prevent corruption
         filtered_messages = filter_incomplete_messages(messages)
+        # Filter out orphaned tool responses (tool responses without tool calls)
+        filtered_messages = filter_orphaned_tool_responses(filtered_messages)
         # Serialize ModelMessage list to JSON-serializable format
         self.agent_history = to_jsonable_python(

shotgun/agents/error/__init__.py ADDED Viewed

@@ -0,0 +1,11 @@
+"""Agent error handling module.
+This module provides the AgentErrorContext model used by AgentRunner
+for error classification.
+"""
+from shotgun.agents.error.models import AgentErrorContext
+__all__ = [
+    "AgentErrorContext",
+]

shotgun/agents/error/models.py ADDED Viewed

@@ -0,0 +1,19 @@
+"""Pydantic models for agent error handling."""
+from typing import Any
+from pydantic import BaseModel, ConfigDict, Field
+class AgentErrorContext(BaseModel):
+    """Context information needed to classify and handle agent errors.
+    Attributes:
+        exception: The exception that was raised
+        is_shotgun_account: Whether the user is using a Shotgun Account
+    """
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+    exception: Any = Field(...)
+    is_shotgun_account: bool

shotgun-sh 0.2.17__py3-none-any.whl → 0.3.3.dev1__py3-none-any.whl

shotgun-sh 0.2.17py3-none-any.whl → 0.3.3.dev1py3-none-any.whl