PyPI - shotgun-sh - Versions diffs - 0.2.6.dev1__py3-none-any.whl → 0.2.17__py3-none-any.whl - Mend

shotgun-sh 0.2.6.dev1py3-none-any.whl → 0.2.17py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (127) hide show

shotgun/agents/agent_manager.py +694 -73
shotgun/agents/common.py +69 -70
shotgun/agents/config/constants.py +0 -6
shotgun/agents/config/manager.py +70 -35
shotgun/agents/config/models.py +41 -1
shotgun/agents/config/provider.py +33 -5
shotgun/agents/context_analyzer/__init__.py +28 -0
shotgun/agents/context_analyzer/analyzer.py +471 -0
shotgun/agents/context_analyzer/constants.py +9 -0
shotgun/agents/context_analyzer/formatter.py +115 -0
shotgun/agents/context_analyzer/models.py +212 -0
shotgun/agents/conversation_history.py +125 -2
shotgun/agents/conversation_manager.py +57 -19
shotgun/agents/export.py +6 -7
shotgun/agents/history/compaction.py +9 -4
shotgun/agents/history/context_extraction.py +93 -6
shotgun/agents/history/history_processors.py +113 -5
shotgun/agents/history/token_counting/anthropic.py +39 -3
shotgun/agents/history/token_counting/base.py +14 -3
shotgun/agents/history/token_counting/openai.py +11 -1
shotgun/agents/history/token_counting/sentencepiece_counter.py +8 -0
shotgun/agents/history/token_counting/tokenizer_cache.py +3 -1
shotgun/agents/history/token_counting/utils.py +0 -3
shotgun/agents/models.py +50 -2
shotgun/agents/plan.py +6 -7
shotgun/agents/research.py +7 -8
shotgun/agents/specify.py +6 -7
shotgun/agents/tasks.py +6 -7
shotgun/agents/tools/__init__.py +0 -2
shotgun/agents/tools/codebase/codebase_shell.py +6 -0
shotgun/agents/tools/codebase/directory_lister.py +6 -0
shotgun/agents/tools/codebase/file_read.py +11 -2
shotgun/agents/tools/codebase/query_graph.py +6 -0
shotgun/agents/tools/codebase/retrieve_code.py +6 -0
shotgun/agents/tools/file_management.py +82 -16
shotgun/agents/tools/registry.py +217 -0
shotgun/agents/tools/web_search/__init__.py +8 -8
shotgun/agents/tools/web_search/anthropic.py +8 -2
shotgun/agents/tools/web_search/gemini.py +7 -1
shotgun/agents/tools/web_search/openai.py +7 -1
shotgun/agents/tools/web_search/utils.py +2 -2
shotgun/agents/usage_manager.py +16 -11
shotgun/api_endpoints.py +7 -3
shotgun/build_constants.py +3 -3
shotgun/cli/clear.py +53 -0
shotgun/cli/compact.py +186 -0
shotgun/cli/config.py +8 -5
shotgun/cli/context.py +111 -0
shotgun/cli/export.py +1 -1
shotgun/cli/feedback.py +4 -2
shotgun/cli/models.py +1 -0
shotgun/cli/plan.py +1 -1
shotgun/cli/research.py +1 -1
shotgun/cli/specify.py +1 -1
shotgun/cli/tasks.py +1 -1
shotgun/cli/update.py +16 -2
shotgun/codebase/core/change_detector.py +5 -3
shotgun/codebase/core/code_retrieval.py +4 -2
shotgun/codebase/core/ingestor.py +10 -8
shotgun/codebase/core/manager.py +13 -4
shotgun/codebase/core/nl_query.py +1 -1
shotgun/exceptions.py +32 -0
shotgun/logging_config.py +18 -27
shotgun/main.py +73 -11
shotgun/posthog_telemetry.py +37 -28
shotgun/prompts/agents/export.j2 +18 -1
shotgun/prompts/agents/partials/common_agent_system_prompt.j2 +5 -1
shotgun/prompts/agents/partials/interactive_mode.j2 +24 -7
shotgun/prompts/agents/plan.j2 +1 -1
shotgun/prompts/agents/research.j2 +1 -1
shotgun/prompts/agents/specify.j2 +270 -3
shotgun/prompts/agents/tasks.j2 +1 -1
shotgun/sentry_telemetry.py +163 -16
shotgun/settings.py +238 -0
shotgun/telemetry.py +18 -33
shotgun/tui/app.py +243 -43
shotgun/tui/commands/__init__.py +1 -1
shotgun/tui/components/context_indicator.py +179 -0
shotgun/tui/components/mode_indicator.py +70 -0
shotgun/tui/components/status_bar.py +48 -0
shotgun/tui/containers.py +91 -0
shotgun/tui/dependencies.py +39 -0
shotgun/tui/protocols.py +45 -0
shotgun/tui/screens/chat/__init__.py +5 -0
shotgun/tui/screens/chat/chat.tcss +54 -0
shotgun/tui/screens/chat/chat_screen.py +1254 -0
shotgun/tui/screens/chat/codebase_index_prompt_screen.py +64 -0
shotgun/tui/screens/chat/codebase_index_selection.py +12 -0
shotgun/tui/screens/chat/help_text.py +40 -0
shotgun/tui/screens/chat/prompt_history.py +48 -0
shotgun/tui/screens/chat.tcss +11 -0
shotgun/tui/screens/chat_screen/command_providers.py +78 -2
shotgun/tui/screens/chat_screen/history/__init__.py +22 -0
shotgun/tui/screens/chat_screen/history/agent_response.py +66 -0
shotgun/tui/screens/chat_screen/history/chat_history.py +115 -0
shotgun/tui/screens/chat_screen/history/formatters.py +115 -0
shotgun/tui/screens/chat_screen/history/partial_response.py +43 -0
shotgun/tui/screens/chat_screen/history/user_question.py +42 -0
shotgun/tui/screens/confirmation_dialog.py +151 -0
shotgun/tui/screens/feedback.py +4 -4
shotgun/tui/screens/github_issue.py +102 -0
shotgun/tui/screens/model_picker.py +49 -24
shotgun/tui/screens/onboarding.py +431 -0
shotgun/tui/screens/pipx_migration.py +153 -0
shotgun/tui/screens/provider_config.py +50 -27
shotgun/tui/screens/shotgun_auth.py +2 -2
shotgun/tui/screens/welcome.py +23 -12
shotgun/tui/services/__init__.py +5 -0
shotgun/tui/services/conversation_service.py +184 -0
shotgun/tui/state/__init__.py +7 -0
shotgun/tui/state/processing_state.py +185 -0
shotgun/tui/utils/mode_progress.py +14 -7
shotgun/tui/widgets/__init__.py +5 -0
shotgun/tui/widgets/widget_coordinator.py +263 -0
shotgun/utils/file_system_utils.py +22 -2
shotgun/utils/marketing.py +110 -0
shotgun/utils/update_checker.py +69 -14
shotgun_sh-0.2.17.dist-info/METADATA +465 -0
shotgun_sh-0.2.17.dist-info/RECORD +194 -0
{shotgun_sh-0.2.6.dev1.dist-info → shotgun_sh-0.2.17.dist-info}/entry_points.txt +1 -0
{shotgun_sh-0.2.6.dev1.dist-info → shotgun_sh-0.2.17.dist-info}/licenses/LICENSE +1 -1
shotgun/agents/tools/user_interaction.py +0 -37
shotgun/tui/screens/chat.py +0 -804
shotgun/tui/screens/chat_screen/history.py +0 -401
shotgun_sh-0.2.6.dev1.dist-info/METADATA +0 -467
shotgun_sh-0.2.6.dev1.dist-info/RECORD +0 -156
{shotgun_sh-0.2.6.dev1.dist-info → shotgun_sh-0.2.17.dist-info}/WHEEL +0 -0

shotgun/agents/config/models.py CHANGED Viewed

@@ -1,5 +1,6 @@
 """Pydantic models for configuration."""
+from datetime import datetime
 from enum import StrEnum
 from pydantic import BaseModel, Field, PrivateAttr, SecretStr
@@ -28,6 +29,7 @@ class ModelName(StrEnum):
     GPT_5_MINI = "gpt-5-mini"
     CLAUDE_OPUS_4_1 = "claude-opus-4-1"
     CLAUDE_SONNET_4_5 = "claude-sonnet-4-5"
+    CLAUDE_HAIKU_4_5 = "claude-haiku-4-5"
     GEMINI_2_5_PRO = "gemini-2.5-pro"
     GEMINI_2_5_FLASH = "gemini-2.5-flash"
@@ -42,6 +44,7 @@ class ModelSpec(BaseModel):
     litellm_proxy_model_name: (
         str  # LiteLLM format (e.g., "openai/gpt-5", "gemini/gemini-2-pro")
     )
+    short_name: str  # Display name for UI (e.g., "Sonnet 4.5", "GPT-5")
 class ModelConfig(BaseModel):
@@ -88,6 +91,7 @@ MODEL_SPECS: dict[ModelName, ModelSpec] = {
         max_input_tokens=400_000,
         max_output_tokens=128_000,
         litellm_proxy_model_name="openai/gpt-5",
+        short_name="GPT-5",
     ),
     ModelName.GPT_5_MINI: ModelSpec(
         name=ModelName.GPT_5_MINI,
@@ -95,6 +99,7 @@ MODEL_SPECS: dict[ModelName, ModelSpec] = {
         max_input_tokens=400_000,
         max_output_tokens=128_000,
         litellm_proxy_model_name="openai/gpt-5-mini",
+        short_name="GPT-5 Mini",
     ),
     ModelName.CLAUDE_OPUS_4_1: ModelSpec(
         name=ModelName.CLAUDE_OPUS_4_1,
@@ -102,6 +107,7 @@ MODEL_SPECS: dict[ModelName, ModelSpec] = {
         max_input_tokens=200_000,
         max_output_tokens=32_000,
         litellm_proxy_model_name="anthropic/claude-opus-4-1",
+        short_name="Opus 4.1",
     ),
     ModelName.CLAUDE_SONNET_4_5: ModelSpec(
         name=ModelName.CLAUDE_SONNET_4_5,
@@ -109,6 +115,15 @@ MODEL_SPECS: dict[ModelName, ModelSpec] = {
         max_input_tokens=200_000,
         max_output_tokens=16_000,
         litellm_proxy_model_name="anthropic/claude-sonnet-4-5",
+        short_name="Sonnet 4.5",
+    ),
+    ModelName.CLAUDE_HAIKU_4_5: ModelSpec(
+        name=ModelName.CLAUDE_HAIKU_4_5,
+        provider=ProviderType.ANTHROPIC,
+        max_input_tokens=200_000,
+        max_output_tokens=64_000,
+        litellm_proxy_model_name="anthropic/claude-haiku-4-5",
+        short_name="Haiku 4.5",
     ),
     ModelName.GEMINI_2_5_PRO: ModelSpec(
         name=ModelName.GEMINI_2_5_PRO,
@@ -116,6 +131,7 @@ MODEL_SPECS: dict[ModelName, ModelSpec] = {
         max_input_tokens=1_000_000,
         max_output_tokens=64_000,
         litellm_proxy_model_name="gemini/gemini-2.5-pro",
+        short_name="Gemini 2.5 Pro",
     ),
     ModelName.GEMINI_2_5_FLASH: ModelSpec(
         name=ModelName.GEMINI_2_5_FLASH,
@@ -123,6 +139,7 @@ MODEL_SPECS: dict[ModelName, ModelSpec] = {
         max_input_tokens=1_000_000,
         max_output_tokens=64_000,
         litellm_proxy_model_name="gemini/gemini-2.5-flash",
+        short_name="Gemini 2.5 Flash",
     ),
 }
@@ -154,6 +171,21 @@ class ShotgunAccountConfig(BaseModel):
     )
+class MarketingMessageRecord(BaseModel):
+    """Record of when a marketing message was shown to the user."""
+    shown_at: datetime = Field(description="Timestamp when the message was shown")
+class MarketingConfig(BaseModel):
+    """Configuration for marketing messages shown to users."""
+    messages: dict[str, MarketingMessageRecord] = Field(
+        default_factory=dict,
+        description="Tracking which marketing messages have been shown. Key is message ID (e.g., 'github_star_v1')",
+    )
 class ShotgunConfig(BaseModel):
     """Main configuration for Shotgun CLI."""
@@ -168,8 +200,16 @@ class ShotgunConfig(BaseModel):
     shotgun_instance_id: str = Field(
         description="Unique shotgun instance identifier (also used for anonymous telemetry)",
     )
-    config_version: int = Field(default=3, description="Configuration schema version")
+    config_version: int = Field(default=4, description="Configuration schema version")
     shown_welcome_screen: bool = Field(
         default=False,
         description="Whether the welcome screen has been shown to the user",
     )
+    shown_onboarding_popup: datetime | None = Field(
+        default=None,
+        description="Timestamp when the onboarding popup was shown to the user (ISO8601 format)",
+    )
+    marketing: MarketingConfig = Field(
+        default_factory=MarketingConfig,
+        description="Marketing messages configuration and tracking",
+    )

shotgun/agents/config/provider.py CHANGED Viewed

@@ -32,6 +32,34 @@ logger = get_logger(__name__)
 _model_cache: dict[tuple[ProviderType, KeyProvider, ModelName, str], Model] = {}
+def get_default_model_for_provider(config: ShotgunConfig) -> ModelName:
+    """Get the default model based on which provider/account is configured.
+    Checks API keys in priority order and returns appropriate default model.
+    Treats Shotgun Account as a provider context.
+    Args:
+        config: Shotgun configuration containing API keys
+    Returns:
+        Default ModelName for the configured provider/account
+    """
+    # Priority 1: Shotgun Account
+    if _get_api_key(config.shotgun.api_key):
+        return ModelName.GPT_5
+    # Priority 2: Individual provider keys
+    if _get_api_key(config.anthropic.api_key):
+        return ModelName.CLAUDE_HAIKU_4_5
+    if _get_api_key(config.openai.api_key):
+        return ModelName.GPT_5
+    if _get_api_key(config.google.api_key):
+        return ModelName.GEMINI_2_5_PRO
+    # Fallback: system-wide default
+    return ModelName.CLAUDE_HAIKU_4_5
 def get_or_create_model(
     provider: ProviderType,
     key_provider: "KeyProvider",
@@ -142,7 +170,7 @@ def get_or_create_model(
     return _model_cache[cache_key]
-def get_provider_model(
+async def get_provider_model(
     provider_or_model: ProviderType | ModelName | None = None,
 ) -> ModelConfig:
     """Get a fully configured ModelConfig with API key and Model instance.
@@ -161,7 +189,7 @@ def get_provider_model(
     """
     config_manager = get_config_manager()
     # Use cached config for read-only access (performance)
-    config = config_manager.load(force_reload=False)
+    config = await config_manager.load(force_reload=False)
     # Priority 1: Check if Shotgun key exists - if so, use it for ANY model
     shotgun_api_key = _get_api_key(config.shotgun.api_key)
@@ -172,7 +200,7 @@ def get_provider_model(
             model_name = provider_or_model
         else:
             # No specific model requested - use selected or default
-            model_name = config.selected_model or ModelName.CLAUDE_SONNET_4_5
+            model_name = config.selected_model or ModelName.GPT_5
         if model_name not in MODEL_SPECS:
             raise ValueError(f"Model '{model_name.value}' not found")
@@ -247,8 +275,8 @@ def get_provider_model(
         if not api_key:
             raise ValueError("Anthropic API key not configured. Set via config.")
-        # Use requested model or default to claude-sonnet-4-5
-        model_name = requested_model if requested_model else ModelName.CLAUDE_SONNET_4_5
+        # Use requested model or default to claude-haiku-4-5
+        model_name = requested_model if requested_model else ModelName.CLAUDE_HAIKU_4_5
         if model_name not in MODEL_SPECS:
             raise ValueError(f"Model '{model_name.value}' not found")
         spec = MODEL_SPECS[model_name]

shotgun/agents/context_analyzer/__init__.py ADDED Viewed

@@ -0,0 +1,28 @@
+"""Context analysis module for conversation composition statistics.
+This module provides tools for analyzing conversation context usage, breaking down
+token consumption by message type and tool category.
+"""
+from .analyzer import ContextAnalyzer
+from .constants import ToolCategory, get_tool_category
+from .formatter import ContextFormatter
+from .models import (
+    ContextAnalysis,
+    ContextAnalysisOutput,
+    ContextCompositionTelemetry,
+    MessageTypeStats,
+    TokenAllocation,
+)
+__all__ = [
+    "ContextAnalyzer",
+    "ContextAnalysis",
+    "ContextAnalysisOutput",
+    "ContextCompositionTelemetry",
+    "ContextFormatter",
+    "MessageTypeStats",
+    "TokenAllocation",
+    "ToolCategory",
+    "get_tool_category",
+]

shotgun/agents/context_analyzer/analyzer.py ADDED Viewed

@@ -0,0 +1,471 @@
+"""Core context analysis logic."""
+import json
+from collections.abc import Sequence
+from pydantic_ai.messages import (
+    ModelMessage,
+    ModelRequest,
+    ModelResponse,
+    SystemPromptPart,
+    TextPart,
+    ToolCallPart,
+    ToolReturnPart,
+    UserPromptPart,
+)
+from shotgun.agents.config.models import ModelConfig
+from shotgun.agents.history.token_counting.utils import count_tokens_from_messages
+from shotgun.agents.history.token_estimation import estimate_tokens_from_messages
+from shotgun.agents.messages import AgentSystemPrompt, SystemStatusPrompt
+from shotgun.logging_config import get_logger
+from shotgun.tui.screens.chat_screen.hint_message import HintMessage
+from .constants import ToolCategory, get_tool_category
+from .models import ContextAnalysis, MessageTypeStats, TokenAllocation
+logger = get_logger(__name__)
+class ContextAnalyzer:
+    """Analyzes conversation message history for context composition."""
+    def __init__(self, model_config: ModelConfig):
+        """Initialize the analyzer with model configuration for token counting.
+        Args:
+            model_config: Model configuration for accurate token counting
+        """
+        self.model_config = model_config
+    async def _allocate_tokens_from_usage(
+        self,
+        message_history: list[ModelMessage],
+    ) -> TokenAllocation:
+        """Allocate tokens from actual API usage data proportionally to parts.
+        This uses the ground truth token counts from ModelResponse.usage instead of
+        creating synthetic messages, which avoids inflating counts with message framing overhead.
+        IMPORTANT: usage.input_tokens is cumulative (includes all conversation history), so we:
+        1. Use the LAST response's input_tokens as the ground truth total
+        2. Calculate proportions based on content size across ALL requests
+        3. Allocate the ground truth total proportionally
+        If usage data is missing or zero (e.g., after compaction), falls back to token estimation.
+        Args:
+            message_history: List of actual messages from conversation
+        Returns:
+            TokenAllocation with token counts by message/tool type
+        """
+        # Step 1: Find the last response's usage data (ground truth for input tokens)
+        last_input_tokens = 0
+        total_output_tokens = 0
+        for msg in reversed(message_history):
+            if isinstance(msg, ModelResponse) and msg.usage:
+                last_input_tokens = msg.usage.input_tokens + msg.usage.cache_read_tokens
+                break
+        if last_input_tokens == 0:
+            # Fallback to token estimation (no logging to reduce verbosity)
+            last_input_tokens = await estimate_tokens_from_messages(
+                message_history, self.model_config
+            )
+        # Step 2: Calculate total output tokens (sum across all responses)
+        for msg in message_history:
+            if isinstance(msg, ModelResponse) and msg.usage:
+                total_output_tokens += msg.usage.output_tokens
+        # Step 3: Calculate content size proportions for each part type across ALL requests
+        # Initialize size accumulators
+        user_size = 0
+        system_prompts_size = 0
+        system_status_size = 0
+        codebase_understanding_input_size = 0
+        artifact_management_input_size = 0
+        web_research_input_size = 0
+        unknown_input_size = 0
+        for msg in message_history:
+            if isinstance(msg, ModelRequest):
+                for part in msg.parts:
+                    if isinstance(part, (SystemPromptPart, UserPromptPart)):
+                        size = len(part.content)
+                    elif isinstance(part, ToolReturnPart):
+                        # ToolReturnPart.content can be Any type
+                        try:
+                            content_str = (
+                                json.dumps(part.content)
+                                if part.content is not None
+                                else ""
+                            )
+                        except (TypeError, ValueError):
+                            content_str = (
+                                str(part.content) if part.content is not None else ""
+                            )
+                        size = len(content_str)
+                    else:
+                        size = 0
+                    # Categorize by part type
+                    # Note: Check subclasses first (AgentSystemPrompt, SystemStatusPrompt)
+                    # before checking base class (SystemPromptPart)
+                    if isinstance(part, SystemStatusPrompt):
+                        system_status_size += size
+                    elif isinstance(part, AgentSystemPrompt):
+                        system_prompts_size += size
+                    elif isinstance(part, SystemPromptPart):
+                        # Generic system prompt (not AgentSystemPrompt or SystemStatusPrompt)
+                        system_prompts_size += size
+                    elif isinstance(part, UserPromptPart):
+                        user_size += size
+                    elif isinstance(part, ToolReturnPart):
+                        # Categorize tool results by tool category
+                        category = get_tool_category(part.tool_name)
+                        if category == ToolCategory.CODEBASE_UNDERSTANDING:
+                            codebase_understanding_input_size += size
+                        elif category == ToolCategory.ARTIFACT_MANAGEMENT:
+                            artifact_management_input_size += size
+                        elif category == ToolCategory.WEB_RESEARCH:
+                            web_research_input_size += size
+                        elif category == ToolCategory.UNKNOWN:
+                            unknown_input_size += size
+        # Step 4: Calculate output proportions by tool category
+        codebase_understanding_size = 0
+        artifact_management_size = 0
+        web_research_size = 0
+        unknown_size = 0
+        agent_response_size = 0
+        for msg in message_history:
+            if isinstance(msg, ModelResponse):
+                for part in msg.parts:  # type: ignore[assignment]
+                    if isinstance(part, ToolCallPart):
+                        category = get_tool_category(part.tool_name)
+                        size = len(str(part.args))
+                        if category == ToolCategory.AGENT_RESPONSE:
+                            agent_response_size += size
+                        elif category == ToolCategory.CODEBASE_UNDERSTANDING:
+                            codebase_understanding_size += size
+                        elif category == ToolCategory.ARTIFACT_MANAGEMENT:
+                            artifact_management_size += size
+                        elif category == ToolCategory.WEB_RESEARCH:
+                            web_research_size += size
+                        elif category == ToolCategory.UNKNOWN:
+                            unknown_size += size
+                    elif isinstance(part, TextPart):
+                        agent_response_size += len(part.content)
+        # Step 5: Allocate input tokens proportionally
+        # Initialize TokenAllocation fields
+        user_tokens = 0
+        agent_response_tokens = 0
+        system_prompt_tokens = 0
+        system_status_tokens = 0
+        codebase_understanding_tokens = 0
+        artifact_management_tokens = 0
+        web_research_tokens = 0
+        unknown_tokens = 0
+        total_input_size = (
+            user_size
+            + system_prompts_size
+            + system_status_size
+            + codebase_understanding_input_size
+            + artifact_management_input_size
+            + web_research_input_size
+            + unknown_input_size
+        )
+        if total_input_size > 0 and last_input_tokens > 0:
+            user_tokens = int(last_input_tokens * (user_size / total_input_size))
+            system_prompt_tokens = int(
+                last_input_tokens * (system_prompts_size / total_input_size)
+            )
+            system_status_tokens = int(
+                last_input_tokens * (system_status_size / total_input_size)
+            )
+            codebase_understanding_tokens = int(
+                last_input_tokens
+                * (codebase_understanding_input_size / total_input_size)
+            )
+            artifact_management_tokens = int(
+                last_input_tokens * (artifact_management_input_size / total_input_size)
+            )
+            web_research_tokens = int(
+                last_input_tokens * (web_research_input_size / total_input_size)
+            )
+            unknown_tokens = int(
+                last_input_tokens * (unknown_input_size / total_input_size)
+            )
+        # Step 6: Allocate output tokens proportionally
+        total_output_size = (
+            codebase_understanding_size
+            + artifact_management_size
+            + web_research_size
+            + unknown_size
+            + agent_response_size
+        )
+        if total_output_size > 0 and total_output_tokens > 0:
+            codebase_understanding_tokens += int(
+                total_output_tokens * (codebase_understanding_size / total_output_size)
+            )
+            artifact_management_tokens += int(
+                total_output_tokens * (artifact_management_size / total_output_size)
+            )
+            web_research_tokens += int(
+                total_output_tokens * (web_research_size / total_output_size)
+            )
+            unknown_tokens += int(
+                total_output_tokens * (unknown_size / total_output_size)
+            )
+            agent_response_tokens += int(
+                total_output_tokens * (agent_response_size / total_output_size)
+            )
+        elif total_output_tokens > 0:
+            # If no content, put all in agent responses
+            agent_response_tokens = total_output_tokens
+        # Token allocation complete (no logging to reduce verbosity)
+        # Create TokenAllocation model
+        return TokenAllocation(
+            user=user_tokens,
+            agent_responses=agent_response_tokens,
+            system_prompts=system_prompt_tokens,
+            system_status=system_status_tokens,
+            codebase_understanding=codebase_understanding_tokens,
+            artifact_management=artifact_management_tokens,
+            web_research=web_research_tokens,
+            unknown=unknown_tokens,
+        )
+    async def analyze_conversation(
+        self,
+        message_history: list[ModelMessage],
+        ui_message_history: list[ModelMessage | HintMessage],
+    ) -> ContextAnalysis:
+        """Analyze the conversation to determine message type composition.
+        Args:
+            message_history: The agent message history (for token counting)
+            ui_message_history: The UI message history (includes hints)
+        Returns:
+            ContextAnalysis with statistics for each message type
+        """
+        # Track counts for each message type
+        user_count = 0
+        agent_responses_count = 0
+        system_prompts_count = 0
+        system_status_count = 0
+        codebase_understanding_count = 0
+        artifact_management_count = 0
+        web_research_count = 0
+        unknown_count = 0
+        # Analyze message_history to count message types
+        for msg in message_history:
+            if isinstance(msg, ModelRequest):
+                # Track what types are in this message for counting
+                has_user_prompt = False
+                has_system_prompt = False
+                has_system_status = False
+                # Check what part types this message contains
+                for part in msg.parts:
+                    if isinstance(part, AgentSystemPrompt):
+                        has_system_prompt = True
+                    elif isinstance(part, SystemStatusPrompt):
+                        has_system_status = True
+                    elif isinstance(part, SystemPromptPart):
+                        # Generic system prompt
+                        has_system_prompt = True
+                    elif isinstance(part, UserPromptPart):
+                        has_user_prompt = True
+                    elif isinstance(part, ToolReturnPart):
+                        # Categorize tool results by category
+                        category = get_tool_category(part.tool_name)
+                        if category == ToolCategory.CODEBASE_UNDERSTANDING:
+                            codebase_understanding_count += 1
+                        elif category == ToolCategory.ARTIFACT_MANAGEMENT:
+                            artifact_management_count += 1
+                        elif category == ToolCategory.WEB_RESEARCH:
+                            web_research_count += 1
+                        elif category == ToolCategory.UNKNOWN:
+                            unknown_count += 1
+                # Count the message types (only count once per message)
+                if has_system_prompt:
+                    system_prompts_count += 1
+                if has_system_status:
+                    system_status_count += 1
+                if has_user_prompt:
+                    user_count += 1
+            elif isinstance(msg, ModelResponse):
+                # Agent responses - count entire response as one
+                agent_responses_count += 1
+                # Check for tool calls in the response
+                for part in msg.parts:  # type: ignore[assignment]
+                    if isinstance(part, ToolCallPart):
+                        category = get_tool_category(part.tool_name)
+                        if category == ToolCategory.CODEBASE_UNDERSTANDING:
+                            codebase_understanding_count += 1
+                        elif category == ToolCategory.ARTIFACT_MANAGEMENT:
+                            artifact_management_count += 1
+                        elif category == ToolCategory.WEB_RESEARCH:
+                            web_research_count += 1
+                        elif category == ToolCategory.UNKNOWN:
+                            unknown_count += 1
+        # Count hints from ui_message_history
+        hint_count = sum(
+            1 for msg in ui_message_history if isinstance(msg, HintMessage)
+        )
+        # Use actual API usage data for accurate token counting (avoids synthetic message overhead)
+        usage_tokens = await self._allocate_tokens_from_usage(message_history)
+        user_tokens = usage_tokens.user
+        agent_response_tokens = usage_tokens.agent_responses
+        system_prompt_tokens = usage_tokens.system_prompts
+        system_status_tokens = usage_tokens.system_status
+        codebase_understanding_tokens = usage_tokens.codebase_understanding
+        artifact_management_tokens = usage_tokens.artifact_management
+        web_research_tokens = usage_tokens.web_research
+        unknown_tokens = usage_tokens.unknown
+        # Estimate hint tokens (rough estimate based on character count)
+        hint_tokens = 0
+        for msg in ui_message_history:  # type: ignore[assignment]
+            if isinstance(msg, HintMessage):
+                # Rough estimate: ~4 chars per token
+                hint_tokens += len(msg.message) // 4
+        # Calculate agent context tokens (excluding UI-only hints)
+        agent_context_tokens = (
+            user_tokens
+            + agent_response_tokens
+            + system_prompt_tokens
+            + system_status_tokens
+            + codebase_understanding_tokens
+            + artifact_management_tokens
+            + web_research_tokens
+            + unknown_tokens
+        )
+        # Total tokens includes hints for display purposes, but agent_context_tokens does not
+        total_tokens = agent_context_tokens + hint_tokens
+        total_messages = (
+            user_count
+            + agent_responses_count
+            + system_prompts_count
+            + system_status_count
+            + codebase_understanding_count
+            + artifact_management_count
+            + web_research_count
+            + unknown_count
+            + hint_count
+        )
+        # Calculate usable context limit (80% of max_input_tokens) and free space
+        # This matches the TOKEN_LIMIT_RATIO = 0.8 from history/constants.py
+        max_usable_tokens = int(self.model_config.max_input_tokens * 0.8)
+        free_space_tokens = max_usable_tokens - agent_context_tokens
+        return ContextAnalysis(
+            user_messages=MessageTypeStats(count=user_count, tokens=user_tokens),
+            agent_responses=MessageTypeStats(
+                count=agent_responses_count, tokens=agent_response_tokens
+            ),
+            system_prompts=MessageTypeStats(
+                count=system_prompts_count, tokens=system_prompt_tokens
+            ),
+            system_status=MessageTypeStats(
+                count=system_status_count, tokens=system_status_tokens
+            ),
+            codebase_understanding=MessageTypeStats(
+                count=codebase_understanding_count,
+                tokens=codebase_understanding_tokens,
+            ),
+            artifact_management=MessageTypeStats(
+                count=artifact_management_count, tokens=artifact_management_tokens
+            ),
+            web_research=MessageTypeStats(
+                count=web_research_count, tokens=web_research_tokens
+            ),
+            unknown=MessageTypeStats(count=unknown_count, tokens=unknown_tokens),
+            hint_messages=MessageTypeStats(count=hint_count, tokens=hint_tokens),
+            total_tokens=total_tokens,
+            total_messages=total_messages,
+            context_window=self.model_config.max_input_tokens,
+            agent_context_tokens=agent_context_tokens,
+            model_name=self.model_config.name.value,
+            max_usable_tokens=max_usable_tokens,
+            free_space_tokens=free_space_tokens,
+        )
+    async def _count_tokens_for_parts(
+        self,
+        parts: Sequence[
+            UserPromptPart | SystemPromptPart | ToolReturnPart | ToolCallPart
+        ],
+        part_type: str,
+    ) -> int:
+        """Count tokens for a list of parts by creating synthetic single-part messages.
+        This avoids double-counting when a message contains multiple part types.
+        Args:
+            parts: List of parts to count tokens for
+            part_type: Type of parts ("user", "system", "tool_return", "tool_call")
+        Returns:
+            Total token count for all parts
+        """
+        if not parts:
+            return 0
+        # Create synthetic messages with single parts for accurate token counting
+        synthetic_messages: list[ModelMessage] = []
+        for part in parts:
+            if part_type in ("user", "system", "tool_return"):
+                # These are request parts - wrap in ModelRequest
+                synthetic_messages.append(ModelRequest(parts=[part]))  # type: ignore[list-item]
+            elif part_type == "tool_call":
+                # Tool calls are in responses - wrap in ModelResponse
+                synthetic_messages.append(ModelResponse(parts=[part]))  # type: ignore[list-item]
+        # Count tokens for the synthetic messages
+        return await self._count_tokens_safe(synthetic_messages)
+    async def _count_tokens_safe(self, messages: Sequence[ModelMessage]) -> int:
+        """Count tokens for a list of messages, returning 0 on error.
+        Args:
+            messages: List of messages to count tokens for
+        Returns:
+            Token count or 0 if counting fails
+        """
+        if not messages:
+            return 0
+        try:
+            return await count_tokens_from_messages(list(messages), self.model_config)
+        except Exception as e:
+            logger.warning(f"Failed to count tokens: {e}")
+            # Fallback to rough estimate
+            total_chars = sum(len(str(msg)) for msg in messages)
+            return total_chars // 4  # Rough estimate: 4 chars per token

shotgun-sh 0.2.6.dev1__py3-none-any.whl → 0.2.17__py3-none-any.whl

shotgun-sh 0.2.6.dev1py3-none-any.whl → 0.2.17py3-none-any.whl