PyPI - code-puppy - Versions diffs - 0.0.214__py3-none-any.whl → 0.0.366__py3-none-any.whl - Mend

code-puppy 0.0.214py3-none-any.whl → 0.0.366py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (231) hide show

code_puppy/__init__.py +7 -1
code_puppy/agents/__init__.py +2 -0
code_puppy/agents/agent_c_reviewer.py +59 -6
code_puppy/agents/agent_code_puppy.py +7 -1
code_puppy/agents/agent_code_reviewer.py +12 -2
code_puppy/agents/agent_cpp_reviewer.py +73 -6
code_puppy/agents/agent_creator_agent.py +45 -4
code_puppy/agents/agent_golang_reviewer.py +92 -3
code_puppy/agents/agent_javascript_reviewer.py +101 -8
code_puppy/agents/agent_manager.py +81 -4
code_puppy/agents/agent_pack_leader.py +383 -0
code_puppy/agents/agent_planning.py +163 -0
code_puppy/agents/agent_python_programmer.py +165 -0
code_puppy/agents/agent_python_reviewer.py +28 -6
code_puppy/agents/agent_qa_expert.py +98 -6
code_puppy/agents/agent_qa_kitten.py +12 -7
code_puppy/agents/agent_security_auditor.py +113 -3
code_puppy/agents/agent_terminal_qa.py +323 -0
code_puppy/agents/agent_typescript_reviewer.py +106 -7
code_puppy/agents/base_agent.py +802 -176
code_puppy/agents/event_stream_handler.py +350 -0
code_puppy/agents/pack/__init__.py +34 -0
code_puppy/agents/pack/bloodhound.py +304 -0
code_puppy/agents/pack/husky.py +321 -0
code_puppy/agents/pack/retriever.py +393 -0
code_puppy/agents/pack/shepherd.py +348 -0
code_puppy/agents/pack/terrier.py +287 -0
code_puppy/agents/pack/watchdog.py +367 -0
code_puppy/agents/prompt_reviewer.py +145 -0
code_puppy/agents/subagent_stream_handler.py +276 -0
code_puppy/api/__init__.py +13 -0
code_puppy/api/app.py +169 -0
code_puppy/api/main.py +21 -0
code_puppy/api/pty_manager.py +446 -0
code_puppy/api/routers/__init__.py +12 -0
code_puppy/api/routers/agents.py +36 -0
code_puppy/api/routers/commands.py +217 -0
code_puppy/api/routers/config.py +74 -0
code_puppy/api/routers/sessions.py +232 -0
code_puppy/api/templates/terminal.html +361 -0
code_puppy/api/websocket.py +154 -0
code_puppy/callbacks.py +142 -4
code_puppy/chatgpt_codex_client.py +283 -0
code_puppy/claude_cache_client.py +586 -0
code_puppy/cli_runner.py +916 -0
code_puppy/command_line/add_model_menu.py +1079 -0
code_puppy/command_line/agent_menu.py +395 -0
code_puppy/command_line/attachments.py +10 -5
code_puppy/command_line/autosave_menu.py +605 -0
code_puppy/command_line/clipboard.py +527 -0
code_puppy/command_line/colors_menu.py +520 -0
code_puppy/command_line/command_handler.py +176 -738
code_puppy/command_line/command_registry.py +150 -0
code_puppy/command_line/config_commands.py +715 -0
code_puppy/command_line/core_commands.py +792 -0
code_puppy/command_line/diff_menu.py +863 -0
code_puppy/command_line/load_context_completion.py +15 -22
code_puppy/command_line/mcp/base.py +0 -3
code_puppy/command_line/mcp/catalog_server_installer.py +175 -0
code_puppy/command_line/mcp/custom_server_form.py +688 -0
code_puppy/command_line/mcp/custom_server_installer.py +195 -0
code_puppy/command_line/mcp/edit_command.py +148 -0
code_puppy/command_line/mcp/handler.py +9 -4
code_puppy/command_line/mcp/help_command.py +6 -5
code_puppy/command_line/mcp/install_command.py +15 -26
code_puppy/command_line/mcp/install_menu.py +685 -0
code_puppy/command_line/mcp/list_command.py +2 -2
code_puppy/command_line/mcp/logs_command.py +174 -65
code_puppy/command_line/mcp/remove_command.py +2 -2
code_puppy/command_line/mcp/restart_command.py +12 -4
code_puppy/command_line/mcp/search_command.py +16 -10
code_puppy/command_line/mcp/start_all_command.py +18 -6
code_puppy/command_line/mcp/start_command.py +47 -25
code_puppy/command_line/mcp/status_command.py +4 -5
code_puppy/command_line/mcp/stop_all_command.py +7 -1
code_puppy/command_line/mcp/stop_command.py +8 -4
code_puppy/command_line/mcp/test_command.py +2 -2
code_puppy/command_line/mcp/wizard_utils.py +20 -16
code_puppy/command_line/mcp_completion.py +174 -0
code_puppy/command_line/model_picker_completion.py +75 -25
code_puppy/command_line/model_settings_menu.py +884 -0
code_puppy/command_line/motd.py +14 -8
code_puppy/command_line/onboarding_slides.py +179 -0
code_puppy/command_line/onboarding_wizard.py +340 -0
code_puppy/command_line/pin_command_completion.py +329 -0
code_puppy/command_line/prompt_toolkit_completion.py +463 -63
code_puppy/command_line/session_commands.py +296 -0
code_puppy/command_line/utils.py +54 -0
code_puppy/config.py +898 -112
code_puppy/error_logging.py +118 -0
code_puppy/gemini_code_assist.py +385 -0
code_puppy/gemini_model.py +602 -0
code_puppy/http_utils.py +210 -148
code_puppy/keymap.py +128 -0
code_puppy/main.py +5 -698
code_puppy/mcp_/__init__.py +17 -0
code_puppy/mcp_/async_lifecycle.py +35 -4
code_puppy/mcp_/blocking_startup.py +70 -43
code_puppy/mcp_/captured_stdio_server.py +2 -2
code_puppy/mcp_/config_wizard.py +4 -4
code_puppy/mcp_/dashboard.py +15 -6
code_puppy/mcp_/managed_server.py +65 -38
code_puppy/mcp_/manager.py +146 -52
code_puppy/mcp_/mcp_logs.py +224 -0
code_puppy/mcp_/registry.py +6 -6
code_puppy/mcp_/server_registry_catalog.py +24 -5
code_puppy/messaging/__init__.py +199 -2
code_puppy/messaging/bus.py +610 -0
code_puppy/messaging/commands.py +167 -0
code_puppy/messaging/markdown_patches.py +57 -0
code_puppy/messaging/message_queue.py +17 -48
code_puppy/messaging/messages.py +500 -0
code_puppy/messaging/queue_console.py +1 -24
code_puppy/messaging/renderers.py +43 -146
code_puppy/messaging/rich_renderer.py +1027 -0
code_puppy/messaging/spinner/__init__.py +21 -5
code_puppy/messaging/spinner/console_spinner.py +86 -51
code_puppy/messaging/subagent_console.py +461 -0
code_puppy/model_factory.py +634 -83
code_puppy/model_utils.py +167 -0
code_puppy/models.json +66 -68
code_puppy/models_dev_api.json +1 -0
code_puppy/models_dev_parser.py +592 -0
code_puppy/plugins/__init__.py +164 -10
code_puppy/plugins/antigravity_oauth/__init__.py +10 -0
code_puppy/plugins/antigravity_oauth/accounts.py +406 -0
code_puppy/plugins/antigravity_oauth/antigravity_model.py +704 -0
code_puppy/plugins/antigravity_oauth/config.py +42 -0
code_puppy/plugins/antigravity_oauth/constants.py +136 -0
code_puppy/plugins/antigravity_oauth/oauth.py +478 -0
code_puppy/plugins/antigravity_oauth/register_callbacks.py +406 -0
code_puppy/plugins/antigravity_oauth/storage.py +271 -0
code_puppy/plugins/antigravity_oauth/test_plugin.py +319 -0
code_puppy/plugins/antigravity_oauth/token.py +167 -0
code_puppy/plugins/antigravity_oauth/transport.py +767 -0
code_puppy/plugins/antigravity_oauth/utils.py +169 -0
code_puppy/plugins/chatgpt_oauth/__init__.py +8 -0
code_puppy/plugins/chatgpt_oauth/config.py +52 -0
code_puppy/plugins/chatgpt_oauth/oauth_flow.py +328 -0
code_puppy/plugins/chatgpt_oauth/register_callbacks.py +94 -0
code_puppy/plugins/chatgpt_oauth/test_plugin.py +293 -0
code_puppy/plugins/chatgpt_oauth/utils.py +489 -0
code_puppy/plugins/claude_code_oauth/README.md +167 -0
code_puppy/plugins/claude_code_oauth/SETUP.md +93 -0
code_puppy/plugins/claude_code_oauth/__init__.py +6 -0
code_puppy/plugins/claude_code_oauth/config.py +50 -0
code_puppy/plugins/claude_code_oauth/register_callbacks.py +308 -0
code_puppy/plugins/claude_code_oauth/test_plugin.py +283 -0
code_puppy/plugins/claude_code_oauth/utils.py +518 -0
code_puppy/plugins/customizable_commands/__init__.py +0 -0
code_puppy/plugins/customizable_commands/register_callbacks.py +169 -0
code_puppy/plugins/example_custom_command/README.md +280 -0
code_puppy/plugins/example_custom_command/register_callbacks.py +2 -2
code_puppy/plugins/file_permission_handler/__init__.py +4 -0
code_puppy/plugins/file_permission_handler/register_callbacks.py +523 -0
code_puppy/plugins/frontend_emitter/__init__.py +25 -0
code_puppy/plugins/frontend_emitter/emitter.py +121 -0
code_puppy/plugins/frontend_emitter/register_callbacks.py +261 -0
code_puppy/plugins/oauth_puppy_html.py +228 -0
code_puppy/plugins/shell_safety/__init__.py +6 -0
code_puppy/plugins/shell_safety/agent_shell_safety.py +69 -0
code_puppy/plugins/shell_safety/command_cache.py +156 -0
code_puppy/plugins/shell_safety/register_callbacks.py +202 -0
code_puppy/prompts/antigravity_system_prompt.md +1 -0
code_puppy/prompts/codex_system_prompt.md +310 -0
code_puppy/pydantic_patches.py +131 -0
code_puppy/reopenable_async_client.py +8 -8
code_puppy/round_robin_model.py +9 -12
code_puppy/session_storage.py +2 -1
code_puppy/status_display.py +21 -4
code_puppy/summarization_agent.py +41 -13
code_puppy/terminal_utils.py +418 -0
code_puppy/tools/__init__.py +37 -1
code_puppy/tools/agent_tools.py +536 -52
code_puppy/tools/browser/__init__.py +37 -0
code_puppy/tools/browser/browser_control.py +19 -23
code_puppy/tools/browser/browser_interactions.py +41 -48
code_puppy/tools/browser/browser_locators.py +36 -38
code_puppy/tools/browser/browser_manager.py +316 -0
code_puppy/tools/browser/browser_navigation.py +16 -16
code_puppy/tools/browser/browser_screenshot.py +79 -143
code_puppy/tools/browser/browser_scripts.py +32 -42
code_puppy/tools/browser/browser_workflows.py +44 -27
code_puppy/tools/browser/chromium_terminal_manager.py +259 -0
code_puppy/tools/browser/terminal_command_tools.py +521 -0
code_puppy/tools/browser/terminal_screenshot_tools.py +556 -0
code_puppy/tools/browser/terminal_tools.py +525 -0
code_puppy/tools/command_runner.py +930 -147
code_puppy/tools/common.py +1113 -5
code_puppy/tools/display.py +84 -0
code_puppy/tools/file_modifications.py +288 -89
code_puppy/tools/file_operations.py +226 -154
code_puppy/tools/subagent_context.py +158 -0
code_puppy/uvx_detection.py +242 -0
code_puppy/version_checker.py +30 -11
code_puppy-0.0.366.data/data/code_puppy/models.json +110 -0
code_puppy-0.0.366.data/data/code_puppy/models_dev_api.json +1 -0
{code_puppy-0.0.214.dist-info → code_puppy-0.0.366.dist-info}/METADATA +149 -75
code_puppy-0.0.366.dist-info/RECORD +217 -0
{code_puppy-0.0.214.dist-info → code_puppy-0.0.366.dist-info}/WHEEL +1 -1
code_puppy/command_line/mcp/add_command.py +0 -183
code_puppy/messaging/spinner/textual_spinner.py +0 -106
code_puppy/tools/browser/camoufox_manager.py +0 -216
code_puppy/tools/browser/vqa_agent.py +0 -70
code_puppy/tui/__init__.py +0 -10
code_puppy/tui/app.py +0 -1105
code_puppy/tui/components/__init__.py +0 -21
code_puppy/tui/components/chat_view.py +0 -551
code_puppy/tui/components/command_history_modal.py +0 -218
code_puppy/tui/components/copy_button.py +0 -139
code_puppy/tui/components/custom_widgets.py +0 -63
code_puppy/tui/components/human_input_modal.py +0 -175
code_puppy/tui/components/input_area.py +0 -167
code_puppy/tui/components/sidebar.py +0 -309
code_puppy/tui/components/status_bar.py +0 -185
code_puppy/tui/messages.py +0 -27
code_puppy/tui/models/__init__.py +0 -8
code_puppy/tui/models/chat_message.py +0 -25
code_puppy/tui/models/command_history.py +0 -89
code_puppy/tui/models/enums.py +0 -24
code_puppy/tui/screens/__init__.py +0 -17
code_puppy/tui/screens/autosave_picker.py +0 -175
code_puppy/tui/screens/help.py +0 -130
code_puppy/tui/screens/mcp_install_wizard.py +0 -803
code_puppy/tui/screens/settings.py +0 -306
code_puppy/tui/screens/tools.py +0 -74
code_puppy/tui_state.py +0 -55
code_puppy-0.0.214.data/data/code_puppy/models.json +0 -112
code_puppy-0.0.214.dist-info/RECORD +0 -131
{code_puppy-0.0.214.dist-info → code_puppy-0.0.366.dist-info}/entry_points.txt +0 -0
{code_puppy-0.0.214.dist-info → code_puppy-0.0.366.dist-info}/licenses/LICENSE +0 -0

code_puppy/model_factory.py CHANGED Viewed

@@ -4,33 +4,134 @@ import os
 import pathlib
 from typing import Any, Dict
-import httpx
 from anthropic import AsyncAnthropic
 from openai import AsyncAzureOpenAI
-from pydantic_ai.models.anthropic import AnthropicModel
-from pydantic_ai.models.google import GoogleModel
-from pydantic_ai.models.openai import OpenAIChatModel
+from pydantic_ai.models.anthropic import AnthropicModel, AnthropicModelSettings
+from pydantic_ai.models.openai import (
+    OpenAIChatModel,
+    OpenAIChatModelSettings,
+    OpenAIResponsesModel,
+)
+from pydantic_ai.profiles import ModelProfile
 from pydantic_ai.providers.anthropic import AnthropicProvider
 from pydantic_ai.providers.cerebras import CerebrasProvider
-from pydantic_ai.providers.google import GoogleProvider
 from pydantic_ai.providers.openai import OpenAIProvider
 from pydantic_ai.providers.openrouter import OpenRouterProvider
+from pydantic_ai.settings import ModelSettings
+from code_puppy.gemini_model import GeminiModel
 from code_puppy.messaging import emit_warning
 from . import callbacks
-from .config import EXTRA_MODELS_FILE
-from .http_utils import create_async_client
+from .claude_cache_client import ClaudeCacheAsyncClient, patch_anthropic_client_messages
+from .config import EXTRA_MODELS_FILE, get_value
+from .http_utils import create_async_client, get_cert_bundle_path, get_http2
 from .round_robin_model import RoundRobinModel
-# Environment variables used in this module:
-# - GEMINI_API_KEY: API key for Google's Gemini models. Required when using Gemini models.
-# - OPENAI_API_KEY: API key for OpenAI models. Required when using OpenAI models or custom_openai endpoints.
-# - TOGETHER_AI_KEY: API key for Together AI models. Required when using Together AI models.
-#
-# When using custom endpoints (type: "custom_openai" in models.json):
-# - Environment variables can be referenced in header values by prefixing with $ in models.json.
-#   Example: "X-Api-Key": "$OPENAI_API_KEY" will use the value from os.environ.get("OPENAI_API_KEY")
+logger = logging.getLogger(__name__)
+def get_api_key(env_var_name: str) -> str | None:
+    """Get an API key from config first, then fall back to environment variable.
+    This allows users to set API keys via `/set KIMI_API_KEY=xxx` in addition to
+    setting them as environment variables.
+    Args:
+        env_var_name: The name of the environment variable (e.g., "OPENAI_API_KEY")
+    Returns:
+        The API key value, or None if not found in either config or environment.
+    """
+    # First check config (case-insensitive key lookup)
+    config_value = get_value(env_var_name.lower())
+    if config_value:
+        return config_value
+    # Fall back to environment variable
+    return os.environ.get(env_var_name)
+def make_model_settings(
+    model_name: str, max_tokens: int | None = None
+) -> ModelSettings:
+    """Create appropriate ModelSettings for a given model.
+    This handles model-specific settings:
+    - GPT-5 models: reasoning_effort and verbosity (non-codex only)
+    - Claude/Anthropic models: extended_thinking and budget_tokens
+    - Automatic max_tokens calculation based on model context length
+    Args:
+        model_name: The name of the model to create settings for.
+        max_tokens: Optional max tokens limit. If None, automatically calculated
+            as: max(2048, min(15% of context_length, 65536))
+    Returns:
+        Appropriate ModelSettings subclass instance for the model.
+    """
+    from code_puppy.config import (
+        get_effective_model_settings,
+        get_openai_reasoning_effort,
+        get_openai_verbosity,
+    )
+    model_settings_dict: dict = {}
+    # Calculate max_tokens if not explicitly provided
+    if max_tokens is None:
+        # Load model config to get context length
+        try:
+            models_config = ModelFactory.load_config()
+            model_config = models_config.get(model_name, {})
+            context_length = model_config.get("context_length", 128000)
+        except Exception:
+            # Fallback if config loading fails (e.g., in CI environments)
+            context_length = 128000
+        # min 2048, 15% of context, max 65536
+        max_tokens = max(2048, min(int(0.15 * context_length), 65536))
+    model_settings_dict["max_tokens"] = max_tokens
+    effective_settings = get_effective_model_settings(model_name)
+    model_settings_dict.update(effective_settings)
+    # Default to clear_thinking=False for GLM-4.7 models (preserved thinking)
+    if "glm-4.7" in model_name.lower():
+        clear_thinking = effective_settings.get("clear_thinking", False)
+        model_settings_dict["thinking"] = {
+            "type": "enabled",
+            "clear_thinking": clear_thinking,
+        }
+    model_settings: ModelSettings = ModelSettings(**model_settings_dict)
+    if "gpt-5" in model_name:
+        model_settings_dict["openai_reasoning_effort"] = get_openai_reasoning_effort()
+        # Verbosity only applies to non-codex GPT-5 models (codex only supports "medium")
+        if "codex" not in model_name:
+            verbosity = get_openai_verbosity()
+            model_settings_dict["extra_body"] = {"verbosity": verbosity}
+        model_settings = OpenAIChatModelSettings(**model_settings_dict)
+    elif model_name.startswith("claude-") or model_name.startswith("anthropic-"):
+        # Handle Anthropic extended thinking settings
+        # Remove top_p as Anthropic doesn't support it with extended thinking
+        model_settings_dict.pop("top_p", None)
+        # Claude extended thinking requires temperature=1.0 (API restriction)
+        # Default to 1.0 if not explicitly set by user
+        if model_settings_dict.get("temperature") is None:
+            model_settings_dict["temperature"] = 1.0
+        extended_thinking = effective_settings.get("extended_thinking", True)
+        budget_tokens = effective_settings.get("budget_tokens", 10000)
+        if extended_thinking and budget_tokens:
+            model_settings_dict["anthropic_thinking"] = {
+                "type": "enabled",
+                "budget_tokens": budget_tokens,
+            }
+        model_settings = AnthropicModelSettings(**model_settings_dict)
+    return model_settings
 class ZaiChatModel(OpenAIChatModel):
@@ -52,10 +153,10 @@ def get_custom_config(model_config):
     for key, value in custom_config.get("headers", {}).items():
         if value.startswith("$"):
             env_var_name = value[1:]
-            resolved_value = os.environ.get(env_var_name)
+            resolved_value = get_api_key(env_var_name)
             if resolved_value is None:
                 emit_warning(
-                    f"Environment variable '{env_var_name}' is not set for custom endpoint header '{key}'. Proceeding with empty value."
+                    f"'{env_var_name}' is not set (check config or environment) for custom endpoint header '{key}'. Proceeding with empty value."
                 )
                 resolved_value = ""
             value = resolved_value
@@ -65,10 +166,10 @@ def get_custom_config(model_config):
             for token in tokens:
                 if token.startswith("$"):
                     env_var = token[1:]
-                    resolved_value = os.environ.get(env_var)
+                    resolved_value = get_api_key(env_var)
                     if resolved_value is None:
                         emit_warning(
-                            f"Environment variable '{env_var}' is not set for custom endpoint header '{key}'. Proceeding with empty value."
+                            f"'{env_var}' is not set (check config or environment) for custom endpoint header '{key}'. Proceeding with empty value."
                         )
                         resolved_values.append("")
                     else:
@@ -81,10 +182,10 @@ def get_custom_config(model_config):
     if "api_key" in custom_config:
         if custom_config["api_key"].startswith("$"):
             env_var_name = custom_config["api_key"][1:]
-            api_key = os.environ.get(env_var_name)
+            api_key = get_api_key(env_var_name)
             if api_key is None:
                 emit_warning(
-                    f"Environment variable '{env_var_name}' is not set for custom endpoint API key; proceeding without API key."
+                    f"API key '{env_var_name}' is not set (checked config and environment); proceeding without API key."
                 )
         else:
             api_key = custom_config["api_key"]
@@ -117,26 +218,63 @@ class ModelFactory:
             with open(MODELS_FILE, "r") as f:
                 config = json.load(f)
-        if pathlib.Path(EXTRA_MODELS_FILE).exists():
+        # Import OAuth model file paths from main config
+        from code_puppy.config import (
+            ANTIGRAVITY_MODELS_FILE,
+            CHATGPT_MODELS_FILE,
+            CLAUDE_MODELS_FILE,
+            GEMINI_MODELS_FILE,
+        )
+        # Build list of extra model sources
+        extra_sources: list[tuple[pathlib.Path, str, bool]] = [
+            (pathlib.Path(EXTRA_MODELS_FILE), "extra models", False),
+            (pathlib.Path(CHATGPT_MODELS_FILE), "ChatGPT OAuth models", False),
+            (pathlib.Path(CLAUDE_MODELS_FILE), "Claude Code OAuth models", True),
+            (pathlib.Path(GEMINI_MODELS_FILE), "Gemini OAuth models", False),
+            (pathlib.Path(ANTIGRAVITY_MODELS_FILE), "Antigravity OAuth models", False),
+        ]
+        for source_path, label, use_filtered in extra_sources:
+            if not source_path.exists():
+                continue
             try:
-                with open(EXTRA_MODELS_FILE, "r") as f:
-                    extra_config = json.load(f)
-                    config.update(extra_config)
-            except json.JSONDecodeError as e:
+                # Use filtered loading for Claude Code OAuth models to show only latest versions
+                if use_filtered:
+                    try:
+                        from code_puppy.plugins.claude_code_oauth.utils import (
+                            load_claude_models_filtered,
+                        )
+                        extra_config = load_claude_models_filtered()
+                    except ImportError:
+                        # Plugin not available, fall back to standard JSON loading
+                        logging.getLogger(__name__).debug(
+                            f"claude_code_oauth plugin not available, loading {label} as plain JSON"
+                        )
+                        with open(source_path, "r") as f:
+                            extra_config = json.load(f)
+                else:
+                    with open(source_path, "r") as f:
+                        extra_config = json.load(f)
+                config.update(extra_config)
+            except json.JSONDecodeError as exc:
                 logging.getLogger(__name__).warning(
-                    f"Failed to load extra models config from {EXTRA_MODELS_FILE}: Invalid JSON - {e}\n"
-                    f"Please check your extra_models.json file for syntax errors."
+                    f"Failed to load {label} config from {source_path}: Invalid JSON - {exc}"
                 )
-            except Exception as e:
+            except Exception as exc:
                 logging.getLogger(__name__).warning(
-                    f"Failed to load extra models config from {EXTRA_MODELS_FILE}: {e}\n"
-                    f"The extra models configuration will be ignored."
+                    f"Failed to load {label} config from {source_path}: {exc}"
                 )
         return config
     @staticmethod
     def get_model(model_name: str, config: Dict[str, Any]) -> Any:
-        """Returns a configured model instance based on the provided name and config."""
+        """Returns a configured model instance based on the provided name and config.
+        API key validation happens naturally within each model type's initialization,
+        which emits warnings and returns None if keys are missing.
+        """
         model_config = config.get(model_name)
         if not model_config:
             raise ValueError(f"Model '{model_name}' not found in configuration.")
@@ -144,41 +282,189 @@ class ModelFactory:
         model_type = model_config.get("type")
         if model_type == "gemini":
-            provider = GoogleProvider(api_key=os.environ.get("GEMINI_API_KEY", ""))
+            api_key = get_api_key("GEMINI_API_KEY")
+            if not api_key:
+                emit_warning(
+                    f"GEMINI_API_KEY is not set (check config or environment); skipping Gemini model '{model_config.get('name')}'."
+                )
+                return None
-            model = GoogleModel(model_name=model_config["name"], provider=provider)
-            setattr(model, "provider", provider)
+            model = GeminiModel(model_name=model_config["name"], api_key=api_key)
             return model
         elif model_type == "openai":
-            provider = OpenAIProvider(api_key=os.environ.get("OPENAI_API_KEY", ""))
+            api_key = get_api_key("OPENAI_API_KEY")
+            if not api_key:
+                emit_warning(
+                    f"OPENAI_API_KEY is not set (check config or environment); skipping OpenAI model '{model_config.get('name')}'."
+                )
+                return None
+            provider = OpenAIProvider(api_key=api_key)
             model = OpenAIChatModel(model_name=model_config["name"], provider=provider)
+            if "codex" in model_name:
+                model = OpenAIResponsesModel(
+                    model_name=model_config["name"], provider=provider
+                )
             setattr(model, "provider", provider)
             return model
         elif model_type == "anthropic":
-            api_key = os.environ.get("ANTHROPIC_API_KEY", None)
+            api_key = get_api_key("ANTHROPIC_API_KEY")
             if not api_key:
                 emit_warning(
-                    f"ANTHROPIC_API_KEY is not set; skipping Anthropic model '{model_config.get('name')}'."
+                    f"ANTHROPIC_API_KEY is not set (check config or environment); skipping Anthropic model '{model_config.get('name')}'."
                 )
                 return None
-            anthropic_client = AsyncAnthropic(api_key=api_key)
+            # Use the same caching client as claude_code models
+            verify = get_cert_bundle_path()
+            http2_enabled = get_http2()
+            client = ClaudeCacheAsyncClient(
+                verify=verify,
+                timeout=180,
+                http2=http2_enabled,
+            )
+            # Check if interleaved thinking is enabled for this model
+            # Only applies to Claude 4 models (Opus 4.5, Opus 4.1, Opus 4, Sonnet 4)
+            from code_puppy.config import get_effective_model_settings
+            effective_settings = get_effective_model_settings(model_name)
+            interleaved_thinking = effective_settings.get("interleaved_thinking", False)
+            default_headers = {}
+            if interleaved_thinking:
+                default_headers["anthropic-beta"] = "interleaved-thinking-2025-05-14"
+            anthropic_client = AsyncAnthropic(
+                api_key=api_key,
+                http_client=client,
+                default_headers=default_headers if default_headers else None,
+            )
+            # Ensure cache_control is injected at the Anthropic SDK layer
+            patch_anthropic_client_messages(anthropic_client)
             provider = AnthropicProvider(anthropic_client=anthropic_client)
             return AnthropicModel(model_name=model_config["name"], provider=provider)
         elif model_type == "custom_anthropic":
             url, headers, verify, api_key = get_custom_config(model_config)
-            client = create_async_client(headers=headers, verify=verify)
+            if not api_key:
+                emit_warning(
+                    f"API key is not set for custom Anthropic endpoint; skipping model '{model_config.get('name')}'."
+                )
+                return None
+            # Use the same caching client as claude_code models
+            if verify is None:
+                verify = get_cert_bundle_path()
+            http2_enabled = get_http2()
+            client = ClaudeCacheAsyncClient(
+                headers=headers,
+                verify=verify,
+                timeout=180,
+                http2=http2_enabled,
+            )
+            # Check if interleaved thinking is enabled for this model
+            from code_puppy.config import get_effective_model_settings
+            effective_settings = get_effective_model_settings(model_name)
+            interleaved_thinking = effective_settings.get("interleaved_thinking", False)
+            default_headers = {}
+            if interleaved_thinking:
+                default_headers["anthropic-beta"] = "interleaved-thinking-2025-05-14"
             anthropic_client = AsyncAnthropic(
                 base_url=url,
                 http_client=client,
                 api_key=api_key,
+                default_headers=default_headers if default_headers else None,
             )
+            # Ensure cache_control is injected at the Anthropic SDK layer
+            patch_anthropic_client_messages(anthropic_client)
             provider = AnthropicProvider(anthropic_client=anthropic_client)
             return AnthropicModel(model_name=model_config["name"], provider=provider)
+        elif model_type == "claude_code":
+            url, headers, verify, api_key = get_custom_config(model_config)
+            if model_config.get("oauth_source") == "claude-code-plugin":
+                try:
+                    from code_puppy.plugins.claude_code_oauth.utils import (
+                        get_valid_access_token,
+                    )
+                    refreshed_token = get_valid_access_token()
+                    if refreshed_token:
+                        api_key = refreshed_token
+                        custom_endpoint = model_config.get("custom_endpoint")
+                        if isinstance(custom_endpoint, dict):
+                            custom_endpoint["api_key"] = refreshed_token
+                except ImportError:
+                    pass
+            if not api_key:
+                emit_warning(
+                    f"API key is not set for Claude Code endpoint; skipping model '{model_config.get('name')}'."
+                )
+                return None
+            # Check if interleaved thinking is enabled (defaults to True for OAuth models)
+            from code_puppy.config import get_effective_model_settings
+            effective_settings = get_effective_model_settings(model_name)
+            interleaved_thinking = effective_settings.get("interleaved_thinking", True)
+            # Handle anthropic-beta header based on interleaved_thinking setting
+            if "anthropic-beta" in headers:
+                beta_parts = [p.strip() for p in headers["anthropic-beta"].split(",")]
+                if interleaved_thinking:
+                    # Ensure interleaved-thinking is in the header
+                    if "interleaved-thinking-2025-05-14" not in beta_parts:
+                        beta_parts.append("interleaved-thinking-2025-05-14")
+                else:
+                    # Remove interleaved-thinking from the header
+                    beta_parts = [
+                        p for p in beta_parts if "interleaved-thinking" not in p
+                    ]
+                headers["anthropic-beta"] = ",".join(beta_parts) if beta_parts else None
+                if headers.get("anthropic-beta") is None:
+                    del headers["anthropic-beta"]
+            elif interleaved_thinking:
+                # No existing beta header, add one for interleaved thinking
+                headers["anthropic-beta"] = "interleaved-thinking-2025-05-14"
+            # Use a dedicated client wrapper that injects cache_control on /v1/messages
+            if verify is None:
+                verify = get_cert_bundle_path()
+            http2_enabled = get_http2()
+            client = ClaudeCacheAsyncClient(
+                headers=headers,
+                verify=verify,
+                timeout=180,
+                http2=http2_enabled,
+            )
+            anthropic_client = AsyncAnthropic(
+                base_url=url,
+                http_client=client,
+                auth_token=api_key,
+            )
+            # Ensure cache_control is injected at the Anthropic SDK layer too
+            # so we don't depend solely on httpx internals.
+            patch_anthropic_client_messages(anthropic_client)
+            anthropic_client.api_key = None
+            anthropic_client.auth_token = api_key
+            provider = AnthropicProvider(anthropic_client=anthropic_client)
+            return AnthropicModel(model_name=model_config["name"], provider=provider)
         elif model_type == "azure_openai":
             azure_endpoint_config = model_config.get("azure_endpoint")
             if not azure_endpoint_config:
@@ -187,10 +473,10 @@ class ModelFactory:
                 )
             azure_endpoint = azure_endpoint_config
             if azure_endpoint_config.startswith("$"):
-                azure_endpoint = os.environ.get(azure_endpoint_config[1:])
+                azure_endpoint = get_api_key(azure_endpoint_config[1:])
             if not azure_endpoint:
                 emit_warning(
-                    f"Azure OpenAI endpoint environment variable '{azure_endpoint_config[1:] if azure_endpoint_config.startswith('$') else azure_endpoint_config}' not found or is empty; skipping model '{model_config.get('name')}'."
+                    f"Azure OpenAI endpoint '{azure_endpoint_config[1:] if azure_endpoint_config.startswith('$') else azure_endpoint_config}' not found (check config or environment); skipping model '{model_config.get('name')}'."
                 )
                 return None
@@ -201,10 +487,10 @@ class ModelFactory:
                 )
             api_version = api_version_config
             if api_version_config.startswith("$"):
-                api_version = os.environ.get(api_version_config[1:])
+                api_version = get_api_key(api_version_config[1:])
             if not api_version:
                 emit_warning(
-                    f"Azure OpenAI API version environment variable '{api_version_config[1:] if api_version_config.startswith('$') else api_version_config}' not found or is empty; skipping model '{model_config.get('name')}'."
+                    f"Azure OpenAI API version '{api_version_config[1:] if api_version_config.startswith('$') else api_version_config}' not found (check config or environment); skipping model '{model_config.get('name')}'."
                 )
                 return None
@@ -215,10 +501,10 @@ class ModelFactory:
                 )
             api_key = api_key_config
             if api_key_config.startswith("$"):
-                api_key = os.environ.get(api_key_config[1:])
+                api_key = get_api_key(api_key_config[1:])
             if not api_key:
                 emit_warning(
-                    f"Azure OpenAI API key environment variable '{api_key_config[1:] if api_key_config.startswith('$') else api_key_config}' not found or is empty; skipping model '{model_config.get('name')}'."
+                    f"Azure OpenAI API key '{api_key_config[1:] if api_key_config.startswith('$') else api_key_config}' not found (check config or environment); skipping model '{model_config.get('name')}'."
                 )
                 return None
@@ -246,71 +532,193 @@ class ModelFactory:
             if api_key:
                 provider_args["api_key"] = api_key
             provider = OpenAIProvider(**provider_args)
             model = OpenAIChatModel(model_name=model_config["name"], provider=provider)
+            if model_name == "chatgpt-gpt-5-codex":
+                model = OpenAIResponsesModel(model_config["name"], provider=provider)
             setattr(model, "provider", provider)
             return model
         elif model_type == "zai_coding":
-            api_key = os.getenv("ZAI_API_KEY")
+            api_key = get_api_key("ZAI_API_KEY")
             if not api_key:
                 emit_warning(
-                    f"ZAI_API_KEY is not set; skipping ZAI coding model '{model_config.get('name')}'."
+                    f"ZAI_API_KEY is not set (check config or environment); skipping ZAI coding model '{model_config.get('name')}'."
                 )
                 return None
+            provider = OpenAIProvider(
+                api_key=api_key,
+                base_url="https://api.z.ai/api/coding/paas/v4",
+            )
             zai_model = ZaiChatModel(
                 model_name=model_config["name"],
-                provider=OpenAIProvider(
-                    api_key=api_key,
-                    base_url="https://api.z.ai/api/coding/paas/v4",
-                ),
+                provider=provider,
             )
+            setattr(zai_model, "provider", provider)
             return zai_model
         elif model_type == "zai_api":
-            api_key = os.getenv("ZAI_API_KEY")
+            api_key = get_api_key("ZAI_API_KEY")
             if not api_key:
                 emit_warning(
-                    f"ZAI_API_KEY is not set; skipping ZAI API model '{model_config.get('name')}'."
+                    f"ZAI_API_KEY is not set (check config or environment); skipping ZAI API model '{model_config.get('name')}'."
                 )
                 return None
+            provider = OpenAIProvider(
+                api_key=api_key,
+                base_url="https://api.z.ai/api/paas/v4/",
+            )
             zai_model = ZaiChatModel(
                 model_name=model_config["name"],
-                provider=OpenAIProvider(
-                    api_key=api_key,
-                    base_url="https://api.z.ai/api/paas/v4/",
-                ),
+                provider=provider,
             )
+            setattr(zai_model, "provider", provider)
             return zai_model
         elif model_type == "custom_gemini":
             url, headers, verify, api_key = get_custom_config(model_config)
-            os.environ["GEMINI_API_KEY"] = api_key
+            if not api_key:
+                emit_warning(
+                    f"API key is not set for custom Gemini endpoint; skipping model '{model_config.get('name')}'."
+                )
+                return None
-            class CustomGoogleGLAProvider(GoogleProvider):
-                def __init__(self, *args, **kwargs):
-                    super().__init__(*args, **kwargs)
+            # Check if this is an Antigravity model
+            if model_config.get("antigravity"):
+                try:
+                    from code_puppy.plugins.antigravity_oauth.token import (
+                        is_token_expired,
+                        refresh_access_token,
+                    )
+                    from code_puppy.plugins.antigravity_oauth.transport import (
+                        create_antigravity_client,
+                    )
+                    from code_puppy.plugins.antigravity_oauth.utils import (
+                        load_stored_tokens,
+                        save_tokens,
+                    )
+                    # Try to import custom model for thinking signatures
+                    try:
+                        from code_puppy.plugins.antigravity_oauth.antigravity_model import (
+                            AntigravityModel,
+                        )
+                    except ImportError:
+                        AntigravityModel = None
-                @property
-                def base_url(self):
-                    return url
+                    # Get fresh access token (refresh if needed)
+                    tokens = load_stored_tokens()
+                    if not tokens:
+                        emit_warning(
+                            "Antigravity tokens not found; run /antigravity-auth first."
+                        )
+                        return None
+                    access_token = tokens.get("access_token", "")
+                    refresh_token = tokens.get("refresh_token", "")
+                    expires_at = tokens.get("expires_at")
+                    # Refresh if expired or about to expire (initial check)
+                    if is_token_expired(expires_at):
+                        new_tokens = refresh_access_token(refresh_token)
+                        if new_tokens:
+                            access_token = new_tokens.access_token
+                            refresh_token = new_tokens.refresh_token
+                            expires_at = new_tokens.expires_at
+                            tokens["access_token"] = new_tokens.access_token
+                            tokens["refresh_token"] = new_tokens.refresh_token
+                            tokens["expires_at"] = new_tokens.expires_at
+                            save_tokens(tokens)
+                        else:
+                            emit_warning(
+                                "Failed to refresh Antigravity token; run /antigravity-auth again."
+                            )
+                            return None
+                    # Callback to persist tokens when proactively refreshed during session
+                    def on_token_refreshed(new_tokens):
+                        """Persist new tokens when proactively refreshed."""
+                        try:
+                            updated_tokens = load_stored_tokens() or {}
+                            updated_tokens["access_token"] = new_tokens.access_token
+                            updated_tokens["refresh_token"] = new_tokens.refresh_token
+                            updated_tokens["expires_at"] = new_tokens.expires_at
+                            save_tokens(updated_tokens)
+                            logger.debug(
+                                "Persisted proactively refreshed Antigravity tokens"
+                            )
+                        except Exception as e:
+                            logger.warning("Failed to persist refreshed tokens: %s", e)
+                    project_id = tokens.get(
+                        "project_id", model_config.get("project_id", "")
+                    )
+                    client = create_antigravity_client(
+                        access_token=access_token,
+                        project_id=project_id,
+                        model_name=model_config["name"],
+                        base_url=url,
+                        headers=headers,
+                        refresh_token=refresh_token,
+                        expires_at=expires_at,
+                        on_token_refreshed=on_token_refreshed,
+                    )
+                    # Use custom model with direct httpx client
+                    if AntigravityModel:
+                        model = AntigravityModel(
+                            model_name=model_config["name"],
+                            api_key=api_key
+                            or "",  # Antigravity uses OAuth, key may be empty
+                            base_url=url,
+                            http_client=client,
+                        )
+                    else:
+                        model = GeminiModel(
+                            model_name=model_config["name"],
+                            api_key=api_key or "",
+                            base_url=url,
+                            http_client=client,
+                        )
-                @property
-                def client(self) -> httpx.AsyncClient:
-                    _client = create_async_client(headers=headers, verify=verify)
-                    _client.base_url = self.base_url
-                    return _client
+                    return model
+                except ImportError:
+                    emit_warning(
+                        f"Antigravity transport not available; skipping model '{model_config.get('name')}'."
+                    )
+                    return None
+            else:
+                client = create_async_client(headers=headers, verify=verify)
-            google_gla = CustomGoogleGLAProvider(api_key=api_key)
-            model = GoogleModel(model_name=model_config["name"], provider=google_gla)
+            model = GeminiModel(
+                model_name=model_config["name"],
+                api_key=api_key,
+                base_url=url,
+                http_client=client,
+            )
             return model
         elif model_type == "cerebras":
+            class ZaiCerebrasProvider(CerebrasProvider):
+                def model_profile(self, model_name: str) -> ModelProfile | None:
+                    profile = super().model_profile(model_name)
+                    if model_name.startswith("zai"):
+                        from pydantic_ai.profiles.qwen import qwen_model_profile
+                        profile = profile.update(qwen_model_profile("qwen-3-coder"))
+                    return profile
             url, headers, verify, api_key = get_custom_config(model_config)
+            if not api_key:
+                emit_warning(
+                    f"API key is not set for Cerebras endpoint; skipping model '{model_config.get('name')}'."
+                )
+                return None
+            # Add Cerebras 3rd party integration header
+            headers["X-Cerebras-3rd-Party-Integration"] = "code-puppy"
             client = create_async_client(headers=headers, verify=verify)
             provider_args = dict(
                 api_key=api_key,
                 http_client=client,
             )
-            if api_key:
-                provider_args["api_key"] = api_key
-            provider = CerebrasProvider(**provider_args)
+            provider = ZaiCerebrasProvider(**provider_args)
             model = OpenAIChatModel(model_name=model_config["name"], provider=provider)
             setattr(model, "provider", provider)
@@ -325,17 +733,23 @@ class ModelFactory:
                 if api_key_config.startswith("$"):
                     # It's an environment variable reference
                     env_var_name = api_key_config[1:]  # Remove the $ prefix
-                    api_key = os.environ.get(env_var_name)
+                    api_key = get_api_key(env_var_name)
                     if api_key is None:
                         emit_warning(
-                            f"OpenRouter API key environment variable '{env_var_name}' not found or is empty; proceeding without API key."
+                            f"OpenRouter API key '{env_var_name}' not found (check config or environment); skipping model '{model_config.get('name')}'."
                         )
-                    else:
-                        # It's a raw API key value
-                        api_key = api_key_config
+                        return None
+                else:
+                    # It's a raw API key value
+                    api_key = api_key_config
             else:
-                # No API key in config, try to get it from the default environment variable
-                api_key = os.environ.get("OPENROUTER_API_KEY")
+                # No API key in config, try to get it from config or the default environment variable
+                api_key = get_api_key("OPENROUTER_API_KEY")
+                if api_key is None:
+                    emit_warning(
+                        f"OPENROUTER_API_KEY is not set (check config or environment); skipping OpenRouter model '{model_config.get('name')}'."
+                    )
+                    return None
             provider = OpenRouterProvider(api_key=api_key)
@@ -343,6 +757,143 @@ class ModelFactory:
             setattr(model, "provider", provider)
             return model
+        elif model_type == "gemini_oauth":
+            # Gemini OAuth models use the Code Assist API (cloudcode-pa.googleapis.com)
+            # This is a different API than the standard Generative Language API
+            try:
+                # Try user plugin first, then built-in plugin
+                try:
+                    from gemini_oauth.config import GEMINI_OAUTH_CONFIG
+                    from gemini_oauth.utils import (
+                        get_project_id,
+                        get_valid_access_token,
+                    )
+                except ImportError:
+                    from code_puppy.plugins.gemini_oauth.config import (
+                        GEMINI_OAUTH_CONFIG,
+                    )
+                    from code_puppy.plugins.gemini_oauth.utils import (
+                        get_project_id,
+                        get_valid_access_token,
+                    )
+            except ImportError as exc:
+                emit_warning(
+                    f"Gemini OAuth plugin not available; skipping model '{model_config.get('name')}'. "
+                    f"Error: {exc}"
+                )
+                return None
+            # Get a valid access token (refreshing if needed)
+            access_token = get_valid_access_token()
+            if not access_token:
+                emit_warning(
+                    f"Failed to get valid Gemini OAuth token; skipping model '{model_config.get('name')}'. "
+                    "Run /gemini-auth to re-authenticate."
+                )
+                return None
+            # Get project ID from stored tokens
+            project_id = get_project_id()
+            if not project_id:
+                emit_warning(
+                    f"No Code Assist project ID found; skipping model '{model_config.get('name')}'. "
+                    "Run /gemini-auth to re-authenticate."
+                )
+                return None
+            # Import the Code Assist model wrapper
+            from code_puppy.gemini_code_assist import GeminiCodeAssistModel
+            # Create the Code Assist model
+            model = GeminiCodeAssistModel(
+                model_name=model_config["name"],
+                access_token=access_token,
+                project_id=project_id,
+                api_base_url=GEMINI_OAUTH_CONFIG["api_base_url"],
+                api_version=GEMINI_OAUTH_CONFIG["api_version"],
+            )
+            return model
+        elif model_type == "chatgpt_oauth":
+            # ChatGPT OAuth models use the Codex API at chatgpt.com
+            try:
+                try:
+                    from chatgpt_oauth.config import CHATGPT_OAUTH_CONFIG
+                    from chatgpt_oauth.utils import (
+                        get_valid_access_token,
+                        load_stored_tokens,
+                    )
+                except ImportError:
+                    from code_puppy.plugins.chatgpt_oauth.config import (
+                        CHATGPT_OAUTH_CONFIG,
+                    )
+                    from code_puppy.plugins.chatgpt_oauth.utils import (
+                        get_valid_access_token,
+                        load_stored_tokens,
+                    )
+            except ImportError as exc:
+                emit_warning(
+                    f"ChatGPT OAuth plugin not available; skipping model '{model_config.get('name')}'. "
+                    f"Error: {exc}"
+                )
+                return None
+            # Get a valid access token (refreshing if needed)
+            access_token = get_valid_access_token()
+            if not access_token:
+                emit_warning(
+                    f"Failed to get valid ChatGPT OAuth token; skipping model '{model_config.get('name')}'. "
+                    "Run /chatgpt-auth to authenticate."
+                )
+                return None
+            # Get account_id from stored tokens (required for ChatGPT-Account-Id header)
+            tokens = load_stored_tokens()
+            account_id = tokens.get("account_id", "") if tokens else ""
+            if not account_id:
+                emit_warning(
+                    f"No account_id found in ChatGPT OAuth tokens; skipping model '{model_config.get('name')}'. "
+                    "Run /chatgpt-auth to re-authenticate."
+                )
+                return None
+            # Build headers for ChatGPT Codex API
+            originator = CHATGPT_OAUTH_CONFIG.get("originator", "codex_cli_rs")
+            client_version = CHATGPT_OAUTH_CONFIG.get("client_version", "0.72.0")
+            headers = {
+                "ChatGPT-Account-Id": account_id,
+                "originator": originator,
+                "User-Agent": f"{originator}/{client_version}",
+            }
+            # Merge with any headers from model config
+            config_headers = model_config.get("custom_endpoint", {}).get("headers", {})
+            headers.update(config_headers)
+            # Get base URL - Codex API uses chatgpt.com, not api.openai.com
+            base_url = model_config.get("custom_endpoint", {}).get(
+                "url", CHATGPT_OAUTH_CONFIG["api_base_url"]
+            )
+            # Create HTTP client with Codex interceptor for store=false injection
+            from code_puppy.chatgpt_codex_client import create_codex_async_client
+            verify = get_cert_bundle_path()
+            client = create_codex_async_client(headers=headers, verify=verify)
+            provider = OpenAIProvider(
+                api_key=access_token,
+                base_url=base_url,
+                http_client=client,
+            )
+            # ChatGPT Codex API only supports Responses format
+            model = OpenAIResponsesModel(
+                model_name=model_config["name"], provider=provider
+            )
+            setattr(model, "provider", provider)
+            return model
         elif model_type == "round_robin":
             # Get the list of model names to use in the round-robin
             model_names = model_config.get("models")

code-puppy 0.0.214__py3-none-any.whl → 0.0.366__py3-none-any.whl

code-puppy 0.0.214py3-none-any.whl → 0.0.366py3-none-any.whl