PyPI - codepp - Versions diffs - 0.0.437__py3-none-any.whl - Mend

codepp 0.0.437__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (288) hide show

code_puppy/__init__.py +10 -0
code_puppy/__main__.py +10 -0
code_puppy/agents/__init__.py +31 -0
code_puppy/agents/agent_c_reviewer.py +155 -0
code_puppy/agents/agent_code_puppy.py +117 -0
code_puppy/agents/agent_code_reviewer.py +90 -0
code_puppy/agents/agent_cpp_reviewer.py +132 -0
code_puppy/agents/agent_creator_agent.py +638 -0
code_puppy/agents/agent_golang_reviewer.py +151 -0
code_puppy/agents/agent_helios.py +124 -0
code_puppy/agents/agent_javascript_reviewer.py +160 -0
code_puppy/agents/agent_manager.py +742 -0
code_puppy/agents/agent_pack_leader.py +385 -0
code_puppy/agents/agent_planning.py +165 -0
code_puppy/agents/agent_python_programmer.py +169 -0
code_puppy/agents/agent_python_reviewer.py +90 -0
code_puppy/agents/agent_qa_expert.py +163 -0
code_puppy/agents/agent_qa_kitten.py +208 -0
code_puppy/agents/agent_scheduler.py +121 -0
code_puppy/agents/agent_security_auditor.py +181 -0
code_puppy/agents/agent_terminal_qa.py +323 -0
code_puppy/agents/agent_typescript_reviewer.py +166 -0
code_puppy/agents/base_agent.py +2156 -0
code_puppy/agents/event_stream_handler.py +348 -0
code_puppy/agents/json_agent.py +202 -0
code_puppy/agents/pack/__init__.py +34 -0
code_puppy/agents/pack/bloodhound.py +304 -0
code_puppy/agents/pack/husky.py +327 -0
code_puppy/agents/pack/retriever.py +393 -0
code_puppy/agents/pack/shepherd.py +348 -0
code_puppy/agents/pack/terrier.py +287 -0
code_puppy/agents/pack/watchdog.py +367 -0
code_puppy/agents/prompt_reviewer.py +145 -0
code_puppy/agents/subagent_stream_handler.py +276 -0
code_puppy/api/__init__.py +13 -0
code_puppy/api/app.py +169 -0
code_puppy/api/main.py +21 -0
code_puppy/api/pty_manager.py +453 -0
code_puppy/api/routers/__init__.py +12 -0
code_puppy/api/routers/agents.py +36 -0
code_puppy/api/routers/commands.py +217 -0
code_puppy/api/routers/config.py +75 -0
code_puppy/api/routers/sessions.py +234 -0
code_puppy/api/templates/terminal.html +361 -0
code_puppy/api/websocket.py +154 -0
code_puppy/callbacks.py +692 -0
code_puppy/chatgpt_codex_client.py +338 -0
code_puppy/claude_cache_client.py +672 -0
code_puppy/cli_runner.py +1073 -0
code_puppy/command_line/__init__.py +1 -0
code_puppy/command_line/add_model_menu.py +1092 -0
code_puppy/command_line/agent_menu.py +662 -0
code_puppy/command_line/attachments.py +395 -0
code_puppy/command_line/autosave_menu.py +704 -0
code_puppy/command_line/clipboard.py +527 -0
code_puppy/command_line/colors_menu.py +532 -0
code_puppy/command_line/command_handler.py +293 -0
code_puppy/command_line/command_registry.py +150 -0
code_puppy/command_line/config_commands.py +719 -0
code_puppy/command_line/core_commands.py +867 -0
code_puppy/command_line/diff_menu.py +865 -0
code_puppy/command_line/file_path_completion.py +73 -0
code_puppy/command_line/load_context_completion.py +52 -0
code_puppy/command_line/mcp/__init__.py +10 -0
code_puppy/command_line/mcp/base.py +32 -0
code_puppy/command_line/mcp/catalog_server_installer.py +175 -0
code_puppy/command_line/mcp/custom_server_form.py +688 -0
code_puppy/command_line/mcp/custom_server_installer.py +195 -0
code_puppy/command_line/mcp/edit_command.py +148 -0
code_puppy/command_line/mcp/handler.py +138 -0
code_puppy/command_line/mcp/help_command.py +147 -0
code_puppy/command_line/mcp/install_command.py +214 -0
code_puppy/command_line/mcp/install_menu.py +705 -0
code_puppy/command_line/mcp/list_command.py +94 -0
code_puppy/command_line/mcp/logs_command.py +235 -0
code_puppy/command_line/mcp/remove_command.py +82 -0
code_puppy/command_line/mcp/restart_command.py +100 -0
code_puppy/command_line/mcp/search_command.py +123 -0
code_puppy/command_line/mcp/start_all_command.py +135 -0
code_puppy/command_line/mcp/start_command.py +117 -0
code_puppy/command_line/mcp/status_command.py +184 -0
code_puppy/command_line/mcp/stop_all_command.py +112 -0
code_puppy/command_line/mcp/stop_command.py +80 -0
code_puppy/command_line/mcp/test_command.py +107 -0
code_puppy/command_line/mcp/utils.py +129 -0
code_puppy/command_line/mcp/wizard_utils.py +334 -0
code_puppy/command_line/mcp_completion.py +174 -0
code_puppy/command_line/model_picker_completion.py +197 -0
code_puppy/command_line/model_settings_menu.py +932 -0
code_puppy/command_line/motd.py +96 -0
code_puppy/command_line/onboarding_slides.py +179 -0
code_puppy/command_line/onboarding_wizard.py +342 -0
code_puppy/command_line/pin_command_completion.py +329 -0
code_puppy/command_line/prompt_toolkit_completion.py +846 -0
code_puppy/command_line/session_commands.py +302 -0
code_puppy/command_line/shell_passthrough.py +145 -0
code_puppy/command_line/skills_completion.py +160 -0
code_puppy/command_line/uc_menu.py +893 -0
code_puppy/command_line/utils.py +93 -0
code_puppy/command_line/wiggum_state.py +78 -0
code_puppy/config.py +1770 -0
code_puppy/error_logging.py +134 -0
code_puppy/gemini_code_assist.py +385 -0
code_puppy/gemini_model.py +754 -0
code_puppy/hook_engine/README.md +105 -0
code_puppy/hook_engine/__init__.py +21 -0
code_puppy/hook_engine/aliases.py +155 -0
code_puppy/hook_engine/engine.py +221 -0
code_puppy/hook_engine/executor.py +296 -0
code_puppy/hook_engine/matcher.py +156 -0
code_puppy/hook_engine/models.py +240 -0
code_puppy/hook_engine/registry.py +106 -0
code_puppy/hook_engine/validator.py +144 -0
code_puppy/http_utils.py +361 -0
code_puppy/keymap.py +128 -0
code_puppy/main.py +10 -0
code_puppy/mcp_/__init__.py +66 -0
code_puppy/mcp_/async_lifecycle.py +286 -0
code_puppy/mcp_/blocking_startup.py +469 -0
code_puppy/mcp_/captured_stdio_server.py +275 -0
code_puppy/mcp_/circuit_breaker.py +290 -0
code_puppy/mcp_/config_wizard.py +507 -0
code_puppy/mcp_/dashboard.py +308 -0
code_puppy/mcp_/error_isolation.py +407 -0
code_puppy/mcp_/examples/retry_example.py +226 -0
code_puppy/mcp_/health_monitor.py +589 -0
code_puppy/mcp_/managed_server.py +428 -0
code_puppy/mcp_/manager.py +807 -0
code_puppy/mcp_/mcp_logs.py +224 -0
code_puppy/mcp_/registry.py +451 -0
code_puppy/mcp_/retry_manager.py +337 -0
code_puppy/mcp_/server_registry_catalog.py +1126 -0
code_puppy/mcp_/status_tracker.py +355 -0
code_puppy/mcp_/system_tools.py +209 -0
code_puppy/mcp_prompts/__init__.py +1 -0
code_puppy/mcp_prompts/hook_creator.py +103 -0
code_puppy/messaging/__init__.py +255 -0
code_puppy/messaging/bus.py +613 -0
code_puppy/messaging/commands.py +167 -0
code_puppy/messaging/markdown_patches.py +57 -0
code_puppy/messaging/message_queue.py +361 -0
code_puppy/messaging/messages.py +569 -0
code_puppy/messaging/queue_console.py +271 -0
code_puppy/messaging/renderers.py +311 -0
code_puppy/messaging/rich_renderer.py +1158 -0
code_puppy/messaging/spinner/__init__.py +83 -0
code_puppy/messaging/spinner/console_spinner.py +240 -0
code_puppy/messaging/spinner/spinner_base.py +95 -0
code_puppy/messaging/subagent_console.py +460 -0
code_puppy/model_factory.py +848 -0
code_puppy/model_switching.py +63 -0
code_puppy/model_utils.py +168 -0
code_puppy/models.json +174 -0
code_puppy/models_dev_api.json +1 -0
code_puppy/models_dev_parser.py +592 -0
code_puppy/plugins/__init__.py +186 -0
code_puppy/plugins/agent_skills/__init__.py +22 -0
code_puppy/plugins/agent_skills/config.py +175 -0
code_puppy/plugins/agent_skills/discovery.py +136 -0
code_puppy/plugins/agent_skills/downloader.py +392 -0
code_puppy/plugins/agent_skills/installer.py +22 -0
code_puppy/plugins/agent_skills/metadata.py +219 -0
code_puppy/plugins/agent_skills/prompt_builder.py +60 -0
code_puppy/plugins/agent_skills/register_callbacks.py +241 -0
code_puppy/plugins/agent_skills/remote_catalog.py +322 -0
code_puppy/plugins/agent_skills/skill_catalog.py +257 -0
code_puppy/plugins/agent_skills/skills_install_menu.py +664 -0
code_puppy/plugins/agent_skills/skills_menu.py +781 -0
code_puppy/plugins/antigravity_oauth/__init__.py +10 -0
code_puppy/plugins/antigravity_oauth/accounts.py +406 -0
code_puppy/plugins/antigravity_oauth/antigravity_model.py +706 -0
code_puppy/plugins/antigravity_oauth/config.py +42 -0
code_puppy/plugins/antigravity_oauth/constants.py +133 -0
code_puppy/plugins/antigravity_oauth/oauth.py +478 -0
code_puppy/plugins/antigravity_oauth/register_callbacks.py +518 -0
code_puppy/plugins/antigravity_oauth/storage.py +288 -0
code_puppy/plugins/antigravity_oauth/test_plugin.py +319 -0
code_puppy/plugins/antigravity_oauth/token.py +167 -0
code_puppy/plugins/antigravity_oauth/transport.py +863 -0
code_puppy/plugins/antigravity_oauth/utils.py +168 -0
code_puppy/plugins/chatgpt_oauth/__init__.py +8 -0
code_puppy/plugins/chatgpt_oauth/config.py +52 -0
code_puppy/plugins/chatgpt_oauth/oauth_flow.py +329 -0
code_puppy/plugins/chatgpt_oauth/register_callbacks.py +176 -0
code_puppy/plugins/chatgpt_oauth/test_plugin.py +301 -0
code_puppy/plugins/chatgpt_oauth/utils.py +523 -0
code_puppy/plugins/claude_code_hooks/__init__.py +1 -0
code_puppy/plugins/claude_code_hooks/config.py +137 -0
code_puppy/plugins/claude_code_hooks/register_callbacks.py +175 -0
code_puppy/plugins/claude_code_oauth/README.md +167 -0
code_puppy/plugins/claude_code_oauth/SETUP.md +93 -0
code_puppy/plugins/claude_code_oauth/__init__.py +25 -0
code_puppy/plugins/claude_code_oauth/config.py +52 -0
code_puppy/plugins/claude_code_oauth/register_callbacks.py +453 -0
code_puppy/plugins/claude_code_oauth/test_plugin.py +283 -0
code_puppy/plugins/claude_code_oauth/token_refresh_heartbeat.py +241 -0
code_puppy/plugins/claude_code_oauth/utils.py +640 -0
code_puppy/plugins/customizable_commands/__init__.py +0 -0
code_puppy/plugins/customizable_commands/register_callbacks.py +152 -0
code_puppy/plugins/example_custom_command/README.md +280 -0
code_puppy/plugins/example_custom_command/register_callbacks.py +51 -0
code_puppy/plugins/file_permission_handler/__init__.py +4 -0
code_puppy/plugins/file_permission_handler/register_callbacks.py +470 -0
code_puppy/plugins/frontend_emitter/__init__.py +25 -0
code_puppy/plugins/frontend_emitter/emitter.py +121 -0
code_puppy/plugins/frontend_emitter/register_callbacks.py +261 -0
code_puppy/plugins/hook_creator/__init__.py +1 -0
code_puppy/plugins/hook_creator/register_callbacks.py +33 -0
code_puppy/plugins/hook_manager/__init__.py +1 -0
code_puppy/plugins/hook_manager/config.py +290 -0
code_puppy/plugins/hook_manager/hooks_menu.py +564 -0
code_puppy/plugins/hook_manager/register_callbacks.py +227 -0
code_puppy/plugins/oauth_puppy_html.py +228 -0
code_puppy/plugins/scheduler/__init__.py +1 -0
code_puppy/plugins/scheduler/register_callbacks.py +88 -0
code_puppy/plugins/scheduler/scheduler_menu.py +522 -0
code_puppy/plugins/scheduler/scheduler_wizard.py +341 -0
code_puppy/plugins/shell_safety/__init__.py +6 -0
code_puppy/plugins/shell_safety/agent_shell_safety.py +69 -0
code_puppy/plugins/shell_safety/command_cache.py +156 -0
code_puppy/plugins/shell_safety/register_callbacks.py +202 -0
code_puppy/plugins/synthetic_status/__init__.py +1 -0
code_puppy/plugins/synthetic_status/register_callbacks.py +132 -0
code_puppy/plugins/synthetic_status/status_api.py +147 -0
code_puppy/plugins/universal_constructor/__init__.py +13 -0
code_puppy/plugins/universal_constructor/models.py +138 -0
code_puppy/plugins/universal_constructor/register_callbacks.py +47 -0
code_puppy/plugins/universal_constructor/registry.py +302 -0
code_puppy/plugins/universal_constructor/sandbox.py +584 -0
code_puppy/prompts/antigravity_system_prompt.md +1 -0
code_puppy/pydantic_patches.py +356 -0
code_puppy/reopenable_async_client.py +232 -0
code_puppy/round_robin_model.py +150 -0
code_puppy/scheduler/__init__.py +41 -0
code_puppy/scheduler/__main__.py +9 -0
code_puppy/scheduler/cli.py +118 -0
code_puppy/scheduler/config.py +126 -0
code_puppy/scheduler/daemon.py +280 -0
code_puppy/scheduler/executor.py +155 -0
code_puppy/scheduler/platform.py +19 -0
code_puppy/scheduler/platform_unix.py +22 -0
code_puppy/scheduler/platform_win.py +32 -0
code_puppy/session_storage.py +338 -0
code_puppy/status_display.py +257 -0
code_puppy/summarization_agent.py +176 -0
code_puppy/terminal_utils.py +418 -0
code_puppy/tools/__init__.py +501 -0
code_puppy/tools/agent_tools.py +603 -0
code_puppy/tools/ask_user_question/__init__.py +26 -0
code_puppy/tools/ask_user_question/constants.py +73 -0
code_puppy/tools/ask_user_question/demo_tui.py +55 -0
code_puppy/tools/ask_user_question/handler.py +232 -0
code_puppy/tools/ask_user_question/models.py +304 -0
code_puppy/tools/ask_user_question/registration.py +26 -0
code_puppy/tools/ask_user_question/renderers.py +309 -0
code_puppy/tools/ask_user_question/terminal_ui.py +329 -0
code_puppy/tools/ask_user_question/theme.py +155 -0
code_puppy/tools/ask_user_question/tui_loop.py +423 -0
code_puppy/tools/browser/__init__.py +37 -0
code_puppy/tools/browser/browser_control.py +289 -0
code_puppy/tools/browser/browser_interactions.py +545 -0
code_puppy/tools/browser/browser_locators.py +640 -0
code_puppy/tools/browser/browser_manager.py +378 -0
code_puppy/tools/browser/browser_navigation.py +251 -0
code_puppy/tools/browser/browser_screenshot.py +179 -0
code_puppy/tools/browser/browser_scripts.py +462 -0
code_puppy/tools/browser/browser_workflows.py +221 -0
code_puppy/tools/browser/chromium_terminal_manager.py +259 -0
code_puppy/tools/browser/terminal_command_tools.py +534 -0
code_puppy/tools/browser/terminal_screenshot_tools.py +552 -0
code_puppy/tools/browser/terminal_tools.py +525 -0
code_puppy/tools/command_runner.py +1346 -0
code_puppy/tools/common.py +1409 -0
code_puppy/tools/display.py +84 -0
code_puppy/tools/file_modifications.py +886 -0
code_puppy/tools/file_operations.py +802 -0
code_puppy/tools/scheduler_tools.py +412 -0
code_puppy/tools/skills_tools.py +244 -0
code_puppy/tools/subagent_context.py +158 -0
code_puppy/tools/tools_content.py +51 -0
code_puppy/tools/universal_constructor.py +889 -0
code_puppy/uvx_detection.py +242 -0
code_puppy/version_checker.py +82 -0
codepp-0.0.437.dist-info/METADATA +766 -0
codepp-0.0.437.dist-info/RECORD +288 -0
codepp-0.0.437.dist-info/WHEEL +4 -0
codepp-0.0.437.dist-info/entry_points.txt +3 -0
codepp-0.0.437.dist-info/licenses/LICENSE +21 -0

code_puppy/model_factory.py ADDED Viewed

@@ -0,0 +1,848 @@
+import json
+import logging
+import os
+import pathlib
+from typing import Any, Dict
+from anthropic import AsyncAnthropic
+from openai import AsyncAzureOpenAI
+from pydantic_ai.models.anthropic import AnthropicModel, AnthropicModelSettings
+from pydantic_ai.models.openai import (
+    OpenAIChatModel,
+    OpenAIChatModelSettings,
+    OpenAIResponsesModel,
+)
+from pydantic_ai.profiles import ModelProfile
+from pydantic_ai.providers.anthropic import AnthropicProvider
+from pydantic_ai.providers.cerebras import CerebrasProvider
+from pydantic_ai.providers.openai import OpenAIProvider
+from pydantic_ai.providers.openrouter import OpenRouterProvider
+from pydantic_ai.settings import ModelSettings
+from code_puppy.gemini_model import GeminiModel
+from code_puppy.messaging import emit_warning
+from . import callbacks
+from .claude_cache_client import ClaudeCacheAsyncClient, patch_anthropic_client_messages
+from .config import EXTRA_MODELS_FILE, get_value, get_yolo_mode
+from .http_utils import create_async_client, get_cert_bundle_path, get_http2
+from .round_robin_model import RoundRobinModel
+logger = logging.getLogger(__name__)
+# Registry for custom model provider classes from plugins
+_CUSTOM_MODEL_PROVIDERS: Dict[str, type] = {}
+def _load_plugin_model_providers():
+    """Load custom model providers from plugins."""
+    global _CUSTOM_MODEL_PROVIDERS
+    try:
+        from code_puppy.callbacks import on_register_model_providers
+        results = on_register_model_providers()
+        for result in results:
+            if isinstance(result, dict):
+                _CUSTOM_MODEL_PROVIDERS.update(result)
+    except Exception as e:
+        logger.warning("Failed to load plugin model providers: %s", e)
+# Load plugin model providers at module initialization
+_load_plugin_model_providers()
+# Anthropic beta header required for 1M context window support.
+CONTEXT_1M_BETA = "context-1m-2025-08-07"
+def _build_anthropic_beta_header(
+    model_config: Dict,
+    *,
+    interleaved_thinking: bool = False,
+) -> str | None:
+    """Build the anthropic-beta header value for an Anthropic model.
+    Combines beta flags based on model capabilities:
+    - interleaved-thinking-2025-05-14  (when interleaved_thinking is enabled)
+    - context-1m-2025-08-07            (when context_length >= 1_000_000)
+    Returns None if no beta flags are needed.
+    """
+    parts: list[str] = []
+    if interleaved_thinking:
+        parts.append("interleaved-thinking-2025-05-14")
+    if model_config.get("context_length", 0) >= 1_000_000:
+        parts.append(CONTEXT_1M_BETA)
+    return ",".join(parts) if parts else None
+def get_api_key(env_var_name: str) -> str | None:
+    """Get an API key from config first, then fall back to environment variable.
+    This allows users to set API keys via `/set KIMI_API_KEY=xxx` in addition to
+    setting them as environment variables.
+    Args:
+        env_var_name: The name of the environment variable (e.g., "OPENAI_API_KEY")
+    Returns:
+        The API key value, or None if not found in either config or environment.
+    """
+    # First check config (case-insensitive key lookup)
+    config_value = get_value(env_var_name.lower())
+    if config_value:
+        return config_value
+    # Fall back to environment variable
+    return os.environ.get(env_var_name)
+def make_model_settings(
+    model_name: str, max_tokens: int | None = None
+) -> ModelSettings:
+    """Create appropriate ModelSettings for a given model.
+    This handles model-specific settings:
+    - GPT-5 models: reasoning_effort and verbosity (non-codex only)
+    - Claude/Anthropic models: extended_thinking and budget_tokens
+    - Automatic max_tokens calculation based on model context length
+    Args:
+        model_name: The name of the model to create settings for.
+        max_tokens: Optional max tokens limit. If None, automatically calculated
+            as: max(2048, min(15% of context_length, 65536))
+    Returns:
+        Appropriate ModelSettings subclass instance for the model.
+    """
+    from code_puppy.config import (
+        get_effective_model_settings,
+        get_openai_reasoning_effort,
+        get_openai_verbosity,
+        model_supports_setting,
+    )
+    model_settings_dict: dict = {}
+    # Calculate max_tokens if not explicitly provided
+    if max_tokens is None:
+        # Load model config to get context length
+        try:
+            models_config = ModelFactory.load_config()
+            model_config = models_config.get(model_name, {})
+            context_length = model_config.get("context_length", 128000)
+        except Exception:
+            # Fallback if config loading fails (e.g., in CI environments)
+            context_length = 128000
+        # min 2048, 15% of context, max 65536
+        max_tokens = max(2048, min(int(0.15 * context_length), 65536))
+    model_settings_dict["max_tokens"] = max_tokens
+    effective_settings = get_effective_model_settings(model_name)
+    model_settings_dict.update(effective_settings)
+    # Disable parallel tool calls when yolo_mode is off (sequential so user can review each call)
+    if not get_yolo_mode():
+        model_settings_dict["parallel_tool_calls"] = False
+    # Default to clear_thinking=False for GLM-4.7 and GLM-5 models (preserved thinking)
+    if "glm-4.7" in model_name.lower() or "glm-5" in model_name.lower():
+        clear_thinking = effective_settings.get("clear_thinking", False)
+        model_settings_dict["thinking"] = {
+            "type": "enabled",
+            "clear_thinking": clear_thinking,
+        }
+    model_settings: ModelSettings = ModelSettings(**model_settings_dict)
+    if "gpt-5" in model_name:
+        model_settings_dict["openai_reasoning_effort"] = get_openai_reasoning_effort()
+        # Verbosity only applies to non-codex GPT-5 models (codex only supports "medium")
+        if "codex" not in model_name:
+            verbosity = get_openai_verbosity()
+            model_settings_dict["extra_body"] = {"verbosity": verbosity}
+        model_settings = OpenAIChatModelSettings(**model_settings_dict)
+    elif model_name.startswith("claude-") or model_name.startswith("anthropic-"):
+        # Handle Anthropic extended thinking settings
+        # Remove top_p as Anthropic doesn't support it with extended thinking
+        model_settings_dict.pop("top_p", None)
+        # Claude extended thinking requires temperature=1.0 (API restriction)
+        # Default to 1.0 if not explicitly set by user
+        if model_settings_dict.get("temperature") is None:
+            model_settings_dict["temperature"] = 1.0
+        from code_puppy.model_utils import get_default_extended_thinking
+        default_thinking = get_default_extended_thinking(model_name)
+        extended_thinking = effective_settings.get(
+            "extended_thinking", default_thinking
+        )
+        # Backwards compat: handle legacy boolean values
+        if extended_thinking is True:
+            extended_thinking = "enabled"
+        elif extended_thinking is False:
+            extended_thinking = "off"
+        budget_tokens = effective_settings.get("budget_tokens", 10000)
+        if extended_thinking in ("enabled", "adaptive"):
+            model_settings_dict["anthropic_thinking"] = {
+                "type": extended_thinking,
+            }
+            # Only send budget_tokens for classic "enabled" mode
+            if extended_thinking == "enabled" and budget_tokens:
+                model_settings_dict["anthropic_thinking"]["budget_tokens"] = (
+                    budget_tokens
+                )
+        # Opus 4-6 models support the `effort` setting via output_config.
+        # pydantic-ai doesn't have a native field for output_config yet,
+        # so we inject it through extra_body which gets merged into the
+        # HTTP request body.
+        if model_supports_setting(model_name, "effort"):
+            effort = effective_settings.get("effort", "high")
+            if "anthropic_thinking" in model_settings_dict:
+                extra_body = model_settings_dict.get("extra_body") or {}
+                extra_body["output_config"] = {"effort": effort}
+                model_settings_dict["extra_body"] = extra_body
+        model_settings = AnthropicModelSettings(**model_settings_dict)
+    # Handle Gemini thinking models (Gemini-3)
+    # Check if model supports thinking settings and apply defaults
+    if model_supports_setting(model_name, "thinking_level"):
+        # Apply defaults if not explicitly set by user
+        # Default: thinking_enabled=True, thinking_level="low"
+        if "thinking_enabled" not in model_settings_dict:
+            model_settings_dict["thinking_enabled"] = True
+        if "thinking_level" not in model_settings_dict:
+            model_settings_dict["thinking_level"] = "low"
+        # Recreate settings with Gemini thinking config
+        model_settings = ModelSettings(**model_settings_dict)
+    return model_settings
+class ZaiChatModel(OpenAIChatModel):
+    def _process_response(self, response):
+        response.object = "chat.completion"
+        return super()._process_response(response)
+def get_custom_config(model_config):
+    custom_config = model_config.get("custom_endpoint", {})
+    if not custom_config:
+        raise ValueError("Custom model requires 'custom_endpoint' configuration")
+    url = custom_config.get("url")
+    if not url:
+        raise ValueError("Custom endpoint requires 'url' field")
+    headers = {}
+    for key, value in custom_config.get("headers", {}).items():
+        if value.startswith("$"):
+            env_var_name = value[1:]
+            resolved_value = get_api_key(env_var_name)
+            if resolved_value is None:
+                emit_warning(
+                    f"'{env_var_name}' is not set (check config or environment) for custom endpoint header '{key}'. Proceeding with empty value."
+                )
+                resolved_value = ""
+            value = resolved_value
+        elif "$" in value:
+            tokens = value.split(" ")
+            resolved_values = []
+            for token in tokens:
+                if token.startswith("$"):
+                    env_var = token[1:]
+                    resolved_value = get_api_key(env_var)
+                    if resolved_value is None:
+                        emit_warning(
+                            f"'{env_var}' is not set (check config or environment) for custom endpoint header '{key}'. Proceeding with empty value."
+                        )
+                        resolved_values.append("")
+                    else:
+                        resolved_values.append(resolved_value)
+                else:
+                    resolved_values.append(token)
+            value = " ".join(resolved_values)
+        headers[key] = value
+    api_key = None
+    if "api_key" in custom_config:
+        if custom_config["api_key"].startswith("$"):
+            env_var_name = custom_config["api_key"][1:]
+            api_key = get_api_key(env_var_name)
+            if api_key is None:
+                emit_warning(
+                    f"API key '{env_var_name}' is not set (checked config and environment); proceeding without API key."
+                )
+        else:
+            api_key = custom_config["api_key"]
+    if "ca_certs_path" in custom_config:
+        verify = custom_config["ca_certs_path"]
+    else:
+        verify = None
+    return url, headers, verify, api_key
+class ModelFactory:
+    """A factory for creating and managing different AI models."""
+    @staticmethod
+    def load_config() -> Dict[str, Any]:
+        load_model_config_callbacks = callbacks.get_callbacks("load_model_config")
+        if len(load_model_config_callbacks) > 0:
+            if len(load_model_config_callbacks) > 1:
+                logging.getLogger(__name__).warning(
+                    "Multiple load_model_config callbacks registered, using the first"
+                )
+            config = callbacks.on_load_model_config()[0]
+        else:
+            # Always load from the bundled models.json so upstream
+            # updates propagate automatically.  User additions belong
+            # in extra_models.json (overlay loaded below).
+            bundled_models = pathlib.Path(__file__).parent / "models.json"
+            with open(bundled_models, "r") as f:
+                config = json.load(f)
+        # Import OAuth model file paths from main config
+        from code_puppy.config import (
+            ANTIGRAVITY_MODELS_FILE,
+            CHATGPT_MODELS_FILE,
+            CLAUDE_MODELS_FILE,
+            GEMINI_MODELS_FILE,
+        )
+        # Build list of extra model sources
+        extra_sources: list[tuple[pathlib.Path, str, bool]] = [
+            (pathlib.Path(EXTRA_MODELS_FILE), "extra models", False),
+            (pathlib.Path(CHATGPT_MODELS_FILE), "ChatGPT OAuth models", False),
+            (pathlib.Path(CLAUDE_MODELS_FILE), "Claude Code OAuth models", True),
+            (pathlib.Path(GEMINI_MODELS_FILE), "Gemini OAuth models", False),
+            (pathlib.Path(ANTIGRAVITY_MODELS_FILE), "Antigravity OAuth models", False),
+        ]
+        for source_path, label, use_filtered in extra_sources:
+            if not source_path.exists():
+                continue
+            try:
+                # Use filtered loading for Claude Code OAuth models to show only latest versions
+                if use_filtered:
+                    try:
+                        from code_puppy.plugins.claude_code_oauth.utils import (
+                            load_claude_models_filtered,
+                        )
+                        extra_config = load_claude_models_filtered()
+                    except ImportError:
+                        # Plugin not available, fall back to standard JSON loading
+                        logging.getLogger(__name__).debug(
+                            f"claude_code_oauth plugin not available, loading {label} as plain JSON"
+                        )
+                        with open(source_path, "r") as f:
+                            extra_config = json.load(f)
+                else:
+                    with open(source_path, "r") as f:
+                        extra_config = json.load(f)
+                config.update(extra_config)
+            except json.JSONDecodeError as exc:
+                logging.getLogger(__name__).warning(
+                    f"Failed to load {label} config from {source_path}: Invalid JSON - {exc}"
+                )
+            except Exception as exc:
+                logging.getLogger(__name__).warning(
+                    f"Failed to load {label} config from {source_path}: {exc}"
+                )
+        # Let plugins add/override models via load_models_config hook
+        try:
+            from code_puppy.callbacks import on_load_models_config
+            results = on_load_models_config()
+            for result in results:
+                if isinstance(result, dict):
+                    config.update(result)  # Plugin models override built-in
+        except Exception as exc:
+            logging.getLogger(__name__).debug(
+                f"Failed to load plugin models config: {exc}"
+            )
+        return config
+    @staticmethod
+    def get_model(model_name: str, config: Dict[str, Any]) -> Any:
+        """Returns a configured model instance based on the provided name and config.
+        API key validation happens naturally within each model type's initialization,
+        which emits warnings and returns None if keys are missing.
+        """
+        model_config = config.get(model_name)
+        if not model_config:
+            raise ValueError(f"Model '{model_name}' not found in configuration.")
+        model_type = model_config.get("type")
+        # Check for plugin-registered model provider classes first
+        if model_type in _CUSTOM_MODEL_PROVIDERS:
+            provider_class = _CUSTOM_MODEL_PROVIDERS[model_type]
+            try:
+                return provider_class(
+                    model_name=model_name, model_config=model_config, config=config
+                )
+            except Exception as e:
+                logger.error(f"Custom model provider '{model_type}' failed: {e}")
+                return None
+        if model_type == "gemini":
+            api_key = get_api_key("GEMINI_API_KEY")
+            if not api_key:
+                emit_warning(
+                    f"GEMINI_API_KEY is not set (check config or environment); skipping Gemini model '{model_config.get('name')}'."
+                )
+                return None
+            model = GeminiModel(model_name=model_config["name"], api_key=api_key)
+            return model
+        elif model_type == "openai":
+            api_key = get_api_key("OPENAI_API_KEY")
+            if not api_key:
+                emit_warning(
+                    f"OPENAI_API_KEY is not set (check config or environment); skipping OpenAI model '{model_config.get('name')}'."
+                )
+                return None
+            provider = OpenAIProvider(api_key=api_key)
+            model = OpenAIChatModel(model_name=model_config["name"], provider=provider)
+            if "codex" in model_name:
+                model = OpenAIResponsesModel(
+                    model_name=model_config["name"], provider=provider
+                )
+            model.provider = provider
+            return model
+        elif model_type == "anthropic":
+            api_key = get_api_key("ANTHROPIC_API_KEY")
+            if not api_key:
+                emit_warning(
+                    f"ANTHROPIC_API_KEY is not set (check config or environment); skipping Anthropic model '{model_config.get('name')}'."
+                )
+                return None
+            # Use the same caching client as claude_code models
+            verify = get_cert_bundle_path()
+            http2_enabled = get_http2()
+            client = ClaudeCacheAsyncClient(
+                verify=verify,
+                timeout=180,
+                http2=http2_enabled,
+            )
+            # Check if interleaved thinking is enabled for this model
+            # Only applies to Claude 4 models (Opus 4.5, Opus 4.1, Opus 4, Sonnet 4)
+            from code_puppy.config import get_effective_model_settings
+            effective_settings = get_effective_model_settings(model_name)
+            interleaved_thinking = effective_settings.get("interleaved_thinking", False)
+            beta_header = _build_anthropic_beta_header(
+                model_config, interleaved_thinking=interleaved_thinking
+            )
+            default_headers = {}
+            if beta_header:
+                default_headers["anthropic-beta"] = beta_header
+            anthropic_client = AsyncAnthropic(
+                api_key=api_key,
+                http_client=client,
+                default_headers=default_headers if default_headers else None,
+            )
+            # Ensure cache_control is injected at the Anthropic SDK layer
+            patch_anthropic_client_messages(anthropic_client)
+            provider = AnthropicProvider(anthropic_client=anthropic_client)
+            return AnthropicModel(model_name=model_config["name"], provider=provider)
+        elif model_type == "custom_anthropic":
+            url, headers, verify, api_key = get_custom_config(model_config)
+            if not api_key:
+                emit_warning(
+                    f"API key is not set for custom Anthropic endpoint; skipping model '{model_config.get('name')}'."
+                )
+                return None
+            # Use the same caching client as claude_code models
+            if verify is None:
+                verify = get_cert_bundle_path()
+            http2_enabled = get_http2()
+            client = ClaudeCacheAsyncClient(
+                headers=headers,
+                verify=verify,
+                timeout=180,
+                http2=http2_enabled,
+            )
+            # Check if interleaved thinking is enabled for this model
+            from code_puppy.config import get_effective_model_settings
+            effective_settings = get_effective_model_settings(model_name)
+            interleaved_thinking = effective_settings.get("interleaved_thinking", False)
+            beta_header = _build_anthropic_beta_header(
+                model_config, interleaved_thinking=interleaved_thinking
+            )
+            default_headers = {}
+            if beta_header:
+                default_headers["anthropic-beta"] = beta_header
+            anthropic_client = AsyncAnthropic(
+                base_url=url,
+                http_client=client,
+                api_key=api_key,
+                default_headers=default_headers if default_headers else None,
+            )
+            # Ensure cache_control is injected at the Anthropic SDK layer
+            patch_anthropic_client_messages(anthropic_client)
+            provider = AnthropicProvider(anthropic_client=anthropic_client)
+            return AnthropicModel(model_name=model_config["name"], provider=provider)
+        # NOTE: 'claude_code' model type is now handled by the claude_code_oauth plugin
+        # via the register_model_type callback. See plugins/claude_code_oauth/register_callbacks.py
+        elif model_type == "azure_openai":
+            azure_endpoint_config = model_config.get("azure_endpoint")
+            if not azure_endpoint_config:
+                raise ValueError(
+                    "Azure OpenAI model type requires 'azure_endpoint' in its configuration."
+                )
+            azure_endpoint = azure_endpoint_config
+            if azure_endpoint_config.startswith("$"):
+                azure_endpoint = get_api_key(azure_endpoint_config[1:])
+            if not azure_endpoint:
+                emit_warning(
+                    f"Azure OpenAI endpoint '{azure_endpoint_config[1:] if azure_endpoint_config.startswith('$') else azure_endpoint_config}' not found (check config or environment); skipping model '{model_config.get('name')}'."
+                )
+                return None
+            api_version_config = model_config.get("api_version")
+            if not api_version_config:
+                raise ValueError(
+                    "Azure OpenAI model type requires 'api_version' in its configuration."
+                )
+            api_version = api_version_config
+            if api_version_config.startswith("$"):
+                api_version = get_api_key(api_version_config[1:])
+            if not api_version:
+                emit_warning(
+                    f"Azure OpenAI API version '{api_version_config[1:] if api_version_config.startswith('$') else api_version_config}' not found (check config or environment); skipping model '{model_config.get('name')}'."
+                )
+                return None
+            api_key_config = model_config.get("api_key")
+            if not api_key_config:
+                raise ValueError(
+                    "Azure OpenAI model type requires 'api_key' in its configuration."
+                )
+            api_key = api_key_config
+            if api_key_config.startswith("$"):
+                api_key = get_api_key(api_key_config[1:])
+            if not api_key:
+                emit_warning(
+                    f"Azure OpenAI API key '{api_key_config[1:] if api_key_config.startswith('$') else api_key_config}' not found (check config or environment); skipping model '{model_config.get('name')}'."
+                )
+                return None
+            # Configure max_retries for the Azure client, defaulting if not specified in config
+            azure_max_retries = model_config.get("max_retries", 2)
+            azure_client = AsyncAzureOpenAI(
+                azure_endpoint=azure_endpoint,
+                api_version=api_version,
+                api_key=api_key,
+                max_retries=azure_max_retries,
+            )
+            provider = OpenAIProvider(openai_client=azure_client)
+            model = OpenAIChatModel(model_name=model_config["name"], provider=provider)
+            model.provider = provider
+            return model
+        elif model_type == "custom_openai":
+            url, headers, verify, api_key = get_custom_config(model_config)
+            client = create_async_client(headers=headers, verify=verify)
+            provider_args = dict(
+                base_url=url,
+                http_client=client,
+            )
+            if api_key:
+                provider_args["api_key"] = api_key
+            provider = OpenAIProvider(**provider_args)
+            model = OpenAIChatModel(model_name=model_config["name"], provider=provider)
+            if model_name == "chatgpt-gpt-5-codex":
+                model = OpenAIResponsesModel(model_config["name"], provider=provider)
+            model.provider = provider
+            return model
+        elif model_type == "zai_coding":
+            api_key = get_api_key("ZAI_API_KEY")
+            if not api_key:
+                emit_warning(
+                    f"ZAI_API_KEY is not set (check config or environment); skipping ZAI coding model '{model_config.get('name')}'."
+                )
+                return None
+            provider = OpenAIProvider(
+                api_key=api_key,
+                base_url="https://api.z.ai/api/coding/paas/v4",
+            )
+            zai_model = ZaiChatModel(
+                model_name=model_config["name"],
+                provider=provider,
+            )
+            zai_model.provider = provider
+            return zai_model
+        elif model_type == "zai_api":
+            api_key = get_api_key("ZAI_API_KEY")
+            if not api_key:
+                emit_warning(
+                    f"ZAI_API_KEY is not set (check config or environment); skipping ZAI API model '{model_config.get('name')}'."
+                )
+                return None
+            provider = OpenAIProvider(
+                api_key=api_key,
+                base_url="https://api.z.ai/api/paas/v4/",
+            )
+            zai_model = ZaiChatModel(
+                model_name=model_config["name"],
+                provider=provider,
+            )
+            zai_model.provider = provider
+            return zai_model
+        # NOTE: 'antigravity' model type is now handled by the antigravity_oauth plugin
+        # via the register_model_type callback. See plugins/antigravity_oauth/register_callbacks.py
+        elif model_type == "custom_gemini":
+            # Backwards compatibility: delegate to antigravity plugin if antigravity flag is set
+            # New configs use type="antigravity" directly, but old configs may have
+            # type="custom_gemini" with antigravity=True
+            if model_config.get("antigravity"):
+                # Find and call the antigravity handler from the plugin
+                registered_handlers = callbacks.on_register_model_types()
+                for handler_info in registered_handlers:
+                    handlers = (
+                        handler_info
+                        if isinstance(handler_info, list)
+                        else [handler_info]
+                        if handler_info
+                        else []
+                    )
+                    for handler_entry in handlers:
+                        if (
+                            isinstance(handler_entry, dict)
+                            and handler_entry.get("type") == "antigravity"
+                        ):
+                            handler = handler_entry.get("handler")
+                            if callable(handler):
+                                try:
+                                    return handler(model_name, model_config, config)
+                                except Exception as e:
+                                    logger.error(f"Antigravity handler failed: {e}")
+                                    return None
+                # If no antigravity handler found, warn and fall through
+                emit_warning(
+                    f"Model '{model_config.get('name')}' has antigravity=True but antigravity plugin not loaded."
+                )
+                return None
+            url, headers, verify, api_key = get_custom_config(model_config)
+            if not api_key:
+                emit_warning(
+                    f"API key is not set for custom Gemini endpoint; skipping model '{model_config.get('name')}'."
+                )
+                return None
+            client = create_async_client(headers=headers, verify=verify)
+            model = GeminiModel(
+                model_name=model_config["name"],
+                api_key=api_key,
+                base_url=url,
+                http_client=client,
+            )
+            return model
+        elif model_type == "cerebras":
+            class ZaiCerebrasProvider(CerebrasProvider):
+                def model_profile(self, model_name: str) -> ModelProfile | None:
+                    profile = super().model_profile(model_name)
+                    if model_name.startswith("zai"):
+                        from pydantic_ai.profiles.qwen import qwen_model_profile
+                        profile = profile.update(qwen_model_profile("qwen-3-coder"))
+                    return profile
+            url, headers, verify, api_key = get_custom_config(model_config)
+            if not api_key:
+                emit_warning(
+                    f"API key is not set for Cerebras endpoint; skipping model '{model_config.get('name')}'."
+                )
+                return None
+            # Add Cerebras 3rd party integration header
+            headers["X-Cerebras-3rd-Party-Integration"] = "code-puppy"
+            # Pass "cerebras" so RetryingAsyncClient knows to ignore Cerebras's
+            # absurdly aggressive Retry-After headers (they send 60s!)
+            # Note: model_config["name"] is "zai-glm-4.7", not "cerebras"
+            client = create_async_client(
+                headers=headers, verify=verify, model_name="cerebras"
+            )
+            provider_args = dict(
+                api_key=api_key,
+                http_client=client,
+            )
+            provider = ZaiCerebrasProvider(**provider_args)
+            model = OpenAIChatModel(model_name=model_config["name"], provider=provider)
+            model.provider = provider
+            return model
+        elif model_type == "openrouter":
+            # Get API key from config, which can be an environment variable reference or raw value
+            api_key_config = model_config.get("api_key")
+            api_key = None
+            if api_key_config:
+                if api_key_config.startswith("$"):
+                    # It's an environment variable reference
+                    env_var_name = api_key_config[1:]  # Remove the $ prefix
+                    api_key = get_api_key(env_var_name)
+                    if api_key is None:
+                        emit_warning(
+                            f"OpenRouter API key '{env_var_name}' not found (check config or environment); skipping model '{model_config.get('name')}'."
+                        )
+                        return None
+                else:
+                    # It's a raw API key value
+                    api_key = api_key_config
+            else:
+                # No API key in config, try to get it from config or the default environment variable
+                api_key = get_api_key("OPENROUTER_API_KEY")
+                if api_key is None:
+                    emit_warning(
+                        f"OPENROUTER_API_KEY is not set (check config or environment); skipping OpenRouter model '{model_config.get('name')}'."
+                    )
+                    return None
+            provider = OpenRouterProvider(api_key=api_key)
+            model = OpenAIChatModel(model_name=model_config["name"], provider=provider)
+            model.provider = provider
+            return model
+        elif model_type == "gemini_oauth":
+            # Gemini OAuth models use the Code Assist API (cloudcode-pa.googleapis.com)
+            # This is a different API than the standard Generative Language API
+            try:
+                # Try user plugin first, then built-in plugin
+                try:
+                    from gemini_oauth.config import GEMINI_OAUTH_CONFIG
+                    from gemini_oauth.utils import (
+                        get_project_id,
+                        get_valid_access_token,
+                    )
+                except ImportError:
+                    from code_puppy.plugins.gemini_oauth.config import (
+                        GEMINI_OAUTH_CONFIG,
+                    )
+                    from code_puppy.plugins.gemini_oauth.utils import (
+                        get_project_id,
+                        get_valid_access_token,
+                    )
+            except ImportError as exc:
+                emit_warning(
+                    f"Gemini OAuth plugin not available; skipping model '{model_config.get('name')}'. "
+                    f"Error: {exc}"
+                )
+                return None
+            # Get a valid access token (refreshing if needed)
+            access_token = get_valid_access_token()
+            if not access_token:
+                emit_warning(
+                    f"Failed to get valid Gemini OAuth token; skipping model '{model_config.get('name')}'. "
+                    "Run /gemini-auth to re-authenticate."
+                )
+                return None
+            # Get project ID from stored tokens
+            project_id = get_project_id()
+            if not project_id:
+                emit_warning(
+                    f"No Code Assist project ID found; skipping model '{model_config.get('name')}'. "
+                    "Run /gemini-auth to re-authenticate."
+                )
+                return None
+            # Import the Code Assist model wrapper
+            from code_puppy.gemini_code_assist import GeminiCodeAssistModel
+            # Create the Code Assist model
+            model = GeminiCodeAssistModel(
+                model_name=model_config["name"],
+                access_token=access_token,
+                project_id=project_id,
+                api_base_url=GEMINI_OAUTH_CONFIG["api_base_url"],
+                api_version=GEMINI_OAUTH_CONFIG["api_version"],
+            )
+            return model
+        # NOTE: 'chatgpt_oauth' model type is now handled by the chatgpt_oauth plugin
+        # via the register_model_type callback. See plugins/chatgpt_oauth/register_callbacks.py
+        elif model_type == "round_robin":
+            # Get the list of model names to use in the round-robin
+            model_names = model_config.get("models")
+            if not model_names or not isinstance(model_names, list):
+                raise ValueError(
+                    f"Round-robin model '{model_name}' requires a 'models' list in its configuration."
+                )
+            # Get the rotate_every parameter (default: 1)
+            rotate_every = model_config.get("rotate_every", 1)
+            # Resolve each model name to an actual model instance
+            models = []
+            for name in model_names:
+                # Recursively get each model using the factory
+                model = ModelFactory.get_model(name, config)
+                models.append(model)
+            # Create and return the round-robin model
+            return RoundRobinModel(*models, rotate_every=rotate_every)
+        else:
+            # Check for plugin-registered model type handlers
+            registered_handlers = callbacks.on_register_model_types()
+            for handler_info in registered_handlers:
+                # Handler info can be a list of dicts or a single dict
+                if isinstance(handler_info, list):
+                    handlers = handler_info
+                else:
+                    handlers = [handler_info] if handler_info else []
+                for handler_entry in handlers:
+                    if not isinstance(handler_entry, dict):
+                        continue
+                    if handler_entry.get("type") == model_type:
+                        handler = handler_entry.get("handler")
+                        if callable(handler):
+                            try:
+                                return handler(model_name, model_config, config)
+                            except Exception as e:
+                                logger.error(
+                                    f"Plugin handler for model type '{model_type}' failed: {e}"
+                                )
+                                return None
+            raise ValueError(f"Unsupported model type: {model_type}")