PyPI - klaude-code - Versions diffs - 2.3.0__py3-none-any.whl → 2.4.1__py3-none-any.whl - Mend

klaude-code 2.3.0py3-none-any.whl → 2.4.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (54) hide show

klaude_code/cli/list_model.py +3 -3
klaude_code/cli/main.py +2 -2
klaude_code/config/assets/builtin_config.yaml +165 -307
klaude_code/config/config.py +17 -17
klaude_code/config/{select_model.py → model_matcher.py} +7 -7
klaude_code/config/sub_agent_model_helper.py +1 -10
klaude_code/config/thinking.py +2 -2
klaude_code/core/agent_profile.py +9 -23
klaude_code/core/executor.py +72 -70
klaude_code/core/tool/file/diff_builder.py +25 -18
klaude_code/llm/anthropic/client.py +5 -5
klaude_code/llm/client.py +1 -1
klaude_code/llm/codex/client.py +2 -2
klaude_code/llm/google/client.py +6 -6
klaude_code/llm/input_common.py +2 -2
klaude_code/llm/openai_compatible/client.py +3 -3
klaude_code/llm/openai_compatible/stream.py +1 -1
klaude_code/llm/openrouter/client.py +4 -4
klaude_code/llm/openrouter/input.py +1 -3
klaude_code/llm/responses/client.py +5 -5
klaude_code/protocol/events/__init__.py +7 -1
klaude_code/protocol/events/chat.py +10 -0
klaude_code/protocol/llm_param.py +1 -1
klaude_code/protocol/model.py +0 -26
klaude_code/protocol/op.py +0 -5
klaude_code/session/session.py +4 -2
klaude_code/tui/command/clear_cmd.py +0 -1
klaude_code/tui/command/command_abc.py +6 -4
klaude_code/tui/command/copy_cmd.py +10 -10
klaude_code/tui/command/debug_cmd.py +11 -10
klaude_code/tui/command/export_online_cmd.py +18 -23
klaude_code/tui/command/fork_session_cmd.py +39 -43
klaude_code/tui/command/model_cmd.py +5 -7
klaude_code/tui/command/{model_select.py → model_picker.py} +3 -5
klaude_code/tui/command/refresh_cmd.py +0 -1
klaude_code/tui/command/registry.py +15 -21
klaude_code/tui/command/resume_cmd.py +10 -16
klaude_code/tui/command/status_cmd.py +8 -12
klaude_code/tui/command/sub_agent_model_cmd.py +11 -16
klaude_code/tui/command/terminal_setup_cmd.py +8 -11
klaude_code/tui/command/thinking_cmd.py +4 -6
klaude_code/tui/commands.py +5 -0
klaude_code/tui/components/command_output.py +96 -0
klaude_code/tui/components/developer.py +3 -110
klaude_code/tui/components/welcome.py +2 -2
klaude_code/tui/input/prompt_toolkit.py +6 -8
klaude_code/tui/machine.py +5 -0
klaude_code/tui/renderer.py +5 -5
klaude_code/tui/runner.py +0 -6
klaude_code/tui/terminal/selector.py +7 -8
{klaude_code-2.3.0.dist-info → klaude_code-2.4.1.dist-info}/METADATA +21 -74
{klaude_code-2.3.0.dist-info → klaude_code-2.4.1.dist-info}/RECORD +54 -53
{klaude_code-2.3.0.dist-info → klaude_code-2.4.1.dist-info}/WHEEL +0 -0
{klaude_code-2.3.0.dist-info → klaude_code-2.4.1.dist-info}/entry_points.txt +0 -0

klaude_code/cli/list_model.py CHANGED Viewed

@@ -181,7 +181,7 @@ def format_env_var_display(value: str | None) -> Text:
 def _get_model_params_display(model: ModelConfig) -> list[Text]:
     """Get display elements for model parameters."""
-    param_strings = format_model_params(model.model_params)
+    param_strings = format_model_params(model)
     if param_strings:
         return [Text(s) for s in param_strings]
     return [Text("")]
@@ -286,7 +286,7 @@ def _build_models_table(
         if not provider_available:
             name = Text.assemble((prefix, ThemeKey.LINES), (model.model_name, "dim"))
-            model_id = Text(model.model_params.model or "", style="dim")
+            model_id = Text(model.model_id or "", style="dim")
             params = Text("(unavailable)", style="dim")
         else:
             # Build role tags for this model
@@ -305,7 +305,7 @@ def _build_models_table(
                 )
             else:
                 name = Text.assemble((prefix, ThemeKey.LINES), (model.model_name, ThemeKey.CONFIG_ITEM_NAME))
-            model_id = Text(model.model_params.model or "")
+            model_id = Text(model.model_id or "")
             params = Text(" · ").join(_get_model_params_display(model))
         models_table.add_row(name, model_id, params)

klaude_code/cli/main.py CHANGED Viewed

@@ -124,7 +124,7 @@ def main_callback(
             raise typer.Exit(2)
         from klaude_code.app.runtime import AppInitConfig
-        from klaude_code.tui.command.model_select import ModelSelectStatus, select_model_interactive
+        from klaude_code.tui.command.model_picker import ModelSelectStatus, select_model_interactive
         from klaude_code.tui.runner import run_interactive
         update_terminal_title()
@@ -193,7 +193,7 @@ def main_callback(
                     matches = [
                         m.selector
                         for m in cfg.iter_model_entries()
-                        if (m.model_params.model or "").strip().lower() == raw_model.lower()
+                        if (m.model_id or "").strip().lower() == raw_model.lower()
                     ]
                     if len(matches) == 1:
                         chosen_model = matches[0]

klaude_code/config/assets/builtin_config.yaml CHANGED Viewed

@@ -1,280 +1,176 @@
+---
 # Built-in provider and model configurations
 # Users can start using klaude by simply setting environment variables
 # (ANTHROPIC_API_KEY, OPENAI_API_KEY, etc.) without manual configuration.
 provider_list:
 - provider_name: anthropic
   protocol: anthropic
   api_key: ${ANTHROPIC_API_KEY}
   model_list:
   - model_name: sonnet
-    model_params:
-      model: claude-sonnet-4-5-20250929
-      context_limit: 200000
-      provider_routing:
-        sort: throughput
-      cost:
-        input: 3.0
-        output: 15.0
-        cache_read: 0.3
-        cache_write: 3.75
+    model_id: claude-sonnet-4-5-20250929
+    context_limit: 200000
+    provider_routing:
+      sort: throughput
+    cost: {input: 3, output: 15, cache_read: 0.3, cache_write: 3.75}
   - model_name: opus
-    model_params:
-      model: claude-opus-4-5-20251101
-      context_limit: 200000
-      verbosity: high
-      thinking:
-        type: enabled
-        budget_tokens: 2048
-      cost:
-        input: 5.0
-        output: 25.0
-        cache_read: 0.5
-        cache_write: 6.25
+    model_id: claude-opus-4-5-20251101
+    context_limit: 200000
+    verbosity: high
+    thinking:
+      type: enabled
+      budget_tokens: 2048
+    cost: {input: 5, output: 25, cache_read: 0.5, cache_write: 6.25}
 - provider_name: openai
   protocol: responses
   api_key: ${OPENAI_API_KEY}
   model_list:
   - model_name: gpt-5.2
-    model_params:
-      model: gpt-5.2
-      max_tokens: 128000
-      context_limit: 400000
-      verbosity: high
-      thinking:
-        reasoning_effort: high
-      cost:
-        input: 1.75
-        output: 14.0
-        cache_read: 0.17
+    model_id: gpt-5.2
+    max_tokens: 128000
+    context_limit: 400000
+    verbosity: high
+    thinking:
+      reasoning_effort: high
+    cost: {input: 1.75, output: 14, cache_read: 0.17}
 - provider_name: openrouter
   protocol: openrouter
   api_key: ${OPENROUTER_API_KEY}
   model_list:
-  - model_name: gpt-5-mini
-    model_params:
-      model: openai/gpt-5-mini
-      max_tokens: 128000
-      context_limit: 400000
-      thinking:
-        reasoning_effort: high
-      cost:
-        input: 0.25
-        output: 2.0
-        cache_read: 0.03
   - model_name: gpt-5.1-codex-max
-    model_params:
-      model: openai/gpt-5.1-codex-max
-      max_tokens: 128000
-      context_limit: 400000
-      thinking:
-        reasoning_effort: medium
-      cost:
-        input: 1.25
-        output: 10.0
-        cache_read: 0.13
+    model_id: openai/gpt-5.1-codex-max
+    max_tokens: 128000
+    context_limit: 400000
+    thinking:
+      reasoning_effort: medium
+    cost: {input: 1.25, output: 10, cache_read: 0.13}
   - model_name: gpt-5.2
-    model_params:
-      model: openai/gpt-5.2
-      max_tokens: 128000
-      context_limit: 400000
-      verbosity: high
-      thinking:
-        reasoning_effort: high
-      cost:
-        input: 1.75
-        output: 14.0
-        cache_read: 0.17
+    model_id: openai/gpt-5.2
+    max_tokens: 128000
+    context_limit: 400000
+    verbosity: high
+    thinking:
+      reasoning_effort: high
+    cost: {input: 1.75, output: 14, cache_read: 0.17}
   - model_name: gpt-5.2-medium
-    model_params:
-      model: openai/gpt-5.2
-      max_tokens: 128000
-      context_limit: 400000
-      verbosity: high
-      thinking:
-        reasoning_effort: medium
-      cost:
-        input: 1.75
-        output: 14.0
-        cache_read: 0.17
+    model_id: openai/gpt-5.2
+    max_tokens: 128000
+    context_limit: 400000
+    verbosity: high
+    thinking:
+      reasoning_effort: medium
+    cost: {input: 1.75, output: 14, cache_read: 0.17}
   - model_name: gpt-5.2-low
-    model_params:
-      model: openai/gpt-5.2
-      max_tokens: 128000
-      context_limit: 400000
-      verbosity: low
-      thinking:
-        reasoning_effort: low
-      cost:
-        input: 1.75
-        output: 14.0
-        cache_read: 0.17
+    model_id: openai/gpt-5.2
+    max_tokens: 128000
+    context_limit: 400000
+    verbosity: low
+    thinking:
+      reasoning_effort: low
+    cost: {input: 1.75, output: 14, cache_read: 0.17}
   - model_name: gpt-5.2-fast
-    model_params:
-      model: openai/gpt-5.2
-      max_tokens: 128000
-      context_limit: 400000
-      verbosity: low
-      thinking:
-        reasoning_effort: none
-      cost:
-        input: 1.75
-        output: 14.0
-        cache_read: 0.17
+    model_id: openai/gpt-5.2
+    max_tokens: 128000
+    context_limit: 400000
+    verbosity: low
+    thinking:
+      reasoning_effort: none
+    cost: {input: 1.75, output: 14, cache_read: 0.17}
   - model_name: kimi
-    model_params:
-      model: moonshotai/kimi-k2-thinking
-      context_limit: 262144
-      provider_routing:
-        only:
-        - moonshotai/turbo
-      cost:
-        input: 0.6
-        output: 2.5
-        cache_read: 0.15
+    model_id: moonshotai/kimi-k2-thinking
+    context_limit: 262144
+    provider_routing:
+      only:
+      - moonshotai/turbo
+    cost: {input: 0.6, output: 2.5, cache_read: 0.15}
   - model_name: haiku
-    model_params:
-      model: anthropic/claude-haiku-4.5
-      context_limit: 200000
-      cost:
-        input: 1.0
-        output: 5.0
-        cache_read: 0.1
-        cache_write: 1.25
+    model_id: anthropic/claude-haiku-4.5
+    context_limit: 200000
+    cost: {input: 1, output: 5, cache_read: 0.1, cache_write: 1.25}
   - model_name: sonnet
-    model_params:
-      model: anthropic/claude-4.5-sonnet
-      context_limit: 200000
-      provider_routing:
-        sort: throughput
-      cost:
-        input: 3.0
-        output: 15.0
-        cache_read: 0.3
-        cache_write: 3.75
+    model_id: anthropic/claude-4.5-sonnet
+    context_limit: 200000
+    provider_routing:
+      sort: throughput
+    cost: {input: 3, output: 15, cache_read: 0.3, cache_write: 3.75}
   - model_name: opus
-    model_params:
-      model: anthropic/claude-4.5-opus
-      context_limit: 200000
-      verbosity: high
-      thinking:
-        type: enabled
-        budget_tokens: 2048
-      cost:
-        input: 5.0
-        output: 25.0
-        cache_read: 0.5
-        cache_write: 6.25
+    model_id: anthropic/claude-4.5-opus
+    context_limit: 200000
+    verbosity: high
+    thinking:
+      type: enabled
+      budget_tokens: 2048
+    cost: {input: 5, output: 25, cache_read: 0.5, cache_write: 6.25}
   - model_name: gemini-pro
-    model_params:
-      model: google/gemini-3-pro-preview
-      context_limit: 1048576
-      thinking:
-        reasoning_effort: high
-      cost:
-        input: 2.0
-        output: 12.0
-        cache_read: 0.2
+    model_id: google/gemini-3-pro-preview
+    context_limit: 1048576
+    thinking:
+      reasoning_effort: high
+    cost: {input: 2, output: 12, cache_read: 0.2}
   - model_name: gemini-flash
-    model_params:
-      model: google/gemini-3-flash-preview
-      context_limit: 1048576
-      thinking:
-        reasoning_effort: medium
-      cost:
-        input: 0.5
-        output: 3.0
-        cache_read: 0.05
+    model_id: google/gemini-3-flash-preview
+    context_limit: 1048576
+    thinking:
+      reasoning_effort: medium
+    cost: {input: 0.5, output: 3, cache_read: 0.05}
   - model_name: nano-banana-pro
-    model_params:
-      model: google/gemini-3-pro-image-preview
-      context_limit: 66000
-      modalities:
-      - image
-      - text
-      cost:
-        input: 2
-        output: 12
-        cache_read: 0.2
-        image: 120
+    model_id: google/gemini-3-pro-image-preview
+    context_limit: 66000
+    modalities:
+    - image
+    - text
+    cost: {input: 2, output: 12, cache_read: 0.2, image: 120}
   - model_name: nano-banana
-    model_params:
-      model: google/gemini-2.5-flash-image
-      context_limit: 33000
-      modalities:
-      - image
-      - text
-      cost:
-        input: 0.3
-        output: 2.5
-        cache_read: 0.03
-        image: 30
+    model_id: google/gemini-2.5-flash-image
+    context_limit: 33000
+    modalities:
+    - image
+    - text
+    cost: {input: 0.3, output: 2.5, cache_read: 0.03, image: 30}
   - model_name: grok
-    model_params:
-      model: x-ai/grok-4.1-fast
-      context_limit: 2000000
-      thinking:
-        type: enabled
-        budget_tokens: 2048
-      cost:
-        input: 0.2
-        output: 0.5
-        cache_read: 0.05
+    model_id: x-ai/grok-4.1-fast
+    context_limit: 2000000
+    thinking:
+      type: enabled
+      budget_tokens: 2048
+    cost: {input: 0.2, output: 0.5, cache_read: 0.05}
   - model_name: minimax
-    model_params:
-      model: minimax/minimax-m2.1
-      context_limit: 204800
-      cost:
-        input: 0.3
-        output: 1.2
-        cache_read: 0.03
+    model_id: minimax/minimax-m2.1
+    context_limit: 204800
+    cost: {input: 0.3, output: 1.2, cache_read: 0.03}
   - model_name: glm
-    model_params:
-      model: z-ai/glm-4.7
-      context_limit: 200000
-      provider_routing:
-        only:
-        - z-ai
-      cost:
-        input: 0.44
-        output: 1.74
-        cache_read: 0.04
+    model_id: z-ai/glm-4.7
+    context_limit: 200000
+    provider_routing:
+      only:
+      - z-ai
+    cost: {input: 0.44, output: 1.74, cache_read: 0.04}
+  - model_name: seedream
+    model_id: bytedance-seed/seedream-4.5
+    context_limit: 4000
+    cost: {input: 0, output: 9.581, image: 9.581}
+    modalities:
+    - image
+    - text
 - provider_name: google
   protocol: google
   api_key: ${GOOGLE_API_KEY}
   model_list:
   - model_name: gemini-pro
-    model_params:
-      model: gemini-3-pro-preview
-      context_limit: 1048576
-      cost:
-        input: 2.0
-        output: 12.0
-        cache_read: 0.2
+    model_id: gemini-3-pro-preview
+    context_limit: 1048576
+    cost: {input: 2, output: 12, cache_read: 0.2}
   - model_name: gemini-flash
-    model_params:
-      model: gemini-3-flash-preview
-      context_limit: 1048576
-      cost:
-        input: 0.5
-        output: 3.0
-        cache_read: 0.05
+    model_id: gemini-3-flash-preview
+    context_limit: 1048576
+    cost: {input: 0.5, output: 3, cache_read: 0.05}
   - model_name: nano-banana-pro
-    model_params:
-      model: gemini-3-pro-image-preview
-      context_limit: 66000
-      modalities:
-      - image
-      - text
-      cost:
-        input: 2
-        output: 12
-        cache_read: 0.2
-        image: 120
+    model_id: gemini-3-pro-image-preview
+    context_limit: 66000
+    modalities:
+    - image
+    - text
+    cost: {input: 2, output: 12, cache_read: 0.2, image: 120}
 - provider_name: bedrock
   protocol: bedrock
   aws_access_key: ${AWS_ACCESS_KEY_ID}
@@ -282,97 +178,59 @@ provider_list:
   aws_region: ${AWS_REGION}
   model_list:
   - model_name: sonnet
-    model_params:
-      model: us.anthropic.claude-sonnet-4-5-20250929-v1:0
-      context_limit: 200000
-      cost:
-        input: 3.0
-        output: 15.0
-        cache_read: 0.3
-        cache_write: 3.75
+    model_id: us.anthropic.claude-sonnet-4-5-20250929-v1:0
+    context_limit: 200000
+    cost: {input: 3, output: 15, cache_read: 0.3, cache_write: 3.75}
 - provider_name: deepseek
   protocol: anthropic
   api_key: ${DEEPSEEK_API_KEY}
   base_url: https://api.deepseek.com/anthropic
   model_list:
   - model_name: deepseek
-    model_params:
-      model: deepseek-reasoner
-      context_limit: 128000
-      thinking:
-        type: enabled
-        budget_tokens: 2048
-      cost:
-        input: 2
-        output: 3
-        cache_read: 0.2
-        currency: CNY
+    model_id: deepseek-reasoner
+    context_limit: 128000
+    thinking:
+      type: enabled
+      budget_tokens: 2048
+    cost: {input: 2, output: 3, cache_read: 0.2, currency: CNY}
 - provider_name: moonshot
   protocol: anthropic
   api_key: ${MOONSHOT_API_KEY}
   base_url: https://api.moonshot.cn/anthropic
   model_list:
   - model_name: kimi
-    model_params:
-      model: kimi-k2-thinking
-      context_limit: 262144
-      thinking:
-        type: enabled
-        budget_tokens: 8192
-      cost:
-        input: 4.0
-        output: 16.0
-        cache_read: 1.0
-        currency: CNY
+    model_id: kimi-k2-thinking
+    context_limit: 262144
+    thinking:
+      type: enabled
+      budget_tokens: 8192
+    cost: {input: 4, output: 16, cache_read: 1, currency: CNY}
 - provider_name: claude-max
   protocol: claude_oauth
   model_list:
   - model_name: sonnet
-    model_params:
-      model: claude-sonnet-4-5-20250929
-      context_limit: 200000
-      cost:
-        input: 3.0
-        output: 15.0
-        cache_read: 0.3
-        cache_write: 3.75
+    model_id: claude-sonnet-4-5-20250929
+    context_limit: 200000
+    cost: {input: 3, output: 15, cache_read: 0.3, cache_write: 3.75}
   - model_name: opus
-    model_params:
-      model: claude-opus-4-5-20251101
-      context_limit: 200000
-      verbosity: high
-      thinking:
-        type: enabled
-        budget_tokens: 2048
-      cost:
-        input: 5.0
-        output: 25.0
-        cache_read: 0.5
-        cache_write: 6.25
+    model_id: claude-opus-4-5-20251101
+    context_limit: 200000
+    verbosity: high
+    thinking:
+      type: enabled
+      budget_tokens: 2048
+    cost: {input: 5, output: 25, cache_read: 0.5, cache_write: 6.25}
   - model_name: haiku
-    model_params:
-      model: claude-haiku-4-5-20251001
-      context_limit: 200000
-      cost:
-        input: 1.0
-        output: 5.0
-        cache_read: 0.1
-        cache_write: 1.25
+    model_id: claude-haiku-4-5-20251001
+    context_limit: 200000
+    cost: {input: 1, output: 5, cache_read: 0.1, cache_write: 1.25}
 - provider_name: codex
   protocol: codex_oauth
   model_list:
   - model_name: gpt-5.2-codex
-    model_params:
-      model: gpt-5.2-codex
-      thinking:
-        reasoning_effort: medium
-      context_limit: 400000
-      max_tokens: 128000
-      cost:
-        input: 1.75
-        output: 14.0
-        cache_read: 0.17
+    model_id: gpt-5.2-codex
+    thinking:
+      reasoning_effort: medium
+    context_limit: 400000
+    max_tokens: 128000
+    cost: {input: 1.75, output: 14, cache_read: 0.17}

klaude_code/config/config.py CHANGED Viewed

@@ -58,9 +58,10 @@ config_path = Path.home() / ".klaude" / "klaude-config.yaml"
 example_config_path = Path.home() / ".klaude" / "klaude-config.example.yaml"
-class ModelConfig(BaseModel):
+class ModelConfig(llm_param.LLMConfigModelParameter):
+    """Model configuration that flattens LLMConfigModelParameter fields."""
     model_name: str
-    model_params: llm_param.LLMConfigModelParameter
 class ProviderConfig(llm_param.LLMConfigProviderParameter):
@@ -135,10 +136,11 @@ class UserProviderConfig(BaseModel):
     model_list: list[ModelConfig] = Field(default_factory=lambda: [])
-class ModelEntry(BaseModel):
+class ModelEntry(llm_param.LLMConfigModelParameter):
+    """Model entry with provider info, flattens LLMConfigModelParameter fields."""
     model_name: str
     provider: str
-    model_params: llm_param.LLMConfigModelParameter
     @property
     def selector(self) -> str:
@@ -325,7 +327,7 @@ class Config(BaseModel):
                 provider_dump["api_key"] = api_key
                 return llm_param.LLMConfigParameter(
                     **provider_dump,
-                    **model.model_params.model_dump(),
+                    **model.model_dump(exclude={"model_name"}),
                 )
         raise ValueError(f"Unknown model: {model_name}")
@@ -340,7 +342,7 @@ class Config(BaseModel):
             ModelEntry(
                 model_name=model.model_name,
                 provider=provider.provider_name,
-                model_params=model.model_params,
+                **model.model_dump(exclude={"model_name"}),
             )
             for provider in self.provider_list
             if not only_available or not provider.is_api_key_missing()
@@ -350,7 +352,7 @@ class Config(BaseModel):
     def has_available_image_model(self) -> bool:
         """Check if any image generation model is available."""
         for entry in self.iter_model_entries(only_available=True):
-            if entry.model_params.modalities and "image" in entry.model_params.modalities:
+            if entry.modalities and "image" in entry.modalities:
                 return True
         return False
@@ -364,7 +366,7 @@ class Config(BaseModel):
     def get_first_available_image_model(self) -> str | None:
         """Get the first available image generation model, or None."""
         for entry in self.iter_model_entries(only_available=True):
-            if entry.model_params.modalities and "image" in entry.model_params.modalities:
+            if entry.modalities and "image" in entry.modalities:
                 return entry.model_name
         return None
@@ -409,15 +411,13 @@ def get_example_config() -> UserConfig:
                 model_list=[
                     ModelConfig(
                         model_name="my-model",
-                        model_params=llm_param.LLMConfigModelParameter(
-                            model="model-id-from-provider",
-                            max_tokens=16000,
-                            context_limit=200000,
-                            cost=llm_param.Cost(
-                                input=1,
-                                output=10,
-                                cache_read=0.1,
-                            ),
+                        model_id="model-id-from-provider",
+                        max_tokens=16000,
+                        context_limit=200000,
+                        cost=llm_param.Cost(
+                            input=1,
+                            output=10,
+                            cache_read=0.1,
                         ),
                     ),
                 ],

klaude-code 2.3.0__py3-none-any.whl → 2.4.1__py3-none-any.whl

klaude-code 2.3.0py3-none-any.whl → 2.4.1py3-none-any.whl