PyPI - klaude-code - Versions diffs - 1.8.0__py3-none-any.whl → 2.0.0__py3-none-any.whl - Mend

klaude-code 1.8.0py3-none-any.whl → 2.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (142) hide show

klaude_code/auth/base.py +97 -0
klaude_code/auth/claude/__init__.py +6 -0
klaude_code/auth/claude/exceptions.py +9 -0
klaude_code/auth/claude/oauth.py +172 -0
klaude_code/auth/claude/token_manager.py +26 -0
klaude_code/auth/codex/token_manager.py +10 -50
klaude_code/cli/auth_cmd.py +127 -46
klaude_code/cli/config_cmd.py +4 -2
klaude_code/cli/cost_cmd.py +14 -9
klaude_code/cli/list_model.py +248 -200
klaude_code/cli/main.py +1 -1
klaude_code/cli/runtime.py +7 -5
klaude_code/cli/self_update.py +1 -1
klaude_code/cli/session_cmd.py +1 -1
klaude_code/command/clear_cmd.py +6 -2
klaude_code/command/command_abc.py +2 -2
klaude_code/command/debug_cmd.py +4 -4
klaude_code/command/export_cmd.py +2 -2
klaude_code/command/export_online_cmd.py +12 -12
klaude_code/command/fork_session_cmd.py +29 -23
klaude_code/command/help_cmd.py +4 -4
klaude_code/command/model_cmd.py +4 -4
klaude_code/command/model_select.py +1 -1
klaude_code/command/prompt-commit.md +82 -0
klaude_code/command/prompt_command.py +3 -3
klaude_code/command/refresh_cmd.py +2 -2
klaude_code/command/registry.py +7 -5
klaude_code/command/release_notes_cmd.py +4 -4
klaude_code/command/resume_cmd.py +15 -11
klaude_code/command/status_cmd.py +4 -4
klaude_code/command/terminal_setup_cmd.py +8 -8
klaude_code/command/thinking_cmd.py +4 -4
klaude_code/config/assets/builtin_config.yaml +52 -3
klaude_code/config/builtin_config.py +16 -5
klaude_code/config/config.py +31 -7
klaude_code/config/thinking.py +4 -4
klaude_code/const.py +146 -91
klaude_code/core/agent.py +3 -12
klaude_code/core/executor.py +21 -13
klaude_code/core/manager/sub_agent_manager.py +71 -7
klaude_code/core/prompt.py +1 -1
klaude_code/core/prompts/prompt-sub-agent-image-gen.md +1 -0
klaude_code/core/prompts/prompt-sub-agent-web.md +27 -1
klaude_code/core/reminders.py +88 -69
klaude_code/core/task.py +44 -45
klaude_code/core/tool/file/apply_patch_tool.py +9 -9
klaude_code/core/tool/file/diff_builder.py +3 -5
klaude_code/core/tool/file/edit_tool.py +23 -23
klaude_code/core/tool/file/move_tool.py +43 -43
klaude_code/core/tool/file/read_tool.py +44 -39
klaude_code/core/tool/file/write_tool.py +14 -14
klaude_code/core/tool/report_back_tool.py +4 -4
klaude_code/core/tool/shell/bash_tool.py +23 -23
klaude_code/core/tool/skill/skill_tool.py +7 -7
klaude_code/core/tool/sub_agent_tool.py +38 -9
klaude_code/core/tool/todo/todo_write_tool.py +8 -8
klaude_code/core/tool/todo/update_plan_tool.py +6 -6
klaude_code/core/tool/tool_abc.py +2 -2
klaude_code/core/tool/tool_context.py +27 -0
klaude_code/core/tool/tool_runner.py +88 -42
klaude_code/core/tool/truncation.py +38 -20
klaude_code/core/tool/web/mermaid_tool.py +6 -7
klaude_code/core/tool/web/web_fetch_tool.py +68 -30
klaude_code/core/tool/web/web_search_tool.py +15 -17
klaude_code/core/turn.py +120 -73
klaude_code/llm/anthropic/client.py +104 -44
klaude_code/llm/anthropic/input.py +116 -108
klaude_code/llm/bedrock/client.py +8 -5
klaude_code/llm/claude/__init__.py +3 -0
klaude_code/llm/claude/client.py +105 -0
klaude_code/llm/client.py +4 -3
klaude_code/llm/codex/client.py +16 -10
klaude_code/llm/google/client.py +122 -60
klaude_code/llm/google/input.py +94 -108
klaude_code/llm/image.py +123 -0
klaude_code/llm/input_common.py +136 -189
klaude_code/llm/openai_compatible/client.py +17 -7
klaude_code/llm/openai_compatible/input.py +36 -66
klaude_code/llm/openai_compatible/stream.py +119 -67
klaude_code/llm/openai_compatible/tool_call_accumulator.py +23 -11
klaude_code/llm/openrouter/client.py +34 -9
klaude_code/llm/openrouter/input.py +63 -64
klaude_code/llm/openrouter/reasoning.py +22 -24
klaude_code/llm/registry.py +20 -15
klaude_code/llm/responses/client.py +107 -45
klaude_code/llm/responses/input.py +115 -98
klaude_code/llm/usage.py +52 -25
klaude_code/protocol/__init__.py +1 -0
klaude_code/protocol/events.py +16 -12
klaude_code/protocol/llm_param.py +22 -3
klaude_code/protocol/message.py +250 -0
klaude_code/protocol/model.py +94 -281
klaude_code/protocol/op.py +2 -2
klaude_code/protocol/sub_agent/__init__.py +2 -2
klaude_code/protocol/sub_agent/explore.py +10 -0
klaude_code/protocol/sub_agent/image_gen.py +119 -0
klaude_code/protocol/sub_agent/task.py +10 -0
klaude_code/protocol/sub_agent/web.py +10 -0
klaude_code/session/codec.py +6 -6
klaude_code/session/export.py +261 -62
klaude_code/session/selector.py +7 -24
klaude_code/session/session.py +125 -53
klaude_code/session/store.py +5 -32
klaude_code/session/templates/export_session.html +1 -1
klaude_code/session/templates/mermaid_viewer.html +1 -1
klaude_code/trace/log.py +11 -6
klaude_code/ui/core/input.py +1 -1
klaude_code/ui/core/stage_manager.py +1 -8
klaude_code/ui/modes/debug/display.py +2 -2
klaude_code/ui/modes/repl/clipboard.py +2 -2
klaude_code/ui/modes/repl/completers.py +18 -10
klaude_code/ui/modes/repl/event_handler.py +136 -127
klaude_code/ui/modes/repl/input_prompt_toolkit.py +1 -1
klaude_code/ui/modes/repl/key_bindings.py +1 -1
klaude_code/ui/modes/repl/renderer.py +107 -15
klaude_code/ui/renderers/assistant.py +2 -2
klaude_code/ui/renderers/common.py +65 -7
klaude_code/ui/renderers/developer.py +7 -6
klaude_code/ui/renderers/diffs.py +11 -11
klaude_code/ui/renderers/mermaid_viewer.py +49 -2
klaude_code/ui/renderers/metadata.py +39 -31
klaude_code/ui/renderers/sub_agent.py +57 -16
klaude_code/ui/renderers/thinking.py +37 -2
klaude_code/ui/renderers/tools.py +180 -165
klaude_code/ui/rich/live.py +3 -1
klaude_code/ui/rich/markdown.py +39 -7
klaude_code/ui/rich/quote.py +76 -1
klaude_code/ui/rich/status.py +14 -8
klaude_code/ui/rich/theme.py +13 -6
klaude_code/ui/terminal/image.py +34 -0
klaude_code/ui/terminal/notifier.py +2 -1
klaude_code/ui/terminal/progress_bar.py +4 -4
klaude_code/ui/terminal/selector.py +22 -4
klaude_code/ui/utils/common.py +55 -0
{klaude_code-1.8.0.dist-info → klaude_code-2.0.0.dist-info}/METADATA +28 -6
klaude_code-2.0.0.dist-info/RECORD +229 -0
klaude_code/command/prompt-jj-describe.md +0 -32
klaude_code/core/prompts/prompt-sub-agent-oracle.md +0 -22
klaude_code/protocol/sub_agent/oracle.py +0 -91
klaude_code-1.8.0.dist-info/RECORD +0 -219
{klaude_code-1.8.0.dist-info → klaude_code-2.0.0.dist-info}/WHEEL +0 -0
{klaude_code-1.8.0.dist-info → klaude_code-2.0.0.dist-info}/entry_points.txt +0 -0

klaude_code/llm/claude/client.py ADDED Viewed

@@ -0,0 +1,105 @@
+import json
+from collections.abc import AsyncGenerator
+from typing import override
+import anthropic
+import httpx
+from anthropic import APIError
+from klaude_code.auth.claude.exceptions import ClaudeNotLoggedInError
+from klaude_code.auth.claude.oauth import ClaudeOAuth
+from klaude_code.auth.claude.token_manager import ClaudeTokenManager
+from klaude_code.const import (
+    ANTHROPIC_BETA_FINE_GRAINED_TOOL_STREAMING,
+    ANTHROPIC_BETA_INTERLEAVED_THINKING,
+    ANTHROPIC_BETA_OAUTH,
+    LLM_HTTP_TIMEOUT_CONNECT,
+    LLM_HTTP_TIMEOUT_READ,
+    LLM_HTTP_TIMEOUT_TOTAL,
+)
+from klaude_code.llm.anthropic.client import build_payload, parse_anthropic_stream
+from klaude_code.llm.client import LLMClientABC
+from klaude_code.llm.input_common import apply_config_defaults
+from klaude_code.llm.registry import register
+from klaude_code.llm.usage import MetadataTracker, error_stream_items
+from klaude_code.protocol import llm_param, message
+from klaude_code.trace import DebugType, log_debug
+_CLAUDE_OAUTH_REQUIRED_BETAS: tuple[str, ...] = (
+    ANTHROPIC_BETA_OAUTH,
+    ANTHROPIC_BETA_FINE_GRAINED_TOOL_STREAMING,
+)
+@register(llm_param.LLMClientProtocol.CLAUDE_OAUTH)
+class ClaudeClient(LLMClientABC):
+    """Claude OAuth client using Anthropic messages API with Bearer auth token."""
+    def __init__(self, config: llm_param.LLMConfigParameter):
+        super().__init__(config)
+        if config.base_url:
+            raise ValueError("CLAUDE protocol does not support custom base_url")
+        self._token_manager = ClaudeTokenManager()
+        self._oauth = ClaudeOAuth(self._token_manager)
+        if not self._token_manager.is_logged_in():
+            raise ClaudeNotLoggedInError("Claude authentication required. Run 'klaude login claude' first.")
+        self.client = self._create_client()
+    def _create_client(self) -> anthropic.AsyncAnthropic:
+        token = self._oauth.ensure_valid_token()
+        return anthropic.AsyncAnthropic(
+            auth_token=token,
+            timeout=httpx.Timeout(LLM_HTTP_TIMEOUT_TOTAL, connect=LLM_HTTP_TIMEOUT_CONNECT, read=LLM_HTTP_TIMEOUT_READ),
+        )
+    def _ensure_valid_token(self) -> None:
+        state = self._token_manager.get_state()
+        if state is None:
+            raise ClaudeNotLoggedInError("Not logged in to Claude. Run 'klaude login claude' first.")
+        if state.is_expired():
+            self._oauth.refresh()
+            self.client = self._create_client()
+    @classmethod
+    @override
+    def create(cls, config: llm_param.LLMConfigParameter) -> "LLMClientABC":
+        return cls(config)
+    @override
+    async def call(self, param: llm_param.LLMCallParameter) -> AsyncGenerator[message.LLMStreamItem]:
+        self._ensure_valid_token()
+        param = apply_config_defaults(param, self.get_llm_config())
+        metadata_tracker = MetadataTracker(cost_config=self.get_llm_config().cost)
+        # Anthropic OAuth requires the oauth beta flag
+        extra_betas = list(_CLAUDE_OAUTH_REQUIRED_BETAS)
+        payload = build_payload(param, extra_betas=extra_betas)
+        # Keep the interleaved-thinking beta in sync with configured thinking.
+        if not (param.thinking and param.thinking.type == "enabled"):
+            payload["betas"] = [b for b in payload.get("betas", []) if b != ANTHROPIC_BETA_INTERLEAVED_THINKING]
+        log_debug(
+            json.dumps(payload, ensure_ascii=False, default=str),
+            style="yellow",
+            debug_type=DebugType.LLM_PAYLOAD,
+        )
+        stream = self.client.beta.messages.create(
+            **payload,
+            extra_headers={"extra": json.dumps({"session_id": param.session_id}, sort_keys=True)},
+        )
+        try:
+            async for item in parse_anthropic_stream(stream, param, metadata_tracker):
+                yield item
+        except (APIError, httpx.HTTPError) as e:
+            error_message = f"{e.__class__.__name__} {e!s}"
+            for item in error_stream_items(metadata_tracker, error=error_message):
+                yield item

klaude_code/llm/client.py CHANGED Viewed

@@ -2,7 +2,7 @@ from abc import ABC, abstractmethod
 from collections.abc import AsyncGenerator
 from typing import ParamSpec, TypeVar, cast
-from klaude_code.protocol import llm_param, model
+from klaude_code.protocol import llm_param, message
 class LLMClientABC(ABC):
@@ -15,9 +15,10 @@ class LLMClientABC(ABC):
         pass
     @abstractmethod
-    async def call(self, param: llm_param.LLMCallParameter) -> AsyncGenerator[model.ConversationItem]:
+    async def call(self, param: llm_param.LLMCallParameter) -> AsyncGenerator[message.LLMStreamItem]:
+        if False:  # pragma: no cover
+            yield cast(message.LLMStreamItem, None)
         raise NotImplementedError
-        yield cast(model.ConversationItem, None)
     def get_llm_config(self) -> llm_param.LLMConfigParameter:
         return self._config

klaude_code/llm/codex/client.py CHANGED Viewed

@@ -12,13 +12,20 @@ from openai.types.responses.response_create_params import ResponseCreateParamsSt
 from klaude_code.auth.codex.exceptions import CodexNotLoggedInError
 from klaude_code.auth.codex.oauth import CodexOAuth
 from klaude_code.auth.codex.token_manager import CodexTokenManager
+from klaude_code.const import (
+    CODEX_BASE_URL,
+    CODEX_USER_AGENT,
+    LLM_HTTP_TIMEOUT_CONNECT,
+    LLM_HTTP_TIMEOUT_READ,
+    LLM_HTTP_TIMEOUT_TOTAL,
+)
 from klaude_code.llm.client import LLMClientABC
 from klaude_code.llm.input_common import apply_config_defaults
 from klaude_code.llm.registry import register
 from klaude_code.llm.responses.client import parse_responses_stream
 from klaude_code.llm.responses.input import convert_history_to_input, convert_tool_schema
-from klaude_code.llm.usage import MetadataTracker
-from klaude_code.protocol import llm_param, model
+from klaude_code.llm.usage import MetadataTracker, error_stream_items
+from klaude_code.protocol import llm_param, message
 from klaude_code.trace import DebugType, log_debug
@@ -57,17 +64,14 @@ def build_payload(param: llm_param.LLMCallParameter) -> ResponseCreateParamsStre
     return payload
-# Codex API configuration
-CODEX_BASE_URL = "https://chatgpt.com/backend-api/codex"
 CODEX_HEADERS = {
     "originator": "codex_cli_rs",
-    # Mocked Codex-style user agent string
-    "User-Agent": "codex_cli_rs/0.0.0-klaude",
+    "User-Agent": CODEX_USER_AGENT,
     "OpenAI-Beta": "responses=experimental",
 }
-@register(llm_param.LLMClientProtocol.CODEX)
+@register(llm_param.LLMClientProtocol.CODEX_OAUTH)
 class CodexClient(LLMClientABC):
     """LLM client for Codex API using ChatGPT subscription."""
@@ -90,7 +94,7 @@ class CodexClient(LLMClientABC):
         return AsyncOpenAI(
             api_key=state.access_token,
             base_url=CODEX_BASE_URL,
-            timeout=httpx.Timeout(300.0, connect=15.0, read=285.0),
+            timeout=httpx.Timeout(LLM_HTTP_TIMEOUT_TOTAL, connect=LLM_HTTP_TIMEOUT_CONNECT, read=LLM_HTTP_TIMEOUT_READ),
             default_headers={
                 **CODEX_HEADERS,
                 "chatgpt-account-id": state.account_id,
@@ -114,7 +118,7 @@ class CodexClient(LLMClientABC):
         return cls(config)
     @override
-    async def call(self, param: llm_param.LLMCallParameter) -> AsyncGenerator[model.ConversationItem]:
+    async def call(self, param: llm_param.LLMCallParameter) -> AsyncGenerator[message.LLMStreamItem]:
         # Ensure token is valid before API call
         self._ensure_valid_token()
@@ -142,7 +146,9 @@ class CodexClient(LLMClientABC):
                 extra_headers=extra_headers,
             )
         except (openai.OpenAIError, httpx.HTTPError) as e:
-            yield model.StreamErrorItem(error=f"{e.__class__.__name__} {e!s}")
+            error_message = f"{e.__class__.__name__} {e!s}"
+            for item in error_stream_items(metadata_tracker, error=error_message):
+                yield item
             return
         async for item in parse_responses_stream(stream, param, metadata_tracker):

klaude_code/llm/google/client.py CHANGED Viewed

@@ -5,7 +5,7 @@
 import json
 from collections.abc import AsyncGenerator, AsyncIterator
-from typing import Any, cast, override
+from typing import Any, Literal, cast, override
 from uuid import uuid4
 import httpx
@@ -26,7 +26,7 @@ from klaude_code.llm.google.input import convert_history_to_contents, convert_to
 from klaude_code.llm.input_common import apply_config_defaults
 from klaude_code.llm.registry import register
 from klaude_code.llm.usage import MetadataTracker
-from klaude_code.protocol import llm_param, model
+from klaude_code.protocol import llm_param, message, model
 from klaude_code.trace import DebugType, log_debug
@@ -114,25 +114,74 @@ def _merge_partial_args(dst: dict[str, Any], partial_args: list[Any] | None) ->
         dst[key] = _partial_arg_value(partial)
+def _map_finish_reason(reason: str) -> model.StopReason | None:
+    normalized = reason.strip().lower()
+    mapping: dict[str, model.StopReason] = {
+        "stop": "stop",
+        "end_turn": "stop",
+        "max_tokens": "length",
+        "length": "length",
+        "tool_use": "tool_use",
+        "safety": "error",
+        "recitation": "error",
+        "other": "error",
+        "content_filter": "error",
+        "blocked": "error",
+        "blocklist": "error",
+        "cancelled": "aborted",
+        "canceled": "aborted",
+        "aborted": "aborted",
+    }
+    return mapping.get(normalized)
 async def parse_google_stream(
     stream: AsyncIterator[Any],
     param: llm_param.LLMCallParameter,
     metadata_tracker: MetadataTracker,
-) -> AsyncGenerator[model.ConversationItem]:
+) -> AsyncGenerator[message.LLMStreamItem]:
     response_id: str | None = None
-    started = False
+    stage: Literal["waiting", "thinking", "assistant", "tool"] = "waiting"
     accumulated_text: list[str] = []
     accumulated_thoughts: list[str] = []
     thought_signature: str | None = None
+    assistant_parts: list[message.Part] = []
     # Track tool calls where args arrive as partial updates.
     partial_args_by_call: dict[str, dict[str, Any]] = {}
     started_tool_calls: dict[str, str] = {}  # call_id -> name
     started_tool_items: set[str] = set()
-    emitted_tool_items: set[str] = set()
+    completed_tool_items: set[str] = set()
     last_usage_metadata: UsageMetadata | None = None
+    stop_reason: model.StopReason | None = None
+    def flush_thinking() -> None:
+        nonlocal thought_signature
+        if accumulated_thoughts:
+            assistant_parts.append(
+                message.ThinkingTextPart(
+                    text="".join(accumulated_thoughts),
+                    model_id=str(param.model),
+                )
+            )
+            accumulated_thoughts.clear()
+        if thought_signature:
+            assistant_parts.append(
+                message.ThinkingSignaturePart(
+                    signature=thought_signature,
+                    model_id=str(param.model),
+                    format="google_thought_signature",
+                )
+            )
+            thought_signature = None
+    def flush_text() -> None:
+        if not accumulated_text:
+            return
+        assistant_parts.append(message.TextPart(text="".join(accumulated_text)))
+        accumulated_text.clear()
     async for chunk in stream:
         log_debug(
@@ -143,33 +192,44 @@ async def parse_google_stream(
         if response_id is None:
             response_id = getattr(chunk, "response_id", None) or uuid4().hex
-        assert response_id is not None
-        if not started:
-            started = True
-            yield model.StartItem(response_id=response_id)
         if getattr(chunk, "usage_metadata", None) is not None:
             last_usage_metadata = chunk.usage_metadata
         candidates = getattr(chunk, "candidates", None) or []
         candidate0 = candidates[0] if candidates else None
+        finish_reason = getattr(candidate0, "finish_reason", None) if candidate0 else None
+        if finish_reason is not None:
+            if isinstance(finish_reason, str):
+                reason_value = finish_reason
+            else:
+                reason_value = getattr(finish_reason, "name", None) or str(finish_reason)
+            stop_reason = _map_finish_reason(reason_value)
         content = getattr(candidate0, "content", None) if candidate0 else None
-        parts = getattr(content, "parts", None) if content else None
-        if not parts:
+        content_parts = getattr(content, "parts", None) if content else None
+        if not content_parts:
             continue
-        for part in parts:
+        for part in content_parts:
             if getattr(part, "text", None) is not None:
-                metadata_tracker.record_token()
                 text = part.text
+                if not text:
+                    continue
+                metadata_tracker.record_token()
                 if getattr(part, "thought", False) is True:
+                    if stage == "assistant":
+                        flush_text()
+                    stage = "thinking"
                     accumulated_thoughts.append(text)
                     if getattr(part, "thought_signature", None):
                         thought_signature = part.thought_signature
-                    yield model.ReasoningTextDelta(content=text, response_id=response_id)
+                    yield message.ThinkingTextDelta(content=text, response_id=response_id)
                 else:
+                    if stage == "thinking":
+                        flush_thinking()
+                    stage = "assistant"
                     accumulated_text.append(text)
-                    yield model.AssistantMessageDelta(content=text, response_id=response_id)
+                    yield message.AssistantTextDelta(content=text, response_id=response_id)
             function_call = getattr(part, "function_call", None)
             if function_call is None:
@@ -182,17 +242,23 @@ async def parse_google_stream(
             if call_id not in started_tool_items:
                 started_tool_items.add(call_id)
-                yield model.ToolCallStartItem(response_id=response_id, call_id=call_id, name=name)
+                yield message.ToolCallStartItem(response_id=response_id, call_id=call_id, name=name)
             args_obj = getattr(function_call, "args", None)
             if args_obj is not None:
-                emitted_tool_items.add(call_id)
-                yield model.ToolCallItem(
-                    response_id=response_id,
-                    call_id=call_id,
-                    name=name,
-                    arguments=json.dumps(args_obj, ensure_ascii=False),
+                if stage == "thinking":
+                    flush_thinking()
+                if stage == "assistant":
+                    flush_text()
+                stage = "tool"
+                assistant_parts.append(
+                    message.ToolCallPart(
+                        call_id=call_id,
+                        tool_name=name,
+                        arguments_json=json.dumps(args_obj, ensure_ascii=False),
+                    )
                 )
+                completed_tool_items.add(call_id)
                 continue
             partial_args = getattr(function_call, "partial_args", None)
@@ -201,53 +267,49 @@ async def parse_google_stream(
                 _merge_partial_args(acc, partial_args)
             will_continue = getattr(function_call, "will_continue", None)
-            if will_continue is False and call_id in partial_args_by_call and call_id not in emitted_tool_items:
-                emitted_tool_items.add(call_id)
-                yield model.ToolCallItem(
-                    response_id=response_id,
-                    call_id=call_id,
-                    name=name,
-                    arguments=json.dumps(partial_args_by_call[call_id], ensure_ascii=False),
+            if will_continue is False and call_id in partial_args_by_call and call_id not in completed_tool_items:
+                if stage == "thinking":
+                    flush_thinking()
+                if stage == "assistant":
+                    flush_text()
+                stage = "tool"
+                assistant_parts.append(
+                    message.ToolCallPart(
+                        call_id=call_id,
+                        tool_name=name,
+                        arguments_json=json.dumps(partial_args_by_call[call_id], ensure_ascii=False),
+                    )
                 )
+                completed_tool_items.add(call_id)
     # Flush any pending tool calls that never produced args.
     for call_id, name in started_tool_calls.items():
-        if call_id in emitted_tool_items:
+        if call_id in completed_tool_items:
             continue
         args = partial_args_by_call.get(call_id, {})
-        emitted_tool_items.add(call_id)
-        yield model.ToolCallItem(
-            response_id=response_id,
-            call_id=call_id,
-            name=name,
-            arguments=json.dumps(args, ensure_ascii=False),
-        )
-    if accumulated_thoughts:
-        metadata_tracker.record_token()
-        yield model.ReasoningTextItem(
-            content="".join(accumulated_thoughts),
-            response_id=response_id,
-            model=str(param.model),
-        )
-        if thought_signature:
-            yield model.ReasoningEncryptedItem(
-                encrypted_content=thought_signature,
-                response_id=response_id,
-                model=str(param.model),
-                format="google_thought_signature",
+        assistant_parts.append(
+            message.ToolCallPart(
+                call_id=call_id,
+                tool_name=name,
+                arguments_json=json.dumps(args, ensure_ascii=False),
             )
+        )
-    if accumulated_text:
-        metadata_tracker.record_token()
-        yield model.AssistantMessageItem(content="".join(accumulated_text), response_id=response_id)
+    flush_thinking()
+    flush_text()
     usage = _usage_from_metadata(last_usage_metadata, context_limit=param.context_limit, max_tokens=param.max_tokens)
     if usage is not None:
         metadata_tracker.set_usage(usage)
     metadata_tracker.set_model_name(str(param.model))
     metadata_tracker.set_response_id(response_id)
-    yield metadata_tracker.finalize()
+    metadata = metadata_tracker.finalize()
+    yield message.AssistantMessage(
+        parts=assistant_parts,
+        response_id=response_id,
+        usage=metadata,
+        stop_reason=stop_reason,
+    )
 @register(llm_param.LLMClientProtocol.GOOGLE)
@@ -270,7 +332,7 @@ class GoogleClient(LLMClientABC):
         return cls(config)
     @override
-    async def call(self, param: llm_param.LLMCallParameter) -> AsyncGenerator[model.ConversationItem]:
+    async def call(self, param: llm_param.LLMCallParameter) -> AsyncGenerator[message.LLMStreamItem]:
         param = apply_config_defaults(param, self.get_llm_config())
         metadata_tracker = MetadataTracker(cost_config=self.get_llm_config().cost)
@@ -297,13 +359,13 @@ class GoogleClient(LLMClientABC):
                 config=config,
             )
         except (APIError, ClientError, ServerError, httpx.HTTPError) as e:
-            yield model.StreamErrorItem(error=f"{e.__class__.__name__} {e!s}")
-            yield metadata_tracker.finalize()
+            yield message.StreamErrorItem(error=f"{e.__class__.__name__} {e!s}")
+            yield message.AssistantMessage(parts=[], response_id=None, usage=metadata_tracker.finalize())
             return
         try:
             async for item in parse_google_stream(stream, param=param, metadata_tracker=metadata_tracker):
                 yield item
         except (APIError, ClientError, ServerError, httpx.HTTPError) as e:
-            yield model.StreamErrorItem(error=f"{e.__class__.__name__} {e!s}")
-            yield metadata_tracker.finalize()
+            yield message.StreamErrorItem(error=f"{e.__class__.__name__} {e!s}")
+            yield message.AssistantMessage(parts=[], response_id=None, usage=metadata_tracker.finalize())

klaude-code 1.8.0__py3-none-any.whl → 2.0.0__py3-none-any.whl

klaude-code 1.8.0py3-none-any.whl → 2.0.0py3-none-any.whl