PyPI - klaude-code - Versions diffs - 1.8.0__py3-none-any.whl → 2.0.0__py3-none-any.whl - Mend

klaude-code 1.8.0py3-none-any.whl → 2.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (142) hide show

klaude_code/auth/base.py +97 -0
klaude_code/auth/claude/__init__.py +6 -0
klaude_code/auth/claude/exceptions.py +9 -0
klaude_code/auth/claude/oauth.py +172 -0
klaude_code/auth/claude/token_manager.py +26 -0
klaude_code/auth/codex/token_manager.py +10 -50
klaude_code/cli/auth_cmd.py +127 -46
klaude_code/cli/config_cmd.py +4 -2
klaude_code/cli/cost_cmd.py +14 -9
klaude_code/cli/list_model.py +248 -200
klaude_code/cli/main.py +1 -1
klaude_code/cli/runtime.py +7 -5
klaude_code/cli/self_update.py +1 -1
klaude_code/cli/session_cmd.py +1 -1
klaude_code/command/clear_cmd.py +6 -2
klaude_code/command/command_abc.py +2 -2
klaude_code/command/debug_cmd.py +4 -4
klaude_code/command/export_cmd.py +2 -2
klaude_code/command/export_online_cmd.py +12 -12
klaude_code/command/fork_session_cmd.py +29 -23
klaude_code/command/help_cmd.py +4 -4
klaude_code/command/model_cmd.py +4 -4
klaude_code/command/model_select.py +1 -1
klaude_code/command/prompt-commit.md +82 -0
klaude_code/command/prompt_command.py +3 -3
klaude_code/command/refresh_cmd.py +2 -2
klaude_code/command/registry.py +7 -5
klaude_code/command/release_notes_cmd.py +4 -4
klaude_code/command/resume_cmd.py +15 -11
klaude_code/command/status_cmd.py +4 -4
klaude_code/command/terminal_setup_cmd.py +8 -8
klaude_code/command/thinking_cmd.py +4 -4
klaude_code/config/assets/builtin_config.yaml +52 -3
klaude_code/config/builtin_config.py +16 -5
klaude_code/config/config.py +31 -7
klaude_code/config/thinking.py +4 -4
klaude_code/const.py +146 -91
klaude_code/core/agent.py +3 -12
klaude_code/core/executor.py +21 -13
klaude_code/core/manager/sub_agent_manager.py +71 -7
klaude_code/core/prompt.py +1 -1
klaude_code/core/prompts/prompt-sub-agent-image-gen.md +1 -0
klaude_code/core/prompts/prompt-sub-agent-web.md +27 -1
klaude_code/core/reminders.py +88 -69
klaude_code/core/task.py +44 -45
klaude_code/core/tool/file/apply_patch_tool.py +9 -9
klaude_code/core/tool/file/diff_builder.py +3 -5
klaude_code/core/tool/file/edit_tool.py +23 -23
klaude_code/core/tool/file/move_tool.py +43 -43
klaude_code/core/tool/file/read_tool.py +44 -39
klaude_code/core/tool/file/write_tool.py +14 -14
klaude_code/core/tool/report_back_tool.py +4 -4
klaude_code/core/tool/shell/bash_tool.py +23 -23
klaude_code/core/tool/skill/skill_tool.py +7 -7
klaude_code/core/tool/sub_agent_tool.py +38 -9
klaude_code/core/tool/todo/todo_write_tool.py +8 -8
klaude_code/core/tool/todo/update_plan_tool.py +6 -6
klaude_code/core/tool/tool_abc.py +2 -2
klaude_code/core/tool/tool_context.py +27 -0
klaude_code/core/tool/tool_runner.py +88 -42
klaude_code/core/tool/truncation.py +38 -20
klaude_code/core/tool/web/mermaid_tool.py +6 -7
klaude_code/core/tool/web/web_fetch_tool.py +68 -30
klaude_code/core/tool/web/web_search_tool.py +15 -17
klaude_code/core/turn.py +120 -73
klaude_code/llm/anthropic/client.py +104 -44
klaude_code/llm/anthropic/input.py +116 -108
klaude_code/llm/bedrock/client.py +8 -5
klaude_code/llm/claude/__init__.py +3 -0
klaude_code/llm/claude/client.py +105 -0
klaude_code/llm/client.py +4 -3
klaude_code/llm/codex/client.py +16 -10
klaude_code/llm/google/client.py +122 -60
klaude_code/llm/google/input.py +94 -108
klaude_code/llm/image.py +123 -0
klaude_code/llm/input_common.py +136 -189
klaude_code/llm/openai_compatible/client.py +17 -7
klaude_code/llm/openai_compatible/input.py +36 -66
klaude_code/llm/openai_compatible/stream.py +119 -67
klaude_code/llm/openai_compatible/tool_call_accumulator.py +23 -11
klaude_code/llm/openrouter/client.py +34 -9
klaude_code/llm/openrouter/input.py +63 -64
klaude_code/llm/openrouter/reasoning.py +22 -24
klaude_code/llm/registry.py +20 -15
klaude_code/llm/responses/client.py +107 -45
klaude_code/llm/responses/input.py +115 -98
klaude_code/llm/usage.py +52 -25
klaude_code/protocol/__init__.py +1 -0
klaude_code/protocol/events.py +16 -12
klaude_code/protocol/llm_param.py +22 -3
klaude_code/protocol/message.py +250 -0
klaude_code/protocol/model.py +94 -281
klaude_code/protocol/op.py +2 -2
klaude_code/protocol/sub_agent/__init__.py +2 -2
klaude_code/protocol/sub_agent/explore.py +10 -0
klaude_code/protocol/sub_agent/image_gen.py +119 -0
klaude_code/protocol/sub_agent/task.py +10 -0
klaude_code/protocol/sub_agent/web.py +10 -0
klaude_code/session/codec.py +6 -6
klaude_code/session/export.py +261 -62
klaude_code/session/selector.py +7 -24
klaude_code/session/session.py +125 -53
klaude_code/session/store.py +5 -32
klaude_code/session/templates/export_session.html +1 -1
klaude_code/session/templates/mermaid_viewer.html +1 -1
klaude_code/trace/log.py +11 -6
klaude_code/ui/core/input.py +1 -1
klaude_code/ui/core/stage_manager.py +1 -8
klaude_code/ui/modes/debug/display.py +2 -2
klaude_code/ui/modes/repl/clipboard.py +2 -2
klaude_code/ui/modes/repl/completers.py +18 -10
klaude_code/ui/modes/repl/event_handler.py +136 -127
klaude_code/ui/modes/repl/input_prompt_toolkit.py +1 -1
klaude_code/ui/modes/repl/key_bindings.py +1 -1
klaude_code/ui/modes/repl/renderer.py +107 -15
klaude_code/ui/renderers/assistant.py +2 -2
klaude_code/ui/renderers/common.py +65 -7
klaude_code/ui/renderers/developer.py +7 -6
klaude_code/ui/renderers/diffs.py +11 -11
klaude_code/ui/renderers/mermaid_viewer.py +49 -2
klaude_code/ui/renderers/metadata.py +39 -31
klaude_code/ui/renderers/sub_agent.py +57 -16
klaude_code/ui/renderers/thinking.py +37 -2
klaude_code/ui/renderers/tools.py +180 -165
klaude_code/ui/rich/live.py +3 -1
klaude_code/ui/rich/markdown.py +39 -7
klaude_code/ui/rich/quote.py +76 -1
klaude_code/ui/rich/status.py +14 -8
klaude_code/ui/rich/theme.py +13 -6
klaude_code/ui/terminal/image.py +34 -0
klaude_code/ui/terminal/notifier.py +2 -1
klaude_code/ui/terminal/progress_bar.py +4 -4
klaude_code/ui/terminal/selector.py +22 -4
klaude_code/ui/utils/common.py +55 -0
{klaude_code-1.8.0.dist-info → klaude_code-2.0.0.dist-info}/METADATA +28 -6
klaude_code-2.0.0.dist-info/RECORD +229 -0
klaude_code/command/prompt-jj-describe.md +0 -32
klaude_code/core/prompts/prompt-sub-agent-oracle.md +0 -22
klaude_code/protocol/sub_agent/oracle.py +0 -91
klaude_code-1.8.0.dist-info/RECORD +0 -219
{klaude_code-1.8.0.dist-info → klaude_code-2.0.0.dist-info}/WHEEL +0 -0
{klaude_code-1.8.0.dist-info → klaude_code-2.0.0.dist-info}/entry_points.txt +0 -0

klaude_code/llm/openrouter/reasoning.py CHANGED Viewed

@@ -1,7 +1,7 @@
 from pydantic import BaseModel
 from klaude_code.llm.openai_compatible.stream import ReasoningDeltaResult, ReasoningHandlerABC
-from klaude_code.protocol import model
+from klaude_code.protocol import message
 from klaude_code.trace import log
@@ -42,7 +42,7 @@ class ReasoningStreamHandler(ReasoningHandlerABC):
         if not reasoning_details:
             return ReasoningDeltaResult(handled=False, outputs=[])
-        outputs: list[str | model.ConversationItem] = []
+        outputs: list[str | message.Part] = []
         for item in reasoning_details:
             try:
                 reasoning_detail = ReasoningDetail.model_validate(item)
@@ -56,16 +56,16 @@ class ReasoningStreamHandler(ReasoningHandlerABC):
         return ReasoningDeltaResult(handled=True, outputs=outputs)
-    def on_detail(self, detail: ReasoningDetail) -> list[model.ConversationItem]:
-        """Process a single reasoning detail and return streamable items."""
-        items: list[model.ConversationItem] = []
+    def on_detail(self, detail: ReasoningDetail) -> list[message.Part]:
+        """Process a single reasoning detail and return streamable parts."""
+        items: list[message.Part] = []
         if detail.type == "reasoning.encrypted":
             self._reasoning_id = detail.id
             # Flush accumulated text before encrypted content
             items.extend(self._flush_text())
-            if encrypted_item := self._build_encrypted_item(detail.data, detail):
-                items.append(encrypted_item)
+            if signature_part := self._build_signature_part(detail.data, detail):
+                items.append(signature_part)
             return items
         if detail.type in ("reasoning.text", "reasoning.summary"):
@@ -77,42 +77,40 @@ class ReasoningStreamHandler(ReasoningHandlerABC):
             # Flush on signature (encrypted content)
             if detail.signature:
                 items.extend(self._flush_text())
-                if encrypted_item := self._build_encrypted_item(detail.signature, detail):
-                    items.append(encrypted_item)
+                if signature_part := self._build_signature_part(detail.signature, detail):
+                    items.append(signature_part)
         return items
-    def flush(self) -> list[model.ConversationItem]:
+    def flush(self) -> list[message.Part]:
         """Flush buffered reasoning text on finalize."""
         return self._flush_text()
-    def _flush_text(self) -> list[model.ConversationItem]:
-        """Flush accumulated reasoning text as a single item."""
+    def _flush_text(self) -> list[message.Part]:
+        """Flush accumulated reasoning text as a single part."""
         if not self._accumulated_reasoning:
             return []
-        item = self._build_text_item("".join(self._accumulated_reasoning))
+        item = self._build_text_part("".join(self._accumulated_reasoning))
         self._accumulated_reasoning = []
         return [item]
-    def _build_text_item(self, content: str) -> model.ReasoningTextItem:
-        return model.ReasoningTextItem(
+    def _build_text_part(self, content: str) -> message.ThinkingTextPart:
+        return message.ThinkingTextPart(
             id=self._reasoning_id,
-            content=content,
-            response_id=self._response_id,
-            model=self._param_model,
+            text=content,
+            model_id=self._param_model,
         )
-    def _build_encrypted_item(
+    def _build_signature_part(
         self,
         content: str | None,
         detail: ReasoningDetail,
-    ) -> model.ReasoningEncryptedItem | None:
+    ) -> message.ThinkingSignaturePart | None:
         if not content:
             return None
-        return model.ReasoningEncryptedItem(
+        return message.ThinkingSignaturePart(
             id=detail.id,
-            encrypted_content=content,
+            signature=content,
             format=detail.format,
-            response_id=self._response_id,
-            model=self._param_model,
+            model_id=self._param_model,
         )

klaude_code/llm/registry.py CHANGED Viewed

@@ -12,29 +12,34 @@ _T = TypeVar("_T", bound=type["LLMClientABC"])
 # Track which protocols have been loaded
 _loaded_protocols: set[llm_param.LLMClientProtocol] = set()
 _REGISTRY: dict[llm_param.LLMClientProtocol, type["LLMClientABC"]] = {}
+_PROTOCOL_MODULES: dict[llm_param.LLMClientProtocol, str] = {
+    llm_param.LLMClientProtocol.ANTHROPIC: "klaude_code.llm.anthropic",
+    llm_param.LLMClientProtocol.CLAUDE_OAUTH: "klaude_code.llm.claude",
+    llm_param.LLMClientProtocol.BEDROCK: "klaude_code.llm.bedrock",
+    llm_param.LLMClientProtocol.CODEX_OAUTH: "klaude_code.llm.codex",
+    llm_param.LLMClientProtocol.OPENAI: "klaude_code.llm.openai_compatible",
+    llm_param.LLMClientProtocol.OPENROUTER: "klaude_code.llm.openrouter",
+    llm_param.LLMClientProtocol.RESPONSES: "klaude_code.llm.responses",
+    llm_param.LLMClientProtocol.GOOGLE: "klaude_code.llm.google",
+}
 def _load_protocol(protocol: llm_param.LLMClientProtocol) -> None:
     """Load the module for a specific protocol on demand."""
     if protocol in _loaded_protocols:
         return
-    _loaded_protocols.add(protocol)
+    module_path = _PROTOCOL_MODULES.get(protocol)
+    if module_path is None:
+        raise ValueError(f"Unknown LLMClient protocol: {protocol}")
     # Import only the needed module to trigger @register decorator
-    if protocol == llm_param.LLMClientProtocol.ANTHROPIC:
-        importlib.import_module("klaude_code.llm.anthropic")
-    elif protocol == llm_param.LLMClientProtocol.BEDROCK:
-        importlib.import_module("klaude_code.llm.bedrock")
-    elif protocol == llm_param.LLMClientProtocol.CODEX:
-        importlib.import_module("klaude_code.llm.codex")
-    elif protocol == llm_param.LLMClientProtocol.OPENAI:
-        importlib.import_module("klaude_code.llm.openai_compatible")
-    elif protocol == llm_param.LLMClientProtocol.OPENROUTER:
-        importlib.import_module("klaude_code.llm.openrouter")
-    elif protocol == llm_param.LLMClientProtocol.RESPONSES:
-        importlib.import_module("klaude_code.llm.responses")
-    elif protocol == llm_param.LLMClientProtocol.GOOGLE:
-        importlib.import_module("klaude_code.llm.google")
+    importlib.import_module(module_path)
+    _loaded_protocols.add(protocol)
+def load_protocol(protocol: llm_param.LLMClientProtocol) -> None:
+    """Load the module for a specific protocol on demand."""
+    _load_protocol(protocol)
 def register(name: llm_param.LLMClientProtocol) -> Callable[[_T], _T]:

klaude_code/llm/responses/client.py CHANGED Viewed

@@ -1,6 +1,6 @@
 import json
 from collections.abc import AsyncGenerator
-from typing import TYPE_CHECKING, override
+from typing import TYPE_CHECKING, Literal, override
 import httpx
 import openai
@@ -8,12 +8,13 @@ from openai import AsyncAzureOpenAI, AsyncOpenAI
 from openai.types import responses
 from openai.types.responses.response_create_params import ResponseCreateParamsStreaming
+from klaude_code.const import LLM_HTTP_TIMEOUT_CONNECT, LLM_HTTP_TIMEOUT_READ, LLM_HTTP_TIMEOUT_TOTAL
 from klaude_code.llm.client import LLMClientABC
 from klaude_code.llm.input_common import apply_config_defaults
 from klaude_code.llm.registry import register
 from klaude_code.llm.responses.input import convert_history_to_input, convert_tool_schema
-from klaude_code.llm.usage import MetadataTracker
-from klaude_code.protocol import llm_param, model
+from klaude_code.llm.usage import MetadataTracker, error_stream_items
+from klaude_code.protocol import llm_param, message, model
 from klaude_code.trace import DebugType, log_debug
 if TYPE_CHECKING:
@@ -59,9 +60,57 @@ async def parse_responses_stream(
     stream: "AsyncStream[ResponseStreamEvent]",
     param: llm_param.LLMCallParameter,
     metadata_tracker: MetadataTracker,
-) -> AsyncGenerator[model.ConversationItem]:
-    """Parse OpenAI Responses API stream events into ConversationItems."""
+) -> AsyncGenerator[message.LLMStreamItem]:
+    """Parse OpenAI Responses API stream events into stream items."""
     response_id: str | None = None
+    stage: Literal["waiting", "thinking", "assistant", "tool"] = "waiting"
+    accumulated_thinking: list[str] = []
+    accumulated_text: list[str] = []
+    pending_signature: str | None = None
+    assistant_parts: list[message.Part] = []
+    stop_reason: model.StopReason | None = None
+    def flush_thinking() -> None:
+        nonlocal pending_signature
+        if accumulated_thinking:
+            assistant_parts.append(
+                message.ThinkingTextPart(
+                    text="".join(accumulated_thinking),
+                    model_id=str(param.model),
+                )
+            )
+            accumulated_thinking.clear()
+        if pending_signature:
+            assistant_parts.append(
+                message.ThinkingSignaturePart(
+                    signature=pending_signature,
+                    model_id=str(param.model),
+                    format="openai_reasoning",
+                )
+            )
+            pending_signature = None
+    def flush_text() -> None:
+        if not accumulated_text:
+            return
+        assistant_parts.append(message.TextPart(text="".join(accumulated_text)))
+        accumulated_text.clear()
+    def map_stop_reason(status: str | None, reason: str | None) -> model.StopReason | None:
+        if reason:
+            normalized = reason.strip().lower()
+            if normalized in {"max_output_tokens", "length", "max_tokens"}:
+                return "length"
+            if normalized in {"content_filter", "safety"}:
+                return "error"
+            if normalized in {"cancelled", "canceled", "aborted"}:
+                return "aborted"
+        if status == "completed":
+            return "stop"
+        if status in {"failed", "error"}:
+            return "error"
+        return None
     try:
         async for event in stream:
@@ -74,29 +123,29 @@ async def parse_responses_stream(
             match event:
                 case responses.ResponseCreatedEvent() as event:
                     response_id = event.response.id
-                    yield model.StartItem(response_id=response_id)
                 case responses.ResponseReasoningSummaryTextDeltaEvent() as event:
                     if event.delta:
                         metadata_tracker.record_token()
-                        yield model.ReasoningTextDelta(
-                            content=event.delta,
-                            response_id=response_id,
-                        )
+                        if stage == "assistant":
+                            flush_text()
+                        stage = "thinking"
+                        accumulated_thinking.append(event.delta)
+                        yield message.ThinkingTextDelta(content=event.delta, response_id=response_id)
                 case responses.ResponseReasoningSummaryTextDoneEvent() as event:
-                    if event.text:
-                        yield model.ReasoningTextItem(
-                            content=event.text,
-                            response_id=response_id,
-                            model=str(param.model),
-                        )
+                    if event.text and not accumulated_thinking:
+                        accumulated_thinking.append(event.text)
                 case responses.ResponseTextDeltaEvent() as event:
                     if event.delta:
                         metadata_tracker.record_token()
-                    yield model.AssistantMessageDelta(content=event.delta, response_id=response_id)
+                        if stage == "thinking":
+                            flush_thinking()
+                        stage = "assistant"
+                        accumulated_text.append(event.delta)
+                        yield message.AssistantTextDelta(content=event.delta, response_id=response_id)
                 case responses.ResponseOutputItemAddedEvent() as event:
                     if isinstance(event.item, responses.ResponseFunctionToolCall):
                         metadata_tracker.record_token()
-                        yield model.ToolCallStartItem(
+                        yield message.ToolCallStartItem(
                             response_id=response_id,
                             call_id=event.item.call_id,
                             name=event.item.name,
@@ -105,34 +154,30 @@ async def parse_responses_stream(
                     match event.item:
                         case responses.ResponseReasoningItem() as item:
                             if item.encrypted_content:
-                                metadata_tracker.record_token()
-                                yield model.ReasoningEncryptedItem(
-                                    id=item.id,
-                                    encrypted_content=item.encrypted_content,
-                                    response_id=response_id,
-                                    model=str(param.model),
-                                )
+                                pending_signature = item.encrypted_content
                         case responses.ResponseOutputMessage() as item:
-                            metadata_tracker.record_token()
-                            yield model.AssistantMessageItem(
-                                content="\n".join(
+                            if not accumulated_text:
+                                text_content = "\n".join(
                                     [
                                         part.text
                                         for part in item.content
                                         if isinstance(part, responses.ResponseOutputText)
                                     ]
-                                ),
-                                id=item.id,
-                                response_id=response_id,
-                            )
+                                )
+                                if text_content:
+                                    accumulated_text.append(text_content)
                         case responses.ResponseFunctionToolCall() as item:
                             metadata_tracker.record_token()
-                            yield model.ToolCallItem(
-                                name=item.name,
-                                arguments=item.arguments.strip(),
-                                call_id=item.call_id,
-                                id=item.id,
-                                response_id=response_id,
+                            flush_thinking()
+                            flush_text()
+                            stage = "tool"
+                            assistant_parts.append(
+                                message.ToolCallPart(
+                                    call_id=item.call_id,
+                                    id=item.id,
+                                    tool_name=item.name,
+                                    arguments_json=item.arguments.strip(),
+                                )
                             )
                         case _:
                             pass
@@ -154,7 +199,7 @@ async def parse_responses_stream(
                         )
                     metadata_tracker.set_model_name(str(param.model))
                     metadata_tracker.set_response_id(response_id)
-                    yield metadata_tracker.finalize()
+                    stop_reason = map_stop_reason(event.response.status, error_reason)
                     if event.response.status != "completed":
                         error_message = f"LLM response finished with status '{event.response.status}'"
                         if error_reason:
@@ -165,7 +210,7 @@ async def parse_responses_stream(
                             style="red",
                             debug_type=DebugType.LLM_STREAM,
                         )
-                        yield model.StreamErrorItem(error=error_message)
+                        yield message.StreamErrorItem(error=error_message)
                 case _:
                     log_debug(
                         "[Unhandled stream event]",
@@ -174,7 +219,18 @@ async def parse_responses_stream(
                         debug_type=DebugType.LLM_STREAM,
                     )
     except (openai.OpenAIError, httpx.HTTPError) as e:
-        yield model.StreamErrorItem(error=f"{e.__class__.__name__} {e!s}")
+        yield message.StreamErrorItem(error=f"{e.__class__.__name__} {e!s}")
+    flush_thinking()
+    flush_text()
+    metadata_tracker.set_response_id(response_id)
+    metadata = metadata_tracker.finalize()
+    yield message.AssistantMessage(
+        parts=assistant_parts,
+        response_id=response_id,
+        usage=metadata,
+        stop_reason=stop_reason,
+    )
 @register(llm_param.LLMClientProtocol.RESPONSES)
@@ -188,13 +244,17 @@ class ResponsesClient(LLMClientABC):
                 api_key=config.api_key,
                 azure_endpoint=str(config.base_url),
                 api_version=config.azure_api_version,
-                timeout=httpx.Timeout(300.0, connect=15.0, read=285.0),
+                timeout=httpx.Timeout(
+                    LLM_HTTP_TIMEOUT_TOTAL, connect=LLM_HTTP_TIMEOUT_CONNECT, read=LLM_HTTP_TIMEOUT_READ
+                ),
             )
         else:
             client = AsyncOpenAI(
                 api_key=config.api_key,
                 base_url=config.base_url,
-                timeout=httpx.Timeout(300.0, connect=15.0, read=285.0),
+                timeout=httpx.Timeout(
+                    LLM_HTTP_TIMEOUT_TOTAL, connect=LLM_HTTP_TIMEOUT_CONNECT, read=LLM_HTTP_TIMEOUT_READ
+                ),
             )
         self.client: AsyncAzureOpenAI | AsyncOpenAI = client
@@ -204,7 +264,7 @@ class ResponsesClient(LLMClientABC):
         return cls(config)
     @override
-    async def call(self, param: llm_param.LLMCallParameter) -> AsyncGenerator[model.ConversationItem]:
+    async def call(self, param: llm_param.LLMCallParameter) -> AsyncGenerator[message.LLMStreamItem]:
         param = apply_config_defaults(param, self.get_llm_config())
         metadata_tracker = MetadataTracker(cost_config=self.get_llm_config().cost)
@@ -222,7 +282,9 @@ class ResponsesClient(LLMClientABC):
                 extra_headers={"extra": json.dumps({"session_id": param.session_id}, sort_keys=True)},
             )
         except (openai.OpenAIError, httpx.HTTPError) as e:
-            yield model.StreamErrorItem(error=f"{e.__class__.__name__} {e!s}")
+            error_message = f"{e.__class__.__name__} {e!s}"
+            for item in error_stream_items(metadata_tracker, error=error_message):
+                yield item
             return
         async for item in parse_responses_stream(stream, param, metadata_tracker):

klaude-code 1.8.0__py3-none-any.whl → 2.0.0__py3-none-any.whl

klaude-code 1.8.0py3-none-any.whl → 2.0.0py3-none-any.whl