PyPI - illusion-code - Versions diffs - 0.1.0__py3-none-any.whl - Mend

illusion-code 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (214) hide show

illusion/__init__.py +24 -0
illusion/__main__.py +15 -0
illusion/_frontend/dist/index.mjs +39208 -0
illusion/_frontend/package.json +27 -0
illusion/_frontend/src/App.tsx +624 -0
illusion/_frontend/src/components/CommandPicker.tsx +98 -0
illusion/_frontend/src/components/Composer.tsx +55 -0
illusion/_frontend/src/components/ComposerController.tsx +128 -0
illusion/_frontend/src/components/ConversationView.tsx +750 -0
illusion/_frontend/src/components/Footer.tsx +25 -0
illusion/_frontend/src/components/MarkdownContent.tsx +537 -0
illusion/_frontend/src/components/MarkdownTable.tsx +245 -0
illusion/_frontend/src/components/ModalHost.tsx +425 -0
illusion/_frontend/src/components/MultilineTextInput.tsx +250 -0
illusion/_frontend/src/components/PromptInput.tsx +64 -0
illusion/_frontend/src/components/SelectModal.tsx +78 -0
illusion/_frontend/src/components/SidePanel.tsx +175 -0
illusion/_frontend/src/components/Spinner.tsx +77 -0
illusion/_frontend/src/components/StatusBar.tsx +142 -0
illusion/_frontend/src/components/SwarmPanel.tsx +141 -0
illusion/_frontend/src/components/TodoPanel.tsx +126 -0
illusion/_frontend/src/components/ToolCallDisplay.tsx +202 -0
illusion/_frontend/src/components/TranscriptPane.tsx +79 -0
illusion/_frontend/src/components/WelcomeBanner.tsx +37 -0
illusion/_frontend/src/hooks/useBackendSession.ts +468 -0
illusion/_frontend/src/hooks/useTerminalSize.ts +9 -0
illusion/_frontend/src/i18n.ts +78 -0
illusion/_frontend/src/index.tsx +42 -0
illusion/_frontend/src/theme/ThemeContext.tsx +19 -0
illusion/_frontend/src/theme/builtinThemes.ts +89 -0
illusion/_frontend/src/types.ts +110 -0
illusion/_frontend/src/utils/markdown.ts +33 -0
illusion/_frontend/src/utils/thinking.ts +191 -0
illusion/_frontend/tsconfig.json +13 -0
illusion/_web_dist/assets/index-BseIw-ik.css +10 -0
illusion/_web_dist/assets/index-C_0ZWMuW.js +82 -0
illusion/_web_dist/index.html +16 -0
illusion/api/__init__.py +36 -0
illusion/api/client.py +568 -0
illusion/api/codex_client.py +563 -0
illusion/api/compat.py +138 -0
illusion/api/effort.py +128 -0
illusion/api/errors.py +57 -0
illusion/api/openai_client.py +819 -0
illusion/api/provider.py +148 -0
illusion/api/registry.py +479 -0
illusion/api/usage.py +45 -0
illusion/auth/__init__.py +50 -0
illusion/auth/copilot.py +419 -0
illusion/auth/external.py +612 -0
illusion/auth/flows.py +58 -0
illusion/auth/manager.py +214 -0
illusion/auth/storage.py +372 -0
illusion/bridge/__init__.py +38 -0
illusion/bridge/manager.py +190 -0
illusion/bridge/session_runner.py +84 -0
illusion/bridge/types.py +113 -0
illusion/bridge/work_secret.py +131 -0
illusion/cli.py +1228 -0
illusion/commands/__init__.py +32 -0
illusion/commands/registry.py +1934 -0
illusion/config/__init__.py +39 -0
illusion/config/i18n.py +522 -0
illusion/config/paths.py +259 -0
illusion/config/settings.py +564 -0
illusion/coordinator/__init__.py +41 -0
illusion/coordinator/agent_definitions.py +1093 -0
illusion/coordinator/coordinator_mode.py +127 -0
illusion/engine/__init__.py +95 -0
illusion/engine/cost_tracker.py +55 -0
illusion/engine/messages.py +369 -0
illusion/engine/query.py +632 -0
illusion/engine/query_engine.py +343 -0
illusion/engine/stream_events.py +169 -0
illusion/hooks/__init__.py +67 -0
illusion/hooks/events.py +43 -0
illusion/hooks/executor.py +397 -0
illusion/hooks/hot_reload.py +74 -0
illusion/hooks/loader.py +133 -0
illusion/hooks/schemas.py +121 -0
illusion/hooks/types.py +86 -0
illusion/mcp/__init__.py +104 -0
illusion/mcp/client.py +377 -0
illusion/mcp/config.py +140 -0
illusion/mcp/types.py +175 -0
illusion/memory/__init__.py +36 -0
illusion/memory/manager.py +94 -0
illusion/memory/memdir.py +58 -0
illusion/memory/paths.py +57 -0
illusion/memory/scan.py +120 -0
illusion/memory/search.py +83 -0
illusion/memory/types.py +43 -0
illusion/output_styles/__init__.py +15 -0
illusion/output_styles/loader.py +64 -0
illusion/permissions/__init__.py +39 -0
illusion/permissions/checker.py +174 -0
illusion/permissions/modes.py +38 -0
illusion/platforms.py +148 -0
illusion/plugins/__init__.py +71 -0
illusion/plugins/bundled/__init__.py +0 -0
illusion/plugins/installer.py +59 -0
illusion/plugins/loader.py +301 -0
illusion/plugins/schemas.py +51 -0
illusion/plugins/types.py +56 -0
illusion/prompts/__init__.py +29 -0
illusion/prompts/claudemd.py +74 -0
illusion/prompts/context.py +187 -0
illusion/prompts/environment.py +189 -0
illusion/prompts/system_prompt.py +155 -0
illusion/py.typed +0 -0
illusion/sandbox/__init__.py +29 -0
illusion/sandbox/adapter.py +174 -0
illusion/services/__init__.py +59 -0
illusion/services/compact/__init__.py +1015 -0
illusion/services/cron.py +338 -0
illusion/services/cron_scheduler.py +715 -0
illusion/services/file_history.py +258 -0
illusion/services/lsp/__init__.py +455 -0
illusion/services/session_storage.py +237 -0
illusion/services/token_estimation.py +72 -0
illusion/skills/__init__.py +60 -0
illusion/skills/bundled/__init__.py +110 -0
illusion/skills/bundled/content/batch.md +86 -0
illusion/skills/bundled/content/coding-guidelines.md +70 -0
illusion/skills/bundled/content/debug.md +38 -0
illusion/skills/bundled/content/loop.md +82 -0
illusion/skills/bundled/content/remember.md +105 -0
illusion/skills/bundled/content/simplify.md +53 -0
illusion/skills/bundled/content/skillify.md +113 -0
illusion/skills/bundled/content/stuck.md +54 -0
illusion/skills/bundled/content/update-config.md +329 -0
illusion/skills/bundled/content/verify.md +74 -0
illusion/skills/loader.py +219 -0
illusion/skills/registry.py +40 -0
illusion/skills/types.py +24 -0
illusion/state/__init__.py +18 -0
illusion/state/app_state.py +67 -0
illusion/state/store.py +93 -0
illusion/swarm/__init__.py +71 -0
illusion/swarm/agent_executor.py +857 -0
illusion/swarm/in_process.py +259 -0
illusion/swarm/subprocess_backend.py +136 -0
illusion/swarm/team_helpers.py +123 -0
illusion/swarm/types.py +159 -0
illusion/swarm/worktree.py +347 -0
illusion/tasks/__init__.py +33 -0
illusion/tasks/local_agent_task.py +42 -0
illusion/tasks/local_shell_task.py +27 -0
illusion/tasks/manager.py +377 -0
illusion/tasks/stop_task.py +21 -0
illusion/tasks/types.py +88 -0
illusion/tools/__init__.py +126 -0
illusion/tools/agent_tool.py +388 -0
illusion/tools/ask_user_question_tool.py +186 -0
illusion/tools/base.py +149 -0
illusion/tools/bash_tool.py +413 -0
illusion/tools/config_tool.py +90 -0
illusion/tools/cron_tool.py +473 -0
illusion/tools/enter_plan_mode_tool.py +147 -0
illusion/tools/enter_worktree_tool.py +188 -0
illusion/tools/exit_plan_mode_tool.py +69 -0
illusion/tools/exit_worktree_tool.py +225 -0
illusion/tools/file_edit_tool.py +283 -0
illusion/tools/file_read_tool.py +294 -0
illusion/tools/file_write_tool.py +184 -0
illusion/tools/glob_tool.py +165 -0
illusion/tools/grep_tool.py +190 -0
illusion/tools/list_mcp_resources_tool.py +80 -0
illusion/tools/lsp_tool.py +333 -0
illusion/tools/mcp_auth_tool.py +100 -0
illusion/tools/mcp_tool.py +75 -0
illusion/tools/notebook_edit_tool.py +242 -0
illusion/tools/powershell_tool.py +334 -0
illusion/tools/read_mcp_resource_tool.py +63 -0
illusion/tools/repl_tool.py +100 -0
illusion/tools/send_message_tool.py +112 -0
illusion/tools/shell_common.py +187 -0
illusion/tools/skill_tool.py +86 -0
illusion/tools/sleep_tool.py +62 -0
illusion/tools/structured_output_tool.py +58 -0
illusion/tools/task_create_tool.py +98 -0
illusion/tools/task_get_tool.py +94 -0
illusion/tools/task_list_tool.py +94 -0
illusion/tools/task_output_tool.py +55 -0
illusion/tools/task_stop_tool.py +52 -0
illusion/tools/task_update_tool.py +224 -0
illusion/tools/team_create_tool.py +236 -0
illusion/tools/team_delete_tool.py +104 -0
illusion/tools/todo_write_tool.py +198 -0
illusion/tools/tool_search_tool.py +156 -0
illusion/tools/web_fetch_tool.py +264 -0
illusion/tools/web_search_tool.py +186 -0
illusion/ui/__init__.py +23 -0
illusion/ui/app.py +258 -0
illusion/ui/backend_host.py +1180 -0
illusion/ui/input.py +86 -0
illusion/ui/output.py +363 -0
illusion/ui/permission_dialog.py +47 -0
illusion/ui/permission_store.py +99 -0
illusion/ui/protocol.py +384 -0
illusion/ui/react_launcher.py +280 -0
illusion/ui/runtime.py +787 -0
illusion/ui/textual_app.py +603 -0
illusion/ui/web/__init__.py +10 -0
illusion/ui/web/server.py +87 -0
illusion/ui/web/ws_host.py +1197 -0
illusion/utils/__init__.py +0 -0
illusion/utils/ripgrep.py +299 -0
illusion/utils/shell.py +248 -0
illusion_code-0.1.0.dist-info/METADATA +1159 -0
illusion_code-0.1.0.dist-info/RECORD +214 -0
illusion_code-0.1.0.dist-info/WHEEL +4 -0
illusion_code-0.1.0.dist-info/entry_points.txt +2 -0
illusion_code-0.1.0.dist-info/licenses/LICENSE +21 -0

illusion/api/openai_client.py ADDED Viewed

@@ -0,0 +1,819 @@
+"""
+OpenAI 兼容 API 客户端模块
+=========================
+本模块提供 OpenAI 兼容 API 客户端封装，支持阿里巴巴 DashScope、GitHub Models 等提供商。
+主要功能：
+    - 流式文本增量生成
+    - Anthropic 工具格式到 OpenAI 格式转换
+    - 自动重试 transient 错误
+    - 支持思维模型（reasoning_content）
+类说明：
+    - OpenAICompatibleClient: OpenAI 兼容客户端类
+使用示例：
+    >>> from illusion.api.openai_client import OpenAICompatibleClient
+    >>> client = OpenAICompatibleClient(api_key="sk-...")
+    >>> request = ApiMessageRequest(model="qwen-plus", messages=[])
+    >>> async for event in client.stream_message(request):
+    >>>     print(event)
+"""
+from __future__ import annotations
+import asyncio
+import json
+import logging
+from typing import Any, AsyncIterator
+from openai import AsyncOpenAI
+from illusion.api.client import (
+    ApiMessageCompleteEvent,
+    ApiMessageRequest,
+    ApiStreamEvent,
+    ApiTextDeltaEvent,
+    ApiToolCallStartedEvent,
+)
+from illusion.api.compat import (
+    merge_reasoning_text,
+    parse_tool_arguments,
+    split_thinking_from_text,
+)
+from illusion.api.errors import (
+    AuthenticationFailure,
+    IllusionCodeApiError,
+    RateLimitFailure,
+    RequestFailure,
+)
+from illusion.api.usage import UsageSnapshot
+from illusion.engine.messages import (
+    ConversationMessage,
+    ContentBlock,
+    MediaBlock,
+    TextBlock,
+    ThinkingBlock,
+    ToolResultBlock,
+    ToolUseBlock,
+    _messages_have_media,
+    _strip_media_from_messages,
+)
+# 模块级日志记录器
+log = logging.getLogger(__name__)
+# 重试配置常量
+MAX_RETRIES = 3  # 最大重试次数
+BASE_DELAY = 1.0  # 基础延迟（秒）
+MAX_DELAY = 30.0  # 最大延迟（秒）
+def _serialize_media_for_openai(block: MediaBlock) -> dict[str, Any]:
+    """将图片 MediaBlock 转换为 OpenAI 消息内容部分。"""
+    return {
+        "type": "image_url",
+        "image_url": {"url": f"data:{block.media_type};base64,{block.data}"},
+    }
+def _convert_tools_to_openai(tools: list[dict[str, Any]]) -> list[dict[str, Any]]:
+    """将 Anthropic 工具模式转换为 OpenAI function-calling 格式
+    Anthropic 格式：
+        {"name": "...", "description": "...", "input_schema": {...}}
+    OpenAI 格式：
+        {"type": "function", "function": {"name": "...", "description": "...", "parameters": {...}}}
+    Args:
+        tools: Anthropic 格式的工具定义列表
+    Returns:
+        list[dict[str, Any]]: OpenAI 格式的工具定义列表
+    """
+    result = []
+    for tool in tools:
+        result.append({
+            "type": "function",
+            "function": {
+                "name": tool["name"],
+                "description": tool.get("description", ""),
+                "parameters": tool.get("input_schema", {}),
+            },
+        })
+    return result
+def _convert_messages_to_openai(
+    messages: list[ConversationMessage],
+    system_prompt: str | None,
+) -> list[dict[str, Any]]:
+    """将 Anthropic 风格消息转换为 OpenAI 聊天格式
+    主要差异：
+    - Anthropic：系统提示词是单独参数
+    - OpenAI：系统提示词是 role="system" 的消息
+    - Anthropic：tool_use / tool_result 是 content blocks
+    - OpenAI：tool_calls 在 assistant 消息上，tool results 是独立消息
+    Args:
+        messages: Anthropic 风格的消息列表
+        system_prompt: 系统提示词
+    Returns:
+        list[dict[str, Any]]: OpenAI 格式的消息列表
+    """
+    openai_messages: list[dict[str, Any]] = []
+    # 添加系统消息
+    if system_prompt:
+        openai_messages.append({"role": "system", "content": system_prompt})
+    for msg in messages:
+        if msg.role == "assistant":
+            openai_msg = _convert_assistant_message(msg)
+            openai_messages.append(openai_msg)
+        elif msg.role == "user":
+            # 用户消息可能包含文本、tool_result 或 media blocks
+            tool_results = [b for b in msg.content if isinstance(b, ToolResultBlock)]
+            text_blocks = [b for b in msg.content if isinstance(b, TextBlock)]
+            media_blocks = [b for b in msg.content if isinstance(b, MediaBlock)]
+            if tool_results:
+                # 每个 tool result 成为独立的 role="tool" 消息
+                # 注意：OpenAI tool 消息只接受字符串 content，不支持图片
+                # 如果 tool result 包含媒体，额外生成一条 user 消息携带媒体
+                for tr in tool_results:
+                    if isinstance(tr.content, list):
+                        # 提取文本和媒体部分
+                        tr_media = [b for b in tr.content if isinstance(b, MediaBlock)]
+                        openai_messages.append({
+                            "role": "tool",
+                            "tool_call_id": tr.tool_use_id,
+                            "content": tr.text_content,
+                        })
+                        # 媒体内容通过独立的 user 消息传递
+                        if tr_media:
+                            media_parts: list[dict[str, Any]] = []
+                            for mb in tr_media:
+                                media_parts.append(_serialize_media_for_openai(mb))
+                            openai_messages.append({
+                                "role": "user",
+                                "content": media_parts,
+                            })
+                    else:
+                        openai_messages.append({
+                            "role": "tool",
+                            "tool_call_id": tr.tool_use_id,
+                            "content": tr.content,
+                        })
+            if text_blocks or media_blocks:
+                text = "".join(b.text for b in text_blocks)
+                if media_blocks:
+                    parts: list[dict[str, Any]] = []
+                    if text.strip():
+                        parts.append({"type": "text", "text": text})
+                    for mb in media_blocks:
+                        parts.append(_serialize_media_for_openai(mb))
+                    openai_messages.append({"role": "user", "content": parts})
+                elif text.strip():
+                    openai_messages.append({"role": "user", "content": text})
+            if not tool_results and not text_blocks and not media_blocks:
+                # 空用户消息（不应发生，但需优雅处理）
+                openai_messages.append({"role": "user", "content": ""})
+    return openai_messages
+def _convert_assistant_message(msg: ConversationMessage) -> dict[str, Any]:
+    """将 assistant ConversationMessage 转换为 OpenAI 格式
+    支持思维模型（如 Kimi k2.5）的 providers 要求每个包含 tool calls 的 assistant
+    消息都有 ``reasoning_content`` 字段。这里统一从 ThinkingBlock 回放 reasoning。
+    Args:
+        msg: ConversationMessage 对象
+    Returns:
+        dict[str, Any]: OpenAI 格式的消息
+    """
+    text_parts = [b.text for b in msg.content if isinstance(b, TextBlock)]
+    tool_uses = [b for b in msg.content if isinstance(b, ToolUseBlock)]
+    thinking_blocks = [b for b in msg.content if isinstance(b, ThinkingBlock)]
+    openai_msg: dict[str, Any] = {"role": "assistant"}
+    content, tagged_reasoning = split_thinking_from_text("".join(text_parts))
+    # 确保 content 不为 None，否则 DeepSeek 等 API 会报错
+    # "Invalid assistant message: content or tool_calls must be set"
+    openai_msg["content"] = content if content else None
+    if openai_msg["content"] is None and not tool_uses:
+        openai_msg["content"] = content or ""
+    # 为思维模型回放 reasoning_content（统一来源：ThinkingBlock）
+    reasoning = merge_reasoning_text(
+        *(b.thinking for b in thinking_blocks),
+        tagged_reasoning,
+    )
+    if reasoning:
+        openai_msg["reasoning_content"] = reasoning
+    elif tool_uses:
+        # 思维模型即使为空也需要此字段
+        openai_msg["reasoning_content"] = ""
+    if tool_uses:
+        openai_msg["tool_calls"] = [
+            {
+                "id": tu.id,
+                "type": "function",
+                "function": {
+                    "name": tu.name,
+                    "arguments": json.dumps(tu.input),
+                },
+            }
+            for tu in tool_uses
+        ]
+    return openai_msg
+def _parse_assistant_response(response: Any) -> ConversationMessage:
+    """将 OpenAI ChatCompletion 响应解析为 ConversationMessage
+    Args:
+        response: OpenAI API 响应对象
+    Returns:
+        ConversationMessage: 解析后的消息对象
+    """
+    choice = response.choices[0]
+    message = choice.message
+    content: list[ContentBlock] = []
+    if message.content:
+        plain_text, tagged_reasoning = split_thinking_from_text(str(message.content))
+        if tagged_reasoning:
+            content.append(ThinkingBlock(thinking=tagged_reasoning))
+        if plain_text:
+            content.append(TextBlock(text=plain_text))
+    reasoning_content = getattr(message, "reasoning_content", None)
+    if isinstance(reasoning_content, str) and reasoning_content.strip():
+        merged = merge_reasoning_text(
+            *(b.thinking for b in content if isinstance(b, ThinkingBlock)),
+            reasoning_content,
+        )
+        content = [b for b in content if not isinstance(b, ThinkingBlock)]
+        if merged:
+            content.insert(0, ThinkingBlock(thinking=merged))
+    if message.tool_calls:
+        for tc in message.tool_calls:
+            args = parse_tool_arguments(getattr(tc.function, "arguments", ""))
+            content.append(ToolUseBlock(
+                id=tc.id,
+                name=tc.function.name,
+                input=args,
+            ))
+    return ConversationMessage(role="assistant", content=content)
+class OpenAICompatibleClient:
+    """OpenAI 兼容 API 客户端
+    用于 DashScope、GitHub Models 等 OpenAI 兼容 API。
+    实现与 AnthropicApiClient 相同的 SupportsStreamingMessages 协议，
+    因此可以在 agent 循环中作为直接替代品使用。
+    Attributes:
+        _client: AsyncOpenAI 客户端实例
+    """
+    def __init__(self, api_key: str, *, base_url: str | None = None, extra_headers: dict[str, str] | None = None) -> None:
+        kwargs: dict[str, Any] = {"api_key": api_key}
+        if base_url:
+            kwargs["base_url"] = base_url
+        if extra_headers:
+            kwargs["default_headers"] = extra_headers
+        self._client = AsyncOpenAI(**kwargs)
+    async def stream_message(self, request: ApiMessageRequest) -> AsyncIterator[ApiStreamEvent]:
+        """流式生成文本增量和最终消息，匹配 Anthropic 客户端接口
+        当消息中包含图片但模型不支持时，自动降级为文本描述并重试。
+        Args:
+            request: API 消息请求
+        Yields:
+            ApiStreamEvent: 流式事件
+        """
+        last_error: Exception | None = None
+        media_stripped = False
+        for attempt in range(MAX_RETRIES + 1):
+            try:
+                async for event in self._stream_once(request):
+                    yield event
+                return
+            except IllusionCodeApiError as exc:
+                if (
+                    not media_stripped
+                    and _messages_have_media(request.messages)
+                    and self._is_media_related_error(exc)
+                ):
+                    log.warning(
+                        "Request failed, possibly due to unsupported image content. "
+                        "Retrying with text descriptions instead of images.",
+                    )
+                    request = ApiMessageRequest(
+                        model=request.model,
+                        messages=_strip_media_from_messages(request.messages),
+                        system_prompt=request.system_prompt,
+                        tools=request.tools,
+                        max_tokens=request.max_tokens,
+                    )
+                    media_stripped = True
+                    continue
+                raise
+            except Exception as exc:
+                last_error = exc
+                if (
+                    not media_stripped
+                    and _messages_have_media(request.messages)
+                    and self._is_media_related_error(exc)
+                ):
+                    log.warning(
+                        "Request failed, possibly due to unsupported image content. "
+                        "Retrying with text descriptions instead of images.",
+                    )
+                    request = ApiMessageRequest(
+                        model=request.model,
+                        messages=_strip_media_from_messages(request.messages),
+                        system_prompt=request.system_prompt,
+                        tools=request.tools,
+                        max_tokens=request.max_tokens,
+                    )
+                    media_stripped = True
+                    continue
+                if attempt >= MAX_RETRIES or not self._is_retryable(exc):
+                    raise self._translate_error(exc) from exc
+                delay = min(BASE_DELAY * (2 ** attempt), MAX_DELAY)
+                log.warning(
+                    "OpenAI API request failed (attempt %d/%d), retrying in %.1fs: %s",
+                    attempt + 1, MAX_RETRIES + 1, delay, exc,
+                )
+                await asyncio.sleep(delay)
+        if last_error is not None:
+            raise self._translate_error(last_error) from last_error
+    async def _stream_once(self, request: ApiMessageRequest) -> AsyncIterator[ApiStreamEvent]:
+        """单次尝试：流式 OpenAI 聊天完成
+        Args:
+            request: API 消息请求
+        Yields:
+            ApiStreamEvent: 流式事件
+        """
+        openai_messages = _convert_messages_to_openai(request.messages, request.system_prompt)
+        openai_tools = _convert_tools_to_openai(request.tools) if request.tools else None
+        params: dict[str, Any] = {
+            "model": request.model,
+            "messages": openai_messages,
+            "max_tokens": request.max_tokens,
+            "stream": True,
+            "stream_options": {"include_usage": True},
+        }
+        if openai_tools:
+            params["tools"] = openai_tools
+            # 某些 providers（如 Kimi）在 tool-call 后续请求中对空的 reasoning_content 报错
+            # 如果存在 tools，则移除整个 stream_options 键，避免触发模型端思维模式
+            # 该模式要求每个 assistant 消息都有 reasoning_content
+            params.pop("stream_options", None)
+        # 添加 effort 字段
+        if request.effort is not None:
+            params["reasoning_effort"] = request.effort.value
+        # 流式文本增量时收集完整响应
+        collected_content = ""
+        collected_reasoning = ""
+        collected_tool_calls: dict[int, dict[str, Any]] = {}
+        finish_reason: str | None = None
+        usage_data: dict[str, int] = {}
+        try:
+            stream = await self._client.chat.completions.create(**params)
+        except Exception as exc:
+            # 检查是否为 effort 不支持错误
+            if self._is_effort_unsupported_error(exc) and request.effort is not None:
+                # 直接向用户反馈错误，不进行降级
+                raise RequestFailure(
+                    f"当前模型不支持推理强度 '{request.effort.value}'，请尝试使用其他推理强度级别（如 low/medium/high）"
+                ) from exc
+            # 某些模型（如 gpt-5.2-codex）不支持 /chat/completions，自动回退到 /responses
+            if self._is_chat_endpoint_error(exc):
+                log.info("Model %s does not support chat/completions, falling back to responses API", request.model)
+                async for event in self._stream_via_responses_api(request, openai_messages, openai_tools):
+                    yield event
+                return
+            raise
+        async for chunk in stream:
+            if not chunk.choices:
+                # 仅使用量块（某些 providers 在最后发送）
+                if chunk.usage:
+                    usage_data = {
+                        "input_tokens": chunk.usage.prompt_tokens or 0,
+                        "output_tokens": chunk.usage.completion_tokens or 0,
+                    }
+                continue
+            delta = chunk.choices[0].delta
+            chunk_finish = chunk.choices[0].finish_reason
+            if chunk_finish:
+                finish_reason = chunk_finish
+            # 收集思维模型的 reasoning_content（不向用户显示）
+            reasoning_piece = getattr(delta, "reasoning_content", None) or ""
+            if reasoning_piece:
+                collected_reasoning += reasoning_piece
+                yield ApiTextDeltaEvent(text="", reasoning=reasoning_piece)
+            # 向用户流式传输文本内容
+            if delta.content:
+                collected_content += delta.content
+                yield ApiTextDeltaEvent(text=delta.content)
+            # 收集工具调用
+            if delta.tool_calls:
+                for tc_delta in delta.tool_calls:
+                    idx = tc_delta.index
+                    if idx not in collected_tool_calls:
+                        collected_tool_calls[idx] = {
+                            "id": tc_delta.id or "",
+                            "name": "",
+                            "arguments": "",
+                        }
+                    entry = collected_tool_calls[idx]
+                    if tc_delta.id:
+                        entry["id"] = tc_delta.id
+                    if tc_delta.function:
+                        if tc_delta.function.name:
+                            # 工具调用开始：模型刚开始生成工具调用时立即通知
+                            if not entry["name"]:
+                                yield ApiToolCallStartedEvent(
+                                    tool_name=tc_delta.function.name,
+                                    tool_use_id=tc_delta.id or "",
+                                )
+                            entry["name"] = tc_delta.function.name
+                        if tc_delta.function.arguments:
+                            entry["arguments"] += tc_delta.function.arguments
+            # chunk 中的使用量（如果 provider 发送）
+            if chunk.usage:
+                usage_data = {
+                    "input_tokens": chunk.usage.prompt_tokens or 0,
+                    "output_tokens": chunk.usage.completion_tokens or 0,
+                }
+        # 构建最终 ConversationMessage
+        content: list[ContentBlock] = []
+        cleaned_text, tagged_reasoning = split_thinking_from_text(collected_content)
+        if cleaned_text:
+            content.append(TextBlock(text=cleaned_text))
+        for _idx in sorted(collected_tool_calls.keys()):
+            tc = collected_tool_calls[_idx]
+            # 跳过某些 provider 发送的空/幻影工具调用
+            if not tc["name"]:
+                continue
+            args = parse_tool_arguments(tc["arguments"])
+            content.append(ToolUseBlock(
+                id=tc["id"],
+                name=tc["name"],
+                input=args,
+            ))
+        merged_reasoning = merge_reasoning_text(collected_reasoning, tagged_reasoning)
+        if merged_reasoning:
+            content.insert(0, ThinkingBlock(thinking=merged_reasoning))
+        final_message = ConversationMessage(
+            role="assistant",
+            content=content,
+        )
+        yield ApiMessageCompleteEvent(
+            message=final_message,
+            usage=UsageSnapshot(
+                input_tokens=usage_data.get("input_tokens", 0),
+                output_tokens=usage_data.get("output_tokens", 0),
+            ),
+            stop_reason=finish_reason,
+        )
+    @staticmethod
+    def _is_chat_endpoint_error(exc: Exception) -> bool:
+        """检查是否为 chat/completions 端点不支持的错误（需回退到 responses API）"""
+        error_msg = str(getattr(exc, "message", "")) or str(exc)
+        return (
+            getattr(exc, "status_code", None) == 400
+            and "chat/completions" in error_msg
+            and "not accessible" in error_msg.lower()
+        )
+    @staticmethod
+    def _is_media_related_error(exc: Exception) -> bool:
+        """检查错误是否可能由图片内容导致（用于优雅降级判断）
+        包括：JSON 解析错误、400/404 错误中与 content/image 相关的消息、
+        空响应（某些模型遇到 image_url 直接返回空内容）。
+        注意：错误可能已被 _translate_error 转为 IllusionCodeApiError，
+        此时 status_code 属性丢失，需从消息字符串中判断。
+        """
+        error_msg = str(exc).lower()
+        status = getattr(exc, "status_code", None)
+        # 从错误消息字符串中提取状态码（适配已翻译的异常）
+        if status is None:
+            for code in (404, 400):
+                if f"error code: {code}" in error_msg:
+                    status = code
+                    break
+        # JSON 解析错误：模型返回空响应（遇到不支持的 image_url）
+        if "expecting value" in error_msg:
+            return True
+        # 400/404 错误且包含图片/内容相关关键词
+        if status in {400, 404}:
+            if any(kw in error_msg for kw in ("image", "media", "content", "param", "unsupported")):
+                return True
+        return False
+    @staticmethod
+    def _is_effort_unsupported_error(exc: Exception) -> bool:
+        """检测是否为 effort 字段不支持导致的错误
+        Args:
+            exc: 异常对象
+        Returns:
+            bool: 是否为 effort 不支持错误
+        """
+        error_msg = str(exc).lower()
+        # 检测常见的 effort 不支持错误消息
+        effort_keywords = ["effort", "reasoning_effort", "reasoning effort"]
+        unsupported_keywords = ["not supported", "unsupported", "invalid", "unknown"]
+        # 检查是否包含 effort 相关关键词
+        has_effort_keyword = any(keyword in error_msg for keyword in effort_keywords)
+        # 检查是否包含不支持相关关键词
+        has_unsupported_keyword = any(keyword in error_msg for keyword in unsupported_keywords)
+        # 检查特定的错误模式：unknown variant `max`/`xhigh` 等
+        has_variant_error = "unknown variant" in error_msg and any(
+            level in error_msg for level in ["max", "xhigh", "low", "medium", "high"]
+        )
+        return (has_effort_keyword and has_unsupported_keyword) or has_variant_error
+    def _convert_messages_to_responses(
+        self,
+        messages: list[dict[str, Any]],
+        system_prompt: str | None,
+    ) -> list[dict[str, Any]]:
+        """将 OpenAI 聊天格式消息转换为 Responses API 输入格式"""
+        items: list[dict[str, Any]] = []
+        for msg in messages:
+            role = msg.get("role", "user")
+            content = msg.get("content", "")
+            if role == "system":
+                items.append({"role": "system", "content": content})
+            elif role == "assistant" and msg.get("tool_calls"):
+                # assistant 消息带 tool_calls：拆分为 message + function_call items
+                text_parts = []
+                if isinstance(content, str) and content:
+                    text_parts.append({"type": "output_text", "text": content})
+                elif isinstance(content, list):
+                    for part in content:
+                        if isinstance(part, dict) and part.get("type") == "text":
+                            text_parts.append({"type": "output_text", "text": part.get("text", "")})
+                if text_parts:
+                    items.append({"type": "message", "role": "assistant", "content": text_parts})
+                for tc in msg["tool_calls"]:
+                    func = tc.get("function", {})
+                    items.append({
+                        "type": "function_call",
+                        "call_id": tc.get("id", ""),
+                        "name": func.get("name", ""),
+                        "arguments": func.get("arguments", "{}"),
+                    })
+            elif role == "tool":
+                # tool 结果消息 → function_call_output item
+                if isinstance(content, list):
+                    text_parts = [
+                        p.get("text", "") for p in content
+                        if isinstance(p, dict) and p.get("type") == "text"
+                    ]
+                    output = " ".join(text_parts) if text_parts else json.dumps(content, ensure_ascii=False)
+                else:
+                    output = content if isinstance(content, str) else json.dumps(content, ensure_ascii=False)
+                items.append({
+                    "type": "function_call_output",
+                    "call_id": msg.get("tool_call_id", ""),
+                    "output": output,
+                })
+            else:
+                # user / assistant 纯文本消息
+                text = content if isinstance(content, str) else json.dumps(content, ensure_ascii=False)
+                items.append({
+                    "type": "message",
+                    "role": role,
+                    "content": [{"type": "input_text" if role == "user" else "output_text", "text": text}],
+                })
+        return items
+    @staticmethod
+    def _convert_tools_to_responses(tools: list[dict[str, Any]] | None) -> list[dict[str, Any]] | None:
+        """将 OpenAI function-calling 工具格式转换为 Responses API 格式"""
+        if not tools:
+            return None
+        result = []
+        for tool in tools:
+            func = tool.get("function", {})
+            result.append({
+                "type": "function",
+                "name": func.get("name", ""),
+                "description": func.get("description", ""),
+                "parameters": func.get("parameters", {}),
+            })
+        return result
+    async def _stream_via_responses_api(
+        self,
+        request: ApiMessageRequest,
+        openai_messages: list[dict[str, Any]],
+        openai_tools: list[dict[str, Any]] | None,
+    ) -> AsyncIterator[ApiStreamEvent]:
+        """通过 OpenAI Responses API 流式生成（chat/completions 不可用时的回退方案）"""
+        from openai.types.responses import (
+            ResponseCompletedEvent,
+            ResponseFunctionCallArgumentsDeltaEvent,
+            ResponseFunctionCallArgumentsDoneEvent,
+            ResponseOutputItemAddedEvent,
+            ResponseTextDeltaEvent,
+        )
+        input_items = self._convert_messages_to_responses(openai_messages, request.system_prompt)
+        resp_tools = self._convert_tools_to_responses(openai_tools)
+        params: dict[str, Any] = {
+            "model": request.model,
+            "input": input_items,
+        }
+        if request.system_prompt:
+            params["instructions"] = request.system_prompt
+        if request.max_tokens:
+            params["max_output_tokens"] = request.max_tokens
+        if resp_tools:
+            params["tools"] = resp_tools
+        # 添加 effort 字段
+        if request.effort is not None:
+            params["reasoning"] = {"effort": request.effort.value}
+        collected_content = ""
+        collected_reasoning = ""
+        collected_tool_calls: dict[int, dict[str, Any]] = {}
+        usage_data: dict[str, int] = {}
+        async with self._client.responses.stream(**params) as stream:
+            async for event in stream:
+                if isinstance(event, ResponseTextDeltaEvent):
+                    collected_content += event.delta
+                    yield ApiTextDeltaEvent(text=event.delta)
+                    continue
+                event_type = str(getattr(event, "type", "") or "")
+                if event_type in {
+                    "response.reasoning_summary_text.delta",
+                    "response.reasoning_text.delta",
+                    "response.output_text.reasoning.delta",
+                }:
+                    delta = getattr(event, "delta", "")
+                    if isinstance(delta, str) and delta:
+                        collected_reasoning += delta
+                        yield ApiTextDeltaEvent(text="", reasoning=delta)
+                    continue
+                if isinstance(event, ResponseOutputItemAddedEvent):
+                    item = event.item
+                    if getattr(item, "type", None) == "function_call":
+                        idx = event.output_index
+                        tool_name = getattr(item, "name", "")
+                        tool_use_id = getattr(item, "call_id", "") or getattr(item, "id", "")
+                        collected_tool_calls[idx] = {
+                            "id": tool_use_id,
+                            "name": tool_name,
+                            "arguments": "",
+                        }
+                        # 工具调用开始：模型刚开始生成工具调用时立即通知
+                        if tool_name:
+                            yield ApiToolCallStartedEvent(
+                                tool_name=tool_name,
+                                tool_use_id=tool_use_id,
+                            )
+                elif isinstance(event, ResponseFunctionCallArgumentsDeltaEvent):
+                    idx = event.output_index
+                    if idx in collected_tool_calls:
+                        collected_tool_calls[idx]["arguments"] += event.delta
+                elif isinstance(event, ResponseFunctionCallArgumentsDoneEvent):
+                    idx = event.output_index
+                    if idx in collected_tool_calls:
+                        collected_tool_calls[idx]["arguments"] = event.arguments
+                elif isinstance(event, ResponseCompletedEvent):
+                    resp = event.response
+                    if hasattr(resp, "usage") and resp.usage:
+                        usage_data = {
+                            "input_tokens": getattr(resp.usage, "input_tokens", 0) or 0,
+                            "output_tokens": getattr(resp.usage, "output_tokens", 0) or 0,
+                        }
+        # 构建最终消息
+        content: list[ContentBlock] = []
+        cleaned_text, tagged_reasoning = split_thinking_from_text(collected_content)
+        if cleaned_text:
+            content.append(TextBlock(text=cleaned_text))
+        for _idx in sorted(collected_tool_calls.keys()):
+            tc = collected_tool_calls[_idx]
+            if not tc["name"]:
+                continue
+            args = parse_tool_arguments(tc["arguments"])
+            content.append(ToolUseBlock(
+                id=tc["id"],
+                name=tc["name"],
+                input=args,
+            ))
+        merged_reasoning = merge_reasoning_text(collected_reasoning, tagged_reasoning)
+        if merged_reasoning:
+            content.insert(0, ThinkingBlock(thinking=merged_reasoning))
+        final_message = ConversationMessage(role="assistant", content=content)
+        yield ApiMessageCompleteEvent(
+            message=final_message,
+            usage=UsageSnapshot(
+                input_tokens=usage_data.get("input_tokens", 0),
+                output_tokens=usage_data.get("output_tokens", 0),
+            ),
+            stop_reason="stop",
+        )
+    @staticmethod
+    def _is_retryable(exc: Exception) -> bool:
+        """检查异常是否可重试
+        Args:
+            exc: 待检查的异常
+        Returns:
+            bool: 是否可重试
+        """
+        status = getattr(exc, "status_code", None)
+        if status and status in {429, 500, 502, 503}:
+            return True
+        if isinstance(exc, (ConnectionError, TimeoutError, OSError)):
+            return True
+        return False
+    @staticmethod
+    def _translate_error(exc: Exception) -> IllusionCodeApiError:
+        """转换错误为统一异常类型
+        Args:
+            exc: 原始异常
+        Returns:
+            IllusionCodeApiError: 统一异常类型
+        """
+        status = getattr(exc, "status_code", None)
+        msg = str(exc)
+        if status == 401 or status == 403:
+            return AuthenticationFailure(msg)
+        if status == 429:
+            return RateLimitFailure(msg)
+        return RequestFailure(msg)