npm - @zhin.js/ai - Versions diffs - 1.0.0 → 1.0.2 - Mend

@zhin.js/ai 1.0.0 → 1.0.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (94) hide show

package/CHANGELOG.md +13 -0
package/README.md +131 -497
package/lib/agent.d.ts +54 -6
package/lib/agent.d.ts.map +1 -1
package/lib/agent.js +468 -116
package/lib/agent.js.map +1 -1
package/lib/compaction.d.ts +132 -0
package/lib/compaction.d.ts.map +1 -0
package/lib/compaction.js +370 -0
package/lib/compaction.js.map +1 -0
package/lib/context-manager.d.ts.map +1 -1
package/lib/context-manager.js +10 -3
package/lib/context-manager.js.map +1 -1
package/lib/conversation-memory.d.ts +192 -0
package/lib/conversation-memory.d.ts.map +1 -0
package/lib/conversation-memory.js +619 -0
package/lib/conversation-memory.js.map +1 -0
package/lib/index.d.ts +25 -163
package/lib/index.d.ts.map +1 -1
package/lib/index.js +24 -1122
package/lib/index.js.map +1 -1
package/lib/output.d.ts +93 -0
package/lib/output.d.ts.map +1 -0
package/lib/output.js +176 -0
package/lib/output.js.map +1 -0
package/lib/providers/anthropic.d.ts +7 -0
package/lib/providers/anthropic.d.ts.map +1 -1
package/lib/providers/anthropic.js +5 -0
package/lib/providers/anthropic.js.map +1 -1
package/lib/providers/ollama.d.ts +10 -0
package/lib/providers/ollama.d.ts.map +1 -1
package/lib/providers/ollama.js +19 -4
package/lib/providers/ollama.js.map +1 -1
package/lib/providers/openai.d.ts +7 -0
package/lib/providers/openai.d.ts.map +1 -1
package/lib/providers/openai.js +11 -0
package/lib/providers/openai.js.map +1 -1
package/lib/rate-limiter.d.ts +38 -0
package/lib/rate-limiter.d.ts.map +1 -0
package/lib/rate-limiter.js +86 -0
package/lib/rate-limiter.js.map +1 -0
package/lib/session.d.ts +7 -0
package/lib/session.d.ts.map +1 -1
package/lib/session.js +47 -18
package/lib/session.js.map +1 -1
package/lib/storage.d.ts +68 -0
package/lib/storage.d.ts.map +1 -0
package/lib/storage.js +105 -0
package/lib/storage.js.map +1 -0
package/lib/tone-detector.d.ts +19 -0
package/lib/tone-detector.d.ts.map +1 -0
package/lib/tone-detector.js +72 -0
package/lib/tone-detector.js.map +1 -0
package/lib/types.d.ts +84 -8
package/lib/types.d.ts.map +1 -1
package/package.json +13 -42
package/src/agent.ts +518 -135
package/src/compaction.ts +529 -0
package/src/context-manager.ts +10 -9
package/src/conversation-memory.ts +816 -0
package/src/index.ts +121 -1406
package/src/output.ts +261 -0
package/src/providers/anthropic.ts +4 -0
package/src/providers/ollama.ts +23 -4
package/src/providers/openai.ts +8 -1
package/src/rate-limiter.ts +129 -0
package/src/session.ts +47 -18
package/src/storage.ts +135 -0
package/src/tone-detector.ts +89 -0
package/src/types.ts +95 -6
package/tests/agent.test.ts +123 -70
package/tests/compaction.test.ts +310 -0
package/tests/context-manager.test.ts +73 -47
package/tests/conversation-memory.test.ts +128 -0
package/tests/output.test.ts +128 -0
package/tests/providers.test.ts +574 -0
package/tests/rate-limiter.test.ts +108 -0
package/tests/session.test.ts +139 -48
package/tests/setup.ts +82 -240
package/tests/storage.test.ts +224 -0
package/tests/tone-detector.test.ts +80 -0
package/tsconfig.json +4 -5
package/vitest.setup.ts +1 -0
package/TOOLS.md +0 -294
package/lib/tools.d.ts +0 -45
package/lib/tools.d.ts.map +0 -1
package/lib/tools.js +0 -194
package/lib/tools.js.map +0 -1
package/src/tools.ts +0 -205
package/tests/ai-trigger.test.ts +0 -369
package/tests/integration.test.ts +0 -596
package/tests/providers.integration.test.ts +0 -227
package/tests/tool.test.ts +0 -800
package/tests/tools-builtin.test.ts +0 -346

package/src/agent.ts CHANGED Viewed

@@ -1,22 +1,54 @@
 /**
- * @zhin.js/ai - Agent System
+ * @zhin.js/agent - Agent System
  * AI Agent 实现，支持工具调用和多轮对话
  */
-import { Logger } from '@zhin.js/core';
+import { Logger } from '@zhin.js/logger';
 import type {
   AIProvider,
   AgentConfig,
   AgentTool,
   AgentResult,
   ChatMessage,
-  ToolDefinition,
+  ToolDefinition as ChatToolDefinition,
   ToolCall,
+  ToolFilterOptions,
   Usage,
 } from './types.js';
 const logger = new Logger(null, 'Agent');
+/** 工具执行默认超时时间 (ms) */
+const DEFAULT_TOOL_TIMEOUT = 30_000;
+/** 中英文混合分词：按标点/空格切分，保留 ≥2 字符的 token */
+const TOKENIZE_RE = /[\s,.:;!?，。：；！？、()（）【】\[\]"'"'「」『』]+/;
+function tokenize(text: string): string[] {
+  return text.split(TOKENIZE_RE).filter(w => w.length >= 2);
+}
+/**
+ * 根据工具名和参数生成简短标题（用于日志、TOOLS.md 等）
+ */
+export function formatToolTitle(name: string, args?: Record<string, any>): string {
+  if (!args || Object.keys(args).length === 0) return name;
+  const a = args;
+  switch (name) {
+    case 'bash': return a.command != null ? `bash: ${String(a.command).slice(0, 60)}` : name;
+    case 'read_file': return a.file_path != null ? `read_file: ${a.file_path}` : name;
+    case 'write_file': return a.file_path != null ? `write_file: ${a.file_path}` : name;
+    case 'edit_file': return a.file_path != null ? `edit_file: ${a.file_path}` : name;
+    case 'list_dir': return a.path != null ? `list_dir: ${a.path}` : name;
+    case 'web_search': return a.query != null ? `web_search: ${String(a.query).slice(0, 40)}` : name;
+    case 'web_fetch': return a.url != null ? `web_fetch: ${String(a.url).slice(0, 50)}` : name;
+    default: {
+      const first = Object.values(a)[0];
+      if (first != null) return `${name}: ${String(first).slice(0, 50)}`;
+      return name;
+    }
+  }
+}
 /**
  * Agent 执行状态
  */
@@ -121,9 +153,9 @@ export class Agent {
   }
   /**
-   * 获取工具定义
+   * 获取工具定义（缓存在第一次调用后保持不变）
    */
-  private getToolDefinitions(): ToolDefinition[] {
+  private getToolDefinitions(): ChatToolDefinition[] {
     return Array.from(this.tools.values()).map(tool => ({
       type: 'function',
       function: {
@@ -135,32 +167,255 @@ export class Agent {
   }
   /**
-   * 执行工具调用
+   * 生成工具调用的去重 key（规范化参数以避免 "" vs "{}" 等差异）
+   */
+  private static toolCallKey(name: string, args: string): string {
+    let normalized: string;
+    try {
+      const parsed = JSON.parse(args || '{}');
+      normalized = JSON.stringify(parsed, Object.keys(parsed).sort());
+    } catch {
+      normalized = args || '';
+    }
+    return `${name}::${normalized}`;
+  }
+  /**
+   * 安全解析 JSON，失败则返回原始字符串
+   */
+  private static safeParse(str: string): any {
+    try {
+      return JSON.parse(str);
+    } catch {
+      return str;
+    }
+  }
+  /**
+   * 程序化工具过滤 —— TF-IDF 加权的相关性评分
+   *
+   * 评分层级（基础权重 × IDF 倍率）：
+   * 1. keywords 精确匹配: base 1.0 × idf  —— 工具声明的触发关键词
+   * 2. tags 匹配:          base 0.5 × idf  —— 工具分类标签
+   * 3. 工具名 token 匹配:  base 0.3 × idf  —— 工具名按 `.` `_` `-` 拆词
+   * 4. description 关键词:  base 0.15 × idf —— 描述中的词/短语
+   *
+   * IDF = log(N / df)，N 为工具总数，df 为包含该词的工具数。
+   * 高频词（出现在大部分工具中）的 IDF 接近 0，权重被压低；
+   * 稀有词（仅少数工具有）的 IDF 较高，权重被放大。
+   *
+   * @param message      用户消息原文
+   * @param tools        候选工具列表
+   * @param options      过滤选项
+   * @returns            按相关性降序排列的工具子集
+   */
+  static filterTools(
+    message: string,
+    tools: AgentTool[],
+    options?: ToolFilterOptions,
+  ): AgentTool[] {
+    if (tools.length === 0) return [];
+    const maxTools = options?.maxTools ?? 10;
+    const minScore = options?.minScore ?? 0.1;
+    const callerPerm = options?.callerPermissionLevel ?? Infinity;
+    const N = tools.length;
+    const msgLower = message.toLowerCase();
+    const msgTokens = tokenize(msgLower);
+    // ── 构建 IDF 索引 ──
+    const df = new Map<string, number>();
+    const toolTermSets: Map<AgentTool, Set<string>> = new Map();
+    for (const tool of tools) {
+      const terms = new Set<string>();
+      if (tool.keywords) for (const kw of tool.keywords) { if (kw) terms.add(kw.toLowerCase()); }
+      if (tool.tags) for (const tag of tool.tags) { if (tag && tag.length > 1) terms.add(tag.toLowerCase()); }
+      for (const nt of tool.name.toLowerCase().split(/[._\-]+/)) { if (nt.length > 1) terms.add(nt); }
+      for (const w of tokenize(tool.description.toLowerCase())) { terms.add(w); }
+      toolTermSets.set(tool, terms);
+      for (const t of terms) {
+        df.set(t, (df.get(t) || 0) + 1);
+      }
+    }
+    const idf = (term: string): number => {
+      const docFreq = df.get(term);
+      if (!docFreq) return 1.0;
+      return Math.max(0.1, Math.log(N / docFreq));
+    };
+    // ── 评分 ──
+    const scored: { tool: AgentTool; score: number }[] = [];
+    for (const tool of tools) {
+      if (tool.permissionLevel != null && tool.permissionLevel > callerPerm) {
+        continue;
+      }
+      let score = 0;
+      // 1. keywords（最高基础权重）
+      if (tool.keywords?.length) {
+        for (const kw of tool.keywords) {
+          if (kw && msgLower.includes(kw.toLowerCase())) {
+            score += 1.0 * idf(kw.toLowerCase());
+          }
+        }
+      }
+      // 2. tags
+      if (tool.tags?.length) {
+        for (const tag of tool.tags) {
+          if (tag && tag.length > 1 && msgLower.includes(tag.toLowerCase())) {
+            score += 0.5 * idf(tag.toLowerCase());
+          }
+        }
+      }
+      // 3. 工具名 token
+      const nameTokens = tool.name.toLowerCase().split(/[._\-]+/);
+      for (const nt of nameTokens) {
+        if (nt.length > 1 && msgLower.includes(nt)) {
+          score += 0.3 * idf(nt);
+        }
+      }
+      // 4. 描述双向匹配
+      const descLower = tool.description.toLowerCase();
+      const descTokens = tokenize(descLower);
+      for (const dw of descTokens) {
+        if (msgLower.includes(dw)) {
+          score += 0.15 * idf(dw);
+        }
+      }
+      for (const mw of msgTokens) {
+        if (descLower.includes(mw)) {
+          score += 0.2 * idf(mw);
+        }
+      }
+      if (score >= minScore) {
+        scored.push({ tool, score });
+      }
+    }
+    scored.sort((a, b) => b.score - a.score);
+    return scored.slice(0, maxTools).map(s => s.tool);
+  }
+  /**
+   * 执行单个工具调用（带超时保护）
    */
   private async executeToolCall(toolCall: ToolCall): Promise<string> {
     const tool = this.tools.get(toolCall.function.name);
     if (!tool) {
-      return JSON.stringify({ error: `Unknown tool: ${toolCall.function.name}` });
+      return JSON.stringify({
+        error: `Unknown tool: ${toolCall.function.name}`,
+        hint: '该工具不存在，请尝试使用其他可用工具，或直接回答用户。',
+      });
+    }
+    let args: Record<string, unknown>;
+    try {
+      args = JSON.parse(toolCall.function.arguments);
+    } catch {
+      return JSON.stringify({
+        error: 'Invalid tool arguments JSON',
+        tool: toolCall.function.name,
+        hint: '请检查工具参数格式后重试。',
+      });
     }
+    logger.debug({ tool: toolCall.function.name, params: args }, 'Executing tool');
+    this.emit('tool_call', tool.name, args);
     try {
-      const args = JSON.parse(toolCall.function.arguments);
-      this.emit('tool_call', tool.name, args);
-      const result = await tool.execute(args);
+      // 带超时的工具执行
+      const result = await Promise.race([
+        tool.execute(args),
+        new Promise<never>((_, reject) =>
+          setTimeout(() => reject(new Error(`工具 ${tool.name} 执行超时`)), DEFAULT_TOOL_TIMEOUT),
+        ),
+      ]);
       this.emit('tool_result', tool.name, result);
       return typeof result === 'string' ? result : JSON.stringify(result);
     } catch (error) {
       const errorMsg = error instanceof Error ? error.message : String(error);
-      return JSON.stringify({ error: errorMsg });
+      logger.warn(`工具 ${toolCall.function.name} 执行失败: ${errorMsg}`);
+      logger.error({ tool: toolCall.function.name, params: args, err: error }, 'Tool execution failed');
+      // 向 AI 提供结构化的错误信息和恢复提示
+      return JSON.stringify({
+        error: errorMsg,
+        tool: toolCall.function.name,
+        hint: '该工具执行失败。请尝试使用不同的参数重试，或换一个工具来完成任务。如果所有工具都无法使用，请直接用文字回答用户。',
+      });
+    }
+  }
+  /**
+   * 并行执行多个工具调用（跳过重复的）
+   * @returns 新执行的工具调用结果列表；如果全部重复则返回空数组
+   */
+  private async executeToolCalls(
+    toolCalls: ToolCall[],
+    seenKeys: Set<string>,
+    state: AgentState,
+  ): Promise<{ toolCall: ToolCall; result: string; args: Record<string, any> }[]> {
+    // 分离：新调用 vs 重复调用
+    const fresh: ToolCall[] = [];
+    for (const tc of toolCalls) {
+      const key = Agent.toolCallKey(tc.function.name, tc.function.arguments);
+      if (seenKeys.has(key)) {
+        logger.debug(`跳过重复工具调用: ${tc.function.name}`);
+      } else {
+        fresh.push(tc);
+      }
     }
+    if (fresh.length === 0) return [];
+    // 并行执行所有新工具调用
+    const tasks = fresh.map(async (tc) => {
+      const result = await this.executeToolCall(tc);
+      const args = Agent.safeParse(tc.function.arguments);
+      const parsedResult = Agent.safeParse(result);
+      // 记录到状态
+      const key = Agent.toolCallKey(tc.function.name, tc.function.arguments);
+      seenKeys.add(key);
+      state.toolCalls.push({
+        tool: tc.function.name,
+        args: typeof args === 'object' ? args : { raw: args },
+        result: parsedResult,
+      });
+      return { toolCall: tc, result, args };
+    });
+    return Promise.all(tasks);
+  }
+  /**
+   * 累加 token 用量
+   */
+  private static addUsage(target: Usage, source?: Usage): void {
+    if (!source) return;
+    target.prompt_tokens += source.prompt_tokens;
+    target.completion_tokens += source.completion_tokens;
+    target.total_tokens += source.total_tokens;
   }
   /**
    * 运行 Agent
+   *
+   * @param userMessage    用户消息
+   * @param context        对话上下文
+   * @param filterOptions  工具过滤选项 —— 启用后在 AI 调用之前程序化筛选工具，省去额外的 AI 意图分析往返
    */
-  async run(userMessage: string, context?: ChatMessage[]): Promise<AgentResult> {
+  async run(userMessage: string, context?: ChatMessage[], filterOptions?: ToolFilterOptions): Promise<AgentResult> {
     const state: AgentState = {
       messages: [
         { role: 'system', content: this.config.systemPrompt },
@@ -172,94 +427,112 @@ export class Agent {
       iterations: 0,
     };
-    const toolDefinitions = this.getToolDefinitions();
+    // 程序化工具预过滤：只把相关工具传给 AI，减少 token 消耗和误选
+    let toolDefinitions: ChatToolDefinition[];
+    if (filterOptions) {
+      const allTools = Array.from(this.tools.values());
+      const filtered = Agent.filterTools(userMessage, allTools, filterOptions);
+      logger.info(`工具预过滤: ${allTools.length} -> ${filtered.length}`);
+      toolDefinitions = filtered.map(tool => ({
+        type: 'function' as const,
+        function: {
+          name: tool.name,
+          description: tool.description,
+          parameters: tool.parameters,
+        },
+      }));
+    } else {
+      toolDefinitions = this.getToolDefinitions();
+    }
+    const hasTools = toolDefinitions.length > 0;
+    // O(1) 去重集合
+    const seenToolKeys = new Set<string>();
+    // 连续全重复计数器
+    let consecutiveDuplicateRounds = 0;
     while (state.iterations < this.config.maxIterations) {
       state.iterations++;
+      // 强制文本回答的条件：
+      // 1. 检测到连续重复工具调用
+      // 2. 最后一轮迭代且已有工具结果 —— 保证 Agent 始终输出文本，不再需要额外的 summary 往返
+      const isLastIteration = state.iterations >= this.config.maxIterations;
+      const forceAnswer = consecutiveDuplicateRounds > 0 ||
+        (isLastIteration && state.toolCalls.length > 0);
       try {
+        // 工具调用轮次禁用思考（qwen3 等模型），大幅减少无效 token 生成
+        const isToolCallRound = hasTools && !forceAnswer;
         const response = await this.provider.chat({
           model: this.config.model,
           messages: state.messages,
-          tools: toolDefinitions.length > 0 ? toolDefinitions : undefined,
-          tool_choice: toolDefinitions.length > 0 ? 'auto' : undefined,
+          tools: isToolCallRound ? toolDefinitions : undefined,
+          tool_choice: isToolCallRound ? 'auto' : undefined,
           temperature: this.config.temperature,
+          think: isToolCallRound ? false : undefined,
         });
-        // 更新用量
-        if (response.usage) {
-          state.usage.prompt_tokens += response.usage.prompt_tokens;
-          state.usage.completion_tokens += response.usage.completion_tokens;
-          state.usage.total_tokens += response.usage.total_tokens;
-        }
+        Agent.addUsage(state.usage, response.usage);
+        logger.info(`token 用量: ${state.usage.prompt_tokens} -> ${state.usage.completion_tokens} -> ${state.usage.total_tokens}`);
+        logger.info(`response: `,response);
         const choice = response.choices[0];
         if (!choice) break;
-        // 如果包含工具调用，不立即将模型原始内容暴露给上层
+        // ── 分支 1: 模型想调用工具 ──
         if (choice.message.tool_calls?.length) {
+          const callSummary = choice.message.tool_calls.map(
+            (tc: any) => `${tc.function.name}(${tc.function.arguments})`
+          ).join(', ');
+          logger.info(`[第${state.iterations}轮] 工具调用: ${callSummary}`);
           this.emit('thinking', '正在执行工具调用...');
-          // 将 assistant 消息加入会话上下文，但避免直接展示纯 JSON 的工具调用原始内容
-          let assistantContent = '';
-          if (typeof choice.message.content === 'string' && choice.message.content) {
-            const rawContent = choice.message.content;
-            const trimmed = rawContent.trim();
-            // 如果内容整体看起来是 JSON（常见于模型将工具调用以 JSON 形式返回），则不暴露给上层
-            if (trimmed.startsWith('{') || trimmed.startsWith('[')) {
-              try {
-                JSON.parse(trimmed);
-                // 解析成功，说明是纯 JSON；保持 assistantContent 为空字符串
-              } catch {
-                // 解析失败，当作普通文本保留
-                assistantContent = rawContent;
-              }
-            } else {
-              // 非纯 JSON 内容，直接保留
-              assistantContent = rawContent;
-            }
-          }
+          // 当存在 tool_calls 时，content 通常是模型的内部思考或原始 JSON，
+          // 不需要暴露给最终用户，但需要保留在消息历史中以维持对话完整性
           state.messages.push({
-            role: 'assistant',
-            content: assistantContent,
+            role: 'tool_call',
+            content: typeof choice.message.content === 'string' ? choice.message.content : '',
             tool_calls: choice.message.tool_calls,
           });
-          // 检测重复工具调用
-          let hasDuplicateCall = false;
-          for (const toolCall of choice.message.tool_calls) {
-            const toolName = toolCall.function.name;
-            const toolArgs = toolCall.function.arguments;
-            // 检查是否重复调用相同工具（相同名称和参数）
-            const isDuplicate = state.toolCalls.some(
-              tc => tc.tool === toolName && JSON.stringify(tc.args) === toolArgs
-            );
-            if (isDuplicate) {
-              logger.debug(`重复工具调用: ${toolName}，跳过`);
-              hasDuplicateCall = true;
-              continue;
-            }
-            const result = await this.executeToolCall(toolCall);
-            // 尝试解析 JSON，如果失败则使用原始字符串
-            let parsedResult: any;
-            try {
-              parsedResult = JSON.parse(result);
-            } catch {
-              parsedResult = result;
+          // 并行执行所有新工具调用，自动跳过重复
+          const results = await this.executeToolCalls(
+            choice.message.tool_calls,
+            seenToolKeys,
+            state,
+          );
+          if (results.length === 0) {
+            consecutiveDuplicateRounds++;
+            logger.warn(`[第${state.iterations}轮] 检测到重复工具调用，已跳过执行，强制下轮文本回答`);
+            for (const tc of choice.message.tool_calls) {
+              const key = Agent.toolCallKey(tc.function.name, tc.function.arguments);
+              const previous = state.toolCalls.find(
+                stc => Agent.toolCallKey(stc.tool, JSON.stringify(stc.args)) === key ||
+                       Agent.toolCallKey(stc.tool, tc.function.arguments) === key,
+              );
+              state.messages.push({
+                role: 'tool',
+                content: previous ? JSON.stringify(previous.result) : '结果已获取',
+                tool_call_id: tc.id,
+              });
             }
-            state.toolCalls.push({
-              tool: toolName,
-              args: JSON.parse(toolArgs),
-              result: parsedResult,
+            state.messages.push({
+              role: 'system',
+              content: '你已经获取了所需的全部信息，请直接用自然语言回答用户，不要再调用工具。',
             });
-            // 添加工具结果消息（供模型下一步使用）
+            continue;
+          }
+          // 有新的工具调用被执行
+          consecutiveDuplicateRounds = 0;
+          // 将工具结果加入消息历史
+          for (const { toolCall, result } of results) {
+            const resultPreview = result.length > 200 ? result.slice(0, 200) + '...' : result;
+            logger.info(`[第${state.iterations}轮] 工具结果 ${toolCall.function.name}: ${resultPreview}`);
             state.messages.push({
               role: 'tool',
               content: result,
@@ -267,35 +540,23 @@ export class Agent {
             });
           }
-          // 如果所有调用都是重复的，强制模型生成最终回答
-          if (hasDuplicateCall && choice.message.tool_calls.every(tc =>
-            state.toolCalls.some(stc => stc.tool === tc.function.name && JSON.stringify(stc.args) === tc.function.arguments)
-          )) {
-            // 添加提示让模型总结结果
+          // 如果工具返回的是最终结果（非查询中间步骤），引导模型直接回复
+          const allSucceeded = results.every(r => !r.result.startsWith('{'));
+          if (allSucceeded && results.length > 0) {
             state.messages.push({
-              role: 'user',
-              content: '请根据已获取的工具结果，用中文总结回答我的问题。',
+              role: 'system',
+              content: '工具已返回结果。如果信息足够回答用户问题，请直接用自然语言回答，不要重复调用相同工具。',
             });
           }
-          // 继续循环，让模型处理工具结果并生成最终回答
           continue;
         }
-        // 没有工具调用，返回结果
-        let content = typeof choice.message.content === 'string'
+        // ── 分支 2: 模型返回文本回答 ──
+        const content = typeof choice.message.content === 'string'
           ? choice.message.content
           : '';
-        // 如果内容为空但有工具调用结果，生成基于工具结果的回复
-        if (!content.trim() && state.toolCalls.length > 0) {
-          const lastToolCall = state.toolCalls[state.toolCalls.length - 1];
-          const resultStr = typeof lastToolCall.result === 'string'
-            ? lastToolCall.result
-            : JSON.stringify(lastToolCall.result, null, 2);
-          content = `根据查询结果:\n\n${resultStr}`;
-        }
         const result: AgentResult = {
           content,
           toolCalls: state.toolCalls,
@@ -309,13 +570,52 @@ export class Agent {
       } catch (error) {
         const err = error instanceof Error ? error : new Error(String(error));
         this.emit('error', err);
-        throw err;
+        // ── 错误恢复策略 ──
+        // 如果已经有工具结果，注入恢复消息让 AI 基于已有数据回答
+        if (state.toolCalls.length > 0) {
+          logger.warn(`第 ${state.iterations} 轮 LLM 调用失败，尝试基于已有数据恢复: ${err.message}`);
+          const toolSummary = state.toolCalls.map(tc => {
+            const r = typeof tc.result === 'string' ? tc.result : JSON.stringify(tc.result);
+            return `【${tc.tool}】${r}`;
+          }).join('\n');
+          const fallbackResult: AgentResult = {
+            content: `以下是已获取的工具结果：\n${toolSummary}`,
+            toolCalls: state.toolCalls,
+            usage: state.usage,
+            iterations: state.iterations,
+          };
+          this.emit('complete', fallbackResult);
+          return fallbackResult;
+        }
+        // 没有任何工具结果，提供友好的错误消息
+        const fallbackResult: AgentResult = {
+          content: `抱歉，处理过程中遇到了问题：${err.message}。请稍后重试或换个方式提问。`,
+          toolCalls: [],
+          usage: state.usage,
+          iterations: state.iterations,
+        };
+        this.emit('complete', fallbackResult);
+        return fallbackResult;
       }
     }
-    // 达到最大迭代次数
+    // 达到最大迭代次数，基于已有工具结果生成兜底回复
+    let fallbackContent: string;
+    if (state.toolCalls.length > 0) {
+      // 尝试从工具结果中构建有意义的回复
+      const toolSummary = state.toolCalls.map(tc => {
+        const r = typeof tc.result === 'string' ? tc.result : JSON.stringify(tc.result);
+        return `【${tc.tool}】${r}`;
+      }).join('\n');
+      fallbackContent = `处理完成，以下是获取到的信息：\n${toolSummary}`;
+    } else {
+      fallbackContent = '达到最大处理轮次，任务可能未完全完成。请尝试简化问题后重试。';
+    }
     const result: AgentResult = {
-      content: '达到最大迭代次数，任务可能未完成。',
+      content: fallbackContent,
       toolCalls: state.toolCalls,
       usage: state.usage,
       iterations: state.iterations,
@@ -327,8 +627,12 @@ export class Agent {
   /**
    * 流式运行 Agent
+   *
+   * @param userMessage    用户消息
+   * @param context        对话上下文
+   * @param filterOptions  工具过滤选项 —— 启用后在 AI 调用之前程序化筛选工具
    */
-  async *runStream(userMessage: string, context?: ChatMessage[]): AsyncIterable<{
+  async *runStream(userMessage: string, context?: ChatMessage[], filterOptions?: ToolFilterOptions): AsyncIterable<{
     type: 'content' | 'tool_call' | 'tool_result' | 'done';
     data: any;
   }> {
@@ -338,10 +642,29 @@ export class Agent {
       { role: 'user', content: userMessage },
     ];
-    const toolDefinitions = this.getToolDefinitions();
+    // 程序化工具预过滤
+    let toolDefinitions: ChatToolDefinition[];
+    if (filterOptions) {
+      const allTools = Array.from(this.tools.values());
+      const filtered = Agent.filterTools(userMessage, allTools, filterOptions);
+      logger.debug(`流式工具预过滤: ${allTools.length} -> ${filtered.length}`);
+      toolDefinitions = filtered.map(tool => ({
+        type: 'function' as const,
+        function: {
+          name: tool.name,
+          description: tool.description,
+          parameters: tool.parameters,
+        },
+      }));
+    } else {
+      toolDefinitions = this.getToolDefinitions();
+    }
+    const hasTools = toolDefinitions.length > 0;
     let iterations = 0;
     const toolCallHistory: { tool: string; args: any; result: any }[] = [];
     const usage: Usage = { prompt_tokens: 0, completion_tokens: 0, total_tokens: 0 };
+    const seenToolKeys = new Set<string>();
+    let consecutiveDuplicateRounds = 0;
     while (iterations < this.config.maxIterations) {
       iterations++;
@@ -349,28 +672,33 @@ export class Agent {
       let content = '';
       const pendingToolCalls: ToolCall[] = [];
       let finishReason: string | null = null;
+      const isLastIteration = iterations >= this.config.maxIterations;
+      const forceAnswer = consecutiveDuplicateRounds > 0 ||
+        (isLastIteration && toolCallHistory.length > 0);
       // 流式获取响应
       for await (const chunk of this.provider.chatStream({
         model: this.config.model,
         messages,
-        tools: toolDefinitions.length > 0 ? toolDefinitions : undefined,
-        tool_choice: toolDefinitions.length > 0 ? 'auto' : undefined,
+        tools: hasTools && !forceAnswer ? toolDefinitions : undefined,
+        tool_choice: hasTools && !forceAnswer ? 'auto' : undefined,
         temperature: this.config.temperature,
       })) {
         const choice = chunk.choices[0];
         if (!choice) continue;
-        // 处理内容
+        // 处理内容片段
         if (choice.delta.content) {
           content += choice.delta.content;
-          yield { type: 'content', data: choice.delta.content };
+          // 仅在非工具调用阶段输出内容给消费者
+          if (pendingToolCalls.length === 0) {
+            yield { type: 'content', data: choice.delta.content };
+          }
         }
-        // 处理工具调用
+        // 合并工具调用片段
         if (choice.delta.tool_calls) {
           for (const tc of choice.delta.tool_calls) {
-            // 合并工具调用片段
             let existing = pendingToolCalls.find(p => p.id === tc.id);
             if (!existing && tc.id) {
               existing = {
@@ -387,42 +715,82 @@ export class Agent {
           }
         }
-        if (choice.finish_reason) {
-          finishReason = choice.finish_reason;
-        }
+        if (choice.finish_reason) finishReason = choice.finish_reason;
-        if (chunk.usage) {
-          usage.prompt_tokens += chunk.usage.prompt_tokens;
-          usage.completion_tokens += chunk.usage.completion_tokens;
-          usage.total_tokens += chunk.usage.total_tokens;
-        }
+        Agent.addUsage(usage, chunk.usage);
       }
-      // 添加 assistant 消息。若存在 pendingToolCalls，则不要在流式期间把模型原始包含工具调用的内容直接发送给消费者。
-      const assistantMessage: ChatMessage = {
-        role: 'assistant',
+      // 将 assistant 消息加入上下文
+      messages.push({
+        role: 'tool_call',
         content,
         tool_calls: pendingToolCalls.length > 0 ? pendingToolCalls : undefined,
-      };
-      messages.push(assistantMessage);
+      });
-      // 处理工具调用（流式模式）
+      // 处理工具调用
       if (pendingToolCalls.length > 0 && finishReason === 'tool_calls') {
-        for (const toolCall of pendingToolCalls) {
-          // 通知上层开始执行工具（上层可用于显示“正在执行工具”而非工具原始内容）
-          yield { type: 'tool_call', data: { name: toolCall.function.name, args: toolCall.function.arguments } };
+        // 分离新调用和重复调用
+        const freshCalls: ToolCall[] = [];
+        const duplicateCalls: ToolCall[] = [];
+        for (const tc of pendingToolCalls) {
+          const key = Agent.toolCallKey(tc.function.name, tc.function.arguments);
+          if (seenToolKeys.has(key)) {
+            duplicateCalls.push(tc);
+          } else {
+            freshCalls.push(tc);
+          }
+        }
-          const result = await this.executeToolCall(toolCall);
+        if (freshCalls.length === 0) {
+          // 全部重复
+          consecutiveDuplicateRounds++;
-          toolCallHistory.push({
-            tool: toolCall.function.name,
-            args: JSON.parse(toolCall.function.arguments),
-            result: JSON.parse(result),
-          });
+          // 补上 tool 消息保持协议完整
+          for (const tc of pendingToolCalls) {
+            const key = Agent.toolCallKey(tc.function.name, tc.function.arguments);
+            const previous = toolCallHistory.find(
+              h => Agent.toolCallKey(h.tool, JSON.stringify(h.args)) === key ||
+                   Agent.toolCallKey(h.tool, tc.function.arguments) === key,
+            );
+            messages.push({
+              role: 'tool_result',
+              content: previous ? JSON.stringify(previous.result) : '结果已获取',
+              tool_call_id: tc.id,
+            });
+          }
+          continue;
+        }
-          // 返回工具结果（上层可选择把工具执行过程隐藏，仅在最终完成时展示润色结果）
-          yield { type: 'tool_result', data: { name: toolCall.function.name, result } };
+        consecutiveDuplicateRounds = 0;
+        // 先通知上层所有工具调用开始
+        for (const tc of freshCalls) {
+          yield { type: 'tool_call', data: { name: tc.function.name, args: tc.function.arguments } };
+        }
+        // 并行执行所有新工具调用
+        const results = await Promise.all(
+          freshCalls.map(async (toolCall) => {
+            const result = await this.executeToolCall(toolCall);
+            const args = Agent.safeParse(toolCall.function.arguments);
+            const parsedResult = Agent.safeParse(result);
+            const key = Agent.toolCallKey(toolCall.function.name, toolCall.function.arguments);
+            seenToolKeys.add(key);
+            toolCallHistory.push({
+              tool: toolCall.function.name,
+              args: typeof args === 'object' ? args : { raw: args },
+              result: parsedResult,
+            });
+            return { toolCall, result };
+          }),
+        );
+        // yield 工具结果并加入消息历史
+        for (const { toolCall, result } of results) {
+          yield { type: 'tool_result', data: { name: toolCall.function.name, result } };
           messages.push({
             role: 'tool',
             content: result,
@@ -430,7 +798,20 @@ export class Agent {
           });
         }
-        // 继续循环，让模型以工具结果为上下文生成最终回答
+        // 为重复的调用也补上 tool 消息
+        for (const tc of duplicateCalls) {
+          const key = Agent.toolCallKey(tc.function.name, tc.function.arguments);
+          const previous = toolCallHistory.find(
+            h => Agent.toolCallKey(h.tool, JSON.stringify(h.args)) === key ||
+                 Agent.toolCallKey(h.tool, tc.function.arguments) === key,
+          );
+          messages.push({
+            role: 'tool',
+            content: previous ? JSON.stringify(previous.result) : '结果已获取',
+            tool_call_id: tc.id,
+          });
+        }
         continue;
       }
@@ -451,7 +832,9 @@ export class Agent {
     yield {
       type: 'done',
       data: {
-        content: '达到最大迭代次数',
+        content: toolCallHistory.length > 0
+          ? `处理完成，共执行了 ${toolCallHistory.length} 个工具调用。`
+          : '达到最大迭代次数',
         toolCalls: toolCallHistory,
         usage,
         iterations,