skyloom 1.13.6 → 1.13.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (193) hide show
  1. package/.github/workflows/ci.yml +36 -36
  2. package/README.md +220 -159
  3. package/config/providers.yaml +39 -39
  4. package/config/skills/api_integrator/SKILL.md +15 -15
  5. package/config/skills/arch_designer/SKILL.md +13 -13
  6. package/config/skills/ci_cd_manager/SKILL.md +14 -14
  7. package/config/skills/code_analysis/SKILL.md +13 -13
  8. package/config/skills/code_generator/SKILL.md +12 -12
  9. package/config/skills/code_reviewer/SKILL.md +13 -13
  10. package/config/skills/content_writer/SKILL.md +14 -14
  11. package/config/skills/data_transformer/SKILL.md +15 -15
  12. package/config/skills/document_analysis/SKILL.md +13 -13
  13. package/config/skills/emotional_companion/SKILL.md +15 -15
  14. package/config/skills/performance_checker/SKILL.md +14 -14
  15. package/config/skills/security_auditor/SKILL.md +14 -14
  16. package/config/skills/self_evolve/SKILL.md +13 -13
  17. package/config/skills/sys_operator/SKILL.md +15 -15
  18. package/config/skills/task_planner/SKILL.md +14 -14
  19. package/config/skills/web_research/SKILL.md +14 -14
  20. package/config/skills/workflow_designer/SKILL.md +13 -13
  21. package/dist/agents/dew.js +52 -52
  22. package/dist/agents/fair.js +84 -84
  23. package/dist/agents/fog.js +30 -30
  24. package/dist/agents/frost.js +32 -32
  25. package/dist/agents/rain.js +32 -32
  26. package/dist/agents/snow.js +68 -68
  27. package/dist/cli/commands_md.d.ts +41 -0
  28. package/dist/cli/commands_md.d.ts.map +1 -0
  29. package/dist/cli/commands_md.js +140 -0
  30. package/dist/cli/commands_md.js.map +1 -0
  31. package/dist/cli/input_macros.d.ts +28 -0
  32. package/dist/cli/input_macros.d.ts.map +1 -0
  33. package/dist/cli/input_macros.js +120 -0
  34. package/dist/cli/input_macros.js.map +1 -0
  35. package/dist/cli/loom.d.ts +220 -0
  36. package/dist/cli/loom.d.ts.map +1 -0
  37. package/dist/cli/loom.js +1094 -0
  38. package/dist/cli/loom.js.map +1 -0
  39. package/dist/cli/loom_chat.d.ts +20 -0
  40. package/dist/cli/loom_chat.d.ts.map +1 -0
  41. package/dist/cli/loom_chat.js +685 -0
  42. package/dist/cli/loom_chat.js.map +1 -0
  43. package/dist/cli/main.js +310 -14
  44. package/dist/cli/main.js.map +1 -1
  45. package/dist/cli/tui.d.ts.map +1 -1
  46. package/dist/cli/tui.js +7 -1
  47. package/dist/cli/tui.js.map +1 -1
  48. package/dist/core/agent.d.ts +20 -0
  49. package/dist/core/agent.d.ts.map +1 -1
  50. package/dist/core/agent.js +199 -16
  51. package/dist/core/agent.js.map +1 -1
  52. package/dist/core/factory.d.ts.map +1 -1
  53. package/dist/core/factory.js +34 -2
  54. package/dist/core/factory.js.map +1 -1
  55. package/dist/core/file_checkpoint.d.ts +57 -0
  56. package/dist/core/file_checkpoint.d.ts.map +1 -0
  57. package/dist/core/file_checkpoint.js +162 -0
  58. package/dist/core/file_checkpoint.js.map +1 -0
  59. package/dist/core/hooks.d.ts +43 -0
  60. package/dist/core/hooks.d.ts.map +1 -0
  61. package/dist/core/hooks.js +110 -0
  62. package/dist/core/hooks.js.map +1 -0
  63. package/dist/core/llm.d.ts.map +1 -1
  64. package/dist/core/llm.js +15 -9
  65. package/dist/core/llm.js.map +1 -1
  66. package/dist/core/longdoc.js +5 -5
  67. package/dist/core/mcp.d.ts +16 -0
  68. package/dist/core/mcp.d.ts.map +1 -1
  69. package/dist/core/mcp.js +55 -0
  70. package/dist/core/mcp.js.map +1 -1
  71. package/dist/core/model_config.d.ts +40 -0
  72. package/dist/core/model_config.d.ts.map +1 -0
  73. package/dist/core/model_config.js +191 -0
  74. package/dist/core/model_config.js.map +1 -0
  75. package/dist/core/skill.d.ts +7 -0
  76. package/dist/core/skill.d.ts.map +1 -1
  77. package/dist/core/skill.js +47 -0
  78. package/dist/core/skill.js.map +1 -1
  79. package/dist/core/skymd.d.ts +39 -0
  80. package/dist/core/skymd.d.ts.map +1 -0
  81. package/dist/core/skymd.js +177 -0
  82. package/dist/core/skymd.js.map +1 -0
  83. package/dist/core/tool.d.ts +12 -0
  84. package/dist/core/tool.d.ts.map +1 -1
  85. package/dist/core/tool.js +30 -0
  86. package/dist/core/tool.js.map +1 -1
  87. package/dist/core/verify.d.ts +27 -0
  88. package/dist/core/verify.d.ts.map +1 -0
  89. package/dist/core/verify.js +62 -0
  90. package/dist/core/verify.js.map +1 -0
  91. package/dist/skills/loader.d.ts +22 -2
  92. package/dist/skills/loader.d.ts.map +1 -1
  93. package/dist/skills/loader.js +45 -15
  94. package/dist/skills/loader.js.map +1 -1
  95. package/dist/tools/builtin.d.ts.map +1 -1
  96. package/dist/tools/builtin.js +13 -3
  97. package/dist/tools/builtin.js.map +1 -1
  98. package/dist/tools/model_tool.d.ts +11 -0
  99. package/dist/tools/model_tool.d.ts.map +1 -0
  100. package/dist/tools/model_tool.js +71 -0
  101. package/dist/tools/model_tool.js.map +1 -0
  102. package/dist/tools/todo.d.ts +30 -0
  103. package/dist/tools/todo.d.ts.map +1 -0
  104. package/dist/tools/todo.js +78 -0
  105. package/dist/tools/todo.js.map +1 -0
  106. package/docs/AESTHETIC_DESIGN.md +152 -144
  107. package/docs/OPTIMIZATION_PLAN.md +178 -178
  108. package/package.json +68 -68
  109. package/scripts/install.js +48 -48
  110. package/scripts/link.js +10 -10
  111. package/setup.bat +79 -79
  112. package/skill-test-ty2fOA/test.md +10 -10
  113. package/src/agents/dew.ts +70 -70
  114. package/src/agents/fair.ts +102 -102
  115. package/src/agents/fog.ts +48 -48
  116. package/src/agents/frost.ts +50 -50
  117. package/src/agents/rain.ts +50 -50
  118. package/src/agents/snow.ts +239 -239
  119. package/src/cli/commands_md.ts +112 -0
  120. package/src/cli/input_macros.ts +83 -0
  121. package/src/cli/loom.ts +982 -0
  122. package/src/cli/loom_chat.ts +598 -0
  123. package/src/cli/main.ts +255 -9
  124. package/src/cli/mode.ts +58 -58
  125. package/src/cli/tui.ts +228 -222
  126. package/src/core/agent/guard.ts +134 -134
  127. package/src/core/agent/task.ts +100 -100
  128. package/src/core/agent.ts +195 -16
  129. package/src/core/arbitrate.ts +162 -162
  130. package/src/core/catalog.ts +178 -178
  131. package/src/core/checkpoint.ts +94 -94
  132. package/src/core/estimate.ts +104 -104
  133. package/src/core/evolve.ts +191 -191
  134. package/src/core/factory.ts +31 -2
  135. package/src/core/file_checkpoint.ts +136 -0
  136. package/src/core/filter.ts +103 -103
  137. package/src/core/graph.ts +156 -156
  138. package/src/core/hooks.ts +126 -0
  139. package/src/core/icons.ts +53 -53
  140. package/src/core/index.ts +37 -37
  141. package/src/core/learn.ts +146 -146
  142. package/src/core/llm.ts +15 -9
  143. package/src/core/longdoc.ts +155 -155
  144. package/src/core/mcp.ts +48 -0
  145. package/src/core/mcp_server.ts +176 -176
  146. package/src/core/model_config.ts +157 -0
  147. package/src/core/profile.ts +255 -255
  148. package/src/core/router.ts +124 -124
  149. package/src/core/sandbox.ts +142 -142
  150. package/src/core/security.ts +243 -243
  151. package/src/core/skill.ts +42 -0
  152. package/src/core/skymd.ts +143 -0
  153. package/src/core/theme.ts +65 -65
  154. package/src/core/tool.ts +30 -0
  155. package/src/core/tool_router.ts +193 -193
  156. package/src/core/vector.ts +152 -152
  157. package/src/core/verify.ts +71 -0
  158. package/src/core/workspace.ts +150 -150
  159. package/src/plugins/loader.ts +66 -66
  160. package/src/skills/loader.ts +45 -16
  161. package/src/sql.js.d.ts +29 -29
  162. package/src/tools/builtin.ts +13 -3
  163. package/src/tools/computer.ts +269 -269
  164. package/src/tools/delegate.ts +49 -49
  165. package/src/tools/model_tool.ts +74 -0
  166. package/src/tools/todo.ts +76 -0
  167. package/src/web/tts.ts +93 -93
  168. package/tests/agent.test.ts +159 -159
  169. package/tests/agent_helpers.test.ts +48 -48
  170. package/tests/bus.test.ts +121 -121
  171. package/tests/catalog.test.ts +86 -86
  172. package/tests/checkpoint_commands.test.ts +124 -0
  173. package/tests/claude_compat.test.ts +110 -0
  174. package/tests/config.test.ts +41 -41
  175. package/tests/guard.test.ts +75 -75
  176. package/tests/icons.test.ts +45 -45
  177. package/tests/loom.test.ts +248 -0
  178. package/tests/memory.test.ts +170 -170
  179. package/tests/model_config.test.ts +109 -0
  180. package/tests/router.test.ts +86 -86
  181. package/tests/schemas.test.ts +51 -51
  182. package/tests/semantic.test.ts +83 -83
  183. package/tests/setup.ts +10 -10
  184. package/tests/skill.test.ts +172 -172
  185. package/tests/skymd.test.ts +146 -0
  186. package/tests/task.test.ts +60 -60
  187. package/tests/todo_toolstats.test.ts +94 -0
  188. package/tests/tool.test.ts +108 -108
  189. package/tests/tool_router.test.ts +71 -71
  190. package/tests/tui.test.ts +67 -67
  191. package/vitest.config.ts +17 -17
  192. package/=12 +0 -0
  193. package/=8 +0 -0
@@ -1,104 +1,104 @@
1
- /**
2
- * 资源估算模块 — Token & time budget estimation for task planning.
3
- *
4
- * Helps Snow and other planning agents estimate the cost of
5
- * proposed sub-tasks before committing to execution.
6
- */
7
-
8
- import type { Task } from "./agent";
9
-
10
- /* ═══════════════════════════════════════
11
- Token estimation
12
- ═══════════════════════════════════════ */
13
- const CJK_REGEX = /[一-鿿぀-ゟ가-힯㐀-䶿]/g;
14
-
15
- /** Estimate tokens for a given text (CJK ~2 each, ASCII ~4 chars each). */
16
- export function estimateTokens(text: string): number {
17
- const cjk = (text.match(CJK_REGEX) || []).length;
18
- return cjk * 2 + Math.ceil((text.length - cjk) / 4);
19
- }
20
-
21
- /* ═══════════════════════════════════════
22
- Per-task-type cost estimates
23
- ═══════════════════════════════════════ */
24
- const TASK_TYPE_PATTERNS: Array<[RegExp, number, number]> = [
25
- // [pattern, estimated tokens, estimated tools]
26
- [/read|read_file|grep|search|查|搜索|list/i, 2000, 2],
27
- [/write|write_file|生成|写|create|implement/i, 4000, 5],
28
- [/edit|edit_file|改|修改|fix|修复/i, 3000, 3],
29
- [/delete|delete_file|删|rm/i, 1500, 2],
30
- [/deploy|部署|publish|发布|release/i, 8000, 8],
31
- [/review|审查|audit|审计|scan|扫描/i, 5000, 4],
32
- [/test|测试|run_test|coverage/i, 3000, 3],
33
- [/research|研究|调研|analyze|分析/i, 6000, 4],
34
- [/orchestrate|编排|multi-step|多步/i, 12000, 10],
35
- ];
36
-
37
- /** Estimate cost for a single task description. */
38
- export function estimateTaskCost(description: string): { tokens: number; tools: number; timeSeconds: number } {
39
- let tokens = 2000; // base
40
- let tools = 2; // base
41
- for (const [pattern, t, tc] of TASK_TYPE_PATTERNS) {
42
- if (pattern.test(description)) { tokens = Math.max(tokens, t); tools = Math.max(tools, tc); }
43
- }
44
-
45
- // Time estimate: ~0.5s per tool call + 2s per 1k tokens
46
- const timeSeconds = (tokens / 1000) * 2 + tools * 0.5 + 2;
47
- return { tokens, tools, timeSeconds };
48
- }
49
-
50
- /* ═══════════════════════════════════════
51
- Task plan cost summary
52
- ═══════════════════════════════════════ */
53
- export interface PlanEstimate {
54
- totalTokens: number;
55
- totalTools: number;
56
- totalTimeSeconds: number;
57
- perTask: Array<{ id: string; tokens: number; tools: number; time: number }>;
58
- warnings: string[];
59
- }
60
-
61
- export function estimateTaskPlan(tasks: Task[]): PlanEstimate {
62
- const perTask: PlanEstimate["perTask"] = [];
63
- let totalTokens = 500; // system prompt overhead
64
- let totalTools = 0;
65
- let totalTime = 5; // init overhead
66
- const warnings: string[] = [];
67
-
68
- for (const t of tasks) {
69
- const est = estimateTaskCost(t.description);
70
- perTask.push({ id: t.id, tokens: est.tokens, tools: est.tools, time: est.timeSeconds });
71
- totalTokens += est.tokens;
72
- totalTools += est.tools;
73
- totalTime += est.timeSeconds;
74
-
75
- if (est.timeSeconds > 60) warnings.push(`Task ${t.id} may take >${Math.round(est.timeSeconds)}s`);
76
- if (est.tools > 10) warnings.push(`Task ${t.id} uses many tool calls (${est.tools})`);
77
- }
78
-
79
- if (totalTokens > 64000) warnings.push(`Total token estimate (${totalTokens}) exceeds typical context window`);
80
- if (totalTime > 120) warnings.push(`Estimated total time (${Math.round(totalTime)}s) is significant`);
81
- if (tasks.length > 6) warnings.push(`Large number of sub-tasks (${tasks.length}) — consider merging simpler ones`);
82
-
83
- return { totalTokens, totalTools, totalTimeSeconds: Math.round(totalTime), perTask, warnings };
84
- }
85
-
86
- /* ═══════════════════════════════════════
87
- Format estimate for display
88
- ═══════════════════════════════════════ */
89
- export function formatPlanEstimate(est: PlanEstimate): string {
90
- const lines: string[] = [
91
- `## Plan Estimate`,
92
- `| Task | Tokens | Tools | Time |`,
93
- `|------|--------|-------|------|`,
94
- ...est.perTask.map(t => `| ${t.id} | ${t.tokens} | ${t.tools} | ${t.time.toFixed(0)}s |`),
95
- `| **Total** | **${est.totalTokens}** | **${est.totalTools}** | **${est.totalTimeSeconds}s** |`,
96
- ];
97
-
98
- if (est.warnings.length > 0) {
99
- lines.push("", "### Warnings");
100
- for (const w of est.warnings) lines.push(`- ⚠ ${w}`);
101
- }
102
-
103
- return lines.join("\n");
104
- }
1
+ /**
2
+ * 资源估算模块 — Token & time budget estimation for task planning.
3
+ *
4
+ * Helps Snow and other planning agents estimate the cost of
5
+ * proposed sub-tasks before committing to execution.
6
+ */
7
+
8
+ import type { Task } from "./agent";
9
+
10
+ /* ═══════════════════════════════════════
11
+ Token estimation
12
+ ═══════════════════════════════════════ */
13
+ const CJK_REGEX = /[一-鿿぀-ゟ가-힯㐀-䶿]/g;
14
+
15
+ /** Estimate tokens for a given text (CJK ~2 each, ASCII ~4 chars each). */
16
+ export function estimateTokens(text: string): number {
17
+ const cjk = (text.match(CJK_REGEX) || []).length;
18
+ return cjk * 2 + Math.ceil((text.length - cjk) / 4);
19
+ }
20
+
21
+ /* ═══════════════════════════════════════
22
+ Per-task-type cost estimates
23
+ ═══════════════════════════════════════ */
24
+ const TASK_TYPE_PATTERNS: Array<[RegExp, number, number]> = [
25
+ // [pattern, estimated tokens, estimated tools]
26
+ [/read|read_file|grep|search|查|搜索|list/i, 2000, 2],
27
+ [/write|write_file|生成|写|create|implement/i, 4000, 5],
28
+ [/edit|edit_file|改|修改|fix|修复/i, 3000, 3],
29
+ [/delete|delete_file|删|rm/i, 1500, 2],
30
+ [/deploy|部署|publish|发布|release/i, 8000, 8],
31
+ [/review|审查|audit|审计|scan|扫描/i, 5000, 4],
32
+ [/test|测试|run_test|coverage/i, 3000, 3],
33
+ [/research|研究|调研|analyze|分析/i, 6000, 4],
34
+ [/orchestrate|编排|multi-step|多步/i, 12000, 10],
35
+ ];
36
+
37
+ /** Estimate cost for a single task description. */
38
+ export function estimateTaskCost(description: string): { tokens: number; tools: number; timeSeconds: number } {
39
+ let tokens = 2000; // base
40
+ let tools = 2; // base
41
+ for (const [pattern, t, tc] of TASK_TYPE_PATTERNS) {
42
+ if (pattern.test(description)) { tokens = Math.max(tokens, t); tools = Math.max(tools, tc); }
43
+ }
44
+
45
+ // Time estimate: ~0.5s per tool call + 2s per 1k tokens
46
+ const timeSeconds = (tokens / 1000) * 2 + tools * 0.5 + 2;
47
+ return { tokens, tools, timeSeconds };
48
+ }
49
+
50
+ /* ═══════════════════════════════════════
51
+ Task plan cost summary
52
+ ═══════════════════════════════════════ */
53
+ export interface PlanEstimate {
54
+ totalTokens: number;
55
+ totalTools: number;
56
+ totalTimeSeconds: number;
57
+ perTask: Array<{ id: string; tokens: number; tools: number; time: number }>;
58
+ warnings: string[];
59
+ }
60
+
61
+ export function estimateTaskPlan(tasks: Task[]): PlanEstimate {
62
+ const perTask: PlanEstimate["perTask"] = [];
63
+ let totalTokens = 500; // system prompt overhead
64
+ let totalTools = 0;
65
+ let totalTime = 5; // init overhead
66
+ const warnings: string[] = [];
67
+
68
+ for (const t of tasks) {
69
+ const est = estimateTaskCost(t.description);
70
+ perTask.push({ id: t.id, tokens: est.tokens, tools: est.tools, time: est.timeSeconds });
71
+ totalTokens += est.tokens;
72
+ totalTools += est.tools;
73
+ totalTime += est.timeSeconds;
74
+
75
+ if (est.timeSeconds > 60) warnings.push(`Task ${t.id} may take >${Math.round(est.timeSeconds)}s`);
76
+ if (est.tools > 10) warnings.push(`Task ${t.id} uses many tool calls (${est.tools})`);
77
+ }
78
+
79
+ if (totalTokens > 64000) warnings.push(`Total token estimate (${totalTokens}) exceeds typical context window`);
80
+ if (totalTime > 120) warnings.push(`Estimated total time (${Math.round(totalTime)}s) is significant`);
81
+ if (tasks.length > 6) warnings.push(`Large number of sub-tasks (${tasks.length}) — consider merging simpler ones`);
82
+
83
+ return { totalTokens, totalTools, totalTimeSeconds: Math.round(totalTime), perTask, warnings };
84
+ }
85
+
86
+ /* ═══════════════════════════════════════
87
+ Format estimate for display
88
+ ═══════════════════════════════════════ */
89
+ export function formatPlanEstimate(est: PlanEstimate): string {
90
+ const lines: string[] = [
91
+ `## Plan Estimate`,
92
+ `| Task | Tokens | Tools | Time |`,
93
+ `|------|--------|-------|------|`,
94
+ ...est.perTask.map(t => `| ${t.id} | ${t.tokens} | ${t.tools} | ${t.time.toFixed(0)}s |`),
95
+ `| **Total** | **${est.totalTokens}** | **${est.totalTools}** | **${est.totalTimeSeconds}s** |`,
96
+ ];
97
+
98
+ if (est.warnings.length > 0) {
99
+ lines.push("", "### Warnings");
100
+ for (const w of est.warnings) lines.push(`- ⚠ ${w}`);
101
+ }
102
+
103
+ return lines.join("\n");
104
+ }
@@ -1,191 +1,191 @@
1
- /**
2
- * 自我进化模块 — Prompt self-optimization via failure analysis.
3
- *
4
- * When an agent repeatedly fails at similar tasks, this module analyzes
5
- * the failure patterns and suggests targeted improvements to the agent's
6
- * System Prompt. The agent can then apply these suggestions to improve
7
- * future performance.
8
- *
9
- * Architecture:
10
- * Failure log → Pattern analysis → Prompt diff → Agent.applyDiff()
11
- */
12
-
13
- import * as fs from "fs";
14
- import * as path from "path";
15
- import { USER_CONFIG_DIR } from "./config";
16
- import { getLogger } from "./logger";
17
-
18
- const log = getLogger("evolve");
19
-
20
- /* ═══════════════════════════════════════
21
- Prompt diff — a suggested change
22
- ═══════════════════════════════════════ */
23
- export interface PromptDiff {
24
- id: string;
25
- ts: string;
26
- agent: string;
27
- reason: string; // Why this change is needed
28
- before: string; // Old prompt fragment
29
- after: string; // New prompt fragment
30
- applied: boolean;
31
- improvement?: string; // Measured improvement after applying
32
- }
33
-
34
- /* ═══════════════════════════════════════
35
- Failure analysis
36
- ═══════════════════════════════════════ */
37
- export interface FailureAnalysis {
38
- agent: string;
39
- period: string;
40
- totalCalls: number;
41
- failureCount: number;
42
- topFailures: Array<{ pattern: string; count: number }>;
43
- suggestedDiffs: PromptDiff[];
44
- }
45
-
46
- const evolveDir = path.join(USER_CONFIG_DIR, "evolve");
47
- function ensureDir() { if (!fs.existsSync(evolveDir)) fs.mkdirSync(evolveDir, { recursive: true }); }
48
-
49
- /** Analyze recent failures from the learning module and suggest prompt improvements. */
50
- export function analyzeFailures(
51
- agent: string,
52
- experiences: Array<{ pattern: string; solution: string; frequency: number; lastSeen: string }>,
53
- systemPrompt: string
54
- ): FailureAnalysis {
55
- const recent = experiences.filter(e => {
56
- try { return new Date(e.lastSeen).getTime() > Date.now() - 7 * 86400000; }
57
- catch { return false; }
58
- });
59
-
60
- const topFailures = recent
61
- .sort((a, b) => b.frequency - a.frequency)
62
- .slice(0, 5)
63
- .map(e => ({ pattern: e.pattern, count: e.frequency }));
64
-
65
- const suggestedDiffs: PromptDiff[] = [];
66
-
67
- // Rule-based suggestions from failure patterns
68
- for (const f of topFailures) {
69
- const lower = f.pattern.toLowerCase();
70
-
71
- // Search storm → add search budget rule
72
- if ((lower.includes("search") || lower.includes("web_search")) && f.count >= 3) {
73
- const rule = `- 搜索不超过 5 轮。5 轮后直接基于已有信息综合回答。`;
74
- if (!systemPrompt.includes("搜索不超过")) {
75
- suggestedDiffs.push({
76
- id: Math.random().toString(36).slice(2, 8),
77
- ts: new Date().toISOString(), agent,
78
- reason: `搜索风暴 (${f.count} 次重复搜索)`,
79
- before: "", after: rule, applied: false,
80
- });
81
- }
82
- }
83
-
84
- // Empty response → add deliverable checklist
85
- if ((lower.includes("empty") || lower.includes("placeholder") || lower.includes("完成了")) && f.count >= 2) {
86
- const rule = `- 完成任务后,必须输出实际产物(代码/文件路径/数据),禁止只说"完成了"而无产出。`;
87
- if (!systemPrompt.includes("必须输出实际产物")) {
88
- suggestedDiffs.push({
89
- id: Math.random().toString(36).slice(2, 8),
90
- ts: new Date().toISOString(), agent,
91
- reason: `空响应/占位 (${f.count} 次)`,
92
- before: "", after: rule, applied: false,
93
- });
94
- }
95
- }
96
-
97
- // Tool not found → add tool discovery to prompt
98
- if (lower.includes("does not exist") || lower.includes("tool") && lower.includes("not found")) {
99
- const rule = `- 使用不熟悉的工具前先调 list_skills 查看可用工具列表。`;
100
- if (!systemPrompt.includes("list_skills")) {
101
- suggestedDiffs.push({
102
- id: Math.random().toString(36).slice(2, 8),
103
- ts: new Date().toISOString(), agent,
104
- reason: `工具不存在 (${f.count} 次)`,
105
- before: "", after: rule, applied: false,
106
- });
107
- }
108
- }
109
-
110
- // File not found → add path verification rule
111
- if (lower.includes("file not found") || lower.includes("directory not found")) {
112
- const rule = `- 文件操作前先用 list_directory 或 read_file 确认路径存在。`;
113
- if (!systemPrompt.includes("确认路径存在")) {
114
- suggestedDiffs.push({
115
- id: Math.random().toString(36).slice(2, 8),
116
- ts: new Date().toISOString(), agent,
117
- reason: `文件路径错误 (${f.count} 次)`,
118
- before: "", after: rule, applied: false,
119
- });
120
- }
121
- }
122
- }
123
-
124
- // General rule: if failure rate > 20%, suggest self-review
125
- const recentExperiences = recent.filter(e => {
126
- try { return new Date(e.lastSeen).getTime() > Date.now() - 3 * 86400000; }
127
- catch { return false; }
128
- });
129
-
130
- // Deduplicate suggestions
131
- const seen = new Set<string>();
132
- const uniqueDiffs = suggestedDiffs.filter(d => {
133
- const key = d.after.slice(0, 30);
134
- if (seen.has(key)) return false;
135
- seen.add(key); return true;
136
- });
137
-
138
- // Max 3 suggestions per analysis
139
- return {
140
- agent, period: "last 7 days",
141
- totalCalls: 0, failureCount: 0,
142
- topFailures,
143
- suggestedDiffs: uniqueDiffs.slice(0, 3),
144
- };
145
- }
146
-
147
- /* ═══════════════════════════════════════
148
- Apply prompt diff to agent
149
- ═══════════════════════════════════════ */
150
- export function applyPromptDiff(agent: any, diff: PromptDiff): boolean {
151
- try {
152
- const currentPrompt = agent.systemPrompt;
153
- if (!diff.after || currentPrompt.includes(diff.after.slice(0, 20))) return false;
154
-
155
- // Append the new rule after "## 行为守则" or "## Behavior" section
156
- const marker = currentPrompt.includes("行为守则") ? "## 行为守则" : "## Behavior";
157
- const idx = currentPrompt.indexOf(marker);
158
- if (idx < 0) { agent.systemPrompt += "\n" + diff.after; }
159
- else {
160
- const insertPoint = currentPrompt.indexOf("\n", currentPrompt.indexOf("\n-", idx) + 1);
161
- agent.systemPrompt = currentPrompt.slice(0, insertPoint) + "\n" + diff.after + "\n" + currentPrompt.slice(insertPoint);
162
- }
163
-
164
- diff.applied = true;
165
- diff.improvement = "pending evaluation";
166
-
167
- // Persist the diff
168
- ensureDir();
169
- const file = path.join(evolveDir, `${diff.agent}_diffs.jsonl`);
170
- fs.appendFileSync(file, JSON.stringify(diff) + "\n");
171
-
172
- agent.rebuildSystemPrompt();
173
- return true;
174
- } catch (e) {
175
- log.warn("apply_prompt_diff_failed", { agent: diff.agent, error: String(e) });
176
- return false;
177
- }
178
- }
179
-
180
- /** Get all applied diffs for an agent. */
181
- export function getAppliedDiffs(agent: string): PromptDiff[] {
182
- const diffs: PromptDiff[] = [];
183
- try {
184
- const file = path.join(evolveDir, `${agent}_diffs.jsonl`);
185
- if (fs.existsSync(file)) {
186
- const lines = fs.readFileSync(file, "utf-8").split("\n").filter(Boolean);
187
- for (const line of lines) { try { diffs.push(JSON.parse(line)); } catch { } }
188
- }
189
- } catch { /* ignore */ }
190
- return diffs;
191
- }
1
+ /**
2
+ * 自我进化模块 — Prompt self-optimization via failure analysis.
3
+ *
4
+ * When an agent repeatedly fails at similar tasks, this module analyzes
5
+ * the failure patterns and suggests targeted improvements to the agent's
6
+ * System Prompt. The agent can then apply these suggestions to improve
7
+ * future performance.
8
+ *
9
+ * Architecture:
10
+ * Failure log → Pattern analysis → Prompt diff → Agent.applyDiff()
11
+ */
12
+
13
+ import * as fs from "fs";
14
+ import * as path from "path";
15
+ import { USER_CONFIG_DIR } from "./config";
16
+ import { getLogger } from "./logger";
17
+
18
+ const log = getLogger("evolve");
19
+
20
+ /* ═══════════════════════════════════════
21
+ Prompt diff — a suggested change
22
+ ═══════════════════════════════════════ */
23
+ export interface PromptDiff {
24
+ id: string;
25
+ ts: string;
26
+ agent: string;
27
+ reason: string; // Why this change is needed
28
+ before: string; // Old prompt fragment
29
+ after: string; // New prompt fragment
30
+ applied: boolean;
31
+ improvement?: string; // Measured improvement after applying
32
+ }
33
+
34
+ /* ═══════════════════════════════════════
35
+ Failure analysis
36
+ ═══════════════════════════════════════ */
37
+ export interface FailureAnalysis {
38
+ agent: string;
39
+ period: string;
40
+ totalCalls: number;
41
+ failureCount: number;
42
+ topFailures: Array<{ pattern: string; count: number }>;
43
+ suggestedDiffs: PromptDiff[];
44
+ }
45
+
46
+ const evolveDir = path.join(USER_CONFIG_DIR, "evolve");
47
+ function ensureDir() { if (!fs.existsSync(evolveDir)) fs.mkdirSync(evolveDir, { recursive: true }); }
48
+
49
+ /** Analyze recent failures from the learning module and suggest prompt improvements. */
50
+ export function analyzeFailures(
51
+ agent: string,
52
+ experiences: Array<{ pattern: string; solution: string; frequency: number; lastSeen: string }>,
53
+ systemPrompt: string
54
+ ): FailureAnalysis {
55
+ const recent = experiences.filter(e => {
56
+ try { return new Date(e.lastSeen).getTime() > Date.now() - 7 * 86400000; }
57
+ catch { return false; }
58
+ });
59
+
60
+ const topFailures = recent
61
+ .sort((a, b) => b.frequency - a.frequency)
62
+ .slice(0, 5)
63
+ .map(e => ({ pattern: e.pattern, count: e.frequency }));
64
+
65
+ const suggestedDiffs: PromptDiff[] = [];
66
+
67
+ // Rule-based suggestions from failure patterns
68
+ for (const f of topFailures) {
69
+ const lower = f.pattern.toLowerCase();
70
+
71
+ // Search storm → add search budget rule
72
+ if ((lower.includes("search") || lower.includes("web_search")) && f.count >= 3) {
73
+ const rule = `- 搜索不超过 5 轮。5 轮后直接基于已有信息综合回答。`;
74
+ if (!systemPrompt.includes("搜索不超过")) {
75
+ suggestedDiffs.push({
76
+ id: Math.random().toString(36).slice(2, 8),
77
+ ts: new Date().toISOString(), agent,
78
+ reason: `搜索风暴 (${f.count} 次重复搜索)`,
79
+ before: "", after: rule, applied: false,
80
+ });
81
+ }
82
+ }
83
+
84
+ // Empty response → add deliverable checklist
85
+ if ((lower.includes("empty") || lower.includes("placeholder") || lower.includes("完成了")) && f.count >= 2) {
86
+ const rule = `- 完成任务后,必须输出实际产物(代码/文件路径/数据),禁止只说"完成了"而无产出。`;
87
+ if (!systemPrompt.includes("必须输出实际产物")) {
88
+ suggestedDiffs.push({
89
+ id: Math.random().toString(36).slice(2, 8),
90
+ ts: new Date().toISOString(), agent,
91
+ reason: `空响应/占位 (${f.count} 次)`,
92
+ before: "", after: rule, applied: false,
93
+ });
94
+ }
95
+ }
96
+
97
+ // Tool not found → add tool discovery to prompt
98
+ if (lower.includes("does not exist") || lower.includes("tool") && lower.includes("not found")) {
99
+ const rule = `- 使用不熟悉的工具前先调 list_skills 查看可用工具列表。`;
100
+ if (!systemPrompt.includes("list_skills")) {
101
+ suggestedDiffs.push({
102
+ id: Math.random().toString(36).slice(2, 8),
103
+ ts: new Date().toISOString(), agent,
104
+ reason: `工具不存在 (${f.count} 次)`,
105
+ before: "", after: rule, applied: false,
106
+ });
107
+ }
108
+ }
109
+
110
+ // File not found → add path verification rule
111
+ if (lower.includes("file not found") || lower.includes("directory not found")) {
112
+ const rule = `- 文件操作前先用 list_directory 或 read_file 确认路径存在。`;
113
+ if (!systemPrompt.includes("确认路径存在")) {
114
+ suggestedDiffs.push({
115
+ id: Math.random().toString(36).slice(2, 8),
116
+ ts: new Date().toISOString(), agent,
117
+ reason: `文件路径错误 (${f.count} 次)`,
118
+ before: "", after: rule, applied: false,
119
+ });
120
+ }
121
+ }
122
+ }
123
+
124
+ // General rule: if failure rate > 20%, suggest self-review
125
+ const recentExperiences = recent.filter(e => {
126
+ try { return new Date(e.lastSeen).getTime() > Date.now() - 3 * 86400000; }
127
+ catch { return false; }
128
+ });
129
+
130
+ // Deduplicate suggestions
131
+ const seen = new Set<string>();
132
+ const uniqueDiffs = suggestedDiffs.filter(d => {
133
+ const key = d.after.slice(0, 30);
134
+ if (seen.has(key)) return false;
135
+ seen.add(key); return true;
136
+ });
137
+
138
+ // Max 3 suggestions per analysis
139
+ return {
140
+ agent, period: "last 7 days",
141
+ totalCalls: 0, failureCount: 0,
142
+ topFailures,
143
+ suggestedDiffs: uniqueDiffs.slice(0, 3),
144
+ };
145
+ }
146
+
147
+ /* ═══════════════════════════════════════
148
+ Apply prompt diff to agent
149
+ ═══════════════════════════════════════ */
150
+ export function applyPromptDiff(agent: any, diff: PromptDiff): boolean {
151
+ try {
152
+ const currentPrompt = agent.systemPrompt;
153
+ if (!diff.after || currentPrompt.includes(diff.after.slice(0, 20))) return false;
154
+
155
+ // Append the new rule after "## 行为守则" or "## Behavior" section
156
+ const marker = currentPrompt.includes("行为守则") ? "## 行为守则" : "## Behavior";
157
+ const idx = currentPrompt.indexOf(marker);
158
+ if (idx < 0) { agent.systemPrompt += "\n" + diff.after; }
159
+ else {
160
+ const insertPoint = currentPrompt.indexOf("\n", currentPrompt.indexOf("\n-", idx) + 1);
161
+ agent.systemPrompt = currentPrompt.slice(0, insertPoint) + "\n" + diff.after + "\n" + currentPrompt.slice(insertPoint);
162
+ }
163
+
164
+ diff.applied = true;
165
+ diff.improvement = "pending evaluation";
166
+
167
+ // Persist the diff
168
+ ensureDir();
169
+ const file = path.join(evolveDir, `${diff.agent}_diffs.jsonl`);
170
+ fs.appendFileSync(file, JSON.stringify(diff) + "\n");
171
+
172
+ agent.rebuildSystemPrompt();
173
+ return true;
174
+ } catch (e) {
175
+ log.warn("apply_prompt_diff_failed", { agent: diff.agent, error: String(e) });
176
+ return false;
177
+ }
178
+ }
179
+
180
+ /** Get all applied diffs for an agent. */
181
+ export function getAppliedDiffs(agent: string): PromptDiff[] {
182
+ const diffs: PromptDiff[] = [];
183
+ try {
184
+ const file = path.join(evolveDir, `${agent}_diffs.jsonl`);
185
+ if (fs.existsSync(file)) {
186
+ const lines = fs.readFileSync(file, "utf-8").split("\n").filter(Boolean);
187
+ for (const line of lines) { try { diffs.push(JSON.parse(line)); } catch { } }
188
+ }
189
+ } catch { /* ignore */ }
190
+ return diffs;
191
+ }
@@ -76,6 +76,13 @@ export class SystemContext {
76
76
  export function createSystemContext(): SystemContext {
77
77
  const config = loadConfig();
78
78
 
79
+ // session_start hooks — user-configured shell commands (see core/hooks)
80
+ try {
81
+ const { loadHooks, runSessionStartHooks } = require('./hooks');
82
+ const hooks = loadHooks(config);
83
+ if (hooks.sessionStart.length > 0) runSessionStartHooks(hooks);
84
+ } catch { /* hooks must never block startup */ }
85
+
79
86
  let workspacePath = '';
80
87
  try {
81
88
  const { resolveWorkspacePath, initWorkspace } = require('./workspace');
@@ -121,11 +128,17 @@ export function createSystemContext(): SystemContext {
121
128
  // Configure MCP manager
122
129
  let mcpManager: any = null;
123
130
  try {
124
- const { MCPManager, loadPersistedServers } = require('./mcp');
131
+ const { MCPManager, loadPersistedServers, loadProjectMcpJson } = require('./mcp');
125
132
  mcpManager = new MCPManager(baseToolRegistry);
126
133
  const persisted = loadPersistedServers();
127
134
  const mcpServers = (config as any).mcp?.servers || [];
128
- const allServers = [...mcpServers, ...persisted];
135
+ const projectServers = loadProjectMcpJson(); // Claude Code 标准 .mcp.json
136
+ // dedupe by name — project .mcp.json wins over runtime-added over config
137
+ const byName = new Map<string, any>();
138
+ for (const s of [...mcpServers, ...persisted, ...projectServers]) {
139
+ if (s?.name) byName.set(s.name, s);
140
+ }
141
+ const allServers = [...byName.values()];
129
142
  if (allServers.length > 0) {
130
143
  mcpManager.configure(allServers);
131
144
  }
@@ -182,6 +195,22 @@ export function createSystemContext(): SystemContext {
182
195
  log.warn('delegate_tool_not_available', { agent: name, error: String(e) });
183
196
  }
184
197
 
198
+ // Register model self-service tools (list_models / set_my_model)
199
+ try {
200
+ const { createModelTools } = require('../tools/model_tool');
201
+ for (const t of createModelTools(name, config)) agentRegistry.register(t);
202
+ } catch (e) {
203
+ log.warn('model_tools_not_available', { agent: name, error: String(e) });
204
+ }
205
+
206
+ // Register the task-checklist tool (todo_write)
207
+ try {
208
+ const { createTodoTool } = require('../tools/todo');
209
+ agentRegistry.register(createTodoTool(agent));
210
+ } catch (e) {
211
+ log.warn('todo_tool_not_available', { agent: name, error: String(e) });
212
+ }
213
+
185
214
  agents.set(name, agent);
186
215
  } catch (e) {
187
216
  log.warn('agent_creation_failed', { agent: name, error: String(e) });