skyloom 1.13.6 → 1.13.8
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.github/workflows/ci.yml +36 -36
- package/README.md +220 -159
- package/config/providers.yaml +39 -39
- package/config/skills/api_integrator/SKILL.md +15 -15
- package/config/skills/arch_designer/SKILL.md +13 -13
- package/config/skills/ci_cd_manager/SKILL.md +14 -14
- package/config/skills/code_analysis/SKILL.md +13 -13
- package/config/skills/code_generator/SKILL.md +12 -12
- package/config/skills/code_reviewer/SKILL.md +13 -13
- package/config/skills/content_writer/SKILL.md +14 -14
- package/config/skills/data_transformer/SKILL.md +15 -15
- package/config/skills/document_analysis/SKILL.md +13 -13
- package/config/skills/emotional_companion/SKILL.md +15 -15
- package/config/skills/performance_checker/SKILL.md +14 -14
- package/config/skills/security_auditor/SKILL.md +14 -14
- package/config/skills/self_evolve/SKILL.md +13 -13
- package/config/skills/sys_operator/SKILL.md +15 -15
- package/config/skills/task_planner/SKILL.md +14 -14
- package/config/skills/web_research/SKILL.md +14 -14
- package/config/skills/workflow_designer/SKILL.md +13 -13
- package/dist/agents/dew.js +52 -52
- package/dist/agents/fair.js +84 -84
- package/dist/agents/fog.js +30 -30
- package/dist/agents/frost.js +32 -32
- package/dist/agents/rain.js +32 -32
- package/dist/agents/snow.js +68 -68
- package/dist/cli/commands_md.d.ts +41 -0
- package/dist/cli/commands_md.d.ts.map +1 -0
- package/dist/cli/commands_md.js +140 -0
- package/dist/cli/commands_md.js.map +1 -0
- package/dist/cli/input_macros.d.ts +28 -0
- package/dist/cli/input_macros.d.ts.map +1 -0
- package/dist/cli/input_macros.js +120 -0
- package/dist/cli/input_macros.js.map +1 -0
- package/dist/cli/loom.d.ts +220 -0
- package/dist/cli/loom.d.ts.map +1 -0
- package/dist/cli/loom.js +1094 -0
- package/dist/cli/loom.js.map +1 -0
- package/dist/cli/loom_chat.d.ts +20 -0
- package/dist/cli/loom_chat.d.ts.map +1 -0
- package/dist/cli/loom_chat.js +685 -0
- package/dist/cli/loom_chat.js.map +1 -0
- package/dist/cli/main.js +310 -14
- package/dist/cli/main.js.map +1 -1
- package/dist/cli/tui.d.ts.map +1 -1
- package/dist/cli/tui.js +7 -1
- package/dist/cli/tui.js.map +1 -1
- package/dist/core/agent.d.ts +20 -0
- package/dist/core/agent.d.ts.map +1 -1
- package/dist/core/agent.js +199 -16
- package/dist/core/agent.js.map +1 -1
- package/dist/core/factory.d.ts.map +1 -1
- package/dist/core/factory.js +34 -2
- package/dist/core/factory.js.map +1 -1
- package/dist/core/file_checkpoint.d.ts +57 -0
- package/dist/core/file_checkpoint.d.ts.map +1 -0
- package/dist/core/file_checkpoint.js +162 -0
- package/dist/core/file_checkpoint.js.map +1 -0
- package/dist/core/hooks.d.ts +43 -0
- package/dist/core/hooks.d.ts.map +1 -0
- package/dist/core/hooks.js +110 -0
- package/dist/core/hooks.js.map +1 -0
- package/dist/core/llm.d.ts.map +1 -1
- package/dist/core/llm.js +15 -9
- package/dist/core/llm.js.map +1 -1
- package/dist/core/longdoc.js +5 -5
- package/dist/core/mcp.d.ts +16 -0
- package/dist/core/mcp.d.ts.map +1 -1
- package/dist/core/mcp.js +55 -0
- package/dist/core/mcp.js.map +1 -1
- package/dist/core/model_config.d.ts +40 -0
- package/dist/core/model_config.d.ts.map +1 -0
- package/dist/core/model_config.js +191 -0
- package/dist/core/model_config.js.map +1 -0
- package/dist/core/skill.d.ts +7 -0
- package/dist/core/skill.d.ts.map +1 -1
- package/dist/core/skill.js +47 -0
- package/dist/core/skill.js.map +1 -1
- package/dist/core/skymd.d.ts +39 -0
- package/dist/core/skymd.d.ts.map +1 -0
- package/dist/core/skymd.js +177 -0
- package/dist/core/skymd.js.map +1 -0
- package/dist/core/tool.d.ts +12 -0
- package/dist/core/tool.d.ts.map +1 -1
- package/dist/core/tool.js +30 -0
- package/dist/core/tool.js.map +1 -1
- package/dist/core/verify.d.ts +27 -0
- package/dist/core/verify.d.ts.map +1 -0
- package/dist/core/verify.js +62 -0
- package/dist/core/verify.js.map +1 -0
- package/dist/skills/loader.d.ts +22 -2
- package/dist/skills/loader.d.ts.map +1 -1
- package/dist/skills/loader.js +45 -15
- package/dist/skills/loader.js.map +1 -1
- package/dist/tools/builtin.d.ts.map +1 -1
- package/dist/tools/builtin.js +13 -3
- package/dist/tools/builtin.js.map +1 -1
- package/dist/tools/model_tool.d.ts +11 -0
- package/dist/tools/model_tool.d.ts.map +1 -0
- package/dist/tools/model_tool.js +71 -0
- package/dist/tools/model_tool.js.map +1 -0
- package/dist/tools/todo.d.ts +30 -0
- package/dist/tools/todo.d.ts.map +1 -0
- package/dist/tools/todo.js +78 -0
- package/dist/tools/todo.js.map +1 -0
- package/docs/AESTHETIC_DESIGN.md +152 -144
- package/docs/OPTIMIZATION_PLAN.md +178 -178
- package/package.json +68 -68
- package/scripts/install.js +48 -48
- package/scripts/link.js +10 -10
- package/setup.bat +79 -79
- package/skill-test-ty2fOA/test.md +10 -10
- package/src/agents/dew.ts +70 -70
- package/src/agents/fair.ts +102 -102
- package/src/agents/fog.ts +48 -48
- package/src/agents/frost.ts +50 -50
- package/src/agents/rain.ts +50 -50
- package/src/agents/snow.ts +239 -239
- package/src/cli/commands_md.ts +112 -0
- package/src/cli/input_macros.ts +83 -0
- package/src/cli/loom.ts +982 -0
- package/src/cli/loom_chat.ts +598 -0
- package/src/cli/main.ts +255 -9
- package/src/cli/mode.ts +58 -58
- package/src/cli/tui.ts +228 -222
- package/src/core/agent/guard.ts +134 -134
- package/src/core/agent/task.ts +100 -100
- package/src/core/agent.ts +195 -16
- package/src/core/arbitrate.ts +162 -162
- package/src/core/catalog.ts +178 -178
- package/src/core/checkpoint.ts +94 -94
- package/src/core/estimate.ts +104 -104
- package/src/core/evolve.ts +191 -191
- package/src/core/factory.ts +31 -2
- package/src/core/file_checkpoint.ts +136 -0
- package/src/core/filter.ts +103 -103
- package/src/core/graph.ts +156 -156
- package/src/core/hooks.ts +126 -0
- package/src/core/icons.ts +53 -53
- package/src/core/index.ts +37 -37
- package/src/core/learn.ts +146 -146
- package/src/core/llm.ts +15 -9
- package/src/core/longdoc.ts +155 -155
- package/src/core/mcp.ts +48 -0
- package/src/core/mcp_server.ts +176 -176
- package/src/core/model_config.ts +157 -0
- package/src/core/profile.ts +255 -255
- package/src/core/router.ts +124 -124
- package/src/core/sandbox.ts +142 -142
- package/src/core/security.ts +243 -243
- package/src/core/skill.ts +42 -0
- package/src/core/skymd.ts +143 -0
- package/src/core/theme.ts +65 -65
- package/src/core/tool.ts +30 -0
- package/src/core/tool_router.ts +193 -193
- package/src/core/vector.ts +152 -152
- package/src/core/verify.ts +71 -0
- package/src/core/workspace.ts +150 -150
- package/src/plugins/loader.ts +66 -66
- package/src/skills/loader.ts +45 -16
- package/src/sql.js.d.ts +29 -29
- package/src/tools/builtin.ts +13 -3
- package/src/tools/computer.ts +269 -269
- package/src/tools/delegate.ts +49 -49
- package/src/tools/model_tool.ts +74 -0
- package/src/tools/todo.ts +76 -0
- package/src/web/tts.ts +93 -93
- package/tests/agent.test.ts +159 -159
- package/tests/agent_helpers.test.ts +48 -48
- package/tests/bus.test.ts +121 -121
- package/tests/catalog.test.ts +86 -86
- package/tests/checkpoint_commands.test.ts +124 -0
- package/tests/claude_compat.test.ts +110 -0
- package/tests/config.test.ts +41 -41
- package/tests/guard.test.ts +75 -75
- package/tests/icons.test.ts +45 -45
- package/tests/loom.test.ts +248 -0
- package/tests/memory.test.ts +170 -170
- package/tests/model_config.test.ts +109 -0
- package/tests/router.test.ts +86 -86
- package/tests/schemas.test.ts +51 -51
- package/tests/semantic.test.ts +83 -83
- package/tests/setup.ts +10 -10
- package/tests/skill.test.ts +172 -172
- package/tests/skymd.test.ts +146 -0
- package/tests/task.test.ts +60 -60
- package/tests/todo_toolstats.test.ts +94 -0
- package/tests/tool.test.ts +108 -108
- package/tests/tool_router.test.ts +71 -71
- package/tests/tui.test.ts +67 -67
- package/vitest.config.ts +17 -17
- package/=12 +0 -0
- package/=8 +0 -0
package/src/core/agent/guard.ts
CHANGED
|
@@ -1,134 +1,134 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Anti-loop guard for the agent reasoning loop.
|
|
3
|
-
*
|
|
4
|
-
* Extracted from chatStreamImpl (Phase 3). Holds the per-turn heuristic state
|
|
5
|
-
* (recent response texts, tool-call signatures, tool outcomes + once-only hint
|
|
6
|
-
* flags) and, after each round, returns a decision: zero or more system
|
|
7
|
-
* "hints" to nudge the model, and optionally a hard `stop` (assistant note +
|
|
8
|
-
* a user-visible content line). The agent loop applies the decision — the guard
|
|
9
|
-
* itself has no side effects, which makes every branch unit-testable.
|
|
10
|
-
*
|
|
11
|
-
* A fresh LoopGuard is created per turn (state must not leak across turns).
|
|
12
|
-
*/
|
|
13
|
-
|
|
14
|
-
import type { ToolCall } from '../llm';
|
|
15
|
-
import {
|
|
16
|
-
toolCallSignature,
|
|
17
|
-
textSimilarity,
|
|
18
|
-
looksLikeFailedToolResult,
|
|
19
|
-
parseToolArgs,
|
|
20
|
-
SIG_WINDOW,
|
|
21
|
-
SIG_LOOP_HINT,
|
|
22
|
-
SIG_LOOP_HARDSTOP,
|
|
23
|
-
} from '../agent_helpers';
|
|
24
|
-
|
|
25
|
-
/** A hard stop: record `note` as an assistant message, then surface `contentLine`. */
|
|
26
|
-
export interface GuardStop {
|
|
27
|
-
note: string;
|
|
28
|
-
contentLine: string;
|
|
29
|
-
}
|
|
30
|
-
|
|
31
|
-
/** The guard's decision for one round. `hints` apply in order; `stop` ends the turn. */
|
|
32
|
-
export interface GuardDecision {
|
|
33
|
-
hints: string[];
|
|
34
|
-
stop?: GuardStop;
|
|
35
|
-
}
|
|
36
|
-
|
|
37
|
-
/** Minimal shape of a tool execution result the guard inspects. */
|
|
38
|
-
export interface GuardExecResult {
|
|
39
|
-
toolName: string;
|
|
40
|
-
success: boolean;
|
|
41
|
-
result: string;
|
|
42
|
-
}
|
|
43
|
-
|
|
44
|
-
export class LoopGuard {
|
|
45
|
-
private recentResponseTexts: string[] = [];
|
|
46
|
-
private recentToolSigs: string[] = [];
|
|
47
|
-
private recentToolOutcomes: boolean[] = [];
|
|
48
|
-
private searchCount = 0; // cumulative search/fetch calls this turn (not window-bounded)
|
|
49
|
-
private repetitionHintInjected = false;
|
|
50
|
-
private toolLoopHintInjected = false; // shared by tool-signature loop + search-storm
|
|
51
|
-
private stuckHintInjected = false;
|
|
52
|
-
|
|
53
|
-
/**
|
|
54
|
-
* Observe one completed round. Mutates internal state and returns the
|
|
55
|
-
* hints/stop decision. Evaluation order (and the shared hint flag) mirrors
|
|
56
|
-
* the original inline logic exactly.
|
|
57
|
-
*/
|
|
58
|
-
observe(
|
|
59
|
-
roundContent: string,
|
|
60
|
-
toolCallsReceived: ToolCall[],
|
|
61
|
-
execResults: Array<GuardExecResult | null>
|
|
62
|
-
): GuardDecision {
|
|
63
|
-
const hints: string[] = [];
|
|
64
|
-
|
|
65
|
-
// 1. Narration-loop: response too similar to a recent one.
|
|
66
|
-
const normalizedRound = (roundContent || '').trim();
|
|
67
|
-
if (normalizedRound && this.recentResponseTexts.length > 0) {
|
|
68
|
-
const highSim = this.recentResponseTexts.slice(-2).some(prev => textSimilarity(normalizedRound, prev) >= 0.7);
|
|
69
|
-
if (highSim && !this.repetitionHintInjected) {
|
|
70
|
-
hints.push('[Stop narrating] Your last response is highly similar to your previous one. Stop writing prose. Either: (1) emit ONLY the next tool call, or (2) output the final deliverable.');
|
|
71
|
-
this.repetitionHintInjected = true;
|
|
72
|
-
}
|
|
73
|
-
}
|
|
74
|
-
this.recentResponseTexts.push(normalizedRound);
|
|
75
|
-
if (this.recentResponseTexts.length > 3) this.recentResponseTexts.shift();
|
|
76
|
-
|
|
77
|
-
// 2. Tool-signature loop: same call repeated within the window.
|
|
78
|
-
for (const tc of toolCallsReceived) {
|
|
79
|
-
const tName = tc.function.name;
|
|
80
|
-
if (['task_done', 'list_skills', 'use_skill'].includes(tName)) continue;
|
|
81
|
-
if (['web_search', 'fetch_page', 'http_get'].includes(tName)) this.searchCount++;
|
|
82
|
-
const rawArgs = tc.function.arguments;
|
|
83
|
-
const tArgs = typeof rawArgs === 'string' ? parseToolArgs(rawArgs) : rawArgs;
|
|
84
|
-
const sig = toolCallSignature(tName, tArgs);
|
|
85
|
-
if (sig) this.recentToolSigs.push(sig);
|
|
86
|
-
}
|
|
87
|
-
if (this.recentToolSigs.length > SIG_WINDOW) {
|
|
88
|
-
this.recentToolSigs.splice(0, this.recentToolSigs.length - SIG_WINDOW);
|
|
89
|
-
}
|
|
90
|
-
if (this.recentToolSigs.length > 0) {
|
|
91
|
-
const counts = new Map<string, number>();
|
|
92
|
-
for (const s of this.recentToolSigs) counts.set(s, (counts.get(s) || 0) + 1);
|
|
93
|
-
let topSig = '';
|
|
94
|
-
let topCount = 0;
|
|
95
|
-
for (const [s, c] of counts) { if (c > topCount) { topSig = s; topCount = c; } }
|
|
96
|
-
if (topCount >= SIG_LOOP_HINT && !this.toolLoopHintInjected) {
|
|
97
|
-
hints.push(`[Tool loop] You have called \`${topSig}\` ${topCount}x in the last ${this.recentToolSigs.length} tool calls — you are iterating without converging. STOP repeating it.`);
|
|
98
|
-
this.toolLoopHintInjected = true;
|
|
99
|
-
}
|
|
100
|
-
if (topCount >= SIG_LOOP_HARDSTOP) {
|
|
101
|
-
return { hints, stop: { note: `I have repeated \`${topSig}\` ${topCount} times without converging. Stopping.`, contentLine: `\n\n[stuck] tool \`${topSig}\` repeated ${topCount}x — stopping.` } };
|
|
102
|
-
}
|
|
103
|
-
}
|
|
104
|
-
|
|
105
|
-
// 3. Stuck-loop: most/all recent tool calls failed.
|
|
106
|
-
for (const r of execResults) {
|
|
107
|
-
if (!r || r.toolName === 'task_done') continue;
|
|
108
|
-
const failed = !r.success || (typeof r.result === 'string' && looksLikeFailedToolResult(r.result));
|
|
109
|
-
this.recentToolOutcomes.push(!failed);
|
|
110
|
-
// Keep 8 so the "all recent calls failed" (>=8) hard-stop below is reachable.
|
|
111
|
-
if (this.recentToolOutcomes.length > 8) this.recentToolOutcomes.shift();
|
|
112
|
-
}
|
|
113
|
-
if (!this.stuckHintInjected && this.recentToolOutcomes.length >= 5 &&
|
|
114
|
-
this.recentToolOutcomes.filter(Boolean).length <= 1) {
|
|
115
|
-
hints.push('[Recovery hint] Your last several tool calls have mostly failed. Synthesize a partial answer from what worked or ask the user for guidance.');
|
|
116
|
-
this.stuckHintInjected = true;
|
|
117
|
-
}
|
|
118
|
-
if (this.recentToolOutcomes.length >= 8 && this.recentToolOutcomes.every(x => !x)) {
|
|
119
|
-
return { hints, stop: { note: 'Every recent tool call failed. Please give me more context.', contentLine: '\n\n[stuck] every recent tool call failed — stopping.\n' } };
|
|
120
|
-
}
|
|
121
|
-
|
|
122
|
-
// 4. Search-storm: cumulative search/fetch calls this turn (not bounded by
|
|
123
|
-
// SIG_WINDOW, so the >=12 hard-stop is actually reachable).
|
|
124
|
-
if (this.searchCount >= 8 && !this.toolLoopHintInjected) {
|
|
125
|
-
hints.push(`[Search storm] ${this.searchCount} search calls. STOP searching and synthesize.`);
|
|
126
|
-
this.toolLoopHintInjected = true;
|
|
127
|
-
}
|
|
128
|
-
if (this.searchCount >= 12) {
|
|
129
|
-
return { hints, stop: { note: 'Too many search requests. Synthesizing best answer.', contentLine: `\n\n[stuck] excessive web searching (${this.searchCount} calls) — stopping.\n` } };
|
|
130
|
-
}
|
|
131
|
-
|
|
132
|
-
return { hints };
|
|
133
|
-
}
|
|
134
|
-
}
|
|
1
|
+
/**
|
|
2
|
+
* Anti-loop guard for the agent reasoning loop.
|
|
3
|
+
*
|
|
4
|
+
* Extracted from chatStreamImpl (Phase 3). Holds the per-turn heuristic state
|
|
5
|
+
* (recent response texts, tool-call signatures, tool outcomes + once-only hint
|
|
6
|
+
* flags) and, after each round, returns a decision: zero or more system
|
|
7
|
+
* "hints" to nudge the model, and optionally a hard `stop` (assistant note +
|
|
8
|
+
* a user-visible content line). The agent loop applies the decision — the guard
|
|
9
|
+
* itself has no side effects, which makes every branch unit-testable.
|
|
10
|
+
*
|
|
11
|
+
* A fresh LoopGuard is created per turn (state must not leak across turns).
|
|
12
|
+
*/
|
|
13
|
+
|
|
14
|
+
import type { ToolCall } from '../llm';
|
|
15
|
+
import {
|
|
16
|
+
toolCallSignature,
|
|
17
|
+
textSimilarity,
|
|
18
|
+
looksLikeFailedToolResult,
|
|
19
|
+
parseToolArgs,
|
|
20
|
+
SIG_WINDOW,
|
|
21
|
+
SIG_LOOP_HINT,
|
|
22
|
+
SIG_LOOP_HARDSTOP,
|
|
23
|
+
} from '../agent_helpers';
|
|
24
|
+
|
|
25
|
+
/** A hard stop: record `note` as an assistant message, then surface `contentLine`. */
|
|
26
|
+
export interface GuardStop {
|
|
27
|
+
note: string;
|
|
28
|
+
contentLine: string;
|
|
29
|
+
}
|
|
30
|
+
|
|
31
|
+
/** The guard's decision for one round. `hints` apply in order; `stop` ends the turn. */
|
|
32
|
+
export interface GuardDecision {
|
|
33
|
+
hints: string[];
|
|
34
|
+
stop?: GuardStop;
|
|
35
|
+
}
|
|
36
|
+
|
|
37
|
+
/** Minimal shape of a tool execution result the guard inspects. */
|
|
38
|
+
export interface GuardExecResult {
|
|
39
|
+
toolName: string;
|
|
40
|
+
success: boolean;
|
|
41
|
+
result: string;
|
|
42
|
+
}
|
|
43
|
+
|
|
44
|
+
export class LoopGuard {
|
|
45
|
+
private recentResponseTexts: string[] = [];
|
|
46
|
+
private recentToolSigs: string[] = [];
|
|
47
|
+
private recentToolOutcomes: boolean[] = [];
|
|
48
|
+
private searchCount = 0; // cumulative search/fetch calls this turn (not window-bounded)
|
|
49
|
+
private repetitionHintInjected = false;
|
|
50
|
+
private toolLoopHintInjected = false; // shared by tool-signature loop + search-storm
|
|
51
|
+
private stuckHintInjected = false;
|
|
52
|
+
|
|
53
|
+
/**
|
|
54
|
+
* Observe one completed round. Mutates internal state and returns the
|
|
55
|
+
* hints/stop decision. Evaluation order (and the shared hint flag) mirrors
|
|
56
|
+
* the original inline logic exactly.
|
|
57
|
+
*/
|
|
58
|
+
observe(
|
|
59
|
+
roundContent: string,
|
|
60
|
+
toolCallsReceived: ToolCall[],
|
|
61
|
+
execResults: Array<GuardExecResult | null>
|
|
62
|
+
): GuardDecision {
|
|
63
|
+
const hints: string[] = [];
|
|
64
|
+
|
|
65
|
+
// 1. Narration-loop: response too similar to a recent one.
|
|
66
|
+
const normalizedRound = (roundContent || '').trim();
|
|
67
|
+
if (normalizedRound && this.recentResponseTexts.length > 0) {
|
|
68
|
+
const highSim = this.recentResponseTexts.slice(-2).some(prev => textSimilarity(normalizedRound, prev) >= 0.7);
|
|
69
|
+
if (highSim && !this.repetitionHintInjected) {
|
|
70
|
+
hints.push('[Stop narrating] Your last response is highly similar to your previous one. Stop writing prose. Either: (1) emit ONLY the next tool call, or (2) output the final deliverable.');
|
|
71
|
+
this.repetitionHintInjected = true;
|
|
72
|
+
}
|
|
73
|
+
}
|
|
74
|
+
this.recentResponseTexts.push(normalizedRound);
|
|
75
|
+
if (this.recentResponseTexts.length > 3) this.recentResponseTexts.shift();
|
|
76
|
+
|
|
77
|
+
// 2. Tool-signature loop: same call repeated within the window.
|
|
78
|
+
for (const tc of toolCallsReceived) {
|
|
79
|
+
const tName = tc.function.name;
|
|
80
|
+
if (['task_done', 'list_skills', 'use_skill'].includes(tName)) continue;
|
|
81
|
+
if (['web_search', 'fetch_page', 'http_get'].includes(tName)) this.searchCount++;
|
|
82
|
+
const rawArgs = tc.function.arguments;
|
|
83
|
+
const tArgs = typeof rawArgs === 'string' ? parseToolArgs(rawArgs) : rawArgs;
|
|
84
|
+
const sig = toolCallSignature(tName, tArgs);
|
|
85
|
+
if (sig) this.recentToolSigs.push(sig);
|
|
86
|
+
}
|
|
87
|
+
if (this.recentToolSigs.length > SIG_WINDOW) {
|
|
88
|
+
this.recentToolSigs.splice(0, this.recentToolSigs.length - SIG_WINDOW);
|
|
89
|
+
}
|
|
90
|
+
if (this.recentToolSigs.length > 0) {
|
|
91
|
+
const counts = new Map<string, number>();
|
|
92
|
+
for (const s of this.recentToolSigs) counts.set(s, (counts.get(s) || 0) + 1);
|
|
93
|
+
let topSig = '';
|
|
94
|
+
let topCount = 0;
|
|
95
|
+
for (const [s, c] of counts) { if (c > topCount) { topSig = s; topCount = c; } }
|
|
96
|
+
if (topCount >= SIG_LOOP_HINT && !this.toolLoopHintInjected) {
|
|
97
|
+
hints.push(`[Tool loop] You have called \`${topSig}\` ${topCount}x in the last ${this.recentToolSigs.length} tool calls — you are iterating without converging. STOP repeating it.`);
|
|
98
|
+
this.toolLoopHintInjected = true;
|
|
99
|
+
}
|
|
100
|
+
if (topCount >= SIG_LOOP_HARDSTOP) {
|
|
101
|
+
return { hints, stop: { note: `I have repeated \`${topSig}\` ${topCount} times without converging. Stopping.`, contentLine: `\n\n[stuck] tool \`${topSig}\` repeated ${topCount}x — stopping.` } };
|
|
102
|
+
}
|
|
103
|
+
}
|
|
104
|
+
|
|
105
|
+
// 3. Stuck-loop: most/all recent tool calls failed.
|
|
106
|
+
for (const r of execResults) {
|
|
107
|
+
if (!r || r.toolName === 'task_done') continue;
|
|
108
|
+
const failed = !r.success || (typeof r.result === 'string' && looksLikeFailedToolResult(r.result));
|
|
109
|
+
this.recentToolOutcomes.push(!failed);
|
|
110
|
+
// Keep 8 so the "all recent calls failed" (>=8) hard-stop below is reachable.
|
|
111
|
+
if (this.recentToolOutcomes.length > 8) this.recentToolOutcomes.shift();
|
|
112
|
+
}
|
|
113
|
+
if (!this.stuckHintInjected && this.recentToolOutcomes.length >= 5 &&
|
|
114
|
+
this.recentToolOutcomes.filter(Boolean).length <= 1) {
|
|
115
|
+
hints.push('[Recovery hint] Your last several tool calls have mostly failed. Synthesize a partial answer from what worked or ask the user for guidance.');
|
|
116
|
+
this.stuckHintInjected = true;
|
|
117
|
+
}
|
|
118
|
+
if (this.recentToolOutcomes.length >= 8 && this.recentToolOutcomes.every(x => !x)) {
|
|
119
|
+
return { hints, stop: { note: 'Every recent tool call failed. Please give me more context.', contentLine: '\n\n[stuck] every recent tool call failed — stopping.\n' } };
|
|
120
|
+
}
|
|
121
|
+
|
|
122
|
+
// 4. Search-storm: cumulative search/fetch calls this turn (not bounded by
|
|
123
|
+
// SIG_WINDOW, so the >=12 hard-stop is actually reachable).
|
|
124
|
+
if (this.searchCount >= 8 && !this.toolLoopHintInjected) {
|
|
125
|
+
hints.push(`[Search storm] ${this.searchCount} search calls. STOP searching and synthesize.`);
|
|
126
|
+
this.toolLoopHintInjected = true;
|
|
127
|
+
}
|
|
128
|
+
if (this.searchCount >= 12) {
|
|
129
|
+
return { hints, stop: { note: 'Too many search requests. Synthesizing best answer.', contentLine: `\n\n[stuck] excessive web searching (${this.searchCount} calls) — stopping.\n` } };
|
|
130
|
+
}
|
|
131
|
+
|
|
132
|
+
return { hints };
|
|
133
|
+
}
|
|
134
|
+
}
|
package/src/core/agent/task.ts
CHANGED
|
@@ -1,100 +1,100 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Agent domain model — states and the Task DAG node.
|
|
3
|
-
*
|
|
4
|
-
* Extracted from the monolithic agent.ts (Phase 3). Pure, dependency-free,
|
|
5
|
-
* and unit-testable in isolation. `agent.ts` re-exports these so external
|
|
6
|
-
* importers of `../core/agent` are unaffected.
|
|
7
|
-
*/
|
|
8
|
-
|
|
9
|
-
/** Lifecycle state of a running agent. */
|
|
10
|
-
export enum AgentState {
|
|
11
|
-
IDLE = 'idle',
|
|
12
|
-
THINKING = 'thinking',
|
|
13
|
-
ACTING = 'acting',
|
|
14
|
-
WAITING = 'waiting',
|
|
15
|
-
ERROR = 'error',
|
|
16
|
-
}
|
|
17
|
-
|
|
18
|
-
/** Lifecycle state of an orchestrated task. */
|
|
19
|
-
export enum TaskState {
|
|
20
|
-
PENDING = 'pending',
|
|
21
|
-
RUNNING = 'running',
|
|
22
|
-
COMPLETED = 'completed',
|
|
23
|
-
FAILED = 'failed',
|
|
24
|
-
SKIPPED = 'skipped',
|
|
25
|
-
}
|
|
26
|
-
|
|
27
|
-
/** Allowed task state transitions. A terminal state has no outgoing edges. */
|
|
28
|
-
export const VALID_TRANSITIONS: Record<TaskState, Set<TaskState>> = {
|
|
29
|
-
[TaskState.PENDING]: new Set([TaskState.RUNNING, TaskState.SKIPPED, TaskState.FAILED]),
|
|
30
|
-
[TaskState.RUNNING]: new Set([TaskState.RUNNING, TaskState.COMPLETED, TaskState.FAILED]),
|
|
31
|
-
[TaskState.FAILED]: new Set([TaskState.RUNNING, TaskState.SKIPPED]),
|
|
32
|
-
[TaskState.COMPLETED]: new Set(),
|
|
33
|
-
[TaskState.SKIPPED]: new Set(),
|
|
34
|
-
};
|
|
35
|
-
|
|
36
|
-
/** A node in the orchestration DAG. */
|
|
37
|
-
export class Task {
|
|
38
|
-
id: string;
|
|
39
|
-
description: string;
|
|
40
|
-
assignedTo: string | null = null;
|
|
41
|
-
parentId: string | null = null;
|
|
42
|
-
dependsOn: string[] = [];
|
|
43
|
-
status: TaskState = TaskState.PENDING;
|
|
44
|
-
priority: number = 0;
|
|
45
|
-
result: string | null = null;
|
|
46
|
-
metadata: Record<string, any> = {};
|
|
47
|
-
|
|
48
|
-
constructor(config: {
|
|
49
|
-
id: string;
|
|
50
|
-
description: string;
|
|
51
|
-
assignedTo?: string | null;
|
|
52
|
-
parentId?: string | null;
|
|
53
|
-
dependsOn?: string[];
|
|
54
|
-
status?: TaskState;
|
|
55
|
-
priority?: number;
|
|
56
|
-
result?: string | null;
|
|
57
|
-
metadata?: Record<string, any>;
|
|
58
|
-
}) {
|
|
59
|
-
this.id = config.id;
|
|
60
|
-
this.description = config.description;
|
|
61
|
-
this.assignedTo = config.assignedTo ?? null;
|
|
62
|
-
this.parentId = config.parentId ?? null;
|
|
63
|
-
this.dependsOn = config.dependsOn || [];
|
|
64
|
-
this.status = config.status ?? TaskState.PENDING;
|
|
65
|
-
this.priority = config.priority ?? 0;
|
|
66
|
-
this.result = config.result ?? null;
|
|
67
|
-
this.metadata = config.metadata || {};
|
|
68
|
-
}
|
|
69
|
-
|
|
70
|
-
transitionTo(newState: TaskState): void {
|
|
71
|
-
const allowed = VALID_TRANSITIONS[this.status] || new Set();
|
|
72
|
-
if (!allowed.has(newState)) {
|
|
73
|
-
throw new Error(
|
|
74
|
-
`Invalid task state transition: ${this.status} -> ${newState}`
|
|
75
|
-
);
|
|
76
|
-
}
|
|
77
|
-
this.status = newState;
|
|
78
|
-
}
|
|
79
|
-
|
|
80
|
-
get allDeps(): string[] {
|
|
81
|
-
const deps = [...this.dependsOn];
|
|
82
|
-
if (this.parentId && !deps.includes(this.parentId)) {
|
|
83
|
-
deps.push(this.parentId);
|
|
84
|
-
}
|
|
85
|
-
return deps;
|
|
86
|
-
}
|
|
87
|
-
}
|
|
88
|
-
|
|
89
|
-
/** Result of executing a single task. */
|
|
90
|
-
export class TaskResult {
|
|
91
|
-
success: boolean;
|
|
92
|
-
content: string;
|
|
93
|
-
data: Record<string, any> = {};
|
|
94
|
-
|
|
95
|
-
constructor(success: boolean, content: string, data?: Record<string, any>) {
|
|
96
|
-
this.success = success;
|
|
97
|
-
this.content = content;
|
|
98
|
-
this.data = data || {};
|
|
99
|
-
}
|
|
100
|
-
}
|
|
1
|
+
/**
|
|
2
|
+
* Agent domain model — states and the Task DAG node.
|
|
3
|
+
*
|
|
4
|
+
* Extracted from the monolithic agent.ts (Phase 3). Pure, dependency-free,
|
|
5
|
+
* and unit-testable in isolation. `agent.ts` re-exports these so external
|
|
6
|
+
* importers of `../core/agent` are unaffected.
|
|
7
|
+
*/
|
|
8
|
+
|
|
9
|
+
/** Lifecycle state of a running agent. */
|
|
10
|
+
export enum AgentState {
|
|
11
|
+
IDLE = 'idle',
|
|
12
|
+
THINKING = 'thinking',
|
|
13
|
+
ACTING = 'acting',
|
|
14
|
+
WAITING = 'waiting',
|
|
15
|
+
ERROR = 'error',
|
|
16
|
+
}
|
|
17
|
+
|
|
18
|
+
/** Lifecycle state of an orchestrated task. */
|
|
19
|
+
export enum TaskState {
|
|
20
|
+
PENDING = 'pending',
|
|
21
|
+
RUNNING = 'running',
|
|
22
|
+
COMPLETED = 'completed',
|
|
23
|
+
FAILED = 'failed',
|
|
24
|
+
SKIPPED = 'skipped',
|
|
25
|
+
}
|
|
26
|
+
|
|
27
|
+
/** Allowed task state transitions. A terminal state has no outgoing edges. */
|
|
28
|
+
export const VALID_TRANSITIONS: Record<TaskState, Set<TaskState>> = {
|
|
29
|
+
[TaskState.PENDING]: new Set([TaskState.RUNNING, TaskState.SKIPPED, TaskState.FAILED]),
|
|
30
|
+
[TaskState.RUNNING]: new Set([TaskState.RUNNING, TaskState.COMPLETED, TaskState.FAILED]),
|
|
31
|
+
[TaskState.FAILED]: new Set([TaskState.RUNNING, TaskState.SKIPPED]),
|
|
32
|
+
[TaskState.COMPLETED]: new Set(),
|
|
33
|
+
[TaskState.SKIPPED]: new Set(),
|
|
34
|
+
};
|
|
35
|
+
|
|
36
|
+
/** A node in the orchestration DAG. */
|
|
37
|
+
export class Task {
|
|
38
|
+
id: string;
|
|
39
|
+
description: string;
|
|
40
|
+
assignedTo: string | null = null;
|
|
41
|
+
parentId: string | null = null;
|
|
42
|
+
dependsOn: string[] = [];
|
|
43
|
+
status: TaskState = TaskState.PENDING;
|
|
44
|
+
priority: number = 0;
|
|
45
|
+
result: string | null = null;
|
|
46
|
+
metadata: Record<string, any> = {};
|
|
47
|
+
|
|
48
|
+
constructor(config: {
|
|
49
|
+
id: string;
|
|
50
|
+
description: string;
|
|
51
|
+
assignedTo?: string | null;
|
|
52
|
+
parentId?: string | null;
|
|
53
|
+
dependsOn?: string[];
|
|
54
|
+
status?: TaskState;
|
|
55
|
+
priority?: number;
|
|
56
|
+
result?: string | null;
|
|
57
|
+
metadata?: Record<string, any>;
|
|
58
|
+
}) {
|
|
59
|
+
this.id = config.id;
|
|
60
|
+
this.description = config.description;
|
|
61
|
+
this.assignedTo = config.assignedTo ?? null;
|
|
62
|
+
this.parentId = config.parentId ?? null;
|
|
63
|
+
this.dependsOn = config.dependsOn || [];
|
|
64
|
+
this.status = config.status ?? TaskState.PENDING;
|
|
65
|
+
this.priority = config.priority ?? 0;
|
|
66
|
+
this.result = config.result ?? null;
|
|
67
|
+
this.metadata = config.metadata || {};
|
|
68
|
+
}
|
|
69
|
+
|
|
70
|
+
transitionTo(newState: TaskState): void {
|
|
71
|
+
const allowed = VALID_TRANSITIONS[this.status] || new Set();
|
|
72
|
+
if (!allowed.has(newState)) {
|
|
73
|
+
throw new Error(
|
|
74
|
+
`Invalid task state transition: ${this.status} -> ${newState}`
|
|
75
|
+
);
|
|
76
|
+
}
|
|
77
|
+
this.status = newState;
|
|
78
|
+
}
|
|
79
|
+
|
|
80
|
+
get allDeps(): string[] {
|
|
81
|
+
const deps = [...this.dependsOn];
|
|
82
|
+
if (this.parentId && !deps.includes(this.parentId)) {
|
|
83
|
+
deps.push(this.parentId);
|
|
84
|
+
}
|
|
85
|
+
return deps;
|
|
86
|
+
}
|
|
87
|
+
}
|
|
88
|
+
|
|
89
|
+
/** Result of executing a single task. */
|
|
90
|
+
export class TaskResult {
|
|
91
|
+
success: boolean;
|
|
92
|
+
content: string;
|
|
93
|
+
data: Record<string, any> = {};
|
|
94
|
+
|
|
95
|
+
constructor(success: boolean, content: string, data?: Record<string, any>) {
|
|
96
|
+
this.success = success;
|
|
97
|
+
this.content = content;
|
|
98
|
+
this.data = data || {};
|
|
99
|
+
}
|
|
100
|
+
}
|