ultimate-pi 0.3.0 → 0.4.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.agents/skills/harness-decisions/SKILL.md +37 -0
- package/.agents/skills/harness-governor/SKILL.md +1 -1
- package/.agents/skills/harness-orchestration/SKILL.md +54 -0
- package/.agents/skills/harness-plan/SKILL.md +4 -3
- package/.agents/skills/harness-sentrux-setup/SKILL.md +57 -0
- package/.agents/skills/scrapling-web/SKILL.md +93 -0
- package/.pi/PACKAGING.md +2 -2
- package/.pi/SYSTEM.md +13 -15
- package/.pi/agents/harness/adversary.md +3 -0
- package/.pi/agents/harness/evaluator.md +3 -0
- package/.pi/agents/harness/executor.md +4 -1
- package/.pi/agents/harness/meta-optimizer.md +2 -1
- package/.pi/agents/harness/planner.md +22 -1
- package/.pi/agents/harness/sentrux-bootstrap.md +42 -0
- package/.pi/agents/harness/tie-breaker.md +2 -0
- package/.pi/extensions/harness-ask-user.ts +74 -0
- package/.pi/extensions/harness-subagents.ts +9 -0
- package/.pi/extensions/lib/ask-user/dialog.ts +260 -0
- package/.pi/extensions/lib/ask-user/fallback.ts +78 -0
- package/.pi/extensions/lib/ask-user/render.ts +66 -0
- package/.pi/extensions/lib/ask-user/schema.ts +69 -0
- package/.pi/extensions/lib/ask-user/types.ts +41 -0
- package/.pi/extensions/lib/ask-user/validate-core.mjs +79 -0
- package/.pi/extensions/lib/ask-user/validate.ts +92 -0
- package/.pi/extensions/lib/harness-subagents/agent-loader.ts +126 -0
- package/.pi/extensions/lib/harness-subagents/agent-manifest.ts +119 -0
- package/.pi/extensions/lib/harness-subagents/agent-parser.ts +87 -0
- package/.pi/extensions/lib/harness-subagents/blackboard-tool.ts +118 -0
- package/.pi/extensions/lib/harness-subagents/blackboard.ts +175 -0
- package/.pi/extensions/lib/harness-subagents/spawn-policy.ts +27 -0
- package/.pi/extensions/lib/harness-subagents/types-blackboard.ts +27 -0
- package/.pi/extensions/lib/harness-subagents/vendored/agent-manager.ts +553 -0
- package/.pi/extensions/lib/harness-subagents/vendored/agent-runner.ts +637 -0
- package/.pi/extensions/lib/harness-subagents/vendored/agent-types.ts +175 -0
- package/.pi/extensions/lib/harness-subagents/vendored/context.ts +59 -0
- package/.pi/extensions/lib/harness-subagents/vendored/cross-extension-rpc.ts +134 -0
- package/.pi/extensions/lib/harness-subagents/vendored/custom-agents.ts +5 -0
- package/.pi/extensions/lib/harness-subagents/vendored/default-agents.ts +123 -0
- package/.pi/extensions/lib/harness-subagents/vendored/env.ts +43 -0
- package/.pi/extensions/lib/harness-subagents/vendored/group-join.ts +144 -0
- package/.pi/extensions/lib/harness-subagents/vendored/index.ts +2447 -0
- package/.pi/extensions/lib/harness-subagents/vendored/invocation-config.ts +52 -0
- package/.pi/extensions/lib/harness-subagents/vendored/memory.ts +182 -0
- package/.pi/extensions/lib/harness-subagents/vendored/model-resolver.ts +92 -0
- package/.pi/extensions/lib/harness-subagents/vendored/output-file.ts +115 -0
- package/.pi/extensions/lib/harness-subagents/vendored/prompts.ts +103 -0
- package/.pi/extensions/lib/harness-subagents/vendored/schedule-store.ts +177 -0
- package/.pi/extensions/lib/harness-subagents/vendored/schedule.ts +416 -0
- package/.pi/extensions/lib/harness-subagents/vendored/settings.ts +210 -0
- package/.pi/extensions/lib/harness-subagents/vendored/skill-loader.ts +108 -0
- package/.pi/extensions/lib/harness-subagents/vendored/types.ts +187 -0
- package/.pi/extensions/lib/harness-subagents/vendored/ui/agent-widget.ts +637 -0
- package/.pi/extensions/lib/harness-subagents/vendored/ui/conversation-viewer.ts +324 -0
- package/.pi/extensions/lib/harness-subagents/vendored/ui/schedule-menu.ts +110 -0
- package/.pi/extensions/lib/harness-subagents/vendored/usage.ts +71 -0
- package/.pi/extensions/lib/harness-subagents/vendored/worktree.ts +195 -0
- package/.pi/extensions/policy-gate.ts +18 -0
- package/.pi/extensions/provider-payload-sanitize.ts +66 -0
- package/.pi/harness/README.md +2 -1
- package/.pi/harness/agents.manifest.json +80 -0
- package/.pi/harness/docs/adrs/0009-sentrux-rules-lifecycle.md +9 -5
- package/.pi/harness/env.harness.template +28 -0
- package/.pi/harness/sentrux/architecture.manifest.json +6 -1
- package/.pi/prompts/harness-auto.md +2 -2
- package/.pi/prompts/harness-plan.md +2 -2
- package/.pi/prompts/harness-router-tune.md +2 -2
- package/.pi/prompts/harness-run.md +1 -0
- package/.pi/prompts/harness-setup.md +182 -339
- package/.pi/scripts/README.md +6 -1
- package/.pi/scripts/harness-agents-manifest.mjs +123 -0
- package/.pi/scripts/harness-cli-verify.sh +60 -11
- package/.pi/scripts/harness-generate-model-router.mjs +242 -0
- package/.pi/scripts/harness-graphify-bootstrap.sh +1 -6
- package/.pi/scripts/harness-resolve-up-pkg.mjs +71 -0
- package/.pi/scripts/harness-seed-project-contracts.mjs +81 -0
- package/.pi/scripts/harness-sentrux-bootstrap.mjs +146 -0
- package/.pi/scripts/harness-sync-env.mjs +148 -0
- package/.pi/scripts/harness-verify.mjs +19 -0
- package/.pi/scripts/harness-web-search.md +33 -0
- package/.pi/scripts/harness-web.py +177 -0
- package/.pi/scripts/harness_web/__init__.py +1 -0
- package/.pi/scripts/harness_web/config.py +80 -0
- package/.pi/scripts/harness_web/output.py +55 -0
- package/.pi/scripts/harness_web/scrape.py +120 -0
- package/.pi/scripts/harness_web/search_ddg.py +106 -0
- package/.pi/scripts/release.sh +338 -0
- package/.pi/scripts/sentrux-rules-sync.mjs +29 -7
- package/.pi/settings.example.json +0 -1
- package/.sentrux/rules.toml +1 -1
- package/AGENTS.md +1 -1
- package/CHANGELOG.md +20 -0
- package/THIRD_PARTY_NOTICES.md +22 -0
- package/package.json +12 -9
- package/.agents/skills/firecrawl/SKILL.md +0 -150
- package/.agents/skills/firecrawl/rules/install.md +0 -82
- package/.agents/skills/firecrawl/rules/security.md +0 -26
- package/.agents/skills/firecrawl-agent/SKILL.md +0 -57
- package/.agents/skills/firecrawl-build-interact/SKILL.md +0 -67
- package/.agents/skills/firecrawl-build-onboarding/SKILL.md +0 -102
- package/.agents/skills/firecrawl-build-onboarding/references/auth-flow.md +0 -39
- package/.agents/skills/firecrawl-build-onboarding/references/project-setup.md +0 -20
- package/.agents/skills/firecrawl-build-onboarding/references/sdk-installation.md +0 -17
- package/.agents/skills/firecrawl-build-scrape/SKILL.md +0 -68
- package/.agents/skills/firecrawl-build-search/SKILL.md +0 -68
- package/.agents/skills/firecrawl-crawl/SKILL.md +0 -58
- package/.agents/skills/firecrawl-download/SKILL.md +0 -69
- package/.agents/skills/firecrawl-interact/SKILL.md +0 -83
- package/.agents/skills/firecrawl-map/SKILL.md +0 -50
- package/.agents/skills/firecrawl-parse/SKILL.md +0 -61
- package/.agents/skills/firecrawl-scrape/SKILL.md +0 -68
- package/.agents/skills/firecrawl-search/SKILL.md +0 -59
- package/firecrawl/.env.template +0 -62
- package/firecrawl/README.md +0 -49
- package/firecrawl/docker-compose.yaml +0 -201
- package/firecrawl/searxng/searxng.env +0 -3
- package/firecrawl/searxng/settings.yml +0 -85
|
@@ -0,0 +1,637 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* agent-runner.ts — Core execution engine: creates sessions, runs agents, collects results.
|
|
3
|
+
*/
|
|
4
|
+
|
|
5
|
+
import * as fs from "node:fs";
|
|
6
|
+
import * as os from "node:os";
|
|
7
|
+
import * as path from "node:path";
|
|
8
|
+
import type { Model } from "@mariozechner/pi-ai";
|
|
9
|
+
import type { ExtensionContext } from "@mariozechner/pi-coding-agent";
|
|
10
|
+
import {
|
|
11
|
+
type AgentSession,
|
|
12
|
+
type AgentSessionEvent,
|
|
13
|
+
createAgentSession,
|
|
14
|
+
DefaultResourceLoader,
|
|
15
|
+
type ExtensionAPI,
|
|
16
|
+
getAgentDir,
|
|
17
|
+
SessionManager,
|
|
18
|
+
SettingsManager,
|
|
19
|
+
} from "@mariozechner/pi-coding-agent";
|
|
20
|
+
import { evaluateSubagentToolCall } from "../spawn-policy.js";
|
|
21
|
+
import {
|
|
22
|
+
getAgentConfig,
|
|
23
|
+
getConfig,
|
|
24
|
+
getMemoryToolNames,
|
|
25
|
+
getReadOnlyMemoryToolNames,
|
|
26
|
+
getToolNamesForType,
|
|
27
|
+
} from "./agent-types.js";
|
|
28
|
+
import { buildParentContext, extractText } from "./context.js";
|
|
29
|
+
import { DEFAULT_AGENTS } from "./default-agents.js";
|
|
30
|
+
import { detectEnv } from "./env.js";
|
|
31
|
+
import { buildMemoryBlock, buildReadOnlyMemoryBlock } from "./memory.js";
|
|
32
|
+
import { buildAgentPrompt, type PromptExtras } from "./prompts.js";
|
|
33
|
+
import { preloadSkills } from "./skill-loader.js";
|
|
34
|
+
import type { SubagentType, ThinkingLevel } from "./types.js";
|
|
35
|
+
|
|
36
|
+
/** Names of tools registered by this extension that subagents must NOT inherit. */
|
|
37
|
+
const EXCLUDED_TOOL_NAMES = [
|
|
38
|
+
"Agent",
|
|
39
|
+
"get_subagent_result",
|
|
40
|
+
"steer_subagent",
|
|
41
|
+
"blackboard",
|
|
42
|
+
"ask_user",
|
|
43
|
+
];
|
|
44
|
+
|
|
45
|
+
/** Default max turns. undefined = unlimited (no turn limit). */
|
|
46
|
+
let defaultMaxTurns: number | undefined;
|
|
47
|
+
|
|
48
|
+
/** Normalize max turns. undefined or 0 = unlimited, otherwise minimum 1. */
|
|
49
|
+
export function normalizeMaxTurns(n: number | undefined): number | undefined {
|
|
50
|
+
if (n == null || n === 0) return undefined;
|
|
51
|
+
return Math.max(1, n);
|
|
52
|
+
}
|
|
53
|
+
|
|
54
|
+
/** Get the default max turns value. undefined = unlimited. */
|
|
55
|
+
export function getDefaultMaxTurns(): number | undefined {
|
|
56
|
+
return defaultMaxTurns;
|
|
57
|
+
}
|
|
58
|
+
/** Set the default max turns value. undefined or 0 = unlimited, otherwise minimum 1. */
|
|
59
|
+
export function setDefaultMaxTurns(n: number | undefined): void {
|
|
60
|
+
defaultMaxTurns = normalizeMaxTurns(n);
|
|
61
|
+
}
|
|
62
|
+
|
|
63
|
+
/** Additional turns allowed after the soft limit steer message. */
|
|
64
|
+
let graceTurns = 5;
|
|
65
|
+
|
|
66
|
+
/** Get the grace turns value. */
|
|
67
|
+
export function getGraceTurns(): number {
|
|
68
|
+
return graceTurns;
|
|
69
|
+
}
|
|
70
|
+
/** Set the grace turns value (minimum 1). */
|
|
71
|
+
export function setGraceTurns(n: number): void {
|
|
72
|
+
graceTurns = Math.max(1, n);
|
|
73
|
+
}
|
|
74
|
+
|
|
75
|
+
/**
|
|
76
|
+
* Try to find the right model for an agent type.
|
|
77
|
+
* Priority: explicit option > config.model > parent model.
|
|
78
|
+
*/
|
|
79
|
+
function resolveDefaultModel(
|
|
80
|
+
parentModel: Model<any> | undefined,
|
|
81
|
+
registry: {
|
|
82
|
+
find(provider: string, modelId: string): Model<any> | undefined;
|
|
83
|
+
getAvailable?(): Model<any>[];
|
|
84
|
+
},
|
|
85
|
+
configModel?: string,
|
|
86
|
+
): Model<any> | undefined {
|
|
87
|
+
if (configModel) {
|
|
88
|
+
const slashIdx = configModel.indexOf("/");
|
|
89
|
+
if (slashIdx !== -1) {
|
|
90
|
+
const provider = configModel.slice(0, slashIdx);
|
|
91
|
+
const modelId = configModel.slice(slashIdx + 1);
|
|
92
|
+
|
|
93
|
+
// Build a set of available model keys for fast lookup
|
|
94
|
+
const available = registry.getAvailable?.();
|
|
95
|
+
const availableKeys = available
|
|
96
|
+
? new Set(available.map((m: any) => `${m.provider}/${m.id}`))
|
|
97
|
+
: undefined;
|
|
98
|
+
const isAvailable = (p: string, id: string) =>
|
|
99
|
+
!availableKeys || availableKeys.has(`${p}/${id}`);
|
|
100
|
+
|
|
101
|
+
const found = registry.find(provider, modelId);
|
|
102
|
+
if (found && isAvailable(provider, modelId)) return found;
|
|
103
|
+
}
|
|
104
|
+
}
|
|
105
|
+
|
|
106
|
+
return parentModel;
|
|
107
|
+
}
|
|
108
|
+
|
|
109
|
+
/** Info about a tool event in the subagent. */
|
|
110
|
+
export interface ToolActivity {
|
|
111
|
+
type: "start" | "end";
|
|
112
|
+
toolName: string;
|
|
113
|
+
}
|
|
114
|
+
|
|
115
|
+
export interface RunOptions {
|
|
116
|
+
/** ExtensionAPI instance — used for pi.exec() instead of execSync. */
|
|
117
|
+
pi: ExtensionAPI;
|
|
118
|
+
/** Manager-assigned id; suffixes session name to disambiguate parallel spawns (e.g. `Explore#a1b2c3d4`). */
|
|
119
|
+
agentId?: string;
|
|
120
|
+
model?: Model<any>;
|
|
121
|
+
maxTurns?: number;
|
|
122
|
+
signal?: AbortSignal;
|
|
123
|
+
isolated?: boolean;
|
|
124
|
+
inheritContext?: boolean;
|
|
125
|
+
thinkingLevel?: ThinkingLevel;
|
|
126
|
+
/** Override working directory (e.g. for worktree isolation). */
|
|
127
|
+
cwd?: string;
|
|
128
|
+
/** Called on tool start/end with activity info. */
|
|
129
|
+
onToolActivity?: (activity: ToolActivity) => void;
|
|
130
|
+
/** Called on streaming text deltas from the assistant response. */
|
|
131
|
+
onTextDelta?: (delta: string, fullText: string) => void;
|
|
132
|
+
onSessionCreated?: (session: AgentSession) => void;
|
|
133
|
+
/** Called at the end of each agentic turn with the cumulative count. */
|
|
134
|
+
onTurnEnd?: (turnCount: number) => void;
|
|
135
|
+
/**
|
|
136
|
+
* Called once per assistant message_end with that message's usage delta.
|
|
137
|
+
* Lets callers maintain a lifetime accumulator that survives compaction
|
|
138
|
+
* (which replaces session.state.messages and resets stats-derived sums).
|
|
139
|
+
*/
|
|
140
|
+
onAssistantUsage?: (usage: {
|
|
141
|
+
input: number;
|
|
142
|
+
output: number;
|
|
143
|
+
cacheWrite: number;
|
|
144
|
+
}) => void;
|
|
145
|
+
/**
|
|
146
|
+
* Called when the session successfully compacts. `tokensBefore` is upstream's
|
|
147
|
+
* pre-compaction context size estimate. Aborted compactions don't fire.
|
|
148
|
+
*/
|
|
149
|
+
onCompaction?: (info: {
|
|
150
|
+
reason: "manual" | "threshold" | "overflow";
|
|
151
|
+
tokensBefore: number;
|
|
152
|
+
}) => void;
|
|
153
|
+
/** Blackboard or other spawn context appended to the subagent system prompt. */
|
|
154
|
+
systemPromptAppendix?: string;
|
|
155
|
+
}
|
|
156
|
+
|
|
157
|
+
export interface RunResult {
|
|
158
|
+
responseText: string;
|
|
159
|
+
session: AgentSession;
|
|
160
|
+
/** True if the agent was hard-aborted (max_turns + grace exceeded). */
|
|
161
|
+
aborted: boolean;
|
|
162
|
+
/** True if the agent was steered to wrap up (hit soft turn limit) but finished in time. */
|
|
163
|
+
steered: boolean;
|
|
164
|
+
}
|
|
165
|
+
|
|
166
|
+
/**
|
|
167
|
+
* Subscribe to a session and collect the last assistant message text.
|
|
168
|
+
* Returns an object with a `getText()` getter and an `unsubscribe` function.
|
|
169
|
+
*/
|
|
170
|
+
function collectResponseText(session: AgentSession) {
|
|
171
|
+
let text = "";
|
|
172
|
+
const unsubscribe = session.subscribe((event: AgentSessionEvent) => {
|
|
173
|
+
if (event.type === "message_start") {
|
|
174
|
+
text = "";
|
|
175
|
+
}
|
|
176
|
+
if (
|
|
177
|
+
event.type === "message_update" &&
|
|
178
|
+
event.assistantMessageEvent.type === "text_delta"
|
|
179
|
+
) {
|
|
180
|
+
text += event.assistantMessageEvent.delta;
|
|
181
|
+
}
|
|
182
|
+
});
|
|
183
|
+
return { getText: () => text, unsubscribe };
|
|
184
|
+
}
|
|
185
|
+
|
|
186
|
+
/** Get the last assistant text from the completed session history. */
|
|
187
|
+
function getLastAssistantText(session: AgentSession): string {
|
|
188
|
+
for (let i = session.messages.length - 1; i >= 0; i--) {
|
|
189
|
+
const msg = session.messages[i];
|
|
190
|
+
if (msg.role !== "assistant") continue;
|
|
191
|
+
const text = extractText(msg.content).trim();
|
|
192
|
+
if (text) return text;
|
|
193
|
+
}
|
|
194
|
+
return "";
|
|
195
|
+
}
|
|
196
|
+
|
|
197
|
+
/**
|
|
198
|
+
* Wire an AbortSignal to abort a session.
|
|
199
|
+
* Returns a cleanup function to remove the listener.
|
|
200
|
+
*/
|
|
201
|
+
function forwardAbortSignal(
|
|
202
|
+
session: AgentSession,
|
|
203
|
+
signal?: AbortSignal,
|
|
204
|
+
): () => void {
|
|
205
|
+
if (!signal) return () => {};
|
|
206
|
+
const onAbort = () => session.abort();
|
|
207
|
+
signal.addEventListener("abort", onAbort, { once: true });
|
|
208
|
+
return () => signal.removeEventListener("abort", onAbort);
|
|
209
|
+
}
|
|
210
|
+
|
|
211
|
+
export async function runAgent(
|
|
212
|
+
ctx: ExtensionContext,
|
|
213
|
+
type: SubagentType,
|
|
214
|
+
prompt: string,
|
|
215
|
+
options: RunOptions,
|
|
216
|
+
): Promise<RunResult> {
|
|
217
|
+
const config = getConfig(type);
|
|
218
|
+
const agentConfig = getAgentConfig(type);
|
|
219
|
+
|
|
220
|
+
// Resolve working directory: worktree override > parent cwd
|
|
221
|
+
const effectiveCwd = options.cwd ?? ctx.cwd;
|
|
222
|
+
|
|
223
|
+
const env = await detectEnv(options.pi, effectiveCwd);
|
|
224
|
+
|
|
225
|
+
// Get parent system prompt for append-mode agents
|
|
226
|
+
const parentSystemPrompt = ctx.getSystemPrompt();
|
|
227
|
+
|
|
228
|
+
// Build prompt extras (memory, skill preloading)
|
|
229
|
+
const extras: PromptExtras = {};
|
|
230
|
+
|
|
231
|
+
// Resolve extensions/skills: isolated overrides to false
|
|
232
|
+
const extensions = options.isolated ? false : config.extensions;
|
|
233
|
+
const skills = options.isolated ? false : config.skills;
|
|
234
|
+
|
|
235
|
+
// Skill preloading: when skills is string[], preload their content into prompt
|
|
236
|
+
if (Array.isArray(skills)) {
|
|
237
|
+
const loaded = preloadSkills(skills, effectiveCwd);
|
|
238
|
+
if (loaded.length > 0) {
|
|
239
|
+
extras.skillBlocks = loaded;
|
|
240
|
+
}
|
|
241
|
+
}
|
|
242
|
+
|
|
243
|
+
let toolNames = getToolNamesForType(type);
|
|
244
|
+
|
|
245
|
+
// Persistent memory: detect write capability and branch accordingly.
|
|
246
|
+
// Account for disallowedTools — a tool in the base set but on the denylist is not truly available.
|
|
247
|
+
if (agentConfig?.memory) {
|
|
248
|
+
const existingNames = new Set(toolNames);
|
|
249
|
+
const denied = agentConfig.disallowedTools
|
|
250
|
+
? new Set(agentConfig.disallowedTools)
|
|
251
|
+
: undefined;
|
|
252
|
+
const effectivelyHas = (name: string) =>
|
|
253
|
+
existingNames.has(name) && !denied?.has(name);
|
|
254
|
+
const hasWriteTools = effectivelyHas("write") || effectivelyHas("edit");
|
|
255
|
+
|
|
256
|
+
if (hasWriteTools) {
|
|
257
|
+
// Read-write memory: add any missing memory tool names (read/write/edit)
|
|
258
|
+
const extraNames = getMemoryToolNames(existingNames);
|
|
259
|
+
if (extraNames.length > 0) toolNames = [...toolNames, ...extraNames];
|
|
260
|
+
extras.memoryBlock = buildMemoryBlock(
|
|
261
|
+
agentConfig.name,
|
|
262
|
+
agentConfig.memory,
|
|
263
|
+
effectiveCwd,
|
|
264
|
+
);
|
|
265
|
+
} else {
|
|
266
|
+
// Read-only memory: only add read tool name, use read-only prompt
|
|
267
|
+
const extraNames = getReadOnlyMemoryToolNames(existingNames);
|
|
268
|
+
if (extraNames.length > 0) toolNames = [...toolNames, ...extraNames];
|
|
269
|
+
extras.memoryBlock = buildReadOnlyMemoryBlock(
|
|
270
|
+
agentConfig.name,
|
|
271
|
+
agentConfig.memory,
|
|
272
|
+
effectiveCwd,
|
|
273
|
+
);
|
|
274
|
+
}
|
|
275
|
+
}
|
|
276
|
+
|
|
277
|
+
// Build system prompt from agent config
|
|
278
|
+
let systemPrompt: string;
|
|
279
|
+
if (agentConfig) {
|
|
280
|
+
systemPrompt = buildAgentPrompt(
|
|
281
|
+
agentConfig,
|
|
282
|
+
effectiveCwd,
|
|
283
|
+
env,
|
|
284
|
+
parentSystemPrompt,
|
|
285
|
+
extras,
|
|
286
|
+
);
|
|
287
|
+
} else {
|
|
288
|
+
// Unknown type fallback: spread the canonical general-purpose config (defensive —
|
|
289
|
+
// unreachable in practice since index.ts resolves unknown types before calling runAgent).
|
|
290
|
+
const fallback = DEFAULT_AGENTS.get("general-purpose");
|
|
291
|
+
if (!fallback)
|
|
292
|
+
throw new Error(
|
|
293
|
+
`No fallback config available for unknown type "${type}"`,
|
|
294
|
+
);
|
|
295
|
+
systemPrompt = buildAgentPrompt(
|
|
296
|
+
{ ...fallback, name: type },
|
|
297
|
+
effectiveCwd,
|
|
298
|
+
env,
|
|
299
|
+
parentSystemPrompt,
|
|
300
|
+
extras,
|
|
301
|
+
);
|
|
302
|
+
}
|
|
303
|
+
|
|
304
|
+
// When skills is string[], we've already preloaded them into the prompt.
|
|
305
|
+
// Still pass noSkills: true since we don't need the skill loader to load them again.
|
|
306
|
+
const noSkills = skills === false || Array.isArray(skills);
|
|
307
|
+
|
|
308
|
+
const parentAgentDir = getAgentDir();
|
|
309
|
+
// Isolated temp agentDir — no parent extensions/ auto-discovery (subagent-v2 pattern).
|
|
310
|
+
const isolatedAgentDir = fs.mkdtempSync(
|
|
311
|
+
path.join(os.tmpdir(), "harness-subagent-"),
|
|
312
|
+
);
|
|
313
|
+
const sessionAgentDir = isolatedAgentDir;
|
|
314
|
+
let disposedIsolatedDir = false;
|
|
315
|
+
const disposeIsolatedDir = () => {
|
|
316
|
+
if (disposedIsolatedDir) return;
|
|
317
|
+
disposedIsolatedDir = true;
|
|
318
|
+
try {
|
|
319
|
+
fs.rmSync(isolatedAgentDir, { recursive: true, force: true });
|
|
320
|
+
} catch {
|
|
321
|
+
/* ignore */
|
|
322
|
+
}
|
|
323
|
+
};
|
|
324
|
+
|
|
325
|
+
const appendix = options.systemPromptAppendix?.trim();
|
|
326
|
+
const fullSystemPrompt =
|
|
327
|
+
appendix && appendix.length > 0
|
|
328
|
+
? `${systemPrompt}\n\n---\n\n## Spawn context\n\n${appendix}`
|
|
329
|
+
: systemPrompt;
|
|
330
|
+
|
|
331
|
+
const extensionFactories: Array<(pi: ExtensionAPI) => void> = [
|
|
332
|
+
(pi) => {
|
|
333
|
+
pi.on("tool_call", (event) => {
|
|
334
|
+
const decision = evaluateSubagentToolCall(event.toolName);
|
|
335
|
+
if (decision.action === "block") {
|
|
336
|
+
return { block: true, reason: decision.reason };
|
|
337
|
+
}
|
|
338
|
+
return undefined;
|
|
339
|
+
});
|
|
340
|
+
pi.on("before_agent_start", (event: { systemPrompt?: string }) => {
|
|
341
|
+
const base =
|
|
342
|
+
typeof event.systemPrompt === "string" ? event.systemPrompt : "";
|
|
343
|
+
return { systemPrompt: base };
|
|
344
|
+
});
|
|
345
|
+
},
|
|
346
|
+
];
|
|
347
|
+
|
|
348
|
+
const loader = new DefaultResourceLoader({
|
|
349
|
+
cwd: effectiveCwd,
|
|
350
|
+
agentDir: sessionAgentDir,
|
|
351
|
+
noExtensions: extensions === false,
|
|
352
|
+
noSkills,
|
|
353
|
+
noPromptTemplates: true,
|
|
354
|
+
noThemes: true,
|
|
355
|
+
noContextFiles: true,
|
|
356
|
+
systemPromptOverride: () => fullSystemPrompt,
|
|
357
|
+
appendSystemPromptOverride: () => [],
|
|
358
|
+
extensionFactories,
|
|
359
|
+
});
|
|
360
|
+
await loader.reload();
|
|
361
|
+
|
|
362
|
+
// Resolve model: explicit option > config.model > parent model
|
|
363
|
+
const model =
|
|
364
|
+
options.model ??
|
|
365
|
+
resolveDefaultModel(ctx.model, ctx.modelRegistry, agentConfig?.model);
|
|
366
|
+
|
|
367
|
+
// Resolve thinking level: explicit option > agent config > undefined (inherit)
|
|
368
|
+
const thinkingLevel = options.thinkingLevel ?? agentConfig?.thinking;
|
|
369
|
+
|
|
370
|
+
const sessionOpts: Parameters<typeof createAgentSession>[0] = {
|
|
371
|
+
cwd: effectiveCwd,
|
|
372
|
+
agentDir: parentAgentDir,
|
|
373
|
+
sessionManager: SessionManager.inMemory(effectiveCwd),
|
|
374
|
+
settingsManager: SettingsManager.create(effectiveCwd, parentAgentDir),
|
|
375
|
+
modelRegistry: ctx.modelRegistry,
|
|
376
|
+
model,
|
|
377
|
+
resourceLoader: loader,
|
|
378
|
+
};
|
|
379
|
+
if (thinkingLevel) {
|
|
380
|
+
sessionOpts.thinkingLevel = thinkingLevel;
|
|
381
|
+
}
|
|
382
|
+
|
|
383
|
+
const { session } = await createAgentSession(sessionOpts);
|
|
384
|
+
|
|
385
|
+
const baseSessionName = agentConfig?.name ?? type;
|
|
386
|
+
session.setSessionName(
|
|
387
|
+
options.agentId
|
|
388
|
+
? `${baseSessionName}#${options.agentId.slice(0, 8)}`
|
|
389
|
+
: baseSessionName,
|
|
390
|
+
);
|
|
391
|
+
|
|
392
|
+
// Build disallowed tools set from agent config
|
|
393
|
+
const disallowedSet = agentConfig?.disallowedTools
|
|
394
|
+
? new Set(agentConfig.disallowedTools)
|
|
395
|
+
: undefined;
|
|
396
|
+
|
|
397
|
+
// setActiveTools in before_agent_start (omit explicit tools: param — SDK quirk).
|
|
398
|
+
const builtinToolNameSet = new Set(toolNames);
|
|
399
|
+
const filterTools = (names: string[]) =>
|
|
400
|
+
names.filter((t) => {
|
|
401
|
+
if (EXCLUDED_TOOL_NAMES.includes(t)) return false;
|
|
402
|
+
if (disallowedSet?.has(t)) return false;
|
|
403
|
+
if (builtinToolNameSet.has(t)) return true;
|
|
404
|
+
if (extensions === false) return false;
|
|
405
|
+
if (Array.isArray(extensions)) {
|
|
406
|
+
return extensions.some((ext) => t.startsWith(ext) || t.includes(ext));
|
|
407
|
+
}
|
|
408
|
+
return true;
|
|
409
|
+
});
|
|
410
|
+
|
|
411
|
+
const activeTools = filterTools(session.getActiveToolNames());
|
|
412
|
+
if (activeTools.length > 0) {
|
|
413
|
+
session.setActiveToolsByName(activeTools);
|
|
414
|
+
} else {
|
|
415
|
+
session.setActiveToolsByName(
|
|
416
|
+
toolNames.filter((t) => !disallowedSet?.has(t)),
|
|
417
|
+
);
|
|
418
|
+
}
|
|
419
|
+
|
|
420
|
+
// Bind extensions so that session_start fires and extensions can initialize
|
|
421
|
+
// (e.g. loading credentials, setting up state). Placed after tool filtering
|
|
422
|
+
// so extension-provided skills/prompts from extendResourcesFromExtensions()
|
|
423
|
+
// respect the active tool set. All ExtensionBindings fields are optional.
|
|
424
|
+
await session.bindExtensions({
|
|
425
|
+
onError: (err) => {
|
|
426
|
+
options.onToolActivity?.({
|
|
427
|
+
type: "end",
|
|
428
|
+
toolName: `extension-error:${err.extensionPath}`,
|
|
429
|
+
});
|
|
430
|
+
},
|
|
431
|
+
});
|
|
432
|
+
|
|
433
|
+
options.onSessionCreated?.(session);
|
|
434
|
+
|
|
435
|
+
// Track turns for graceful max_turns enforcement
|
|
436
|
+
let turnCount = 0;
|
|
437
|
+
const maxTurns = normalizeMaxTurns(
|
|
438
|
+
options.maxTurns ?? agentConfig?.maxTurns ?? defaultMaxTurns,
|
|
439
|
+
);
|
|
440
|
+
let softLimitReached = false;
|
|
441
|
+
let aborted = false;
|
|
442
|
+
|
|
443
|
+
let currentMessageText = "";
|
|
444
|
+
const unsubTurns = session.subscribe((event: AgentSessionEvent) => {
|
|
445
|
+
if (event.type === "turn_end") {
|
|
446
|
+
turnCount++;
|
|
447
|
+
options.onTurnEnd?.(turnCount);
|
|
448
|
+
if (maxTurns != null) {
|
|
449
|
+
if (!softLimitReached && turnCount >= maxTurns) {
|
|
450
|
+
softLimitReached = true;
|
|
451
|
+
session.steer(
|
|
452
|
+
"You have reached your turn limit. Wrap up immediately — provide your final answer now.",
|
|
453
|
+
);
|
|
454
|
+
} else if (softLimitReached && turnCount >= maxTurns + graceTurns) {
|
|
455
|
+
aborted = true;
|
|
456
|
+
session.abort();
|
|
457
|
+
}
|
|
458
|
+
}
|
|
459
|
+
}
|
|
460
|
+
if (event.type === "message_start") {
|
|
461
|
+
currentMessageText = "";
|
|
462
|
+
}
|
|
463
|
+
if (
|
|
464
|
+
event.type === "message_update" &&
|
|
465
|
+
event.assistantMessageEvent.type === "text_delta"
|
|
466
|
+
) {
|
|
467
|
+
currentMessageText += event.assistantMessageEvent.delta;
|
|
468
|
+
options.onTextDelta?.(
|
|
469
|
+
event.assistantMessageEvent.delta,
|
|
470
|
+
currentMessageText,
|
|
471
|
+
);
|
|
472
|
+
}
|
|
473
|
+
if (event.type === "tool_execution_start") {
|
|
474
|
+
options.onToolActivity?.({ type: "start", toolName: event.toolName });
|
|
475
|
+
}
|
|
476
|
+
if (event.type === "tool_execution_end") {
|
|
477
|
+
options.onToolActivity?.({ type: "end", toolName: event.toolName });
|
|
478
|
+
}
|
|
479
|
+
if (event.type === "message_end" && event.message.role === "assistant") {
|
|
480
|
+
const u = (event.message as any).usage;
|
|
481
|
+
if (u)
|
|
482
|
+
options.onAssistantUsage?.({
|
|
483
|
+
input: u.input ?? 0,
|
|
484
|
+
output: u.output ?? 0,
|
|
485
|
+
cacheWrite: u.cacheWrite ?? 0,
|
|
486
|
+
});
|
|
487
|
+
}
|
|
488
|
+
if (event.type === "compaction_end" && !event.aborted && event.result) {
|
|
489
|
+
options.onCompaction?.({
|
|
490
|
+
reason: event.reason,
|
|
491
|
+
tokensBefore: event.result.tokensBefore,
|
|
492
|
+
});
|
|
493
|
+
}
|
|
494
|
+
});
|
|
495
|
+
|
|
496
|
+
const collector = collectResponseText(session);
|
|
497
|
+
const cleanupAbort = forwardAbortSignal(session, options.signal);
|
|
498
|
+
|
|
499
|
+
// Build the effective prompt: optionally prepend parent context
|
|
500
|
+
let effectivePrompt = prompt;
|
|
501
|
+
if (options.inheritContext) {
|
|
502
|
+
const parentContext = buildParentContext(ctx);
|
|
503
|
+
if (parentContext) {
|
|
504
|
+
effectivePrompt = parentContext + prompt;
|
|
505
|
+
}
|
|
506
|
+
}
|
|
507
|
+
|
|
508
|
+
try {
|
|
509
|
+
await session.prompt(effectivePrompt);
|
|
510
|
+
} finally {
|
|
511
|
+
unsubTurns();
|
|
512
|
+
collector.unsubscribe();
|
|
513
|
+
cleanupAbort();
|
|
514
|
+
disposeIsolatedDir();
|
|
515
|
+
}
|
|
516
|
+
|
|
517
|
+
const responseText =
|
|
518
|
+
collector.getText().trim() || getLastAssistantText(session);
|
|
519
|
+
return { responseText, session, aborted, steered: softLimitReached };
|
|
520
|
+
}
|
|
521
|
+
|
|
522
|
+
/**
|
|
523
|
+
* Send a new prompt to an existing session (resume).
|
|
524
|
+
*/
|
|
525
|
+
export async function resumeAgent(
|
|
526
|
+
session: AgentSession,
|
|
527
|
+
prompt: string,
|
|
528
|
+
options: {
|
|
529
|
+
onToolActivity?: (activity: ToolActivity) => void;
|
|
530
|
+
onAssistantUsage?: (usage: {
|
|
531
|
+
input: number;
|
|
532
|
+
output: number;
|
|
533
|
+
cacheWrite: number;
|
|
534
|
+
}) => void;
|
|
535
|
+
onCompaction?: (info: {
|
|
536
|
+
reason: "manual" | "threshold" | "overflow";
|
|
537
|
+
tokensBefore: number;
|
|
538
|
+
}) => void;
|
|
539
|
+
signal?: AbortSignal;
|
|
540
|
+
} = {},
|
|
541
|
+
): Promise<string> {
|
|
542
|
+
const collector = collectResponseText(session);
|
|
543
|
+
const cleanupAbort = forwardAbortSignal(session, options.signal);
|
|
544
|
+
|
|
545
|
+
const unsubEvents =
|
|
546
|
+
options.onToolActivity || options.onAssistantUsage || options.onCompaction
|
|
547
|
+
? session.subscribe((event: AgentSessionEvent) => {
|
|
548
|
+
if (event.type === "tool_execution_start")
|
|
549
|
+
options.onToolActivity?.({
|
|
550
|
+
type: "start",
|
|
551
|
+
toolName: event.toolName,
|
|
552
|
+
});
|
|
553
|
+
if (event.type === "tool_execution_end")
|
|
554
|
+
options.onToolActivity?.({ type: "end", toolName: event.toolName });
|
|
555
|
+
if (
|
|
556
|
+
event.type === "message_end" &&
|
|
557
|
+
event.message.role === "assistant"
|
|
558
|
+
) {
|
|
559
|
+
const u = (event.message as any).usage;
|
|
560
|
+
if (u)
|
|
561
|
+
options.onAssistantUsage?.({
|
|
562
|
+
input: u.input ?? 0,
|
|
563
|
+
output: u.output ?? 0,
|
|
564
|
+
cacheWrite: u.cacheWrite ?? 0,
|
|
565
|
+
});
|
|
566
|
+
}
|
|
567
|
+
if (
|
|
568
|
+
event.type === "compaction_end" &&
|
|
569
|
+
!event.aborted &&
|
|
570
|
+
event.result
|
|
571
|
+
) {
|
|
572
|
+
options.onCompaction?.({
|
|
573
|
+
reason: event.reason,
|
|
574
|
+
tokensBefore: event.result.tokensBefore,
|
|
575
|
+
});
|
|
576
|
+
}
|
|
577
|
+
})
|
|
578
|
+
: () => {};
|
|
579
|
+
|
|
580
|
+
try {
|
|
581
|
+
await session.prompt(prompt);
|
|
582
|
+
} finally {
|
|
583
|
+
collector.unsubscribe();
|
|
584
|
+
unsubEvents();
|
|
585
|
+
cleanupAbort();
|
|
586
|
+
}
|
|
587
|
+
|
|
588
|
+
return collector.getText().trim() || getLastAssistantText(session);
|
|
589
|
+
}
|
|
590
|
+
|
|
591
|
+
/**
|
|
592
|
+
* Send a steering message to a running subagent.
|
|
593
|
+
* The message will interrupt the agent after its current tool execution.
|
|
594
|
+
*/
|
|
595
|
+
export async function steerAgent(
|
|
596
|
+
session: AgentSession,
|
|
597
|
+
message: string,
|
|
598
|
+
): Promise<void> {
|
|
599
|
+
await session.steer(message);
|
|
600
|
+
}
|
|
601
|
+
|
|
602
|
+
/**
|
|
603
|
+
* Get the subagent's conversation messages as formatted text.
|
|
604
|
+
*/
|
|
605
|
+
export function getAgentConversation(session: AgentSession): string {
|
|
606
|
+
const parts: string[] = [];
|
|
607
|
+
|
|
608
|
+
for (const msg of session.messages) {
|
|
609
|
+
if (msg.role === "user") {
|
|
610
|
+
const text =
|
|
611
|
+
typeof msg.content === "string"
|
|
612
|
+
? msg.content
|
|
613
|
+
: extractText(msg.content);
|
|
614
|
+
if (text.trim()) parts.push(`[User]: ${text.trim()}`);
|
|
615
|
+
} else if (msg.role === "assistant") {
|
|
616
|
+
const textParts: string[] = [];
|
|
617
|
+
const toolCalls: string[] = [];
|
|
618
|
+
for (const c of msg.content) {
|
|
619
|
+
if (c.type === "text" && c.text) textParts.push(c.text);
|
|
620
|
+
else if (c.type === "toolCall")
|
|
621
|
+
toolCalls.push(
|
|
622
|
+
` Tool: ${(c as any).name ?? (c as any).toolName ?? "unknown"}`,
|
|
623
|
+
);
|
|
624
|
+
}
|
|
625
|
+
if (textParts.length > 0)
|
|
626
|
+
parts.push(`[Assistant]: ${textParts.join("\n")}`);
|
|
627
|
+
if (toolCalls.length > 0)
|
|
628
|
+
parts.push(`[Tool Calls]:\n${toolCalls.join("\n")}`);
|
|
629
|
+
} else if (msg.role === "toolResult") {
|
|
630
|
+
const text = extractText(msg.content);
|
|
631
|
+
const truncated = text.length > 200 ? `${text.slice(0, 200)}...` : text;
|
|
632
|
+
parts.push(`[Tool Result (${msg.toolName})]: ${truncated}`);
|
|
633
|
+
}
|
|
634
|
+
}
|
|
635
|
+
|
|
636
|
+
return parts.join("\n\n");
|
|
637
|
+
}
|