sentinelayer-cli 0.1.1 → 0.3.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +996 -996
- package/bin/create-sentinelayer.js +5 -5
- package/bin/sentinelayer-cli.js +4 -4
- package/bin/sl.js +5 -5
- package/package.json +62 -54
- package/src/agents/jules/config/definition.js +209 -209
- package/src/agents/jules/config/system-prompt.js +175 -175
- package/src/agents/jules/error-intake.js +51 -51
- package/src/agents/jules/fix-cycle.js +377 -377
- package/src/agents/jules/loop.js +367 -367
- package/src/agents/jules/pulse.js +319 -319
- package/src/agents/jules/stream.js +186 -186
- package/src/agents/jules/swarm/file-scanner.js +74 -74
- package/src/agents/jules/swarm/index.js +11 -11
- package/src/agents/jules/swarm/orchestrator.js +362 -362
- package/src/agents/jules/swarm/pattern-hunter.js +123 -123
- package/src/agents/jules/swarm/sub-agent.js +308 -308
- package/src/agents/jules/tools/auth-audit.js +226 -222
- package/src/agents/jules/tools/dispatch.js +327 -327
- package/src/agents/jules/tools/file-edit.js +180 -180
- package/src/agents/jules/tools/file-read.js +100 -100
- package/src/agents/jules/tools/frontend-analyze.js +570 -570
- package/src/agents/jules/tools/glob.js +168 -168
- package/src/agents/jules/tools/grep.js +228 -228
- package/src/agents/jules/tools/index.js +29 -29
- package/src/agents/jules/tools/path-guards.js +161 -161
- package/src/agents/jules/tools/runtime-audit.js +493 -493
- package/src/agents/jules/tools/shell.js +383 -383
- package/src/ai/aidenid.js +972 -945
- package/src/ai/client.js +508 -508
- package/src/ai/domain-target-store.js +268 -268
- package/src/ai/identity-store.js +270 -270
- package/src/ai/site-store.js +145 -145
- package/src/audit/agents/architecture.js +180 -180
- package/src/audit/agents/compliance.js +179 -179
- package/src/audit/agents/documentation.js +165 -165
- package/src/audit/agents/performance.js +145 -145
- package/src/audit/agents/security.js +215 -215
- package/src/audit/agents/testing.js +172 -172
- package/src/audit/orchestrator.js +557 -557
- package/src/audit/package.js +204 -204
- package/src/audit/registry.js +284 -284
- package/src/audit/replay.js +103 -103
- package/src/auth/http.js +113 -113
- package/src/auth/service.js +891 -848
- package/src/auth/session-store.js +359 -345
- package/src/cli.js +252 -252
- package/src/commands/ai/identity-lifecycle.js +1338 -1337
- package/src/commands/ai/provision-governance.js +1272 -1246
- package/src/commands/ai/shared.js +147 -147
- package/src/commands/ai.js +11 -11
- package/src/commands/apply.js +12 -12
- package/src/commands/audit.js +1166 -1147
- package/src/commands/auth.js +375 -366
- package/src/commands/chat.js +191 -191
- package/src/commands/config.js +184 -184
- package/src/commands/cost.js +311 -311
- package/src/commands/daemon/core.js +850 -850
- package/src/commands/daemon/extended.js +1048 -1048
- package/src/commands/daemon/shared.js +213 -213
- package/src/commands/daemon.js +11 -11
- package/src/commands/guide.js +174 -174
- package/src/commands/ingest.js +58 -58
- package/src/commands/init.js +55 -55
- package/src/commands/legacy-args.js +10 -10
- package/src/commands/mcp.js +461 -404
- package/src/commands/omargate.js +15 -15
- package/src/commands/persona.js +20 -20
- package/src/commands/plugin.js +260 -260
- package/src/commands/policy.js +132 -132
- package/src/commands/prompt.js +238 -238
- package/src/commands/review.js +704 -704
- package/src/commands/scan.js +866 -788
- package/src/commands/spec.js +716 -716
- package/src/commands/swarm.js +651 -651
- package/src/commands/telemetry.js +202 -202
- package/src/commands/watch.js +510 -510
- package/src/config/agent-dictionary.js +182 -182
- package/src/config/io.js +56 -56
- package/src/config/paths.js +18 -18
- package/src/config/schema.js +55 -55
- package/src/config/service.js +184 -184
- package/src/cost/budget.js +235 -235
- package/src/cost/history.js +188 -188
- package/src/cost/tracker.js +171 -171
- package/src/daemon/artifact-lineage.js +534 -534
- package/src/daemon/assignment-ledger.js +770 -770
- package/src/daemon/ast-parser-layer.js +258 -258
- package/src/daemon/budget-governor.js +633 -633
- package/src/daemon/callgraph-overlay.js +646 -646
- package/src/daemon/error-worker.js +626 -626
- package/src/daemon/hybrid-mapper.js +929 -929
- package/src/daemon/ingest-refresh.js +195 -0
- package/src/daemon/jira-lifecycle.js +632 -632
- package/src/daemon/operator-control.js +657 -657
- package/src/daemon/reliability-lane.js +471 -471
- package/src/daemon/watchdog.js +971 -971
- package/src/guide/generator.js +316 -316
- package/src/ingest/engine.js +918 -918
- package/src/interactive/action-menu.js +132 -0
- package/src/interactive/auto-ingest.js +111 -0
- package/src/interactive/index.js +95 -0
- package/src/interactive/workspace.js +92 -0
- package/src/legacy-cli.js +2548 -2435
- package/src/mcp/registry.js +695 -695
- package/src/memory/blackboard.js +301 -301
- package/src/memory/retrieval.js +581 -581
- package/src/plugin/manifest.js +553 -553
- package/src/policy/packs.js +144 -144
- package/src/prompt/generator.js +118 -106
- package/src/review/ai-review.js +669 -669
- package/src/review/local-review.js +1284 -1284
- package/src/review/replay.js +235 -235
- package/src/review/report.js +664 -664
- package/src/review/spec-binding.js +487 -487
- package/src/scaffold/generator.js +67 -0
- package/src/scaffold/templates.js +150 -0
- package/src/scan/generator.js +418 -351
- package/src/scan/gh-secrets.js +107 -0
- package/src/spec/generator.js +519 -519
- package/src/spec/regenerate.js +237 -237
- package/src/spec/templates.js +91 -91
- package/src/swarm/dashboard.js +247 -247
- package/src/swarm/factory.js +363 -363
- package/src/swarm/pentest.js +934 -934
- package/src/swarm/registry.js +419 -419
- package/src/swarm/report.js +158 -158
- package/src/swarm/runtime.js +576 -576
- package/src/swarm/scenario-dsl.js +272 -272
- package/src/telemetry/ledger.js +302 -302
- package/src/telemetry/session-tracker.js +118 -0
- package/src/telemetry/sync.js +190 -0
- package/src/ui/markdown.js +220 -220
package/src/agents/jules/loop.js
CHANGED
|
@@ -1,367 +1,367 @@
|
|
|
1
|
-
import { randomUUID } from "node:crypto";
|
|
2
|
-
import { createMultiProviderApiClient } from "../../ai/client.js";
|
|
3
|
-
import { evaluateBudget } from "../../cost/budget.js";
|
|
4
|
-
import { dispatchTool, createAgentContext, BudgetExhaustedError } from "./tools/dispatch.js";
|
|
5
|
-
import { JULES_DEFINITION } from "./config/definition.js";
|
|
6
|
-
import { shouldSpawnSubAgents, runJulesSwarm } from "./swarm/orchestrator.js";
|
|
7
|
-
import { frontendAnalyze } from "./tools/frontend-analyze.js";
|
|
8
|
-
|
|
9
|
-
/**
|
|
10
|
-
* Jules Tanaka — Agentic Loop
|
|
11
|
-
*
|
|
12
|
-
* Core state machine: LLM → tool_use → execute → result → LLM → repeat
|
|
13
|
-
* With sub-agent swarm integration for large codebases.
|
|
14
|
-
*
|
|
15
|
-
* This loop is self-contained: it uses the existing ai/client.js for LLM calls,
|
|
16
|
-
* the existing cost/budget.js for budget enforcement, and the Jules tool
|
|
17
|
-
* dispatch for tool execution. No dependency on Batches O-Q.
|
|
18
|
-
*/
|
|
19
|
-
|
|
20
|
-
const DEFAULT_MAX_TURNS = 25;
|
|
21
|
-
const HEARTBEAT_INTERVAL_TURNS = 5;
|
|
22
|
-
|
|
23
|
-
/**
|
|
24
|
-
* Run Jules' agentic audit loop.
|
|
25
|
-
*
|
|
26
|
-
* @param {object} config
|
|
27
|
-
* @param {string} config.systemPrompt - Jules' full system prompt
|
|
28
|
-
* @param {object} config.scopeMap - { primary, secondary, tertiary } file lists
|
|
29
|
-
* @param {string} config.rootPath - Codebase root
|
|
30
|
-
* @param {object} [config.omarBaseline] - Deterministic baseline findings (if available)
|
|
31
|
-
* @param {object} [config.blackboard] - Shared blackboard for cross-agent findings
|
|
32
|
-
* @param {object} [config.memory] - Memory index for cross-run recall
|
|
33
|
-
* @param {object} [config.budget] - Budget overrides
|
|
34
|
-
* @param {object} [config.provider] - LLM provider overrides
|
|
35
|
-
* @param {string} [config.mode] - "primary" | "secondary" | "tertiary"
|
|
36
|
-
* @param {number} [config.maxTurns] - Max loop iterations
|
|
37
|
-
* @param {AbortController} [config.abortController]
|
|
38
|
-
* @param {function} [config.onEvent] - Streaming event callback
|
|
39
|
-
* @returns {AsyncGenerator<JulesEvent>} Yields events as they occur
|
|
40
|
-
*/
|
|
41
|
-
export async function* julesAuditLoop(config) {
|
|
42
|
-
const {
|
|
43
|
-
systemPrompt,
|
|
44
|
-
scopeMap,
|
|
45
|
-
rootPath,
|
|
46
|
-
omarBaseline,
|
|
47
|
-
blackboard,
|
|
48
|
-
memory,
|
|
49
|
-
provider,
|
|
50
|
-
mode = "primary",
|
|
51
|
-
maxTurns = DEFAULT_MAX_TURNS,
|
|
52
|
-
abortController,
|
|
53
|
-
onEvent,
|
|
54
|
-
} = config;
|
|
55
|
-
|
|
56
|
-
const budget = { ...JULES_DEFINITION.budget, ...config.budget };
|
|
57
|
-
const runId = `jules-${Date.now()}-${randomUUID().slice(0, 8)}`;
|
|
58
|
-
const startedAt = Date.now();
|
|
59
|
-
const client = createMultiProviderApiClient(provider || {});
|
|
60
|
-
|
|
61
|
-
const ctx = createAgentContext({
|
|
62
|
-
agentIdentity: { id: JULES_DEFINITION.id, persona: JULES_DEFINITION.persona },
|
|
63
|
-
budget,
|
|
64
|
-
runId,
|
|
65
|
-
onEvent,
|
|
66
|
-
});
|
|
67
|
-
|
|
68
|
-
const emit = (event, payload) => {
|
|
69
|
-
const evt = {
|
|
70
|
-
stream: "sl_event",
|
|
71
|
-
event,
|
|
72
|
-
agent: { id: JULES_DEFINITION.id, persona: JULES_DEFINITION.persona, color: JULES_DEFINITION.color, avatar: JULES_DEFINITION.avatar },
|
|
73
|
-
payload,
|
|
74
|
-
usage: {
|
|
75
|
-
costUsd: ctx.usage.costUsd,
|
|
76
|
-
outputTokens: ctx.usage.outputTokens,
|
|
77
|
-
toolCalls: ctx.usage.toolCalls,
|
|
78
|
-
durationMs: Date.now() - startedAt,
|
|
79
|
-
},
|
|
80
|
-
};
|
|
81
|
-
if (onEvent) onEvent(evt);
|
|
82
|
-
return evt;
|
|
83
|
-
};
|
|
84
|
-
|
|
85
|
-
yield emit("agent_start", { mode, runId, maxTurns, budget });
|
|
86
|
-
|
|
87
|
-
// ── Phase 0: Prerequisites ────────────────────────────────────────
|
|
88
|
-
|
|
89
|
-
yield emit("progress", { phase: "prerequisites", message: "Detecting framework..." });
|
|
90
|
-
|
|
91
|
-
let framework = {};
|
|
92
|
-
try {
|
|
93
|
-
framework = frontendAnalyze({ operation: "detect_framework", path: rootPath });
|
|
94
|
-
ctx.usage.toolCalls++;
|
|
95
|
-
yield emit("tool_result", { tool: "FrontendAnalyze", operation: "detect_framework", result: { framework: framework.framework, componentCount: framework.componentCount } });
|
|
96
|
-
} catch { /* proceed without */ }
|
|
97
|
-
|
|
98
|
-
// ── Phase 1: Swarm or direct? ─────────────────────────────────────
|
|
99
|
-
|
|
100
|
-
const spawnDecision = shouldSpawnSubAgents(scopeMap);
|
|
101
|
-
let swarmFindings = [];
|
|
102
|
-
|
|
103
|
-
if (spawnDecision.spawn && blackboard) {
|
|
104
|
-
yield emit("progress", { phase: "swarm", message: `Large frontend (${spawnDecision.reason}). Spawning sub-agents...` });
|
|
105
|
-
|
|
106
|
-
const swarmResult = await runJulesSwarm({
|
|
107
|
-
scopeMap,
|
|
108
|
-
rootPath,
|
|
109
|
-
blackboard,
|
|
110
|
-
budget: { ...budget, maxCostUsd: budget.maxCostUsd * 0.6 }, // 60% for swarm
|
|
111
|
-
provider,
|
|
112
|
-
parentAbort: abortController,
|
|
113
|
-
onEvent,
|
|
114
|
-
});
|
|
115
|
-
|
|
116
|
-
swarmFindings = swarmResult.agentResults.flatMap(r => r.findings);
|
|
117
|
-
ctx.usage.costUsd += swarmResult.usage.totalCostUsd;
|
|
118
|
-
ctx.usage.toolCalls += swarmResult.usage.totalToolCalls;
|
|
119
|
-
|
|
120
|
-
yield emit("swarm_complete", {
|
|
121
|
-
totalFindings: swarmFindings.length,
|
|
122
|
-
totalAgents: swarmResult.usage.totalAgents,
|
|
123
|
-
totalCostUsd: swarmResult.usage.totalCostUsd,
|
|
124
|
-
});
|
|
125
|
-
}
|
|
126
|
-
|
|
127
|
-
// ── Phase 2: Jules primary deep analysis (agentic LLM loop) ──────
|
|
128
|
-
|
|
129
|
-
yield emit("progress", { phase: "deep_analysis", message: "Starting deep analysis..." });
|
|
130
|
-
|
|
131
|
-
// Build context for LLM
|
|
132
|
-
const contextParts = [];
|
|
133
|
-
contextParts.push(`Framework: ${framework.framework || "unknown"}`);
|
|
134
|
-
contextParts.push(`Mode: ${mode}`);
|
|
135
|
-
contextParts.push(`Components: ${framework.componentCount || "unknown"}`);
|
|
136
|
-
contextParts.push(`Scope: ${(scopeMap.primary || []).length} primary files`);
|
|
137
|
-
|
|
138
|
-
if (swarmFindings.length > 0) {
|
|
139
|
-
contextParts.push(`\nSub-agent findings (${swarmFindings.length} total):`);
|
|
140
|
-
for (const f of swarmFindings.slice(0, 30)) {
|
|
141
|
-
contextParts.push(`- [${f.severity || "P3"}] ${f.file || ""}:${f.line || ""} ${f.title || f.type || ""}`);
|
|
142
|
-
}
|
|
143
|
-
}
|
|
144
|
-
|
|
145
|
-
if (omarBaseline) {
|
|
146
|
-
const baselineFindings = omarBaseline.findings || omarBaseline.summary || [];
|
|
147
|
-
if (Array.isArray(baselineFindings) && baselineFindings.length > 0) {
|
|
148
|
-
contextParts.push(`\nOmar baseline findings (${baselineFindings.length}):`);
|
|
149
|
-
for (const f of baselineFindings.slice(0, 20)) {
|
|
150
|
-
contextParts.push(`- [${f.severity || ""}] ${f.file || ""}:${f.line || ""} ${f.message || f.title || ""}`);
|
|
151
|
-
}
|
|
152
|
-
}
|
|
153
|
-
}
|
|
154
|
-
|
|
155
|
-
if (memory) {
|
|
156
|
-
try {
|
|
157
|
-
const recalled = memory.query ? memory.query({
|
|
158
|
-
files: (scopeMap.primary || []).map(f => f.path || f),
|
|
159
|
-
limit: 10,
|
|
160
|
-
}) : [];
|
|
161
|
-
if (recalled.length > 0) {
|
|
162
|
-
contextParts.push(`\nPrevious findings recalled from memory (${recalled.length}):`);
|
|
163
|
-
for (const r of recalled) {
|
|
164
|
-
contextParts.push(`- ${r.content || r.text || JSON.stringify(r).slice(0, 100)}`);
|
|
165
|
-
}
|
|
166
|
-
}
|
|
167
|
-
} catch { /* memory recall failure is non-blocking */ }
|
|
168
|
-
}
|
|
169
|
-
|
|
170
|
-
const messages = [
|
|
171
|
-
{ role: "user", content: contextParts.join("\n") +
|
|
172
|
-
"\n\nPerform your deep analysis now. Use FileRead, Grep, Glob, and FrontendAnalyze tools as needed. " +
|
|
173
|
-
"Return your findings in a ```json code block as an array of { severity, file, line, title, evidence, rootCause, recommendedFix, trafficLight }." },
|
|
174
|
-
];
|
|
175
|
-
|
|
176
|
-
const allFindings = [...swarmFindings];
|
|
177
|
-
let turnCount = 0;
|
|
178
|
-
|
|
179
|
-
while (turnCount < maxTurns) {
|
|
180
|
-
if (abortController?.signal.aborted) {
|
|
181
|
-
yield emit("agent_abort", { reason: "user_cancelled" });
|
|
182
|
-
break;
|
|
183
|
-
}
|
|
184
|
-
|
|
185
|
-
// Budget check before LLM call
|
|
186
|
-
const preCheck = evaluateBudget({
|
|
187
|
-
sessionSummary: {
|
|
188
|
-
costUsd: ctx.usage.costUsd,
|
|
189
|
-
outputTokens: ctx.usage.outputTokens,
|
|
190
|
-
durationMs: Date.now() - startedAt,
|
|
191
|
-
toolCalls: ctx.usage.toolCalls,
|
|
192
|
-
},
|
|
193
|
-
...budget,
|
|
194
|
-
});
|
|
195
|
-
|
|
196
|
-
if (preCheck.blocking) {
|
|
197
|
-
yield emit("budget_stop", { reasons: preCheck.reasons });
|
|
198
|
-
break;
|
|
199
|
-
}
|
|
200
|
-
|
|
201
|
-
if (preCheck.warnings.length > 0) {
|
|
202
|
-
yield emit("budget_warning", { warnings: preCheck.warnings });
|
|
203
|
-
}
|
|
204
|
-
|
|
205
|
-
turnCount++;
|
|
206
|
-
|
|
207
|
-
// Heartbeat
|
|
208
|
-
if (turnCount % HEARTBEAT_INTERVAL_TURNS === 0) {
|
|
209
|
-
yield emit("heartbeat", {
|
|
210
|
-
turnsCompleted: turnCount,
|
|
211
|
-
turnsMax: maxTurns,
|
|
212
|
-
findingsSoFar: allFindings.length,
|
|
213
|
-
budgetRemaining: {
|
|
214
|
-
costUsd: Math.max(0, budget.maxCostUsd - ctx.usage.costUsd),
|
|
215
|
-
pct: Math.max(0, 100 - (ctx.usage.costUsd / budget.maxCostUsd * 100)),
|
|
216
|
-
},
|
|
217
|
-
});
|
|
218
|
-
}
|
|
219
|
-
|
|
220
|
-
// Call LLM
|
|
221
|
-
let response;
|
|
222
|
-
try {
|
|
223
|
-
response = await client.invoke({
|
|
224
|
-
systemPrompt,
|
|
225
|
-
messages,
|
|
226
|
-
});
|
|
227
|
-
} catch (err) {
|
|
228
|
-
yield emit("llm_error", { error: err.message, turn: turnCount });
|
|
229
|
-
break;
|
|
230
|
-
}
|
|
231
|
-
|
|
232
|
-
const responseText = response.text || "";
|
|
233
|
-
ctx.usage.outputTokens += Math.ceil(responseText.length / 4);
|
|
234
|
-
ctx.usage.costUsd += (Math.ceil(responseText.length / 4) / 1_000_000) * 15;
|
|
235
|
-
|
|
236
|
-
yield emit("reasoning", {
|
|
237
|
-
phase: "deep_analysis",
|
|
238
|
-
turn: turnCount,
|
|
239
|
-
summary: responseText.slice(0, 200),
|
|
240
|
-
});
|
|
241
|
-
|
|
242
|
-
// Parse tool_use blocks
|
|
243
|
-
const toolCalls = parseToolUseBlocks(responseText);
|
|
244
|
-
|
|
245
|
-
if (toolCalls.length === 0) {
|
|
246
|
-
// No tools — extract findings from response
|
|
247
|
-
const parsed = extractJsonFindings(responseText);
|
|
248
|
-
for (const finding of parsed) {
|
|
249
|
-
allFindings.push(finding);
|
|
250
|
-
yield emit("finding", { ...finding });
|
|
251
|
-
if (blackboard) {
|
|
252
|
-
try {
|
|
253
|
-
await blackboard.appendEntry({
|
|
254
|
-
agentId: JULES_DEFINITION.id,
|
|
255
|
-
source: "jules-primary",
|
|
256
|
-
...finding,
|
|
257
|
-
});
|
|
258
|
-
} catch { /* blackboard write failure non-blocking */ }
|
|
259
|
-
}
|
|
260
|
-
}
|
|
261
|
-
messages.push({ role: "assistant", content: responseText });
|
|
262
|
-
break; // LLM is done
|
|
263
|
-
}
|
|
264
|
-
|
|
265
|
-
// Execute tool calls
|
|
266
|
-
const results = [];
|
|
267
|
-
for (const call of toolCalls) {
|
|
268
|
-
try {
|
|
269
|
-
const result = await dispatchTool(call.tool, call.input, ctx);
|
|
270
|
-
results.push({ tool: call.tool, result });
|
|
271
|
-
yield emit("tool_call", { tool: call.tool, input: sanitizeForEvent(call.input) });
|
|
272
|
-
} catch (err) {
|
|
273
|
-
if (err instanceof BudgetExhaustedError) {
|
|
274
|
-
yield emit("budget_stop", { reason: err.message });
|
|
275
|
-
break;
|
|
276
|
-
}
|
|
277
|
-
results.push({ tool: call.tool, error: err.message });
|
|
278
|
-
}
|
|
279
|
-
}
|
|
280
|
-
|
|
281
|
-
// Feed results back
|
|
282
|
-
messages.push({ role: "assistant", content: responseText });
|
|
283
|
-
messages.push({
|
|
284
|
-
role: "user",
|
|
285
|
-
content: results.map(r =>
|
|
286
|
-
r.error
|
|
287
|
-
? `Tool ${r.tool} failed: ${r.error}`
|
|
288
|
-
: `Tool ${r.tool} result:\n${JSON.stringify(r.result).slice(0, 3000)}`,
|
|
289
|
-
).join("\n\n") + "\n\nContinue your analysis. If done, return findings in a ```json code block.",
|
|
290
|
-
});
|
|
291
|
-
}
|
|
292
|
-
|
|
293
|
-
// ── Phase 3: Build final report ───────────────────────────────────
|
|
294
|
-
|
|
295
|
-
const durationMs = Date.now() - startedAt;
|
|
296
|
-
const severityCounts = { P0: 0, P1: 0, P2: 0, P3: 0 };
|
|
297
|
-
for (const f of allFindings) {
|
|
298
|
-
const sev = (f.severity || "P3").toUpperCase();
|
|
299
|
-
if (severityCounts[sev] !== undefined) severityCounts[sev]++;
|
|
300
|
-
else severityCounts.P3++;
|
|
301
|
-
}
|
|
302
|
-
|
|
303
|
-
const report = {
|
|
304
|
-
runId,
|
|
305
|
-
persona: JULES_DEFINITION.persona,
|
|
306
|
-
mode,
|
|
307
|
-
framework: framework.framework || "unknown",
|
|
308
|
-
status: "completed",
|
|
309
|
-
findings: allFindings,
|
|
310
|
-
summary: {
|
|
311
|
-
total: allFindings.length,
|
|
312
|
-
...severityCounts,
|
|
313
|
-
blocking: severityCounts.P0 > 0 || severityCounts.P1 > 0,
|
|
314
|
-
},
|
|
315
|
-
usage: {
|
|
316
|
-
turns: turnCount,
|
|
317
|
-
costUsd: ctx.usage.costUsd,
|
|
318
|
-
outputTokens: ctx.usage.outputTokens,
|
|
319
|
-
toolCalls: ctx.usage.toolCalls,
|
|
320
|
-
durationMs,
|
|
321
|
-
},
|
|
322
|
-
signature: JULES_DEFINITION.signature,
|
|
323
|
-
};
|
|
324
|
-
|
|
325
|
-
yield emit("agent_complete", {
|
|
326
|
-
...report.summary,
|
|
327
|
-
costUsd: ctx.usage.costUsd,
|
|
328
|
-
durationMs,
|
|
329
|
-
turns: turnCount,
|
|
330
|
-
});
|
|
331
|
-
|
|
332
|
-
return report;
|
|
333
|
-
}
|
|
334
|
-
|
|
335
|
-
// ── Helpers ──────────────────────────────────────────────────────────
|
|
336
|
-
|
|
337
|
-
function parseToolUseBlocks(text) {
|
|
338
|
-
const calls = [];
|
|
339
|
-
const regex = /```tool_use\s*\n([\s\S]*?)```/g;
|
|
340
|
-
let match;
|
|
341
|
-
while ((match = regex.exec(text)) !== null) {
|
|
342
|
-
try {
|
|
343
|
-
const parsed = JSON.parse(match[1].trim());
|
|
344
|
-
if (parsed.tool && parsed.input) calls.push(parsed);
|
|
345
|
-
} catch { /* skip malformed */ }
|
|
346
|
-
}
|
|
347
|
-
return calls;
|
|
348
|
-
}
|
|
349
|
-
|
|
350
|
-
function extractJsonFindings(text) {
|
|
351
|
-
const jsonMatch = text.match(/```json\s*\n([\s\S]*?)```/);
|
|
352
|
-
if (!jsonMatch) return [];
|
|
353
|
-
try {
|
|
354
|
-
const parsed = JSON.parse(jsonMatch[1].trim());
|
|
355
|
-
if (Array.isArray(parsed)) return parsed;
|
|
356
|
-
if (parsed.findings && Array.isArray(parsed.findings)) return parsed.findings;
|
|
357
|
-
} catch { /* skip malformed */ }
|
|
358
|
-
return [];
|
|
359
|
-
}
|
|
360
|
-
|
|
361
|
-
function sanitizeForEvent(input) {
|
|
362
|
-
const sanitized = { ...input };
|
|
363
|
-
if (typeof sanitized.content === "string" && sanitized.content.length > 200) {
|
|
364
|
-
sanitized.content = `[${sanitized.content.length} chars]`;
|
|
365
|
-
}
|
|
366
|
-
return sanitized;
|
|
367
|
-
}
|
|
1
|
+
import { randomUUID } from "node:crypto";
|
|
2
|
+
import { createMultiProviderApiClient } from "../../ai/client.js";
|
|
3
|
+
import { evaluateBudget } from "../../cost/budget.js";
|
|
4
|
+
import { dispatchTool, createAgentContext, BudgetExhaustedError } from "./tools/dispatch.js";
|
|
5
|
+
import { JULES_DEFINITION } from "./config/definition.js";
|
|
6
|
+
import { shouldSpawnSubAgents, runJulesSwarm } from "./swarm/orchestrator.js";
|
|
7
|
+
import { frontendAnalyze } from "./tools/frontend-analyze.js";
|
|
8
|
+
|
|
9
|
+
/**
|
|
10
|
+
* Jules Tanaka — Agentic Loop
|
|
11
|
+
*
|
|
12
|
+
* Core state machine: LLM → tool_use → execute → result → LLM → repeat
|
|
13
|
+
* With sub-agent swarm integration for large codebases.
|
|
14
|
+
*
|
|
15
|
+
* This loop is self-contained: it uses the existing ai/client.js for LLM calls,
|
|
16
|
+
* the existing cost/budget.js for budget enforcement, and the Jules tool
|
|
17
|
+
* dispatch for tool execution. No dependency on Batches O-Q.
|
|
18
|
+
*/
|
|
19
|
+
|
|
20
|
+
const DEFAULT_MAX_TURNS = 25;
|
|
21
|
+
const HEARTBEAT_INTERVAL_TURNS = 5;
|
|
22
|
+
|
|
23
|
+
/**
|
|
24
|
+
* Run Jules' agentic audit loop.
|
|
25
|
+
*
|
|
26
|
+
* @param {object} config
|
|
27
|
+
* @param {string} config.systemPrompt - Jules' full system prompt
|
|
28
|
+
* @param {object} config.scopeMap - { primary, secondary, tertiary } file lists
|
|
29
|
+
* @param {string} config.rootPath - Codebase root
|
|
30
|
+
* @param {object} [config.omarBaseline] - Deterministic baseline findings (if available)
|
|
31
|
+
* @param {object} [config.blackboard] - Shared blackboard for cross-agent findings
|
|
32
|
+
* @param {object} [config.memory] - Memory index for cross-run recall
|
|
33
|
+
* @param {object} [config.budget] - Budget overrides
|
|
34
|
+
* @param {object} [config.provider] - LLM provider overrides
|
|
35
|
+
* @param {string} [config.mode] - "primary" | "secondary" | "tertiary"
|
|
36
|
+
* @param {number} [config.maxTurns] - Max loop iterations
|
|
37
|
+
* @param {AbortController} [config.abortController]
|
|
38
|
+
* @param {function} [config.onEvent] - Streaming event callback
|
|
39
|
+
* @returns {AsyncGenerator<JulesEvent>} Yields events as they occur
|
|
40
|
+
*/
|
|
41
|
+
export async function* julesAuditLoop(config) {
|
|
42
|
+
const {
|
|
43
|
+
systemPrompt,
|
|
44
|
+
scopeMap,
|
|
45
|
+
rootPath,
|
|
46
|
+
omarBaseline,
|
|
47
|
+
blackboard,
|
|
48
|
+
memory,
|
|
49
|
+
provider,
|
|
50
|
+
mode = "primary",
|
|
51
|
+
maxTurns = DEFAULT_MAX_TURNS,
|
|
52
|
+
abortController,
|
|
53
|
+
onEvent,
|
|
54
|
+
} = config;
|
|
55
|
+
|
|
56
|
+
const budget = { ...JULES_DEFINITION.budget, ...config.budget };
|
|
57
|
+
const runId = `jules-${Date.now()}-${randomUUID().slice(0, 8)}`;
|
|
58
|
+
const startedAt = Date.now();
|
|
59
|
+
const client = createMultiProviderApiClient(provider || {});
|
|
60
|
+
|
|
61
|
+
const ctx = createAgentContext({
|
|
62
|
+
agentIdentity: { id: JULES_DEFINITION.id, persona: JULES_DEFINITION.persona },
|
|
63
|
+
budget,
|
|
64
|
+
runId,
|
|
65
|
+
onEvent,
|
|
66
|
+
});
|
|
67
|
+
|
|
68
|
+
const emit = (event, payload) => {
|
|
69
|
+
const evt = {
|
|
70
|
+
stream: "sl_event",
|
|
71
|
+
event,
|
|
72
|
+
agent: { id: JULES_DEFINITION.id, persona: JULES_DEFINITION.persona, color: JULES_DEFINITION.color, avatar: JULES_DEFINITION.avatar },
|
|
73
|
+
payload,
|
|
74
|
+
usage: {
|
|
75
|
+
costUsd: ctx.usage.costUsd,
|
|
76
|
+
outputTokens: ctx.usage.outputTokens,
|
|
77
|
+
toolCalls: ctx.usage.toolCalls,
|
|
78
|
+
durationMs: Date.now() - startedAt,
|
|
79
|
+
},
|
|
80
|
+
};
|
|
81
|
+
if (onEvent) onEvent(evt);
|
|
82
|
+
return evt;
|
|
83
|
+
};
|
|
84
|
+
|
|
85
|
+
yield emit("agent_start", { mode, runId, maxTurns, budget });
|
|
86
|
+
|
|
87
|
+
// ── Phase 0: Prerequisites ────────────────────────────────────────
|
|
88
|
+
|
|
89
|
+
yield emit("progress", { phase: "prerequisites", message: "Detecting framework..." });
|
|
90
|
+
|
|
91
|
+
let framework = {};
|
|
92
|
+
try {
|
|
93
|
+
framework = frontendAnalyze({ operation: "detect_framework", path: rootPath });
|
|
94
|
+
ctx.usage.toolCalls++;
|
|
95
|
+
yield emit("tool_result", { tool: "FrontendAnalyze", operation: "detect_framework", result: { framework: framework.framework, componentCount: framework.componentCount } });
|
|
96
|
+
} catch { /* proceed without */ }
|
|
97
|
+
|
|
98
|
+
// ── Phase 1: Swarm or direct? ─────────────────────────────────────
|
|
99
|
+
|
|
100
|
+
const spawnDecision = shouldSpawnSubAgents(scopeMap);
|
|
101
|
+
let swarmFindings = [];
|
|
102
|
+
|
|
103
|
+
if (spawnDecision.spawn && blackboard) {
|
|
104
|
+
yield emit("progress", { phase: "swarm", message: `Large frontend (${spawnDecision.reason}). Spawning sub-agents...` });
|
|
105
|
+
|
|
106
|
+
const swarmResult = await runJulesSwarm({
|
|
107
|
+
scopeMap,
|
|
108
|
+
rootPath,
|
|
109
|
+
blackboard,
|
|
110
|
+
budget: { ...budget, maxCostUsd: budget.maxCostUsd * 0.6 }, // 60% for swarm
|
|
111
|
+
provider,
|
|
112
|
+
parentAbort: abortController,
|
|
113
|
+
onEvent,
|
|
114
|
+
});
|
|
115
|
+
|
|
116
|
+
swarmFindings = swarmResult.agentResults.flatMap(r => r.findings);
|
|
117
|
+
ctx.usage.costUsd += swarmResult.usage.totalCostUsd;
|
|
118
|
+
ctx.usage.toolCalls += swarmResult.usage.totalToolCalls;
|
|
119
|
+
|
|
120
|
+
yield emit("swarm_complete", {
|
|
121
|
+
totalFindings: swarmFindings.length,
|
|
122
|
+
totalAgents: swarmResult.usage.totalAgents,
|
|
123
|
+
totalCostUsd: swarmResult.usage.totalCostUsd,
|
|
124
|
+
});
|
|
125
|
+
}
|
|
126
|
+
|
|
127
|
+
// ── Phase 2: Jules primary deep analysis (agentic LLM loop) ──────
|
|
128
|
+
|
|
129
|
+
yield emit("progress", { phase: "deep_analysis", message: "Starting deep analysis..." });
|
|
130
|
+
|
|
131
|
+
// Build context for LLM
|
|
132
|
+
const contextParts = [];
|
|
133
|
+
contextParts.push(`Framework: ${framework.framework || "unknown"}`);
|
|
134
|
+
contextParts.push(`Mode: ${mode}`);
|
|
135
|
+
contextParts.push(`Components: ${framework.componentCount || "unknown"}`);
|
|
136
|
+
contextParts.push(`Scope: ${(scopeMap.primary || []).length} primary files`);
|
|
137
|
+
|
|
138
|
+
if (swarmFindings.length > 0) {
|
|
139
|
+
contextParts.push(`\nSub-agent findings (${swarmFindings.length} total):`);
|
|
140
|
+
for (const f of swarmFindings.slice(0, 30)) {
|
|
141
|
+
contextParts.push(`- [${f.severity || "P3"}] ${f.file || ""}:${f.line || ""} ${f.title || f.type || ""}`);
|
|
142
|
+
}
|
|
143
|
+
}
|
|
144
|
+
|
|
145
|
+
if (omarBaseline) {
|
|
146
|
+
const baselineFindings = omarBaseline.findings || omarBaseline.summary || [];
|
|
147
|
+
if (Array.isArray(baselineFindings) && baselineFindings.length > 0) {
|
|
148
|
+
contextParts.push(`\nOmar baseline findings (${baselineFindings.length}):`);
|
|
149
|
+
for (const f of baselineFindings.slice(0, 20)) {
|
|
150
|
+
contextParts.push(`- [${f.severity || ""}] ${f.file || ""}:${f.line || ""} ${f.message || f.title || ""}`);
|
|
151
|
+
}
|
|
152
|
+
}
|
|
153
|
+
}
|
|
154
|
+
|
|
155
|
+
if (memory) {
|
|
156
|
+
try {
|
|
157
|
+
const recalled = memory.query ? memory.query({
|
|
158
|
+
files: (scopeMap.primary || []).map(f => f.path || f),
|
|
159
|
+
limit: 10,
|
|
160
|
+
}) : [];
|
|
161
|
+
if (recalled.length > 0) {
|
|
162
|
+
contextParts.push(`\nPrevious findings recalled from memory (${recalled.length}):`);
|
|
163
|
+
for (const r of recalled) {
|
|
164
|
+
contextParts.push(`- ${r.content || r.text || JSON.stringify(r).slice(0, 100)}`);
|
|
165
|
+
}
|
|
166
|
+
}
|
|
167
|
+
} catch { /* memory recall failure is non-blocking */ }
|
|
168
|
+
}
|
|
169
|
+
|
|
170
|
+
const messages = [
|
|
171
|
+
{ role: "user", content: contextParts.join("\n") +
|
|
172
|
+
"\n\nPerform your deep analysis now. Use FileRead, Grep, Glob, and FrontendAnalyze tools as needed. " +
|
|
173
|
+
"Return your findings in a ```json code block as an array of { severity, file, line, title, evidence, rootCause, recommendedFix, trafficLight }." },
|
|
174
|
+
];
|
|
175
|
+
|
|
176
|
+
const allFindings = [...swarmFindings];
|
|
177
|
+
let turnCount = 0;
|
|
178
|
+
|
|
179
|
+
while (turnCount < maxTurns) {
|
|
180
|
+
if (abortController?.signal.aborted) {
|
|
181
|
+
yield emit("agent_abort", { reason: "user_cancelled" });
|
|
182
|
+
break;
|
|
183
|
+
}
|
|
184
|
+
|
|
185
|
+
// Budget check before LLM call
|
|
186
|
+
const preCheck = evaluateBudget({
|
|
187
|
+
sessionSummary: {
|
|
188
|
+
costUsd: ctx.usage.costUsd,
|
|
189
|
+
outputTokens: ctx.usage.outputTokens,
|
|
190
|
+
durationMs: Date.now() - startedAt,
|
|
191
|
+
toolCalls: ctx.usage.toolCalls,
|
|
192
|
+
},
|
|
193
|
+
...budget,
|
|
194
|
+
});
|
|
195
|
+
|
|
196
|
+
if (preCheck.blocking) {
|
|
197
|
+
yield emit("budget_stop", { reasons: preCheck.reasons });
|
|
198
|
+
break;
|
|
199
|
+
}
|
|
200
|
+
|
|
201
|
+
if (preCheck.warnings.length > 0) {
|
|
202
|
+
yield emit("budget_warning", { warnings: preCheck.warnings });
|
|
203
|
+
}
|
|
204
|
+
|
|
205
|
+
turnCount++;
|
|
206
|
+
|
|
207
|
+
// Heartbeat
|
|
208
|
+
if (turnCount % HEARTBEAT_INTERVAL_TURNS === 0) {
|
|
209
|
+
yield emit("heartbeat", {
|
|
210
|
+
turnsCompleted: turnCount,
|
|
211
|
+
turnsMax: maxTurns,
|
|
212
|
+
findingsSoFar: allFindings.length,
|
|
213
|
+
budgetRemaining: {
|
|
214
|
+
costUsd: Math.max(0, budget.maxCostUsd - ctx.usage.costUsd),
|
|
215
|
+
pct: Math.max(0, 100 - (ctx.usage.costUsd / budget.maxCostUsd * 100)),
|
|
216
|
+
},
|
|
217
|
+
});
|
|
218
|
+
}
|
|
219
|
+
|
|
220
|
+
// Call LLM
|
|
221
|
+
let response;
|
|
222
|
+
try {
|
|
223
|
+
response = await client.invoke({
|
|
224
|
+
systemPrompt,
|
|
225
|
+
messages,
|
|
226
|
+
});
|
|
227
|
+
} catch (err) {
|
|
228
|
+
yield emit("llm_error", { error: err.message, turn: turnCount });
|
|
229
|
+
break;
|
|
230
|
+
}
|
|
231
|
+
|
|
232
|
+
const responseText = response.text || "";
|
|
233
|
+
ctx.usage.outputTokens += Math.ceil(responseText.length / 4);
|
|
234
|
+
ctx.usage.costUsd += (Math.ceil(responseText.length / 4) / 1_000_000) * 15;
|
|
235
|
+
|
|
236
|
+
yield emit("reasoning", {
|
|
237
|
+
phase: "deep_analysis",
|
|
238
|
+
turn: turnCount,
|
|
239
|
+
summary: responseText.slice(0, 200),
|
|
240
|
+
});
|
|
241
|
+
|
|
242
|
+
// Parse tool_use blocks
|
|
243
|
+
const toolCalls = parseToolUseBlocks(responseText);
|
|
244
|
+
|
|
245
|
+
if (toolCalls.length === 0) {
|
|
246
|
+
// No tools — extract findings from response
|
|
247
|
+
const parsed = extractJsonFindings(responseText);
|
|
248
|
+
for (const finding of parsed) {
|
|
249
|
+
allFindings.push(finding);
|
|
250
|
+
yield emit("finding", { ...finding });
|
|
251
|
+
if (blackboard) {
|
|
252
|
+
try {
|
|
253
|
+
await blackboard.appendEntry({
|
|
254
|
+
agentId: JULES_DEFINITION.id,
|
|
255
|
+
source: "jules-primary",
|
|
256
|
+
...finding,
|
|
257
|
+
});
|
|
258
|
+
} catch { /* blackboard write failure non-blocking */ }
|
|
259
|
+
}
|
|
260
|
+
}
|
|
261
|
+
messages.push({ role: "assistant", content: responseText });
|
|
262
|
+
break; // LLM is done
|
|
263
|
+
}
|
|
264
|
+
|
|
265
|
+
// Execute tool calls
|
|
266
|
+
const results = [];
|
|
267
|
+
for (const call of toolCalls) {
|
|
268
|
+
try {
|
|
269
|
+
const result = await dispatchTool(call.tool, call.input, ctx);
|
|
270
|
+
results.push({ tool: call.tool, result });
|
|
271
|
+
yield emit("tool_call", { tool: call.tool, input: sanitizeForEvent(call.input) });
|
|
272
|
+
} catch (err) {
|
|
273
|
+
if (err instanceof BudgetExhaustedError) {
|
|
274
|
+
yield emit("budget_stop", { reason: err.message });
|
|
275
|
+
break;
|
|
276
|
+
}
|
|
277
|
+
results.push({ tool: call.tool, error: err.message });
|
|
278
|
+
}
|
|
279
|
+
}
|
|
280
|
+
|
|
281
|
+
// Feed results back
|
|
282
|
+
messages.push({ role: "assistant", content: responseText });
|
|
283
|
+
messages.push({
|
|
284
|
+
role: "user",
|
|
285
|
+
content: results.map(r =>
|
|
286
|
+
r.error
|
|
287
|
+
? `Tool ${r.tool} failed: ${r.error}`
|
|
288
|
+
: `Tool ${r.tool} result:\n${JSON.stringify(r.result).slice(0, 3000)}`,
|
|
289
|
+
).join("\n\n") + "\n\nContinue your analysis. If done, return findings in a ```json code block.",
|
|
290
|
+
});
|
|
291
|
+
}
|
|
292
|
+
|
|
293
|
+
// ── Phase 3: Build final report ───────────────────────────────────
|
|
294
|
+
|
|
295
|
+
const durationMs = Date.now() - startedAt;
|
|
296
|
+
const severityCounts = { P0: 0, P1: 0, P2: 0, P3: 0 };
|
|
297
|
+
for (const f of allFindings) {
|
|
298
|
+
const sev = (f.severity || "P3").toUpperCase();
|
|
299
|
+
if (severityCounts[sev] !== undefined) severityCounts[sev]++;
|
|
300
|
+
else severityCounts.P3++;
|
|
301
|
+
}
|
|
302
|
+
|
|
303
|
+
const report = {
|
|
304
|
+
runId,
|
|
305
|
+
persona: JULES_DEFINITION.persona,
|
|
306
|
+
mode,
|
|
307
|
+
framework: framework.framework || "unknown",
|
|
308
|
+
status: "completed",
|
|
309
|
+
findings: allFindings,
|
|
310
|
+
summary: {
|
|
311
|
+
total: allFindings.length,
|
|
312
|
+
...severityCounts,
|
|
313
|
+
blocking: severityCounts.P0 > 0 || severityCounts.P1 > 0,
|
|
314
|
+
},
|
|
315
|
+
usage: {
|
|
316
|
+
turns: turnCount,
|
|
317
|
+
costUsd: ctx.usage.costUsd,
|
|
318
|
+
outputTokens: ctx.usage.outputTokens,
|
|
319
|
+
toolCalls: ctx.usage.toolCalls,
|
|
320
|
+
durationMs,
|
|
321
|
+
},
|
|
322
|
+
signature: JULES_DEFINITION.signature,
|
|
323
|
+
};
|
|
324
|
+
|
|
325
|
+
yield emit("agent_complete", {
|
|
326
|
+
...report.summary,
|
|
327
|
+
costUsd: ctx.usage.costUsd,
|
|
328
|
+
durationMs,
|
|
329
|
+
turns: turnCount,
|
|
330
|
+
});
|
|
331
|
+
|
|
332
|
+
return report;
|
|
333
|
+
}
|
|
334
|
+
|
|
335
|
+
// ── Helpers ──────────────────────────────────────────────────────────
|
|
336
|
+
|
|
337
|
+
function parseToolUseBlocks(text) {
|
|
338
|
+
const calls = [];
|
|
339
|
+
const regex = /```tool_use\s*\n([\s\S]*?)```/g;
|
|
340
|
+
let match;
|
|
341
|
+
while ((match = regex.exec(text)) !== null) {
|
|
342
|
+
try {
|
|
343
|
+
const parsed = JSON.parse(match[1].trim());
|
|
344
|
+
if (parsed.tool && parsed.input) calls.push(parsed);
|
|
345
|
+
} catch { /* skip malformed */ }
|
|
346
|
+
}
|
|
347
|
+
return calls;
|
|
348
|
+
}
|
|
349
|
+
|
|
350
|
+
function extractJsonFindings(text) {
|
|
351
|
+
const jsonMatch = text.match(/```json\s*\n([\s\S]*?)```/);
|
|
352
|
+
if (!jsonMatch) return [];
|
|
353
|
+
try {
|
|
354
|
+
const parsed = JSON.parse(jsonMatch[1].trim());
|
|
355
|
+
if (Array.isArray(parsed)) return parsed;
|
|
356
|
+
if (parsed.findings && Array.isArray(parsed.findings)) return parsed.findings;
|
|
357
|
+
} catch { /* skip malformed */ }
|
|
358
|
+
return [];
|
|
359
|
+
}
|
|
360
|
+
|
|
361
|
+
function sanitizeForEvent(input) {
|
|
362
|
+
const sanitized = { ...input };
|
|
363
|
+
if (typeof sanitized.content === "string" && sanitized.content.length > 200) {
|
|
364
|
+
sanitized.content = `[${sanitized.content.length} chars]`;
|
|
365
|
+
}
|
|
366
|
+
return sanitized;
|
|
367
|
+
}
|