sentinelayer-cli 0.1.2 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (127) hide show
  1. package/README.md +996 -996
  2. package/bin/create-sentinelayer.js +5 -5
  3. package/bin/sentinelayer-cli.js +4 -4
  4. package/bin/sl.js +5 -5
  5. package/package.json +62 -54
  6. package/src/agents/jules/config/definition.js +209 -209
  7. package/src/agents/jules/config/system-prompt.js +175 -175
  8. package/src/agents/jules/error-intake.js +51 -51
  9. package/src/agents/jules/fix-cycle.js +377 -377
  10. package/src/agents/jules/loop.js +367 -367
  11. package/src/agents/jules/pulse.js +319 -319
  12. package/src/agents/jules/stream.js +186 -186
  13. package/src/agents/jules/swarm/file-scanner.js +74 -74
  14. package/src/agents/jules/swarm/index.js +11 -11
  15. package/src/agents/jules/swarm/orchestrator.js +362 -362
  16. package/src/agents/jules/swarm/pattern-hunter.js +123 -123
  17. package/src/agents/jules/swarm/sub-agent.js +308 -308
  18. package/src/agents/jules/tools/auth-audit.js +226 -222
  19. package/src/agents/jules/tools/dispatch.js +327 -327
  20. package/src/agents/jules/tools/file-edit.js +180 -180
  21. package/src/agents/jules/tools/file-read.js +100 -100
  22. package/src/agents/jules/tools/frontend-analyze.js +570 -570
  23. package/src/agents/jules/tools/glob.js +168 -168
  24. package/src/agents/jules/tools/grep.js +228 -228
  25. package/src/agents/jules/tools/index.js +29 -29
  26. package/src/agents/jules/tools/path-guards.js +161 -161
  27. package/src/agents/jules/tools/runtime-audit.js +493 -493
  28. package/src/agents/jules/tools/shell.js +383 -383
  29. package/src/ai/aidenid.js +972 -945
  30. package/src/ai/client.js +508 -508
  31. package/src/ai/domain-target-store.js +268 -268
  32. package/src/ai/identity-store.js +270 -270
  33. package/src/ai/site-store.js +145 -145
  34. package/src/audit/agents/architecture.js +180 -180
  35. package/src/audit/agents/compliance.js +179 -179
  36. package/src/audit/agents/documentation.js +165 -165
  37. package/src/audit/agents/performance.js +145 -145
  38. package/src/audit/agents/security.js +215 -215
  39. package/src/audit/agents/testing.js +172 -172
  40. package/src/audit/orchestrator.js +557 -557
  41. package/src/audit/package.js +204 -204
  42. package/src/audit/registry.js +284 -284
  43. package/src/audit/replay.js +103 -103
  44. package/src/auth/http.js +113 -113
  45. package/src/auth/service.js +891 -848
  46. package/src/auth/session-store.js +359 -345
  47. package/src/cli.js +252 -252
  48. package/src/commands/ai/identity-lifecycle.js +1338 -1337
  49. package/src/commands/ai/provision-governance.js +1272 -1246
  50. package/src/commands/ai/shared.js +147 -147
  51. package/src/commands/ai.js +11 -11
  52. package/src/commands/apply.js +12 -12
  53. package/src/commands/audit.js +1166 -1166
  54. package/src/commands/auth.js +375 -366
  55. package/src/commands/chat.js +191 -191
  56. package/src/commands/config.js +184 -184
  57. package/src/commands/cost.js +311 -311
  58. package/src/commands/daemon/core.js +850 -850
  59. package/src/commands/daemon/extended.js +1048 -1048
  60. package/src/commands/daemon/shared.js +213 -213
  61. package/src/commands/daemon.js +11 -11
  62. package/src/commands/guide.js +174 -174
  63. package/src/commands/ingest.js +58 -58
  64. package/src/commands/init.js +55 -55
  65. package/src/commands/legacy-args.js +10 -10
  66. package/src/commands/mcp.js +461 -404
  67. package/src/commands/omargate.js +15 -15
  68. package/src/commands/persona.js +20 -20
  69. package/src/commands/plugin.js +260 -260
  70. package/src/commands/policy.js +132 -132
  71. package/src/commands/prompt.js +238 -238
  72. package/src/commands/review.js +704 -704
  73. package/src/commands/scan.js +866 -788
  74. package/src/commands/spec.js +716 -716
  75. package/src/commands/swarm.js +651 -651
  76. package/src/commands/telemetry.js +202 -202
  77. package/src/commands/watch.js +510 -510
  78. package/src/config/agent-dictionary.js +182 -182
  79. package/src/config/io.js +56 -56
  80. package/src/config/paths.js +18 -18
  81. package/src/config/schema.js +55 -55
  82. package/src/config/service.js +184 -184
  83. package/src/cost/budget.js +235 -235
  84. package/src/cost/history.js +188 -188
  85. package/src/cost/tracker.js +171 -171
  86. package/src/daemon/artifact-lineage.js +534 -534
  87. package/src/daemon/assignment-ledger.js +770 -770
  88. package/src/daemon/ast-parser-layer.js +258 -258
  89. package/src/daemon/budget-governor.js +633 -633
  90. package/src/daemon/callgraph-overlay.js +646 -646
  91. package/src/daemon/error-worker.js +626 -626
  92. package/src/daemon/hybrid-mapper.js +929 -929
  93. package/src/daemon/jira-lifecycle.js +632 -632
  94. package/src/daemon/operator-control.js +657 -657
  95. package/src/daemon/reliability-lane.js +471 -471
  96. package/src/daemon/watchdog.js +971 -971
  97. package/src/guide/generator.js +316 -316
  98. package/src/ingest/engine.js +918 -918
  99. package/src/legacy-cli.js +2548 -2435
  100. package/src/mcp/registry.js +695 -695
  101. package/src/memory/blackboard.js +301 -301
  102. package/src/memory/retrieval.js +581 -581
  103. package/src/plugin/manifest.js +553 -553
  104. package/src/policy/packs.js +144 -144
  105. package/src/prompt/generator.js +118 -106
  106. package/src/review/ai-review.js +669 -669
  107. package/src/review/local-review.js +1284 -1284
  108. package/src/review/replay.js +235 -235
  109. package/src/review/report.js +664 -664
  110. package/src/review/spec-binding.js +487 -487
  111. package/src/scaffold/generator.js +67 -0
  112. package/src/scaffold/templates.js +150 -0
  113. package/src/scan/generator.js +418 -351
  114. package/src/scan/gh-secrets.js +107 -0
  115. package/src/spec/generator.js +519 -519
  116. package/src/spec/regenerate.js +237 -237
  117. package/src/spec/templates.js +91 -91
  118. package/src/swarm/dashboard.js +247 -247
  119. package/src/swarm/factory.js +363 -363
  120. package/src/swarm/pentest.js +934 -934
  121. package/src/swarm/registry.js +419 -419
  122. package/src/swarm/report.js +158 -158
  123. package/src/swarm/runtime.js +576 -576
  124. package/src/swarm/scenario-dsl.js +272 -272
  125. package/src/telemetry/ledger.js +302 -302
  126. package/src/telemetry/sync.js +96 -59
  127. package/src/ui/markdown.js +220 -220
@@ -1,367 +1,367 @@
1
- import { randomUUID } from "node:crypto";
2
- import { createMultiProviderApiClient } from "../../ai/client.js";
3
- import { evaluateBudget } from "../../cost/budget.js";
4
- import { dispatchTool, createAgentContext, BudgetExhaustedError } from "./tools/dispatch.js";
5
- import { JULES_DEFINITION } from "./config/definition.js";
6
- import { shouldSpawnSubAgents, runJulesSwarm } from "./swarm/orchestrator.js";
7
- import { frontendAnalyze } from "./tools/frontend-analyze.js";
8
-
9
- /**
10
- * Jules Tanaka — Agentic Loop
11
- *
12
- * Core state machine: LLM → tool_use → execute → result → LLM → repeat
13
- * With sub-agent swarm integration for large codebases.
14
- *
15
- * This loop is self-contained: it uses the existing ai/client.js for LLM calls,
16
- * the existing cost/budget.js for budget enforcement, and the Jules tool
17
- * dispatch for tool execution. No dependency on Batches O-Q.
18
- */
19
-
20
- const DEFAULT_MAX_TURNS = 25;
21
- const HEARTBEAT_INTERVAL_TURNS = 5;
22
-
23
- /**
24
- * Run Jules' agentic audit loop.
25
- *
26
- * @param {object} config
27
- * @param {string} config.systemPrompt - Jules' full system prompt
28
- * @param {object} config.scopeMap - { primary, secondary, tertiary } file lists
29
- * @param {string} config.rootPath - Codebase root
30
- * @param {object} [config.omarBaseline] - Deterministic baseline findings (if available)
31
- * @param {object} [config.blackboard] - Shared blackboard for cross-agent findings
32
- * @param {object} [config.memory] - Memory index for cross-run recall
33
- * @param {object} [config.budget] - Budget overrides
34
- * @param {object} [config.provider] - LLM provider overrides
35
- * @param {string} [config.mode] - "primary" | "secondary" | "tertiary"
36
- * @param {number} [config.maxTurns] - Max loop iterations
37
- * @param {AbortController} [config.abortController]
38
- * @param {function} [config.onEvent] - Streaming event callback
39
- * @returns {AsyncGenerator<JulesEvent>} Yields events as they occur
40
- */
41
- export async function* julesAuditLoop(config) {
42
- const {
43
- systemPrompt,
44
- scopeMap,
45
- rootPath,
46
- omarBaseline,
47
- blackboard,
48
- memory,
49
- provider,
50
- mode = "primary",
51
- maxTurns = DEFAULT_MAX_TURNS,
52
- abortController,
53
- onEvent,
54
- } = config;
55
-
56
- const budget = { ...JULES_DEFINITION.budget, ...config.budget };
57
- const runId = `jules-${Date.now()}-${randomUUID().slice(0, 8)}`;
58
- const startedAt = Date.now();
59
- const client = createMultiProviderApiClient(provider || {});
60
-
61
- const ctx = createAgentContext({
62
- agentIdentity: { id: JULES_DEFINITION.id, persona: JULES_DEFINITION.persona },
63
- budget,
64
- runId,
65
- onEvent,
66
- });
67
-
68
- const emit = (event, payload) => {
69
- const evt = {
70
- stream: "sl_event",
71
- event,
72
- agent: { id: JULES_DEFINITION.id, persona: JULES_DEFINITION.persona, color: JULES_DEFINITION.color, avatar: JULES_DEFINITION.avatar },
73
- payload,
74
- usage: {
75
- costUsd: ctx.usage.costUsd,
76
- outputTokens: ctx.usage.outputTokens,
77
- toolCalls: ctx.usage.toolCalls,
78
- durationMs: Date.now() - startedAt,
79
- },
80
- };
81
- if (onEvent) onEvent(evt);
82
- return evt;
83
- };
84
-
85
- yield emit("agent_start", { mode, runId, maxTurns, budget });
86
-
87
- // ── Phase 0: Prerequisites ────────────────────────────────────────
88
-
89
- yield emit("progress", { phase: "prerequisites", message: "Detecting framework..." });
90
-
91
- let framework = {};
92
- try {
93
- framework = frontendAnalyze({ operation: "detect_framework", path: rootPath });
94
- ctx.usage.toolCalls++;
95
- yield emit("tool_result", { tool: "FrontendAnalyze", operation: "detect_framework", result: { framework: framework.framework, componentCount: framework.componentCount } });
96
- } catch { /* proceed without */ }
97
-
98
- // ── Phase 1: Swarm or direct? ─────────────────────────────────────
99
-
100
- const spawnDecision = shouldSpawnSubAgents(scopeMap);
101
- let swarmFindings = [];
102
-
103
- if (spawnDecision.spawn && blackboard) {
104
- yield emit("progress", { phase: "swarm", message: `Large frontend (${spawnDecision.reason}). Spawning sub-agents...` });
105
-
106
- const swarmResult = await runJulesSwarm({
107
- scopeMap,
108
- rootPath,
109
- blackboard,
110
- budget: { ...budget, maxCostUsd: budget.maxCostUsd * 0.6 }, // 60% for swarm
111
- provider,
112
- parentAbort: abortController,
113
- onEvent,
114
- });
115
-
116
- swarmFindings = swarmResult.agentResults.flatMap(r => r.findings);
117
- ctx.usage.costUsd += swarmResult.usage.totalCostUsd;
118
- ctx.usage.toolCalls += swarmResult.usage.totalToolCalls;
119
-
120
- yield emit("swarm_complete", {
121
- totalFindings: swarmFindings.length,
122
- totalAgents: swarmResult.usage.totalAgents,
123
- totalCostUsd: swarmResult.usage.totalCostUsd,
124
- });
125
- }
126
-
127
- // ── Phase 2: Jules primary deep analysis (agentic LLM loop) ──────
128
-
129
- yield emit("progress", { phase: "deep_analysis", message: "Starting deep analysis..." });
130
-
131
- // Build context for LLM
132
- const contextParts = [];
133
- contextParts.push(`Framework: ${framework.framework || "unknown"}`);
134
- contextParts.push(`Mode: ${mode}`);
135
- contextParts.push(`Components: ${framework.componentCount || "unknown"}`);
136
- contextParts.push(`Scope: ${(scopeMap.primary || []).length} primary files`);
137
-
138
- if (swarmFindings.length > 0) {
139
- contextParts.push(`\nSub-agent findings (${swarmFindings.length} total):`);
140
- for (const f of swarmFindings.slice(0, 30)) {
141
- contextParts.push(`- [${f.severity || "P3"}] ${f.file || ""}:${f.line || ""} ${f.title || f.type || ""}`);
142
- }
143
- }
144
-
145
- if (omarBaseline) {
146
- const baselineFindings = omarBaseline.findings || omarBaseline.summary || [];
147
- if (Array.isArray(baselineFindings) && baselineFindings.length > 0) {
148
- contextParts.push(`\nOmar baseline findings (${baselineFindings.length}):`);
149
- for (const f of baselineFindings.slice(0, 20)) {
150
- contextParts.push(`- [${f.severity || ""}] ${f.file || ""}:${f.line || ""} ${f.message || f.title || ""}`);
151
- }
152
- }
153
- }
154
-
155
- if (memory) {
156
- try {
157
- const recalled = memory.query ? memory.query({
158
- files: (scopeMap.primary || []).map(f => f.path || f),
159
- limit: 10,
160
- }) : [];
161
- if (recalled.length > 0) {
162
- contextParts.push(`\nPrevious findings recalled from memory (${recalled.length}):`);
163
- for (const r of recalled) {
164
- contextParts.push(`- ${r.content || r.text || JSON.stringify(r).slice(0, 100)}`);
165
- }
166
- }
167
- } catch { /* memory recall failure is non-blocking */ }
168
- }
169
-
170
- const messages = [
171
- { role: "user", content: contextParts.join("\n") +
172
- "\n\nPerform your deep analysis now. Use FileRead, Grep, Glob, and FrontendAnalyze tools as needed. " +
173
- "Return your findings in a ```json code block as an array of { severity, file, line, title, evidence, rootCause, recommendedFix, trafficLight }." },
174
- ];
175
-
176
- const allFindings = [...swarmFindings];
177
- let turnCount = 0;
178
-
179
- while (turnCount < maxTurns) {
180
- if (abortController?.signal.aborted) {
181
- yield emit("agent_abort", { reason: "user_cancelled" });
182
- break;
183
- }
184
-
185
- // Budget check before LLM call
186
- const preCheck = evaluateBudget({
187
- sessionSummary: {
188
- costUsd: ctx.usage.costUsd,
189
- outputTokens: ctx.usage.outputTokens,
190
- durationMs: Date.now() - startedAt,
191
- toolCalls: ctx.usage.toolCalls,
192
- },
193
- ...budget,
194
- });
195
-
196
- if (preCheck.blocking) {
197
- yield emit("budget_stop", { reasons: preCheck.reasons });
198
- break;
199
- }
200
-
201
- if (preCheck.warnings.length > 0) {
202
- yield emit("budget_warning", { warnings: preCheck.warnings });
203
- }
204
-
205
- turnCount++;
206
-
207
- // Heartbeat
208
- if (turnCount % HEARTBEAT_INTERVAL_TURNS === 0) {
209
- yield emit("heartbeat", {
210
- turnsCompleted: turnCount,
211
- turnsMax: maxTurns,
212
- findingsSoFar: allFindings.length,
213
- budgetRemaining: {
214
- costUsd: Math.max(0, budget.maxCostUsd - ctx.usage.costUsd),
215
- pct: Math.max(0, 100 - (ctx.usage.costUsd / budget.maxCostUsd * 100)),
216
- },
217
- });
218
- }
219
-
220
- // Call LLM
221
- let response;
222
- try {
223
- response = await client.invoke({
224
- systemPrompt,
225
- messages,
226
- });
227
- } catch (err) {
228
- yield emit("llm_error", { error: err.message, turn: turnCount });
229
- break;
230
- }
231
-
232
- const responseText = response.text || "";
233
- ctx.usage.outputTokens += Math.ceil(responseText.length / 4);
234
- ctx.usage.costUsd += (Math.ceil(responseText.length / 4) / 1_000_000) * 15;
235
-
236
- yield emit("reasoning", {
237
- phase: "deep_analysis",
238
- turn: turnCount,
239
- summary: responseText.slice(0, 200),
240
- });
241
-
242
- // Parse tool_use blocks
243
- const toolCalls = parseToolUseBlocks(responseText);
244
-
245
- if (toolCalls.length === 0) {
246
- // No tools — extract findings from response
247
- const parsed = extractJsonFindings(responseText);
248
- for (const finding of parsed) {
249
- allFindings.push(finding);
250
- yield emit("finding", { ...finding });
251
- if (blackboard) {
252
- try {
253
- await blackboard.appendEntry({
254
- agentId: JULES_DEFINITION.id,
255
- source: "jules-primary",
256
- ...finding,
257
- });
258
- } catch { /* blackboard write failure non-blocking */ }
259
- }
260
- }
261
- messages.push({ role: "assistant", content: responseText });
262
- break; // LLM is done
263
- }
264
-
265
- // Execute tool calls
266
- const results = [];
267
- for (const call of toolCalls) {
268
- try {
269
- const result = await dispatchTool(call.tool, call.input, ctx);
270
- results.push({ tool: call.tool, result });
271
- yield emit("tool_call", { tool: call.tool, input: sanitizeForEvent(call.input) });
272
- } catch (err) {
273
- if (err instanceof BudgetExhaustedError) {
274
- yield emit("budget_stop", { reason: err.message });
275
- break;
276
- }
277
- results.push({ tool: call.tool, error: err.message });
278
- }
279
- }
280
-
281
- // Feed results back
282
- messages.push({ role: "assistant", content: responseText });
283
- messages.push({
284
- role: "user",
285
- content: results.map(r =>
286
- r.error
287
- ? `Tool ${r.tool} failed: ${r.error}`
288
- : `Tool ${r.tool} result:\n${JSON.stringify(r.result).slice(0, 3000)}`,
289
- ).join("\n\n") + "\n\nContinue your analysis. If done, return findings in a ```json code block.",
290
- });
291
- }
292
-
293
- // ── Phase 3: Build final report ───────────────────────────────────
294
-
295
- const durationMs = Date.now() - startedAt;
296
- const severityCounts = { P0: 0, P1: 0, P2: 0, P3: 0 };
297
- for (const f of allFindings) {
298
- const sev = (f.severity || "P3").toUpperCase();
299
- if (severityCounts[sev] !== undefined) severityCounts[sev]++;
300
- else severityCounts.P3++;
301
- }
302
-
303
- const report = {
304
- runId,
305
- persona: JULES_DEFINITION.persona,
306
- mode,
307
- framework: framework.framework || "unknown",
308
- status: "completed",
309
- findings: allFindings,
310
- summary: {
311
- total: allFindings.length,
312
- ...severityCounts,
313
- blocking: severityCounts.P0 > 0 || severityCounts.P1 > 0,
314
- },
315
- usage: {
316
- turns: turnCount,
317
- costUsd: ctx.usage.costUsd,
318
- outputTokens: ctx.usage.outputTokens,
319
- toolCalls: ctx.usage.toolCalls,
320
- durationMs,
321
- },
322
- signature: JULES_DEFINITION.signature,
323
- };
324
-
325
- yield emit("agent_complete", {
326
- ...report.summary,
327
- costUsd: ctx.usage.costUsd,
328
- durationMs,
329
- turns: turnCount,
330
- });
331
-
332
- return report;
333
- }
334
-
335
- // ── Helpers ──────────────────────────────────────────────────────────
336
-
337
- function parseToolUseBlocks(text) {
338
- const calls = [];
339
- const regex = /```tool_use\s*\n([\s\S]*?)```/g;
340
- let match;
341
- while ((match = regex.exec(text)) !== null) {
342
- try {
343
- const parsed = JSON.parse(match[1].trim());
344
- if (parsed.tool && parsed.input) calls.push(parsed);
345
- } catch { /* skip malformed */ }
346
- }
347
- return calls;
348
- }
349
-
350
- function extractJsonFindings(text) {
351
- const jsonMatch = text.match(/```json\s*\n([\s\S]*?)```/);
352
- if (!jsonMatch) return [];
353
- try {
354
- const parsed = JSON.parse(jsonMatch[1].trim());
355
- if (Array.isArray(parsed)) return parsed;
356
- if (parsed.findings && Array.isArray(parsed.findings)) return parsed.findings;
357
- } catch { /* skip malformed */ }
358
- return [];
359
- }
360
-
361
- function sanitizeForEvent(input) {
362
- const sanitized = { ...input };
363
- if (typeof sanitized.content === "string" && sanitized.content.length > 200) {
364
- sanitized.content = `[${sanitized.content.length} chars]`;
365
- }
366
- return sanitized;
367
- }
1
+ import { randomUUID } from "node:crypto";
2
+ import { createMultiProviderApiClient } from "../../ai/client.js";
3
+ import { evaluateBudget } from "../../cost/budget.js";
4
+ import { dispatchTool, createAgentContext, BudgetExhaustedError } from "./tools/dispatch.js";
5
+ import { JULES_DEFINITION } from "./config/definition.js";
6
+ import { shouldSpawnSubAgents, runJulesSwarm } from "./swarm/orchestrator.js";
7
+ import { frontendAnalyze } from "./tools/frontend-analyze.js";
8
+
9
+ /**
10
+ * Jules Tanaka — Agentic Loop
11
+ *
12
+ * Core state machine: LLM → tool_use → execute → result → LLM → repeat
13
+ * With sub-agent swarm integration for large codebases.
14
+ *
15
+ * This loop is self-contained: it uses the existing ai/client.js for LLM calls,
16
+ * the existing cost/budget.js for budget enforcement, and the Jules tool
17
+ * dispatch for tool execution. No dependency on Batches O-Q.
18
+ */
19
+
20
+ const DEFAULT_MAX_TURNS = 25;
21
+ const HEARTBEAT_INTERVAL_TURNS = 5;
22
+
23
+ /**
24
+ * Run Jules' agentic audit loop.
25
+ *
26
+ * @param {object} config
27
+ * @param {string} config.systemPrompt - Jules' full system prompt
28
+ * @param {object} config.scopeMap - { primary, secondary, tertiary } file lists
29
+ * @param {string} config.rootPath - Codebase root
30
+ * @param {object} [config.omarBaseline] - Deterministic baseline findings (if available)
31
+ * @param {object} [config.blackboard] - Shared blackboard for cross-agent findings
32
+ * @param {object} [config.memory] - Memory index for cross-run recall
33
+ * @param {object} [config.budget] - Budget overrides
34
+ * @param {object} [config.provider] - LLM provider overrides
35
+ * @param {string} [config.mode] - "primary" | "secondary" | "tertiary"
36
+ * @param {number} [config.maxTurns] - Max loop iterations
37
+ * @param {AbortController} [config.abortController]
38
+ * @param {function} [config.onEvent] - Streaming event callback
39
+ * @returns {AsyncGenerator<JulesEvent>} Yields events as they occur
40
+ */
41
+ export async function* julesAuditLoop(config) {
42
+ const {
43
+ systemPrompt,
44
+ scopeMap,
45
+ rootPath,
46
+ omarBaseline,
47
+ blackboard,
48
+ memory,
49
+ provider,
50
+ mode = "primary",
51
+ maxTurns = DEFAULT_MAX_TURNS,
52
+ abortController,
53
+ onEvent,
54
+ } = config;
55
+
56
+ const budget = { ...JULES_DEFINITION.budget, ...config.budget };
57
+ const runId = `jules-${Date.now()}-${randomUUID().slice(0, 8)}`;
58
+ const startedAt = Date.now();
59
+ const client = createMultiProviderApiClient(provider || {});
60
+
61
+ const ctx = createAgentContext({
62
+ agentIdentity: { id: JULES_DEFINITION.id, persona: JULES_DEFINITION.persona },
63
+ budget,
64
+ runId,
65
+ onEvent,
66
+ });
67
+
68
+ const emit = (event, payload) => {
69
+ const evt = {
70
+ stream: "sl_event",
71
+ event,
72
+ agent: { id: JULES_DEFINITION.id, persona: JULES_DEFINITION.persona, color: JULES_DEFINITION.color, avatar: JULES_DEFINITION.avatar },
73
+ payload,
74
+ usage: {
75
+ costUsd: ctx.usage.costUsd,
76
+ outputTokens: ctx.usage.outputTokens,
77
+ toolCalls: ctx.usage.toolCalls,
78
+ durationMs: Date.now() - startedAt,
79
+ },
80
+ };
81
+ if (onEvent) onEvent(evt);
82
+ return evt;
83
+ };
84
+
85
+ yield emit("agent_start", { mode, runId, maxTurns, budget });
86
+
87
+ // ── Phase 0: Prerequisites ────────────────────────────────────────
88
+
89
+ yield emit("progress", { phase: "prerequisites", message: "Detecting framework..." });
90
+
91
+ let framework = {};
92
+ try {
93
+ framework = frontendAnalyze({ operation: "detect_framework", path: rootPath });
94
+ ctx.usage.toolCalls++;
95
+ yield emit("tool_result", { tool: "FrontendAnalyze", operation: "detect_framework", result: { framework: framework.framework, componentCount: framework.componentCount } });
96
+ } catch { /* proceed without */ }
97
+
98
+ // ── Phase 1: Swarm or direct? ─────────────────────────────────────
99
+
100
+ const spawnDecision = shouldSpawnSubAgents(scopeMap);
101
+ let swarmFindings = [];
102
+
103
+ if (spawnDecision.spawn && blackboard) {
104
+ yield emit("progress", { phase: "swarm", message: `Large frontend (${spawnDecision.reason}). Spawning sub-agents...` });
105
+
106
+ const swarmResult = await runJulesSwarm({
107
+ scopeMap,
108
+ rootPath,
109
+ blackboard,
110
+ budget: { ...budget, maxCostUsd: budget.maxCostUsd * 0.6 }, // 60% for swarm
111
+ provider,
112
+ parentAbort: abortController,
113
+ onEvent,
114
+ });
115
+
116
+ swarmFindings = swarmResult.agentResults.flatMap(r => r.findings);
117
+ ctx.usage.costUsd += swarmResult.usage.totalCostUsd;
118
+ ctx.usage.toolCalls += swarmResult.usage.totalToolCalls;
119
+
120
+ yield emit("swarm_complete", {
121
+ totalFindings: swarmFindings.length,
122
+ totalAgents: swarmResult.usage.totalAgents,
123
+ totalCostUsd: swarmResult.usage.totalCostUsd,
124
+ });
125
+ }
126
+
127
+ // ── Phase 2: Jules primary deep analysis (agentic LLM loop) ──────
128
+
129
+ yield emit("progress", { phase: "deep_analysis", message: "Starting deep analysis..." });
130
+
131
+ // Build context for LLM
132
+ const contextParts = [];
133
+ contextParts.push(`Framework: ${framework.framework || "unknown"}`);
134
+ contextParts.push(`Mode: ${mode}`);
135
+ contextParts.push(`Components: ${framework.componentCount || "unknown"}`);
136
+ contextParts.push(`Scope: ${(scopeMap.primary || []).length} primary files`);
137
+
138
+ if (swarmFindings.length > 0) {
139
+ contextParts.push(`\nSub-agent findings (${swarmFindings.length} total):`);
140
+ for (const f of swarmFindings.slice(0, 30)) {
141
+ contextParts.push(`- [${f.severity || "P3"}] ${f.file || ""}:${f.line || ""} ${f.title || f.type || ""}`);
142
+ }
143
+ }
144
+
145
+ if (omarBaseline) {
146
+ const baselineFindings = omarBaseline.findings || omarBaseline.summary || [];
147
+ if (Array.isArray(baselineFindings) && baselineFindings.length > 0) {
148
+ contextParts.push(`\nOmar baseline findings (${baselineFindings.length}):`);
149
+ for (const f of baselineFindings.slice(0, 20)) {
150
+ contextParts.push(`- [${f.severity || ""}] ${f.file || ""}:${f.line || ""} ${f.message || f.title || ""}`);
151
+ }
152
+ }
153
+ }
154
+
155
+ if (memory) {
156
+ try {
157
+ const recalled = memory.query ? memory.query({
158
+ files: (scopeMap.primary || []).map(f => f.path || f),
159
+ limit: 10,
160
+ }) : [];
161
+ if (recalled.length > 0) {
162
+ contextParts.push(`\nPrevious findings recalled from memory (${recalled.length}):`);
163
+ for (const r of recalled) {
164
+ contextParts.push(`- ${r.content || r.text || JSON.stringify(r).slice(0, 100)}`);
165
+ }
166
+ }
167
+ } catch { /* memory recall failure is non-blocking */ }
168
+ }
169
+
170
+ const messages = [
171
+ { role: "user", content: contextParts.join("\n") +
172
+ "\n\nPerform your deep analysis now. Use FileRead, Grep, Glob, and FrontendAnalyze tools as needed. " +
173
+ "Return your findings in a ```json code block as an array of { severity, file, line, title, evidence, rootCause, recommendedFix, trafficLight }." },
174
+ ];
175
+
176
+ const allFindings = [...swarmFindings];
177
+ let turnCount = 0;
178
+
179
+ while (turnCount < maxTurns) {
180
+ if (abortController?.signal.aborted) {
181
+ yield emit("agent_abort", { reason: "user_cancelled" });
182
+ break;
183
+ }
184
+
185
+ // Budget check before LLM call
186
+ const preCheck = evaluateBudget({
187
+ sessionSummary: {
188
+ costUsd: ctx.usage.costUsd,
189
+ outputTokens: ctx.usage.outputTokens,
190
+ durationMs: Date.now() - startedAt,
191
+ toolCalls: ctx.usage.toolCalls,
192
+ },
193
+ ...budget,
194
+ });
195
+
196
+ if (preCheck.blocking) {
197
+ yield emit("budget_stop", { reasons: preCheck.reasons });
198
+ break;
199
+ }
200
+
201
+ if (preCheck.warnings.length > 0) {
202
+ yield emit("budget_warning", { warnings: preCheck.warnings });
203
+ }
204
+
205
+ turnCount++;
206
+
207
+ // Heartbeat
208
+ if (turnCount % HEARTBEAT_INTERVAL_TURNS === 0) {
209
+ yield emit("heartbeat", {
210
+ turnsCompleted: turnCount,
211
+ turnsMax: maxTurns,
212
+ findingsSoFar: allFindings.length,
213
+ budgetRemaining: {
214
+ costUsd: Math.max(0, budget.maxCostUsd - ctx.usage.costUsd),
215
+ pct: Math.max(0, 100 - (ctx.usage.costUsd / budget.maxCostUsd * 100)),
216
+ },
217
+ });
218
+ }
219
+
220
+ // Call LLM
221
+ let response;
222
+ try {
223
+ response = await client.invoke({
224
+ systemPrompt,
225
+ messages,
226
+ });
227
+ } catch (err) {
228
+ yield emit("llm_error", { error: err.message, turn: turnCount });
229
+ break;
230
+ }
231
+
232
+ const responseText = response.text || "";
233
+ ctx.usage.outputTokens += Math.ceil(responseText.length / 4);
234
+ ctx.usage.costUsd += (Math.ceil(responseText.length / 4) / 1_000_000) * 15;
235
+
236
+ yield emit("reasoning", {
237
+ phase: "deep_analysis",
238
+ turn: turnCount,
239
+ summary: responseText.slice(0, 200),
240
+ });
241
+
242
+ // Parse tool_use blocks
243
+ const toolCalls = parseToolUseBlocks(responseText);
244
+
245
+ if (toolCalls.length === 0) {
246
+ // No tools — extract findings from response
247
+ const parsed = extractJsonFindings(responseText);
248
+ for (const finding of parsed) {
249
+ allFindings.push(finding);
250
+ yield emit("finding", { ...finding });
251
+ if (blackboard) {
252
+ try {
253
+ await blackboard.appendEntry({
254
+ agentId: JULES_DEFINITION.id,
255
+ source: "jules-primary",
256
+ ...finding,
257
+ });
258
+ } catch { /* blackboard write failure non-blocking */ }
259
+ }
260
+ }
261
+ messages.push({ role: "assistant", content: responseText });
262
+ break; // LLM is done
263
+ }
264
+
265
+ // Execute tool calls
266
+ const results = [];
267
+ for (const call of toolCalls) {
268
+ try {
269
+ const result = await dispatchTool(call.tool, call.input, ctx);
270
+ results.push({ tool: call.tool, result });
271
+ yield emit("tool_call", { tool: call.tool, input: sanitizeForEvent(call.input) });
272
+ } catch (err) {
273
+ if (err instanceof BudgetExhaustedError) {
274
+ yield emit("budget_stop", { reason: err.message });
275
+ break;
276
+ }
277
+ results.push({ tool: call.tool, error: err.message });
278
+ }
279
+ }
280
+
281
+ // Feed results back
282
+ messages.push({ role: "assistant", content: responseText });
283
+ messages.push({
284
+ role: "user",
285
+ content: results.map(r =>
286
+ r.error
287
+ ? `Tool ${r.tool} failed: ${r.error}`
288
+ : `Tool ${r.tool} result:\n${JSON.stringify(r.result).slice(0, 3000)}`,
289
+ ).join("\n\n") + "\n\nContinue your analysis. If done, return findings in a ```json code block.",
290
+ });
291
+ }
292
+
293
+ // ── Phase 3: Build final report ───────────────────────────────────
294
+
295
+ const durationMs = Date.now() - startedAt;
296
+ const severityCounts = { P0: 0, P1: 0, P2: 0, P3: 0 };
297
+ for (const f of allFindings) {
298
+ const sev = (f.severity || "P3").toUpperCase();
299
+ if (severityCounts[sev] !== undefined) severityCounts[sev]++;
300
+ else severityCounts.P3++;
301
+ }
302
+
303
+ const report = {
304
+ runId,
305
+ persona: JULES_DEFINITION.persona,
306
+ mode,
307
+ framework: framework.framework || "unknown",
308
+ status: "completed",
309
+ findings: allFindings,
310
+ summary: {
311
+ total: allFindings.length,
312
+ ...severityCounts,
313
+ blocking: severityCounts.P0 > 0 || severityCounts.P1 > 0,
314
+ },
315
+ usage: {
316
+ turns: turnCount,
317
+ costUsd: ctx.usage.costUsd,
318
+ outputTokens: ctx.usage.outputTokens,
319
+ toolCalls: ctx.usage.toolCalls,
320
+ durationMs,
321
+ },
322
+ signature: JULES_DEFINITION.signature,
323
+ };
324
+
325
+ yield emit("agent_complete", {
326
+ ...report.summary,
327
+ costUsd: ctx.usage.costUsd,
328
+ durationMs,
329
+ turns: turnCount,
330
+ });
331
+
332
+ return report;
333
+ }
334
+
335
+ // ── Helpers ──────────────────────────────────────────────────────────
336
+
337
+ function parseToolUseBlocks(text) {
338
+ const calls = [];
339
+ const regex = /```tool_use\s*\n([\s\S]*?)```/g;
340
+ let match;
341
+ while ((match = regex.exec(text)) !== null) {
342
+ try {
343
+ const parsed = JSON.parse(match[1].trim());
344
+ if (parsed.tool && parsed.input) calls.push(parsed);
345
+ } catch { /* skip malformed */ }
346
+ }
347
+ return calls;
348
+ }
349
+
350
+ function extractJsonFindings(text) {
351
+ const jsonMatch = text.match(/```json\s*\n([\s\S]*?)```/);
352
+ if (!jsonMatch) return [];
353
+ try {
354
+ const parsed = JSON.parse(jsonMatch[1].trim());
355
+ if (Array.isArray(parsed)) return parsed;
356
+ if (parsed.findings && Array.isArray(parsed.findings)) return parsed.findings;
357
+ } catch { /* skip malformed */ }
358
+ return [];
359
+ }
360
+
361
+ function sanitizeForEvent(input) {
362
+ const sanitized = { ...input };
363
+ if (typeof sanitized.content === "string" && sanitized.content.length > 200) {
364
+ sanitized.content = `[${sanitized.content.length} chars]`;
365
+ }
366
+ return sanitized;
367
+ }