sentinelayer-cli 0.6.2 → 0.8.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (280) hide show
  1. package/README.md +1009 -996
  2. package/bin/create-sentinelayer.js +5 -5
  3. package/bin/sentinelayer-cli.js +4 -4
  4. package/bin/sl.js +5 -5
  5. package/package.json +64 -63
  6. package/src/agents/ai-governance/index.js +12 -0
  7. package/src/agents/ai-governance/tools/base.js +171 -0
  8. package/src/agents/ai-governance/tools/eval-regression.js +47 -0
  9. package/src/agents/ai-governance/tools/hitl-audit.js +81 -0
  10. package/src/agents/ai-governance/tools/index.js +52 -0
  11. package/src/agents/ai-governance/tools/prompt-drift.js +42 -0
  12. package/src/agents/ai-governance/tools/provenance-check.js +69 -0
  13. package/src/agents/backend/index.js +12 -0
  14. package/src/agents/backend/tools/base.js +189 -0
  15. package/src/agents/backend/tools/circuit-breaker-check.js +123 -0
  16. package/src/agents/backend/tools/idempotency-audit.js +105 -0
  17. package/src/agents/backend/tools/index.js +87 -0
  18. package/src/agents/backend/tools/retry-audit.js +132 -0
  19. package/src/agents/backend/tools/timeout-audit.js +144 -0
  20. package/src/agents/code-quality/index.js +12 -0
  21. package/src/agents/code-quality/tools/base.js +159 -0
  22. package/src/agents/code-quality/tools/complexity-measure.js +197 -0
  23. package/src/agents/code-quality/tools/coupling-analysis.js +81 -0
  24. package/src/agents/code-quality/tools/cycle-detect.js +49 -0
  25. package/src/agents/code-quality/tools/dep-graph.js +196 -0
  26. package/src/agents/code-quality/tools/index.js +89 -0
  27. package/src/agents/data-layer/index.js +12 -0
  28. package/src/agents/data-layer/tools/base.js +181 -0
  29. package/src/agents/data-layer/tools/index-audit.js +165 -0
  30. package/src/agents/data-layer/tools/index.js +83 -0
  31. package/src/agents/data-layer/tools/migration-scan.js +135 -0
  32. package/src/agents/data-layer/tools/query-explain.js +120 -0
  33. package/src/agents/data-layer/tools/tenancy-scan.js +166 -0
  34. package/src/agents/documentation/index.js +12 -0
  35. package/src/agents/documentation/tools/api-diff.js +91 -0
  36. package/src/agents/documentation/tools/base.js +151 -0
  37. package/src/agents/documentation/tools/dead-link-check.js +58 -0
  38. package/src/agents/documentation/tools/docstring-coverage.js +78 -0
  39. package/src/agents/documentation/tools/index.js +52 -0
  40. package/src/agents/documentation/tools/readme-freshness.js +61 -0
  41. package/src/agents/envelope/fix-cycle.js +45 -0
  42. package/src/agents/envelope/index.js +31 -0
  43. package/src/agents/envelope/loop.js +150 -0
  44. package/src/agents/envelope/pulse.js +18 -0
  45. package/src/agents/envelope/stream.js +40 -0
  46. package/src/agents/infrastructure/index.js +12 -0
  47. package/src/agents/infrastructure/tools/base.js +171 -0
  48. package/src/agents/infrastructure/tools/checkov-run.js +32 -0
  49. package/src/agents/infrastructure/tools/drift-detect.js +59 -0
  50. package/src/agents/infrastructure/tools/iam-least-priv-check.js +78 -0
  51. package/src/agents/infrastructure/tools/index.js +52 -0
  52. package/src/agents/infrastructure/tools/tflint-run.js +31 -0
  53. package/src/agents/jules/config/definition.js +160 -160
  54. package/src/agents/jules/config/system-prompt.js +182 -182
  55. package/src/agents/jules/error-intake.js +51 -51
  56. package/src/agents/jules/fix-cycle.js +17 -17
  57. package/src/agents/jules/loop.js +460 -450
  58. package/src/agents/jules/pulse.js +10 -10
  59. package/src/agents/jules/stream.js +187 -186
  60. package/src/agents/jules/swarm/file-scanner.js +74 -74
  61. package/src/agents/jules/swarm/index.js +11 -11
  62. package/src/agents/jules/swarm/orchestrator.js +362 -362
  63. package/src/agents/jules/swarm/pattern-hunter.js +123 -123
  64. package/src/agents/jules/swarm/sub-agent.js +315 -309
  65. package/src/agents/jules/tools/aidenid-email.js +189 -189
  66. package/src/agents/jules/tools/auth-audit.js +1708 -1691
  67. package/src/agents/jules/tools/dispatch.js +340 -335
  68. package/src/agents/jules/tools/file-edit.js +2 -2
  69. package/src/agents/jules/tools/file-read.js +2 -2
  70. package/src/agents/jules/tools/frontend-analyze.js +570 -570
  71. package/src/agents/jules/tools/glob.js +2 -2
  72. package/src/agents/jules/tools/grep.js +2 -2
  73. package/src/agents/jules/tools/index.js +29 -29
  74. package/src/agents/jules/tools/path-guards.js +2 -2
  75. package/src/agents/jules/tools/runtime-audit.js +507 -507
  76. package/src/agents/jules/tools/shell.js +2 -2
  77. package/src/agents/jules/tools/url-policy.js +100 -100
  78. package/src/agents/mode.js +113 -0
  79. package/src/agents/observability/index.js +12 -0
  80. package/src/agents/observability/tools/alert-audit.js +39 -0
  81. package/src/agents/observability/tools/base.js +181 -0
  82. package/src/agents/observability/tools/dashboard-gap.js +42 -0
  83. package/src/agents/observability/tools/index.js +54 -0
  84. package/src/agents/observability/tools/log-schema-check.js +74 -0
  85. package/src/agents/observability/tools/span-coverage.js +74 -0
  86. package/src/agents/persona-visuals.js +102 -61
  87. package/src/agents/release/index.js +12 -0
  88. package/src/agents/release/tools/base.js +181 -0
  89. package/src/agents/release/tools/changelog-diff.js +86 -0
  90. package/src/agents/release/tools/feature-flag-audit.js +126 -0
  91. package/src/agents/release/tools/index.js +61 -0
  92. package/src/agents/release/tools/rollback-verify.js +129 -0
  93. package/src/agents/release/tools/semver-check.js +109 -0
  94. package/src/agents/reliability/index.js +12 -0
  95. package/src/agents/reliability/tools/backpressure-check.js +129 -0
  96. package/src/agents/reliability/tools/base.js +181 -0
  97. package/src/agents/reliability/tools/chaos-probe.js +109 -0
  98. package/src/agents/reliability/tools/graceful-degradation-check.js +114 -0
  99. package/src/agents/reliability/tools/health-check-audit.js +111 -0
  100. package/src/agents/reliability/tools/index.js +87 -0
  101. package/src/agents/run-persona.js +109 -0
  102. package/src/agents/security/index.js +12 -0
  103. package/src/agents/security/tools/authz-audit.js +134 -0
  104. package/src/agents/security/tools/base.js +190 -0
  105. package/src/agents/security/tools/crypto-review.js +175 -0
  106. package/src/agents/security/tools/index.js +97 -0
  107. package/src/agents/security/tools/sast-scan.js +175 -0
  108. package/src/agents/security/tools/secrets-scan.js +216 -0
  109. package/src/agents/shared-tools/dispatch-core.js +320 -315
  110. package/src/agents/shared-tools/file-edit.js +180 -180
  111. package/src/agents/shared-tools/file-read.js +100 -100
  112. package/src/agents/shared-tools/glob.js +168 -168
  113. package/src/agents/shared-tools/grep.js +228 -228
  114. package/src/agents/shared-tools/index.js +46 -46
  115. package/src/agents/shared-tools/path-guards.js +161 -161
  116. package/src/agents/shared-tools/shell.js +383 -383
  117. package/src/agents/supply-chain/index.js +12 -0
  118. package/src/agents/supply-chain/tools/attestation-check.js +42 -0
  119. package/src/agents/supply-chain/tools/base.js +151 -0
  120. package/src/agents/supply-chain/tools/index.js +52 -0
  121. package/src/agents/supply-chain/tools/lockfile-integrity.js +73 -0
  122. package/src/agents/supply-chain/tools/package-verify.js +56 -0
  123. package/src/agents/supply-chain/tools/sbom-diff.js +34 -0
  124. package/src/agents/testing/index.js +12 -0
  125. package/src/agents/testing/tools/base.js +202 -0
  126. package/src/agents/testing/tools/coverage-gap.js +144 -0
  127. package/src/agents/testing/tools/flake-detect.js +125 -0
  128. package/src/agents/testing/tools/index.js +85 -0
  129. package/src/agents/testing/tools/mutation-test.js +143 -0
  130. package/src/agents/testing/tools/snapshot-diff.js +103 -0
  131. package/src/ai/aidenid.js +1021 -1009
  132. package/src/ai/client.js +553 -553
  133. package/src/ai/domain-target-store.js +268 -268
  134. package/src/ai/identity-store.js +270 -270
  135. package/src/ai/proxy.js +137 -137
  136. package/src/ai/site-store.js +145 -145
  137. package/src/audit/agents/architecture.js +180 -180
  138. package/src/audit/agents/compliance.js +179 -179
  139. package/src/audit/agents/documentation.js +165 -165
  140. package/src/audit/agents/performance.js +145 -145
  141. package/src/audit/agents/security.js +215 -215
  142. package/src/audit/agents/testing.js +172 -172
  143. package/src/audit/orchestrator.js +557 -557
  144. package/src/audit/package.js +204 -204
  145. package/src/audit/registry.js +284 -284
  146. package/src/audit/replay.js +103 -103
  147. package/src/auth/gate.js +428 -371
  148. package/src/auth/http.js +681 -611
  149. package/src/auth/service.js +1106 -1106
  150. package/src/auth/session-store.js +813 -813
  151. package/src/cli.js +257 -252
  152. package/src/commands/ai/identity-lifecycle.js +1338 -1338
  153. package/src/commands/ai/provision-governance.js +1272 -1272
  154. package/src/commands/ai/shared.js +147 -147
  155. package/src/commands/ai.js +11 -11
  156. package/src/commands/apply.js +12 -12
  157. package/src/commands/audit.js +1171 -1166
  158. package/src/commands/auth.js +419 -419
  159. package/src/commands/chat.js +184 -191
  160. package/src/commands/config.js +184 -184
  161. package/src/commands/cost.js +311 -311
  162. package/src/commands/daemon/core.js +850 -850
  163. package/src/commands/daemon/extended.js +1048 -1048
  164. package/src/commands/daemon/shared.js +213 -213
  165. package/src/commands/daemon.js +11 -11
  166. package/src/commands/guide.js +174 -174
  167. package/src/commands/ingest.js +58 -58
  168. package/src/commands/init.js +55 -55
  169. package/src/commands/legacy-args.js +20 -10
  170. package/src/commands/mcp.js +461 -461
  171. package/src/commands/omargate.js +63 -29
  172. package/src/commands/persona.js +65 -20
  173. package/src/commands/plugin.js +260 -260
  174. package/src/commands/policy.js +132 -132
  175. package/src/commands/prompt.js +238 -238
  176. package/src/commands/review.js +704 -704
  177. package/src/commands/scan.js +865 -872
  178. package/src/commands/session.js +1238 -0
  179. package/src/commands/spec.js +771 -716
  180. package/src/commands/swarm.js +651 -651
  181. package/src/commands/telemetry.js +202 -202
  182. package/src/commands/watch.js +511 -511
  183. package/src/config/agent-dictionary.js +182 -182
  184. package/src/config/io.js +56 -56
  185. package/src/config/paths.js +18 -18
  186. package/src/config/schema.js +55 -55
  187. package/src/config/service.js +184 -184
  188. package/src/coord/events-log.js +141 -0
  189. package/src/coord/handshake.js +719 -0
  190. package/src/coord/index.js +35 -0
  191. package/src/coord/paths.js +84 -0
  192. package/src/coord/priority.js +62 -0
  193. package/src/coord/tarjan.js +157 -0
  194. package/src/cost/budget.js +235 -235
  195. package/src/cost/history.js +188 -188
  196. package/src/cost/tokenizer.js +160 -0
  197. package/src/cost/tracker.js +232 -171
  198. package/src/daemon/artifact-lineage.js +896 -534
  199. package/src/daemon/assignment-ledger.js +1083 -770
  200. package/src/daemon/ast-drift.js +496 -0
  201. package/src/daemon/ast-parser-layer.js +258 -258
  202. package/src/daemon/budget-governor.js +633 -633
  203. package/src/daemon/callgraph-overlay.js +646 -646
  204. package/src/daemon/error-worker.js +1209 -626
  205. package/src/daemon/fix-cycle.js +384 -377
  206. package/src/daemon/hybrid-mapper.js +929 -929
  207. package/src/daemon/ingest-refresh.js +79 -11
  208. package/src/daemon/jira-lifecycle.js +767 -632
  209. package/src/daemon/operator-control.js +657 -657
  210. package/src/daemon/pulse.js +327 -327
  211. package/src/daemon/reliability-lane.js +471 -471
  212. package/src/daemon/scope-engine.js +1068 -0
  213. package/src/daemon/watchdog.js +971 -971
  214. package/src/events/schema.js +190 -0
  215. package/src/guide/generator.js +316 -316
  216. package/src/ingest/engine.js +933 -918
  217. package/src/ingest/ownership.js +380 -0
  218. package/src/interactive/index.js +97 -97
  219. package/src/legacy-cli.js +3228 -2994
  220. package/src/mcp/registry.js +695 -695
  221. package/src/memory/blackboard.js +301 -301
  222. package/src/memory/retrieval.js +581 -581
  223. package/src/orchestrator/kai-chen.js +126 -0
  224. package/src/plugin/manifest.js +553 -553
  225. package/src/policy/packs.js +144 -144
  226. package/src/prompt/generator.js +136 -118
  227. package/src/review/ai-review.js +672 -679
  228. package/src/review/compliance-pack.js +389 -0
  229. package/src/review/investor-dd-config.js +54 -0
  230. package/src/review/investor-dd-file-loop.js +303 -0
  231. package/src/review/investor-dd-file-router.js +406 -0
  232. package/src/review/investor-dd-html-report.js +233 -0
  233. package/src/review/investor-dd-notification.js +120 -0
  234. package/src/review/investor-dd-orchestrator.js +405 -0
  235. package/src/review/investor-dd-persona-runner.js +275 -0
  236. package/src/review/live-validator.js +253 -0
  237. package/src/review/local-review.js +1351 -1305
  238. package/src/review/omargate-interactive.js +68 -68
  239. package/src/review/omargate-orchestrator.js +492 -300
  240. package/src/review/persona-prompts.js +484 -296
  241. package/src/review/reconciliation-rules.js +329 -0
  242. package/src/review/replay.js +235 -235
  243. package/src/review/report.js +664 -664
  244. package/src/review/reproducibility-chain.js +136 -0
  245. package/src/review/scan-modes.js +147 -42
  246. package/src/review/spec-binding.js +487 -487
  247. package/src/scaffold/generator.js +67 -67
  248. package/src/scaffold/templates.js +150 -150
  249. package/src/scan/generator.js +418 -418
  250. package/src/scan/gh-secrets.js +107 -107
  251. package/src/session/agent-registry.js +359 -0
  252. package/src/session/analytics.js +479 -0
  253. package/src/session/daemon.js +1396 -0
  254. package/src/session/file-locks.js +666 -0
  255. package/src/session/paths.js +37 -0
  256. package/src/session/recap.js +567 -0
  257. package/src/session/redact.js +82 -0
  258. package/src/session/runtime-bridge.js +762 -0
  259. package/src/session/scoring.js +406 -0
  260. package/src/session/setup-guides.js +304 -0
  261. package/src/session/store.js +704 -0
  262. package/src/session/stream.js +333 -0
  263. package/src/session/sync.js +753 -0
  264. package/src/session/tasks.js +1054 -0
  265. package/src/session/templates.js +188 -0
  266. package/src/spec/generator.js +619 -519
  267. package/src/spec/regenerate.js +237 -237
  268. package/src/spec/templates.js +91 -91
  269. package/src/swarm/dashboard.js +247 -247
  270. package/src/swarm/factory.js +363 -363
  271. package/src/swarm/pentest.js +934 -934
  272. package/src/swarm/registry.js +419 -419
  273. package/src/swarm/report.js +158 -158
  274. package/src/swarm/runtime.js +569 -576
  275. package/src/swarm/scenario-dsl.js +272 -272
  276. package/src/telemetry/ledger.js +302 -302
  277. package/src/telemetry/session-tracker.js +234 -234
  278. package/src/telemetry/sync.js +203 -203
  279. package/src/ui/command-hints.js +13 -13
  280. package/src/ui/markdown.js +220 -220
@@ -1,450 +1,460 @@
1
- import { randomUUID } from "node:crypto";
2
- import { createMultiProviderApiClient } from "../../ai/client.js";
3
- import { evaluateBudget } from "../../cost/budget.js";
4
- import { dispatchTool, createAgentContext, BudgetExhaustedError } from "./tools/dispatch.js";
5
- import { JULES_DEFINITION } from "./config/definition.js";
6
- import { shouldSpawnSubAgents, runJulesSwarm } from "./swarm/orchestrator.js";
7
- import { frontendAnalyze } from "./tools/frontend-analyze.js";
8
-
9
- /**
10
- * Jules Tanaka — Agentic Loop
11
- *
12
- * Core state machine: LLM → tool_use → execute → result → LLM → repeat
13
- * With sub-agent swarm integration for large codebases.
14
- *
15
- * This loop is self-contained: it uses the existing ai/client.js for LLM calls,
16
- * the existing cost/budget.js for budget enforcement, and the Jules tool
17
- * dispatch for tool execution. No dependency on Batches O-Q.
18
- */
19
-
20
- const DEFAULT_MAX_TURNS = 25;
21
- const HEARTBEAT_INTERVAL_TURNS = 5;
22
-
23
- /**
24
- * Run Jules' agentic audit loop.
25
- *
26
- * @param {object} config
27
- * @param {string} config.systemPrompt - Jules' full system prompt
28
- * @param {object} config.scopeMap - { primary, secondary, tertiary } file lists
29
- * @param {string} config.rootPath - Codebase root
30
- * @param {object} [config.omarBaseline] - Deterministic baseline findings (if available)
31
- * @param {object} [config.blackboard] - Shared blackboard for cross-agent findings
32
- * @param {object} [config.memory] - Memory index for cross-run recall
33
- * @param {object} [config.budget] - Budget overrides
34
- * @param {object} [config.provider] - LLM provider overrides
35
- * @param {string} [config.mode] - "primary" | "secondary" | "tertiary"
36
- * @param {number} [config.maxTurns] - Max loop iterations
37
- * @param {AbortController} [config.abortController]
38
- * @param {function} [config.onEvent] - Streaming event callback
39
- * @returns {AsyncGenerator<JulesEvent>} Yields events as they occur
40
- */
41
- export async function* julesAuditLoop(config) {
42
- const {
43
- systemPrompt,
44
- scopeMap,
45
- rootPath,
46
- omarBaseline,
47
- blackboard,
48
- memory,
49
- provider,
50
- mode = "primary",
51
- maxTurns = DEFAULT_MAX_TURNS,
52
- abortController,
53
- onEvent,
54
- } = config;
55
-
56
- const budget = { ...JULES_DEFINITION.budget, ...config.budget };
57
- const runId = `jules-${Date.now()}-${randomUUID().slice(0, 8)}`;
58
- const startedAt = Date.now();
59
- const client = createMultiProviderApiClient(provider || {});
60
-
61
- const ctx = createAgentContext({
62
- agentIdentity: { id: JULES_DEFINITION.id, persona: JULES_DEFINITION.persona },
63
- budget,
64
- runId,
65
- onEvent,
66
- });
67
-
68
- const emit = (event, payload) => {
69
- const evt = {
70
- stream: "sl_event",
71
- event,
72
- agent: { id: JULES_DEFINITION.id, persona: JULES_DEFINITION.persona, color: JULES_DEFINITION.color, avatar: JULES_DEFINITION.avatar },
73
- payload,
74
- usage: {
75
- costUsd: ctx.usage.costUsd,
76
- outputTokens: ctx.usage.outputTokens,
77
- toolCalls: ctx.usage.toolCalls,
78
- durationMs: Date.now() - startedAt,
79
- },
80
- };
81
- if (onEvent) onEvent(evt);
82
- return evt;
83
- };
84
-
85
- yield emit("agent_start", { mode, runId, maxTurns, budget });
86
-
87
- // ── Phase 0: Prerequisites ────────────────────────────────────────
88
-
89
- yield emit("progress", { phase: "prerequisites", message: "Detecting framework..." });
90
-
91
- let framework = {};
92
- try {
93
- framework = frontendAnalyze({ operation: "detect_framework", path: rootPath });
94
- ctx.usage.toolCalls++;
95
- yield emit("tool_result", { tool: "FrontendAnalyze", operation: "detect_framework", result: { framework: framework.framework, componentCount: framework.componentCount } });
96
- } catch { /* proceed without */ }
97
-
98
- // ── Phase 1: Swarm or direct? ─────────────────────────────────────
99
-
100
- const spawnDecision = shouldSpawnSubAgents(scopeMap);
101
- let swarmFindings = [];
102
-
103
- if (spawnDecision.spawn && blackboard) {
104
- yield emit("progress", { phase: "swarm", message: `Large frontend (${spawnDecision.reason}). Spawning sub-agents...` });
105
-
106
- const swarmResult = await runJulesSwarm({
107
- scopeMap,
108
- rootPath,
109
- blackboard,
110
- budget: { ...budget, maxCostUsd: budget.maxCostUsd * 0.6 }, // 60% for swarm
111
- provider,
112
- parentAbort: abortController,
113
- onEvent,
114
- });
115
-
116
- swarmFindings = swarmResult.agentResults.flatMap(r => r.findings);
117
- ctx.usage.costUsd += swarmResult.usage.totalCostUsd;
118
- ctx.usage.toolCalls += swarmResult.usage.totalToolCalls;
119
-
120
- yield emit("swarm_complete", {
121
- totalFindings: swarmFindings.length,
122
- totalAgents: swarmResult.usage.totalAgents,
123
- totalCostUsd: swarmResult.usage.totalCostUsd,
124
- });
125
- }
126
-
127
- // ── Phase 2: Jules primary deep analysis (agentic LLM loop) ──────
128
-
129
- yield emit("progress", { phase: "deep_analysis", message: "Starting deep analysis..." });
130
-
131
- // Build context for LLM — BLIND-FIRST: no Omar baseline or swarm findings
132
- // in the initial context. Only codebase metadata and memory recall (past runs,
133
- // not current-run findings). Swarm/baseline reconciliation happens AFTER the
134
- // independent deep analysis completes.
135
- const contextParts = [];
136
- contextParts.push(`Framework: ${framework.framework || "unknown"}`);
137
- contextParts.push(`Mode: ${mode}`);
138
- contextParts.push(`Components: ${framework.componentCount || "unknown"}`);
139
- contextParts.push(`Scope: ${(scopeMap.primary || []).length} primary files`);
140
-
141
- if (memory) {
142
- try {
143
- const recalled = memory.query ? memory.query({
144
- files: (scopeMap.primary || []).map(f => f.path || f),
145
- limit: 10,
146
- }) : [];
147
- if (recalled.length > 0) {
148
- contextParts.push(`\nPrevious findings recalled from memory (${recalled.length}):`);
149
- for (const r of recalled) {
150
- contextParts.push(`- ${r.content || r.text || JSON.stringify(r).slice(0, 100)}`);
151
- }
152
- }
153
- } catch { /* memory recall failure is non-blocking */ }
154
- }
155
-
156
- const messages = [
157
- { role: "user", content: contextParts.join("\n") +
158
- "\n\nPerform your deep analysis now. Use FileRead, Grep, Glob, and FrontendAnalyze tools as needed. " +
159
- "Return your findings in a ```json code block as an array of { severity, file, line, title, evidence, rootCause, recommendedFix, trafficLight, reproduction, user_impact, confidence }." },
160
- ];
161
-
162
- const allFindings = [...swarmFindings];
163
- let turnCount = 0;
164
-
165
- while (turnCount < maxTurns) {
166
- if (abortController?.signal.aborted) {
167
- yield emit("agent_abort", { reason: "user_cancelled" });
168
- break;
169
- }
170
-
171
- // Budget check before LLM call
172
- const preCheck = evaluateBudget({
173
- sessionSummary: {
174
- costUsd: ctx.usage.costUsd,
175
- outputTokens: ctx.usage.outputTokens,
176
- durationMs: Date.now() - startedAt,
177
- toolCalls: ctx.usage.toolCalls,
178
- },
179
- ...budget,
180
- });
181
-
182
- if (preCheck.blocking) {
183
- yield emit("budget_stop", { reasons: preCheck.reasons });
184
- break;
185
- }
186
-
187
- if (preCheck.warnings.length > 0) {
188
- yield emit("budget_warning", { warnings: preCheck.warnings });
189
- }
190
-
191
- turnCount++;
192
-
193
- // Heartbeat
194
- if (turnCount % HEARTBEAT_INTERVAL_TURNS === 0) {
195
- yield emit("heartbeat", {
196
- turnsCompleted: turnCount,
197
- turnsMax: maxTurns,
198
- findingsSoFar: allFindings.length,
199
- budgetRemaining: {
200
- costUsd: Math.max(0, budget.maxCostUsd - ctx.usage.costUsd),
201
- pct: Math.max(0, 100 - (ctx.usage.costUsd / budget.maxCostUsd * 100)),
202
- },
203
- });
204
- }
205
-
206
- // Call LLM — format system prompt + messages into a single prompt
207
- // for the MultiProviderApiClient which uses a completions-style API
208
- let response;
209
- try {
210
- response = await client.invoke({
211
- prompt: formatPromptForClient(systemPrompt, messages),
212
- });
213
- } catch (err) {
214
- yield emit("llm_error", { error: err.message, turn: turnCount });
215
- break;
216
- }
217
-
218
- const responseText = response.text || "";
219
- ctx.usage.outputTokens += Math.ceil(responseText.length / 4);
220
- ctx.usage.costUsd += (Math.ceil(responseText.length / 4) / 1_000_000) * 15;
221
-
222
- yield emit("reasoning", {
223
- phase: "deep_analysis",
224
- turn: turnCount,
225
- summary: responseText.slice(0, 200),
226
- });
227
-
228
- // Parse tool_use blocks
229
- const toolCalls = parseToolUseBlocks(responseText);
230
-
231
- if (toolCalls.length === 0) {
232
- // No tools — extract findings from response
233
- const parsed = extractJsonFindings(responseText);
234
- for (const finding of parsed) {
235
- allFindings.push(finding);
236
- yield emit("finding", { ...finding });
237
- if (blackboard) {
238
- try {
239
- await blackboard.appendEntry({
240
- agentId: JULES_DEFINITION.id,
241
- source: "jules-primary",
242
- ...finding,
243
- });
244
- } catch { /* blackboard write failure non-blocking */ }
245
- }
246
- }
247
- messages.push({ role: "assistant", content: responseText });
248
- break; // LLM is done
249
- }
250
-
251
- // Execute tool calls
252
- const results = [];
253
- for (const call of toolCalls) {
254
- try {
255
- const result = await dispatchTool(call.tool, call.input, ctx);
256
- results.push({ tool: call.tool, result });
257
- yield emit("tool_call", { tool: call.tool, input: sanitizeForEvent(call.input) });
258
- } catch (err) {
259
- if (err instanceof BudgetExhaustedError) {
260
- yield emit("budget_stop", { reason: err.message });
261
- break;
262
- }
263
- results.push({ tool: call.tool, error: err.message });
264
- }
265
- }
266
-
267
- // Feed results back
268
- messages.push({ role: "assistant", content: responseText });
269
- messages.push({
270
- role: "user",
271
- content: results.map(r =>
272
- r.error
273
- ? `Tool ${r.tool} failed: ${r.error}`
274
- : `Tool ${r.tool} result:\n${JSON.stringify(r.result).slice(0, 3000)}`,
275
- ).join("\n\n") + "\n\nContinue your analysis. If done, return findings in a ```json code block.",
276
- });
277
- }
278
-
279
- // ── Phase 2b: Reconciliation (post-blind-pass) ─────────────────────
280
- // Now that the independent analysis is complete, cross-reference with
281
- // swarm findings and Omar baseline. This preserves blind-first: the
282
- // persona formed its own opinion before seeing prior conclusions.
283
-
284
- const hasSwarmContext = swarmFindings.length > 0;
285
- const baselineFindings = omarBaseline
286
- ? (omarBaseline.findings || omarBaseline.summary || [])
287
- : [];
288
- const hasBaselineContext = Array.isArray(baselineFindings) && baselineFindings.length > 0;
289
-
290
- if (hasSwarmContext || hasBaselineContext) {
291
- yield emit("progress", { phase: "reconciliation", message: "Cross-referencing with sub-agent and baseline findings..." });
292
-
293
- const reconcileParts = [];
294
- reconcileParts.push("Your independent analysis is complete. Now cross-reference with the following prior findings.");
295
- reconcileParts.push("For each prior finding: confirm if your analysis agrees, dispute with evidence if you disagree, or flag as missed if you did not cover it.");
296
-
297
- if (hasSwarmContext) {
298
- reconcileParts.push(`\nYour sub-agents found ${swarmFindings.length} findings:`);
299
- for (const f of swarmFindings.slice(0, 30)) {
300
- reconcileParts.push(`- [${f.severity || "P3"}] ${f.file || ""}:${f.line || ""} ${f.title || f.type || ""}`);
301
- }
302
- }
303
-
304
- if (hasBaselineContext) {
305
- reconcileParts.push(`\nOmar baseline reported ${baselineFindings.length} findings:`);
306
- for (const f of baselineFindings.slice(0, 20)) {
307
- reconcileParts.push(`- [${f.severity || ""}] ${f.file || ""}:${f.line || ""} ${f.message || f.title || ""}`);
308
- }
309
- }
310
-
311
- reconcileParts.push("\nReturn any additional or revised findings as a JSON array in a ```json code block. If no changes, return an empty array [].");
312
-
313
- messages.push({ role: "user", content: reconcileParts.join("\n") });
314
-
315
- // Budget check before reconciliation turn
316
- const reconcilePreCheck = evaluateBudget({
317
- sessionSummary: {
318
- costUsd: ctx.usage.costUsd,
319
- outputTokens: ctx.usage.outputTokens,
320
- durationMs: Date.now() - startedAt,
321
- toolCalls: ctx.usage.toolCalls,
322
- },
323
- ...budget,
324
- });
325
-
326
- if (!reconcilePreCheck.blocking) {
327
- try {
328
- const reconcileResponse = await client.invoke({
329
- prompt: formatPromptForClient(systemPrompt, messages),
330
- });
331
-
332
- const reconcileText = reconcileResponse.text || "";
333
- ctx.usage.outputTokens += Math.ceil(reconcileText.length / 4);
334
- ctx.usage.costUsd += (Math.ceil(reconcileText.length / 4) / 1_000_000) * 15;
335
-
336
- yield emit("reasoning", { phase: "reconciliation", summary: reconcileText.slice(0, 200) });
337
-
338
- const reconcileFindings = extractJsonFindings(reconcileText);
339
- for (const finding of reconcileFindings) {
340
- allFindings.push(finding);
341
- yield emit("finding", { ...finding, source: "reconciliation" });
342
- if (blackboard) {
343
- try {
344
- await blackboard.appendEntry({
345
- agentId: JULES_DEFINITION.id,
346
- source: "jules-reconciliation",
347
- ...finding,
348
- });
349
- } catch { /* blackboard write failure non-blocking */ }
350
- }
351
- }
352
-
353
- messages.push({ role: "assistant", content: reconcileText });
354
- } catch (err) {
355
- yield emit("llm_error", { error: err.message, phase: "reconciliation" });
356
- }
357
- } else {
358
- yield emit("budget_stop", { reasons: reconcilePreCheck.reasons, phase: "reconciliation" });
359
- }
360
- }
361
-
362
- // ── Phase 3: Build final report ───────────────────────────────────
363
-
364
- const durationMs = Date.now() - startedAt;
365
- const severityCounts = { P0: 0, P1: 0, P2: 0, P3: 0 };
366
- for (const f of allFindings) {
367
- const sev = (f.severity || "P3").toUpperCase();
368
- if (severityCounts[sev] !== undefined) severityCounts[sev]++;
369
- else severityCounts.P3++;
370
- }
371
-
372
- const report = {
373
- runId,
374
- persona: JULES_DEFINITION.persona,
375
- mode,
376
- framework: framework.framework || "unknown",
377
- status: "completed",
378
- findings: allFindings,
379
- summary: {
380
- total: allFindings.length,
381
- ...severityCounts,
382
- blocking: severityCounts.P0 > 0 || severityCounts.P1 > 0,
383
- },
384
- usage: {
385
- turns: turnCount,
386
- costUsd: ctx.usage.costUsd,
387
- outputTokens: ctx.usage.outputTokens,
388
- toolCalls: ctx.usage.toolCalls,
389
- durationMs,
390
- },
391
- signature: JULES_DEFINITION.signature,
392
- };
393
-
394
- yield emit("agent_complete", {
395
- ...report.summary,
396
- costUsd: ctx.usage.costUsd,
397
- durationMs,
398
- turns: turnCount,
399
- });
400
-
401
- return report;
402
- }
403
-
404
- // ── Helpers ──────────────────────────────────────────────────────────
405
-
406
- function parseToolUseBlocks(text) {
407
- const calls = [];
408
- const regex = /```tool_use\s*\n([\s\S]*?)```/g;
409
- let match;
410
- while ((match = regex.exec(text)) !== null) {
411
- try {
412
- const parsed = JSON.parse(match[1].trim());
413
- if (parsed.tool && parsed.input) calls.push(parsed);
414
- } catch { /* skip malformed */ }
415
- }
416
- return calls;
417
- }
418
-
419
- function extractJsonFindings(text) {
420
- const jsonMatch = text.match(/```json\s*\n([\s\S]*?)```/);
421
- if (!jsonMatch) return [];
422
- try {
423
- const parsed = JSON.parse(jsonMatch[1].trim());
424
- if (Array.isArray(parsed)) return parsed;
425
- if (parsed.findings && Array.isArray(parsed.findings)) return parsed.findings;
426
- } catch { /* skip malformed */ }
427
- return [];
428
- }
429
-
430
- function sanitizeForEvent(input) {
431
- const sanitized = { ...input };
432
- if (typeof sanitized.content === "string" && sanitized.content.length > 200) {
433
- sanitized.content = `[${sanitized.content.length} chars]`;
434
- }
435
- return sanitized;
436
- }
437
-
438
- /**
439
- * Format system prompt + chat messages into a single prompt string
440
- * for MultiProviderApiClient which uses a completions-style API.
441
- */
442
- function formatPromptForClient(systemPrompt, messages) {
443
- const parts = [];
444
- if (systemPrompt) parts.push(systemPrompt);
445
- for (const msg of messages) {
446
- const role = msg.role === "assistant" ? "ASSISTANT" : "USER";
447
- parts.push(`\n${role}:\n${msg.content}`);
448
- }
449
- return parts.join("\n");
450
- }
1
+ import { randomUUID } from "node:crypto";
2
+ import { createMultiProviderApiClient } from "../../ai/client.js";
3
+ import { evaluateBudget } from "../../cost/budget.js";
4
+ import { estimateTokens } from "../../cost/tokenizer.js";
5
+ import { dispatchTool, createAgentContext, BudgetExhaustedError } from "./tools/dispatch.js";
6
+ import { JULES_DEFINITION } from "./config/definition.js";
7
+ import { shouldSpawnSubAgents, runJulesSwarm } from "./swarm/orchestrator.js";
8
+ import { frontendAnalyze } from "./tools/frontend-analyze.js";
9
+ import { createAgentEvent } from "../../events/schema.js";
10
+
11
+ /**
12
+ * Jules Tanaka Agentic Loop
13
+ *
14
+ * Core state machine: LLM → tool_use → execute → result → LLM → repeat
15
+ * With sub-agent swarm integration for large codebases.
16
+ *
17
+ * This loop is self-contained: it uses the existing ai/client.js for LLM calls,
18
+ * the existing cost/budget.js for budget enforcement, and the Jules tool
19
+ * dispatch for tool execution. No dependency on Batches O-Q.
20
+ */
21
+
22
+ const DEFAULT_MAX_TURNS = 25;
23
+ const HEARTBEAT_INTERVAL_TURNS = 5;
24
+
25
+ /**
26
+ * Run Jules' agentic audit loop.
27
+ *
28
+ * @param {object} config
29
+ * @param {string} config.systemPrompt - Jules' full system prompt
30
+ * @param {object} config.scopeMap - { primary, secondary, tertiary } file lists
31
+ * @param {string} config.rootPath - Codebase root
32
+ * @param {object} [config.omarBaseline] - Deterministic baseline findings (if available)
33
+ * @param {object} [config.blackboard] - Shared blackboard for cross-agent findings
34
+ * @param {object} [config.memory] - Memory index for cross-run recall
35
+ * @param {object} [config.budget] - Budget overrides
36
+ * @param {object} [config.provider] - LLM provider overrides
37
+ * @param {string} [config.mode] - "primary" | "secondary" | "tertiary"
38
+ * @param {number} [config.maxTurns] - Max loop iterations
39
+ * @param {AbortController} [config.abortController]
40
+ * @param {function} [config.onEvent] - Streaming event callback
41
+ * @returns {AsyncGenerator<JulesEvent>} Yields events as they occur
42
+ */
43
+ export async function* julesAuditLoop(config) {
44
+ const {
45
+ systemPrompt,
46
+ scopeMap,
47
+ rootPath,
48
+ omarBaseline,
49
+ blackboard,
50
+ memory,
51
+ provider,
52
+ mode = "primary",
53
+ maxTurns = DEFAULT_MAX_TURNS,
54
+ abortController,
55
+ onEvent,
56
+ } = config;
57
+
58
+ const budget = { ...JULES_DEFINITION.budget, ...config.budget };
59
+ const runId = `jules-${Date.now()}-${randomUUID().slice(0, 8)}`;
60
+ const startedAt = Date.now();
61
+ const client = createMultiProviderApiClient(provider || {});
62
+
63
+ const ctx = createAgentContext({
64
+ agentIdentity: { id: JULES_DEFINITION.id, persona: JULES_DEFINITION.persona },
65
+ budget,
66
+ runId,
67
+ onEvent,
68
+ });
69
+
70
+ const emit = (event, payload) => {
71
+ const evt = createAgentEvent({
72
+ event,
73
+ agent: {
74
+ id: JULES_DEFINITION.id,
75
+ persona: JULES_DEFINITION.persona,
76
+ color: JULES_DEFINITION.color,
77
+ avatar: JULES_DEFINITION.avatar,
78
+ },
79
+ payload,
80
+ usage: {
81
+ costUsd: ctx.usage.costUsd,
82
+ outputTokens: ctx.usage.outputTokens,
83
+ toolCalls: ctx.usage.toolCalls,
84
+ durationMs: Date.now() - startedAt,
85
+ },
86
+ runId,
87
+ sessionId: ctx.sessionId,
88
+ });
89
+ if (onEvent) onEvent(evt);
90
+ return evt;
91
+ };
92
+
93
+ yield emit("agent_start", { mode, runId, maxTurns, budget });
94
+
95
+ // ── Phase 0: Prerequisites ────────────────────────────────────────
96
+
97
+ yield emit("progress", { phase: "prerequisites", message: "Detecting framework..." });
98
+
99
+ let framework = {};
100
+ try {
101
+ framework = frontendAnalyze({ operation: "detect_framework", path: rootPath });
102
+ ctx.usage.toolCalls++;
103
+ yield emit("tool_result", { tool: "FrontendAnalyze", operation: "detect_framework", result: { framework: framework.framework, componentCount: framework.componentCount } });
104
+ } catch { /* proceed without */ }
105
+
106
+ // ── Phase 1: Swarm or direct? ─────────────────────────────────────
107
+
108
+ const spawnDecision = shouldSpawnSubAgents(scopeMap);
109
+ let swarmFindings = [];
110
+
111
+ if (spawnDecision.spawn && blackboard) {
112
+ yield emit("progress", { phase: "swarm", message: `Large frontend (${spawnDecision.reason}). Spawning sub-agents...` });
113
+
114
+ const swarmResult = await runJulesSwarm({
115
+ scopeMap,
116
+ rootPath,
117
+ blackboard,
118
+ budget: { ...budget, maxCostUsd: budget.maxCostUsd * 0.6 }, // 60% for swarm
119
+ provider,
120
+ parentAbort: abortController,
121
+ onEvent,
122
+ });
123
+
124
+ swarmFindings = swarmResult.agentResults.flatMap(r => r.findings);
125
+ ctx.usage.costUsd += swarmResult.usage.totalCostUsd;
126
+ ctx.usage.toolCalls += swarmResult.usage.totalToolCalls;
127
+
128
+ yield emit("swarm_complete", {
129
+ totalFindings: swarmFindings.length,
130
+ totalAgents: swarmResult.usage.totalAgents,
131
+ totalCostUsd: swarmResult.usage.totalCostUsd,
132
+ });
133
+ }
134
+
135
+ // ── Phase 2: Jules primary deep analysis (agentic LLM loop) ──────
136
+
137
+ yield emit("progress", { phase: "deep_analysis", message: "Starting deep analysis..." });
138
+
139
+ // Build context for LLM — BLIND-FIRST: no Omar baseline or swarm findings
140
+ // in the initial context. Only codebase metadata and memory recall (past runs,
141
+ // not current-run findings). Swarm/baseline reconciliation happens AFTER the
142
+ // independent deep analysis completes.
143
+ const contextParts = [];
144
+ contextParts.push(`Framework: ${framework.framework || "unknown"}`);
145
+ contextParts.push(`Mode: ${mode}`);
146
+ contextParts.push(`Components: ${framework.componentCount || "unknown"}`);
147
+ contextParts.push(`Scope: ${(scopeMap.primary || []).length} primary files`);
148
+
149
+ if (memory) {
150
+ try {
151
+ const recalled = memory.query ? memory.query({
152
+ files: (scopeMap.primary || []).map(f => f.path || f),
153
+ limit: 10,
154
+ }) : [];
155
+ if (recalled.length > 0) {
156
+ contextParts.push(`\nPrevious findings recalled from memory (${recalled.length}):`);
157
+ for (const r of recalled) {
158
+ contextParts.push(`- ${r.content || r.text || JSON.stringify(r).slice(0, 100)}`);
159
+ }
160
+ }
161
+ } catch { /* memory recall failure is non-blocking */ }
162
+ }
163
+
164
+ const messages = [
165
+ { role: "user", content: contextParts.join("\n") +
166
+ "\n\nPerform your deep analysis now. Use FileRead, Grep, Glob, and FrontendAnalyze tools as needed. " +
167
+ "Return your findings in a ```json code block as an array of { severity, file, line, title, evidence, rootCause, recommendedFix, trafficLight, reproduction, user_impact, confidence }." },
168
+ ];
169
+
170
+ const allFindings = [...swarmFindings];
171
+ let turnCount = 0;
172
+
173
+ while (turnCount < maxTurns) {
174
+ if (abortController?.signal.aborted) {
175
+ yield emit("agent_abort", { reason: "user_cancelled" });
176
+ break;
177
+ }
178
+
179
+ // Budget check before LLM call
180
+ const preCheck = evaluateBudget({
181
+ sessionSummary: {
182
+ costUsd: ctx.usage.costUsd,
183
+ outputTokens: ctx.usage.outputTokens,
184
+ durationMs: Date.now() - startedAt,
185
+ toolCalls: ctx.usage.toolCalls,
186
+ },
187
+ ...budget,
188
+ });
189
+
190
+ if (preCheck.blocking) {
191
+ yield emit("budget_stop", { reasons: preCheck.reasons });
192
+ break;
193
+ }
194
+
195
+ if (preCheck.warnings.length > 0) {
196
+ yield emit("budget_warning", { warnings: preCheck.warnings });
197
+ }
198
+
199
+ turnCount++;
200
+
201
+ // Heartbeat
202
+ if (turnCount % HEARTBEAT_INTERVAL_TURNS === 0) {
203
+ yield emit("heartbeat", {
204
+ turnsCompleted: turnCount,
205
+ turnsMax: maxTurns,
206
+ findingsSoFar: allFindings.length,
207
+ budgetRemaining: {
208
+ costUsd: Math.max(0, budget.maxCostUsd - ctx.usage.costUsd),
209
+ pct: Math.max(0, 100 - (ctx.usage.costUsd / budget.maxCostUsd * 100)),
210
+ },
211
+ });
212
+ }
213
+
214
+ // Call LLM format system prompt + messages into a single prompt
215
+ // for the MultiProviderApiClient which uses a completions-style API
216
+ let response;
217
+ try {
218
+ response = await client.invoke({
219
+ prompt: formatPromptForClient(systemPrompt, messages),
220
+ });
221
+ } catch (err) {
222
+ yield emit("llm_error", { error: err.message, turn: turnCount });
223
+ break;
224
+ }
225
+
226
+ const responseText = response.text || "";
227
+ const responseTokens = estimateTokens(responseText, { provider: "anthropic" });
228
+ ctx.usage.outputTokens += responseTokens;
229
+ ctx.usage.costUsd += (responseTokens / 1_000_000) * 15;
230
+
231
+ yield emit("reasoning", {
232
+ phase: "deep_analysis",
233
+ turn: turnCount,
234
+ summary: responseText.slice(0, 200),
235
+ });
236
+
237
+ // Parse tool_use blocks
238
+ const toolCalls = parseToolUseBlocks(responseText);
239
+
240
+ if (toolCalls.length === 0) {
241
+ // No tools — extract findings from response
242
+ const parsed = extractJsonFindings(responseText);
243
+ for (const finding of parsed) {
244
+ allFindings.push(finding);
245
+ yield emit("finding", { ...finding });
246
+ if (blackboard) {
247
+ try {
248
+ await blackboard.appendEntry({
249
+ agentId: JULES_DEFINITION.id,
250
+ source: "jules-primary",
251
+ ...finding,
252
+ });
253
+ } catch { /* blackboard write failure non-blocking */ }
254
+ }
255
+ }
256
+ messages.push({ role: "assistant", content: responseText });
257
+ break; // LLM is done
258
+ }
259
+
260
+ // Execute tool calls
261
+ const results = [];
262
+ for (const call of toolCalls) {
263
+ try {
264
+ const result = await dispatchTool(call.tool, call.input, ctx);
265
+ results.push({ tool: call.tool, result });
266
+ yield emit("tool_call", { tool: call.tool, input: sanitizeForEvent(call.input) });
267
+ } catch (err) {
268
+ if (err instanceof BudgetExhaustedError) {
269
+ yield emit("budget_stop", { reason: err.message });
270
+ break;
271
+ }
272
+ results.push({ tool: call.tool, error: err.message });
273
+ }
274
+ }
275
+
276
+ // Feed results back
277
+ messages.push({ role: "assistant", content: responseText });
278
+ messages.push({
279
+ role: "user",
280
+ content: results.map(r =>
281
+ r.error
282
+ ? `Tool ${r.tool} failed: ${r.error}`
283
+ : `Tool ${r.tool} result:\n${JSON.stringify(r.result).slice(0, 3000)}`,
284
+ ).join("\n\n") + "\n\nContinue your analysis. If done, return findings in a ```json code block.",
285
+ });
286
+ }
287
+
288
+ // ── Phase 2b: Reconciliation (post-blind-pass) ─────────────────────
289
+ // Now that the independent analysis is complete, cross-reference with
290
+ // swarm findings and Omar baseline. This preserves blind-first: the
291
+ // persona formed its own opinion before seeing prior conclusions.
292
+
293
+ const hasSwarmContext = swarmFindings.length > 0;
294
+ const baselineFindings = omarBaseline
295
+ ? (omarBaseline.findings || omarBaseline.summary || [])
296
+ : [];
297
+ const hasBaselineContext = Array.isArray(baselineFindings) && baselineFindings.length > 0;
298
+
299
+ if (hasSwarmContext || hasBaselineContext) {
300
+ yield emit("progress", { phase: "reconciliation", message: "Cross-referencing with sub-agent and baseline findings..." });
301
+
302
+ const reconcileParts = [];
303
+ reconcileParts.push("Your independent analysis is complete. Now cross-reference with the following prior findings.");
304
+ reconcileParts.push("For each prior finding: confirm if your analysis agrees, dispute with evidence if you disagree, or flag as missed if you did not cover it.");
305
+
306
+ if (hasSwarmContext) {
307
+ reconcileParts.push(`\nYour sub-agents found ${swarmFindings.length} findings:`);
308
+ for (const f of swarmFindings.slice(0, 30)) {
309
+ reconcileParts.push(`- [${f.severity || "P3"}] ${f.file || ""}:${f.line || ""} ${f.title || f.type || ""}`);
310
+ }
311
+ }
312
+
313
+ if (hasBaselineContext) {
314
+ reconcileParts.push(`\nOmar baseline reported ${baselineFindings.length} findings:`);
315
+ for (const f of baselineFindings.slice(0, 20)) {
316
+ reconcileParts.push(`- [${f.severity || ""}] ${f.file || ""}:${f.line || ""} ${f.message || f.title || ""}`);
317
+ }
318
+ }
319
+
320
+ reconcileParts.push("\nReturn any additional or revised findings as a JSON array in a ```json code block. If no changes, return an empty array [].");
321
+
322
+ messages.push({ role: "user", content: reconcileParts.join("\n") });
323
+
324
+ // Budget check before reconciliation turn
325
+ const reconcilePreCheck = evaluateBudget({
326
+ sessionSummary: {
327
+ costUsd: ctx.usage.costUsd,
328
+ outputTokens: ctx.usage.outputTokens,
329
+ durationMs: Date.now() - startedAt,
330
+ toolCalls: ctx.usage.toolCalls,
331
+ },
332
+ ...budget,
333
+ });
334
+
335
+ if (!reconcilePreCheck.blocking) {
336
+ try {
337
+ const reconcileResponse = await client.invoke({
338
+ prompt: formatPromptForClient(systemPrompt, messages),
339
+ });
340
+
341
+ const reconcileText = reconcileResponse.text || "";
342
+ const reconcileTokens = estimateTokens(reconcileText, { provider: "anthropic" });
343
+ ctx.usage.outputTokens += reconcileTokens;
344
+ ctx.usage.costUsd += (reconcileTokens / 1_000_000) * 15;
345
+
346
+ yield emit("reasoning", { phase: "reconciliation", summary: reconcileText.slice(0, 200) });
347
+
348
+ const reconcileFindings = extractJsonFindings(reconcileText);
349
+ for (const finding of reconcileFindings) {
350
+ allFindings.push(finding);
351
+ yield emit("finding", { ...finding, source: "reconciliation" });
352
+ if (blackboard) {
353
+ try {
354
+ await blackboard.appendEntry({
355
+ agentId: JULES_DEFINITION.id,
356
+ source: "jules-reconciliation",
357
+ ...finding,
358
+ });
359
+ } catch { /* blackboard write failure non-blocking */ }
360
+ }
361
+ }
362
+
363
+ messages.push({ role: "assistant", content: reconcileText });
364
+ } catch (err) {
365
+ yield emit("llm_error", { error: err.message, phase: "reconciliation" });
366
+ }
367
+ } else {
368
+ yield emit("budget_stop", { reasons: reconcilePreCheck.reasons, phase: "reconciliation" });
369
+ }
370
+ }
371
+
372
+ // ── Phase 3: Build final report ───────────────────────────────────
373
+
374
+ const durationMs = Date.now() - startedAt;
375
+ const severityCounts = { P0: 0, P1: 0, P2: 0, P3: 0 };
376
+ for (const f of allFindings) {
377
+ const sev = (f.severity || "P3").toUpperCase();
378
+ if (severityCounts[sev] !== undefined) severityCounts[sev]++;
379
+ else severityCounts.P3++;
380
+ }
381
+
382
+ const report = {
383
+ runId,
384
+ persona: JULES_DEFINITION.persona,
385
+ mode,
386
+ framework: framework.framework || "unknown",
387
+ status: "completed",
388
+ findings: allFindings,
389
+ summary: {
390
+ total: allFindings.length,
391
+ ...severityCounts,
392
+ blocking: severityCounts.P0 > 0 || severityCounts.P1 > 0,
393
+ },
394
+ usage: {
395
+ turns: turnCount,
396
+ costUsd: ctx.usage.costUsd,
397
+ outputTokens: ctx.usage.outputTokens,
398
+ toolCalls: ctx.usage.toolCalls,
399
+ durationMs,
400
+ },
401
+ signature: JULES_DEFINITION.signature,
402
+ };
403
+
404
+ yield emit("agent_complete", {
405
+ ...report.summary,
406
+ costUsd: ctx.usage.costUsd,
407
+ durationMs,
408
+ turns: turnCount,
409
+ });
410
+
411
+ return report;
412
+ }
413
+
414
+ // ── Helpers ──────────────────────────────────────────────────────────
415
+
416
+ function parseToolUseBlocks(text) {
417
+ const calls = [];
418
+ const regex = /```tool_use\s*\n([\s\S]*?)```/g;
419
+ let match;
420
+ while ((match = regex.exec(text)) !== null) {
421
+ try {
422
+ const parsed = JSON.parse(match[1].trim());
423
+ if (parsed.tool && parsed.input) calls.push(parsed);
424
+ } catch { /* skip malformed */ }
425
+ }
426
+ return calls;
427
+ }
428
+
429
+ function extractJsonFindings(text) {
430
+ const jsonMatch = text.match(/```json\s*\n([\s\S]*?)```/);
431
+ if (!jsonMatch) return [];
432
+ try {
433
+ const parsed = JSON.parse(jsonMatch[1].trim());
434
+ if (Array.isArray(parsed)) return parsed;
435
+ if (parsed.findings && Array.isArray(parsed.findings)) return parsed.findings;
436
+ } catch { /* skip malformed */ }
437
+ return [];
438
+ }
439
+
440
+ function sanitizeForEvent(input) {
441
+ const sanitized = { ...input };
442
+ if (typeof sanitized.content === "string" && sanitized.content.length > 200) {
443
+ sanitized.content = `[${sanitized.content.length} chars]`;
444
+ }
445
+ return sanitized;
446
+ }
447
+
448
+ /**
449
+ * Format system prompt + chat messages into a single prompt string
450
+ * for MultiProviderApiClient which uses a completions-style API.
451
+ */
452
+ function formatPromptForClient(systemPrompt, messages) {
453
+ const parts = [];
454
+ if (systemPrompt) parts.push(systemPrompt);
455
+ for (const msg of messages) {
456
+ const role = msg.role === "assistant" ? "ASSISTANT" : "USER";
457
+ parts.push(`\n${role}:\n${msg.content}`);
458
+ }
459
+ return parts.join("\n");
460
+ }