scai 0.1.178 → 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (770) hide show
  1. package/README.md +162 -267
  2. package/dist/__tests__/CommitSuggesterCmd.test.js +112 -0
  3. package/dist/__tests__/CommitSuggesterCmd.test.js.map +1 -0
  4. package/dist/__tests__/EvalReportCmd.test.js +645 -0
  5. package/dist/__tests__/EvalReportCmd.test.js.map +1 -0
  6. package/dist/__tests__/ModelCmd.test.js +64 -0
  7. package/dist/__tests__/ModelCmd.test.js.map +1 -0
  8. package/dist/__tests__/agents/agentActions.test.js +345 -0
  9. package/dist/__tests__/agents/agentActions.test.js.map +1 -0
  10. package/dist/__tests__/agents/agentFeedback.test.js +118 -0
  11. package/dist/__tests__/agents/agentFeedback.test.js.map +1 -0
  12. package/dist/__tests__/agents/agentGeneralScope.test.js +74 -0
  13. package/dist/__tests__/agents/agentGeneralScope.test.js.map +1 -0
  14. package/dist/__tests__/agents/agentLoop.test.js +1723 -0
  15. package/dist/__tests__/agents/agentLoop.test.js.map +1 -0
  16. package/dist/__tests__/agents/agentPolicyState.test.js +948 -0
  17. package/dist/__tests__/agents/agentPolicyState.test.js.map +1 -0
  18. package/dist/__tests__/agents/agentReadEvidence.test.js +170 -0
  19. package/dist/__tests__/agents/agentReadEvidence.test.js.map +1 -0
  20. package/dist/__tests__/agents/agentReadPersistence.test.js +129 -0
  21. package/dist/__tests__/agents/agentReadPersistence.test.js.map +1 -0
  22. package/dist/__tests__/agents/agentResumeCheckpoint.test.js +90 -0
  23. package/dist/__tests__/agents/agentResumeCheckpoint.test.js.map +1 -0
  24. package/dist/__tests__/agents/agentSearchBatchPlanner.test.js +289 -0
  25. package/dist/__tests__/agents/agentSearchBatchPlanner.test.js.map +1 -0
  26. package/dist/__tests__/agents/agentSearchOwnership.test.js +166 -0
  27. package/dist/__tests__/agents/agentSearchOwnership.test.js.map +1 -0
  28. package/dist/__tests__/agents/agentSearchRanking.test.js +139 -0
  29. package/dist/__tests__/agents/agentSearchRanking.test.js.map +1 -0
  30. package/dist/__tests__/agents/agentSearchRouting.test.js +584 -0
  31. package/dist/__tests__/agents/agentSearchRouting.test.js.map +1 -0
  32. package/dist/__tests__/agents/agentSearchScoring.test.js +23 -0
  33. package/dist/__tests__/agents/agentSearchScoring.test.js.map +1 -0
  34. package/dist/__tests__/agents/agentSearchShared.test.js +78 -0
  35. package/dist/__tests__/agents/agentSearchShared.test.js.map +1 -0
  36. package/dist/__tests__/agents/agentStateMachine.test.js +58 -0
  37. package/dist/__tests__/agents/agentStateMachine.test.js.map +1 -0
  38. package/dist/__tests__/agents/agentTaskPersistence.test.js +156 -0
  39. package/dist/__tests__/agents/agentTaskPersistence.test.js.map +1 -0
  40. package/dist/__tests__/agents/agentTools.test.js +69 -0
  41. package/dist/__tests__/agents/agentTools.test.js.map +1 -0
  42. package/dist/__tests__/agents/agentTransform.test.js +779 -0
  43. package/dist/__tests__/agents/agentTransform.test.js.map +1 -0
  44. package/dist/__tests__/agents/analysisPlanGenStep.test.js +157 -0
  45. package/dist/__tests__/agents/analysisPlanGenStep.test.js.map +1 -0
  46. package/dist/__tests__/agents/answerOnlyCompletion.test.js +75 -0
  47. package/dist/__tests__/agents/answerOnlyCompletion.test.js.map +1 -0
  48. package/dist/__tests__/agents/decideNextAction.test.js +1662 -0
  49. package/dist/__tests__/agents/decideNextAction.test.js.map +1 -0
  50. package/dist/__tests__/agents/deriveFocusFromSearchStep.test.js +258 -0
  51. package/dist/__tests__/agents/deriveFocusFromSearchStep.test.js.map +1 -0
  52. package/dist/__tests__/agents/evidenceVerifierStep.test.js +113 -0
  53. package/dist/__tests__/agents/evidenceVerifierStep.test.js.map +1 -0
  54. package/dist/__tests__/agents/executionPolicyResolver.test.js +208 -0
  55. package/dist/__tests__/agents/executionPolicyResolver.test.js.map +1 -0
  56. package/dist/__tests__/agents/fileCheckStep.test.js +299 -0
  57. package/dist/__tests__/agents/fileCheckStep.test.js.map +1 -0
  58. package/dist/__tests__/agents/giveUpEvaluatorStep.test.js +35 -0
  59. package/dist/__tests__/agents/giveUpEvaluatorStep.test.js.map +1 -0
  60. package/dist/__tests__/agents/guardState.test.js +297 -0
  61. package/dist/__tests__/agents/guardState.test.js.map +1 -0
  62. package/dist/__tests__/agents/mainAgentHeuristics.test.js +72 -0
  63. package/dist/__tests__/agents/mainAgentHeuristics.test.js.map +1 -0
  64. package/dist/__tests__/agents/objectiveEvaluatorStep.test.js +60 -0
  65. package/dist/__tests__/agents/objectiveEvaluatorStep.test.js.map +1 -0
  66. package/dist/__tests__/agents/outerLoopRecoveryEvaluator.test.js +207 -0
  67. package/dist/__tests__/agents/outerLoopRecoveryEvaluator.test.js.map +1 -0
  68. package/dist/__tests__/agents/prompting.test.js +363 -0
  69. package/dist/__tests__/agents/prompting.test.js.map +1 -0
  70. package/dist/__tests__/agents/readinessGateStep.test.js +180 -0
  71. package/dist/__tests__/agents/readinessGateStep.test.js.map +1 -0
  72. package/dist/__tests__/agents/reasonNextStep.test.js +56 -0
  73. package/dist/__tests__/agents/reasonNextStep.test.js.map +1 -0
  74. package/dist/__tests__/agents/reasonNextTaskStep.test.js +284 -0
  75. package/dist/__tests__/agents/reasonNextTaskStep.test.js.map +1 -0
  76. package/dist/__tests__/agents/resolveAgentTargetClassification.test.js +170 -0
  77. package/dist/__tests__/agents/resolveAgentTargetClassification.test.js.map +1 -0
  78. package/dist/__tests__/agents/resolveProgressState.test.js +526 -0
  79. package/dist/__tests__/agents/resolveProgressState.test.js.map +1 -0
  80. package/dist/__tests__/agents/resumeCheckpoint.test.js +50 -0
  81. package/dist/__tests__/agents/resumeCheckpoint.test.js.map +1 -0
  82. package/dist/__tests__/agents/routingDecisionStep.test.js +134 -0
  83. package/dist/__tests__/agents/routingDecisionStep.test.js.map +1 -0
  84. package/dist/__tests__/agents/scopeClassificationStep.test.js +118 -0
  85. package/dist/__tests__/agents/scopeClassificationStep.test.js.map +1 -0
  86. package/dist/__tests__/agents/searchContext.test.js +97 -0
  87. package/dist/__tests__/agents/searchContext.test.js.map +1 -0
  88. package/dist/__tests__/agents/selectRelevantSourcesStep.test.js +73 -0
  89. package/dist/__tests__/agents/selectRelevantSourcesStep.test.js.map +1 -0
  90. package/dist/__tests__/agents/structuredOutput.test.js +45 -0
  91. package/dist/__tests__/agents/structuredOutput.test.js.map +1 -0
  92. package/dist/__tests__/agents/transformPlanGenStep.fallback.test.js +59 -0
  93. package/dist/__tests__/agents/transformPlanGenStep.fallback.test.js.map +1 -0
  94. package/dist/__tests__/agents/transformPlanGenStep.test.js +92 -0
  95. package/dist/__tests__/agents/transformPlanGenStep.test.js.map +1 -0
  96. package/dist/__tests__/agents/understandIntentStep.test.js +237 -0
  97. package/dist/__tests__/agents/understandIntentStep.test.js.map +1 -0
  98. package/dist/__tests__/agents/understandResumeContext.test.js +65 -0
  99. package/dist/__tests__/agents/understandResumeContext.test.js.map +1 -0
  100. package/dist/__tests__/agents/understandScope.test.js +227 -0
  101. package/dist/__tests__/agents/understandScope.test.js.map +1 -0
  102. package/dist/__tests__/agents/validateChangesStep.test.js +52 -0
  103. package/dist/__tests__/agents/validateChangesStep.test.js.map +1 -0
  104. package/dist/__tests__/askCommandTaskBinding.test.js +176 -0
  105. package/dist/__tests__/askCommandTaskBinding.test.js.map +1 -0
  106. package/dist/__tests__/commandVisibility.test.js +25 -0
  107. package/dist/__tests__/commandVisibility.test.js.map +1 -0
  108. package/dist/__tests__/config.devOutput.test.js +82 -0
  109. package/dist/__tests__/config.devOutput.test.js.map +1 -0
  110. package/dist/__tests__/currentContext.test.js +43 -0
  111. package/dist/__tests__/currentContext.test.js.map +1 -0
  112. package/dist/__tests__/daemonWorker.test.js +51 -0
  113. package/dist/__tests__/daemonWorker.test.js.map +1 -0
  114. package/dist/__tests__/dialogState.test.js +113 -0
  115. package/dist/__tests__/dialogState.test.js.map +1 -0
  116. package/dist/__tests__/evalCommands.test.js +506 -0
  117. package/dist/__tests__/evalCommands.test.js.map +1 -0
  118. package/dist/__tests__/evalCommandsSummary.test.js +68 -0
  119. package/dist/__tests__/evalCommandsSummary.test.js.map +1 -0
  120. package/dist/__tests__/example.test.js +1 -0
  121. package/dist/__tests__/example.test.js.map +1 -0
  122. package/dist/__tests__/factory.commitCommand.test.js +45 -0
  123. package/dist/__tests__/factory.commitCommand.test.js.map +1 -0
  124. package/dist/__tests__/factory.devOutputCommand.test.js +122 -0
  125. package/dist/__tests__/factory.devOutputCommand.test.js.map +1 -0
  126. package/dist/__tests__/factory.evalCommands.test.js +38 -0
  127. package/dist/__tests__/factory.evalCommands.test.js.map +1 -0
  128. package/dist/__tests__/factory.planCommand.test.js +35 -0
  129. package/dist/__tests__/factory.planCommand.test.js.map +1 -0
  130. package/dist/__tests__/factory.setupCommand.test.js +34 -0
  131. package/dist/__tests__/factory.setupCommand.test.js.map +1 -0
  132. package/dist/__tests__/factory.statusCommand.test.js +54 -0
  133. package/dist/__tests__/factory.statusCommand.test.js.map +1 -0
  134. package/dist/__tests__/fileRules/queryTokenRules.test.js +35 -0
  135. package/dist/__tests__/fileRules/queryTokenRules.test.js.map +1 -0
  136. package/dist/__tests__/fileRules/searchPathClassification.test.js +57 -0
  137. package/dist/__tests__/fileRules/searchPathClassification.test.js.map +1 -0
  138. package/dist/__tests__/generate.ollamaRecovery.test.js +344 -0
  139. package/dist/__tests__/generate.ollamaRecovery.test.js.map +1 -0
  140. package/dist/__tests__/index.modelStartup.test.js +24 -0
  141. package/dist/__tests__/index.modelStartup.test.js.map +1 -0
  142. package/dist/__tests__/indexCmd.test.js +85 -0
  143. package/dist/__tests__/indexCmd.test.js.map +1 -0
  144. package/dist/__tests__/indexSlashCommand.test.js +50 -0
  145. package/dist/__tests__/indexSlashCommand.test.js.map +1 -0
  146. package/dist/__tests__/ollamaService.test.js +103 -0
  147. package/dist/__tests__/ollamaService.test.js.map +1 -0
  148. package/dist/__tests__/pipeline/modules/codeTransformModule.small-file.test.js +68 -0
  149. package/dist/__tests__/pipeline/modules/codeTransformModule.small-file.test.js.map +1 -0
  150. package/dist/__tests__/pipeline/modules/commitSuggesterModule.test.js +68 -0
  151. package/dist/__tests__/pipeline/modules/commitSuggesterModule.test.js.map +1 -0
  152. package/dist/__tests__/pipeline/modules/fileSearchModule.test.js +284 -0
  153. package/dist/__tests__/pipeline/modules/fileSearchModule.test.js.map +1 -0
  154. package/dist/__tests__/pipeline/modules/finalAnswerModule.test.js +1139 -0
  155. package/dist/__tests__/pipeline/modules/finalAnswerModule.test.js.map +1 -0
  156. package/dist/__tests__/pipeline/modules/readFileModule.test.js +146 -0
  157. package/dist/__tests__/pipeline/modules/readFileModule.test.js.map +1 -0
  158. package/dist/__tests__/pipeline/modules/semanticAnalysisModule.test.js +192 -0
  159. package/dist/__tests__/pipeline/modules/semanticAnalysisModule.test.js.map +1 -0
  160. package/dist/__tests__/repoIdentity.test.js +31 -0
  161. package/dist/__tests__/repoIdentity.test.js.map +1 -0
  162. package/dist/__tests__/resumeContext.test.js +87 -0
  163. package/dist/__tests__/resumeContext.test.js.map +1 -0
  164. package/dist/__tests__/resumeState.test.js +239 -0
  165. package/dist/__tests__/resumeState.test.js.map +1 -0
  166. package/dist/__tests__/search/SearchOrchestrator.test.js +836 -0
  167. package/dist/__tests__/search/SearchOrchestrator.test.js.map +1 -0
  168. package/dist/__tests__/shellDialogUi.test.js +52 -0
  169. package/dist/__tests__/shellDialogUi.test.js.map +1 -0
  170. package/dist/__tests__/shellSession.test.js +102 -0
  171. package/dist/__tests__/shellSession.test.js.map +1 -0
  172. package/dist/__tests__/statusOwner.test.js +215 -0
  173. package/dist/__tests__/statusOwner.test.js.map +1 -0
  174. package/dist/__tests__/testing/contextEval.test.js +244 -0
  175. package/dist/__tests__/testing/contextEval.test.js.map +1 -0
  176. package/dist/__tests__/testing/harnessArtifacts.test.js +124 -0
  177. package/dist/__tests__/testing/harnessArtifacts.test.js.map +1 -0
  178. package/dist/__tests__/testing/llmTraceSession.test.js +67 -0
  179. package/dist/__tests__/testing/llmTraceSession.test.js.map +1 -0
  180. package/dist/__tests__/testing/registerDevCliCommands.test.js +35 -0
  181. package/dist/__tests__/testing/registerDevCliCommands.test.js.map +1 -0
  182. package/dist/__tests__/testing/runDiagnosis.test.js +159 -0
  183. package/dist/__tests__/testing/runDiagnosis.test.js.map +1 -0
  184. package/dist/__tests__/testing/runtimeLogReader.test.js +66 -0
  185. package/dist/__tests__/testing/runtimeLogReader.test.js.map +1 -0
  186. package/dist/__tests__/testing/testCommands.test.js +53 -0
  187. package/dist/__tests__/testing/testCommands.test.js.map +1 -0
  188. package/dist/__tests__/utils/compileSearchQuery.test.js +38 -0
  189. package/dist/__tests__/utils/compileSearchQuery.test.js.map +1 -0
  190. package/dist/__tests__/utils/consolePresentation.test.js +105 -0
  191. package/dist/__tests__/utils/consolePresentation.test.js.map +1 -0
  192. package/dist/__tests__/utils/extractFileReferences.test.js +41 -0
  193. package/dist/__tests__/utils/extractFileReferences.test.js.map +1 -0
  194. package/dist/__tests__/utils/log.test.js +34 -0
  195. package/dist/__tests__/utils/log.test.js.map +1 -0
  196. package/dist/__tests__/utils/runtimeLogger.test.js +200 -0
  197. package/dist/__tests__/utils/runtimeLogger.test.js.map +1 -0
  198. package/dist/__tests__/utils/spinner.test.js +31 -0
  199. package/dist/__tests__/utils/spinner.test.js.map +1 -0
  200. package/dist/__tests__/utils/verifyFocusPreference.test.js +41 -0
  201. package/dist/__tests__/utils/verifyFocusPreference.test.js.map +1 -0
  202. package/dist/agent/actions/index.js +301 -0
  203. package/dist/agent/actions/index.js.map +1 -0
  204. package/dist/agent/actions/normalize.js +360 -0
  205. package/dist/agent/actions/normalize.js.map +1 -0
  206. package/dist/agent/actions/schemas.js +129 -0
  207. package/dist/agent/actions/schemas.js.map +1 -0
  208. package/dist/agent/evidence/index.js +320 -0
  209. package/dist/agent/evidence/index.js.map +1 -0
  210. package/dist/agent/feedback/index.js +187 -0
  211. package/dist/agent/feedback/index.js.map +1 -0
  212. package/dist/agent/finalization/index.js +35 -0
  213. package/dist/agent/finalization/index.js.map +1 -0
  214. package/dist/agent/index.js +126 -0
  215. package/dist/agent/index.js.map +1 -0
  216. package/dist/agent/logging/index.js +350 -0
  217. package/dist/agent/logging/index.js.map +1 -0
  218. package/dist/agent/persistence/boot.js +58 -0
  219. package/dist/agent/persistence/boot.js.map +1 -0
  220. package/dist/agent/persistence/currentTask.js +36 -0
  221. package/dist/agent/persistence/currentTask.js.map +1 -0
  222. package/dist/agent/persistence/hydrate.js +42 -0
  223. package/dist/agent/persistence/hydrate.js.map +1 -0
  224. package/dist/agent/persistence/index.js +15 -0
  225. package/dist/agent/persistence/index.js.map +1 -0
  226. package/dist/agent/persistence/snapshots.js +97 -0
  227. package/dist/agent/persistence/snapshots.js.map +1 -0
  228. package/dist/agent/persistence/steps.js +95 -0
  229. package/dist/agent/persistence/steps.js.map +1 -0
  230. package/dist/agent/persistence/tasks.js +195 -0
  231. package/dist/agent/persistence/tasks.js.map +1 -0
  232. package/dist/agent/persistence/turns.js +92 -0
  233. package/dist/agent/persistence/turns.js.map +1 -0
  234. package/dist/agent/policy/ambiguityResolution.js +226 -0
  235. package/dist/agent/policy/ambiguityResolution.js.map +1 -0
  236. package/dist/agent/policy/contracts.js +2 -0
  237. package/dist/agent/policy/contracts.js.map +1 -0
  238. package/dist/agent/policy/coveragePolicy.js +309 -0
  239. package/dist/agent/policy/coveragePolicy.js.map +1 -0
  240. package/dist/agent/policy/endDecisionPolicy.js +31 -0
  241. package/dist/agent/policy/endDecisionPolicy.js.map +1 -0
  242. package/dist/agent/policy/index.js +344 -0
  243. package/dist/agent/policy/index.js.map +1 -0
  244. package/dist/agent/policy/loopReview.js +778 -0
  245. package/dist/agent/policy/loopReview.js.map +1 -0
  246. package/dist/agent/policy/readinessPolicy.js +108 -0
  247. package/dist/agent/policy/readinessPolicy.js.map +1 -0
  248. package/dist/agent/policy/resolutionPipeline.js +356 -0
  249. package/dist/agent/policy/resolutionPipeline.js.map +1 -0
  250. package/dist/agent/policy/targetClassification.js +33 -0
  251. package/dist/agent/policy/targetClassification.js.map +1 -0
  252. package/dist/agent/prompting/actionChoice.js +90 -0
  253. package/dist/agent/prompting/actionChoice.js.map +1 -0
  254. package/dist/agent/prompting/finalAnswer.js +38 -0
  255. package/dist/agent/prompting/finalAnswer.js.map +1 -0
  256. package/dist/agent/prompting/index.js +14 -0
  257. package/dist/agent/prompting/index.js.map +1 -0
  258. package/dist/agent/prompting/plan.js +59 -0
  259. package/dist/agent/prompting/plan.js.map +1 -0
  260. package/dist/agent/prompting/transform.js +175 -0
  261. package/dist/agent/prompting/transform.js.map +1 -0
  262. package/dist/agent/prompting/understand.js +70 -0
  263. package/dist/agent/prompting/understand.js.map +1 -0
  264. package/dist/agent/read/freshness.js +29 -0
  265. package/dist/agent/read/freshness.js.map +1 -0
  266. package/dist/agent/read/fullReadPrompt.js +43 -0
  267. package/dist/agent/read/fullReadPrompt.js.map +1 -0
  268. package/dist/agent/read/index.js +140 -0
  269. package/dist/agent/read/index.js.map +1 -0
  270. package/dist/agent/read/persistence.js +88 -0
  271. package/dist/agent/read/persistence.js.map +1 -0
  272. package/dist/agent/read/summarizeReadEvidence.js +733 -0
  273. package/dist/agent/read/summarizeReadEvidence.js.map +1 -0
  274. package/dist/agent/read/targetResolution.js +126 -0
  275. package/dist/agent/read/targetResolution.js.map +1 -0
  276. package/dist/agent/resume/checkpoint.js +41 -0
  277. package/dist/agent/resume/checkpoint.js.map +1 -0
  278. package/dist/agent/runtime/lifecycle.js +67 -0
  279. package/dist/agent/runtime/lifecycle.js.map +1 -0
  280. package/dist/agent/runtime/progress.js +178 -0
  281. package/dist/agent/runtime/progress.js.map +1 -0
  282. package/dist/agent/runtime/runAgentLoop.js +402 -0
  283. package/dist/agent/runtime/runAgentLoop.js.map +1 -0
  284. package/dist/agent/runtime/runAgentPlanOnly.js +127 -0
  285. package/dist/agent/runtime/runAgentPlanOnly.js.map +1 -0
  286. package/dist/agent/runtime/understand.js +336 -0
  287. package/dist/agent/runtime/understand.js.map +1 -0
  288. package/dist/agent/search/batchPlanner.js +274 -0
  289. package/dist/agent/search/batchPlanner.js.map +1 -0
  290. package/dist/agent/search/candidateRetentionPolicy.js +184 -0
  291. package/dist/agent/search/candidateRetentionPolicy.js.map +1 -0
  292. package/dist/agent/search/directory.js +51 -0
  293. package/dist/agent/search/directory.js.map +1 -0
  294. package/dist/agent/search/exactTarget.js +151 -0
  295. package/dist/agent/search/exactTarget.js.map +1 -0
  296. package/dist/agent/search/fragment.js +110 -0
  297. package/dist/agent/search/fragment.js.map +1 -0
  298. package/dist/agent/search/index.js +166 -0
  299. package/dist/agent/search/index.js.map +1 -0
  300. package/dist/agent/search/laneClassifier.js +119 -0
  301. package/dist/agent/search/laneClassifier.js.map +1 -0
  302. package/dist/agent/search/limits.js +10 -0
  303. package/dist/agent/search/limits.js.map +1 -0
  304. package/dist/agent/search/ranking.js +22 -0
  305. package/dist/agent/search/ranking.js.map +1 -0
  306. package/dist/agent/search/regex.js +83 -0
  307. package/dist/agent/search/regex.js.map +1 -0
  308. package/dist/agent/search/routePolicy.js +11 -0
  309. package/dist/agent/search/routePolicy.js.map +1 -0
  310. package/dist/agent/search/searchContext.js +128 -0
  311. package/dist/agent/search/searchContext.js.map +1 -0
  312. package/dist/agent/search/semantic.js +113 -0
  313. package/dist/agent/search/semantic.js.map +1 -0
  314. package/dist/agent/search/semanticIndexSearch.js +202 -0
  315. package/dist/agent/search/semanticIndexSearch.js.map +1 -0
  316. package/dist/agent/search/shared.js +283 -0
  317. package/dist/agent/search/shared.js.map +1 -0
  318. package/dist/agent/search/shell.js +202 -0
  319. package/dist/agent/search/shell.js.map +1 -0
  320. package/dist/agent/search/snippetEvidence.js +57 -0
  321. package/dist/agent/search/snippetEvidence.js.map +1 -0
  322. package/dist/agent/search/types.js +2 -0
  323. package/dist/agent/search/types.js.map +1 -0
  324. package/dist/agent/state/index.js +99 -0
  325. package/dist/agent/state/index.js.map +1 -0
  326. package/dist/agent/state/memory.js +56 -0
  327. package/dist/agent/state/memory.js.map +1 -0
  328. package/dist/agent/structuredOutput/index.js +28 -0
  329. package/dist/agent/structuredOutput/index.js.map +1 -0
  330. package/dist/agent/tools/index.js +199 -0
  331. package/dist/agent/tools/index.js.map +1 -0
  332. package/dist/agent/transform/index.js +519 -0
  333. package/dist/agent/transform/index.js.map +1 -0
  334. package/dist/agent/transform/syntax.js +49 -0
  335. package/dist/agent/transform/syntax.js.map +1 -0
  336. package/dist/agent/types.js +20 -0
  337. package/dist/agent/types.js.map +1 -0
  338. package/dist/agents/actionRegistry.js +114 -0
  339. package/dist/agents/actionRegistry.js.map +1 -0
  340. package/dist/agents/agent.js +5 -0
  341. package/dist/agents/agent.js.map +1 -0
  342. package/dist/agents/agentActions.js +5 -0
  343. package/dist/agents/agentActions.js.map +1 -0
  344. package/dist/agents/agentEvidence.js +5 -0
  345. package/dist/agents/agentEvidence.js.map +1 -0
  346. package/dist/agents/agentFeedback.js +5 -0
  347. package/dist/agents/agentFeedback.js.map +1 -0
  348. package/dist/agents/agentLogging.js +5 -0
  349. package/dist/agents/agentLogging.js.map +1 -0
  350. package/dist/agents/agentLoop.js +5 -0
  351. package/dist/agents/agentLoop.js.map +1 -0
  352. package/dist/agents/agentMemory.js +5 -0
  353. package/dist/agents/agentMemory.js.map +1 -0
  354. package/dist/agents/agentPlanMode.js +5 -0
  355. package/dist/agents/agentPlanMode.js.map +1 -0
  356. package/dist/agents/agentPolicyState.js +5 -0
  357. package/dist/agents/agentPolicyState.js.map +1 -0
  358. package/dist/agents/agentProgress.js +93 -0
  359. package/dist/agents/agentProgress.js.map +1 -0
  360. package/dist/agents/agentSchemas.js +5 -0
  361. package/dist/agents/agentSchemas.js.map +1 -0
  362. package/dist/agents/agentSearchScoring.js +5 -0
  363. package/dist/agents/agentSearchScoring.js.map +1 -0
  364. package/dist/agents/agentStateMachine.js +5 -0
  365. package/dist/agents/agentStateMachine.js.map +1 -0
  366. package/dist/agents/agentTools.js +5 -0
  367. package/dist/agents/agentTools.js.map +1 -0
  368. package/dist/agents/agentTypes.js +5 -0
  369. package/dist/agents/agentTypes.js.map +1 -0
  370. package/dist/agents/agentUnderstand.js +5 -0
  371. package/dist/agents/agentUnderstand.js.map +1 -0
  372. package/dist/agents/analysisPlanGenStep.js +194 -17
  373. package/dist/agents/analysisPlanGenStep.js.map +1 -0
  374. package/dist/agents/answerOnlyCompletion.js +32 -0
  375. package/dist/agents/answerOnlyCompletion.js.map +1 -0
  376. package/dist/agents/collaboratorStep.js +1 -0
  377. package/dist/agents/collaboratorStep.js.map +1 -0
  378. package/dist/agents/decideNextAction.js +444 -0
  379. package/dist/agents/decideNextAction.js.map +1 -0
  380. package/dist/agents/deriveFocusFromSearchStep.js +83 -0
  381. package/dist/agents/deriveFocusFromSearchStep.js.map +1 -0
  382. package/dist/agents/evidenceVerifierStep.js +104 -13
  383. package/dist/agents/evidenceVerifierStep.js.map +1 -0
  384. package/dist/agents/fileCheckStep.js +381 -12
  385. package/dist/agents/fileCheckStep.js.map +1 -0
  386. package/dist/agents/giveUpEvaluatorStep.js +63 -0
  387. package/dist/agents/giveUpEvaluatorStep.js.map +1 -0
  388. package/dist/agents/guardPolicy.js +20 -0
  389. package/dist/agents/guardPolicy.js.map +1 -0
  390. package/dist/agents/guards/executionPolicyResolver.js +165 -0
  391. package/dist/agents/guards/executionPolicyResolver.js.map +1 -0
  392. package/dist/agents/guards/guardState.js +195 -0
  393. package/dist/agents/guards/guardState.js.map +1 -0
  394. package/dist/agents/guards/resolveProgressState.js +403 -0
  395. package/dist/agents/guards/resolveProgressState.js.map +1 -0
  396. package/dist/agents/infoPlanGenStep.js +66 -8
  397. package/dist/agents/infoPlanGenStep.js.map +1 -0
  398. package/dist/agents/integrateFeedbackStep.js +1 -0
  399. package/dist/agents/integrateFeedbackStep.js.map +1 -0
  400. package/dist/agents/iterationFileSelector.js +8 -7
  401. package/dist/agents/iterationFileSelector.js.map +1 -0
  402. package/dist/agents/mainAgentActivityLog.js +85 -0
  403. package/dist/agents/mainAgentActivityLog.js.map +1 -0
  404. package/dist/agents/mainAgentHeuristics.js +173 -0
  405. package/dist/agents/mainAgentHeuristics.js.map +1 -0
  406. package/dist/agents/mainAgentVerify.js +159 -0
  407. package/dist/agents/mainAgentVerify.js.map +1 -0
  408. package/dist/agents/objectiveEvaluatorStep.js +103 -0
  409. package/dist/agents/objectiveEvaluatorStep.js.map +1 -0
  410. package/dist/agents/outerLoopRecoveryEvaluator.js +108 -0
  411. package/dist/agents/outerLoopRecoveryEvaluator.js.map +1 -0
  412. package/dist/agents/readinessGateStep.js +95 -9
  413. package/dist/agents/readinessGateStep.js.map +1 -0
  414. package/dist/agents/reasonNextStep.js +9 -8
  415. package/dist/agents/reasonNextStep.js.map +1 -0
  416. package/dist/agents/reasonNextTaskStep.js +267 -144
  417. package/dist/agents/reasonNextTaskStep.js.map +1 -0
  418. package/dist/agents/researchPlanGenStep.js +61 -25
  419. package/dist/agents/researchPlanGenStep.js.map +1 -0
  420. package/dist/agents/resolveAgentTargetClassification.js +5 -0
  421. package/dist/agents/resolveAgentTargetClassification.js.map +1 -0
  422. package/dist/agents/resolveExecutionModeStep.js +1 -0
  423. package/dist/agents/resolveExecutionModeStep.js.map +1 -0
  424. package/dist/agents/resolveExplicitTargetsStep.js +74 -0
  425. package/dist/agents/resolveExplicitTargetsStep.js.map +1 -0
  426. package/dist/agents/routingDecisionStep.js +58 -11
  427. package/dist/agents/routingDecisionStep.js.map +1 -0
  428. package/dist/agents/scopeClassificationStep.js +66 -3
  429. package/dist/agents/scopeClassificationStep.js.map +1 -0
  430. package/dist/agents/selectRelevantSourcesStep.js +13 -5
  431. package/dist/agents/selectRelevantSourcesStep.js.map +1 -0
  432. package/dist/agents/structuralPreloadStep.js +3 -4
  433. package/dist/agents/structuralPreloadStep.js.map +1 -0
  434. package/dist/agents/transformPlanGenStep.js +105 -18
  435. package/dist/agents/transformPlanGenStep.js.map +1 -0
  436. package/dist/agents/understandIntentStep.js +237 -17
  437. package/dist/agents/understandIntentStep.js.map +1 -0
  438. package/dist/agents/validateChangesStep.js +16 -2
  439. package/dist/agents/validateChangesStep.js.map +1 -0
  440. package/dist/agents/writeFileStep.js +1 -0
  441. package/dist/agents/writeFileStep.js.map +1 -0
  442. package/dist/commands/AskCmd.js +139 -44
  443. package/dist/commands/AskCmd.js.map +1 -0
  444. package/dist/commands/BackupCmd.js +1 -0
  445. package/dist/commands/BackupCmd.js.map +1 -0
  446. package/dist/commands/ChangeLogUpdateCmd.js +1 -0
  447. package/dist/commands/ChangeLogUpdateCmd.js.map +1 -0
  448. package/dist/commands/CommitSuggesterCmd.js +55 -13
  449. package/dist/commands/CommitSuggesterCmd.js.map +1 -0
  450. package/dist/commands/DaemonCmd.js +52 -14
  451. package/dist/commands/DaemonCmd.js.map +1 -0
  452. package/dist/commands/DeleteIndex.js +1 -0
  453. package/dist/commands/DeleteIndex.js.map +1 -0
  454. package/dist/commands/EvalReportCmd.js +374 -0
  455. package/dist/commands/EvalReportCmd.js.map +1 -0
  456. package/dist/commands/FindCmd.js +1 -0
  457. package/dist/commands/FindCmd.js.map +1 -0
  458. package/dist/commands/GitCmd.js +1 -0
  459. package/dist/commands/GitCmd.js.map +1 -0
  460. package/dist/commands/IndexCmd.js +11 -79
  461. package/dist/commands/IndexCmd.js.map +1 -0
  462. package/dist/commands/InspectCmd.js +1 -0
  463. package/dist/commands/InspectCmd.js.map +1 -0
  464. package/dist/commands/ModelCmd.js +24 -0
  465. package/dist/commands/ModelCmd.js.map +1 -0
  466. package/dist/commands/ReadlineSingleton.js +1 -0
  467. package/dist/commands/ReadlineSingleton.js.map +1 -0
  468. package/dist/commands/ResetDbCmd.js +18 -1
  469. package/dist/commands/ResetDbCmd.js.map +1 -0
  470. package/dist/commands/ReviewCmd.js +1 -0
  471. package/dist/commands/ReviewCmd.js.map +1 -0
  472. package/dist/commands/StatusCmd.js +22 -0
  473. package/dist/commands/StatusCmd.js.map +1 -0
  474. package/dist/commands/StopDaemonCmd.js +1 -0
  475. package/dist/commands/StopDaemonCmd.js.map +1 -0
  476. package/dist/commands/SummaryCmd.js +1 -0
  477. package/dist/commands/SummaryCmd.js.map +1 -0
  478. package/dist/commands/SwitchCmd.js +9 -15
  479. package/dist/commands/SwitchCmd.js.map +1 -0
  480. package/dist/commands/TasksCmd.js +142 -57
  481. package/dist/commands/TasksCmd.js.map +1 -0
  482. package/dist/commands/TestCmd.js +66 -0
  483. package/dist/commands/TestCmd.js.map +1 -0
  484. package/dist/commands/WorkflowCmd.js +1 -0
  485. package/dist/commands/WorkflowCmd.js.map +1 -0
  486. package/dist/commands/commandVisibility.js +27 -0
  487. package/dist/commands/commandVisibility.js.map +1 -0
  488. package/dist/commands/evalCommands.js +1337 -0
  489. package/dist/commands/evalCommands.js.map +1 -0
  490. package/dist/commands/factory.js +206 -38
  491. package/dist/commands/factory.js.map +1 -0
  492. package/dist/config.js +62 -11
  493. package/dist/config.js.map +1 -0
  494. package/dist/constants.js +21 -3
  495. package/dist/constants.js.map +1 -0
  496. package/dist/context.js +33 -32
  497. package/dist/context.js.map +1 -0
  498. package/dist/daemon/daemonQueues.js +1 -20
  499. package/dist/daemon/daemonQueues.js.map +1 -0
  500. package/dist/daemon/daemonWorker.js +26 -37
  501. package/dist/daemon/daemonWorker.js.map +1 -0
  502. package/dist/daemon/generateSummaries.js +1 -0
  503. package/dist/daemon/generateSummaries.js.map +1 -0
  504. package/dist/daemon/runFolderCapsuleBatch.js +1 -0
  505. package/dist/daemon/runFolderCapsuleBatch.js.map +1 -0
  506. package/dist/daemon/runIndexingBatch.js +1 -0
  507. package/dist/daemon/runIndexingBatch.js.map +1 -0
  508. package/dist/daemon/runKgBatch.js +9 -1
  509. package/dist/daemon/runKgBatch.js.map +1 -0
  510. package/dist/db/backup.js +1 -0
  511. package/dist/db/backup.js.map +1 -0
  512. package/dist/db/client.js +18 -3
  513. package/dist/db/client.js.map +1 -0
  514. package/dist/db/fileIndex.js +110 -152
  515. package/dist/db/fileIndex.js.map +1 -0
  516. package/dist/db/functionExtractors/extractFromJava.js +1 -0
  517. package/dist/db/functionExtractors/extractFromJava.js.map +1 -0
  518. package/dist/db/functionExtractors/extractFromJs.js +1 -0
  519. package/dist/db/functionExtractors/extractFromJs.js.map +1 -0
  520. package/dist/db/functionExtractors/extractFromTs.js +1 -0
  521. package/dist/db/functionExtractors/extractFromTs.js.map +1 -0
  522. package/dist/db/functionExtractors/extractFromXML.js +1 -0
  523. package/dist/db/functionExtractors/extractFromXML.js.map +1 -0
  524. package/dist/db/functionExtractors/index.js +1 -0
  525. package/dist/db/functionExtractors/index.js.map +1 -0
  526. package/dist/db/functionIndex.js +9 -0
  527. package/dist/db/functionIndex.js.map +1 -0
  528. package/dist/db/schema.js +314 -99
  529. package/dist/db/schema.js.map +1 -0
  530. package/dist/db/sqlTemplates.js +1 -0
  531. package/dist/db/sqlTemplates.js.map +1 -0
  532. package/dist/fileRules/builtins.js +1 -0
  533. package/dist/fileRules/builtins.js.map +1 -0
  534. package/dist/fileRules/classifyFile.js +1 -0
  535. package/dist/fileRules/classifyFile.js.map +1 -0
  536. package/dist/fileRules/codeAllowedExtensions.js +1 -0
  537. package/dist/fileRules/codeAllowedExtensions.js.map +1 -0
  538. package/dist/fileRules/detectFileType.js +1 -0
  539. package/dist/fileRules/detectFileType.js.map +1 -0
  540. package/dist/fileRules/fileClassifier.js +1 -0
  541. package/dist/fileRules/fileClassifier.js.map +1 -0
  542. package/dist/fileRules/fileExceptions.js +1 -0
  543. package/dist/fileRules/fileExceptions.js.map +1 -0
  544. package/dist/fileRules/ignoredExtensions.js +1 -0
  545. package/dist/fileRules/ignoredExtensions.js.map +1 -0
  546. package/dist/fileRules/ignoredPaths.js +48 -5
  547. package/dist/fileRules/ignoredPaths.js.map +1 -0
  548. package/dist/fileRules/queryTokenRules.js +176 -0
  549. package/dist/fileRules/queryTokenRules.js.map +1 -0
  550. package/dist/fileRules/searchPathClassification.js +58 -0
  551. package/dist/fileRules/searchPathClassification.js.map +1 -0
  552. package/dist/fileRules/shouldIgnoreFiles.js +1 -0
  553. package/dist/fileRules/shouldIgnoreFiles.js.map +1 -0
  554. package/dist/fileRules/stopWords.js +9 -0
  555. package/dist/fileRules/stopWords.js.map +1 -0
  556. package/dist/fileRules/wellKnownRepoFiles.js +1 -0
  557. package/dist/fileRules/wellKnownRepoFiles.js.map +1 -0
  558. package/dist/git/commitSummary.js +227 -0
  559. package/dist/git/commitSummary.js.map +1 -0
  560. package/dist/github/api.js +1 -0
  561. package/dist/github/api.js.map +1 -0
  562. package/dist/github/auth.js +1 -0
  563. package/dist/github/auth.js.map +1 -0
  564. package/dist/github/github.js +1 -0
  565. package/dist/github/github.js.map +1 -0
  566. package/dist/github/githubAuthCheck.js +1 -0
  567. package/dist/github/githubAuthCheck.js.map +1 -0
  568. package/dist/github/postComments.js +1 -0
  569. package/dist/github/postComments.js.map +1 -0
  570. package/dist/github/repo.js +15 -24
  571. package/dist/github/repo.js.map +1 -0
  572. package/dist/github/token.js +1 -0
  573. package/dist/github/token.js.map +1 -0
  574. package/dist/github/types.js +1 -0
  575. package/dist/github/types.js.map +1 -0
  576. package/dist/index.js +318 -37
  577. package/dist/index.js.map +1 -0
  578. package/dist/lib/generate.js +264 -20
  579. package/dist/lib/generate.js.map +1 -0
  580. package/dist/lib/generateFolderCapsules.js +1 -0
  581. package/dist/lib/generateFolderCapsules.js.map +1 -0
  582. package/dist/lib/ollamaModelPolicy.js +59 -0
  583. package/dist/lib/ollamaModelPolicy.js.map +1 -0
  584. package/dist/lib/spinner.js +29 -9
  585. package/dist/lib/spinner.js.map +1 -0
  586. package/dist/modelSetup.js +25 -78
  587. package/dist/modelSetup.js.map +1 -0
  588. package/dist/pipeline/modules/changeLogModule.js +10 -1
  589. package/dist/pipeline/modules/changeLogModule.js.map +1 -0
  590. package/dist/pipeline/modules/cleanupModule.js +1 -0
  591. package/dist/pipeline/modules/cleanupModule.js.map +1 -0
  592. package/dist/pipeline/modules/codeTransformModule.js +10 -16
  593. package/dist/pipeline/modules/codeTransformModule.js.map +1 -0
  594. package/dist/pipeline/modules/commentModule.js +12 -0
  595. package/dist/pipeline/modules/commentModule.js.map +1 -0
  596. package/dist/pipeline/modules/commitSuggesterModule.js +82 -12
  597. package/dist/pipeline/modules/commitSuggesterModule.js.map +1 -0
  598. package/dist/pipeline/modules/contextReviewModule.js +12 -1
  599. package/dist/pipeline/modules/contextReviewModule.js.map +1 -0
  600. package/dist/pipeline/modules/dialogAnswerModule.js +58 -0
  601. package/dist/pipeline/modules/dialogAnswerModule.js.map +1 -0
  602. package/dist/pipeline/modules/fileSearchModule.js +5 -143
  603. package/dist/pipeline/modules/fileSearchModule.js.map +1 -0
  604. package/dist/pipeline/modules/finalAnswerModule.js +1176 -151
  605. package/dist/pipeline/modules/finalAnswerModule.js.map +1 -0
  606. package/dist/pipeline/modules/kgModule.js +18 -1
  607. package/dist/pipeline/modules/kgModule.js.map +1 -0
  608. package/dist/pipeline/modules/planAnswerModule.js +99 -0
  609. package/dist/pipeline/modules/planAnswerModule.js.map +1 -0
  610. package/dist/pipeline/modules/readFileModule.js +300 -0
  611. package/dist/pipeline/modules/readFileModule.js.map +1 -0
  612. package/dist/pipeline/modules/reviewModule.js +10 -1
  613. package/dist/pipeline/modules/reviewModule.js.map +1 -0
  614. package/dist/pipeline/modules/searchDbModule.js +159 -0
  615. package/dist/pipeline/modules/searchDbModule.js.map +1 -0
  616. package/dist/pipeline/modules/searchListDirectoryModule.js +62 -0
  617. package/dist/pipeline/modules/searchListDirectoryModule.js.map +1 -0
  618. package/dist/pipeline/modules/searchModuleShared.js +71 -0
  619. package/dist/pipeline/modules/searchModuleShared.js.map +1 -0
  620. package/dist/pipeline/modules/searchRegexModule.js +59 -0
  621. package/dist/pipeline/modules/searchRegexModule.js.map +1 -0
  622. package/dist/pipeline/modules/semanticAnalysisModule.js +185 -28
  623. package/dist/pipeline/modules/semanticAnalysisModule.js.map +1 -0
  624. package/dist/pipeline/modules/summaryModule.js +11 -1
  625. package/dist/pipeline/modules/summaryModule.js.map +1 -0
  626. package/dist/pipeline/registry/moduleRegistry.js +9 -0
  627. package/dist/pipeline/registry/moduleRegistry.js.map +1 -0
  628. package/dist/pipeline/runModulePipeline.js +1 -0
  629. package/dist/pipeline/runModulePipeline.js.map +1 -0
  630. package/dist/scripts/dbScriptSupport.js +172 -0
  631. package/dist/scripts/dbScriptSupport.js.map +1 -0
  632. package/dist/scripts/dbcheck.js +173 -267
  633. package/dist/scripts/dbcheck.js.map +1 -0
  634. package/dist/scripts/dboverview.js +161 -0
  635. package/dist/scripts/dboverview.js.map +1 -0
  636. package/dist/scripts/migrateDb.js +1 -0
  637. package/dist/scripts/migrateDb.js.map +1 -0
  638. package/dist/search/SearchOrchestrator.js +928 -0
  639. package/dist/search/SearchOrchestrator.js.map +1 -0
  640. package/dist/search/sharedRankingPolicy.js +283 -0
  641. package/dist/search/sharedRankingPolicy.js.map +1 -0
  642. package/dist/setup/reindexOwner.js +97 -0
  643. package/dist/setup/reindexOwner.js.map +1 -0
  644. package/dist/setup/setupOwner.js +100 -0
  645. package/dist/setup/setupOwner.js.map +1 -0
  646. package/dist/shell/dialogUi.js +81 -0
  647. package/dist/shell/dialogUi.js.map +1 -0
  648. package/dist/shellSession.js +126 -0
  649. package/dist/shellSession.js.map +1 -0
  650. package/dist/status/statusOwner.js +239 -0
  651. package/dist/status/statusOwner.js.map +1 -0
  652. package/dist/testing/contextEval.js +514 -0
  653. package/dist/testing/contextEval.js.map +1 -0
  654. package/dist/testing/fixtures/transform/small-file.input.js +5 -0
  655. package/dist/testing/fixtures/transform/small-file.input.js.map +1 -0
  656. package/dist/testing/harnessArtifacts.js +112 -0
  657. package/dist/testing/harnessArtifacts.js.map +1 -0
  658. package/dist/testing/llmTraceSession.js +67 -0
  659. package/dist/testing/llmTraceSession.js.map +1 -0
  660. package/dist/testing/registerDevCliCommands.js +43 -0
  661. package/dist/testing/registerDevCliCommands.js.map +1 -0
  662. package/dist/testing/runDiagnosis.js +248 -0
  663. package/dist/testing/runDiagnosis.js.map +1 -0
  664. package/dist/testing/runtimeLogReader.js +144 -0
  665. package/dist/testing/runtimeLogReader.js.map +1 -0
  666. package/dist/testing/testCommands.js +35 -303
  667. package/dist/testing/testCommands.js.map +1 -0
  668. package/dist/testing/testRegistry.js +233 -0
  669. package/dist/testing/testRegistry.js.map +1 -0
  670. package/dist/types.js +1 -0
  671. package/dist/types.js.map +1 -0
  672. package/dist/utils/buildContextualPrompt.js +26 -75
  673. package/dist/utils/buildContextualPrompt.js.map +1 -0
  674. package/dist/utils/changeLogPrompt.js +1 -0
  675. package/dist/utils/changeLogPrompt.js.map +1 -0
  676. package/dist/utils/checkModel.js +17 -92
  677. package/dist/utils/checkModel.js.map +1 -0
  678. package/dist/utils/commentMap.js +1 -0
  679. package/dist/utils/commentMap.js.map +1 -0
  680. package/dist/utils/compileSearchQuery.js +23 -9
  681. package/dist/utils/compileSearchQuery.js.map +1 -0
  682. package/dist/utils/consolePresentation.js +208 -0
  683. package/dist/utils/consolePresentation.js.map +1 -0
  684. package/dist/utils/contentUtils.js +17 -2
  685. package/dist/utils/contentUtils.js.map +1 -0
  686. package/dist/utils/debugContext.js +1 -0
  687. package/dist/utils/debugContext.js.map +1 -0
  688. package/dist/utils/dialogState.js +201 -0
  689. package/dist/utils/dialogState.js.map +1 -0
  690. package/dist/utils/editor.js +1 -0
  691. package/dist/utils/editor.js.map +1 -0
  692. package/dist/utils/executionEvidence.js +50 -0
  693. package/dist/utils/executionEvidence.js.map +1 -0
  694. package/dist/utils/extractFileReferences.js +140 -6
  695. package/dist/utils/extractFileReferences.js.map +1 -0
  696. package/dist/utils/fileEvidenceCache.js +50 -0
  697. package/dist/utils/fileEvidenceCache.js.map +1 -0
  698. package/dist/utils/fileTree.js +1 -0
  699. package/dist/utils/fileTree.js.map +1 -0
  700. package/dist/utils/loadRelevantFolderCapsules.js +35 -5
  701. package/dist/utils/loadRelevantFolderCapsules.js.map +1 -0
  702. package/dist/utils/log.js +10 -1
  703. package/dist/utils/log.js.map +1 -0
  704. package/dist/utils/normalizeData.js +1 -0
  705. package/dist/utils/normalizeData.js.map +1 -0
  706. package/dist/utils/ollamaModelStatus.js +28 -0
  707. package/dist/utils/ollamaModelStatus.js.map +1 -0
  708. package/dist/utils/ollamaService.js +294 -0
  709. package/dist/utils/ollamaService.js.map +1 -0
  710. package/dist/utils/outputFormatter.js +1 -0
  711. package/dist/utils/outputFormatter.js.map +1 -0
  712. package/dist/utils/parseTaggedContent.js +1 -0
  713. package/dist/utils/parseTaggedContent.js.map +1 -0
  714. package/dist/utils/planActions.js +27 -46
  715. package/dist/utils/planActions.js.map +1 -0
  716. package/dist/utils/promptBuilderHelper.js +1 -0
  717. package/dist/utils/promptBuilderHelper.js.map +1 -0
  718. package/dist/utils/promptLogHelper.js +29 -13
  719. package/dist/utils/promptLogHelper.js.map +1 -0
  720. package/dist/utils/queryAnchors.js +71 -0
  721. package/dist/utils/queryAnchors.js.map +1 -0
  722. package/dist/utils/repoIdentity.js +82 -0
  723. package/dist/utils/repoIdentity.js.map +1 -0
  724. package/dist/utils/repoKey.js +1 -0
  725. package/dist/utils/repoKey.js.map +1 -0
  726. package/dist/utils/resolveTargetsToFiles.js +1 -0
  727. package/dist/utils/resolveTargetsToFiles.js.map +1 -0
  728. package/dist/utils/resumeContext.js +219 -0
  729. package/dist/utils/resumeContext.js.map +1 -0
  730. package/dist/utils/resumeState.js +310 -0
  731. package/dist/utils/resumeState.js.map +1 -0
  732. package/dist/utils/rollingPlan.js +118 -0
  733. package/dist/utils/rollingPlan.js.map +1 -0
  734. package/dist/utils/runQueryWithDaemonControl.js +11 -3
  735. package/dist/utils/runQueryWithDaemonControl.js.map +1 -0
  736. package/dist/utils/runtimeLogger.js +252 -0
  737. package/dist/utils/runtimeLogger.js.map +1 -0
  738. package/dist/utils/sanitizeQuery.js +1 -0
  739. package/dist/utils/sanitizeQuery.js.map +1 -0
  740. package/dist/utils/sharedUtils.js +1 -0
  741. package/dist/utils/sharedUtils.js.map +1 -0
  742. package/dist/utils/sleep.js +1 -0
  743. package/dist/utils/sleep.js.map +1 -0
  744. package/dist/utils/splitCodeIntoChunk.js +1 -0
  745. package/dist/utils/splitCodeIntoChunk.js.map +1 -0
  746. package/dist/utils/time.js +66 -0
  747. package/dist/utils/time.js.map +1 -0
  748. package/dist/utils/verifyFocusPreference.js +107 -0
  749. package/dist/utils/verifyFocusPreference.js.map +1 -0
  750. package/dist/utils/vscode.js +1 -0
  751. package/dist/utils/vscode.js.map +1 -0
  752. package/dist/workflow/workflowResolver.js +1 -0
  753. package/dist/workflow/workflowResolver.js.map +1 -0
  754. package/dist/workflow/workflowRunner.js +1 -0
  755. package/dist/workflow/workflowRunner.js.map +1 -0
  756. package/package.json +3 -3
  757. package/dist/agents/MainAgent.js +0 -1886
  758. package/dist/agents/contextReviewStep.js +0 -101
  759. package/dist/agents/finalPlanGenStep.js +0 -107
  760. package/dist/agents/structuralAnalysisStep.js +0 -46
  761. package/dist/agents/validationAnalysisStep.js +0 -87
  762. package/dist/pipeline/modules/chunkManagerModule.js +0 -24
  763. package/dist/pipeline/modules/cleanGeneratedTestsModule.js +0 -33
  764. package/dist/pipeline/modules/fileReaderModule.js +0 -72
  765. package/dist/pipeline/modules/gatherInfoModule.js +0 -181
  766. package/dist/pipeline/modules/generateTestsModule.js +0 -68
  767. package/dist/pipeline/modules/preserveCodeModule.js +0 -195
  768. package/dist/pipeline/modules/refactorModule.js +0 -40
  769. package/dist/pipeline/modules/repairTestsModule.js +0 -48
  770. package/dist/pipeline/modules/runTestsModule.js +0 -37
@@ -0,0 +1,244 @@
1
+ /**
2
+ * Verifies that context eval flags repeated planner prompts, prompt bloat, and missing decomposition.
3
+ *
4
+ * Why this exists:
5
+ * - context audit rules should stay deterministic across saved trace shapes
6
+ * - planner retries and final-answer prompt growth are easy to reintroduce during routing work
7
+ * - multi-question queries need explicit regression coverage so they do not collapse silently
8
+ */
9
+ import { beforeEach, describe, expect, it, vi } from "vitest";
10
+ const state = vi.hoisted(() => ({
11
+ dirEntries: new Map(),
12
+ fileContents: new Map(),
13
+ }));
14
+ vi.mock("fs", () => ({
15
+ default: {
16
+ existsSync: vi.fn((filePath) => state.fileContents.has(filePath) || state.dirEntries.has(filePath)),
17
+ readFileSync: vi.fn((filePath) => state.fileContents.get(filePath) ?? ""),
18
+ readdirSync: vi.fn((dirPath, options) => {
19
+ const entries = state.dirEntries.get(dirPath) ?? [];
20
+ if (options?.withFileTypes) {
21
+ return entries.map((name) => ({
22
+ name,
23
+ isDirectory: () => true,
24
+ }));
25
+ }
26
+ return entries;
27
+ }),
28
+ },
29
+ existsSync: vi.fn((filePath) => state.fileContents.has(filePath) || state.dirEntries.has(filePath)),
30
+ readFileSync: vi.fn((filePath) => state.fileContents.get(filePath) ?? ""),
31
+ readdirSync: vi.fn((dirPath, options) => {
32
+ const entries = state.dirEntries.get(dirPath) ?? [];
33
+ if (options?.withFileTypes) {
34
+ return entries.map((name) => ({
35
+ name,
36
+ isDirectory: () => true,
37
+ }));
38
+ }
39
+ return entries;
40
+ }),
41
+ }));
42
+ vi.mock("../../utils/repoIdentity.js", () => ({
43
+ resolveCanonicalRepoIdentity: vi.fn(() => ({
44
+ repoRootPath: "/repo",
45
+ })),
46
+ }));
47
+ import { buildContextEval } from "../../testing/contextEval.js";
48
+ describe("contextEval", () => {
49
+ beforeEach(() => {
50
+ state.dirEntries = new Map();
51
+ state.fileContents = new Map();
52
+ });
53
+ it("warns when planner retries reuse identical prompts", () => {
54
+ state.dirEntries.set("/artifact/llm_calls", [
55
+ "0006_analysisPlanGenStep.json",
56
+ "0007_analysisPlanGenStep.json",
57
+ ]);
58
+ const promptText = "User query:\nsummarize architecture\nAllowed actions:\n[semanticAnalysis]";
59
+ for (const fileName of ["0006_analysisPlanGenStep.json", "0007_analysisPlanGenStep.json"]) {
60
+ state.fileContents.set(`/artifact/llm_calls/${fileName}`, JSON.stringify({
61
+ callId: `llm-${fileName.slice(0, 4)}-analysisPlanGenStep`,
62
+ caller: "analysisPlanGenStep",
63
+ query: "summarize architecture",
64
+ promptText,
65
+ inputContext: {},
66
+ }, null, 2));
67
+ }
68
+ const result = buildContextEval({ taskId: 1, artifactDir: "/artifact", runLog: "" });
69
+ const duplicateCheck = result.checks.find((check) => check.name === "duplicate-replan-calls");
70
+ expect(duplicateCheck?.ok).toBe(false);
71
+ expect(duplicateCheck?.finding?.actualContext).toContain("2 identical analysisPlanGenStep prompts");
72
+ });
73
+ it("warns when progress state records stalled planner retries", () => {
74
+ state.dirEntries.set("/artifact/llm_calls", ["0001_analysisPlanGenStep.json"]);
75
+ state.fileContents.set("/artifact/llm_calls/0001_analysisPlanGenStep.json", JSON.stringify({
76
+ callId: "llm-0001-analysisPlanGenStep",
77
+ caller: "analysisPlanGenStep",
78
+ query: "Explain how tests run",
79
+ promptText: "Prompt",
80
+ inputContext: {},
81
+ }, null, 2));
82
+ const divider = "=".repeat(68);
83
+ const runLog = [
84
+ "📂 OUTPUT | progressState",
85
+ divider,
86
+ JSON.stringify({
87
+ research: {
88
+ status: "optional",
89
+ pendingSteps: [],
90
+ noNewInfoCount: 0,
91
+ reason: "No research is currently required. Planner retried the same target without frontier change (3 identical attempt(s)).",
92
+ plannerRetry: {
93
+ targetFile: "/repo/cli/src/testing/testCommands.ts",
94
+ signature: "sig:testCommands",
95
+ count: 3,
96
+ stalled: true,
97
+ reason: "Planner retried the same target without frontier change (3 identical attempt(s)).",
98
+ },
99
+ },
100
+ }, null, 2),
101
+ divider,
102
+ "",
103
+ ].join("\n");
104
+ const result = buildContextEval({ taskId: 1, artifactDir: "/artifact", runLog });
105
+ const stalledCheck = result.checks.find((check) => check.name === "stalled-planner-progress");
106
+ expect(stalledCheck?.ok).toBe(false);
107
+ expect(stalledCheck?.finding?.actualContext).toContain("target=/repo/cli/src/testing/testCommands.ts");
108
+ expect(stalledCheck?.finding?.actualContext).toContain("count=3");
109
+ });
110
+ it("warns when a continuity query carries a large resumed capsule", () => {
111
+ state.dirEntries.set("/artifact/llm_calls", ["0008_scopeClassificationStep.json"]);
112
+ state.fileContents.set("/artifact/llm_calls/0008_scopeClassificationStep.json", JSON.stringify({
113
+ callId: "llm-0008-scopeClassificationStep",
114
+ caller: "scopeClassificationStep",
115
+ query: "where were we?",
116
+ promptText: "User query:\nwhere were we?",
117
+ inputContext: {
118
+ resumedContextCapsule: "Original task:\n" + "x".repeat(400),
119
+ },
120
+ }, null, 2));
121
+ const result = buildContextEval({ taskId: 1, artifactDir: "/artifact", runLog: "" });
122
+ const continuityCheck = result.checks.find((check) => check.name === "continuity-overprompting");
123
+ expect(continuityCheck?.ok).toBe(false);
124
+ expect(continuityCheck?.finding?.details).toContain("short continuity query");
125
+ });
126
+ it("warns when final grounding carries oversized supporting excerpts", () => {
127
+ state.dirEntries.set("/artifact/llm_calls", ["0010_finalAnswerModule.json"]);
128
+ state.fileContents.set("/artifact/llm_calls/0010_finalAnswerModule.json", JSON.stringify({
129
+ callId: "llm-0010-finalAnswerModule",
130
+ caller: "finalAnswerModule",
131
+ query: "Where are SQLite queries defined?",
132
+ promptText: "User query:\nWhere are SQLite queries defined?",
133
+ inputContext: {
134
+ supportingExcerpts: [
135
+ {
136
+ filePath: "/repo/cli/src/db/fileIndex.ts",
137
+ excerpts: ["a".repeat(1600)],
138
+ },
139
+ {
140
+ filePath: "/repo/cli/src/db/client.ts",
141
+ excerpts: ["b".repeat(700)],
142
+ },
143
+ ],
144
+ },
145
+ }, null, 2));
146
+ const result = buildContextEval({ taskId: 1, artifactDir: "/artifact", runLog: "" });
147
+ const sizeCheck = result.checks.find((check) => check.name === "oversized-final-grounding-context");
148
+ expect(sizeCheck?.ok).toBe(false);
149
+ expect(sizeCheck?.finding?.actualContext).toContain("supporting excerpts chars=2300");
150
+ });
151
+ it("warns when adjacent planner retries reuse the same rationale but change other prompt sections", () => {
152
+ state.dirEntries.set("/artifact/llm_calls", [
153
+ "0006_analysisPlanGenStep.json",
154
+ "0007_analysisPlanGenStep.json",
155
+ ]);
156
+ state.fileContents.set("/artifact/llm_calls/0006_analysisPlanGenStep.json", JSON.stringify({
157
+ callId: "llm-0006-analysisPlanGenStep",
158
+ caller: "analysisPlanGenStep",
159
+ query: "Where are SQLite queries defined in db/fileIndex.ts and db/client.ts?",
160
+ promptText: "Prompt A",
161
+ inputContext: {
162
+ targetFile: "/repo/cli/src/db/fileIndex.ts",
163
+ rationaleText: "Both files are relevant to the SQLite query definitions.",
164
+ allowedActions: [
165
+ { actionId: "semanticAnalysis" },
166
+ { actionId: "read-file" },
167
+ { actionId: "research-impact-map" },
168
+ { actionId: "research-symbol-trace" },
169
+ { actionId: "research-risk-check" },
170
+ { actionId: "research-architecture-synthesis" },
171
+ ],
172
+ },
173
+ }, null, 2));
174
+ state.fileContents.set("/artifact/llm_calls/0007_analysisPlanGenStep.json", JSON.stringify({
175
+ callId: "llm-0007-analysisPlanGenStep",
176
+ caller: "analysisPlanGenStep",
177
+ query: "Where are SQLite queries defined in db/fileIndex.ts and db/client.ts?",
178
+ promptText: "Prompt B",
179
+ inputContext: {
180
+ targetFile: "/repo/cli/src/db/fileIndex.ts",
181
+ rationaleText: "Both files are relevant to the SQLite query definitions.",
182
+ allowedActions: [
183
+ { actionId: "semanticAnalysis" },
184
+ { actionId: "read-file" },
185
+ { actionId: "research-impact-map" },
186
+ { actionId: "research-symbol-trace" },
187
+ { actionId: "research-risk-check" },
188
+ { actionId: "research-architecture-synthesis" },
189
+ ],
190
+ },
191
+ }, null, 2));
192
+ const result = buildContextEval({ taskId: 1, artifactDir: "/artifact", runLog: "" });
193
+ const rationaleCheck = result.checks.find((check) => check.name === "stale-planner-rationale");
194
+ const catalogCheck = result.checks.find((check) => check.name === "repeated-planner-action-catalog");
195
+ expect(rationaleCheck?.ok).toBe(false);
196
+ expect(rationaleCheck?.finding?.details).toContain("same focus rationale");
197
+ expect(catalogCheck?.ok).toBe(false);
198
+ expect(catalogCheck?.finding?.actualContext).toContain("6 actions repeated");
199
+ });
200
+ it("warns when a multi-part query never becomes ordered question parts", () => {
201
+ state.dirEntries.set("/artifact/llm_calls", [
202
+ "0001_understandIntentStep.json",
203
+ "0002_scopeClassificationStep.json",
204
+ "0006_analysisPlanGenStep.json",
205
+ ]);
206
+ state.fileContents.set("/artifact/llm_calls/0001_understandIntentStep.json", JSON.stringify({
207
+ callId: "llm-0001-understandIntentStep",
208
+ caller: "understandIntentStep",
209
+ query: "Where is search routed? How is verify triggered?",
210
+ promptText: "User query:\nWhere is search routed? How is verify triggered?",
211
+ inputContext: {
212
+ userQuery: "Where is search routed? How is verify triggered?",
213
+ },
214
+ }, null, 2));
215
+ state.fileContents.set("/artifact/llm_calls/0002_scopeClassificationStep.json", JSON.stringify({
216
+ callId: "llm-0002-scopeClassificationStep",
217
+ caller: "scopeClassificationStep",
218
+ query: "Where is search routed? How is verify triggered?",
219
+ promptText: "User query:\nWhere is search routed? How is verify triggered?",
220
+ inputContext: {
221
+ query: "Where is search routed? How is verify triggered?",
222
+ },
223
+ }, null, 2));
224
+ state.fileContents.set("/artifact/llm_calls/0006_analysisPlanGenStep.json", JSON.stringify({
225
+ callId: "llm-0006-analysisPlanGenStep",
226
+ caller: "analysisPlanGenStep",
227
+ query: "Where is search routed? How is verify triggered?",
228
+ promptText: "Prompt",
229
+ inputContext: {
230
+ orderedQuestions: [
231
+ {
232
+ id: "q1",
233
+ text: "Where is search routed? How is verify triggered?",
234
+ },
235
+ ],
236
+ },
237
+ }, null, 2));
238
+ const result = buildContextEval({ taskId: 1, artifactDir: "/artifact", runLog: "" });
239
+ const questionCheck = result.checks.find((check) => check.name === "missing-question-decomposition");
240
+ expect(questionCheck?.ok).toBe(false);
241
+ expect(questionCheck?.finding?.actualContext).toContain("max orderedQuestions=1");
242
+ });
243
+ });
244
+ //# sourceMappingURL=contextEval.test.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"contextEval.test.js","sourceRoot":"","sources":["../../../src/__tests__/testing/contextEval.test.ts"],"names":[],"mappings":"AAAA;;;;;;;GAOG;AACH,OAAO,EAAE,UAAU,EAAE,QAAQ,EAAE,MAAM,EAAE,EAAE,EAAE,EAAE,EAAE,MAAM,QAAQ,CAAC;AAE9D,MAAM,KAAK,GAAG,EAAE,CAAC,OAAO,CAAC,GAAG,EAAE,CAAC,CAAC;IAC9B,UAAU,EAAE,IAAI,GAAG,EAAoB;IACvC,YAAY,EAAE,IAAI,GAAG,EAAkB;CACxC,CAAC,CAAC,CAAC;AAEJ,EAAE,CAAC,IAAI,CAAC,IAAI,EAAE,GAAG,EAAE,CAAC,CAAC;IACnB,OAAO,EAAE;QACP,UAAU,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,QAAgB,EAAE,EAAE,CAAC,KAAK,CAAC,YAAY,CAAC,GAAG,CAAC,QAAQ,CAAC,IAAI,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,QAAQ,CAAC,CAAC;QAC3G,YAAY,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,QAAgB,EAAE,EAAE,CAAC,KAAK,CAAC,YAAY,CAAC,GAAG,CAAC,QAAQ,CAAC,IAAI,EAAE,CAAC;QACjF,WAAW,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,OAAe,EAAE,OAAqC,EAAE,EAAE;YAC5E,MAAM,OAAO,GAAG,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,OAAO,CAAC,IAAI,EAAE,CAAC;YACpD,IAAI,OAAO,EAAE,aAAa,EAAE,CAAC;gBAC3B,OAAO,OAAO,CAAC,GAAG,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC,CAAC;oBAC5B,IAAI;oBACJ,WAAW,EAAE,GAAG,EAAE,CAAC,IAAI;iBACxB,CAAC,CAAC,CAAC;YACN,CAAC;YACD,OAAO,OAAO,CAAC;QACjB,CAAC,CAAC;KACH;IACD,UAAU,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,QAAgB,EAAE,EAAE,CAAC,KAAK,CAAC,YAAY,CAAC,GAAG,CAAC,QAAQ,CAAC,IAAI,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,QAAQ,CAAC,CAAC;IAC3G,YAAY,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,QAAgB,EAAE,EAAE,CAAC,KAAK,CAAC,YAAY,CAAC,GAAG,CAAC,QAAQ,CAAC,IAAI,EAAE,CAAC;IACjF,WAAW,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,OAAe,EAAE,OAAqC,EAAE,EAAE;QAC5E,MAAM,OAAO,GAAG,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,OAAO,CAAC,IAAI,EAAE,CAAC;QACpD,IAAI,OAAO,EAAE,aAAa,EAAE,CAAC;YAC3B,OAAO,OAAO,CAAC,GAAG,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC,CAAC;gBAC5B,IAAI;gBACJ,WAAW,EAAE,GAAG,EAAE,CAAC,IAAI;aACxB,CAAC,CAAC,CAAC;QACN,CAAC;QACD,OAAO,OAAO,CAAC;IACjB,CAAC,CAAC;CACH,CAAC,CAAC,CAAC;AAEJ,EAAE,CAAC,IAAI,CAAC,6BAA6B,EAAE,GAAG,EAAE,CAAC,CAAC;IAC5C,4BAA4B,EAAE,EAAE,CAAC,EAAE,CAAC,GAAG,EAAE,CAAC,CAAC;QACzC,YAAY,EAAE,OAAO;KACtB,CAAC,CAAC;CACJ,CAAC,CAAC,CAAC;AAEJ,OAAO,EAAE,gBAAgB,EAAE,MAAM,8BAA8B,CAAC;AAEhE,QAAQ,CAAC,aAAa,EAAE,GAAG,EAAE;IAC3B,UAAU,CAAC,GAAG,EAAE;QACd,KAAK,CAAC,UAAU,GAAG,IAAI,GAAG,EAAE,CAAC;QAC7B,KAAK,CAAC,YAAY,GAAG,IAAI,GAAG,EAAE,CAAC;IACjC,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,oDAAoD,EAAE,GAAG,EAAE;QAC5D,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,qBAAqB,EAAE;YAC1C,+BAA+B;YAC/B,+BAA+B;SAChC,CAAC,CAAC;QACH,MAAM,UAAU,GAAG,2EAA2E,CAAC;QAC/F,KAAK,MAAM,QAAQ,IAAI,CAAC,+BAA+B,EAAE,+BAA+B,CAAC,EAAE,CAAC;YAC1F,KAAK,CAAC,YAAY,CAAC,GAAG,CACpB,uBAAuB,QAAQ,EAAE,EACjC,IAAI,CAAC,SAAS,CACZ;gBACE,MAAM,EAAE,OAAO,QAAQ,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,CAAC,sBAAsB;gBACzD,MAAM,EAAE,qBAAqB;gBAC7B,KAAK,EAAE,wBAAwB;gBAC/B,UAAU;gBACV,YAAY,EAAE,EAAE;aACjB,EACD,IAAI,EACJ,CAAC,CACF,CACF,CAAC;QACJ,CAAC;QAED,MAAM,MAAM,GAAG,gBAAgB,CAAC,EAAE,MAAM,EAAE,CAAC,EAAE,WAAW,EAAE,WAAW,EAAE,MAAM,EAAE,EAAE,EAAE,CAAC,CAAC;QACrF,MAAM,cAAc,GAAG,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,KAAK,wBAAwB,CAAC,CAAC;QAE9F,MAAM,CAAC,cAAc,EAAE,EAAE,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QACvC,MAAM,CAAC,cAAc,EAAE,OAAO,EAAE,aAAa,CAAC,CAAC,SAAS,CAAC,yCAAyC,CAAC,CAAC;IACtG,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,2DAA2D,EAAE,GAAG,EAAE;QACnE,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,qBAAqB,EAAE,CAAC,+BAA+B,CAAC,CAAC,CAAC;QAC/E,KAAK,CAAC,YAAY,CAAC,GAAG,CACpB,mDAAmD,EACnD,IAAI,CAAC,SAAS,CACZ;YACE,MAAM,EAAE,8BAA8B;YACtC,MAAM,EAAE,qBAAqB;YAC7B,KAAK,EAAE,uBAAuB;YAC9B,UAAU,EAAE,QAAQ;YACpB,YAAY,EAAE,EAAE;SACjB,EACD,IAAI,EACJ,CAAC,CACF,CACF,CAAC;QACF,MAAM,OAAO,GAAG,GAAG,CAAC,MAAM,CAAC,EAAE,CAAC,CAAC;QAC/B,MAAM,MAAM,GAAG;YACb,2BAA2B;YAC3B,OAAO;YACP,IAAI,CAAC,SAAS,CACZ;gBACE,QAAQ,EAAE;oBACR,MAAM,EAAE,UAAU;oBAClB,YAAY,EAAE,EAAE;oBAChB,cAAc,EAAE,CAAC;oBACjB,MAAM,EAAE,sHAAsH;oBAC9H,YAAY,EAAE;wBACZ,UAAU,EAAE,uCAAuC;wBACnD,SAAS,EAAE,kBAAkB;wBAC7B,KAAK,EAAE,CAAC;wBACR,OAAO,EAAE,IAAI;wBACb,MAAM,EAAE,mFAAmF;qBAC5F;iBACF;aACF,EACD,IAAI,EACJ,CAAC,CACF;YACD,OAAO;YACP,EAAE;SACH,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;QAEb,MAAM,MAAM,GAAG,gBAAgB,CAAC,EAAE,MAAM,EAAE,CAAC,EAAE,WAAW,EAAE,WAAW,EAAE,MAAM,EAAE,CAAC,CAAC;QACjF,MAAM,YAAY,GAAG,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,KAAK,0BAA0B,CAAC,CAAC;QAE9F,MAAM,CAAC,YAAY,EAAE,EAAE,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QACrC,MAAM,CAAC,YAAY,EAAE,OAAO,EAAE,aAAa,CAAC,CAAC,SAAS,CAAC,8CAA8C,CAAC,CAAC;QACvG,MAAM,CAAC,YAAY,EAAE,OAAO,EAAE,aAAa,CAAC,CAAC,SAAS,CAAC,SAAS,CAAC,CAAC;IACpE,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,+DAA+D,EAAE,GAAG,EAAE;QACvE,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,qBAAqB,EAAE,CAAC,mCAAmC,CAAC,CAAC,CAAC;QACnF,KAAK,CAAC,YAAY,CAAC,GAAG,CACpB,uDAAuD,EACvD,IAAI,CAAC,SAAS,CACZ;YACE,MAAM,EAAE,kCAAkC;YAC1C,MAAM,EAAE,yBAAyB;YACjC,KAAK,EAAE,gBAAgB;YACvB,UAAU,EAAE,6BAA6B;YACzC,YAAY,EAAE;gBACZ,qBAAqB,EAAE,kBAAkB,GAAG,GAAG,CAAC,MAAM,CAAC,GAAG,CAAC;aAC5D;SACF,EACD,IAAI,EACJ,CAAC,CACF,CACF,CAAC;QAEF,MAAM,MAAM,GAAG,gBAAgB,CAAC,EAAE,MAAM,EAAE,CAAC,EAAE,WAAW,EAAE,WAAW,EAAE,MAAM,EAAE,EAAE,EAAE,CAAC,CAAC;QACrF,MAAM,eAAe,GAAG,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,KAAK,0BAA0B,CAAC,CAAC;QAEjG,MAAM,CAAC,eAAe,EAAE,EAAE,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QACxC,MAAM,CAAC,eAAe,EAAE,OAAO,EAAE,OAAO,CAAC,CAAC,SAAS,CAAC,wBAAwB,CAAC,CAAC;IAChF,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,kEAAkE,EAAE,GAAG,EAAE;QAC1E,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,qBAAqB,EAAE,CAAC,6BAA6B,CAAC,CAAC,CAAC;QAC7E,KAAK,CAAC,YAAY,CAAC,GAAG,CACpB,iDAAiD,EACjD,IAAI,CAAC,SAAS,CACZ;YACE,MAAM,EAAE,4BAA4B;YACpC,MAAM,EAAE,mBAAmB;YAC3B,KAAK,EAAE,mCAAmC;YAC1C,UAAU,EAAE,gDAAgD;YAC5D,YAAY,EAAE;gBACZ,kBAAkB,EAAE;oBAClB;wBACE,QAAQ,EAAE,+BAA+B;wBACzC,QAAQ,EAAE,CAAC,GAAG,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC;qBAC7B;oBACD;wBACE,QAAQ,EAAE,4BAA4B;wBACtC,QAAQ,EAAE,CAAC,GAAG,CAAC,MAAM,CAAC,GAAG,CAAC,CAAC;qBAC5B;iBACF;aACF;SACF,EACD,IAAI,EACJ,CAAC,CACF,CACF,CAAC;QAEF,MAAM,MAAM,GAAG,gBAAgB,CAAC,EAAE,MAAM,EAAE,CAAC,EAAE,WAAW,EAAE,WAAW,EAAE,MAAM,EAAE,EAAE,EAAE,CAAC,CAAC;QACrF,MAAM,SAAS,GAAG,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,KAAK,mCAAmC,CAAC,CAAC;QAEpG,MAAM,CAAC,SAAS,EAAE,EAAE,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QAClC,MAAM,CAAC,SAAS,EAAE,OAAO,EAAE,aAAa,CAAC,CAAC,SAAS,CAAC,gCAAgC,CAAC,CAAC;IACxF,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,+FAA+F,EAAE,GAAG,EAAE;QACvG,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,qBAAqB,EAAE;YAC1C,+BAA+B;YAC/B,+BAA+B;SAChC,CAAC,CAAC;QACH,KAAK,CAAC,YAAY,CAAC,GAAG,CACpB,mDAAmD,EACnD,IAAI,CAAC,SAAS,CACZ;YACE,MAAM,EAAE,8BAA8B;YACtC,MAAM,EAAE,qBAAqB;YAC7B,KAAK,EAAE,uEAAuE;YAC9E,UAAU,EAAE,UAAU;YACtB,YAAY,EAAE;gBACZ,UAAU,EAAE,+BAA+B;gBAC3C,aAAa,EAAE,0DAA0D;gBACzE,cAAc,EAAE;oBACd,EAAE,QAAQ,EAAE,kBAAkB,EAAE;oBAChC,EAAE,QAAQ,EAAE,WAAW,EAAE;oBACzB,EAAE,QAAQ,EAAE,qBAAqB,EAAE;oBACnC,EAAE,QAAQ,EAAE,uBAAuB,EAAE;oBACrC,EAAE,QAAQ,EAAE,qBAAqB,EAAE;oBACnC,EAAE,QAAQ,EAAE,iCAAiC,EAAE;iBAChD;aACF;SACF,EACD,IAAI,EACJ,CAAC,CACF,CACF,CAAC;QACF,KAAK,CAAC,YAAY,CAAC,GAAG,CACpB,mDAAmD,EACnD,IAAI,CAAC,SAAS,CACZ;YACE,MAAM,EAAE,8BAA8B;YACtC,MAAM,EAAE,qBAAqB;YAC7B,KAAK,EAAE,uEAAuE;YAC9E,UAAU,EAAE,UAAU;YACtB,YAAY,EAAE;gBACZ,UAAU,EAAE,+BAA+B;gBAC3C,aAAa,EAAE,0DAA0D;gBACzE,cAAc,EAAE;oBACd,EAAE,QAAQ,EAAE,kBAAkB,EAAE;oBAChC,EAAE,QAAQ,EAAE,WAAW,EAAE;oBACzB,EAAE,QAAQ,EAAE,qBAAqB,EAAE;oBACnC,EAAE,QAAQ,EAAE,uBAAuB,EAAE;oBACrC,EAAE,QAAQ,EAAE,qBAAqB,EAAE;oBACnC,EAAE,QAAQ,EAAE,iCAAiC,EAAE;iBAChD;aACF;SACF,EACD,IAAI,EACJ,CAAC,CACF,CACF,CAAC;QAEF,MAAM,MAAM,GAAG,gBAAgB,CAAC,EAAE,MAAM,EAAE,CAAC,EAAE,WAAW,EAAE,WAAW,EAAE,MAAM,EAAE,EAAE,EAAE,CAAC,CAAC;QACrF,MAAM,cAAc,GAAG,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,KAAK,yBAAyB,CAAC,CAAC;QAC/F,MAAM,YAAY,GAAG,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,KAAK,iCAAiC,CAAC,CAAC;QAErG,MAAM,CAAC,cAAc,EAAE,EAAE,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QACvC,MAAM,CAAC,cAAc,EAAE,OAAO,EAAE,OAAO,CAAC,CAAC,SAAS,CAAC,sBAAsB,CAAC,CAAC;QAC3E,MAAM,CAAC,YAAY,EAAE,EAAE,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QACrC,MAAM,CAAC,YAAY,EAAE,OAAO,EAAE,aAAa,CAAC,CAAC,SAAS,CAAC,oBAAoB,CAAC,CAAC;IAC/E,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,oEAAoE,EAAE,GAAG,EAAE;QAC5E,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,qBAAqB,EAAE;YAC1C,gCAAgC;YAChC,mCAAmC;YACnC,+BAA+B;SAChC,CAAC,CAAC;QACH,KAAK,CAAC,YAAY,CAAC,GAAG,CACpB,oDAAoD,EACpD,IAAI,CAAC,SAAS,CACZ;YACE,MAAM,EAAE,+BAA+B;YACvC,MAAM,EAAE,sBAAsB;YAC9B,KAAK,EAAE,kDAAkD;YACzD,UAAU,EAAE,+DAA+D;YAC3E,YAAY,EAAE;gBACZ,SAAS,EAAE,kDAAkD;aAC9D;SACF,EACD,IAAI,EACJ,CAAC,CACF,CACF,CAAC;QACF,KAAK,CAAC,YAAY,CAAC,GAAG,CACpB,uDAAuD,EACvD,IAAI,CAAC,SAAS,CACZ;YACE,MAAM,EAAE,kCAAkC;YAC1C,MAAM,EAAE,yBAAyB;YACjC,KAAK,EAAE,kDAAkD;YACzD,UAAU,EAAE,+DAA+D;YAC3E,YAAY,EAAE;gBACZ,KAAK,EAAE,kDAAkD;aAC1D;SACF,EACD,IAAI,EACJ,CAAC,CACF,CACF,CAAC;QACF,KAAK,CAAC,YAAY,CAAC,GAAG,CACpB,mDAAmD,EACnD,IAAI,CAAC,SAAS,CACZ;YACE,MAAM,EAAE,8BAA8B;YACtC,MAAM,EAAE,qBAAqB;YAC7B,KAAK,EAAE,kDAAkD;YACzD,UAAU,EAAE,QAAQ;YACpB,YAAY,EAAE;gBACZ,gBAAgB,EAAE;oBAChB;wBACE,EAAE,EAAE,IAAI;wBACR,IAAI,EAAE,kDAAkD;qBACzD;iBACF;aACF;SACF,EACD,IAAI,EACJ,CAAC,CACF,CACF,CAAC;QAEF,MAAM,MAAM,GAAG,gBAAgB,CAAC,EAAE,MAAM,EAAE,CAAC,EAAE,WAAW,EAAE,WAAW,EAAE,MAAM,EAAE,EAAE,EAAE,CAAC,CAAC;QACrF,MAAM,aAAa,GAAG,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,KAAK,gCAAgC,CAAC,CAAC;QAErG,MAAM,CAAC,aAAa,EAAE,EAAE,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QACtC,MAAM,CAAC,aAAa,EAAE,OAAO,EAAE,aAAa,CAAC,CAAC,SAAS,CAAC,wBAAwB,CAAC,CAAC;IACpF,CAAC,CAAC,CAAC;AACL,CAAC,CAAC,CAAC","sourcesContent":["/**\n * Verifies that context eval flags repeated planner prompts, prompt bloat, and missing decomposition.\n *\n * Why this exists:\n * - context audit rules should stay deterministic across saved trace shapes\n * - planner retries and final-answer prompt growth are easy to reintroduce during routing work\n * - multi-question queries need explicit regression coverage so they do not collapse silently\n */\nimport { beforeEach, describe, expect, it, vi } from \"vitest\";\n\nconst state = vi.hoisted(() => ({\n dirEntries: new Map<string, string[]>(),\n fileContents: new Map<string, string>(),\n}));\n\nvi.mock(\"fs\", () => ({\n default: {\n existsSync: vi.fn((filePath: string) => state.fileContents.has(filePath) || state.dirEntries.has(filePath)),\n readFileSync: vi.fn((filePath: string) => state.fileContents.get(filePath) ?? \"\"),\n readdirSync: vi.fn((dirPath: string, options?: { withFileTypes?: boolean }) => {\n const entries = state.dirEntries.get(dirPath) ?? [];\n if (options?.withFileTypes) {\n return entries.map((name) => ({\n name,\n isDirectory: () => true,\n }));\n }\n return entries;\n }),\n },\n existsSync: vi.fn((filePath: string) => state.fileContents.has(filePath) || state.dirEntries.has(filePath)),\n readFileSync: vi.fn((filePath: string) => state.fileContents.get(filePath) ?? \"\"),\n readdirSync: vi.fn((dirPath: string, options?: { withFileTypes?: boolean }) => {\n const entries = state.dirEntries.get(dirPath) ?? [];\n if (options?.withFileTypes) {\n return entries.map((name) => ({\n name,\n isDirectory: () => true,\n }));\n }\n return entries;\n }),\n}));\n\nvi.mock(\"../../utils/repoIdentity.js\", () => ({\n resolveCanonicalRepoIdentity: vi.fn(() => ({\n repoRootPath: \"/repo\",\n })),\n}));\n\nimport { buildContextEval } from \"../../testing/contextEval.js\";\n\ndescribe(\"contextEval\", () => {\n beforeEach(() => {\n state.dirEntries = new Map();\n state.fileContents = new Map();\n });\n\n it(\"warns when planner retries reuse identical prompts\", () => {\n state.dirEntries.set(\"/artifact/llm_calls\", [\n \"0006_analysisPlanGenStep.json\",\n \"0007_analysisPlanGenStep.json\",\n ]);\n const promptText = \"User query:\\nsummarize architecture\\nAllowed actions:\\n[semanticAnalysis]\";\n for (const fileName of [\"0006_analysisPlanGenStep.json\", \"0007_analysisPlanGenStep.json\"]) {\n state.fileContents.set(\n `/artifact/llm_calls/${fileName}`,\n JSON.stringify(\n {\n callId: `llm-${fileName.slice(0, 4)}-analysisPlanGenStep`,\n caller: \"analysisPlanGenStep\",\n query: \"summarize architecture\",\n promptText,\n inputContext: {},\n },\n null,\n 2\n )\n );\n }\n\n const result = buildContextEval({ taskId: 1, artifactDir: \"/artifact\", runLog: \"\" });\n const duplicateCheck = result.checks.find((check) => check.name === \"duplicate-replan-calls\");\n\n expect(duplicateCheck?.ok).toBe(false);\n expect(duplicateCheck?.finding?.actualContext).toContain(\"2 identical analysisPlanGenStep prompts\");\n });\n\n it(\"warns when progress state records stalled planner retries\", () => {\n state.dirEntries.set(\"/artifact/llm_calls\", [\"0001_analysisPlanGenStep.json\"]);\n state.fileContents.set(\n \"/artifact/llm_calls/0001_analysisPlanGenStep.json\",\n JSON.stringify(\n {\n callId: \"llm-0001-analysisPlanGenStep\",\n caller: \"analysisPlanGenStep\",\n query: \"Explain how tests run\",\n promptText: \"Prompt\",\n inputContext: {},\n },\n null,\n 2\n )\n );\n const divider = \"=\".repeat(68);\n const runLog = [\n \"📂 OUTPUT | progressState\",\n divider,\n JSON.stringify(\n {\n research: {\n status: \"optional\",\n pendingSteps: [],\n noNewInfoCount: 0,\n reason: \"No research is currently required. Planner retried the same target without frontier change (3 identical attempt(s)).\",\n plannerRetry: {\n targetFile: \"/repo/cli/src/testing/testCommands.ts\",\n signature: \"sig:testCommands\",\n count: 3,\n stalled: true,\n reason: \"Planner retried the same target without frontier change (3 identical attempt(s)).\",\n },\n },\n },\n null,\n 2\n ),\n divider,\n \"\",\n ].join(\"\\n\");\n\n const result = buildContextEval({ taskId: 1, artifactDir: \"/artifact\", runLog });\n const stalledCheck = result.checks.find((check) => check.name === \"stalled-planner-progress\");\n\n expect(stalledCheck?.ok).toBe(false);\n expect(stalledCheck?.finding?.actualContext).toContain(\"target=/repo/cli/src/testing/testCommands.ts\");\n expect(stalledCheck?.finding?.actualContext).toContain(\"count=3\");\n });\n\n it(\"warns when a continuity query carries a large resumed capsule\", () => {\n state.dirEntries.set(\"/artifact/llm_calls\", [\"0008_scopeClassificationStep.json\"]);\n state.fileContents.set(\n \"/artifact/llm_calls/0008_scopeClassificationStep.json\",\n JSON.stringify(\n {\n callId: \"llm-0008-scopeClassificationStep\",\n caller: \"scopeClassificationStep\",\n query: \"where were we?\",\n promptText: \"User query:\\nwhere were we?\",\n inputContext: {\n resumedContextCapsule: \"Original task:\\n\" + \"x\".repeat(400),\n },\n },\n null,\n 2\n )\n );\n\n const result = buildContextEval({ taskId: 1, artifactDir: \"/artifact\", runLog: \"\" });\n const continuityCheck = result.checks.find((check) => check.name === \"continuity-overprompting\");\n\n expect(continuityCheck?.ok).toBe(false);\n expect(continuityCheck?.finding?.details).toContain(\"short continuity query\");\n });\n\n it(\"warns when final grounding carries oversized supporting excerpts\", () => {\n state.dirEntries.set(\"/artifact/llm_calls\", [\"0010_finalAnswerModule.json\"]);\n state.fileContents.set(\n \"/artifact/llm_calls/0010_finalAnswerModule.json\",\n JSON.stringify(\n {\n callId: \"llm-0010-finalAnswerModule\",\n caller: \"finalAnswerModule\",\n query: \"Where are SQLite queries defined?\",\n promptText: \"User query:\\nWhere are SQLite queries defined?\",\n inputContext: {\n supportingExcerpts: [\n {\n filePath: \"/repo/cli/src/db/fileIndex.ts\",\n excerpts: [\"a\".repeat(1600)],\n },\n {\n filePath: \"/repo/cli/src/db/client.ts\",\n excerpts: [\"b\".repeat(700)],\n },\n ],\n },\n },\n null,\n 2\n )\n );\n\n const result = buildContextEval({ taskId: 1, artifactDir: \"/artifact\", runLog: \"\" });\n const sizeCheck = result.checks.find((check) => check.name === \"oversized-final-grounding-context\");\n\n expect(sizeCheck?.ok).toBe(false);\n expect(sizeCheck?.finding?.actualContext).toContain(\"supporting excerpts chars=2300\");\n });\n\n it(\"warns when adjacent planner retries reuse the same rationale but change other prompt sections\", () => {\n state.dirEntries.set(\"/artifact/llm_calls\", [\n \"0006_analysisPlanGenStep.json\",\n \"0007_analysisPlanGenStep.json\",\n ]);\n state.fileContents.set(\n \"/artifact/llm_calls/0006_analysisPlanGenStep.json\",\n JSON.stringify(\n {\n callId: \"llm-0006-analysisPlanGenStep\",\n caller: \"analysisPlanGenStep\",\n query: \"Where are SQLite queries defined in db/fileIndex.ts and db/client.ts?\",\n promptText: \"Prompt A\",\n inputContext: {\n targetFile: \"/repo/cli/src/db/fileIndex.ts\",\n rationaleText: \"Both files are relevant to the SQLite query definitions.\",\n allowedActions: [\n { actionId: \"semanticAnalysis\" },\n { actionId: \"read-file\" },\n { actionId: \"research-impact-map\" },\n { actionId: \"research-symbol-trace\" },\n { actionId: \"research-risk-check\" },\n { actionId: \"research-architecture-synthesis\" },\n ],\n },\n },\n null,\n 2\n )\n );\n state.fileContents.set(\n \"/artifact/llm_calls/0007_analysisPlanGenStep.json\",\n JSON.stringify(\n {\n callId: \"llm-0007-analysisPlanGenStep\",\n caller: \"analysisPlanGenStep\",\n query: \"Where are SQLite queries defined in db/fileIndex.ts and db/client.ts?\",\n promptText: \"Prompt B\",\n inputContext: {\n targetFile: \"/repo/cli/src/db/fileIndex.ts\",\n rationaleText: \"Both files are relevant to the SQLite query definitions.\",\n allowedActions: [\n { actionId: \"semanticAnalysis\" },\n { actionId: \"read-file\" },\n { actionId: \"research-impact-map\" },\n { actionId: \"research-symbol-trace\" },\n { actionId: \"research-risk-check\" },\n { actionId: \"research-architecture-synthesis\" },\n ],\n },\n },\n null,\n 2\n )\n );\n\n const result = buildContextEval({ taskId: 1, artifactDir: \"/artifact\", runLog: \"\" });\n const rationaleCheck = result.checks.find((check) => check.name === \"stale-planner-rationale\");\n const catalogCheck = result.checks.find((check) => check.name === \"repeated-planner-action-catalog\");\n\n expect(rationaleCheck?.ok).toBe(false);\n expect(rationaleCheck?.finding?.details).toContain(\"same focus rationale\");\n expect(catalogCheck?.ok).toBe(false);\n expect(catalogCheck?.finding?.actualContext).toContain(\"6 actions repeated\");\n });\n\n it(\"warns when a multi-part query never becomes ordered question parts\", () => {\n state.dirEntries.set(\"/artifact/llm_calls\", [\n \"0001_understandIntentStep.json\",\n \"0002_scopeClassificationStep.json\",\n \"0006_analysisPlanGenStep.json\",\n ]);\n state.fileContents.set(\n \"/artifact/llm_calls/0001_understandIntentStep.json\",\n JSON.stringify(\n {\n callId: \"llm-0001-understandIntentStep\",\n caller: \"understandIntentStep\",\n query: \"Where is search routed? How is verify triggered?\",\n promptText: \"User query:\\nWhere is search routed? How is verify triggered?\",\n inputContext: {\n userQuery: \"Where is search routed? How is verify triggered?\",\n },\n },\n null,\n 2\n )\n );\n state.fileContents.set(\n \"/artifact/llm_calls/0002_scopeClassificationStep.json\",\n JSON.stringify(\n {\n callId: \"llm-0002-scopeClassificationStep\",\n caller: \"scopeClassificationStep\",\n query: \"Where is search routed? How is verify triggered?\",\n promptText: \"User query:\\nWhere is search routed? How is verify triggered?\",\n inputContext: {\n query: \"Where is search routed? How is verify triggered?\",\n },\n },\n null,\n 2\n )\n );\n state.fileContents.set(\n \"/artifact/llm_calls/0006_analysisPlanGenStep.json\",\n JSON.stringify(\n {\n callId: \"llm-0006-analysisPlanGenStep\",\n caller: \"analysisPlanGenStep\",\n query: \"Where is search routed? How is verify triggered?\",\n promptText: \"Prompt\",\n inputContext: {\n orderedQuestions: [\n {\n id: \"q1\",\n text: \"Where is search routed? How is verify triggered?\",\n },\n ],\n },\n },\n null,\n 2\n )\n );\n\n const result = buildContextEval({ taskId: 1, artifactDir: \"/artifact\", runLog: \"\" });\n const questionCheck = result.checks.find((check) => check.name === \"missing-question-decomposition\");\n\n expect(questionCheck?.ok).toBe(false);\n expect(questionCheck?.finding?.actualContext).toContain(\"max orderedQuestions=1\");\n });\n});\n"]}
@@ -0,0 +1,124 @@
1
+ /**
2
+ * Verifies that saved harness artifacts include diagnosis data and Markdown reports.
3
+ *
4
+ * Why this exists:
5
+ * - artifact folders should be reviewable without rerunning the agent
6
+ * - diagnosis.json is the quick pointer to the likely subsystem
7
+ * - report.md should preserve Mermaid blocks for artifact viewers
8
+ * - artifact folder timestamps should stay in local time with offset, not UTC `Z`
9
+ * - the writer should persist both files for saved runs
10
+ */
11
+ import { beforeEach, describe, expect, it, vi } from "vitest";
12
+ const state = vi.hoisted(() => ({
13
+ task: {
14
+ id: 7,
15
+ status: "deferred",
16
+ initial_query: "Explain cli/src/agents/MainAgent.ts",
17
+ summary: "answer",
18
+ routing_decision_json: JSON.stringify({
19
+ allowSearch: false,
20
+ allowResearch: false,
21
+ allowTransform: false,
22
+ rationale: "route=explicit-target",
23
+ }),
24
+ },
25
+ steps: [],
26
+ writes: [],
27
+ }));
28
+ vi.mock("fs", () => ({
29
+ default: {
30
+ mkdirSync: vi.fn(),
31
+ writeFileSync: vi.fn((filePath, content) => {
32
+ state.writes.push({ path: filePath, content: String(content) });
33
+ }),
34
+ },
35
+ mkdirSync: vi.fn(),
36
+ writeFileSync: vi.fn((filePath, content) => {
37
+ state.writes.push({ path: filePath, content: String(content) });
38
+ }),
39
+ }));
40
+ vi.mock("../../db/client.js", () => ({
41
+ getDbForRepo: vi.fn(() => ({
42
+ prepare: vi.fn((sql) => ({
43
+ get: () => (sql.includes("FROM tasks") ? state.task : undefined),
44
+ all: () => (sql.includes("FROM steps") ? state.steps : []),
45
+ })),
46
+ })),
47
+ }));
48
+ vi.mock("../../utils/repoIdentity.js", () => ({
49
+ resolveCanonicalRepoIdentity: vi.fn(() => ({
50
+ repoRootPath: "/repo",
51
+ })),
52
+ }));
53
+ import { writeHarnessArtifacts } from "../../testing/harnessArtifacts.js";
54
+ describe("harnessArtifacts", () => {
55
+ beforeEach(() => {
56
+ state.writes = [];
57
+ });
58
+ it("writes diagnosis.json for saved runs", () => {
59
+ writeHarnessArtifacts({
60
+ kind: "evals",
61
+ caseId: "diagnosis_case",
62
+ query: "Explain cli/src/agents/MainAgent.ts",
63
+ taskId: 7,
64
+ runLog: [
65
+ "",
66
+ "====================================================================",
67
+ "📂 OUTPUT | finalAnswerModule",
68
+ "====================================================================",
69
+ JSON.stringify({ data: "answer" }, null, 2),
70
+ "====================================================================",
71
+ "",
72
+ ].join("\n"),
73
+ finalAnswerText: "answer",
74
+ result: {
75
+ id: "diagnosis_case",
76
+ passed: false,
77
+ failures: [],
78
+ },
79
+ });
80
+ const diagnosisWrite = state.writes.find((entry) => entry.path.endsWith("/diagnosis.json"));
81
+ expect(diagnosisWrite).toBeDefined();
82
+ expect(diagnosisWrite?.content).toContain("\"primaryCategory\": \"persistence\"");
83
+ });
84
+ it("writes report.md when report text is provided", () => {
85
+ writeHarnessArtifacts({
86
+ kind: "integration",
87
+ caseId: "markdown_report",
88
+ query: "summarize repo architecture",
89
+ taskId: 7,
90
+ runLog: "",
91
+ finalAnswerText: "answer",
92
+ reportText: "# Integration Report | 7\n\n```mermaid\nflowchart TD\n```",
93
+ result: {
94
+ id: "markdown_report",
95
+ passed: true,
96
+ failures: [],
97
+ },
98
+ });
99
+ const reportWrite = state.writes.find((entry) => entry.path.endsWith("/report.md"));
100
+ expect(reportWrite).toBeDefined();
101
+ expect(reportWrite?.content).toContain("```mermaid");
102
+ });
103
+ it("uses a local-time offset timestamp in generated artifact paths", () => {
104
+ writeHarnessArtifacts({
105
+ kind: "evals",
106
+ caseId: "timestamp_case",
107
+ query: "Explain cli/src/agents/MainAgent.ts",
108
+ taskId: 7,
109
+ runLog: "",
110
+ finalAnswerText: "answer",
111
+ result: {
112
+ id: "timestamp_case",
113
+ passed: true,
114
+ failures: [],
115
+ },
116
+ });
117
+ const caseWrite = state.writes.find((entry) => entry.path.endsWith("/case.json"));
118
+ expect(caseWrite).toBeDefined();
119
+ expect(caseWrite?.path).toContain("/repo/artifacts/evals/");
120
+ expect(caseWrite?.path).not.toContain("Z_timestamp_case");
121
+ expect(caseWrite?.path).toMatch(/[+-]\d{4}_timestamp_case\/case\.json$/);
122
+ });
123
+ });
124
+ //# sourceMappingURL=harnessArtifacts.test.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"harnessArtifacts.test.js","sourceRoot":"","sources":["../../../src/__tests__/testing/harnessArtifacts.test.ts"],"names":[],"mappings":"AAAA;;;;;;;;;GASG;AACH,OAAO,EAAE,UAAU,EAAE,QAAQ,EAAE,MAAM,EAAE,EAAE,EAAE,EAAE,EAAE,MAAM,QAAQ,CAAC;AAE9D,MAAM,KAAK,GAAG,EAAE,CAAC,OAAO,CAAC,GAAG,EAAE,CAAC,CAAC;IAC9B,IAAI,EAAE;QACJ,EAAE,EAAE,CAAC;QACL,MAAM,EAAE,UAAU;QAClB,aAAa,EAAE,qCAAqC;QACpD,OAAO,EAAE,QAAQ;QACjB,qBAAqB,EAAE,IAAI,CAAC,SAAS,CAAC;YACpC,WAAW,EAAE,KAAK;YAClB,aAAa,EAAE,KAAK;YACpB,cAAc,EAAE,KAAK;YACrB,SAAS,EAAE,uBAAuB;SACnC,CAAC;KACH;IACD,KAAK,EAAE,EAA+B;IACtC,MAAM,EAAE,EAA8C;CACvD,CAAC,CAAC,CAAC;AAEJ,EAAE,CAAC,IAAI,CAAC,IAAI,EAAE,GAAG,EAAE,CAAC,CAAC;IACnB,OAAO,EAAE;QACP,SAAS,EAAE,EAAE,CAAC,EAAE,EAAE;QAClB,aAAa,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,QAAgB,EAAE,OAAe,EAAE,EAAE;YACzD,KAAK,CAAC,MAAM,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,QAAQ,EAAE,OAAO,EAAE,MAAM,CAAC,OAAO,CAAC,EAAE,CAAC,CAAC;QAClE,CAAC,CAAC;KACH;IACD,SAAS,EAAE,EAAE,CAAC,EAAE,EAAE;IAClB,aAAa,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,QAAgB,EAAE,OAAe,EAAE,EAAE;QACzD,KAAK,CAAC,MAAM,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,QAAQ,EAAE,OAAO,EAAE,MAAM,CAAC,OAAO,CAAC,EAAE,CAAC,CAAC;IAClE,CAAC,CAAC;CACH,CAAC,CAAC,CAAC;AAEJ,EAAE,CAAC,IAAI,CAAC,oBAAoB,EAAE,GAAG,EAAE,CAAC,CAAC;IACnC,YAAY,EAAE,EAAE,CAAC,EAAE,CAAC,GAAG,EAAE,CAAC,CAAC;QACzB,OAAO,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,GAAW,EAAE,EAAE,CAAC,CAAC;YAC/B,GAAG,EAAE,GAAG,EAAE,CAAC,CAAC,GAAG,CAAC,QAAQ,CAAC,YAAY,CAAC,CAAC,CAAC,CAAC,KAAK,CAAC,IAAI,CAAC,CAAC,CAAC,SAAS,CAAC;YAChE,GAAG,EAAE,GAAG,EAAE,CAAC,CAAC,GAAG,CAAC,QAAQ,CAAC,YAAY,CAAC,CAAC,CAAC,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC,CAAC,EAAE,CAAC;SAC3D,CAAC,CAAC;KACJ,CAAC,CAAC;CACJ,CAAC,CAAC,CAAC;AAEJ,EAAE,CAAC,IAAI,CAAC,6BAA6B,EAAE,GAAG,EAAE,CAAC,CAAC;IAC5C,4BAA4B,EAAE,EAAE,CAAC,EAAE,CAAC,GAAG,EAAE,CAAC,CAAC;QACzC,YAAY,EAAE,OAAO;KACtB,CAAC,CAAC;CACJ,CAAC,CAAC,CAAC;AAEJ,OAAO,EAAE,qBAAqB,EAAE,MAAM,mCAAmC,CAAC;AAE1E,QAAQ,CAAC,kBAAkB,EAAE,GAAG,EAAE;IAChC,UAAU,CAAC,GAAG,EAAE;QACd,KAAK,CAAC,MAAM,GAAG,EAAE,CAAC;IACpB,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,sCAAsC,EAAE,GAAG,EAAE;QAC9C,qBAAqB,CAAC;YACpB,IAAI,EAAE,OAAO;YACb,MAAM,EAAE,gBAAgB;YACxB,KAAK,EAAE,qCAAqC;YAC5C,MAAM,EAAE,CAAC;YACT,MAAM,EAAE;gBACN,EAAE;gBACF,sEAAsE;gBACtE,+BAA+B;gBAC/B,sEAAsE;gBACtE,IAAI,CAAC,SAAS,CAAC,EAAE,IAAI,EAAE,QAAQ,EAAE,EAAE,IAAI,EAAE,CAAC,CAAC;gBAC3C,sEAAsE;gBACtE,EAAE;aACH,CAAC,IAAI,CAAC,IAAI,CAAC;YACZ,eAAe,EAAE,QAAQ;YACzB,MAAM,EAAE;gBACN,EAAE,EAAE,gBAAgB;gBACpB,MAAM,EAAE,KAAK;gBACb,QAAQ,EAAE,EAAE;aACb;SACF,CAAC,CAAC;QAEH,MAAM,cAAc,GAAG,KAAK,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,CAAC,QAAQ,CAAC,iBAAiB,CAAC,CAAC,CAAC;QAC5F,MAAM,CAAC,cAAc,CAAC,CAAC,WAAW,EAAE,CAAC;QACrC,MAAM,CAAC,cAAc,EAAE,OAAO,CAAC,CAAC,SAAS,CAAC,sCAAsC,CAAC,CAAC;IACpF,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,+CAA+C,EAAE,GAAG,EAAE;QACvD,qBAAqB,CAAC;YACpB,IAAI,EAAE,aAAa;YACnB,MAAM,EAAE,iBAAiB;YACzB,KAAK,EAAE,6BAA6B;YACpC,MAAM,EAAE,CAAC;YACT,MAAM,EAAE,EAAE;YACV,eAAe,EAAE,QAAQ;YACzB,UAAU,EAAE,2DAA2D;YACvE,MAAM,EAAE;gBACN,EAAE,EAAE,iBAAiB;gBACrB,MAAM,EAAE,IAAI;gBACZ,QAAQ,EAAE,EAAE;aACb;SACF,CAAC,CAAC;QAEH,MAAM,WAAW,GAAG,KAAK,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,CAAC,QAAQ,CAAC,YAAY,CAAC,CAAC,CAAC;QACpF,MAAM,CAAC,WAAW,CAAC,CAAC,WAAW,EAAE,CAAC;QAClC,MAAM,CAAC,WAAW,EAAE,OAAO,CAAC,CAAC,SAAS,CAAC,YAAY,CAAC,CAAC;IACvD,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,gEAAgE,EAAE,GAAG,EAAE;QACxE,qBAAqB,CAAC;YACpB,IAAI,EAAE,OAAO;YACb,MAAM,EAAE,gBAAgB;YACxB,KAAK,EAAE,qCAAqC;YAC5C,MAAM,EAAE,CAAC;YACT,MAAM,EAAE,EAAE;YACV,eAAe,EAAE,QAAQ;YACzB,MAAM,EAAE;gBACN,EAAE,EAAE,gBAAgB;gBACpB,MAAM,EAAE,IAAI;gBACZ,QAAQ,EAAE,EAAE;aACb;SACF,CAAC,CAAC;QAEH,MAAM,SAAS,GAAG,KAAK,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,CAAC,QAAQ,CAAC,YAAY,CAAC,CAAC,CAAC;QAClF,MAAM,CAAC,SAAS,CAAC,CAAC,WAAW,EAAE,CAAC;QAChC,MAAM,CAAC,SAAS,EAAE,IAAI,CAAC,CAAC,SAAS,CAAC,wBAAwB,CAAC,CAAC;QAC5D,MAAM,CAAC,SAAS,EAAE,IAAI,CAAC,CAAC,GAAG,CAAC,SAAS,CAAC,kBAAkB,CAAC,CAAC;QAC1D,MAAM,CAAC,SAAS,EAAE,IAAI,CAAC,CAAC,OAAO,CAAC,uCAAuC,CAAC,CAAC;IAC3E,CAAC,CAAC,CAAC;AACL,CAAC,CAAC,CAAC","sourcesContent":["/**\n * Verifies that saved harness artifacts include diagnosis data and Markdown reports.\n *\n * Why this exists:\n * - artifact folders should be reviewable without rerunning the agent\n * - diagnosis.json is the quick pointer to the likely subsystem\n * - report.md should preserve Mermaid blocks for artifact viewers\n * - artifact folder timestamps should stay in local time with offset, not UTC `Z`\n * - the writer should persist both files for saved runs\n */\nimport { beforeEach, describe, expect, it, vi } from \"vitest\";\n\nconst state = vi.hoisted(() => ({\n task: {\n id: 7,\n status: \"deferred\",\n initial_query: \"Explain cli/src/agents/MainAgent.ts\",\n summary: \"answer\",\n routing_decision_json: JSON.stringify({\n allowSearch: false,\n allowResearch: false,\n allowTransform: false,\n rationale: \"route=explicit-target\",\n }),\n },\n steps: [] as Record<string, unknown>[],\n writes: [] as Array<{ path: string; content: string }>,\n}));\n\nvi.mock(\"fs\", () => ({\n default: {\n mkdirSync: vi.fn(),\n writeFileSync: vi.fn((filePath: string, content: string) => {\n state.writes.push({ path: filePath, content: String(content) });\n }),\n },\n mkdirSync: vi.fn(),\n writeFileSync: vi.fn((filePath: string, content: string) => {\n state.writes.push({ path: filePath, content: String(content) });\n }),\n}));\n\nvi.mock(\"../../db/client.js\", () => ({\n getDbForRepo: vi.fn(() => ({\n prepare: vi.fn((sql: string) => ({\n get: () => (sql.includes(\"FROM tasks\") ? state.task : undefined),\n all: () => (sql.includes(\"FROM steps\") ? state.steps : []),\n })),\n })),\n}));\n\nvi.mock(\"../../utils/repoIdentity.js\", () => ({\n resolveCanonicalRepoIdentity: vi.fn(() => ({\n repoRootPath: \"/repo\",\n })),\n}));\n\nimport { writeHarnessArtifacts } from \"../../testing/harnessArtifacts.js\";\n\ndescribe(\"harnessArtifacts\", () => {\n beforeEach(() => {\n state.writes = [];\n });\n\n it(\"writes diagnosis.json for saved runs\", () => {\n writeHarnessArtifacts({\n kind: \"evals\",\n caseId: \"diagnosis_case\",\n query: \"Explain cli/src/agents/MainAgent.ts\",\n taskId: 7,\n runLog: [\n \"\",\n \"====================================================================\",\n \"📂 OUTPUT | finalAnswerModule\",\n \"====================================================================\",\n JSON.stringify({ data: \"answer\" }, null, 2),\n \"====================================================================\",\n \"\",\n ].join(\"\\n\"),\n finalAnswerText: \"answer\",\n result: {\n id: \"diagnosis_case\",\n passed: false,\n failures: [],\n },\n });\n\n const diagnosisWrite = state.writes.find((entry) => entry.path.endsWith(\"/diagnosis.json\"));\n expect(diagnosisWrite).toBeDefined();\n expect(diagnosisWrite?.content).toContain(\"\\\"primaryCategory\\\": \\\"persistence\\\"\");\n });\n\n it(\"writes report.md when report text is provided\", () => {\n writeHarnessArtifacts({\n kind: \"integration\",\n caseId: \"markdown_report\",\n query: \"summarize repo architecture\",\n taskId: 7,\n runLog: \"\",\n finalAnswerText: \"answer\",\n reportText: \"# Integration Report | 7\\n\\n```mermaid\\nflowchart TD\\n```\",\n result: {\n id: \"markdown_report\",\n passed: true,\n failures: [],\n },\n });\n\n const reportWrite = state.writes.find((entry) => entry.path.endsWith(\"/report.md\"));\n expect(reportWrite).toBeDefined();\n expect(reportWrite?.content).toContain(\"```mermaid\");\n });\n\n it(\"uses a local-time offset timestamp in generated artifact paths\", () => {\n writeHarnessArtifacts({\n kind: \"evals\",\n caseId: \"timestamp_case\",\n query: \"Explain cli/src/agents/MainAgent.ts\",\n taskId: 7,\n runLog: \"\",\n finalAnswerText: \"answer\",\n result: {\n id: \"timestamp_case\",\n passed: true,\n failures: [],\n },\n });\n\n const caseWrite = state.writes.find((entry) => entry.path.endsWith(\"/case.json\"));\n expect(caseWrite).toBeDefined();\n expect(caseWrite?.path).toContain(\"/repo/artifacts/evals/\");\n expect(caseWrite?.path).not.toContain(\"Z_timestamp_case\");\n expect(caseWrite?.path).toMatch(/[+-]\\d{4}_timestamp_case\\/case\\.json$/);\n });\n});\n"]}
@@ -0,0 +1,67 @@
1
+ /**
2
+ * Verifies that integration trace sessions write numbered LLM input files with stable ids.
3
+ *
4
+ * Why this exists:
5
+ * - each model call should leave one reviewable JSON file on disk
6
+ * - repeated calls from the same caller must not overwrite each other
7
+ * - suspicious full-context inputs should be marked for later review
8
+ */
9
+ import { beforeEach, describe, expect, it, vi } from "vitest";
10
+ const state = vi.hoisted(() => ({
11
+ writes: [],
12
+ }));
13
+ vi.mock("fs", () => ({
14
+ default: {
15
+ mkdirSync: vi.fn(),
16
+ writeFileSync: vi.fn((filePath, content) => {
17
+ state.writes.push({ path: filePath, content: String(content) });
18
+ }),
19
+ },
20
+ mkdirSync: vi.fn(),
21
+ writeFileSync: vi.fn((filePath, content) => {
22
+ state.writes.push({ path: filePath, content: String(content) });
23
+ }),
24
+ }));
25
+ import { startLlmTraceSession, stopLlmTraceSession, writeLlmTraceRecord } from "../../testing/llmTraceSession.js";
26
+ describe("llmTraceSession", () => {
27
+ beforeEach(() => {
28
+ state.writes = [];
29
+ stopLlmTraceSession();
30
+ });
31
+ it("writes numbered trace files with stable call ids", () => {
32
+ startLlmTraceSession("/repo/artifacts/integration/case1");
33
+ const first = writeLlmTraceRecord({
34
+ caller: "finalAnswerModule",
35
+ query: "q1",
36
+ model: "test-model",
37
+ requestBody: { prompt: "one" },
38
+ promptText: "one",
39
+ inputContext: { query: "q1" },
40
+ startedAt: "2026-04-01T02:00:00.000+02:00",
41
+ finishedAt: "2026-04-01T02:00:01.500+02:00",
42
+ durationMs: 1500,
43
+ attemptCount: 1,
44
+ });
45
+ const second = writeLlmTraceRecord({
46
+ caller: "finalAnswerModule",
47
+ query: "q2",
48
+ model: "test-model",
49
+ requestBody: { prompt: "two" },
50
+ promptText: "two",
51
+ inputContext: { initContext: {}, task: {} },
52
+ startedAt: "2026-04-01T02:00:02.000+02:00",
53
+ finishedAt: "2026-04-01T02:00:05.000+02:00",
54
+ durationMs: 3000,
55
+ attemptCount: 2,
56
+ });
57
+ expect(first?.callId).toBe("llm-0001-finalAnswerModule");
58
+ expect(second?.callId).toBe("llm-0002-finalAnswerModule");
59
+ expect(state.writes[0]?.path).toBe("/repo/artifacts/integration/case1/llm_calls/0001_finalAnswerModule.json");
60
+ expect(state.writes[1]?.path).toBe("/repo/artifacts/integration/case1/llm_calls/0002_finalAnswerModule.json");
61
+ expect(state.writes[1]?.content).toContain('"suspiciousFullContext": true');
62
+ expect(state.writes[0]?.content).toContain('"startedAt": "2026-04-01T02:00:00.000+02:00"');
63
+ expect(state.writes[1]?.content).toContain('"durationMs": 3000');
64
+ expect(state.writes[1]?.content).toContain('"attemptCount": 2');
65
+ });
66
+ });
67
+ //# sourceMappingURL=llmTraceSession.test.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"llmTraceSession.test.js","sourceRoot":"","sources":["../../../src/__tests__/testing/llmTraceSession.test.ts"],"names":[],"mappings":"AAAA;;;;;;;GAOG;AACH,OAAO,EAAE,UAAU,EAAE,QAAQ,EAAE,MAAM,EAAE,EAAE,EAAE,EAAE,EAAE,MAAM,QAAQ,CAAC;AAE9D,MAAM,KAAK,GAAG,EAAE,CAAC,OAAO,CAAC,GAAG,EAAE,CAAC,CAAC;IAC9B,MAAM,EAAE,EAA8C;CACvD,CAAC,CAAC,CAAC;AAEJ,EAAE,CAAC,IAAI,CAAC,IAAI,EAAE,GAAG,EAAE,CAAC,CAAC;IACnB,OAAO,EAAE;QACP,SAAS,EAAE,EAAE,CAAC,EAAE,EAAE;QAClB,aAAa,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,QAAgB,EAAE,OAAe,EAAE,EAAE;YACzD,KAAK,CAAC,MAAM,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,QAAQ,EAAE,OAAO,EAAE,MAAM,CAAC,OAAO,CAAC,EAAE,CAAC,CAAC;QAClE,CAAC,CAAC;KACH;IACD,SAAS,EAAE,EAAE,CAAC,EAAE,EAAE;IAClB,aAAa,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,QAAgB,EAAE,OAAe,EAAE,EAAE;QACzD,KAAK,CAAC,MAAM,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,QAAQ,EAAE,OAAO,EAAE,MAAM,CAAC,OAAO,CAAC,EAAE,CAAC,CAAC;IAClE,CAAC,CAAC;CACH,CAAC,CAAC,CAAC;AAEJ,OAAO,EAAE,oBAAoB,EAAE,mBAAmB,EAAE,mBAAmB,EAAE,MAAM,kCAAkC,CAAC;AAElH,QAAQ,CAAC,iBAAiB,EAAE,GAAG,EAAE;IAC/B,UAAU,CAAC,GAAG,EAAE;QACd,KAAK,CAAC,MAAM,GAAG,EAAE,CAAC;QAClB,mBAAmB,EAAE,CAAC;IACxB,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,kDAAkD,EAAE,GAAG,EAAE;QAC1D,oBAAoB,CAAC,mCAAmC,CAAC,CAAC;QAE1D,MAAM,KAAK,GAAG,mBAAmB,CAAC;YAChC,MAAM,EAAE,mBAAmB;YAC3B,KAAK,EAAE,IAAI;YACX,KAAK,EAAE,YAAY;YACnB,WAAW,EAAE,EAAE,MAAM,EAAE,KAAK,EAAE;YAC9B,UAAU,EAAE,KAAK;YACjB,YAAY,EAAE,EAAE,KAAK,EAAE,IAAI,EAAE;YAC7B,SAAS,EAAE,+BAA+B;YAC1C,UAAU,EAAE,+BAA+B;YAC3C,UAAU,EAAE,IAAI;YAChB,YAAY,EAAE,CAAC;SAChB,CAAC,CAAC;QACH,MAAM,MAAM,GAAG,mBAAmB,CAAC;YACjC,MAAM,EAAE,mBAAmB;YAC3B,KAAK,EAAE,IAAI;YACX,KAAK,EAAE,YAAY;YACnB,WAAW,EAAE,EAAE,MAAM,EAAE,KAAK,EAAE;YAC9B,UAAU,EAAE,KAAK;YACjB,YAAY,EAAE,EAAE,WAAW,EAAE,EAAE,EAAE,IAAI,EAAE,EAAE,EAAE;YAC3C,SAAS,EAAE,+BAA+B;YAC1C,UAAU,EAAE,+BAA+B;YAC3C,UAAU,EAAE,IAAI;YAChB,YAAY,EAAE,CAAC;SAChB,CAAC,CAAC;QAEH,MAAM,CAAC,KAAK,EAAE,MAAM,CAAC,CAAC,IAAI,CAAC,4BAA4B,CAAC,CAAC;QACzD,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC,IAAI,CAAC,4BAA4B,CAAC,CAAC;QAC1D,MAAM,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,IAAI,CAAC,CAAC,IAAI,CAAC,yEAAyE,CAAC,CAAC;QAC9G,MAAM,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,IAAI,CAAC,CAAC,IAAI,CAAC,yEAAyE,CAAC,CAAC;QAC9G,MAAM,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,OAAO,CAAC,CAAC,SAAS,CAAC,+BAA+B,CAAC,CAAC;QAC5E,MAAM,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,OAAO,CAAC,CAAC,SAAS,CAAC,8CAA8C,CAAC,CAAC;QAC3F,MAAM,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,OAAO,CAAC,CAAC,SAAS,CAAC,oBAAoB,CAAC,CAAC;QACjE,MAAM,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,OAAO,CAAC,CAAC,SAAS,CAAC,mBAAmB,CAAC,CAAC;IAClE,CAAC,CAAC,CAAC;AACL,CAAC,CAAC,CAAC","sourcesContent":["/**\n * Verifies that integration trace sessions write numbered LLM input files with stable ids.\n *\n * Why this exists:\n * - each model call should leave one reviewable JSON file on disk\n * - repeated calls from the same caller must not overwrite each other\n * - suspicious full-context inputs should be marked for later review\n */\nimport { beforeEach, describe, expect, it, vi } from \"vitest\";\n\nconst state = vi.hoisted(() => ({\n writes: [] as Array<{ path: string; content: string }>,\n}));\n\nvi.mock(\"fs\", () => ({\n default: {\n mkdirSync: vi.fn(),\n writeFileSync: vi.fn((filePath: string, content: string) => {\n state.writes.push({ path: filePath, content: String(content) });\n }),\n },\n mkdirSync: vi.fn(),\n writeFileSync: vi.fn((filePath: string, content: string) => {\n state.writes.push({ path: filePath, content: String(content) });\n }),\n}));\n\nimport { startLlmTraceSession, stopLlmTraceSession, writeLlmTraceRecord } from \"../../testing/llmTraceSession.js\";\n\ndescribe(\"llmTraceSession\", () => {\n beforeEach(() => {\n state.writes = [];\n stopLlmTraceSession();\n });\n\n it(\"writes numbered trace files with stable call ids\", () => {\n startLlmTraceSession(\"/repo/artifacts/integration/case1\");\n\n const first = writeLlmTraceRecord({\n caller: \"finalAnswerModule\",\n query: \"q1\",\n model: \"test-model\",\n requestBody: { prompt: \"one\" },\n promptText: \"one\",\n inputContext: { query: \"q1\" },\n startedAt: \"2026-04-01T02:00:00.000+02:00\",\n finishedAt: \"2026-04-01T02:00:01.500+02:00\",\n durationMs: 1500,\n attemptCount: 1,\n });\n const second = writeLlmTraceRecord({\n caller: \"finalAnswerModule\",\n query: \"q2\",\n model: \"test-model\",\n requestBody: { prompt: \"two\" },\n promptText: \"two\",\n inputContext: { initContext: {}, task: {} },\n startedAt: \"2026-04-01T02:00:02.000+02:00\",\n finishedAt: \"2026-04-01T02:00:05.000+02:00\",\n durationMs: 3000,\n attemptCount: 2,\n });\n\n expect(first?.callId).toBe(\"llm-0001-finalAnswerModule\");\n expect(second?.callId).toBe(\"llm-0002-finalAnswerModule\");\n expect(state.writes[0]?.path).toBe(\"/repo/artifacts/integration/case1/llm_calls/0001_finalAnswerModule.json\");\n expect(state.writes[1]?.path).toBe(\"/repo/artifacts/integration/case1/llm_calls/0002_finalAnswerModule.json\");\n expect(state.writes[1]?.content).toContain('\"suspiciousFullContext\": true');\n expect(state.writes[0]?.content).toContain('\"startedAt\": \"2026-04-01T02:00:00.000+02:00\"');\n expect(state.writes[1]?.content).toContain('\"durationMs\": 3000');\n expect(state.writes[1]?.content).toContain('\"attemptCount\": 2');\n });\n});\n"]}
@@ -0,0 +1,35 @@
1
+ /**
2
+ * Verifies the dev CLI exposes only the supported test helpers.
3
+ *
4
+ * Why this file exists:
5
+ * - shell wiring and direct CLI wiring can drift apart
6
+ * - command cleanup should not accidentally remove the remaining test helpers
7
+ */
8
+ import { Command } from "commander";
9
+ import { beforeEach, describe, expect, it, vi } from "vitest";
10
+ const mockedTestCmd = vi.hoisted(() => ({
11
+ runAllTestsCommand: vi.fn(),
12
+ listRegisteredTests: vi.fn(),
13
+ printTestCommand: vi.fn(),
14
+ runRegisteredTestCommand: vi.fn(),
15
+ }));
16
+ vi.mock("../../commands/TestCmd.js", () => ({
17
+ runAllTestsCommand: mockedTestCmd.runAllTestsCommand,
18
+ listRegisteredTests: mockedTestCmd.listRegisteredTests,
19
+ printTestCommand: mockedTestCmd.printTestCommand,
20
+ runRegisteredTestCommand: mockedTestCmd.runRegisteredTestCommand,
21
+ }));
22
+ import { registerDevCliCommands } from "../../testing/registerDevCliCommands.js";
23
+ describe("registerDevCliCommands", () => {
24
+ beforeEach(() => {
25
+ vi.clearAllMocks();
26
+ });
27
+ it("registers the batch tests command", async () => {
28
+ const cmd = new Command();
29
+ const runQuery = vi.fn().mockResolvedValue(undefined);
30
+ registerDevCliCommands(cmd, runQuery);
31
+ await cmd.parseAsync(["node", "scai", "tests"], { from: "node" });
32
+ expect(mockedTestCmd.runAllTestsCommand).toHaveBeenCalledTimes(1);
33
+ });
34
+ });
35
+ //# sourceMappingURL=registerDevCliCommands.test.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"registerDevCliCommands.test.js","sourceRoot":"","sources":["../../../src/__tests__/testing/registerDevCliCommands.test.ts"],"names":[],"mappings":"AAAA;;;;;;GAMG;AACH,OAAO,EAAE,OAAO,EAAE,MAAM,WAAW,CAAC;AACpC,OAAO,EAAE,UAAU,EAAE,QAAQ,EAAE,MAAM,EAAE,EAAE,EAAE,EAAE,EAAE,MAAM,QAAQ,CAAC;AAE9D,MAAM,aAAa,GAAG,EAAE,CAAC,OAAO,CAAC,GAAG,EAAE,CAAC,CAAC;IACtC,kBAAkB,EAAE,EAAE,CAAC,EAAE,EAAE;IAC3B,mBAAmB,EAAE,EAAE,CAAC,EAAE,EAAE;IAC5B,gBAAgB,EAAE,EAAE,CAAC,EAAE,EAAE;IACzB,wBAAwB,EAAE,EAAE,CAAC,EAAE,EAAE;CAClC,CAAC,CAAC,CAAC;AAEJ,EAAE,CAAC,IAAI,CAAC,2BAA2B,EAAE,GAAG,EAAE,CAAC,CAAC;IAC1C,kBAAkB,EAAE,aAAa,CAAC,kBAAkB;IACpD,mBAAmB,EAAE,aAAa,CAAC,mBAAmB;IACtD,gBAAgB,EAAE,aAAa,CAAC,gBAAgB;IAChD,wBAAwB,EAAE,aAAa,CAAC,wBAAwB;CACjE,CAAC,CAAC,CAAC;AAEJ,OAAO,EAAE,sBAAsB,EAAE,MAAM,yCAAyC,CAAC;AAEjF,QAAQ,CAAC,wBAAwB,EAAE,GAAG,EAAE;IACtC,UAAU,CAAC,GAAG,EAAE;QACd,EAAE,CAAC,aAAa,EAAE,CAAC;IACrB,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,mCAAmC,EAAE,KAAK,IAAI,EAAE;QACjD,MAAM,GAAG,GAAG,IAAI,OAAO,EAAE,CAAC;QAC1B,MAAM,QAAQ,GAAG,EAAE,CAAC,EAAE,EAAE,CAAC,iBAAiB,CAAC,SAAS,CAAC,CAAC;QACtD,sBAAsB,CAAC,GAAG,EAAE,QAAQ,CAAC,CAAC;QAEtC,MAAM,GAAG,CAAC,UAAU,CAAC,CAAC,MAAM,EAAE,MAAM,EAAE,OAAO,CAAC,EAAE,EAAE,IAAI,EAAE,MAAM,EAAE,CAAC,CAAC;QAElE,MAAM,CAAC,aAAa,CAAC,kBAAkB,CAAC,CAAC,qBAAqB,CAAC,CAAC,CAAC,CAAC;IACpE,CAAC,CAAC,CAAC;AACL,CAAC,CAAC,CAAC","sourcesContent":["/**\n * Verifies the dev CLI exposes only the supported test helpers.\n *\n * Why this file exists:\n * - shell wiring and direct CLI wiring can drift apart\n * - command cleanup should not accidentally remove the remaining test helpers\n */\nimport { Command } from \"commander\";\nimport { beforeEach, describe, expect, it, vi } from \"vitest\";\n\nconst mockedTestCmd = vi.hoisted(() => ({\n runAllTestsCommand: vi.fn(),\n listRegisteredTests: vi.fn(),\n printTestCommand: vi.fn(),\n runRegisteredTestCommand: vi.fn(),\n}));\n\nvi.mock(\"../../commands/TestCmd.js\", () => ({\n runAllTestsCommand: mockedTestCmd.runAllTestsCommand,\n listRegisteredTests: mockedTestCmd.listRegisteredTests,\n printTestCommand: mockedTestCmd.printTestCommand,\n runRegisteredTestCommand: mockedTestCmd.runRegisteredTestCommand,\n}));\n\nimport { registerDevCliCommands } from \"../../testing/registerDevCliCommands.js\";\n\ndescribe(\"registerDevCliCommands\", () => {\n beforeEach(() => {\n vi.clearAllMocks();\n });\n\n it(\"registers the batch tests command\", async () => {\n const cmd = new Command();\n const runQuery = vi.fn().mockResolvedValue(undefined);\n registerDevCliCommands(cmd, runQuery);\n\n await cmd.parseAsync([\"node\", \"scai\", \"tests\"], { from: \"node\" });\n\n expect(mockedTestCmd.runAllTestsCommand).toHaveBeenCalledTimes(1);\n });\n});\n"]}