scai 0.1.178 → 1.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +162 -267
- package/dist/__tests__/CommitSuggesterCmd.test.js +112 -0
- package/dist/__tests__/CommitSuggesterCmd.test.js.map +1 -0
- package/dist/__tests__/EvalReportCmd.test.js +645 -0
- package/dist/__tests__/EvalReportCmd.test.js.map +1 -0
- package/dist/__tests__/ModelCmd.test.js +64 -0
- package/dist/__tests__/ModelCmd.test.js.map +1 -0
- package/dist/__tests__/agents/agentActions.test.js +345 -0
- package/dist/__tests__/agents/agentActions.test.js.map +1 -0
- package/dist/__tests__/agents/agentFeedback.test.js +118 -0
- package/dist/__tests__/agents/agentFeedback.test.js.map +1 -0
- package/dist/__tests__/agents/agentGeneralScope.test.js +74 -0
- package/dist/__tests__/agents/agentGeneralScope.test.js.map +1 -0
- package/dist/__tests__/agents/agentLoop.test.js +1723 -0
- package/dist/__tests__/agents/agentLoop.test.js.map +1 -0
- package/dist/__tests__/agents/agentPolicyState.test.js +948 -0
- package/dist/__tests__/agents/agentPolicyState.test.js.map +1 -0
- package/dist/__tests__/agents/agentReadEvidence.test.js +170 -0
- package/dist/__tests__/agents/agentReadEvidence.test.js.map +1 -0
- package/dist/__tests__/agents/agentReadPersistence.test.js +129 -0
- package/dist/__tests__/agents/agentReadPersistence.test.js.map +1 -0
- package/dist/__tests__/agents/agentResumeCheckpoint.test.js +90 -0
- package/dist/__tests__/agents/agentResumeCheckpoint.test.js.map +1 -0
- package/dist/__tests__/agents/agentSearchBatchPlanner.test.js +289 -0
- package/dist/__tests__/agents/agentSearchBatchPlanner.test.js.map +1 -0
- package/dist/__tests__/agents/agentSearchOwnership.test.js +166 -0
- package/dist/__tests__/agents/agentSearchOwnership.test.js.map +1 -0
- package/dist/__tests__/agents/agentSearchRanking.test.js +139 -0
- package/dist/__tests__/agents/agentSearchRanking.test.js.map +1 -0
- package/dist/__tests__/agents/agentSearchRouting.test.js +584 -0
- package/dist/__tests__/agents/agentSearchRouting.test.js.map +1 -0
- package/dist/__tests__/agents/agentSearchScoring.test.js +23 -0
- package/dist/__tests__/agents/agentSearchScoring.test.js.map +1 -0
- package/dist/__tests__/agents/agentSearchShared.test.js +78 -0
- package/dist/__tests__/agents/agentSearchShared.test.js.map +1 -0
- package/dist/__tests__/agents/agentStateMachine.test.js +58 -0
- package/dist/__tests__/agents/agentStateMachine.test.js.map +1 -0
- package/dist/__tests__/agents/agentTaskPersistence.test.js +156 -0
- package/dist/__tests__/agents/agentTaskPersistence.test.js.map +1 -0
- package/dist/__tests__/agents/agentTools.test.js +69 -0
- package/dist/__tests__/agents/agentTools.test.js.map +1 -0
- package/dist/__tests__/agents/agentTransform.test.js +779 -0
- package/dist/__tests__/agents/agentTransform.test.js.map +1 -0
- package/dist/__tests__/agents/analysisPlanGenStep.test.js +157 -0
- package/dist/__tests__/agents/analysisPlanGenStep.test.js.map +1 -0
- package/dist/__tests__/agents/answerOnlyCompletion.test.js +75 -0
- package/dist/__tests__/agents/answerOnlyCompletion.test.js.map +1 -0
- package/dist/__tests__/agents/decideNextAction.test.js +1662 -0
- package/dist/__tests__/agents/decideNextAction.test.js.map +1 -0
- package/dist/__tests__/agents/deriveFocusFromSearchStep.test.js +258 -0
- package/dist/__tests__/agents/deriveFocusFromSearchStep.test.js.map +1 -0
- package/dist/__tests__/agents/evidenceVerifierStep.test.js +113 -0
- package/dist/__tests__/agents/evidenceVerifierStep.test.js.map +1 -0
- package/dist/__tests__/agents/executionPolicyResolver.test.js +208 -0
- package/dist/__tests__/agents/executionPolicyResolver.test.js.map +1 -0
- package/dist/__tests__/agents/fileCheckStep.test.js +299 -0
- package/dist/__tests__/agents/fileCheckStep.test.js.map +1 -0
- package/dist/__tests__/agents/giveUpEvaluatorStep.test.js +35 -0
- package/dist/__tests__/agents/giveUpEvaluatorStep.test.js.map +1 -0
- package/dist/__tests__/agents/guardState.test.js +297 -0
- package/dist/__tests__/agents/guardState.test.js.map +1 -0
- package/dist/__tests__/agents/mainAgentHeuristics.test.js +72 -0
- package/dist/__tests__/agents/mainAgentHeuristics.test.js.map +1 -0
- package/dist/__tests__/agents/objectiveEvaluatorStep.test.js +60 -0
- package/dist/__tests__/agents/objectiveEvaluatorStep.test.js.map +1 -0
- package/dist/__tests__/agents/outerLoopRecoveryEvaluator.test.js +207 -0
- package/dist/__tests__/agents/outerLoopRecoveryEvaluator.test.js.map +1 -0
- package/dist/__tests__/agents/prompting.test.js +363 -0
- package/dist/__tests__/agents/prompting.test.js.map +1 -0
- package/dist/__tests__/agents/readinessGateStep.test.js +180 -0
- package/dist/__tests__/agents/readinessGateStep.test.js.map +1 -0
- package/dist/__tests__/agents/reasonNextStep.test.js +56 -0
- package/dist/__tests__/agents/reasonNextStep.test.js.map +1 -0
- package/dist/__tests__/agents/reasonNextTaskStep.test.js +284 -0
- package/dist/__tests__/agents/reasonNextTaskStep.test.js.map +1 -0
- package/dist/__tests__/agents/resolveAgentTargetClassification.test.js +170 -0
- package/dist/__tests__/agents/resolveAgentTargetClassification.test.js.map +1 -0
- package/dist/__tests__/agents/resolveProgressState.test.js +526 -0
- package/dist/__tests__/agents/resolveProgressState.test.js.map +1 -0
- package/dist/__tests__/agents/resumeCheckpoint.test.js +50 -0
- package/dist/__tests__/agents/resumeCheckpoint.test.js.map +1 -0
- package/dist/__tests__/agents/routingDecisionStep.test.js +134 -0
- package/dist/__tests__/agents/routingDecisionStep.test.js.map +1 -0
- package/dist/__tests__/agents/scopeClassificationStep.test.js +118 -0
- package/dist/__tests__/agents/scopeClassificationStep.test.js.map +1 -0
- package/dist/__tests__/agents/searchContext.test.js +97 -0
- package/dist/__tests__/agents/searchContext.test.js.map +1 -0
- package/dist/__tests__/agents/selectRelevantSourcesStep.test.js +73 -0
- package/dist/__tests__/agents/selectRelevantSourcesStep.test.js.map +1 -0
- package/dist/__tests__/agents/structuredOutput.test.js +45 -0
- package/dist/__tests__/agents/structuredOutput.test.js.map +1 -0
- package/dist/__tests__/agents/transformPlanGenStep.fallback.test.js +59 -0
- package/dist/__tests__/agents/transformPlanGenStep.fallback.test.js.map +1 -0
- package/dist/__tests__/agents/transformPlanGenStep.test.js +92 -0
- package/dist/__tests__/agents/transformPlanGenStep.test.js.map +1 -0
- package/dist/__tests__/agents/understandIntentStep.test.js +237 -0
- package/dist/__tests__/agents/understandIntentStep.test.js.map +1 -0
- package/dist/__tests__/agents/understandResumeContext.test.js +65 -0
- package/dist/__tests__/agents/understandResumeContext.test.js.map +1 -0
- package/dist/__tests__/agents/understandScope.test.js +227 -0
- package/dist/__tests__/agents/understandScope.test.js.map +1 -0
- package/dist/__tests__/agents/validateChangesStep.test.js +52 -0
- package/dist/__tests__/agents/validateChangesStep.test.js.map +1 -0
- package/dist/__tests__/askCommandTaskBinding.test.js +176 -0
- package/dist/__tests__/askCommandTaskBinding.test.js.map +1 -0
- package/dist/__tests__/commandVisibility.test.js +25 -0
- package/dist/__tests__/commandVisibility.test.js.map +1 -0
- package/dist/__tests__/config.devOutput.test.js +82 -0
- package/dist/__tests__/config.devOutput.test.js.map +1 -0
- package/dist/__tests__/currentContext.test.js +43 -0
- package/dist/__tests__/currentContext.test.js.map +1 -0
- package/dist/__tests__/daemonWorker.test.js +51 -0
- package/dist/__tests__/daemonWorker.test.js.map +1 -0
- package/dist/__tests__/dialogState.test.js +113 -0
- package/dist/__tests__/dialogState.test.js.map +1 -0
- package/dist/__tests__/evalCommands.test.js +506 -0
- package/dist/__tests__/evalCommands.test.js.map +1 -0
- package/dist/__tests__/evalCommandsSummary.test.js +68 -0
- package/dist/__tests__/evalCommandsSummary.test.js.map +1 -0
- package/dist/__tests__/example.test.js +1 -0
- package/dist/__tests__/example.test.js.map +1 -0
- package/dist/__tests__/factory.commitCommand.test.js +45 -0
- package/dist/__tests__/factory.commitCommand.test.js.map +1 -0
- package/dist/__tests__/factory.devOutputCommand.test.js +122 -0
- package/dist/__tests__/factory.devOutputCommand.test.js.map +1 -0
- package/dist/__tests__/factory.evalCommands.test.js +38 -0
- package/dist/__tests__/factory.evalCommands.test.js.map +1 -0
- package/dist/__tests__/factory.planCommand.test.js +35 -0
- package/dist/__tests__/factory.planCommand.test.js.map +1 -0
- package/dist/__tests__/factory.setupCommand.test.js +34 -0
- package/dist/__tests__/factory.setupCommand.test.js.map +1 -0
- package/dist/__tests__/factory.statusCommand.test.js +54 -0
- package/dist/__tests__/factory.statusCommand.test.js.map +1 -0
- package/dist/__tests__/fileRules/queryTokenRules.test.js +35 -0
- package/dist/__tests__/fileRules/queryTokenRules.test.js.map +1 -0
- package/dist/__tests__/fileRules/searchPathClassification.test.js +57 -0
- package/dist/__tests__/fileRules/searchPathClassification.test.js.map +1 -0
- package/dist/__tests__/generate.ollamaRecovery.test.js +344 -0
- package/dist/__tests__/generate.ollamaRecovery.test.js.map +1 -0
- package/dist/__tests__/index.modelStartup.test.js +24 -0
- package/dist/__tests__/index.modelStartup.test.js.map +1 -0
- package/dist/__tests__/indexCmd.test.js +85 -0
- package/dist/__tests__/indexCmd.test.js.map +1 -0
- package/dist/__tests__/indexSlashCommand.test.js +50 -0
- package/dist/__tests__/indexSlashCommand.test.js.map +1 -0
- package/dist/__tests__/ollamaService.test.js +103 -0
- package/dist/__tests__/ollamaService.test.js.map +1 -0
- package/dist/__tests__/pipeline/modules/codeTransformModule.small-file.test.js +68 -0
- package/dist/__tests__/pipeline/modules/codeTransformModule.small-file.test.js.map +1 -0
- package/dist/__tests__/pipeline/modules/commitSuggesterModule.test.js +68 -0
- package/dist/__tests__/pipeline/modules/commitSuggesterModule.test.js.map +1 -0
- package/dist/__tests__/pipeline/modules/fileSearchModule.test.js +284 -0
- package/dist/__tests__/pipeline/modules/fileSearchModule.test.js.map +1 -0
- package/dist/__tests__/pipeline/modules/finalAnswerModule.test.js +1139 -0
- package/dist/__tests__/pipeline/modules/finalAnswerModule.test.js.map +1 -0
- package/dist/__tests__/pipeline/modules/readFileModule.test.js +146 -0
- package/dist/__tests__/pipeline/modules/readFileModule.test.js.map +1 -0
- package/dist/__tests__/pipeline/modules/semanticAnalysisModule.test.js +192 -0
- package/dist/__tests__/pipeline/modules/semanticAnalysisModule.test.js.map +1 -0
- package/dist/__tests__/repoIdentity.test.js +31 -0
- package/dist/__tests__/repoIdentity.test.js.map +1 -0
- package/dist/__tests__/resumeContext.test.js +87 -0
- package/dist/__tests__/resumeContext.test.js.map +1 -0
- package/dist/__tests__/resumeState.test.js +239 -0
- package/dist/__tests__/resumeState.test.js.map +1 -0
- package/dist/__tests__/search/SearchOrchestrator.test.js +836 -0
- package/dist/__tests__/search/SearchOrchestrator.test.js.map +1 -0
- package/dist/__tests__/shellDialogUi.test.js +52 -0
- package/dist/__tests__/shellDialogUi.test.js.map +1 -0
- package/dist/__tests__/shellSession.test.js +102 -0
- package/dist/__tests__/shellSession.test.js.map +1 -0
- package/dist/__tests__/statusOwner.test.js +215 -0
- package/dist/__tests__/statusOwner.test.js.map +1 -0
- package/dist/__tests__/testing/contextEval.test.js +244 -0
- package/dist/__tests__/testing/contextEval.test.js.map +1 -0
- package/dist/__tests__/testing/harnessArtifacts.test.js +124 -0
- package/dist/__tests__/testing/harnessArtifacts.test.js.map +1 -0
- package/dist/__tests__/testing/llmTraceSession.test.js +67 -0
- package/dist/__tests__/testing/llmTraceSession.test.js.map +1 -0
- package/dist/__tests__/testing/registerDevCliCommands.test.js +35 -0
- package/dist/__tests__/testing/registerDevCliCommands.test.js.map +1 -0
- package/dist/__tests__/testing/runDiagnosis.test.js +159 -0
- package/dist/__tests__/testing/runDiagnosis.test.js.map +1 -0
- package/dist/__tests__/testing/runtimeLogReader.test.js +66 -0
- package/dist/__tests__/testing/runtimeLogReader.test.js.map +1 -0
- package/dist/__tests__/testing/testCommands.test.js +53 -0
- package/dist/__tests__/testing/testCommands.test.js.map +1 -0
- package/dist/__tests__/utils/compileSearchQuery.test.js +38 -0
- package/dist/__tests__/utils/compileSearchQuery.test.js.map +1 -0
- package/dist/__tests__/utils/consolePresentation.test.js +105 -0
- package/dist/__tests__/utils/consolePresentation.test.js.map +1 -0
- package/dist/__tests__/utils/extractFileReferences.test.js +41 -0
- package/dist/__tests__/utils/extractFileReferences.test.js.map +1 -0
- package/dist/__tests__/utils/log.test.js +34 -0
- package/dist/__tests__/utils/log.test.js.map +1 -0
- package/dist/__tests__/utils/runtimeLogger.test.js +200 -0
- package/dist/__tests__/utils/runtimeLogger.test.js.map +1 -0
- package/dist/__tests__/utils/spinner.test.js +31 -0
- package/dist/__tests__/utils/spinner.test.js.map +1 -0
- package/dist/__tests__/utils/verifyFocusPreference.test.js +41 -0
- package/dist/__tests__/utils/verifyFocusPreference.test.js.map +1 -0
- package/dist/agent/actions/index.js +301 -0
- package/dist/agent/actions/index.js.map +1 -0
- package/dist/agent/actions/normalize.js +360 -0
- package/dist/agent/actions/normalize.js.map +1 -0
- package/dist/agent/actions/schemas.js +129 -0
- package/dist/agent/actions/schemas.js.map +1 -0
- package/dist/agent/evidence/index.js +320 -0
- package/dist/agent/evidence/index.js.map +1 -0
- package/dist/agent/feedback/index.js +187 -0
- package/dist/agent/feedback/index.js.map +1 -0
- package/dist/agent/finalization/index.js +35 -0
- package/dist/agent/finalization/index.js.map +1 -0
- package/dist/agent/index.js +126 -0
- package/dist/agent/index.js.map +1 -0
- package/dist/agent/logging/index.js +350 -0
- package/dist/agent/logging/index.js.map +1 -0
- package/dist/agent/persistence/boot.js +58 -0
- package/dist/agent/persistence/boot.js.map +1 -0
- package/dist/agent/persistence/currentTask.js +36 -0
- package/dist/agent/persistence/currentTask.js.map +1 -0
- package/dist/agent/persistence/hydrate.js +42 -0
- package/dist/agent/persistence/hydrate.js.map +1 -0
- package/dist/agent/persistence/index.js +15 -0
- package/dist/agent/persistence/index.js.map +1 -0
- package/dist/agent/persistence/snapshots.js +97 -0
- package/dist/agent/persistence/snapshots.js.map +1 -0
- package/dist/agent/persistence/steps.js +95 -0
- package/dist/agent/persistence/steps.js.map +1 -0
- package/dist/agent/persistence/tasks.js +195 -0
- package/dist/agent/persistence/tasks.js.map +1 -0
- package/dist/agent/persistence/turns.js +92 -0
- package/dist/agent/persistence/turns.js.map +1 -0
- package/dist/agent/policy/ambiguityResolution.js +226 -0
- package/dist/agent/policy/ambiguityResolution.js.map +1 -0
- package/dist/agent/policy/contracts.js +2 -0
- package/dist/agent/policy/contracts.js.map +1 -0
- package/dist/agent/policy/coveragePolicy.js +309 -0
- package/dist/agent/policy/coveragePolicy.js.map +1 -0
- package/dist/agent/policy/endDecisionPolicy.js +31 -0
- package/dist/agent/policy/endDecisionPolicy.js.map +1 -0
- package/dist/agent/policy/index.js +344 -0
- package/dist/agent/policy/index.js.map +1 -0
- package/dist/agent/policy/loopReview.js +778 -0
- package/dist/agent/policy/loopReview.js.map +1 -0
- package/dist/agent/policy/readinessPolicy.js +108 -0
- package/dist/agent/policy/readinessPolicy.js.map +1 -0
- package/dist/agent/policy/resolutionPipeline.js +356 -0
- package/dist/agent/policy/resolutionPipeline.js.map +1 -0
- package/dist/agent/policy/targetClassification.js +33 -0
- package/dist/agent/policy/targetClassification.js.map +1 -0
- package/dist/agent/prompting/actionChoice.js +90 -0
- package/dist/agent/prompting/actionChoice.js.map +1 -0
- package/dist/agent/prompting/finalAnswer.js +38 -0
- package/dist/agent/prompting/finalAnswer.js.map +1 -0
- package/dist/agent/prompting/index.js +14 -0
- package/dist/agent/prompting/index.js.map +1 -0
- package/dist/agent/prompting/plan.js +59 -0
- package/dist/agent/prompting/plan.js.map +1 -0
- package/dist/agent/prompting/transform.js +175 -0
- package/dist/agent/prompting/transform.js.map +1 -0
- package/dist/agent/prompting/understand.js +70 -0
- package/dist/agent/prompting/understand.js.map +1 -0
- package/dist/agent/read/freshness.js +29 -0
- package/dist/agent/read/freshness.js.map +1 -0
- package/dist/agent/read/fullReadPrompt.js +43 -0
- package/dist/agent/read/fullReadPrompt.js.map +1 -0
- package/dist/agent/read/index.js +140 -0
- package/dist/agent/read/index.js.map +1 -0
- package/dist/agent/read/persistence.js +88 -0
- package/dist/agent/read/persistence.js.map +1 -0
- package/dist/agent/read/summarizeReadEvidence.js +733 -0
- package/dist/agent/read/summarizeReadEvidence.js.map +1 -0
- package/dist/agent/read/targetResolution.js +126 -0
- package/dist/agent/read/targetResolution.js.map +1 -0
- package/dist/agent/resume/checkpoint.js +41 -0
- package/dist/agent/resume/checkpoint.js.map +1 -0
- package/dist/agent/runtime/lifecycle.js +67 -0
- package/dist/agent/runtime/lifecycle.js.map +1 -0
- package/dist/agent/runtime/progress.js +178 -0
- package/dist/agent/runtime/progress.js.map +1 -0
- package/dist/agent/runtime/runAgentLoop.js +402 -0
- package/dist/agent/runtime/runAgentLoop.js.map +1 -0
- package/dist/agent/runtime/runAgentPlanOnly.js +127 -0
- package/dist/agent/runtime/runAgentPlanOnly.js.map +1 -0
- package/dist/agent/runtime/understand.js +336 -0
- package/dist/agent/runtime/understand.js.map +1 -0
- package/dist/agent/search/batchPlanner.js +274 -0
- package/dist/agent/search/batchPlanner.js.map +1 -0
- package/dist/agent/search/candidateRetentionPolicy.js +184 -0
- package/dist/agent/search/candidateRetentionPolicy.js.map +1 -0
- package/dist/agent/search/directory.js +51 -0
- package/dist/agent/search/directory.js.map +1 -0
- package/dist/agent/search/exactTarget.js +151 -0
- package/dist/agent/search/exactTarget.js.map +1 -0
- package/dist/agent/search/fragment.js +110 -0
- package/dist/agent/search/fragment.js.map +1 -0
- package/dist/agent/search/index.js +166 -0
- package/dist/agent/search/index.js.map +1 -0
- package/dist/agent/search/laneClassifier.js +119 -0
- package/dist/agent/search/laneClassifier.js.map +1 -0
- package/dist/agent/search/limits.js +10 -0
- package/dist/agent/search/limits.js.map +1 -0
- package/dist/agent/search/ranking.js +22 -0
- package/dist/agent/search/ranking.js.map +1 -0
- package/dist/agent/search/regex.js +83 -0
- package/dist/agent/search/regex.js.map +1 -0
- package/dist/agent/search/routePolicy.js +11 -0
- package/dist/agent/search/routePolicy.js.map +1 -0
- package/dist/agent/search/searchContext.js +128 -0
- package/dist/agent/search/searchContext.js.map +1 -0
- package/dist/agent/search/semantic.js +113 -0
- package/dist/agent/search/semantic.js.map +1 -0
- package/dist/agent/search/semanticIndexSearch.js +202 -0
- package/dist/agent/search/semanticIndexSearch.js.map +1 -0
- package/dist/agent/search/shared.js +283 -0
- package/dist/agent/search/shared.js.map +1 -0
- package/dist/agent/search/shell.js +202 -0
- package/dist/agent/search/shell.js.map +1 -0
- package/dist/agent/search/snippetEvidence.js +57 -0
- package/dist/agent/search/snippetEvidence.js.map +1 -0
- package/dist/agent/search/types.js +2 -0
- package/dist/agent/search/types.js.map +1 -0
- package/dist/agent/state/index.js +99 -0
- package/dist/agent/state/index.js.map +1 -0
- package/dist/agent/state/memory.js +56 -0
- package/dist/agent/state/memory.js.map +1 -0
- package/dist/agent/structuredOutput/index.js +28 -0
- package/dist/agent/structuredOutput/index.js.map +1 -0
- package/dist/agent/tools/index.js +199 -0
- package/dist/agent/tools/index.js.map +1 -0
- package/dist/agent/transform/index.js +519 -0
- package/dist/agent/transform/index.js.map +1 -0
- package/dist/agent/transform/syntax.js +49 -0
- package/dist/agent/transform/syntax.js.map +1 -0
- package/dist/agent/types.js +20 -0
- package/dist/agent/types.js.map +1 -0
- package/dist/agents/actionRegistry.js +114 -0
- package/dist/agents/actionRegistry.js.map +1 -0
- package/dist/agents/agent.js +5 -0
- package/dist/agents/agent.js.map +1 -0
- package/dist/agents/agentActions.js +5 -0
- package/dist/agents/agentActions.js.map +1 -0
- package/dist/agents/agentEvidence.js +5 -0
- package/dist/agents/agentEvidence.js.map +1 -0
- package/dist/agents/agentFeedback.js +5 -0
- package/dist/agents/agentFeedback.js.map +1 -0
- package/dist/agents/agentLogging.js +5 -0
- package/dist/agents/agentLogging.js.map +1 -0
- package/dist/agents/agentLoop.js +5 -0
- package/dist/agents/agentLoop.js.map +1 -0
- package/dist/agents/agentMemory.js +5 -0
- package/dist/agents/agentMemory.js.map +1 -0
- package/dist/agents/agentPlanMode.js +5 -0
- package/dist/agents/agentPlanMode.js.map +1 -0
- package/dist/agents/agentPolicyState.js +5 -0
- package/dist/agents/agentPolicyState.js.map +1 -0
- package/dist/agents/agentProgress.js +93 -0
- package/dist/agents/agentProgress.js.map +1 -0
- package/dist/agents/agentSchemas.js +5 -0
- package/dist/agents/agentSchemas.js.map +1 -0
- package/dist/agents/agentSearchScoring.js +5 -0
- package/dist/agents/agentSearchScoring.js.map +1 -0
- package/dist/agents/agentStateMachine.js +5 -0
- package/dist/agents/agentStateMachine.js.map +1 -0
- package/dist/agents/agentTools.js +5 -0
- package/dist/agents/agentTools.js.map +1 -0
- package/dist/agents/agentTypes.js +5 -0
- package/dist/agents/agentTypes.js.map +1 -0
- package/dist/agents/agentUnderstand.js +5 -0
- package/dist/agents/agentUnderstand.js.map +1 -0
- package/dist/agents/analysisPlanGenStep.js +194 -17
- package/dist/agents/analysisPlanGenStep.js.map +1 -0
- package/dist/agents/answerOnlyCompletion.js +32 -0
- package/dist/agents/answerOnlyCompletion.js.map +1 -0
- package/dist/agents/collaboratorStep.js +1 -0
- package/dist/agents/collaboratorStep.js.map +1 -0
- package/dist/agents/decideNextAction.js +444 -0
- package/dist/agents/decideNextAction.js.map +1 -0
- package/dist/agents/deriveFocusFromSearchStep.js +83 -0
- package/dist/agents/deriveFocusFromSearchStep.js.map +1 -0
- package/dist/agents/evidenceVerifierStep.js +104 -13
- package/dist/agents/evidenceVerifierStep.js.map +1 -0
- package/dist/agents/fileCheckStep.js +381 -12
- package/dist/agents/fileCheckStep.js.map +1 -0
- package/dist/agents/giveUpEvaluatorStep.js +63 -0
- package/dist/agents/giveUpEvaluatorStep.js.map +1 -0
- package/dist/agents/guardPolicy.js +20 -0
- package/dist/agents/guardPolicy.js.map +1 -0
- package/dist/agents/guards/executionPolicyResolver.js +165 -0
- package/dist/agents/guards/executionPolicyResolver.js.map +1 -0
- package/dist/agents/guards/guardState.js +195 -0
- package/dist/agents/guards/guardState.js.map +1 -0
- package/dist/agents/guards/resolveProgressState.js +403 -0
- package/dist/agents/guards/resolveProgressState.js.map +1 -0
- package/dist/agents/infoPlanGenStep.js +66 -8
- package/dist/agents/infoPlanGenStep.js.map +1 -0
- package/dist/agents/integrateFeedbackStep.js +1 -0
- package/dist/agents/integrateFeedbackStep.js.map +1 -0
- package/dist/agents/iterationFileSelector.js +8 -7
- package/dist/agents/iterationFileSelector.js.map +1 -0
- package/dist/agents/mainAgentActivityLog.js +85 -0
- package/dist/agents/mainAgentActivityLog.js.map +1 -0
- package/dist/agents/mainAgentHeuristics.js +173 -0
- package/dist/agents/mainAgentHeuristics.js.map +1 -0
- package/dist/agents/mainAgentVerify.js +159 -0
- package/dist/agents/mainAgentVerify.js.map +1 -0
- package/dist/agents/objectiveEvaluatorStep.js +103 -0
- package/dist/agents/objectiveEvaluatorStep.js.map +1 -0
- package/dist/agents/outerLoopRecoveryEvaluator.js +108 -0
- package/dist/agents/outerLoopRecoveryEvaluator.js.map +1 -0
- package/dist/agents/readinessGateStep.js +95 -9
- package/dist/agents/readinessGateStep.js.map +1 -0
- package/dist/agents/reasonNextStep.js +9 -8
- package/dist/agents/reasonNextStep.js.map +1 -0
- package/dist/agents/reasonNextTaskStep.js +267 -144
- package/dist/agents/reasonNextTaskStep.js.map +1 -0
- package/dist/agents/researchPlanGenStep.js +61 -25
- package/dist/agents/researchPlanGenStep.js.map +1 -0
- package/dist/agents/resolveAgentTargetClassification.js +5 -0
- package/dist/agents/resolveAgentTargetClassification.js.map +1 -0
- package/dist/agents/resolveExecutionModeStep.js +1 -0
- package/dist/agents/resolveExecutionModeStep.js.map +1 -0
- package/dist/agents/resolveExplicitTargetsStep.js +74 -0
- package/dist/agents/resolveExplicitTargetsStep.js.map +1 -0
- package/dist/agents/routingDecisionStep.js +58 -11
- package/dist/agents/routingDecisionStep.js.map +1 -0
- package/dist/agents/scopeClassificationStep.js +66 -3
- package/dist/agents/scopeClassificationStep.js.map +1 -0
- package/dist/agents/selectRelevantSourcesStep.js +13 -5
- package/dist/agents/selectRelevantSourcesStep.js.map +1 -0
- package/dist/agents/structuralPreloadStep.js +3 -4
- package/dist/agents/structuralPreloadStep.js.map +1 -0
- package/dist/agents/transformPlanGenStep.js +105 -18
- package/dist/agents/transformPlanGenStep.js.map +1 -0
- package/dist/agents/understandIntentStep.js +237 -17
- package/dist/agents/understandIntentStep.js.map +1 -0
- package/dist/agents/validateChangesStep.js +16 -2
- package/dist/agents/validateChangesStep.js.map +1 -0
- package/dist/agents/writeFileStep.js +1 -0
- package/dist/agents/writeFileStep.js.map +1 -0
- package/dist/commands/AskCmd.js +139 -44
- package/dist/commands/AskCmd.js.map +1 -0
- package/dist/commands/BackupCmd.js +1 -0
- package/dist/commands/BackupCmd.js.map +1 -0
- package/dist/commands/ChangeLogUpdateCmd.js +1 -0
- package/dist/commands/ChangeLogUpdateCmd.js.map +1 -0
- package/dist/commands/CommitSuggesterCmd.js +55 -13
- package/dist/commands/CommitSuggesterCmd.js.map +1 -0
- package/dist/commands/DaemonCmd.js +52 -14
- package/dist/commands/DaemonCmd.js.map +1 -0
- package/dist/commands/DeleteIndex.js +1 -0
- package/dist/commands/DeleteIndex.js.map +1 -0
- package/dist/commands/EvalReportCmd.js +374 -0
- package/dist/commands/EvalReportCmd.js.map +1 -0
- package/dist/commands/FindCmd.js +1 -0
- package/dist/commands/FindCmd.js.map +1 -0
- package/dist/commands/GitCmd.js +1 -0
- package/dist/commands/GitCmd.js.map +1 -0
- package/dist/commands/IndexCmd.js +11 -79
- package/dist/commands/IndexCmd.js.map +1 -0
- package/dist/commands/InspectCmd.js +1 -0
- package/dist/commands/InspectCmd.js.map +1 -0
- package/dist/commands/ModelCmd.js +24 -0
- package/dist/commands/ModelCmd.js.map +1 -0
- package/dist/commands/ReadlineSingleton.js +1 -0
- package/dist/commands/ReadlineSingleton.js.map +1 -0
- package/dist/commands/ResetDbCmd.js +18 -1
- package/dist/commands/ResetDbCmd.js.map +1 -0
- package/dist/commands/ReviewCmd.js +1 -0
- package/dist/commands/ReviewCmd.js.map +1 -0
- package/dist/commands/StatusCmd.js +22 -0
- package/dist/commands/StatusCmd.js.map +1 -0
- package/dist/commands/StopDaemonCmd.js +1 -0
- package/dist/commands/StopDaemonCmd.js.map +1 -0
- package/dist/commands/SummaryCmd.js +1 -0
- package/dist/commands/SummaryCmd.js.map +1 -0
- package/dist/commands/SwitchCmd.js +9 -15
- package/dist/commands/SwitchCmd.js.map +1 -0
- package/dist/commands/TasksCmd.js +142 -57
- package/dist/commands/TasksCmd.js.map +1 -0
- package/dist/commands/TestCmd.js +66 -0
- package/dist/commands/TestCmd.js.map +1 -0
- package/dist/commands/WorkflowCmd.js +1 -0
- package/dist/commands/WorkflowCmd.js.map +1 -0
- package/dist/commands/commandVisibility.js +27 -0
- package/dist/commands/commandVisibility.js.map +1 -0
- package/dist/commands/evalCommands.js +1337 -0
- package/dist/commands/evalCommands.js.map +1 -0
- package/dist/commands/factory.js +206 -38
- package/dist/commands/factory.js.map +1 -0
- package/dist/config.js +62 -11
- package/dist/config.js.map +1 -0
- package/dist/constants.js +21 -3
- package/dist/constants.js.map +1 -0
- package/dist/context.js +33 -32
- package/dist/context.js.map +1 -0
- package/dist/daemon/daemonQueues.js +1 -20
- package/dist/daemon/daemonQueues.js.map +1 -0
- package/dist/daemon/daemonWorker.js +26 -37
- package/dist/daemon/daemonWorker.js.map +1 -0
- package/dist/daemon/generateSummaries.js +1 -0
- package/dist/daemon/generateSummaries.js.map +1 -0
- package/dist/daemon/runFolderCapsuleBatch.js +1 -0
- package/dist/daemon/runFolderCapsuleBatch.js.map +1 -0
- package/dist/daemon/runIndexingBatch.js +1 -0
- package/dist/daemon/runIndexingBatch.js.map +1 -0
- package/dist/daemon/runKgBatch.js +9 -1
- package/dist/daemon/runKgBatch.js.map +1 -0
- package/dist/db/backup.js +1 -0
- package/dist/db/backup.js.map +1 -0
- package/dist/db/client.js +18 -3
- package/dist/db/client.js.map +1 -0
- package/dist/db/fileIndex.js +110 -152
- package/dist/db/fileIndex.js.map +1 -0
- package/dist/db/functionExtractors/extractFromJava.js +1 -0
- package/dist/db/functionExtractors/extractFromJava.js.map +1 -0
- package/dist/db/functionExtractors/extractFromJs.js +1 -0
- package/dist/db/functionExtractors/extractFromJs.js.map +1 -0
- package/dist/db/functionExtractors/extractFromTs.js +1 -0
- package/dist/db/functionExtractors/extractFromTs.js.map +1 -0
- package/dist/db/functionExtractors/extractFromXML.js +1 -0
- package/dist/db/functionExtractors/extractFromXML.js.map +1 -0
- package/dist/db/functionExtractors/index.js +1 -0
- package/dist/db/functionExtractors/index.js.map +1 -0
- package/dist/db/functionIndex.js +9 -0
- package/dist/db/functionIndex.js.map +1 -0
- package/dist/db/schema.js +314 -99
- package/dist/db/schema.js.map +1 -0
- package/dist/db/sqlTemplates.js +1 -0
- package/dist/db/sqlTemplates.js.map +1 -0
- package/dist/fileRules/builtins.js +1 -0
- package/dist/fileRules/builtins.js.map +1 -0
- package/dist/fileRules/classifyFile.js +1 -0
- package/dist/fileRules/classifyFile.js.map +1 -0
- package/dist/fileRules/codeAllowedExtensions.js +1 -0
- package/dist/fileRules/codeAllowedExtensions.js.map +1 -0
- package/dist/fileRules/detectFileType.js +1 -0
- package/dist/fileRules/detectFileType.js.map +1 -0
- package/dist/fileRules/fileClassifier.js +1 -0
- package/dist/fileRules/fileClassifier.js.map +1 -0
- package/dist/fileRules/fileExceptions.js +1 -0
- package/dist/fileRules/fileExceptions.js.map +1 -0
- package/dist/fileRules/ignoredExtensions.js +1 -0
- package/dist/fileRules/ignoredExtensions.js.map +1 -0
- package/dist/fileRules/ignoredPaths.js +48 -5
- package/dist/fileRules/ignoredPaths.js.map +1 -0
- package/dist/fileRules/queryTokenRules.js +176 -0
- package/dist/fileRules/queryTokenRules.js.map +1 -0
- package/dist/fileRules/searchPathClassification.js +58 -0
- package/dist/fileRules/searchPathClassification.js.map +1 -0
- package/dist/fileRules/shouldIgnoreFiles.js +1 -0
- package/dist/fileRules/shouldIgnoreFiles.js.map +1 -0
- package/dist/fileRules/stopWords.js +9 -0
- package/dist/fileRules/stopWords.js.map +1 -0
- package/dist/fileRules/wellKnownRepoFiles.js +1 -0
- package/dist/fileRules/wellKnownRepoFiles.js.map +1 -0
- package/dist/git/commitSummary.js +227 -0
- package/dist/git/commitSummary.js.map +1 -0
- package/dist/github/api.js +1 -0
- package/dist/github/api.js.map +1 -0
- package/dist/github/auth.js +1 -0
- package/dist/github/auth.js.map +1 -0
- package/dist/github/github.js +1 -0
- package/dist/github/github.js.map +1 -0
- package/dist/github/githubAuthCheck.js +1 -0
- package/dist/github/githubAuthCheck.js.map +1 -0
- package/dist/github/postComments.js +1 -0
- package/dist/github/postComments.js.map +1 -0
- package/dist/github/repo.js +15 -24
- package/dist/github/repo.js.map +1 -0
- package/dist/github/token.js +1 -0
- package/dist/github/token.js.map +1 -0
- package/dist/github/types.js +1 -0
- package/dist/github/types.js.map +1 -0
- package/dist/index.js +318 -37
- package/dist/index.js.map +1 -0
- package/dist/lib/generate.js +264 -20
- package/dist/lib/generate.js.map +1 -0
- package/dist/lib/generateFolderCapsules.js +1 -0
- package/dist/lib/generateFolderCapsules.js.map +1 -0
- package/dist/lib/ollamaModelPolicy.js +59 -0
- package/dist/lib/ollamaModelPolicy.js.map +1 -0
- package/dist/lib/spinner.js +29 -9
- package/dist/lib/spinner.js.map +1 -0
- package/dist/modelSetup.js +25 -78
- package/dist/modelSetup.js.map +1 -0
- package/dist/pipeline/modules/changeLogModule.js +10 -1
- package/dist/pipeline/modules/changeLogModule.js.map +1 -0
- package/dist/pipeline/modules/cleanupModule.js +1 -0
- package/dist/pipeline/modules/cleanupModule.js.map +1 -0
- package/dist/pipeline/modules/codeTransformModule.js +10 -16
- package/dist/pipeline/modules/codeTransformModule.js.map +1 -0
- package/dist/pipeline/modules/commentModule.js +12 -0
- package/dist/pipeline/modules/commentModule.js.map +1 -0
- package/dist/pipeline/modules/commitSuggesterModule.js +82 -12
- package/dist/pipeline/modules/commitSuggesterModule.js.map +1 -0
- package/dist/pipeline/modules/contextReviewModule.js +12 -1
- package/dist/pipeline/modules/contextReviewModule.js.map +1 -0
- package/dist/pipeline/modules/dialogAnswerModule.js +58 -0
- package/dist/pipeline/modules/dialogAnswerModule.js.map +1 -0
- package/dist/pipeline/modules/fileSearchModule.js +5 -143
- package/dist/pipeline/modules/fileSearchModule.js.map +1 -0
- package/dist/pipeline/modules/finalAnswerModule.js +1176 -151
- package/dist/pipeline/modules/finalAnswerModule.js.map +1 -0
- package/dist/pipeline/modules/kgModule.js +18 -1
- package/dist/pipeline/modules/kgModule.js.map +1 -0
- package/dist/pipeline/modules/planAnswerModule.js +99 -0
- package/dist/pipeline/modules/planAnswerModule.js.map +1 -0
- package/dist/pipeline/modules/readFileModule.js +300 -0
- package/dist/pipeline/modules/readFileModule.js.map +1 -0
- package/dist/pipeline/modules/reviewModule.js +10 -1
- package/dist/pipeline/modules/reviewModule.js.map +1 -0
- package/dist/pipeline/modules/searchDbModule.js +159 -0
- package/dist/pipeline/modules/searchDbModule.js.map +1 -0
- package/dist/pipeline/modules/searchListDirectoryModule.js +62 -0
- package/dist/pipeline/modules/searchListDirectoryModule.js.map +1 -0
- package/dist/pipeline/modules/searchModuleShared.js +71 -0
- package/dist/pipeline/modules/searchModuleShared.js.map +1 -0
- package/dist/pipeline/modules/searchRegexModule.js +59 -0
- package/dist/pipeline/modules/searchRegexModule.js.map +1 -0
- package/dist/pipeline/modules/semanticAnalysisModule.js +185 -28
- package/dist/pipeline/modules/semanticAnalysisModule.js.map +1 -0
- package/dist/pipeline/modules/summaryModule.js +11 -1
- package/dist/pipeline/modules/summaryModule.js.map +1 -0
- package/dist/pipeline/registry/moduleRegistry.js +9 -0
- package/dist/pipeline/registry/moduleRegistry.js.map +1 -0
- package/dist/pipeline/runModulePipeline.js +1 -0
- package/dist/pipeline/runModulePipeline.js.map +1 -0
- package/dist/scripts/dbScriptSupport.js +172 -0
- package/dist/scripts/dbScriptSupport.js.map +1 -0
- package/dist/scripts/dbcheck.js +173 -267
- package/dist/scripts/dbcheck.js.map +1 -0
- package/dist/scripts/dboverview.js +161 -0
- package/dist/scripts/dboverview.js.map +1 -0
- package/dist/scripts/migrateDb.js +1 -0
- package/dist/scripts/migrateDb.js.map +1 -0
- package/dist/search/SearchOrchestrator.js +928 -0
- package/dist/search/SearchOrchestrator.js.map +1 -0
- package/dist/search/sharedRankingPolicy.js +283 -0
- package/dist/search/sharedRankingPolicy.js.map +1 -0
- package/dist/setup/reindexOwner.js +97 -0
- package/dist/setup/reindexOwner.js.map +1 -0
- package/dist/setup/setupOwner.js +100 -0
- package/dist/setup/setupOwner.js.map +1 -0
- package/dist/shell/dialogUi.js +81 -0
- package/dist/shell/dialogUi.js.map +1 -0
- package/dist/shellSession.js +126 -0
- package/dist/shellSession.js.map +1 -0
- package/dist/status/statusOwner.js +239 -0
- package/dist/status/statusOwner.js.map +1 -0
- package/dist/testing/contextEval.js +514 -0
- package/dist/testing/contextEval.js.map +1 -0
- package/dist/testing/fixtures/transform/small-file.input.js +5 -0
- package/dist/testing/fixtures/transform/small-file.input.js.map +1 -0
- package/dist/testing/harnessArtifacts.js +112 -0
- package/dist/testing/harnessArtifacts.js.map +1 -0
- package/dist/testing/llmTraceSession.js +67 -0
- package/dist/testing/llmTraceSession.js.map +1 -0
- package/dist/testing/registerDevCliCommands.js +43 -0
- package/dist/testing/registerDevCliCommands.js.map +1 -0
- package/dist/testing/runDiagnosis.js +248 -0
- package/dist/testing/runDiagnosis.js.map +1 -0
- package/dist/testing/runtimeLogReader.js +144 -0
- package/dist/testing/runtimeLogReader.js.map +1 -0
- package/dist/testing/testCommands.js +35 -303
- package/dist/testing/testCommands.js.map +1 -0
- package/dist/testing/testRegistry.js +233 -0
- package/dist/testing/testRegistry.js.map +1 -0
- package/dist/types.js +1 -0
- package/dist/types.js.map +1 -0
- package/dist/utils/buildContextualPrompt.js +26 -75
- package/dist/utils/buildContextualPrompt.js.map +1 -0
- package/dist/utils/changeLogPrompt.js +1 -0
- package/dist/utils/changeLogPrompt.js.map +1 -0
- package/dist/utils/checkModel.js +17 -92
- package/dist/utils/checkModel.js.map +1 -0
- package/dist/utils/commentMap.js +1 -0
- package/dist/utils/commentMap.js.map +1 -0
- package/dist/utils/compileSearchQuery.js +23 -9
- package/dist/utils/compileSearchQuery.js.map +1 -0
- package/dist/utils/consolePresentation.js +208 -0
- package/dist/utils/consolePresentation.js.map +1 -0
- package/dist/utils/contentUtils.js +17 -2
- package/dist/utils/contentUtils.js.map +1 -0
- package/dist/utils/debugContext.js +1 -0
- package/dist/utils/debugContext.js.map +1 -0
- package/dist/utils/dialogState.js +201 -0
- package/dist/utils/dialogState.js.map +1 -0
- package/dist/utils/editor.js +1 -0
- package/dist/utils/editor.js.map +1 -0
- package/dist/utils/executionEvidence.js +50 -0
- package/dist/utils/executionEvidence.js.map +1 -0
- package/dist/utils/extractFileReferences.js +140 -6
- package/dist/utils/extractFileReferences.js.map +1 -0
- package/dist/utils/fileEvidenceCache.js +50 -0
- package/dist/utils/fileEvidenceCache.js.map +1 -0
- package/dist/utils/fileTree.js +1 -0
- package/dist/utils/fileTree.js.map +1 -0
- package/dist/utils/loadRelevantFolderCapsules.js +35 -5
- package/dist/utils/loadRelevantFolderCapsules.js.map +1 -0
- package/dist/utils/log.js +10 -1
- package/dist/utils/log.js.map +1 -0
- package/dist/utils/normalizeData.js +1 -0
- package/dist/utils/normalizeData.js.map +1 -0
- package/dist/utils/ollamaModelStatus.js +28 -0
- package/dist/utils/ollamaModelStatus.js.map +1 -0
- package/dist/utils/ollamaService.js +294 -0
- package/dist/utils/ollamaService.js.map +1 -0
- package/dist/utils/outputFormatter.js +1 -0
- package/dist/utils/outputFormatter.js.map +1 -0
- package/dist/utils/parseTaggedContent.js +1 -0
- package/dist/utils/parseTaggedContent.js.map +1 -0
- package/dist/utils/planActions.js +27 -46
- package/dist/utils/planActions.js.map +1 -0
- package/dist/utils/promptBuilderHelper.js +1 -0
- package/dist/utils/promptBuilderHelper.js.map +1 -0
- package/dist/utils/promptLogHelper.js +29 -13
- package/dist/utils/promptLogHelper.js.map +1 -0
- package/dist/utils/queryAnchors.js +71 -0
- package/dist/utils/queryAnchors.js.map +1 -0
- package/dist/utils/repoIdentity.js +82 -0
- package/dist/utils/repoIdentity.js.map +1 -0
- package/dist/utils/repoKey.js +1 -0
- package/dist/utils/repoKey.js.map +1 -0
- package/dist/utils/resolveTargetsToFiles.js +1 -0
- package/dist/utils/resolveTargetsToFiles.js.map +1 -0
- package/dist/utils/resumeContext.js +219 -0
- package/dist/utils/resumeContext.js.map +1 -0
- package/dist/utils/resumeState.js +310 -0
- package/dist/utils/resumeState.js.map +1 -0
- package/dist/utils/rollingPlan.js +118 -0
- package/dist/utils/rollingPlan.js.map +1 -0
- package/dist/utils/runQueryWithDaemonControl.js +11 -3
- package/dist/utils/runQueryWithDaemonControl.js.map +1 -0
- package/dist/utils/runtimeLogger.js +252 -0
- package/dist/utils/runtimeLogger.js.map +1 -0
- package/dist/utils/sanitizeQuery.js +1 -0
- package/dist/utils/sanitizeQuery.js.map +1 -0
- package/dist/utils/sharedUtils.js +1 -0
- package/dist/utils/sharedUtils.js.map +1 -0
- package/dist/utils/sleep.js +1 -0
- package/dist/utils/sleep.js.map +1 -0
- package/dist/utils/splitCodeIntoChunk.js +1 -0
- package/dist/utils/splitCodeIntoChunk.js.map +1 -0
- package/dist/utils/time.js +66 -0
- package/dist/utils/time.js.map +1 -0
- package/dist/utils/verifyFocusPreference.js +107 -0
- package/dist/utils/verifyFocusPreference.js.map +1 -0
- package/dist/utils/vscode.js +1 -0
- package/dist/utils/vscode.js.map +1 -0
- package/dist/workflow/workflowResolver.js +1 -0
- package/dist/workflow/workflowResolver.js.map +1 -0
- package/dist/workflow/workflowRunner.js +1 -0
- package/dist/workflow/workflowRunner.js.map +1 -0
- package/package.json +3 -3
- package/dist/agents/MainAgent.js +0 -1886
- package/dist/agents/contextReviewStep.js +0 -101
- package/dist/agents/finalPlanGenStep.js +0 -107
- package/dist/agents/structuralAnalysisStep.js +0 -46
- package/dist/agents/validationAnalysisStep.js +0 -87
- package/dist/pipeline/modules/chunkManagerModule.js +0 -24
- package/dist/pipeline/modules/cleanGeneratedTestsModule.js +0 -33
- package/dist/pipeline/modules/fileReaderModule.js +0 -72
- package/dist/pipeline/modules/gatherInfoModule.js +0 -181
- package/dist/pipeline/modules/generateTestsModule.js +0 -68
- package/dist/pipeline/modules/preserveCodeModule.js +0 -195
- package/dist/pipeline/modules/refactorModule.js +0 -40
- package/dist/pipeline/modules/repairTestsModule.js +0 -48
- package/dist/pipeline/modules/runTestsModule.js +0 -37
|
@@ -0,0 +1,244 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Verifies that context eval flags repeated planner prompts, prompt bloat, and missing decomposition.
|
|
3
|
+
*
|
|
4
|
+
* Why this exists:
|
|
5
|
+
* - context audit rules should stay deterministic across saved trace shapes
|
|
6
|
+
* - planner retries and final-answer prompt growth are easy to reintroduce during routing work
|
|
7
|
+
* - multi-question queries need explicit regression coverage so they do not collapse silently
|
|
8
|
+
*/
|
|
9
|
+
import { beforeEach, describe, expect, it, vi } from "vitest";
|
|
10
|
+
const state = vi.hoisted(() => ({
|
|
11
|
+
dirEntries: new Map(),
|
|
12
|
+
fileContents: new Map(),
|
|
13
|
+
}));
|
|
14
|
+
vi.mock("fs", () => ({
|
|
15
|
+
default: {
|
|
16
|
+
existsSync: vi.fn((filePath) => state.fileContents.has(filePath) || state.dirEntries.has(filePath)),
|
|
17
|
+
readFileSync: vi.fn((filePath) => state.fileContents.get(filePath) ?? ""),
|
|
18
|
+
readdirSync: vi.fn((dirPath, options) => {
|
|
19
|
+
const entries = state.dirEntries.get(dirPath) ?? [];
|
|
20
|
+
if (options?.withFileTypes) {
|
|
21
|
+
return entries.map((name) => ({
|
|
22
|
+
name,
|
|
23
|
+
isDirectory: () => true,
|
|
24
|
+
}));
|
|
25
|
+
}
|
|
26
|
+
return entries;
|
|
27
|
+
}),
|
|
28
|
+
},
|
|
29
|
+
existsSync: vi.fn((filePath) => state.fileContents.has(filePath) || state.dirEntries.has(filePath)),
|
|
30
|
+
readFileSync: vi.fn((filePath) => state.fileContents.get(filePath) ?? ""),
|
|
31
|
+
readdirSync: vi.fn((dirPath, options) => {
|
|
32
|
+
const entries = state.dirEntries.get(dirPath) ?? [];
|
|
33
|
+
if (options?.withFileTypes) {
|
|
34
|
+
return entries.map((name) => ({
|
|
35
|
+
name,
|
|
36
|
+
isDirectory: () => true,
|
|
37
|
+
}));
|
|
38
|
+
}
|
|
39
|
+
return entries;
|
|
40
|
+
}),
|
|
41
|
+
}));
|
|
42
|
+
vi.mock("../../utils/repoIdentity.js", () => ({
|
|
43
|
+
resolveCanonicalRepoIdentity: vi.fn(() => ({
|
|
44
|
+
repoRootPath: "/repo",
|
|
45
|
+
})),
|
|
46
|
+
}));
|
|
47
|
+
import { buildContextEval } from "../../testing/contextEval.js";
|
|
48
|
+
describe("contextEval", () => {
|
|
49
|
+
beforeEach(() => {
|
|
50
|
+
state.dirEntries = new Map();
|
|
51
|
+
state.fileContents = new Map();
|
|
52
|
+
});
|
|
53
|
+
it("warns when planner retries reuse identical prompts", () => {
|
|
54
|
+
state.dirEntries.set("/artifact/llm_calls", [
|
|
55
|
+
"0006_analysisPlanGenStep.json",
|
|
56
|
+
"0007_analysisPlanGenStep.json",
|
|
57
|
+
]);
|
|
58
|
+
const promptText = "User query:\nsummarize architecture\nAllowed actions:\n[semanticAnalysis]";
|
|
59
|
+
for (const fileName of ["0006_analysisPlanGenStep.json", "0007_analysisPlanGenStep.json"]) {
|
|
60
|
+
state.fileContents.set(`/artifact/llm_calls/${fileName}`, JSON.stringify({
|
|
61
|
+
callId: `llm-${fileName.slice(0, 4)}-analysisPlanGenStep`,
|
|
62
|
+
caller: "analysisPlanGenStep",
|
|
63
|
+
query: "summarize architecture",
|
|
64
|
+
promptText,
|
|
65
|
+
inputContext: {},
|
|
66
|
+
}, null, 2));
|
|
67
|
+
}
|
|
68
|
+
const result = buildContextEval({ taskId: 1, artifactDir: "/artifact", runLog: "" });
|
|
69
|
+
const duplicateCheck = result.checks.find((check) => check.name === "duplicate-replan-calls");
|
|
70
|
+
expect(duplicateCheck?.ok).toBe(false);
|
|
71
|
+
expect(duplicateCheck?.finding?.actualContext).toContain("2 identical analysisPlanGenStep prompts");
|
|
72
|
+
});
|
|
73
|
+
it("warns when progress state records stalled planner retries", () => {
|
|
74
|
+
state.dirEntries.set("/artifact/llm_calls", ["0001_analysisPlanGenStep.json"]);
|
|
75
|
+
state.fileContents.set("/artifact/llm_calls/0001_analysisPlanGenStep.json", JSON.stringify({
|
|
76
|
+
callId: "llm-0001-analysisPlanGenStep",
|
|
77
|
+
caller: "analysisPlanGenStep",
|
|
78
|
+
query: "Explain how tests run",
|
|
79
|
+
promptText: "Prompt",
|
|
80
|
+
inputContext: {},
|
|
81
|
+
}, null, 2));
|
|
82
|
+
const divider = "=".repeat(68);
|
|
83
|
+
const runLog = [
|
|
84
|
+
"📂 OUTPUT | progressState",
|
|
85
|
+
divider,
|
|
86
|
+
JSON.stringify({
|
|
87
|
+
research: {
|
|
88
|
+
status: "optional",
|
|
89
|
+
pendingSteps: [],
|
|
90
|
+
noNewInfoCount: 0,
|
|
91
|
+
reason: "No research is currently required. Planner retried the same target without frontier change (3 identical attempt(s)).",
|
|
92
|
+
plannerRetry: {
|
|
93
|
+
targetFile: "/repo/cli/src/testing/testCommands.ts",
|
|
94
|
+
signature: "sig:testCommands",
|
|
95
|
+
count: 3,
|
|
96
|
+
stalled: true,
|
|
97
|
+
reason: "Planner retried the same target without frontier change (3 identical attempt(s)).",
|
|
98
|
+
},
|
|
99
|
+
},
|
|
100
|
+
}, null, 2),
|
|
101
|
+
divider,
|
|
102
|
+
"",
|
|
103
|
+
].join("\n");
|
|
104
|
+
const result = buildContextEval({ taskId: 1, artifactDir: "/artifact", runLog });
|
|
105
|
+
const stalledCheck = result.checks.find((check) => check.name === "stalled-planner-progress");
|
|
106
|
+
expect(stalledCheck?.ok).toBe(false);
|
|
107
|
+
expect(stalledCheck?.finding?.actualContext).toContain("target=/repo/cli/src/testing/testCommands.ts");
|
|
108
|
+
expect(stalledCheck?.finding?.actualContext).toContain("count=3");
|
|
109
|
+
});
|
|
110
|
+
it("warns when a continuity query carries a large resumed capsule", () => {
|
|
111
|
+
state.dirEntries.set("/artifact/llm_calls", ["0008_scopeClassificationStep.json"]);
|
|
112
|
+
state.fileContents.set("/artifact/llm_calls/0008_scopeClassificationStep.json", JSON.stringify({
|
|
113
|
+
callId: "llm-0008-scopeClassificationStep",
|
|
114
|
+
caller: "scopeClassificationStep",
|
|
115
|
+
query: "where were we?",
|
|
116
|
+
promptText: "User query:\nwhere were we?",
|
|
117
|
+
inputContext: {
|
|
118
|
+
resumedContextCapsule: "Original task:\n" + "x".repeat(400),
|
|
119
|
+
},
|
|
120
|
+
}, null, 2));
|
|
121
|
+
const result = buildContextEval({ taskId: 1, artifactDir: "/artifact", runLog: "" });
|
|
122
|
+
const continuityCheck = result.checks.find((check) => check.name === "continuity-overprompting");
|
|
123
|
+
expect(continuityCheck?.ok).toBe(false);
|
|
124
|
+
expect(continuityCheck?.finding?.details).toContain("short continuity query");
|
|
125
|
+
});
|
|
126
|
+
it("warns when final grounding carries oversized supporting excerpts", () => {
|
|
127
|
+
state.dirEntries.set("/artifact/llm_calls", ["0010_finalAnswerModule.json"]);
|
|
128
|
+
state.fileContents.set("/artifact/llm_calls/0010_finalAnswerModule.json", JSON.stringify({
|
|
129
|
+
callId: "llm-0010-finalAnswerModule",
|
|
130
|
+
caller: "finalAnswerModule",
|
|
131
|
+
query: "Where are SQLite queries defined?",
|
|
132
|
+
promptText: "User query:\nWhere are SQLite queries defined?",
|
|
133
|
+
inputContext: {
|
|
134
|
+
supportingExcerpts: [
|
|
135
|
+
{
|
|
136
|
+
filePath: "/repo/cli/src/db/fileIndex.ts",
|
|
137
|
+
excerpts: ["a".repeat(1600)],
|
|
138
|
+
},
|
|
139
|
+
{
|
|
140
|
+
filePath: "/repo/cli/src/db/client.ts",
|
|
141
|
+
excerpts: ["b".repeat(700)],
|
|
142
|
+
},
|
|
143
|
+
],
|
|
144
|
+
},
|
|
145
|
+
}, null, 2));
|
|
146
|
+
const result = buildContextEval({ taskId: 1, artifactDir: "/artifact", runLog: "" });
|
|
147
|
+
const sizeCheck = result.checks.find((check) => check.name === "oversized-final-grounding-context");
|
|
148
|
+
expect(sizeCheck?.ok).toBe(false);
|
|
149
|
+
expect(sizeCheck?.finding?.actualContext).toContain("supporting excerpts chars=2300");
|
|
150
|
+
});
|
|
151
|
+
it("warns when adjacent planner retries reuse the same rationale but change other prompt sections", () => {
|
|
152
|
+
state.dirEntries.set("/artifact/llm_calls", [
|
|
153
|
+
"0006_analysisPlanGenStep.json",
|
|
154
|
+
"0007_analysisPlanGenStep.json",
|
|
155
|
+
]);
|
|
156
|
+
state.fileContents.set("/artifact/llm_calls/0006_analysisPlanGenStep.json", JSON.stringify({
|
|
157
|
+
callId: "llm-0006-analysisPlanGenStep",
|
|
158
|
+
caller: "analysisPlanGenStep",
|
|
159
|
+
query: "Where are SQLite queries defined in db/fileIndex.ts and db/client.ts?",
|
|
160
|
+
promptText: "Prompt A",
|
|
161
|
+
inputContext: {
|
|
162
|
+
targetFile: "/repo/cli/src/db/fileIndex.ts",
|
|
163
|
+
rationaleText: "Both files are relevant to the SQLite query definitions.",
|
|
164
|
+
allowedActions: [
|
|
165
|
+
{ actionId: "semanticAnalysis" },
|
|
166
|
+
{ actionId: "read-file" },
|
|
167
|
+
{ actionId: "research-impact-map" },
|
|
168
|
+
{ actionId: "research-symbol-trace" },
|
|
169
|
+
{ actionId: "research-risk-check" },
|
|
170
|
+
{ actionId: "research-architecture-synthesis" },
|
|
171
|
+
],
|
|
172
|
+
},
|
|
173
|
+
}, null, 2));
|
|
174
|
+
state.fileContents.set("/artifact/llm_calls/0007_analysisPlanGenStep.json", JSON.stringify({
|
|
175
|
+
callId: "llm-0007-analysisPlanGenStep",
|
|
176
|
+
caller: "analysisPlanGenStep",
|
|
177
|
+
query: "Where are SQLite queries defined in db/fileIndex.ts and db/client.ts?",
|
|
178
|
+
promptText: "Prompt B",
|
|
179
|
+
inputContext: {
|
|
180
|
+
targetFile: "/repo/cli/src/db/fileIndex.ts",
|
|
181
|
+
rationaleText: "Both files are relevant to the SQLite query definitions.",
|
|
182
|
+
allowedActions: [
|
|
183
|
+
{ actionId: "semanticAnalysis" },
|
|
184
|
+
{ actionId: "read-file" },
|
|
185
|
+
{ actionId: "research-impact-map" },
|
|
186
|
+
{ actionId: "research-symbol-trace" },
|
|
187
|
+
{ actionId: "research-risk-check" },
|
|
188
|
+
{ actionId: "research-architecture-synthesis" },
|
|
189
|
+
],
|
|
190
|
+
},
|
|
191
|
+
}, null, 2));
|
|
192
|
+
const result = buildContextEval({ taskId: 1, artifactDir: "/artifact", runLog: "" });
|
|
193
|
+
const rationaleCheck = result.checks.find((check) => check.name === "stale-planner-rationale");
|
|
194
|
+
const catalogCheck = result.checks.find((check) => check.name === "repeated-planner-action-catalog");
|
|
195
|
+
expect(rationaleCheck?.ok).toBe(false);
|
|
196
|
+
expect(rationaleCheck?.finding?.details).toContain("same focus rationale");
|
|
197
|
+
expect(catalogCheck?.ok).toBe(false);
|
|
198
|
+
expect(catalogCheck?.finding?.actualContext).toContain("6 actions repeated");
|
|
199
|
+
});
|
|
200
|
+
it("warns when a multi-part query never becomes ordered question parts", () => {
|
|
201
|
+
state.dirEntries.set("/artifact/llm_calls", [
|
|
202
|
+
"0001_understandIntentStep.json",
|
|
203
|
+
"0002_scopeClassificationStep.json",
|
|
204
|
+
"0006_analysisPlanGenStep.json",
|
|
205
|
+
]);
|
|
206
|
+
state.fileContents.set("/artifact/llm_calls/0001_understandIntentStep.json", JSON.stringify({
|
|
207
|
+
callId: "llm-0001-understandIntentStep",
|
|
208
|
+
caller: "understandIntentStep",
|
|
209
|
+
query: "Where is search routed? How is verify triggered?",
|
|
210
|
+
promptText: "User query:\nWhere is search routed? How is verify triggered?",
|
|
211
|
+
inputContext: {
|
|
212
|
+
userQuery: "Where is search routed? How is verify triggered?",
|
|
213
|
+
},
|
|
214
|
+
}, null, 2));
|
|
215
|
+
state.fileContents.set("/artifact/llm_calls/0002_scopeClassificationStep.json", JSON.stringify({
|
|
216
|
+
callId: "llm-0002-scopeClassificationStep",
|
|
217
|
+
caller: "scopeClassificationStep",
|
|
218
|
+
query: "Where is search routed? How is verify triggered?",
|
|
219
|
+
promptText: "User query:\nWhere is search routed? How is verify triggered?",
|
|
220
|
+
inputContext: {
|
|
221
|
+
query: "Where is search routed? How is verify triggered?",
|
|
222
|
+
},
|
|
223
|
+
}, null, 2));
|
|
224
|
+
state.fileContents.set("/artifact/llm_calls/0006_analysisPlanGenStep.json", JSON.stringify({
|
|
225
|
+
callId: "llm-0006-analysisPlanGenStep",
|
|
226
|
+
caller: "analysisPlanGenStep",
|
|
227
|
+
query: "Where is search routed? How is verify triggered?",
|
|
228
|
+
promptText: "Prompt",
|
|
229
|
+
inputContext: {
|
|
230
|
+
orderedQuestions: [
|
|
231
|
+
{
|
|
232
|
+
id: "q1",
|
|
233
|
+
text: "Where is search routed? How is verify triggered?",
|
|
234
|
+
},
|
|
235
|
+
],
|
|
236
|
+
},
|
|
237
|
+
}, null, 2));
|
|
238
|
+
const result = buildContextEval({ taskId: 1, artifactDir: "/artifact", runLog: "" });
|
|
239
|
+
const questionCheck = result.checks.find((check) => check.name === "missing-question-decomposition");
|
|
240
|
+
expect(questionCheck?.ok).toBe(false);
|
|
241
|
+
expect(questionCheck?.finding?.actualContext).toContain("max orderedQuestions=1");
|
|
242
|
+
});
|
|
243
|
+
});
|
|
244
|
+
//# sourceMappingURL=contextEval.test.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"contextEval.test.js","sourceRoot":"","sources":["../../../src/__tests__/testing/contextEval.test.ts"],"names":[],"mappings":"AAAA;;;;;;;GAOG;AACH,OAAO,EAAE,UAAU,EAAE,QAAQ,EAAE,MAAM,EAAE,EAAE,EAAE,EAAE,EAAE,MAAM,QAAQ,CAAC;AAE9D,MAAM,KAAK,GAAG,EAAE,CAAC,OAAO,CAAC,GAAG,EAAE,CAAC,CAAC;IAC9B,UAAU,EAAE,IAAI,GAAG,EAAoB;IACvC,YAAY,EAAE,IAAI,GAAG,EAAkB;CACxC,CAAC,CAAC,CAAC;AAEJ,EAAE,CAAC,IAAI,CAAC,IAAI,EAAE,GAAG,EAAE,CAAC,CAAC;IACnB,OAAO,EAAE;QACP,UAAU,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,QAAgB,EAAE,EAAE,CAAC,KAAK,CAAC,YAAY,CAAC,GAAG,CAAC,QAAQ,CAAC,IAAI,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,QAAQ,CAAC,CAAC;QAC3G,YAAY,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,QAAgB,EAAE,EAAE,CAAC,KAAK,CAAC,YAAY,CAAC,GAAG,CAAC,QAAQ,CAAC,IAAI,EAAE,CAAC;QACjF,WAAW,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,OAAe,EAAE,OAAqC,EAAE,EAAE;YAC5E,MAAM,OAAO,GAAG,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,OAAO,CAAC,IAAI,EAAE,CAAC;YACpD,IAAI,OAAO,EAAE,aAAa,EAAE,CAAC;gBAC3B,OAAO,OAAO,CAAC,GAAG,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC,CAAC;oBAC5B,IAAI;oBACJ,WAAW,EAAE,GAAG,EAAE,CAAC,IAAI;iBACxB,CAAC,CAAC,CAAC;YACN,CAAC;YACD,OAAO,OAAO,CAAC;QACjB,CAAC,CAAC;KACH;IACD,UAAU,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,QAAgB,EAAE,EAAE,CAAC,KAAK,CAAC,YAAY,CAAC,GAAG,CAAC,QAAQ,CAAC,IAAI,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,QAAQ,CAAC,CAAC;IAC3G,YAAY,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,QAAgB,EAAE,EAAE,CAAC,KAAK,CAAC,YAAY,CAAC,GAAG,CAAC,QAAQ,CAAC,IAAI,EAAE,CAAC;IACjF,WAAW,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,OAAe,EAAE,OAAqC,EAAE,EAAE;QAC5E,MAAM,OAAO,GAAG,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,OAAO,CAAC,IAAI,EAAE,CAAC;QACpD,IAAI,OAAO,EAAE,aAAa,EAAE,CAAC;YAC3B,OAAO,OAAO,CAAC,GAAG,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC,CAAC;gBAC5B,IAAI;gBACJ,WAAW,EAAE,GAAG,EAAE,CAAC,IAAI;aACxB,CAAC,CAAC,CAAC;QACN,CAAC;QACD,OAAO,OAAO,CAAC;IACjB,CAAC,CAAC;CACH,CAAC,CAAC,CAAC;AAEJ,EAAE,CAAC,IAAI,CAAC,6BAA6B,EAAE,GAAG,EAAE,CAAC,CAAC;IAC5C,4BAA4B,EAAE,EAAE,CAAC,EAAE,CAAC,GAAG,EAAE,CAAC,CAAC;QACzC,YAAY,EAAE,OAAO;KACtB,CAAC,CAAC;CACJ,CAAC,CAAC,CAAC;AAEJ,OAAO,EAAE,gBAAgB,EAAE,MAAM,8BAA8B,CAAC;AAEhE,QAAQ,CAAC,aAAa,EAAE,GAAG,EAAE;IAC3B,UAAU,CAAC,GAAG,EAAE;QACd,KAAK,CAAC,UAAU,GAAG,IAAI,GAAG,EAAE,CAAC;QAC7B,KAAK,CAAC,YAAY,GAAG,IAAI,GAAG,EAAE,CAAC;IACjC,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,oDAAoD,EAAE,GAAG,EAAE;QAC5D,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,qBAAqB,EAAE;YAC1C,+BAA+B;YAC/B,+BAA+B;SAChC,CAAC,CAAC;QACH,MAAM,UAAU,GAAG,2EAA2E,CAAC;QAC/F,KAAK,MAAM,QAAQ,IAAI,CAAC,+BAA+B,EAAE,+BAA+B,CAAC,EAAE,CAAC;YAC1F,KAAK,CAAC,YAAY,CAAC,GAAG,CACpB,uBAAuB,QAAQ,EAAE,EACjC,IAAI,CAAC,SAAS,CACZ;gBACE,MAAM,EAAE,OAAO,QAAQ,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,CAAC,sBAAsB;gBACzD,MAAM,EAAE,qBAAqB;gBAC7B,KAAK,EAAE,wBAAwB;gBAC/B,UAAU;gBACV,YAAY,EAAE,EAAE;aACjB,EACD,IAAI,EACJ,CAAC,CACF,CACF,CAAC;QACJ,CAAC;QAED,MAAM,MAAM,GAAG,gBAAgB,CAAC,EAAE,MAAM,EAAE,CAAC,EAAE,WAAW,EAAE,WAAW,EAAE,MAAM,EAAE,EAAE,EAAE,CAAC,CAAC;QACrF,MAAM,cAAc,GAAG,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,KAAK,wBAAwB,CAAC,CAAC;QAE9F,MAAM,CAAC,cAAc,EAAE,EAAE,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QACvC,MAAM,CAAC,cAAc,EAAE,OAAO,EAAE,aAAa,CAAC,CAAC,SAAS,CAAC,yCAAyC,CAAC,CAAC;IACtG,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,2DAA2D,EAAE,GAAG,EAAE;QACnE,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,qBAAqB,EAAE,CAAC,+BAA+B,CAAC,CAAC,CAAC;QAC/E,KAAK,CAAC,YAAY,CAAC,GAAG,CACpB,mDAAmD,EACnD,IAAI,CAAC,SAAS,CACZ;YACE,MAAM,EAAE,8BAA8B;YACtC,MAAM,EAAE,qBAAqB;YAC7B,KAAK,EAAE,uBAAuB;YAC9B,UAAU,EAAE,QAAQ;YACpB,YAAY,EAAE,EAAE;SACjB,EACD,IAAI,EACJ,CAAC,CACF,CACF,CAAC;QACF,MAAM,OAAO,GAAG,GAAG,CAAC,MAAM,CAAC,EAAE,CAAC,CAAC;QAC/B,MAAM,MAAM,GAAG;YACb,2BAA2B;YAC3B,OAAO;YACP,IAAI,CAAC,SAAS,CACZ;gBACE,QAAQ,EAAE;oBACR,MAAM,EAAE,UAAU;oBAClB,YAAY,EAAE,EAAE;oBAChB,cAAc,EAAE,CAAC;oBACjB,MAAM,EAAE,sHAAsH;oBAC9H,YAAY,EAAE;wBACZ,UAAU,EAAE,uCAAuC;wBACnD,SAAS,EAAE,kBAAkB;wBAC7B,KAAK,EAAE,CAAC;wBACR,OAAO,EAAE,IAAI;wBACb,MAAM,EAAE,mFAAmF;qBAC5F;iBACF;aACF,EACD,IAAI,EACJ,CAAC,CACF;YACD,OAAO;YACP,EAAE;SACH,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;QAEb,MAAM,MAAM,GAAG,gBAAgB,CAAC,EAAE,MAAM,EAAE,CAAC,EAAE,WAAW,EAAE,WAAW,EAAE,MAAM,EAAE,CAAC,CAAC;QACjF,MAAM,YAAY,GAAG,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,KAAK,0BAA0B,CAAC,CAAC;QAE9F,MAAM,CAAC,YAAY,EAAE,EAAE,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QACrC,MAAM,CAAC,YAAY,EAAE,OAAO,EAAE,aAAa,CAAC,CAAC,SAAS,CAAC,8CAA8C,CAAC,CAAC;QACvG,MAAM,CAAC,YAAY,EAAE,OAAO,EAAE,aAAa,CAAC,CAAC,SAAS,CAAC,SAAS,CAAC,CAAC;IACpE,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,+DAA+D,EAAE,GAAG,EAAE;QACvE,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,qBAAqB,EAAE,CAAC,mCAAmC,CAAC,CAAC,CAAC;QACnF,KAAK,CAAC,YAAY,CAAC,GAAG,CACpB,uDAAuD,EACvD,IAAI,CAAC,SAAS,CACZ;YACE,MAAM,EAAE,kCAAkC;YAC1C,MAAM,EAAE,yBAAyB;YACjC,KAAK,EAAE,gBAAgB;YACvB,UAAU,EAAE,6BAA6B;YACzC,YAAY,EAAE;gBACZ,qBAAqB,EAAE,kBAAkB,GAAG,GAAG,CAAC,MAAM,CAAC,GAAG,CAAC;aAC5D;SACF,EACD,IAAI,EACJ,CAAC,CACF,CACF,CAAC;QAEF,MAAM,MAAM,GAAG,gBAAgB,CAAC,EAAE,MAAM,EAAE,CAAC,EAAE,WAAW,EAAE,WAAW,EAAE,MAAM,EAAE,EAAE,EAAE,CAAC,CAAC;QACrF,MAAM,eAAe,GAAG,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,KAAK,0BAA0B,CAAC,CAAC;QAEjG,MAAM,CAAC,eAAe,EAAE,EAAE,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QACxC,MAAM,CAAC,eAAe,EAAE,OAAO,EAAE,OAAO,CAAC,CAAC,SAAS,CAAC,wBAAwB,CAAC,CAAC;IAChF,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,kEAAkE,EAAE,GAAG,EAAE;QAC1E,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,qBAAqB,EAAE,CAAC,6BAA6B,CAAC,CAAC,CAAC;QAC7E,KAAK,CAAC,YAAY,CAAC,GAAG,CACpB,iDAAiD,EACjD,IAAI,CAAC,SAAS,CACZ;YACE,MAAM,EAAE,4BAA4B;YACpC,MAAM,EAAE,mBAAmB;YAC3B,KAAK,EAAE,mCAAmC;YAC1C,UAAU,EAAE,gDAAgD;YAC5D,YAAY,EAAE;gBACZ,kBAAkB,EAAE;oBAClB;wBACE,QAAQ,EAAE,+BAA+B;wBACzC,QAAQ,EAAE,CAAC,GAAG,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC;qBAC7B;oBACD;wBACE,QAAQ,EAAE,4BAA4B;wBACtC,QAAQ,EAAE,CAAC,GAAG,CAAC,MAAM,CAAC,GAAG,CAAC,CAAC;qBAC5B;iBACF;aACF;SACF,EACD,IAAI,EACJ,CAAC,CACF,CACF,CAAC;QAEF,MAAM,MAAM,GAAG,gBAAgB,CAAC,EAAE,MAAM,EAAE,CAAC,EAAE,WAAW,EAAE,WAAW,EAAE,MAAM,EAAE,EAAE,EAAE,CAAC,CAAC;QACrF,MAAM,SAAS,GAAG,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,KAAK,mCAAmC,CAAC,CAAC;QAEpG,MAAM,CAAC,SAAS,EAAE,EAAE,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QAClC,MAAM,CAAC,SAAS,EAAE,OAAO,EAAE,aAAa,CAAC,CAAC,SAAS,CAAC,gCAAgC,CAAC,CAAC;IACxF,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,+FAA+F,EAAE,GAAG,EAAE;QACvG,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,qBAAqB,EAAE;YAC1C,+BAA+B;YAC/B,+BAA+B;SAChC,CAAC,CAAC;QACH,KAAK,CAAC,YAAY,CAAC,GAAG,CACpB,mDAAmD,EACnD,IAAI,CAAC,SAAS,CACZ;YACE,MAAM,EAAE,8BAA8B;YACtC,MAAM,EAAE,qBAAqB;YAC7B,KAAK,EAAE,uEAAuE;YAC9E,UAAU,EAAE,UAAU;YACtB,YAAY,EAAE;gBACZ,UAAU,EAAE,+BAA+B;gBAC3C,aAAa,EAAE,0DAA0D;gBACzE,cAAc,EAAE;oBACd,EAAE,QAAQ,EAAE,kBAAkB,EAAE;oBAChC,EAAE,QAAQ,EAAE,WAAW,EAAE;oBACzB,EAAE,QAAQ,EAAE,qBAAqB,EAAE;oBACnC,EAAE,QAAQ,EAAE,uBAAuB,EAAE;oBACrC,EAAE,QAAQ,EAAE,qBAAqB,EAAE;oBACnC,EAAE,QAAQ,EAAE,iCAAiC,EAAE;iBAChD;aACF;SACF,EACD,IAAI,EACJ,CAAC,CACF,CACF,CAAC;QACF,KAAK,CAAC,YAAY,CAAC,GAAG,CACpB,mDAAmD,EACnD,IAAI,CAAC,SAAS,CACZ;YACE,MAAM,EAAE,8BAA8B;YACtC,MAAM,EAAE,qBAAqB;YAC7B,KAAK,EAAE,uEAAuE;YAC9E,UAAU,EAAE,UAAU;YACtB,YAAY,EAAE;gBACZ,UAAU,EAAE,+BAA+B;gBAC3C,aAAa,EAAE,0DAA0D;gBACzE,cAAc,EAAE;oBACd,EAAE,QAAQ,EAAE,kBAAkB,EAAE;oBAChC,EAAE,QAAQ,EAAE,WAAW,EAAE;oBACzB,EAAE,QAAQ,EAAE,qBAAqB,EAAE;oBACnC,EAAE,QAAQ,EAAE,uBAAuB,EAAE;oBACrC,EAAE,QAAQ,EAAE,qBAAqB,EAAE;oBACnC,EAAE,QAAQ,EAAE,iCAAiC,EAAE;iBAChD;aACF;SACF,EACD,IAAI,EACJ,CAAC,CACF,CACF,CAAC;QAEF,MAAM,MAAM,GAAG,gBAAgB,CAAC,EAAE,MAAM,EAAE,CAAC,EAAE,WAAW,EAAE,WAAW,EAAE,MAAM,EAAE,EAAE,EAAE,CAAC,CAAC;QACrF,MAAM,cAAc,GAAG,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,KAAK,yBAAyB,CAAC,CAAC;QAC/F,MAAM,YAAY,GAAG,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,KAAK,iCAAiC,CAAC,CAAC;QAErG,MAAM,CAAC,cAAc,EAAE,EAAE,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QACvC,MAAM,CAAC,cAAc,EAAE,OAAO,EAAE,OAAO,CAAC,CAAC,SAAS,CAAC,sBAAsB,CAAC,CAAC;QAC3E,MAAM,CAAC,YAAY,EAAE,EAAE,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QACrC,MAAM,CAAC,YAAY,EAAE,OAAO,EAAE,aAAa,CAAC,CAAC,SAAS,CAAC,oBAAoB,CAAC,CAAC;IAC/E,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,oEAAoE,EAAE,GAAG,EAAE;QAC5E,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,qBAAqB,EAAE;YAC1C,gCAAgC;YAChC,mCAAmC;YACnC,+BAA+B;SAChC,CAAC,CAAC;QACH,KAAK,CAAC,YAAY,CAAC,GAAG,CACpB,oDAAoD,EACpD,IAAI,CAAC,SAAS,CACZ;YACE,MAAM,EAAE,+BAA+B;YACvC,MAAM,EAAE,sBAAsB;YAC9B,KAAK,EAAE,kDAAkD;YACzD,UAAU,EAAE,+DAA+D;YAC3E,YAAY,EAAE;gBACZ,SAAS,EAAE,kDAAkD;aAC9D;SACF,EACD,IAAI,EACJ,CAAC,CACF,CACF,CAAC;QACF,KAAK,CAAC,YAAY,CAAC,GAAG,CACpB,uDAAuD,EACvD,IAAI,CAAC,SAAS,CACZ;YACE,MAAM,EAAE,kCAAkC;YAC1C,MAAM,EAAE,yBAAyB;YACjC,KAAK,EAAE,kDAAkD;YACzD,UAAU,EAAE,+DAA+D;YAC3E,YAAY,EAAE;gBACZ,KAAK,EAAE,kDAAkD;aAC1D;SACF,EACD,IAAI,EACJ,CAAC,CACF,CACF,CAAC;QACF,KAAK,CAAC,YAAY,CAAC,GAAG,CACpB,mDAAmD,EACnD,IAAI,CAAC,SAAS,CACZ;YACE,MAAM,EAAE,8BAA8B;YACtC,MAAM,EAAE,qBAAqB;YAC7B,KAAK,EAAE,kDAAkD;YACzD,UAAU,EAAE,QAAQ;YACpB,YAAY,EAAE;gBACZ,gBAAgB,EAAE;oBAChB;wBACE,EAAE,EAAE,IAAI;wBACR,IAAI,EAAE,kDAAkD;qBACzD;iBACF;aACF;SACF,EACD,IAAI,EACJ,CAAC,CACF,CACF,CAAC;QAEF,MAAM,MAAM,GAAG,gBAAgB,CAAC,EAAE,MAAM,EAAE,CAAC,EAAE,WAAW,EAAE,WAAW,EAAE,MAAM,EAAE,EAAE,EAAE,CAAC,CAAC;QACrF,MAAM,aAAa,GAAG,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,KAAK,gCAAgC,CAAC,CAAC;QAErG,MAAM,CAAC,aAAa,EAAE,EAAE,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QACtC,MAAM,CAAC,aAAa,EAAE,OAAO,EAAE,aAAa,CAAC,CAAC,SAAS,CAAC,wBAAwB,CAAC,CAAC;IACpF,CAAC,CAAC,CAAC;AACL,CAAC,CAAC,CAAC","sourcesContent":["/**\n * Verifies that context eval flags repeated planner prompts, prompt bloat, and missing decomposition.\n *\n * Why this exists:\n * - context audit rules should stay deterministic across saved trace shapes\n * - planner retries and final-answer prompt growth are easy to reintroduce during routing work\n * - multi-question queries need explicit regression coverage so they do not collapse silently\n */\nimport { beforeEach, describe, expect, it, vi } from \"vitest\";\n\nconst state = vi.hoisted(() => ({\n dirEntries: new Map<string, string[]>(),\n fileContents: new Map<string, string>(),\n}));\n\nvi.mock(\"fs\", () => ({\n default: {\n existsSync: vi.fn((filePath: string) => state.fileContents.has(filePath) || state.dirEntries.has(filePath)),\n readFileSync: vi.fn((filePath: string) => state.fileContents.get(filePath) ?? \"\"),\n readdirSync: vi.fn((dirPath: string, options?: { withFileTypes?: boolean }) => {\n const entries = state.dirEntries.get(dirPath) ?? [];\n if (options?.withFileTypes) {\n return entries.map((name) => ({\n name,\n isDirectory: () => true,\n }));\n }\n return entries;\n }),\n },\n existsSync: vi.fn((filePath: string) => state.fileContents.has(filePath) || state.dirEntries.has(filePath)),\n readFileSync: vi.fn((filePath: string) => state.fileContents.get(filePath) ?? \"\"),\n readdirSync: vi.fn((dirPath: string, options?: { withFileTypes?: boolean }) => {\n const entries = state.dirEntries.get(dirPath) ?? [];\n if (options?.withFileTypes) {\n return entries.map((name) => ({\n name,\n isDirectory: () => true,\n }));\n }\n return entries;\n }),\n}));\n\nvi.mock(\"../../utils/repoIdentity.js\", () => ({\n resolveCanonicalRepoIdentity: vi.fn(() => ({\n repoRootPath: \"/repo\",\n })),\n}));\n\nimport { buildContextEval } from \"../../testing/contextEval.js\";\n\ndescribe(\"contextEval\", () => {\n beforeEach(() => {\n state.dirEntries = new Map();\n state.fileContents = new Map();\n });\n\n it(\"warns when planner retries reuse identical prompts\", () => {\n state.dirEntries.set(\"/artifact/llm_calls\", [\n \"0006_analysisPlanGenStep.json\",\n \"0007_analysisPlanGenStep.json\",\n ]);\n const promptText = \"User query:\\nsummarize architecture\\nAllowed actions:\\n[semanticAnalysis]\";\n for (const fileName of [\"0006_analysisPlanGenStep.json\", \"0007_analysisPlanGenStep.json\"]) {\n state.fileContents.set(\n `/artifact/llm_calls/${fileName}`,\n JSON.stringify(\n {\n callId: `llm-${fileName.slice(0, 4)}-analysisPlanGenStep`,\n caller: \"analysisPlanGenStep\",\n query: \"summarize architecture\",\n promptText,\n inputContext: {},\n },\n null,\n 2\n )\n );\n }\n\n const result = buildContextEval({ taskId: 1, artifactDir: \"/artifact\", runLog: \"\" });\n const duplicateCheck = result.checks.find((check) => check.name === \"duplicate-replan-calls\");\n\n expect(duplicateCheck?.ok).toBe(false);\n expect(duplicateCheck?.finding?.actualContext).toContain(\"2 identical analysisPlanGenStep prompts\");\n });\n\n it(\"warns when progress state records stalled planner retries\", () => {\n state.dirEntries.set(\"/artifact/llm_calls\", [\"0001_analysisPlanGenStep.json\"]);\n state.fileContents.set(\n \"/artifact/llm_calls/0001_analysisPlanGenStep.json\",\n JSON.stringify(\n {\n callId: \"llm-0001-analysisPlanGenStep\",\n caller: \"analysisPlanGenStep\",\n query: \"Explain how tests run\",\n promptText: \"Prompt\",\n inputContext: {},\n },\n null,\n 2\n )\n );\n const divider = \"=\".repeat(68);\n const runLog = [\n \"📂 OUTPUT | progressState\",\n divider,\n JSON.stringify(\n {\n research: {\n status: \"optional\",\n pendingSteps: [],\n noNewInfoCount: 0,\n reason: \"No research is currently required. Planner retried the same target without frontier change (3 identical attempt(s)).\",\n plannerRetry: {\n targetFile: \"/repo/cli/src/testing/testCommands.ts\",\n signature: \"sig:testCommands\",\n count: 3,\n stalled: true,\n reason: \"Planner retried the same target without frontier change (3 identical attempt(s)).\",\n },\n },\n },\n null,\n 2\n ),\n divider,\n \"\",\n ].join(\"\\n\");\n\n const result = buildContextEval({ taskId: 1, artifactDir: \"/artifact\", runLog });\n const stalledCheck = result.checks.find((check) => check.name === \"stalled-planner-progress\");\n\n expect(stalledCheck?.ok).toBe(false);\n expect(stalledCheck?.finding?.actualContext).toContain(\"target=/repo/cli/src/testing/testCommands.ts\");\n expect(stalledCheck?.finding?.actualContext).toContain(\"count=3\");\n });\n\n it(\"warns when a continuity query carries a large resumed capsule\", () => {\n state.dirEntries.set(\"/artifact/llm_calls\", [\"0008_scopeClassificationStep.json\"]);\n state.fileContents.set(\n \"/artifact/llm_calls/0008_scopeClassificationStep.json\",\n JSON.stringify(\n {\n callId: \"llm-0008-scopeClassificationStep\",\n caller: \"scopeClassificationStep\",\n query: \"where were we?\",\n promptText: \"User query:\\nwhere were we?\",\n inputContext: {\n resumedContextCapsule: \"Original task:\\n\" + \"x\".repeat(400),\n },\n },\n null,\n 2\n )\n );\n\n const result = buildContextEval({ taskId: 1, artifactDir: \"/artifact\", runLog: \"\" });\n const continuityCheck = result.checks.find((check) => check.name === \"continuity-overprompting\");\n\n expect(continuityCheck?.ok).toBe(false);\n expect(continuityCheck?.finding?.details).toContain(\"short continuity query\");\n });\n\n it(\"warns when final grounding carries oversized supporting excerpts\", () => {\n state.dirEntries.set(\"/artifact/llm_calls\", [\"0010_finalAnswerModule.json\"]);\n state.fileContents.set(\n \"/artifact/llm_calls/0010_finalAnswerModule.json\",\n JSON.stringify(\n {\n callId: \"llm-0010-finalAnswerModule\",\n caller: \"finalAnswerModule\",\n query: \"Where are SQLite queries defined?\",\n promptText: \"User query:\\nWhere are SQLite queries defined?\",\n inputContext: {\n supportingExcerpts: [\n {\n filePath: \"/repo/cli/src/db/fileIndex.ts\",\n excerpts: [\"a\".repeat(1600)],\n },\n {\n filePath: \"/repo/cli/src/db/client.ts\",\n excerpts: [\"b\".repeat(700)],\n },\n ],\n },\n },\n null,\n 2\n )\n );\n\n const result = buildContextEval({ taskId: 1, artifactDir: \"/artifact\", runLog: \"\" });\n const sizeCheck = result.checks.find((check) => check.name === \"oversized-final-grounding-context\");\n\n expect(sizeCheck?.ok).toBe(false);\n expect(sizeCheck?.finding?.actualContext).toContain(\"supporting excerpts chars=2300\");\n });\n\n it(\"warns when adjacent planner retries reuse the same rationale but change other prompt sections\", () => {\n state.dirEntries.set(\"/artifact/llm_calls\", [\n \"0006_analysisPlanGenStep.json\",\n \"0007_analysisPlanGenStep.json\",\n ]);\n state.fileContents.set(\n \"/artifact/llm_calls/0006_analysisPlanGenStep.json\",\n JSON.stringify(\n {\n callId: \"llm-0006-analysisPlanGenStep\",\n caller: \"analysisPlanGenStep\",\n query: \"Where are SQLite queries defined in db/fileIndex.ts and db/client.ts?\",\n promptText: \"Prompt A\",\n inputContext: {\n targetFile: \"/repo/cli/src/db/fileIndex.ts\",\n rationaleText: \"Both files are relevant to the SQLite query definitions.\",\n allowedActions: [\n { actionId: \"semanticAnalysis\" },\n { actionId: \"read-file\" },\n { actionId: \"research-impact-map\" },\n { actionId: \"research-symbol-trace\" },\n { actionId: \"research-risk-check\" },\n { actionId: \"research-architecture-synthesis\" },\n ],\n },\n },\n null,\n 2\n )\n );\n state.fileContents.set(\n \"/artifact/llm_calls/0007_analysisPlanGenStep.json\",\n JSON.stringify(\n {\n callId: \"llm-0007-analysisPlanGenStep\",\n caller: \"analysisPlanGenStep\",\n query: \"Where are SQLite queries defined in db/fileIndex.ts and db/client.ts?\",\n promptText: \"Prompt B\",\n inputContext: {\n targetFile: \"/repo/cli/src/db/fileIndex.ts\",\n rationaleText: \"Both files are relevant to the SQLite query definitions.\",\n allowedActions: [\n { actionId: \"semanticAnalysis\" },\n { actionId: \"read-file\" },\n { actionId: \"research-impact-map\" },\n { actionId: \"research-symbol-trace\" },\n { actionId: \"research-risk-check\" },\n { actionId: \"research-architecture-synthesis\" },\n ],\n },\n },\n null,\n 2\n )\n );\n\n const result = buildContextEval({ taskId: 1, artifactDir: \"/artifact\", runLog: \"\" });\n const rationaleCheck = result.checks.find((check) => check.name === \"stale-planner-rationale\");\n const catalogCheck = result.checks.find((check) => check.name === \"repeated-planner-action-catalog\");\n\n expect(rationaleCheck?.ok).toBe(false);\n expect(rationaleCheck?.finding?.details).toContain(\"same focus rationale\");\n expect(catalogCheck?.ok).toBe(false);\n expect(catalogCheck?.finding?.actualContext).toContain(\"6 actions repeated\");\n });\n\n it(\"warns when a multi-part query never becomes ordered question parts\", () => {\n state.dirEntries.set(\"/artifact/llm_calls\", [\n \"0001_understandIntentStep.json\",\n \"0002_scopeClassificationStep.json\",\n \"0006_analysisPlanGenStep.json\",\n ]);\n state.fileContents.set(\n \"/artifact/llm_calls/0001_understandIntentStep.json\",\n JSON.stringify(\n {\n callId: \"llm-0001-understandIntentStep\",\n caller: \"understandIntentStep\",\n query: \"Where is search routed? How is verify triggered?\",\n promptText: \"User query:\\nWhere is search routed? How is verify triggered?\",\n inputContext: {\n userQuery: \"Where is search routed? How is verify triggered?\",\n },\n },\n null,\n 2\n )\n );\n state.fileContents.set(\n \"/artifact/llm_calls/0002_scopeClassificationStep.json\",\n JSON.stringify(\n {\n callId: \"llm-0002-scopeClassificationStep\",\n caller: \"scopeClassificationStep\",\n query: \"Where is search routed? How is verify triggered?\",\n promptText: \"User query:\\nWhere is search routed? How is verify triggered?\",\n inputContext: {\n query: \"Where is search routed? How is verify triggered?\",\n },\n },\n null,\n 2\n )\n );\n state.fileContents.set(\n \"/artifact/llm_calls/0006_analysisPlanGenStep.json\",\n JSON.stringify(\n {\n callId: \"llm-0006-analysisPlanGenStep\",\n caller: \"analysisPlanGenStep\",\n query: \"Where is search routed? How is verify triggered?\",\n promptText: \"Prompt\",\n inputContext: {\n orderedQuestions: [\n {\n id: \"q1\",\n text: \"Where is search routed? How is verify triggered?\",\n },\n ],\n },\n },\n null,\n 2\n )\n );\n\n const result = buildContextEval({ taskId: 1, artifactDir: \"/artifact\", runLog: \"\" });\n const questionCheck = result.checks.find((check) => check.name === \"missing-question-decomposition\");\n\n expect(questionCheck?.ok).toBe(false);\n expect(questionCheck?.finding?.actualContext).toContain(\"max orderedQuestions=1\");\n });\n});\n"]}
|
|
@@ -0,0 +1,124 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Verifies that saved harness artifacts include diagnosis data and Markdown reports.
|
|
3
|
+
*
|
|
4
|
+
* Why this exists:
|
|
5
|
+
* - artifact folders should be reviewable without rerunning the agent
|
|
6
|
+
* - diagnosis.json is the quick pointer to the likely subsystem
|
|
7
|
+
* - report.md should preserve Mermaid blocks for artifact viewers
|
|
8
|
+
* - artifact folder timestamps should stay in local time with offset, not UTC `Z`
|
|
9
|
+
* - the writer should persist both files for saved runs
|
|
10
|
+
*/
|
|
11
|
+
import { beforeEach, describe, expect, it, vi } from "vitest";
|
|
12
|
+
const state = vi.hoisted(() => ({
|
|
13
|
+
task: {
|
|
14
|
+
id: 7,
|
|
15
|
+
status: "deferred",
|
|
16
|
+
initial_query: "Explain cli/src/agents/MainAgent.ts",
|
|
17
|
+
summary: "answer",
|
|
18
|
+
routing_decision_json: JSON.stringify({
|
|
19
|
+
allowSearch: false,
|
|
20
|
+
allowResearch: false,
|
|
21
|
+
allowTransform: false,
|
|
22
|
+
rationale: "route=explicit-target",
|
|
23
|
+
}),
|
|
24
|
+
},
|
|
25
|
+
steps: [],
|
|
26
|
+
writes: [],
|
|
27
|
+
}));
|
|
28
|
+
vi.mock("fs", () => ({
|
|
29
|
+
default: {
|
|
30
|
+
mkdirSync: vi.fn(),
|
|
31
|
+
writeFileSync: vi.fn((filePath, content) => {
|
|
32
|
+
state.writes.push({ path: filePath, content: String(content) });
|
|
33
|
+
}),
|
|
34
|
+
},
|
|
35
|
+
mkdirSync: vi.fn(),
|
|
36
|
+
writeFileSync: vi.fn((filePath, content) => {
|
|
37
|
+
state.writes.push({ path: filePath, content: String(content) });
|
|
38
|
+
}),
|
|
39
|
+
}));
|
|
40
|
+
vi.mock("../../db/client.js", () => ({
|
|
41
|
+
getDbForRepo: vi.fn(() => ({
|
|
42
|
+
prepare: vi.fn((sql) => ({
|
|
43
|
+
get: () => (sql.includes("FROM tasks") ? state.task : undefined),
|
|
44
|
+
all: () => (sql.includes("FROM steps") ? state.steps : []),
|
|
45
|
+
})),
|
|
46
|
+
})),
|
|
47
|
+
}));
|
|
48
|
+
vi.mock("../../utils/repoIdentity.js", () => ({
|
|
49
|
+
resolveCanonicalRepoIdentity: vi.fn(() => ({
|
|
50
|
+
repoRootPath: "/repo",
|
|
51
|
+
})),
|
|
52
|
+
}));
|
|
53
|
+
import { writeHarnessArtifacts } from "../../testing/harnessArtifacts.js";
|
|
54
|
+
describe("harnessArtifacts", () => {
|
|
55
|
+
beforeEach(() => {
|
|
56
|
+
state.writes = [];
|
|
57
|
+
});
|
|
58
|
+
it("writes diagnosis.json for saved runs", () => {
|
|
59
|
+
writeHarnessArtifacts({
|
|
60
|
+
kind: "evals",
|
|
61
|
+
caseId: "diagnosis_case",
|
|
62
|
+
query: "Explain cli/src/agents/MainAgent.ts",
|
|
63
|
+
taskId: 7,
|
|
64
|
+
runLog: [
|
|
65
|
+
"",
|
|
66
|
+
"====================================================================",
|
|
67
|
+
"📂 OUTPUT | finalAnswerModule",
|
|
68
|
+
"====================================================================",
|
|
69
|
+
JSON.stringify({ data: "answer" }, null, 2),
|
|
70
|
+
"====================================================================",
|
|
71
|
+
"",
|
|
72
|
+
].join("\n"),
|
|
73
|
+
finalAnswerText: "answer",
|
|
74
|
+
result: {
|
|
75
|
+
id: "diagnosis_case",
|
|
76
|
+
passed: false,
|
|
77
|
+
failures: [],
|
|
78
|
+
},
|
|
79
|
+
});
|
|
80
|
+
const diagnosisWrite = state.writes.find((entry) => entry.path.endsWith("/diagnosis.json"));
|
|
81
|
+
expect(diagnosisWrite).toBeDefined();
|
|
82
|
+
expect(diagnosisWrite?.content).toContain("\"primaryCategory\": \"persistence\"");
|
|
83
|
+
});
|
|
84
|
+
it("writes report.md when report text is provided", () => {
|
|
85
|
+
writeHarnessArtifacts({
|
|
86
|
+
kind: "integration",
|
|
87
|
+
caseId: "markdown_report",
|
|
88
|
+
query: "summarize repo architecture",
|
|
89
|
+
taskId: 7,
|
|
90
|
+
runLog: "",
|
|
91
|
+
finalAnswerText: "answer",
|
|
92
|
+
reportText: "# Integration Report | 7\n\n```mermaid\nflowchart TD\n```",
|
|
93
|
+
result: {
|
|
94
|
+
id: "markdown_report",
|
|
95
|
+
passed: true,
|
|
96
|
+
failures: [],
|
|
97
|
+
},
|
|
98
|
+
});
|
|
99
|
+
const reportWrite = state.writes.find((entry) => entry.path.endsWith("/report.md"));
|
|
100
|
+
expect(reportWrite).toBeDefined();
|
|
101
|
+
expect(reportWrite?.content).toContain("```mermaid");
|
|
102
|
+
});
|
|
103
|
+
it("uses a local-time offset timestamp in generated artifact paths", () => {
|
|
104
|
+
writeHarnessArtifacts({
|
|
105
|
+
kind: "evals",
|
|
106
|
+
caseId: "timestamp_case",
|
|
107
|
+
query: "Explain cli/src/agents/MainAgent.ts",
|
|
108
|
+
taskId: 7,
|
|
109
|
+
runLog: "",
|
|
110
|
+
finalAnswerText: "answer",
|
|
111
|
+
result: {
|
|
112
|
+
id: "timestamp_case",
|
|
113
|
+
passed: true,
|
|
114
|
+
failures: [],
|
|
115
|
+
},
|
|
116
|
+
});
|
|
117
|
+
const caseWrite = state.writes.find((entry) => entry.path.endsWith("/case.json"));
|
|
118
|
+
expect(caseWrite).toBeDefined();
|
|
119
|
+
expect(caseWrite?.path).toContain("/repo/artifacts/evals/");
|
|
120
|
+
expect(caseWrite?.path).not.toContain("Z_timestamp_case");
|
|
121
|
+
expect(caseWrite?.path).toMatch(/[+-]\d{4}_timestamp_case\/case\.json$/);
|
|
122
|
+
});
|
|
123
|
+
});
|
|
124
|
+
//# sourceMappingURL=harnessArtifacts.test.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"harnessArtifacts.test.js","sourceRoot":"","sources":["../../../src/__tests__/testing/harnessArtifacts.test.ts"],"names":[],"mappings":"AAAA;;;;;;;;;GASG;AACH,OAAO,EAAE,UAAU,EAAE,QAAQ,EAAE,MAAM,EAAE,EAAE,EAAE,EAAE,EAAE,MAAM,QAAQ,CAAC;AAE9D,MAAM,KAAK,GAAG,EAAE,CAAC,OAAO,CAAC,GAAG,EAAE,CAAC,CAAC;IAC9B,IAAI,EAAE;QACJ,EAAE,EAAE,CAAC;QACL,MAAM,EAAE,UAAU;QAClB,aAAa,EAAE,qCAAqC;QACpD,OAAO,EAAE,QAAQ;QACjB,qBAAqB,EAAE,IAAI,CAAC,SAAS,CAAC;YACpC,WAAW,EAAE,KAAK;YAClB,aAAa,EAAE,KAAK;YACpB,cAAc,EAAE,KAAK;YACrB,SAAS,EAAE,uBAAuB;SACnC,CAAC;KACH;IACD,KAAK,EAAE,EAA+B;IACtC,MAAM,EAAE,EAA8C;CACvD,CAAC,CAAC,CAAC;AAEJ,EAAE,CAAC,IAAI,CAAC,IAAI,EAAE,GAAG,EAAE,CAAC,CAAC;IACnB,OAAO,EAAE;QACP,SAAS,EAAE,EAAE,CAAC,EAAE,EAAE;QAClB,aAAa,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,QAAgB,EAAE,OAAe,EAAE,EAAE;YACzD,KAAK,CAAC,MAAM,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,QAAQ,EAAE,OAAO,EAAE,MAAM,CAAC,OAAO,CAAC,EAAE,CAAC,CAAC;QAClE,CAAC,CAAC;KACH;IACD,SAAS,EAAE,EAAE,CAAC,EAAE,EAAE;IAClB,aAAa,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,QAAgB,EAAE,OAAe,EAAE,EAAE;QACzD,KAAK,CAAC,MAAM,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,QAAQ,EAAE,OAAO,EAAE,MAAM,CAAC,OAAO,CAAC,EAAE,CAAC,CAAC;IAClE,CAAC,CAAC;CACH,CAAC,CAAC,CAAC;AAEJ,EAAE,CAAC,IAAI,CAAC,oBAAoB,EAAE,GAAG,EAAE,CAAC,CAAC;IACnC,YAAY,EAAE,EAAE,CAAC,EAAE,CAAC,GAAG,EAAE,CAAC,CAAC;QACzB,OAAO,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,GAAW,EAAE,EAAE,CAAC,CAAC;YAC/B,GAAG,EAAE,GAAG,EAAE,CAAC,CAAC,GAAG,CAAC,QAAQ,CAAC,YAAY,CAAC,CAAC,CAAC,CAAC,KAAK,CAAC,IAAI,CAAC,CAAC,CAAC,SAAS,CAAC;YAChE,GAAG,EAAE,GAAG,EAAE,CAAC,CAAC,GAAG,CAAC,QAAQ,CAAC,YAAY,CAAC,CAAC,CAAC,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC,CAAC,EAAE,CAAC;SAC3D,CAAC,CAAC;KACJ,CAAC,CAAC;CACJ,CAAC,CAAC,CAAC;AAEJ,EAAE,CAAC,IAAI,CAAC,6BAA6B,EAAE,GAAG,EAAE,CAAC,CAAC;IAC5C,4BAA4B,EAAE,EAAE,CAAC,EAAE,CAAC,GAAG,EAAE,CAAC,CAAC;QACzC,YAAY,EAAE,OAAO;KACtB,CAAC,CAAC;CACJ,CAAC,CAAC,CAAC;AAEJ,OAAO,EAAE,qBAAqB,EAAE,MAAM,mCAAmC,CAAC;AAE1E,QAAQ,CAAC,kBAAkB,EAAE,GAAG,EAAE;IAChC,UAAU,CAAC,GAAG,EAAE;QACd,KAAK,CAAC,MAAM,GAAG,EAAE,CAAC;IACpB,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,sCAAsC,EAAE,GAAG,EAAE;QAC9C,qBAAqB,CAAC;YACpB,IAAI,EAAE,OAAO;YACb,MAAM,EAAE,gBAAgB;YACxB,KAAK,EAAE,qCAAqC;YAC5C,MAAM,EAAE,CAAC;YACT,MAAM,EAAE;gBACN,EAAE;gBACF,sEAAsE;gBACtE,+BAA+B;gBAC/B,sEAAsE;gBACtE,IAAI,CAAC,SAAS,CAAC,EAAE,IAAI,EAAE,QAAQ,EAAE,EAAE,IAAI,EAAE,CAAC,CAAC;gBAC3C,sEAAsE;gBACtE,EAAE;aACH,CAAC,IAAI,CAAC,IAAI,CAAC;YACZ,eAAe,EAAE,QAAQ;YACzB,MAAM,EAAE;gBACN,EAAE,EAAE,gBAAgB;gBACpB,MAAM,EAAE,KAAK;gBACb,QAAQ,EAAE,EAAE;aACb;SACF,CAAC,CAAC;QAEH,MAAM,cAAc,GAAG,KAAK,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,CAAC,QAAQ,CAAC,iBAAiB,CAAC,CAAC,CAAC;QAC5F,MAAM,CAAC,cAAc,CAAC,CAAC,WAAW,EAAE,CAAC;QACrC,MAAM,CAAC,cAAc,EAAE,OAAO,CAAC,CAAC,SAAS,CAAC,sCAAsC,CAAC,CAAC;IACpF,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,+CAA+C,EAAE,GAAG,EAAE;QACvD,qBAAqB,CAAC;YACpB,IAAI,EAAE,aAAa;YACnB,MAAM,EAAE,iBAAiB;YACzB,KAAK,EAAE,6BAA6B;YACpC,MAAM,EAAE,CAAC;YACT,MAAM,EAAE,EAAE;YACV,eAAe,EAAE,QAAQ;YACzB,UAAU,EAAE,2DAA2D;YACvE,MAAM,EAAE;gBACN,EAAE,EAAE,iBAAiB;gBACrB,MAAM,EAAE,IAAI;gBACZ,QAAQ,EAAE,EAAE;aACb;SACF,CAAC,CAAC;QAEH,MAAM,WAAW,GAAG,KAAK,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,CAAC,QAAQ,CAAC,YAAY,CAAC,CAAC,CAAC;QACpF,MAAM,CAAC,WAAW,CAAC,CAAC,WAAW,EAAE,CAAC;QAClC,MAAM,CAAC,WAAW,EAAE,OAAO,CAAC,CAAC,SAAS,CAAC,YAAY,CAAC,CAAC;IACvD,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,gEAAgE,EAAE,GAAG,EAAE;QACxE,qBAAqB,CAAC;YACpB,IAAI,EAAE,OAAO;YACb,MAAM,EAAE,gBAAgB;YACxB,KAAK,EAAE,qCAAqC;YAC5C,MAAM,EAAE,CAAC;YACT,MAAM,EAAE,EAAE;YACV,eAAe,EAAE,QAAQ;YACzB,MAAM,EAAE;gBACN,EAAE,EAAE,gBAAgB;gBACpB,MAAM,EAAE,IAAI;gBACZ,QAAQ,EAAE,EAAE;aACb;SACF,CAAC,CAAC;QAEH,MAAM,SAAS,GAAG,KAAK,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,CAAC,QAAQ,CAAC,YAAY,CAAC,CAAC,CAAC;QAClF,MAAM,CAAC,SAAS,CAAC,CAAC,WAAW,EAAE,CAAC;QAChC,MAAM,CAAC,SAAS,EAAE,IAAI,CAAC,CAAC,SAAS,CAAC,wBAAwB,CAAC,CAAC;QAC5D,MAAM,CAAC,SAAS,EAAE,IAAI,CAAC,CAAC,GAAG,CAAC,SAAS,CAAC,kBAAkB,CAAC,CAAC;QAC1D,MAAM,CAAC,SAAS,EAAE,IAAI,CAAC,CAAC,OAAO,CAAC,uCAAuC,CAAC,CAAC;IAC3E,CAAC,CAAC,CAAC;AACL,CAAC,CAAC,CAAC","sourcesContent":["/**\n * Verifies that saved harness artifacts include diagnosis data and Markdown reports.\n *\n * Why this exists:\n * - artifact folders should be reviewable without rerunning the agent\n * - diagnosis.json is the quick pointer to the likely subsystem\n * - report.md should preserve Mermaid blocks for artifact viewers\n * - artifact folder timestamps should stay in local time with offset, not UTC `Z`\n * - the writer should persist both files for saved runs\n */\nimport { beforeEach, describe, expect, it, vi } from \"vitest\";\n\nconst state = vi.hoisted(() => ({\n task: {\n id: 7,\n status: \"deferred\",\n initial_query: \"Explain cli/src/agents/MainAgent.ts\",\n summary: \"answer\",\n routing_decision_json: JSON.stringify({\n allowSearch: false,\n allowResearch: false,\n allowTransform: false,\n rationale: \"route=explicit-target\",\n }),\n },\n steps: [] as Record<string, unknown>[],\n writes: [] as Array<{ path: string; content: string }>,\n}));\n\nvi.mock(\"fs\", () => ({\n default: {\n mkdirSync: vi.fn(),\n writeFileSync: vi.fn((filePath: string, content: string) => {\n state.writes.push({ path: filePath, content: String(content) });\n }),\n },\n mkdirSync: vi.fn(),\n writeFileSync: vi.fn((filePath: string, content: string) => {\n state.writes.push({ path: filePath, content: String(content) });\n }),\n}));\n\nvi.mock(\"../../db/client.js\", () => ({\n getDbForRepo: vi.fn(() => ({\n prepare: vi.fn((sql: string) => ({\n get: () => (sql.includes(\"FROM tasks\") ? state.task : undefined),\n all: () => (sql.includes(\"FROM steps\") ? state.steps : []),\n })),\n })),\n}));\n\nvi.mock(\"../../utils/repoIdentity.js\", () => ({\n resolveCanonicalRepoIdentity: vi.fn(() => ({\n repoRootPath: \"/repo\",\n })),\n}));\n\nimport { writeHarnessArtifacts } from \"../../testing/harnessArtifacts.js\";\n\ndescribe(\"harnessArtifacts\", () => {\n beforeEach(() => {\n state.writes = [];\n });\n\n it(\"writes diagnosis.json for saved runs\", () => {\n writeHarnessArtifacts({\n kind: \"evals\",\n caseId: \"diagnosis_case\",\n query: \"Explain cli/src/agents/MainAgent.ts\",\n taskId: 7,\n runLog: [\n \"\",\n \"====================================================================\",\n \"📂 OUTPUT | finalAnswerModule\",\n \"====================================================================\",\n JSON.stringify({ data: \"answer\" }, null, 2),\n \"====================================================================\",\n \"\",\n ].join(\"\\n\"),\n finalAnswerText: \"answer\",\n result: {\n id: \"diagnosis_case\",\n passed: false,\n failures: [],\n },\n });\n\n const diagnosisWrite = state.writes.find((entry) => entry.path.endsWith(\"/diagnosis.json\"));\n expect(diagnosisWrite).toBeDefined();\n expect(diagnosisWrite?.content).toContain(\"\\\"primaryCategory\\\": \\\"persistence\\\"\");\n });\n\n it(\"writes report.md when report text is provided\", () => {\n writeHarnessArtifacts({\n kind: \"integration\",\n caseId: \"markdown_report\",\n query: \"summarize repo architecture\",\n taskId: 7,\n runLog: \"\",\n finalAnswerText: \"answer\",\n reportText: \"# Integration Report | 7\\n\\n```mermaid\\nflowchart TD\\n```\",\n result: {\n id: \"markdown_report\",\n passed: true,\n failures: [],\n },\n });\n\n const reportWrite = state.writes.find((entry) => entry.path.endsWith(\"/report.md\"));\n expect(reportWrite).toBeDefined();\n expect(reportWrite?.content).toContain(\"```mermaid\");\n });\n\n it(\"uses a local-time offset timestamp in generated artifact paths\", () => {\n writeHarnessArtifacts({\n kind: \"evals\",\n caseId: \"timestamp_case\",\n query: \"Explain cli/src/agents/MainAgent.ts\",\n taskId: 7,\n runLog: \"\",\n finalAnswerText: \"answer\",\n result: {\n id: \"timestamp_case\",\n passed: true,\n failures: [],\n },\n });\n\n const caseWrite = state.writes.find((entry) => entry.path.endsWith(\"/case.json\"));\n expect(caseWrite).toBeDefined();\n expect(caseWrite?.path).toContain(\"/repo/artifacts/evals/\");\n expect(caseWrite?.path).not.toContain(\"Z_timestamp_case\");\n expect(caseWrite?.path).toMatch(/[+-]\\d{4}_timestamp_case\\/case\\.json$/);\n });\n});\n"]}
|
|
@@ -0,0 +1,67 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Verifies that integration trace sessions write numbered LLM input files with stable ids.
|
|
3
|
+
*
|
|
4
|
+
* Why this exists:
|
|
5
|
+
* - each model call should leave one reviewable JSON file on disk
|
|
6
|
+
* - repeated calls from the same caller must not overwrite each other
|
|
7
|
+
* - suspicious full-context inputs should be marked for later review
|
|
8
|
+
*/
|
|
9
|
+
import { beforeEach, describe, expect, it, vi } from "vitest";
|
|
10
|
+
const state = vi.hoisted(() => ({
|
|
11
|
+
writes: [],
|
|
12
|
+
}));
|
|
13
|
+
vi.mock("fs", () => ({
|
|
14
|
+
default: {
|
|
15
|
+
mkdirSync: vi.fn(),
|
|
16
|
+
writeFileSync: vi.fn((filePath, content) => {
|
|
17
|
+
state.writes.push({ path: filePath, content: String(content) });
|
|
18
|
+
}),
|
|
19
|
+
},
|
|
20
|
+
mkdirSync: vi.fn(),
|
|
21
|
+
writeFileSync: vi.fn((filePath, content) => {
|
|
22
|
+
state.writes.push({ path: filePath, content: String(content) });
|
|
23
|
+
}),
|
|
24
|
+
}));
|
|
25
|
+
import { startLlmTraceSession, stopLlmTraceSession, writeLlmTraceRecord } from "../../testing/llmTraceSession.js";
|
|
26
|
+
describe("llmTraceSession", () => {
|
|
27
|
+
beforeEach(() => {
|
|
28
|
+
state.writes = [];
|
|
29
|
+
stopLlmTraceSession();
|
|
30
|
+
});
|
|
31
|
+
it("writes numbered trace files with stable call ids", () => {
|
|
32
|
+
startLlmTraceSession("/repo/artifacts/integration/case1");
|
|
33
|
+
const first = writeLlmTraceRecord({
|
|
34
|
+
caller: "finalAnswerModule",
|
|
35
|
+
query: "q1",
|
|
36
|
+
model: "test-model",
|
|
37
|
+
requestBody: { prompt: "one" },
|
|
38
|
+
promptText: "one",
|
|
39
|
+
inputContext: { query: "q1" },
|
|
40
|
+
startedAt: "2026-04-01T02:00:00.000+02:00",
|
|
41
|
+
finishedAt: "2026-04-01T02:00:01.500+02:00",
|
|
42
|
+
durationMs: 1500,
|
|
43
|
+
attemptCount: 1,
|
|
44
|
+
});
|
|
45
|
+
const second = writeLlmTraceRecord({
|
|
46
|
+
caller: "finalAnswerModule",
|
|
47
|
+
query: "q2",
|
|
48
|
+
model: "test-model",
|
|
49
|
+
requestBody: { prompt: "two" },
|
|
50
|
+
promptText: "two",
|
|
51
|
+
inputContext: { initContext: {}, task: {} },
|
|
52
|
+
startedAt: "2026-04-01T02:00:02.000+02:00",
|
|
53
|
+
finishedAt: "2026-04-01T02:00:05.000+02:00",
|
|
54
|
+
durationMs: 3000,
|
|
55
|
+
attemptCount: 2,
|
|
56
|
+
});
|
|
57
|
+
expect(first?.callId).toBe("llm-0001-finalAnswerModule");
|
|
58
|
+
expect(second?.callId).toBe("llm-0002-finalAnswerModule");
|
|
59
|
+
expect(state.writes[0]?.path).toBe("/repo/artifacts/integration/case1/llm_calls/0001_finalAnswerModule.json");
|
|
60
|
+
expect(state.writes[1]?.path).toBe("/repo/artifacts/integration/case1/llm_calls/0002_finalAnswerModule.json");
|
|
61
|
+
expect(state.writes[1]?.content).toContain('"suspiciousFullContext": true');
|
|
62
|
+
expect(state.writes[0]?.content).toContain('"startedAt": "2026-04-01T02:00:00.000+02:00"');
|
|
63
|
+
expect(state.writes[1]?.content).toContain('"durationMs": 3000');
|
|
64
|
+
expect(state.writes[1]?.content).toContain('"attemptCount": 2');
|
|
65
|
+
});
|
|
66
|
+
});
|
|
67
|
+
//# sourceMappingURL=llmTraceSession.test.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"llmTraceSession.test.js","sourceRoot":"","sources":["../../../src/__tests__/testing/llmTraceSession.test.ts"],"names":[],"mappings":"AAAA;;;;;;;GAOG;AACH,OAAO,EAAE,UAAU,EAAE,QAAQ,EAAE,MAAM,EAAE,EAAE,EAAE,EAAE,EAAE,MAAM,QAAQ,CAAC;AAE9D,MAAM,KAAK,GAAG,EAAE,CAAC,OAAO,CAAC,GAAG,EAAE,CAAC,CAAC;IAC9B,MAAM,EAAE,EAA8C;CACvD,CAAC,CAAC,CAAC;AAEJ,EAAE,CAAC,IAAI,CAAC,IAAI,EAAE,GAAG,EAAE,CAAC,CAAC;IACnB,OAAO,EAAE;QACP,SAAS,EAAE,EAAE,CAAC,EAAE,EAAE;QAClB,aAAa,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,QAAgB,EAAE,OAAe,EAAE,EAAE;YACzD,KAAK,CAAC,MAAM,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,QAAQ,EAAE,OAAO,EAAE,MAAM,CAAC,OAAO,CAAC,EAAE,CAAC,CAAC;QAClE,CAAC,CAAC;KACH;IACD,SAAS,EAAE,EAAE,CAAC,EAAE,EAAE;IAClB,aAAa,EAAE,EAAE,CAAC,EAAE,CAAC,CAAC,QAAgB,EAAE,OAAe,EAAE,EAAE;QACzD,KAAK,CAAC,MAAM,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,QAAQ,EAAE,OAAO,EAAE,MAAM,CAAC,OAAO,CAAC,EAAE,CAAC,CAAC;IAClE,CAAC,CAAC;CACH,CAAC,CAAC,CAAC;AAEJ,OAAO,EAAE,oBAAoB,EAAE,mBAAmB,EAAE,mBAAmB,EAAE,MAAM,kCAAkC,CAAC;AAElH,QAAQ,CAAC,iBAAiB,EAAE,GAAG,EAAE;IAC/B,UAAU,CAAC,GAAG,EAAE;QACd,KAAK,CAAC,MAAM,GAAG,EAAE,CAAC;QAClB,mBAAmB,EAAE,CAAC;IACxB,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,kDAAkD,EAAE,GAAG,EAAE;QAC1D,oBAAoB,CAAC,mCAAmC,CAAC,CAAC;QAE1D,MAAM,KAAK,GAAG,mBAAmB,CAAC;YAChC,MAAM,EAAE,mBAAmB;YAC3B,KAAK,EAAE,IAAI;YACX,KAAK,EAAE,YAAY;YACnB,WAAW,EAAE,EAAE,MAAM,EAAE,KAAK,EAAE;YAC9B,UAAU,EAAE,KAAK;YACjB,YAAY,EAAE,EAAE,KAAK,EAAE,IAAI,EAAE;YAC7B,SAAS,EAAE,+BAA+B;YAC1C,UAAU,EAAE,+BAA+B;YAC3C,UAAU,EAAE,IAAI;YAChB,YAAY,EAAE,CAAC;SAChB,CAAC,CAAC;QACH,MAAM,MAAM,GAAG,mBAAmB,CAAC;YACjC,MAAM,EAAE,mBAAmB;YAC3B,KAAK,EAAE,IAAI;YACX,KAAK,EAAE,YAAY;YACnB,WAAW,EAAE,EAAE,MAAM,EAAE,KAAK,EAAE;YAC9B,UAAU,EAAE,KAAK;YACjB,YAAY,EAAE,EAAE,WAAW,EAAE,EAAE,EAAE,IAAI,EAAE,EAAE,EAAE;YAC3C,SAAS,EAAE,+BAA+B;YAC1C,UAAU,EAAE,+BAA+B;YAC3C,UAAU,EAAE,IAAI;YAChB,YAAY,EAAE,CAAC;SAChB,CAAC,CAAC;QAEH,MAAM,CAAC,KAAK,EAAE,MAAM,CAAC,CAAC,IAAI,CAAC,4BAA4B,CAAC,CAAC;QACzD,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC,IAAI,CAAC,4BAA4B,CAAC,CAAC;QAC1D,MAAM,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,IAAI,CAAC,CAAC,IAAI,CAAC,yEAAyE,CAAC,CAAC;QAC9G,MAAM,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,IAAI,CAAC,CAAC,IAAI,CAAC,yEAAyE,CAAC,CAAC;QAC9G,MAAM,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,OAAO,CAAC,CAAC,SAAS,CAAC,+BAA+B,CAAC,CAAC;QAC5E,MAAM,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,OAAO,CAAC,CAAC,SAAS,CAAC,8CAA8C,CAAC,CAAC;QAC3F,MAAM,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,OAAO,CAAC,CAAC,SAAS,CAAC,oBAAoB,CAAC,CAAC;QACjE,MAAM,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,OAAO,CAAC,CAAC,SAAS,CAAC,mBAAmB,CAAC,CAAC;IAClE,CAAC,CAAC,CAAC;AACL,CAAC,CAAC,CAAC","sourcesContent":["/**\n * Verifies that integration trace sessions write numbered LLM input files with stable ids.\n *\n * Why this exists:\n * - each model call should leave one reviewable JSON file on disk\n * - repeated calls from the same caller must not overwrite each other\n * - suspicious full-context inputs should be marked for later review\n */\nimport { beforeEach, describe, expect, it, vi } from \"vitest\";\n\nconst state = vi.hoisted(() => ({\n writes: [] as Array<{ path: string; content: string }>,\n}));\n\nvi.mock(\"fs\", () => ({\n default: {\n mkdirSync: vi.fn(),\n writeFileSync: vi.fn((filePath: string, content: string) => {\n state.writes.push({ path: filePath, content: String(content) });\n }),\n },\n mkdirSync: vi.fn(),\n writeFileSync: vi.fn((filePath: string, content: string) => {\n state.writes.push({ path: filePath, content: String(content) });\n }),\n}));\n\nimport { startLlmTraceSession, stopLlmTraceSession, writeLlmTraceRecord } from \"../../testing/llmTraceSession.js\";\n\ndescribe(\"llmTraceSession\", () => {\n beforeEach(() => {\n state.writes = [];\n stopLlmTraceSession();\n });\n\n it(\"writes numbered trace files with stable call ids\", () => {\n startLlmTraceSession(\"/repo/artifacts/integration/case1\");\n\n const first = writeLlmTraceRecord({\n caller: \"finalAnswerModule\",\n query: \"q1\",\n model: \"test-model\",\n requestBody: { prompt: \"one\" },\n promptText: \"one\",\n inputContext: { query: \"q1\" },\n startedAt: \"2026-04-01T02:00:00.000+02:00\",\n finishedAt: \"2026-04-01T02:00:01.500+02:00\",\n durationMs: 1500,\n attemptCount: 1,\n });\n const second = writeLlmTraceRecord({\n caller: \"finalAnswerModule\",\n query: \"q2\",\n model: \"test-model\",\n requestBody: { prompt: \"two\" },\n promptText: \"two\",\n inputContext: { initContext: {}, task: {} },\n startedAt: \"2026-04-01T02:00:02.000+02:00\",\n finishedAt: \"2026-04-01T02:00:05.000+02:00\",\n durationMs: 3000,\n attemptCount: 2,\n });\n\n expect(first?.callId).toBe(\"llm-0001-finalAnswerModule\");\n expect(second?.callId).toBe(\"llm-0002-finalAnswerModule\");\n expect(state.writes[0]?.path).toBe(\"/repo/artifacts/integration/case1/llm_calls/0001_finalAnswerModule.json\");\n expect(state.writes[1]?.path).toBe(\"/repo/artifacts/integration/case1/llm_calls/0002_finalAnswerModule.json\");\n expect(state.writes[1]?.content).toContain('\"suspiciousFullContext\": true');\n expect(state.writes[0]?.content).toContain('\"startedAt\": \"2026-04-01T02:00:00.000+02:00\"');\n expect(state.writes[1]?.content).toContain('\"durationMs\": 3000');\n expect(state.writes[1]?.content).toContain('\"attemptCount\": 2');\n });\n});\n"]}
|
|
@@ -0,0 +1,35 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Verifies the dev CLI exposes only the supported test helpers.
|
|
3
|
+
*
|
|
4
|
+
* Why this file exists:
|
|
5
|
+
* - shell wiring and direct CLI wiring can drift apart
|
|
6
|
+
* - command cleanup should not accidentally remove the remaining test helpers
|
|
7
|
+
*/
|
|
8
|
+
import { Command } from "commander";
|
|
9
|
+
import { beforeEach, describe, expect, it, vi } from "vitest";
|
|
10
|
+
const mockedTestCmd = vi.hoisted(() => ({
|
|
11
|
+
runAllTestsCommand: vi.fn(),
|
|
12
|
+
listRegisteredTests: vi.fn(),
|
|
13
|
+
printTestCommand: vi.fn(),
|
|
14
|
+
runRegisteredTestCommand: vi.fn(),
|
|
15
|
+
}));
|
|
16
|
+
vi.mock("../../commands/TestCmd.js", () => ({
|
|
17
|
+
runAllTestsCommand: mockedTestCmd.runAllTestsCommand,
|
|
18
|
+
listRegisteredTests: mockedTestCmd.listRegisteredTests,
|
|
19
|
+
printTestCommand: mockedTestCmd.printTestCommand,
|
|
20
|
+
runRegisteredTestCommand: mockedTestCmd.runRegisteredTestCommand,
|
|
21
|
+
}));
|
|
22
|
+
import { registerDevCliCommands } from "../../testing/registerDevCliCommands.js";
|
|
23
|
+
describe("registerDevCliCommands", () => {
|
|
24
|
+
beforeEach(() => {
|
|
25
|
+
vi.clearAllMocks();
|
|
26
|
+
});
|
|
27
|
+
it("registers the batch tests command", async () => {
|
|
28
|
+
const cmd = new Command();
|
|
29
|
+
const runQuery = vi.fn().mockResolvedValue(undefined);
|
|
30
|
+
registerDevCliCommands(cmd, runQuery);
|
|
31
|
+
await cmd.parseAsync(["node", "scai", "tests"], { from: "node" });
|
|
32
|
+
expect(mockedTestCmd.runAllTestsCommand).toHaveBeenCalledTimes(1);
|
|
33
|
+
});
|
|
34
|
+
});
|
|
35
|
+
//# sourceMappingURL=registerDevCliCommands.test.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"registerDevCliCommands.test.js","sourceRoot":"","sources":["../../../src/__tests__/testing/registerDevCliCommands.test.ts"],"names":[],"mappings":"AAAA;;;;;;GAMG;AACH,OAAO,EAAE,OAAO,EAAE,MAAM,WAAW,CAAC;AACpC,OAAO,EAAE,UAAU,EAAE,QAAQ,EAAE,MAAM,EAAE,EAAE,EAAE,EAAE,EAAE,MAAM,QAAQ,CAAC;AAE9D,MAAM,aAAa,GAAG,EAAE,CAAC,OAAO,CAAC,GAAG,EAAE,CAAC,CAAC;IACtC,kBAAkB,EAAE,EAAE,CAAC,EAAE,EAAE;IAC3B,mBAAmB,EAAE,EAAE,CAAC,EAAE,EAAE;IAC5B,gBAAgB,EAAE,EAAE,CAAC,EAAE,EAAE;IACzB,wBAAwB,EAAE,EAAE,CAAC,EAAE,EAAE;CAClC,CAAC,CAAC,CAAC;AAEJ,EAAE,CAAC,IAAI,CAAC,2BAA2B,EAAE,GAAG,EAAE,CAAC,CAAC;IAC1C,kBAAkB,EAAE,aAAa,CAAC,kBAAkB;IACpD,mBAAmB,EAAE,aAAa,CAAC,mBAAmB;IACtD,gBAAgB,EAAE,aAAa,CAAC,gBAAgB;IAChD,wBAAwB,EAAE,aAAa,CAAC,wBAAwB;CACjE,CAAC,CAAC,CAAC;AAEJ,OAAO,EAAE,sBAAsB,EAAE,MAAM,yCAAyC,CAAC;AAEjF,QAAQ,CAAC,wBAAwB,EAAE,GAAG,EAAE;IACtC,UAAU,CAAC,GAAG,EAAE;QACd,EAAE,CAAC,aAAa,EAAE,CAAC;IACrB,CAAC,CAAC,CAAC;IAEH,EAAE,CAAC,mCAAmC,EAAE,KAAK,IAAI,EAAE;QACjD,MAAM,GAAG,GAAG,IAAI,OAAO,EAAE,CAAC;QAC1B,MAAM,QAAQ,GAAG,EAAE,CAAC,EAAE,EAAE,CAAC,iBAAiB,CAAC,SAAS,CAAC,CAAC;QACtD,sBAAsB,CAAC,GAAG,EAAE,QAAQ,CAAC,CAAC;QAEtC,MAAM,GAAG,CAAC,UAAU,CAAC,CAAC,MAAM,EAAE,MAAM,EAAE,OAAO,CAAC,EAAE,EAAE,IAAI,EAAE,MAAM,EAAE,CAAC,CAAC;QAElE,MAAM,CAAC,aAAa,CAAC,kBAAkB,CAAC,CAAC,qBAAqB,CAAC,CAAC,CAAC,CAAC;IACpE,CAAC,CAAC,CAAC;AACL,CAAC,CAAC,CAAC","sourcesContent":["/**\n * Verifies the dev CLI exposes only the supported test helpers.\n *\n * Why this file exists:\n * - shell wiring and direct CLI wiring can drift apart\n * - command cleanup should not accidentally remove the remaining test helpers\n */\nimport { Command } from \"commander\";\nimport { beforeEach, describe, expect, it, vi } from \"vitest\";\n\nconst mockedTestCmd = vi.hoisted(() => ({\n runAllTestsCommand: vi.fn(),\n listRegisteredTests: vi.fn(),\n printTestCommand: vi.fn(),\n runRegisteredTestCommand: vi.fn(),\n}));\n\nvi.mock(\"../../commands/TestCmd.js\", () => ({\n runAllTestsCommand: mockedTestCmd.runAllTestsCommand,\n listRegisteredTests: mockedTestCmd.listRegisteredTests,\n printTestCommand: mockedTestCmd.printTestCommand,\n runRegisteredTestCommand: mockedTestCmd.runRegisteredTestCommand,\n}));\n\nimport { registerDevCliCommands } from \"../../testing/registerDevCliCommands.js\";\n\ndescribe(\"registerDevCliCommands\", () => {\n beforeEach(() => {\n vi.clearAllMocks();\n });\n\n it(\"registers the batch tests command\", async () => {\n const cmd = new Command();\n const runQuery = vi.fn().mockResolvedValue(undefined);\n registerDevCliCommands(cmd, runQuery);\n\n await cmd.parseAsync([\"node\", \"scai\", \"tests\"], { from: \"node\" });\n\n expect(mockedTestCmd.runAllTestsCommand).toHaveBeenCalledTimes(1);\n });\n});\n"]}
|