model-test-bench 1.0.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (288) hide show
  1. package/LICENSE +201 -0
  2. package/README.md +389 -0
  3. package/dist/bin/mtb.d.ts +3 -0
  4. package/dist/bin/mtb.d.ts.map +1 -0
  5. package/dist/bin/mtb.js +148 -0
  6. package/dist/bin/mtb.js.map +1 -0
  7. package/dist/server/index.d.ts +13 -0
  8. package/dist/server/index.d.ts.map +1 -0
  9. package/dist/server/index.js +72 -0
  10. package/dist/server/index.js.map +1 -0
  11. package/dist/server/interfaces/evaluator.d.ts +15 -0
  12. package/dist/server/interfaces/evaluator.d.ts.map +1 -0
  13. package/dist/server/interfaces/evaluator.js +2 -0
  14. package/dist/server/interfaces/evaluator.js.map +1 -0
  15. package/dist/server/interfaces/logger.d.ts +9 -0
  16. package/dist/server/interfaces/logger.d.ts.map +1 -0
  17. package/dist/server/interfaces/logger.js +2 -0
  18. package/dist/server/interfaces/logger.js.map +1 -0
  19. package/dist/server/interfaces/runner.d.ts +9 -0
  20. package/dist/server/interfaces/runner.d.ts.map +1 -0
  21. package/dist/server/interfaces/runner.js +2 -0
  22. package/dist/server/interfaces/runner.js.map +1 -0
  23. package/dist/server/interfaces/storage.d.ts +36 -0
  24. package/dist/server/interfaces/storage.d.ts.map +1 -0
  25. package/dist/server/interfaces/storage.js +2 -0
  26. package/dist/server/interfaces/storage.js.map +1 -0
  27. package/dist/server/routes/eval-queue.d.ts +23 -0
  28. package/dist/server/routes/eval-queue.d.ts.map +1 -0
  29. package/dist/server/routes/eval-queue.js +45 -0
  30. package/dist/server/routes/eval-queue.js.map +1 -0
  31. package/dist/server/routes/evaluations.d.ts +8 -0
  32. package/dist/server/routes/evaluations.d.ts.map +1 -0
  33. package/dist/server/routes/evaluations.js +221 -0
  34. package/dist/server/routes/evaluations.js.map +1 -0
  35. package/dist/server/routes/providers.d.ts +5 -0
  36. package/dist/server/routes/providers.d.ts.map +1 -0
  37. package/dist/server/routes/providers.js +179 -0
  38. package/dist/server/routes/providers.js.map +1 -0
  39. package/dist/server/routes/run-queue.d.ts +17 -0
  40. package/dist/server/routes/run-queue.d.ts.map +1 -0
  41. package/dist/server/routes/run-queue.js +34 -0
  42. package/dist/server/routes/run-queue.js.map +1 -0
  43. package/dist/server/routes/run-sse.d.ts +18 -0
  44. package/dist/server/routes/run-sse.d.ts.map +1 -0
  45. package/dist/server/routes/run-sse.js +57 -0
  46. package/dist/server/routes/run-sse.js.map +1 -0
  47. package/dist/server/routes/runs.d.ts +9 -0
  48. package/dist/server/routes/runs.d.ts.map +1 -0
  49. package/dist/server/routes/runs.js +380 -0
  50. package/dist/server/routes/runs.js.map +1 -0
  51. package/dist/server/routes/scenarios.d.ts +5 -0
  52. package/dist/server/routes/scenarios.d.ts.map +1 -0
  53. package/dist/server/routes/scenarios.js +181 -0
  54. package/dist/server/routes/scenarios.js.map +1 -0
  55. package/dist/server/services/eval-helpers.d.ts +22 -0
  56. package/dist/server/services/eval-helpers.d.ts.map +1 -0
  57. package/dist/server/services/eval-helpers.js +75 -0
  58. package/dist/server/services/eval-helpers.js.map +1 -0
  59. package/dist/server/services/eval-parsers-debate-impl.d.ts +11 -0
  60. package/dist/server/services/eval-parsers-debate-impl.d.ts.map +1 -0
  61. package/dist/server/services/eval-parsers-debate-impl.js +133 -0
  62. package/dist/server/services/eval-parsers-debate-impl.js.map +1 -0
  63. package/dist/server/services/eval-parsers.d.ts +24 -0
  64. package/dist/server/services/eval-parsers.d.ts.map +1 -0
  65. package/dist/server/services/eval-parsers.js +153 -0
  66. package/dist/server/services/eval-parsers.js.map +1 -0
  67. package/dist/server/services/eval-prompts.d.ts +9 -0
  68. package/dist/server/services/eval-prompts.d.ts.map +1 -0
  69. package/dist/server/services/eval-prompts.js +164 -0
  70. package/dist/server/services/eval-prompts.js.map +1 -0
  71. package/dist/server/services/evaluator.d.ts +10 -0
  72. package/dist/server/services/evaluator.d.ts.map +1 -0
  73. package/dist/server/services/evaluator.js +143 -0
  74. package/dist/server/services/evaluator.js.map +1 -0
  75. package/dist/server/services/fs-adapter.d.ts +20 -0
  76. package/dist/server/services/fs-adapter.d.ts.map +1 -0
  77. package/dist/server/services/fs-adapter.js +13 -0
  78. package/dist/server/services/fs-adapter.js.map +1 -0
  79. package/dist/server/services/instruction-parser.d.ts +26 -0
  80. package/dist/server/services/instruction-parser.d.ts.map +1 -0
  81. package/dist/server/services/instruction-parser.js +121 -0
  82. package/dist/server/services/instruction-parser.js.map +1 -0
  83. package/dist/server/services/log-rotator.d.ts +20 -0
  84. package/dist/server/services/log-rotator.d.ts.map +1 -0
  85. package/dist/server/services/log-rotator.js +60 -0
  86. package/dist/server/services/log-rotator.js.map +1 -0
  87. package/dist/server/services/logger.d.ts +15 -0
  88. package/dist/server/services/logger.d.ts.map +1 -0
  89. package/dist/server/services/logger.js +69 -0
  90. package/dist/server/services/logger.js.map +1 -0
  91. package/dist/server/services/model-factory.d.ts +10 -0
  92. package/dist/server/services/model-factory.d.ts.map +1 -0
  93. package/dist/server/services/model-factory.js +33 -0
  94. package/dist/server/services/model-factory.js.map +1 -0
  95. package/dist/server/services/runner.d.ts +9 -0
  96. package/dist/server/services/runner.d.ts.map +1 -0
  97. package/dist/server/services/runner.js +99 -0
  98. package/dist/server/services/runner.js.map +1 -0
  99. package/dist/server/services/seeder.d.ts +5 -0
  100. package/dist/server/services/seeder.d.ts.map +1 -0
  101. package/dist/server/services/seeder.js +79 -0
  102. package/dist/server/services/seeder.js.map +1 -0
  103. package/dist/server/services/storage-test-helpers.d.ts +15 -0
  104. package/dist/server/services/storage-test-helpers.d.ts.map +1 -0
  105. package/dist/server/services/storage-test-helpers.js +151 -0
  106. package/dist/server/services/storage-test-helpers.js.map +1 -0
  107. package/dist/server/services/storage.d.ts +35 -0
  108. package/dist/server/services/storage.d.ts.map +1 -0
  109. package/dist/server/services/storage.js +219 -0
  110. package/dist/server/services/storage.js.map +1 -0
  111. package/dist/server/services/tools.d.ts +6 -0
  112. package/dist/server/services/tools.d.ts.map +1 -0
  113. package/dist/server/services/tools.js +94 -0
  114. package/dist/server/services/tools.js.map +1 -0
  115. package/dist/server/services/transcript-formatter.d.ts +18 -0
  116. package/dist/server/services/transcript-formatter.d.ts.map +1 -0
  117. package/dist/server/services/transcript-formatter.js +227 -0
  118. package/dist/server/services/transcript-formatter.js.map +1 -0
  119. package/dist/server/services/update-checker.d.ts +3 -0
  120. package/dist/server/services/update-checker.d.ts.map +1 -0
  121. package/dist/server/services/update-checker.js +34 -0
  122. package/dist/server/services/update-checker.js.map +1 -0
  123. package/dist/server/types/evaluation.d.ts +94 -0
  124. package/dist/server/types/evaluation.d.ts.map +1 -0
  125. package/dist/server/types/evaluation.js +5 -0
  126. package/dist/server/types/evaluation.js.map +1 -0
  127. package/dist/server/types/index.d.ts +5 -0
  128. package/dist/server/types/index.d.ts.map +1 -0
  129. package/dist/server/types/index.js +5 -0
  130. package/dist/server/types/index.js.map +1 -0
  131. package/dist/server/types/provider.d.ts +23 -0
  132. package/dist/server/types/provider.d.ts.map +1 -0
  133. package/dist/server/types/provider.js +5 -0
  134. package/dist/server/types/provider.js.map +1 -0
  135. package/dist/server/types/run.d.ts +31 -0
  136. package/dist/server/types/run.d.ts.map +1 -0
  137. package/dist/server/types/run.js +5 -0
  138. package/dist/server/types/run.js.map +1 -0
  139. package/dist/server/types/scenario.d.ts +19 -0
  140. package/dist/server/types/scenario.d.ts.map +1 -0
  141. package/dist/server/types/scenario.js +5 -0
  142. package/dist/server/types/scenario.js.map +1 -0
  143. package/dist/src/server/index.d.ts +13 -0
  144. package/dist/src/server/index.d.ts.map +1 -0
  145. package/dist/src/server/index.js +72 -0
  146. package/dist/src/server/index.js.map +1 -0
  147. package/dist/src/server/interfaces/evaluator.d.ts +15 -0
  148. package/dist/src/server/interfaces/evaluator.d.ts.map +1 -0
  149. package/dist/src/server/interfaces/evaluator.js +2 -0
  150. package/dist/src/server/interfaces/evaluator.js.map +1 -0
  151. package/dist/src/server/interfaces/logger.d.ts +9 -0
  152. package/dist/src/server/interfaces/logger.d.ts.map +1 -0
  153. package/dist/src/server/interfaces/logger.js +2 -0
  154. package/dist/src/server/interfaces/logger.js.map +1 -0
  155. package/dist/src/server/interfaces/runner.d.ts +9 -0
  156. package/dist/src/server/interfaces/runner.d.ts.map +1 -0
  157. package/dist/src/server/interfaces/runner.js +2 -0
  158. package/dist/src/server/interfaces/runner.js.map +1 -0
  159. package/dist/src/server/interfaces/storage.d.ts +36 -0
  160. package/dist/src/server/interfaces/storage.d.ts.map +1 -0
  161. package/dist/src/server/interfaces/storage.js +2 -0
  162. package/dist/src/server/interfaces/storage.js.map +1 -0
  163. package/dist/src/server/routes/eval-queue.d.ts +23 -0
  164. package/dist/src/server/routes/eval-queue.d.ts.map +1 -0
  165. package/dist/src/server/routes/eval-queue.js +45 -0
  166. package/dist/src/server/routes/eval-queue.js.map +1 -0
  167. package/dist/src/server/routes/evaluations.d.ts +8 -0
  168. package/dist/src/server/routes/evaluations.d.ts.map +1 -0
  169. package/dist/src/server/routes/evaluations.js +221 -0
  170. package/dist/src/server/routes/evaluations.js.map +1 -0
  171. package/dist/src/server/routes/providers.d.ts +5 -0
  172. package/dist/src/server/routes/providers.d.ts.map +1 -0
  173. package/dist/src/server/routes/providers.js +179 -0
  174. package/dist/src/server/routes/providers.js.map +1 -0
  175. package/dist/src/server/routes/run-queue.d.ts +17 -0
  176. package/dist/src/server/routes/run-queue.d.ts.map +1 -0
  177. package/dist/src/server/routes/run-queue.js +34 -0
  178. package/dist/src/server/routes/run-queue.js.map +1 -0
  179. package/dist/src/server/routes/run-sse.d.ts +18 -0
  180. package/dist/src/server/routes/run-sse.d.ts.map +1 -0
  181. package/dist/src/server/routes/run-sse.js +57 -0
  182. package/dist/src/server/routes/run-sse.js.map +1 -0
  183. package/dist/src/server/routes/runs.d.ts +9 -0
  184. package/dist/src/server/routes/runs.d.ts.map +1 -0
  185. package/dist/src/server/routes/runs.js +380 -0
  186. package/dist/src/server/routes/runs.js.map +1 -0
  187. package/dist/src/server/routes/scenarios.d.ts +5 -0
  188. package/dist/src/server/routes/scenarios.d.ts.map +1 -0
  189. package/dist/src/server/routes/scenarios.js +181 -0
  190. package/dist/src/server/routes/scenarios.js.map +1 -0
  191. package/dist/src/server/services/eval-helpers.d.ts +22 -0
  192. package/dist/src/server/services/eval-helpers.d.ts.map +1 -0
  193. package/dist/src/server/services/eval-helpers.js +75 -0
  194. package/dist/src/server/services/eval-helpers.js.map +1 -0
  195. package/dist/src/server/services/eval-parsers-debate-impl.d.ts +11 -0
  196. package/dist/src/server/services/eval-parsers-debate-impl.d.ts.map +1 -0
  197. package/dist/src/server/services/eval-parsers-debate-impl.js +133 -0
  198. package/dist/src/server/services/eval-parsers-debate-impl.js.map +1 -0
  199. package/dist/src/server/services/eval-parsers.d.ts +24 -0
  200. package/dist/src/server/services/eval-parsers.d.ts.map +1 -0
  201. package/dist/src/server/services/eval-parsers.js +153 -0
  202. package/dist/src/server/services/eval-parsers.js.map +1 -0
  203. package/dist/src/server/services/eval-prompts.d.ts +9 -0
  204. package/dist/src/server/services/eval-prompts.d.ts.map +1 -0
  205. package/dist/src/server/services/eval-prompts.js +164 -0
  206. package/dist/src/server/services/eval-prompts.js.map +1 -0
  207. package/dist/src/server/services/evaluator.d.ts +10 -0
  208. package/dist/src/server/services/evaluator.d.ts.map +1 -0
  209. package/dist/src/server/services/evaluator.js +143 -0
  210. package/dist/src/server/services/evaluator.js.map +1 -0
  211. package/dist/src/server/services/fs-adapter.d.ts +20 -0
  212. package/dist/src/server/services/fs-adapter.d.ts.map +1 -0
  213. package/dist/src/server/services/fs-adapter.js +13 -0
  214. package/dist/src/server/services/fs-adapter.js.map +1 -0
  215. package/dist/src/server/services/instruction-parser.d.ts +26 -0
  216. package/dist/src/server/services/instruction-parser.d.ts.map +1 -0
  217. package/dist/src/server/services/instruction-parser.js +121 -0
  218. package/dist/src/server/services/instruction-parser.js.map +1 -0
  219. package/dist/src/server/services/log-rotator.d.ts +20 -0
  220. package/dist/src/server/services/log-rotator.d.ts.map +1 -0
  221. package/dist/src/server/services/log-rotator.js +60 -0
  222. package/dist/src/server/services/log-rotator.js.map +1 -0
  223. package/dist/src/server/services/logger.d.ts +15 -0
  224. package/dist/src/server/services/logger.d.ts.map +1 -0
  225. package/dist/src/server/services/logger.js +69 -0
  226. package/dist/src/server/services/logger.js.map +1 -0
  227. package/dist/src/server/services/model-factory.d.ts +10 -0
  228. package/dist/src/server/services/model-factory.d.ts.map +1 -0
  229. package/dist/src/server/services/model-factory.js +33 -0
  230. package/dist/src/server/services/model-factory.js.map +1 -0
  231. package/dist/src/server/services/runner.d.ts +9 -0
  232. package/dist/src/server/services/runner.d.ts.map +1 -0
  233. package/dist/src/server/services/runner.js +99 -0
  234. package/dist/src/server/services/runner.js.map +1 -0
  235. package/dist/src/server/services/seeder.d.ts +5 -0
  236. package/dist/src/server/services/seeder.d.ts.map +1 -0
  237. package/dist/src/server/services/seeder.js +79 -0
  238. package/dist/src/server/services/seeder.js.map +1 -0
  239. package/dist/src/server/services/storage.d.ts +35 -0
  240. package/dist/src/server/services/storage.d.ts.map +1 -0
  241. package/dist/src/server/services/storage.js +219 -0
  242. package/dist/src/server/services/storage.js.map +1 -0
  243. package/dist/src/server/services/tools.d.ts +6 -0
  244. package/dist/src/server/services/tools.d.ts.map +1 -0
  245. package/dist/src/server/services/tools.js +94 -0
  246. package/dist/src/server/services/tools.js.map +1 -0
  247. package/dist/src/server/services/transcript-formatter.d.ts +18 -0
  248. package/dist/src/server/services/transcript-formatter.d.ts.map +1 -0
  249. package/dist/src/server/services/transcript-formatter.js +227 -0
  250. package/dist/src/server/services/transcript-formatter.js.map +1 -0
  251. package/dist/src/server/services/update-checker.d.ts +3 -0
  252. package/dist/src/server/services/update-checker.d.ts.map +1 -0
  253. package/dist/src/server/services/update-checker.js +34 -0
  254. package/dist/src/server/services/update-checker.js.map +1 -0
  255. package/dist/src/server/types/evaluation.d.ts +94 -0
  256. package/dist/src/server/types/evaluation.d.ts.map +1 -0
  257. package/dist/src/server/types/evaluation.js +5 -0
  258. package/dist/src/server/types/evaluation.js.map +1 -0
  259. package/dist/src/server/types/index.d.ts +5 -0
  260. package/dist/src/server/types/index.d.ts.map +1 -0
  261. package/dist/src/server/types/index.js +5 -0
  262. package/dist/src/server/types/index.js.map +1 -0
  263. package/dist/src/server/types/provider.d.ts +23 -0
  264. package/dist/src/server/types/provider.d.ts.map +1 -0
  265. package/dist/src/server/types/provider.js +5 -0
  266. package/dist/src/server/types/provider.js.map +1 -0
  267. package/dist/src/server/types/run.d.ts +31 -0
  268. package/dist/src/server/types/run.d.ts.map +1 -0
  269. package/dist/src/server/types/run.js +5 -0
  270. package/dist/src/server/types/run.js.map +1 -0
  271. package/dist/src/server/types/scenario.d.ts +19 -0
  272. package/dist/src/server/types/scenario.d.ts.map +1 -0
  273. package/dist/src/server/types/scenario.js +5 -0
  274. package/dist/src/server/types/scenario.js.map +1 -0
  275. package/dist/web/assets/index-AJu1Yn5F.js +70 -0
  276. package/dist/web/assets/index-C_ioEISr.css +1 -0
  277. package/dist/web/index.html +15 -0
  278. package/docs/schemas/provider-api.example.json +12 -0
  279. package/docs/schemas/provider-openai.example.json +11 -0
  280. package/docs/schemas/scenario-baseline.example.json +24 -0
  281. package/docs/schemas/scenario-carwash-baseline.example.json +22 -0
  282. package/docs/schemas/scenario-carwash-with-system-prompt.example.json +24 -0
  283. package/docs/schemas/scenario-golden-rules-baseline.example.json +24 -0
  284. package/docs/schemas/scenario-golden-rules-with-system-prompt.example.json +28 -0
  285. package/docs/schemas/scenario-negative-analysis-baseline.example.json +23 -0
  286. package/docs/schemas/scenario-negative-analysis-with-system-prompt.example.json +25 -0
  287. package/docs/schemas/scenario-with-system-prompt.example.json +25 -0
  288. package/package.json +97 -0
@@ -0,0 +1,143 @@
1
+ // ---------------------------------------------------------------------------
2
+ // Evaluator — orchestrates evaluation pipeline via Vercel AI SDK
3
+ // ---------------------------------------------------------------------------
4
+ import { generateText } from 'ai';
5
+ import { createModel } from './model-factory.js';
6
+ import { formatTranscript } from './transcript-formatter.js';
7
+ import { parseAllInstructions } from './instruction-parser.js';
8
+ import { buildScorePrompt, buildCompliancePrompt, buildDebatePrompt, buildSynthesisPrompt, } from './eval-prompts.js';
9
+ import { parseScoreResponse, parseComplianceResponse, parseSynthesisResponse, parseDebateResponse, toIndividualEvaluations, } from './eval-parsers.js';
10
+ import { checkConsensus, buildAnswerComparison, buildCriticalResults, mergeCompliance, } from './eval-helpers.js';
11
+ // ---------------------------------------------------------------------------
12
+ // Implementation
13
+ // ---------------------------------------------------------------------------
14
+ export class EvaluationOrchestrator {
15
+ async evaluateRun(run, scenario, provider, request, callbacks) {
16
+ callbacks.onStatusChange('running');
17
+ callbacks.onProgress('preparing', 'Formatting transcript and parsing instructions...');
18
+ const { text: transcript, summary } = formatTranscript(run.messages);
19
+ const instructions = parseAllInstructions(scenario.systemPrompt
20
+ ? [{ content: scenario.systemPrompt, source: 'system_prompt' }]
21
+ : []);
22
+ const accumulators = request.evaluators.map((e) => ({
23
+ role: e.role, costUsd: 0, tokensIn: 0, tokensOut: 0, rounds: 0,
24
+ scoreResult: {}, complianceResult: {}, assessmentText: '',
25
+ }));
26
+ // ── Round 1 ──────────────────────────────────────────────────────
27
+ callbacks.onProgress('scoring', `Running score and compliance queries (${request.evaluators.length} evaluator${request.evaluators.length > 1 ? 's' : ''})...`);
28
+ const round1Evals = await this.runRound1(request.evaluators, accumulators, transcript, scenario, provider, instructions, summary, callbacks);
29
+ const round1Consensus = request.maxRounds <= 1 || checkConsensus(accumulators);
30
+ const rounds = [{
31
+ roundNumber: 1, evaluations: round1Evals,
32
+ consensusReached: round1Consensus, timestamp: new Date().toISOString(),
33
+ }];
34
+ // ── Multi-round debate ───────────────────────────────────────────
35
+ if (request.maxRounds > 1 && !round1Consensus) {
36
+ for (let roundNum = 2; roundNum <= request.maxRounds; roundNum++) {
37
+ callbacks.onProgress('debate', `Debate round ${roundNum} of ${request.maxRounds}...`);
38
+ const debateEvals = await this.runDebateRound(request.evaluators, accumulators, roundNum, callbacks);
39
+ const consensus = checkConsensus(accumulators);
40
+ rounds.push({
41
+ roundNumber: roundNum, evaluations: debateEvals,
42
+ consensusReached: consensus, timestamp: new Date().toISOString(),
43
+ });
44
+ if (consensus)
45
+ break;
46
+ }
47
+ }
48
+ // ── Synthesis ────────────────────────────────────────────────────
49
+ callbacks.onProgress('synthesis', 'Synthesizing final scores and confidence...');
50
+ const latestRound = rounds[rounds.length - 1];
51
+ const latestEvals = latestRound.evaluations;
52
+ const synthesizer = request.evaluators[request.evaluators.length - 1];
53
+ const synthInfo = { phase: 'synthesis', evaluatorRole: synthesizer.role, roundNumber: rounds.length };
54
+ const synthResult = await this.runSynthesis(synthesizer, latestEvals, scenario, provider, accumulators, callbacks, synthInfo);
55
+ // ── Assemble final evaluation ────────────────────────────────────
56
+ const ledger = accumulators.map((a) => ({
57
+ evaluatorRole: a.role, totalCostUsd: a.costUsd,
58
+ totalTokensIn: a.tokensIn, totalTokensOut: a.tokensOut, roundsParticipated: a.rounds,
59
+ }));
60
+ const now = new Date().toISOString();
61
+ callbacks.onProgress('complete', 'Evaluation finished.');
62
+ callbacks.onStatusChange('completed');
63
+ return {
64
+ id: '', runId: run.id, status: 'completed', evaluators: request.evaluators, rounds,
65
+ answerComparison: buildAnswerComparison(accumulators),
66
+ criticalResults: buildCriticalResults(accumulators, scenario),
67
+ setupCompliance: { instructionCompliance: mergeCompliance(accumulators) },
68
+ synthesis: {
69
+ dimensionScores: synthResult.dimensionScores ?? {}, weightedTotal: synthResult.weightedTotal ?? 0,
70
+ confidence: synthResult.confidence ?? 0, dissenting: synthResult.dissenting ?? [],
71
+ },
72
+ ledger, totalCostUsd: ledger.reduce((sum, l) => sum + l.totalCostUsd, 0),
73
+ createdAt: now, updatedAt: now,
74
+ };
75
+ }
76
+ // ─── Round 1: Score + Compliance ─────────────────────────────────────
77
+ async runRound1(evaluators, accumulators, transcript, scenario, provider, instructions, summary, callbacks) {
78
+ const promises = evaluators.map(async (evaluator, idx) => {
79
+ const acc = accumulators[idx];
80
+ acc.rounds++;
81
+ const scoreInfo = { phase: 'score', evaluatorRole: evaluator.role, roundNumber: 1 };
82
+ const scoreResp = await this.runQuery(evaluator, buildScorePrompt(transcript, scenario, summary), callbacks, scoreInfo);
83
+ acc.costUsd += scoreResp.costUsd;
84
+ acc.scoreResult = parseScoreResponse(scoreResp.text);
85
+ acc.assessmentText = scoreResp.text;
86
+ const compInfo = { phase: 'compliance', evaluatorRole: evaluator.role, roundNumber: 1 };
87
+ const compResp = await this.runQuery(evaluator, buildCompliancePrompt(transcript, scenario, instructions), callbacks, compInfo);
88
+ acc.costUsd += compResp.costUsd;
89
+ acc.complianceResult = parseComplianceResponse(compResp.text);
90
+ return toIndividualEvaluations(acc.scoreResult.scores ?? {}, evaluator.role, {});
91
+ });
92
+ return (await Promise.all(promises)).flat();
93
+ }
94
+ // ─── Multi-round debate ──────────────────────────────────────────────
95
+ async runDebateRound(evaluators, accumulators, roundNumber, callbacks) {
96
+ const promises = evaluators.map(async (evaluator, idx) => {
97
+ const acc = accumulators[idx];
98
+ acc.rounds++;
99
+ const others = accumulators.filter((_, i) => i !== idx).map((a) => a.assessmentText);
100
+ const info = { phase: 'debate', evaluatorRole: evaluator.role, roundNumber };
101
+ const resp = await this.runQuery(evaluator, buildDebatePrompt(acc.assessmentText, others, roundNumber), callbacks, info);
102
+ acc.costUsd += resp.costUsd;
103
+ const result = parseDebateResponse(resp.text);
104
+ if (result.updatedScores && Object.keys(result.updatedScores).length > 0) {
105
+ acc.scoreResult = { ...acc.scoreResult, scores: result.updatedScores };
106
+ }
107
+ acc.assessmentText = resp.text;
108
+ return toIndividualEvaluations(acc.scoreResult.scores ?? {}, evaluator.role, {});
109
+ });
110
+ return (await Promise.all(promises)).flat();
111
+ }
112
+ // ─── Synthesis ───────────────────────────────────────────────────────
113
+ async runSynthesis(synthesizer, allEvals, scenario, provider, accumulators, callbacks, info) {
114
+ const resp = await this.runQuery(synthesizer, buildSynthesisPrompt(allEvals, scenario, provider), callbacks, info);
115
+ const acc = accumulators.find((a) => a.role === synthesizer.role);
116
+ if (acc)
117
+ acc.costUsd += resp.costUsd;
118
+ return parseSynthesisResponse(resp.text);
119
+ }
120
+ // ─── AI SDK query wrapper ─────────────────────────────────────────────
121
+ async runQuery(evaluator, prompt, callbacks, info) {
122
+ const model = createModel({
123
+ providerName: evaluator.providerName,
124
+ model: evaluator.model,
125
+ apiKey: evaluator.apiKey,
126
+ baseUrl: evaluator.baseUrl,
127
+ });
128
+ const result = await generateText({ model, prompt, maxOutputTokens: 4096 });
129
+ const record = {
130
+ timestamp: new Date().toISOString(),
131
+ message: {
132
+ type: 'eval_response',
133
+ text: result.text,
134
+ usage: result.usage,
135
+ },
136
+ };
137
+ callbacks.onMessage(info, record);
138
+ // Token-based cost calculation (provider-specific pricing TBD)
139
+ const costUsd = 0;
140
+ return { text: result.text, costUsd };
141
+ }
142
+ }
143
+ //# sourceMappingURL=evaluator.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"evaluator.js","sourceRoot":"","sources":["../../../src/server/services/evaluator.ts"],"names":[],"mappings":"AAAA,8EAA8E;AAC9E,iEAAiE;AACjE,8EAA8E;AAE9E,OAAO,EAAE,YAAY,EAAE,MAAM,IAAI,CAAC;AAclC,OAAO,EAAE,WAAW,EAAE,MAAM,oBAAoB,CAAC;AACjD,OAAO,EAAE,gBAAgB,EAAE,MAAM,2BAA2B,CAAC;AAC7D,OAAO,EAAE,oBAAoB,EAAE,MAAM,yBAAyB,CAAC;AAC/D,OAAO,EACL,gBAAgB,EAChB,qBAAqB,EACrB,iBAAiB,EACjB,oBAAoB,GACrB,MAAM,mBAAmB,CAAC;AAC3B,OAAO,EACL,kBAAkB,EAClB,uBAAuB,EACvB,sBAAsB,EACtB,mBAAmB,EACnB,uBAAuB,GACxB,MAAM,mBAAmB,CAAC;AAC3B,OAAO,EACL,cAAc,EACd,qBAAqB,EACrB,oBAAoB,EACpB,eAAe,GAChB,MAAM,mBAAmB,CAAC;AAG3B,8EAA8E;AAC9E,iBAAiB;AACjB,8EAA8E;AAE9E,MAAM,OAAO,sBAAsB;IACjC,KAAK,CAAC,WAAW,CACf,GAAQ,EACR,QAAkB,EAClB,QAAkB,EAClB,OAA0B,EAC1B,SAA8B;QAE9B,SAAS,CAAC,cAAc,CAAC,SAAS,CAAC,CAAC;QACpC,SAAS,CAAC,UAAU,CAAC,WAAW,EAAE,mDAAmD,CAAC,CAAC;QAEvF,MAAM,EAAE,IAAI,EAAE,UAAU,EAAE,OAAO,EAAE,GAAG,gBAAgB,CAAC,GAAG,CAAC,QAAQ,CAAC,CAAC;QACrE,MAAM,YAAY,GAAG,oBAAoB,CACvC,QAAQ,CAAC,YAAY;YACnB,CAAC,CAAC,CAAC,EAAE,OAAO,EAAE,QAAQ,CAAC,YAAY,EAAE,MAAM,EAAE,eAAe,EAAE,CAAC;YAC/D,CAAC,CAAC,EAAE,CACP,CAAC;QAEF,MAAM,YAAY,GAA2B,OAAO,CAAC,UAAU,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;YAC1E,IAAI,EAAE,CAAC,CAAC,IAAI,EAAE,OAAO,EAAE,CAAC,EAAE,QAAQ,EAAE,CAAC,EAAE,SAAS,EAAE,CAAC,EAAE,MAAM,EAAE,CAAC;YAC9D,WAAW,EAAE,EAAE,EAAE,gBAAgB,EAAE,EAAE,EAAE,cAAc,EAAE,EAAE;SAC1D,CAAC,CAAC,CAAC;QAEJ,oEAAoE;QACpE,SAAS,CAAC,UAAU,CAAC,SAAS,EAAE,yCAAyC,OAAO,CAAC,UAAU,CAAC,MAAM,aAAa,OAAO,CAAC,UAAU,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,MAAM,CAAC,CAAC;QAC/J,MAAM,WAAW,GAAG,MAAM,IAAI,CAAC,SAAS,CACtC,OAAO,CAAC,UAAU,EAAE,YAAY,EAAE,UAAU,EAAE,QAAQ,EAAE,QAAQ,EAAE,YAAY,EAAE,OAAO,EAAE,SAAS,CACnG,CAAC;QACF,MAAM,eAAe,GAAG,OAAO,CAAC,SAAS,IAAI,CAAC,IAAI,cAAc,CAAC,YAAY,CAAC,CAAC;QAC/E,MAAM,MAAM,GAAsB,CAAC;gBACjC,WAAW,EAAE,CAAC,EAAE,WAAW,EAAE,WAAW;gBACxC,gBAAgB,EAAE,eAAe,EAAE,SAAS,EAAE,IAAI,IAAI,EAAE,CAAC,WAAW,EAAE;aACvE,CAAC,CAAC;QAEH,oEAAoE;QACpE,IAAI,OAAO,CAAC,SAAS,GAAG,CAAC,IAAI,CAAC,eAAe,EAAE,CAAC;YAC9C,KAAK,IAAI,QAAQ,GAAG,CAAC,EAAE,QAAQ,IAAI,OAAO,CAAC,SAAS,EAAE,QAAQ,EAAE,EAAE,CAAC;gBACjE,SAAS,CAAC,UAAU,CAAC,QAAQ,EAAE,gBAAgB,QAAQ,OAAO,OAAO,CAAC,SAAS,KAAK,CAAC,CAAC;gBACtF,MAAM,WAAW,GAAG,MAAM,IAAI,CAAC,cAAc,CAAC,OAAO,CAAC,UAAU,EAAE,YAAY,EAAE,QAAQ,EAAE,SAAS,CAAC,CAAC;gBACrG,MAAM,SAAS,GAAG,cAAc,CAAC,YAAY,CAAC,CAAC;gBAC/C,MAAM,CAAC,IAAI,CAAC;oBACV,WAAW,EAAE,QAAQ,EAAE,WAAW,EAAE,WAAW;oBAC/C,gBAAgB,EAAE,SAAS,EAAE,SAAS,EAAE,IAAI,IAAI,EAAE,CAAC,WAAW,EAAE;iBACjE,CAAC,CAAC;gBACH,IAAI,SAAS;oBAAE,MAAM;YACvB,CAAC;QACH,CAAC;QAED,oEAAoE;QACpE,SAAS,CAAC,UAAU,CAAC,WAAW,EAAE,6CAA6C,CAAC,CAAC;QACjF,MAAM,WAAW,GAAG,MAAM,CAAC,MAAM,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC;QAC9C,MAAM,WAAW,GAAG,WAAW,CAAC,WAAW,CAAC;QAC5C,MAAM,WAAW,GAAG,OAAO,CAAC,UAAU,CAAC,OAAO,CAAC,UAAU,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC;QACtE,MAAM,SAAS,GAAoB,EAAE,KAAK,EAAE,WAAW,EAAE,aAAa,EAAE,WAAW,CAAC,IAAI,EAAE,WAAW,EAAE,MAAM,CAAC,MAAM,EAAE,CAAC;QACvH,MAAM,WAAW,GAAG,MAAM,IAAI,CAAC,YAAY,CAAC,WAAW,EAAE,WAAW,EAAE,QAAQ,EAAE,QAAQ,EAAE,YAAY,EAAE,SAAS,EAAE,SAAS,CAAC,CAAC;QAE9H,oEAAoE;QACpE,MAAM,MAAM,GAAsB,YAAY,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;YACzD,aAAa,EAAE,CAAC,CAAC,IAAI,EAAE,YAAY,EAAE,CAAC,CAAC,OAAO;YAC9C,aAAa,EAAE,CAAC,CAAC,QAAQ,EAAE,cAAc,EAAE,CAAC,CAAC,SAAS,EAAE,kBAAkB,EAAE,CAAC,CAAC,MAAM;SACrF,CAAC,CAAC,CAAC;QACJ,MAAM,GAAG,GAAG,IAAI,IAAI,EAAE,CAAC,WAAW,EAAE,CAAC;QACrC,SAAS,CAAC,UAAU,CAAC,UAAU,EAAE,sBAAsB,CAAC,CAAC;QACzD,SAAS,CAAC,cAAc,CAAC,WAAW,CAAC,CAAC;QAEtC,OAAO;YACL,EAAE,EAAE,EAAE,EAAE,KAAK,EAAE,GAAG,CAAC,EAAE,EAAE,MAAM,EAAE,WAAW,EAAE,UAAU,EAAE,OAAO,CAAC,UAAU,EAAE,MAAM;YAClF,gBAAgB,EAAE,qBAAqB,CAAC,YAAY,CAAC;YACrD,eAAe,EAAE,oBAAoB,CAAC,YAAY,EAAE,QAAQ,CAAC;YAC7D,eAAe,EAAE,EAAE,qBAAqB,EAAE,eAAe,CAAC,YAAY,CAAC,EAAE;YACzE,SAAS,EAAE;gBACT,eAAe,EAAE,WAAW,CAAC,eAAe,IAAI,EAAE,EAAE,aAAa,EAAE,WAAW,CAAC,aAAa,IAAI,CAAC;gBACjG,UAAU,EAAE,WAAW,CAAC,UAAU,IAAI,CAAC,EAAE,UAAU,EAAE,WAAW,CAAC,UAAU,IAAI,EAAE;aAClF;YACD,MAAM,EAAE,YAAY,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,CAAC,EAAE,EAAE,CAAC,GAAG,GAAG,CAAC,CAAC,YAAY,EAAE,CAAC,CAAC;YACxE,SAAS,EAAE,GAAG,EAAE,SAAS,EAAE,GAAG;SAC/B,CAAC;IACJ,CAAC;IAED,wEAAwE;IAEhE,KAAK,CAAC,SAAS,CACrB,UAAsC,EACtC,YAAoC,EACpC,UAAkB,EAClB,QAAkB,EAClB,QAAkB,EAClB,YAAqD,EACrD,OAAuD,EACvD,SAA8B;QAE9B,MAAM,QAAQ,GAAG,UAAU,CAAC,GAAG,CAAC,KAAK,EAAE,SAAS,EAAE,GAAG,EAAE,EAAE;YACvD,MAAM,GAAG,GAAG,YAAY,CAAC,GAAG,CAAC,CAAC;YAC9B,GAAG,CAAC,MAAM,EAAE,CAAC;YACb,MAAM,SAAS,GAAoB,EAAE,KAAK,EAAE,OAAO,EAAE,aAAa,EAAE,SAAS,CAAC,IAAI,EAAE,WAAW,EAAE,CAAC,EAAE,CAAC;YACrG,MAAM,SAAS,GAAG,MAAM,IAAI,CAAC,QAAQ,CAAC,SAAS,EAAE,gBAAgB,CAAC,UAAU,EAAE,QAAQ,EAAE,OAAO,CAAC,EAAE,SAAS,EAAE,SAAS,CAAC,CAAC;YACxH,GAAG,CAAC,OAAO,IAAI,SAAS,CAAC,OAAO,CAAC;YACjC,GAAG,CAAC,WAAW,GAAG,kBAAkB,CAAC,SAAS,CAAC,IAAI,CAAC,CAAC;YACrD,GAAG,CAAC,cAAc,GAAG,SAAS,CAAC,IAAI,CAAC;YACpC,MAAM,QAAQ,GAAoB,EAAE,KAAK,EAAE,YAAY,EAAE,aAAa,EAAE,SAAS,CAAC,IAAI,EAAE,WAAW,EAAE,CAAC,EAAE,CAAC;YACzG,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,QAAQ,CAAC,SAAS,EAAE,qBAAqB,CAAC,UAAU,EAAE,QAAQ,EAAE,YAAY,CAAC,EAAE,SAAS,EAAE,QAAQ,CAAC,CAAC;YAChI,GAAG,CAAC,OAAO,IAAI,QAAQ,CAAC,OAAO,CAAC;YAChC,GAAG,CAAC,gBAAgB,GAAG,uBAAuB,CAAC,QAAQ,CAAC,IAAI,CAAC,CAAC;YAC9D,OAAO,uBAAuB,CAAC,GAAG,CAAC,WAAW,CAAC,MAAM,IAAI,EAAE,EAAE,SAAS,CAAC,IAAI,EAAE,EAAE,CAAC,CAAC;QACnF,CAAC,CAAC,CAAC;QACH,OAAO,CAAC,MAAM,OAAO,CAAC,GAAG,CAAC,QAAQ,CAAC,CAAC,CAAC,IAAI,EAAE,CAAC;IAC9C,CAAC;IAED,wEAAwE;IAEhE,KAAK,CAAC,cAAc,CAC1B,UAAsC,EACtC,YAAoC,EACpC,WAAmB,EACnB,SAA8B;QAE9B,MAAM,QAAQ,GAAG,UAAU,CAAC,GAAG,CAAC,KAAK,EAAE,SAAS,EAAE,GAAG,EAAE,EAAE;YACvD,MAAM,GAAG,GAAG,YAAY,CAAC,GAAG,CAAC,CAAC;YAC9B,GAAG,CAAC,MAAM,EAAE,CAAC;YACb,MAAM,MAAM,GAAG,YAAY,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,KAAK,GAAG,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,cAAc,CAAC,CAAC;YACrF,MAAM,IAAI,GAAoB,EAAE,KAAK,EAAE,QAAQ,EAAE,aAAa,EAAE,SAAS,CAAC,IAAI,EAAE,WAAW,EAAE,CAAC;YAC9F,MAAM,IAAI,GAAG,MAAM,IAAI,CAAC,QAAQ,CAAC,SAAS,EAAE,iBAAiB,CAAC,GAAG,CAAC,cAAc,EAAE,MAAM,EAAE,WAAW,CAAC,EAAE,SAAS,EAAE,IAAI,CAAC,CAAC;YACzH,GAAG,CAAC,OAAO,IAAI,IAAI,CAAC,OAAO,CAAC;YAC5B,MAAM,MAAM,GAAG,mBAAmB,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;YAC9C,IAAI,MAAM,CAAC,aAAa,IAAI,MAAM,CAAC,IAAI,CAAC,MAAM,CAAC,aAAa,CAAC,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;gBACzE,GAAG,CAAC,WAAW,GAAG,EAAE,GAAG,GAAG,CAAC,WAAW,EAAE,MAAM,EAAE,MAAM,CAAC,aAAa,EAAE,CAAC;YACzE,CAAC;YACD,GAAG,CAAC,cAAc,GAAG,IAAI,CAAC,IAAI,CAAC;YAC/B,OAAO,uBAAuB,CAAC,GAAG,CAAC,WAAW,CAAC,MAAM,IAAI,EAAE,EAAE,SAAS,CAAC,IAAI,EAAE,EAAE,CAAC,CAAC;QACnF,CAAC,CAAC,CAAC;QACH,OAAO,CAAC,MAAM,OAAO,CAAC,GAAG,CAAC,QAAQ,CAAC,CAAC,CAAC,IAAI,EAAE,CAAC;IAC9C,CAAC;IAED,wEAAwE;IAEhE,KAAK,CAAC,YAAY,CACxB,WAA4B,EAC5B,QAAyC,EACzC,QAAkB,EAClB,QAAkB,EAClB,YAAoC,EACpC,SAA8B,EAC9B,IAAqB;QAErB,MAAM,IAAI,GAAG,MAAM,IAAI,CAAC,QAAQ,CAAC,WAAW,EAAE,oBAAoB,CAAC,QAAQ,EAAE,QAAQ,EAAE,QAAQ,CAAC,EAAE,SAAS,EAAE,IAAI,CAAC,CAAC;QACnH,MAAM,GAAG,GAAG,YAAY,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,IAAI,KAAK,WAAW,CAAC,IAAI,CAAC,CAAC;QAClE,IAAI,GAAG;YAAE,GAAG,CAAC,OAAO,IAAI,IAAI,CAAC,OAAO,CAAC;QACrC,OAAO,sBAAsB,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;IAC3C,CAAC;IAED,yEAAyE;IAEjE,KAAK,CAAC,QAAQ,CACpB,SAA0B,EAC1B,MAAc,EACd,SAA8B,EAC9B,IAAqB;QAErB,MAAM,KAAK,GAAG,WAAW,CAAC;YACxB,YAAY,EAAE,SAAS,CAAC,YAAY;YACpC,KAAK,EAAE,SAAS,CAAC,KAAK;YACtB,MAAM,EAAE,SAAS,CAAC,MAAM;YACxB,OAAO,EAAE,SAAS,CAAC,OAAO;SAC3B,CAAC,CAAC;QAEH,MAAM,MAAM,GAAG,MAAM,YAAY,CAAC,EAAE,KAAK,EAAE,MAAM,EAAE,eAAe,EAAE,IAAI,EAAE,CAAC,CAAC;QAE5E,MAAM,MAAM,GAAqB;YAC/B,SAAS,EAAE,IAAI,IAAI,EAAE,CAAC,WAAW,EAAE;YACnC,OAAO,EAAE;gBACP,IAAI,EAAE,eAAe;gBACrB,IAAI,EAAE,MAAM,CAAC,IAAI;gBACjB,KAAK,EAAE,MAAM,CAAC,KAAK;aACkB;SACxC,CAAC;QACF,SAAS,CAAC,SAAS,CAAC,IAAI,EAAE,MAAM,CAAC,CAAC;QAElC,+DAA+D;QAC/D,MAAM,OAAO,GAAG,CAAC,CAAC;QAClB,OAAO,EAAE,IAAI,EAAE,MAAM,CAAC,IAAI,EAAE,OAAO,EAAE,CAAC;IACxC,CAAC;CACF"}
@@ -0,0 +1,20 @@
1
+ /** File system abstraction for testing */
2
+ export interface FsAdapter {
3
+ mkdir(dirPath: string, opts: {
4
+ recursive: boolean;
5
+ }): Promise<void>;
6
+ writeFile(filePath: string, data: string, opts?: {
7
+ mode?: number;
8
+ }): Promise<void>;
9
+ readFile(filePath: string, encoding: BufferEncoding): Promise<string>;
10
+ readdir(dirPath: string): Promise<string[]>;
11
+ unlink(filePath: string): Promise<void>;
12
+ rename(oldPath: string, newPath: string): Promise<void>;
13
+ stat(filePath: string): Promise<{
14
+ isFile(): boolean;
15
+ }>;
16
+ access(filePath: string): Promise<void>;
17
+ }
18
+ /** Default adapter that delegates to node:fs/promises */
19
+ export declare const defaultFs: FsAdapter;
20
+ //# sourceMappingURL=fs-adapter.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"fs-adapter.d.ts","sourceRoot":"","sources":["../../../src/server/services/fs-adapter.ts"],"names":[],"mappings":"AAEA,0CAA0C;AAC1C,MAAM,WAAW,SAAS;IACxB,KAAK,CAAC,OAAO,EAAE,MAAM,EAAE,IAAI,EAAE;QAAE,SAAS,EAAE,OAAO,CAAA;KAAE,GAAG,OAAO,CAAC,IAAI,CAAC,CAAC;IACpE,SAAS,CAAC,QAAQ,EAAE,MAAM,EAAE,IAAI,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE;QAAE,IAAI,CAAC,EAAE,MAAM,CAAA;KAAE,GAAG,OAAO,CAAC,IAAI,CAAC,CAAC;IACnF,QAAQ,CAAC,QAAQ,EAAE,MAAM,EAAE,QAAQ,EAAE,cAAc,GAAG,OAAO,CAAC,MAAM,CAAC,CAAC;IACtE,OAAO,CAAC,OAAO,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,EAAE,CAAC,CAAC;IAC5C,MAAM,CAAC,QAAQ,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC,CAAC;IACxC,MAAM,CAAC,OAAO,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC,CAAC;IACxD,IAAI,CAAC,QAAQ,EAAE,MAAM,GAAG,OAAO,CAAC;QAAE,MAAM,IAAI,OAAO,CAAA;KAAE,CAAC,CAAC;IACvD,MAAM,CAAC,QAAQ,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC,CAAC;CACzC;AAED,yDAAyD;AACzD,eAAO,MAAM,SAAS,EAAE,SAUvB,CAAC"}
@@ -0,0 +1,13 @@
1
+ import fs from 'node:fs/promises';
2
+ /** Default adapter that delegates to node:fs/promises */
3
+ export const defaultFs = {
4
+ mkdir: (dirPath, opts) => fs.mkdir(dirPath, opts).then(() => undefined),
5
+ writeFile: (filePath, data, opts) => fs.writeFile(filePath, data, opts).then(() => undefined),
6
+ readFile: (filePath, encoding) => fs.readFile(filePath, encoding),
7
+ readdir: (dirPath) => fs.readdir(dirPath).then((entries) => entries.map(String)),
8
+ unlink: (filePath) => fs.unlink(filePath),
9
+ rename: (oldPath, newPath) => fs.rename(oldPath, newPath),
10
+ stat: (filePath) => fs.stat(filePath),
11
+ access: (filePath) => fs.access(filePath),
12
+ };
13
+ //# sourceMappingURL=fs-adapter.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"fs-adapter.js","sourceRoot":"","sources":["../../../src/server/services/fs-adapter.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,MAAM,kBAAkB,CAAC;AAclC,yDAAyD;AACzD,MAAM,CAAC,MAAM,SAAS,GAAc;IAClC,KAAK,EAAE,CAAC,OAAO,EAAE,IAAI,EAAE,EAAE,CAAC,EAAE,CAAC,KAAK,CAAC,OAAO,EAAE,IAAI,CAAC,CAAC,IAAI,CAAC,GAAG,EAAE,CAAC,SAAS,CAAC;IACvE,SAAS,EAAE,CAAC,QAAQ,EAAE,IAAI,EAAE,IAAI,EAAE,EAAE,CAClC,EAAE,CAAC,SAAS,CAAC,QAAQ,EAAE,IAAI,EAAE,IAAI,CAAC,CAAC,IAAI,CAAC,GAAG,EAAE,CAAC,SAAS,CAAC;IAC1D,QAAQ,EAAE,CAAC,QAAQ,EAAE,QAAQ,EAAE,EAAE,CAAC,EAAE,CAAC,QAAQ,CAAC,QAAQ,EAAE,QAAQ,CAAC;IACjE,OAAO,EAAE,CAAC,OAAO,EAAE,EAAE,CAAC,EAAE,CAAC,OAAO,CAAC,OAAO,CAAC,CAAC,IAAI,CAAC,CAAC,OAAO,EAAE,EAAE,CAAC,OAAO,CAAC,GAAG,CAAC,MAAM,CAAC,CAAC;IAChF,MAAM,EAAE,CAAC,QAAQ,EAAE,EAAE,CAAC,EAAE,CAAC,MAAM,CAAC,QAAQ,CAAC;IACzC,MAAM,EAAE,CAAC,OAAO,EAAE,OAAO,EAAE,EAAE,CAAC,EAAE,CAAC,MAAM,CAAC,OAAO,EAAE,OAAO,CAAC;IACzD,IAAI,EAAE,CAAC,QAAQ,EAAE,EAAE,CAAC,EAAE,CAAC,IAAI,CAAC,QAAQ,CAAC;IACrC,MAAM,EAAE,CAAC,QAAQ,EAAE,EAAE,CAAC,EAAE,CAAC,MAAM,CAAC,QAAQ,CAAC;CAC1C,CAAC"}
@@ -0,0 +1,26 @@
1
+ /** A single testable instruction block extracted from rules content. */
2
+ export interface InstructionBlock {
3
+ readonly source: string;
4
+ readonly text: string;
5
+ }
6
+ /**
7
+ * Parse rules/CLAUDE.md content into semantic instruction blocks.
8
+ *
9
+ * Splits on:
10
+ * - Markdown headings (# / ## / ### etc.)
11
+ * - Numbered lists (1. / 2. etc.)
12
+ * - Bulleted lists (- / * / + prefixed lines)
13
+ * - Paragraph breaks (double newlines)
14
+ *
15
+ * Each block is trimmed and deduplicated. Empty blocks are discarded.
16
+ */
17
+ export declare function parseInstructions(content: string, source: string): InstructionBlock[];
18
+ /**
19
+ * Parse multiple sources (e.g. CLAUDE.md files + rule entries) into a
20
+ * combined list of instruction blocks.
21
+ */
22
+ export declare function parseAllInstructions(entries: readonly {
23
+ content: string;
24
+ source: string;
25
+ }[]): InstructionBlock[];
26
+ //# sourceMappingURL=instruction-parser.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"instruction-parser.d.ts","sourceRoot":"","sources":["../../../src/server/services/instruction-parser.ts"],"names":[],"mappings":"AAIA,wEAAwE;AACxE,MAAM,WAAW,gBAAgB;IAC/B,QAAQ,CAAC,MAAM,EAAE,MAAM,CAAC;IACxB,QAAQ,CAAC,IAAI,EAAE,MAAM,CAAC;CACvB;AAED;;;;;;;;;;GAUG;AACH,wBAAgB,iBAAiB,CAAC,OAAO,EAAE,MAAM,EAAE,MAAM,EAAE,MAAM,GAAG,gBAAgB,EAAE,CAerF;AAED;;;GAGG;AACH,wBAAgB,oBAAoB,CAClC,OAAO,EAAE,SAAS;IAAE,OAAO,EAAE,MAAM,CAAC;IAAC,MAAM,EAAE,MAAM,CAAA;CAAE,EAAE,GACtD,gBAAgB,EAAE,CAMpB"}
@@ -0,0 +1,121 @@
1
+ // ---------------------------------------------------------------------------
2
+ // Instruction Parser — splits CLAUDE.md / rules content into testable blocks
3
+ // ---------------------------------------------------------------------------
4
+ /**
5
+ * Parse rules/CLAUDE.md content into semantic instruction blocks.
6
+ *
7
+ * Splits on:
8
+ * - Markdown headings (# / ## / ### etc.)
9
+ * - Numbered lists (1. / 2. etc.)
10
+ * - Bulleted lists (- / * / + prefixed lines)
11
+ * - Paragraph breaks (double newlines)
12
+ *
13
+ * Each block is trimmed and deduplicated. Empty blocks are discarded.
14
+ */
15
+ export function parseInstructions(content, source) {
16
+ if (!content.trim())
17
+ return [];
18
+ const rawBlocks = splitIntoBlocks(content);
19
+ const seen = new Set();
20
+ const blocks = [];
21
+ for (const raw of rawBlocks) {
22
+ const text = cleanBlock(raw);
23
+ if (!text || seen.has(text))
24
+ continue;
25
+ seen.add(text);
26
+ blocks.push({ source, text });
27
+ }
28
+ return blocks;
29
+ }
30
+ /**
31
+ * Parse multiple sources (e.g. CLAUDE.md files + rule entries) into a
32
+ * combined list of instruction blocks.
33
+ */
34
+ export function parseAllInstructions(entries) {
35
+ const allBlocks = [];
36
+ for (const entry of entries) {
37
+ allBlocks.push(...parseInstructions(entry.content, entry.source));
38
+ }
39
+ return allBlocks;
40
+ }
41
+ // ---------------------------------------------------------------------------
42
+ // Internal helpers
43
+ // ---------------------------------------------------------------------------
44
+ /** Split content into raw blocks using heading/list/paragraph boundaries. */
45
+ function splitIntoBlocks(content) {
46
+ const lines = content.split('\n');
47
+ const blocks = [];
48
+ let current = [];
49
+ let currentHeadingContext = '';
50
+ for (const line of lines) {
51
+ const isHeading = /^#{1,6}\s+/.test(line);
52
+ const isListItem = /^\s*(?:[-*+]|\d+\.)\s+/.test(line);
53
+ const isBlankLine = line.trim() === '';
54
+ if (isHeading || (isListItem && current.length > 0) || isBlankLine) {
55
+ if (current.length > 0) {
56
+ blocks.push(current.join('\n'));
57
+ current = [];
58
+ }
59
+ }
60
+ if (!isBlankLine) {
61
+ if (isHeading) {
62
+ const headingText = line.replace(/^#{1,6}\s+/, '').trim();
63
+ if (headingText && !isOnlyFormatting(headingText)) {
64
+ if (isActionableHeading(headingText)) {
65
+ // Actionable headings are testable instructions on their own
66
+ blocks.push(headingText);
67
+ currentHeadingContext = '';
68
+ }
69
+ else {
70
+ // Non-actionable headings become context for child instructions
71
+ currentHeadingContext = headingText;
72
+ }
73
+ }
74
+ }
75
+ else {
76
+ // Prepend heading context to child instructions for grouping
77
+ if (currentHeadingContext && current.length === 0) {
78
+ current.push(`[${currentHeadingContext}]`);
79
+ }
80
+ current.push(line);
81
+ }
82
+ }
83
+ }
84
+ if (current.length > 0) {
85
+ blocks.push(current.join('\n'));
86
+ }
87
+ return blocks;
88
+ }
89
+ /**
90
+ * Check if heading text contains imperative/actionable language.
91
+ * A heading is actionable if it starts with a verb or contains directive keywords.
92
+ */
93
+ function isActionableHeading(text) {
94
+ const lower = text.toLowerCase();
95
+ // Contains directive keywords
96
+ if (/\b(must|should|always|never|do not|don't|ensure|require|avoid)\b/i.test(lower)) {
97
+ return true;
98
+ }
99
+ // Starts with an imperative verb (common instruction patterns)
100
+ if (/^(use|run|add|set|create|delete|remove|install|configure|enable|disable|check|verify|test|write|read|update|fix|apply|follow|include|exclude|import|export|call|return|throw|handle|log|format|lint|build|deploy|commit|push|pull|merge|rebase)\b/i.test(lower)) {
101
+ return true;
102
+ }
103
+ return false;
104
+ }
105
+ /** Clean up a raw block: strip list markers, collapse whitespace. */
106
+ function cleanBlock(raw) {
107
+ let text = raw.trim();
108
+ // Remove leading list markers
109
+ text = text.replace(/^\s*(?:[-*+]|\d+\.)\s+/, '');
110
+ // Collapse internal whitespace
111
+ text = text.replace(/\s+/g, ' ').trim();
112
+ // Skip very short blocks (likely formatting artifacts)
113
+ if (text.length < 5)
114
+ return '';
115
+ return text;
116
+ }
117
+ /** Check if a string is only formatting characters (dashes, equals, etc.). */
118
+ function isOnlyFormatting(text) {
119
+ return /^[-=_*#~`]+$/.test(text.trim());
120
+ }
121
+ //# sourceMappingURL=instruction-parser.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"instruction-parser.js","sourceRoot":"","sources":["../../../src/server/services/instruction-parser.ts"],"names":[],"mappings":"AAAA,8EAA8E;AAC9E,6EAA6E;AAC7E,8EAA8E;AAQ9E;;;;;;;;;;GAUG;AACH,MAAM,UAAU,iBAAiB,CAAC,OAAe,EAAE,MAAc;IAC/D,IAAI,CAAC,OAAO,CAAC,IAAI,EAAE;QAAE,OAAO,EAAE,CAAC;IAE/B,MAAM,SAAS,GAAG,eAAe,CAAC,OAAO,CAAC,CAAC;IAC3C,MAAM,IAAI,GAAG,IAAI,GAAG,EAAU,CAAC;IAC/B,MAAM,MAAM,GAAuB,EAAE,CAAC;IAEtC,KAAK,MAAM,GAAG,IAAI,SAAS,EAAE,CAAC;QAC5B,MAAM,IAAI,GAAG,UAAU,CAAC,GAAG,CAAC,CAAC;QAC7B,IAAI,CAAC,IAAI,IAAI,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC;YAAE,SAAS;QACtC,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC;QACf,MAAM,CAAC,IAAI,CAAC,EAAE,MAAM,EAAE,IAAI,EAAE,CAAC,CAAC;IAChC,CAAC;IAED,OAAO,MAAM,CAAC;AAChB,CAAC;AAED;;;GAGG;AACH,MAAM,UAAU,oBAAoB,CAClC,OAAuD;IAEvD,MAAM,SAAS,GAAuB,EAAE,CAAC;IACzC,KAAK,MAAM,KAAK,IAAI,OAAO,EAAE,CAAC;QAC5B,SAAS,CAAC,IAAI,CAAC,GAAG,iBAAiB,CAAC,KAAK,CAAC,OAAO,EAAE,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC;IACpE,CAAC;IACD,OAAO,SAAS,CAAC;AACnB,CAAC;AAED,8EAA8E;AAC9E,mBAAmB;AACnB,8EAA8E;AAE9E,6EAA6E;AAC7E,SAAS,eAAe,CAAC,OAAe;IACtC,MAAM,KAAK,GAAG,OAAO,CAAC,KAAK,CAAC,IAAI,CAAC,CAAC;IAClC,MAAM,MAAM,GAAa,EAAE,CAAC;IAC5B,IAAI,OAAO,GAAa,EAAE,CAAC;IAC3B,IAAI,qBAAqB,GAAG,EAAE,CAAC;IAE/B,KAAK,MAAM,IAAI,IAAI,KAAK,EAAE,CAAC;QACzB,MAAM,SAAS,GAAG,YAAY,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;QAC1C,MAAM,UAAU,GAAG,wBAAwB,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;QACvD,MAAM,WAAW,GAAG,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,CAAC;QAEvC,IAAI,SAAS,IAAI,CAAC,UAAU,IAAI,OAAO,CAAC,MAAM,GAAG,CAAC,CAAC,IAAI,WAAW,EAAE,CAAC;YACnE,IAAI,OAAO,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;gBACvB,MAAM,CAAC,IAAI,CAAC,OAAO,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC,CAAC;gBAChC,OAAO,GAAG,EAAE,CAAC;YACf,CAAC;QACH,CAAC;QAED,IAAI,CAAC,WAAW,EAAE,CAAC;YACjB,IAAI,SAAS,EAAE,CAAC;gBACd,MAAM,WAAW,GAAG,IAAI,CAAC,OAAO,CAAC,YAAY,EAAE,EAAE,CAAC,CAAC,IAAI,EAAE,CAAC;gBAC1D,IAAI,WAAW,IAAI,CAAC,gBAAgB,CAAC,WAAW,CAAC,EAAE,CAAC;oBAClD,IAAI,mBAAmB,CAAC,WAAW,CAAC,EAAE,CAAC;wBACrC,6DAA6D;wBAC7D,MAAM,CAAC,IAAI,CAAC,WAAW,CAAC,CAAC;wBACzB,qBAAqB,GAAG,EAAE,CAAC;oBAC7B,CAAC;yBAAM,CAAC;wBACN,gEAAgE;wBAChE,qBAAqB,GAAG,WAAW,CAAC;oBACtC,CAAC;gBACH,CAAC;YACH,CAAC;iBAAM,CAAC;gBACN,6DAA6D;gBAC7D,IAAI,qBAAqB,IAAI,OAAO,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;oBAClD,OAAO,CAAC,IAAI,CAAC,IAAI,qBAAqB,GAAG,CAAC,CAAC;gBAC7C,CAAC;gBACD,OAAO,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;YACrB,CAAC;QACH,CAAC;IACH,CAAC;IAED,IAAI,OAAO,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QACvB,MAAM,CAAC,IAAI,CAAC,OAAO,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC,CAAC;IAClC,CAAC;IAED,OAAO,MAAM,CAAC;AAChB,CAAC;AAED;;;GAGG;AACH,SAAS,mBAAmB,CAAC,IAAY;IACvC,MAAM,KAAK,GAAG,IAAI,CAAC,WAAW,EAAE,CAAC;IACjC,8BAA8B;IAC9B,IAAI,mEAAmE,CAAC,IAAI,CAAC,KAAK,CAAC,EAAE,CAAC;QACpF,OAAO,IAAI,CAAC;IACd,CAAC;IACD,+DAA+D;IAC/D,IAAI,oPAAoP,CAAC,IAAI,CAAC,KAAK,CAAC,EAAE,CAAC;QACrQ,OAAO,IAAI,CAAC;IACd,CAAC;IACD,OAAO,KAAK,CAAC;AACf,CAAC;AAED,qEAAqE;AACrE,SAAS,UAAU,CAAC,GAAW;IAC7B,IAAI,IAAI,GAAG,GAAG,CAAC,IAAI,EAAE,CAAC;IACtB,8BAA8B;IAC9B,IAAI,GAAG,IAAI,CAAC,OAAO,CAAC,wBAAwB,EAAE,EAAE,CAAC,CAAC;IAClD,+BAA+B;IAC/B,IAAI,GAAG,IAAI,CAAC,OAAO,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC,IAAI,EAAE,CAAC;IACxC,uDAAuD;IACvD,IAAI,IAAI,CAAC,MAAM,GAAG,CAAC;QAAE,OAAO,EAAE,CAAC;IAC/B,OAAO,IAAI,CAAC;AACd,CAAC;AAED,8EAA8E;AAC9E,SAAS,gBAAgB,CAAC,IAAY;IACpC,OAAO,cAAc,CAAC,IAAI,CAAC,IAAI,CAAC,IAAI,EAAE,CAAC,CAAC;AAC1C,CAAC"}
@@ -0,0 +1,20 @@
1
+ export interface RotationConfig {
2
+ /** Maximum file size in bytes before rotation (default: 2MB). */
3
+ maxBytes: number;
4
+ /** Maximum number of rotated files to keep (default: 25). */
5
+ maxFiles: number;
6
+ }
7
+ export declare const DEFAULT_ROTATION: RotationConfig;
8
+ /**
9
+ * Rotate a log file if it exceeds `config.maxBytes`.
10
+ *
11
+ * Rotation scheme (e.g. for ctb.log):
12
+ * ctb.24.log → deleted
13
+ * ctb.23.log → ctb.24.log
14
+ * ...
15
+ * ctb.1.log → ctb.2.log
16
+ * ctb.log → ctb.1.log
17
+ * (a fresh ctb.log is NOT created here — the caller appends)
18
+ */
19
+ export declare function rotateIfNeeded(filePath: string, config?: RotationConfig): void;
20
+ //# sourceMappingURL=log-rotator.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"log-rotator.d.ts","sourceRoot":"","sources":["../../../src/server/services/log-rotator.ts"],"names":[],"mappings":"AAGA,MAAM,WAAW,cAAc;IAC7B,iEAAiE;IACjE,QAAQ,EAAE,MAAM,CAAC;IACjB,6DAA6D;IAC7D,QAAQ,EAAE,MAAM,CAAC;CAClB;AAED,eAAO,MAAM,gBAAgB,EAAE,cAG9B,CAAC;AAEF;;;;;;;;;;GAUG;AACH,wBAAgB,cAAc,CAC5B,QAAQ,EAAE,MAAM,EAChB,MAAM,GAAE,cAAiC,GACxC,IAAI,CAmCN"}
@@ -0,0 +1,60 @@
1
+ import fs from 'node:fs';
2
+ import path from 'node:path';
3
+ export const DEFAULT_ROTATION = {
4
+ maxBytes: 2 * 1024 * 1024, // 2 MB
5
+ maxFiles: 25,
6
+ };
7
+ /**
8
+ * Rotate a log file if it exceeds `config.maxBytes`.
9
+ *
10
+ * Rotation scheme (e.g. for ctb.log):
11
+ * ctb.24.log → deleted
12
+ * ctb.23.log → ctb.24.log
13
+ * ...
14
+ * ctb.1.log → ctb.2.log
15
+ * ctb.log → ctb.1.log
16
+ * (a fresh ctb.log is NOT created here — the caller appends)
17
+ */
18
+ export function rotateIfNeeded(filePath, config = DEFAULT_ROTATION) {
19
+ let size;
20
+ try {
21
+ const stat = fs.statSync(filePath);
22
+ size = stat.size;
23
+ }
24
+ catch {
25
+ // File does not exist yet — nothing to rotate.
26
+ return;
27
+ }
28
+ if (size < config.maxBytes)
29
+ return;
30
+ const dir = path.dirname(filePath);
31
+ const ext = path.extname(filePath); // .log
32
+ const base = path.basename(filePath, ext); // ctb
33
+ // Shift numbered files: N → N+1. Delete the oldest if at maxFiles.
34
+ for (let i = config.maxFiles; i >= 1; i--) {
35
+ const src = path.join(dir, `${base}.${i}${ext}`);
36
+ if (i === config.maxFiles) {
37
+ // Delete the oldest file
38
+ try {
39
+ fs.unlinkSync(src);
40
+ }
41
+ catch { /* noop */ }
42
+ }
43
+ else {
44
+ const dst = path.join(dir, `${base}.${i + 1}${ext}`);
45
+ try {
46
+ fs.renameSync(src, dst);
47
+ }
48
+ catch { /* noop */ }
49
+ }
50
+ }
51
+ // Move current file → .1
52
+ const firstRotated = path.join(dir, `${base}.1${ext}`);
53
+ try {
54
+ fs.renameSync(filePath, firstRotated);
55
+ }
56
+ catch {
57
+ // If rename fails, continue — the caller will append to the same file.
58
+ }
59
+ }
60
+ //# sourceMappingURL=log-rotator.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"log-rotator.js","sourceRoot":"","sources":["../../../src/server/services/log-rotator.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,MAAM,SAAS,CAAC;AACzB,OAAO,IAAI,MAAM,WAAW,CAAC;AAS7B,MAAM,CAAC,MAAM,gBAAgB,GAAmB;IAC9C,QAAQ,EAAE,CAAC,GAAG,IAAI,GAAG,IAAI,EAAG,OAAO;IACnC,QAAQ,EAAE,EAAE;CACb,CAAC;AAEF;;;;;;;;;;GAUG;AACH,MAAM,UAAU,cAAc,CAC5B,QAAgB,EAChB,SAAyB,gBAAgB;IAEzC,IAAI,IAAY,CAAC;IACjB,IAAI,CAAC;QACH,MAAM,IAAI,GAAG,EAAE,CAAC,QAAQ,CAAC,QAAQ,CAAC,CAAC;QACnC,IAAI,GAAG,IAAI,CAAC,IAAI,CAAC;IACnB,CAAC;IAAC,MAAM,CAAC;QACP,+CAA+C;QAC/C,OAAO;IACT,CAAC;IAED,IAAI,IAAI,GAAG,MAAM,CAAC,QAAQ;QAAE,OAAO;IAEnC,MAAM,GAAG,GAAG,IAAI,CAAC,OAAO,CAAC,QAAQ,CAAC,CAAC;IACnC,MAAM,GAAG,GAAG,IAAI,CAAC,OAAO,CAAC,QAAQ,CAAC,CAAC,CAAW,OAAO;IACrD,MAAM,IAAI,GAAG,IAAI,CAAC,QAAQ,CAAC,QAAQ,EAAE,GAAG,CAAC,CAAC,CAAK,MAAM;IAErD,oEAAoE;IACpE,KAAK,IAAI,CAAC,GAAG,MAAM,CAAC,QAAQ,EAAE,CAAC,IAAI,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC;QAC1C,MAAM,GAAG,GAAG,IAAI,CAAC,IAAI,CAAC,GAAG,EAAE,GAAG,IAAI,IAAI,CAAC,GAAG,GAAG,EAAE,CAAC,CAAC;QACjD,IAAI,CAAC,KAAK,MAAM,CAAC,QAAQ,EAAE,CAAC;YAC1B,yBAAyB;YACzB,IAAI,CAAC;gBAAC,EAAE,CAAC,UAAU,CAAC,GAAG,CAAC,CAAC;YAAC,CAAC;YAAC,MAAM,CAAC,CAAC,UAAU,CAAC,CAAC;QAClD,CAAC;aAAM,CAAC;YACN,MAAM,GAAG,GAAG,IAAI,CAAC,IAAI,CAAC,GAAG,EAAE,GAAG,IAAI,IAAI,CAAC,GAAG,CAAC,GAAG,GAAG,EAAE,CAAC,CAAC;YACrD,IAAI,CAAC;gBAAC,EAAE,CAAC,UAAU,CAAC,GAAG,EAAE,GAAG,CAAC,CAAC;YAAC,CAAC;YAAC,MAAM,CAAC,CAAC,UAAU,CAAC,CAAC;QACvD,CAAC;IACH,CAAC;IAED,yBAAyB;IACzB,MAAM,YAAY,GAAG,IAAI,CAAC,IAAI,CAAC,GAAG,EAAE,GAAG,IAAI,KAAK,GAAG,EAAE,CAAC,CAAC;IACvD,IAAI,CAAC;QACH,EAAE,CAAC,UAAU,CAAC,QAAQ,EAAE,YAAY,CAAC,CAAC;IACxC,CAAC;IAAC,MAAM,CAAC;QACP,uEAAuE;IACzE,CAAC;AACH,CAAC"}
@@ -0,0 +1,15 @@
1
+ import type { ILogger, LogLevel } from '../interfaces/logger.js';
2
+ export declare class JsonLogger implements ILogger {
3
+ private readonly level;
4
+ private readonly baseAttrs;
5
+ private readonly writeFn;
6
+ private readonly logFilePath;
7
+ constructor(level?: LogLevel, baseAttrs?: Record<string, unknown>, writeFn?: (line: string) => void, logFilePath?: string);
8
+ debug(msg: string, attrs?: Record<string, unknown>): void;
9
+ info(msg: string, attrs?: Record<string, unknown>): void;
10
+ warn(msg: string, attrs?: Record<string, unknown>): void;
11
+ error(msg: string, attrs?: Record<string, unknown>): void;
12
+ child(attrs: Record<string, unknown>): ILogger;
13
+ private log;
14
+ }
15
+ //# sourceMappingURL=logger.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"logger.d.ts","sourceRoot":"","sources":["../../../src/server/services/logger.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,OAAO,EAAE,QAAQ,EAAE,MAAM,yBAAyB,CAAC;AAiBjE,qBAAa,UAAW,YAAW,OAAO;IACxC,OAAO,CAAC,QAAQ,CAAC,KAAK,CAAW;IACjC,OAAO,CAAC,QAAQ,CAAC,SAAS,CAA0B;IACpD,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAyB;IACjD,OAAO,CAAC,QAAQ,CAAC,WAAW,CAAqB;gBAG/C,KAAK,GAAE,QAAiB,EACxB,SAAS,GAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAM,EACvC,OAAO,CAAC,EAAE,CAAC,IAAI,EAAE,MAAM,KAAK,IAAI,EAChC,WAAW,CAAC,EAAE,MAAM;IAYtB,KAAK,CAAC,GAAG,EAAE,MAAM,EAAE,KAAK,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI;IAIzD,IAAI,CAAC,GAAG,EAAE,MAAM,EAAE,KAAK,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI;IAIxD,IAAI,CAAC,GAAG,EAAE,MAAM,EAAE,KAAK,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI;IAIxD,KAAK,CAAC,GAAG,EAAE,MAAM,EAAE,KAAK,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI;IAIzD,KAAK,CAAC,KAAK,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,OAAO;IAI9C,OAAO,CAAC,GAAG;CAyBZ"}
@@ -0,0 +1,69 @@
1
+ import fs from 'node:fs';
2
+ import path from 'node:path';
3
+ import { rotateIfNeeded, DEFAULT_ROTATION } from './log-rotator.js';
4
+ const LOG_LEVEL_ORDER = {
5
+ debug: 0,
6
+ info: 1,
7
+ warn: 2,
8
+ error: 3,
9
+ };
10
+ const LOG_LEVEL_LABEL = {
11
+ debug: 'DEBUG',
12
+ info: 'INFO',
13
+ warn: 'WARN',
14
+ error: 'ERROR',
15
+ };
16
+ export class JsonLogger {
17
+ level;
18
+ baseAttrs;
19
+ writeFn;
20
+ logFilePath;
21
+ constructor(level = 'info', baseAttrs = {}, writeFn, logFilePath) {
22
+ this.level = level;
23
+ this.baseAttrs = baseAttrs;
24
+ this.writeFn = writeFn ?? ((line) => process.stderr.write(line + '\n'));
25
+ this.logFilePath = logFilePath;
26
+ if (logFilePath) {
27
+ fs.mkdirSync(path.dirname(logFilePath), { recursive: true });
28
+ }
29
+ }
30
+ debug(msg, attrs) {
31
+ this.log('debug', msg, attrs);
32
+ }
33
+ info(msg, attrs) {
34
+ this.log('info', msg, attrs);
35
+ }
36
+ warn(msg, attrs) {
37
+ this.log('warn', msg, attrs);
38
+ }
39
+ error(msg, attrs) {
40
+ this.log('error', msg, attrs);
41
+ }
42
+ child(attrs) {
43
+ return new JsonLogger(this.level, { ...this.baseAttrs, ...attrs }, this.writeFn, this.logFilePath);
44
+ }
45
+ log(level, msg, attrs) {
46
+ if (LOG_LEVEL_ORDER[level] < LOG_LEVEL_ORDER[this.level]) {
47
+ return;
48
+ }
49
+ const entry = {
50
+ ...this.baseAttrs,
51
+ ...attrs,
52
+ time: new Date().toISOString(),
53
+ level: LOG_LEVEL_LABEL[level],
54
+ msg,
55
+ };
56
+ const line = JSON.stringify(entry);
57
+ this.writeFn(line);
58
+ if (this.logFilePath) {
59
+ try {
60
+ fs.appendFileSync(this.logFilePath, line + '\n');
61
+ rotateIfNeeded(this.logFilePath, DEFAULT_ROTATION);
62
+ }
63
+ catch {
64
+ // Best-effort file logging — do not crash the process.
65
+ }
66
+ }
67
+ }
68
+ }
69
+ //# sourceMappingURL=logger.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"logger.js","sourceRoot":"","sources":["../../../src/server/services/logger.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,MAAM,SAAS,CAAC;AACzB,OAAO,IAAI,MAAM,WAAW,CAAC;AAE7B,OAAO,EAAE,cAAc,EAAE,gBAAgB,EAAE,MAAM,kBAAkB,CAAC;AAEpE,MAAM,eAAe,GAA6B;IAChD,KAAK,EAAE,CAAC;IACR,IAAI,EAAE,CAAC;IACP,IAAI,EAAE,CAAC;IACP,KAAK,EAAE,CAAC;CACT,CAAC;AAEF,MAAM,eAAe,GAA6B;IAChD,KAAK,EAAE,OAAO;IACd,IAAI,EAAE,MAAM;IACZ,IAAI,EAAE,MAAM;IACZ,KAAK,EAAE,OAAO;CACf,CAAC;AAEF,MAAM,OAAO,UAAU;IACJ,KAAK,CAAW;IAChB,SAAS,CAA0B;IACnC,OAAO,CAAyB;IAChC,WAAW,CAAqB;IAEjD,YACE,QAAkB,MAAM,EACxB,YAAqC,EAAE,EACvC,OAAgC,EAChC,WAAoB;QAEpB,IAAI,CAAC,KAAK,GAAG,KAAK,CAAC;QACnB,IAAI,CAAC,SAAS,GAAG,SAAS,CAAC;QAC3B,IAAI,CAAC,OAAO,GAAG,OAAO,IAAI,CAAC,CAAC,IAAY,EAAE,EAAE,CAAC,OAAO,CAAC,MAAM,CAAC,KAAK,CAAC,IAAI,GAAG,IAAI,CAAC,CAAC,CAAC;QAChF,IAAI,CAAC,WAAW,GAAG,WAAW,CAAC;QAE/B,IAAI,WAAW,EAAE,CAAC;YAChB,EAAE,CAAC,SAAS,CAAC,IAAI,CAAC,OAAO,CAAC,WAAW,CAAC,EAAE,EAAE,SAAS,EAAE,IAAI,EAAE,CAAC,CAAC;QAC/D,CAAC;IACH,CAAC;IAED,KAAK,CAAC,GAAW,EAAE,KAA+B;QAChD,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,GAAG,EAAE,KAAK,CAAC,CAAC;IAChC,CAAC;IAED,IAAI,CAAC,GAAW,EAAE,KAA+B;QAC/C,IAAI,CAAC,GAAG,CAAC,MAAM,EAAE,GAAG,EAAE,KAAK,CAAC,CAAC;IAC/B,CAAC;IAED,IAAI,CAAC,GAAW,EAAE,KAA+B;QAC/C,IAAI,CAAC,GAAG,CAAC,MAAM,EAAE,GAAG,EAAE,KAAK,CAAC,CAAC;IAC/B,CAAC;IAED,KAAK,CAAC,GAAW,EAAE,KAA+B;QAChD,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,GAAG,EAAE,KAAK,CAAC,CAAC;IAChC,CAAC;IAED,KAAK,CAAC,KAA8B;QAClC,OAAO,IAAI,UAAU,CAAC,IAAI,CAAC,KAAK,EAAE,EAAE,GAAG,IAAI,CAAC,SAAS,EAAE,GAAG,KAAK,EAAE,EAAE,IAAI,CAAC,OAAO,EAAE,IAAI,CAAC,WAAW,CAAC,CAAC;IACrG,CAAC;IAEO,GAAG,CAAC,KAAe,EAAE,GAAW,EAAE,KAA+B;QACvE,IAAI,eAAe,CAAC,KAAK,CAAC,GAAG,eAAe,CAAC,IAAI,CAAC,KAAK,CAAC,EAAE,CAAC;YACzD,OAAO;QACT,CAAC;QAED,MAAM,KAAK,GAA4B;YACrC,GAAG,IAAI,CAAC,SAAS;YACjB,GAAG,KAAK;YACR,IAAI,EAAE,IAAI,IAAI,EAAE,CAAC,WAAW,EAAE;YAC9B,KAAK,EAAE,eAAe,CAAC,KAAK,CAAC;YAC7B,GAAG;SACJ,CAAC;QAEF,MAAM,IAAI,GAAG,IAAI,CAAC,SAAS,CAAC,KAAK,CAAC,CAAC;QACnC,IAAI,CAAC,OAAO,CAAC,IAAI,CAAC,CAAC;QAEnB,IAAI,IAAI,CAAC,WAAW,EAAE,CAAC;YACrB,IAAI,CAAC;gBACH,EAAE,CAAC,cAAc,CAAC,IAAI,CAAC,WAAW,EAAE,IAAI,GAAG,IAAI,CAAC,CAAC;gBACjD,cAAc,CAAC,IAAI,CAAC,WAAW,EAAE,gBAAgB,CAAC,CAAC;YACrD,CAAC;YAAC,MAAM,CAAC;gBACP,uDAAuD;YACzD,CAAC;QACH,CAAC;IACH,CAAC;CACF"}
@@ -0,0 +1,10 @@
1
+ import type { LanguageModel } from 'ai';
2
+ export interface ModelConfig {
3
+ readonly providerName: string;
4
+ readonly model: string;
5
+ readonly apiKey: string;
6
+ readonly baseUrl?: string;
7
+ }
8
+ export declare function createModel(config: ModelConfig): LanguageModel;
9
+ export declare function isSupportedProvider(name: string): boolean;
10
+ //# sourceMappingURL=model-factory.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"model-factory.d.ts","sourceRoot":"","sources":["../../../src/server/services/model-factory.ts"],"names":[],"mappings":"AAOA,OAAO,KAAK,EAAE,aAAa,EAAE,MAAM,IAAI,CAAC;AAExC,MAAM,WAAW,WAAW;IAC1B,QAAQ,CAAC,YAAY,EAAE,MAAM,CAAC;IAC9B,QAAQ,CAAC,KAAK,EAAE,MAAM,CAAC;IACvB,QAAQ,CAAC,MAAM,EAAE,MAAM,CAAC;IACxB,QAAQ,CAAC,OAAO,CAAC,EAAE,MAAM,CAAC;CAC3B;AAID,wBAAgB,WAAW,CAAC,MAAM,EAAE,WAAW,GAAG,aAAa,CA0B9D;AAED,wBAAgB,mBAAmB,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO,CAEzD"}
@@ -0,0 +1,33 @@
1
+ // ---------------------------------------------------------------------------
2
+ // Model Factory — creates AI SDK model instances from provider config
3
+ // ---------------------------------------------------------------------------
4
+ import { createAnthropic } from '@ai-sdk/anthropic';
5
+ import { createOpenAI } from '@ai-sdk/openai';
6
+ import { createGoogleGenerativeAI } from '@ai-sdk/google';
7
+ const SUPPORTED_PROVIDERS = ['anthropic', 'openai', 'google'];
8
+ export function createModel(config) {
9
+ switch (config.providerName) {
10
+ case 'anthropic':
11
+ return createAnthropic({
12
+ apiKey: config.apiKey,
13
+ ...(config.baseUrl ? { baseURL: config.baseUrl } : {}),
14
+ })(config.model);
15
+ case 'openai':
16
+ return createOpenAI({
17
+ apiKey: config.apiKey,
18
+ ...(config.baseUrl ? { baseURL: config.baseUrl } : {}),
19
+ })(config.model);
20
+ case 'google':
21
+ return createGoogleGenerativeAI({
22
+ apiKey: config.apiKey,
23
+ ...(config.baseUrl ? { baseURL: config.baseUrl } : {}),
24
+ })(config.model);
25
+ default:
26
+ throw new Error(`Unsupported provider: "${config.providerName}". ` +
27
+ `Supported providers: ${SUPPORTED_PROVIDERS.join(', ')}`);
28
+ }
29
+ }
30
+ export function isSupportedProvider(name) {
31
+ return SUPPORTED_PROVIDERS.includes(name);
32
+ }
33
+ //# sourceMappingURL=model-factory.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"model-factory.js","sourceRoot":"","sources":["../../../src/server/services/model-factory.ts"],"names":[],"mappings":"AAAA,8EAA8E;AAC9E,sEAAsE;AACtE,8EAA8E;AAE9E,OAAO,EAAE,eAAe,EAAE,MAAM,mBAAmB,CAAC;AACpD,OAAO,EAAE,YAAY,EAAE,MAAM,gBAAgB,CAAC;AAC9C,OAAO,EAAE,wBAAwB,EAAE,MAAM,gBAAgB,CAAC;AAU1D,MAAM,mBAAmB,GAAG,CAAC,WAAW,EAAE,QAAQ,EAAE,QAAQ,CAAU,CAAC;AAEvE,MAAM,UAAU,WAAW,CAAC,MAAmB;IAC7C,QAAQ,MAAM,CAAC,YAAY,EAAE,CAAC;QAC5B,KAAK,WAAW;YACd,OAAO,eAAe,CAAC;gBACrB,MAAM,EAAE,MAAM,CAAC,MAAM;gBACrB,GAAG,CAAC,MAAM,CAAC,OAAO,CAAC,CAAC,CAAC,EAAE,OAAO,EAAE,MAAM,CAAC,OAAO,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC;aACvD,CAAC,CAAC,MAAM,CAAC,KAAK,CAAC,CAAC;QAEnB,KAAK,QAAQ;YACX,OAAO,YAAY,CAAC;gBAClB,MAAM,EAAE,MAAM,CAAC,MAAM;gBACrB,GAAG,CAAC,MAAM,CAAC,OAAO,CAAC,CAAC,CAAC,EAAE,OAAO,EAAE,MAAM,CAAC,OAAO,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC;aACvD,CAAC,CAAC,MAAM,CAAC,KAAK,CAAC,CAAC;QAEnB,KAAK,QAAQ;YACX,OAAO,wBAAwB,CAAC;gBAC9B,MAAM,EAAE,MAAM,CAAC,MAAM;gBACrB,GAAG,CAAC,MAAM,CAAC,OAAO,CAAC,CAAC,CAAC,EAAE,OAAO,EAAE,MAAM,CAAC,OAAO,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC;aACvD,CAAC,CAAC,MAAM,CAAC,KAAK,CAAC,CAAC;QAEnB;YACE,MAAM,IAAI,KAAK,CACb,0BAA0B,MAAM,CAAC,YAAY,KAAK;gBAClD,wBAAwB,mBAAmB,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CACzD,CAAC;IACN,CAAC;AACH,CAAC;AAED,MAAM,UAAU,mBAAmB,CAAC,IAAY;IAC9C,OAAQ,mBAAyC,CAAC,QAAQ,CAAC,IAAI,CAAC,CAAC;AACnE,CAAC"}
@@ -0,0 +1,9 @@
1
+ import type { IRunner, RunCallbacks } from '../interfaces/runner.js';
2
+ import type { ILogger } from '../interfaces/logger.js';
3
+ import type { Provider, Scenario, Run } from '../types/index.js';
4
+ export declare class AiSdkRunner implements IRunner {
5
+ private readonly logger;
6
+ constructor(logger: ILogger);
7
+ executeRun(provider: Provider, scenario: Scenario, run: Run, callbacks: RunCallbacks, externalAbortController?: AbortController): Promise<Run>;
8
+ }
9
+ //# sourceMappingURL=runner.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"runner.d.ts","sourceRoot":"","sources":["../../../src/server/services/runner.ts"],"names":[],"mappings":"AAKA,OAAO,KAAK,EAAE,OAAO,EAAE,YAAY,EAAE,MAAM,yBAAyB,CAAC;AACrE,OAAO,KAAK,EAAE,OAAO,EAAE,MAAM,yBAAyB,CAAC;AACvD,OAAO,KAAK,EAAE,QAAQ,EAAE,QAAQ,EAAE,GAAG,EAAoB,MAAM,mBAAmB,CAAC;AAQnF,qBAAa,WAAY,YAAW,OAAO;IAC7B,OAAO,CAAC,QAAQ,CAAC,MAAM;gBAAN,MAAM,EAAE,OAAO;IAEtC,UAAU,CACd,QAAQ,EAAE,QAAQ,EAClB,QAAQ,EAAE,QAAQ,EAClB,GAAG,EAAE,GAAG,EACR,SAAS,EAAE,YAAY,EACvB,uBAAuB,CAAC,EAAE,eAAe,GACxC,OAAO,CAAC,GAAG,CAAC;CA0FhB"}