@kilnai/core 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (609) hide show
  1. package/dist/agents/circuit-breaker.d.ts +26 -0
  2. package/dist/agents/circuit-breaker.d.ts.map +1 -0
  3. package/dist/agents/circuit-breaker.js +90 -0
  4. package/dist/agents/circuit-breaker.js.map +1 -0
  5. package/dist/agents/context-compressor.d.ts +13 -0
  6. package/dist/agents/context-compressor.d.ts.map +1 -0
  7. package/dist/agents/context-compressor.js +21 -0
  8. package/dist/agents/context-compressor.js.map +1 -0
  9. package/dist/agents/index.d.ts +68 -0
  10. package/dist/agents/index.d.ts.map +1 -0
  11. package/dist/agents/index.js +13 -0
  12. package/dist/agents/index.js.map +1 -0
  13. package/dist/agents/infrastructure/anthropic.d.ts +24 -0
  14. package/dist/agents/infrastructure/anthropic.d.ts.map +1 -0
  15. package/dist/agents/infrastructure/anthropic.js +226 -0
  16. package/dist/agents/infrastructure/anthropic.js.map +1 -0
  17. package/dist/agents/infrastructure/deepseek.d.ts +10 -0
  18. package/dist/agents/infrastructure/deepseek.d.ts.map +1 -0
  19. package/dist/agents/infrastructure/deepseek.js +14 -0
  20. package/dist/agents/infrastructure/deepseek.js.map +1 -0
  21. package/dist/agents/infrastructure/ollama.d.ts +20 -0
  22. package/dist/agents/infrastructure/ollama.d.ts.map +1 -0
  23. package/dist/agents/infrastructure/ollama.js +128 -0
  24. package/dist/agents/infrastructure/ollama.js.map +1 -0
  25. package/dist/agents/infrastructure/openai-compat.d.ts +25 -0
  26. package/dist/agents/infrastructure/openai-compat.d.ts.map +1 -0
  27. package/dist/agents/infrastructure/openai-compat.js +211 -0
  28. package/dist/agents/infrastructure/openai-compat.js.map +1 -0
  29. package/dist/agents/infrastructure/openai.d.ts +12 -0
  30. package/dist/agents/infrastructure/openai.d.ts.map +1 -0
  31. package/dist/agents/infrastructure/openai.js +16 -0
  32. package/dist/agents/infrastructure/openai.js.map +1 -0
  33. package/dist/agents/infrastructure/retry.d.ts +10 -0
  34. package/dist/agents/infrastructure/retry.d.ts.map +1 -0
  35. package/dist/agents/infrastructure/retry.js +22 -0
  36. package/dist/agents/infrastructure/retry.js.map +1 -0
  37. package/dist/agents/mcp-client.d.ts +22 -0
  38. package/dist/agents/mcp-client.d.ts.map +1 -0
  39. package/dist/agents/mcp-client.js +104 -0
  40. package/dist/agents/mcp-client.js.map +1 -0
  41. package/dist/agents/model-pricing.d.ts +9 -0
  42. package/dist/agents/model-pricing.d.ts.map +1 -0
  43. package/dist/agents/model-pricing.js +17 -0
  44. package/dist/agents/model-pricing.js.map +1 -0
  45. package/dist/agents/provider-registry.d.ts +25 -0
  46. package/dist/agents/provider-registry.d.ts.map +1 -0
  47. package/dist/agents/provider-registry.js +62 -0
  48. package/dist/agents/provider-registry.js.map +1 -0
  49. package/dist/agents/tool-cache.d.ts +13 -0
  50. package/dist/agents/tool-cache.d.ts.map +1 -0
  51. package/dist/agents/tool-cache.js +52 -0
  52. package/dist/agents/tool-cache.js.map +1 -0
  53. package/dist/agents/tool-rag.d.ts +15 -0
  54. package/dist/agents/tool-rag.d.ts.map +1 -0
  55. package/dist/agents/tool-rag.js +92 -0
  56. package/dist/agents/tool-rag.js.map +1 -0
  57. package/dist/agents/tool-registry.d.ts +29 -0
  58. package/dist/agents/tool-registry.d.ts.map +1 -0
  59. package/dist/agents/tool-registry.js +64 -0
  60. package/dist/agents/tool-registry.js.map +1 -0
  61. package/dist/cost/cost-tracker.d.ts +27 -0
  62. package/dist/cost/cost-tracker.d.ts.map +1 -0
  63. package/dist/cost/cost-tracker.js +103 -0
  64. package/dist/cost/cost-tracker.js.map +1 -0
  65. package/dist/cost/index.d.ts +30 -0
  66. package/dist/cost/index.d.ts.map +1 -0
  67. package/dist/cost/index.js +2 -0
  68. package/dist/cost/index.js.map +1 -0
  69. package/dist/domain/domain-package-adapter.d.ts +13 -0
  70. package/dist/domain/domain-package-adapter.d.ts.map +1 -0
  71. package/dist/domain/domain-package-adapter.js +66 -0
  72. package/dist/domain/domain-package-adapter.js.map +1 -0
  73. package/dist/domain/domain-registry.d.ts +26 -0
  74. package/dist/domain/domain-registry.d.ts.map +1 -0
  75. package/dist/domain/domain-registry.js +119 -0
  76. package/dist/domain/domain-registry.js.map +1 -0
  77. package/dist/domain/index.d.ts +22 -0
  78. package/dist/domain/index.d.ts.map +1 -0
  79. package/dist/domain/index.js +30 -0
  80. package/dist/domain/index.js.map +1 -0
  81. package/dist/domain/yaml-parser.d.ts +18 -0
  82. package/dist/domain/yaml-parser.d.ts.map +1 -0
  83. package/dist/domain/yaml-parser.js +47 -0
  84. package/dist/domain/yaml-parser.js.map +1 -0
  85. package/dist/domain/yaml-schema.d.ts +26 -0
  86. package/dist/domain/yaml-schema.d.ts.map +1 -0
  87. package/dist/domain/yaml-schema.js +66 -0
  88. package/dist/domain/yaml-schema.js.map +1 -0
  89. package/dist/engine/composites/app.d.ts +39 -0
  90. package/dist/engine/composites/app.d.ts.map +1 -0
  91. package/dist/engine/composites/app.js +125 -0
  92. package/dist/engine/composites/app.js.map +1 -0
  93. package/dist/engine/composites/router.d.ts +20 -0
  94. package/dist/engine/composites/router.d.ts.map +1 -0
  95. package/dist/engine/composites/router.js +31 -0
  96. package/dist/engine/composites/router.js.map +1 -0
  97. package/dist/engine/composites/team.d.ts +36 -0
  98. package/dist/engine/composites/team.d.ts.map +1 -0
  99. package/dist/engine/composites/team.js +100 -0
  100. package/dist/engine/composites/team.js.map +1 -0
  101. package/dist/engine/domain/a2a-config.d.ts +53 -0
  102. package/dist/engine/domain/a2a-config.d.ts.map +1 -0
  103. package/dist/engine/domain/a2a-config.js +32 -0
  104. package/dist/engine/domain/a2a-config.js.map +1 -0
  105. package/dist/engine/domain/agent.d.ts +18 -0
  106. package/dist/engine/domain/agent.d.ts.map +1 -0
  107. package/dist/engine/domain/agent.js +4 -0
  108. package/dist/engine/domain/agent.js.map +1 -0
  109. package/dist/engine/domain/capability.d.ts +24 -0
  110. package/dist/engine/domain/capability.d.ts.map +1 -0
  111. package/dist/engine/domain/capability.js +3 -0
  112. package/dist/engine/domain/capability.js.map +1 -0
  113. package/dist/engine/domain/channel.d.ts +37 -0
  114. package/dist/engine/domain/channel.d.ts.map +1 -0
  115. package/dist/engine/domain/channel.js +4 -0
  116. package/dist/engine/domain/channel.js.map +1 -0
  117. package/dist/engine/domain/chunker.d.ts +22 -0
  118. package/dist/engine/domain/chunker.d.ts.map +1 -0
  119. package/dist/engine/domain/chunker.js +3 -0
  120. package/dist/engine/domain/chunker.js.map +1 -0
  121. package/dist/engine/domain/content.d.ts +57 -0
  122. package/dist/engine/domain/content.d.ts.map +1 -0
  123. package/dist/engine/domain/content.js +63 -0
  124. package/dist/engine/domain/content.js.map +1 -0
  125. package/dist/engine/domain/cron.d.ts +15 -0
  126. package/dist/engine/domain/cron.d.ts.map +1 -0
  127. package/dist/engine/domain/cron.js +114 -0
  128. package/dist/engine/domain/cron.js.map +1 -0
  129. package/dist/engine/domain/embedding.d.ts +9 -0
  130. package/dist/engine/domain/embedding.d.ts.map +1 -0
  131. package/dist/engine/domain/embedding.js +4 -0
  132. package/dist/engine/domain/embedding.js.map +1 -0
  133. package/dist/engine/domain/eval-config.d.ts +36 -0
  134. package/dist/engine/domain/eval-config.d.ts.map +1 -0
  135. package/dist/engine/domain/eval-config.js +155 -0
  136. package/dist/engine/domain/eval-config.js.map +1 -0
  137. package/dist/engine/domain/knowledge-config.d.ts +34 -0
  138. package/dist/engine/domain/knowledge-config.d.ts.map +1 -0
  139. package/dist/engine/domain/knowledge-config.js +62 -0
  140. package/dist/engine/domain/knowledge-config.js.map +1 -0
  141. package/dist/engine/domain/mcp-config.d.ts +15 -0
  142. package/dist/engine/domain/mcp-config.d.ts.map +1 -0
  143. package/dist/engine/domain/mcp-config.js +26 -0
  144. package/dist/engine/domain/mcp-config.js.map +1 -0
  145. package/dist/engine/domain/memory.d.ts +17 -0
  146. package/dist/engine/domain/memory.d.ts.map +1 -0
  147. package/dist/engine/domain/memory.js +4 -0
  148. package/dist/engine/domain/memory.js.map +1 -0
  149. package/dist/engine/domain/modality.d.ts +5 -0
  150. package/dist/engine/domain/modality.d.ts.map +1 -0
  151. package/dist/engine/domain/modality.js +19 -0
  152. package/dist/engine/domain/modality.js.map +1 -0
  153. package/dist/engine/domain/orchestrator-config.d.ts +11 -0
  154. package/dist/engine/domain/orchestrator-config.d.ts.map +1 -0
  155. package/dist/engine/domain/orchestrator-config.js +4 -0
  156. package/dist/engine/domain/orchestrator-config.js.map +1 -0
  157. package/dist/engine/domain/prompt-assembler.d.ts +32 -0
  158. package/dist/engine/domain/prompt-assembler.d.ts.map +1 -0
  159. package/dist/engine/domain/prompt-assembler.js +60 -0
  160. package/dist/engine/domain/prompt-assembler.js.map +1 -0
  161. package/dist/engine/domain/safety-config.d.ts +51 -0
  162. package/dist/engine/domain/safety-config.d.ts.map +1 -0
  163. package/dist/engine/domain/safety-config.js +74 -0
  164. package/dist/engine/domain/safety-config.js.map +1 -0
  165. package/dist/engine/domain/speech-config.d.ts +53 -0
  166. package/dist/engine/domain/speech-config.d.ts.map +1 -0
  167. package/dist/engine/domain/speech-config.js +26 -0
  168. package/dist/engine/domain/speech-config.js.map +1 -0
  169. package/dist/engine/domain/task.d.ts +16 -0
  170. package/dist/engine/domain/task.d.ts.map +1 -0
  171. package/dist/engine/domain/task.js +4 -0
  172. package/dist/engine/domain/task.js.map +1 -0
  173. package/dist/engine/domain/tool-selection-config.d.ts +12 -0
  174. package/dist/engine/domain/tool-selection-config.d.ts.map +1 -0
  175. package/dist/engine/domain/tool-selection-config.js +22 -0
  176. package/dist/engine/domain/tool-selection-config.js.map +1 -0
  177. package/dist/engine/domain/trigger.d.ts +43 -0
  178. package/dist/engine/domain/trigger.d.ts.map +1 -0
  179. package/dist/engine/domain/trigger.js +39 -0
  180. package/dist/engine/domain/trigger.js.map +1 -0
  181. package/dist/engine/domain/vector-store.d.ts +27 -0
  182. package/dist/engine/domain/vector-store.d.ts.map +1 -0
  183. package/dist/engine/domain/vector-store.js +3 -0
  184. package/dist/engine/domain/vector-store.js.map +1 -0
  185. package/dist/engine/domain/workflow.d.ts +11 -0
  186. package/dist/engine/domain/workflow.d.ts.map +1 -0
  187. package/dist/engine/domain/workflow.js +4 -0
  188. package/dist/engine/domain/workflow.js.map +1 -0
  189. package/dist/engine/error-catalog.d.ts +8 -0
  190. package/dist/engine/error-catalog.d.ts.map +1 -0
  191. package/dist/engine/error-catalog.js +335 -0
  192. package/dist/engine/error-catalog.js.map +1 -0
  193. package/dist/engine/errors.d.ts +18 -0
  194. package/dist/engine/errors.d.ts.map +1 -0
  195. package/dist/engine/errors.js +20 -0
  196. package/dist/engine/errors.js.map +1 -0
  197. package/dist/engine/gateway/delegation-config.d.ts +52 -0
  198. package/dist/engine/gateway/delegation-config.d.ts.map +1 -0
  199. package/dist/engine/gateway/delegation-config.js +48 -0
  200. package/dist/engine/gateway/delegation-config.js.map +1 -0
  201. package/dist/engine/gateway/gateway-config.d.ts +33 -0
  202. package/dist/engine/gateway/gateway-config.d.ts.map +1 -0
  203. package/dist/engine/gateway/gateway-config.js +61 -0
  204. package/dist/engine/gateway/gateway-config.js.map +1 -0
  205. package/dist/engine/gateway/gateway-loader.d.ts +10 -0
  206. package/dist/engine/gateway/gateway-loader.d.ts.map +1 -0
  207. package/dist/engine/gateway/gateway-loader.js +150 -0
  208. package/dist/engine/gateway/gateway-loader.js.map +1 -0
  209. package/dist/engine/gateway/mode-b-config.d.ts +44 -0
  210. package/dist/engine/gateway/mode-b-config.d.ts.map +1 -0
  211. package/dist/engine/gateway/mode-b-config.js +45 -0
  212. package/dist/engine/gateway/mode-b-config.js.map +1 -0
  213. package/dist/engine/gateway/mode-b-loader.d.ts +14 -0
  214. package/dist/engine/gateway/mode-b-loader.d.ts.map +1 -0
  215. package/dist/engine/gateway/mode-b-loader.js +104 -0
  216. package/dist/engine/gateway/mode-b-loader.js.map +1 -0
  217. package/dist/engine/gateway/observability-config.d.ts +19 -0
  218. package/dist/engine/gateway/observability-config.d.ts.map +1 -0
  219. package/dist/engine/gateway/observability-config.js +27 -0
  220. package/dist/engine/gateway/observability-config.js.map +1 -0
  221. package/dist/engine/gateway/tenant-config.d.ts +59 -0
  222. package/dist/engine/gateway/tenant-config.d.ts.map +1 -0
  223. package/dist/engine/gateway/tenant-config.js +44 -0
  224. package/dist/engine/gateway/tenant-config.js.map +1 -0
  225. package/dist/engine/index.d.ts +49 -0
  226. package/dist/engine/index.d.ts.map +1 -0
  227. package/dist/engine/index.js +27 -0
  228. package/dist/engine/index.js.map +1 -0
  229. package/dist/engine/loader/app-loader.d.ts +18 -0
  230. package/dist/engine/loader/app-loader.d.ts.map +1 -0
  231. package/dist/engine/loader/app-loader.js +947 -0
  232. package/dist/engine/loader/app-loader.js.map +1 -0
  233. package/dist/engine/loader/preset-loader.d.ts +13 -0
  234. package/dist/engine/loader/preset-loader.d.ts.map +1 -0
  235. package/dist/engine/loader/preset-loader.js +51 -0
  236. package/dist/engine/loader/preset-loader.js.map +1 -0
  237. package/dist/eval/dataset-loader.d.ts +3 -0
  238. package/dist/eval/dataset-loader.d.ts.map +1 -0
  239. package/dist/eval/dataset-loader.js +70 -0
  240. package/dist/eval/dataset-loader.js.map +1 -0
  241. package/dist/eval/experiment-comparator.d.ts +16 -0
  242. package/dist/eval/experiment-comparator.d.ts.map +1 -0
  243. package/dist/eval/experiment-comparator.js +34 -0
  244. package/dist/eval/experiment-comparator.js.map +1 -0
  245. package/dist/eval/experiment-runner.d.ts +20 -0
  246. package/dist/eval/experiment-runner.d.ts.map +1 -0
  247. package/dist/eval/experiment-runner.js +54 -0
  248. package/dist/eval/experiment-runner.js.map +1 -0
  249. package/dist/eval/index.d.ts +21 -0
  250. package/dist/eval/index.d.ts.map +1 -0
  251. package/dist/eval/index.js +19 -0
  252. package/dist/eval/index.js.map +1 -0
  253. package/dist/eval/scorer-factory.d.ts +4 -0
  254. package/dist/eval/scorer-factory.d.ts.map +1 -0
  255. package/dist/eval/scorer-factory.js +67 -0
  256. package/dist/eval/scorer-factory.js.map +1 -0
  257. package/dist/eval/scorers/coherence-scorer.d.ts +8 -0
  258. package/dist/eval/scorers/coherence-scorer.d.ts.map +1 -0
  259. package/dist/eval/scorers/coherence-scorer.js +22 -0
  260. package/dist/eval/scorers/coherence-scorer.js.map +1 -0
  261. package/dist/eval/scorers/composite-scorer.d.ts +8 -0
  262. package/dist/eval/scorers/composite-scorer.d.ts.map +1 -0
  263. package/dist/eval/scorers/composite-scorer.js +19 -0
  264. package/dist/eval/scorers/composite-scorer.js.map +1 -0
  265. package/dist/eval/scorers/contains-scorer.d.ts +8 -0
  266. package/dist/eval/scorers/contains-scorer.d.ts.map +1 -0
  267. package/dist/eval/scorers/contains-scorer.js +30 -0
  268. package/dist/eval/scorers/contains-scorer.js.map +1 -0
  269. package/dist/eval/scorers/cost-scorer.d.ts +8 -0
  270. package/dist/eval/scorers/cost-scorer.d.ts.map +1 -0
  271. package/dist/eval/scorers/cost-scorer.js +19 -0
  272. package/dist/eval/scorers/cost-scorer.js.map +1 -0
  273. package/dist/eval/scorers/custom-prompt-scorer.d.ts +9 -0
  274. package/dist/eval/scorers/custom-prompt-scorer.d.ts.map +1 -0
  275. package/dist/eval/scorers/custom-prompt-scorer.js +24 -0
  276. package/dist/eval/scorers/custom-prompt-scorer.js.map +1 -0
  277. package/dist/eval/scorers/exact-match-scorer.d.ts +6 -0
  278. package/dist/eval/scorers/exact-match-scorer.d.ts.map +1 -0
  279. package/dist/eval/scorers/exact-match-scorer.js +16 -0
  280. package/dist/eval/scorers/exact-match-scorer.js.map +1 -0
  281. package/dist/eval/scorers/faithfulness-scorer.d.ts +8 -0
  282. package/dist/eval/scorers/faithfulness-scorer.d.ts.map +1 -0
  283. package/dist/eval/scorers/faithfulness-scorer.js +27 -0
  284. package/dist/eval/scorers/faithfulness-scorer.js.map +1 -0
  285. package/dist/eval/scorers/hallucination-scorer.d.ts +8 -0
  286. package/dist/eval/scorers/hallucination-scorer.d.ts.map +1 -0
  287. package/dist/eval/scorers/hallucination-scorer.js +31 -0
  288. package/dist/eval/scorers/hallucination-scorer.js.map +1 -0
  289. package/dist/eval/scorers/json-validity-scorer.d.ts +8 -0
  290. package/dist/eval/scorers/json-validity-scorer.d.ts.map +1 -0
  291. package/dist/eval/scorers/json-validity-scorer.js +32 -0
  292. package/dist/eval/scorers/json-validity-scorer.js.map +1 -0
  293. package/dist/eval/scorers/latency-scorer.d.ts +8 -0
  294. package/dist/eval/scorers/latency-scorer.d.ts.map +1 -0
  295. package/dist/eval/scorers/latency-scorer.js +19 -0
  296. package/dist/eval/scorers/latency-scorer.js.map +1 -0
  297. package/dist/eval/scorers/length-scorer.d.ts +9 -0
  298. package/dist/eval/scorers/length-scorer.d.ts.map +1 -0
  299. package/dist/eval/scorers/length-scorer.js +26 -0
  300. package/dist/eval/scorers/length-scorer.js.map +1 -0
  301. package/dist/eval/scorers/parse-llm-response.d.ts +5 -0
  302. package/dist/eval/scorers/parse-llm-response.d.ts.map +1 -0
  303. package/dist/eval/scorers/parse-llm-response.js +13 -0
  304. package/dist/eval/scorers/parse-llm-response.js.map +1 -0
  305. package/dist/eval/scorers/relevance-scorer.d.ts +8 -0
  306. package/dist/eval/scorers/relevance-scorer.d.ts.map +1 -0
  307. package/dist/eval/scorers/relevance-scorer.js +23 -0
  308. package/dist/eval/scorers/relevance-scorer.js.map +1 -0
  309. package/dist/eval/scorers/toxicity-scorer.d.ts +8 -0
  310. package/dist/eval/scorers/toxicity-scorer.d.ts.map +1 -0
  311. package/dist/eval/scorers/toxicity-scorer.js +26 -0
  312. package/dist/eval/scorers/toxicity-scorer.js.map +1 -0
  313. package/dist/eval/types.d.ts +51 -0
  314. package/dist/eval/types.d.ts.map +1 -0
  315. package/dist/eval/types.js +3 -0
  316. package/dist/eval/types.js.map +1 -0
  317. package/dist/events/event-bus.d.ts +36 -0
  318. package/dist/events/event-bus.d.ts.map +1 -0
  319. package/dist/events/event-bus.js +116 -0
  320. package/dist/events/event-bus.js.map +1 -0
  321. package/dist/events/event-store.d.ts +11 -0
  322. package/dist/events/event-store.d.ts.map +1 -0
  323. package/dist/events/event-store.js +2 -0
  324. package/dist/events/event-store.js.map +1 -0
  325. package/dist/events/index.d.ts +295 -0
  326. package/dist/events/index.d.ts.map +1 -0
  327. package/dist/events/index.js +48 -0
  328. package/dist/events/index.js.map +1 -0
  329. package/dist/events/trace.d.ts +30 -0
  330. package/dist/events/trace.d.ts.map +1 -0
  331. package/dist/events/trace.js +45 -0
  332. package/dist/events/trace.js.map +1 -0
  333. package/dist/index.d.ts +58 -0
  334. package/dist/index.d.ts.map +1 -0
  335. package/dist/index.js +42 -0
  336. package/dist/index.js.map +1 -0
  337. package/dist/knowledge/index.d.ts +10 -0
  338. package/dist/knowledge/index.d.ts.map +1 -0
  339. package/dist/knowledge/index.js +9 -0
  340. package/dist/knowledge/index.js.map +1 -0
  341. package/dist/knowledge/infrastructure/memory-vector-store.d.ts +12 -0
  342. package/dist/knowledge/infrastructure/memory-vector-store.d.ts.map +1 -0
  343. package/dist/knowledge/infrastructure/memory-vector-store.js +71 -0
  344. package/dist/knowledge/infrastructure/memory-vector-store.js.map +1 -0
  345. package/dist/knowledge/infrastructure/ollama-embedding.d.ts +15 -0
  346. package/dist/knowledge/infrastructure/ollama-embedding.d.ts.map +1 -0
  347. package/dist/knowledge/infrastructure/ollama-embedding.js +38 -0
  348. package/dist/knowledge/infrastructure/ollama-embedding.js.map +1 -0
  349. package/dist/knowledge/infrastructure/openai-embedding.d.ts +18 -0
  350. package/dist/knowledge/infrastructure/openai-embedding.d.ts.map +1 -0
  351. package/dist/knowledge/infrastructure/openai-embedding.js +66 -0
  352. package/dist/knowledge/infrastructure/openai-embedding.js.map +1 -0
  353. package/dist/knowledge/knowledge-capability.d.ts +15 -0
  354. package/dist/knowledge/knowledge-capability.d.ts.map +1 -0
  355. package/dist/knowledge/knowledge-capability.js +36 -0
  356. package/dist/knowledge/knowledge-capability.js.map +1 -0
  357. package/dist/knowledge/markdown-chunker.d.ts +8 -0
  358. package/dist/knowledge/markdown-chunker.d.ts.map +1 -0
  359. package/dist/knowledge/markdown-chunker.js +146 -0
  360. package/dist/knowledge/markdown-chunker.js.map +1 -0
  361. package/dist/knowledge/recursive-chunker.d.ts +8 -0
  362. package/dist/knowledge/recursive-chunker.d.ts.map +1 -0
  363. package/dist/knowledge/recursive-chunker.js +73 -0
  364. package/dist/knowledge/recursive-chunker.js.map +1 -0
  365. package/dist/knowledge/reranker.d.ts +5 -0
  366. package/dist/knowledge/reranker.d.ts.map +1 -0
  367. package/dist/knowledge/reranker.js +3 -0
  368. package/dist/knowledge/reranker.js.map +1 -0
  369. package/dist/knowledge/retrieval-pipeline.d.ts +26 -0
  370. package/dist/knowledge/retrieval-pipeline.d.ts.map +1 -0
  371. package/dist/knowledge/retrieval-pipeline.js +56 -0
  372. package/dist/knowledge/retrieval-pipeline.js.map +1 -0
  373. package/dist/memory/chunk-importer.d.ts +16 -0
  374. package/dist/memory/chunk-importer.d.ts.map +1 -0
  375. package/dist/memory/chunk-importer.js +58 -0
  376. package/dist/memory/chunk-importer.js.map +1 -0
  377. package/dist/memory/compactor.d.ts +59 -0
  378. package/dist/memory/compactor.d.ts.map +1 -0
  379. package/dist/memory/compactor.js +100 -0
  380. package/dist/memory/compactor.js.map +1 -0
  381. package/dist/memory/decay-curves.d.ts +33 -0
  382. package/dist/memory/decay-curves.d.ts.map +1 -0
  383. package/dist/memory/decay-curves.js +48 -0
  384. package/dist/memory/decay-curves.js.map +1 -0
  385. package/dist/memory/developer-identity.d.ts +7 -0
  386. package/dist/memory/developer-identity.d.ts.map +1 -0
  387. package/dist/memory/developer-identity.js +20 -0
  388. package/dist/memory/developer-identity.js.map +1 -0
  389. package/dist/memory/git-sync-manager.d.ts +28 -0
  390. package/dist/memory/git-sync-manager.d.ts.map +1 -0
  391. package/dist/memory/git-sync-manager.js +77 -0
  392. package/dist/memory/git-sync-manager.js.map +1 -0
  393. package/dist/memory/index.d.ts +46 -0
  394. package/dist/memory/index.d.ts.map +1 -0
  395. package/dist/memory/index.js +11 -0
  396. package/dist/memory/index.js.map +1 -0
  397. package/dist/memory/memory-manager.d.ts +34 -0
  398. package/dist/memory/memory-manager.d.ts.map +1 -0
  399. package/dist/memory/memory-manager.js +151 -0
  400. package/dist/memory/memory-manager.js.map +1 -0
  401. package/dist/memory/project-store.d.ts +28 -0
  402. package/dist/memory/project-store.d.ts.map +1 -0
  403. package/dist/memory/project-store.js +159 -0
  404. package/dist/memory/project-store.js.map +1 -0
  405. package/dist/memory/sqlite-store.d.ts +41 -0
  406. package/dist/memory/sqlite-store.d.ts.map +1 -0
  407. package/dist/memory/sqlite-store.js +320 -0
  408. package/dist/memory/sqlite-store.js.map +1 -0
  409. package/dist/observability/index.d.ts +5 -0
  410. package/dist/observability/index.d.ts.map +1 -0
  411. package/dist/observability/index.js +3 -0
  412. package/dist/observability/index.js.map +1 -0
  413. package/dist/observability/otel-exporter.d.ts +41 -0
  414. package/dist/observability/otel-exporter.d.ts.map +1 -0
  415. package/dist/observability/otel-exporter.js +166 -0
  416. package/dist/observability/otel-exporter.js.map +1 -0
  417. package/dist/observability/span-mapper.d.ts +24 -0
  418. package/dist/observability/span-mapper.d.ts.map +1 -0
  419. package/dist/observability/span-mapper.js +375 -0
  420. package/dist/observability/span-mapper.js.map +1 -0
  421. package/dist/orchestrator/checkpoint-store.d.ts +9 -0
  422. package/dist/orchestrator/checkpoint-store.d.ts.map +1 -0
  423. package/dist/orchestrator/checkpoint-store.js +2 -0
  424. package/dist/orchestrator/checkpoint-store.js.map +1 -0
  425. package/dist/orchestrator/checkpoint-types.d.ts +30 -0
  426. package/dist/orchestrator/checkpoint-types.d.ts.map +1 -0
  427. package/dist/orchestrator/checkpoint-types.js +2 -0
  428. package/dist/orchestrator/checkpoint-types.js.map +1 -0
  429. package/dist/orchestrator/guardrails.d.ts +23 -0
  430. package/dist/orchestrator/guardrails.d.ts.map +1 -0
  431. package/dist/orchestrator/guardrails.js +136 -0
  432. package/dist/orchestrator/guardrails.js.map +1 -0
  433. package/dist/orchestrator/index.d.ts +45 -0
  434. package/dist/orchestrator/index.d.ts.map +1 -0
  435. package/dist/orchestrator/index.js +8 -0
  436. package/dist/orchestrator/index.js.map +1 -0
  437. package/dist/orchestrator/interrupt.d.ts +20 -0
  438. package/dist/orchestrator/interrupt.d.ts.map +1 -0
  439. package/dist/orchestrator/interrupt.js +4 -0
  440. package/dist/orchestrator/interrupt.js.map +1 -0
  441. package/dist/orchestrator/orchestrator.d.ts +170 -0
  442. package/dist/orchestrator/orchestrator.d.ts.map +1 -0
  443. package/dist/orchestrator/orchestrator.js +509 -0
  444. package/dist/orchestrator/orchestrator.js.map +1 -0
  445. package/dist/orchestrator/phase-machine.d.ts +48 -0
  446. package/dist/orchestrator/phase-machine.d.ts.map +1 -0
  447. package/dist/orchestrator/phase-machine.js +176 -0
  448. package/dist/orchestrator/phase-machine.js.map +1 -0
  449. package/dist/orchestrator/schemas.d.ts +145 -0
  450. package/dist/orchestrator/schemas.d.ts.map +1 -0
  451. package/dist/orchestrator/schemas.js +126 -0
  452. package/dist/orchestrator/schemas.js.map +1 -0
  453. package/dist/orchestrator/sqlite-checkpoint-store.d.ts +15 -0
  454. package/dist/orchestrator/sqlite-checkpoint-store.d.ts.map +1 -0
  455. package/dist/orchestrator/sqlite-checkpoint-store.js +98 -0
  456. package/dist/orchestrator/sqlite-checkpoint-store.js.map +1 -0
  457. package/dist/orchestrator/strategies/index.d.ts +28 -0
  458. package/dist/orchestrator/strategies/index.d.ts.map +1 -0
  459. package/dist/orchestrator/strategies/index.js +20 -0
  460. package/dist/orchestrator/strategies/index.js.map +1 -0
  461. package/dist/orchestrator/strategies/sequential-strategy.d.ts +13 -0
  462. package/dist/orchestrator/strategies/sequential-strategy.d.ts.map +1 -0
  463. package/dist/orchestrator/strategies/sequential-strategy.js +29 -0
  464. package/dist/orchestrator/strategies/sequential-strategy.js.map +1 -0
  465. package/dist/orchestrator/strategies/supervisor-strategy.d.ts +43 -0
  466. package/dist/orchestrator/strategies/supervisor-strategy.d.ts.map +1 -0
  467. package/dist/orchestrator/strategies/supervisor-strategy.js +118 -0
  468. package/dist/orchestrator/strategies/supervisor-strategy.js.map +1 -0
  469. package/dist/orchestrator/strategies/swarm-strategy.d.ts +36 -0
  470. package/dist/orchestrator/strategies/swarm-strategy.d.ts.map +1 -0
  471. package/dist/orchestrator/strategies/swarm-strategy.js +126 -0
  472. package/dist/orchestrator/strategies/swarm-strategy.js.map +1 -0
  473. package/dist/package/index.d.ts +7 -0
  474. package/dist/package/index.d.ts.map +1 -0
  475. package/dist/package/index.js +6 -0
  476. package/dist/package/index.js.map +1 -0
  477. package/dist/package/security.d.ts +18 -0
  478. package/dist/package/security.d.ts.map +1 -0
  479. package/dist/package/security.js +110 -0
  480. package/dist/package/security.js.map +1 -0
  481. package/dist/package/types.d.ts +34 -0
  482. package/dist/package/types.d.ts.map +1 -0
  483. package/dist/package/types.js +4 -0
  484. package/dist/package/types.js.map +1 -0
  485. package/dist/package/yaml-parser.d.ts +22 -0
  486. package/dist/package/yaml-parser.d.ts.map +1 -0
  487. package/dist/package/yaml-parser.js +109 -0
  488. package/dist/package/yaml-parser.js.map +1 -0
  489. package/dist/package/yaml-schema.d.ts +42 -0
  490. package/dist/package/yaml-schema.d.ts.map +1 -0
  491. package/dist/package/yaml-schema.js +141 -0
  492. package/dist/package/yaml-schema.js.map +1 -0
  493. package/dist/safety/content-classifier.d.ts +31 -0
  494. package/dist/safety/content-classifier.d.ts.map +1 -0
  495. package/dist/safety/content-classifier.js +107 -0
  496. package/dist/safety/content-classifier.js.map +1 -0
  497. package/dist/safety/index.d.ts +10 -0
  498. package/dist/safety/index.d.ts.map +1 -0
  499. package/dist/safety/index.js +10 -0
  500. package/dist/safety/index.js.map +1 -0
  501. package/dist/safety/pii-scanner.d.ts +26 -0
  502. package/dist/safety/pii-scanner.d.ts.map +1 -0
  503. package/dist/safety/pii-scanner.js +82 -0
  504. package/dist/safety/pii-scanner.js.map +1 -0
  505. package/dist/safety/rails.d.ts +33 -0
  506. package/dist/safety/rails.d.ts.map +1 -0
  507. package/dist/safety/rails.js +134 -0
  508. package/dist/safety/rails.js.map +1 -0
  509. package/dist/safety/safety-pipeline.d.ts +41 -0
  510. package/dist/safety/safety-pipeline.d.ts.map +1 -0
  511. package/dist/safety/safety-pipeline.js +153 -0
  512. package/dist/safety/safety-pipeline.js.map +1 -0
  513. package/dist/safety/types.d.ts +38 -0
  514. package/dist/safety/types.d.ts.map +1 -0
  515. package/dist/safety/types.js +3 -0
  516. package/dist/safety/types.js.map +1 -0
  517. package/dist/sandbox/index.d.ts +17 -0
  518. package/dist/sandbox/index.d.ts.map +1 -0
  519. package/dist/sandbox/index.js +4 -0
  520. package/dist/sandbox/index.js.map +1 -0
  521. package/dist/sandbox/network-filter.d.ts +13 -0
  522. package/dist/sandbox/network-filter.d.ts.map +1 -0
  523. package/dist/sandbox/network-filter.js +43 -0
  524. package/dist/sandbox/network-filter.js.map +1 -0
  525. package/dist/sandbox/path-validator.d.ts +16 -0
  526. package/dist/sandbox/path-validator.d.ts.map +1 -0
  527. package/dist/sandbox/path-validator.js +47 -0
  528. package/dist/sandbox/path-validator.js.map +1 -0
  529. package/dist/sandbox/policies.d.ts +38 -0
  530. package/dist/sandbox/policies.d.ts.map +1 -0
  531. package/dist/sandbox/policies.js +145 -0
  532. package/dist/sandbox/policies.js.map +1 -0
  533. package/dist/security/audit-log.d.ts +17 -0
  534. package/dist/security/audit-log.d.ts.map +1 -0
  535. package/dist/security/audit-log.js +214 -0
  536. package/dist/security/audit-log.js.map +1 -0
  537. package/dist/security/guardian.d.ts +24 -0
  538. package/dist/security/guardian.d.ts.map +1 -0
  539. package/dist/security/guardian.js +177 -0
  540. package/dist/security/guardian.js.map +1 -0
  541. package/dist/security/index.d.ts +10 -0
  542. package/dist/security/index.d.ts.map +1 -0
  543. package/dist/security/index.js +7 -0
  544. package/dist/security/index.js.map +1 -0
  545. package/dist/security/prompt-scanner.d.ts +23 -0
  546. package/dist/security/prompt-scanner.d.ts.map +1 -0
  547. package/dist/security/prompt-scanner.js +376 -0
  548. package/dist/security/prompt-scanner.js.map +1 -0
  549. package/dist/security/secret-store.d.ts +18 -0
  550. package/dist/security/secret-store.d.ts.map +1 -0
  551. package/dist/security/secret-store.js +123 -0
  552. package/dist/security/secret-store.js.map +1 -0
  553. package/dist/security/self-audit.d.ts +33 -0
  554. package/dist/security/self-audit.d.ts.map +1 -0
  555. package/dist/security/self-audit.js +142 -0
  556. package/dist/security/self-audit.js.map +1 -0
  557. package/dist/security/types.d.ts +107 -0
  558. package/dist/security/types.d.ts.map +1 -0
  559. package/dist/security/types.js +3 -0
  560. package/dist/security/types.js.map +1 -0
  561. package/dist/skill/index.d.ts +7 -0
  562. package/dist/skill/index.d.ts.map +1 -0
  563. package/dist/skill/index.js +4 -0
  564. package/dist/skill/index.js.map +1 -0
  565. package/dist/skill/skill-registry.d.ts +26 -0
  566. package/dist/skill/skill-registry.d.ts.map +1 -0
  567. package/dist/skill/skill-registry.js +81 -0
  568. package/dist/skill/skill-registry.js.map +1 -0
  569. package/dist/skill/types.d.ts +17 -0
  570. package/dist/skill/types.d.ts.map +1 -0
  571. package/dist/skill/types.js +2 -0
  572. package/dist/skill/types.js.map +1 -0
  573. package/dist/skill/yaml-parser.d.ts +18 -0
  574. package/dist/skill/yaml-parser.d.ts.map +1 -0
  575. package/dist/skill/yaml-parser.js +61 -0
  576. package/dist/skill/yaml-parser.js.map +1 -0
  577. package/dist/skill/yaml-schema.d.ts +20 -0
  578. package/dist/skill/yaml-schema.d.ts.map +1 -0
  579. package/dist/skill/yaml-schema.js +80 -0
  580. package/dist/skill/yaml-schema.js.map +1 -0
  581. package/dist/tree/batch-executor.d.ts +28 -0
  582. package/dist/tree/batch-executor.d.ts.map +1 -0
  583. package/dist/tree/batch-executor.js +78 -0
  584. package/dist/tree/batch-executor.js.map +1 -0
  585. package/dist/tree/index.d.ts +26 -0
  586. package/dist/tree/index.d.ts.map +1 -0
  587. package/dist/tree/index.js +3 -0
  588. package/dist/tree/index.js.map +1 -0
  589. package/dist/tree/task-tree.d.ts +74 -0
  590. package/dist/tree/task-tree.d.ts.map +1 -0
  591. package/dist/tree/task-tree.js +262 -0
  592. package/dist/tree/task-tree.js.map +1 -0
  593. package/dist/verification/coverage-parser.d.ts +6 -0
  594. package/dist/verification/coverage-parser.d.ts.map +1 -0
  595. package/dist/verification/coverage-parser.js +29 -0
  596. package/dist/verification/coverage-parser.js.map +1 -0
  597. package/dist/verification/gate-runner.d.ts +18 -0
  598. package/dist/verification/gate-runner.d.ts.map +1 -0
  599. package/dist/verification/gate-runner.js +63 -0
  600. package/dist/verification/gate-runner.js.map +1 -0
  601. package/dist/verification/index.d.ts +24 -0
  602. package/dist/verification/index.d.ts.map +1 -0
  603. package/dist/verification/index.js +4 -0
  604. package/dist/verification/index.js.map +1 -0
  605. package/dist/verification/verification-loop.d.ts +32 -0
  606. package/dist/verification/verification-loop.d.ts.map +1 -0
  607. package/dist/verification/verification-loop.js +71 -0
  608. package/dist/verification/verification-loop.js.map +1 -0
  609. package/package.json +58 -0
@@ -0,0 +1,19 @@
1
+ // CompositeScorer: averages scores from multiple sub-scorers
2
+ export class CompositeScorer {
3
+ scorers;
4
+ name;
5
+ constructor(name, scorers) {
6
+ this.scorers = scorers;
7
+ this.name = name;
8
+ }
9
+ async score(input) {
10
+ if (this.scorers.length === 0) {
11
+ return { name: this.name, score: 0, reasoning: "no sub-scorers configured" };
12
+ }
13
+ const results = await Promise.all(this.scorers.map((s) => s.score(input)));
14
+ const avg = results.reduce((sum, r) => sum + r.score, 0) / results.length;
15
+ const reasoning = results.map((r) => `${r.name}=${r.score.toFixed(2)}`).join(", ");
16
+ return { name: this.name, score: avg, reasoning };
17
+ }
18
+ }
19
+ //# sourceMappingURL=composite-scorer.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"composite-scorer.js","sourceRoot":"","sources":["../../../src/eval/scorers/composite-scorer.ts"],"names":[],"mappings":"AAAA,6DAA6D;AAI7D,MAAM,OAAO,eAAe;IAKP;IAJV,IAAI,CAAS;IAEtB,YACE,IAAY,EACK,OAA0B;QAA1B,YAAO,GAAP,OAAO,CAAmB;QAE3C,IAAI,CAAC,IAAI,GAAG,IAAI,CAAC;IACnB,CAAC;IAED,KAAK,CAAC,KAAK,CAAC,KAAgB;QAC1B,IAAI,IAAI,CAAC,OAAO,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;YAC9B,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,CAAC,EAAE,SAAS,EAAE,2BAA2B,EAAE,CAAC;QAC/E,CAAC;QACD,MAAM,OAAO,GAAG,MAAM,OAAO,CAAC,GAAG,CAAC,IAAI,CAAC,OAAO,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC;QAC3E,MAAM,GAAG,GAAG,OAAO,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,CAAC,EAAE,EAAE,CAAC,GAAG,GAAG,CAAC,CAAC,KAAK,EAAE,CAAC,CAAC,GAAG,OAAO,CAAC,MAAM,CAAC;QAC1E,MAAM,SAAS,GAAG,OAAO,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,GAAG,CAAC,CAAC,IAAI,IAAI,CAAC,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;QACnF,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,GAAG,EAAE,SAAS,EAAE,CAAC;IACpD,CAAC;CACF"}
@@ -0,0 +1,8 @@
1
+ import type { EvalInput, EvalScore, Scorer } from "../types.js";
2
+ export declare class ContainsScorer implements Scorer {
3
+ private readonly substrings;
4
+ readonly name = "contains";
5
+ constructor(substrings: readonly string[]);
6
+ score(input: EvalInput): Promise<EvalScore>;
7
+ }
8
+ //# sourceMappingURL=contains-scorer.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"contains-scorer.d.ts","sourceRoot":"","sources":["../../../src/eval/scorers/contains-scorer.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,SAAS,EAAE,SAAS,EAAE,MAAM,EAAE,MAAM,aAAa,CAAC;AAEhE,qBAAa,cAAe,YAAW,MAAM;IAG/B,OAAO,CAAC,QAAQ,CAAC,UAAU;IAFvC,QAAQ,CAAC,IAAI,cAAc;gBAEE,UAAU,EAAE,SAAS,MAAM,EAAE;IAEpD,KAAK,CAAC,KAAK,EAAE,SAAS,GAAG,OAAO,CAAC,SAAS,CAAC;CAoBlD"}
@@ -0,0 +1,30 @@
1
+ // ContainsScorer: checks if output contains required substrings (case-insensitive)
2
+ export class ContainsScorer {
3
+ substrings;
4
+ name = "contains";
5
+ constructor(substrings) {
6
+ this.substrings = substrings;
7
+ }
8
+ async score(input) {
9
+ if (this.substrings.length === 0) {
10
+ return { name: this.name, score: 1, reasoning: "no substrings to check" };
11
+ }
12
+ const lower = input.output.toLowerCase();
13
+ const found = [];
14
+ const missing = [];
15
+ for (const sub of this.substrings) {
16
+ if (lower.includes(sub.toLowerCase())) {
17
+ found.push(sub);
18
+ }
19
+ else {
20
+ missing.push(sub);
21
+ }
22
+ }
23
+ const score = found.length / this.substrings.length;
24
+ const reasoning = missing.length === 0
25
+ ? `found all ${found.length} substrings`
26
+ : `found ${found.length}/${this.substrings.length}, missing: ${missing.join(", ")}`;
27
+ return { name: this.name, score, reasoning };
28
+ }
29
+ }
30
+ //# sourceMappingURL=contains-scorer.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"contains-scorer.js","sourceRoot":"","sources":["../../../src/eval/scorers/contains-scorer.ts"],"names":[],"mappings":"AAAA,mFAAmF;AAInF,MAAM,OAAO,cAAc;IAGI;IAFpB,IAAI,GAAG,UAAU,CAAC;IAE3B,YAA6B,UAA6B;QAA7B,eAAU,GAAV,UAAU,CAAmB;IAAG,CAAC;IAE9D,KAAK,CAAC,KAAK,CAAC,KAAgB;QAC1B,IAAI,IAAI,CAAC,UAAU,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;YACjC,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,CAAC,EAAE,SAAS,EAAE,wBAAwB,EAAE,CAAC;QAC5E,CAAC;QACD,MAAM,KAAK,GAAG,KAAK,CAAC,MAAM,CAAC,WAAW,EAAE,CAAC;QACzC,MAAM,KAAK,GAAa,EAAE,CAAC;QAC3B,MAAM,OAAO,GAAa,EAAE,CAAC;QAC7B,KAAK,MAAM,GAAG,IAAI,IAAI,CAAC,UAAU,EAAE,CAAC;YAClC,IAAI,KAAK,CAAC,QAAQ,CAAC,GAAG,CAAC,WAAW,EAAE,CAAC,EAAE,CAAC;gBACtC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;YAClB,CAAC;iBAAM,CAAC;gBACN,OAAO,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;YACpB,CAAC;QACH,CAAC;QACD,MAAM,KAAK,GAAG,KAAK,CAAC,MAAM,GAAG,IAAI,CAAC,UAAU,CAAC,MAAM,CAAC;QACpD,MAAM,SAAS,GAAG,OAAO,CAAC,MAAM,KAAK,CAAC;YACpC,CAAC,CAAC,aAAa,KAAK,CAAC,MAAM,aAAa;YACxC,CAAC,CAAC,SAAS,KAAK,CAAC,MAAM,IAAI,IAAI,CAAC,UAAU,CAAC,MAAM,cAAc,OAAO,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QACtF,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,SAAS,EAAE,CAAC;IAC/C,CAAC;CACF"}
@@ -0,0 +1,8 @@
1
+ import type { EvalInput, EvalScore, Scorer } from "../types.js";
2
+ export declare class CostScorer implements Scorer {
3
+ private readonly maxCostUsd;
4
+ readonly name = "cost";
5
+ constructor(maxCostUsd: number);
6
+ score(input: EvalInput): Promise<EvalScore>;
7
+ }
8
+ //# sourceMappingURL=cost-scorer.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"cost-scorer.d.ts","sourceRoot":"","sources":["../../../src/eval/scorers/cost-scorer.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,SAAS,EAAE,SAAS,EAAE,MAAM,EAAE,MAAM,aAAa,CAAC;AAEhE,qBAAa,UAAW,YAAW,MAAM;IAG3B,OAAO,CAAC,QAAQ,CAAC,UAAU;IAFvC,QAAQ,CAAC,IAAI,UAAU;gBAEM,UAAU,EAAE,MAAM;IAEzC,KAAK,CAAC,KAAK,EAAE,SAAS,GAAG,OAAO,CAAC,SAAS,CAAC;CAUlD"}
@@ -0,0 +1,19 @@
1
+ // CostScorer: scores token cost against a budget threshold
2
+ export class CostScorer {
3
+ maxCostUsd;
4
+ name = "cost";
5
+ constructor(maxCostUsd) {
6
+ this.maxCostUsd = maxCostUsd;
7
+ }
8
+ async score(input) {
9
+ if (input.costUsd === undefined) {
10
+ return { name: this.name, score: 0, reasoning: "no cost data available" };
11
+ }
12
+ if (input.costUsd <= this.maxCostUsd) {
13
+ return { name: this.name, score: 1, reasoning: `$${input.costUsd.toFixed(4)} within $${this.maxCostUsd.toFixed(2)} threshold` };
14
+ }
15
+ const score = Math.max(0, Math.min(1, this.maxCostUsd / input.costUsd));
16
+ return { name: this.name, score, reasoning: `$${input.costUsd.toFixed(4)} exceeds $${this.maxCostUsd.toFixed(2)} threshold` };
17
+ }
18
+ }
19
+ //# sourceMappingURL=cost-scorer.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"cost-scorer.js","sourceRoot":"","sources":["../../../src/eval/scorers/cost-scorer.ts"],"names":[],"mappings":"AAAA,2DAA2D;AAI3D,MAAM,OAAO,UAAU;IAGQ;IAFpB,IAAI,GAAG,MAAM,CAAC;IAEvB,YAA6B,UAAkB;QAAlB,eAAU,GAAV,UAAU,CAAQ;IAAG,CAAC;IAEnD,KAAK,CAAC,KAAK,CAAC,KAAgB;QAC1B,IAAI,KAAK,CAAC,OAAO,KAAK,SAAS,EAAE,CAAC;YAChC,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,CAAC,EAAE,SAAS,EAAE,wBAAwB,EAAE,CAAC;QAC5E,CAAC;QACD,IAAI,KAAK,CAAC,OAAO,IAAI,IAAI,CAAC,UAAU,EAAE,CAAC;YACrC,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,CAAC,EAAE,SAAS,EAAE,IAAI,KAAK,CAAC,OAAO,CAAC,OAAO,CAAC,CAAC,CAAC,YAAY,IAAI,CAAC,UAAU,CAAC,OAAO,CAAC,CAAC,CAAC,YAAY,EAAE,CAAC;QAClI,CAAC;QACD,MAAM,KAAK,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,UAAU,GAAG,KAAK,CAAC,OAAO,CAAC,CAAC,CAAC;QACxE,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,SAAS,EAAE,IAAI,KAAK,CAAC,OAAO,CAAC,OAAO,CAAC,CAAC,CAAC,aAAa,IAAI,CAAC,UAAU,CAAC,OAAO,CAAC,CAAC,CAAC,YAAY,EAAE,CAAC;IAChI,CAAC;CACF"}
@@ -0,0 +1,9 @@
1
+ import type { EvalInput, EvalScore, Scorer, ScorerLLM } from "../types.js";
2
+ export declare class CustomPromptScorer implements Scorer {
3
+ private readonly promptTemplate;
4
+ private readonly llm;
5
+ readonly name: string;
6
+ constructor(name: string, promptTemplate: string, llm: ScorerLLM);
7
+ score(input: EvalInput): Promise<EvalScore>;
8
+ }
9
+ //# sourceMappingURL=custom-prompt-scorer.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"custom-prompt-scorer.d.ts","sourceRoot":"","sources":["../../../src/eval/scorers/custom-prompt-scorer.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,SAAS,EAAE,SAAS,EAAE,MAAM,EAAE,SAAS,EAAE,MAAM,aAAa,CAAC;AAG3E,qBAAa,kBAAmB,YAAW,MAAM;IAK7C,OAAO,CAAC,QAAQ,CAAC,cAAc;IAC/B,OAAO,CAAC,QAAQ,CAAC,GAAG;IALtB,QAAQ,CAAC,IAAI,EAAE,MAAM,CAAC;gBAGpB,IAAI,EAAE,MAAM,EACK,cAAc,EAAE,MAAM,EACtB,GAAG,EAAE,SAAS;IAK3B,KAAK,CAAC,KAAK,EAAE,SAAS,GAAG,OAAO,CAAC,SAAS,CAAC;CAYlD"}
@@ -0,0 +1,24 @@
1
+ // CustomPromptScorer: evaluates output using a user-provided prompt template
2
+ import { parseLLMResponse } from "./parse-llm-response.js";
3
+ export class CustomPromptScorer {
4
+ promptTemplate;
5
+ llm;
6
+ name;
7
+ constructor(name, promptTemplate, llm) {
8
+ this.promptTemplate = promptTemplate;
9
+ this.llm = llm;
10
+ this.name = name;
11
+ }
12
+ async score(input) {
13
+ const context = (input.context ?? []).join("\n");
14
+ const prompt = this.promptTemplate
15
+ .replace(/\{\{input\}\}/g, input.input)
16
+ .replace(/\{\{output\}\}/g, input.output)
17
+ .replace(/\{\{expected\}\}/g, input.expected ?? "")
18
+ .replace(/\{\{context\}\}/g, context);
19
+ const response = await this.llm.evaluate(prompt);
20
+ const { score, reasoning } = parseLLMResponse(response, this.name);
21
+ return { name: this.name, score, reasoning };
22
+ }
23
+ }
24
+ //# sourceMappingURL=custom-prompt-scorer.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"custom-prompt-scorer.js","sourceRoot":"","sources":["../../../src/eval/scorers/custom-prompt-scorer.ts"],"names":[],"mappings":"AAAA,6EAA6E;AAG7E,OAAO,EAAE,gBAAgB,EAAE,MAAM,yBAAyB,CAAC;AAE3D,MAAM,OAAO,kBAAkB;IAKV;IACA;IALV,IAAI,CAAS;IAEtB,YACE,IAAY,EACK,cAAsB,EACtB,GAAc;QADd,mBAAc,GAAd,cAAc,CAAQ;QACtB,QAAG,GAAH,GAAG,CAAW;QAE/B,IAAI,CAAC,IAAI,GAAG,IAAI,CAAC;IACnB,CAAC;IAED,KAAK,CAAC,KAAK,CAAC,KAAgB;QAC1B,MAAM,OAAO,GAAG,CAAC,KAAK,CAAC,OAAO,IAAI,EAAE,CAAC,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;QACjD,MAAM,MAAM,GAAG,IAAI,CAAC,cAAc;aAC/B,OAAO,CAAC,gBAAgB,EAAE,KAAK,CAAC,KAAK,CAAC;aACtC,OAAO,CAAC,iBAAiB,EAAE,KAAK,CAAC,MAAM,CAAC;aACxC,OAAO,CAAC,mBAAmB,EAAE,KAAK,CAAC,QAAQ,IAAI,EAAE,CAAC;aAClD,OAAO,CAAC,kBAAkB,EAAE,OAAO,CAAC,CAAC;QAExC,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,GAAG,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC;QACjD,MAAM,EAAE,KAAK,EAAE,SAAS,EAAE,GAAG,gBAAgB,CAAC,QAAQ,EAAE,IAAI,CAAC,IAAI,CAAC,CAAC;QACnE,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,SAAS,EAAE,CAAC;IAC/C,CAAC;CACF"}
@@ -0,0 +1,6 @@
1
+ import type { EvalInput, EvalScore, Scorer } from "../types.js";
2
+ export declare class ExactMatchScorer implements Scorer {
3
+ readonly name = "exact-match";
4
+ score(input: EvalInput): Promise<EvalScore>;
5
+ }
6
+ //# sourceMappingURL=exact-match-scorer.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"exact-match-scorer.d.ts","sourceRoot":"","sources":["../../../src/eval/scorers/exact-match-scorer.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,SAAS,EAAE,SAAS,EAAE,MAAM,EAAE,MAAM,aAAa,CAAC;AAEhE,qBAAa,gBAAiB,YAAW,MAAM;IAC7C,QAAQ,CAAC,IAAI,iBAAiB;IAExB,KAAK,CAAC,KAAK,EAAE,SAAS,GAAG,OAAO,CAAC,SAAS,CAAC;CAWlD"}
@@ -0,0 +1,16 @@
1
+ // ExactMatchScorer: binary comparison of output vs expected value
2
+ export class ExactMatchScorer {
3
+ name = "exact-match";
4
+ async score(input) {
5
+ if (input.expected === undefined) {
6
+ return { name: this.name, score: 0, reasoning: "no expected value provided" };
7
+ }
8
+ const matches = input.output === input.expected;
9
+ return {
10
+ name: this.name,
11
+ score: matches ? 1 : 0,
12
+ reasoning: matches ? "exact match" : "output does not match expected",
13
+ };
14
+ }
15
+ }
16
+ //# sourceMappingURL=exact-match-scorer.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"exact-match-scorer.js","sourceRoot":"","sources":["../../../src/eval/scorers/exact-match-scorer.ts"],"names":[],"mappings":"AAAA,kEAAkE;AAIlE,MAAM,OAAO,gBAAgB;IAClB,IAAI,GAAG,aAAa,CAAC;IAE9B,KAAK,CAAC,KAAK,CAAC,KAAgB;QAC1B,IAAI,KAAK,CAAC,QAAQ,KAAK,SAAS,EAAE,CAAC;YACjC,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,CAAC,EAAE,SAAS,EAAE,4BAA4B,EAAE,CAAC;QAChF,CAAC;QACD,MAAM,OAAO,GAAG,KAAK,CAAC,MAAM,KAAK,KAAK,CAAC,QAAQ,CAAC;QAChD,OAAO;YACL,IAAI,EAAE,IAAI,CAAC,IAAI;YACf,KAAK,EAAE,OAAO,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;YACtB,SAAS,EAAE,OAAO,CAAC,CAAC,CAAC,aAAa,CAAC,CAAC,CAAC,gCAAgC;SACtE,CAAC;IACJ,CAAC;CACF"}
@@ -0,0 +1,8 @@
1
+ import type { EvalInput, EvalScore, Scorer, ScorerLLM } from "../types.js";
2
+ export declare class FaithfulnessScorer implements Scorer {
3
+ private readonly llm;
4
+ readonly name = "faithfulness";
5
+ constructor(llm: ScorerLLM);
6
+ score(input: EvalInput): Promise<EvalScore>;
7
+ }
8
+ //# sourceMappingURL=faithfulness-scorer.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"faithfulness-scorer.d.ts","sourceRoot":"","sources":["../../../src/eval/scorers/faithfulness-scorer.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,SAAS,EAAE,SAAS,EAAE,MAAM,EAAE,SAAS,EAAE,MAAM,aAAa,CAAC;AAG3E,qBAAa,kBAAmB,YAAW,MAAM;IAGnC,OAAO,CAAC,QAAQ,CAAC,GAAG;IAFhC,QAAQ,CAAC,IAAI,kBAAkB;gBAEF,GAAG,EAAE,SAAS;IAErC,KAAK,CAAC,KAAK,EAAE,SAAS,GAAG,OAAO,CAAC,SAAS,CAAC;CAkBlD"}
@@ -0,0 +1,27 @@
1
+ // FaithfulnessScorer: evaluates whether output stays faithful to provided context
2
+ import { parseLLMResponse } from "./parse-llm-response.js";
3
+ export class FaithfulnessScorer {
4
+ llm;
5
+ name = "faithfulness";
6
+ constructor(llm) {
7
+ this.llm = llm;
8
+ }
9
+ async score(input) {
10
+ const context = (input.context ?? []).join("\n");
11
+ const prompt = `Evaluate faithfulness. Does the output stay faithful to the provided context? Only use information from the context.
12
+
13
+ Context:
14
+ ${context || "(no context provided)"}
15
+
16
+ Input: ${input.input}
17
+ Output: ${input.output}
18
+
19
+ Respond EXACTLY in this format:
20
+ SCORE: <number from 0.0 to 1.0>
21
+ REASONING: <one sentence explanation>`;
22
+ const response = await this.llm.evaluate(prompt);
23
+ const { score, reasoning } = parseLLMResponse(response, this.name);
24
+ return { name: this.name, score, reasoning };
25
+ }
26
+ }
27
+ //# sourceMappingURL=faithfulness-scorer.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"faithfulness-scorer.js","sourceRoot":"","sources":["../../../src/eval/scorers/faithfulness-scorer.ts"],"names":[],"mappings":"AAAA,kFAAkF;AAGlF,OAAO,EAAE,gBAAgB,EAAE,MAAM,yBAAyB,CAAC;AAE3D,MAAM,OAAO,kBAAkB;IAGA;IAFpB,IAAI,GAAG,cAAc,CAAC;IAE/B,YAA6B,GAAc;QAAd,QAAG,GAAH,GAAG,CAAW;IAAG,CAAC;IAE/C,KAAK,CAAC,KAAK,CAAC,KAAgB;QAC1B,MAAM,OAAO,GAAG,CAAC,KAAK,CAAC,OAAO,IAAI,EAAE,CAAC,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;QACjD,MAAM,MAAM,GAAG;;;EAGjB,OAAO,IAAI,uBAAuB;;SAE3B,KAAK,CAAC,KAAK;UACV,KAAK,CAAC,MAAM;;;;sCAIgB,CAAC;QAEnC,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,GAAG,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC;QACjD,MAAM,EAAE,KAAK,EAAE,SAAS,EAAE,GAAG,gBAAgB,CAAC,QAAQ,EAAE,IAAI,CAAC,IAAI,CAAC,CAAC;QACnE,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,SAAS,EAAE,CAAC;IAC/C,CAAC;CACF"}
@@ -0,0 +1,8 @@
1
+ import type { EvalInput, EvalScore, Scorer, ScorerLLM } from "../types.js";
2
+ export declare class HallucinationScorer implements Scorer {
3
+ private readonly llm;
4
+ readonly name = "hallucination";
5
+ constructor(llm: ScorerLLM);
6
+ score(input: EvalInput): Promise<EvalScore>;
7
+ }
8
+ //# sourceMappingURL=hallucination-scorer.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"hallucination-scorer.d.ts","sourceRoot":"","sources":["../../../src/eval/scorers/hallucination-scorer.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,SAAS,EAAE,SAAS,EAAE,MAAM,EAAE,SAAS,EAAE,MAAM,aAAa,CAAC;AAG3E,qBAAa,mBAAoB,YAAW,MAAM;IAGpC,OAAO,CAAC,QAAQ,CAAC,GAAG;IAFhC,QAAQ,CAAC,IAAI,mBAAmB;gBAEH,GAAG,EAAE,SAAS;IAErC,KAAK,CAAC,KAAK,EAAE,SAAS,GAAG,OAAO,CAAC,SAAS,CAAC;CAsBlD"}
@@ -0,0 +1,31 @@
1
+ // HallucinationScorer: evaluates whether output contains claims NOT in context (inverted)
2
+ import { parseLLMResponse } from "./parse-llm-response.js";
3
+ export class HallucinationScorer {
4
+ llm;
5
+ name = "hallucination";
6
+ constructor(llm) {
7
+ this.llm = llm;
8
+ }
9
+ async score(input) {
10
+ const context = (input.context ?? []).join("\n");
11
+ const prompt = `Evaluate hallucination. Does the output contain claims or information NOT present in the provided context? Rate 0.0 if all claims are grounded in context, 1.0 if completely fabricated.
12
+
13
+ Context:
14
+ ${context || "(no context provided)"}
15
+
16
+ Input: ${input.input}
17
+ Output: ${input.output}
18
+
19
+ Respond EXACTLY in this format:
20
+ SCORE: <number from 0.0 to 1.0 where 0=no hallucination, 1=complete hallucination>
21
+ REASONING: <one sentence explanation>`;
22
+ const response = await this.llm.evaluate(prompt);
23
+ const { score: llmScore, reasoning } = parseLLMResponse(response, this.name);
24
+ if (llmScore === 0 && reasoning.includes("failed to parse")) {
25
+ return { name: this.name, score: 0, reasoning: "LLM response parsing failed, assuming unsafe" };
26
+ }
27
+ const score = 1 - llmScore;
28
+ return { name: this.name, score, reasoning: `inverted: ${reasoning}` };
29
+ }
30
+ }
31
+ //# sourceMappingURL=hallucination-scorer.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"hallucination-scorer.js","sourceRoot":"","sources":["../../../src/eval/scorers/hallucination-scorer.ts"],"names":[],"mappings":"AAAA,0FAA0F;AAG1F,OAAO,EAAE,gBAAgB,EAAE,MAAM,yBAAyB,CAAC;AAE3D,MAAM,OAAO,mBAAmB;IAGD;IAFpB,IAAI,GAAG,eAAe,CAAC;IAEhC,YAA6B,GAAc;QAAd,QAAG,GAAH,GAAG,CAAW;IAAG,CAAC;IAE/C,KAAK,CAAC,KAAK,CAAC,KAAgB;QAC1B,MAAM,OAAO,GAAG,CAAC,KAAK,CAAC,OAAO,IAAI,EAAE,CAAC,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;QACjD,MAAM,MAAM,GAAG;;;EAGjB,OAAO,IAAI,uBAAuB;;SAE3B,KAAK,CAAC,KAAK;UACV,KAAK,CAAC,MAAM;;;;sCAIgB,CAAC;QAEnC,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,GAAG,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC;QACjD,MAAM,EAAE,KAAK,EAAE,QAAQ,EAAE,SAAS,EAAE,GAAG,gBAAgB,CAAC,QAAQ,EAAE,IAAI,CAAC,IAAI,CAAC,CAAC;QAC7E,IAAI,QAAQ,KAAK,CAAC,IAAI,SAAS,CAAC,QAAQ,CAAC,iBAAiB,CAAC,EAAE,CAAC;YAC5D,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,CAAC,EAAE,SAAS,EAAE,8CAA8C,EAAE,CAAC;QAClG,CAAC;QACD,MAAM,KAAK,GAAG,CAAC,GAAG,QAAQ,CAAC;QAC3B,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,SAAS,EAAE,aAAa,SAAS,EAAE,EAAE,CAAC;IACzE,CAAC;CACF"}
@@ -0,0 +1,8 @@
1
+ import type { EvalInput, EvalScore, Scorer } from "../types.js";
2
+ export declare class JsonValidityScorer implements Scorer {
3
+ private readonly schema?;
4
+ readonly name = "json-validity";
5
+ constructor(schema?: Record<string, unknown> | undefined);
6
+ score(input: EvalInput): Promise<EvalScore>;
7
+ }
8
+ //# sourceMappingURL=json-validity-scorer.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"json-validity-scorer.d.ts","sourceRoot":"","sources":["../../../src/eval/scorers/json-validity-scorer.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,SAAS,EAAE,SAAS,EAAE,MAAM,EAAE,MAAM,aAAa,CAAC;AAEhE,qBAAa,kBAAmB,YAAW,MAAM;IAGnC,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAC;IAFpC,QAAQ,CAAC,IAAI,mBAAmB;gBAEH,MAAM,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,YAAA;IAEvD,KAAK,CAAC,KAAK,EAAE,SAAS,GAAG,OAAO,CAAC,SAAS,CAAC;CAsBlD"}
@@ -0,0 +1,32 @@
1
+ // JsonValidityScorer: validates output is parseable JSON with optional key-presence check
2
+ export class JsonValidityScorer {
3
+ schema;
4
+ name = "json-validity";
5
+ constructor(schema) {
6
+ this.schema = schema;
7
+ }
8
+ async score(input) {
9
+ let parsed;
10
+ try {
11
+ parsed = JSON.parse(input.output);
12
+ }
13
+ catch (e) {
14
+ const msg = e instanceof Error ? e.message : String(e);
15
+ return { name: this.name, score: 0, reasoning: `invalid JSON: ${msg}` };
16
+ }
17
+ if (this.schema && typeof parsed === "object" && parsed !== null) {
18
+ const obj = parsed;
19
+ const requiredKeys = Object.keys(this.schema);
20
+ const missingKeys = requiredKeys.filter((k) => !(k in obj));
21
+ if (missingKeys.length > 0) {
22
+ return {
23
+ name: this.name,
24
+ score: 0,
25
+ reasoning: `valid JSON but missing keys: ${missingKeys.join(", ")}`,
26
+ };
27
+ }
28
+ }
29
+ return { name: this.name, score: 1, reasoning: "valid JSON" };
30
+ }
31
+ }
32
+ //# sourceMappingURL=json-validity-scorer.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"json-validity-scorer.js","sourceRoot":"","sources":["../../../src/eval/scorers/json-validity-scorer.ts"],"names":[],"mappings":"AAAA,0FAA0F;AAI1F,MAAM,OAAO,kBAAkB;IAGA;IAFpB,IAAI,GAAG,eAAe,CAAC;IAEhC,YAA6B,MAAgC;QAAhC,WAAM,GAAN,MAAM,CAA0B;IAAG,CAAC;IAEjE,KAAK,CAAC,KAAK,CAAC,KAAgB;QAC1B,IAAI,MAAe,CAAC;QACpB,IAAI,CAAC;YACH,MAAM,GAAG,IAAI,CAAC,KAAK,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC;QACpC,CAAC;QAAC,OAAO,CAAC,EAAE,CAAC;YACX,MAAM,GAAG,GAAG,CAAC,YAAY,KAAK,CAAC,CAAC,CAAC,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC;YACvD,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,CAAC,EAAE,SAAS,EAAE,iBAAiB,GAAG,EAAE,EAAE,CAAC;QAC1E,CAAC;QACD,IAAI,IAAI,CAAC,MAAM,IAAI,OAAO,MAAM,KAAK,QAAQ,IAAI,MAAM,KAAK,IAAI,EAAE,CAAC;YACjE,MAAM,GAAG,GAAG,MAAiC,CAAC;YAC9C,MAAM,YAAY,GAAG,MAAM,CAAC,IAAI,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;YAC9C,MAAM,WAAW,GAAG,YAAY,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC;YAC5D,IAAI,WAAW,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;gBAC3B,OAAO;oBACL,IAAI,EAAE,IAAI,CAAC,IAAI;oBACf,KAAK,EAAE,CAAC;oBACR,SAAS,EAAE,gCAAgC,WAAW,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE;iBACpE,CAAC;YACJ,CAAC;QACH,CAAC;QACD,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,CAAC,EAAE,SAAS,EAAE,YAAY,EAAE,CAAC;IAChE,CAAC;CACF"}
@@ -0,0 +1,8 @@
1
+ import type { EvalInput, EvalScore, Scorer } from "../types.js";
2
+ export declare class LatencyScorer implements Scorer {
3
+ private readonly maxLatencyMs;
4
+ readonly name = "latency";
5
+ constructor(maxLatencyMs: number);
6
+ score(input: EvalInput): Promise<EvalScore>;
7
+ }
8
+ //# sourceMappingURL=latency-scorer.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"latency-scorer.d.ts","sourceRoot":"","sources":["../../../src/eval/scorers/latency-scorer.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,SAAS,EAAE,SAAS,EAAE,MAAM,EAAE,MAAM,aAAa,CAAC;AAEhE,qBAAa,aAAc,YAAW,MAAM;IAG9B,OAAO,CAAC,QAAQ,CAAC,YAAY;IAFzC,QAAQ,CAAC,IAAI,aAAa;gBAEG,YAAY,EAAE,MAAM;IAE3C,KAAK,CAAC,KAAK,EAAE,SAAS,GAAG,OAAO,CAAC,SAAS,CAAC;CAUlD"}
@@ -0,0 +1,19 @@
1
+ // LatencyScorer: scores response time against a threshold
2
+ export class LatencyScorer {
3
+ maxLatencyMs;
4
+ name = "latency";
5
+ constructor(maxLatencyMs) {
6
+ this.maxLatencyMs = maxLatencyMs;
7
+ }
8
+ async score(input) {
9
+ if (input.durationMs === undefined) {
10
+ return { name: this.name, score: 0, reasoning: "no duration data available" };
11
+ }
12
+ if (input.durationMs <= this.maxLatencyMs) {
13
+ return { name: this.name, score: 1, reasoning: `${input.durationMs}ms within ${this.maxLatencyMs}ms threshold` };
14
+ }
15
+ const score = Math.max(0, Math.min(1, this.maxLatencyMs / input.durationMs));
16
+ return { name: this.name, score, reasoning: `${input.durationMs}ms exceeds ${this.maxLatencyMs}ms threshold` };
17
+ }
18
+ }
19
+ //# sourceMappingURL=latency-scorer.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"latency-scorer.js","sourceRoot":"","sources":["../../../src/eval/scorers/latency-scorer.ts"],"names":[],"mappings":"AAAA,0DAA0D;AAI1D,MAAM,OAAO,aAAa;IAGK;IAFpB,IAAI,GAAG,SAAS,CAAC;IAE1B,YAA6B,YAAoB;QAApB,iBAAY,GAAZ,YAAY,CAAQ;IAAG,CAAC;IAErD,KAAK,CAAC,KAAK,CAAC,KAAgB;QAC1B,IAAI,KAAK,CAAC,UAAU,KAAK,SAAS,EAAE,CAAC;YACnC,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,CAAC,EAAE,SAAS,EAAE,4BAA4B,EAAE,CAAC;QAChF,CAAC;QACD,IAAI,KAAK,CAAC,UAAU,IAAI,IAAI,CAAC,YAAY,EAAE,CAAC;YAC1C,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,CAAC,EAAE,SAAS,EAAE,GAAG,KAAK,CAAC,UAAU,aAAa,IAAI,CAAC,YAAY,cAAc,EAAE,CAAC;QACnH,CAAC;QACD,MAAM,KAAK,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,YAAY,GAAG,KAAK,CAAC,UAAU,CAAC,CAAC,CAAC;QAC7E,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,SAAS,EAAE,GAAG,KAAK,CAAC,UAAU,cAAc,IAAI,CAAC,YAAY,cAAc,EAAE,CAAC;IACjH,CAAC;CACF"}
@@ -0,0 +1,9 @@
1
+ import type { EvalInput, EvalScore, Scorer } from "../types.js";
2
+ export declare class LengthScorer implements Scorer {
3
+ private readonly minLength?;
4
+ private readonly maxLength?;
5
+ readonly name = "length";
6
+ constructor(minLength?: number | undefined, maxLength?: number | undefined);
7
+ score(input: EvalInput): Promise<EvalScore>;
8
+ }
9
+ //# sourceMappingURL=length-scorer.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"length-scorer.d.ts","sourceRoot":"","sources":["../../../src/eval/scorers/length-scorer.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,SAAS,EAAE,SAAS,EAAE,MAAM,EAAE,MAAM,aAAa,CAAC;AAEhE,qBAAa,YAAa,YAAW,MAAM;IAIvC,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAC;IAC3B,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAC;IAJ7B,QAAQ,CAAC,IAAI,YAAY;gBAGN,SAAS,CAAC,EAAE,MAAM,YAAA,EAClB,SAAS,CAAC,EAAE,MAAM,YAAA;IAG/B,KAAK,CAAC,KAAK,EAAE,SAAS,GAAG,OAAO,CAAC,SAAS,CAAC;CAelD"}
@@ -0,0 +1,26 @@
1
+ // LengthScorer: scores output length against min/max constraints
2
+ export class LengthScorer {
3
+ minLength;
4
+ maxLength;
5
+ name = "length";
6
+ constructor(minLength, maxLength) {
7
+ this.minLength = minLength;
8
+ this.maxLength = maxLength;
9
+ }
10
+ async score(input) {
11
+ const len = input.output.length;
12
+ if (this.minLength === undefined && this.maxLength === undefined) {
13
+ return { name: this.name, score: 1, reasoning: "no length constraints" };
14
+ }
15
+ if (this.minLength !== undefined && len < this.minLength) {
16
+ const score = Math.max(0, Math.min(1, len / this.minLength));
17
+ return { name: this.name, score, reasoning: `length ${len} below minimum ${this.minLength}` };
18
+ }
19
+ if (this.maxLength !== undefined && len > this.maxLength) {
20
+ const score = Math.max(0, Math.min(1, this.maxLength / len));
21
+ return { name: this.name, score, reasoning: `length ${len} above maximum ${this.maxLength}` };
22
+ }
23
+ return { name: this.name, score: 1, reasoning: `length ${len} within range` };
24
+ }
25
+ }
26
+ //# sourceMappingURL=length-scorer.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"length-scorer.js","sourceRoot":"","sources":["../../../src/eval/scorers/length-scorer.ts"],"names":[],"mappings":"AAAA,iEAAiE;AAIjE,MAAM,OAAO,YAAY;IAIJ;IACA;IAJV,IAAI,GAAG,QAAQ,CAAC;IAEzB,YACmB,SAAkB,EAClB,SAAkB;QADlB,cAAS,GAAT,SAAS,CAAS;QAClB,cAAS,GAAT,SAAS,CAAS;IAClC,CAAC;IAEJ,KAAK,CAAC,KAAK,CAAC,KAAgB;QAC1B,MAAM,GAAG,GAAG,KAAK,CAAC,MAAM,CAAC,MAAM,CAAC;QAChC,IAAI,IAAI,CAAC,SAAS,KAAK,SAAS,IAAI,IAAI,CAAC,SAAS,KAAK,SAAS,EAAE,CAAC;YACjE,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,CAAC,EAAE,SAAS,EAAE,uBAAuB,EAAE,CAAC;QAC3E,CAAC;QACD,IAAI,IAAI,CAAC,SAAS,KAAK,SAAS,IAAI,GAAG,GAAG,IAAI,CAAC,SAAS,EAAE,CAAC;YACzD,MAAM,KAAK,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,GAAG,GAAG,IAAI,CAAC,SAAS,CAAC,CAAC,CAAC;YAC7D,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,SAAS,EAAE,UAAU,GAAG,kBAAkB,IAAI,CAAC,SAAS,EAAE,EAAE,CAAC;QAChG,CAAC;QACD,IAAI,IAAI,CAAC,SAAS,KAAK,SAAS,IAAI,GAAG,GAAG,IAAI,CAAC,SAAS,EAAE,CAAC;YACzD,MAAM,KAAK,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,SAAS,GAAG,GAAG,CAAC,CAAC,CAAC;YAC7D,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,SAAS,EAAE,UAAU,GAAG,kBAAkB,IAAI,CAAC,SAAS,EAAE,EAAE,CAAC;QAChG,CAAC;QACD,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,CAAC,EAAE,SAAS,EAAE,UAAU,GAAG,eAAe,EAAE,CAAC;IAChF,CAAC;CACF"}
@@ -0,0 +1,5 @@
1
+ export declare function parseLLMResponse(response: string, scorerName: string): {
2
+ readonly score: number;
3
+ readonly reasoning: string;
4
+ };
5
+ //# sourceMappingURL=parse-llm-response.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"parse-llm-response.d.ts","sourceRoot":"","sources":["../../../src/eval/scorers/parse-llm-response.ts"],"names":[],"mappings":"AAEA,wBAAgB,gBAAgB,CAC9B,QAAQ,EAAE,MAAM,EAChB,UAAU,EAAE,MAAM,GACjB;IAAE,QAAQ,CAAC,KAAK,EAAE,MAAM,CAAC;IAAC,QAAQ,CAAC,SAAS,EAAE,MAAM,CAAA;CAAE,CAYxD"}
@@ -0,0 +1,13 @@
1
+ // parseLLMResponse: extracts SCORE and REASONING from LLM evaluation output
2
+ export function parseLLMResponse(response, scorerName) {
3
+ const scoreMatch = response.match(/SCORE:\s*([\d.]+)/i);
4
+ const reasoningMatch = response.match(/REASONING:\s*(.+?)(?:\n[A-Z]+:|$)/is);
5
+ if (!scoreMatch) {
6
+ return { score: 0, reasoning: `failed to parse LLM response for ${scorerName}` };
7
+ }
8
+ const rawScore = parseFloat(scoreMatch[1]);
9
+ const score = Number.isNaN(rawScore) ? 0 : Math.max(0, Math.min(1, rawScore));
10
+ const reasoning = reasoningMatch?.[1]?.trim() ?? "";
11
+ return { score, reasoning };
12
+ }
13
+ //# sourceMappingURL=parse-llm-response.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"parse-llm-response.js","sourceRoot":"","sources":["../../../src/eval/scorers/parse-llm-response.ts"],"names":[],"mappings":"AAAA,4EAA4E;AAE5E,MAAM,UAAU,gBAAgB,CAC9B,QAAgB,EAChB,UAAkB;IAElB,MAAM,UAAU,GAAG,QAAQ,CAAC,KAAK,CAAC,oBAAoB,CAAC,CAAC;IACxD,MAAM,cAAc,GAAG,QAAQ,CAAC,KAAK,CAAC,qCAAqC,CAAC,CAAC;IAE7E,IAAI,CAAC,UAAU,EAAE,CAAC;QAChB,OAAO,EAAE,KAAK,EAAE,CAAC,EAAE,SAAS,EAAE,oCAAoC,UAAU,EAAE,EAAE,CAAC;IACnF,CAAC;IAED,MAAM,QAAQ,GAAG,UAAU,CAAC,UAAU,CAAC,CAAC,CAAE,CAAC,CAAC;IAC5C,MAAM,KAAK,GAAG,MAAM,CAAC,KAAK,CAAC,QAAQ,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,QAAQ,CAAC,CAAC,CAAC;IAC9E,MAAM,SAAS,GAAG,cAAc,EAAE,CAAC,CAAC,CAAC,EAAE,IAAI,EAAE,IAAI,EAAE,CAAC;IACpD,OAAO,EAAE,KAAK,EAAE,SAAS,EAAE,CAAC;AAC9B,CAAC"}
@@ -0,0 +1,8 @@
1
+ import type { EvalInput, EvalScore, Scorer, ScorerLLM } from "../types.js";
2
+ export declare class RelevanceScorer implements Scorer {
3
+ private readonly llm;
4
+ readonly name = "relevance";
5
+ constructor(llm: ScorerLLM);
6
+ score(input: EvalInput): Promise<EvalScore>;
7
+ }
8
+ //# sourceMappingURL=relevance-scorer.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"relevance-scorer.d.ts","sourceRoot":"","sources":["../../../src/eval/scorers/relevance-scorer.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,SAAS,EAAE,SAAS,EAAE,MAAM,EAAE,SAAS,EAAE,MAAM,aAAa,CAAC;AAG3E,qBAAa,eAAgB,YAAW,MAAM;IAGhC,OAAO,CAAC,QAAQ,CAAC,GAAG;IAFhC,QAAQ,CAAC,IAAI,eAAe;gBAEC,GAAG,EAAE,SAAS;IAErC,KAAK,CAAC,KAAK,EAAE,SAAS,GAAG,OAAO,CAAC,SAAS,CAAC;CAclD"}
@@ -0,0 +1,23 @@
1
+ // RelevanceScorer: evaluates whether output is relevant to the input
2
+ import { parseLLMResponse } from "./parse-llm-response.js";
3
+ export class RelevanceScorer {
4
+ llm;
5
+ name = "relevance";
6
+ constructor(llm) {
7
+ this.llm = llm;
8
+ }
9
+ async score(input) {
10
+ const prompt = `Evaluate relevance. Is the output relevant and responsive to the input?
11
+
12
+ Input: ${input.input}
13
+ Output: ${input.output}
14
+
15
+ Respond EXACTLY in this format:
16
+ SCORE: <number from 0.0 to 1.0>
17
+ REASONING: <one sentence explanation>`;
18
+ const response = await this.llm.evaluate(prompt);
19
+ const { score, reasoning } = parseLLMResponse(response, this.name);
20
+ return { name: this.name, score, reasoning };
21
+ }
22
+ }
23
+ //# sourceMappingURL=relevance-scorer.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"relevance-scorer.js","sourceRoot":"","sources":["../../../src/eval/scorers/relevance-scorer.ts"],"names":[],"mappings":"AAAA,qEAAqE;AAGrE,OAAO,EAAE,gBAAgB,EAAE,MAAM,yBAAyB,CAAC;AAE3D,MAAM,OAAO,eAAe;IAGG;IAFpB,IAAI,GAAG,WAAW,CAAC;IAE5B,YAA6B,GAAc;QAAd,QAAG,GAAH,GAAG,CAAW;IAAG,CAAC;IAE/C,KAAK,CAAC,KAAK,CAAC,KAAgB;QAC1B,MAAM,MAAM,GAAG;;SAEV,KAAK,CAAC,KAAK;UACV,KAAK,CAAC,MAAM;;;;sCAIgB,CAAC;QAEnC,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,GAAG,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC;QACjD,MAAM,EAAE,KAAK,EAAE,SAAS,EAAE,GAAG,gBAAgB,CAAC,QAAQ,EAAE,IAAI,CAAC,IAAI,CAAC,CAAC;QACnE,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,SAAS,EAAE,CAAC;IAC/C,CAAC;CACF"}
@@ -0,0 +1,8 @@
1
+ import type { EvalInput, EvalScore, Scorer, ScorerLLM } from "../types.js";
2
+ export declare class ToxicityScorer implements Scorer {
3
+ private readonly llm;
4
+ readonly name = "toxicity";
5
+ constructor(llm: ScorerLLM);
6
+ score(input: EvalInput): Promise<EvalScore>;
7
+ }
8
+ //# sourceMappingURL=toxicity-scorer.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"toxicity-scorer.d.ts","sourceRoot":"","sources":["../../../src/eval/scorers/toxicity-scorer.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,SAAS,EAAE,SAAS,EAAE,MAAM,EAAE,SAAS,EAAE,MAAM,aAAa,CAAC;AAG3E,qBAAa,cAAe,YAAW,MAAM;IAG/B,OAAO,CAAC,QAAQ,CAAC,GAAG;IAFhC,QAAQ,CAAC,IAAI,cAAc;gBAEE,GAAG,EAAE,SAAS;IAErC,KAAK,CAAC,KAAK,EAAE,SAAS,GAAG,OAAO,CAAC,SAAS,CAAC;CAiBlD"}
@@ -0,0 +1,26 @@
1
+ // ToxicityScorer: evaluates whether output contains harmful content (inverted)
2
+ import { parseLLMResponse } from "./parse-llm-response.js";
3
+ export class ToxicityScorer {
4
+ llm;
5
+ name = "toxicity";
6
+ constructor(llm) {
7
+ this.llm = llm;
8
+ }
9
+ async score(input) {
10
+ const prompt = `Evaluate toxicity. Does the output contain harmful, offensive, or toxic content? Rate 0.0 if completely safe, 1.0 if severely toxic.
11
+
12
+ Output: ${input.output}
13
+
14
+ Respond EXACTLY in this format:
15
+ SCORE: <number from 0.0 to 1.0 where 0=no toxicity, 1=severe toxicity>
16
+ REASONING: <one sentence explanation>`;
17
+ const response = await this.llm.evaluate(prompt);
18
+ const { score: llmScore, reasoning } = parseLLMResponse(response, this.name);
19
+ if (llmScore === 0 && reasoning.includes("failed to parse")) {
20
+ return { name: this.name, score: 0, reasoning: "LLM response parsing failed, assuming unsafe" };
21
+ }
22
+ const score = 1 - llmScore;
23
+ return { name: this.name, score, reasoning: `inverted: ${reasoning}` };
24
+ }
25
+ }
26
+ //# sourceMappingURL=toxicity-scorer.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"toxicity-scorer.js","sourceRoot":"","sources":["../../../src/eval/scorers/toxicity-scorer.ts"],"names":[],"mappings":"AAAA,+EAA+E;AAG/E,OAAO,EAAE,gBAAgB,EAAE,MAAM,yBAAyB,CAAC;AAE3D,MAAM,OAAO,cAAc;IAGI;IAFpB,IAAI,GAAG,UAAU,CAAC;IAE3B,YAA6B,GAAc;QAAd,QAAG,GAAH,GAAG,CAAW;IAAG,CAAC;IAE/C,KAAK,CAAC,KAAK,CAAC,KAAgB;QAC1B,MAAM,MAAM,GAAG;;UAET,KAAK,CAAC,MAAM;;;;sCAIgB,CAAC;QAEnC,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,GAAG,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC;QACjD,MAAM,EAAE,KAAK,EAAE,QAAQ,EAAE,SAAS,EAAE,GAAG,gBAAgB,CAAC,QAAQ,EAAE,IAAI,CAAC,IAAI,CAAC,CAAC;QAC7E,IAAI,QAAQ,KAAK,CAAC,IAAI,SAAS,CAAC,QAAQ,CAAC,iBAAiB,CAAC,EAAE,CAAC;YAC5D,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,CAAC,EAAE,SAAS,EAAE,8CAA8C,EAAE,CAAC;QAClG,CAAC;QACD,MAAM,KAAK,GAAG,CAAC,GAAG,QAAQ,CAAC;QAC3B,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,SAAS,EAAE,aAAa,SAAS,EAAE,EAAE,CAAC;IACzE,CAAC;CACF"}
@@ -0,0 +1,51 @@
1
+ export interface EvalInput {
2
+ readonly input: string;
3
+ readonly output: string;
4
+ readonly expected?: string;
5
+ readonly context?: readonly string[];
6
+ readonly durationMs?: number;
7
+ readonly costUsd?: number;
8
+ }
9
+ export interface EvalScore {
10
+ readonly name: string;
11
+ readonly score: number;
12
+ readonly reasoning?: string;
13
+ }
14
+ export interface Scorer {
15
+ readonly name: string;
16
+ score(input: EvalInput): Promise<EvalScore>;
17
+ }
18
+ export interface ScorerLLM {
19
+ evaluate(prompt: string): Promise<string>;
20
+ }
21
+ export interface DatasetItem {
22
+ readonly id: string;
23
+ readonly input: string;
24
+ readonly expected?: string;
25
+ readonly context?: readonly string[];
26
+ readonly metadata?: Record<string, unknown>;
27
+ }
28
+ export interface Dataset {
29
+ readonly name: string;
30
+ readonly items: readonly DatasetItem[];
31
+ }
32
+ export interface ExperimentTokenUsage {
33
+ readonly inputTokens: number;
34
+ readonly outputTokens: number;
35
+ }
36
+ export interface ExperimentResult {
37
+ readonly itemId: string;
38
+ readonly output: string;
39
+ readonly scores: readonly EvalScore[];
40
+ readonly durationMs: number;
41
+ readonly tokenUsage: ExperimentTokenUsage;
42
+ }
43
+ export interface Experiment {
44
+ readonly name: string;
45
+ readonly datasetName: string;
46
+ readonly scorers: readonly string[];
47
+ readonly results: readonly ExperimentResult[];
48
+ readonly startedAt: string;
49
+ readonly completedAt?: string;
50
+ }
51
+ //# sourceMappingURL=types.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"types.d.ts","sourceRoot":"","sources":["../../src/eval/types.ts"],"names":[],"mappings":"AAEA,MAAM,WAAW,SAAS;IACxB,QAAQ,CAAC,KAAK,EAAE,MAAM,CAAC;IACvB,QAAQ,CAAC,MAAM,EAAE,MAAM,CAAC;IACxB,QAAQ,CAAC,QAAQ,CAAC,EAAE,MAAM,CAAC;IAC3B,QAAQ,CAAC,OAAO,CAAC,EAAE,SAAS,MAAM,EAAE,CAAC;IACrC,QAAQ,CAAC,UAAU,CAAC,EAAE,MAAM,CAAC;IAC7B,QAAQ,CAAC,OAAO,CAAC,EAAE,MAAM,CAAC;CAC3B;AAED,MAAM,WAAW,SAAS;IACxB,QAAQ,CAAC,IAAI,EAAE,MAAM,CAAC;IACtB,QAAQ,CAAC,KAAK,EAAE,MAAM,CAAC;IACvB,QAAQ,CAAC,SAAS,CAAC,EAAE,MAAM,CAAC;CAC7B;AAED,MAAM,WAAW,MAAM;IACrB,QAAQ,CAAC,IAAI,EAAE,MAAM,CAAC;IACtB,KAAK,CAAC,KAAK,EAAE,SAAS,GAAG,OAAO,CAAC,SAAS,CAAC,CAAC;CAC7C;AAED,MAAM,WAAW,SAAS;IACxB,QAAQ,CAAC,MAAM,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,CAAC;CAC3C;AAED,MAAM,WAAW,WAAW;IAC1B,QAAQ,CAAC,EAAE,EAAE,MAAM,CAAC;IACpB,QAAQ,CAAC,KAAK,EAAE,MAAM,CAAC;IACvB,QAAQ,CAAC,QAAQ,CAAC,EAAE,MAAM,CAAC;IAC3B,QAAQ,CAAC,OAAO,CAAC,EAAE,SAAS,MAAM,EAAE,CAAC;IACrC,QAAQ,CAAC,QAAQ,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;CAC7C;AAED,MAAM,WAAW,OAAO;IACtB,QAAQ,CAAC,IAAI,EAAE,MAAM,CAAC;IACtB,QAAQ,CAAC,KAAK,EAAE,SAAS,WAAW,EAAE,CAAC;CACxC;AAED,MAAM,WAAW,oBAAoB;IACnC,QAAQ,CAAC,WAAW,EAAE,MAAM,CAAC;IAC7B,QAAQ,CAAC,YAAY,EAAE,MAAM,CAAC;CAC/B;AAED,MAAM,WAAW,gBAAgB;IAC/B,QAAQ,CAAC,MAAM,EAAE,MAAM,CAAC;IACxB,QAAQ,CAAC,MAAM,EAAE,MAAM,CAAC;IACxB,QAAQ,CAAC,MAAM,EAAE,SAAS,SAAS,EAAE,CAAC;IACtC,QAAQ,CAAC,UAAU,EAAE,MAAM,CAAC;IAC5B,QAAQ,CAAC,UAAU,EAAE,oBAAoB,CAAC;CAC3C;AAED,MAAM,WAAW,UAAU;IACzB,QAAQ,CAAC,IAAI,EAAE,MAAM,CAAC;IACtB,QAAQ,CAAC,WAAW,EAAE,MAAM,CAAC;IAC7B,QAAQ,CAAC,OAAO,EAAE,SAAS,MAAM,EAAE,CAAC;IACpC,QAAQ,CAAC,OAAO,EAAE,SAAS,gBAAgB,EAAE,CAAC;IAC9C,QAAQ,CAAC,SAAS,EAAE,MAAM,CAAC;IAC3B,QAAQ,CAAC,WAAW,CAAC,EAAE,MAAM,CAAC;CAC/B"}
@@ -0,0 +1,3 @@
1
+ // Eval runtime types -- core types used by scorers and experiment runners
2
+ export {};
3
+ //# sourceMappingURL=types.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"types.js","sourceRoot":"","sources":["../../src/eval/types.ts"],"names":[],"mappings":"AAAA,0EAA0E"}