cognitive-core 0.0.2 → 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (329) hide show
  1. package/README.md +302 -116
  2. package/SKILL.md +193 -0
  3. package/dist/agents/index.d.ts +3 -0
  4. package/dist/agents/index.d.ts.map +1 -0
  5. package/dist/agents/index.js +5 -0
  6. package/dist/agents/index.js.map +1 -0
  7. package/dist/agents/mock-provider.d.ts +23 -0
  8. package/dist/agents/mock-provider.d.ts.map +1 -0
  9. package/dist/agents/mock-provider.js +71 -0
  10. package/dist/agents/mock-provider.js.map +1 -0
  11. package/dist/agents/types.d.ts +98 -0
  12. package/dist/agents/types.d.ts.map +1 -0
  13. package/dist/agents/types.js +44 -0
  14. package/dist/agents/types.js.map +1 -0
  15. package/dist/atlas.d.ts +196 -0
  16. package/dist/atlas.d.ts.map +1 -0
  17. package/dist/atlas.js +373 -0
  18. package/dist/atlas.js.map +1 -0
  19. package/dist/bin/cognitive-core.d.ts +18 -0
  20. package/dist/bin/cognitive-core.d.ts.map +1 -0
  21. package/dist/bin/cognitive-core.js +419 -0
  22. package/dist/bin/cognitive-core.js.map +1 -0
  23. package/dist/embeddings/bm25.d.ts +104 -0
  24. package/dist/embeddings/bm25.d.ts.map +1 -0
  25. package/dist/embeddings/bm25.js +264 -0
  26. package/dist/embeddings/bm25.js.map +1 -0
  27. package/dist/embeddings/index.d.ts +12 -0
  28. package/dist/embeddings/index.d.ts.map +1 -0
  29. package/dist/embeddings/index.js +16 -0
  30. package/dist/embeddings/index.js.map +1 -0
  31. package/dist/embeddings/manager.d.ts +112 -0
  32. package/dist/embeddings/manager.d.ts.map +1 -0
  33. package/dist/embeddings/manager.js +215 -0
  34. package/dist/embeddings/manager.js.map +1 -0
  35. package/dist/embeddings/provider.d.ts +101 -0
  36. package/dist/embeddings/provider.d.ts.map +1 -0
  37. package/dist/embeddings/provider.js +232 -0
  38. package/dist/embeddings/provider.js.map +1 -0
  39. package/dist/embeddings/vector-store.d.ts +101 -0
  40. package/dist/embeddings/vector-store.d.ts.map +1 -0
  41. package/dist/embeddings/vector-store.js +256 -0
  42. package/dist/embeddings/vector-store.js.map +1 -0
  43. package/dist/factory.d.ts +193 -0
  44. package/dist/factory.d.ts.map +1 -0
  45. package/dist/factory.js +109 -0
  46. package/dist/factory.js.map +1 -0
  47. package/dist/index.d.ts +30 -453
  48. package/dist/index.d.ts.map +1 -0
  49. package/dist/index.js +84 -509
  50. package/dist/index.js.map +1 -0
  51. package/dist/learning/analyzer.d.ts +110 -0
  52. package/dist/learning/analyzer.d.ts.map +1 -0
  53. package/dist/learning/analyzer.js +213 -0
  54. package/dist/learning/analyzer.js.map +1 -0
  55. package/dist/learning/effectiveness.d.ts +158 -0
  56. package/dist/learning/effectiveness.d.ts.map +1 -0
  57. package/dist/learning/effectiveness.js +251 -0
  58. package/dist/learning/effectiveness.js.map +1 -0
  59. package/dist/learning/index.d.ts +8 -0
  60. package/dist/learning/index.d.ts.map +1 -0
  61. package/dist/learning/index.js +11 -0
  62. package/dist/learning/index.js.map +1 -0
  63. package/dist/learning/llm-extractor.d.ts +88 -0
  64. package/dist/learning/llm-extractor.d.ts.map +1 -0
  65. package/dist/learning/llm-extractor.js +372 -0
  66. package/dist/learning/llm-extractor.js.map +1 -0
  67. package/dist/learning/meta-learner.d.ts +80 -0
  68. package/dist/learning/meta-learner.d.ts.map +1 -0
  69. package/dist/learning/meta-learner.js +355 -0
  70. package/dist/learning/meta-learner.js.map +1 -0
  71. package/dist/learning/pipeline.d.ts +65 -0
  72. package/dist/learning/pipeline.d.ts.map +1 -0
  73. package/dist/learning/pipeline.js +170 -0
  74. package/dist/learning/pipeline.js.map +1 -0
  75. package/dist/learning/playbook-extractor.d.ts +113 -0
  76. package/dist/learning/playbook-extractor.d.ts.map +1 -0
  77. package/dist/learning/playbook-extractor.js +523 -0
  78. package/dist/learning/playbook-extractor.js.map +1 -0
  79. package/dist/learning/usage-inference.d.ts +82 -0
  80. package/dist/learning/usage-inference.d.ts.map +1 -0
  81. package/dist/learning/usage-inference.js +261 -0
  82. package/dist/learning/usage-inference.js.map +1 -0
  83. package/dist/mcp/index.d.ts +6 -0
  84. package/dist/mcp/index.d.ts.map +1 -0
  85. package/dist/mcp/index.js +6 -0
  86. package/dist/mcp/index.js.map +1 -0
  87. package/dist/mcp/playbook-server.d.ts +120 -0
  88. package/dist/mcp/playbook-server.d.ts.map +1 -0
  89. package/dist/mcp/playbook-server.js +427 -0
  90. package/dist/mcp/playbook-server.js.map +1 -0
  91. package/dist/memory/curated-loader.d.ts +62 -0
  92. package/dist/memory/curated-loader.d.ts.map +1 -0
  93. package/dist/memory/curated-loader.js +106 -0
  94. package/dist/memory/curated-loader.js.map +1 -0
  95. package/dist/memory/experience.d.ts +122 -0
  96. package/dist/memory/experience.d.ts.map +1 -0
  97. package/dist/memory/experience.js +392 -0
  98. package/dist/memory/experience.js.map +1 -0
  99. package/dist/memory/index.d.ts +6 -0
  100. package/dist/memory/index.d.ts.map +1 -0
  101. package/dist/memory/index.js +9 -0
  102. package/dist/memory/index.js.map +1 -0
  103. package/dist/memory/meta.d.ts +90 -0
  104. package/dist/memory/meta.d.ts.map +1 -0
  105. package/dist/memory/meta.js +362 -0
  106. package/dist/memory/meta.js.map +1 -0
  107. package/dist/memory/playbook.d.ts +133 -0
  108. package/dist/memory/playbook.d.ts.map +1 -0
  109. package/dist/memory/playbook.js +357 -0
  110. package/dist/memory/playbook.js.map +1 -0
  111. package/dist/memory/system.d.ts +167 -0
  112. package/dist/memory/system.d.ts.map +1 -0
  113. package/dist/memory/system.js +383 -0
  114. package/dist/memory/system.js.map +1 -0
  115. package/dist/runtime/backends/acp.d.ts +67 -0
  116. package/dist/runtime/backends/acp.d.ts.map +1 -0
  117. package/dist/runtime/backends/acp.js +290 -0
  118. package/dist/runtime/backends/acp.js.map +1 -0
  119. package/dist/runtime/backends/index.d.ts +5 -0
  120. package/dist/runtime/backends/index.d.ts.map +1 -0
  121. package/dist/runtime/backends/index.js +6 -0
  122. package/dist/runtime/backends/index.js.map +1 -0
  123. package/dist/runtime/backends/mock.d.ts +67 -0
  124. package/dist/runtime/backends/mock.d.ts.map +1 -0
  125. package/dist/runtime/backends/mock.js +153 -0
  126. package/dist/runtime/backends/mock.js.map +1 -0
  127. package/dist/runtime/backends/subprocess.d.ts +56 -0
  128. package/dist/runtime/backends/subprocess.d.ts.map +1 -0
  129. package/dist/runtime/backends/subprocess.js +260 -0
  130. package/dist/runtime/backends/subprocess.js.map +1 -0
  131. package/dist/runtime/flows/learning.d.ts +73 -0
  132. package/dist/runtime/flows/learning.d.ts.map +1 -0
  133. package/dist/runtime/flows/learning.js +116 -0
  134. package/dist/runtime/flows/learning.js.map +1 -0
  135. package/dist/runtime/flows/validation.d.ts +122 -0
  136. package/dist/runtime/flows/validation.d.ts.map +1 -0
  137. package/dist/runtime/flows/validation.js +223 -0
  138. package/dist/runtime/flows/validation.js.map +1 -0
  139. package/dist/runtime/index.d.ts +6 -0
  140. package/dist/runtime/index.d.ts.map +1 -0
  141. package/dist/runtime/index.js +8 -0
  142. package/dist/runtime/index.js.map +1 -0
  143. package/dist/runtime/manager.d.ts +116 -0
  144. package/dist/runtime/manager.d.ts.map +1 -0
  145. package/dist/runtime/manager.js +416 -0
  146. package/dist/runtime/manager.js.map +1 -0
  147. package/dist/runtime/types.d.ts +138 -0
  148. package/dist/runtime/types.d.ts.map +1 -0
  149. package/dist/runtime/types.js +2 -0
  150. package/dist/runtime/types.js.map +1 -0
  151. package/dist/search/evaluator.d.ts +102 -0
  152. package/dist/search/evaluator.d.ts.map +1 -0
  153. package/dist/search/evaluator.js +352 -0
  154. package/dist/search/evaluator.js.map +1 -0
  155. package/dist/search/index.d.ts +7 -0
  156. package/dist/search/index.d.ts.map +1 -0
  157. package/dist/search/index.js +11 -0
  158. package/dist/search/index.js.map +1 -0
  159. package/dist/search/refinement-loop.d.ts +73 -0
  160. package/dist/search/refinement-loop.d.ts.map +1 -0
  161. package/dist/search/refinement-loop.js +245 -0
  162. package/dist/search/refinement-loop.js.map +1 -0
  163. package/dist/search/refinement-types.d.ts +154 -0
  164. package/dist/search/refinement-types.d.ts.map +1 -0
  165. package/dist/search/refinement-types.js +99 -0
  166. package/dist/search/refinement-types.js.map +1 -0
  167. package/dist/search/router.d.ts +61 -0
  168. package/dist/search/router.d.ts.map +1 -0
  169. package/dist/search/router.js +197 -0
  170. package/dist/search/router.js.map +1 -0
  171. package/dist/search/solver.d.ts +75 -0
  172. package/dist/search/solver.d.ts.map +1 -0
  173. package/dist/search/solver.js +216 -0
  174. package/dist/search/solver.js.map +1 -0
  175. package/dist/search/verification-runner.d.ts +125 -0
  176. package/dist/search/verification-runner.d.ts.map +1 -0
  177. package/dist/search/verification-runner.js +440 -0
  178. package/dist/search/verification-runner.js.map +1 -0
  179. package/dist/surfacing/index.d.ts +2 -0
  180. package/dist/surfacing/index.d.ts.map +1 -0
  181. package/dist/surfacing/index.js +2 -0
  182. package/dist/surfacing/index.js.map +1 -0
  183. package/dist/surfacing/skill-library.d.ts +158 -0
  184. package/dist/surfacing/skill-library.d.ts.map +1 -0
  185. package/dist/surfacing/skill-library.js +429 -0
  186. package/dist/surfacing/skill-library.js.map +1 -0
  187. package/dist/types/config.d.ts +1113 -0
  188. package/dist/types/config.d.ts.map +1 -0
  189. package/dist/types/config.js +274 -0
  190. package/dist/types/config.js.map +1 -0
  191. package/dist/types/index.d.ts +9 -0
  192. package/dist/types/index.d.ts.map +1 -0
  193. package/dist/types/index.js +14 -0
  194. package/dist/types/index.js.map +1 -0
  195. package/dist/types/memory.d.ts +339 -0
  196. package/dist/types/memory.d.ts.map +1 -0
  197. package/dist/types/memory.js +207 -0
  198. package/dist/types/memory.js.map +1 -0
  199. package/dist/types/meta.d.ts +146 -0
  200. package/dist/types/meta.d.ts.map +1 -0
  201. package/dist/types/meta.js +51 -0
  202. package/dist/types/meta.js.map +1 -0
  203. package/dist/types/outcome.d.ts +42 -0
  204. package/dist/types/outcome.d.ts.map +1 -0
  205. package/dist/types/outcome.js +50 -0
  206. package/dist/types/outcome.js.map +1 -0
  207. package/dist/types/playbook.d.ts +119 -0
  208. package/dist/types/playbook.d.ts.map +1 -0
  209. package/dist/types/playbook.js +71 -0
  210. package/dist/types/playbook.js.map +1 -0
  211. package/dist/types/step.d.ts +44 -0
  212. package/dist/types/step.d.ts.map +1 -0
  213. package/dist/types/step.js +32 -0
  214. package/dist/types/step.js.map +1 -0
  215. package/dist/types/task.d.ts +91 -0
  216. package/dist/types/task.d.ts.map +1 -0
  217. package/dist/types/task.js +39 -0
  218. package/dist/types/task.js.map +1 -0
  219. package/dist/types/trajectory.d.ts +221 -0
  220. package/dist/types/trajectory.d.ts.map +1 -0
  221. package/dist/types/trajectory.js +60 -0
  222. package/dist/types/trajectory.js.map +1 -0
  223. package/dist/utils/index.d.ts +4 -0
  224. package/dist/utils/index.d.ts.map +1 -0
  225. package/dist/utils/index.js +4 -0
  226. package/dist/utils/index.js.map +1 -0
  227. package/dist/utils/similarity.d.ts +31 -0
  228. package/dist/utils/similarity.d.ts.map +1 -0
  229. package/dist/utils/similarity.js +107 -0
  230. package/dist/utils/similarity.js.map +1 -0
  231. package/dist/utils/storage.d.ts +106 -0
  232. package/dist/utils/storage.d.ts.map +1 -0
  233. package/dist/utils/storage.js +203 -0
  234. package/dist/utils/storage.js.map +1 -0
  235. package/dist/utils/validation.d.ts +129 -0
  236. package/dist/utils/validation.d.ts.map +1 -0
  237. package/dist/utils/validation.js +171 -0
  238. package/dist/utils/validation.js.map +1 -0
  239. package/package.json +50 -34
  240. package/scripts/migrate-to-playbooks.ts +307 -0
  241. package/src/agents/index.ts +14 -0
  242. package/src/agents/mock-provider.ts +93 -0
  243. package/src/agents/types.ts +137 -0
  244. package/src/atlas.ts +560 -0
  245. package/src/bin/cognitive-core.ts +470 -0
  246. package/src/embeddings/bm25.ts +337 -0
  247. package/src/embeddings/index.ts +39 -0
  248. package/src/embeddings/manager.ts +288 -0
  249. package/src/embeddings/provider.ts +311 -0
  250. package/src/embeddings/vector-store.ts +353 -0
  251. package/src/factory.ts +263 -0
  252. package/src/index.ts +246 -0
  253. package/src/learning/analyzer.ts +335 -0
  254. package/src/learning/effectiveness.ts +428 -0
  255. package/src/learning/index.ts +58 -0
  256. package/src/learning/llm-extractor.ts +542 -0
  257. package/src/learning/meta-learner.ts +516 -0
  258. package/src/learning/pipeline.ts +244 -0
  259. package/src/learning/playbook-extractor.ts +702 -0
  260. package/src/learning/usage-inference.ts +372 -0
  261. package/src/mcp/index.ts +12 -0
  262. package/src/mcp/playbook-server.ts +565 -0
  263. package/src/memory/curated-loader.ts +160 -0
  264. package/src/memory/experience.ts +515 -0
  265. package/src/memory/index.ts +27 -0
  266. package/src/memory/meta.ts +506 -0
  267. package/src/memory/playbook.ts +493 -0
  268. package/src/memory/system.ts +551 -0
  269. package/src/runtime/backends/acp.ts +378 -0
  270. package/src/runtime/backends/index.ts +24 -0
  271. package/src/runtime/backends/mock.ts +218 -0
  272. package/src/runtime/backends/subprocess.ts +356 -0
  273. package/src/runtime/flows/learning.ts +183 -0
  274. package/src/runtime/flows/validation.ts +381 -0
  275. package/src/runtime/index.ts +53 -0
  276. package/src/runtime/manager.ts +541 -0
  277. package/src/runtime/types.ts +157 -0
  278. package/src/search/evaluator.ts +474 -0
  279. package/src/search/index.ts +59 -0
  280. package/src/search/refinement-loop.ts +363 -0
  281. package/src/search/refinement-types.ts +159 -0
  282. package/src/search/router.ts +261 -0
  283. package/src/search/solver.ts +303 -0
  284. package/src/search/verification-runner.ts +570 -0
  285. package/src/surfacing/index.ts +6 -0
  286. package/src/surfacing/skill-library.ts +594 -0
  287. package/src/types/config.ts +333 -0
  288. package/src/types/index.ts +130 -0
  289. package/src/types/memory.ts +270 -0
  290. package/src/types/meta.ts +218 -0
  291. package/src/types/outcome.ts +66 -0
  292. package/src/types/playbook.ts +196 -0
  293. package/src/types/step.ts +40 -0
  294. package/src/types/task.ts +52 -0
  295. package/src/types/trajectory.ts +80 -0
  296. package/src/utils/index.ts +38 -0
  297. package/src/utils/similarity.ts +139 -0
  298. package/src/utils/storage.ts +249 -0
  299. package/src/utils/validation.ts +286 -0
  300. package/tests/embeddings/bm25.test.ts +130 -0
  301. package/tests/embeddings/manager.test.ts +205 -0
  302. package/tests/integration/atlas.test.ts +266 -0
  303. package/tests/integration/e2e.test.ts +929 -0
  304. package/tests/learning/analyzer.test.ts +426 -0
  305. package/tests/learning/effectiveness.test.ts +542 -0
  306. package/tests/learning/pipeline.test.ts +176 -0
  307. package/tests/learning/playbook-extractor-provenance.test.ts +114 -0
  308. package/tests/learning/usage-inference.test.ts +254 -0
  309. package/tests/mcp/playbook-server.test.ts +252 -0
  310. package/tests/memory/experience.test.ts +198 -0
  311. package/tests/memory/playbook.test.ts +338 -0
  312. package/tests/memory/provenance.test.ts +639 -0
  313. package/tests/memory/system.test.ts +325 -0
  314. package/tests/runtime/agent-manager.test.ts +512 -0
  315. package/tests/runtime/mock-backend.test.ts +248 -0
  316. package/tests/search/refinement-loop.test.ts +468 -0
  317. package/tests/search/refinement.test.ts +267 -0
  318. package/tests/search/router.test.ts +427 -0
  319. package/tests/surfacing/skill-library.test.ts +292 -0
  320. package/tests/types/outcome.test.ts +147 -0
  321. package/tests/types/step.test.ts +133 -0
  322. package/tests/types/task.test.ts +158 -0
  323. package/tests/types/trajectory.test.ts +253 -0
  324. package/tests/utils/similarity.test.ts +188 -0
  325. package/tests/utils/validation.test.ts +252 -0
  326. package/tsconfig.json +25 -0
  327. package/vitest.config.ts +22 -0
  328. package/dist/index.d.mts +0 -466
  329. package/dist/index.mjs +0 -478
@@ -0,0 +1,223 @@
1
+ /**
2
+ * Validation Flow
3
+ * Orchestrates: Knowledge injection → Agent execution → Performance measurement
4
+ *
5
+ * This flow is for the "injection" direction:
6
+ * - Test how well learning is working
7
+ * - Compare performance with vs without knowledge
8
+ * - Measure improvement over time
9
+ */
10
+ export class ValidationFlow {
11
+ manager;
12
+ config;
13
+ constructor(manager, _memory, // Reserved for future memory state tracking
14
+ config) {
15
+ this.manager = manager;
16
+ this.config = {
17
+ runsPerTask: 1,
18
+ runComparison: true,
19
+ taskTimeout: 300000, // 5 minutes
20
+ ...config,
21
+ };
22
+ }
23
+ /**
24
+ * Validate on a single task
25
+ */
26
+ async validateTask(task) {
27
+ const runsPerTask = this.config.runsPerTask ?? 1;
28
+ const results = [];
29
+ const baselineResults = [];
30
+ // Run with knowledge injection
31
+ for (let i = 0; i < runsPerTask; i++) {
32
+ const result = await this.manager.spawn({
33
+ agentType: this.config.agentType,
34
+ task,
35
+ timeout: this.config.taskTimeout,
36
+ captureToolCalls: true,
37
+ });
38
+ results.push(result);
39
+ }
40
+ // Run baseline if comparison enabled
41
+ if (this.config.runComparison) {
42
+ for (let i = 0; i < runsPerTask; i++) {
43
+ const result = await this.manager.spawnBaseline({
44
+ agentType: this.config.agentType,
45
+ task,
46
+ timeout: this.config.taskTimeout,
47
+ captureToolCalls: true,
48
+ });
49
+ baselineResults.push(result);
50
+ }
51
+ }
52
+ const metrics = this.calculateMetrics(results);
53
+ let comparison;
54
+ if (this.config.runComparison && baselineResults.length > 0) {
55
+ const baselineMetrics = this.calculateMetrics(baselineResults);
56
+ comparison = this.calculateComparison(metrics, baselineMetrics);
57
+ }
58
+ return { task, results, metrics, comparison };
59
+ }
60
+ /**
61
+ * Validate on multiple tasks
62
+ */
63
+ async validate(tasks) {
64
+ const taskResults = [];
65
+ const allResults = [];
66
+ const allBaselineResults = [];
67
+ for (const task of tasks) {
68
+ const result = await this.validateTask(task);
69
+ taskResults.push({
70
+ task: result.task,
71
+ results: result.results,
72
+ metrics: result.metrics,
73
+ });
74
+ allResults.push(...result.results);
75
+ // Collect baseline results for aggregate comparison
76
+ if (this.config.runComparison) {
77
+ // Re-run baseline for aggregate (or we could store from validateTask)
78
+ for (let i = 0; i < (this.config.runsPerTask ?? 1); i++) {
79
+ const baselineResult = await this.manager.spawnBaseline({
80
+ agentType: this.config.agentType,
81
+ task,
82
+ timeout: this.config.taskTimeout,
83
+ captureToolCalls: true,
84
+ });
85
+ allBaselineResults.push(baselineResult);
86
+ }
87
+ }
88
+ }
89
+ const aggregateMetrics = this.calculateMetrics(allResults);
90
+ let comparison;
91
+ if (this.config.runComparison && allBaselineResults.length > 0) {
92
+ const baselineMetrics = this.calculateMetrics(allBaselineResults);
93
+ comparison = this.calculateComparison(aggregateMetrics, baselineMetrics);
94
+ }
95
+ return {
96
+ taskResults,
97
+ aggregateMetrics,
98
+ comparison,
99
+ };
100
+ }
101
+ /**
102
+ * Quick validation - single run per task, with comparison
103
+ */
104
+ async quickValidate(tasks) {
105
+ const details = [];
106
+ for (const task of tasks) {
107
+ const [withKnowledge, baseline] = await Promise.all([
108
+ this.manager.spawn({
109
+ agentType: this.config.agentType,
110
+ task,
111
+ timeout: this.config.taskTimeout,
112
+ }),
113
+ this.manager.spawnBaseline({
114
+ agentType: this.config.agentType,
115
+ task,
116
+ timeout: this.config.taskTimeout,
117
+ }),
118
+ ]);
119
+ details.push({
120
+ task,
121
+ withKnowledge: withKnowledge.success,
122
+ baseline: baseline.success,
123
+ });
124
+ }
125
+ const successRateWithKnowledge = details.filter((d) => d.withKnowledge).length / details.length;
126
+ const successRateBaseline = details.filter((d) => d.baseline).length / details.length;
127
+ return {
128
+ successRateWithKnowledge,
129
+ successRateBaseline,
130
+ improvement: successRateWithKnowledge - successRateBaseline,
131
+ details,
132
+ };
133
+ }
134
+ /**
135
+ * Calculate metrics from results
136
+ */
137
+ calculateMetrics(results) {
138
+ if (results.length === 0) {
139
+ return {
140
+ successRate: 0,
141
+ avgTime: 0,
142
+ avgToolCalls: 0,
143
+ timeStdDev: 0,
144
+ totalRuns: 0,
145
+ };
146
+ }
147
+ const successCount = results.filter((r) => r.success).length;
148
+ const times = results.map((r) => r.metrics.totalTime);
149
+ const toolCalls = results.map((r) => r.metrics.toolCallCount);
150
+ const avgTime = times.reduce((a, b) => a + b, 0) / times.length;
151
+ const avgToolCalls = toolCalls.reduce((a, b) => a + b, 0) / toolCalls.length;
152
+ // Calculate standard deviation
153
+ const timeVariance = times.reduce((sum, t) => sum + Math.pow(t - avgTime, 2), 0) /
154
+ times.length;
155
+ const timeStdDev = Math.sqrt(timeVariance);
156
+ return {
157
+ successRate: successCount / results.length,
158
+ avgTime,
159
+ avgToolCalls,
160
+ timeStdDev,
161
+ totalRuns: results.length,
162
+ };
163
+ }
164
+ /**
165
+ * Calculate comparison between two sets of metrics
166
+ */
167
+ calculateComparison(withKnowledge, baseline) {
168
+ const successRateDelta = withKnowledge.successRate - baseline.successRate;
169
+ const timeDeltaPercent = baseline.avgTime > 0
170
+ ? ((baseline.avgTime - withKnowledge.avgTime) / baseline.avgTime) * 100
171
+ : 0;
172
+ const toolCallDeltaPercent = baseline.avgToolCalls > 0
173
+ ? ((baseline.avgToolCalls - withKnowledge.avgToolCalls) /
174
+ baseline.avgToolCalls) *
175
+ 100
176
+ : 0;
177
+ // Simple significance test (would need proper statistical test in production)
178
+ // Using a rough heuristic: significant if improvement > 2 std devs
179
+ const isSignificant = Math.abs(withKnowledge.avgTime - baseline.avgTime) >
180
+ 2 * Math.max(withKnowledge.timeStdDev, baseline.timeStdDev);
181
+ return {
182
+ withKnowledge,
183
+ baseline,
184
+ improvement: {
185
+ successRateDelta,
186
+ timeDeltaPercent,
187
+ toolCallDeltaPercent,
188
+ isSignificant,
189
+ },
190
+ };
191
+ }
192
+ /**
193
+ * Generate a validation report
194
+ */
195
+ generateReport(result) {
196
+ const lines = [
197
+ '# Atlas Validation Report',
198
+ '',
199
+ '## Aggregate Metrics',
200
+ `- Success Rate: ${(result.aggregateMetrics.successRate * 100).toFixed(1)}%`,
201
+ `- Avg Time: ${result.aggregateMetrics.avgTime.toFixed(0)}ms`,
202
+ `- Avg Tool Calls: ${result.aggregateMetrics.avgToolCalls.toFixed(1)}`,
203
+ `- Total Runs: ${result.aggregateMetrics.totalRuns}`,
204
+ '',
205
+ ];
206
+ if (result.comparison) {
207
+ const c = result.comparison;
208
+ lines.push('## Comparison (With Knowledge vs Baseline)', '', '| Metric | With Knowledge | Baseline | Improvement |', '|--------|---------------|----------|-------------|', `| Success Rate | ${(c.withKnowledge.successRate * 100).toFixed(1)}% | ${(c.baseline.successRate * 100).toFixed(1)}% | ${c.improvement.successRateDelta > 0 ? '+' : ''}${(c.improvement.successRateDelta * 100).toFixed(1)}% |`, `| Avg Time | ${c.withKnowledge.avgTime.toFixed(0)}ms | ${c.baseline.avgTime.toFixed(0)}ms | ${c.improvement.timeDeltaPercent > 0 ? '+' : ''}${c.improvement.timeDeltaPercent.toFixed(1)}% faster |`, `| Avg Tool Calls | ${c.withKnowledge.avgToolCalls.toFixed(1)} | ${c.baseline.avgToolCalls.toFixed(1)} | ${c.improvement.toolCallDeltaPercent > 0 ? '+' : ''}${c.improvement.toolCallDeltaPercent.toFixed(1)}% fewer |`, '', `Statistical Significance: ${c.improvement.isSignificant ? '✓ Yes' : '✗ No'}`, '');
209
+ }
210
+ lines.push('## Per-Task Results', '');
211
+ for (const taskResult of result.taskResults) {
212
+ lines.push(`### ${taskResult.task.description.slice(0, 50)}...`, `- Success Rate: ${(taskResult.metrics.successRate * 100).toFixed(1)}%`, `- Avg Time: ${taskResult.metrics.avgTime.toFixed(0)}ms`, '');
213
+ }
214
+ return lines.join('\n');
215
+ }
216
+ }
217
+ /**
218
+ * Create a validation flow
219
+ */
220
+ export function createValidationFlow(manager, memory, config) {
221
+ return new ValidationFlow(manager, memory, config);
222
+ }
223
+ //# sourceMappingURL=validation.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"validation.js","sourceRoot":"","sources":["../../../src/runtime/flows/validation.ts"],"names":[],"mappings":"AAqEA;;;;;;;;GAQG;AACH,MAAM,OAAO,cAAc;IACjB,OAAO,CAAe;IACtB,MAAM,CAAuB;IAErC,YACE,OAAqB,EACrB,OAAqB,EAAE,4CAA4C;IACnE,MAA4B;QAE5B,IAAI,CAAC,OAAO,GAAG,OAAO,CAAC;QACvB,IAAI,CAAC,MAAM,GAAG;YACZ,WAAW,EAAE,CAAC;YACd,aAAa,EAAE,IAAI;YACnB,WAAW,EAAE,MAAM,EAAE,YAAY;YACjC,GAAG,MAAM;SACV,CAAC;IACJ,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,YAAY,CAAC,IAAU;QAM3B,MAAM,WAAW,GAAG,IAAI,CAAC,MAAM,CAAC,WAAW,IAAI,CAAC,CAAC;QACjD,MAAM,OAAO,GAAkB,EAAE,CAAC;QAClC,MAAM,eAAe,GAAkB,EAAE,CAAC;QAE1C,+BAA+B;QAC/B,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,WAAW,EAAE,CAAC,EAAE,EAAE,CAAC;YACrC,MAAM,MAAM,GAAG,MAAM,IAAI,CAAC,OAAO,CAAC,KAAK,CAAC;gBACtC,SAAS,EAAE,IAAI,CAAC,MAAM,CAAC,SAAS;gBAChC,IAAI;gBACJ,OAAO,EAAE,IAAI,CAAC,MAAM,CAAC,WAAW;gBAChC,gBAAgB,EAAE,IAAI;aACvB,CAAC,CAAC;YACH,OAAO,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;QACvB,CAAC;QAED,qCAAqC;QACrC,IAAI,IAAI,CAAC,MAAM,CAAC,aAAa,EAAE,CAAC;YAC9B,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,WAAW,EAAE,CAAC,EAAE,EAAE,CAAC;gBACrC,MAAM,MAAM,GAAG,MAAM,IAAI,CAAC,OAAO,CAAC,aAAa,CAAC;oBAC9C,SAAS,EAAE,IAAI,CAAC,MAAM,CAAC,SAAS;oBAChC,IAAI;oBACJ,OAAO,EAAE,IAAI,CAAC,MAAM,CAAC,WAAW;oBAChC,gBAAgB,EAAE,IAAI;iBACvB,CAAC,CAAC;gBACH,eAAe,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;YAC/B,CAAC;QACH,CAAC;QAED,MAAM,OAAO,GAAG,IAAI,CAAC,gBAAgB,CAAC,OAAO,CAAC,CAAC;QAC/C,IAAI,UAAwC,CAAC;QAE7C,IAAI,IAAI,CAAC,MAAM,CAAC,aAAa,IAAI,eAAe,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;YAC5D,MAAM,eAAe,GAAG,IAAI,CAAC,gBAAgB,CAAC,eAAe,CAAC,CAAC;YAC/D,UAAU,GAAG,IAAI,CAAC,mBAAmB,CAAC,OAAO,EAAE,eAAe,CAAC,CAAC;QAClE,CAAC;QAED,OAAO,EAAE,IAAI,EAAE,OAAO,EAAE,OAAO,EAAE,UAAU,EAAE,CAAC;IAChD,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,QAAQ,CAAC,KAAa;QAC1B,MAAM,WAAW,GAAwC,EAAE,CAAC;QAC5D,MAAM,UAAU,GAAkB,EAAE,CAAC;QACrC,MAAM,kBAAkB,GAAkB,EAAE,CAAC;QAE7C,KAAK,MAAM,IAAI,IAAI,KAAK,EAAE,CAAC;YACzB,MAAM,MAAM,GAAG,MAAM,IAAI,CAAC,YAAY,CAAC,IAAI,CAAC,CAAC;YAC7C,WAAW,CAAC,IAAI,CAAC;gBACf,IAAI,EAAE,MAAM,CAAC,IAAI;gBACjB,OAAO,EAAE,MAAM,CAAC,OAAO;gBACvB,OAAO,EAAE,MAAM,CAAC,OAAO;aACxB,CAAC,CAAC;YAEH,UAAU,CAAC,IAAI,CAAC,GAAG,MAAM,CAAC,OAAO,CAAC,CAAC;YAEnC,oDAAoD;YACpD,IAAI,IAAI,CAAC,MAAM,CAAC,aAAa,EAAE,CAAC;gBAC9B,sEAAsE;gBACtE,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,CAAC,IAAI,CAAC,MAAM,CAAC,WAAW,IAAI,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC;oBACxD,MAAM,cAAc,GAAG,MAAM,IAAI,CAAC,OAAO,CAAC,aAAa,CAAC;wBACtD,SAAS,EAAE,IAAI,CAAC,MAAM,CAAC,SAAS;wBAChC,IAAI;wBACJ,OAAO,EAAE,IAAI,CAAC,MAAM,CAAC,WAAW;wBAChC,gBAAgB,EAAE,IAAI;qBACvB,CAAC,CAAC;oBACH,kBAAkB,CAAC,IAAI,CAAC,cAAc,CAAC,CAAC;gBAC1C,CAAC;YACH,CAAC;QACH,CAAC;QAED,MAAM,gBAAgB,GAAG,IAAI,CAAC,gBAAgB,CAAC,UAAU,CAAC,CAAC;QAC3D,IAAI,UAAwC,CAAC;QAE7C,IAAI,IAAI,CAAC,MAAM,CAAC,aAAa,IAAI,kBAAkB,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;YAC/D,MAAM,eAAe,GAAG,IAAI,CAAC,gBAAgB,CAAC,kBAAkB,CAAC,CAAC;YAClE,UAAU,GAAG,IAAI,CAAC,mBAAmB,CAAC,gBAAgB,EAAE,eAAe,CAAC,CAAC;QAC3E,CAAC;QAED,OAAO;YACL,WAAW;YACX,gBAAgB;YAChB,UAAU;SACX,CAAC;IACJ,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,aAAa,CAAC,KAAa;QAU/B,MAAM,OAAO,GAIR,EAAE,CAAC;QAER,KAAK,MAAM,IAAI,IAAI,KAAK,EAAE,CAAC;YACzB,MAAM,CAAC,aAAa,EAAE,QAAQ,CAAC,GAAG,MAAM,OAAO,CAAC,GAAG,CAAC;gBAClD,IAAI,CAAC,OAAO,CAAC,KAAK,CAAC;oBACjB,SAAS,EAAE,IAAI,CAAC,MAAM,CAAC,SAAS;oBAChC,IAAI;oBACJ,OAAO,EAAE,IAAI,CAAC,MAAM,CAAC,WAAW;iBACjC,CAAC;gBACF,IAAI,CAAC,OAAO,CAAC,aAAa,CAAC;oBACzB,SAAS,EAAE,IAAI,CAAC,MAAM,CAAC,SAAS;oBAChC,IAAI;oBACJ,OAAO,EAAE,IAAI,CAAC,MAAM,CAAC,WAAW;iBACjC,CAAC;aACH,CAAC,CAAC;YAEH,OAAO,CAAC,IAAI,CAAC;gBACX,IAAI;gBACJ,aAAa,EAAE,aAAa,CAAC,OAAO;gBACpC,QAAQ,EAAE,QAAQ,CAAC,OAAO;aAC3B,CAAC,CAAC;QACL,CAAC;QAED,MAAM,wBAAwB,GAC5B,OAAO,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,aAAa,CAAC,CAAC,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC;QACjE,MAAM,mBAAmB,GACvB,OAAO,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,QAAQ,CAAC,CAAC,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC;QAE5D,OAAO;YACL,wBAAwB;YACxB,mBAAmB;YACnB,WAAW,EAAE,wBAAwB,GAAG,mBAAmB;YAC3D,OAAO;SACR,CAAC;IACJ,CAAC;IAED;;OAEG;IACK,gBAAgB,CAAC,OAAsB;QAC7C,IAAI,OAAO,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;YACzB,OAAO;gBACL,WAAW,EAAE,CAAC;gBACd,OAAO,EAAE,CAAC;gBACV,YAAY,EAAE,CAAC;gBACf,UAAU,EAAE,CAAC;gBACb,SAAS,EAAE,CAAC;aACb,CAAC;QACJ,CAAC;QAED,MAAM,YAAY,GAAG,OAAO,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,OAAO,CAAC,CAAC,MAAM,CAAC;QAC7D,MAAM,KAAK,GAAG,OAAO,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,OAAO,CAAC,SAAS,CAAC,CAAC;QACtD,MAAM,SAAS,GAAG,OAAO,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,OAAO,CAAC,aAAa,CAAC,CAAC;QAE9D,MAAM,OAAO,GAAG,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC,GAAG,KAAK,CAAC,MAAM,CAAC;QAChE,MAAM,YAAY,GAChB,SAAS,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC,GAAG,SAAS,CAAC,MAAM,CAAC;QAE1D,+BAA+B;QAC/B,MAAM,YAAY,GAChB,KAAK,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,CAAC,EAAE,EAAE,CAAC,GAAG,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,GAAG,OAAO,EAAE,CAAC,CAAC,EAAE,CAAC,CAAC;YAC3D,KAAK,CAAC,MAAM,CAAC;QACf,MAAM,UAAU,GAAG,IAAI,CAAC,IAAI,CAAC,YAAY,CAAC,CAAC;QAE3C,OAAO;YACL,WAAW,EAAE,YAAY,GAAG,OAAO,CAAC,MAAM;YAC1C,OAAO;YACP,YAAY;YACZ,UAAU;YACV,SAAS,EAAE,OAAO,CAAC,MAAM;SAC1B,CAAC;IACJ,CAAC;IAED;;OAEG;IACK,mBAAmB,CACzB,aAAgC,EAChC,QAA2B;QAE3B,MAAM,gBAAgB,GACpB,aAAa,CAAC,WAAW,GAAG,QAAQ,CAAC,WAAW,CAAC;QAEnD,MAAM,gBAAgB,GACpB,QAAQ,CAAC,OAAO,GAAG,CAAC;YAClB,CAAC,CAAC,CAAC,CAAC,QAAQ,CAAC,OAAO,GAAG,aAAa,CAAC,OAAO,CAAC,GAAG,QAAQ,CAAC,OAAO,CAAC,GAAG,GAAG;YACvE,CAAC,CAAC,CAAC,CAAC;QAER,MAAM,oBAAoB,GACxB,QAAQ,CAAC,YAAY,GAAG,CAAC;YACvB,CAAC,CAAC,CAAC,CAAC,QAAQ,CAAC,YAAY,GAAG,aAAa,CAAC,YAAY,CAAC;gBACnD,QAAQ,CAAC,YAAY,CAAC;gBACxB,GAAG;YACL,CAAC,CAAC,CAAC,CAAC;QAER,8EAA8E;QAC9E,mEAAmE;QACnE,MAAM,aAAa,GACjB,IAAI,CAAC,GAAG,CAAC,aAAa,CAAC,OAAO,GAAG,QAAQ,CAAC,OAAO,CAAC;YAClD,CAAC,GAAG,IAAI,CAAC,GAAG,CAAC,aAAa,CAAC,UAAU,EAAE,QAAQ,CAAC,UAAU,CAAC,CAAC;QAE9D,OAAO;YACL,aAAa;YACb,QAAQ;YACR,WAAW,EAAE;gBACX,gBAAgB;gBAChB,gBAAgB;gBAChB,oBAAoB;gBACpB,aAAa;aACd;SACF,CAAC;IACJ,CAAC;IAED;;OAEG;IACH,cAAc,CAAC,MAA4B;QACzC,MAAM,KAAK,GAAa;YACtB,2BAA2B;YAC3B,EAAE;YACF,sBAAsB;YACtB,mBAAmB,CAAC,MAAM,CAAC,gBAAgB,CAAC,WAAW,GAAG,GAAG,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,GAAG;YAC5E,eAAe,MAAM,CAAC,gBAAgB,CAAC,OAAO,CAAC,OAAO,CAAC,CAAC,CAAC,IAAI;YAC7D,qBAAqB,MAAM,CAAC,gBAAgB,CAAC,YAAY,CAAC,OAAO,CAAC,CAAC,CAAC,EAAE;YACtE,iBAAiB,MAAM,CAAC,gBAAgB,CAAC,SAAS,EAAE;YACpD,EAAE;SACH,CAAC;QAEF,IAAI,MAAM,CAAC,UAAU,EAAE,CAAC;YACtB,MAAM,CAAC,GAAG,MAAM,CAAC,UAAU,CAAC;YAC5B,KAAK,CAAC,IAAI,CACR,4CAA4C,EAC5C,EAAE,EACF,sDAAsD,EACtD,qDAAqD,EACrD,oBAAoB,CAAC,CAAC,CAAC,aAAa,CAAC,WAAW,GAAG,GAAG,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,QAAQ,CAAC,WAAW,GAAG,GAAG,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,OAAO,CAAC,CAAC,WAAW,CAAC,gBAAgB,GAAG,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,GAAG,CAAC,CAAC,CAAC,WAAW,CAAC,gBAAgB,GAAG,GAAG,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,KAAK,EAC/N,gBAAgB,CAAC,CAAC,aAAa,CAAC,OAAO,CAAC,OAAO,CAAC,CAAC,CAAC,QAAQ,CAAC,CAAC,QAAQ,CAAC,OAAO,CAAC,OAAO,CAAC,CAAC,CAAC,QAAQ,CAAC,CAAC,WAAW,CAAC,gBAAgB,GAAG,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,GAAG,CAAC,CAAC,WAAW,CAAC,gBAAgB,CAAC,OAAO,CAAC,CAAC,CAAC,YAAY,EACpM,sBAAsB,CAAC,CAAC,aAAa,CAAC,YAAY,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,CAAC,QAAQ,CAAC,YAAY,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,CAAC,WAAW,CAAC,oBAAoB,GAAG,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,GAAG,CAAC,CAAC,WAAW,CAAC,oBAAoB,CAAC,OAAO,CAAC,CAAC,CAAC,WAAW,EACvN,EAAE,EACF,6BAA6B,CAAC,CAAC,WAAW,CAAC,aAAa,CAAC,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,EAAE,EAC7E,EAAE,CACH,CAAC;QACJ,CAAC;QAED,KAAK,CAAC,IAAI,CACR,qBAAqB,EACrB,EAAE,CACH,CAAC;QAEF,KAAK,MAAM,UAAU,IAAI,MAAM,CAAC,WAAW,EAAE,CAAC;YAC5C,KAAK,CAAC,IAAI,CACR,OAAO,UAAU,CAAC,IAAI,CAAC,WAAW,CAAC,KAAK,CAAC,CAAC,EAAE,EAAE,CAAC,KAAK,EACpD,mBAAmB,CAAC,UAAU,CAAC,OAAO,CAAC,WAAW,GAAG,GAAG,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,GAAG,EACvE,eAAe,UAAU,CAAC,OAAO,CAAC,OAAO,CAAC,OAAO,CAAC,CAAC,CAAC,IAAI,EACxD,EAAE,CACH,CAAC;QACJ,CAAC;QAED,OAAO,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;IAC1B,CAAC;CACF;AAED;;GAEG;AACH,MAAM,UAAU,oBAAoB,CAClC,OAAqB,EACrB,MAAoB,EACpB,MAA4B;IAE5B,OAAO,IAAI,cAAc,CAAC,OAAO,EAAE,MAAM,EAAE,MAAM,CAAC,CAAC;AACrD,CAAC"}
@@ -0,0 +1,6 @@
1
+ export type { AgentMessage, ToolCall, AgentState, AgentSession, AgentSpawnConfig, AgentResult, AgentBackend, KnowledgeInjector, TrajectoryExtractor, AgentObserverCallbacks, } from './types.js';
2
+ export { AgentManager, createAgentManager, DefaultKnowledgeInjector, DefaultTrajectoryExtractor, } from './manager.js';
3
+ export { SubprocessBackend, createSubprocessBackend, claudeCodeConfig, type SubprocessAgentConfig, MockBackend, createMockBackend, type MockAgentBehavior, ACPBackend, createACPBackend, claudeCodeACPConfig, claudeCodeDirectConfig, type ACPAgentConfig, } from './backends/index.js';
4
+ export { LearningFlow, createLearningFlow, type LearningFlowConfig, type LearningFlowResult, } from './flows/learning.js';
5
+ export { ValidationFlow, createValidationFlow, type ValidationFlowConfig, type ValidationFlowResult, type ValidationMetrics, } from './flows/validation.js';
6
+ //# sourceMappingURL=index.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../src/runtime/index.ts"],"names":[],"mappings":"AACA,YAAY,EACV,YAAY,EACZ,QAAQ,EACR,UAAU,EACV,YAAY,EACZ,gBAAgB,EAChB,WAAW,EACX,YAAY,EACZ,iBAAiB,EACjB,mBAAmB,EACnB,sBAAsB,GACvB,MAAM,YAAY,CAAC;AAGpB,OAAO,EACL,YAAY,EACZ,kBAAkB,EAClB,wBAAwB,EACxB,0BAA0B,GAC3B,MAAM,cAAc,CAAC;AAGtB,OAAO,EACL,iBAAiB,EACjB,uBAAuB,EACvB,gBAAgB,EAChB,KAAK,qBAAqB,EAC1B,WAAW,EACX,iBAAiB,EACjB,KAAK,iBAAiB,EACtB,UAAU,EACV,gBAAgB,EAChB,mBAAmB,EACnB,sBAAsB,EACtB,KAAK,cAAc,GACpB,MAAM,qBAAqB,CAAC;AAG7B,OAAO,EACL,YAAY,EACZ,kBAAkB,EAClB,KAAK,kBAAkB,EACvB,KAAK,kBAAkB,GACxB,MAAM,qBAAqB,CAAC;AAE7B,OAAO,EACL,cAAc,EACd,oBAAoB,EACpB,KAAK,oBAAoB,EACzB,KAAK,oBAAoB,EACzB,KAAK,iBAAiB,GACvB,MAAM,uBAAuB,CAAC"}
@@ -0,0 +1,8 @@
1
+ // Manager
2
+ export { AgentManager, createAgentManager, DefaultKnowledgeInjector, DefaultTrajectoryExtractor, } from './manager.js';
3
+ // Backends
4
+ export { SubprocessBackend, createSubprocessBackend, claudeCodeConfig, MockBackend, createMockBackend, ACPBackend, createACPBackend, claudeCodeACPConfig, claudeCodeDirectConfig, } from './backends/index.js';
5
+ // Flows
6
+ export { LearningFlow, createLearningFlow, } from './flows/learning.js';
7
+ export { ValidationFlow, createValidationFlow, } from './flows/validation.js';
8
+ //# sourceMappingURL=index.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"index.js","sourceRoot":"","sources":["../../src/runtime/index.ts"],"names":[],"mappings":"AAcA,UAAU;AACV,OAAO,EACL,YAAY,EACZ,kBAAkB,EAClB,wBAAwB,EACxB,0BAA0B,GAC3B,MAAM,cAAc,CAAC;AAEtB,WAAW;AACX,OAAO,EACL,iBAAiB,EACjB,uBAAuB,EACvB,gBAAgB,EAEhB,WAAW,EACX,iBAAiB,EAEjB,UAAU,EACV,gBAAgB,EAChB,mBAAmB,EACnB,sBAAsB,GAEvB,MAAM,qBAAqB,CAAC;AAE7B,QAAQ;AACR,OAAO,EACL,YAAY,EACZ,kBAAkB,GAGnB,MAAM,qBAAqB,CAAC;AAE7B,OAAO,EACL,cAAc,EACd,oBAAoB,GAIrB,MAAM,uBAAuB,CAAC"}
@@ -0,0 +1,116 @@
1
+ import type { Task, Trajectory } from '../types/index.js';
2
+ import type { MemorySystem, MemoryQueryResultV2 } from '../memory/system.js';
3
+ import type { AgentBackend, AgentSpawnConfig, AgentSession, AgentResult, AgentObserverCallbacks, KnowledgeInjector, TrajectoryExtractor } from './types.js';
4
+ /**
5
+ * Default knowledge injector - formats memory for context injection
6
+ */
7
+ export declare class DefaultKnowledgeInjector implements KnowledgeInjector {
8
+ format(knowledge: MemoryQueryResultV2, _agentType: string, options?: {
9
+ maxTokens?: number;
10
+ format?: 'markdown' | 'json' | 'xml';
11
+ }): string;
12
+ private formatMarkdown;
13
+ private formatXml;
14
+ private escapeXml;
15
+ }
16
+ /**
17
+ * Default trajectory extractor - converts agent sessions to trajectories
18
+ */
19
+ export declare class DefaultTrajectoryExtractor implements TrajectoryExtractor {
20
+ extract(session: AgentSession, task: Task): Trajectory;
21
+ private extractThought;
22
+ private summarizeInput;
23
+ private summarizeOutput;
24
+ }
25
+ /**
26
+ * Agent Manager - orchestrates agent spawning, observation, and learning
27
+ */
28
+ export declare class AgentManager {
29
+ private backends;
30
+ private memory;
31
+ private injector;
32
+ private extractor;
33
+ private observers;
34
+ private activeSessions;
35
+ constructor(memory: MemorySystem, options?: {
36
+ injector?: KnowledgeInjector;
37
+ extractor?: TrajectoryExtractor;
38
+ });
39
+ /**
40
+ * Register an agent backend
41
+ */
42
+ registerBackend(backend: AgentBackend): void;
43
+ /**
44
+ * Get a registered backend
45
+ */
46
+ getBackend(name: string): AgentBackend | undefined;
47
+ /**
48
+ * List available backends
49
+ */
50
+ listBackends(): string[];
51
+ /**
52
+ * Add an observer for agent events
53
+ */
54
+ addObserver(callbacks: AgentObserverCallbacks): void;
55
+ /**
56
+ * Remove an observer
57
+ */
58
+ removeObserver(callbacks: AgentObserverCallbacks): void;
59
+ /**
60
+ * Spawn an agent to execute a task
61
+ * This is the main entry point for running agents
62
+ */
63
+ spawn(config: AgentSpawnConfig): Promise<AgentResult>;
64
+ /**
65
+ * Spawn an agent WITHOUT knowledge injection (for baseline/control)
66
+ */
67
+ spawnBaseline(config: Omit<AgentSpawnConfig, 'injectedKnowledge'>): Promise<AgentResult>;
68
+ /**
69
+ * Run an A/B comparison: with and without knowledge injection
70
+ */
71
+ compareWithKnowledge(config: Omit<AgentSpawnConfig, 'injectedKnowledge'>): Promise<{
72
+ withKnowledge: AgentResult;
73
+ baseline: AgentResult;
74
+ improvement: {
75
+ timeDelta: number;
76
+ toolCallDelta: number;
77
+ successDelta: number;
78
+ };
79
+ }>;
80
+ /**
81
+ * Observe an external agent session and learn from it
82
+ * Use this when you have access to another agent's execution
83
+ */
84
+ observeAndLearn(session: AgentSession, task: Task): Promise<Trajectory>;
85
+ /**
86
+ * Get active sessions
87
+ */
88
+ getActiveSessions(): AgentSession[];
89
+ /**
90
+ * Terminate a session
91
+ */
92
+ terminate(sessionId: string): Promise<void>;
93
+ /**
94
+ * Terminate all active sessions
95
+ */
96
+ terminateAll(): Promise<void>;
97
+ /**
98
+ * Close the manager and clean up resources
99
+ * Terminates all active sessions and clears all state
100
+ */
101
+ close(): Promise<void>;
102
+ private findBackend;
103
+ private waitForCompletion;
104
+ private notifySessionStart;
105
+ private notifyMessage;
106
+ private notifyToolCall;
107
+ private notifySessionEnd;
108
+ }
109
+ /**
110
+ * Create an agent manager
111
+ */
112
+ export declare function createAgentManager(memory: MemorySystem, options?: {
113
+ injector?: KnowledgeInjector;
114
+ extractor?: TrajectoryExtractor;
115
+ }): AgentManager;
116
+ //# sourceMappingURL=manager.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"manager.d.ts","sourceRoot":"","sources":["../../src/runtime/manager.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,IAAI,EAAE,UAAU,EAAQ,MAAM,mBAAmB,CAAC;AAOhE,OAAO,KAAK,EAAE,YAAY,EAAE,mBAAmB,EAAE,MAAM,qBAAqB,CAAC;AAC7E,OAAO,KAAK,EACV,YAAY,EACZ,gBAAgB,EAChB,YAAY,EACZ,WAAW,EAGX,sBAAsB,EACtB,iBAAiB,EACjB,mBAAmB,EACpB,MAAM,YAAY,CAAC;AAEpB;;GAEG;AACH,qBAAa,wBAAyB,YAAW,iBAAiB;IAChE,MAAM,CACJ,SAAS,EAAE,mBAAmB,EAC9B,UAAU,EAAE,MAAM,EAClB,OAAO,CAAC,EAAE;QAAE,SAAS,CAAC,EAAE,MAAM,CAAC;QAAC,MAAM,CAAC,EAAE,UAAU,GAAG,MAAM,GAAG,KAAK,CAAA;KAAE,GACrE,MAAM;IAcT,OAAO,CAAC,cAAc;IAmCtB,OAAO,CAAC,SAAS;IAoCjB,OAAO,CAAC,SAAS;CAOlB;AAED;;GAEG;AACH,qBAAa,0BAA2B,YAAW,mBAAmB;IACpE,OAAO,CAAC,OAAO,EAAE,YAAY,EAAE,IAAI,EAAE,IAAI,GAAG,UAAU;IAgDtD,OAAO,CAAC,cAAc;IAsBtB,OAAO,CAAC,cAAc;IAWtB,OAAO,CAAC,eAAe;CAWxB;AAED;;GAEG;AACH,qBAAa,YAAY;IACvB,OAAO,CAAC,QAAQ,CAAwC;IACxD,OAAO,CAAC,MAAM,CAAe;IAC7B,OAAO,CAAC,QAAQ,CAAoB;IACpC,OAAO,CAAC,SAAS,CAAsB;IACvC,OAAO,CAAC,SAAS,CAAgC;IACjD,OAAO,CAAC,cAAc,CAAwC;gBAG5D,MAAM,EAAE,YAAY,EACpB,OAAO,CAAC,EAAE;QACR,QAAQ,CAAC,EAAE,iBAAiB,CAAC;QAC7B,SAAS,CAAC,EAAE,mBAAmB,CAAC;KACjC;IAOH;;OAEG;IACH,eAAe,CAAC,OAAO,EAAE,YAAY,GAAG,IAAI;IAI5C;;OAEG;IACH,UAAU,CAAC,IAAI,EAAE,MAAM,GAAG,YAAY,GAAG,SAAS;IAIlD;;OAEG;IACH,YAAY,IAAI,MAAM,EAAE;IAIxB;;OAEG;IACH,WAAW,CAAC,SAAS,EAAE,sBAAsB,GAAG,IAAI;IAIpD;;OAEG;IACH,cAAc,CAAC,SAAS,EAAE,sBAAsB,GAAG,IAAI;IAOvD;;;OAGG;IACG,KAAK,CAAC,MAAM,EAAE,gBAAgB,GAAG,OAAO,CAAC,WAAW,CAAC;IA6E3D;;OAEG;IACG,aAAa,CACjB,MAAM,EAAE,IAAI,CAAC,gBAAgB,EAAE,mBAAmB,CAAC,GAClD,OAAO,CAAC,WAAW,CAAC;IAUvB;;OAEG;IACG,oBAAoB,CACxB,MAAM,EAAE,IAAI,CAAC,gBAAgB,EAAE,mBAAmB,CAAC,GAClD,OAAO,CAAC;QACT,aAAa,EAAE,WAAW,CAAC;QAC3B,QAAQ,EAAE,WAAW,CAAC;QACtB,WAAW,EAAE;YACX,SAAS,EAAE,MAAM,CAAC;YAClB,aAAa,EAAE,MAAM,CAAC;YACtB,YAAY,EAAE,MAAM,CAAC;SACtB,CAAC;KACH,CAAC;IAoBF;;;OAGG;IACG,eAAe,CAAC,OAAO,EAAE,YAAY,EAAE,IAAI,EAAE,IAAI,GAAG,OAAO,CAAC,UAAU,CAAC;IAS7E;;OAEG;IACH,iBAAiB,IAAI,YAAY,EAAE;IAInC;;OAEG;IACG,SAAS,CAAC,SAAS,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC;IAYjD;;OAEG;IACG,YAAY,IAAI,OAAO,CAAC,IAAI,CAAC;IAKnC;;;OAGG;IACG,KAAK,IAAI,OAAO,CAAC,IAAI,CAAC;IAa5B,OAAO,CAAC,WAAW;YAWL,iBAAiB;IAuB/B,OAAO,CAAC,kBAAkB;IAM1B,OAAO,CAAC,aAAa;IAMrB,OAAO,CAAC,cAAc;IAMtB,OAAO,CAAC,gBAAgB;CAKzB;AAED;;GAEG;AACH,wBAAgB,kBAAkB,CAChC,MAAM,EAAE,YAAY,EACpB,OAAO,CAAC,EAAE;IACR,QAAQ,CAAC,EAAE,iBAAiB,CAAC;IAC7B,SAAS,CAAC,EAAE,mBAAmB,CAAC;CACjC,GACA,YAAY,CAEd"}