@namzu/sdk 0.4.0 → 0.4.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (480) hide show
  1. package/CHANGELOG.md +86 -0
  2. package/dist/__tests__/replay-public-surface.test.d.ts +2 -0
  3. package/dist/__tests__/replay-public-surface.test.d.ts.map +1 -0
  4. package/dist/__tests__/replay-public-surface.test.js +45 -0
  5. package/dist/__tests__/replay-public-surface.test.js.map +1 -0
  6. package/dist/agents/SupervisorAgent.d.ts.map +1 -1
  7. package/dist/agents/SupervisorAgent.js.map +1 -1
  8. package/dist/bridge/a2a/task.d.ts +2 -2
  9. package/dist/bridge/a2a/task.d.ts.map +1 -1
  10. package/dist/bridge/a2a/task.js.map +1 -1
  11. package/dist/config/runtime.d.ts +24 -25
  12. package/dist/config/runtime.d.ts.map +1 -1
  13. package/dist/config/runtime.js.map +1 -1
  14. package/dist/contracts/api.d.ts +2 -2
  15. package/dist/contracts/api.d.ts.map +1 -1
  16. package/dist/contracts/index.d.ts +1 -2
  17. package/dist/contracts/index.d.ts.map +1 -1
  18. package/dist/contracts/index.js.map +1 -1
  19. package/dist/contracts/schemas.d.ts +10 -10
  20. package/dist/index.d.ts +3 -103
  21. package/dist/index.d.ts.map +1 -1
  22. package/dist/index.js +9 -89
  23. package/dist/index.js.map +1 -1
  24. package/dist/manager/agent/__tests__/lifecycle.test.js.map +1 -1
  25. package/dist/manager/agent/lifecycle.d.ts +1 -1
  26. package/dist/manager/agent/lifecycle.d.ts.map +1 -1
  27. package/dist/manager/agent/lifecycle.js +1 -1
  28. package/dist/manager/agent/lifecycle.js.map +1 -1
  29. package/dist/manager/run/persistence.d.ts +3 -3
  30. package/dist/manager/run/persistence.d.ts.map +1 -1
  31. package/dist/manager/run/persistence.js.map +1 -1
  32. package/dist/manager/thread/__tests__/lifecycle.test.js.map +1 -1
  33. package/dist/manager/thread/lifecycle.d.ts +1 -1
  34. package/dist/manager/thread/lifecycle.d.ts.map +1 -1
  35. package/dist/plugin/loader.d.ts +0 -5
  36. package/dist/plugin/loader.d.ts.map +1 -1
  37. package/dist/plugin/loader.js +1 -13
  38. package/dist/plugin/loader.js.map +1 -1
  39. package/dist/public-runtime.d.ts +70 -0
  40. package/dist/public-runtime.d.ts.map +1 -0
  41. package/dist/public-runtime.js +108 -0
  42. package/dist/public-runtime.js.map +1 -0
  43. package/dist/public-tools.d.ts +19 -0
  44. package/dist/public-tools.d.ts.map +1 -0
  45. package/dist/public-tools.js +34 -0
  46. package/dist/public-tools.js.map +1 -0
  47. package/dist/public-types.d.ts +55 -0
  48. package/dist/public-types.d.ts.map +1 -0
  49. package/dist/public-types.js +14 -0
  50. package/dist/public-types.js.map +1 -0
  51. package/dist/rag/rag-tool.d.ts +1 -1
  52. package/dist/run/LimitChecker.d.ts +0 -1
  53. package/dist/run/LimitChecker.d.ts.map +1 -1
  54. package/dist/run/LimitChecker.js +0 -6
  55. package/dist/run/LimitChecker.js.map +1 -1
  56. package/dist/run/reporter.d.ts +2 -2
  57. package/dist/run/reporter.d.ts.map +1 -1
  58. package/dist/run/reporter.js.map +1 -1
  59. package/dist/runtime/query/__tests__/checkpoint.test.d.ts +2 -0
  60. package/dist/runtime/query/__tests__/checkpoint.test.d.ts.map +1 -0
  61. package/dist/runtime/query/__tests__/checkpoint.test.js +150 -0
  62. package/dist/runtime/query/__tests__/checkpoint.test.js.map +1 -0
  63. package/dist/runtime/query/checkpoint.d.ts +23 -0
  64. package/dist/runtime/query/checkpoint.d.ts.map +1 -1
  65. package/dist/runtime/query/checkpoint.js +49 -0
  66. package/dist/runtime/query/checkpoint.js.map +1 -1
  67. package/dist/runtime/query/context.d.ts +0 -2
  68. package/dist/runtime/query/context.d.ts.map +1 -1
  69. package/dist/runtime/query/context.js +0 -4
  70. package/dist/runtime/query/context.js.map +1 -1
  71. package/dist/runtime/query/index.d.ts +3 -3
  72. package/dist/runtime/query/index.d.ts.map +1 -1
  73. package/dist/runtime/query/replay/__tests__/mutate.test.d.ts +2 -0
  74. package/dist/runtime/query/replay/__tests__/mutate.test.d.ts.map +1 -0
  75. package/dist/runtime/query/replay/__tests__/mutate.test.js +123 -0
  76. package/dist/runtime/query/replay/__tests__/mutate.test.js.map +1 -0
  77. package/dist/runtime/query/replay/__tests__/prepare.test.d.ts +2 -0
  78. package/dist/runtime/query/replay/__tests__/prepare.test.d.ts.map +1 -0
  79. package/dist/runtime/query/replay/__tests__/prepare.test.js +171 -0
  80. package/dist/runtime/query/replay/__tests__/prepare.test.js.map +1 -0
  81. package/dist/runtime/query/replay/list.d.ts +24 -0
  82. package/dist/runtime/query/replay/list.d.ts.map +1 -0
  83. package/dist/runtime/query/replay/list.js +21 -0
  84. package/dist/runtime/query/replay/list.js.map +1 -0
  85. package/dist/runtime/query/replay/mutate.d.ts +17 -0
  86. package/dist/runtime/query/replay/mutate.d.ts.map +1 -0
  87. package/dist/runtime/query/replay/mutate.js +62 -0
  88. package/dist/runtime/query/replay/mutate.js.map +1 -0
  89. package/dist/runtime/query/replay/prepare.d.ts +56 -0
  90. package/dist/runtime/query/replay/prepare.d.ts.map +1 -0
  91. package/dist/runtime/query/replay/prepare.js +65 -0
  92. package/dist/runtime/query/replay/prepare.js.map +1 -0
  93. package/dist/runtime/query/result.d.ts +2 -2
  94. package/dist/runtime/query/result.d.ts.map +1 -1
  95. package/dist/session/__tests__/integration/_fixtures.d.ts +4 -4
  96. package/dist/session/__tests__/integration/_fixtures.d.ts.map +1 -1
  97. package/dist/session/__tests__/integration/_fixtures.js.map +1 -1
  98. package/dist/session/__tests__/integration/archive-gate.test.js.map +1 -1
  99. package/dist/session/__tests__/integration/capacity-caps.test.js.map +1 -1
  100. package/dist/session/__tests__/integration/e2e-spawn.test.js.map +1 -1
  101. package/dist/session/__tests__/integration/handoff-broadcast-e2e.test.js.map +1 -1
  102. package/dist/session/__tests__/integration/handoff-single-e2e.test.js.map +1 -1
  103. package/dist/session/__tests__/integration/prev-artifact-dag.test.js.map +1 -1
  104. package/dist/session/__tests__/integration/retention-archive.test.js.map +1 -1
  105. package/dist/session/__tests__/integration/spawn-rollback.test.js.map +1 -1
  106. package/dist/session/__tests__/integration/summary-materialization-e2e.test.js +1 -1
  107. package/dist/session/__tests__/integration/summary-materialization-e2e.test.js.map +1 -1
  108. package/dist/session/errors.d.ts +1 -1
  109. package/dist/session/errors.d.ts.map +1 -1
  110. package/dist/session/events/index.d.ts +3 -3
  111. package/dist/session/events/index.d.ts.map +1 -1
  112. package/dist/session/events/index.js +3 -2
  113. package/dist/session/events/index.js.map +1 -1
  114. package/dist/session/handoff/__tests__/broadcast.test.js.map +1 -1
  115. package/dist/session/handoff/__tests__/capacity.test.js.map +1 -1
  116. package/dist/session/handoff/__tests__/single.test.js.map +1 -1
  117. package/dist/session/handoff/assignment.d.ts +1 -1
  118. package/dist/session/handoff/assignment.d.ts.map +1 -1
  119. package/dist/session/handoff/broadcast.d.ts.map +1 -1
  120. package/dist/session/handoff/broadcast.js.map +1 -1
  121. package/dist/session/handoff/single.d.ts.map +1 -1
  122. package/dist/session/handoff/single.js.map +1 -1
  123. package/dist/session/index.d.ts +0 -1
  124. package/dist/session/index.d.ts.map +1 -1
  125. package/dist/session/index.js +7 -6
  126. package/dist/session/index.js.map +1 -1
  127. package/dist/session/intervention/__tests__/prev-artifact.test.js.map +1 -1
  128. package/dist/session/intervention/prev-artifact.d.ts +1 -1
  129. package/dist/session/intervention/prev-artifact.d.ts.map +1 -1
  130. package/dist/session/retention/__tests__/archive.test.js.map +1 -1
  131. package/dist/session/retention/__tests__/disk-backend.test.js.map +1 -1
  132. package/dist/session/retention/archive.d.ts +1 -1
  133. package/dist/session/retention/archive.d.ts.map +1 -1
  134. package/dist/session/retention/backend.d.ts +4 -4
  135. package/dist/session/retention/backend.d.ts.map +1 -1
  136. package/dist/session/retention/disk-backend.d.ts +1 -1
  137. package/dist/session/retention/disk-backend.d.ts.map +1 -1
  138. package/dist/session/retention/index.d.ts +3 -3
  139. package/dist/session/retention/index.d.ts.map +1 -1
  140. package/dist/session/retention/index.js +4 -2
  141. package/dist/session/retention/index.js.map +1 -1
  142. package/dist/session/status/__tests__/derive.test.d.ts +2 -0
  143. package/dist/session/status/__tests__/derive.test.d.ts.map +1 -0
  144. package/dist/session/{hierarchy/__tests__/session.test.js → status/__tests__/derive.test.js} +2 -2
  145. package/dist/session/status/__tests__/derive.test.js.map +1 -0
  146. package/dist/session/status/derive.d.ts +33 -0
  147. package/dist/session/status/derive.d.ts.map +1 -0
  148. package/dist/session/{hierarchy/session.js → status/derive.js} +6 -1
  149. package/dist/session/status/derive.js.map +1 -0
  150. package/dist/session/summary/__tests__/materialize.test.js +2 -1
  151. package/dist/session/summary/__tests__/materialize.test.js.map +1 -1
  152. package/dist/session/summary/errors.d.ts +43 -0
  153. package/dist/session/summary/errors.d.ts.map +1 -0
  154. package/dist/session/summary/errors.js +37 -0
  155. package/dist/session/summary/errors.js.map +1 -0
  156. package/dist/session/summary/index.d.ts +4 -3
  157. package/dist/session/summary/index.d.ts.map +1 -1
  158. package/dist/session/summary/index.js +5 -4
  159. package/dist/session/summary/index.js.map +1 -1
  160. package/dist/session/summary/materialize.d.ts +2 -2
  161. package/dist/session/summary/materialize.d.ts.map +1 -1
  162. package/dist/session/summary/materialize.js +2 -1
  163. package/dist/session/summary/materialize.js.map +1 -1
  164. package/dist/session/workspace/__tests__/git-worktree.test.js.map +1 -1
  165. package/dist/session/workspace/driver.d.ts +2 -2
  166. package/dist/session/workspace/driver.d.ts.map +1 -1
  167. package/dist/session/workspace/git-worktree.d.ts +1 -1
  168. package/dist/session/workspace/git-worktree.d.ts.map +1 -1
  169. package/dist/session/workspace/git-worktree.js.map +1 -1
  170. package/dist/session/workspace/index.d.ts +1 -1
  171. package/dist/session/workspace/index.d.ts.map +1 -1
  172. package/dist/session/workspace/index.js +3 -2
  173. package/dist/session/workspace/index.js.map +1 -1
  174. package/dist/store/run/disk.d.ts +4 -4
  175. package/dist/store/run/disk.d.ts.map +1 -1
  176. package/dist/store/run/disk.js.map +1 -1
  177. package/dist/store/session/__tests__/disk.test.js.map +1 -1
  178. package/dist/store/session/__tests__/memory.test.js.map +1 -1
  179. package/dist/store/session/disk.d.ts +6 -6
  180. package/dist/store/session/disk.d.ts.map +1 -1
  181. package/dist/store/session/disk.js +1 -1
  182. package/dist/store/session/disk.js.map +1 -1
  183. package/dist/store/session/index.d.ts +1 -1
  184. package/dist/store/session/index.d.ts.map +1 -1
  185. package/dist/store/session/index.js +2 -1
  186. package/dist/store/session/index.js.map +1 -1
  187. package/dist/store/session/linkage.d.ts +1 -1
  188. package/dist/store/session/linkage.d.ts.map +1 -1
  189. package/dist/store/session/memory.d.ts +5 -5
  190. package/dist/store/session/memory.d.ts.map +1 -1
  191. package/dist/store/session/memory.js +1 -1
  192. package/dist/store/session/memory.js.map +1 -1
  193. package/dist/store/thread/disk.d.ts +1 -1
  194. package/dist/store/thread/disk.d.ts.map +1 -1
  195. package/dist/store/thread/memory.d.ts +1 -1
  196. package/dist/store/thread/memory.d.ts.map +1 -1
  197. package/dist/telemetry/attributes.d.ts +0 -1
  198. package/dist/telemetry/attributes.d.ts.map +1 -1
  199. package/dist/telemetry/attributes.js +0 -3
  200. package/dist/telemetry/attributes.js.map +1 -1
  201. package/dist/telemetry/runtime-accessors.d.ts +1 -2
  202. package/dist/telemetry/runtime-accessors.d.ts.map +1 -1
  203. package/dist/telemetry/runtime-accessors.js +1 -4
  204. package/dist/telemetry/runtime-accessors.js.map +1 -1
  205. package/dist/tools/builtins/bash.d.ts +1 -1
  206. package/dist/tools/builtins/computer-use.d.ts +4 -4
  207. package/dist/tools/builtins/edit.d.ts +1 -1
  208. package/dist/tools/builtins/glob.d.ts +1 -1
  209. package/dist/tools/builtins/grep.d.ts +1 -1
  210. package/dist/tools/builtins/ls.d.ts +1 -1
  211. package/dist/tools/builtins/read-file.d.ts +1 -1
  212. package/dist/tools/builtins/search-tools.d.ts +1 -1
  213. package/dist/tools/builtins/write-file.d.ts +1 -1
  214. package/dist/types/agent/task.d.ts +2 -2
  215. package/dist/types/agent/task.d.ts.map +1 -1
  216. package/dist/{session/hierarchy/project.d.ts → types/project/entity.d.ts} +4 -4
  217. package/dist/types/project/entity.d.ts.map +1 -0
  218. package/dist/types/project/entity.js +2 -0
  219. package/dist/types/project/entity.js.map +1 -0
  220. package/dist/types/project/index.d.ts +2 -0
  221. package/dist/types/project/index.d.ts.map +1 -0
  222. package/dist/types/project/index.js +4 -0
  223. package/dist/types/project/index.js.map +1 -0
  224. package/dist/types/retention/archive-backend-ref.d.ts.map +1 -0
  225. package/dist/types/retention/archive-backend-ref.js.map +1 -0
  226. package/dist/types/retention/index.d.ts +4 -0
  227. package/dist/types/retention/index.d.ts.map +1 -0
  228. package/dist/types/retention/index.js +4 -0
  229. package/dist/types/retention/index.js.map +1 -0
  230. package/dist/types/retention/policy.d.ts.map +1 -0
  231. package/dist/types/retention/policy.js.map +1 -0
  232. package/dist/types/run/entity.d.ts +56 -0
  233. package/dist/types/run/entity.d.ts.map +1 -0
  234. package/dist/types/run/entity.js +2 -0
  235. package/dist/types/run/entity.js.map +1 -0
  236. package/dist/types/run/events.d.ts +2 -2
  237. package/dist/types/run/events.d.ts.map +1 -1
  238. package/dist/types/run/index.d.ts +7 -1
  239. package/dist/types/run/index.d.ts.map +1 -1
  240. package/dist/types/run/index.js +8 -9
  241. package/dist/types/run/index.js.map +1 -1
  242. package/dist/{session/hierarchy → types/run}/lineage.d.ts +1 -1
  243. package/dist/types/run/lineage.d.ts.map +1 -0
  244. package/dist/types/run/lineage.js.map +1 -0
  245. package/dist/types/run/replay.d.ts +53 -0
  246. package/dist/types/run/replay.d.ts.map +1 -0
  247. package/dist/types/run/replay.js +15 -0
  248. package/dist/types/run/replay.js.map +1 -0
  249. package/dist/types/run/schema-version.d.ts.map +1 -0
  250. package/dist/types/run/schema-version.js.map +1 -0
  251. package/dist/{session/events/types.d.ts → types/run/subsession-events.d.ts} +5 -5
  252. package/dist/types/run/subsession-events.d.ts.map +1 -0
  253. package/dist/types/run/subsession-events.js +2 -0
  254. package/dist/types/run/subsession-events.js.map +1 -0
  255. package/dist/{session/hierarchy → types/session}/actor.d.ts +1 -1
  256. package/dist/types/session/actor.d.ts.map +1 -0
  257. package/dist/{session/hierarchy → types/session}/actor.js.map +1 -1
  258. package/dist/types/session/entity.d.ts +51 -0
  259. package/dist/types/session/entity.d.ts.map +1 -0
  260. package/dist/types/session/entity.js +2 -0
  261. package/dist/types/session/entity.js.map +1 -0
  262. package/dist/types/session/index.d.ts +4 -0
  263. package/dist/types/session/index.d.ts.map +1 -1
  264. package/dist/{store → types}/session/messages.d.ts +2 -2
  265. package/dist/{store → types}/session/messages.d.ts.map +1 -1
  266. package/dist/types/session/messages.js.map +1 -0
  267. package/dist/types/session/store.d.ts +6 -6
  268. package/dist/types/session/store.d.ts.map +1 -1
  269. package/dist/{session/hierarchy → types/session}/sub-session.d.ts +9 -9
  270. package/dist/types/session/sub-session.d.ts.map +1 -0
  271. package/dist/types/session/sub-session.js.map +1 -0
  272. package/dist/{session → types}/summary/deliverable.d.ts +2 -2
  273. package/dist/types/summary/deliverable.d.ts.map +1 -0
  274. package/dist/types/summary/deliverable.js.map +1 -0
  275. package/dist/types/summary/index.d.ts +4 -0
  276. package/dist/types/summary/index.d.ts.map +1 -0
  277. package/dist/types/summary/index.js +4 -0
  278. package/dist/types/summary/index.js.map +1 -0
  279. package/dist/{session → types}/summary/ref.d.ts +9 -36
  280. package/dist/types/summary/ref.d.ts.map +1 -0
  281. package/dist/types/summary/ref.js +28 -0
  282. package/dist/types/summary/ref.js.map +1 -0
  283. package/dist/{session/hierarchy/tenant.d.ts → types/tenant/entity.d.ts} +2 -2
  284. package/dist/types/tenant/entity.d.ts.map +1 -0
  285. package/dist/types/tenant/entity.js +2 -0
  286. package/dist/types/tenant/entity.js.map +1 -0
  287. package/dist/types/tenant/index.d.ts +2 -0
  288. package/dist/types/tenant/index.d.ts.map +1 -0
  289. package/dist/types/tenant/index.js +4 -0
  290. package/dist/types/tenant/index.js.map +1 -0
  291. package/dist/{session/hierarchy/thread.d.ts → types/thread/entity.d.ts} +31 -7
  292. package/dist/types/thread/entity.d.ts.map +1 -0
  293. package/dist/types/thread/entity.js +2 -0
  294. package/dist/types/thread/entity.js.map +1 -0
  295. package/dist/types/thread/index.d.ts +1 -0
  296. package/dist/types/thread/index.d.ts.map +1 -1
  297. package/dist/types/thread/store.d.ts +1 -1
  298. package/dist/types/thread/store.d.ts.map +1 -1
  299. package/dist/types/workspace/index.d.ts +2 -0
  300. package/dist/types/workspace/index.d.ts.map +1 -0
  301. package/dist/types/workspace/index.js +7 -0
  302. package/dist/types/workspace/index.js.map +1 -0
  303. package/dist/{session → types}/workspace/ref.d.ts +1 -1
  304. package/dist/types/workspace/ref.d.ts.map +1 -0
  305. package/dist/types/workspace/ref.js.map +1 -0
  306. package/package.json +1 -1
  307. package/src/__tests__/replay-public-surface.test.ts +54 -0
  308. package/src/agents/SupervisorAgent.ts +1 -1
  309. package/src/bridge/a2a/task.ts +4 -4
  310. package/src/config/runtime.ts +0 -2
  311. package/src/contracts/api.ts +2 -2
  312. package/src/contracts/index.ts +1 -3
  313. package/src/index.ts +11 -362
  314. package/src/manager/agent/__tests__/lifecycle.test.ts +2 -2
  315. package/src/manager/agent/lifecycle.ts +5 -5
  316. package/src/manager/run/persistence.ts +4 -4
  317. package/src/manager/thread/__tests__/lifecycle.test.ts +1 -1
  318. package/src/manager/thread/lifecycle.ts +2 -2
  319. package/src/plugin/loader.ts +0 -16
  320. package/src/public-runtime.ts +373 -0
  321. package/src/public-tools.ts +63 -0
  322. package/src/public-types.ts +156 -0
  323. package/src/run/LimitChecker.ts +0 -9
  324. package/src/run/reporter.ts +3 -3
  325. package/src/runtime/query/__tests__/checkpoint.test.ts +169 -0
  326. package/src/runtime/query/checkpoint.ts +54 -0
  327. package/src/runtime/query/context.ts +0 -5
  328. package/src/runtime/query/index.ts +4 -4
  329. package/src/runtime/query/replay/__tests__/mutate.test.ts +134 -0
  330. package/src/runtime/query/replay/__tests__/prepare.test.ts +207 -0
  331. package/src/runtime/query/replay/list.ts +32 -0
  332. package/src/runtime/query/replay/mutate.ts +76 -0
  333. package/src/runtime/query/replay/prepare.ts +114 -0
  334. package/src/runtime/query/result.ts +2 -2
  335. package/src/session/__tests__/integration/_fixtures.ts +2 -2
  336. package/src/session/__tests__/integration/archive-gate.test.ts +1 -1
  337. package/src/session/__tests__/integration/capacity-caps.test.ts +1 -1
  338. package/src/session/__tests__/integration/e2e-spawn.test.ts +1 -1
  339. package/src/session/__tests__/integration/handoff-broadcast-e2e.test.ts +1 -1
  340. package/src/session/__tests__/integration/handoff-single-e2e.test.ts +1 -1
  341. package/src/session/__tests__/integration/prev-artifact-dag.test.ts +4 -1
  342. package/src/session/__tests__/integration/retention-archive.test.ts +1 -1
  343. package/src/session/__tests__/integration/spawn-rollback.test.ts +2 -2
  344. package/src/session/__tests__/integration/summary-materialization-e2e.test.ts +1 -1
  345. package/src/session/errors.ts +1 -1
  346. package/src/session/events/index.ts +5 -4
  347. package/src/session/handoff/__tests__/broadcast.test.ts +1 -1
  348. package/src/session/handoff/__tests__/capacity.test.ts +1 -1
  349. package/src/session/handoff/__tests__/single.test.ts +1 -1
  350. package/src/session/handoff/assignment.ts +1 -1
  351. package/src/session/handoff/broadcast.ts +2 -2
  352. package/src/session/handoff/single.ts +2 -2
  353. package/src/session/index.ts +7 -6
  354. package/src/session/intervention/__tests__/prev-artifact.test.ts +4 -1
  355. package/src/session/intervention/prev-artifact.ts +1 -1
  356. package/src/session/retention/__tests__/archive.test.ts +3 -3
  357. package/src/session/retention/__tests__/disk-backend.test.ts +4 -4
  358. package/src/session/retention/archive.ts +2 -2
  359. package/src/session/retention/backend.ts +4 -4
  360. package/src/session/retention/disk-backend.ts +4 -4
  361. package/src/session/retention/index.ts +6 -4
  362. package/src/session/{hierarchy/__tests__/session.test.ts → status/__tests__/derive.test.ts} +3 -2
  363. package/src/session/{hierarchy/session.ts → status/derive.ts} +9 -55
  364. package/src/session/summary/__tests__/materialize.test.ts +4 -7
  365. package/src/session/summary/errors.ts +51 -0
  366. package/src/session/summary/index.ts +7 -10
  367. package/src/session/summary/materialize.ts +4 -5
  368. package/src/session/workspace/__tests__/git-worktree.test.ts +1 -1
  369. package/src/session/workspace/driver.ts +2 -2
  370. package/src/session/workspace/git-worktree.ts +1 -1
  371. package/src/session/workspace/index.ts +7 -6
  372. package/src/store/run/disk.ts +4 -4
  373. package/src/store/session/__tests__/disk.test.ts +2 -2
  374. package/src/store/session/__tests__/memory.test.ts +2 -2
  375. package/src/store/session/disk.ts +12 -12
  376. package/src/store/session/index.ts +3 -2
  377. package/src/store/session/linkage.ts +1 -1
  378. package/src/store/session/memory.ts +6 -6
  379. package/src/store/thread/disk.ts +1 -1
  380. package/src/store/thread/memory.ts +1 -1
  381. package/src/telemetry/attributes.ts +0 -4
  382. package/src/telemetry/runtime-accessors.ts +1 -5
  383. package/src/types/agent/task.ts +2 -2
  384. package/src/{session/hierarchy/project.ts → types/project/entity.ts} +3 -3
  385. package/src/types/project/index.ts +4 -0
  386. package/src/types/retention/index.ts +6 -0
  387. package/src/types/run/entity.ts +63 -0
  388. package/src/types/run/events.ts +6 -6
  389. package/src/types/run/index.ts +16 -9
  390. package/src/{session/hierarchy → types/run}/lineage.ts +1 -1
  391. package/src/types/run/replay.ts +61 -0
  392. package/src/{session/events/types.ts → types/run/subsession-events.ts} +4 -4
  393. package/src/{session/hierarchy → types/session}/actor.ts +1 -1
  394. package/src/types/session/entity.ts +59 -0
  395. package/src/types/session/index.ts +15 -0
  396. package/src/{store → types}/session/messages.ts +2 -2
  397. package/src/types/session/store.ts +6 -6
  398. package/src/{session/hierarchy → types/session}/sub-session.ts +9 -9
  399. package/src/{session → types}/summary/deliverable.ts +2 -2
  400. package/src/types/summary/index.ts +18 -0
  401. package/src/{session → types}/summary/ref.ts +9 -44
  402. package/src/{session/hierarchy/tenant.ts → types/tenant/entity.ts} +1 -1
  403. package/src/types/tenant/index.ts +4 -0
  404. package/src/{session/hierarchy/thread.ts → types/thread/entity.ts} +30 -6
  405. package/src/types/thread/index.ts +1 -0
  406. package/src/types/thread/store.ts +1 -1
  407. package/src/types/workspace/index.ts +12 -0
  408. package/src/{session → types}/workspace/ref.ts +1 -1
  409. package/dist/contracts/ids.d.ts +0 -2
  410. package/dist/contracts/ids.d.ts.map +0 -1
  411. package/dist/contracts/ids.js +0 -2
  412. package/dist/contracts/ids.js.map +0 -1
  413. package/dist/session/events/schema-version.d.ts.map +0 -1
  414. package/dist/session/events/schema-version.js.map +0 -1
  415. package/dist/session/events/types.d.ts.map +0 -1
  416. package/dist/session/events/types.js +0 -2
  417. package/dist/session/events/types.js.map +0 -1
  418. package/dist/session/hierarchy/__tests__/session.test.d.ts +0 -2
  419. package/dist/session/hierarchy/__tests__/session.test.d.ts.map +0 -1
  420. package/dist/session/hierarchy/__tests__/session.test.js.map +0 -1
  421. package/dist/session/hierarchy/actor.d.ts.map +0 -1
  422. package/dist/session/hierarchy/index.d.ts +0 -9
  423. package/dist/session/hierarchy/index.d.ts.map +0 -1
  424. package/dist/session/hierarchy/index.js +0 -4
  425. package/dist/session/hierarchy/index.js.map +0 -1
  426. package/dist/session/hierarchy/lineage.d.ts.map +0 -1
  427. package/dist/session/hierarchy/lineage.js.map +0 -1
  428. package/dist/session/hierarchy/project.d.ts.map +0 -1
  429. package/dist/session/hierarchy/project.js +0 -2
  430. package/dist/session/hierarchy/project.js.map +0 -1
  431. package/dist/session/hierarchy/session.d.ts +0 -71
  432. package/dist/session/hierarchy/session.d.ts.map +0 -1
  433. package/dist/session/hierarchy/session.js.map +0 -1
  434. package/dist/session/hierarchy/sub-session.d.ts.map +0 -1
  435. package/dist/session/hierarchy/sub-session.js.map +0 -1
  436. package/dist/session/hierarchy/tenant.d.ts.map +0 -1
  437. package/dist/session/hierarchy/tenant.js +0 -2
  438. package/dist/session/hierarchy/tenant.js.map +0 -1
  439. package/dist/session/hierarchy/thread.d.ts.map +0 -1
  440. package/dist/session/hierarchy/thread.js +0 -2
  441. package/dist/session/hierarchy/thread.js.map +0 -1
  442. package/dist/session/retention/archive-backend-ref.d.ts.map +0 -1
  443. package/dist/session/retention/archive-backend-ref.js.map +0 -1
  444. package/dist/session/retention/policy.d.ts.map +0 -1
  445. package/dist/session/retention/policy.js.map +0 -1
  446. package/dist/session/summary/deliverable.d.ts.map +0 -1
  447. package/dist/session/summary/deliverable.js.map +0 -1
  448. package/dist/session/summary/ref.d.ts.map +0 -1
  449. package/dist/session/summary/ref.js +0 -51
  450. package/dist/session/summary/ref.js.map +0 -1
  451. package/dist/session/workspace/ref.d.ts.map +0 -1
  452. package/dist/session/workspace/ref.js.map +0 -1
  453. package/dist/store/session/messages.js.map +0 -1
  454. package/dist/tools/builtins/__tests__/structuredOutput.example.d.ts +0 -140
  455. package/dist/tools/builtins/__tests__/structuredOutput.example.d.ts.map +0 -1
  456. package/dist/tools/builtins/__tests__/structuredOutput.example.js +0 -183
  457. package/dist/tools/builtins/__tests__/structuredOutput.example.js.map +0 -1
  458. package/dist/types/run/state.d.ts +0 -30
  459. package/dist/types/run/state.d.ts.map +0 -1
  460. package/dist/types/run/state.js +0 -2
  461. package/dist/types/run/state.js.map +0 -1
  462. package/src/contracts/ids.ts +0 -1
  463. package/src/session/hierarchy/index.ts +0 -18
  464. package/src/tools/builtins/__tests__/structuredOutput.example.ts +0 -221
  465. package/src/types/run/state.ts +0 -35
  466. /package/dist/{session → types}/retention/archive-backend-ref.d.ts +0 -0
  467. /package/dist/{session → types}/retention/archive-backend-ref.js +0 -0
  468. /package/dist/{session → types}/retention/policy.d.ts +0 -0
  469. /package/dist/{session → types}/retention/policy.js +0 -0
  470. /package/dist/{session/hierarchy → types/run}/lineage.js +0 -0
  471. /package/dist/{session/events → types/run}/schema-version.d.ts +0 -0
  472. /package/dist/{session/events → types/run}/schema-version.js +0 -0
  473. /package/dist/{session/hierarchy → types/session}/actor.js +0 -0
  474. /package/dist/{store → types}/session/messages.js +0 -0
  475. /package/dist/{session/hierarchy → types/session}/sub-session.js +0 -0
  476. /package/dist/{session → types}/summary/deliverable.js +0 -0
  477. /package/dist/{session → types}/workspace/ref.js +0 -0
  478. /package/src/{session → types}/retention/archive-backend-ref.ts +0 -0
  479. /package/src/{session → types}/retention/policy.ts +0 -0
  480. /package/src/{session/events → types/run}/schema-version.ts +0 -0
@@ -0,0 +1,169 @@
1
+ import { describe, expect, it } from 'vitest'
2
+ import type { RunDiskStore } from '../../../store/run/disk.js'
3
+ import type { CheckpointId, IterationCheckpoint } from '../../../types/hitl/index.js'
4
+ import type { EmergencySaveId, RunId } from '../../../types/ids/index.js'
5
+ import type { EmergencySaveData } from '../../../types/run/emergency.js'
6
+ import { CheckpointManager, projectEmergencyToCheckpoint } from '../checkpoint.js'
7
+
8
+ function makeCheckpoint(overrides: Partial<IterationCheckpoint> = {}): IterationCheckpoint {
9
+ return {
10
+ id: 'cp_test_a' as CheckpointId,
11
+ runId: 'run_test' as RunId,
12
+ iteration: 1,
13
+ messages: [{ role: 'user', content: 'hello' }],
14
+ tokenUsage: {
15
+ promptTokens: 0,
16
+ completionTokens: 0,
17
+ totalTokens: 0,
18
+ cachedTokens: 0,
19
+ cacheWriteTokens: 0,
20
+ },
21
+ costInfo: {
22
+ inputCostPer1M: 0,
23
+ outputCostPer1M: 0,
24
+ totalCost: 0,
25
+ cacheDiscount: 0,
26
+ },
27
+ guardState: { iterationCount: 1, elapsedMs: 100 },
28
+ createdAt: Date.now(),
29
+ ...overrides,
30
+ }
31
+ }
32
+
33
+ function makeStoreStub(checkpoints: IterationCheckpoint[]): RunDiskStore {
34
+ return {
35
+ listCheckpoints: async () => checkpoints,
36
+ } as unknown as RunDiskStore
37
+ }
38
+
39
+ describe('CheckpointManager.listEntries', () => {
40
+ it('projects stored checkpoints to CheckpointListEntry', async () => {
41
+ const store = makeStoreStub([
42
+ makeCheckpoint({
43
+ id: 'cp_a' as CheckpointId,
44
+ iteration: 1,
45
+ createdAt: 1000,
46
+ messages: [
47
+ { role: 'user', content: 'hi' },
48
+ { role: 'assistant', content: 'hello' },
49
+ ],
50
+ }),
51
+ makeCheckpoint({
52
+ id: 'cp_b' as CheckpointId,
53
+ iteration: 2,
54
+ createdAt: 2000,
55
+ messages: [
56
+ { role: 'user', content: 'hi' },
57
+ { role: 'assistant', content: 'hello' },
58
+ { role: 'user', content: 'more' },
59
+ ],
60
+ }),
61
+ ])
62
+
63
+ const mgr = new CheckpointManager(store)
64
+ const entries = await mgr.listEntries()
65
+
66
+ expect(entries).toHaveLength(2)
67
+ expect(entries[0]).toEqual({
68
+ id: 'cp_a',
69
+ runId: 'run_test',
70
+ iteration: 1,
71
+ createdAt: 1000,
72
+ messageCount: 2,
73
+ })
74
+ expect(entries[1]).toEqual({
75
+ id: 'cp_b',
76
+ runId: 'run_test',
77
+ iteration: 2,
78
+ createdAt: 2000,
79
+ messageCount: 3,
80
+ })
81
+ })
82
+
83
+ it('returns empty array when no checkpoints exist', async () => {
84
+ const mgr = new CheckpointManager(makeStoreStub([]))
85
+ expect(await mgr.listEntries()).toEqual([])
86
+ })
87
+
88
+ it('does not include full checkpoint payload fields', async () => {
89
+ const mgr = new CheckpointManager(
90
+ makeStoreStub([
91
+ makeCheckpoint({
92
+ toolResultHashes: { call_x: 'hash' },
93
+ branchStack: [{ agentId: 'a', decision: 'd', confidence: 1, timestamp: 0 }],
94
+ }),
95
+ ]),
96
+ )
97
+ const [entry] = await mgr.listEntries()
98
+ expect(entry).not.toHaveProperty('tokenUsage')
99
+ expect(entry).not.toHaveProperty('costInfo')
100
+ expect(entry).not.toHaveProperty('toolResultHashes')
101
+ expect(entry).not.toHaveProperty('branchStack')
102
+ expect(entry).not.toHaveProperty('guardState')
103
+ expect(entry).not.toHaveProperty('messages')
104
+ })
105
+ })
106
+
107
+ function makeEmergencyDump(overrides: Partial<EmergencySaveData> = {}): EmergencySaveData {
108
+ return {
109
+ id: 'esave_dump_a' as EmergencySaveId,
110
+ runId: 'run_victim' as RunId,
111
+ messages: [
112
+ { role: 'user', content: 'before the crash' },
113
+ { role: 'assistant', content: 'working' },
114
+ ],
115
+ tokenUsage: {
116
+ promptTokens: 10,
117
+ completionTokens: 5,
118
+ totalTokens: 15,
119
+ cachedTokens: 0,
120
+ cacheWriteTokens: 0,
121
+ },
122
+ currentIteration: 7,
123
+ startedAt: 1_000,
124
+ savedAt: 2_500,
125
+ processSignal: 'SIGTERM',
126
+ ...overrides,
127
+ }
128
+ }
129
+
130
+ describe('projectEmergencyToCheckpoint', () => {
131
+ it('produces an IterationCheckpoint with all required fields', () => {
132
+ const dump = makeEmergencyDump()
133
+ const cp = projectEmergencyToCheckpoint(dump)
134
+
135
+ expect(cp.runId).toBe('run_victim')
136
+ expect(cp.iteration).toBe(7)
137
+ expect(cp.messages).toBe(dump.messages)
138
+ expect(cp.tokenUsage).toBe(dump.tokenUsage)
139
+ expect(cp.createdAt).toBe(2_500)
140
+ expect(cp.guardState).toEqual({ iterationCount: 7, elapsedMs: 1_500 })
141
+ expect(cp.costInfo).toEqual({
142
+ inputCostPer1M: 0,
143
+ outputCostPer1M: 0,
144
+ totalCost: 0,
145
+ cacheDiscount: 0,
146
+ })
147
+ })
148
+
149
+ it('derives a deterministic CheckpointId from the emergency save id', () => {
150
+ const dump = makeEmergencyDump({ id: 'esave_xyz123' as EmergencySaveId })
151
+ const cp1 = projectEmergencyToCheckpoint(dump)
152
+ const cp2 = projectEmergencyToCheckpoint(dump)
153
+
154
+ expect(cp1.id).toBe('cp_emergency_xyz123')
155
+ expect(cp1.id).toBe(cp2.id)
156
+ })
157
+
158
+ it('clamps guardState.elapsedMs to 0 when savedAt precedes startedAt', () => {
159
+ const cp = projectEmergencyToCheckpoint(makeEmergencyDump({ startedAt: 2_000, savedAt: 1_000 }))
160
+ expect(cp.guardState.elapsedMs).toBe(0)
161
+ })
162
+
163
+ it('leaves optional fields (toolResultHashes, branchStack, activeNode) unset', () => {
164
+ const cp = projectEmergencyToCheckpoint(makeEmergencyDump())
165
+ expect(cp.toolResultHashes).toBeUndefined()
166
+ expect(cp.branchStack).toBeUndefined()
167
+ expect(cp.activeNode).toBeUndefined()
168
+ })
169
+ })
@@ -8,9 +8,52 @@ import type {
8
8
  IterationCheckpoint,
9
9
  } from '../../types/hitl/index.js'
10
10
  import type { AssistantMessage } from '../../types/message/index.js'
11
+ import type { EmergencySaveData } from '../../types/run/emergency.js'
12
+ import type { CheckpointListEntry } from '../../types/run/replay.js'
13
+ import { ZERO_COST } from '../../utils/cost.js'
11
14
  import { buildToolResultHashes } from '../../utils/hash.js'
12
15
  import { generateCheckpointId } from '../../utils/id.js'
13
16
 
17
+ function toCheckpointListEntry(cp: IterationCheckpoint): CheckpointListEntry {
18
+ return {
19
+ id: cp.id,
20
+ runId: cp.runId,
21
+ iteration: cp.iteration,
22
+ createdAt: cp.createdAt,
23
+ messageCount: cp.messages.length,
24
+ }
25
+ }
26
+
27
+ /**
28
+ * Project an {@link EmergencySaveData} dump to an {@link IterationCheckpoint}
29
+ * shape so `replay({ fromCheckpoint: 'emergency' })` can consume it through
30
+ * the same restore path as any other checkpoint.
31
+ *
32
+ * The projection is lossy: `costInfo`, `guardState.elapsedMs`,
33
+ * `toolResultHashes`, `branchStack`, and `activeNode` are not captured at
34
+ * emergency-save time and default to zero/empty values. The synthetic
35
+ * checkpoint id is derived deterministically from the emergency save id so
36
+ * re-projecting the same dump yields the same {@link CheckpointId}.
37
+ *
38
+ * See ses_005-deterministic-replay design §2 + §5.2.
39
+ */
40
+ export function projectEmergencyToCheckpoint(dump: EmergencySaveData): IterationCheckpoint {
41
+ const emergencySuffix = dump.id.replace(/^esave_/, '')
42
+ return {
43
+ id: `cp_emergency_${emergencySuffix}` as CheckpointId,
44
+ runId: dump.runId,
45
+ iteration: dump.currentIteration,
46
+ messages: dump.messages,
47
+ tokenUsage: dump.tokenUsage,
48
+ costInfo: { ...ZERO_COST },
49
+ guardState: {
50
+ iterationCount: dump.currentIteration,
51
+ elapsedMs: Math.max(0, dump.savedAt - dump.startedAt),
52
+ },
53
+ createdAt: dump.savedAt,
54
+ }
55
+ }
56
+
14
57
  export class CheckpointManager {
15
58
  private store: RunDiskStore
16
59
 
@@ -60,6 +103,17 @@ export class CheckpointManager {
60
103
  return this.store.listCheckpoints()
61
104
  }
62
105
 
106
+ /**
107
+ * Listing projection used by the public `listCheckpoints` API. Returns
108
+ * only the fields a consumer needs to pick a fork point for
109
+ * {@link import('./replay/prepare.js').prepareReplayState} — not the
110
+ * full checkpoint payload. See ses_005-deterministic-replay design §3.1.
111
+ */
112
+ async listEntries(): Promise<CheckpointListEntry[]> {
113
+ const checkpoints = await this.store.listCheckpoints()
114
+ return checkpoints.map(toCheckpointListEntry)
115
+ }
116
+
63
117
  async prune(keepLast: number): Promise<void> {
64
118
  const all = await this.list()
65
119
  if (all.length <= keepLast) return
@@ -99,11 +99,6 @@ export interface RunContext {
99
99
  */
100
100
  const migrationPromises = new Map<string, Promise<FilesystemMigrationResult>>()
101
101
 
102
- /** Testing hook — clears the first-call guard cache. */
103
- export function __resetMigrationGuardForTests(): void {
104
- migrationPromises.clear()
105
- }
106
-
107
102
  export class RunContextFactory {
108
103
  /**
109
104
  * Run the boot-time filesystem migration for `rootDir` at most once per
@@ -27,7 +27,7 @@ import { type Message, createSystemMessage } from '../../types/message/index.js'
27
27
  import type { AgentPersona } from '../../types/persona/index.js'
28
28
  import type { LLMProvider } from '../../types/provider/index.js'
29
29
  import type { TaskRouterConfig } from '../../types/router/index.js'
30
- import type { AgentRun, AgentRunConfig, RunEvent, RunEventListener } from '../../types/run/index.js'
30
+ import type { AgentRunConfig, Run, RunEvent, RunEventListener } from '../../types/run/index.js'
31
31
  import type { Sandbox, SandboxProvider } from '../../types/sandbox/index.js'
32
32
  import type { ProjectId, ThreadId } from '../../types/session/ids.js'
33
33
  import type { Skill } from '../../types/skills/index.js'
@@ -136,7 +136,7 @@ export interface QueryParams {
136
136
  invocationState?: InvocationState
137
137
  }
138
138
 
139
- export async function* query(params: QueryParams): AsyncGenerator<RunEvent, AgentRun> {
139
+ export async function* query(params: QueryParams): AsyncGenerator<RunEvent, Run> {
140
140
  // Boot-time filesystem migration (session-hierarchy.md §13.4.1). First
141
141
  // call per process per root actually runs; subsequent calls short-circuit
142
142
  // via the in-memory guard in `context.ts`. Kept here rather than inside
@@ -335,7 +335,7 @@ export async function* query(params: QueryParams): AsyncGenerator<RunEvent, Agen
335
335
 
336
336
  const tracer = getTracer()
337
337
 
338
- return yield* (async function* (): AsyncGenerator<RunEvent, AgentRun> {
338
+ return yield* (async function* (): AsyncGenerator<RunEvent, Run> {
339
339
  const rootSpan = tracer.startSpan(agentRunSpanName(params.agentName))
340
340
  rootSpan.setAttributes({
341
341
  [NAMZU.RUN_ID]: ctx.runMgr.id,
@@ -515,7 +515,7 @@ export async function* query(params: QueryParams): AsyncGenerator<RunEvent, Agen
515
515
  export async function drainQuery(
516
516
  params: Omit<QueryParams, 'resumeHandler'> & { resumeHandler?: ResumeHandler },
517
517
  listener?: RunEventListener,
518
- ): Promise<AgentRun> {
518
+ ): Promise<Run> {
519
519
  const fullParams: QueryParams = {
520
520
  ...params,
521
521
  resumeHandler: params.resumeHandler ?? autoApproveHandler,
@@ -0,0 +1,134 @@
1
+ import { describe, expect, it } from 'vitest'
2
+ import type { ToolCallId } from '../../../../types/ids/index.js'
3
+ import type { AssistantMessage, Message, ToolMessage } from '../../../../types/message/index.js'
4
+ import { type Mutation, MutationNotApplicableError } from '../../../../types/run/replay.js'
5
+ import { applyMutations } from '../mutate.js'
6
+
7
+ function assistantWithCalls(toolCallIds: string[]): AssistantMessage {
8
+ return {
9
+ role: 'assistant',
10
+ content: null,
11
+ toolCalls: toolCallIds.map((id) => ({
12
+ id,
13
+ type: 'function',
14
+ function: { name: 'noop', arguments: '{}' },
15
+ })),
16
+ }
17
+ }
18
+
19
+ describe('applyMutations / injectToolResponse', () => {
20
+ it('appends a ToolMessage when the toolCallId is pending', () => {
21
+ const messages: Message[] = [
22
+ { role: 'user', content: 'do stuff' },
23
+ assistantWithCalls(['call_a', 'call_b']),
24
+ { role: 'tool', content: 'a done', toolCallId: 'call_a' },
25
+ ]
26
+ const mutations: Mutation[] = [
27
+ {
28
+ type: 'injectToolResponse',
29
+ toolCallId: 'call_b' as ToolCallId,
30
+ response: { success: true, output: 'mocked-b', data: { x: 1 } },
31
+ },
32
+ ]
33
+
34
+ const result = applyMutations(messages, mutations)
35
+
36
+ expect(result).toHaveLength(4)
37
+ const last = result[3] as ToolMessage
38
+ expect(last.role).toBe('tool')
39
+ expect(last.toolCallId).toBe('call_b')
40
+ expect(last.content).toBe('mocked-b')
41
+ })
42
+
43
+ it('throws MutationNotApplicableError when no pending tool calls exist', () => {
44
+ const messages: Message[] = [
45
+ { role: 'user', content: 'hi' },
46
+ { role: 'assistant', content: 'hello' },
47
+ ]
48
+ expect(() =>
49
+ applyMutations(messages, [
50
+ {
51
+ type: 'injectToolResponse',
52
+ toolCallId: 'call_missing' as ToolCallId,
53
+ response: { success: true, output: 'x' },
54
+ },
55
+ ]),
56
+ ).toThrow(MutationNotApplicableError)
57
+ })
58
+
59
+ it('throws with availableToolCallIds populated when toolCallId is not pending', () => {
60
+ const messages: Message[] = [
61
+ { role: 'user', content: 'do stuff' },
62
+ assistantWithCalls(['call_a', 'call_b']),
63
+ ]
64
+ try {
65
+ applyMutations(messages, [
66
+ {
67
+ type: 'injectToolResponse',
68
+ toolCallId: 'call_z' as ToolCallId,
69
+ response: { success: true, output: 'x' },
70
+ },
71
+ ])
72
+ expect.fail('expected MutationNotApplicableError')
73
+ } catch (err) {
74
+ expect(err).toBeInstanceOf(MutationNotApplicableError)
75
+ const e = err as MutationNotApplicableError
76
+ expect(e.availableToolCallIds).toEqual(['call_a', 'call_b'])
77
+ }
78
+ })
79
+
80
+ it('considers a tool call satisfied only when a subsequent ToolMessage responds to it', () => {
81
+ const messages: Message[] = [
82
+ { role: 'user', content: 'do stuff' },
83
+ assistantWithCalls(['call_a', 'call_b', 'call_c']),
84
+ { role: 'tool', content: 'a done', toolCallId: 'call_a' },
85
+ { role: 'tool', content: 'c done', toolCallId: 'call_c' },
86
+ ]
87
+ try {
88
+ applyMutations(messages, [
89
+ {
90
+ type: 'injectToolResponse',
91
+ toolCallId: 'call_a' as ToolCallId,
92
+ response: { success: true, output: 're-answered' },
93
+ },
94
+ ])
95
+ expect.fail('expected MutationNotApplicableError — call_a already satisfied')
96
+ } catch (err) {
97
+ const e = err as MutationNotApplicableError
98
+ expect(e.availableToolCallIds).toEqual(['call_b'])
99
+ }
100
+ })
101
+
102
+ it('applies mutations in order so a later mutation sees earlier ones', () => {
103
+ const messages: Message[] = [
104
+ { role: 'user', content: 'two calls pending' },
105
+ assistantWithCalls(['call_x', 'call_y']),
106
+ ]
107
+ const result = applyMutations(messages, [
108
+ {
109
+ type: 'injectToolResponse',
110
+ toolCallId: 'call_x' as ToolCallId,
111
+ response: { success: true, output: 'x-result' },
112
+ },
113
+ {
114
+ type: 'injectToolResponse',
115
+ toolCallId: 'call_y' as ToolCallId,
116
+ response: { success: true, output: 'y-result' },
117
+ },
118
+ ])
119
+
120
+ expect(result).toHaveLength(4)
121
+ expect((result[2] as ToolMessage).toolCallId).toBe('call_x')
122
+ expect((result[3] as ToolMessage).toolCallId).toBe('call_y')
123
+ })
124
+
125
+ it('returns the original messages unchanged when the mutation list is empty', () => {
126
+ const messages: Message[] = [
127
+ { role: 'user', content: 'no-op' },
128
+ { role: 'assistant', content: 'ok' },
129
+ ]
130
+ const result = applyMutations(messages, [])
131
+ expect(result).toEqual(messages)
132
+ expect(result).not.toBe(messages)
133
+ })
134
+ })
@@ -0,0 +1,207 @@
1
+ import { mkdir, mkdtemp, writeFile } from 'node:fs/promises'
2
+ import { tmpdir } from 'node:os'
3
+ import { join } from 'node:path'
4
+ import { afterEach, beforeEach, describe, expect, it } from 'vitest'
5
+ import type { CheckpointId, IterationCheckpoint } from '../../../../types/hitl/index.js'
6
+ import type { EmergencySaveId, RunId, ToolCallId } from '../../../../types/ids/index.js'
7
+ import type { AssistantMessage, ToolMessage } from '../../../../types/message/index.js'
8
+ import type { EmergencySaveData } from '../../../../types/run/emergency.js'
9
+ import type { Mutation } from '../../../../types/run/replay.js'
10
+ import { prepareReplayState } from '../prepare.js'
11
+
12
+ const RUN_ID = 'run_source' as RunId
13
+
14
+ function makeCheckpoint(overrides: Partial<IterationCheckpoint>): IterationCheckpoint {
15
+ return {
16
+ id: 'cp_default' as CheckpointId,
17
+ runId: RUN_ID,
18
+ iteration: 1,
19
+ messages: [{ role: 'user', content: 'hi' }],
20
+ tokenUsage: {
21
+ promptTokens: 0,
22
+ completionTokens: 0,
23
+ totalTokens: 0,
24
+ cachedTokens: 0,
25
+ cacheWriteTokens: 0,
26
+ },
27
+ costInfo: { inputCostPer1M: 0, outputCostPer1M: 0, totalCost: 0, cacheDiscount: 0 },
28
+ guardState: { iterationCount: 1, elapsedMs: 0 },
29
+ createdAt: Date.now(),
30
+ ...overrides,
31
+ }
32
+ }
33
+
34
+ async function seedCheckpoint(baseDir: string, cp: IterationCheckpoint): Promise<void> {
35
+ const cpDir = join(baseDir, cp.runId, 'checkpoints')
36
+ await mkdir(cpDir, { recursive: true })
37
+ await writeFile(join(cpDir, `${cp.id}.json`), JSON.stringify(cp), 'utf-8')
38
+ }
39
+
40
+ async function seedEmergency(emergencyDir: string, dump: EmergencySaveData): Promise<void> {
41
+ await mkdir(emergencyDir, { recursive: true })
42
+ await writeFile(join(emergencyDir, `${dump.runId}.json`), JSON.stringify(dump), 'utf-8')
43
+ }
44
+
45
+ describe('prepareReplayState', () => {
46
+ let baseDir: string
47
+ let emergencyDir: string
48
+
49
+ beforeEach(async () => {
50
+ const wrapper = await mkdtemp(join(tmpdir(), 'namzu-prepare-replay-'))
51
+ baseDir = join(wrapper, 'runs')
52
+ emergencyDir = join(wrapper, 'emergency')
53
+ await mkdir(baseDir, { recursive: true })
54
+ })
55
+
56
+ afterEach(async () => {
57
+ // Per-test tmpdir isolation; vitest cleans tmpdir between runs.
58
+ })
59
+
60
+ it('resolves a specific CheckpointId and returns the checkpoint messages', async () => {
61
+ const cp = makeCheckpoint({
62
+ id: 'cp_one' as CheckpointId,
63
+ iteration: 3,
64
+ messages: [
65
+ { role: 'user', content: 'start' },
66
+ { role: 'assistant', content: 'ok' },
67
+ ],
68
+ })
69
+ await seedCheckpoint(baseDir, cp)
70
+
71
+ const prepared = await prepareReplayState({
72
+ baseDir,
73
+ runId: RUN_ID,
74
+ fromCheckpoint: 'cp_one' as CheckpointId,
75
+ })
76
+
77
+ expect(prepared.sourceCheckpoint.id).toBe('cp_one')
78
+ expect(prepared.messages).toEqual(cp.messages)
79
+ expect(prepared.attribution.sourceRunId).toBe(RUN_ID)
80
+ expect(prepared.attribution.fromCheckpointId).toBe('cp_one')
81
+ expect(prepared.attribution.mutations).toEqual([])
82
+ expect(prepared.attribution.replayedAt).toBeGreaterThan(0)
83
+ })
84
+
85
+ it("resolves 'latest' to the checkpoint with the highest iteration", async () => {
86
+ await seedCheckpoint(baseDir, makeCheckpoint({ id: 'cp_a' as CheckpointId, iteration: 1 }))
87
+ await seedCheckpoint(baseDir, makeCheckpoint({ id: 'cp_b' as CheckpointId, iteration: 5 }))
88
+ await seedCheckpoint(baseDir, makeCheckpoint({ id: 'cp_c' as CheckpointId, iteration: 3 }))
89
+
90
+ const prepared = await prepareReplayState({
91
+ baseDir,
92
+ runId: RUN_ID,
93
+ fromCheckpoint: 'latest',
94
+ })
95
+
96
+ expect(prepared.sourceCheckpoint.id).toBe('cp_b')
97
+ expect(prepared.sourceCheckpoint.iteration).toBe(5)
98
+ })
99
+
100
+ it("throws when 'latest' is requested but no checkpoints exist", async () => {
101
+ await expect(
102
+ prepareReplayState({
103
+ baseDir,
104
+ runId: RUN_ID,
105
+ fromCheckpoint: 'latest',
106
+ }),
107
+ ).rejects.toThrow(/No checkpoints found/)
108
+ })
109
+
110
+ it('throws when a specific CheckpointId does not resolve', async () => {
111
+ await expect(
112
+ prepareReplayState({
113
+ baseDir,
114
+ runId: RUN_ID,
115
+ fromCheckpoint: 'cp_missing' as CheckpointId,
116
+ }),
117
+ ).rejects.toThrow(/not found/)
118
+ })
119
+
120
+ it('applies injectToolResponse mutations at the fork point', async () => {
121
+ const assistantMsg: AssistantMessage = {
122
+ role: 'assistant',
123
+ content: null,
124
+ toolCalls: [{ id: 'call_a', type: 'function', function: { name: 'noop', arguments: '{}' } }],
125
+ }
126
+ const cp = makeCheckpoint({
127
+ id: 'cp_with_tool' as CheckpointId,
128
+ messages: [{ role: 'user', content: 'run tool' }, assistantMsg],
129
+ })
130
+ await seedCheckpoint(baseDir, cp)
131
+
132
+ const mutations: Mutation[] = [
133
+ {
134
+ type: 'injectToolResponse',
135
+ toolCallId: 'call_a' as ToolCallId,
136
+ response: { success: true, output: 'mocked-a' },
137
+ },
138
+ ]
139
+
140
+ const prepared = await prepareReplayState({
141
+ baseDir,
142
+ runId: RUN_ID,
143
+ fromCheckpoint: 'cp_with_tool' as CheckpointId,
144
+ mutate: mutations,
145
+ })
146
+
147
+ expect(prepared.messages).toHaveLength(3)
148
+ const appended = prepared.messages[2] as ToolMessage
149
+ expect(appended.role).toBe('tool')
150
+ expect(appended.toolCallId).toBe('call_a')
151
+ expect(appended.content).toBe('mocked-a')
152
+ expect(prepared.attribution.mutations).toEqual(mutations)
153
+ })
154
+
155
+ it("resolves 'emergency' via the emergency dump and projects it to a checkpoint", async () => {
156
+ const dump: EmergencySaveData = {
157
+ id: 'esave_xyz' as EmergencySaveId,
158
+ runId: RUN_ID,
159
+ messages: [{ role: 'user', content: 'before crash' }],
160
+ tokenUsage: {
161
+ promptTokens: 4,
162
+ completionTokens: 2,
163
+ totalTokens: 6,
164
+ cachedTokens: 0,
165
+ cacheWriteTokens: 0,
166
+ },
167
+ currentIteration: 9,
168
+ startedAt: 1_000,
169
+ savedAt: 2_000,
170
+ processSignal: 'SIGTERM',
171
+ }
172
+ await seedEmergency(emergencyDir, dump)
173
+
174
+ const prepared = await prepareReplayState({
175
+ baseDir,
176
+ runId: RUN_ID,
177
+ fromCheckpoint: 'emergency',
178
+ emergencyDir,
179
+ })
180
+
181
+ expect(prepared.sourceCheckpoint.id).toBe('cp_emergency_xyz')
182
+ expect(prepared.sourceCheckpoint.iteration).toBe(9)
183
+ expect(prepared.messages).toEqual(dump.messages)
184
+ expect(prepared.attribution.fromCheckpointId).toBe('cp_emergency_xyz')
185
+ })
186
+
187
+ it("throws when 'emergency' is requested without emergencyDir", async () => {
188
+ await expect(
189
+ prepareReplayState({
190
+ baseDir,
191
+ runId: RUN_ID,
192
+ fromCheckpoint: 'emergency',
193
+ }),
194
+ ).rejects.toThrow(/emergencyDir/)
195
+ })
196
+
197
+ it("throws when 'emergency' dump file is missing", async () => {
198
+ await expect(
199
+ prepareReplayState({
200
+ baseDir,
201
+ runId: RUN_ID,
202
+ fromCheckpoint: 'emergency',
203
+ emergencyDir,
204
+ }),
205
+ ).rejects.toThrow(/No emergency dump/)
206
+ })
207
+ })
@@ -0,0 +1,32 @@
1
+ import { RunDiskStore } from '../../../store/run/disk.js'
2
+ import type { RunId } from '../../../types/ids/index.js'
3
+ import type { CheckpointListEntry } from '../../../types/run/replay.js'
4
+ import type { Logger } from '../../../utils/logger.js'
5
+ import { CheckpointManager } from '../checkpoint.js'
6
+
7
+ export interface ListCheckpointsInput {
8
+ /** Directory that contains `<runId>/` for the target run. */
9
+ baseDir: string
10
+ /** Run whose checkpoints should be listed. */
11
+ runId: RunId
12
+ logger?: Logger
13
+ }
14
+
15
+ /**
16
+ * Read-only listing of a run's checkpoints for use with {@link
17
+ * import('./prepare.js').prepareReplayState}. Returns the public
18
+ * {@link CheckpointListEntry} projection — just enough for a caller to
19
+ * pick a fork point — not the full `IterationCheckpoint` payload.
20
+ *
21
+ * Entries are returned in the order the underlying store returns them
22
+ * (disk store sorts by `createdAt` ascending). Callers that want a
23
+ * specific order should sort client-side.
24
+ *
25
+ * See ses_005-deterministic-replay/design.md §3.1.
26
+ */
27
+ export async function listCheckpoints(input: ListCheckpointsInput): Promise<CheckpointListEntry[]> {
28
+ const store = new RunDiskStore({ baseDir: input.baseDir, logger: input.logger })
29
+ await store.initRun(input.runId)
30
+ const mgr = new CheckpointManager(store)
31
+ return mgr.listEntries()
32
+ }