saeeol 1.2.9 → 1.3.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (539) hide show
  1. package/.turbo/turbo-typecheck.log +1 -0
  2. package/AGENTS.md +72 -0
  3. package/BUN_SHELL_MIGRATION_PLAN.md +136 -0
  4. package/Dockerfile +18 -0
  5. package/assets/saeeol.ico +0 -0
  6. package/bin/saeeol.cjs +0 -0
  7. package/database.db +0 -0
  8. package/drizzle.config.ts +10 -0
  9. package/git +0 -0
  10. package/migration/20260127222353_familiar_lady_ursula/migration.sql +90 -0
  11. package/migration/20260127222353_familiar_lady_ursula/snapshot.json +796 -0
  12. package/migration/20260211171708_add_project_commands/migration.sql +1 -0
  13. package/migration/20260211171708_add_project_commands/snapshot.json +806 -0
  14. package/migration/20260213144116_wakeful_the_professor/migration.sql +11 -0
  15. package/migration/20260213144116_wakeful_the_professor/snapshot.json +897 -0
  16. package/migration/20260225215848_workspace/migration.sql +7 -0
  17. package/migration/20260225215848_workspace/snapshot.json +959 -0
  18. package/migration/20260227213759_add_session_workspace_id/migration.sql +2 -0
  19. package/migration/20260227213759_add_session_workspace_id/snapshot.json +983 -0
  20. package/migration/20260228203230_blue_harpoon/migration.sql +17 -0
  21. package/migration/20260228203230_blue_harpoon/snapshot.json +1102 -0
  22. package/migration/20260303231226_add_workspace_fields/migration.sql +5 -0
  23. package/migration/20260303231226_add_workspace_fields/snapshot.json +1013 -0
  24. package/migration/20260309230000_move_org_to_state/migration.sql +3 -0
  25. package/migration/20260309230000_move_org_to_state/snapshot.json +1156 -0
  26. package/migration/20260312043431_session_message_cursor/migration.sql +4 -0
  27. package/migration/20260312043431_session_message_cursor/snapshot.json +1168 -0
  28. package/migration/20260323234822_events/migration.sql +13 -0
  29. package/migration/20260323234822_events/snapshot.json +1271 -0
  30. package/migration/20260410174513_workspace-name/migration.sql +16 -0
  31. package/migration/20260410174513_workspace-name/snapshot.json +1271 -0
  32. package/migration/20260413175956_chief_energizer/migration.sql +13 -0
  33. package/migration/20260413175956_chief_energizer/snapshot.json +1399 -0
  34. package/migration/20260423070820_add_icon_url_override/migration.sql +2 -0
  35. package/migration/20260423070820_add_icon_url_override/snapshot.json +1409 -0
  36. package/migration/20260428004200_add_session_path/migration.sql +1 -0
  37. package/migration/20260428004200_add_session_path/snapshot.json +1419 -0
  38. package/npm/bin/saeeol +42 -0
  39. package/npm/package.json +39 -0
  40. package/npm/postinstall.js +162 -0
  41. package/package.json +201 -207
  42. package/parsers-config.ts +289 -0
  43. package/script/build.ts +393 -0
  44. package/script/check-migrations.ts +16 -0
  45. package/script/fix-node-pty.ts +34 -0
  46. package/script/generate.ts +23 -0
  47. package/script/postinstall.mjs +189 -0
  48. package/script/publish.ts +200 -0
  49. package/script/run-workspace-server +106 -0
  50. package/script/schema.ts +63 -0
  51. package/script/test-runner.ts +420 -0
  52. package/script/time.ts +6 -0
  53. package/script/trace-imports.ts +153 -0
  54. package/script/upgrade-opentui.ts +64 -0
  55. package/scripts/diff-sdk-types.sh +52 -0
  56. package/specs/effect/facades.md +221 -0
  57. package/specs/effect/http-api.md +401 -0
  58. package/specs/effect/instance-context.md +309 -0
  59. package/specs/effect/loose-ends.md +34 -0
  60. package/specs/effect/migration.md +299 -0
  61. package/specs/effect/routes.md +64 -0
  62. package/specs/effect/schema.md +399 -0
  63. package/specs/effect/server-package.md +668 -0
  64. package/specs/effect/tools.md +90 -0
  65. package/specs/tui-plugins.md +433 -0
  66. package/specs/v2/api.ts +67 -0
  67. package/specs/v2/keymappings.md +10 -0
  68. package/specs/v2/message-shape.md +136 -0
  69. package/src/acp/agent-message.ts +1 -1
  70. package/src/acp/agent-utils.ts +1 -1
  71. package/src/boxes/ansi.ts +17 -0
  72. package/src/boxes/atomic-write.ts +35 -0
  73. package/src/boxes/b64.ts +58 -0
  74. package/src/boxes/bash-security.ts +129 -0
  75. package/src/boxes/bom.ts +18 -0
  76. package/src/boxes/cancel.ts +16 -0
  77. package/src/boxes/chop.ts +12 -0
  78. package/src/boxes/clamp.ts +3 -0
  79. package/src/boxes/compact.ts +9 -0
  80. package/src/boxes/cost-tracker.ts +116 -0
  81. package/src/boxes/dataurl.ts +29 -0
  82. package/src/boxes/delay.ts +27 -0
  83. package/src/boxes/diff-apply.ts +53 -0
  84. package/src/boxes/disposable.ts +13 -0
  85. package/src/boxes/err.ts +34 -0
  86. package/src/boxes/human.ts +47 -0
  87. package/src/boxes/iife.ts +9 -0
  88. package/src/boxes/latch.ts +8 -0
  89. package/src/boxes/memory.ts +198 -0
  90. package/src/boxes/net.ts +16 -0
  91. package/src/boxes/plural.ts +4 -0
  92. package/src/boxes/puny.ts +21 -0
  93. package/src/boxes/retry.ts +49 -0
  94. package/src/boxes/rwlock.ts +41 -0
  95. package/src/boxes/schedule.ts +71 -0
  96. package/src/boxes/scope.ts +21 -0
  97. package/src/boxes/tokens.ts +9 -0
  98. package/src/boxes/ttl-cache.ts +63 -0
  99. package/src/boxes/typed-event.ts +51 -0
  100. package/src/boxes/uid.ts +50 -0
  101. package/src/boxes/wave6.test.ts +296 -0
  102. package/src/boxes/wildcard.ts +58 -0
  103. package/src/bus/global.ts +1 -1
  104. package/src/cli/cmd/github-run-api.ts +2 -2
  105. package/src/cli/cmd/run-events.ts +2 -2
  106. package/src/cli/cmd/tui/component/logo.tsx +1 -1
  107. package/src/cli/cmd/tui/component/prompt/use-prompt-memos.ts +2 -2
  108. package/src/cli/cmd/tui/context/app/editor-zed.ts +1 -1
  109. package/src/cli/cmd/tui/context/app/editor.ts +1 -1
  110. package/src/cli/cmd/tui/context/app/helper.tsx +1 -0
  111. package/src/cli/cmd/tui/context/app/theme.tsx +1 -0
  112. package/src/cli/cmd/tui/util/revert-diff.ts +1 -1
  113. package/src/overlay/cli/cmd/roll-call-call.ts +1 -1
  114. package/src/overlay/cost-tracker/format.ts +1 -1
  115. package/src/overlay/cost-tracker/index.ts +4 -4
  116. package/src/overlay/cost-tracker/state.ts +2 -2
  117. package/src/overlay/cost-tracker/types.ts +2 -2
  118. package/src/overlay/memory/age.ts +1 -1
  119. package/src/overlay/memory/index.ts +4 -4
  120. package/src/overlay/memory/paths.ts +2 -2
  121. package/src/overlay/memory/scan.ts +1 -1
  122. package/src/overlay/memory/types.ts +2 -2
  123. package/src/overlay/tool/bash-security.ts +3 -3
  124. package/src/overlay/util/url.ts +1 -1
  125. package/src/plugin/codex-auth.ts +1 -1
  126. package/src/provider/model-cache.ts +2 -2
  127. package/src/provider/provider-resolve.ts +3 -3
  128. package/src/provider/transform-message.ts +1 -1
  129. package/src/server/routes/game.ts +284 -0
  130. package/src/server/server.ts +2 -0
  131. package/src/session/core/compaction/compaction-helpers.ts +1 -1
  132. package/src/session/core/compaction/compaction.ts +1 -1
  133. package/src/session/core/session-events.ts +50 -8
  134. package/src/session/core/session.ts +2 -0
  135. package/src/sessions/ingest-queue.ts +2 -2
  136. package/src/sessions/remote-ws.ts +1 -1
  137. package/src/tool/workflow/question.ts +1 -1
  138. package/src/util/abort.ts +1 -1
  139. package/src/util/bom.ts +2 -2
  140. package/src/util/color.ts +1 -1
  141. package/src/util/data-url.ts +1 -1
  142. package/src/util/defer.ts +1 -1
  143. package/src/util/error.ts +2 -2
  144. package/src/util/filesystem.ts +2 -2
  145. package/src/util/format.ts +1 -1
  146. package/src/util/iife.ts +1 -1
  147. package/src/util/local-context.ts +1 -1
  148. package/src/util/locale.ts +2 -2
  149. package/src/util/lock.ts +1 -1
  150. package/src/util/network.ts +1 -1
  151. package/src/util/signal.ts +1 -1
  152. package/src/util/token.ts +1 -1
  153. package/src/util/wildcard.ts +1 -1
  154. package/sst-env.d.ts +10 -0
  155. package/test/AGENTS.md +133 -0
  156. package/test/account/repo.test.ts +352 -0
  157. package/test/account/service.test.ts +456 -0
  158. package/test/acp/agent-interface.test.ts +51 -0
  159. package/test/acp/event-subscription.test.ts +725 -0
  160. package/test/agent/agent.test.ts +890 -0
  161. package/test/auth/auth.test.ts +86 -0
  162. package/test/bun/registry.test.ts +75 -0
  163. package/test/bus/bus-effect.test.ts +161 -0
  164. package/test/bus/bus-integration.test.ts +87 -0
  165. package/test/bus/bus.test.ts +219 -0
  166. package/test/cli/account.test.ts +26 -0
  167. package/test/cli/auto-mode.test.ts +75 -0
  168. package/test/cli/bin-saeeol.test.ts +8 -0
  169. package/test/cli/cmd/tui/prompt-part.test.ts +47 -0
  170. package/test/cli/cmd/tui/prompt-traits.test.ts +38 -0
  171. package/test/cli/cmd/tui/sync.test.tsx +159 -0
  172. package/test/cli/error.test.ts +18 -0
  173. package/test/cli/github-action.test.ts +198 -0
  174. package/test/cli/github-remote.test.ts +85 -0
  175. package/test/cli/import.test.ts +97 -0
  176. package/test/cli/install-artifact.test.ts +72 -0
  177. package/test/cli/plugin-auth-picker.test.ts +120 -0
  178. package/test/cli/pr.test.ts +59 -0
  179. package/test/cli/tui/editor-context-zed.test.ts +356 -0
  180. package/test/cli/tui/editor-context.test.tsx +228 -0
  181. package/test/cli/tui/keybind-plugin.test.ts +90 -0
  182. package/test/cli/tui/markdown.test.ts +161 -0
  183. package/test/cli/tui/plugin-add.test.ts +111 -0
  184. package/test/cli/tui/plugin-install.test.ts +87 -0
  185. package/test/cli/tui/plugin-lifecycle.test.ts +224 -0
  186. package/test/cli/tui/plugin-loader-entrypoint.test.ts +484 -0
  187. package/test/cli/tui/plugin-loader-pure.test.ts +71 -0
  188. package/test/cli/tui/plugin-loader.test.ts +816 -0
  189. package/test/cli/tui/plugin-toggle.test.ts +157 -0
  190. package/test/cli/tui/revert-diff.test.ts +35 -0
  191. package/test/cli/tui/slot-replace.test.tsx +47 -0
  192. package/test/cli/tui/theme-store.test.ts +54 -0
  193. package/test/cli/tui/thread.test.ts +28 -0
  194. package/test/cli/tui/transcript.test.ts +426 -0
  195. package/test/cli/tui/usage.test.ts +60 -0
  196. package/test/cli/tui/use-event.test.tsx +175 -0
  197. package/test/config/agent-color.test.ts +67 -0
  198. package/test/config/config.test.ts +2544 -0
  199. package/test/config/fixtures/empty-frontmatter.md +4 -0
  200. package/test/config/fixtures/frontmatter.md +28 -0
  201. package/test/config/fixtures/markdown-header.md +11 -0
  202. package/test/config/fixtures/no-frontmatter.md +1 -0
  203. package/test/config/fixtures/weird-model-id.md +13 -0
  204. package/test/config/lsp.test.ts +87 -0
  205. package/test/config/markdown.test.ts +228 -0
  206. package/test/config/plugin.test.ts +0 -0
  207. package/test/config/tui.test.ts +624 -0
  208. package/test/control-plane/adapters.test.ts +71 -0
  209. package/test/control-plane/workspace.test.ts +1526 -0
  210. package/test/effect/app-runtime-logger.test.ts +98 -0
  211. package/test/effect/config-service.test.ts +65 -0
  212. package/test/effect/instance-state.test.ts +394 -0
  213. package/test/effect/run-service.test.ts +89 -0
  214. package/test/effect/runner.test.ts +523 -0
  215. package/test/fake/provider.ts +82 -0
  216. package/test/file/fsmonitor.test.ts +68 -0
  217. package/test/file/ignore.test.ts +10 -0
  218. package/test/file/index.test.ts +954 -0
  219. package/test/file/path-traversal.test.ts +205 -0
  220. package/test/file/ripgrep.test.ts +226 -0
  221. package/test/file/watcher.test.ts +249 -0
  222. package/test/filesystem/filesystem.test.ts +319 -0
  223. package/test/fixture/db.ts +11 -0
  224. package/test/fixture/fixture.test.ts +26 -0
  225. package/test/fixture/fixture.ts +175 -0
  226. package/test/fixture/flock-worker.ts +72 -0
  227. package/test/fixture/log-init-worker.ts +62 -0
  228. package/test/fixture/lsp/fake-lsp-server.js +249 -0
  229. package/test/fixture/plug-worker.ts +93 -0
  230. package/test/fixture/plugin-meta-worker.ts +19 -0
  231. package/test/fixture/skills/agents-sdk/SKILL.md +152 -0
  232. package/test/fixture/skills/cloudflare/SKILL.md +211 -0
  233. package/test/fixture/skills/index.json +6 -0
  234. package/test/fixture/tui-plugin.ts +323 -0
  235. package/test/fixture/tui-runtime.ts +31 -0
  236. package/test/format/format.test.ts +272 -0
  237. package/test/git/git.test.ts +128 -0
  238. package/test/ide/ide.test.ts +82 -0
  239. package/test/installation/installation.test.ts +168 -0
  240. package/test/keybind.test.ts +421 -0
  241. package/test/lib/effect.ts +53 -0
  242. package/test/lib/filesystem.ts +10 -0
  243. package/test/lib/llm-server.ts +778 -0
  244. package/test/lib/websocket.ts +46 -0
  245. package/test/lsp/client.test.ts +482 -0
  246. package/test/lsp/index.test.ts +160 -0
  247. package/test/lsp/launch.test.ts +22 -0
  248. package/test/lsp/lifecycle.test.ts +184 -0
  249. package/test/ltm/ltm.test.ts +230 -0
  250. package/test/mcp/headers.test.ts +178 -0
  251. package/test/mcp/lifecycle.test.ts +787 -0
  252. package/test/mcp/oauth-auto-connect.test.ts +311 -0
  253. package/test/mcp/oauth-browser.test.ts +276 -0
  254. package/test/mcp/oauth-callback.test.ts +34 -0
  255. package/test/memory/abort-leak-webfetch.ts +49 -0
  256. package/test/memory/abort-leak.test.ts +128 -0
  257. package/test/patch/patch.test.ts +348 -0
  258. package/test/permission/arity.test.ts +33 -0
  259. package/test/permission/next.test.ts +1227 -0
  260. package/test/permission/next.toConfig.test.ts +110 -0
  261. package/test/permission-task.test.ts +326 -0
  262. package/test/plugin/auth-override.test.ts +79 -0
  263. package/test/plugin/cloudflare.test.ts +68 -0
  264. package/test/plugin/codex.test.ts +123 -0
  265. package/test/plugin/github-copilot-models.test.ts +261 -0
  266. package/test/plugin/install-concurrency.test.ts +140 -0
  267. package/test/plugin/install.test.ts +570 -0
  268. package/test/plugin/loader-shared.test.ts +1169 -0
  269. package/test/plugin/meta.test.ts +137 -0
  270. package/test/plugin/plugin-contract.test.ts +291 -0
  271. package/test/plugin/shared.test.ts +88 -0
  272. package/test/plugin/trigger.test.ts +102 -0
  273. package/test/plugin/workspace-adapter.test.ts +109 -0
  274. package/test/preload.ts +77 -0
  275. package/test/project/instance.test.ts +276 -0
  276. package/test/project/migrate-global.test.ts +152 -0
  277. package/test/project/project.test.ts +600 -0
  278. package/test/project/vcs.test.ts +286 -0
  279. package/test/project/worktree-remove.test.ts +126 -0
  280. package/test/project/worktree.test.ts +223 -0
  281. package/test/provider/amazon-bedrock.test.ts +462 -0
  282. package/test/provider/copilot/convert-to-copilot-messages.test.ts +523 -0
  283. package/test/provider/copilot/copilot-chat-model.test.ts +592 -0
  284. package/test/provider/gitlab-duo.test.ts +413 -0
  285. package/test/provider/local.test.ts +208 -0
  286. package/test/provider/models.test.ts +261 -0
  287. package/test/provider/provider-category.test.ts +190 -0
  288. package/test/provider/provider.test.ts +2758 -0
  289. package/test/provider/transform.test.ts +3681 -0
  290. package/test/pty/pty-output-isolation.test.ts +147 -0
  291. package/test/pty/pty-session.test.ts +102 -0
  292. package/test/pty/pty-shell.test.ts +104 -0
  293. package/test/question/question.test.ts +490 -0
  294. package/test/saeeol/agent-global-config-dirs.test.ts +24 -0
  295. package/test/saeeol/agent-manager-tool.test.ts +71 -0
  296. package/test/saeeol/agent-permission-overrides.test.ts +75 -0
  297. package/test/saeeol/agent-skill-permissions.test.ts +37 -0
  298. package/test/saeeol/ask-agent-permissions.test.ts +303 -0
  299. package/test/saeeol/bash-hierarchy.test.ts +64 -0
  300. package/test/saeeol/bash-permission-metadata.test.ts +66 -0
  301. package/test/saeeol/bash-security-extended.test.ts +243 -0
  302. package/test/saeeol/bedrock-claude-empty-content.test.ts +138 -0
  303. package/test/saeeol/boxes-integration.test.ts +415 -0
  304. package/test/saeeol/builtin-skills.test.ts +75 -0
  305. package/test/saeeol/cleanup.ts +28 -0
  306. package/test/saeeol/cli/dev-setup.test.ts +74 -0
  307. package/test/saeeol/cli/roll-call.test.ts +161 -0
  308. package/test/saeeol/cli-run-auto-helper.test.ts +58 -0
  309. package/test/saeeol/codex-auth-refresh.test.ts +124 -0
  310. package/test/saeeol/commit-message/generate.test.ts +188 -0
  311. package/test/saeeol/commit-message/git-context.test.ts +303 -0
  312. package/test/saeeol/commit-message-windows.test.ts +38 -0
  313. package/test/saeeol/compaction-payload-recovery.test.ts +406 -0
  314. package/test/saeeol/compaction-preservation-audit.test.ts +122 -0
  315. package/test/saeeol/compaction-skip-guard.test.ts +224 -0
  316. package/test/saeeol/compaction-smart-select.test.ts +100 -0
  317. package/test/saeeol/config/config.test.ts +166 -0
  318. package/test/saeeol/config/indexing-default-plugin.test.ts +82 -0
  319. package/test/saeeol/config/opentelemetry-default.test.ts +29 -0
  320. package/test/saeeol/config-gitignore.test.ts +70 -0
  321. package/test/saeeol/config-injector.test.ts +305 -0
  322. package/test/saeeol/config-resilience.test.ts +234 -0
  323. package/test/saeeol/config-validation.test.ts +183 -0
  324. package/test/saeeol/cost-propagation.test.ts +94 -0
  325. package/test/saeeol/cost-tracker-extended.test.ts +141 -0
  326. package/test/saeeol/cost-tracker.test.ts +64 -0
  327. package/test/saeeol/custom-provider-delete.test.ts +149 -0
  328. package/test/saeeol/diff-full.test.ts +226 -0
  329. package/test/saeeol/edit-permission-filediff.test.ts +223 -0
  330. package/test/saeeol/encoding.test.ts +364 -0
  331. package/test/saeeol/enhance-prompt.test.ts +61 -0
  332. package/test/saeeol/ensure-plan-dir.test.ts +32 -0
  333. package/test/saeeol/errors.test.ts +144 -0
  334. package/test/saeeol/external-directory-boundary.test.ts +96 -0
  335. package/test/saeeol/gateway-headers.test.ts +88 -0
  336. package/test/saeeol/help.test.ts +191 -0
  337. package/test/saeeol/ignore-migrator.test.ts +308 -0
  338. package/test/saeeol/indexing-auth.test.ts +45 -0
  339. package/test/saeeol/indexing-feature.test.ts +44 -0
  340. package/test/saeeol/indexing-label.test.ts +70 -0
  341. package/test/saeeol/indexing-startup.test.ts +381 -0
  342. package/test/saeeol/indexing-worktree.test.ts +73 -0
  343. package/test/saeeol/instruction.test.ts +136 -0
  344. package/test/saeeol/lancedb-runtime.test.ts +116 -0
  345. package/test/saeeol/loader-auth.test.ts +168 -0
  346. package/test/saeeol/local-model.test.ts +621 -0
  347. package/test/saeeol/logo.test.ts +31 -0
  348. package/test/saeeol/lsp-typescript-lightweight.test.ts +89 -0
  349. package/test/saeeol/mcp-branding.test.ts +33 -0
  350. package/test/saeeol/mcp-docker-rm.test.ts +32 -0
  351. package/test/saeeol/mcp-migrator.test.ts +736 -0
  352. package/test/saeeol/mcp-oauth-callback.test.ts +33 -0
  353. package/test/saeeol/memory-io.test.ts +198 -0
  354. package/test/saeeol/memory-paths.test.ts +87 -0
  355. package/test/saeeol/memory-security.test.ts +166 -0
  356. package/test/saeeol/model-cache-org.test.ts +164 -0
  357. package/test/saeeol/model-info-panel-utils.test.ts +52 -0
  358. package/test/saeeol/model-info-panel.types.test.ts +7 -0
  359. package/test/saeeol/models-401-fallback.test.ts +52 -0
  360. package/test/saeeol/modes-migrator.test.ts +320 -0
  361. package/test/saeeol/nvidia-headers.test.ts +74 -0
  362. package/test/saeeol/patch-jsonc.test.ts +73 -0
  363. package/test/saeeol/patch.test.ts +172 -0
  364. package/test/saeeol/paths.test.ts +265 -0
  365. package/test/saeeol/permission/config-paths.test.ts +174 -0
  366. package/test/saeeol/permission/env-read.test.ts +149 -0
  367. package/test/saeeol/permission/external-directory-allow.test.ts +327 -0
  368. package/test/saeeol/permission/next.always-rules.test.ts +882 -0
  369. package/test/saeeol/permission/next.reply-http.test.ts +205 -0
  370. package/test/saeeol/permission/next.reply-routing.test.ts +184 -0
  371. package/test/saeeol/plan-exit-detection.test.ts +494 -0
  372. package/test/saeeol/plan-followup.test.ts +1376 -0
  373. package/test/saeeol/project-config-update.test.ts +120 -0
  374. package/test/saeeol/project-id.test.ts +455 -0
  375. package/test/saeeol/provider-cost.test.ts +171 -0
  376. package/test/saeeol/provider-list-failed-state.test.ts +100 -0
  377. package/test/saeeol/question-dismiss-all.test.ts +174 -0
  378. package/test/saeeol/read-directory.test.ts +116 -0
  379. package/test/saeeol/rules-migrator.test.ts +257 -0
  380. package/test/saeeol/run-auto.test.ts +176 -0
  381. package/test/saeeol/run-network.test.ts +224 -0
  382. package/test/saeeol/semantic-search.test.ts +186 -0
  383. package/test/saeeol/server/permission-allow-everything.test.ts +125 -0
  384. package/test/saeeol/session/instruction-substitution.test.ts +72 -0
  385. package/test/saeeol/session/platform-attribution.test.ts +118 -0
  386. package/test/saeeol/session/session.test.ts +105 -0
  387. package/test/saeeol/session-compaction-cap.test.ts +399 -0
  388. package/test/saeeol/session-compaction-chunks.test.ts +501 -0
  389. package/test/saeeol/session-compaction-safety.test.ts +481 -0
  390. package/test/saeeol/session-fork-remap.test.ts +251 -0
  391. package/test/saeeol/session-import-service.test.ts +114 -0
  392. package/test/saeeol/session-list.test.ts +47 -0
  393. package/test/saeeol/session-message-metadata.test.ts +128 -0
  394. package/test/saeeol/session-overflow.test.ts +78 -0
  395. package/test/saeeol/session-processor-empty-tool-calls.test.ts +571 -0
  396. package/test/saeeol/session-processor-network-offline.test.ts +204 -0
  397. package/test/saeeol/session-processor-retry-limit.test.ts +238 -0
  398. package/test/saeeol/session-processor-review-telemetry.test.ts +82 -0
  399. package/test/saeeol/session-prompt-compaction-safety.test.ts +517 -0
  400. package/test/saeeol/session-prompt-queue.test.ts +815 -0
  401. package/test/saeeol/sessions/inflight-cache.test.ts +157 -0
  402. package/test/saeeol/sessions/ingest-queue.test.ts +402 -0
  403. package/test/saeeol/sessions/remote-protocol.test.ts +258 -0
  404. package/test/saeeol/sessions/remote-sender.test.ts +1036 -0
  405. package/test/saeeol/sessions/remote-ws.test.ts +367 -0
  406. package/test/saeeol/sessions/sessions-enable-remote.test.disable +181 -0
  407. package/test/saeeol/slot-prop-reactivity.test.ts +142 -0
  408. package/test/saeeol/snapshot-cache.test.ts +84 -0
  409. package/test/saeeol/snapshot-freeze-repro.test.ts +100 -0
  410. package/test/saeeol/snapshot-track-timeout.test.ts +519 -0
  411. package/test/saeeol/stats-subagent-cost.test.ts +123 -0
  412. package/test/saeeol/suggestion/auto-dismiss.test.ts +65 -0
  413. package/test/saeeol/suggestion/suggestion.test.ts +145 -0
  414. package/test/saeeol/suggestion/tool.test.ts +298 -0
  415. package/test/saeeol/summary-file-diff.test.ts +28 -0
  416. package/test/saeeol/system-prompt.test.ts +142 -0
  417. package/test/saeeol/task-nesting.test.ts +193 -0
  418. package/test/saeeol/telemetry/feedback.test.ts +8 -0
  419. package/test/saeeol/todo-view.test.ts +57 -0
  420. package/test/saeeol/tool-encoding.test.ts +455 -0
  421. package/test/saeeol/tool-registry-indexing-import-failure.test.ts +49 -0
  422. package/test/saeeol/tool-registry-indexing.test.ts +236 -0
  423. package/test/saeeol/tool-registry-semantic-import-failure.test.ts +55 -0
  424. package/test/saeeol/tool-task-model.test.ts +352 -0
  425. package/test/saeeol/transform-opus-4.7.test.ts +89 -0
  426. package/test/saeeol/tui-diff.test.ts +91 -0
  427. package/test/saeeol/tui-sync.test.ts +80 -0
  428. package/test/saeeol/util/url.test.ts +141 -0
  429. package/test/saeeol/workflows-migrator.test.ts +261 -0
  430. package/test/saeeol/worktree-diff-summary.test.ts +64 -0
  431. package/test/saeeol/worktree-diff.test.ts +223 -0
  432. package/test/saeeol/worktree-remove-lock.test.ts +82 -0
  433. package/test/server/AGENTS.md +15 -0
  434. package/test/server/contract.test.ts +357 -0
  435. package/test/server/experimental-session-list.test.ts +157 -0
  436. package/test/server/global-session-list.test.ts +155 -0
  437. package/test/server/httpapi-authorization.test.ts +103 -0
  438. package/test/server/httpapi-bridge.test.ts +440 -0
  439. package/test/server/httpapi-config.test.ts +67 -0
  440. package/test/server/httpapi-cors.test.ts +89 -0
  441. package/test/server/httpapi-event.test.ts +57 -0
  442. package/test/server/httpapi-experimental.test.ts +219 -0
  443. package/test/server/httpapi-file.test.ts +79 -0
  444. package/test/server/httpapi-instance-context.test.ts +237 -0
  445. package/test/server/httpapi-instance.legacy.test.ts +140 -0
  446. package/test/server/httpapi-instance.test.ts +83 -0
  447. package/test/server/httpapi-json-parity.test.ts +263 -0
  448. package/test/server/httpapi-mcp-oauth.test.ts +76 -0
  449. package/test/server/httpapi-mcp.test.ts +189 -0
  450. package/test/server/httpapi-provider.test.ts +153 -0
  451. package/test/server/httpapi-pty-websocket.test.ts +16 -0
  452. package/test/server/httpapi-pty.test.ts +175 -0
  453. package/test/server/httpapi-raw-route-auth.test.ts +89 -0
  454. package/test/server/httpapi-sdk.test.ts +681 -0
  455. package/test/server/httpapi-session.test.ts +464 -0
  456. package/test/server/httpapi-sync.test.ts +130 -0
  457. package/test/server/httpapi-tui.test.ts +121 -0
  458. package/test/server/httpapi-workspace-routing.test.ts +471 -0
  459. package/test/server/httpapi-workspace.test.ts +427 -0
  460. package/test/server/lib/conformance.ts +88 -0
  461. package/test/server/lib/stateful.ts +112 -0
  462. package/test/server/project-init-git.test.ts +113 -0
  463. package/test/server/proxy-util.test.ts +113 -0
  464. package/test/server/session-actions.test.ts +49 -0
  465. package/test/server/session-list.test.ts +238 -0
  466. package/test/server/session-messages.test.ts +167 -0
  467. package/test/server/session-select.test.ts +100 -0
  468. package/test/server/trace-attributes.test.ts +76 -0
  469. package/test/server/workspace-proxy.test.ts +165 -0
  470. package/test/server/workspace-routing.test.ts +85 -0
  471. package/test/session/compaction.test.ts +2420 -0
  472. package/test/session/instruction.test.ts +247 -0
  473. package/test/session/llm.test.ts +1273 -0
  474. package/test/session/message-v2.test.ts +1291 -0
  475. package/test/session/messages-pagination.test.ts +1173 -0
  476. package/test/session/network.test.ts +249 -0
  477. package/test/session/processor-effect.test.ts +847 -0
  478. package/test/session/prompt.test.ts +2131 -0
  479. package/test/session/retry.test.ts +340 -0
  480. package/test/session/revert-compact.test.ts +639 -0
  481. package/test/session/schema-decoding.test.ts +311 -0
  482. package/test/session/session-entry-stepper.test.ts +917 -0
  483. package/test/session/session-schema.test.ts +76 -0
  484. package/test/session/snapshot-tool-race.test.ts +257 -0
  485. package/test/session/structured-output-integration.test.ts +265 -0
  486. package/test/session/structured-output.test.ts +381 -0
  487. package/test/session/system.test.ts +73 -0
  488. package/test/share/share-next.test.ts +333 -0
  489. package/test/shell/shell.test.ts +99 -0
  490. package/test/skill/discovery.test.ts +116 -0
  491. package/test/skill/skill.test.ts +393 -0
  492. package/test/snapshot/snapshot.test.ts +1531 -0
  493. package/test/storage/db.test.ts +23 -0
  494. package/test/storage/json-migration.test.ts +832 -0
  495. package/test/storage/storage.test.ts +293 -0
  496. package/test/suggestion/suggestion.test.ts +1 -0
  497. package/test/sync/index.test.ts +256 -0
  498. package/test/tool/__snapshots__/parameters.test.ts.snap +500 -0
  499. package/test/tool/__snapshots__/tool.test.ts.snap +9 -0
  500. package/test/tool/apply_patch.test.ts +614 -0
  501. package/test/tool/bash.test.ts +1225 -0
  502. package/test/tool/diagnostics-filter.test.ts +55 -0
  503. package/test/tool/edit.test.ts +754 -0
  504. package/test/tool/external-directory.test.ts +169 -0
  505. package/test/tool/fixtures/large-image.png +0 -0
  506. package/test/tool/fixtures/models-api.json +65179 -0
  507. package/test/tool/glob.test.ts +107 -0
  508. package/test/tool/grep.test.ts +114 -0
  509. package/test/tool/lsp.test.ts +187 -0
  510. package/test/tool/parameters.test.ts +243 -0
  511. package/test/tool/question.test.ts +129 -0
  512. package/test/tool/read.test.ts +500 -0
  513. package/test/tool/recall.test.ts +151 -0
  514. package/test/tool/registry.test.ts +203 -0
  515. package/test/tool/skill.test.ts +135 -0
  516. package/test/tool/suggest.test.ts +1 -0
  517. package/test/tool/task.test.ts +612 -0
  518. package/test/tool/tool-define.test.ts +99 -0
  519. package/test/tool/truncation.test.ts +260 -0
  520. package/test/tool/webfetch.test.ts +103 -0
  521. package/test/tool/write.test.ts +291 -0
  522. package/test/util/data-url.test.ts +14 -0
  523. package/test/util/effect-zod.test.ts +754 -0
  524. package/test/util/error.test.ts +38 -0
  525. package/test/util/filesystem.test.ts +656 -0
  526. package/test/util/format.test.ts +59 -0
  527. package/test/util/glob.test.ts +164 -0
  528. package/test/util/iife.test.ts +36 -0
  529. package/test/util/lazy.test.ts +50 -0
  530. package/test/util/lock.test.ts +72 -0
  531. package/test/util/log.test.ts +86 -0
  532. package/test/util/module.test.ts +59 -0
  533. package/test/util/process.test.ts +128 -0
  534. package/test/util/timeout.test.ts +21 -0
  535. package/test/util/which.test.ts +100 -0
  536. package/test/util/wildcard.test.ts +90 -0
  537. package/test/workspace/workspace-restore.test.ts +296 -0
  538. package/src/provider/models-snapshot.d.ts +0 -2
  539. package/src/provider/models-snapshot.js +0 -3
@@ -0,0 +1,2420 @@
1
+ import { afterEach, describe, expect, mock, test } from "bun:test"
2
+ import { APICallError } from "ai"
3
+ import { Cause, Effect, Exit, Layer, ManagedRuntime } from "effect"
4
+ import * as Stream from "effect/Stream"
5
+ import z from "zod"
6
+ import { Bus } from "../../src/bus"
7
+ import { Config } from "@/config/config"
8
+ import { Agent } from "../../src/agent/agent"
9
+ import { LLM } from "../../src/session/llm"
10
+ import { SessionCompaction } from "../../src/session/compaction"
11
+ import { Token } from "@/util/token"
12
+ import { Instance } from "../../src/project/instance"
13
+ import * as Log from "@saeeol/core/util/log"
14
+ import { Permission } from "../../src/permission"
15
+ import { Plugin } from "../../src/plugin"
16
+ import { provideTmpdirInstance, tmpdir } from "../fixture/fixture"
17
+ import { Session as SessionNs } from "@/session/session"
18
+ import { MessageV2 } from "../../src/session/message-v2"
19
+ import { MessageID, PartID, SessionID } from "../../src/session/schema"
20
+ import { SessionStatus } from "../../src/session/status"
21
+ import { SessionSummary } from "../../src/session/summary"
22
+ import { ModelID, ProviderID } from "../../src/provider/schema"
23
+ import type { Provider } from "@/provider/provider"
24
+ import * as SessionProcessorModule from "../../src/session/processor"
25
+ import { Snapshot } from "../../src/snapshot"
26
+ import { ProviderTest } from "../fake/provider"
27
+ import { testEffect } from "../lib/effect"
28
+ import { CrossSpawnSpawner } from "@saeeol/core/cross-spawn-spawner"
29
+
30
+ void Log.init({ print: false })
31
+
32
+ function run<A, E>(fx: Effect.Effect<A, E, SessionNs.Service>) {
33
+ return Effect.runPromise(fx.pipe(Effect.provide(SessionNs.defaultLayer)))
34
+ }
35
+
36
+ const svc = {
37
+ ...SessionNs,
38
+ create(input?: SessionNs.CreateInput) {
39
+ return run(SessionNs.Service.use((svc) => svc.create(input)))
40
+ },
41
+ messages(input: z.output<typeof SessionNs.MessagesInput.zod>) {
42
+ return run(SessionNs.Service.use((svc) => svc.messages(input)))
43
+ },
44
+ updateMessage<T extends MessageV2.Info>(msg: T) {
45
+ return run(SessionNs.Service.use((svc) => svc.updateMessage(msg)))
46
+ },
47
+ updatePart<T extends MessageV2.Part>(part: T) {
48
+ return run(SessionNs.Service.use((svc) => svc.updatePart(part)))
49
+ },
50
+ }
51
+
52
+ const summary = Layer.succeed(
53
+ SessionSummary.Service,
54
+ SessionSummary.Service.of({
55
+ summarize: () => Effect.void,
56
+ diff: () => Effect.succeed([]),
57
+ computeDiff: () => Effect.succeed([]),
58
+ }),
59
+ )
60
+
61
+ const ref = {
62
+ providerID: ProviderID.make("test"),
63
+ modelID: ModelID.make("test-model"),
64
+ }
65
+
66
+ afterEach(() => {
67
+ mock.restore()
68
+ })
69
+
70
+ function createModel(opts: {
71
+ context: number
72
+ output: number
73
+ input?: number
74
+ cost?: Provider.Model["cost"]
75
+ npm?: string
76
+ }): Provider.Model {
77
+ return {
78
+ id: "test-model",
79
+ providerID: "test",
80
+ name: "Test",
81
+ limit: {
82
+ context: opts.context,
83
+ input: opts.input,
84
+ output: opts.output,
85
+ },
86
+ cost: opts.cost ?? { input: 0, output: 0, cache: { read: 0, write: 0 } },
87
+ capabilities: {
88
+ toolcall: true,
89
+ attachment: false,
90
+ reasoning: false,
91
+ temperature: true,
92
+ input: { text: true, image: false, audio: false, video: false },
93
+ output: { text: true, image: false, audio: false, video: false },
94
+ },
95
+ api: { npm: opts.npm ?? "@ai-sdk/anthropic" },
96
+ options: {},
97
+ } as Provider.Model
98
+ }
99
+
100
+ const wide = () => ProviderTest.fake({ model: createModel({ context: 100_000, output: 32_000 }) })
101
+
102
+ async function user(sessionID: SessionID, text: string) {
103
+ const msg = await svc.updateMessage({
104
+ id: MessageID.ascending(),
105
+ role: "user",
106
+ sessionID,
107
+ agent: "build",
108
+ model: ref,
109
+ time: { created: Date.now() },
110
+ })
111
+ await svc.updatePart({
112
+ id: PartID.ascending(),
113
+ messageID: msg.id,
114
+ sessionID,
115
+ type: "text",
116
+ text,
117
+ })
118
+ return msg
119
+ }
120
+
121
+ async function assistant(sessionID: SessionID, parentID: MessageID, root: string) {
122
+ const msg: MessageV2.Assistant = {
123
+ id: MessageID.ascending(),
124
+ role: "assistant",
125
+ sessionID,
126
+ mode: "build",
127
+ agent: "build",
128
+ path: { cwd: root, root },
129
+ cost: 0,
130
+ tokens: {
131
+ output: 0,
132
+ input: 0,
133
+ reasoning: 0,
134
+ cache: { read: 0, write: 0 },
135
+ },
136
+ modelID: ref.modelID,
137
+ providerID: ref.providerID,
138
+ parentID,
139
+ time: { created: Date.now() },
140
+ finish: "end_turn",
141
+ }
142
+ await svc.updateMessage(msg)
143
+ return msg
144
+ }
145
+
146
+ async function summaryAssistant(sessionID: SessionID, parentID: MessageID, root: string, text: string) {
147
+ const msg: MessageV2.Assistant = {
148
+ id: MessageID.ascending(),
149
+ role: "assistant",
150
+ sessionID,
151
+ mode: "compaction",
152
+ agent: "compaction",
153
+ path: { cwd: root, root },
154
+ cost: 0,
155
+ tokens: {
156
+ output: 0,
157
+ input: 0,
158
+ reasoning: 0,
159
+ cache: { read: 0, write: 0 },
160
+ },
161
+ modelID: ref.modelID,
162
+ providerID: ref.providerID,
163
+ parentID,
164
+ summary: true,
165
+ time: { created: Date.now() },
166
+ finish: "end_turn",
167
+ }
168
+ await svc.updateMessage(msg)
169
+ await svc.updatePart({
170
+ id: PartID.ascending(),
171
+ messageID: msg.id,
172
+ sessionID,
173
+ type: "text",
174
+ text,
175
+ })
176
+ return msg
177
+ }
178
+
179
+ async function lastCompactionPart(sessionID: SessionID) {
180
+ return (await svc.messages({ sessionID }))
181
+ .at(-2)
182
+ ?.parts.find((item): item is MessageV2.CompactionPart => item.type === "compaction")
183
+ }
184
+
185
+ function fake(
186
+ input: Parameters<SessionProcessorModule.SessionProcessor.Interface["create"]>[0],
187
+ result: "continue" | "compact",
188
+ ) {
189
+ const msg = input.assistantMessage
190
+ return {
191
+ get message() {
192
+ return msg
193
+ },
194
+ updateToolCall: Effect.fn("TestSessionProcessor.updateToolCall")(() => Effect.succeed(undefined)),
195
+ completeToolCall: Effect.fn("TestSessionProcessor.completeToolCall")(() => Effect.void),
196
+ process: Effect.fn("TestSessionProcessor.process")(() => Effect.succeed(result)),
197
+ } satisfies SessionProcessorModule.SessionProcessor.Handle
198
+ }
199
+
200
+ function layer(result: "continue" | "compact") {
201
+ return Layer.succeed(
202
+ SessionProcessorModule.SessionProcessor.Service,
203
+ SessionProcessorModule.SessionProcessor.Service.of({
204
+ create: Effect.fn("TestSessionProcessor.create")((input) => Effect.succeed(fake(input, result))),
205
+ }),
206
+ )
207
+ }
208
+
209
+ function cfg(compaction?: Config.Info["compaction"]) {
210
+ const base = Config.Info.zod.parse({})
211
+ return Layer.mock(Config.Service)({
212
+ get: () => Effect.succeed({ ...base, compaction }),
213
+ })
214
+ }
215
+
216
+ function runtime(
217
+ result: "continue" | "compact",
218
+ plugin = Plugin.defaultLayer,
219
+ provider = ProviderTest.fake(),
220
+ config = Config.defaultLayer,
221
+ ) {
222
+ const bus = Bus.layer
223
+ return ManagedRuntime.make(
224
+ Layer.mergeAll(SessionCompaction.layer, bus).pipe(
225
+ Layer.provide(provider.layer),
226
+ Layer.provide(SessionNs.defaultLayer),
227
+ Layer.provide(layer(result)),
228
+ Layer.provide(Agent.defaultLayer),
229
+ Layer.provide(plugin),
230
+ Layer.provide(bus),
231
+ Layer.provide(config),
232
+ ),
233
+ )
234
+ }
235
+
236
+ const deps = Layer.mergeAll(
237
+ ProviderTest.fake().layer,
238
+ layer("continue"),
239
+ Agent.defaultLayer,
240
+ Plugin.defaultLayer,
241
+ Bus.layer,
242
+ Config.defaultLayer,
243
+ )
244
+
245
+ const env = Layer.mergeAll(
246
+ SessionNs.defaultLayer,
247
+ CrossSpawnSpawner.defaultLayer,
248
+ SessionCompaction.layer.pipe(Layer.provide(SessionNs.defaultLayer), Layer.provideMerge(deps)),
249
+ )
250
+
251
+ const it = testEffect(env)
252
+
253
+ function llm() {
254
+ const queue: Array<
255
+ Stream.Stream<LLM.Event, unknown> | ((input: LLM.StreamInput) => Stream.Stream<LLM.Event, unknown>)
256
+ > = []
257
+
258
+ return {
259
+ push(stream: Stream.Stream<LLM.Event, unknown> | ((input: LLM.StreamInput) => Stream.Stream<LLM.Event, unknown>)) {
260
+ queue.push(stream)
261
+ },
262
+ layer: Layer.succeed(
263
+ LLM.Service,
264
+ LLM.Service.of({
265
+ stream: (input) => {
266
+ const item = queue.shift() ?? Stream.empty
267
+ const stream = typeof item === "function" ? item(input) : item
268
+ return stream.pipe(Stream.mapEffect((event) => Effect.succeed(event)))
269
+ },
270
+ raw: () => Effect.die("raw not implemented in test LLM"),
271
+ }),
272
+ ),
273
+ }
274
+ }
275
+
276
+ function liveRuntime(layer: Layer.Layer<LLM.Service>, provider = ProviderTest.fake(), config = Config.defaultLayer) {
277
+ const bus = Bus.layer
278
+ const status = SessionStatus.layer.pipe(Layer.provide(bus))
279
+ const processor = SessionProcessorModule.SessionProcessor.layer.pipe(Layer.provide(summary))
280
+ return ManagedRuntime.make(
281
+ Layer.mergeAll(SessionCompaction.layer.pipe(Layer.provide(processor)), processor, bus, status).pipe(
282
+ Layer.provide(provider.layer),
283
+ Layer.provide(SessionNs.defaultLayer),
284
+ Layer.provide(Snapshot.defaultLayer),
285
+ Layer.provide(layer),
286
+ Layer.provide(Permission.defaultLayer),
287
+ Layer.provide(Agent.defaultLayer),
288
+ Layer.provide(Plugin.defaultLayer),
289
+ Layer.provide(status),
290
+ Layer.provide(bus),
291
+ Layer.provide(config),
292
+ ),
293
+ )
294
+ }
295
+
296
+ function reply(
297
+ text: string,
298
+ capture?: (input: LLM.StreamInput) => void,
299
+ ): (input: LLM.StreamInput) => Stream.Stream<LLM.Event, unknown> {
300
+ return (input) => {
301
+ capture?.(input)
302
+ return Stream.make(
303
+ { type: "start" } satisfies LLM.Event,
304
+ { type: "text-start", id: "txt-0" } satisfies LLM.Event,
305
+ { type: "text-delta", id: "txt-0", delta: text, text } as LLM.Event,
306
+ { type: "text-end", id: "txt-0" } satisfies LLM.Event,
307
+ {
308
+ type: "finish-step",
309
+ finishReason: "stop",
310
+ rawFinishReason: "stop",
311
+ response: { id: "res", modelId: "test-model", timestamp: new Date() },
312
+ providerMetadata: undefined,
313
+ usage: {
314
+ inputTokens: 1,
315
+ outputTokens: 1,
316
+ totalTokens: 2,
317
+ inputTokenDetails: {
318
+ noCacheTokens: undefined,
319
+ cacheReadTokens: undefined,
320
+ cacheWriteTokens: undefined,
321
+ },
322
+ outputTokenDetails: {
323
+ textTokens: undefined,
324
+ reasoningTokens: undefined,
325
+ },
326
+ },
327
+ } satisfies LLM.Event,
328
+ {
329
+ type: "finish",
330
+ finishReason: "stop",
331
+ rawFinishReason: "stop",
332
+ totalUsage: {
333
+ inputTokens: 1,
334
+ outputTokens: 1,
335
+ totalTokens: 2,
336
+ inputTokenDetails: {
337
+ noCacheTokens: undefined,
338
+ cacheReadTokens: undefined,
339
+ cacheWriteTokens: undefined,
340
+ },
341
+ outputTokenDetails: {
342
+ textTokens: undefined,
343
+ reasoningTokens: undefined,
344
+ },
345
+ },
346
+ } satisfies LLM.Event,
347
+ )
348
+ }
349
+ }
350
+
351
+ function wait(ms = 50) {
352
+ return new Promise((resolve) => setTimeout(resolve, ms))
353
+ }
354
+
355
+ function defer() {
356
+ let resolve!: () => void
357
+ const promise = new Promise<void>((done) => {
358
+ resolve = done
359
+ })
360
+ return { promise, resolve }
361
+ }
362
+
363
+ function plugin(ready: ReturnType<typeof defer>) {
364
+ return Layer.mock(Plugin.Service)({
365
+ trigger: <Name extends string, Input, Output>(name: Name, _input: Input, output: Output) => {
366
+ if (name !== "experimental.session.compacting") return Effect.succeed(output)
367
+ return Effect.sync(() => ready.resolve()).pipe(Effect.andThen(Effect.never), Effect.as(output))
368
+ },
369
+ list: () => Effect.succeed([]),
370
+ init: () => Effect.void,
371
+ })
372
+ }
373
+
374
+ function autocontinue(enabled: boolean) {
375
+ return Layer.mock(Plugin.Service)({
376
+ trigger: <Name extends string, Input, Output>(name: Name, _input: Input, output: Output) => {
377
+ if (name !== "experimental.compaction.autocontinue") return Effect.succeed(output)
378
+ return Effect.sync(() => {
379
+ ;(output as { enabled: boolean }).enabled = enabled
380
+ return output
381
+ })
382
+ },
383
+ list: () => Effect.succeed([]),
384
+ init: () => Effect.void,
385
+ })
386
+ }
387
+
388
+ describe("session.compaction.isOverflow", () => {
389
+ it.live(
390
+ "returns true when token count exceeds usable context",
391
+ provideTmpdirInstance(() =>
392
+ Effect.gen(function* () {
393
+ const compact = yield* SessionCompaction.Service
394
+ const model = createModel({ context: 100_000, output: 32_000 })
395
+ const tokens = { input: 75_000, output: 5_000, reasoning: 0, cache: { read: 0, write: 0 } }
396
+ expect(yield* compact.isOverflow({ tokens, model })).toBe(true)
397
+ }),
398
+ ),
399
+ )
400
+
401
+ it.live(
402
+ "returns false when token count within usable context",
403
+ provideTmpdirInstance(() =>
404
+ Effect.gen(function* () {
405
+ const compact = yield* SessionCompaction.Service
406
+ const model = createModel({ context: 200_000, output: 32_000 })
407
+ const tokens = { input: 100_000, output: 10_000, reasoning: 0, cache: { read: 0, write: 0 } }
408
+ expect(yield* compact.isOverflow({ tokens, model })).toBe(false)
409
+ }),
410
+ ),
411
+ )
412
+
413
+ it.live(
414
+ "includes cache.read in token count",
415
+ provideTmpdirInstance(() =>
416
+ Effect.gen(function* () {
417
+ const compact = yield* SessionCompaction.Service
418
+ const model = createModel({ context: 100_000, output: 32_000 })
419
+ const tokens = { input: 60_000, output: 10_000, reasoning: 0, cache: { read: 10_000, write: 0 } }
420
+ expect(yield* compact.isOverflow({ tokens, model })).toBe(true)
421
+ }),
422
+ ),
423
+ )
424
+
425
+ it.live(
426
+ "respects input limit for input caps",
427
+ provideTmpdirInstance(() =>
428
+ Effect.gen(function* () {
429
+ const compact = yield* SessionCompaction.Service
430
+ const model = createModel({ context: 400_000, input: 272_000, output: 128_000 })
431
+ const tokens = { input: 271_000, output: 1_000, reasoning: 0, cache: { read: 2_000, write: 0 } }
432
+ expect(yield* compact.isOverflow({ tokens, model })).toBe(true)
433
+ }),
434
+ ),
435
+ )
436
+
437
+ it.live(
438
+ "returns false when input/output are within input caps",
439
+ provideTmpdirInstance(() =>
440
+ Effect.gen(function* () {
441
+ const compact = yield* SessionCompaction.Service
442
+ const model = createModel({ context: 400_000, input: 272_000, output: 128_000 })
443
+ const tokens = { input: 200_000, output: 20_000, reasoning: 0, cache: { read: 10_000, write: 0 } }
444
+ expect(yield* compact.isOverflow({ tokens, model })).toBe(false)
445
+ }),
446
+ ),
447
+ )
448
+
449
+ it.live(
450
+ "returns false when output within limit with input caps",
451
+ provideTmpdirInstance(() =>
452
+ Effect.gen(function* () {
453
+ const compact = yield* SessionCompaction.Service
454
+ const model = createModel({ context: 200_000, input: 120_000, output: 10_000 })
455
+ const tokens = { input: 50_000, output: 9_999, reasoning: 0, cache: { read: 0, write: 0 } }
456
+ expect(yield* compact.isOverflow({ tokens, model })).toBe(false)
457
+ }),
458
+ ),
459
+ )
460
+
461
+ // ─── Bug reproduction tests ───────────────────────────────────────────
462
+ // These tests demonstrate that when limit.input is set, isOverflow()
463
+ // does not subtract any headroom for the next model response. This means
464
+ // compaction only triggers AFTER we've already consumed the full input
465
+ // budget, leaving zero room for the next API call's output tokens.
466
+ //
467
+ // Compare: without limit.input, usable = context - output (reserves space).
468
+ // With limit.input, usable = limit.input (reserves nothing).
469
+ //
470
+ // Related issues: #10634, #8089, #11086, #12621
471
+ // Open PRs: #6875, #12924
472
+
473
+ it.live(
474
+ "BUG: no headroom when limit.input is set — compaction should trigger near boundary but does not",
475
+ provideTmpdirInstance(() =>
476
+ Effect.gen(function* () {
477
+ const compact = yield* SessionCompaction.Service
478
+ // Simulate Claude with prompt caching: input limit = 200K, output limit = 32K
479
+ const model = createModel({ context: 200_000, input: 200_000, output: 32_000 })
480
+
481
+ // We've used 198K tokens total. Only 2K under the input limit.
482
+ // On the next turn, the full conversation (198K) becomes input,
483
+ // plus the model needs room to generate output — this WILL overflow.
484
+ const tokens = { input: 180_000, output: 15_000, reasoning: 0, cache: { read: 3_000, write: 0 } }
485
+ // count = 180K + 3K + 15K = 198K
486
+ // usable = limit.input = 200K (no output subtracted!)
487
+ // 198K > 200K = false → no compaction triggered
488
+
489
+ // WITHOUT limit.input: usable = 200K - 32K = 168K, and 198K > 168K = true ✓
490
+ // WITH limit.input: usable = 200K, and 198K > 200K = false ✗
491
+
492
+ // With 198K used and only 2K headroom, the next turn will overflow.
493
+ // Compaction MUST trigger here.
494
+ expect(yield* compact.isOverflow({ tokens, model })).toBe(true)
495
+ }),
496
+ ),
497
+ )
498
+
499
+ it.live(
500
+ "BUG: without limit.input, same token count correctly triggers compaction",
501
+ provideTmpdirInstance(() =>
502
+ Effect.gen(function* () {
503
+ const compact = yield* SessionCompaction.Service
504
+ // Same model but without limit.input — uses context - output instead
505
+ const model = createModel({ context: 200_000, output: 32_000 })
506
+
507
+ // Same token usage as above
508
+ const tokens = { input: 180_000, output: 15_000, reasoning: 0, cache: { read: 3_000, write: 0 } }
509
+ // count = 198K
510
+ // usable = context - output = 200K - 32K = 168K
511
+ // 198K > 168K = true → compaction correctly triggered
512
+
513
+ const result = yield* compact.isOverflow({ tokens, model })
514
+ expect(result).toBe(true) // ← Correct: headroom is reserved
515
+ }),
516
+ ),
517
+ )
518
+
519
+ it.live(
520
+ "BUG: asymmetry — limit.input model allows 30K more usage before compaction than equivalent model without it",
521
+ provideTmpdirInstance(() =>
522
+ Effect.gen(function* () {
523
+ const compact = yield* SessionCompaction.Service
524
+ // Two models with identical context/output limits, differing only in limit.input
525
+ const withInputLimit = createModel({ context: 200_000, input: 200_000, output: 32_000 })
526
+ const withoutInputLimit = createModel({ context: 200_000, output: 32_000 })
527
+
528
+ // 170K total tokens — well above context-output (168K) but below input limit (200K)
529
+ const tokens = { input: 166_000, output: 10_000, reasoning: 0, cache: { read: 5_000, write: 0 } }
530
+
531
+ const withLimit = yield* compact.isOverflow({ tokens, model: withInputLimit })
532
+ const withoutLimit = yield* compact.isOverflow({ tokens, model: withoutInputLimit })
533
+
534
+ // Both models have identical real capacity — they should agree:
535
+ expect(withLimit).toBe(true) // should compact (170K leaves no room for 32K output)
536
+ expect(withoutLimit).toBe(true) // correctly compacts (170K > 168K)
537
+ }),
538
+ ),
539
+ )
540
+
541
+ it.live(
542
+ "returns false when model context limit is 0",
543
+ provideTmpdirInstance(() =>
544
+ Effect.gen(function* () {
545
+ const compact = yield* SessionCompaction.Service
546
+ const model = createModel({ context: 0, output: 32_000 })
547
+ const tokens = { input: 100_000, output: 10_000, reasoning: 0, cache: { read: 0, write: 0 } }
548
+ expect(yield* compact.isOverflow({ tokens, model })).toBe(false)
549
+ }),
550
+ ),
551
+ )
552
+
553
+ it.live(
554
+ "returns false when compaction.auto is disabled",
555
+ provideTmpdirInstance(
556
+ () =>
557
+ Effect.gen(function* () {
558
+ const compact = yield* SessionCompaction.Service
559
+ const model = createModel({ context: 100_000, output: 32_000 })
560
+ const tokens = { input: 75_000, output: 5_000, reasoning: 0, cache: { read: 0, write: 0 } }
561
+ expect(yield* compact.isOverflow({ tokens, model })).toBe(false)
562
+ }),
563
+ {
564
+ config: {
565
+ compaction: { auto: false },
566
+ },
567
+ },
568
+ ),
569
+ )
570
+ })
571
+
572
+ describe("session.compaction.create", () => {
573
+ it.live(
574
+ "creates a compaction user message and part",
575
+ provideTmpdirInstance(() =>
576
+ Effect.gen(function* () {
577
+ const compact = yield* SessionCompaction.Service
578
+ const ssn = yield* SessionNs.Service
579
+
580
+ const info = yield* ssn.create({})
581
+
582
+ yield* compact.create({
583
+ sessionID: info.id,
584
+ agent: "build",
585
+ model: ref,
586
+ auto: true,
587
+ overflow: true,
588
+ })
589
+
590
+ const msgs = yield* ssn.messages({ sessionID: info.id })
591
+ expect(msgs).toHaveLength(1)
592
+ expect(msgs[0].info.role).toBe("user")
593
+ expect(msgs[0].parts).toHaveLength(1)
594
+ expect(msgs[0].parts[0]).toMatchObject({
595
+ type: "compaction",
596
+ auto: true,
597
+ overflow: true,
598
+ })
599
+ }),
600
+ ),
601
+ )
602
+ })
603
+
604
+ describe("session.compaction.prune", () => {
605
+ it.live(
606
+ "compacts old completed tool output",
607
+ provideTmpdirInstance(
608
+ (dir) =>
609
+ Effect.gen(function* () {
610
+ const compact = yield* SessionCompaction.Service
611
+ const ssn = yield* SessionNs.Service
612
+ const info = yield* ssn.create({})
613
+ const a = yield* ssn.updateMessage({
614
+ id: MessageID.ascending(),
615
+ role: "user",
616
+ sessionID: info.id,
617
+ agent: "build",
618
+ model: ref,
619
+ time: { created: Date.now() },
620
+ })
621
+ yield* ssn.updatePart({
622
+ id: PartID.ascending(),
623
+ messageID: a.id,
624
+ sessionID: info.id,
625
+ type: "text",
626
+ text: "first",
627
+ })
628
+ const b: MessageV2.Assistant = {
629
+ id: MessageID.ascending(),
630
+ role: "assistant",
631
+ sessionID: info.id,
632
+ mode: "build",
633
+ agent: "build",
634
+ path: { cwd: dir, root: dir },
635
+ cost: 0,
636
+ tokens: {
637
+ output: 0,
638
+ input: 0,
639
+ reasoning: 0,
640
+ cache: { read: 0, write: 0 },
641
+ },
642
+ modelID: ref.modelID,
643
+ providerID: ref.providerID,
644
+ parentID: a.id,
645
+ time: { created: Date.now() },
646
+ finish: "end_turn",
647
+ }
648
+ yield* ssn.updateMessage(b)
649
+ yield* ssn.updatePart({
650
+ id: PartID.ascending(),
651
+ messageID: b.id,
652
+ sessionID: info.id,
653
+ type: "tool",
654
+ callID: crypto.randomUUID(),
655
+ tool: "bash",
656
+ state: {
657
+ status: "completed",
658
+ input: {},
659
+ output: "x".repeat(200_000),
660
+ title: "done",
661
+ metadata: {},
662
+ time: { start: Date.now(), end: Date.now() },
663
+ },
664
+ })
665
+ for (const text of ["second", "third"]) {
666
+ const msg = yield* ssn.updateMessage({
667
+ id: MessageID.ascending(),
668
+ role: "user",
669
+ sessionID: info.id,
670
+ agent: "build",
671
+ model: ref,
672
+ time: { created: Date.now() },
673
+ })
674
+ yield* ssn.updatePart({
675
+ id: PartID.ascending(),
676
+ messageID: msg.id,
677
+ sessionID: info.id,
678
+ type: "text",
679
+ text,
680
+ })
681
+ }
682
+
683
+ yield* compact.prune({ sessionID: info.id })
684
+
685
+ const msgs = yield* ssn.messages({ sessionID: info.id })
686
+ const part = msgs.flatMap((msg) => msg.parts).find((part) => part.type === "tool")
687
+ expect(part?.type).toBe("tool")
688
+ expect(part?.state.status).toBe("completed")
689
+ if (part?.type === "tool" && part.state.status === "completed") {
690
+ expect(part.state.time.compacted).toBeNumber()
691
+ }
692
+ }),
693
+
694
+ {
695
+ config: {
696
+ compaction: { prune: true },
697
+ },
698
+ },
699
+ ),
700
+ )
701
+
702
+ it.live(
703
+ "skips protected skill tool output",
704
+ provideTmpdirInstance((dir) =>
705
+ Effect.gen(function* () {
706
+ const compact = yield* SessionCompaction.Service
707
+ const ssn = yield* SessionNs.Service
708
+ const info = yield* ssn.create({})
709
+ const a = yield* ssn.updateMessage({
710
+ id: MessageID.ascending(),
711
+ role: "user",
712
+ sessionID: info.id,
713
+ agent: "build",
714
+ model: ref,
715
+ time: { created: Date.now() },
716
+ })
717
+ yield* ssn.updatePart({
718
+ id: PartID.ascending(),
719
+ messageID: a.id,
720
+ sessionID: info.id,
721
+ type: "text",
722
+ text: "first",
723
+ })
724
+ const b: MessageV2.Assistant = {
725
+ id: MessageID.ascending(),
726
+ role: "assistant",
727
+ sessionID: info.id,
728
+ mode: "build",
729
+ agent: "build",
730
+ path: { cwd: dir, root: dir },
731
+ cost: 0,
732
+ tokens: {
733
+ output: 0,
734
+ input: 0,
735
+ reasoning: 0,
736
+ cache: { read: 0, write: 0 },
737
+ },
738
+ modelID: ref.modelID,
739
+ providerID: ref.providerID,
740
+ parentID: a.id,
741
+ time: { created: Date.now() },
742
+ finish: "end_turn",
743
+ }
744
+ yield* ssn.updateMessage(b)
745
+ yield* ssn.updatePart({
746
+ id: PartID.ascending(),
747
+ messageID: b.id,
748
+ sessionID: info.id,
749
+ type: "tool",
750
+ callID: crypto.randomUUID(),
751
+ tool: "skill",
752
+ state: {
753
+ status: "completed",
754
+ input: {},
755
+ output: "x".repeat(200_000),
756
+ title: "done",
757
+ metadata: {},
758
+ time: { start: Date.now(), end: Date.now() },
759
+ },
760
+ })
761
+ for (const text of ["second", "third"]) {
762
+ const msg = yield* ssn.updateMessage({
763
+ id: MessageID.ascending(),
764
+ role: "user",
765
+ sessionID: info.id,
766
+ agent: "build",
767
+ model: ref,
768
+ time: { created: Date.now() },
769
+ })
770
+ yield* ssn.updatePart({
771
+ id: PartID.ascending(),
772
+ messageID: msg.id,
773
+ sessionID: info.id,
774
+ type: "text",
775
+ text,
776
+ })
777
+ }
778
+
779
+ yield* compact.prune({ sessionID: info.id })
780
+
781
+ const msgs = yield* ssn.messages({ sessionID: info.id })
782
+ const part = msgs.flatMap((msg) => msg.parts).find((part) => part.type === "tool")
783
+ expect(part?.type).toBe("tool")
784
+ if (part?.type === "tool" && part.state.status === "completed") {
785
+ expect(part.state.time.compacted).toBeUndefined()
786
+ }
787
+ }),
788
+ ),
789
+ )
790
+ })
791
+
792
+ describe("session.compaction.process", () => {
793
+ test("throws when parent is not a user message", async () => {
794
+ await using tmp = await tmpdir()
795
+ await Instance.provide({
796
+ directory: tmp.path,
797
+ fn: async () => {
798
+ const session = await svc.create({})
799
+ const msg = await user(session.id, "hello")
800
+ const reply = await assistant(session.id, msg.id, tmp.path)
801
+ const rt = runtime("continue")
802
+ try {
803
+ const msgs = await svc.messages({ sessionID: session.id })
804
+ await expect(
805
+ rt.runPromise(
806
+ SessionCompaction.Service.use((svc) =>
807
+ svc.process({
808
+ parentID: reply.id,
809
+ messages: msgs,
810
+ sessionID: session.id,
811
+ auto: false,
812
+ }),
813
+ ),
814
+ ),
815
+ ).rejects.toThrow(`Compaction parent must be a user message: ${reply.id}`)
816
+ } finally {
817
+ await rt.dispose()
818
+ }
819
+ },
820
+ })
821
+ })
822
+
823
+ test("publishes compacted event on continue", async () => {
824
+ await using tmp = await tmpdir()
825
+ await Instance.provide({
826
+ directory: tmp.path,
827
+ fn: async () => {
828
+ const session = await svc.create({})
829
+ const msg = await user(session.id, "hello")
830
+ const msgs = await svc.messages({ sessionID: session.id })
831
+ const done = defer()
832
+ let seen = false
833
+ const rt = runtime("continue", Plugin.defaultLayer, wide())
834
+ let unsub: (() => void) | undefined
835
+ try {
836
+ unsub = await rt.runPromise(
837
+ Bus.Service.use((svc) =>
838
+ svc.subscribeCallback(SessionCompaction.Event.Compacted, (evt) => {
839
+ if (evt.properties.sessionID !== session.id) return
840
+ seen = true
841
+ done.resolve()
842
+ }),
843
+ ),
844
+ )
845
+
846
+ const result = await rt.runPromise(
847
+ SessionCompaction.Service.use((svc) =>
848
+ svc.process({
849
+ parentID: msg.id,
850
+ messages: msgs,
851
+ sessionID: session.id,
852
+ auto: false,
853
+ }),
854
+ ),
855
+ )
856
+
857
+ await Promise.race([
858
+ done.promise,
859
+ wait(500).then(() => {
860
+ throw new Error("timed out waiting for compacted event")
861
+ }),
862
+ ])
863
+ expect(result).toBe("continue")
864
+ expect(seen).toBe(true)
865
+ } finally {
866
+ unsub?.()
867
+ await rt.dispose()
868
+ }
869
+ },
870
+ })
871
+ })
872
+
873
+ test("marks summary message as errored on compact result", async () => {
874
+ await using tmp = await tmpdir()
875
+ await Instance.provide({
876
+ directory: tmp.path,
877
+ fn: async () => {
878
+ const session = await svc.create({})
879
+ const msg = await user(session.id, "hello")
880
+ const rt = runtime("compact", Plugin.defaultLayer, wide())
881
+ try {
882
+ const msgs = await svc.messages({ sessionID: session.id })
883
+ const result = await rt.runPromise(
884
+ SessionCompaction.Service.use((svc) =>
885
+ svc.process({
886
+ parentID: msg.id,
887
+ messages: msgs,
888
+ sessionID: session.id,
889
+ auto: false,
890
+ }),
891
+ ),
892
+ )
893
+
894
+ const summary = (await svc.messages({ sessionID: session.id })).find(
895
+ (msg) => msg.info.role === "assistant" && msg.info.summary,
896
+ )
897
+
898
+ expect(result).toBe("stop")
899
+ expect(summary?.info.role).toBe("assistant")
900
+ if (summary?.info.role === "assistant") {
901
+ expect(summary.info.finish).toBe("error")
902
+ expect(JSON.stringify(summary.info.error)).toContain("Session too large to compact")
903
+ }
904
+ } finally {
905
+ await rt.dispose()
906
+ }
907
+ },
908
+ })
909
+ })
910
+
911
+ test("adds synthetic continue prompt when auto is enabled", async () => {
912
+ await using tmp = await tmpdir()
913
+ await Instance.provide({
914
+ directory: tmp.path,
915
+ fn: async () => {
916
+ const session = await svc.create({})
917
+ const msg = await user(session.id, "hello")
918
+ const rt = runtime("continue", Plugin.defaultLayer, wide())
919
+ try {
920
+ const msgs = await svc.messages({ sessionID: session.id })
921
+ const result = await rt.runPromise(
922
+ SessionCompaction.Service.use((svc) =>
923
+ svc.process({
924
+ parentID: msg.id,
925
+ messages: msgs,
926
+ sessionID: session.id,
927
+ auto: true,
928
+ }),
929
+ ),
930
+ )
931
+
932
+ const all = await svc.messages({ sessionID: session.id })
933
+ const last = all.at(-1)
934
+
935
+ expect(result).toBe("continue")
936
+ expect(last?.info.role).toBe("user")
937
+ expect(last?.parts[0]).toMatchObject({
938
+ type: "text",
939
+ synthetic: true,
940
+ metadata: { compaction_continue: true },
941
+ })
942
+ if (last?.parts[0]?.type === "text") {
943
+ expect(last.parts[0].text).toContain("Continue if you have next steps")
944
+ }
945
+ } finally {
946
+ await rt.dispose()
947
+ }
948
+ },
949
+ })
950
+ })
951
+
952
+ test("persists tail_start_id for retained recent turns", async () => {
953
+ await using tmp = await tmpdir()
954
+ await Instance.provide({
955
+ directory: tmp.path,
956
+ fn: async () => {
957
+ const session = await svc.create({})
958
+ await user(session.id, "first")
959
+ const keep = await user(session.id, "second")
960
+ await user(session.id, "third")
961
+ await SessionCompaction.create({
962
+ sessionID: session.id,
963
+ agent: "build",
964
+ model: ref,
965
+ auto: false,
966
+ })
967
+
968
+ const rt = runtime(
969
+ "continue",
970
+ Plugin.defaultLayer,
971
+ wide(),
972
+ cfg({ tail_turns: 2, preserve_recent_tokens: 10_000 }),
973
+ )
974
+ try {
975
+ const msgs = await svc.messages({ sessionID: session.id })
976
+ const parent = msgs.at(-1)?.info.id
977
+ expect(parent).toBeTruthy()
978
+ await rt.runPromise(
979
+ SessionCompaction.Service.use((svc) =>
980
+ svc.process({
981
+ parentID: parent!,
982
+ messages: msgs,
983
+ sessionID: session.id,
984
+ auto: false,
985
+ }),
986
+ ),
987
+ )
988
+
989
+ const part = await lastCompactionPart(session.id)
990
+ expect(part?.type).toBe("compaction")
991
+ expect(part?.tail_start_id).toBe(keep.id)
992
+ } finally {
993
+ await rt.dispose()
994
+ }
995
+ },
996
+ })
997
+ })
998
+
999
+ test("shrinks retained tail to fit preserve token budget", async () => {
1000
+ await using tmp = await tmpdir()
1001
+ await Instance.provide({
1002
+ directory: tmp.path,
1003
+ fn: async () => {
1004
+ const session = await svc.create({})
1005
+ await user(session.id, "first")
1006
+ await user(session.id, "x".repeat(2_000))
1007
+ const keep = await user(session.id, "tiny")
1008
+ await SessionCompaction.create({
1009
+ sessionID: session.id,
1010
+ agent: "build",
1011
+ model: ref,
1012
+ auto: false,
1013
+ })
1014
+
1015
+ const rt = runtime("continue", Plugin.defaultLayer, wide(), cfg({ tail_turns: 2, preserve_recent_tokens: 100 }))
1016
+ try {
1017
+ const msgs = await svc.messages({ sessionID: session.id })
1018
+ const parent = msgs.at(-1)?.info.id
1019
+ expect(parent).toBeTruthy()
1020
+ await rt.runPromise(
1021
+ SessionCompaction.Service.use((svc) =>
1022
+ svc.process({
1023
+ parentID: parent!,
1024
+ messages: msgs,
1025
+ sessionID: session.id,
1026
+ auto: false,
1027
+ }),
1028
+ ),
1029
+ )
1030
+
1031
+ const part = await lastCompactionPart(session.id)
1032
+ expect(part?.type).toBe("compaction")
1033
+ expect(part?.tail_start_id).toBe(keep.id)
1034
+ } finally {
1035
+ await rt.dispose()
1036
+ }
1037
+ },
1038
+ })
1039
+ })
1040
+
1041
+ test("falls back to full summary when even one recent turn exceeds preserve token budget", async () => {
1042
+ await using tmp = await tmpdir({ git: true })
1043
+ const stub = llm()
1044
+ let captured = ""
1045
+ stub.push(
1046
+ reply("summary", (input) => {
1047
+ captured = JSON.stringify(input.messages)
1048
+ }),
1049
+ )
1050
+ await Instance.provide({
1051
+ directory: tmp.path,
1052
+ fn: async () => {
1053
+ const session = await svc.create({})
1054
+ await user(session.id, "first")
1055
+ await user(session.id, "y".repeat(2_000))
1056
+ await SessionCompaction.create({
1057
+ sessionID: session.id,
1058
+ agent: "build",
1059
+ model: ref,
1060
+ auto: false,
1061
+ })
1062
+
1063
+ const rt = liveRuntime(stub.layer, wide(), cfg({ tail_turns: 1, preserve_recent_tokens: 20 }))
1064
+ try {
1065
+ const msgs = await svc.messages({ sessionID: session.id })
1066
+ const parent = msgs.at(-1)?.info.id
1067
+ expect(parent).toBeTruthy()
1068
+ await rt.runPromise(
1069
+ SessionCompaction.Service.use((svc) =>
1070
+ svc.process({
1071
+ parentID: parent!,
1072
+ messages: msgs,
1073
+ sessionID: session.id,
1074
+ auto: false,
1075
+ }),
1076
+ ),
1077
+ )
1078
+
1079
+ const part = await lastCompactionPart(session.id)
1080
+ expect(part?.type).toBe("compaction")
1081
+ expect(part?.tail_start_id).toBeUndefined()
1082
+ expect(captured).toContain("yyyy")
1083
+ } finally {
1084
+ await rt.dispose()
1085
+ }
1086
+ },
1087
+ })
1088
+ })
1089
+
1090
+ test("falls back to full summary when retained tail media exceeds preserve token budget", async () => {
1091
+ await using tmp = await tmpdir({ git: true })
1092
+ const stub = llm()
1093
+ let captured = ""
1094
+ stub.push(
1095
+ reply("summary", (input) => {
1096
+ captured = JSON.stringify(input.messages)
1097
+ }),
1098
+ )
1099
+ await Instance.provide({
1100
+ directory: tmp.path,
1101
+ fn: async () => {
1102
+ const session = await svc.create({})
1103
+ await user(session.id, "older")
1104
+ const recent = await user(session.id, "recent image turn")
1105
+ await svc.updatePart({
1106
+ id: PartID.ascending(),
1107
+ messageID: recent.id,
1108
+ sessionID: session.id,
1109
+ type: "file",
1110
+ mime: "image/png",
1111
+ filename: "big.png",
1112
+ url: `data:image/png;base64,${"a".repeat(4_000)}`,
1113
+ })
1114
+ await SessionCompaction.create({
1115
+ sessionID: session.id,
1116
+ agent: "build",
1117
+ model: ref,
1118
+ auto: false,
1119
+ })
1120
+
1121
+ const rt = liveRuntime(stub.layer, wide(), cfg({ tail_turns: 1, preserve_recent_tokens: 100 }))
1122
+ try {
1123
+ const msgs = await svc.messages({ sessionID: session.id })
1124
+ const parent = msgs.at(-1)?.info.id
1125
+ expect(parent).toBeTruthy()
1126
+ await rt.runPromise(
1127
+ SessionCompaction.Service.use((svc) =>
1128
+ svc.process({
1129
+ parentID: parent!,
1130
+ messages: msgs,
1131
+ sessionID: session.id,
1132
+ auto: false,
1133
+ }),
1134
+ ),
1135
+ )
1136
+
1137
+ const part = await lastCompactionPart(session.id)
1138
+ expect(part?.type).toBe("compaction")
1139
+ expect(part?.tail_start_id).toBeUndefined()
1140
+ expect(captured).toContain("recent image turn")
1141
+ expect(captured).toContain("Attached image/png: big.png")
1142
+ } finally {
1143
+ await rt.dispose()
1144
+ }
1145
+ },
1146
+ })
1147
+ })
1148
+
1149
+ test("retains a split turn suffix when a later message fits the preserve token budget", async () => {
1150
+ await using tmp = await tmpdir({ git: true })
1151
+ const stub = llm()
1152
+ let captured = ""
1153
+ stub.push(
1154
+ reply("summary", (input) => {
1155
+ captured = JSON.stringify(input.messages)
1156
+ }),
1157
+ )
1158
+ await Instance.provide({
1159
+ directory: tmp.path,
1160
+ fn: async () => {
1161
+ const session = await svc.create({})
1162
+ await user(session.id, "older")
1163
+ const recent = await user(session.id, "recent turn")
1164
+ const large = await assistant(session.id, recent.id, tmp.path)
1165
+ await svc.updatePart({
1166
+ id: PartID.ascending(),
1167
+ messageID: large.id,
1168
+ sessionID: session.id,
1169
+ type: "text",
1170
+ text: "z".repeat(2_000),
1171
+ })
1172
+ const keep = await assistant(session.id, recent.id, tmp.path)
1173
+ await svc.updatePart({
1174
+ id: PartID.ascending(),
1175
+ messageID: keep.id,
1176
+ sessionID: session.id,
1177
+ type: "text",
1178
+ text: "keep tail",
1179
+ })
1180
+ await SessionCompaction.create({
1181
+ sessionID: session.id,
1182
+ agent: "build",
1183
+ model: ref,
1184
+ auto: false,
1185
+ })
1186
+
1187
+ const rt = liveRuntime(stub.layer, wide(), cfg({ tail_turns: 1, preserve_recent_tokens: 100 }))
1188
+ try {
1189
+ const msgs = await svc.messages({ sessionID: session.id })
1190
+ const parent = msgs.at(-1)?.info.id
1191
+ expect(parent).toBeTruthy()
1192
+ await rt.runPromise(
1193
+ SessionCompaction.Service.use((svc) =>
1194
+ svc.process({
1195
+ parentID: parent!,
1196
+ messages: msgs,
1197
+ sessionID: session.id,
1198
+ auto: false,
1199
+ }),
1200
+ ),
1201
+ )
1202
+
1203
+ const part = await lastCompactionPart(session.id)
1204
+ expect(part?.type).toBe("compaction")
1205
+ expect(part?.tail_start_id).toBe(keep.id)
1206
+ expect(captured).toContain("zzzz")
1207
+ expect(captured).not.toContain("keep tail")
1208
+
1209
+ const filtered = MessageV2.filterCompacted(MessageV2.stream(session.id))
1210
+ expect(filtered[0]?.info.id).toBe(keep.id)
1211
+ expect(filtered.map((msg) => msg.info.id)).not.toContain(large.id)
1212
+ } finally {
1213
+ await rt.dispose()
1214
+ }
1215
+ },
1216
+ })
1217
+ })
1218
+
1219
+ test("allows plugins to disable synthetic continue prompt", async () => {
1220
+ await using tmp = await tmpdir()
1221
+ await Instance.provide({
1222
+ directory: tmp.path,
1223
+ fn: async () => {
1224
+ const session = await svc.create({})
1225
+ const msg = await user(session.id, "hello")
1226
+ const rt = runtime("continue", autocontinue(false), wide())
1227
+ try {
1228
+ const msgs = await svc.messages({ sessionID: session.id })
1229
+ const result = await rt.runPromise(
1230
+ SessionCompaction.Service.use((svc) =>
1231
+ svc.process({
1232
+ parentID: msg.id,
1233
+ messages: msgs,
1234
+ sessionID: session.id,
1235
+ auto: true,
1236
+ }),
1237
+ ),
1238
+ )
1239
+
1240
+ const all = await svc.messages({ sessionID: session.id })
1241
+ const last = all.at(-1)
1242
+
1243
+ expect(result).toBe("continue")
1244
+ expect(last?.info.role).toBe("assistant")
1245
+ expect(
1246
+ all.some(
1247
+ (msg) =>
1248
+ msg.info.role === "user" &&
1249
+ msg.parts.some(
1250
+ (part) =>
1251
+ part.type === "text" && part.synthetic && part.text.includes("Continue if you have next steps"),
1252
+ ),
1253
+ ),
1254
+ ).toBe(false)
1255
+ } finally {
1256
+ await rt.dispose()
1257
+ }
1258
+ },
1259
+ })
1260
+ })
1261
+
1262
+ test("replays the prior user turn on overflow when earlier context exists", async () => {
1263
+ await using tmp = await tmpdir()
1264
+ await Instance.provide({
1265
+ directory: tmp.path,
1266
+ fn: async () => {
1267
+ const session = await svc.create({})
1268
+ await user(session.id, "root")
1269
+ const replay = await user(session.id, "image")
1270
+ await svc.updatePart({
1271
+ id: PartID.ascending(),
1272
+ messageID: replay.id,
1273
+ sessionID: session.id,
1274
+ type: "file",
1275
+ mime: "image/png",
1276
+ filename: "cat.png",
1277
+ url: "https://example.com/cat.png",
1278
+ })
1279
+ const msg = await user(session.id, "current")
1280
+ const rt = runtime("continue", Plugin.defaultLayer, wide())
1281
+ try {
1282
+ const msgs = await svc.messages({ sessionID: session.id })
1283
+ const result = await rt.runPromise(
1284
+ SessionCompaction.Service.use((svc) =>
1285
+ svc.process({
1286
+ parentID: msg.id,
1287
+ messages: msgs,
1288
+ sessionID: session.id,
1289
+ auto: true,
1290
+ overflow: true,
1291
+ }),
1292
+ ),
1293
+ )
1294
+
1295
+ const last = (await svc.messages({ sessionID: session.id })).at(-1)
1296
+
1297
+ expect(result).toBe("continue")
1298
+ expect(last?.info.role).toBe("user")
1299
+ expect(last?.parts.some((part) => part.type === "file")).toBe(false)
1300
+ expect(
1301
+ last?.parts.some((part) => part.type === "text" && part.text.includes("Attached image/png: cat.png")),
1302
+ ).toBe(true)
1303
+ } finally {
1304
+ await rt.dispose()
1305
+ }
1306
+ },
1307
+ })
1308
+ })
1309
+
1310
+ test("falls back to overflow guidance when no replayable turn exists", async () => {
1311
+ await using tmp = await tmpdir()
1312
+ await Instance.provide({
1313
+ directory: tmp.path,
1314
+ fn: async () => {
1315
+ const session = await svc.create({})
1316
+ await user(session.id, "earlier")
1317
+ const msg = await user(session.id, "current")
1318
+
1319
+ const rt = runtime("continue", Plugin.defaultLayer, wide())
1320
+ try {
1321
+ const msgs = await svc.messages({ sessionID: session.id })
1322
+ const result = await rt.runPromise(
1323
+ SessionCompaction.Service.use((svc) =>
1324
+ svc.process({
1325
+ parentID: msg.id,
1326
+ messages: msgs,
1327
+ sessionID: session.id,
1328
+ auto: true,
1329
+ overflow: true,
1330
+ }),
1331
+ ),
1332
+ )
1333
+
1334
+ const last = (await svc.messages({ sessionID: session.id })).at(-1)
1335
+
1336
+ expect(result).toBe("continue")
1337
+ expect(last?.info.role).toBe("user")
1338
+ if (last?.parts[0]?.type === "text") {
1339
+ expect(last.parts[0].text).toContain("previous request exceeded the provider's size limit")
1340
+ }
1341
+ } finally {
1342
+ await rt.dispose()
1343
+ }
1344
+ },
1345
+ })
1346
+ })
1347
+
1348
+ test("stops quickly when aborted during retry backoff", async () => {
1349
+ const stub = llm()
1350
+ const ready = defer()
1351
+ stub.push(
1352
+ Stream.fromAsyncIterable(
1353
+ {
1354
+ async *[Symbol.asyncIterator]() {
1355
+ yield { type: "start" } as LLM.Event
1356
+ throw new APICallError({
1357
+ message: "boom",
1358
+ url: "https://example.com/v1/chat/completions",
1359
+ requestBodyValues: {},
1360
+ statusCode: 503,
1361
+ responseHeaders: { "retry-after-ms": "10000" },
1362
+ responseBody: '{"error":"boom"}',
1363
+ isRetryable: true,
1364
+ })
1365
+ },
1366
+ },
1367
+ (err) => err,
1368
+ ),
1369
+ )
1370
+
1371
+ await using tmp = await tmpdir({ git: true })
1372
+ await Instance.provide({
1373
+ directory: tmp.path,
1374
+ fn: async () => {
1375
+ const session = await svc.create({})
1376
+ const msg = await user(session.id, "hello")
1377
+ const msgs = await svc.messages({ sessionID: session.id })
1378
+ const abort = new AbortController()
1379
+ const rt = liveRuntime(stub.layer, wide())
1380
+ let off: (() => void) | undefined
1381
+ let run: Promise<"continue" | "stop"> | undefined
1382
+ try {
1383
+ off = await rt.runPromise(
1384
+ Bus.Service.use((svc) =>
1385
+ svc.subscribeCallback(SessionStatus.Event.Status, (evt) => {
1386
+ if (evt.properties.sessionID !== session.id) return
1387
+ if (evt.properties.status.type !== "retry") return
1388
+ ready.resolve()
1389
+ }),
1390
+ ),
1391
+ )
1392
+
1393
+ run = rt
1394
+ .runPromiseExit(
1395
+ SessionCompaction.Service.use((svc) =>
1396
+ svc.process({
1397
+ parentID: msg.id,
1398
+ messages: msgs,
1399
+ sessionID: session.id,
1400
+ auto: false,
1401
+ }),
1402
+ ),
1403
+ { signal: abort.signal },
1404
+ )
1405
+ .then((exit) => {
1406
+ if (Exit.isFailure(exit)) {
1407
+ if (Cause.hasInterrupts(exit.cause) && abort.signal.aborted) return "stop"
1408
+ throw Cause.squash(exit.cause)
1409
+ }
1410
+ return exit.value
1411
+ })
1412
+
1413
+ await Promise.race([
1414
+ ready.promise,
1415
+ wait(5000).then(() => {
1416
+ throw new Error("timed out waiting for retry status")
1417
+ }),
1418
+ ])
1419
+
1420
+ const start = Date.now()
1421
+ abort.abort()
1422
+ const result = await Promise.race([
1423
+ run.then((value) => ({ kind: "done" as const, value, ms: Date.now() - start })),
1424
+ wait(2000).then(() => ({ kind: "timeout" as const })),
1425
+ ])
1426
+
1427
+ expect(result.kind).toBe("done")
1428
+ if (result.kind === "done") {
1429
+ expect(result.value).toBe("stop")
1430
+ expect(result.ms).toBeLessThan(2000)
1431
+ }
1432
+ } finally {
1433
+ off?.()
1434
+ abort.abort()
1435
+ await rt.dispose()
1436
+ await run?.catch(() => undefined)
1437
+ }
1438
+ },
1439
+ })
1440
+ })
1441
+
1442
+ test("does not leave a summary assistant when aborted before processor setup", async () => {
1443
+ const ready = defer()
1444
+
1445
+ await using tmp = await tmpdir({ git: true })
1446
+ await Instance.provide({
1447
+ directory: tmp.path,
1448
+ fn: async () => {
1449
+ const session = await svc.create({})
1450
+ const msg = await user(session.id, "hello")
1451
+ const msgs = await svc.messages({ sessionID: session.id })
1452
+ const abort = new AbortController()
1453
+ const rt = runtime("continue", plugin(ready), wide())
1454
+ let run: Promise<"continue" | "stop"> | undefined
1455
+ try {
1456
+ run = rt
1457
+ .runPromiseExit(
1458
+ SessionCompaction.Service.use((svc) =>
1459
+ svc.process({
1460
+ parentID: msg.id,
1461
+ messages: msgs,
1462
+ sessionID: session.id,
1463
+ auto: false,
1464
+ }),
1465
+ ),
1466
+ { signal: abort.signal },
1467
+ )
1468
+ .then((exit) => {
1469
+ if (Exit.isFailure(exit)) {
1470
+ if (Cause.hasInterrupts(exit.cause) && abort.signal.aborted) return "stop"
1471
+ throw Cause.squash(exit.cause)
1472
+ }
1473
+ return exit.value
1474
+ })
1475
+
1476
+ await Promise.race([
1477
+ ready.promise,
1478
+ wait(1000).then(() => {
1479
+ throw new Error("timed out waiting for compaction hook")
1480
+ }),
1481
+ ])
1482
+
1483
+ abort.abort()
1484
+ expect(await run).toBe("stop")
1485
+
1486
+ const all = await svc.messages({ sessionID: session.id })
1487
+ expect(all.some((msg) => msg.info.role === "assistant" && msg.info.summary)).toBe(false)
1488
+ } finally {
1489
+ abort.abort()
1490
+ await rt.dispose()
1491
+ await run?.catch(() => undefined)
1492
+ }
1493
+ },
1494
+ })
1495
+ })
1496
+
1497
+ test("does not allow tool calls while generating the summary", async () => {
1498
+ const stub = llm()
1499
+ stub.push(
1500
+ Stream.make(
1501
+ { type: "start" } satisfies LLM.Event,
1502
+ { type: "tool-input-start", id: "call-1", toolName: "_noop" } satisfies LLM.Event,
1503
+ { type: "tool-call", toolCallId: "call-1", toolName: "_noop", input: {} } satisfies LLM.Event,
1504
+ {
1505
+ type: "finish-step",
1506
+ finishReason: "tool-calls",
1507
+ rawFinishReason: "tool_calls",
1508
+ response: { id: "res", modelId: "test-model", timestamp: new Date() },
1509
+ providerMetadata: undefined,
1510
+ usage: {
1511
+ inputTokens: 1,
1512
+ outputTokens: 1,
1513
+ totalTokens: 2,
1514
+ inputTokenDetails: {
1515
+ noCacheTokens: undefined,
1516
+ cacheReadTokens: undefined,
1517
+ cacheWriteTokens: undefined,
1518
+ },
1519
+ outputTokenDetails: {
1520
+ textTokens: undefined,
1521
+ reasoningTokens: undefined,
1522
+ },
1523
+ },
1524
+ } satisfies LLM.Event,
1525
+ {
1526
+ type: "finish",
1527
+ finishReason: "tool-calls",
1528
+ rawFinishReason: "tool_calls",
1529
+ totalUsage: {
1530
+ inputTokens: 1,
1531
+ outputTokens: 1,
1532
+ totalTokens: 2,
1533
+ inputTokenDetails: {
1534
+ noCacheTokens: undefined,
1535
+ cacheReadTokens: undefined,
1536
+ cacheWriteTokens: undefined,
1537
+ },
1538
+ outputTokenDetails: {
1539
+ textTokens: undefined,
1540
+ reasoningTokens: undefined,
1541
+ },
1542
+ },
1543
+ } satisfies LLM.Event,
1544
+ ),
1545
+ )
1546
+
1547
+ await using tmp = await tmpdir({ git: true })
1548
+ await Instance.provide({
1549
+ directory: tmp.path,
1550
+ fn: async () => {
1551
+ const session = await svc.create({})
1552
+ const msg = await user(session.id, "hello")
1553
+ const rt = liveRuntime(stub.layer, wide())
1554
+ try {
1555
+ const msgs = await svc.messages({ sessionID: session.id })
1556
+ await rt.runPromise(
1557
+ SessionCompaction.Service.use((svc) =>
1558
+ svc.process({
1559
+ parentID: msg.id,
1560
+ messages: msgs,
1561
+ sessionID: session.id,
1562
+ auto: false,
1563
+ }),
1564
+ ),
1565
+ )
1566
+
1567
+ const summary = (await svc.messages({ sessionID: session.id })).find(
1568
+ (item) => item.info.role === "assistant" && item.info.summary,
1569
+ )
1570
+
1571
+ expect(summary?.info.role).toBe("assistant")
1572
+ expect(summary?.parts.some((part) => part.type === "tool")).toBe(false)
1573
+ } finally {
1574
+ await rt.dispose()
1575
+ }
1576
+ },
1577
+ })
1578
+ })
1579
+
1580
+ test("summarizes only the head while keeping recent tail out of summary input", async () => {
1581
+ const stub = llm()
1582
+ let captured = ""
1583
+ stub.push(
1584
+ reply("summary", (input) => {
1585
+ captured = JSON.stringify(input.messages)
1586
+ }),
1587
+ )
1588
+
1589
+ await using tmp = await tmpdir({ git: true })
1590
+ await Instance.provide({
1591
+ directory: tmp.path,
1592
+ fn: async () => {
1593
+ const session = await svc.create({})
1594
+ await user(session.id, "older context")
1595
+ await user(session.id, "keep this turn")
1596
+ await user(session.id, "and this one too")
1597
+ await SessionCompaction.create({
1598
+ sessionID: session.id,
1599
+ agent: "build",
1600
+ model: ref,
1601
+ auto: false,
1602
+ })
1603
+
1604
+ const rt = liveRuntime(stub.layer, wide())
1605
+ try {
1606
+ const msgs = await svc.messages({ sessionID: session.id })
1607
+ const parent = msgs.at(-1)?.info.id
1608
+ expect(parent).toBeTruthy()
1609
+ await rt.runPromise(
1610
+ SessionCompaction.Service.use((svc) =>
1611
+ svc.process({
1612
+ parentID: parent!,
1613
+ messages: msgs,
1614
+ sessionID: session.id,
1615
+ auto: false,
1616
+ }),
1617
+ ),
1618
+ )
1619
+
1620
+ expect(captured).toContain("older context")
1621
+ expect(captured).not.toContain("keep this turn")
1622
+ expect(captured).not.toContain("and this one too")
1623
+ expect(captured).not.toContain("What did we do so far?")
1624
+ } finally {
1625
+ await rt.dispose()
1626
+ }
1627
+ },
1628
+ })
1629
+ })
1630
+
1631
+ test("anchors repeated compactions with the previous summary", async () => {
1632
+ const stub = llm()
1633
+ let captured = ""
1634
+ stub.push(reply("summary one"))
1635
+ stub.push(
1636
+ reply("summary two", (input) => {
1637
+ captured = JSON.stringify(input.messages)
1638
+ }),
1639
+ )
1640
+
1641
+ await using tmp = await tmpdir({ git: true })
1642
+ await Instance.provide({
1643
+ directory: tmp.path,
1644
+ fn: async () => {
1645
+ const session = await svc.create({})
1646
+ await user(session.id, "older context")
1647
+ await user(session.id, "keep this turn")
1648
+ await SessionCompaction.create({
1649
+ sessionID: session.id,
1650
+ agent: "build",
1651
+ model: ref,
1652
+ auto: false,
1653
+ })
1654
+
1655
+ const rt = liveRuntime(stub.layer, wide())
1656
+ try {
1657
+ let msgs = await svc.messages({ sessionID: session.id })
1658
+ let parent = msgs.at(-1)?.info.id
1659
+ expect(parent).toBeTruthy()
1660
+ await rt.runPromise(
1661
+ SessionCompaction.Service.use((svc) =>
1662
+ svc.process({
1663
+ parentID: parent!,
1664
+ messages: msgs,
1665
+ sessionID: session.id,
1666
+ auto: false,
1667
+ }),
1668
+ ),
1669
+ )
1670
+
1671
+ await user(session.id, "latest turn")
1672
+ await SessionCompaction.create({
1673
+ sessionID: session.id,
1674
+ agent: "build",
1675
+ model: ref,
1676
+ auto: false,
1677
+ })
1678
+
1679
+ msgs = MessageV2.filterCompacted(MessageV2.stream(session.id))
1680
+ parent = msgs.at(-1)?.info.id
1681
+ expect(parent).toBeTruthy()
1682
+ await rt.runPromise(
1683
+ SessionCompaction.Service.use((svc) =>
1684
+ svc.process({
1685
+ parentID: parent!,
1686
+ messages: msgs,
1687
+ sessionID: session.id,
1688
+ auto: false,
1689
+ }),
1690
+ ),
1691
+ )
1692
+
1693
+ expect(captured).toContain("<previous-summary>")
1694
+ expect(captured).toContain("summary one")
1695
+ expect(captured.match(/summary one/g)?.length).toBe(1)
1696
+ expect(captured).toContain("## Constraints & Preferences")
1697
+ expect(captured).toContain("## Progress")
1698
+ } finally {
1699
+ await rt.dispose()
1700
+ }
1701
+ },
1702
+ })
1703
+ })
1704
+
1705
+ test("keeps recent pre-compaction turns across repeated compactions", async () => {
1706
+ const stub = llm()
1707
+ stub.push(reply("summary one"))
1708
+ stub.push(reply("summary two"))
1709
+ await using tmp = await tmpdir()
1710
+ await Instance.provide({
1711
+ directory: tmp.path,
1712
+ fn: async () => {
1713
+ const session = await svc.create({})
1714
+ const u1 = await user(session.id, "one")
1715
+ const u2 = await user(session.id, "two")
1716
+ const u3 = await user(session.id, "three")
1717
+ await SessionCompaction.create({
1718
+ sessionID: session.id,
1719
+ agent: "build",
1720
+ model: ref,
1721
+ auto: false,
1722
+ })
1723
+
1724
+ const rt = liveRuntime(stub.layer, wide(), cfg({ tail_turns: 2, preserve_recent_tokens: 10_000 }))
1725
+ try {
1726
+ let msgs = await svc.messages({ sessionID: session.id })
1727
+ let parent = msgs.at(-1)?.info.id
1728
+ expect(parent).toBeTruthy()
1729
+ await rt.runPromise(
1730
+ SessionCompaction.Service.use((svc) =>
1731
+ svc.process({
1732
+ parentID: parent!,
1733
+ messages: msgs,
1734
+ sessionID: session.id,
1735
+ auto: false,
1736
+ }),
1737
+ ),
1738
+ )
1739
+
1740
+ const u4 = await user(session.id, "four")
1741
+ await SessionCompaction.create({
1742
+ sessionID: session.id,
1743
+ agent: "build",
1744
+ model: ref,
1745
+ auto: false,
1746
+ })
1747
+
1748
+ msgs = MessageV2.filterCompacted(MessageV2.stream(session.id))
1749
+ parent = msgs.at(-1)?.info.id
1750
+ expect(parent).toBeTruthy()
1751
+ await rt.runPromise(
1752
+ SessionCompaction.Service.use((svc) =>
1753
+ svc.process({
1754
+ parentID: parent!,
1755
+ messages: msgs,
1756
+ sessionID: session.id,
1757
+ auto: false,
1758
+ }),
1759
+ ),
1760
+ )
1761
+
1762
+ const filtered = MessageV2.filterCompacted(MessageV2.stream(session.id))
1763
+ const ids = filtered.map((msg) => msg.info.id)
1764
+
1765
+ expect(ids).not.toContain(u1.id)
1766
+ expect(ids).not.toContain(u2.id)
1767
+ expect(ids).toContain(u3.id)
1768
+ expect(ids).toContain(u4.id)
1769
+ expect(filtered.some((msg) => msg.info.role === "assistant" && msg.info.summary)).toBe(true)
1770
+ expect(
1771
+ filtered.some((msg) => msg.info.role === "user" && msg.parts.some((part) => part.type === "compaction")),
1772
+ ).toBe(true)
1773
+ } finally {
1774
+ await rt.dispose()
1775
+ }
1776
+ },
1777
+ })
1778
+ })
1779
+
1780
+ test("ignores previous summaries when sizing the retained tail", async () => {
1781
+ await using tmp = await tmpdir()
1782
+ await Instance.provide({
1783
+ directory: tmp.path,
1784
+ fn: async () => {
1785
+ const session = await svc.create({})
1786
+ await user(session.id, "older")
1787
+ const keep = await user(session.id, "keep this turn")
1788
+ const keepReply = await assistant(session.id, keep.id, tmp.path)
1789
+ await svc.updatePart({
1790
+ id: PartID.ascending(),
1791
+ messageID: keepReply.id,
1792
+ sessionID: session.id,
1793
+ type: "text",
1794
+ text: "keep reply",
1795
+ })
1796
+
1797
+ await SessionCompaction.create({
1798
+ sessionID: session.id,
1799
+ agent: "build",
1800
+ model: ref,
1801
+ auto: false,
1802
+ })
1803
+ const firstCompaction = (await svc.messages({ sessionID: session.id })).at(-1)?.info.id
1804
+ expect(firstCompaction).toBeTruthy()
1805
+ await summaryAssistant(session.id, firstCompaction!, tmp.path, "summary ".repeat(800))
1806
+
1807
+ const recent = await user(session.id, "recent turn")
1808
+ const recentReply = await assistant(session.id, recent.id, tmp.path)
1809
+ await svc.updatePart({
1810
+ id: PartID.ascending(),
1811
+ messageID: recentReply.id,
1812
+ sessionID: session.id,
1813
+ type: "text",
1814
+ text: "recent reply",
1815
+ })
1816
+
1817
+ await SessionCompaction.create({
1818
+ sessionID: session.id,
1819
+ agent: "build",
1820
+ model: ref,
1821
+ auto: false,
1822
+ })
1823
+
1824
+ const rt = runtime("continue", Plugin.defaultLayer, wide(), cfg({ tail_turns: 2, preserve_recent_tokens: 500 }))
1825
+ try {
1826
+ const msgs = await svc.messages({ sessionID: session.id })
1827
+ const parent = msgs.at(-1)?.info.id
1828
+ expect(parent).toBeTruthy()
1829
+ await rt.runPromise(
1830
+ SessionCompaction.Service.use((svc) =>
1831
+ svc.process({
1832
+ parentID: parent!,
1833
+ messages: msgs,
1834
+ sessionID: session.id,
1835
+ auto: false,
1836
+ }),
1837
+ ),
1838
+ )
1839
+
1840
+ const part = await lastCompactionPart(session.id)
1841
+ expect(part?.type).toBe("compaction")
1842
+ expect(part?.tail_start_id).toBe(keep.id)
1843
+ } finally {
1844
+ await rt.dispose()
1845
+ }
1846
+ },
1847
+ })
1848
+ })
1849
+ })
1850
+
1851
+ describe("util.token.estimate", () => {
1852
+ test("estimates tokens from text (4 chars per token)", () => {
1853
+ const text = "x".repeat(4000)
1854
+ expect(Token.estimate(text)).toBe(1000)
1855
+ })
1856
+
1857
+ test("estimates tokens from larger text", () => {
1858
+ const text = "y".repeat(20_000)
1859
+ expect(Token.estimate(text)).toBe(5000)
1860
+ })
1861
+
1862
+ test("returns 0 for empty string", () => {
1863
+ expect(Token.estimate("")).toBe(0)
1864
+ })
1865
+ })
1866
+
1867
+ describe("SessionNs.getUsage", () => {
1868
+ test("normalizes standard usage to token format", () => {
1869
+ const model = createModel({ context: 100_000, output: 32_000 })
1870
+ const result = SessionNs.getUsage({
1871
+ model,
1872
+ usage: {
1873
+ inputTokens: 1000,
1874
+ outputTokens: 500,
1875
+ totalTokens: 1500,
1876
+ inputTokenDetails: {
1877
+ noCacheTokens: undefined,
1878
+ cacheReadTokens: undefined,
1879
+ cacheWriteTokens: undefined,
1880
+ },
1881
+ outputTokenDetails: {
1882
+ textTokens: undefined,
1883
+ reasoningTokens: undefined,
1884
+ },
1885
+ },
1886
+ })
1887
+
1888
+ expect(result.tokens.input).toBe(1000)
1889
+ expect(result.tokens.output).toBe(500)
1890
+ expect(result.tokens.reasoning).toBe(0)
1891
+ expect(result.tokens.cache.read).toBe(0)
1892
+ expect(result.tokens.cache.write).toBe(0)
1893
+ })
1894
+
1895
+ test("extracts cached tokens to cache.read", () => {
1896
+ const model = createModel({ context: 100_000, output: 32_000 })
1897
+ const result = SessionNs.getUsage({
1898
+ model,
1899
+ usage: {
1900
+ inputTokens: 1000,
1901
+ outputTokens: 500,
1902
+ totalTokens: 1500,
1903
+ inputTokenDetails: {
1904
+ noCacheTokens: 800,
1905
+ cacheReadTokens: 200,
1906
+ cacheWriteTokens: undefined,
1907
+ },
1908
+ outputTokenDetails: {
1909
+ textTokens: undefined,
1910
+ reasoningTokens: undefined,
1911
+ },
1912
+ },
1913
+ })
1914
+
1915
+ expect(result.tokens.input).toBe(800)
1916
+ expect(result.tokens.cache.read).toBe(200)
1917
+ })
1918
+
1919
+ test("handles anthropic cache write metadata", () => {
1920
+ const model = createModel({ context: 100_000, output: 32_000 })
1921
+ const result = SessionNs.getUsage({
1922
+ model,
1923
+ usage: {
1924
+ inputTokens: 1000,
1925
+ outputTokens: 500,
1926
+ totalTokens: 1500,
1927
+ inputTokenDetails: {
1928
+ noCacheTokens: undefined,
1929
+ cacheReadTokens: undefined,
1930
+ cacheWriteTokens: undefined,
1931
+ },
1932
+ outputTokenDetails: {
1933
+ textTokens: undefined,
1934
+ reasoningTokens: undefined,
1935
+ },
1936
+ },
1937
+ metadata: {
1938
+ anthropic: {
1939
+ cacheCreationInputTokens: 300,
1940
+ },
1941
+ },
1942
+ })
1943
+
1944
+ expect(result.tokens.cache.write).toBe(300)
1945
+ })
1946
+
1947
+ test("subtracts cached tokens for anthropic provider", () => {
1948
+ const model = createModel({ context: 100_000, output: 32_000 })
1949
+ // AI SDK v6 normalizes inputTokens to include cached tokens for all providers
1950
+ const result = SessionNs.getUsage({
1951
+ model,
1952
+ usage: {
1953
+ inputTokens: 1000,
1954
+ outputTokens: 500,
1955
+ totalTokens: 1500,
1956
+ inputTokenDetails: {
1957
+ noCacheTokens: 800,
1958
+ cacheReadTokens: 200,
1959
+ cacheWriteTokens: undefined,
1960
+ },
1961
+ outputTokenDetails: {
1962
+ textTokens: undefined,
1963
+ reasoningTokens: undefined,
1964
+ },
1965
+ },
1966
+ metadata: {
1967
+ anthropic: {},
1968
+ },
1969
+ })
1970
+
1971
+ expect(result.tokens.input).toBe(800)
1972
+ expect(result.tokens.cache.read).toBe(200)
1973
+ })
1974
+
1975
+ test("separates reasoning tokens from output tokens", () => {
1976
+ const model = createModel({ context: 100_000, output: 32_000 })
1977
+ const result = SessionNs.getUsage({
1978
+ model,
1979
+ usage: {
1980
+ inputTokens: 1000,
1981
+ outputTokens: 500,
1982
+ totalTokens: 1500,
1983
+ inputTokenDetails: {
1984
+ noCacheTokens: undefined,
1985
+ cacheReadTokens: undefined,
1986
+ cacheWriteTokens: undefined,
1987
+ },
1988
+ outputTokenDetails: {
1989
+ textTokens: 400,
1990
+ reasoningTokens: 100,
1991
+ },
1992
+ },
1993
+ })
1994
+
1995
+ expect(result.tokens.input).toBe(1000)
1996
+ expect(result.tokens.output).toBe(400)
1997
+ expect(result.tokens.reasoning).toBe(100)
1998
+ expect(result.tokens.total).toBe(1500)
1999
+ })
2000
+
2001
+ test("does not double count reasoning tokens in cost", () => {
2002
+ const model = createModel({
2003
+ context: 100_000,
2004
+ output: 32_000,
2005
+ cost: {
2006
+ input: 0,
2007
+ output: 15,
2008
+ cache: { read: 0, write: 0 },
2009
+ },
2010
+ })
2011
+ const result = SessionNs.getUsage({
2012
+ model,
2013
+ usage: {
2014
+ inputTokens: 0,
2015
+ outputTokens: 1_000_000,
2016
+ totalTokens: 1_000_000,
2017
+ inputTokenDetails: {
2018
+ noCacheTokens: undefined,
2019
+ cacheReadTokens: undefined,
2020
+ cacheWriteTokens: undefined,
2021
+ },
2022
+ outputTokenDetails: {
2023
+ textTokens: 750_000,
2024
+ reasoningTokens: 250_000,
2025
+ },
2026
+ },
2027
+ })
2028
+
2029
+ expect(result.tokens.output).toBe(750_000)
2030
+ expect(result.tokens.reasoning).toBe(250_000)
2031
+ expect(result.cost).toBe(15)
2032
+ })
2033
+
2034
+ test("handles undefined optional values gracefully", () => {
2035
+ const model = createModel({ context: 100_000, output: 32_000 })
2036
+ const result = SessionNs.getUsage({
2037
+ model,
2038
+ usage: {
2039
+ inputTokens: 0,
2040
+ outputTokens: 0,
2041
+ totalTokens: 0,
2042
+ inputTokenDetails: {
2043
+ noCacheTokens: undefined,
2044
+ cacheReadTokens: undefined,
2045
+ cacheWriteTokens: undefined,
2046
+ },
2047
+ outputTokenDetails: {
2048
+ textTokens: undefined,
2049
+ reasoningTokens: undefined,
2050
+ },
2051
+ },
2052
+ })
2053
+
2054
+ expect(result.tokens.input).toBe(0)
2055
+ expect(result.tokens.output).toBe(0)
2056
+ expect(result.tokens.reasoning).toBe(0)
2057
+ expect(result.tokens.cache.read).toBe(0)
2058
+ expect(result.tokens.cache.write).toBe(0)
2059
+ expect(Number.isNaN(result.cost)).toBe(false)
2060
+ })
2061
+
2062
+ test("calculates cost correctly", () => {
2063
+ const model = createModel({
2064
+ context: 100_000,
2065
+ output: 32_000,
2066
+ cost: {
2067
+ input: 3,
2068
+ output: 15,
2069
+ cache: { read: 0.3, write: 3.75 },
2070
+ },
2071
+ })
2072
+ const result = SessionNs.getUsage({
2073
+ model,
2074
+ usage: {
2075
+ inputTokens: 1_000_000,
2076
+ outputTokens: 100_000,
2077
+ totalTokens: 1_100_000,
2078
+ inputTokenDetails: {
2079
+ noCacheTokens: undefined,
2080
+ cacheReadTokens: undefined,
2081
+ cacheWriteTokens: undefined,
2082
+ },
2083
+ outputTokenDetails: {
2084
+ textTokens: undefined,
2085
+ reasoningTokens: undefined,
2086
+ },
2087
+ },
2088
+ })
2089
+
2090
+ expect(result.cost).toBe(3 + 1.5)
2091
+ })
2092
+ test("uses openrouter provider cost when available", () => {
2093
+ const model = createModel({
2094
+ context: 100_000,
2095
+ output: 32_000,
2096
+ cost: {
2097
+ input: 3,
2098
+ output: 15,
2099
+ cache: { read: 0.3, write: 3.75 },
2100
+ },
2101
+ })
2102
+ const result = SessionNs.getUsage({
2103
+ model,
2104
+ usage: {
2105
+ inputTokens: 1_000_000,
2106
+ outputTokens: 100_000,
2107
+ totalTokens: 1_100_000,
2108
+ inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
2109
+ outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
2110
+ },
2111
+ metadata: {
2112
+ openrouter: {
2113
+ usage: {
2114
+ cost: 0.42, // Provider-reported cost should be used instead of calculated
2115
+ },
2116
+ },
2117
+ },
2118
+ })
2119
+
2120
+ // Should use the provider cost (0.42) instead of calculated cost (4.5)
2121
+ expect(result.cost).toBe(0.42)
2122
+ })
2123
+
2124
+ test("falls back to calculated cost when openrouter cost is not available", () => {
2125
+ const model = createModel({
2126
+ context: 100_000,
2127
+ output: 32_000,
2128
+ cost: {
2129
+ input: 3,
2130
+ output: 15,
2131
+ cache: { read: 0.3, write: 3.75 },
2132
+ },
2133
+ })
2134
+ const result = SessionNs.getUsage({
2135
+ model,
2136
+ usage: {
2137
+ inputTokens: 1_000_000,
2138
+ outputTokens: 100_000,
2139
+ totalTokens: 1_100_000,
2140
+ inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
2141
+ outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
2142
+ },
2143
+ metadata: {
2144
+ openrouter: {
2145
+ usage: {
2146
+ // cost is undefined
2147
+ },
2148
+ },
2149
+ },
2150
+ })
2151
+
2152
+ // Should fall back to calculated cost
2153
+ expect(result.cost).toBe(3 + 1.5)
2154
+ })
2155
+
2156
+ test("falls back to calculated cost when openrouter metadata is empty", () => {
2157
+ const model = createModel({
2158
+ context: 100_000,
2159
+ output: 32_000,
2160
+ cost: {
2161
+ input: 3,
2162
+ output: 15,
2163
+ cache: { read: 0.3, write: 3.75 },
2164
+ },
2165
+ })
2166
+ const result = SessionNs.getUsage({
2167
+ model,
2168
+ usage: {
2169
+ inputTokens: 1_000_000,
2170
+ outputTokens: 100_000,
2171
+ totalTokens: 1_100_000,
2172
+ inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
2173
+ outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
2174
+ },
2175
+ metadata: {
2176
+ openrouter: {},
2177
+ },
2178
+ })
2179
+
2180
+ // Should fall back to calculated cost
2181
+ expect(result.cost).toBe(3 + 1.5)
2182
+ })
2183
+
2184
+ test("uses upstreamInferenceCost for Saeeol provider", () => {
2185
+ const model = createModel({
2186
+ context: 100_000,
2187
+ output: 32_000,
2188
+ cost: {
2189
+ input: 3,
2190
+ output: 15,
2191
+ cache: { read: 0.3, write: 3.75 },
2192
+ },
2193
+ })
2194
+ const provider = { id: "saeeol" } as Provider.Info
2195
+ const result = SessionNs.getUsage({
2196
+ model,
2197
+ provider,
2198
+ usage: {
2199
+ inputTokens: 1_000_000,
2200
+ outputTokens: 100_000,
2201
+ totalTokens: 1_100_000,
2202
+ inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
2203
+ outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
2204
+ },
2205
+ metadata: {
2206
+ openrouter: {
2207
+ usage: {
2208
+ cost: 0.01, // OpenRouter 5% fee
2209
+ costDetails: {
2210
+ upstreamInferenceCost: 0.2, // Actual inference cost
2211
+ },
2212
+ },
2213
+ },
2214
+ },
2215
+ })
2216
+
2217
+ // Should use upstreamInferenceCost for Saeeol provider (BYOK)
2218
+ expect(result.cost).toBe(0.2)
2219
+ })
2220
+
2221
+ test("uses regular cost for OpenRouter provider", () => {
2222
+ const model = createModel({
2223
+ context: 100_000,
2224
+ output: 32_000,
2225
+ cost: {
2226
+ input: 3,
2227
+ output: 15,
2228
+ cache: { read: 0.3, write: 3.75 },
2229
+ },
2230
+ })
2231
+ const provider = { id: "openrouter" } as Provider.Info
2232
+ const result = SessionNs.getUsage({
2233
+ model,
2234
+ provider,
2235
+ usage: {
2236
+ inputTokens: 1_000_000,
2237
+ outputTokens: 100_000,
2238
+ totalTokens: 1_100_000,
2239
+ inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
2240
+ outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
2241
+ },
2242
+ metadata: {
2243
+ openrouter: {
2244
+ usage: {
2245
+ cost: 0.5, // Regular OpenRouter cost
2246
+ costDetails: {
2247
+ upstreamInferenceCost: 0.45,
2248
+ },
2249
+ },
2250
+ },
2251
+ },
2252
+ })
2253
+
2254
+ // Should use regular cost for OpenRouter provider
2255
+ expect(result.cost).toBe(0.5)
2256
+ })
2257
+
2258
+ test("falls back to regular cost when provider is not specified", () => {
2259
+ const model = createModel({
2260
+ context: 100_000,
2261
+ output: 32_000,
2262
+ cost: {
2263
+ input: 3,
2264
+ output: 15,
2265
+ cache: { read: 0.3, write: 3.75 },
2266
+ },
2267
+ })
2268
+ const result = SessionNs.getUsage({
2269
+ model,
2270
+ usage: {
2271
+ inputTokens: 1_000_000,
2272
+ outputTokens: 100_000,
2273
+ totalTokens: 1_100_000,
2274
+ inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
2275
+ outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
2276
+ },
2277
+ metadata: {
2278
+ openrouter: {
2279
+ usage: {
2280
+ cost: 0.3,
2281
+ costDetails: {
2282
+ upstreamInferenceCost: 0.25,
2283
+ },
2284
+ },
2285
+ },
2286
+ },
2287
+ })
2288
+
2289
+ // Should use regular cost when provider is not specified
2290
+ expect(result.cost).toBe(0.3)
2291
+ })
2292
+
2293
+ test("uses regular cost when upstreamInferenceCost is missing for Saeeol", () => {
2294
+ const model = createModel({
2295
+ context: 100_000,
2296
+ output: 32_000,
2297
+ cost: {
2298
+ input: 3,
2299
+ output: 15,
2300
+ cache: { read: 0.3, write: 3.75 },
2301
+ },
2302
+ })
2303
+ const provider = { id: "saeeol" } as Provider.Info
2304
+ const result = SessionNs.getUsage({
2305
+ model,
2306
+ provider,
2307
+ usage: {
2308
+ inputTokens: 1_000_000,
2309
+ outputTokens: 100_000,
2310
+ totalTokens: 1_100_000,
2311
+ inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
2312
+ outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
2313
+ },
2314
+ metadata: {
2315
+ openrouter: {
2316
+ usage: {
2317
+ cost: 0.01,
2318
+ // costDetails is missing
2319
+ },
2320
+ },
2321
+ },
2322
+ })
2323
+
2324
+ // When upstream cost is missing for Saeeol, fall back to regular cost field
2325
+ expect(result.cost).toBe(0.01)
2326
+ })
2327
+
2328
+ // Tests for Anthropic Messages / OpenAI Responses / Vercel AI Gateway cost extraction
2329
+ // live in test/saeeol/provider-cost.test.ts (saeeol_change).
2330
+
2331
+ test.each(["@ai-sdk/anthropic", "@ai-sdk/amazon-bedrock", "@ai-sdk/google-vertex/anthropic"])(
2332
+ "computes total from components for %s models",
2333
+ (npm) => {
2334
+ const model = createModel({ context: 100_000, output: 32_000, npm })
2335
+ // AI SDK v6: inputTokens includes cached tokens for all providers
2336
+ const usage = {
2337
+ inputTokens: 1000,
2338
+ outputTokens: 500,
2339
+ totalTokens: 1500,
2340
+ inputTokenDetails: {
2341
+ noCacheTokens: 800,
2342
+ cacheReadTokens: 200,
2343
+ cacheWriteTokens: undefined,
2344
+ },
2345
+ outputTokenDetails: {
2346
+ textTokens: undefined,
2347
+ reasoningTokens: undefined,
2348
+ },
2349
+ }
2350
+ if (npm === "@ai-sdk/amazon-bedrock") {
2351
+ const result = SessionNs.getUsage({
2352
+ model,
2353
+ usage,
2354
+ metadata: {
2355
+ bedrock: {
2356
+ usage: {
2357
+ cacheWriteInputTokens: 300,
2358
+ },
2359
+ },
2360
+ },
2361
+ })
2362
+
2363
+ // inputTokens (1000) includes cache, so adjusted = 1000 - 200 - 300 = 500
2364
+ expect(result.tokens.input).toBe(500)
2365
+ expect(result.tokens.cache.read).toBe(200)
2366
+ expect(result.tokens.cache.write).toBe(300)
2367
+ // total = adjusted (500) + output (500) + cacheRead (200) + cacheWrite (300)
2368
+ expect(result.tokens.total).toBe(1500)
2369
+ return
2370
+ }
2371
+
2372
+ const result = SessionNs.getUsage({
2373
+ model,
2374
+ usage,
2375
+ metadata: {
2376
+ anthropic: {
2377
+ cacheCreationInputTokens: 300,
2378
+ },
2379
+ },
2380
+ })
2381
+
2382
+ // inputTokens (1000) includes cache, so adjusted = 1000 - 200 - 300 = 500
2383
+ expect(result.tokens.input).toBe(500)
2384
+ expect(result.tokens.cache.read).toBe(200)
2385
+ expect(result.tokens.cache.write).toBe(300)
2386
+ // total = adjusted (500) + output (500) + cacheRead (200) + cacheWrite (300)
2387
+ expect(result.tokens.total).toBe(1500)
2388
+ },
2389
+ )
2390
+
2391
+ test("extracts cache write tokens from vertex metadata key", () => {
2392
+ const model = createModel({ context: 100_000, output: 32_000, npm: "@ai-sdk/google-vertex/anthropic" })
2393
+ const result = SessionNs.getUsage({
2394
+ model,
2395
+ usage: {
2396
+ inputTokens: 1000,
2397
+ outputTokens: 500,
2398
+ totalTokens: 1500,
2399
+ inputTokenDetails: {
2400
+ noCacheTokens: 800,
2401
+ cacheReadTokens: 200,
2402
+ cacheWriteTokens: undefined,
2403
+ },
2404
+ outputTokenDetails: {
2405
+ textTokens: undefined,
2406
+ reasoningTokens: undefined,
2407
+ },
2408
+ },
2409
+ metadata: {
2410
+ vertex: {
2411
+ cacheCreationInputTokens: 300,
2412
+ },
2413
+ },
2414
+ })
2415
+
2416
+ expect(result.tokens.input).toBe(500)
2417
+ expect(result.tokens.cache.read).toBe(200)
2418
+ expect(result.tokens.cache.write).toBe(300)
2419
+ })
2420
+ })