saeeol 1.2.4 → 1.2.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (483) hide show
  1. package/bin/saeeol.cjs +2 -1
  2. package/package.json +15 -12
  3. package/src/ltm/config.ts +15 -15
  4. package/src/ltm/events.ts +1 -1
  5. package/src/ltm/index.ts +1 -1
  6. package/src/ltm/pipeline.ts +23 -23
  7. package/src/ltm/scheduler.ts +91 -17
  8. package/src/ltm/store.ts +9 -7
  9. package/src/ltm/types.ts +15 -15
  10. package/src/provider/local/embedder.ts +24 -24
  11. package/src/provider/models-snapshot.d.ts +2 -0
  12. package/src/provider/models-snapshot.js +3 -0
  13. package/src/session/message/message-errors.ts +1 -1
  14. package/src/session/message/message-parts.ts +1 -1
  15. package/src/session/message/message-transform.ts +1 -1
  16. package/src/session/message/message-types.ts +1 -1
  17. package/src/tool/core/tool.ts +1 -1
  18. package/AGENTS.md +0 -72
  19. package/BUN_SHELL_MIGRATION_PLAN.md +0 -136
  20. package/Dockerfile +0 -18
  21. package/assets/saeeol.ico +0 -0
  22. package/bin/saeeol +0 -187
  23. package/bunfig.toml +0 -7
  24. package/database.db +0 -0
  25. package/drizzle.config.ts +0 -10
  26. package/git +0 -0
  27. package/migration/20260127222353_familiar_lady_ursula/migration.sql +0 -90
  28. package/migration/20260127222353_familiar_lady_ursula/snapshot.json +0 -796
  29. package/migration/20260211171708_add_project_commands/migration.sql +0 -1
  30. package/migration/20260211171708_add_project_commands/snapshot.json +0 -806
  31. package/migration/20260213144116_wakeful_the_professor/migration.sql +0 -11
  32. package/migration/20260213144116_wakeful_the_professor/snapshot.json +0 -897
  33. package/migration/20260225215848_workspace/migration.sql +0 -7
  34. package/migration/20260225215848_workspace/snapshot.json +0 -959
  35. package/migration/20260227213759_add_session_workspace_id/migration.sql +0 -2
  36. package/migration/20260227213759_add_session_workspace_id/snapshot.json +0 -983
  37. package/migration/20260228203230_blue_harpoon/migration.sql +0 -17
  38. package/migration/20260228203230_blue_harpoon/snapshot.json +0 -1102
  39. package/migration/20260303231226_add_workspace_fields/migration.sql +0 -5
  40. package/migration/20260303231226_add_workspace_fields/snapshot.json +0 -1013
  41. package/migration/20260309230000_move_org_to_state/migration.sql +0 -3
  42. package/migration/20260309230000_move_org_to_state/snapshot.json +0 -1156
  43. package/migration/20260312043431_session_message_cursor/migration.sql +0 -4
  44. package/migration/20260312043431_session_message_cursor/snapshot.json +0 -1168
  45. package/migration/20260323234822_events/migration.sql +0 -13
  46. package/migration/20260323234822_events/snapshot.json +0 -1271
  47. package/migration/20260410174513_workspace-name/migration.sql +0 -16
  48. package/migration/20260410174513_workspace-name/snapshot.json +0 -1271
  49. package/migration/20260413175956_chief_energizer/migration.sql +0 -13
  50. package/migration/20260413175956_chief_energizer/snapshot.json +0 -1399
  51. package/migration/20260423070820_add_icon_url_override/migration.sql +0 -2
  52. package/migration/20260423070820_add_icon_url_override/snapshot.json +0 -1409
  53. package/migration/20260428004200_add_session_path/migration.sql +0 -1
  54. package/migration/20260428004200_add_session_path/snapshot.json +0 -1419
  55. package/npm/bin/saeeol +0 -42
  56. package/npm/package.json +0 -39
  57. package/npm/postinstall.js +0 -162
  58. package/parsers-config.ts +0 -289
  59. package/script/build.ts +0 -393
  60. package/script/check-migrations.ts +0 -16
  61. package/script/fix-node-pty.ts +0 -34
  62. package/script/generate.ts +0 -23
  63. package/script/postinstall.mjs +0 -189
  64. package/script/publish.ts +0 -200
  65. package/script/run-workspace-server +0 -106
  66. package/script/schema.ts +0 -63
  67. package/script/test-runner.ts +0 -420
  68. package/script/time.ts +0 -6
  69. package/script/trace-imports.ts +0 -153
  70. package/script/upgrade-opentui.ts +0 -64
  71. package/scripts/diff-sdk-types.sh +0 -52
  72. package/specs/effect/facades.md +0 -221
  73. package/specs/effect/http-api.md +0 -401
  74. package/specs/effect/instance-context.md +0 -309
  75. package/specs/effect/loose-ends.md +0 -34
  76. package/specs/effect/migration.md +0 -299
  77. package/specs/effect/routes.md +0 -64
  78. package/specs/effect/schema.md +0 -399
  79. package/specs/effect/server-package.md +0 -668
  80. package/specs/effect/tools.md +0 -90
  81. package/specs/tui-plugins.md +0 -433
  82. package/specs/v2/api.ts +0 -67
  83. package/specs/v2/keymappings.md +0 -10
  84. package/specs/v2/message-shape.md +0 -136
  85. package/src/tool/apply_patch.txt +0 -33
  86. package/src/tool/bash.txt +0 -119
  87. package/src/tool/edit.txt +0 -10
  88. package/src/tool/glob.txt +0 -6
  89. package/src/tool/grep.txt +0 -8
  90. package/src/tool/lsp.txt +0 -24
  91. package/src/tool/plan-enter.txt +0 -14
  92. package/src/tool/plan-exit.txt +0 -13
  93. package/src/tool/question.txt +0 -11
  94. package/src/tool/read.txt +0 -14
  95. package/src/tool/recall.txt +0 -12
  96. package/src/tool/skill.txt +0 -5
  97. package/src/tool/task.txt +0 -57
  98. package/src/tool/todowrite.txt +0 -167
  99. package/src/tool/warpgrep.txt +0 -10
  100. package/src/tool/webfetch.txt +0 -13
  101. package/src/tool/websearch.txt +0 -14
  102. package/src/tool/write.txt +0 -8
  103. package/sst-env.d.ts +0 -10
  104. package/test/AGENTS.md +0 -133
  105. package/test/account/repo.test.ts +0 -352
  106. package/test/account/service.test.ts +0 -456
  107. package/test/acp/agent-interface.test.ts +0 -51
  108. package/test/acp/event-subscription.test.ts +0 -725
  109. package/test/agent/agent.test.ts +0 -890
  110. package/test/auth/auth.test.ts +0 -86
  111. package/test/bun/registry.test.ts +0 -75
  112. package/test/bus/bus-effect.test.ts +0 -161
  113. package/test/bus/bus-integration.test.ts +0 -87
  114. package/test/bus/bus.test.ts +0 -219
  115. package/test/cli/account.test.ts +0 -26
  116. package/test/cli/auto-mode.test.ts +0 -75
  117. package/test/cli/bin-saeeol.test.ts +0 -8
  118. package/test/cli/cmd/tui/prompt-part.test.ts +0 -47
  119. package/test/cli/cmd/tui/prompt-traits.test.ts +0 -38
  120. package/test/cli/cmd/tui/sync.test.tsx +0 -159
  121. package/test/cli/error.test.ts +0 -18
  122. package/test/cli/github-action.test.ts +0 -198
  123. package/test/cli/github-remote.test.ts +0 -85
  124. package/test/cli/import.test.ts +0 -97
  125. package/test/cli/install-artifact.test.ts +0 -72
  126. package/test/cli/plugin-auth-picker.test.ts +0 -120
  127. package/test/cli/pr.test.ts +0 -59
  128. package/test/cli/tui/editor-context-zed.test.ts +0 -356
  129. package/test/cli/tui/editor-context.test.tsx +0 -228
  130. package/test/cli/tui/keybind-plugin.test.ts +0 -90
  131. package/test/cli/tui/markdown.test.ts +0 -161
  132. package/test/cli/tui/plugin-add.test.ts +0 -111
  133. package/test/cli/tui/plugin-install.test.ts +0 -87
  134. package/test/cli/tui/plugin-lifecycle.test.ts +0 -224
  135. package/test/cli/tui/plugin-loader-entrypoint.test.ts +0 -484
  136. package/test/cli/tui/plugin-loader-pure.test.ts +0 -71
  137. package/test/cli/tui/plugin-loader.test.ts +0 -816
  138. package/test/cli/tui/plugin-toggle.test.ts +0 -157
  139. package/test/cli/tui/revert-diff.test.ts +0 -35
  140. package/test/cli/tui/slot-replace.test.tsx +0 -47
  141. package/test/cli/tui/theme-store.test.ts +0 -54
  142. package/test/cli/tui/thread.test.ts +0 -28
  143. package/test/cli/tui/transcript.test.ts +0 -426
  144. package/test/cli/tui/usage.test.ts +0 -60
  145. package/test/cli/tui/use-event.test.tsx +0 -175
  146. package/test/config/agent-color.test.ts +0 -67
  147. package/test/config/config.test.ts +0 -2544
  148. package/test/config/fixtures/empty-frontmatter.md +0 -4
  149. package/test/config/fixtures/frontmatter.md +0 -28
  150. package/test/config/fixtures/markdown-header.md +0 -11
  151. package/test/config/fixtures/no-frontmatter.md +0 -1
  152. package/test/config/fixtures/weird-model-id.md +0 -13
  153. package/test/config/lsp.test.ts +0 -87
  154. package/test/config/markdown.test.ts +0 -228
  155. package/test/config/plugin.test.ts +0 -0
  156. package/test/config/tui.test.ts +0 -624
  157. package/test/control-plane/adapters.test.ts +0 -71
  158. package/test/control-plane/workspace.test.ts +0 -1526
  159. package/test/effect/app-runtime-logger.test.ts +0 -98
  160. package/test/effect/config-service.test.ts +0 -65
  161. package/test/effect/instance-state.test.ts +0 -394
  162. package/test/effect/run-service.test.ts +0 -89
  163. package/test/effect/runner.test.ts +0 -523
  164. package/test/fake/provider.ts +0 -82
  165. package/test/file/fsmonitor.test.ts +0 -68
  166. package/test/file/ignore.test.ts +0 -10
  167. package/test/file/index.test.ts +0 -954
  168. package/test/file/path-traversal.test.ts +0 -205
  169. package/test/file/ripgrep.test.ts +0 -226
  170. package/test/file/watcher.test.ts +0 -249
  171. package/test/filesystem/filesystem.test.ts +0 -319
  172. package/test/fixture/db.ts +0 -11
  173. package/test/fixture/fixture.test.ts +0 -26
  174. package/test/fixture/fixture.ts +0 -175
  175. package/test/fixture/flock-worker.ts +0 -72
  176. package/test/fixture/log-init-worker.ts +0 -62
  177. package/test/fixture/lsp/fake-lsp-server.js +0 -249
  178. package/test/fixture/plug-worker.ts +0 -93
  179. package/test/fixture/plugin-meta-worker.ts +0 -19
  180. package/test/fixture/skills/agents-sdk/SKILL.md +0 -152
  181. package/test/fixture/skills/cloudflare/SKILL.md +0 -211
  182. package/test/fixture/skills/index.json +0 -6
  183. package/test/fixture/tui-plugin.ts +0 -323
  184. package/test/fixture/tui-runtime.ts +0 -31
  185. package/test/format/format.test.ts +0 -272
  186. package/test/git/git.test.ts +0 -128
  187. package/test/ide/ide.test.ts +0 -82
  188. package/test/installation/installation.test.ts +0 -168
  189. package/test/keybind.test.ts +0 -421
  190. package/test/lib/effect.ts +0 -53
  191. package/test/lib/filesystem.ts +0 -10
  192. package/test/lib/llm-server.ts +0 -778
  193. package/test/lib/websocket.ts +0 -46
  194. package/test/lsp/client.test.ts +0 -482
  195. package/test/lsp/index.test.ts +0 -160
  196. package/test/lsp/launch.test.ts +0 -22
  197. package/test/lsp/lifecycle.test.ts +0 -184
  198. package/test/mcp/headers.test.ts +0 -178
  199. package/test/mcp/lifecycle.test.ts +0 -787
  200. package/test/mcp/oauth-auto-connect.test.ts +0 -311
  201. package/test/mcp/oauth-browser.test.ts +0 -276
  202. package/test/mcp/oauth-callback.test.ts +0 -34
  203. package/test/memory/abort-leak-webfetch.ts +0 -49
  204. package/test/memory/abort-leak.test.ts +0 -128
  205. package/test/patch/patch.test.ts +0 -348
  206. package/test/permission/arity.test.ts +0 -33
  207. package/test/permission/next.test.ts +0 -1227
  208. package/test/permission/next.toConfig.test.ts +0 -110
  209. package/test/permission-task.test.ts +0 -326
  210. package/test/plugin/auth-override.test.ts +0 -79
  211. package/test/plugin/cloudflare.test.ts +0 -68
  212. package/test/plugin/codex.test.ts +0 -123
  213. package/test/plugin/github-copilot-models.test.ts +0 -261
  214. package/test/plugin/install-concurrency.test.ts +0 -140
  215. package/test/plugin/install.test.ts +0 -570
  216. package/test/plugin/loader-shared.test.ts +0 -1169
  217. package/test/plugin/meta.test.ts +0 -137
  218. package/test/plugin/shared.test.ts +0 -88
  219. package/test/plugin/trigger.test.ts +0 -102
  220. package/test/plugin/workspace-adapter.test.ts +0 -109
  221. package/test/preload.ts +0 -77
  222. package/test/project/instance.test.ts +0 -276
  223. package/test/project/migrate-global.test.ts +0 -152
  224. package/test/project/project.test.ts +0 -600
  225. package/test/project/vcs.test.ts +0 -286
  226. package/test/project/worktree-remove.test.ts +0 -126
  227. package/test/project/worktree.test.ts +0 -223
  228. package/test/provider/amazon-bedrock.test.ts +0 -462
  229. package/test/provider/copilot/convert-to-copilot-messages.test.ts +0 -523
  230. package/test/provider/copilot/copilot-chat-model.test.ts +0 -592
  231. package/test/provider/gitlab-duo.test.ts +0 -413
  232. package/test/provider/local.test.ts +0 -208
  233. package/test/provider/models.test.ts +0 -261
  234. package/test/provider/provider-category.test.ts +0 -190
  235. package/test/provider/provider.test.ts +0 -2758
  236. package/test/provider/transform.test.ts +0 -3681
  237. package/test/pty/pty-output-isolation.test.ts +0 -147
  238. package/test/pty/pty-session.test.ts +0 -102
  239. package/test/pty/pty-shell.test.ts +0 -104
  240. package/test/question/question.test.ts +0 -490
  241. package/test/saeeol/agent-global-config-dirs.test.ts +0 -24
  242. package/test/saeeol/agent-manager-tool.test.ts +0 -71
  243. package/test/saeeol/agent-permission-overrides.test.ts +0 -75
  244. package/test/saeeol/agent-skill-permissions.test.ts +0 -37
  245. package/test/saeeol/ask-agent-permissions.test.ts +0 -303
  246. package/test/saeeol/bash-hierarchy.test.ts +0 -64
  247. package/test/saeeol/bash-permission-metadata.test.ts +0 -66
  248. package/test/saeeol/bash-security-extended.test.ts +0 -243
  249. package/test/saeeol/bedrock-claude-empty-content.test.ts +0 -138
  250. package/test/saeeol/boxes-integration.test.ts +0 -415
  251. package/test/saeeol/builtin-skills.test.ts +0 -75
  252. package/test/saeeol/cleanup.ts +0 -28
  253. package/test/saeeol/cli/dev-setup.test.ts +0 -74
  254. package/test/saeeol/cli/roll-call.test.ts +0 -161
  255. package/test/saeeol/cli-run-auto-helper.test.ts +0 -58
  256. package/test/saeeol/codex-auth-refresh.test.ts +0 -124
  257. package/test/saeeol/commit-message/generate.test.ts +0 -188
  258. package/test/saeeol/commit-message/git-context.test.ts +0 -303
  259. package/test/saeeol/commit-message-windows.test.ts +0 -38
  260. package/test/saeeol/compaction-payload-recovery.test.ts +0 -406
  261. package/test/saeeol/compaction-preservation-audit.test.ts +0 -122
  262. package/test/saeeol/compaction-skip-guard.test.ts +0 -224
  263. package/test/saeeol/compaction-smart-select.test.ts +0 -100
  264. package/test/saeeol/config/config.test.ts +0 -166
  265. package/test/saeeol/config/indexing-default-plugin.test.ts +0 -82
  266. package/test/saeeol/config/opentelemetry-default.test.ts +0 -29
  267. package/test/saeeol/config-gitignore.test.ts +0 -70
  268. package/test/saeeol/config-injector.test.ts +0 -305
  269. package/test/saeeol/config-resilience.test.ts +0 -234
  270. package/test/saeeol/config-validation.test.ts +0 -183
  271. package/test/saeeol/cost-propagation.test.ts +0 -94
  272. package/test/saeeol/cost-tracker-extended.test.ts +0 -141
  273. package/test/saeeol/cost-tracker.test.ts +0 -64
  274. package/test/saeeol/custom-provider-delete.test.ts +0 -149
  275. package/test/saeeol/diff-full.test.ts +0 -226
  276. package/test/saeeol/edit-permission-filediff.test.ts +0 -223
  277. package/test/saeeol/encoding.test.ts +0 -364
  278. package/test/saeeol/enhance-prompt.test.ts +0 -61
  279. package/test/saeeol/ensure-plan-dir.test.ts +0 -32
  280. package/test/saeeol/errors.test.ts +0 -144
  281. package/test/saeeol/external-directory-boundary.test.ts +0 -96
  282. package/test/saeeol/gateway-headers.test.ts +0 -88
  283. package/test/saeeol/help.test.ts +0 -191
  284. package/test/saeeol/ignore-migrator.test.ts +0 -308
  285. package/test/saeeol/indexing-auth.test.ts +0 -45
  286. package/test/saeeol/indexing-feature.test.ts +0 -44
  287. package/test/saeeol/indexing-label.test.ts +0 -70
  288. package/test/saeeol/indexing-startup.test.ts +0 -381
  289. package/test/saeeol/indexing-worktree.test.ts +0 -73
  290. package/test/saeeol/instruction.test.ts +0 -136
  291. package/test/saeeol/lancedb-runtime.test.ts +0 -116
  292. package/test/saeeol/loader-auth.test.ts +0 -168
  293. package/test/saeeol/local-model.test.ts +0 -621
  294. package/test/saeeol/logo.test.ts +0 -31
  295. package/test/saeeol/lsp-typescript-lightweight.test.ts +0 -89
  296. package/test/saeeol/mcp-branding.test.ts +0 -33
  297. package/test/saeeol/mcp-docker-rm.test.ts +0 -32
  298. package/test/saeeol/mcp-migrator.test.ts +0 -736
  299. package/test/saeeol/mcp-oauth-callback.test.ts +0 -33
  300. package/test/saeeol/memory-io.test.ts +0 -198
  301. package/test/saeeol/memory-paths.test.ts +0 -87
  302. package/test/saeeol/memory-security.test.ts +0 -166
  303. package/test/saeeol/model-cache-org.test.ts +0 -164
  304. package/test/saeeol/model-info-panel-utils.test.ts +0 -52
  305. package/test/saeeol/model-info-panel.types.test.ts +0 -7
  306. package/test/saeeol/models-401-fallback.test.ts +0 -52
  307. package/test/saeeol/modes-migrator.test.ts +0 -320
  308. package/test/saeeol/nvidia-headers.test.ts +0 -74
  309. package/test/saeeol/patch-jsonc.test.ts +0 -73
  310. package/test/saeeol/patch.test.ts +0 -172
  311. package/test/saeeol/paths.test.ts +0 -265
  312. package/test/saeeol/permission/config-paths.test.ts +0 -174
  313. package/test/saeeol/permission/env-read.test.ts +0 -149
  314. package/test/saeeol/permission/external-directory-allow.test.ts +0 -327
  315. package/test/saeeol/permission/next.always-rules.test.ts +0 -882
  316. package/test/saeeol/permission/next.reply-http.test.ts +0 -205
  317. package/test/saeeol/permission/next.reply-routing.test.ts +0 -184
  318. package/test/saeeol/plan-exit-detection.test.ts +0 -494
  319. package/test/saeeol/plan-followup.test.ts +0 -1376
  320. package/test/saeeol/project-config-update.test.ts +0 -120
  321. package/test/saeeol/project-id.test.ts +0 -455
  322. package/test/saeeol/provider-cost.test.ts +0 -171
  323. package/test/saeeol/provider-list-failed-state.test.ts +0 -100
  324. package/test/saeeol/question-dismiss-all.test.ts +0 -174
  325. package/test/saeeol/read-directory.test.ts +0 -116
  326. package/test/saeeol/rules-migrator.test.ts +0 -257
  327. package/test/saeeol/run-auto.test.ts +0 -176
  328. package/test/saeeol/run-network.test.ts +0 -224
  329. package/test/saeeol/semantic-search.test.ts +0 -186
  330. package/test/saeeol/server/permission-allow-everything.test.ts +0 -125
  331. package/test/saeeol/session/instruction-substitution.test.ts +0 -72
  332. package/test/saeeol/session/platform-attribution.test.ts +0 -118
  333. package/test/saeeol/session/session.test.ts +0 -105
  334. package/test/saeeol/session-compaction-cap.test.ts +0 -399
  335. package/test/saeeol/session-compaction-chunks.test.ts +0 -501
  336. package/test/saeeol/session-compaction-safety.test.ts +0 -481
  337. package/test/saeeol/session-fork-remap.test.ts +0 -251
  338. package/test/saeeol/session-import-service.test.ts +0 -114
  339. package/test/saeeol/session-list.test.ts +0 -47
  340. package/test/saeeol/session-message-metadata.test.ts +0 -128
  341. package/test/saeeol/session-overflow.test.ts +0 -78
  342. package/test/saeeol/session-processor-empty-tool-calls.test.ts +0 -571
  343. package/test/saeeol/session-processor-network-offline.test.ts +0 -204
  344. package/test/saeeol/session-processor-retry-limit.test.ts +0 -238
  345. package/test/saeeol/session-processor-review-telemetry.test.ts +0 -82
  346. package/test/saeeol/session-prompt-compaction-safety.test.ts +0 -517
  347. package/test/saeeol/session-prompt-queue.test.ts +0 -815
  348. package/test/saeeol/sessions/inflight-cache.test.ts +0 -157
  349. package/test/saeeol/sessions/ingest-queue.test.ts +0 -402
  350. package/test/saeeol/sessions/remote-protocol.test.ts +0 -258
  351. package/test/saeeol/sessions/remote-sender.test.ts +0 -1036
  352. package/test/saeeol/sessions/remote-ws.test.ts +0 -367
  353. package/test/saeeol/sessions/sessions-enable-remote.test.disable +0 -181
  354. package/test/saeeol/slot-prop-reactivity.test.ts +0 -142
  355. package/test/saeeol/snapshot-cache.test.ts +0 -84
  356. package/test/saeeol/snapshot-freeze-repro.test.ts +0 -100
  357. package/test/saeeol/snapshot-track-timeout.test.ts +0 -519
  358. package/test/saeeol/stats-subagent-cost.test.ts +0 -123
  359. package/test/saeeol/suggestion/auto-dismiss.test.ts +0 -65
  360. package/test/saeeol/suggestion/suggestion.test.ts +0 -145
  361. package/test/saeeol/suggestion/tool.test.ts +0 -298
  362. package/test/saeeol/summary-file-diff.test.ts +0 -28
  363. package/test/saeeol/system-prompt.test.ts +0 -142
  364. package/test/saeeol/task-nesting.test.ts +0 -193
  365. package/test/saeeol/telemetry/feedback.test.ts +0 -8
  366. package/test/saeeol/todo-view.test.ts +0 -57
  367. package/test/saeeol/tool-encoding.test.ts +0 -455
  368. package/test/saeeol/tool-registry-indexing-import-failure.test.ts +0 -49
  369. package/test/saeeol/tool-registry-indexing.test.ts +0 -236
  370. package/test/saeeol/tool-registry-semantic-import-failure.test.ts +0 -55
  371. package/test/saeeol/tool-task-model.test.ts +0 -352
  372. package/test/saeeol/transform-opus-4.7.test.ts +0 -89
  373. package/test/saeeol/tui-diff.test.ts +0 -91
  374. package/test/saeeol/tui-sync.test.ts +0 -80
  375. package/test/saeeol/util/url.test.ts +0 -141
  376. package/test/saeeol/workflows-migrator.test.ts +0 -261
  377. package/test/saeeol/worktree-diff-summary.test.ts +0 -64
  378. package/test/saeeol/worktree-diff.test.ts +0 -223
  379. package/test/saeeol/worktree-remove-lock.test.ts +0 -82
  380. package/test/server/AGENTS.md +0 -15
  381. package/test/server/contract.test.ts +0 -249
  382. package/test/server/experimental-session-list.test.ts +0 -157
  383. package/test/server/global-session-list.test.ts +0 -155
  384. package/test/server/httpapi-authorization.test.ts +0 -103
  385. package/test/server/httpapi-bridge.test.ts +0 -440
  386. package/test/server/httpapi-config.test.ts +0 -67
  387. package/test/server/httpapi-cors.test.ts +0 -89
  388. package/test/server/httpapi-event.test.ts +0 -57
  389. package/test/server/httpapi-experimental.test.ts +0 -219
  390. package/test/server/httpapi-file.test.ts +0 -79
  391. package/test/server/httpapi-instance-context.test.ts +0 -237
  392. package/test/server/httpapi-instance.legacy.test.ts +0 -140
  393. package/test/server/httpapi-instance.test.ts +0 -83
  394. package/test/server/httpapi-json-parity.test.ts +0 -263
  395. package/test/server/httpapi-mcp-oauth.test.ts +0 -76
  396. package/test/server/httpapi-mcp.test.ts +0 -189
  397. package/test/server/httpapi-provider.test.ts +0 -153
  398. package/test/server/httpapi-pty-websocket.test.ts +0 -16
  399. package/test/server/httpapi-pty.test.ts +0 -175
  400. package/test/server/httpapi-raw-route-auth.test.ts +0 -89
  401. package/test/server/httpapi-sdk.test.ts +0 -679
  402. package/test/server/httpapi-session.test.ts +0 -464
  403. package/test/server/httpapi-sync.test.ts +0 -130
  404. package/test/server/httpapi-tui.test.ts +0 -121
  405. package/test/server/httpapi-workspace-routing.test.ts +0 -471
  406. package/test/server/httpapi-workspace.test.ts +0 -427
  407. package/test/server/project-init-git.test.ts +0 -113
  408. package/test/server/proxy-util.test.ts +0 -113
  409. package/test/server/session-actions.test.ts +0 -49
  410. package/test/server/session-list.test.ts +0 -238
  411. package/test/server/session-messages.test.ts +0 -167
  412. package/test/server/session-select.test.ts +0 -100
  413. package/test/server/trace-attributes.test.ts +0 -76
  414. package/test/server/workspace-proxy.test.ts +0 -165
  415. package/test/server/workspace-routing.test.ts +0 -85
  416. package/test/session/compaction.test.ts +0 -2420
  417. package/test/session/instruction.test.ts +0 -247
  418. package/test/session/llm.test.ts +0 -1273
  419. package/test/session/message-v2.test.ts +0 -1291
  420. package/test/session/messages-pagination.test.ts +0 -1173
  421. package/test/session/network.test.ts +0 -249
  422. package/test/session/processor-effect.test.ts +0 -847
  423. package/test/session/prompt.test.ts +0 -2131
  424. package/test/session/retry.test.ts +0 -340
  425. package/test/session/revert-compact.test.ts +0 -639
  426. package/test/session/schema-decoding.test.ts +0 -311
  427. package/test/session/session-entry-stepper.test.ts +0 -917
  428. package/test/session/session-schema.test.ts +0 -76
  429. package/test/session/snapshot-tool-race.test.ts +0 -257
  430. package/test/session/structured-output-integration.test.ts +0 -265
  431. package/test/session/structured-output.test.ts +0 -381
  432. package/test/session/system.test.ts +0 -73
  433. package/test/share/share-next.test.ts +0 -333
  434. package/test/shell/shell.test.ts +0 -99
  435. package/test/skill/discovery.test.ts +0 -116
  436. package/test/skill/skill.test.ts +0 -393
  437. package/test/snapshot/snapshot.test.ts +0 -1531
  438. package/test/storage/db.test.ts +0 -23
  439. package/test/storage/json-migration.test.ts +0 -832
  440. package/test/storage/storage.test.ts +0 -293
  441. package/test/suggestion/suggestion.test.ts +0 -1
  442. package/test/sync/index.test.ts +0 -256
  443. package/test/tool/__snapshots__/parameters.test.ts.snap +0 -500
  444. package/test/tool/__snapshots__/tool.test.ts.snap +0 -9
  445. package/test/tool/apply_patch.test.ts +0 -614
  446. package/test/tool/bash.test.ts +0 -1225
  447. package/test/tool/diagnostics-filter.test.ts +0 -55
  448. package/test/tool/edit.test.ts +0 -754
  449. package/test/tool/external-directory.test.ts +0 -169
  450. package/test/tool/fixtures/large-image.png +0 -0
  451. package/test/tool/fixtures/models-api.json +0 -65179
  452. package/test/tool/glob.test.ts +0 -107
  453. package/test/tool/grep.test.ts +0 -114
  454. package/test/tool/lsp.test.ts +0 -187
  455. package/test/tool/parameters.test.ts +0 -243
  456. package/test/tool/question.test.ts +0 -129
  457. package/test/tool/read.test.ts +0 -500
  458. package/test/tool/recall.test.ts +0 -151
  459. package/test/tool/registry.test.ts +0 -203
  460. package/test/tool/skill.test.ts +0 -135
  461. package/test/tool/suggest.test.ts +0 -1
  462. package/test/tool/task.test.ts +0 -612
  463. package/test/tool/tool-define.test.ts +0 -99
  464. package/test/tool/truncation.test.ts +0 -260
  465. package/test/tool/webfetch.test.ts +0 -103
  466. package/test/tool/write.test.ts +0 -291
  467. package/test/util/data-url.test.ts +0 -14
  468. package/test/util/effect-zod.test.ts +0 -754
  469. package/test/util/error.test.ts +0 -38
  470. package/test/util/filesystem.test.ts +0 -656
  471. package/test/util/format.test.ts +0 -59
  472. package/test/util/glob.test.ts +0 -164
  473. package/test/util/iife.test.ts +0 -36
  474. package/test/util/lazy.test.ts +0 -50
  475. package/test/util/lock.test.ts +0 -72
  476. package/test/util/log.test.ts +0 -86
  477. package/test/util/module.test.ts +0 -59
  478. package/test/util/process.test.ts +0 -128
  479. package/test/util/timeout.test.ts +0 -21
  480. package/test/util/which.test.ts +0 -100
  481. package/test/util/wildcard.test.ts +0 -90
  482. package/test/workspace/workspace-restore.test.ts +0 -296
  483. package/tsconfig.json +0 -19
@@ -1,2420 +0,0 @@
1
- import { afterEach, describe, expect, mock, test } from "bun:test"
2
- import { APICallError } from "ai"
3
- import { Cause, Effect, Exit, Layer, ManagedRuntime } from "effect"
4
- import * as Stream from "effect/Stream"
5
- import z from "zod"
6
- import { Bus } from "../../src/bus"
7
- import { Config } from "@/config/config"
8
- import { Agent } from "../../src/agent/agent"
9
- import { LLM } from "../../src/session/llm"
10
- import { SessionCompaction } from "../../src/session/compaction"
11
- import { Token } from "@/util/token"
12
- import { Instance } from "../../src/project/instance"
13
- import * as Log from "@saeeol/core/util/log"
14
- import { Permission } from "../../src/permission"
15
- import { Plugin } from "../../src/plugin"
16
- import { provideTmpdirInstance, tmpdir } from "../fixture/fixture"
17
- import { Session as SessionNs } from "@/session/session"
18
- import { MessageV2 } from "../../src/session/message-v2"
19
- import { MessageID, PartID, SessionID } from "../../src/session/schema"
20
- import { SessionStatus } from "../../src/session/status"
21
- import { SessionSummary } from "../../src/session/summary"
22
- import { ModelID, ProviderID } from "../../src/provider/schema"
23
- import type { Provider } from "@/provider/provider"
24
- import * as SessionProcessorModule from "../../src/session/processor"
25
- import { Snapshot } from "../../src/snapshot"
26
- import { ProviderTest } from "../fake/provider"
27
- import { testEffect } from "../lib/effect"
28
- import { CrossSpawnSpawner } from "@saeeol/core/cross-spawn-spawner"
29
-
30
- void Log.init({ print: false })
31
-
32
- function run<A, E>(fx: Effect.Effect<A, E, SessionNs.Service>) {
33
- return Effect.runPromise(fx.pipe(Effect.provide(SessionNs.defaultLayer)))
34
- }
35
-
36
- const svc = {
37
- ...SessionNs,
38
- create(input?: SessionNs.CreateInput) {
39
- return run(SessionNs.Service.use((svc) => svc.create(input)))
40
- },
41
- messages(input: z.output<typeof SessionNs.MessagesInput.zod>) {
42
- return run(SessionNs.Service.use((svc) => svc.messages(input)))
43
- },
44
- updateMessage<T extends MessageV2.Info>(msg: T) {
45
- return run(SessionNs.Service.use((svc) => svc.updateMessage(msg)))
46
- },
47
- updatePart<T extends MessageV2.Part>(part: T) {
48
- return run(SessionNs.Service.use((svc) => svc.updatePart(part)))
49
- },
50
- }
51
-
52
- const summary = Layer.succeed(
53
- SessionSummary.Service,
54
- SessionSummary.Service.of({
55
- summarize: () => Effect.void,
56
- diff: () => Effect.succeed([]),
57
- computeDiff: () => Effect.succeed([]),
58
- }),
59
- )
60
-
61
- const ref = {
62
- providerID: ProviderID.make("test"),
63
- modelID: ModelID.make("test-model"),
64
- }
65
-
66
- afterEach(() => {
67
- mock.restore()
68
- })
69
-
70
- function createModel(opts: {
71
- context: number
72
- output: number
73
- input?: number
74
- cost?: Provider.Model["cost"]
75
- npm?: string
76
- }): Provider.Model {
77
- return {
78
- id: "test-model",
79
- providerID: "test",
80
- name: "Test",
81
- limit: {
82
- context: opts.context,
83
- input: opts.input,
84
- output: opts.output,
85
- },
86
- cost: opts.cost ?? { input: 0, output: 0, cache: { read: 0, write: 0 } },
87
- capabilities: {
88
- toolcall: true,
89
- attachment: false,
90
- reasoning: false,
91
- temperature: true,
92
- input: { text: true, image: false, audio: false, video: false },
93
- output: { text: true, image: false, audio: false, video: false },
94
- },
95
- api: { npm: opts.npm ?? "@ai-sdk/anthropic" },
96
- options: {},
97
- } as Provider.Model
98
- }
99
-
100
- const wide = () => ProviderTest.fake({ model: createModel({ context: 100_000, output: 32_000 }) })
101
-
102
- async function user(sessionID: SessionID, text: string) {
103
- const msg = await svc.updateMessage({
104
- id: MessageID.ascending(),
105
- role: "user",
106
- sessionID,
107
- agent: "build",
108
- model: ref,
109
- time: { created: Date.now() },
110
- })
111
- await svc.updatePart({
112
- id: PartID.ascending(),
113
- messageID: msg.id,
114
- sessionID,
115
- type: "text",
116
- text,
117
- })
118
- return msg
119
- }
120
-
121
- async function assistant(sessionID: SessionID, parentID: MessageID, root: string) {
122
- const msg: MessageV2.Assistant = {
123
- id: MessageID.ascending(),
124
- role: "assistant",
125
- sessionID,
126
- mode: "build",
127
- agent: "build",
128
- path: { cwd: root, root },
129
- cost: 0,
130
- tokens: {
131
- output: 0,
132
- input: 0,
133
- reasoning: 0,
134
- cache: { read: 0, write: 0 },
135
- },
136
- modelID: ref.modelID,
137
- providerID: ref.providerID,
138
- parentID,
139
- time: { created: Date.now() },
140
- finish: "end_turn",
141
- }
142
- await svc.updateMessage(msg)
143
- return msg
144
- }
145
-
146
- async function summaryAssistant(sessionID: SessionID, parentID: MessageID, root: string, text: string) {
147
- const msg: MessageV2.Assistant = {
148
- id: MessageID.ascending(),
149
- role: "assistant",
150
- sessionID,
151
- mode: "compaction",
152
- agent: "compaction",
153
- path: { cwd: root, root },
154
- cost: 0,
155
- tokens: {
156
- output: 0,
157
- input: 0,
158
- reasoning: 0,
159
- cache: { read: 0, write: 0 },
160
- },
161
- modelID: ref.modelID,
162
- providerID: ref.providerID,
163
- parentID,
164
- summary: true,
165
- time: { created: Date.now() },
166
- finish: "end_turn",
167
- }
168
- await svc.updateMessage(msg)
169
- await svc.updatePart({
170
- id: PartID.ascending(),
171
- messageID: msg.id,
172
- sessionID,
173
- type: "text",
174
- text,
175
- })
176
- return msg
177
- }
178
-
179
- async function lastCompactionPart(sessionID: SessionID) {
180
- return (await svc.messages({ sessionID }))
181
- .at(-2)
182
- ?.parts.find((item): item is MessageV2.CompactionPart => item.type === "compaction")
183
- }
184
-
185
- function fake(
186
- input: Parameters<SessionProcessorModule.SessionProcessor.Interface["create"]>[0],
187
- result: "continue" | "compact",
188
- ) {
189
- const msg = input.assistantMessage
190
- return {
191
- get message() {
192
- return msg
193
- },
194
- updateToolCall: Effect.fn("TestSessionProcessor.updateToolCall")(() => Effect.succeed(undefined)),
195
- completeToolCall: Effect.fn("TestSessionProcessor.completeToolCall")(() => Effect.void),
196
- process: Effect.fn("TestSessionProcessor.process")(() => Effect.succeed(result)),
197
- } satisfies SessionProcessorModule.SessionProcessor.Handle
198
- }
199
-
200
- function layer(result: "continue" | "compact") {
201
- return Layer.succeed(
202
- SessionProcessorModule.SessionProcessor.Service,
203
- SessionProcessorModule.SessionProcessor.Service.of({
204
- create: Effect.fn("TestSessionProcessor.create")((input) => Effect.succeed(fake(input, result))),
205
- }),
206
- )
207
- }
208
-
209
- function cfg(compaction?: Config.Info["compaction"]) {
210
- const base = Config.Info.zod.parse({})
211
- return Layer.mock(Config.Service)({
212
- get: () => Effect.succeed({ ...base, compaction }),
213
- })
214
- }
215
-
216
- function runtime(
217
- result: "continue" | "compact",
218
- plugin = Plugin.defaultLayer,
219
- provider = ProviderTest.fake(),
220
- config = Config.defaultLayer,
221
- ) {
222
- const bus = Bus.layer
223
- return ManagedRuntime.make(
224
- Layer.mergeAll(SessionCompaction.layer, bus).pipe(
225
- Layer.provide(provider.layer),
226
- Layer.provide(SessionNs.defaultLayer),
227
- Layer.provide(layer(result)),
228
- Layer.provide(Agent.defaultLayer),
229
- Layer.provide(plugin),
230
- Layer.provide(bus),
231
- Layer.provide(config),
232
- ),
233
- )
234
- }
235
-
236
- const deps = Layer.mergeAll(
237
- ProviderTest.fake().layer,
238
- layer("continue"),
239
- Agent.defaultLayer,
240
- Plugin.defaultLayer,
241
- Bus.layer,
242
- Config.defaultLayer,
243
- )
244
-
245
- const env = Layer.mergeAll(
246
- SessionNs.defaultLayer,
247
- CrossSpawnSpawner.defaultLayer,
248
- SessionCompaction.layer.pipe(Layer.provide(SessionNs.defaultLayer), Layer.provideMerge(deps)),
249
- )
250
-
251
- const it = testEffect(env)
252
-
253
- function llm() {
254
- const queue: Array<
255
- Stream.Stream<LLM.Event, unknown> | ((input: LLM.StreamInput) => Stream.Stream<LLM.Event, unknown>)
256
- > = []
257
-
258
- return {
259
- push(stream: Stream.Stream<LLM.Event, unknown> | ((input: LLM.StreamInput) => Stream.Stream<LLM.Event, unknown>)) {
260
- queue.push(stream)
261
- },
262
- layer: Layer.succeed(
263
- LLM.Service,
264
- LLM.Service.of({
265
- stream: (input) => {
266
- const item = queue.shift() ?? Stream.empty
267
- const stream = typeof item === "function" ? item(input) : item
268
- return stream.pipe(Stream.mapEffect((event) => Effect.succeed(event)))
269
- },
270
- raw: () => Effect.die("raw not implemented in test LLM"),
271
- }),
272
- ),
273
- }
274
- }
275
-
276
- function liveRuntime(layer: Layer.Layer<LLM.Service>, provider = ProviderTest.fake(), config = Config.defaultLayer) {
277
- const bus = Bus.layer
278
- const status = SessionStatus.layer.pipe(Layer.provide(bus))
279
- const processor = SessionProcessorModule.SessionProcessor.layer.pipe(Layer.provide(summary))
280
- return ManagedRuntime.make(
281
- Layer.mergeAll(SessionCompaction.layer.pipe(Layer.provide(processor)), processor, bus, status).pipe(
282
- Layer.provide(provider.layer),
283
- Layer.provide(SessionNs.defaultLayer),
284
- Layer.provide(Snapshot.defaultLayer),
285
- Layer.provide(layer),
286
- Layer.provide(Permission.defaultLayer),
287
- Layer.provide(Agent.defaultLayer),
288
- Layer.provide(Plugin.defaultLayer),
289
- Layer.provide(status),
290
- Layer.provide(bus),
291
- Layer.provide(config),
292
- ),
293
- )
294
- }
295
-
296
- function reply(
297
- text: string,
298
- capture?: (input: LLM.StreamInput) => void,
299
- ): (input: LLM.StreamInput) => Stream.Stream<LLM.Event, unknown> {
300
- return (input) => {
301
- capture?.(input)
302
- return Stream.make(
303
- { type: "start" } satisfies LLM.Event,
304
- { type: "text-start", id: "txt-0" } satisfies LLM.Event,
305
- { type: "text-delta", id: "txt-0", delta: text, text } as LLM.Event,
306
- { type: "text-end", id: "txt-0" } satisfies LLM.Event,
307
- {
308
- type: "finish-step",
309
- finishReason: "stop",
310
- rawFinishReason: "stop",
311
- response: { id: "res", modelId: "test-model", timestamp: new Date() },
312
- providerMetadata: undefined,
313
- usage: {
314
- inputTokens: 1,
315
- outputTokens: 1,
316
- totalTokens: 2,
317
- inputTokenDetails: {
318
- noCacheTokens: undefined,
319
- cacheReadTokens: undefined,
320
- cacheWriteTokens: undefined,
321
- },
322
- outputTokenDetails: {
323
- textTokens: undefined,
324
- reasoningTokens: undefined,
325
- },
326
- },
327
- } satisfies LLM.Event,
328
- {
329
- type: "finish",
330
- finishReason: "stop",
331
- rawFinishReason: "stop",
332
- totalUsage: {
333
- inputTokens: 1,
334
- outputTokens: 1,
335
- totalTokens: 2,
336
- inputTokenDetails: {
337
- noCacheTokens: undefined,
338
- cacheReadTokens: undefined,
339
- cacheWriteTokens: undefined,
340
- },
341
- outputTokenDetails: {
342
- textTokens: undefined,
343
- reasoningTokens: undefined,
344
- },
345
- },
346
- } satisfies LLM.Event,
347
- )
348
- }
349
- }
350
-
351
- function wait(ms = 50) {
352
- return new Promise((resolve) => setTimeout(resolve, ms))
353
- }
354
-
355
- function defer() {
356
- let resolve!: () => void
357
- const promise = new Promise<void>((done) => {
358
- resolve = done
359
- })
360
- return { promise, resolve }
361
- }
362
-
363
- function plugin(ready: ReturnType<typeof defer>) {
364
- return Layer.mock(Plugin.Service)({
365
- trigger: <Name extends string, Input, Output>(name: Name, _input: Input, output: Output) => {
366
- if (name !== "experimental.session.compacting") return Effect.succeed(output)
367
- return Effect.sync(() => ready.resolve()).pipe(Effect.andThen(Effect.never), Effect.as(output))
368
- },
369
- list: () => Effect.succeed([]),
370
- init: () => Effect.void,
371
- })
372
- }
373
-
374
- function autocontinue(enabled: boolean) {
375
- return Layer.mock(Plugin.Service)({
376
- trigger: <Name extends string, Input, Output>(name: Name, _input: Input, output: Output) => {
377
- if (name !== "experimental.compaction.autocontinue") return Effect.succeed(output)
378
- return Effect.sync(() => {
379
- ;(output as { enabled: boolean }).enabled = enabled
380
- return output
381
- })
382
- },
383
- list: () => Effect.succeed([]),
384
- init: () => Effect.void,
385
- })
386
- }
387
-
388
- describe("session.compaction.isOverflow", () => {
389
- it.live(
390
- "returns true when token count exceeds usable context",
391
- provideTmpdirInstance(() =>
392
- Effect.gen(function* () {
393
- const compact = yield* SessionCompaction.Service
394
- const model = createModel({ context: 100_000, output: 32_000 })
395
- const tokens = { input: 75_000, output: 5_000, reasoning: 0, cache: { read: 0, write: 0 } }
396
- expect(yield* compact.isOverflow({ tokens, model })).toBe(true)
397
- }),
398
- ),
399
- )
400
-
401
- it.live(
402
- "returns false when token count within usable context",
403
- provideTmpdirInstance(() =>
404
- Effect.gen(function* () {
405
- const compact = yield* SessionCompaction.Service
406
- const model = createModel({ context: 200_000, output: 32_000 })
407
- const tokens = { input: 100_000, output: 10_000, reasoning: 0, cache: { read: 0, write: 0 } }
408
- expect(yield* compact.isOverflow({ tokens, model })).toBe(false)
409
- }),
410
- ),
411
- )
412
-
413
- it.live(
414
- "includes cache.read in token count",
415
- provideTmpdirInstance(() =>
416
- Effect.gen(function* () {
417
- const compact = yield* SessionCompaction.Service
418
- const model = createModel({ context: 100_000, output: 32_000 })
419
- const tokens = { input: 60_000, output: 10_000, reasoning: 0, cache: { read: 10_000, write: 0 } }
420
- expect(yield* compact.isOverflow({ tokens, model })).toBe(true)
421
- }),
422
- ),
423
- )
424
-
425
- it.live(
426
- "respects input limit for input caps",
427
- provideTmpdirInstance(() =>
428
- Effect.gen(function* () {
429
- const compact = yield* SessionCompaction.Service
430
- const model = createModel({ context: 400_000, input: 272_000, output: 128_000 })
431
- const tokens = { input: 271_000, output: 1_000, reasoning: 0, cache: { read: 2_000, write: 0 } }
432
- expect(yield* compact.isOverflow({ tokens, model })).toBe(true)
433
- }),
434
- ),
435
- )
436
-
437
- it.live(
438
- "returns false when input/output are within input caps",
439
- provideTmpdirInstance(() =>
440
- Effect.gen(function* () {
441
- const compact = yield* SessionCompaction.Service
442
- const model = createModel({ context: 400_000, input: 272_000, output: 128_000 })
443
- const tokens = { input: 200_000, output: 20_000, reasoning: 0, cache: { read: 10_000, write: 0 } }
444
- expect(yield* compact.isOverflow({ tokens, model })).toBe(false)
445
- }),
446
- ),
447
- )
448
-
449
- it.live(
450
- "returns false when output within limit with input caps",
451
- provideTmpdirInstance(() =>
452
- Effect.gen(function* () {
453
- const compact = yield* SessionCompaction.Service
454
- const model = createModel({ context: 200_000, input: 120_000, output: 10_000 })
455
- const tokens = { input: 50_000, output: 9_999, reasoning: 0, cache: { read: 0, write: 0 } }
456
- expect(yield* compact.isOverflow({ tokens, model })).toBe(false)
457
- }),
458
- ),
459
- )
460
-
461
- // ─── Bug reproduction tests ───────────────────────────────────────────
462
- // These tests demonstrate that when limit.input is set, isOverflow()
463
- // does not subtract any headroom for the next model response. This means
464
- // compaction only triggers AFTER we've already consumed the full input
465
- // budget, leaving zero room for the next API call's output tokens.
466
- //
467
- // Compare: without limit.input, usable = context - output (reserves space).
468
- // With limit.input, usable = limit.input (reserves nothing).
469
- //
470
- // Related issues: #10634, #8089, #11086, #12621
471
- // Open PRs: #6875, #12924
472
-
473
- it.live(
474
- "BUG: no headroom when limit.input is set — compaction should trigger near boundary but does not",
475
- provideTmpdirInstance(() =>
476
- Effect.gen(function* () {
477
- const compact = yield* SessionCompaction.Service
478
- // Simulate Claude with prompt caching: input limit = 200K, output limit = 32K
479
- const model = createModel({ context: 200_000, input: 200_000, output: 32_000 })
480
-
481
- // We've used 198K tokens total. Only 2K under the input limit.
482
- // On the next turn, the full conversation (198K) becomes input,
483
- // plus the model needs room to generate output — this WILL overflow.
484
- const tokens = { input: 180_000, output: 15_000, reasoning: 0, cache: { read: 3_000, write: 0 } }
485
- // count = 180K + 3K + 15K = 198K
486
- // usable = limit.input = 200K (no output subtracted!)
487
- // 198K > 200K = false → no compaction triggered
488
-
489
- // WITHOUT limit.input: usable = 200K - 32K = 168K, and 198K > 168K = true ✓
490
- // WITH limit.input: usable = 200K, and 198K > 200K = false ✗
491
-
492
- // With 198K used and only 2K headroom, the next turn will overflow.
493
- // Compaction MUST trigger here.
494
- expect(yield* compact.isOverflow({ tokens, model })).toBe(true)
495
- }),
496
- ),
497
- )
498
-
499
- it.live(
500
- "BUG: without limit.input, same token count correctly triggers compaction",
501
- provideTmpdirInstance(() =>
502
- Effect.gen(function* () {
503
- const compact = yield* SessionCompaction.Service
504
- // Same model but without limit.input — uses context - output instead
505
- const model = createModel({ context: 200_000, output: 32_000 })
506
-
507
- // Same token usage as above
508
- const tokens = { input: 180_000, output: 15_000, reasoning: 0, cache: { read: 3_000, write: 0 } }
509
- // count = 198K
510
- // usable = context - output = 200K - 32K = 168K
511
- // 198K > 168K = true → compaction correctly triggered
512
-
513
- const result = yield* compact.isOverflow({ tokens, model })
514
- expect(result).toBe(true) // ← Correct: headroom is reserved
515
- }),
516
- ),
517
- )
518
-
519
- it.live(
520
- "BUG: asymmetry — limit.input model allows 30K more usage before compaction than equivalent model without it",
521
- provideTmpdirInstance(() =>
522
- Effect.gen(function* () {
523
- const compact = yield* SessionCompaction.Service
524
- // Two models with identical context/output limits, differing only in limit.input
525
- const withInputLimit = createModel({ context: 200_000, input: 200_000, output: 32_000 })
526
- const withoutInputLimit = createModel({ context: 200_000, output: 32_000 })
527
-
528
- // 170K total tokens — well above context-output (168K) but below input limit (200K)
529
- const tokens = { input: 166_000, output: 10_000, reasoning: 0, cache: { read: 5_000, write: 0 } }
530
-
531
- const withLimit = yield* compact.isOverflow({ tokens, model: withInputLimit })
532
- const withoutLimit = yield* compact.isOverflow({ tokens, model: withoutInputLimit })
533
-
534
- // Both models have identical real capacity — they should agree:
535
- expect(withLimit).toBe(true) // should compact (170K leaves no room for 32K output)
536
- expect(withoutLimit).toBe(true) // correctly compacts (170K > 168K)
537
- }),
538
- ),
539
- )
540
-
541
- it.live(
542
- "returns false when model context limit is 0",
543
- provideTmpdirInstance(() =>
544
- Effect.gen(function* () {
545
- const compact = yield* SessionCompaction.Service
546
- const model = createModel({ context: 0, output: 32_000 })
547
- const tokens = { input: 100_000, output: 10_000, reasoning: 0, cache: { read: 0, write: 0 } }
548
- expect(yield* compact.isOverflow({ tokens, model })).toBe(false)
549
- }),
550
- ),
551
- )
552
-
553
- it.live(
554
- "returns false when compaction.auto is disabled",
555
- provideTmpdirInstance(
556
- () =>
557
- Effect.gen(function* () {
558
- const compact = yield* SessionCompaction.Service
559
- const model = createModel({ context: 100_000, output: 32_000 })
560
- const tokens = { input: 75_000, output: 5_000, reasoning: 0, cache: { read: 0, write: 0 } }
561
- expect(yield* compact.isOverflow({ tokens, model })).toBe(false)
562
- }),
563
- {
564
- config: {
565
- compaction: { auto: false },
566
- },
567
- },
568
- ),
569
- )
570
- })
571
-
572
- describe("session.compaction.create", () => {
573
- it.live(
574
- "creates a compaction user message and part",
575
- provideTmpdirInstance(() =>
576
- Effect.gen(function* () {
577
- const compact = yield* SessionCompaction.Service
578
- const ssn = yield* SessionNs.Service
579
-
580
- const info = yield* ssn.create({})
581
-
582
- yield* compact.create({
583
- sessionID: info.id,
584
- agent: "build",
585
- model: ref,
586
- auto: true,
587
- overflow: true,
588
- })
589
-
590
- const msgs = yield* ssn.messages({ sessionID: info.id })
591
- expect(msgs).toHaveLength(1)
592
- expect(msgs[0].info.role).toBe("user")
593
- expect(msgs[0].parts).toHaveLength(1)
594
- expect(msgs[0].parts[0]).toMatchObject({
595
- type: "compaction",
596
- auto: true,
597
- overflow: true,
598
- })
599
- }),
600
- ),
601
- )
602
- })
603
-
604
- describe("session.compaction.prune", () => {
605
- it.live(
606
- "compacts old completed tool output",
607
- provideTmpdirInstance(
608
- (dir) =>
609
- Effect.gen(function* () {
610
- const compact = yield* SessionCompaction.Service
611
- const ssn = yield* SessionNs.Service
612
- const info = yield* ssn.create({})
613
- const a = yield* ssn.updateMessage({
614
- id: MessageID.ascending(),
615
- role: "user",
616
- sessionID: info.id,
617
- agent: "build",
618
- model: ref,
619
- time: { created: Date.now() },
620
- })
621
- yield* ssn.updatePart({
622
- id: PartID.ascending(),
623
- messageID: a.id,
624
- sessionID: info.id,
625
- type: "text",
626
- text: "first",
627
- })
628
- const b: MessageV2.Assistant = {
629
- id: MessageID.ascending(),
630
- role: "assistant",
631
- sessionID: info.id,
632
- mode: "build",
633
- agent: "build",
634
- path: { cwd: dir, root: dir },
635
- cost: 0,
636
- tokens: {
637
- output: 0,
638
- input: 0,
639
- reasoning: 0,
640
- cache: { read: 0, write: 0 },
641
- },
642
- modelID: ref.modelID,
643
- providerID: ref.providerID,
644
- parentID: a.id,
645
- time: { created: Date.now() },
646
- finish: "end_turn",
647
- }
648
- yield* ssn.updateMessage(b)
649
- yield* ssn.updatePart({
650
- id: PartID.ascending(),
651
- messageID: b.id,
652
- sessionID: info.id,
653
- type: "tool",
654
- callID: crypto.randomUUID(),
655
- tool: "bash",
656
- state: {
657
- status: "completed",
658
- input: {},
659
- output: "x".repeat(200_000),
660
- title: "done",
661
- metadata: {},
662
- time: { start: Date.now(), end: Date.now() },
663
- },
664
- })
665
- for (const text of ["second", "third"]) {
666
- const msg = yield* ssn.updateMessage({
667
- id: MessageID.ascending(),
668
- role: "user",
669
- sessionID: info.id,
670
- agent: "build",
671
- model: ref,
672
- time: { created: Date.now() },
673
- })
674
- yield* ssn.updatePart({
675
- id: PartID.ascending(),
676
- messageID: msg.id,
677
- sessionID: info.id,
678
- type: "text",
679
- text,
680
- })
681
- }
682
-
683
- yield* compact.prune({ sessionID: info.id })
684
-
685
- const msgs = yield* ssn.messages({ sessionID: info.id })
686
- const part = msgs.flatMap((msg) => msg.parts).find((part) => part.type === "tool")
687
- expect(part?.type).toBe("tool")
688
- expect(part?.state.status).toBe("completed")
689
- if (part?.type === "tool" && part.state.status === "completed") {
690
- expect(part.state.time.compacted).toBeNumber()
691
- }
692
- }),
693
-
694
- {
695
- config: {
696
- compaction: { prune: true },
697
- },
698
- },
699
- ),
700
- )
701
-
702
- it.live(
703
- "skips protected skill tool output",
704
- provideTmpdirInstance((dir) =>
705
- Effect.gen(function* () {
706
- const compact = yield* SessionCompaction.Service
707
- const ssn = yield* SessionNs.Service
708
- const info = yield* ssn.create({})
709
- const a = yield* ssn.updateMessage({
710
- id: MessageID.ascending(),
711
- role: "user",
712
- sessionID: info.id,
713
- agent: "build",
714
- model: ref,
715
- time: { created: Date.now() },
716
- })
717
- yield* ssn.updatePart({
718
- id: PartID.ascending(),
719
- messageID: a.id,
720
- sessionID: info.id,
721
- type: "text",
722
- text: "first",
723
- })
724
- const b: MessageV2.Assistant = {
725
- id: MessageID.ascending(),
726
- role: "assistant",
727
- sessionID: info.id,
728
- mode: "build",
729
- agent: "build",
730
- path: { cwd: dir, root: dir },
731
- cost: 0,
732
- tokens: {
733
- output: 0,
734
- input: 0,
735
- reasoning: 0,
736
- cache: { read: 0, write: 0 },
737
- },
738
- modelID: ref.modelID,
739
- providerID: ref.providerID,
740
- parentID: a.id,
741
- time: { created: Date.now() },
742
- finish: "end_turn",
743
- }
744
- yield* ssn.updateMessage(b)
745
- yield* ssn.updatePart({
746
- id: PartID.ascending(),
747
- messageID: b.id,
748
- sessionID: info.id,
749
- type: "tool",
750
- callID: crypto.randomUUID(),
751
- tool: "skill",
752
- state: {
753
- status: "completed",
754
- input: {},
755
- output: "x".repeat(200_000),
756
- title: "done",
757
- metadata: {},
758
- time: { start: Date.now(), end: Date.now() },
759
- },
760
- })
761
- for (const text of ["second", "third"]) {
762
- const msg = yield* ssn.updateMessage({
763
- id: MessageID.ascending(),
764
- role: "user",
765
- sessionID: info.id,
766
- agent: "build",
767
- model: ref,
768
- time: { created: Date.now() },
769
- })
770
- yield* ssn.updatePart({
771
- id: PartID.ascending(),
772
- messageID: msg.id,
773
- sessionID: info.id,
774
- type: "text",
775
- text,
776
- })
777
- }
778
-
779
- yield* compact.prune({ sessionID: info.id })
780
-
781
- const msgs = yield* ssn.messages({ sessionID: info.id })
782
- const part = msgs.flatMap((msg) => msg.parts).find((part) => part.type === "tool")
783
- expect(part?.type).toBe("tool")
784
- if (part?.type === "tool" && part.state.status === "completed") {
785
- expect(part.state.time.compacted).toBeUndefined()
786
- }
787
- }),
788
- ),
789
- )
790
- })
791
-
792
- describe("session.compaction.process", () => {
793
- test("throws when parent is not a user message", async () => {
794
- await using tmp = await tmpdir()
795
- await Instance.provide({
796
- directory: tmp.path,
797
- fn: async () => {
798
- const session = await svc.create({})
799
- const msg = await user(session.id, "hello")
800
- const reply = await assistant(session.id, msg.id, tmp.path)
801
- const rt = runtime("continue")
802
- try {
803
- const msgs = await svc.messages({ sessionID: session.id })
804
- await expect(
805
- rt.runPromise(
806
- SessionCompaction.Service.use((svc) =>
807
- svc.process({
808
- parentID: reply.id,
809
- messages: msgs,
810
- sessionID: session.id,
811
- auto: false,
812
- }),
813
- ),
814
- ),
815
- ).rejects.toThrow(`Compaction parent must be a user message: ${reply.id}`)
816
- } finally {
817
- await rt.dispose()
818
- }
819
- },
820
- })
821
- })
822
-
823
- test("publishes compacted event on continue", async () => {
824
- await using tmp = await tmpdir()
825
- await Instance.provide({
826
- directory: tmp.path,
827
- fn: async () => {
828
- const session = await svc.create({})
829
- const msg = await user(session.id, "hello")
830
- const msgs = await svc.messages({ sessionID: session.id })
831
- const done = defer()
832
- let seen = false
833
- const rt = runtime("continue", Plugin.defaultLayer, wide())
834
- let unsub: (() => void) | undefined
835
- try {
836
- unsub = await rt.runPromise(
837
- Bus.Service.use((svc) =>
838
- svc.subscribeCallback(SessionCompaction.Event.Compacted, (evt) => {
839
- if (evt.properties.sessionID !== session.id) return
840
- seen = true
841
- done.resolve()
842
- }),
843
- ),
844
- )
845
-
846
- const result = await rt.runPromise(
847
- SessionCompaction.Service.use((svc) =>
848
- svc.process({
849
- parentID: msg.id,
850
- messages: msgs,
851
- sessionID: session.id,
852
- auto: false,
853
- }),
854
- ),
855
- )
856
-
857
- await Promise.race([
858
- done.promise,
859
- wait(500).then(() => {
860
- throw new Error("timed out waiting for compacted event")
861
- }),
862
- ])
863
- expect(result).toBe("continue")
864
- expect(seen).toBe(true)
865
- } finally {
866
- unsub?.()
867
- await rt.dispose()
868
- }
869
- },
870
- })
871
- })
872
-
873
- test("marks summary message as errored on compact result", async () => {
874
- await using tmp = await tmpdir()
875
- await Instance.provide({
876
- directory: tmp.path,
877
- fn: async () => {
878
- const session = await svc.create({})
879
- const msg = await user(session.id, "hello")
880
- const rt = runtime("compact", Plugin.defaultLayer, wide())
881
- try {
882
- const msgs = await svc.messages({ sessionID: session.id })
883
- const result = await rt.runPromise(
884
- SessionCompaction.Service.use((svc) =>
885
- svc.process({
886
- parentID: msg.id,
887
- messages: msgs,
888
- sessionID: session.id,
889
- auto: false,
890
- }),
891
- ),
892
- )
893
-
894
- const summary = (await svc.messages({ sessionID: session.id })).find(
895
- (msg) => msg.info.role === "assistant" && msg.info.summary,
896
- )
897
-
898
- expect(result).toBe("stop")
899
- expect(summary?.info.role).toBe("assistant")
900
- if (summary?.info.role === "assistant") {
901
- expect(summary.info.finish).toBe("error")
902
- expect(JSON.stringify(summary.info.error)).toContain("Session too large to compact")
903
- }
904
- } finally {
905
- await rt.dispose()
906
- }
907
- },
908
- })
909
- })
910
-
911
- test("adds synthetic continue prompt when auto is enabled", async () => {
912
- await using tmp = await tmpdir()
913
- await Instance.provide({
914
- directory: tmp.path,
915
- fn: async () => {
916
- const session = await svc.create({})
917
- const msg = await user(session.id, "hello")
918
- const rt = runtime("continue", Plugin.defaultLayer, wide())
919
- try {
920
- const msgs = await svc.messages({ sessionID: session.id })
921
- const result = await rt.runPromise(
922
- SessionCompaction.Service.use((svc) =>
923
- svc.process({
924
- parentID: msg.id,
925
- messages: msgs,
926
- sessionID: session.id,
927
- auto: true,
928
- }),
929
- ),
930
- )
931
-
932
- const all = await svc.messages({ sessionID: session.id })
933
- const last = all.at(-1)
934
-
935
- expect(result).toBe("continue")
936
- expect(last?.info.role).toBe("user")
937
- expect(last?.parts[0]).toMatchObject({
938
- type: "text",
939
- synthetic: true,
940
- metadata: { compaction_continue: true },
941
- })
942
- if (last?.parts[0]?.type === "text") {
943
- expect(last.parts[0].text).toContain("Continue if you have next steps")
944
- }
945
- } finally {
946
- await rt.dispose()
947
- }
948
- },
949
- })
950
- })
951
-
952
- test("persists tail_start_id for retained recent turns", async () => {
953
- await using tmp = await tmpdir()
954
- await Instance.provide({
955
- directory: tmp.path,
956
- fn: async () => {
957
- const session = await svc.create({})
958
- await user(session.id, "first")
959
- const keep = await user(session.id, "second")
960
- await user(session.id, "third")
961
- await SessionCompaction.create({
962
- sessionID: session.id,
963
- agent: "build",
964
- model: ref,
965
- auto: false,
966
- })
967
-
968
- const rt = runtime(
969
- "continue",
970
- Plugin.defaultLayer,
971
- wide(),
972
- cfg({ tail_turns: 2, preserve_recent_tokens: 10_000 }),
973
- )
974
- try {
975
- const msgs = await svc.messages({ sessionID: session.id })
976
- const parent = msgs.at(-1)?.info.id
977
- expect(parent).toBeTruthy()
978
- await rt.runPromise(
979
- SessionCompaction.Service.use((svc) =>
980
- svc.process({
981
- parentID: parent!,
982
- messages: msgs,
983
- sessionID: session.id,
984
- auto: false,
985
- }),
986
- ),
987
- )
988
-
989
- const part = await lastCompactionPart(session.id)
990
- expect(part?.type).toBe("compaction")
991
- expect(part?.tail_start_id).toBe(keep.id)
992
- } finally {
993
- await rt.dispose()
994
- }
995
- },
996
- })
997
- })
998
-
999
- test("shrinks retained tail to fit preserve token budget", async () => {
1000
- await using tmp = await tmpdir()
1001
- await Instance.provide({
1002
- directory: tmp.path,
1003
- fn: async () => {
1004
- const session = await svc.create({})
1005
- await user(session.id, "first")
1006
- await user(session.id, "x".repeat(2_000))
1007
- const keep = await user(session.id, "tiny")
1008
- await SessionCompaction.create({
1009
- sessionID: session.id,
1010
- agent: "build",
1011
- model: ref,
1012
- auto: false,
1013
- })
1014
-
1015
- const rt = runtime("continue", Plugin.defaultLayer, wide(), cfg({ tail_turns: 2, preserve_recent_tokens: 100 }))
1016
- try {
1017
- const msgs = await svc.messages({ sessionID: session.id })
1018
- const parent = msgs.at(-1)?.info.id
1019
- expect(parent).toBeTruthy()
1020
- await rt.runPromise(
1021
- SessionCompaction.Service.use((svc) =>
1022
- svc.process({
1023
- parentID: parent!,
1024
- messages: msgs,
1025
- sessionID: session.id,
1026
- auto: false,
1027
- }),
1028
- ),
1029
- )
1030
-
1031
- const part = await lastCompactionPart(session.id)
1032
- expect(part?.type).toBe("compaction")
1033
- expect(part?.tail_start_id).toBe(keep.id)
1034
- } finally {
1035
- await rt.dispose()
1036
- }
1037
- },
1038
- })
1039
- })
1040
-
1041
- test("falls back to full summary when even one recent turn exceeds preserve token budget", async () => {
1042
- await using tmp = await tmpdir({ git: true })
1043
- const stub = llm()
1044
- let captured = ""
1045
- stub.push(
1046
- reply("summary", (input) => {
1047
- captured = JSON.stringify(input.messages)
1048
- }),
1049
- )
1050
- await Instance.provide({
1051
- directory: tmp.path,
1052
- fn: async () => {
1053
- const session = await svc.create({})
1054
- await user(session.id, "first")
1055
- await user(session.id, "y".repeat(2_000))
1056
- await SessionCompaction.create({
1057
- sessionID: session.id,
1058
- agent: "build",
1059
- model: ref,
1060
- auto: false,
1061
- })
1062
-
1063
- const rt = liveRuntime(stub.layer, wide(), cfg({ tail_turns: 1, preserve_recent_tokens: 20 }))
1064
- try {
1065
- const msgs = await svc.messages({ sessionID: session.id })
1066
- const parent = msgs.at(-1)?.info.id
1067
- expect(parent).toBeTruthy()
1068
- await rt.runPromise(
1069
- SessionCompaction.Service.use((svc) =>
1070
- svc.process({
1071
- parentID: parent!,
1072
- messages: msgs,
1073
- sessionID: session.id,
1074
- auto: false,
1075
- }),
1076
- ),
1077
- )
1078
-
1079
- const part = await lastCompactionPart(session.id)
1080
- expect(part?.type).toBe("compaction")
1081
- expect(part?.tail_start_id).toBeUndefined()
1082
- expect(captured).toContain("yyyy")
1083
- } finally {
1084
- await rt.dispose()
1085
- }
1086
- },
1087
- })
1088
- })
1089
-
1090
- test("falls back to full summary when retained tail media exceeds preserve token budget", async () => {
1091
- await using tmp = await tmpdir({ git: true })
1092
- const stub = llm()
1093
- let captured = ""
1094
- stub.push(
1095
- reply("summary", (input) => {
1096
- captured = JSON.stringify(input.messages)
1097
- }),
1098
- )
1099
- await Instance.provide({
1100
- directory: tmp.path,
1101
- fn: async () => {
1102
- const session = await svc.create({})
1103
- await user(session.id, "older")
1104
- const recent = await user(session.id, "recent image turn")
1105
- await svc.updatePart({
1106
- id: PartID.ascending(),
1107
- messageID: recent.id,
1108
- sessionID: session.id,
1109
- type: "file",
1110
- mime: "image/png",
1111
- filename: "big.png",
1112
- url: `data:image/png;base64,${"a".repeat(4_000)}`,
1113
- })
1114
- await SessionCompaction.create({
1115
- sessionID: session.id,
1116
- agent: "build",
1117
- model: ref,
1118
- auto: false,
1119
- })
1120
-
1121
- const rt = liveRuntime(stub.layer, wide(), cfg({ tail_turns: 1, preserve_recent_tokens: 100 }))
1122
- try {
1123
- const msgs = await svc.messages({ sessionID: session.id })
1124
- const parent = msgs.at(-1)?.info.id
1125
- expect(parent).toBeTruthy()
1126
- await rt.runPromise(
1127
- SessionCompaction.Service.use((svc) =>
1128
- svc.process({
1129
- parentID: parent!,
1130
- messages: msgs,
1131
- sessionID: session.id,
1132
- auto: false,
1133
- }),
1134
- ),
1135
- )
1136
-
1137
- const part = await lastCompactionPart(session.id)
1138
- expect(part?.type).toBe("compaction")
1139
- expect(part?.tail_start_id).toBeUndefined()
1140
- expect(captured).toContain("recent image turn")
1141
- expect(captured).toContain("Attached image/png: big.png")
1142
- } finally {
1143
- await rt.dispose()
1144
- }
1145
- },
1146
- })
1147
- })
1148
-
1149
- test("retains a split turn suffix when a later message fits the preserve token budget", async () => {
1150
- await using tmp = await tmpdir({ git: true })
1151
- const stub = llm()
1152
- let captured = ""
1153
- stub.push(
1154
- reply("summary", (input) => {
1155
- captured = JSON.stringify(input.messages)
1156
- }),
1157
- )
1158
- await Instance.provide({
1159
- directory: tmp.path,
1160
- fn: async () => {
1161
- const session = await svc.create({})
1162
- await user(session.id, "older")
1163
- const recent = await user(session.id, "recent turn")
1164
- const large = await assistant(session.id, recent.id, tmp.path)
1165
- await svc.updatePart({
1166
- id: PartID.ascending(),
1167
- messageID: large.id,
1168
- sessionID: session.id,
1169
- type: "text",
1170
- text: "z".repeat(2_000),
1171
- })
1172
- const keep = await assistant(session.id, recent.id, tmp.path)
1173
- await svc.updatePart({
1174
- id: PartID.ascending(),
1175
- messageID: keep.id,
1176
- sessionID: session.id,
1177
- type: "text",
1178
- text: "keep tail",
1179
- })
1180
- await SessionCompaction.create({
1181
- sessionID: session.id,
1182
- agent: "build",
1183
- model: ref,
1184
- auto: false,
1185
- })
1186
-
1187
- const rt = liveRuntime(stub.layer, wide(), cfg({ tail_turns: 1, preserve_recent_tokens: 100 }))
1188
- try {
1189
- const msgs = await svc.messages({ sessionID: session.id })
1190
- const parent = msgs.at(-1)?.info.id
1191
- expect(parent).toBeTruthy()
1192
- await rt.runPromise(
1193
- SessionCompaction.Service.use((svc) =>
1194
- svc.process({
1195
- parentID: parent!,
1196
- messages: msgs,
1197
- sessionID: session.id,
1198
- auto: false,
1199
- }),
1200
- ),
1201
- )
1202
-
1203
- const part = await lastCompactionPart(session.id)
1204
- expect(part?.type).toBe("compaction")
1205
- expect(part?.tail_start_id).toBe(keep.id)
1206
- expect(captured).toContain("zzzz")
1207
- expect(captured).not.toContain("keep tail")
1208
-
1209
- const filtered = MessageV2.filterCompacted(MessageV2.stream(session.id))
1210
- expect(filtered[0]?.info.id).toBe(keep.id)
1211
- expect(filtered.map((msg) => msg.info.id)).not.toContain(large.id)
1212
- } finally {
1213
- await rt.dispose()
1214
- }
1215
- },
1216
- })
1217
- })
1218
-
1219
- test("allows plugins to disable synthetic continue prompt", async () => {
1220
- await using tmp = await tmpdir()
1221
- await Instance.provide({
1222
- directory: tmp.path,
1223
- fn: async () => {
1224
- const session = await svc.create({})
1225
- const msg = await user(session.id, "hello")
1226
- const rt = runtime("continue", autocontinue(false), wide())
1227
- try {
1228
- const msgs = await svc.messages({ sessionID: session.id })
1229
- const result = await rt.runPromise(
1230
- SessionCompaction.Service.use((svc) =>
1231
- svc.process({
1232
- parentID: msg.id,
1233
- messages: msgs,
1234
- sessionID: session.id,
1235
- auto: true,
1236
- }),
1237
- ),
1238
- )
1239
-
1240
- const all = await svc.messages({ sessionID: session.id })
1241
- const last = all.at(-1)
1242
-
1243
- expect(result).toBe("continue")
1244
- expect(last?.info.role).toBe("assistant")
1245
- expect(
1246
- all.some(
1247
- (msg) =>
1248
- msg.info.role === "user" &&
1249
- msg.parts.some(
1250
- (part) =>
1251
- part.type === "text" && part.synthetic && part.text.includes("Continue if you have next steps"),
1252
- ),
1253
- ),
1254
- ).toBe(false)
1255
- } finally {
1256
- await rt.dispose()
1257
- }
1258
- },
1259
- })
1260
- })
1261
-
1262
- test("replays the prior user turn on overflow when earlier context exists", async () => {
1263
- await using tmp = await tmpdir()
1264
- await Instance.provide({
1265
- directory: tmp.path,
1266
- fn: async () => {
1267
- const session = await svc.create({})
1268
- await user(session.id, "root")
1269
- const replay = await user(session.id, "image")
1270
- await svc.updatePart({
1271
- id: PartID.ascending(),
1272
- messageID: replay.id,
1273
- sessionID: session.id,
1274
- type: "file",
1275
- mime: "image/png",
1276
- filename: "cat.png",
1277
- url: "https://example.com/cat.png",
1278
- })
1279
- const msg = await user(session.id, "current")
1280
- const rt = runtime("continue", Plugin.defaultLayer, wide())
1281
- try {
1282
- const msgs = await svc.messages({ sessionID: session.id })
1283
- const result = await rt.runPromise(
1284
- SessionCompaction.Service.use((svc) =>
1285
- svc.process({
1286
- parentID: msg.id,
1287
- messages: msgs,
1288
- sessionID: session.id,
1289
- auto: true,
1290
- overflow: true,
1291
- }),
1292
- ),
1293
- )
1294
-
1295
- const last = (await svc.messages({ sessionID: session.id })).at(-1)
1296
-
1297
- expect(result).toBe("continue")
1298
- expect(last?.info.role).toBe("user")
1299
- expect(last?.parts.some((part) => part.type === "file")).toBe(false)
1300
- expect(
1301
- last?.parts.some((part) => part.type === "text" && part.text.includes("Attached image/png: cat.png")),
1302
- ).toBe(true)
1303
- } finally {
1304
- await rt.dispose()
1305
- }
1306
- },
1307
- })
1308
- })
1309
-
1310
- test("falls back to overflow guidance when no replayable turn exists", async () => {
1311
- await using tmp = await tmpdir()
1312
- await Instance.provide({
1313
- directory: tmp.path,
1314
- fn: async () => {
1315
- const session = await svc.create({})
1316
- await user(session.id, "earlier")
1317
- const msg = await user(session.id, "current")
1318
-
1319
- const rt = runtime("continue", Plugin.defaultLayer, wide())
1320
- try {
1321
- const msgs = await svc.messages({ sessionID: session.id })
1322
- const result = await rt.runPromise(
1323
- SessionCompaction.Service.use((svc) =>
1324
- svc.process({
1325
- parentID: msg.id,
1326
- messages: msgs,
1327
- sessionID: session.id,
1328
- auto: true,
1329
- overflow: true,
1330
- }),
1331
- ),
1332
- )
1333
-
1334
- const last = (await svc.messages({ sessionID: session.id })).at(-1)
1335
-
1336
- expect(result).toBe("continue")
1337
- expect(last?.info.role).toBe("user")
1338
- if (last?.parts[0]?.type === "text") {
1339
- expect(last.parts[0].text).toContain("previous request exceeded the provider's size limit")
1340
- }
1341
- } finally {
1342
- await rt.dispose()
1343
- }
1344
- },
1345
- })
1346
- })
1347
-
1348
- test("stops quickly when aborted during retry backoff", async () => {
1349
- const stub = llm()
1350
- const ready = defer()
1351
- stub.push(
1352
- Stream.fromAsyncIterable(
1353
- {
1354
- async *[Symbol.asyncIterator]() {
1355
- yield { type: "start" } as LLM.Event
1356
- throw new APICallError({
1357
- message: "boom",
1358
- url: "https://example.com/v1/chat/completions",
1359
- requestBodyValues: {},
1360
- statusCode: 503,
1361
- responseHeaders: { "retry-after-ms": "10000" },
1362
- responseBody: '{"error":"boom"}',
1363
- isRetryable: true,
1364
- })
1365
- },
1366
- },
1367
- (err) => err,
1368
- ),
1369
- )
1370
-
1371
- await using tmp = await tmpdir({ git: true })
1372
- await Instance.provide({
1373
- directory: tmp.path,
1374
- fn: async () => {
1375
- const session = await svc.create({})
1376
- const msg = await user(session.id, "hello")
1377
- const msgs = await svc.messages({ sessionID: session.id })
1378
- const abort = new AbortController()
1379
- const rt = liveRuntime(stub.layer, wide())
1380
- let off: (() => void) | undefined
1381
- let run: Promise<"continue" | "stop"> | undefined
1382
- try {
1383
- off = await rt.runPromise(
1384
- Bus.Service.use((svc) =>
1385
- svc.subscribeCallback(SessionStatus.Event.Status, (evt) => {
1386
- if (evt.properties.sessionID !== session.id) return
1387
- if (evt.properties.status.type !== "retry") return
1388
- ready.resolve()
1389
- }),
1390
- ),
1391
- )
1392
-
1393
- run = rt
1394
- .runPromiseExit(
1395
- SessionCompaction.Service.use((svc) =>
1396
- svc.process({
1397
- parentID: msg.id,
1398
- messages: msgs,
1399
- sessionID: session.id,
1400
- auto: false,
1401
- }),
1402
- ),
1403
- { signal: abort.signal },
1404
- )
1405
- .then((exit) => {
1406
- if (Exit.isFailure(exit)) {
1407
- if (Cause.hasInterrupts(exit.cause) && abort.signal.aborted) return "stop"
1408
- throw Cause.squash(exit.cause)
1409
- }
1410
- return exit.value
1411
- })
1412
-
1413
- await Promise.race([
1414
- ready.promise,
1415
- wait(5000).then(() => {
1416
- throw new Error("timed out waiting for retry status")
1417
- }),
1418
- ])
1419
-
1420
- const start = Date.now()
1421
- abort.abort()
1422
- const result = await Promise.race([
1423
- run.then((value) => ({ kind: "done" as const, value, ms: Date.now() - start })),
1424
- wait(2000).then(() => ({ kind: "timeout" as const })),
1425
- ])
1426
-
1427
- expect(result.kind).toBe("done")
1428
- if (result.kind === "done") {
1429
- expect(result.value).toBe("stop")
1430
- expect(result.ms).toBeLessThan(2000)
1431
- }
1432
- } finally {
1433
- off?.()
1434
- abort.abort()
1435
- await rt.dispose()
1436
- await run?.catch(() => undefined)
1437
- }
1438
- },
1439
- })
1440
- })
1441
-
1442
- test("does not leave a summary assistant when aborted before processor setup", async () => {
1443
- const ready = defer()
1444
-
1445
- await using tmp = await tmpdir({ git: true })
1446
- await Instance.provide({
1447
- directory: tmp.path,
1448
- fn: async () => {
1449
- const session = await svc.create({})
1450
- const msg = await user(session.id, "hello")
1451
- const msgs = await svc.messages({ sessionID: session.id })
1452
- const abort = new AbortController()
1453
- const rt = runtime("continue", plugin(ready), wide())
1454
- let run: Promise<"continue" | "stop"> | undefined
1455
- try {
1456
- run = rt
1457
- .runPromiseExit(
1458
- SessionCompaction.Service.use((svc) =>
1459
- svc.process({
1460
- parentID: msg.id,
1461
- messages: msgs,
1462
- sessionID: session.id,
1463
- auto: false,
1464
- }),
1465
- ),
1466
- { signal: abort.signal },
1467
- )
1468
- .then((exit) => {
1469
- if (Exit.isFailure(exit)) {
1470
- if (Cause.hasInterrupts(exit.cause) && abort.signal.aborted) return "stop"
1471
- throw Cause.squash(exit.cause)
1472
- }
1473
- return exit.value
1474
- })
1475
-
1476
- await Promise.race([
1477
- ready.promise,
1478
- wait(1000).then(() => {
1479
- throw new Error("timed out waiting for compaction hook")
1480
- }),
1481
- ])
1482
-
1483
- abort.abort()
1484
- expect(await run).toBe("stop")
1485
-
1486
- const all = await svc.messages({ sessionID: session.id })
1487
- expect(all.some((msg) => msg.info.role === "assistant" && msg.info.summary)).toBe(false)
1488
- } finally {
1489
- abort.abort()
1490
- await rt.dispose()
1491
- await run?.catch(() => undefined)
1492
- }
1493
- },
1494
- })
1495
- })
1496
-
1497
- test("does not allow tool calls while generating the summary", async () => {
1498
- const stub = llm()
1499
- stub.push(
1500
- Stream.make(
1501
- { type: "start" } satisfies LLM.Event,
1502
- { type: "tool-input-start", id: "call-1", toolName: "_noop" } satisfies LLM.Event,
1503
- { type: "tool-call", toolCallId: "call-1", toolName: "_noop", input: {} } satisfies LLM.Event,
1504
- {
1505
- type: "finish-step",
1506
- finishReason: "tool-calls",
1507
- rawFinishReason: "tool_calls",
1508
- response: { id: "res", modelId: "test-model", timestamp: new Date() },
1509
- providerMetadata: undefined,
1510
- usage: {
1511
- inputTokens: 1,
1512
- outputTokens: 1,
1513
- totalTokens: 2,
1514
- inputTokenDetails: {
1515
- noCacheTokens: undefined,
1516
- cacheReadTokens: undefined,
1517
- cacheWriteTokens: undefined,
1518
- },
1519
- outputTokenDetails: {
1520
- textTokens: undefined,
1521
- reasoningTokens: undefined,
1522
- },
1523
- },
1524
- } satisfies LLM.Event,
1525
- {
1526
- type: "finish",
1527
- finishReason: "tool-calls",
1528
- rawFinishReason: "tool_calls",
1529
- totalUsage: {
1530
- inputTokens: 1,
1531
- outputTokens: 1,
1532
- totalTokens: 2,
1533
- inputTokenDetails: {
1534
- noCacheTokens: undefined,
1535
- cacheReadTokens: undefined,
1536
- cacheWriteTokens: undefined,
1537
- },
1538
- outputTokenDetails: {
1539
- textTokens: undefined,
1540
- reasoningTokens: undefined,
1541
- },
1542
- },
1543
- } satisfies LLM.Event,
1544
- ),
1545
- )
1546
-
1547
- await using tmp = await tmpdir({ git: true })
1548
- await Instance.provide({
1549
- directory: tmp.path,
1550
- fn: async () => {
1551
- const session = await svc.create({})
1552
- const msg = await user(session.id, "hello")
1553
- const rt = liveRuntime(stub.layer, wide())
1554
- try {
1555
- const msgs = await svc.messages({ sessionID: session.id })
1556
- await rt.runPromise(
1557
- SessionCompaction.Service.use((svc) =>
1558
- svc.process({
1559
- parentID: msg.id,
1560
- messages: msgs,
1561
- sessionID: session.id,
1562
- auto: false,
1563
- }),
1564
- ),
1565
- )
1566
-
1567
- const summary = (await svc.messages({ sessionID: session.id })).find(
1568
- (item) => item.info.role === "assistant" && item.info.summary,
1569
- )
1570
-
1571
- expect(summary?.info.role).toBe("assistant")
1572
- expect(summary?.parts.some((part) => part.type === "tool")).toBe(false)
1573
- } finally {
1574
- await rt.dispose()
1575
- }
1576
- },
1577
- })
1578
- })
1579
-
1580
- test("summarizes only the head while keeping recent tail out of summary input", async () => {
1581
- const stub = llm()
1582
- let captured = ""
1583
- stub.push(
1584
- reply("summary", (input) => {
1585
- captured = JSON.stringify(input.messages)
1586
- }),
1587
- )
1588
-
1589
- await using tmp = await tmpdir({ git: true })
1590
- await Instance.provide({
1591
- directory: tmp.path,
1592
- fn: async () => {
1593
- const session = await svc.create({})
1594
- await user(session.id, "older context")
1595
- await user(session.id, "keep this turn")
1596
- await user(session.id, "and this one too")
1597
- await SessionCompaction.create({
1598
- sessionID: session.id,
1599
- agent: "build",
1600
- model: ref,
1601
- auto: false,
1602
- })
1603
-
1604
- const rt = liveRuntime(stub.layer, wide())
1605
- try {
1606
- const msgs = await svc.messages({ sessionID: session.id })
1607
- const parent = msgs.at(-1)?.info.id
1608
- expect(parent).toBeTruthy()
1609
- await rt.runPromise(
1610
- SessionCompaction.Service.use((svc) =>
1611
- svc.process({
1612
- parentID: parent!,
1613
- messages: msgs,
1614
- sessionID: session.id,
1615
- auto: false,
1616
- }),
1617
- ),
1618
- )
1619
-
1620
- expect(captured).toContain("older context")
1621
- expect(captured).not.toContain("keep this turn")
1622
- expect(captured).not.toContain("and this one too")
1623
- expect(captured).not.toContain("What did we do so far?")
1624
- } finally {
1625
- await rt.dispose()
1626
- }
1627
- },
1628
- })
1629
- })
1630
-
1631
- test("anchors repeated compactions with the previous summary", async () => {
1632
- const stub = llm()
1633
- let captured = ""
1634
- stub.push(reply("summary one"))
1635
- stub.push(
1636
- reply("summary two", (input) => {
1637
- captured = JSON.stringify(input.messages)
1638
- }),
1639
- )
1640
-
1641
- await using tmp = await tmpdir({ git: true })
1642
- await Instance.provide({
1643
- directory: tmp.path,
1644
- fn: async () => {
1645
- const session = await svc.create({})
1646
- await user(session.id, "older context")
1647
- await user(session.id, "keep this turn")
1648
- await SessionCompaction.create({
1649
- sessionID: session.id,
1650
- agent: "build",
1651
- model: ref,
1652
- auto: false,
1653
- })
1654
-
1655
- const rt = liveRuntime(stub.layer, wide())
1656
- try {
1657
- let msgs = await svc.messages({ sessionID: session.id })
1658
- let parent = msgs.at(-1)?.info.id
1659
- expect(parent).toBeTruthy()
1660
- await rt.runPromise(
1661
- SessionCompaction.Service.use((svc) =>
1662
- svc.process({
1663
- parentID: parent!,
1664
- messages: msgs,
1665
- sessionID: session.id,
1666
- auto: false,
1667
- }),
1668
- ),
1669
- )
1670
-
1671
- await user(session.id, "latest turn")
1672
- await SessionCompaction.create({
1673
- sessionID: session.id,
1674
- agent: "build",
1675
- model: ref,
1676
- auto: false,
1677
- })
1678
-
1679
- msgs = MessageV2.filterCompacted(MessageV2.stream(session.id))
1680
- parent = msgs.at(-1)?.info.id
1681
- expect(parent).toBeTruthy()
1682
- await rt.runPromise(
1683
- SessionCompaction.Service.use((svc) =>
1684
- svc.process({
1685
- parentID: parent!,
1686
- messages: msgs,
1687
- sessionID: session.id,
1688
- auto: false,
1689
- }),
1690
- ),
1691
- )
1692
-
1693
- expect(captured).toContain("<previous-summary>")
1694
- expect(captured).toContain("summary one")
1695
- expect(captured.match(/summary one/g)?.length).toBe(1)
1696
- expect(captured).toContain("## Constraints & Preferences")
1697
- expect(captured).toContain("## Progress")
1698
- } finally {
1699
- await rt.dispose()
1700
- }
1701
- },
1702
- })
1703
- })
1704
-
1705
- test("keeps recent pre-compaction turns across repeated compactions", async () => {
1706
- const stub = llm()
1707
- stub.push(reply("summary one"))
1708
- stub.push(reply("summary two"))
1709
- await using tmp = await tmpdir()
1710
- await Instance.provide({
1711
- directory: tmp.path,
1712
- fn: async () => {
1713
- const session = await svc.create({})
1714
- const u1 = await user(session.id, "one")
1715
- const u2 = await user(session.id, "two")
1716
- const u3 = await user(session.id, "three")
1717
- await SessionCompaction.create({
1718
- sessionID: session.id,
1719
- agent: "build",
1720
- model: ref,
1721
- auto: false,
1722
- })
1723
-
1724
- const rt = liveRuntime(stub.layer, wide(), cfg({ tail_turns: 2, preserve_recent_tokens: 10_000 }))
1725
- try {
1726
- let msgs = await svc.messages({ sessionID: session.id })
1727
- let parent = msgs.at(-1)?.info.id
1728
- expect(parent).toBeTruthy()
1729
- await rt.runPromise(
1730
- SessionCompaction.Service.use((svc) =>
1731
- svc.process({
1732
- parentID: parent!,
1733
- messages: msgs,
1734
- sessionID: session.id,
1735
- auto: false,
1736
- }),
1737
- ),
1738
- )
1739
-
1740
- const u4 = await user(session.id, "four")
1741
- await SessionCompaction.create({
1742
- sessionID: session.id,
1743
- agent: "build",
1744
- model: ref,
1745
- auto: false,
1746
- })
1747
-
1748
- msgs = MessageV2.filterCompacted(MessageV2.stream(session.id))
1749
- parent = msgs.at(-1)?.info.id
1750
- expect(parent).toBeTruthy()
1751
- await rt.runPromise(
1752
- SessionCompaction.Service.use((svc) =>
1753
- svc.process({
1754
- parentID: parent!,
1755
- messages: msgs,
1756
- sessionID: session.id,
1757
- auto: false,
1758
- }),
1759
- ),
1760
- )
1761
-
1762
- const filtered = MessageV2.filterCompacted(MessageV2.stream(session.id))
1763
- const ids = filtered.map((msg) => msg.info.id)
1764
-
1765
- expect(ids).not.toContain(u1.id)
1766
- expect(ids).not.toContain(u2.id)
1767
- expect(ids).toContain(u3.id)
1768
- expect(ids).toContain(u4.id)
1769
- expect(filtered.some((msg) => msg.info.role === "assistant" && msg.info.summary)).toBe(true)
1770
- expect(
1771
- filtered.some((msg) => msg.info.role === "user" && msg.parts.some((part) => part.type === "compaction")),
1772
- ).toBe(true)
1773
- } finally {
1774
- await rt.dispose()
1775
- }
1776
- },
1777
- })
1778
- })
1779
-
1780
- test("ignores previous summaries when sizing the retained tail", async () => {
1781
- await using tmp = await tmpdir()
1782
- await Instance.provide({
1783
- directory: tmp.path,
1784
- fn: async () => {
1785
- const session = await svc.create({})
1786
- await user(session.id, "older")
1787
- const keep = await user(session.id, "keep this turn")
1788
- const keepReply = await assistant(session.id, keep.id, tmp.path)
1789
- await svc.updatePart({
1790
- id: PartID.ascending(),
1791
- messageID: keepReply.id,
1792
- sessionID: session.id,
1793
- type: "text",
1794
- text: "keep reply",
1795
- })
1796
-
1797
- await SessionCompaction.create({
1798
- sessionID: session.id,
1799
- agent: "build",
1800
- model: ref,
1801
- auto: false,
1802
- })
1803
- const firstCompaction = (await svc.messages({ sessionID: session.id })).at(-1)?.info.id
1804
- expect(firstCompaction).toBeTruthy()
1805
- await summaryAssistant(session.id, firstCompaction!, tmp.path, "summary ".repeat(800))
1806
-
1807
- const recent = await user(session.id, "recent turn")
1808
- const recentReply = await assistant(session.id, recent.id, tmp.path)
1809
- await svc.updatePart({
1810
- id: PartID.ascending(),
1811
- messageID: recentReply.id,
1812
- sessionID: session.id,
1813
- type: "text",
1814
- text: "recent reply",
1815
- })
1816
-
1817
- await SessionCompaction.create({
1818
- sessionID: session.id,
1819
- agent: "build",
1820
- model: ref,
1821
- auto: false,
1822
- })
1823
-
1824
- const rt = runtime("continue", Plugin.defaultLayer, wide(), cfg({ tail_turns: 2, preserve_recent_tokens: 500 }))
1825
- try {
1826
- const msgs = await svc.messages({ sessionID: session.id })
1827
- const parent = msgs.at(-1)?.info.id
1828
- expect(parent).toBeTruthy()
1829
- await rt.runPromise(
1830
- SessionCompaction.Service.use((svc) =>
1831
- svc.process({
1832
- parentID: parent!,
1833
- messages: msgs,
1834
- sessionID: session.id,
1835
- auto: false,
1836
- }),
1837
- ),
1838
- )
1839
-
1840
- const part = await lastCompactionPart(session.id)
1841
- expect(part?.type).toBe("compaction")
1842
- expect(part?.tail_start_id).toBe(keep.id)
1843
- } finally {
1844
- await rt.dispose()
1845
- }
1846
- },
1847
- })
1848
- })
1849
- })
1850
-
1851
- describe("util.token.estimate", () => {
1852
- test("estimates tokens from text (4 chars per token)", () => {
1853
- const text = "x".repeat(4000)
1854
- expect(Token.estimate(text)).toBe(1000)
1855
- })
1856
-
1857
- test("estimates tokens from larger text", () => {
1858
- const text = "y".repeat(20_000)
1859
- expect(Token.estimate(text)).toBe(5000)
1860
- })
1861
-
1862
- test("returns 0 for empty string", () => {
1863
- expect(Token.estimate("")).toBe(0)
1864
- })
1865
- })
1866
-
1867
- describe("SessionNs.getUsage", () => {
1868
- test("normalizes standard usage to token format", () => {
1869
- const model = createModel({ context: 100_000, output: 32_000 })
1870
- const result = SessionNs.getUsage({
1871
- model,
1872
- usage: {
1873
- inputTokens: 1000,
1874
- outputTokens: 500,
1875
- totalTokens: 1500,
1876
- inputTokenDetails: {
1877
- noCacheTokens: undefined,
1878
- cacheReadTokens: undefined,
1879
- cacheWriteTokens: undefined,
1880
- },
1881
- outputTokenDetails: {
1882
- textTokens: undefined,
1883
- reasoningTokens: undefined,
1884
- },
1885
- },
1886
- })
1887
-
1888
- expect(result.tokens.input).toBe(1000)
1889
- expect(result.tokens.output).toBe(500)
1890
- expect(result.tokens.reasoning).toBe(0)
1891
- expect(result.tokens.cache.read).toBe(0)
1892
- expect(result.tokens.cache.write).toBe(0)
1893
- })
1894
-
1895
- test("extracts cached tokens to cache.read", () => {
1896
- const model = createModel({ context: 100_000, output: 32_000 })
1897
- const result = SessionNs.getUsage({
1898
- model,
1899
- usage: {
1900
- inputTokens: 1000,
1901
- outputTokens: 500,
1902
- totalTokens: 1500,
1903
- inputTokenDetails: {
1904
- noCacheTokens: 800,
1905
- cacheReadTokens: 200,
1906
- cacheWriteTokens: undefined,
1907
- },
1908
- outputTokenDetails: {
1909
- textTokens: undefined,
1910
- reasoningTokens: undefined,
1911
- },
1912
- },
1913
- })
1914
-
1915
- expect(result.tokens.input).toBe(800)
1916
- expect(result.tokens.cache.read).toBe(200)
1917
- })
1918
-
1919
- test("handles anthropic cache write metadata", () => {
1920
- const model = createModel({ context: 100_000, output: 32_000 })
1921
- const result = SessionNs.getUsage({
1922
- model,
1923
- usage: {
1924
- inputTokens: 1000,
1925
- outputTokens: 500,
1926
- totalTokens: 1500,
1927
- inputTokenDetails: {
1928
- noCacheTokens: undefined,
1929
- cacheReadTokens: undefined,
1930
- cacheWriteTokens: undefined,
1931
- },
1932
- outputTokenDetails: {
1933
- textTokens: undefined,
1934
- reasoningTokens: undefined,
1935
- },
1936
- },
1937
- metadata: {
1938
- anthropic: {
1939
- cacheCreationInputTokens: 300,
1940
- },
1941
- },
1942
- })
1943
-
1944
- expect(result.tokens.cache.write).toBe(300)
1945
- })
1946
-
1947
- test("subtracts cached tokens for anthropic provider", () => {
1948
- const model = createModel({ context: 100_000, output: 32_000 })
1949
- // AI SDK v6 normalizes inputTokens to include cached tokens for all providers
1950
- const result = SessionNs.getUsage({
1951
- model,
1952
- usage: {
1953
- inputTokens: 1000,
1954
- outputTokens: 500,
1955
- totalTokens: 1500,
1956
- inputTokenDetails: {
1957
- noCacheTokens: 800,
1958
- cacheReadTokens: 200,
1959
- cacheWriteTokens: undefined,
1960
- },
1961
- outputTokenDetails: {
1962
- textTokens: undefined,
1963
- reasoningTokens: undefined,
1964
- },
1965
- },
1966
- metadata: {
1967
- anthropic: {},
1968
- },
1969
- })
1970
-
1971
- expect(result.tokens.input).toBe(800)
1972
- expect(result.tokens.cache.read).toBe(200)
1973
- })
1974
-
1975
- test("separates reasoning tokens from output tokens", () => {
1976
- const model = createModel({ context: 100_000, output: 32_000 })
1977
- const result = SessionNs.getUsage({
1978
- model,
1979
- usage: {
1980
- inputTokens: 1000,
1981
- outputTokens: 500,
1982
- totalTokens: 1500,
1983
- inputTokenDetails: {
1984
- noCacheTokens: undefined,
1985
- cacheReadTokens: undefined,
1986
- cacheWriteTokens: undefined,
1987
- },
1988
- outputTokenDetails: {
1989
- textTokens: 400,
1990
- reasoningTokens: 100,
1991
- },
1992
- },
1993
- })
1994
-
1995
- expect(result.tokens.input).toBe(1000)
1996
- expect(result.tokens.output).toBe(400)
1997
- expect(result.tokens.reasoning).toBe(100)
1998
- expect(result.tokens.total).toBe(1500)
1999
- })
2000
-
2001
- test("does not double count reasoning tokens in cost", () => {
2002
- const model = createModel({
2003
- context: 100_000,
2004
- output: 32_000,
2005
- cost: {
2006
- input: 0,
2007
- output: 15,
2008
- cache: { read: 0, write: 0 },
2009
- },
2010
- })
2011
- const result = SessionNs.getUsage({
2012
- model,
2013
- usage: {
2014
- inputTokens: 0,
2015
- outputTokens: 1_000_000,
2016
- totalTokens: 1_000_000,
2017
- inputTokenDetails: {
2018
- noCacheTokens: undefined,
2019
- cacheReadTokens: undefined,
2020
- cacheWriteTokens: undefined,
2021
- },
2022
- outputTokenDetails: {
2023
- textTokens: 750_000,
2024
- reasoningTokens: 250_000,
2025
- },
2026
- },
2027
- })
2028
-
2029
- expect(result.tokens.output).toBe(750_000)
2030
- expect(result.tokens.reasoning).toBe(250_000)
2031
- expect(result.cost).toBe(15)
2032
- })
2033
-
2034
- test("handles undefined optional values gracefully", () => {
2035
- const model = createModel({ context: 100_000, output: 32_000 })
2036
- const result = SessionNs.getUsage({
2037
- model,
2038
- usage: {
2039
- inputTokens: 0,
2040
- outputTokens: 0,
2041
- totalTokens: 0,
2042
- inputTokenDetails: {
2043
- noCacheTokens: undefined,
2044
- cacheReadTokens: undefined,
2045
- cacheWriteTokens: undefined,
2046
- },
2047
- outputTokenDetails: {
2048
- textTokens: undefined,
2049
- reasoningTokens: undefined,
2050
- },
2051
- },
2052
- })
2053
-
2054
- expect(result.tokens.input).toBe(0)
2055
- expect(result.tokens.output).toBe(0)
2056
- expect(result.tokens.reasoning).toBe(0)
2057
- expect(result.tokens.cache.read).toBe(0)
2058
- expect(result.tokens.cache.write).toBe(0)
2059
- expect(Number.isNaN(result.cost)).toBe(false)
2060
- })
2061
-
2062
- test("calculates cost correctly", () => {
2063
- const model = createModel({
2064
- context: 100_000,
2065
- output: 32_000,
2066
- cost: {
2067
- input: 3,
2068
- output: 15,
2069
- cache: { read: 0.3, write: 3.75 },
2070
- },
2071
- })
2072
- const result = SessionNs.getUsage({
2073
- model,
2074
- usage: {
2075
- inputTokens: 1_000_000,
2076
- outputTokens: 100_000,
2077
- totalTokens: 1_100_000,
2078
- inputTokenDetails: {
2079
- noCacheTokens: undefined,
2080
- cacheReadTokens: undefined,
2081
- cacheWriteTokens: undefined,
2082
- },
2083
- outputTokenDetails: {
2084
- textTokens: undefined,
2085
- reasoningTokens: undefined,
2086
- },
2087
- },
2088
- })
2089
-
2090
- expect(result.cost).toBe(3 + 1.5)
2091
- })
2092
- test("uses openrouter provider cost when available", () => {
2093
- const model = createModel({
2094
- context: 100_000,
2095
- output: 32_000,
2096
- cost: {
2097
- input: 3,
2098
- output: 15,
2099
- cache: { read: 0.3, write: 3.75 },
2100
- },
2101
- })
2102
- const result = SessionNs.getUsage({
2103
- model,
2104
- usage: {
2105
- inputTokens: 1_000_000,
2106
- outputTokens: 100_000,
2107
- totalTokens: 1_100_000,
2108
- inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
2109
- outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
2110
- },
2111
- metadata: {
2112
- openrouter: {
2113
- usage: {
2114
- cost: 0.42, // Provider-reported cost should be used instead of calculated
2115
- },
2116
- },
2117
- },
2118
- })
2119
-
2120
- // Should use the provider cost (0.42) instead of calculated cost (4.5)
2121
- expect(result.cost).toBe(0.42)
2122
- })
2123
-
2124
- test("falls back to calculated cost when openrouter cost is not available", () => {
2125
- const model = createModel({
2126
- context: 100_000,
2127
- output: 32_000,
2128
- cost: {
2129
- input: 3,
2130
- output: 15,
2131
- cache: { read: 0.3, write: 3.75 },
2132
- },
2133
- })
2134
- const result = SessionNs.getUsage({
2135
- model,
2136
- usage: {
2137
- inputTokens: 1_000_000,
2138
- outputTokens: 100_000,
2139
- totalTokens: 1_100_000,
2140
- inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
2141
- outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
2142
- },
2143
- metadata: {
2144
- openrouter: {
2145
- usage: {
2146
- // cost is undefined
2147
- },
2148
- },
2149
- },
2150
- })
2151
-
2152
- // Should fall back to calculated cost
2153
- expect(result.cost).toBe(3 + 1.5)
2154
- })
2155
-
2156
- test("falls back to calculated cost when openrouter metadata is empty", () => {
2157
- const model = createModel({
2158
- context: 100_000,
2159
- output: 32_000,
2160
- cost: {
2161
- input: 3,
2162
- output: 15,
2163
- cache: { read: 0.3, write: 3.75 },
2164
- },
2165
- })
2166
- const result = SessionNs.getUsage({
2167
- model,
2168
- usage: {
2169
- inputTokens: 1_000_000,
2170
- outputTokens: 100_000,
2171
- totalTokens: 1_100_000,
2172
- inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
2173
- outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
2174
- },
2175
- metadata: {
2176
- openrouter: {},
2177
- },
2178
- })
2179
-
2180
- // Should fall back to calculated cost
2181
- expect(result.cost).toBe(3 + 1.5)
2182
- })
2183
-
2184
- test("uses upstreamInferenceCost for Saeeol provider", () => {
2185
- const model = createModel({
2186
- context: 100_000,
2187
- output: 32_000,
2188
- cost: {
2189
- input: 3,
2190
- output: 15,
2191
- cache: { read: 0.3, write: 3.75 },
2192
- },
2193
- })
2194
- const provider = { id: "saeeol" } as Provider.Info
2195
- const result = SessionNs.getUsage({
2196
- model,
2197
- provider,
2198
- usage: {
2199
- inputTokens: 1_000_000,
2200
- outputTokens: 100_000,
2201
- totalTokens: 1_100_000,
2202
- inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
2203
- outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
2204
- },
2205
- metadata: {
2206
- openrouter: {
2207
- usage: {
2208
- cost: 0.01, // OpenRouter 5% fee
2209
- costDetails: {
2210
- upstreamInferenceCost: 0.2, // Actual inference cost
2211
- },
2212
- },
2213
- },
2214
- },
2215
- })
2216
-
2217
- // Should use upstreamInferenceCost for Saeeol provider (BYOK)
2218
- expect(result.cost).toBe(0.2)
2219
- })
2220
-
2221
- test("uses regular cost for OpenRouter provider", () => {
2222
- const model = createModel({
2223
- context: 100_000,
2224
- output: 32_000,
2225
- cost: {
2226
- input: 3,
2227
- output: 15,
2228
- cache: { read: 0.3, write: 3.75 },
2229
- },
2230
- })
2231
- const provider = { id: "openrouter" } as Provider.Info
2232
- const result = SessionNs.getUsage({
2233
- model,
2234
- provider,
2235
- usage: {
2236
- inputTokens: 1_000_000,
2237
- outputTokens: 100_000,
2238
- totalTokens: 1_100_000,
2239
- inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
2240
- outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
2241
- },
2242
- metadata: {
2243
- openrouter: {
2244
- usage: {
2245
- cost: 0.5, // Regular OpenRouter cost
2246
- costDetails: {
2247
- upstreamInferenceCost: 0.45,
2248
- },
2249
- },
2250
- },
2251
- },
2252
- })
2253
-
2254
- // Should use regular cost for OpenRouter provider
2255
- expect(result.cost).toBe(0.5)
2256
- })
2257
-
2258
- test("falls back to regular cost when provider is not specified", () => {
2259
- const model = createModel({
2260
- context: 100_000,
2261
- output: 32_000,
2262
- cost: {
2263
- input: 3,
2264
- output: 15,
2265
- cache: { read: 0.3, write: 3.75 },
2266
- },
2267
- })
2268
- const result = SessionNs.getUsage({
2269
- model,
2270
- usage: {
2271
- inputTokens: 1_000_000,
2272
- outputTokens: 100_000,
2273
- totalTokens: 1_100_000,
2274
- inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
2275
- outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
2276
- },
2277
- metadata: {
2278
- openrouter: {
2279
- usage: {
2280
- cost: 0.3,
2281
- costDetails: {
2282
- upstreamInferenceCost: 0.25,
2283
- },
2284
- },
2285
- },
2286
- },
2287
- })
2288
-
2289
- // Should use regular cost when provider is not specified
2290
- expect(result.cost).toBe(0.3)
2291
- })
2292
-
2293
- test("uses regular cost when upstreamInferenceCost is missing for Saeeol", () => {
2294
- const model = createModel({
2295
- context: 100_000,
2296
- output: 32_000,
2297
- cost: {
2298
- input: 3,
2299
- output: 15,
2300
- cache: { read: 0.3, write: 3.75 },
2301
- },
2302
- })
2303
- const provider = { id: "saeeol" } as Provider.Info
2304
- const result = SessionNs.getUsage({
2305
- model,
2306
- provider,
2307
- usage: {
2308
- inputTokens: 1_000_000,
2309
- outputTokens: 100_000,
2310
- totalTokens: 1_100_000,
2311
- inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
2312
- outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
2313
- },
2314
- metadata: {
2315
- openrouter: {
2316
- usage: {
2317
- cost: 0.01,
2318
- // costDetails is missing
2319
- },
2320
- },
2321
- },
2322
- })
2323
-
2324
- // When upstream cost is missing for Saeeol, fall back to regular cost field
2325
- expect(result.cost).toBe(0.01)
2326
- })
2327
-
2328
- // Tests for Anthropic Messages / OpenAI Responses / Vercel AI Gateway cost extraction
2329
- // live in test/saeeol/provider-cost.test.ts (saeeol_change).
2330
-
2331
- test.each(["@ai-sdk/anthropic", "@ai-sdk/amazon-bedrock", "@ai-sdk/google-vertex/anthropic"])(
2332
- "computes total from components for %s models",
2333
- (npm) => {
2334
- const model = createModel({ context: 100_000, output: 32_000, npm })
2335
- // AI SDK v6: inputTokens includes cached tokens for all providers
2336
- const usage = {
2337
- inputTokens: 1000,
2338
- outputTokens: 500,
2339
- totalTokens: 1500,
2340
- inputTokenDetails: {
2341
- noCacheTokens: 800,
2342
- cacheReadTokens: 200,
2343
- cacheWriteTokens: undefined,
2344
- },
2345
- outputTokenDetails: {
2346
- textTokens: undefined,
2347
- reasoningTokens: undefined,
2348
- },
2349
- }
2350
- if (npm === "@ai-sdk/amazon-bedrock") {
2351
- const result = SessionNs.getUsage({
2352
- model,
2353
- usage,
2354
- metadata: {
2355
- bedrock: {
2356
- usage: {
2357
- cacheWriteInputTokens: 300,
2358
- },
2359
- },
2360
- },
2361
- })
2362
-
2363
- // inputTokens (1000) includes cache, so adjusted = 1000 - 200 - 300 = 500
2364
- expect(result.tokens.input).toBe(500)
2365
- expect(result.tokens.cache.read).toBe(200)
2366
- expect(result.tokens.cache.write).toBe(300)
2367
- // total = adjusted (500) + output (500) + cacheRead (200) + cacheWrite (300)
2368
- expect(result.tokens.total).toBe(1500)
2369
- return
2370
- }
2371
-
2372
- const result = SessionNs.getUsage({
2373
- model,
2374
- usage,
2375
- metadata: {
2376
- anthropic: {
2377
- cacheCreationInputTokens: 300,
2378
- },
2379
- },
2380
- })
2381
-
2382
- // inputTokens (1000) includes cache, so adjusted = 1000 - 200 - 300 = 500
2383
- expect(result.tokens.input).toBe(500)
2384
- expect(result.tokens.cache.read).toBe(200)
2385
- expect(result.tokens.cache.write).toBe(300)
2386
- // total = adjusted (500) + output (500) + cacheRead (200) + cacheWrite (300)
2387
- expect(result.tokens.total).toBe(1500)
2388
- },
2389
- )
2390
-
2391
- test("extracts cache write tokens from vertex metadata key", () => {
2392
- const model = createModel({ context: 100_000, output: 32_000, npm: "@ai-sdk/google-vertex/anthropic" })
2393
- const result = SessionNs.getUsage({
2394
- model,
2395
- usage: {
2396
- inputTokens: 1000,
2397
- outputTokens: 500,
2398
- totalTokens: 1500,
2399
- inputTokenDetails: {
2400
- noCacheTokens: 800,
2401
- cacheReadTokens: 200,
2402
- cacheWriteTokens: undefined,
2403
- },
2404
- outputTokenDetails: {
2405
- textTokens: undefined,
2406
- reasoningTokens: undefined,
2407
- },
2408
- },
2409
- metadata: {
2410
- vertex: {
2411
- cacheCreationInputTokens: 300,
2412
- },
2413
- },
2414
- })
2415
-
2416
- expect(result.tokens.input).toBe(500)
2417
- expect(result.tokens.cache.read).toBe(200)
2418
- expect(result.tokens.cache.write).toBe(300)
2419
- })
2420
- })