saeeol 1.3.0 → 1.4.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/AGENTS.md +72 -0
- package/BUN_SHELL_MIGRATION_PLAN.md +136 -0
- package/Dockerfile +18 -0
- package/assets/saeeol.ico +0 -0
- package/bin/saeeol.cjs +3 -1
- package/bunfig.toml +7 -0
- package/database.db +0 -0
- package/drizzle.config.ts +10 -0
- package/git +0 -0
- package/migration/20260127222353_familiar_lady_ursula/migration.sql +90 -0
- package/migration/20260127222353_familiar_lady_ursula/snapshot.json +796 -0
- package/migration/20260211171708_add_project_commands/migration.sql +1 -0
- package/migration/20260211171708_add_project_commands/snapshot.json +806 -0
- package/migration/20260213144116_wakeful_the_professor/migration.sql +11 -0
- package/migration/20260213144116_wakeful_the_professor/snapshot.json +897 -0
- package/migration/20260225215848_workspace/migration.sql +7 -0
- package/migration/20260225215848_workspace/snapshot.json +959 -0
- package/migration/20260227213759_add_session_workspace_id/migration.sql +2 -0
- package/migration/20260227213759_add_session_workspace_id/snapshot.json +983 -0
- package/migration/20260228203230_blue_harpoon/migration.sql +17 -0
- package/migration/20260228203230_blue_harpoon/snapshot.json +1102 -0
- package/migration/20260303231226_add_workspace_fields/migration.sql +5 -0
- package/migration/20260303231226_add_workspace_fields/snapshot.json +1013 -0
- package/migration/20260309230000_move_org_to_state/migration.sql +3 -0
- package/migration/20260309230000_move_org_to_state/snapshot.json +1156 -0
- package/migration/20260312043431_session_message_cursor/migration.sql +4 -0
- package/migration/20260312043431_session_message_cursor/snapshot.json +1168 -0
- package/migration/20260323234822_events/migration.sql +13 -0
- package/migration/20260323234822_events/snapshot.json +1271 -0
- package/migration/20260410174513_workspace-name/migration.sql +16 -0
- package/migration/20260410174513_workspace-name/snapshot.json +1271 -0
- package/migration/20260413175956_chief_energizer/migration.sql +13 -0
- package/migration/20260413175956_chief_energizer/snapshot.json +1399 -0
- package/migration/20260423070820_add_icon_url_override/migration.sql +2 -0
- package/migration/20260423070820_add_icon_url_override/snapshot.json +1409 -0
- package/migration/20260428004200_add_session_path/migration.sql +1 -0
- package/migration/20260428004200_add_session_path/snapshot.json +1419 -0
- package/npm/bin/saeeol +42 -0
- package/npm/package.json +39 -0
- package/npm/postinstall.js +162 -0
- package/package.json +201 -207
- package/parsers-config.ts +289 -0
- package/script/build.ts +393 -0
- package/script/check-migrations.ts +16 -0
- package/script/fix-node-pty.ts +34 -0
- package/script/generate.ts +23 -0
- package/script/postinstall.mjs +189 -0
- package/script/publish.ts +200 -0
- package/script/run-workspace-server +106 -0
- package/script/schema.ts +63 -0
- package/script/test-runner.ts +420 -0
- package/script/time.ts +6 -0
- package/script/trace-imports.ts +153 -0
- package/script/upgrade-opentui.ts +64 -0
- package/scripts/diff-sdk-types.sh +52 -0
- package/specs/effect/facades.md +221 -0
- package/specs/effect/http-api.md +401 -0
- package/specs/effect/instance-context.md +309 -0
- package/specs/effect/loose-ends.md +34 -0
- package/specs/effect/migration.md +299 -0
- package/specs/effect/routes.md +64 -0
- package/specs/effect/schema.md +399 -0
- package/specs/effect/server-package.md +668 -0
- package/specs/effect/tools.md +90 -0
- package/specs/tui-plugins.md +433 -0
- package/specs/v2/api.ts +67 -0
- package/specs/v2/keymappings.md +10 -0
- package/specs/v2/message-shape.md +136 -0
- package/src/acp/agent-message.ts +1 -1
- package/src/acp/agent-utils.ts +1 -1
- package/src/boxes/ansi.ts +17 -0
- package/src/boxes/atomic-write.ts +35 -0
- package/src/boxes/b64.ts +58 -0
- package/src/boxes/bash-security.ts +129 -0
- package/src/boxes/bom.ts +18 -0
- package/src/boxes/cancel.ts +16 -0
- package/src/boxes/chop.ts +12 -0
- package/src/boxes/clamp.ts +3 -0
- package/src/boxes/compact.ts +9 -0
- package/src/boxes/cost-tracker.ts +116 -0
- package/src/boxes/dataurl.ts +29 -0
- package/src/boxes/delay.ts +27 -0
- package/src/boxes/diff-apply.ts +53 -0
- package/src/boxes/disposable.ts +13 -0
- package/src/boxes/err.ts +34 -0
- package/src/boxes/human.ts +47 -0
- package/src/boxes/iife.ts +9 -0
- package/src/boxes/latch.ts +8 -0
- package/src/boxes/memory.ts +198 -0
- package/src/boxes/net.ts +16 -0
- package/src/boxes/plural.ts +4 -0
- package/src/boxes/puny.ts +21 -0
- package/src/boxes/retry.ts +49 -0
- package/src/boxes/rwlock.ts +41 -0
- package/src/boxes/schedule.ts +71 -0
- package/src/boxes/scope.ts +21 -0
- package/src/boxes/tokens.ts +9 -0
- package/src/boxes/ttl-cache.ts +63 -0
- package/src/boxes/typed-event.ts +51 -0
- package/src/boxes/uid.ts +50 -0
- package/src/boxes/wave6.test.ts +296 -0
- package/src/boxes/wildcard.ts +58 -0
- package/src/bus/global.ts +1 -1
- package/src/cli/cmd/github-run-api.ts +2 -2
- package/src/cli/cmd/run-events.ts +2 -2
- package/src/cli/cmd/tui/component/logo.tsx +1 -1
- package/src/cli/cmd/tui/component/prompt/use-prompt-memos.ts +2 -2
- package/src/cli/cmd/tui/context/app/editor-zed.ts +1 -1
- package/src/cli/cmd/tui/context/app/editor.ts +1 -1
- package/src/cli/cmd/tui/context/app/theme.tsx +1 -1
- package/src/cli/cmd/tui/preflight.ts +138 -0
- package/src/cli/cmd/tui/thread.ts +20 -0
- package/src/cli/cmd/tui/util/revert-diff.ts +1 -1
- package/src/overlay/cli/cmd/roll-call-call.ts +1 -1
- package/src/overlay/cost-tracker/format.ts +1 -1
- package/src/overlay/cost-tracker/index.ts +4 -4
- package/src/overlay/cost-tracker/state.ts +2 -2
- package/src/overlay/cost-tracker/types.ts +2 -2
- package/src/overlay/memory/age.ts +1 -1
- package/src/overlay/memory/index.ts +4 -4
- package/src/overlay/memory/paths.ts +2 -2
- package/src/overlay/memory/scan.ts +1 -1
- package/src/overlay/memory/types.ts +2 -2
- package/src/overlay/tool/bash-security.ts +3 -3
- package/src/overlay/util/url.ts +1 -1
- package/src/plugin/codex-auth.ts +1 -1
- package/src/provider/model-cache.ts +2 -2
- package/src/provider/provider-resolve.ts +3 -3
- package/src/provider/transform-message.ts +1 -1
- package/src/server/routes/game.ts +284 -0
- package/src/server/server.ts +2 -0
- package/src/session/core/compaction/compaction-helpers.ts +1 -1
- package/src/session/core/compaction/compaction.ts +1 -1
- package/src/session/core/session.ts +2 -0
- package/src/sessions/ingest-queue.ts +2 -2
- package/src/sessions/remote-ws.ts +1 -1
- package/src/tool/workflow/question.ts +1 -1
- package/src/util/abort.ts +1 -1
- package/src/util/bom.ts +2 -2
- package/src/util/color.ts +1 -1
- package/src/util/data-url.ts +1 -1
- package/src/util/defer.ts +1 -1
- package/src/util/error.ts +2 -2
- package/src/util/filesystem.ts +2 -2
- package/src/util/format.ts +1 -1
- package/src/util/iife.ts +1 -1
- package/src/util/local-context.ts +1 -1
- package/src/util/locale.ts +2 -2
- package/src/util/lock.ts +1 -1
- package/src/util/network.ts +1 -1
- package/src/util/signal.ts +1 -1
- package/src/util/token.ts +1 -1
- package/src/util/wildcard.ts +1 -1
- package/sst-env.d.ts +10 -0
- package/test/AGENTS.md +133 -0
- package/test/account/repo.test.ts +352 -0
- package/test/account/service.test.ts +456 -0
- package/test/acp/agent-interface.test.ts +51 -0
- package/test/acp/event-subscription.test.ts +725 -0
- package/test/agent/agent.test.ts +890 -0
- package/test/auth/auth.test.ts +86 -0
- package/test/bun/registry.test.ts +75 -0
- package/test/bus/bus-effect.test.ts +161 -0
- package/test/bus/bus-integration.test.ts +87 -0
- package/test/bus/bus.test.ts +219 -0
- package/test/cli/account.test.ts +26 -0
- package/test/cli/auto-mode.test.ts +75 -0
- package/test/cli/bin-saeeol.test.ts +8 -0
- package/test/cli/cmd/tui/prompt-part.test.ts +47 -0
- package/test/cli/cmd/tui/prompt-traits.test.ts +38 -0
- package/test/cli/cmd/tui/sync.test.tsx +159 -0
- package/test/cli/error.test.ts +18 -0
- package/test/cli/github-action.test.ts +198 -0
- package/test/cli/github-remote.test.ts +85 -0
- package/test/cli/import.test.ts +97 -0
- package/test/cli/install-artifact.test.ts +72 -0
- package/test/cli/plugin-auth-picker.test.ts +120 -0
- package/test/cli/pr.test.ts +59 -0
- package/test/cli/tui/editor-context-zed.test.ts +356 -0
- package/test/cli/tui/editor-context.test.tsx +228 -0
- package/test/cli/tui/keybind-plugin.test.ts +90 -0
- package/test/cli/tui/markdown.test.ts +161 -0
- package/test/cli/tui/plugin-add.test.ts +111 -0
- package/test/cli/tui/plugin-install.test.ts +87 -0
- package/test/cli/tui/plugin-lifecycle.test.ts +224 -0
- package/test/cli/tui/plugin-loader-entrypoint.test.ts +484 -0
- package/test/cli/tui/plugin-loader-pure.test.ts +71 -0
- package/test/cli/tui/plugin-loader.test.ts +816 -0
- package/test/cli/tui/plugin-toggle.test.ts +157 -0
- package/test/cli/tui/revert-diff.test.ts +35 -0
- package/test/cli/tui/slot-replace.test.tsx +47 -0
- package/test/cli/tui/theme-store.test.ts +54 -0
- package/test/cli/tui/thread.test.ts +28 -0
- package/test/cli/tui/transcript.test.ts +426 -0
- package/test/cli/tui/usage.test.ts +60 -0
- package/test/cli/tui/use-event.test.tsx +175 -0
- package/test/config/agent-color.test.ts +67 -0
- package/test/config/config.test.ts +2544 -0
- package/test/config/fixtures/empty-frontmatter.md +4 -0
- package/test/config/fixtures/frontmatter.md +28 -0
- package/test/config/fixtures/markdown-header.md +11 -0
- package/test/config/fixtures/no-frontmatter.md +1 -0
- package/test/config/fixtures/weird-model-id.md +13 -0
- package/test/config/lsp.test.ts +87 -0
- package/test/config/markdown.test.ts +228 -0
- package/test/config/plugin.test.ts +0 -0
- package/test/config/tui.test.ts +624 -0
- package/test/control-plane/adapters.test.ts +71 -0
- package/test/control-plane/workspace.test.ts +1526 -0
- package/test/effect/app-runtime-logger.test.ts +98 -0
- package/test/effect/config-service.test.ts +65 -0
- package/test/effect/instance-state.test.ts +394 -0
- package/test/effect/run-service.test.ts +89 -0
- package/test/effect/runner.test.ts +523 -0
- package/test/fake/provider.ts +82 -0
- package/test/file/fsmonitor.test.ts +68 -0
- package/test/file/ignore.test.ts +10 -0
- package/test/file/index.test.ts +954 -0
- package/test/file/path-traversal.test.ts +205 -0
- package/test/file/ripgrep.test.ts +226 -0
- package/test/file/watcher.test.ts +249 -0
- package/test/filesystem/filesystem.test.ts +319 -0
- package/test/fixture/db.ts +11 -0
- package/test/fixture/fixture.test.ts +26 -0
- package/test/fixture/fixture.ts +175 -0
- package/test/fixture/flock-worker.ts +72 -0
- package/test/fixture/log-init-worker.ts +62 -0
- package/test/fixture/lsp/fake-lsp-server.js +249 -0
- package/test/fixture/plug-worker.ts +93 -0
- package/test/fixture/plugin-meta-worker.ts +19 -0
- package/test/fixture/skills/agents-sdk/SKILL.md +152 -0
- package/test/fixture/skills/cloudflare/SKILL.md +211 -0
- package/test/fixture/skills/index.json +6 -0
- package/test/fixture/tui-plugin.ts +323 -0
- package/test/fixture/tui-runtime.ts +31 -0
- package/test/format/format.test.ts +272 -0
- package/test/git/git.test.ts +128 -0
- package/test/ide/ide.test.ts +82 -0
- package/test/installation/installation.test.ts +168 -0
- package/test/keybind.test.ts +421 -0
- package/test/lib/effect.ts +53 -0
- package/test/lib/filesystem.ts +10 -0
- package/test/lib/llm-server.ts +778 -0
- package/test/lib/websocket.ts +46 -0
- package/test/lsp/client.test.ts +482 -0
- package/test/lsp/index.test.ts +160 -0
- package/test/lsp/launch.test.ts +22 -0
- package/test/lsp/lifecycle.test.ts +184 -0
- package/test/ltm/ltm.test.ts +230 -0
- package/test/mcp/headers.test.ts +178 -0
- package/test/mcp/lifecycle.test.ts +787 -0
- package/test/mcp/oauth-auto-connect.test.ts +311 -0
- package/test/mcp/oauth-browser.test.ts +276 -0
- package/test/mcp/oauth-callback.test.ts +34 -0
- package/test/memory/abort-leak-webfetch.ts +49 -0
- package/test/memory/abort-leak.test.ts +128 -0
- package/test/patch/patch.test.ts +348 -0
- package/test/permission/arity.test.ts +33 -0
- package/test/permission/next.test.ts +1227 -0
- package/test/permission/next.toConfig.test.ts +110 -0
- package/test/permission-task.test.ts +326 -0
- package/test/plugin/auth-override.test.ts +79 -0
- package/test/plugin/cloudflare.test.ts +68 -0
- package/test/plugin/codex.test.ts +123 -0
- package/test/plugin/github-copilot-models.test.ts +261 -0
- package/test/plugin/install-concurrency.test.ts +140 -0
- package/test/plugin/install.test.ts +570 -0
- package/test/plugin/loader-shared.test.ts +1169 -0
- package/test/plugin/meta.test.ts +137 -0
- package/test/plugin/plugin-contract.test.ts +291 -0
- package/test/plugin/shared.test.ts +88 -0
- package/test/plugin/trigger.test.ts +102 -0
- package/test/plugin/workspace-adapter.test.ts +109 -0
- package/test/preload.ts +77 -0
- package/test/project/instance.test.ts +276 -0
- package/test/project/migrate-global.test.ts +152 -0
- package/test/project/project.test.ts +600 -0
- package/test/project/vcs.test.ts +286 -0
- package/test/project/worktree-remove.test.ts +126 -0
- package/test/project/worktree.test.ts +223 -0
- package/test/provider/amazon-bedrock.test.ts +462 -0
- package/test/provider/copilot/convert-to-copilot-messages.test.ts +523 -0
- package/test/provider/copilot/copilot-chat-model.test.ts +592 -0
- package/test/provider/gitlab-duo.test.ts +413 -0
- package/test/provider/local.test.ts +208 -0
- package/test/provider/models.test.ts +261 -0
- package/test/provider/provider-category.test.ts +190 -0
- package/test/provider/provider.test.ts +2758 -0
- package/test/provider/transform.test.ts +3681 -0
- package/test/pty/pty-output-isolation.test.ts +147 -0
- package/test/pty/pty-session.test.ts +102 -0
- package/test/pty/pty-shell.test.ts +104 -0
- package/test/question/question.test.ts +490 -0
- package/test/saeeol/agent-global-config-dirs.test.ts +24 -0
- package/test/saeeol/agent-manager-tool.test.ts +71 -0
- package/test/saeeol/agent-permission-overrides.test.ts +75 -0
- package/test/saeeol/agent-skill-permissions.test.ts +37 -0
- package/test/saeeol/ask-agent-permissions.test.ts +303 -0
- package/test/saeeol/bash-hierarchy.test.ts +64 -0
- package/test/saeeol/bash-permission-metadata.test.ts +66 -0
- package/test/saeeol/bash-security-extended.test.ts +243 -0
- package/test/saeeol/bedrock-claude-empty-content.test.ts +138 -0
- package/test/saeeol/boxes-integration.test.ts +415 -0
- package/test/saeeol/builtin-skills.test.ts +75 -0
- package/test/saeeol/cleanup.ts +28 -0
- package/test/saeeol/cli/dev-setup.test.ts +74 -0
- package/test/saeeol/cli/roll-call.test.ts +161 -0
- package/test/saeeol/cli-run-auto-helper.test.ts +58 -0
- package/test/saeeol/codex-auth-refresh.test.ts +124 -0
- package/test/saeeol/commit-message/generate.test.ts +188 -0
- package/test/saeeol/commit-message/git-context.test.ts +303 -0
- package/test/saeeol/commit-message-windows.test.ts +38 -0
- package/test/saeeol/compaction-payload-recovery.test.ts +406 -0
- package/test/saeeol/compaction-preservation-audit.test.ts +122 -0
- package/test/saeeol/compaction-skip-guard.test.ts +224 -0
- package/test/saeeol/compaction-smart-select.test.ts +100 -0
- package/test/saeeol/config/config.test.ts +166 -0
- package/test/saeeol/config/indexing-default-plugin.test.ts +82 -0
- package/test/saeeol/config/opentelemetry-default.test.ts +29 -0
- package/test/saeeol/config-gitignore.test.ts +70 -0
- package/test/saeeol/config-injector.test.ts +305 -0
- package/test/saeeol/config-resilience.test.ts +234 -0
- package/test/saeeol/config-validation.test.ts +183 -0
- package/test/saeeol/cost-propagation.test.ts +94 -0
- package/test/saeeol/cost-tracker-extended.test.ts +141 -0
- package/test/saeeol/cost-tracker.test.ts +64 -0
- package/test/saeeol/custom-provider-delete.test.ts +149 -0
- package/test/saeeol/diff-full.test.ts +226 -0
- package/test/saeeol/edit-permission-filediff.test.ts +223 -0
- package/test/saeeol/encoding.test.ts +364 -0
- package/test/saeeol/enhance-prompt.test.ts +61 -0
- package/test/saeeol/ensure-plan-dir.test.ts +32 -0
- package/test/saeeol/errors.test.ts +144 -0
- package/test/saeeol/external-directory-boundary.test.ts +96 -0
- package/test/saeeol/gateway-headers.test.ts +88 -0
- package/test/saeeol/help.test.ts +191 -0
- package/test/saeeol/ignore-migrator.test.ts +308 -0
- package/test/saeeol/indexing-auth.test.ts +45 -0
- package/test/saeeol/indexing-feature.test.ts +44 -0
- package/test/saeeol/indexing-label.test.ts +70 -0
- package/test/saeeol/indexing-startup.test.ts +381 -0
- package/test/saeeol/indexing-worktree.test.ts +73 -0
- package/test/saeeol/instruction.test.ts +136 -0
- package/test/saeeol/lancedb-runtime.test.ts +116 -0
- package/test/saeeol/loader-auth.test.ts +168 -0
- package/test/saeeol/local-model.test.ts +621 -0
- package/test/saeeol/logo.test.ts +31 -0
- package/test/saeeol/lsp-typescript-lightweight.test.ts +89 -0
- package/test/saeeol/mcp-branding.test.ts +33 -0
- package/test/saeeol/mcp-docker-rm.test.ts +32 -0
- package/test/saeeol/mcp-migrator.test.ts +736 -0
- package/test/saeeol/mcp-oauth-callback.test.ts +33 -0
- package/test/saeeol/memory-io.test.ts +198 -0
- package/test/saeeol/memory-paths.test.ts +87 -0
- package/test/saeeol/memory-security.test.ts +166 -0
- package/test/saeeol/model-cache-org.test.ts +164 -0
- package/test/saeeol/model-info-panel-utils.test.ts +52 -0
- package/test/saeeol/model-info-panel.types.test.ts +7 -0
- package/test/saeeol/models-401-fallback.test.ts +52 -0
- package/test/saeeol/modes-migrator.test.ts +320 -0
- package/test/saeeol/nvidia-headers.test.ts +74 -0
- package/test/saeeol/patch-jsonc.test.ts +73 -0
- package/test/saeeol/patch.test.ts +172 -0
- package/test/saeeol/paths.test.ts +265 -0
- package/test/saeeol/permission/config-paths.test.ts +174 -0
- package/test/saeeol/permission/env-read.test.ts +149 -0
- package/test/saeeol/permission/external-directory-allow.test.ts +327 -0
- package/test/saeeol/permission/next.always-rules.test.ts +882 -0
- package/test/saeeol/permission/next.reply-http.test.ts +205 -0
- package/test/saeeol/permission/next.reply-routing.test.ts +184 -0
- package/test/saeeol/plan-exit-detection.test.ts +494 -0
- package/test/saeeol/plan-followup.test.ts +1376 -0
- package/test/saeeol/project-config-update.test.ts +120 -0
- package/test/saeeol/project-id.test.ts +455 -0
- package/test/saeeol/provider-cost.test.ts +171 -0
- package/test/saeeol/provider-list-failed-state.test.ts +100 -0
- package/test/saeeol/question-dismiss-all.test.ts +174 -0
- package/test/saeeol/read-directory.test.ts +116 -0
- package/test/saeeol/rules-migrator.test.ts +257 -0
- package/test/saeeol/run-auto.test.ts +176 -0
- package/test/saeeol/run-network.test.ts +224 -0
- package/test/saeeol/semantic-search.test.ts +186 -0
- package/test/saeeol/server/permission-allow-everything.test.ts +125 -0
- package/test/saeeol/session/instruction-substitution.test.ts +72 -0
- package/test/saeeol/session/platform-attribution.test.ts +118 -0
- package/test/saeeol/session/session.test.ts +105 -0
- package/test/saeeol/session-compaction-cap.test.ts +399 -0
- package/test/saeeol/session-compaction-chunks.test.ts +501 -0
- package/test/saeeol/session-compaction-safety.test.ts +481 -0
- package/test/saeeol/session-fork-remap.test.ts +251 -0
- package/test/saeeol/session-import-service.test.ts +114 -0
- package/test/saeeol/session-list.test.ts +47 -0
- package/test/saeeol/session-message-metadata.test.ts +128 -0
- package/test/saeeol/session-overflow.test.ts +78 -0
- package/test/saeeol/session-processor-empty-tool-calls.test.ts +571 -0
- package/test/saeeol/session-processor-network-offline.test.ts +204 -0
- package/test/saeeol/session-processor-retry-limit.test.ts +238 -0
- package/test/saeeol/session-processor-review-telemetry.test.ts +82 -0
- package/test/saeeol/session-prompt-compaction-safety.test.ts +517 -0
- package/test/saeeol/session-prompt-queue.test.ts +815 -0
- package/test/saeeol/sessions/inflight-cache.test.ts +157 -0
- package/test/saeeol/sessions/ingest-queue.test.ts +402 -0
- package/test/saeeol/sessions/remote-protocol.test.ts +258 -0
- package/test/saeeol/sessions/remote-sender.test.ts +1036 -0
- package/test/saeeol/sessions/remote-ws.test.ts +367 -0
- package/test/saeeol/sessions/sessions-enable-remote.test.disable +181 -0
- package/test/saeeol/slot-prop-reactivity.test.ts +142 -0
- package/test/saeeol/snapshot-cache.test.ts +84 -0
- package/test/saeeol/snapshot-freeze-repro.test.ts +100 -0
- package/test/saeeol/snapshot-track-timeout.test.ts +519 -0
- package/test/saeeol/stats-subagent-cost.test.ts +123 -0
- package/test/saeeol/suggestion/auto-dismiss.test.ts +65 -0
- package/test/saeeol/suggestion/suggestion.test.ts +145 -0
- package/test/saeeol/suggestion/tool.test.ts +298 -0
- package/test/saeeol/summary-file-diff.test.ts +28 -0
- package/test/saeeol/system-prompt.test.ts +142 -0
- package/test/saeeol/task-nesting.test.ts +193 -0
- package/test/saeeol/telemetry/feedback.test.ts +8 -0
- package/test/saeeol/todo-view.test.ts +57 -0
- package/test/saeeol/tool-encoding.test.ts +455 -0
- package/test/saeeol/tool-registry-indexing-import-failure.test.ts +49 -0
- package/test/saeeol/tool-registry-indexing.test.ts +236 -0
- package/test/saeeol/tool-registry-semantic-import-failure.test.ts +55 -0
- package/test/saeeol/tool-task-model.test.ts +352 -0
- package/test/saeeol/transform-opus-4.7.test.ts +89 -0
- package/test/saeeol/tui-diff.test.ts +91 -0
- package/test/saeeol/tui-sync.test.ts +80 -0
- package/test/saeeol/util/url.test.ts +141 -0
- package/test/saeeol/workflows-migrator.test.ts +261 -0
- package/test/saeeol/worktree-diff-summary.test.ts +64 -0
- package/test/saeeol/worktree-diff.test.ts +223 -0
- package/test/saeeol/worktree-remove-lock.test.ts +82 -0
- package/test/server/AGENTS.md +15 -0
- package/test/server/contract.test.ts +357 -0
- package/test/server/experimental-session-list.test.ts +157 -0
- package/test/server/global-session-list.test.ts +155 -0
- package/test/server/httpapi-authorization.test.ts +103 -0
- package/test/server/httpapi-bridge.test.ts +440 -0
- package/test/server/httpapi-config.test.ts +67 -0
- package/test/server/httpapi-cors.test.ts +89 -0
- package/test/server/httpapi-event.test.ts +57 -0
- package/test/server/httpapi-experimental.test.ts +219 -0
- package/test/server/httpapi-file.test.ts +79 -0
- package/test/server/httpapi-instance-context.test.ts +237 -0
- package/test/server/httpapi-instance.legacy.test.ts +140 -0
- package/test/server/httpapi-instance.test.ts +83 -0
- package/test/server/httpapi-json-parity.test.ts +263 -0
- package/test/server/httpapi-mcp-oauth.test.ts +76 -0
- package/test/server/httpapi-mcp.test.ts +189 -0
- package/test/server/httpapi-provider.test.ts +153 -0
- package/test/server/httpapi-pty-websocket.test.ts +16 -0
- package/test/server/httpapi-pty.test.ts +175 -0
- package/test/server/httpapi-raw-route-auth.test.ts +89 -0
- package/test/server/httpapi-sdk.test.ts +681 -0
- package/test/server/httpapi-session.test.ts +464 -0
- package/test/server/httpapi-sync.test.ts +130 -0
- package/test/server/httpapi-tui.test.ts +121 -0
- package/test/server/httpapi-workspace-routing.test.ts +471 -0
- package/test/server/httpapi-workspace.test.ts +427 -0
- package/test/server/lib/conformance.ts +88 -0
- package/test/server/lib/stateful.ts +112 -0
- package/test/server/project-init-git.test.ts +113 -0
- package/test/server/proxy-util.test.ts +113 -0
- package/test/server/session-actions.test.ts +49 -0
- package/test/server/session-list.test.ts +238 -0
- package/test/server/session-messages.test.ts +167 -0
- package/test/server/session-select.test.ts +100 -0
- package/test/server/trace-attributes.test.ts +76 -0
- package/test/server/workspace-proxy.test.ts +165 -0
- package/test/server/workspace-routing.test.ts +85 -0
- package/test/session/compaction.test.ts +2420 -0
- package/test/session/instruction.test.ts +247 -0
- package/test/session/llm.test.ts +1273 -0
- package/test/session/message-v2.test.ts +1291 -0
- package/test/session/messages-pagination.test.ts +1173 -0
- package/test/session/network.test.ts +249 -0
- package/test/session/processor-effect.test.ts +847 -0
- package/test/session/prompt.test.ts +2131 -0
- package/test/session/retry.test.ts +340 -0
- package/test/session/revert-compact.test.ts +639 -0
- package/test/session/schema-decoding.test.ts +311 -0
- package/test/session/session-entry-stepper.test.ts +917 -0
- package/test/session/session-schema.test.ts +76 -0
- package/test/session/snapshot-tool-race.test.ts +257 -0
- package/test/session/structured-output-integration.test.ts +265 -0
- package/test/session/structured-output.test.ts +381 -0
- package/test/session/system.test.ts +73 -0
- package/test/share/share-next.test.ts +333 -0
- package/test/shell/shell.test.ts +99 -0
- package/test/skill/discovery.test.ts +116 -0
- package/test/skill/skill.test.ts +393 -0
- package/test/smoke/.tui-debug-output.txt +1 -0
- package/test/smoke/.tui-debug-plain.txt +1 -0
- package/test/smoke/.tui-walkthrough-report.txt +122 -0
- package/test/smoke/smoke-tui-pty.test.ts +123 -0
- package/test/smoke/smoke-tui.mjs +83 -0
- package/test/smoke/tui-walkthrough.test.ts +520 -0
- package/test/snapshot/snapshot.test.ts +1531 -0
- package/test/storage/db.test.ts +23 -0
- package/test/storage/json-migration.test.ts +832 -0
- package/test/storage/storage.test.ts +293 -0
- package/test/suggestion/suggestion.test.ts +1 -0
- package/test/sync/index.test.ts +256 -0
- package/test/tool/__snapshots__/parameters.test.ts.snap +500 -0
- package/test/tool/__snapshots__/tool.test.ts.snap +9 -0
- package/test/tool/apply_patch.test.ts +614 -0
- package/test/tool/bash.test.ts +1225 -0
- package/test/tool/diagnostics-filter.test.ts +55 -0
- package/test/tool/edit.test.ts +754 -0
- package/test/tool/external-directory.test.ts +169 -0
- package/test/tool/fixtures/large-image.png +0 -0
- package/test/tool/fixtures/models-api.json +65179 -0
- package/test/tool/glob.test.ts +107 -0
- package/test/tool/grep.test.ts +114 -0
- package/test/tool/lsp.test.ts +187 -0
- package/test/tool/parameters.test.ts +243 -0
- package/test/tool/question.test.ts +129 -0
- package/test/tool/read.test.ts +500 -0
- package/test/tool/recall.test.ts +151 -0
- package/test/tool/registry.test.ts +203 -0
- package/test/tool/skill.test.ts +135 -0
- package/test/tool/suggest.test.ts +1 -0
- package/test/tool/task.test.ts +612 -0
- package/test/tool/tool-define.test.ts +99 -0
- package/test/tool/truncation.test.ts +260 -0
- package/test/tool/webfetch.test.ts +103 -0
- package/test/tool/write.test.ts +291 -0
- package/test/util/data-url.test.ts +14 -0
- package/test/util/effect-zod.test.ts +754 -0
- package/test/util/error.test.ts +38 -0
- package/test/util/filesystem.test.ts +656 -0
- package/test/util/format.test.ts +59 -0
- package/test/util/glob.test.ts +164 -0
- package/test/util/iife.test.ts +36 -0
- package/test/util/lazy.test.ts +50 -0
- package/test/util/lock.test.ts +72 -0
- package/test/util/log.test.ts +86 -0
- package/test/util/module.test.ts +59 -0
- package/test/util/process.test.ts +128 -0
- package/test/util/timeout.test.ts +21 -0
- package/test/util/which.test.ts +100 -0
- package/test/util/wildcard.test.ts +90 -0
- package/test/workspace/workspace-restore.test.ts +296 -0
- package/src/provider/models-snapshot.d.ts +0 -2
- package/src/provider/models-snapshot.js +0 -3
|
@@ -0,0 +1,2420 @@
|
|
|
1
|
+
import { afterEach, describe, expect, mock, test } from "bun:test"
|
|
2
|
+
import { APICallError } from "ai"
|
|
3
|
+
import { Cause, Effect, Exit, Layer, ManagedRuntime } from "effect"
|
|
4
|
+
import * as Stream from "effect/Stream"
|
|
5
|
+
import z from "zod"
|
|
6
|
+
import { Bus } from "../../src/bus"
|
|
7
|
+
import { Config } from "@/config/config"
|
|
8
|
+
import { Agent } from "../../src/agent/agent"
|
|
9
|
+
import { LLM } from "../../src/session/llm"
|
|
10
|
+
import { SessionCompaction } from "../../src/session/compaction"
|
|
11
|
+
import { Token } from "@/util/token"
|
|
12
|
+
import { Instance } from "../../src/project/instance"
|
|
13
|
+
import * as Log from "@saeeol/core/util/log"
|
|
14
|
+
import { Permission } from "../../src/permission"
|
|
15
|
+
import { Plugin } from "../../src/plugin"
|
|
16
|
+
import { provideTmpdirInstance, tmpdir } from "../fixture/fixture"
|
|
17
|
+
import { Session as SessionNs } from "@/session/session"
|
|
18
|
+
import { MessageV2 } from "../../src/session/message-v2"
|
|
19
|
+
import { MessageID, PartID, SessionID } from "../../src/session/schema"
|
|
20
|
+
import { SessionStatus } from "../../src/session/status"
|
|
21
|
+
import { SessionSummary } from "../../src/session/summary"
|
|
22
|
+
import { ModelID, ProviderID } from "../../src/provider/schema"
|
|
23
|
+
import type { Provider } from "@/provider/provider"
|
|
24
|
+
import * as SessionProcessorModule from "../../src/session/processor"
|
|
25
|
+
import { Snapshot } from "../../src/snapshot"
|
|
26
|
+
import { ProviderTest } from "../fake/provider"
|
|
27
|
+
import { testEffect } from "../lib/effect"
|
|
28
|
+
import { CrossSpawnSpawner } from "@saeeol/core/cross-spawn-spawner"
|
|
29
|
+
|
|
30
|
+
void Log.init({ print: false })
|
|
31
|
+
|
|
32
|
+
function run<A, E>(fx: Effect.Effect<A, E, SessionNs.Service>) {
|
|
33
|
+
return Effect.runPromise(fx.pipe(Effect.provide(SessionNs.defaultLayer)))
|
|
34
|
+
}
|
|
35
|
+
|
|
36
|
+
const svc = {
|
|
37
|
+
...SessionNs,
|
|
38
|
+
create(input?: SessionNs.CreateInput) {
|
|
39
|
+
return run(SessionNs.Service.use((svc) => svc.create(input)))
|
|
40
|
+
},
|
|
41
|
+
messages(input: z.output<typeof SessionNs.MessagesInput.zod>) {
|
|
42
|
+
return run(SessionNs.Service.use((svc) => svc.messages(input)))
|
|
43
|
+
},
|
|
44
|
+
updateMessage<T extends MessageV2.Info>(msg: T) {
|
|
45
|
+
return run(SessionNs.Service.use((svc) => svc.updateMessage(msg)))
|
|
46
|
+
},
|
|
47
|
+
updatePart<T extends MessageV2.Part>(part: T) {
|
|
48
|
+
return run(SessionNs.Service.use((svc) => svc.updatePart(part)))
|
|
49
|
+
},
|
|
50
|
+
}
|
|
51
|
+
|
|
52
|
+
const summary = Layer.succeed(
|
|
53
|
+
SessionSummary.Service,
|
|
54
|
+
SessionSummary.Service.of({
|
|
55
|
+
summarize: () => Effect.void,
|
|
56
|
+
diff: () => Effect.succeed([]),
|
|
57
|
+
computeDiff: () => Effect.succeed([]),
|
|
58
|
+
}),
|
|
59
|
+
)
|
|
60
|
+
|
|
61
|
+
const ref = {
|
|
62
|
+
providerID: ProviderID.make("test"),
|
|
63
|
+
modelID: ModelID.make("test-model"),
|
|
64
|
+
}
|
|
65
|
+
|
|
66
|
+
afterEach(() => {
|
|
67
|
+
mock.restore()
|
|
68
|
+
})
|
|
69
|
+
|
|
70
|
+
function createModel(opts: {
|
|
71
|
+
context: number
|
|
72
|
+
output: number
|
|
73
|
+
input?: number
|
|
74
|
+
cost?: Provider.Model["cost"]
|
|
75
|
+
npm?: string
|
|
76
|
+
}): Provider.Model {
|
|
77
|
+
return {
|
|
78
|
+
id: "test-model",
|
|
79
|
+
providerID: "test",
|
|
80
|
+
name: "Test",
|
|
81
|
+
limit: {
|
|
82
|
+
context: opts.context,
|
|
83
|
+
input: opts.input,
|
|
84
|
+
output: opts.output,
|
|
85
|
+
},
|
|
86
|
+
cost: opts.cost ?? { input: 0, output: 0, cache: { read: 0, write: 0 } },
|
|
87
|
+
capabilities: {
|
|
88
|
+
toolcall: true,
|
|
89
|
+
attachment: false,
|
|
90
|
+
reasoning: false,
|
|
91
|
+
temperature: true,
|
|
92
|
+
input: { text: true, image: false, audio: false, video: false },
|
|
93
|
+
output: { text: true, image: false, audio: false, video: false },
|
|
94
|
+
},
|
|
95
|
+
api: { npm: opts.npm ?? "@ai-sdk/anthropic" },
|
|
96
|
+
options: {},
|
|
97
|
+
} as Provider.Model
|
|
98
|
+
}
|
|
99
|
+
|
|
100
|
+
const wide = () => ProviderTest.fake({ model: createModel({ context: 100_000, output: 32_000 }) })
|
|
101
|
+
|
|
102
|
+
async function user(sessionID: SessionID, text: string) {
|
|
103
|
+
const msg = await svc.updateMessage({
|
|
104
|
+
id: MessageID.ascending(),
|
|
105
|
+
role: "user",
|
|
106
|
+
sessionID,
|
|
107
|
+
agent: "build",
|
|
108
|
+
model: ref,
|
|
109
|
+
time: { created: Date.now() },
|
|
110
|
+
})
|
|
111
|
+
await svc.updatePart({
|
|
112
|
+
id: PartID.ascending(),
|
|
113
|
+
messageID: msg.id,
|
|
114
|
+
sessionID,
|
|
115
|
+
type: "text",
|
|
116
|
+
text,
|
|
117
|
+
})
|
|
118
|
+
return msg
|
|
119
|
+
}
|
|
120
|
+
|
|
121
|
+
async function assistant(sessionID: SessionID, parentID: MessageID, root: string) {
|
|
122
|
+
const msg: MessageV2.Assistant = {
|
|
123
|
+
id: MessageID.ascending(),
|
|
124
|
+
role: "assistant",
|
|
125
|
+
sessionID,
|
|
126
|
+
mode: "build",
|
|
127
|
+
agent: "build",
|
|
128
|
+
path: { cwd: root, root },
|
|
129
|
+
cost: 0,
|
|
130
|
+
tokens: {
|
|
131
|
+
output: 0,
|
|
132
|
+
input: 0,
|
|
133
|
+
reasoning: 0,
|
|
134
|
+
cache: { read: 0, write: 0 },
|
|
135
|
+
},
|
|
136
|
+
modelID: ref.modelID,
|
|
137
|
+
providerID: ref.providerID,
|
|
138
|
+
parentID,
|
|
139
|
+
time: { created: Date.now() },
|
|
140
|
+
finish: "end_turn",
|
|
141
|
+
}
|
|
142
|
+
await svc.updateMessage(msg)
|
|
143
|
+
return msg
|
|
144
|
+
}
|
|
145
|
+
|
|
146
|
+
async function summaryAssistant(sessionID: SessionID, parentID: MessageID, root: string, text: string) {
|
|
147
|
+
const msg: MessageV2.Assistant = {
|
|
148
|
+
id: MessageID.ascending(),
|
|
149
|
+
role: "assistant",
|
|
150
|
+
sessionID,
|
|
151
|
+
mode: "compaction",
|
|
152
|
+
agent: "compaction",
|
|
153
|
+
path: { cwd: root, root },
|
|
154
|
+
cost: 0,
|
|
155
|
+
tokens: {
|
|
156
|
+
output: 0,
|
|
157
|
+
input: 0,
|
|
158
|
+
reasoning: 0,
|
|
159
|
+
cache: { read: 0, write: 0 },
|
|
160
|
+
},
|
|
161
|
+
modelID: ref.modelID,
|
|
162
|
+
providerID: ref.providerID,
|
|
163
|
+
parentID,
|
|
164
|
+
summary: true,
|
|
165
|
+
time: { created: Date.now() },
|
|
166
|
+
finish: "end_turn",
|
|
167
|
+
}
|
|
168
|
+
await svc.updateMessage(msg)
|
|
169
|
+
await svc.updatePart({
|
|
170
|
+
id: PartID.ascending(),
|
|
171
|
+
messageID: msg.id,
|
|
172
|
+
sessionID,
|
|
173
|
+
type: "text",
|
|
174
|
+
text,
|
|
175
|
+
})
|
|
176
|
+
return msg
|
|
177
|
+
}
|
|
178
|
+
|
|
179
|
+
async function lastCompactionPart(sessionID: SessionID) {
|
|
180
|
+
return (await svc.messages({ sessionID }))
|
|
181
|
+
.at(-2)
|
|
182
|
+
?.parts.find((item): item is MessageV2.CompactionPart => item.type === "compaction")
|
|
183
|
+
}
|
|
184
|
+
|
|
185
|
+
function fake(
|
|
186
|
+
input: Parameters<SessionProcessorModule.SessionProcessor.Interface["create"]>[0],
|
|
187
|
+
result: "continue" | "compact",
|
|
188
|
+
) {
|
|
189
|
+
const msg = input.assistantMessage
|
|
190
|
+
return {
|
|
191
|
+
get message() {
|
|
192
|
+
return msg
|
|
193
|
+
},
|
|
194
|
+
updateToolCall: Effect.fn("TestSessionProcessor.updateToolCall")(() => Effect.succeed(undefined)),
|
|
195
|
+
completeToolCall: Effect.fn("TestSessionProcessor.completeToolCall")(() => Effect.void),
|
|
196
|
+
process: Effect.fn("TestSessionProcessor.process")(() => Effect.succeed(result)),
|
|
197
|
+
} satisfies SessionProcessorModule.SessionProcessor.Handle
|
|
198
|
+
}
|
|
199
|
+
|
|
200
|
+
function layer(result: "continue" | "compact") {
|
|
201
|
+
return Layer.succeed(
|
|
202
|
+
SessionProcessorModule.SessionProcessor.Service,
|
|
203
|
+
SessionProcessorModule.SessionProcessor.Service.of({
|
|
204
|
+
create: Effect.fn("TestSessionProcessor.create")((input) => Effect.succeed(fake(input, result))),
|
|
205
|
+
}),
|
|
206
|
+
)
|
|
207
|
+
}
|
|
208
|
+
|
|
209
|
+
function cfg(compaction?: Config.Info["compaction"]) {
|
|
210
|
+
const base = Config.Info.zod.parse({})
|
|
211
|
+
return Layer.mock(Config.Service)({
|
|
212
|
+
get: () => Effect.succeed({ ...base, compaction }),
|
|
213
|
+
})
|
|
214
|
+
}
|
|
215
|
+
|
|
216
|
+
function runtime(
|
|
217
|
+
result: "continue" | "compact",
|
|
218
|
+
plugin = Plugin.defaultLayer,
|
|
219
|
+
provider = ProviderTest.fake(),
|
|
220
|
+
config = Config.defaultLayer,
|
|
221
|
+
) {
|
|
222
|
+
const bus = Bus.layer
|
|
223
|
+
return ManagedRuntime.make(
|
|
224
|
+
Layer.mergeAll(SessionCompaction.layer, bus).pipe(
|
|
225
|
+
Layer.provide(provider.layer),
|
|
226
|
+
Layer.provide(SessionNs.defaultLayer),
|
|
227
|
+
Layer.provide(layer(result)),
|
|
228
|
+
Layer.provide(Agent.defaultLayer),
|
|
229
|
+
Layer.provide(plugin),
|
|
230
|
+
Layer.provide(bus),
|
|
231
|
+
Layer.provide(config),
|
|
232
|
+
),
|
|
233
|
+
)
|
|
234
|
+
}
|
|
235
|
+
|
|
236
|
+
const deps = Layer.mergeAll(
|
|
237
|
+
ProviderTest.fake().layer,
|
|
238
|
+
layer("continue"),
|
|
239
|
+
Agent.defaultLayer,
|
|
240
|
+
Plugin.defaultLayer,
|
|
241
|
+
Bus.layer,
|
|
242
|
+
Config.defaultLayer,
|
|
243
|
+
)
|
|
244
|
+
|
|
245
|
+
const env = Layer.mergeAll(
|
|
246
|
+
SessionNs.defaultLayer,
|
|
247
|
+
CrossSpawnSpawner.defaultLayer,
|
|
248
|
+
SessionCompaction.layer.pipe(Layer.provide(SessionNs.defaultLayer), Layer.provideMerge(deps)),
|
|
249
|
+
)
|
|
250
|
+
|
|
251
|
+
const it = testEffect(env)
|
|
252
|
+
|
|
253
|
+
function llm() {
|
|
254
|
+
const queue: Array<
|
|
255
|
+
Stream.Stream<LLM.Event, unknown> | ((input: LLM.StreamInput) => Stream.Stream<LLM.Event, unknown>)
|
|
256
|
+
> = []
|
|
257
|
+
|
|
258
|
+
return {
|
|
259
|
+
push(stream: Stream.Stream<LLM.Event, unknown> | ((input: LLM.StreamInput) => Stream.Stream<LLM.Event, unknown>)) {
|
|
260
|
+
queue.push(stream)
|
|
261
|
+
},
|
|
262
|
+
layer: Layer.succeed(
|
|
263
|
+
LLM.Service,
|
|
264
|
+
LLM.Service.of({
|
|
265
|
+
stream: (input) => {
|
|
266
|
+
const item = queue.shift() ?? Stream.empty
|
|
267
|
+
const stream = typeof item === "function" ? item(input) : item
|
|
268
|
+
return stream.pipe(Stream.mapEffect((event) => Effect.succeed(event)))
|
|
269
|
+
},
|
|
270
|
+
raw: () => Effect.die("raw not implemented in test LLM"),
|
|
271
|
+
}),
|
|
272
|
+
),
|
|
273
|
+
}
|
|
274
|
+
}
|
|
275
|
+
|
|
276
|
+
function liveRuntime(layer: Layer.Layer<LLM.Service>, provider = ProviderTest.fake(), config = Config.defaultLayer) {
|
|
277
|
+
const bus = Bus.layer
|
|
278
|
+
const status = SessionStatus.layer.pipe(Layer.provide(bus))
|
|
279
|
+
const processor = SessionProcessorModule.SessionProcessor.layer.pipe(Layer.provide(summary))
|
|
280
|
+
return ManagedRuntime.make(
|
|
281
|
+
Layer.mergeAll(SessionCompaction.layer.pipe(Layer.provide(processor)), processor, bus, status).pipe(
|
|
282
|
+
Layer.provide(provider.layer),
|
|
283
|
+
Layer.provide(SessionNs.defaultLayer),
|
|
284
|
+
Layer.provide(Snapshot.defaultLayer),
|
|
285
|
+
Layer.provide(layer),
|
|
286
|
+
Layer.provide(Permission.defaultLayer),
|
|
287
|
+
Layer.provide(Agent.defaultLayer),
|
|
288
|
+
Layer.provide(Plugin.defaultLayer),
|
|
289
|
+
Layer.provide(status),
|
|
290
|
+
Layer.provide(bus),
|
|
291
|
+
Layer.provide(config),
|
|
292
|
+
),
|
|
293
|
+
)
|
|
294
|
+
}
|
|
295
|
+
|
|
296
|
+
function reply(
|
|
297
|
+
text: string,
|
|
298
|
+
capture?: (input: LLM.StreamInput) => void,
|
|
299
|
+
): (input: LLM.StreamInput) => Stream.Stream<LLM.Event, unknown> {
|
|
300
|
+
return (input) => {
|
|
301
|
+
capture?.(input)
|
|
302
|
+
return Stream.make(
|
|
303
|
+
{ type: "start" } satisfies LLM.Event,
|
|
304
|
+
{ type: "text-start", id: "txt-0" } satisfies LLM.Event,
|
|
305
|
+
{ type: "text-delta", id: "txt-0", delta: text, text } as LLM.Event,
|
|
306
|
+
{ type: "text-end", id: "txt-0" } satisfies LLM.Event,
|
|
307
|
+
{
|
|
308
|
+
type: "finish-step",
|
|
309
|
+
finishReason: "stop",
|
|
310
|
+
rawFinishReason: "stop",
|
|
311
|
+
response: { id: "res", modelId: "test-model", timestamp: new Date() },
|
|
312
|
+
providerMetadata: undefined,
|
|
313
|
+
usage: {
|
|
314
|
+
inputTokens: 1,
|
|
315
|
+
outputTokens: 1,
|
|
316
|
+
totalTokens: 2,
|
|
317
|
+
inputTokenDetails: {
|
|
318
|
+
noCacheTokens: undefined,
|
|
319
|
+
cacheReadTokens: undefined,
|
|
320
|
+
cacheWriteTokens: undefined,
|
|
321
|
+
},
|
|
322
|
+
outputTokenDetails: {
|
|
323
|
+
textTokens: undefined,
|
|
324
|
+
reasoningTokens: undefined,
|
|
325
|
+
},
|
|
326
|
+
},
|
|
327
|
+
} satisfies LLM.Event,
|
|
328
|
+
{
|
|
329
|
+
type: "finish",
|
|
330
|
+
finishReason: "stop",
|
|
331
|
+
rawFinishReason: "stop",
|
|
332
|
+
totalUsage: {
|
|
333
|
+
inputTokens: 1,
|
|
334
|
+
outputTokens: 1,
|
|
335
|
+
totalTokens: 2,
|
|
336
|
+
inputTokenDetails: {
|
|
337
|
+
noCacheTokens: undefined,
|
|
338
|
+
cacheReadTokens: undefined,
|
|
339
|
+
cacheWriteTokens: undefined,
|
|
340
|
+
},
|
|
341
|
+
outputTokenDetails: {
|
|
342
|
+
textTokens: undefined,
|
|
343
|
+
reasoningTokens: undefined,
|
|
344
|
+
},
|
|
345
|
+
},
|
|
346
|
+
} satisfies LLM.Event,
|
|
347
|
+
)
|
|
348
|
+
}
|
|
349
|
+
}
|
|
350
|
+
|
|
351
|
+
function wait(ms = 50) {
|
|
352
|
+
return new Promise((resolve) => setTimeout(resolve, ms))
|
|
353
|
+
}
|
|
354
|
+
|
|
355
|
+
function defer() {
|
|
356
|
+
let resolve!: () => void
|
|
357
|
+
const promise = new Promise<void>((done) => {
|
|
358
|
+
resolve = done
|
|
359
|
+
})
|
|
360
|
+
return { promise, resolve }
|
|
361
|
+
}
|
|
362
|
+
|
|
363
|
+
function plugin(ready: ReturnType<typeof defer>) {
|
|
364
|
+
return Layer.mock(Plugin.Service)({
|
|
365
|
+
trigger: <Name extends string, Input, Output>(name: Name, _input: Input, output: Output) => {
|
|
366
|
+
if (name !== "experimental.session.compacting") return Effect.succeed(output)
|
|
367
|
+
return Effect.sync(() => ready.resolve()).pipe(Effect.andThen(Effect.never), Effect.as(output))
|
|
368
|
+
},
|
|
369
|
+
list: () => Effect.succeed([]),
|
|
370
|
+
init: () => Effect.void,
|
|
371
|
+
})
|
|
372
|
+
}
|
|
373
|
+
|
|
374
|
+
function autocontinue(enabled: boolean) {
|
|
375
|
+
return Layer.mock(Plugin.Service)({
|
|
376
|
+
trigger: <Name extends string, Input, Output>(name: Name, _input: Input, output: Output) => {
|
|
377
|
+
if (name !== "experimental.compaction.autocontinue") return Effect.succeed(output)
|
|
378
|
+
return Effect.sync(() => {
|
|
379
|
+
;(output as { enabled: boolean }).enabled = enabled
|
|
380
|
+
return output
|
|
381
|
+
})
|
|
382
|
+
},
|
|
383
|
+
list: () => Effect.succeed([]),
|
|
384
|
+
init: () => Effect.void,
|
|
385
|
+
})
|
|
386
|
+
}
|
|
387
|
+
|
|
388
|
+
describe("session.compaction.isOverflow", () => {
|
|
389
|
+
it.live(
|
|
390
|
+
"returns true when token count exceeds usable context",
|
|
391
|
+
provideTmpdirInstance(() =>
|
|
392
|
+
Effect.gen(function* () {
|
|
393
|
+
const compact = yield* SessionCompaction.Service
|
|
394
|
+
const model = createModel({ context: 100_000, output: 32_000 })
|
|
395
|
+
const tokens = { input: 75_000, output: 5_000, reasoning: 0, cache: { read: 0, write: 0 } }
|
|
396
|
+
expect(yield* compact.isOverflow({ tokens, model })).toBe(true)
|
|
397
|
+
}),
|
|
398
|
+
),
|
|
399
|
+
)
|
|
400
|
+
|
|
401
|
+
it.live(
|
|
402
|
+
"returns false when token count within usable context",
|
|
403
|
+
provideTmpdirInstance(() =>
|
|
404
|
+
Effect.gen(function* () {
|
|
405
|
+
const compact = yield* SessionCompaction.Service
|
|
406
|
+
const model = createModel({ context: 200_000, output: 32_000 })
|
|
407
|
+
const tokens = { input: 100_000, output: 10_000, reasoning: 0, cache: { read: 0, write: 0 } }
|
|
408
|
+
expect(yield* compact.isOverflow({ tokens, model })).toBe(false)
|
|
409
|
+
}),
|
|
410
|
+
),
|
|
411
|
+
)
|
|
412
|
+
|
|
413
|
+
it.live(
|
|
414
|
+
"includes cache.read in token count",
|
|
415
|
+
provideTmpdirInstance(() =>
|
|
416
|
+
Effect.gen(function* () {
|
|
417
|
+
const compact = yield* SessionCompaction.Service
|
|
418
|
+
const model = createModel({ context: 100_000, output: 32_000 })
|
|
419
|
+
const tokens = { input: 60_000, output: 10_000, reasoning: 0, cache: { read: 10_000, write: 0 } }
|
|
420
|
+
expect(yield* compact.isOverflow({ tokens, model })).toBe(true)
|
|
421
|
+
}),
|
|
422
|
+
),
|
|
423
|
+
)
|
|
424
|
+
|
|
425
|
+
it.live(
|
|
426
|
+
"respects input limit for input caps",
|
|
427
|
+
provideTmpdirInstance(() =>
|
|
428
|
+
Effect.gen(function* () {
|
|
429
|
+
const compact = yield* SessionCompaction.Service
|
|
430
|
+
const model = createModel({ context: 400_000, input: 272_000, output: 128_000 })
|
|
431
|
+
const tokens = { input: 271_000, output: 1_000, reasoning: 0, cache: { read: 2_000, write: 0 } }
|
|
432
|
+
expect(yield* compact.isOverflow({ tokens, model })).toBe(true)
|
|
433
|
+
}),
|
|
434
|
+
),
|
|
435
|
+
)
|
|
436
|
+
|
|
437
|
+
it.live(
|
|
438
|
+
"returns false when input/output are within input caps",
|
|
439
|
+
provideTmpdirInstance(() =>
|
|
440
|
+
Effect.gen(function* () {
|
|
441
|
+
const compact = yield* SessionCompaction.Service
|
|
442
|
+
const model = createModel({ context: 400_000, input: 272_000, output: 128_000 })
|
|
443
|
+
const tokens = { input: 200_000, output: 20_000, reasoning: 0, cache: { read: 10_000, write: 0 } }
|
|
444
|
+
expect(yield* compact.isOverflow({ tokens, model })).toBe(false)
|
|
445
|
+
}),
|
|
446
|
+
),
|
|
447
|
+
)
|
|
448
|
+
|
|
449
|
+
it.live(
|
|
450
|
+
"returns false when output within limit with input caps",
|
|
451
|
+
provideTmpdirInstance(() =>
|
|
452
|
+
Effect.gen(function* () {
|
|
453
|
+
const compact = yield* SessionCompaction.Service
|
|
454
|
+
const model = createModel({ context: 200_000, input: 120_000, output: 10_000 })
|
|
455
|
+
const tokens = { input: 50_000, output: 9_999, reasoning: 0, cache: { read: 0, write: 0 } }
|
|
456
|
+
expect(yield* compact.isOverflow({ tokens, model })).toBe(false)
|
|
457
|
+
}),
|
|
458
|
+
),
|
|
459
|
+
)
|
|
460
|
+
|
|
461
|
+
// ─── Bug reproduction tests ───────────────────────────────────────────
|
|
462
|
+
// These tests demonstrate that when limit.input is set, isOverflow()
|
|
463
|
+
// does not subtract any headroom for the next model response. This means
|
|
464
|
+
// compaction only triggers AFTER we've already consumed the full input
|
|
465
|
+
// budget, leaving zero room for the next API call's output tokens.
|
|
466
|
+
//
|
|
467
|
+
// Compare: without limit.input, usable = context - output (reserves space).
|
|
468
|
+
// With limit.input, usable = limit.input (reserves nothing).
|
|
469
|
+
//
|
|
470
|
+
// Related issues: #10634, #8089, #11086, #12621
|
|
471
|
+
// Open PRs: #6875, #12924
|
|
472
|
+
|
|
473
|
+
it.live(
|
|
474
|
+
"BUG: no headroom when limit.input is set — compaction should trigger near boundary but does not",
|
|
475
|
+
provideTmpdirInstance(() =>
|
|
476
|
+
Effect.gen(function* () {
|
|
477
|
+
const compact = yield* SessionCompaction.Service
|
|
478
|
+
// Simulate Claude with prompt caching: input limit = 200K, output limit = 32K
|
|
479
|
+
const model = createModel({ context: 200_000, input: 200_000, output: 32_000 })
|
|
480
|
+
|
|
481
|
+
// We've used 198K tokens total. Only 2K under the input limit.
|
|
482
|
+
// On the next turn, the full conversation (198K) becomes input,
|
|
483
|
+
// plus the model needs room to generate output — this WILL overflow.
|
|
484
|
+
const tokens = { input: 180_000, output: 15_000, reasoning: 0, cache: { read: 3_000, write: 0 } }
|
|
485
|
+
// count = 180K + 3K + 15K = 198K
|
|
486
|
+
// usable = limit.input = 200K (no output subtracted!)
|
|
487
|
+
// 198K > 200K = false → no compaction triggered
|
|
488
|
+
|
|
489
|
+
// WITHOUT limit.input: usable = 200K - 32K = 168K, and 198K > 168K = true ✓
|
|
490
|
+
// WITH limit.input: usable = 200K, and 198K > 200K = false ✗
|
|
491
|
+
|
|
492
|
+
// With 198K used and only 2K headroom, the next turn will overflow.
|
|
493
|
+
// Compaction MUST trigger here.
|
|
494
|
+
expect(yield* compact.isOverflow({ tokens, model })).toBe(true)
|
|
495
|
+
}),
|
|
496
|
+
),
|
|
497
|
+
)
|
|
498
|
+
|
|
499
|
+
it.live(
|
|
500
|
+
"BUG: without limit.input, same token count correctly triggers compaction",
|
|
501
|
+
provideTmpdirInstance(() =>
|
|
502
|
+
Effect.gen(function* () {
|
|
503
|
+
const compact = yield* SessionCompaction.Service
|
|
504
|
+
// Same model but without limit.input — uses context - output instead
|
|
505
|
+
const model = createModel({ context: 200_000, output: 32_000 })
|
|
506
|
+
|
|
507
|
+
// Same token usage as above
|
|
508
|
+
const tokens = { input: 180_000, output: 15_000, reasoning: 0, cache: { read: 3_000, write: 0 } }
|
|
509
|
+
// count = 198K
|
|
510
|
+
// usable = context - output = 200K - 32K = 168K
|
|
511
|
+
// 198K > 168K = true → compaction correctly triggered
|
|
512
|
+
|
|
513
|
+
const result = yield* compact.isOverflow({ tokens, model })
|
|
514
|
+
expect(result).toBe(true) // ← Correct: headroom is reserved
|
|
515
|
+
}),
|
|
516
|
+
),
|
|
517
|
+
)
|
|
518
|
+
|
|
519
|
+
it.live(
|
|
520
|
+
"BUG: asymmetry — limit.input model allows 30K more usage before compaction than equivalent model without it",
|
|
521
|
+
provideTmpdirInstance(() =>
|
|
522
|
+
Effect.gen(function* () {
|
|
523
|
+
const compact = yield* SessionCompaction.Service
|
|
524
|
+
// Two models with identical context/output limits, differing only in limit.input
|
|
525
|
+
const withInputLimit = createModel({ context: 200_000, input: 200_000, output: 32_000 })
|
|
526
|
+
const withoutInputLimit = createModel({ context: 200_000, output: 32_000 })
|
|
527
|
+
|
|
528
|
+
// 170K total tokens — well above context-output (168K) but below input limit (200K)
|
|
529
|
+
const tokens = { input: 166_000, output: 10_000, reasoning: 0, cache: { read: 5_000, write: 0 } }
|
|
530
|
+
|
|
531
|
+
const withLimit = yield* compact.isOverflow({ tokens, model: withInputLimit })
|
|
532
|
+
const withoutLimit = yield* compact.isOverflow({ tokens, model: withoutInputLimit })
|
|
533
|
+
|
|
534
|
+
// Both models have identical real capacity — they should agree:
|
|
535
|
+
expect(withLimit).toBe(true) // should compact (170K leaves no room for 32K output)
|
|
536
|
+
expect(withoutLimit).toBe(true) // correctly compacts (170K > 168K)
|
|
537
|
+
}),
|
|
538
|
+
),
|
|
539
|
+
)
|
|
540
|
+
|
|
541
|
+
it.live(
|
|
542
|
+
"returns false when model context limit is 0",
|
|
543
|
+
provideTmpdirInstance(() =>
|
|
544
|
+
Effect.gen(function* () {
|
|
545
|
+
const compact = yield* SessionCompaction.Service
|
|
546
|
+
const model = createModel({ context: 0, output: 32_000 })
|
|
547
|
+
const tokens = { input: 100_000, output: 10_000, reasoning: 0, cache: { read: 0, write: 0 } }
|
|
548
|
+
expect(yield* compact.isOverflow({ tokens, model })).toBe(false)
|
|
549
|
+
}),
|
|
550
|
+
),
|
|
551
|
+
)
|
|
552
|
+
|
|
553
|
+
it.live(
|
|
554
|
+
"returns false when compaction.auto is disabled",
|
|
555
|
+
provideTmpdirInstance(
|
|
556
|
+
() =>
|
|
557
|
+
Effect.gen(function* () {
|
|
558
|
+
const compact = yield* SessionCompaction.Service
|
|
559
|
+
const model = createModel({ context: 100_000, output: 32_000 })
|
|
560
|
+
const tokens = { input: 75_000, output: 5_000, reasoning: 0, cache: { read: 0, write: 0 } }
|
|
561
|
+
expect(yield* compact.isOverflow({ tokens, model })).toBe(false)
|
|
562
|
+
}),
|
|
563
|
+
{
|
|
564
|
+
config: {
|
|
565
|
+
compaction: { auto: false },
|
|
566
|
+
},
|
|
567
|
+
},
|
|
568
|
+
),
|
|
569
|
+
)
|
|
570
|
+
})
|
|
571
|
+
|
|
572
|
+
describe("session.compaction.create", () => {
|
|
573
|
+
it.live(
|
|
574
|
+
"creates a compaction user message and part",
|
|
575
|
+
provideTmpdirInstance(() =>
|
|
576
|
+
Effect.gen(function* () {
|
|
577
|
+
const compact = yield* SessionCompaction.Service
|
|
578
|
+
const ssn = yield* SessionNs.Service
|
|
579
|
+
|
|
580
|
+
const info = yield* ssn.create({})
|
|
581
|
+
|
|
582
|
+
yield* compact.create({
|
|
583
|
+
sessionID: info.id,
|
|
584
|
+
agent: "build",
|
|
585
|
+
model: ref,
|
|
586
|
+
auto: true,
|
|
587
|
+
overflow: true,
|
|
588
|
+
})
|
|
589
|
+
|
|
590
|
+
const msgs = yield* ssn.messages({ sessionID: info.id })
|
|
591
|
+
expect(msgs).toHaveLength(1)
|
|
592
|
+
expect(msgs[0].info.role).toBe("user")
|
|
593
|
+
expect(msgs[0].parts).toHaveLength(1)
|
|
594
|
+
expect(msgs[0].parts[0]).toMatchObject({
|
|
595
|
+
type: "compaction",
|
|
596
|
+
auto: true,
|
|
597
|
+
overflow: true,
|
|
598
|
+
})
|
|
599
|
+
}),
|
|
600
|
+
),
|
|
601
|
+
)
|
|
602
|
+
})
|
|
603
|
+
|
|
604
|
+
describe("session.compaction.prune", () => {
|
|
605
|
+
it.live(
|
|
606
|
+
"compacts old completed tool output",
|
|
607
|
+
provideTmpdirInstance(
|
|
608
|
+
(dir) =>
|
|
609
|
+
Effect.gen(function* () {
|
|
610
|
+
const compact = yield* SessionCompaction.Service
|
|
611
|
+
const ssn = yield* SessionNs.Service
|
|
612
|
+
const info = yield* ssn.create({})
|
|
613
|
+
const a = yield* ssn.updateMessage({
|
|
614
|
+
id: MessageID.ascending(),
|
|
615
|
+
role: "user",
|
|
616
|
+
sessionID: info.id,
|
|
617
|
+
agent: "build",
|
|
618
|
+
model: ref,
|
|
619
|
+
time: { created: Date.now() },
|
|
620
|
+
})
|
|
621
|
+
yield* ssn.updatePart({
|
|
622
|
+
id: PartID.ascending(),
|
|
623
|
+
messageID: a.id,
|
|
624
|
+
sessionID: info.id,
|
|
625
|
+
type: "text",
|
|
626
|
+
text: "first",
|
|
627
|
+
})
|
|
628
|
+
const b: MessageV2.Assistant = {
|
|
629
|
+
id: MessageID.ascending(),
|
|
630
|
+
role: "assistant",
|
|
631
|
+
sessionID: info.id,
|
|
632
|
+
mode: "build",
|
|
633
|
+
agent: "build",
|
|
634
|
+
path: { cwd: dir, root: dir },
|
|
635
|
+
cost: 0,
|
|
636
|
+
tokens: {
|
|
637
|
+
output: 0,
|
|
638
|
+
input: 0,
|
|
639
|
+
reasoning: 0,
|
|
640
|
+
cache: { read: 0, write: 0 },
|
|
641
|
+
},
|
|
642
|
+
modelID: ref.modelID,
|
|
643
|
+
providerID: ref.providerID,
|
|
644
|
+
parentID: a.id,
|
|
645
|
+
time: { created: Date.now() },
|
|
646
|
+
finish: "end_turn",
|
|
647
|
+
}
|
|
648
|
+
yield* ssn.updateMessage(b)
|
|
649
|
+
yield* ssn.updatePart({
|
|
650
|
+
id: PartID.ascending(),
|
|
651
|
+
messageID: b.id,
|
|
652
|
+
sessionID: info.id,
|
|
653
|
+
type: "tool",
|
|
654
|
+
callID: crypto.randomUUID(),
|
|
655
|
+
tool: "bash",
|
|
656
|
+
state: {
|
|
657
|
+
status: "completed",
|
|
658
|
+
input: {},
|
|
659
|
+
output: "x".repeat(200_000),
|
|
660
|
+
title: "done",
|
|
661
|
+
metadata: {},
|
|
662
|
+
time: { start: Date.now(), end: Date.now() },
|
|
663
|
+
},
|
|
664
|
+
})
|
|
665
|
+
for (const text of ["second", "third"]) {
|
|
666
|
+
const msg = yield* ssn.updateMessage({
|
|
667
|
+
id: MessageID.ascending(),
|
|
668
|
+
role: "user",
|
|
669
|
+
sessionID: info.id,
|
|
670
|
+
agent: "build",
|
|
671
|
+
model: ref,
|
|
672
|
+
time: { created: Date.now() },
|
|
673
|
+
})
|
|
674
|
+
yield* ssn.updatePart({
|
|
675
|
+
id: PartID.ascending(),
|
|
676
|
+
messageID: msg.id,
|
|
677
|
+
sessionID: info.id,
|
|
678
|
+
type: "text",
|
|
679
|
+
text,
|
|
680
|
+
})
|
|
681
|
+
}
|
|
682
|
+
|
|
683
|
+
yield* compact.prune({ sessionID: info.id })
|
|
684
|
+
|
|
685
|
+
const msgs = yield* ssn.messages({ sessionID: info.id })
|
|
686
|
+
const part = msgs.flatMap((msg) => msg.parts).find((part) => part.type === "tool")
|
|
687
|
+
expect(part?.type).toBe("tool")
|
|
688
|
+
expect(part?.state.status).toBe("completed")
|
|
689
|
+
if (part?.type === "tool" && part.state.status === "completed") {
|
|
690
|
+
expect(part.state.time.compacted).toBeNumber()
|
|
691
|
+
}
|
|
692
|
+
}),
|
|
693
|
+
|
|
694
|
+
{
|
|
695
|
+
config: {
|
|
696
|
+
compaction: { prune: true },
|
|
697
|
+
},
|
|
698
|
+
},
|
|
699
|
+
),
|
|
700
|
+
)
|
|
701
|
+
|
|
702
|
+
it.live(
|
|
703
|
+
"skips protected skill tool output",
|
|
704
|
+
provideTmpdirInstance((dir) =>
|
|
705
|
+
Effect.gen(function* () {
|
|
706
|
+
const compact = yield* SessionCompaction.Service
|
|
707
|
+
const ssn = yield* SessionNs.Service
|
|
708
|
+
const info = yield* ssn.create({})
|
|
709
|
+
const a = yield* ssn.updateMessage({
|
|
710
|
+
id: MessageID.ascending(),
|
|
711
|
+
role: "user",
|
|
712
|
+
sessionID: info.id,
|
|
713
|
+
agent: "build",
|
|
714
|
+
model: ref,
|
|
715
|
+
time: { created: Date.now() },
|
|
716
|
+
})
|
|
717
|
+
yield* ssn.updatePart({
|
|
718
|
+
id: PartID.ascending(),
|
|
719
|
+
messageID: a.id,
|
|
720
|
+
sessionID: info.id,
|
|
721
|
+
type: "text",
|
|
722
|
+
text: "first",
|
|
723
|
+
})
|
|
724
|
+
const b: MessageV2.Assistant = {
|
|
725
|
+
id: MessageID.ascending(),
|
|
726
|
+
role: "assistant",
|
|
727
|
+
sessionID: info.id,
|
|
728
|
+
mode: "build",
|
|
729
|
+
agent: "build",
|
|
730
|
+
path: { cwd: dir, root: dir },
|
|
731
|
+
cost: 0,
|
|
732
|
+
tokens: {
|
|
733
|
+
output: 0,
|
|
734
|
+
input: 0,
|
|
735
|
+
reasoning: 0,
|
|
736
|
+
cache: { read: 0, write: 0 },
|
|
737
|
+
},
|
|
738
|
+
modelID: ref.modelID,
|
|
739
|
+
providerID: ref.providerID,
|
|
740
|
+
parentID: a.id,
|
|
741
|
+
time: { created: Date.now() },
|
|
742
|
+
finish: "end_turn",
|
|
743
|
+
}
|
|
744
|
+
yield* ssn.updateMessage(b)
|
|
745
|
+
yield* ssn.updatePart({
|
|
746
|
+
id: PartID.ascending(),
|
|
747
|
+
messageID: b.id,
|
|
748
|
+
sessionID: info.id,
|
|
749
|
+
type: "tool",
|
|
750
|
+
callID: crypto.randomUUID(),
|
|
751
|
+
tool: "skill",
|
|
752
|
+
state: {
|
|
753
|
+
status: "completed",
|
|
754
|
+
input: {},
|
|
755
|
+
output: "x".repeat(200_000),
|
|
756
|
+
title: "done",
|
|
757
|
+
metadata: {},
|
|
758
|
+
time: { start: Date.now(), end: Date.now() },
|
|
759
|
+
},
|
|
760
|
+
})
|
|
761
|
+
for (const text of ["second", "third"]) {
|
|
762
|
+
const msg = yield* ssn.updateMessage({
|
|
763
|
+
id: MessageID.ascending(),
|
|
764
|
+
role: "user",
|
|
765
|
+
sessionID: info.id,
|
|
766
|
+
agent: "build",
|
|
767
|
+
model: ref,
|
|
768
|
+
time: { created: Date.now() },
|
|
769
|
+
})
|
|
770
|
+
yield* ssn.updatePart({
|
|
771
|
+
id: PartID.ascending(),
|
|
772
|
+
messageID: msg.id,
|
|
773
|
+
sessionID: info.id,
|
|
774
|
+
type: "text",
|
|
775
|
+
text,
|
|
776
|
+
})
|
|
777
|
+
}
|
|
778
|
+
|
|
779
|
+
yield* compact.prune({ sessionID: info.id })
|
|
780
|
+
|
|
781
|
+
const msgs = yield* ssn.messages({ sessionID: info.id })
|
|
782
|
+
const part = msgs.flatMap((msg) => msg.parts).find((part) => part.type === "tool")
|
|
783
|
+
expect(part?.type).toBe("tool")
|
|
784
|
+
if (part?.type === "tool" && part.state.status === "completed") {
|
|
785
|
+
expect(part.state.time.compacted).toBeUndefined()
|
|
786
|
+
}
|
|
787
|
+
}),
|
|
788
|
+
),
|
|
789
|
+
)
|
|
790
|
+
})
|
|
791
|
+
|
|
792
|
+
describe("session.compaction.process", () => {
|
|
793
|
+
test("throws when parent is not a user message", async () => {
|
|
794
|
+
await using tmp = await tmpdir()
|
|
795
|
+
await Instance.provide({
|
|
796
|
+
directory: tmp.path,
|
|
797
|
+
fn: async () => {
|
|
798
|
+
const session = await svc.create({})
|
|
799
|
+
const msg = await user(session.id, "hello")
|
|
800
|
+
const reply = await assistant(session.id, msg.id, tmp.path)
|
|
801
|
+
const rt = runtime("continue")
|
|
802
|
+
try {
|
|
803
|
+
const msgs = await svc.messages({ sessionID: session.id })
|
|
804
|
+
await expect(
|
|
805
|
+
rt.runPromise(
|
|
806
|
+
SessionCompaction.Service.use((svc) =>
|
|
807
|
+
svc.process({
|
|
808
|
+
parentID: reply.id,
|
|
809
|
+
messages: msgs,
|
|
810
|
+
sessionID: session.id,
|
|
811
|
+
auto: false,
|
|
812
|
+
}),
|
|
813
|
+
),
|
|
814
|
+
),
|
|
815
|
+
).rejects.toThrow(`Compaction parent must be a user message: ${reply.id}`)
|
|
816
|
+
} finally {
|
|
817
|
+
await rt.dispose()
|
|
818
|
+
}
|
|
819
|
+
},
|
|
820
|
+
})
|
|
821
|
+
})
|
|
822
|
+
|
|
823
|
+
test("publishes compacted event on continue", async () => {
|
|
824
|
+
await using tmp = await tmpdir()
|
|
825
|
+
await Instance.provide({
|
|
826
|
+
directory: tmp.path,
|
|
827
|
+
fn: async () => {
|
|
828
|
+
const session = await svc.create({})
|
|
829
|
+
const msg = await user(session.id, "hello")
|
|
830
|
+
const msgs = await svc.messages({ sessionID: session.id })
|
|
831
|
+
const done = defer()
|
|
832
|
+
let seen = false
|
|
833
|
+
const rt = runtime("continue", Plugin.defaultLayer, wide())
|
|
834
|
+
let unsub: (() => void) | undefined
|
|
835
|
+
try {
|
|
836
|
+
unsub = await rt.runPromise(
|
|
837
|
+
Bus.Service.use((svc) =>
|
|
838
|
+
svc.subscribeCallback(SessionCompaction.Event.Compacted, (evt) => {
|
|
839
|
+
if (evt.properties.sessionID !== session.id) return
|
|
840
|
+
seen = true
|
|
841
|
+
done.resolve()
|
|
842
|
+
}),
|
|
843
|
+
),
|
|
844
|
+
)
|
|
845
|
+
|
|
846
|
+
const result = await rt.runPromise(
|
|
847
|
+
SessionCompaction.Service.use((svc) =>
|
|
848
|
+
svc.process({
|
|
849
|
+
parentID: msg.id,
|
|
850
|
+
messages: msgs,
|
|
851
|
+
sessionID: session.id,
|
|
852
|
+
auto: false,
|
|
853
|
+
}),
|
|
854
|
+
),
|
|
855
|
+
)
|
|
856
|
+
|
|
857
|
+
await Promise.race([
|
|
858
|
+
done.promise,
|
|
859
|
+
wait(500).then(() => {
|
|
860
|
+
throw new Error("timed out waiting for compacted event")
|
|
861
|
+
}),
|
|
862
|
+
])
|
|
863
|
+
expect(result).toBe("continue")
|
|
864
|
+
expect(seen).toBe(true)
|
|
865
|
+
} finally {
|
|
866
|
+
unsub?.()
|
|
867
|
+
await rt.dispose()
|
|
868
|
+
}
|
|
869
|
+
},
|
|
870
|
+
})
|
|
871
|
+
})
|
|
872
|
+
|
|
873
|
+
test("marks summary message as errored on compact result", async () => {
|
|
874
|
+
await using tmp = await tmpdir()
|
|
875
|
+
await Instance.provide({
|
|
876
|
+
directory: tmp.path,
|
|
877
|
+
fn: async () => {
|
|
878
|
+
const session = await svc.create({})
|
|
879
|
+
const msg = await user(session.id, "hello")
|
|
880
|
+
const rt = runtime("compact", Plugin.defaultLayer, wide())
|
|
881
|
+
try {
|
|
882
|
+
const msgs = await svc.messages({ sessionID: session.id })
|
|
883
|
+
const result = await rt.runPromise(
|
|
884
|
+
SessionCompaction.Service.use((svc) =>
|
|
885
|
+
svc.process({
|
|
886
|
+
parentID: msg.id,
|
|
887
|
+
messages: msgs,
|
|
888
|
+
sessionID: session.id,
|
|
889
|
+
auto: false,
|
|
890
|
+
}),
|
|
891
|
+
),
|
|
892
|
+
)
|
|
893
|
+
|
|
894
|
+
const summary = (await svc.messages({ sessionID: session.id })).find(
|
|
895
|
+
(msg) => msg.info.role === "assistant" && msg.info.summary,
|
|
896
|
+
)
|
|
897
|
+
|
|
898
|
+
expect(result).toBe("stop")
|
|
899
|
+
expect(summary?.info.role).toBe("assistant")
|
|
900
|
+
if (summary?.info.role === "assistant") {
|
|
901
|
+
expect(summary.info.finish).toBe("error")
|
|
902
|
+
expect(JSON.stringify(summary.info.error)).toContain("Session too large to compact")
|
|
903
|
+
}
|
|
904
|
+
} finally {
|
|
905
|
+
await rt.dispose()
|
|
906
|
+
}
|
|
907
|
+
},
|
|
908
|
+
})
|
|
909
|
+
})
|
|
910
|
+
|
|
911
|
+
test("adds synthetic continue prompt when auto is enabled", async () => {
|
|
912
|
+
await using tmp = await tmpdir()
|
|
913
|
+
await Instance.provide({
|
|
914
|
+
directory: tmp.path,
|
|
915
|
+
fn: async () => {
|
|
916
|
+
const session = await svc.create({})
|
|
917
|
+
const msg = await user(session.id, "hello")
|
|
918
|
+
const rt = runtime("continue", Plugin.defaultLayer, wide())
|
|
919
|
+
try {
|
|
920
|
+
const msgs = await svc.messages({ sessionID: session.id })
|
|
921
|
+
const result = await rt.runPromise(
|
|
922
|
+
SessionCompaction.Service.use((svc) =>
|
|
923
|
+
svc.process({
|
|
924
|
+
parentID: msg.id,
|
|
925
|
+
messages: msgs,
|
|
926
|
+
sessionID: session.id,
|
|
927
|
+
auto: true,
|
|
928
|
+
}),
|
|
929
|
+
),
|
|
930
|
+
)
|
|
931
|
+
|
|
932
|
+
const all = await svc.messages({ sessionID: session.id })
|
|
933
|
+
const last = all.at(-1)
|
|
934
|
+
|
|
935
|
+
expect(result).toBe("continue")
|
|
936
|
+
expect(last?.info.role).toBe("user")
|
|
937
|
+
expect(last?.parts[0]).toMatchObject({
|
|
938
|
+
type: "text",
|
|
939
|
+
synthetic: true,
|
|
940
|
+
metadata: { compaction_continue: true },
|
|
941
|
+
})
|
|
942
|
+
if (last?.parts[0]?.type === "text") {
|
|
943
|
+
expect(last.parts[0].text).toContain("Continue if you have next steps")
|
|
944
|
+
}
|
|
945
|
+
} finally {
|
|
946
|
+
await rt.dispose()
|
|
947
|
+
}
|
|
948
|
+
},
|
|
949
|
+
})
|
|
950
|
+
})
|
|
951
|
+
|
|
952
|
+
test("persists tail_start_id for retained recent turns", async () => {
|
|
953
|
+
await using tmp = await tmpdir()
|
|
954
|
+
await Instance.provide({
|
|
955
|
+
directory: tmp.path,
|
|
956
|
+
fn: async () => {
|
|
957
|
+
const session = await svc.create({})
|
|
958
|
+
await user(session.id, "first")
|
|
959
|
+
const keep = await user(session.id, "second")
|
|
960
|
+
await user(session.id, "third")
|
|
961
|
+
await SessionCompaction.create({
|
|
962
|
+
sessionID: session.id,
|
|
963
|
+
agent: "build",
|
|
964
|
+
model: ref,
|
|
965
|
+
auto: false,
|
|
966
|
+
})
|
|
967
|
+
|
|
968
|
+
const rt = runtime(
|
|
969
|
+
"continue",
|
|
970
|
+
Plugin.defaultLayer,
|
|
971
|
+
wide(),
|
|
972
|
+
cfg({ tail_turns: 2, preserve_recent_tokens: 10_000 }),
|
|
973
|
+
)
|
|
974
|
+
try {
|
|
975
|
+
const msgs = await svc.messages({ sessionID: session.id })
|
|
976
|
+
const parent = msgs.at(-1)?.info.id
|
|
977
|
+
expect(parent).toBeTruthy()
|
|
978
|
+
await rt.runPromise(
|
|
979
|
+
SessionCompaction.Service.use((svc) =>
|
|
980
|
+
svc.process({
|
|
981
|
+
parentID: parent!,
|
|
982
|
+
messages: msgs,
|
|
983
|
+
sessionID: session.id,
|
|
984
|
+
auto: false,
|
|
985
|
+
}),
|
|
986
|
+
),
|
|
987
|
+
)
|
|
988
|
+
|
|
989
|
+
const part = await lastCompactionPart(session.id)
|
|
990
|
+
expect(part?.type).toBe("compaction")
|
|
991
|
+
expect(part?.tail_start_id).toBe(keep.id)
|
|
992
|
+
} finally {
|
|
993
|
+
await rt.dispose()
|
|
994
|
+
}
|
|
995
|
+
},
|
|
996
|
+
})
|
|
997
|
+
})
|
|
998
|
+
|
|
999
|
+
test("shrinks retained tail to fit preserve token budget", async () => {
|
|
1000
|
+
await using tmp = await tmpdir()
|
|
1001
|
+
await Instance.provide({
|
|
1002
|
+
directory: tmp.path,
|
|
1003
|
+
fn: async () => {
|
|
1004
|
+
const session = await svc.create({})
|
|
1005
|
+
await user(session.id, "first")
|
|
1006
|
+
await user(session.id, "x".repeat(2_000))
|
|
1007
|
+
const keep = await user(session.id, "tiny")
|
|
1008
|
+
await SessionCompaction.create({
|
|
1009
|
+
sessionID: session.id,
|
|
1010
|
+
agent: "build",
|
|
1011
|
+
model: ref,
|
|
1012
|
+
auto: false,
|
|
1013
|
+
})
|
|
1014
|
+
|
|
1015
|
+
const rt = runtime("continue", Plugin.defaultLayer, wide(), cfg({ tail_turns: 2, preserve_recent_tokens: 100 }))
|
|
1016
|
+
try {
|
|
1017
|
+
const msgs = await svc.messages({ sessionID: session.id })
|
|
1018
|
+
const parent = msgs.at(-1)?.info.id
|
|
1019
|
+
expect(parent).toBeTruthy()
|
|
1020
|
+
await rt.runPromise(
|
|
1021
|
+
SessionCompaction.Service.use((svc) =>
|
|
1022
|
+
svc.process({
|
|
1023
|
+
parentID: parent!,
|
|
1024
|
+
messages: msgs,
|
|
1025
|
+
sessionID: session.id,
|
|
1026
|
+
auto: false,
|
|
1027
|
+
}),
|
|
1028
|
+
),
|
|
1029
|
+
)
|
|
1030
|
+
|
|
1031
|
+
const part = await lastCompactionPart(session.id)
|
|
1032
|
+
expect(part?.type).toBe("compaction")
|
|
1033
|
+
expect(part?.tail_start_id).toBe(keep.id)
|
|
1034
|
+
} finally {
|
|
1035
|
+
await rt.dispose()
|
|
1036
|
+
}
|
|
1037
|
+
},
|
|
1038
|
+
})
|
|
1039
|
+
})
|
|
1040
|
+
|
|
1041
|
+
test("falls back to full summary when even one recent turn exceeds preserve token budget", async () => {
|
|
1042
|
+
await using tmp = await tmpdir({ git: true })
|
|
1043
|
+
const stub = llm()
|
|
1044
|
+
let captured = ""
|
|
1045
|
+
stub.push(
|
|
1046
|
+
reply("summary", (input) => {
|
|
1047
|
+
captured = JSON.stringify(input.messages)
|
|
1048
|
+
}),
|
|
1049
|
+
)
|
|
1050
|
+
await Instance.provide({
|
|
1051
|
+
directory: tmp.path,
|
|
1052
|
+
fn: async () => {
|
|
1053
|
+
const session = await svc.create({})
|
|
1054
|
+
await user(session.id, "first")
|
|
1055
|
+
await user(session.id, "y".repeat(2_000))
|
|
1056
|
+
await SessionCompaction.create({
|
|
1057
|
+
sessionID: session.id,
|
|
1058
|
+
agent: "build",
|
|
1059
|
+
model: ref,
|
|
1060
|
+
auto: false,
|
|
1061
|
+
})
|
|
1062
|
+
|
|
1063
|
+
const rt = liveRuntime(stub.layer, wide(), cfg({ tail_turns: 1, preserve_recent_tokens: 20 }))
|
|
1064
|
+
try {
|
|
1065
|
+
const msgs = await svc.messages({ sessionID: session.id })
|
|
1066
|
+
const parent = msgs.at(-1)?.info.id
|
|
1067
|
+
expect(parent).toBeTruthy()
|
|
1068
|
+
await rt.runPromise(
|
|
1069
|
+
SessionCompaction.Service.use((svc) =>
|
|
1070
|
+
svc.process({
|
|
1071
|
+
parentID: parent!,
|
|
1072
|
+
messages: msgs,
|
|
1073
|
+
sessionID: session.id,
|
|
1074
|
+
auto: false,
|
|
1075
|
+
}),
|
|
1076
|
+
),
|
|
1077
|
+
)
|
|
1078
|
+
|
|
1079
|
+
const part = await lastCompactionPart(session.id)
|
|
1080
|
+
expect(part?.type).toBe("compaction")
|
|
1081
|
+
expect(part?.tail_start_id).toBeUndefined()
|
|
1082
|
+
expect(captured).toContain("yyyy")
|
|
1083
|
+
} finally {
|
|
1084
|
+
await rt.dispose()
|
|
1085
|
+
}
|
|
1086
|
+
},
|
|
1087
|
+
})
|
|
1088
|
+
})
|
|
1089
|
+
|
|
1090
|
+
test("falls back to full summary when retained tail media exceeds preserve token budget", async () => {
|
|
1091
|
+
await using tmp = await tmpdir({ git: true })
|
|
1092
|
+
const stub = llm()
|
|
1093
|
+
let captured = ""
|
|
1094
|
+
stub.push(
|
|
1095
|
+
reply("summary", (input) => {
|
|
1096
|
+
captured = JSON.stringify(input.messages)
|
|
1097
|
+
}),
|
|
1098
|
+
)
|
|
1099
|
+
await Instance.provide({
|
|
1100
|
+
directory: tmp.path,
|
|
1101
|
+
fn: async () => {
|
|
1102
|
+
const session = await svc.create({})
|
|
1103
|
+
await user(session.id, "older")
|
|
1104
|
+
const recent = await user(session.id, "recent image turn")
|
|
1105
|
+
await svc.updatePart({
|
|
1106
|
+
id: PartID.ascending(),
|
|
1107
|
+
messageID: recent.id,
|
|
1108
|
+
sessionID: session.id,
|
|
1109
|
+
type: "file",
|
|
1110
|
+
mime: "image/png",
|
|
1111
|
+
filename: "big.png",
|
|
1112
|
+
url: `data:image/png;base64,${"a".repeat(4_000)}`,
|
|
1113
|
+
})
|
|
1114
|
+
await SessionCompaction.create({
|
|
1115
|
+
sessionID: session.id,
|
|
1116
|
+
agent: "build",
|
|
1117
|
+
model: ref,
|
|
1118
|
+
auto: false,
|
|
1119
|
+
})
|
|
1120
|
+
|
|
1121
|
+
const rt = liveRuntime(stub.layer, wide(), cfg({ tail_turns: 1, preserve_recent_tokens: 100 }))
|
|
1122
|
+
try {
|
|
1123
|
+
const msgs = await svc.messages({ sessionID: session.id })
|
|
1124
|
+
const parent = msgs.at(-1)?.info.id
|
|
1125
|
+
expect(parent).toBeTruthy()
|
|
1126
|
+
await rt.runPromise(
|
|
1127
|
+
SessionCompaction.Service.use((svc) =>
|
|
1128
|
+
svc.process({
|
|
1129
|
+
parentID: parent!,
|
|
1130
|
+
messages: msgs,
|
|
1131
|
+
sessionID: session.id,
|
|
1132
|
+
auto: false,
|
|
1133
|
+
}),
|
|
1134
|
+
),
|
|
1135
|
+
)
|
|
1136
|
+
|
|
1137
|
+
const part = await lastCompactionPart(session.id)
|
|
1138
|
+
expect(part?.type).toBe("compaction")
|
|
1139
|
+
expect(part?.tail_start_id).toBeUndefined()
|
|
1140
|
+
expect(captured).toContain("recent image turn")
|
|
1141
|
+
expect(captured).toContain("Attached image/png: big.png")
|
|
1142
|
+
} finally {
|
|
1143
|
+
await rt.dispose()
|
|
1144
|
+
}
|
|
1145
|
+
},
|
|
1146
|
+
})
|
|
1147
|
+
})
|
|
1148
|
+
|
|
1149
|
+
test("retains a split turn suffix when a later message fits the preserve token budget", async () => {
|
|
1150
|
+
await using tmp = await tmpdir({ git: true })
|
|
1151
|
+
const stub = llm()
|
|
1152
|
+
let captured = ""
|
|
1153
|
+
stub.push(
|
|
1154
|
+
reply("summary", (input) => {
|
|
1155
|
+
captured = JSON.stringify(input.messages)
|
|
1156
|
+
}),
|
|
1157
|
+
)
|
|
1158
|
+
await Instance.provide({
|
|
1159
|
+
directory: tmp.path,
|
|
1160
|
+
fn: async () => {
|
|
1161
|
+
const session = await svc.create({})
|
|
1162
|
+
await user(session.id, "older")
|
|
1163
|
+
const recent = await user(session.id, "recent turn")
|
|
1164
|
+
const large = await assistant(session.id, recent.id, tmp.path)
|
|
1165
|
+
await svc.updatePart({
|
|
1166
|
+
id: PartID.ascending(),
|
|
1167
|
+
messageID: large.id,
|
|
1168
|
+
sessionID: session.id,
|
|
1169
|
+
type: "text",
|
|
1170
|
+
text: "z".repeat(2_000),
|
|
1171
|
+
})
|
|
1172
|
+
const keep = await assistant(session.id, recent.id, tmp.path)
|
|
1173
|
+
await svc.updatePart({
|
|
1174
|
+
id: PartID.ascending(),
|
|
1175
|
+
messageID: keep.id,
|
|
1176
|
+
sessionID: session.id,
|
|
1177
|
+
type: "text",
|
|
1178
|
+
text: "keep tail",
|
|
1179
|
+
})
|
|
1180
|
+
await SessionCompaction.create({
|
|
1181
|
+
sessionID: session.id,
|
|
1182
|
+
agent: "build",
|
|
1183
|
+
model: ref,
|
|
1184
|
+
auto: false,
|
|
1185
|
+
})
|
|
1186
|
+
|
|
1187
|
+
const rt = liveRuntime(stub.layer, wide(), cfg({ tail_turns: 1, preserve_recent_tokens: 100 }))
|
|
1188
|
+
try {
|
|
1189
|
+
const msgs = await svc.messages({ sessionID: session.id })
|
|
1190
|
+
const parent = msgs.at(-1)?.info.id
|
|
1191
|
+
expect(parent).toBeTruthy()
|
|
1192
|
+
await rt.runPromise(
|
|
1193
|
+
SessionCompaction.Service.use((svc) =>
|
|
1194
|
+
svc.process({
|
|
1195
|
+
parentID: parent!,
|
|
1196
|
+
messages: msgs,
|
|
1197
|
+
sessionID: session.id,
|
|
1198
|
+
auto: false,
|
|
1199
|
+
}),
|
|
1200
|
+
),
|
|
1201
|
+
)
|
|
1202
|
+
|
|
1203
|
+
const part = await lastCompactionPart(session.id)
|
|
1204
|
+
expect(part?.type).toBe("compaction")
|
|
1205
|
+
expect(part?.tail_start_id).toBe(keep.id)
|
|
1206
|
+
expect(captured).toContain("zzzz")
|
|
1207
|
+
expect(captured).not.toContain("keep tail")
|
|
1208
|
+
|
|
1209
|
+
const filtered = MessageV2.filterCompacted(MessageV2.stream(session.id))
|
|
1210
|
+
expect(filtered[0]?.info.id).toBe(keep.id)
|
|
1211
|
+
expect(filtered.map((msg) => msg.info.id)).not.toContain(large.id)
|
|
1212
|
+
} finally {
|
|
1213
|
+
await rt.dispose()
|
|
1214
|
+
}
|
|
1215
|
+
},
|
|
1216
|
+
})
|
|
1217
|
+
})
|
|
1218
|
+
|
|
1219
|
+
test("allows plugins to disable synthetic continue prompt", async () => {
|
|
1220
|
+
await using tmp = await tmpdir()
|
|
1221
|
+
await Instance.provide({
|
|
1222
|
+
directory: tmp.path,
|
|
1223
|
+
fn: async () => {
|
|
1224
|
+
const session = await svc.create({})
|
|
1225
|
+
const msg = await user(session.id, "hello")
|
|
1226
|
+
const rt = runtime("continue", autocontinue(false), wide())
|
|
1227
|
+
try {
|
|
1228
|
+
const msgs = await svc.messages({ sessionID: session.id })
|
|
1229
|
+
const result = await rt.runPromise(
|
|
1230
|
+
SessionCompaction.Service.use((svc) =>
|
|
1231
|
+
svc.process({
|
|
1232
|
+
parentID: msg.id,
|
|
1233
|
+
messages: msgs,
|
|
1234
|
+
sessionID: session.id,
|
|
1235
|
+
auto: true,
|
|
1236
|
+
}),
|
|
1237
|
+
),
|
|
1238
|
+
)
|
|
1239
|
+
|
|
1240
|
+
const all = await svc.messages({ sessionID: session.id })
|
|
1241
|
+
const last = all.at(-1)
|
|
1242
|
+
|
|
1243
|
+
expect(result).toBe("continue")
|
|
1244
|
+
expect(last?.info.role).toBe("assistant")
|
|
1245
|
+
expect(
|
|
1246
|
+
all.some(
|
|
1247
|
+
(msg) =>
|
|
1248
|
+
msg.info.role === "user" &&
|
|
1249
|
+
msg.parts.some(
|
|
1250
|
+
(part) =>
|
|
1251
|
+
part.type === "text" && part.synthetic && part.text.includes("Continue if you have next steps"),
|
|
1252
|
+
),
|
|
1253
|
+
),
|
|
1254
|
+
).toBe(false)
|
|
1255
|
+
} finally {
|
|
1256
|
+
await rt.dispose()
|
|
1257
|
+
}
|
|
1258
|
+
},
|
|
1259
|
+
})
|
|
1260
|
+
})
|
|
1261
|
+
|
|
1262
|
+
test("replays the prior user turn on overflow when earlier context exists", async () => {
|
|
1263
|
+
await using tmp = await tmpdir()
|
|
1264
|
+
await Instance.provide({
|
|
1265
|
+
directory: tmp.path,
|
|
1266
|
+
fn: async () => {
|
|
1267
|
+
const session = await svc.create({})
|
|
1268
|
+
await user(session.id, "root")
|
|
1269
|
+
const replay = await user(session.id, "image")
|
|
1270
|
+
await svc.updatePart({
|
|
1271
|
+
id: PartID.ascending(),
|
|
1272
|
+
messageID: replay.id,
|
|
1273
|
+
sessionID: session.id,
|
|
1274
|
+
type: "file",
|
|
1275
|
+
mime: "image/png",
|
|
1276
|
+
filename: "cat.png",
|
|
1277
|
+
url: "https://example.com/cat.png",
|
|
1278
|
+
})
|
|
1279
|
+
const msg = await user(session.id, "current")
|
|
1280
|
+
const rt = runtime("continue", Plugin.defaultLayer, wide())
|
|
1281
|
+
try {
|
|
1282
|
+
const msgs = await svc.messages({ sessionID: session.id })
|
|
1283
|
+
const result = await rt.runPromise(
|
|
1284
|
+
SessionCompaction.Service.use((svc) =>
|
|
1285
|
+
svc.process({
|
|
1286
|
+
parentID: msg.id,
|
|
1287
|
+
messages: msgs,
|
|
1288
|
+
sessionID: session.id,
|
|
1289
|
+
auto: true,
|
|
1290
|
+
overflow: true,
|
|
1291
|
+
}),
|
|
1292
|
+
),
|
|
1293
|
+
)
|
|
1294
|
+
|
|
1295
|
+
const last = (await svc.messages({ sessionID: session.id })).at(-1)
|
|
1296
|
+
|
|
1297
|
+
expect(result).toBe("continue")
|
|
1298
|
+
expect(last?.info.role).toBe("user")
|
|
1299
|
+
expect(last?.parts.some((part) => part.type === "file")).toBe(false)
|
|
1300
|
+
expect(
|
|
1301
|
+
last?.parts.some((part) => part.type === "text" && part.text.includes("Attached image/png: cat.png")),
|
|
1302
|
+
).toBe(true)
|
|
1303
|
+
} finally {
|
|
1304
|
+
await rt.dispose()
|
|
1305
|
+
}
|
|
1306
|
+
},
|
|
1307
|
+
})
|
|
1308
|
+
})
|
|
1309
|
+
|
|
1310
|
+
test("falls back to overflow guidance when no replayable turn exists", async () => {
|
|
1311
|
+
await using tmp = await tmpdir()
|
|
1312
|
+
await Instance.provide({
|
|
1313
|
+
directory: tmp.path,
|
|
1314
|
+
fn: async () => {
|
|
1315
|
+
const session = await svc.create({})
|
|
1316
|
+
await user(session.id, "earlier")
|
|
1317
|
+
const msg = await user(session.id, "current")
|
|
1318
|
+
|
|
1319
|
+
const rt = runtime("continue", Plugin.defaultLayer, wide())
|
|
1320
|
+
try {
|
|
1321
|
+
const msgs = await svc.messages({ sessionID: session.id })
|
|
1322
|
+
const result = await rt.runPromise(
|
|
1323
|
+
SessionCompaction.Service.use((svc) =>
|
|
1324
|
+
svc.process({
|
|
1325
|
+
parentID: msg.id,
|
|
1326
|
+
messages: msgs,
|
|
1327
|
+
sessionID: session.id,
|
|
1328
|
+
auto: true,
|
|
1329
|
+
overflow: true,
|
|
1330
|
+
}),
|
|
1331
|
+
),
|
|
1332
|
+
)
|
|
1333
|
+
|
|
1334
|
+
const last = (await svc.messages({ sessionID: session.id })).at(-1)
|
|
1335
|
+
|
|
1336
|
+
expect(result).toBe("continue")
|
|
1337
|
+
expect(last?.info.role).toBe("user")
|
|
1338
|
+
if (last?.parts[0]?.type === "text") {
|
|
1339
|
+
expect(last.parts[0].text).toContain("previous request exceeded the provider's size limit")
|
|
1340
|
+
}
|
|
1341
|
+
} finally {
|
|
1342
|
+
await rt.dispose()
|
|
1343
|
+
}
|
|
1344
|
+
},
|
|
1345
|
+
})
|
|
1346
|
+
})
|
|
1347
|
+
|
|
1348
|
+
test("stops quickly when aborted during retry backoff", async () => {
|
|
1349
|
+
const stub = llm()
|
|
1350
|
+
const ready = defer()
|
|
1351
|
+
stub.push(
|
|
1352
|
+
Stream.fromAsyncIterable(
|
|
1353
|
+
{
|
|
1354
|
+
async *[Symbol.asyncIterator]() {
|
|
1355
|
+
yield { type: "start" } as LLM.Event
|
|
1356
|
+
throw new APICallError({
|
|
1357
|
+
message: "boom",
|
|
1358
|
+
url: "https://example.com/v1/chat/completions",
|
|
1359
|
+
requestBodyValues: {},
|
|
1360
|
+
statusCode: 503,
|
|
1361
|
+
responseHeaders: { "retry-after-ms": "10000" },
|
|
1362
|
+
responseBody: '{"error":"boom"}',
|
|
1363
|
+
isRetryable: true,
|
|
1364
|
+
})
|
|
1365
|
+
},
|
|
1366
|
+
},
|
|
1367
|
+
(err) => err,
|
|
1368
|
+
),
|
|
1369
|
+
)
|
|
1370
|
+
|
|
1371
|
+
await using tmp = await tmpdir({ git: true })
|
|
1372
|
+
await Instance.provide({
|
|
1373
|
+
directory: tmp.path,
|
|
1374
|
+
fn: async () => {
|
|
1375
|
+
const session = await svc.create({})
|
|
1376
|
+
const msg = await user(session.id, "hello")
|
|
1377
|
+
const msgs = await svc.messages({ sessionID: session.id })
|
|
1378
|
+
const abort = new AbortController()
|
|
1379
|
+
const rt = liveRuntime(stub.layer, wide())
|
|
1380
|
+
let off: (() => void) | undefined
|
|
1381
|
+
let run: Promise<"continue" | "stop"> | undefined
|
|
1382
|
+
try {
|
|
1383
|
+
off = await rt.runPromise(
|
|
1384
|
+
Bus.Service.use((svc) =>
|
|
1385
|
+
svc.subscribeCallback(SessionStatus.Event.Status, (evt) => {
|
|
1386
|
+
if (evt.properties.sessionID !== session.id) return
|
|
1387
|
+
if (evt.properties.status.type !== "retry") return
|
|
1388
|
+
ready.resolve()
|
|
1389
|
+
}),
|
|
1390
|
+
),
|
|
1391
|
+
)
|
|
1392
|
+
|
|
1393
|
+
run = rt
|
|
1394
|
+
.runPromiseExit(
|
|
1395
|
+
SessionCompaction.Service.use((svc) =>
|
|
1396
|
+
svc.process({
|
|
1397
|
+
parentID: msg.id,
|
|
1398
|
+
messages: msgs,
|
|
1399
|
+
sessionID: session.id,
|
|
1400
|
+
auto: false,
|
|
1401
|
+
}),
|
|
1402
|
+
),
|
|
1403
|
+
{ signal: abort.signal },
|
|
1404
|
+
)
|
|
1405
|
+
.then((exit) => {
|
|
1406
|
+
if (Exit.isFailure(exit)) {
|
|
1407
|
+
if (Cause.hasInterrupts(exit.cause) && abort.signal.aborted) return "stop"
|
|
1408
|
+
throw Cause.squash(exit.cause)
|
|
1409
|
+
}
|
|
1410
|
+
return exit.value
|
|
1411
|
+
})
|
|
1412
|
+
|
|
1413
|
+
await Promise.race([
|
|
1414
|
+
ready.promise,
|
|
1415
|
+
wait(5000).then(() => {
|
|
1416
|
+
throw new Error("timed out waiting for retry status")
|
|
1417
|
+
}),
|
|
1418
|
+
])
|
|
1419
|
+
|
|
1420
|
+
const start = Date.now()
|
|
1421
|
+
abort.abort()
|
|
1422
|
+
const result = await Promise.race([
|
|
1423
|
+
run.then((value) => ({ kind: "done" as const, value, ms: Date.now() - start })),
|
|
1424
|
+
wait(2000).then(() => ({ kind: "timeout" as const })),
|
|
1425
|
+
])
|
|
1426
|
+
|
|
1427
|
+
expect(result.kind).toBe("done")
|
|
1428
|
+
if (result.kind === "done") {
|
|
1429
|
+
expect(result.value).toBe("stop")
|
|
1430
|
+
expect(result.ms).toBeLessThan(2000)
|
|
1431
|
+
}
|
|
1432
|
+
} finally {
|
|
1433
|
+
off?.()
|
|
1434
|
+
abort.abort()
|
|
1435
|
+
await rt.dispose()
|
|
1436
|
+
await run?.catch(() => undefined)
|
|
1437
|
+
}
|
|
1438
|
+
},
|
|
1439
|
+
})
|
|
1440
|
+
})
|
|
1441
|
+
|
|
1442
|
+
test("does not leave a summary assistant when aborted before processor setup", async () => {
|
|
1443
|
+
const ready = defer()
|
|
1444
|
+
|
|
1445
|
+
await using tmp = await tmpdir({ git: true })
|
|
1446
|
+
await Instance.provide({
|
|
1447
|
+
directory: tmp.path,
|
|
1448
|
+
fn: async () => {
|
|
1449
|
+
const session = await svc.create({})
|
|
1450
|
+
const msg = await user(session.id, "hello")
|
|
1451
|
+
const msgs = await svc.messages({ sessionID: session.id })
|
|
1452
|
+
const abort = new AbortController()
|
|
1453
|
+
const rt = runtime("continue", plugin(ready), wide())
|
|
1454
|
+
let run: Promise<"continue" | "stop"> | undefined
|
|
1455
|
+
try {
|
|
1456
|
+
run = rt
|
|
1457
|
+
.runPromiseExit(
|
|
1458
|
+
SessionCompaction.Service.use((svc) =>
|
|
1459
|
+
svc.process({
|
|
1460
|
+
parentID: msg.id,
|
|
1461
|
+
messages: msgs,
|
|
1462
|
+
sessionID: session.id,
|
|
1463
|
+
auto: false,
|
|
1464
|
+
}),
|
|
1465
|
+
),
|
|
1466
|
+
{ signal: abort.signal },
|
|
1467
|
+
)
|
|
1468
|
+
.then((exit) => {
|
|
1469
|
+
if (Exit.isFailure(exit)) {
|
|
1470
|
+
if (Cause.hasInterrupts(exit.cause) && abort.signal.aborted) return "stop"
|
|
1471
|
+
throw Cause.squash(exit.cause)
|
|
1472
|
+
}
|
|
1473
|
+
return exit.value
|
|
1474
|
+
})
|
|
1475
|
+
|
|
1476
|
+
await Promise.race([
|
|
1477
|
+
ready.promise,
|
|
1478
|
+
wait(1000).then(() => {
|
|
1479
|
+
throw new Error("timed out waiting for compaction hook")
|
|
1480
|
+
}),
|
|
1481
|
+
])
|
|
1482
|
+
|
|
1483
|
+
abort.abort()
|
|
1484
|
+
expect(await run).toBe("stop")
|
|
1485
|
+
|
|
1486
|
+
const all = await svc.messages({ sessionID: session.id })
|
|
1487
|
+
expect(all.some((msg) => msg.info.role === "assistant" && msg.info.summary)).toBe(false)
|
|
1488
|
+
} finally {
|
|
1489
|
+
abort.abort()
|
|
1490
|
+
await rt.dispose()
|
|
1491
|
+
await run?.catch(() => undefined)
|
|
1492
|
+
}
|
|
1493
|
+
},
|
|
1494
|
+
})
|
|
1495
|
+
})
|
|
1496
|
+
|
|
1497
|
+
test("does not allow tool calls while generating the summary", async () => {
|
|
1498
|
+
const stub = llm()
|
|
1499
|
+
stub.push(
|
|
1500
|
+
Stream.make(
|
|
1501
|
+
{ type: "start" } satisfies LLM.Event,
|
|
1502
|
+
{ type: "tool-input-start", id: "call-1", toolName: "_noop" } satisfies LLM.Event,
|
|
1503
|
+
{ type: "tool-call", toolCallId: "call-1", toolName: "_noop", input: {} } satisfies LLM.Event,
|
|
1504
|
+
{
|
|
1505
|
+
type: "finish-step",
|
|
1506
|
+
finishReason: "tool-calls",
|
|
1507
|
+
rawFinishReason: "tool_calls",
|
|
1508
|
+
response: { id: "res", modelId: "test-model", timestamp: new Date() },
|
|
1509
|
+
providerMetadata: undefined,
|
|
1510
|
+
usage: {
|
|
1511
|
+
inputTokens: 1,
|
|
1512
|
+
outputTokens: 1,
|
|
1513
|
+
totalTokens: 2,
|
|
1514
|
+
inputTokenDetails: {
|
|
1515
|
+
noCacheTokens: undefined,
|
|
1516
|
+
cacheReadTokens: undefined,
|
|
1517
|
+
cacheWriteTokens: undefined,
|
|
1518
|
+
},
|
|
1519
|
+
outputTokenDetails: {
|
|
1520
|
+
textTokens: undefined,
|
|
1521
|
+
reasoningTokens: undefined,
|
|
1522
|
+
},
|
|
1523
|
+
},
|
|
1524
|
+
} satisfies LLM.Event,
|
|
1525
|
+
{
|
|
1526
|
+
type: "finish",
|
|
1527
|
+
finishReason: "tool-calls",
|
|
1528
|
+
rawFinishReason: "tool_calls",
|
|
1529
|
+
totalUsage: {
|
|
1530
|
+
inputTokens: 1,
|
|
1531
|
+
outputTokens: 1,
|
|
1532
|
+
totalTokens: 2,
|
|
1533
|
+
inputTokenDetails: {
|
|
1534
|
+
noCacheTokens: undefined,
|
|
1535
|
+
cacheReadTokens: undefined,
|
|
1536
|
+
cacheWriteTokens: undefined,
|
|
1537
|
+
},
|
|
1538
|
+
outputTokenDetails: {
|
|
1539
|
+
textTokens: undefined,
|
|
1540
|
+
reasoningTokens: undefined,
|
|
1541
|
+
},
|
|
1542
|
+
},
|
|
1543
|
+
} satisfies LLM.Event,
|
|
1544
|
+
),
|
|
1545
|
+
)
|
|
1546
|
+
|
|
1547
|
+
await using tmp = await tmpdir({ git: true })
|
|
1548
|
+
await Instance.provide({
|
|
1549
|
+
directory: tmp.path,
|
|
1550
|
+
fn: async () => {
|
|
1551
|
+
const session = await svc.create({})
|
|
1552
|
+
const msg = await user(session.id, "hello")
|
|
1553
|
+
const rt = liveRuntime(stub.layer, wide())
|
|
1554
|
+
try {
|
|
1555
|
+
const msgs = await svc.messages({ sessionID: session.id })
|
|
1556
|
+
await rt.runPromise(
|
|
1557
|
+
SessionCompaction.Service.use((svc) =>
|
|
1558
|
+
svc.process({
|
|
1559
|
+
parentID: msg.id,
|
|
1560
|
+
messages: msgs,
|
|
1561
|
+
sessionID: session.id,
|
|
1562
|
+
auto: false,
|
|
1563
|
+
}),
|
|
1564
|
+
),
|
|
1565
|
+
)
|
|
1566
|
+
|
|
1567
|
+
const summary = (await svc.messages({ sessionID: session.id })).find(
|
|
1568
|
+
(item) => item.info.role === "assistant" && item.info.summary,
|
|
1569
|
+
)
|
|
1570
|
+
|
|
1571
|
+
expect(summary?.info.role).toBe("assistant")
|
|
1572
|
+
expect(summary?.parts.some((part) => part.type === "tool")).toBe(false)
|
|
1573
|
+
} finally {
|
|
1574
|
+
await rt.dispose()
|
|
1575
|
+
}
|
|
1576
|
+
},
|
|
1577
|
+
})
|
|
1578
|
+
})
|
|
1579
|
+
|
|
1580
|
+
test("summarizes only the head while keeping recent tail out of summary input", async () => {
|
|
1581
|
+
const stub = llm()
|
|
1582
|
+
let captured = ""
|
|
1583
|
+
stub.push(
|
|
1584
|
+
reply("summary", (input) => {
|
|
1585
|
+
captured = JSON.stringify(input.messages)
|
|
1586
|
+
}),
|
|
1587
|
+
)
|
|
1588
|
+
|
|
1589
|
+
await using tmp = await tmpdir({ git: true })
|
|
1590
|
+
await Instance.provide({
|
|
1591
|
+
directory: tmp.path,
|
|
1592
|
+
fn: async () => {
|
|
1593
|
+
const session = await svc.create({})
|
|
1594
|
+
await user(session.id, "older context")
|
|
1595
|
+
await user(session.id, "keep this turn")
|
|
1596
|
+
await user(session.id, "and this one too")
|
|
1597
|
+
await SessionCompaction.create({
|
|
1598
|
+
sessionID: session.id,
|
|
1599
|
+
agent: "build",
|
|
1600
|
+
model: ref,
|
|
1601
|
+
auto: false,
|
|
1602
|
+
})
|
|
1603
|
+
|
|
1604
|
+
const rt = liveRuntime(stub.layer, wide())
|
|
1605
|
+
try {
|
|
1606
|
+
const msgs = await svc.messages({ sessionID: session.id })
|
|
1607
|
+
const parent = msgs.at(-1)?.info.id
|
|
1608
|
+
expect(parent).toBeTruthy()
|
|
1609
|
+
await rt.runPromise(
|
|
1610
|
+
SessionCompaction.Service.use((svc) =>
|
|
1611
|
+
svc.process({
|
|
1612
|
+
parentID: parent!,
|
|
1613
|
+
messages: msgs,
|
|
1614
|
+
sessionID: session.id,
|
|
1615
|
+
auto: false,
|
|
1616
|
+
}),
|
|
1617
|
+
),
|
|
1618
|
+
)
|
|
1619
|
+
|
|
1620
|
+
expect(captured).toContain("older context")
|
|
1621
|
+
expect(captured).not.toContain("keep this turn")
|
|
1622
|
+
expect(captured).not.toContain("and this one too")
|
|
1623
|
+
expect(captured).not.toContain("What did we do so far?")
|
|
1624
|
+
} finally {
|
|
1625
|
+
await rt.dispose()
|
|
1626
|
+
}
|
|
1627
|
+
},
|
|
1628
|
+
})
|
|
1629
|
+
})
|
|
1630
|
+
|
|
1631
|
+
test("anchors repeated compactions with the previous summary", async () => {
|
|
1632
|
+
const stub = llm()
|
|
1633
|
+
let captured = ""
|
|
1634
|
+
stub.push(reply("summary one"))
|
|
1635
|
+
stub.push(
|
|
1636
|
+
reply("summary two", (input) => {
|
|
1637
|
+
captured = JSON.stringify(input.messages)
|
|
1638
|
+
}),
|
|
1639
|
+
)
|
|
1640
|
+
|
|
1641
|
+
await using tmp = await tmpdir({ git: true })
|
|
1642
|
+
await Instance.provide({
|
|
1643
|
+
directory: tmp.path,
|
|
1644
|
+
fn: async () => {
|
|
1645
|
+
const session = await svc.create({})
|
|
1646
|
+
await user(session.id, "older context")
|
|
1647
|
+
await user(session.id, "keep this turn")
|
|
1648
|
+
await SessionCompaction.create({
|
|
1649
|
+
sessionID: session.id,
|
|
1650
|
+
agent: "build",
|
|
1651
|
+
model: ref,
|
|
1652
|
+
auto: false,
|
|
1653
|
+
})
|
|
1654
|
+
|
|
1655
|
+
const rt = liveRuntime(stub.layer, wide())
|
|
1656
|
+
try {
|
|
1657
|
+
let msgs = await svc.messages({ sessionID: session.id })
|
|
1658
|
+
let parent = msgs.at(-1)?.info.id
|
|
1659
|
+
expect(parent).toBeTruthy()
|
|
1660
|
+
await rt.runPromise(
|
|
1661
|
+
SessionCompaction.Service.use((svc) =>
|
|
1662
|
+
svc.process({
|
|
1663
|
+
parentID: parent!,
|
|
1664
|
+
messages: msgs,
|
|
1665
|
+
sessionID: session.id,
|
|
1666
|
+
auto: false,
|
|
1667
|
+
}),
|
|
1668
|
+
),
|
|
1669
|
+
)
|
|
1670
|
+
|
|
1671
|
+
await user(session.id, "latest turn")
|
|
1672
|
+
await SessionCompaction.create({
|
|
1673
|
+
sessionID: session.id,
|
|
1674
|
+
agent: "build",
|
|
1675
|
+
model: ref,
|
|
1676
|
+
auto: false,
|
|
1677
|
+
})
|
|
1678
|
+
|
|
1679
|
+
msgs = MessageV2.filterCompacted(MessageV2.stream(session.id))
|
|
1680
|
+
parent = msgs.at(-1)?.info.id
|
|
1681
|
+
expect(parent).toBeTruthy()
|
|
1682
|
+
await rt.runPromise(
|
|
1683
|
+
SessionCompaction.Service.use((svc) =>
|
|
1684
|
+
svc.process({
|
|
1685
|
+
parentID: parent!,
|
|
1686
|
+
messages: msgs,
|
|
1687
|
+
sessionID: session.id,
|
|
1688
|
+
auto: false,
|
|
1689
|
+
}),
|
|
1690
|
+
),
|
|
1691
|
+
)
|
|
1692
|
+
|
|
1693
|
+
expect(captured).toContain("<previous-summary>")
|
|
1694
|
+
expect(captured).toContain("summary one")
|
|
1695
|
+
expect(captured.match(/summary one/g)?.length).toBe(1)
|
|
1696
|
+
expect(captured).toContain("## Constraints & Preferences")
|
|
1697
|
+
expect(captured).toContain("## Progress")
|
|
1698
|
+
} finally {
|
|
1699
|
+
await rt.dispose()
|
|
1700
|
+
}
|
|
1701
|
+
},
|
|
1702
|
+
})
|
|
1703
|
+
})
|
|
1704
|
+
|
|
1705
|
+
test("keeps recent pre-compaction turns across repeated compactions", async () => {
|
|
1706
|
+
const stub = llm()
|
|
1707
|
+
stub.push(reply("summary one"))
|
|
1708
|
+
stub.push(reply("summary two"))
|
|
1709
|
+
await using tmp = await tmpdir()
|
|
1710
|
+
await Instance.provide({
|
|
1711
|
+
directory: tmp.path,
|
|
1712
|
+
fn: async () => {
|
|
1713
|
+
const session = await svc.create({})
|
|
1714
|
+
const u1 = await user(session.id, "one")
|
|
1715
|
+
const u2 = await user(session.id, "two")
|
|
1716
|
+
const u3 = await user(session.id, "three")
|
|
1717
|
+
await SessionCompaction.create({
|
|
1718
|
+
sessionID: session.id,
|
|
1719
|
+
agent: "build",
|
|
1720
|
+
model: ref,
|
|
1721
|
+
auto: false,
|
|
1722
|
+
})
|
|
1723
|
+
|
|
1724
|
+
const rt = liveRuntime(stub.layer, wide(), cfg({ tail_turns: 2, preserve_recent_tokens: 10_000 }))
|
|
1725
|
+
try {
|
|
1726
|
+
let msgs = await svc.messages({ sessionID: session.id })
|
|
1727
|
+
let parent = msgs.at(-1)?.info.id
|
|
1728
|
+
expect(parent).toBeTruthy()
|
|
1729
|
+
await rt.runPromise(
|
|
1730
|
+
SessionCompaction.Service.use((svc) =>
|
|
1731
|
+
svc.process({
|
|
1732
|
+
parentID: parent!,
|
|
1733
|
+
messages: msgs,
|
|
1734
|
+
sessionID: session.id,
|
|
1735
|
+
auto: false,
|
|
1736
|
+
}),
|
|
1737
|
+
),
|
|
1738
|
+
)
|
|
1739
|
+
|
|
1740
|
+
const u4 = await user(session.id, "four")
|
|
1741
|
+
await SessionCompaction.create({
|
|
1742
|
+
sessionID: session.id,
|
|
1743
|
+
agent: "build",
|
|
1744
|
+
model: ref,
|
|
1745
|
+
auto: false,
|
|
1746
|
+
})
|
|
1747
|
+
|
|
1748
|
+
msgs = MessageV2.filterCompacted(MessageV2.stream(session.id))
|
|
1749
|
+
parent = msgs.at(-1)?.info.id
|
|
1750
|
+
expect(parent).toBeTruthy()
|
|
1751
|
+
await rt.runPromise(
|
|
1752
|
+
SessionCompaction.Service.use((svc) =>
|
|
1753
|
+
svc.process({
|
|
1754
|
+
parentID: parent!,
|
|
1755
|
+
messages: msgs,
|
|
1756
|
+
sessionID: session.id,
|
|
1757
|
+
auto: false,
|
|
1758
|
+
}),
|
|
1759
|
+
),
|
|
1760
|
+
)
|
|
1761
|
+
|
|
1762
|
+
const filtered = MessageV2.filterCompacted(MessageV2.stream(session.id))
|
|
1763
|
+
const ids = filtered.map((msg) => msg.info.id)
|
|
1764
|
+
|
|
1765
|
+
expect(ids).not.toContain(u1.id)
|
|
1766
|
+
expect(ids).not.toContain(u2.id)
|
|
1767
|
+
expect(ids).toContain(u3.id)
|
|
1768
|
+
expect(ids).toContain(u4.id)
|
|
1769
|
+
expect(filtered.some((msg) => msg.info.role === "assistant" && msg.info.summary)).toBe(true)
|
|
1770
|
+
expect(
|
|
1771
|
+
filtered.some((msg) => msg.info.role === "user" && msg.parts.some((part) => part.type === "compaction")),
|
|
1772
|
+
).toBe(true)
|
|
1773
|
+
} finally {
|
|
1774
|
+
await rt.dispose()
|
|
1775
|
+
}
|
|
1776
|
+
},
|
|
1777
|
+
})
|
|
1778
|
+
})
|
|
1779
|
+
|
|
1780
|
+
test("ignores previous summaries when sizing the retained tail", async () => {
|
|
1781
|
+
await using tmp = await tmpdir()
|
|
1782
|
+
await Instance.provide({
|
|
1783
|
+
directory: tmp.path,
|
|
1784
|
+
fn: async () => {
|
|
1785
|
+
const session = await svc.create({})
|
|
1786
|
+
await user(session.id, "older")
|
|
1787
|
+
const keep = await user(session.id, "keep this turn")
|
|
1788
|
+
const keepReply = await assistant(session.id, keep.id, tmp.path)
|
|
1789
|
+
await svc.updatePart({
|
|
1790
|
+
id: PartID.ascending(),
|
|
1791
|
+
messageID: keepReply.id,
|
|
1792
|
+
sessionID: session.id,
|
|
1793
|
+
type: "text",
|
|
1794
|
+
text: "keep reply",
|
|
1795
|
+
})
|
|
1796
|
+
|
|
1797
|
+
await SessionCompaction.create({
|
|
1798
|
+
sessionID: session.id,
|
|
1799
|
+
agent: "build",
|
|
1800
|
+
model: ref,
|
|
1801
|
+
auto: false,
|
|
1802
|
+
})
|
|
1803
|
+
const firstCompaction = (await svc.messages({ sessionID: session.id })).at(-1)?.info.id
|
|
1804
|
+
expect(firstCompaction).toBeTruthy()
|
|
1805
|
+
await summaryAssistant(session.id, firstCompaction!, tmp.path, "summary ".repeat(800))
|
|
1806
|
+
|
|
1807
|
+
const recent = await user(session.id, "recent turn")
|
|
1808
|
+
const recentReply = await assistant(session.id, recent.id, tmp.path)
|
|
1809
|
+
await svc.updatePart({
|
|
1810
|
+
id: PartID.ascending(),
|
|
1811
|
+
messageID: recentReply.id,
|
|
1812
|
+
sessionID: session.id,
|
|
1813
|
+
type: "text",
|
|
1814
|
+
text: "recent reply",
|
|
1815
|
+
})
|
|
1816
|
+
|
|
1817
|
+
await SessionCompaction.create({
|
|
1818
|
+
sessionID: session.id,
|
|
1819
|
+
agent: "build",
|
|
1820
|
+
model: ref,
|
|
1821
|
+
auto: false,
|
|
1822
|
+
})
|
|
1823
|
+
|
|
1824
|
+
const rt = runtime("continue", Plugin.defaultLayer, wide(), cfg({ tail_turns: 2, preserve_recent_tokens: 500 }))
|
|
1825
|
+
try {
|
|
1826
|
+
const msgs = await svc.messages({ sessionID: session.id })
|
|
1827
|
+
const parent = msgs.at(-1)?.info.id
|
|
1828
|
+
expect(parent).toBeTruthy()
|
|
1829
|
+
await rt.runPromise(
|
|
1830
|
+
SessionCompaction.Service.use((svc) =>
|
|
1831
|
+
svc.process({
|
|
1832
|
+
parentID: parent!,
|
|
1833
|
+
messages: msgs,
|
|
1834
|
+
sessionID: session.id,
|
|
1835
|
+
auto: false,
|
|
1836
|
+
}),
|
|
1837
|
+
),
|
|
1838
|
+
)
|
|
1839
|
+
|
|
1840
|
+
const part = await lastCompactionPart(session.id)
|
|
1841
|
+
expect(part?.type).toBe("compaction")
|
|
1842
|
+
expect(part?.tail_start_id).toBe(keep.id)
|
|
1843
|
+
} finally {
|
|
1844
|
+
await rt.dispose()
|
|
1845
|
+
}
|
|
1846
|
+
},
|
|
1847
|
+
})
|
|
1848
|
+
})
|
|
1849
|
+
})
|
|
1850
|
+
|
|
1851
|
+
describe("util.token.estimate", () => {
|
|
1852
|
+
test("estimates tokens from text (4 chars per token)", () => {
|
|
1853
|
+
const text = "x".repeat(4000)
|
|
1854
|
+
expect(Token.estimate(text)).toBe(1000)
|
|
1855
|
+
})
|
|
1856
|
+
|
|
1857
|
+
test("estimates tokens from larger text", () => {
|
|
1858
|
+
const text = "y".repeat(20_000)
|
|
1859
|
+
expect(Token.estimate(text)).toBe(5000)
|
|
1860
|
+
})
|
|
1861
|
+
|
|
1862
|
+
test("returns 0 for empty string", () => {
|
|
1863
|
+
expect(Token.estimate("")).toBe(0)
|
|
1864
|
+
})
|
|
1865
|
+
})
|
|
1866
|
+
|
|
1867
|
+
describe("SessionNs.getUsage", () => {
|
|
1868
|
+
test("normalizes standard usage to token format", () => {
|
|
1869
|
+
const model = createModel({ context: 100_000, output: 32_000 })
|
|
1870
|
+
const result = SessionNs.getUsage({
|
|
1871
|
+
model,
|
|
1872
|
+
usage: {
|
|
1873
|
+
inputTokens: 1000,
|
|
1874
|
+
outputTokens: 500,
|
|
1875
|
+
totalTokens: 1500,
|
|
1876
|
+
inputTokenDetails: {
|
|
1877
|
+
noCacheTokens: undefined,
|
|
1878
|
+
cacheReadTokens: undefined,
|
|
1879
|
+
cacheWriteTokens: undefined,
|
|
1880
|
+
},
|
|
1881
|
+
outputTokenDetails: {
|
|
1882
|
+
textTokens: undefined,
|
|
1883
|
+
reasoningTokens: undefined,
|
|
1884
|
+
},
|
|
1885
|
+
},
|
|
1886
|
+
})
|
|
1887
|
+
|
|
1888
|
+
expect(result.tokens.input).toBe(1000)
|
|
1889
|
+
expect(result.tokens.output).toBe(500)
|
|
1890
|
+
expect(result.tokens.reasoning).toBe(0)
|
|
1891
|
+
expect(result.tokens.cache.read).toBe(0)
|
|
1892
|
+
expect(result.tokens.cache.write).toBe(0)
|
|
1893
|
+
})
|
|
1894
|
+
|
|
1895
|
+
test("extracts cached tokens to cache.read", () => {
|
|
1896
|
+
const model = createModel({ context: 100_000, output: 32_000 })
|
|
1897
|
+
const result = SessionNs.getUsage({
|
|
1898
|
+
model,
|
|
1899
|
+
usage: {
|
|
1900
|
+
inputTokens: 1000,
|
|
1901
|
+
outputTokens: 500,
|
|
1902
|
+
totalTokens: 1500,
|
|
1903
|
+
inputTokenDetails: {
|
|
1904
|
+
noCacheTokens: 800,
|
|
1905
|
+
cacheReadTokens: 200,
|
|
1906
|
+
cacheWriteTokens: undefined,
|
|
1907
|
+
},
|
|
1908
|
+
outputTokenDetails: {
|
|
1909
|
+
textTokens: undefined,
|
|
1910
|
+
reasoningTokens: undefined,
|
|
1911
|
+
},
|
|
1912
|
+
},
|
|
1913
|
+
})
|
|
1914
|
+
|
|
1915
|
+
expect(result.tokens.input).toBe(800)
|
|
1916
|
+
expect(result.tokens.cache.read).toBe(200)
|
|
1917
|
+
})
|
|
1918
|
+
|
|
1919
|
+
test("handles anthropic cache write metadata", () => {
|
|
1920
|
+
const model = createModel({ context: 100_000, output: 32_000 })
|
|
1921
|
+
const result = SessionNs.getUsage({
|
|
1922
|
+
model,
|
|
1923
|
+
usage: {
|
|
1924
|
+
inputTokens: 1000,
|
|
1925
|
+
outputTokens: 500,
|
|
1926
|
+
totalTokens: 1500,
|
|
1927
|
+
inputTokenDetails: {
|
|
1928
|
+
noCacheTokens: undefined,
|
|
1929
|
+
cacheReadTokens: undefined,
|
|
1930
|
+
cacheWriteTokens: undefined,
|
|
1931
|
+
},
|
|
1932
|
+
outputTokenDetails: {
|
|
1933
|
+
textTokens: undefined,
|
|
1934
|
+
reasoningTokens: undefined,
|
|
1935
|
+
},
|
|
1936
|
+
},
|
|
1937
|
+
metadata: {
|
|
1938
|
+
anthropic: {
|
|
1939
|
+
cacheCreationInputTokens: 300,
|
|
1940
|
+
},
|
|
1941
|
+
},
|
|
1942
|
+
})
|
|
1943
|
+
|
|
1944
|
+
expect(result.tokens.cache.write).toBe(300)
|
|
1945
|
+
})
|
|
1946
|
+
|
|
1947
|
+
test("subtracts cached tokens for anthropic provider", () => {
|
|
1948
|
+
const model = createModel({ context: 100_000, output: 32_000 })
|
|
1949
|
+
// AI SDK v6 normalizes inputTokens to include cached tokens for all providers
|
|
1950
|
+
const result = SessionNs.getUsage({
|
|
1951
|
+
model,
|
|
1952
|
+
usage: {
|
|
1953
|
+
inputTokens: 1000,
|
|
1954
|
+
outputTokens: 500,
|
|
1955
|
+
totalTokens: 1500,
|
|
1956
|
+
inputTokenDetails: {
|
|
1957
|
+
noCacheTokens: 800,
|
|
1958
|
+
cacheReadTokens: 200,
|
|
1959
|
+
cacheWriteTokens: undefined,
|
|
1960
|
+
},
|
|
1961
|
+
outputTokenDetails: {
|
|
1962
|
+
textTokens: undefined,
|
|
1963
|
+
reasoningTokens: undefined,
|
|
1964
|
+
},
|
|
1965
|
+
},
|
|
1966
|
+
metadata: {
|
|
1967
|
+
anthropic: {},
|
|
1968
|
+
},
|
|
1969
|
+
})
|
|
1970
|
+
|
|
1971
|
+
expect(result.tokens.input).toBe(800)
|
|
1972
|
+
expect(result.tokens.cache.read).toBe(200)
|
|
1973
|
+
})
|
|
1974
|
+
|
|
1975
|
+
test("separates reasoning tokens from output tokens", () => {
|
|
1976
|
+
const model = createModel({ context: 100_000, output: 32_000 })
|
|
1977
|
+
const result = SessionNs.getUsage({
|
|
1978
|
+
model,
|
|
1979
|
+
usage: {
|
|
1980
|
+
inputTokens: 1000,
|
|
1981
|
+
outputTokens: 500,
|
|
1982
|
+
totalTokens: 1500,
|
|
1983
|
+
inputTokenDetails: {
|
|
1984
|
+
noCacheTokens: undefined,
|
|
1985
|
+
cacheReadTokens: undefined,
|
|
1986
|
+
cacheWriteTokens: undefined,
|
|
1987
|
+
},
|
|
1988
|
+
outputTokenDetails: {
|
|
1989
|
+
textTokens: 400,
|
|
1990
|
+
reasoningTokens: 100,
|
|
1991
|
+
},
|
|
1992
|
+
},
|
|
1993
|
+
})
|
|
1994
|
+
|
|
1995
|
+
expect(result.tokens.input).toBe(1000)
|
|
1996
|
+
expect(result.tokens.output).toBe(400)
|
|
1997
|
+
expect(result.tokens.reasoning).toBe(100)
|
|
1998
|
+
expect(result.tokens.total).toBe(1500)
|
|
1999
|
+
})
|
|
2000
|
+
|
|
2001
|
+
test("does not double count reasoning tokens in cost", () => {
|
|
2002
|
+
const model = createModel({
|
|
2003
|
+
context: 100_000,
|
|
2004
|
+
output: 32_000,
|
|
2005
|
+
cost: {
|
|
2006
|
+
input: 0,
|
|
2007
|
+
output: 15,
|
|
2008
|
+
cache: { read: 0, write: 0 },
|
|
2009
|
+
},
|
|
2010
|
+
})
|
|
2011
|
+
const result = SessionNs.getUsage({
|
|
2012
|
+
model,
|
|
2013
|
+
usage: {
|
|
2014
|
+
inputTokens: 0,
|
|
2015
|
+
outputTokens: 1_000_000,
|
|
2016
|
+
totalTokens: 1_000_000,
|
|
2017
|
+
inputTokenDetails: {
|
|
2018
|
+
noCacheTokens: undefined,
|
|
2019
|
+
cacheReadTokens: undefined,
|
|
2020
|
+
cacheWriteTokens: undefined,
|
|
2021
|
+
},
|
|
2022
|
+
outputTokenDetails: {
|
|
2023
|
+
textTokens: 750_000,
|
|
2024
|
+
reasoningTokens: 250_000,
|
|
2025
|
+
},
|
|
2026
|
+
},
|
|
2027
|
+
})
|
|
2028
|
+
|
|
2029
|
+
expect(result.tokens.output).toBe(750_000)
|
|
2030
|
+
expect(result.tokens.reasoning).toBe(250_000)
|
|
2031
|
+
expect(result.cost).toBe(15)
|
|
2032
|
+
})
|
|
2033
|
+
|
|
2034
|
+
test("handles undefined optional values gracefully", () => {
|
|
2035
|
+
const model = createModel({ context: 100_000, output: 32_000 })
|
|
2036
|
+
const result = SessionNs.getUsage({
|
|
2037
|
+
model,
|
|
2038
|
+
usage: {
|
|
2039
|
+
inputTokens: 0,
|
|
2040
|
+
outputTokens: 0,
|
|
2041
|
+
totalTokens: 0,
|
|
2042
|
+
inputTokenDetails: {
|
|
2043
|
+
noCacheTokens: undefined,
|
|
2044
|
+
cacheReadTokens: undefined,
|
|
2045
|
+
cacheWriteTokens: undefined,
|
|
2046
|
+
},
|
|
2047
|
+
outputTokenDetails: {
|
|
2048
|
+
textTokens: undefined,
|
|
2049
|
+
reasoningTokens: undefined,
|
|
2050
|
+
},
|
|
2051
|
+
},
|
|
2052
|
+
})
|
|
2053
|
+
|
|
2054
|
+
expect(result.tokens.input).toBe(0)
|
|
2055
|
+
expect(result.tokens.output).toBe(0)
|
|
2056
|
+
expect(result.tokens.reasoning).toBe(0)
|
|
2057
|
+
expect(result.tokens.cache.read).toBe(0)
|
|
2058
|
+
expect(result.tokens.cache.write).toBe(0)
|
|
2059
|
+
expect(Number.isNaN(result.cost)).toBe(false)
|
|
2060
|
+
})
|
|
2061
|
+
|
|
2062
|
+
test("calculates cost correctly", () => {
|
|
2063
|
+
const model = createModel({
|
|
2064
|
+
context: 100_000,
|
|
2065
|
+
output: 32_000,
|
|
2066
|
+
cost: {
|
|
2067
|
+
input: 3,
|
|
2068
|
+
output: 15,
|
|
2069
|
+
cache: { read: 0.3, write: 3.75 },
|
|
2070
|
+
},
|
|
2071
|
+
})
|
|
2072
|
+
const result = SessionNs.getUsage({
|
|
2073
|
+
model,
|
|
2074
|
+
usage: {
|
|
2075
|
+
inputTokens: 1_000_000,
|
|
2076
|
+
outputTokens: 100_000,
|
|
2077
|
+
totalTokens: 1_100_000,
|
|
2078
|
+
inputTokenDetails: {
|
|
2079
|
+
noCacheTokens: undefined,
|
|
2080
|
+
cacheReadTokens: undefined,
|
|
2081
|
+
cacheWriteTokens: undefined,
|
|
2082
|
+
},
|
|
2083
|
+
outputTokenDetails: {
|
|
2084
|
+
textTokens: undefined,
|
|
2085
|
+
reasoningTokens: undefined,
|
|
2086
|
+
},
|
|
2087
|
+
},
|
|
2088
|
+
})
|
|
2089
|
+
|
|
2090
|
+
expect(result.cost).toBe(3 + 1.5)
|
|
2091
|
+
})
|
|
2092
|
+
test("uses openrouter provider cost when available", () => {
|
|
2093
|
+
const model = createModel({
|
|
2094
|
+
context: 100_000,
|
|
2095
|
+
output: 32_000,
|
|
2096
|
+
cost: {
|
|
2097
|
+
input: 3,
|
|
2098
|
+
output: 15,
|
|
2099
|
+
cache: { read: 0.3, write: 3.75 },
|
|
2100
|
+
},
|
|
2101
|
+
})
|
|
2102
|
+
const result = SessionNs.getUsage({
|
|
2103
|
+
model,
|
|
2104
|
+
usage: {
|
|
2105
|
+
inputTokens: 1_000_000,
|
|
2106
|
+
outputTokens: 100_000,
|
|
2107
|
+
totalTokens: 1_100_000,
|
|
2108
|
+
inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
|
|
2109
|
+
outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
|
|
2110
|
+
},
|
|
2111
|
+
metadata: {
|
|
2112
|
+
openrouter: {
|
|
2113
|
+
usage: {
|
|
2114
|
+
cost: 0.42, // Provider-reported cost should be used instead of calculated
|
|
2115
|
+
},
|
|
2116
|
+
},
|
|
2117
|
+
},
|
|
2118
|
+
})
|
|
2119
|
+
|
|
2120
|
+
// Should use the provider cost (0.42) instead of calculated cost (4.5)
|
|
2121
|
+
expect(result.cost).toBe(0.42)
|
|
2122
|
+
})
|
|
2123
|
+
|
|
2124
|
+
test("falls back to calculated cost when openrouter cost is not available", () => {
|
|
2125
|
+
const model = createModel({
|
|
2126
|
+
context: 100_000,
|
|
2127
|
+
output: 32_000,
|
|
2128
|
+
cost: {
|
|
2129
|
+
input: 3,
|
|
2130
|
+
output: 15,
|
|
2131
|
+
cache: { read: 0.3, write: 3.75 },
|
|
2132
|
+
},
|
|
2133
|
+
})
|
|
2134
|
+
const result = SessionNs.getUsage({
|
|
2135
|
+
model,
|
|
2136
|
+
usage: {
|
|
2137
|
+
inputTokens: 1_000_000,
|
|
2138
|
+
outputTokens: 100_000,
|
|
2139
|
+
totalTokens: 1_100_000,
|
|
2140
|
+
inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
|
|
2141
|
+
outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
|
|
2142
|
+
},
|
|
2143
|
+
metadata: {
|
|
2144
|
+
openrouter: {
|
|
2145
|
+
usage: {
|
|
2146
|
+
// cost is undefined
|
|
2147
|
+
},
|
|
2148
|
+
},
|
|
2149
|
+
},
|
|
2150
|
+
})
|
|
2151
|
+
|
|
2152
|
+
// Should fall back to calculated cost
|
|
2153
|
+
expect(result.cost).toBe(3 + 1.5)
|
|
2154
|
+
})
|
|
2155
|
+
|
|
2156
|
+
test("falls back to calculated cost when openrouter metadata is empty", () => {
|
|
2157
|
+
const model = createModel({
|
|
2158
|
+
context: 100_000,
|
|
2159
|
+
output: 32_000,
|
|
2160
|
+
cost: {
|
|
2161
|
+
input: 3,
|
|
2162
|
+
output: 15,
|
|
2163
|
+
cache: { read: 0.3, write: 3.75 },
|
|
2164
|
+
},
|
|
2165
|
+
})
|
|
2166
|
+
const result = SessionNs.getUsage({
|
|
2167
|
+
model,
|
|
2168
|
+
usage: {
|
|
2169
|
+
inputTokens: 1_000_000,
|
|
2170
|
+
outputTokens: 100_000,
|
|
2171
|
+
totalTokens: 1_100_000,
|
|
2172
|
+
inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
|
|
2173
|
+
outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
|
|
2174
|
+
},
|
|
2175
|
+
metadata: {
|
|
2176
|
+
openrouter: {},
|
|
2177
|
+
},
|
|
2178
|
+
})
|
|
2179
|
+
|
|
2180
|
+
// Should fall back to calculated cost
|
|
2181
|
+
expect(result.cost).toBe(3 + 1.5)
|
|
2182
|
+
})
|
|
2183
|
+
|
|
2184
|
+
test("uses upstreamInferenceCost for Saeeol provider", () => {
|
|
2185
|
+
const model = createModel({
|
|
2186
|
+
context: 100_000,
|
|
2187
|
+
output: 32_000,
|
|
2188
|
+
cost: {
|
|
2189
|
+
input: 3,
|
|
2190
|
+
output: 15,
|
|
2191
|
+
cache: { read: 0.3, write: 3.75 },
|
|
2192
|
+
},
|
|
2193
|
+
})
|
|
2194
|
+
const provider = { id: "saeeol" } as Provider.Info
|
|
2195
|
+
const result = SessionNs.getUsage({
|
|
2196
|
+
model,
|
|
2197
|
+
provider,
|
|
2198
|
+
usage: {
|
|
2199
|
+
inputTokens: 1_000_000,
|
|
2200
|
+
outputTokens: 100_000,
|
|
2201
|
+
totalTokens: 1_100_000,
|
|
2202
|
+
inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
|
|
2203
|
+
outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
|
|
2204
|
+
},
|
|
2205
|
+
metadata: {
|
|
2206
|
+
openrouter: {
|
|
2207
|
+
usage: {
|
|
2208
|
+
cost: 0.01, // OpenRouter 5% fee
|
|
2209
|
+
costDetails: {
|
|
2210
|
+
upstreamInferenceCost: 0.2, // Actual inference cost
|
|
2211
|
+
},
|
|
2212
|
+
},
|
|
2213
|
+
},
|
|
2214
|
+
},
|
|
2215
|
+
})
|
|
2216
|
+
|
|
2217
|
+
// Should use upstreamInferenceCost for Saeeol provider (BYOK)
|
|
2218
|
+
expect(result.cost).toBe(0.2)
|
|
2219
|
+
})
|
|
2220
|
+
|
|
2221
|
+
test("uses regular cost for OpenRouter provider", () => {
|
|
2222
|
+
const model = createModel({
|
|
2223
|
+
context: 100_000,
|
|
2224
|
+
output: 32_000,
|
|
2225
|
+
cost: {
|
|
2226
|
+
input: 3,
|
|
2227
|
+
output: 15,
|
|
2228
|
+
cache: { read: 0.3, write: 3.75 },
|
|
2229
|
+
},
|
|
2230
|
+
})
|
|
2231
|
+
const provider = { id: "openrouter" } as Provider.Info
|
|
2232
|
+
const result = SessionNs.getUsage({
|
|
2233
|
+
model,
|
|
2234
|
+
provider,
|
|
2235
|
+
usage: {
|
|
2236
|
+
inputTokens: 1_000_000,
|
|
2237
|
+
outputTokens: 100_000,
|
|
2238
|
+
totalTokens: 1_100_000,
|
|
2239
|
+
inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
|
|
2240
|
+
outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
|
|
2241
|
+
},
|
|
2242
|
+
metadata: {
|
|
2243
|
+
openrouter: {
|
|
2244
|
+
usage: {
|
|
2245
|
+
cost: 0.5, // Regular OpenRouter cost
|
|
2246
|
+
costDetails: {
|
|
2247
|
+
upstreamInferenceCost: 0.45,
|
|
2248
|
+
},
|
|
2249
|
+
},
|
|
2250
|
+
},
|
|
2251
|
+
},
|
|
2252
|
+
})
|
|
2253
|
+
|
|
2254
|
+
// Should use regular cost for OpenRouter provider
|
|
2255
|
+
expect(result.cost).toBe(0.5)
|
|
2256
|
+
})
|
|
2257
|
+
|
|
2258
|
+
test("falls back to regular cost when provider is not specified", () => {
|
|
2259
|
+
const model = createModel({
|
|
2260
|
+
context: 100_000,
|
|
2261
|
+
output: 32_000,
|
|
2262
|
+
cost: {
|
|
2263
|
+
input: 3,
|
|
2264
|
+
output: 15,
|
|
2265
|
+
cache: { read: 0.3, write: 3.75 },
|
|
2266
|
+
},
|
|
2267
|
+
})
|
|
2268
|
+
const result = SessionNs.getUsage({
|
|
2269
|
+
model,
|
|
2270
|
+
usage: {
|
|
2271
|
+
inputTokens: 1_000_000,
|
|
2272
|
+
outputTokens: 100_000,
|
|
2273
|
+
totalTokens: 1_100_000,
|
|
2274
|
+
inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
|
|
2275
|
+
outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
|
|
2276
|
+
},
|
|
2277
|
+
metadata: {
|
|
2278
|
+
openrouter: {
|
|
2279
|
+
usage: {
|
|
2280
|
+
cost: 0.3,
|
|
2281
|
+
costDetails: {
|
|
2282
|
+
upstreamInferenceCost: 0.25,
|
|
2283
|
+
},
|
|
2284
|
+
},
|
|
2285
|
+
},
|
|
2286
|
+
},
|
|
2287
|
+
})
|
|
2288
|
+
|
|
2289
|
+
// Should use regular cost when provider is not specified
|
|
2290
|
+
expect(result.cost).toBe(0.3)
|
|
2291
|
+
})
|
|
2292
|
+
|
|
2293
|
+
test("uses regular cost when upstreamInferenceCost is missing for Saeeol", () => {
|
|
2294
|
+
const model = createModel({
|
|
2295
|
+
context: 100_000,
|
|
2296
|
+
output: 32_000,
|
|
2297
|
+
cost: {
|
|
2298
|
+
input: 3,
|
|
2299
|
+
output: 15,
|
|
2300
|
+
cache: { read: 0.3, write: 3.75 },
|
|
2301
|
+
},
|
|
2302
|
+
})
|
|
2303
|
+
const provider = { id: "saeeol" } as Provider.Info
|
|
2304
|
+
const result = SessionNs.getUsage({
|
|
2305
|
+
model,
|
|
2306
|
+
provider,
|
|
2307
|
+
usage: {
|
|
2308
|
+
inputTokens: 1_000_000,
|
|
2309
|
+
outputTokens: 100_000,
|
|
2310
|
+
totalTokens: 1_100_000,
|
|
2311
|
+
inputTokenDetails: { noCacheTokens: undefined, cacheReadTokens: undefined, cacheWriteTokens: undefined },
|
|
2312
|
+
outputTokenDetails: { textTokens: undefined, reasoningTokens: undefined },
|
|
2313
|
+
},
|
|
2314
|
+
metadata: {
|
|
2315
|
+
openrouter: {
|
|
2316
|
+
usage: {
|
|
2317
|
+
cost: 0.01,
|
|
2318
|
+
// costDetails is missing
|
|
2319
|
+
},
|
|
2320
|
+
},
|
|
2321
|
+
},
|
|
2322
|
+
})
|
|
2323
|
+
|
|
2324
|
+
// When upstream cost is missing for Saeeol, fall back to regular cost field
|
|
2325
|
+
expect(result.cost).toBe(0.01)
|
|
2326
|
+
})
|
|
2327
|
+
|
|
2328
|
+
// Tests for Anthropic Messages / OpenAI Responses / Vercel AI Gateway cost extraction
|
|
2329
|
+
// live in test/saeeol/provider-cost.test.ts (saeeol_change).
|
|
2330
|
+
|
|
2331
|
+
test.each(["@ai-sdk/anthropic", "@ai-sdk/amazon-bedrock", "@ai-sdk/google-vertex/anthropic"])(
|
|
2332
|
+
"computes total from components for %s models",
|
|
2333
|
+
(npm) => {
|
|
2334
|
+
const model = createModel({ context: 100_000, output: 32_000, npm })
|
|
2335
|
+
// AI SDK v6: inputTokens includes cached tokens for all providers
|
|
2336
|
+
const usage = {
|
|
2337
|
+
inputTokens: 1000,
|
|
2338
|
+
outputTokens: 500,
|
|
2339
|
+
totalTokens: 1500,
|
|
2340
|
+
inputTokenDetails: {
|
|
2341
|
+
noCacheTokens: 800,
|
|
2342
|
+
cacheReadTokens: 200,
|
|
2343
|
+
cacheWriteTokens: undefined,
|
|
2344
|
+
},
|
|
2345
|
+
outputTokenDetails: {
|
|
2346
|
+
textTokens: undefined,
|
|
2347
|
+
reasoningTokens: undefined,
|
|
2348
|
+
},
|
|
2349
|
+
}
|
|
2350
|
+
if (npm === "@ai-sdk/amazon-bedrock") {
|
|
2351
|
+
const result = SessionNs.getUsage({
|
|
2352
|
+
model,
|
|
2353
|
+
usage,
|
|
2354
|
+
metadata: {
|
|
2355
|
+
bedrock: {
|
|
2356
|
+
usage: {
|
|
2357
|
+
cacheWriteInputTokens: 300,
|
|
2358
|
+
},
|
|
2359
|
+
},
|
|
2360
|
+
},
|
|
2361
|
+
})
|
|
2362
|
+
|
|
2363
|
+
// inputTokens (1000) includes cache, so adjusted = 1000 - 200 - 300 = 500
|
|
2364
|
+
expect(result.tokens.input).toBe(500)
|
|
2365
|
+
expect(result.tokens.cache.read).toBe(200)
|
|
2366
|
+
expect(result.tokens.cache.write).toBe(300)
|
|
2367
|
+
// total = adjusted (500) + output (500) + cacheRead (200) + cacheWrite (300)
|
|
2368
|
+
expect(result.tokens.total).toBe(1500)
|
|
2369
|
+
return
|
|
2370
|
+
}
|
|
2371
|
+
|
|
2372
|
+
const result = SessionNs.getUsage({
|
|
2373
|
+
model,
|
|
2374
|
+
usage,
|
|
2375
|
+
metadata: {
|
|
2376
|
+
anthropic: {
|
|
2377
|
+
cacheCreationInputTokens: 300,
|
|
2378
|
+
},
|
|
2379
|
+
},
|
|
2380
|
+
})
|
|
2381
|
+
|
|
2382
|
+
// inputTokens (1000) includes cache, so adjusted = 1000 - 200 - 300 = 500
|
|
2383
|
+
expect(result.tokens.input).toBe(500)
|
|
2384
|
+
expect(result.tokens.cache.read).toBe(200)
|
|
2385
|
+
expect(result.tokens.cache.write).toBe(300)
|
|
2386
|
+
// total = adjusted (500) + output (500) + cacheRead (200) + cacheWrite (300)
|
|
2387
|
+
expect(result.tokens.total).toBe(1500)
|
|
2388
|
+
},
|
|
2389
|
+
)
|
|
2390
|
+
|
|
2391
|
+
test("extracts cache write tokens from vertex metadata key", () => {
|
|
2392
|
+
const model = createModel({ context: 100_000, output: 32_000, npm: "@ai-sdk/google-vertex/anthropic" })
|
|
2393
|
+
const result = SessionNs.getUsage({
|
|
2394
|
+
model,
|
|
2395
|
+
usage: {
|
|
2396
|
+
inputTokens: 1000,
|
|
2397
|
+
outputTokens: 500,
|
|
2398
|
+
totalTokens: 1500,
|
|
2399
|
+
inputTokenDetails: {
|
|
2400
|
+
noCacheTokens: 800,
|
|
2401
|
+
cacheReadTokens: 200,
|
|
2402
|
+
cacheWriteTokens: undefined,
|
|
2403
|
+
},
|
|
2404
|
+
outputTokenDetails: {
|
|
2405
|
+
textTokens: undefined,
|
|
2406
|
+
reasoningTokens: undefined,
|
|
2407
|
+
},
|
|
2408
|
+
},
|
|
2409
|
+
metadata: {
|
|
2410
|
+
vertex: {
|
|
2411
|
+
cacheCreationInputTokens: 300,
|
|
2412
|
+
},
|
|
2413
|
+
},
|
|
2414
|
+
})
|
|
2415
|
+
|
|
2416
|
+
expect(result.tokens.input).toBe(500)
|
|
2417
|
+
expect(result.tokens.cache.read).toBe(200)
|
|
2418
|
+
expect(result.tokens.cache.write).toBe(300)
|
|
2419
|
+
})
|
|
2420
|
+
})
|