mixdog 0.7.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.claude-plugin/marketplace.json +31 -0
- package/.claude-plugin/plugin.json +20 -0
- package/.gitattributes +34 -0
- package/.mcp.json +14 -0
- package/ARCHITECTURE.md +77 -0
- package/CHANGELOG.md +7 -0
- package/CONTRIBUTING.md +45 -0
- package/DATA-FLOW.md +79 -0
- package/LICENSE +21 -0
- package/README.md +389 -0
- package/SECURITY.md +138 -0
- package/UNINSTALL.md +112 -0
- package/agents/maintenance.md +5 -0
- package/agents/memory-classification.md +30 -0
- package/agents/scheduler-task.md +18 -0
- package/agents/webhook-handler.md +27 -0
- package/agents/worker.md +24 -0
- package/bin/bridge +133 -0
- package/bin/statusline-launcher.mjs +78 -0
- package/bin/statusline-lib.mjs +550 -0
- package/bin/statusline.mjs +607 -0
- package/bun.lock +802 -0
- package/commands/config.md +16 -0
- package/commands/doctor.md +13 -0
- package/commands/setup.md +17 -0
- package/defaults/cycle3-review-prompt.md +90 -0
- package/defaults/hidden-roles.json +65 -0
- package/defaults/memory-chunk-prompt.md +63 -0
- package/defaults/memory-promote-prompt.md +135 -0
- package/defaults/mixdog-config.template.json +27 -0
- package/defaults/user-workflow.json +8 -0
- package/defaults/user-workflow.md +12 -0
- package/hooks/hooks.json +73 -0
- package/hooks/lib/active-instance.cjs +77 -0
- package/hooks/lib/permission-evaluator.cjs +411 -0
- package/hooks/lib/permission-route.cjs +63 -0
- package/hooks/lib/permission-rules.cjs +170 -0
- package/hooks/lib/settings-loader.cjs +116 -0
- package/hooks/post-tool-use.cjs +84 -0
- package/hooks/pre-mcp-sandbox.cjs +158 -0
- package/hooks/pre-tool-subagent.cjs +253 -0
- package/hooks/session-start.cjs +1372 -0
- package/hooks/turn-timer.cjs +82 -0
- package/lib/claude-md-writer.cjs +386 -0
- package/lib/config-cjs.cjs +61 -0
- package/lib/hook-pipe-path.cjs +10 -0
- package/lib/keychain-cjs.cjs +263 -0
- package/lib/plugin-paths.cjs +61 -0
- package/lib/rules-builder.cjs +241 -0
- package/lib/text-utils.cjs +61 -0
- package/native/README.md +117 -0
- package/native/prebuilt/linux-aarch64/mixdog-shim +0 -0
- package/native/prebuilt/linux-x86_64/mixdog-shim +0 -0
- package/native/prebuilt/macos-aarch64/mixdog-shim +0 -0
- package/native/prebuilt/macos-x86_64/mixdog-shim +0 -0
- package/native/prebuilt/windows-x86_64/mixdog-shim.exe +0 -0
- package/package.json +107 -0
- package/prompts/code-review.txt +16 -0
- package/prompts/security-audit.txt +17 -0
- package/rules/bridge/00-common.md +39 -0
- package/rules/bridge/20-skip-protocol.md +18 -0
- package/rules/bridge/30-explorer.md +33 -0
- package/rules/bridge/40-cycle1-agent.md +52 -0
- package/rules/bridge/41-cycle2-agent.md +62 -0
- package/rules/bridge/42-cycle3-agent.md +44 -0
- package/rules/lead/00-tool-lead.md +61 -0
- package/rules/lead/01-general.md +23 -0
- package/rules/lead/02-channels.md +49 -0
- package/rules/lead/03-team.md +27 -0
- package/rules/lead/04-workflow.md +20 -0
- package/rules/shared/00-language.md +14 -0
- package/rules/shared/01-tool.md +138 -0
- package/scripts/bootstrap.mjs +184 -0
- package/scripts/bridge-unify-smoke.mjs +308 -0
- package/scripts/build-runtime-linux.sh +348 -0
- package/scripts/build-runtime-macos.sh +217 -0
- package/scripts/build-runtime-windows.ps1 +242 -0
- package/scripts/builtin-utils-smoke.mjs +392 -0
- package/scripts/check-json.mjs +45 -0
- package/scripts/check-syntax-changed.mjs +102 -0
- package/scripts/check-syntax.mjs +58 -0
- package/scripts/code-graph-batch.test.mjs +33 -0
- package/scripts/config-preserve-smoke.mjs +180 -0
- package/scripts/doctor.mjs +484 -0
- package/scripts/edit-normalize-fuzz.mjs +130 -0
- package/scripts/edit-normalize-smoke.mjs +401 -0
- package/scripts/edit-operation-smoke.mjs +369 -0
- package/scripts/edit2-smoke.mjs +63 -0
- package/scripts/fuzzy-e2e.mjs +28 -0
- package/scripts/fuzzy-smoke.mjs +26 -0
- package/scripts/generate-runtime-manifest.mjs +166 -0
- package/scripts/guard-smoke.mjs +66 -0
- package/scripts/hidden-role-schema-smoke.mjs +162 -0
- package/scripts/hook-routing-smoke.mjs +29 -0
- package/scripts/inject-input.ps1 +204 -0
- package/scripts/io-complex-smoke.mjs +667 -0
- package/scripts/io-explore-bench.mjs +424 -0
- package/scripts/io-guardrails-smoke.mjs +205 -0
- package/scripts/io-mini-bench-baseline.json +11 -0
- package/scripts/io-mini-bench.mjs +216 -0
- package/scripts/io-route-harness.mjs +933 -0
- package/scripts/io-telemetry-report.mjs +691 -0
- package/scripts/mutation-bench.mjs +564 -0
- package/scripts/mutation-io-smoke.mjs +1081 -0
- package/scripts/native-patch-bridge-smoke.mjs +288 -0
- package/scripts/native-patch-smoke.mjs +304 -0
- package/scripts/patch-interior-context-smoke.mjs +49 -0
- package/scripts/patch-newline-utf8-smoke.mjs +157 -0
- package/scripts/perf-hook-smoke.mjs +71 -0
- package/scripts/permission-eval-smoke.mjs +426 -0
- package/scripts/prep-patch.mjs +53 -0
- package/scripts/prep-shim.mjs +96 -0
- package/scripts/provider-cache-smoke.mjs +687 -0
- package/scripts/report-runtime-health.mjs +132 -0
- package/scripts/run-mcp.mjs +1547 -0
- package/scripts/salvage-v4a-shatter.test.mjs +58 -0
- package/scripts/scoped-cache-io-smoke.mjs +103 -0
- package/scripts/shell-policy-round3-smoke.mjs +46 -0
- package/scripts/smoke-runtime-negative.ps1 +100 -0
- package/scripts/smoke-runtime-negative.sh +95 -0
- package/scripts/stall-policy-smoke.mjs +50 -0
- package/scripts/start-memory-worker.mjs +23 -0
- package/scripts/statusline-launcher-smoke.mjs +82 -0
- package/scripts/stress-atomic-write.mjs +1028 -0
- package/scripts/test-config-rmw-restore.mjs +122 -0
- package/scripts/test-fault-inject.mjs +164 -0
- package/scripts/test-large-file.mjs +174 -0
- package/scripts/tool-edge-smoke.mjs +209 -0
- package/scripts/uninstall.mjs +201 -0
- package/scripts/webhook-selfheal-smoke.mjs +29 -0
- package/scripts/write-overwrite-guard-smoke.mjs +56 -0
- package/server-main.mjs +3055 -0
- package/server.mjs +468 -0
- package/setup/config-merge.mjs +254 -0
- package/setup/install.mjs +120 -0
- package/setup/launch-core.mjs +507 -0
- package/setup/launch.mjs +101 -0
- package/setup/setup-server.mjs +3206 -0
- package/setup/setup.html +3693 -0
- package/skills/retro-skill-proposer/SKILL.md +92 -0
- package/skills/schedule-add/SKILL.md +77 -0
- package/skills/setup/SKILL.md +346 -0
- package/skills/webhook-add/SKILL.md +81 -0
- package/src/agent/bridge-stall-watchdog.mjs +337 -0
- package/src/agent/index.mjs +2138 -0
- package/src/agent/orchestrator/activity-bus.mjs +38 -0
- package/src/agent/orchestrator/ai-wrapped-dispatch.mjs +1010 -0
- package/src/agent/orchestrator/bridge-retry.mjs +220 -0
- package/src/agent/orchestrator/bridge-trace.mjs +583 -0
- package/src/agent/orchestrator/cache-mtime.mjs +58 -0
- package/src/agent/orchestrator/config.mjs +358 -0
- package/src/agent/orchestrator/context/collect.mjs +651 -0
- package/src/agent/orchestrator/dispatch-persist.mjs +549 -0
- package/src/agent/orchestrator/drain-registry.mjs +50 -0
- package/src/agent/orchestrator/explore-validator.mjs +8 -0
- package/src/agent/orchestrator/internal-roles.mjs +118 -0
- package/src/agent/orchestrator/internal-tools.mjs +88 -0
- package/src/agent/orchestrator/jobs.mjs +116 -0
- package/src/agent/orchestrator/mcp/client.mjs +364 -0
- package/src/agent/orchestrator/providers/anthropic-betas.mjs +21 -0
- package/src/agent/orchestrator/providers/anthropic-oauth.mjs +1745 -0
- package/src/agent/orchestrator/providers/anthropic.mjs +437 -0
- package/src/agent/orchestrator/providers/gemini.mjs +1175 -0
- package/src/agent/orchestrator/providers/grok-oauth.mjs +782 -0
- package/src/agent/orchestrator/providers/model-catalog.mjs +241 -0
- package/src/agent/orchestrator/providers/openai-compat.mjs +1467 -0
- package/src/agent/orchestrator/providers/openai-oauth-ws.mjs +1890 -0
- package/src/agent/orchestrator/providers/openai-oauth.mjs +1307 -0
- package/src/agent/orchestrator/providers/openai-ws.mjs +104 -0
- package/src/agent/orchestrator/providers/registry.mjs +192 -0
- package/src/agent/orchestrator/providers/retry-classifier.mjs +325 -0
- package/src/agent/orchestrator/session/abort-lookup.mjs +13 -0
- package/src/agent/orchestrator/session/cache/post-edit-marks.mjs +42 -0
- package/src/agent/orchestrator/session/cache/prefetch-cache.mjs +142 -0
- package/src/agent/orchestrator/session/cache/read-cache.mjs +319 -0
- package/src/agent/orchestrator/session/cache/scoped-cache-outcome.mjs +11 -0
- package/src/agent/orchestrator/session/cache/scoped-cache.mjs +361 -0
- package/src/agent/orchestrator/session/cache/util.mjs +49 -0
- package/src/agent/orchestrator/session/loop.mjs +1478 -0
- package/src/agent/orchestrator/session/manager.mjs +1975 -0
- package/src/agent/orchestrator/session/read-dedup.mjs +6 -0
- package/src/agent/orchestrator/session/result-classification.mjs +65 -0
- package/src/agent/orchestrator/session/save-session-worker.mjs +18 -0
- package/src/agent/orchestrator/session/store.mjs +624 -0
- package/src/agent/orchestrator/session/stream-watchdog.mjs +130 -0
- package/src/agent/orchestrator/session/tool-result-offload.mjs +166 -0
- package/src/agent/orchestrator/session/trim.mjs +491 -0
- package/src/agent/orchestrator/smart-bridge/CACHE-SHARD.md +115 -0
- package/src/agent/orchestrator/smart-bridge/bridge-llm.mjs +327 -0
- package/src/agent/orchestrator/smart-bridge/cache-obs.mjs +150 -0
- package/src/agent/orchestrator/smart-bridge/cache-strategy.mjs +228 -0
- package/src/agent/orchestrator/smart-bridge/index.mjs +215 -0
- package/src/agent/orchestrator/smart-bridge/profiles.mjs +37 -0
- package/src/agent/orchestrator/smart-bridge/registry.mjs +348 -0
- package/src/agent/orchestrator/smart-bridge/session-builder.mjs +116 -0
- package/src/agent/orchestrator/stall-policy.mjs +195 -0
- package/src/agent/orchestrator/tool-loop-guard.mjs +75 -0
- package/src/agent/orchestrator/tools/bash-policy-scan.mjs +77 -0
- package/src/agent/orchestrator/tools/bash-session.mjs +721 -0
- package/src/agent/orchestrator/tools/builtin/advisory-lock.mjs +171 -0
- package/src/agent/orchestrator/tools/builtin/arg-guard.mjs +455 -0
- package/src/agent/orchestrator/tools/builtin/atomic-write.mjs +236 -0
- package/src/agent/orchestrator/tools/builtin/bash-tool.mjs +480 -0
- package/src/agent/orchestrator/tools/builtin/binary-file.mjs +76 -0
- package/src/agent/orchestrator/tools/builtin/builtin-tools.mjs +256 -0
- package/src/agent/orchestrator/tools/builtin/cache-layers.mjs +386 -0
- package/src/agent/orchestrator/tools/builtin/cwd-utils.mjs +37 -0
- package/src/agent/orchestrator/tools/builtin/device-paths.mjs +154 -0
- package/src/agent/orchestrator/tools/builtin/diagnostics-tool.mjs +292 -0
- package/src/agent/orchestrator/tools/builtin/diff-utils.mjs +109 -0
- package/src/agent/orchestrator/tools/builtin/edit-base-guard.mjs +58 -0
- package/src/agent/orchestrator/tools/builtin/edit-byte-plan.mjs +240 -0
- package/src/agent/orchestrator/tools/builtin/edit-byte-utils.mjs +113 -0
- package/src/agent/orchestrator/tools/builtin/edit-commit.mjs +74 -0
- package/src/agent/orchestrator/tools/builtin/edit-context-utils.mjs +242 -0
- package/src/agent/orchestrator/tools/builtin/edit-diagnostics.mjs +211 -0
- package/src/agent/orchestrator/tools/builtin/edit-engine.mjs +1364 -0
- package/src/agent/orchestrator/tools/builtin/edit-failure-context.mjs +126 -0
- package/src/agent/orchestrator/tools/builtin/edit-hint.mjs +141 -0
- package/src/agent/orchestrator/tools/builtin/edit-match-utils.mjs +194 -0
- package/src/agent/orchestrator/tools/builtin/edit-partial-write.mjs +60 -0
- package/src/agent/orchestrator/tools/builtin/edit-stale-refresh.mjs +168 -0
- package/src/agent/orchestrator/tools/builtin/edit-tool.mjs +173 -0
- package/src/agent/orchestrator/tools/builtin/edit-utf8-guard.mjs +48 -0
- package/src/agent/orchestrator/tools/builtin/fs-reachability.mjs +48 -0
- package/src/agent/orchestrator/tools/builtin/fuzzy-match.mjs +99 -0
- package/src/agent/orchestrator/tools/builtin/glob-walk.mjs +170 -0
- package/src/agent/orchestrator/tools/builtin/grep-formatting.mjs +113 -0
- package/src/agent/orchestrator/tools/builtin/hash-utils.mjs +6 -0
- package/src/agent/orchestrator/tools/builtin/list-formatting.mjs +7 -0
- package/src/agent/orchestrator/tools/builtin/list-tool.mjs +593 -0
- package/src/agent/orchestrator/tools/builtin/native-edit-runner.mjs +89 -0
- package/src/agent/orchestrator/tools/builtin/notebook-edit-tool.mjs +300 -0
- package/src/agent/orchestrator/tools/builtin/open-config-tool.mjs +26 -0
- package/src/agent/orchestrator/tools/builtin/path-diagnostics.mjs +152 -0
- package/src/agent/orchestrator/tools/builtin/path-locks.mjs +35 -0
- package/src/agent/orchestrator/tools/builtin/path-utils.mjs +201 -0
- package/src/agent/orchestrator/tools/builtin/read-args.mjs +103 -0
- package/src/agent/orchestrator/tools/builtin/read-batch.mjs +172 -0
- package/src/agent/orchestrator/tools/builtin/read-constants.mjs +40 -0
- package/src/agent/orchestrator/tools/builtin/read-formatting.mjs +118 -0
- package/src/agent/orchestrator/tools/builtin/read-image-resize.mjs +189 -0
- package/src/agent/orchestrator/tools/builtin/read-image.mjs +88 -0
- package/src/agent/orchestrator/tools/builtin/read-lines.mjs +12 -0
- package/src/agent/orchestrator/tools/builtin/read-mode-tool.mjs +455 -0
- package/src/agent/orchestrator/tools/builtin/read-open.mjs +190 -0
- package/src/agent/orchestrator/tools/builtin/read-range-index.mjs +271 -0
- package/src/agent/orchestrator/tools/builtin/read-ranges.mjs +26 -0
- package/src/agent/orchestrator/tools/builtin/read-single-tool.mjs +728 -0
- package/src/agent/orchestrator/tools/builtin/read-snapshot-runtime.mjs +173 -0
- package/src/agent/orchestrator/tools/builtin/read-special-files.mjs +268 -0
- package/src/agent/orchestrator/tools/builtin/read-streaming.mjs +602 -0
- package/src/agent/orchestrator/tools/builtin/read-tool.mjs +530 -0
- package/src/agent/orchestrator/tools/builtin/read-windows.mjs +107 -0
- package/src/agent/orchestrator/tools/builtin/rename-tool.mjs +196 -0
- package/src/agent/orchestrator/tools/builtin/rg-runner.mjs +422 -0
- package/src/agent/orchestrator/tools/builtin/search-builders.mjs +158 -0
- package/src/agent/orchestrator/tools/builtin/search-tool.mjs +869 -0
- package/src/agent/orchestrator/tools/builtin/shell-analysis.mjs +653 -0
- package/src/agent/orchestrator/tools/builtin/shell-jobs.mjs +936 -0
- package/src/agent/orchestrator/tools/builtin/shell-output.mjs +36 -0
- package/src/agent/orchestrator/tools/builtin/shell-runtime.mjs +214 -0
- package/src/agent/orchestrator/tools/builtin/snapshot-helpers.mjs +143 -0
- package/src/agent/orchestrator/tools/builtin/snapshot-store.mjs +206 -0
- package/src/agent/orchestrator/tools/builtin/snapshot-validation.mjs +98 -0
- package/src/agent/orchestrator/tools/builtin/text-stats.mjs +69 -0
- package/src/agent/orchestrator/tools/builtin/windows-roots.mjs +23 -0
- package/src/agent/orchestrator/tools/builtin/write-tool.mjs +401 -0
- package/src/agent/orchestrator/tools/builtin.mjs +500 -0
- package/src/agent/orchestrator/tools/code-graph-prewarm-worker.mjs +39 -0
- package/src/agent/orchestrator/tools/code-graph-tool-defs.mjs +24 -0
- package/src/agent/orchestrator/tools/code-graph.mjs +4095 -0
- package/src/agent/orchestrator/tools/cwd-tool.mjs +298 -0
- package/src/agent/orchestrator/tools/destructive-warning.mjs +323 -0
- package/src/agent/orchestrator/tools/edit-normalize.mjs +603 -0
- package/src/agent/orchestrator/tools/env-scrub.mjs +100 -0
- package/src/agent/orchestrator/tools/graph-binary-fetcher.mjs +144 -0
- package/src/agent/orchestrator/tools/graph-manifest.json +26 -0
- package/src/agent/orchestrator/tools/host-input.mjs +204 -0
- package/src/agent/orchestrator/tools/mutation-content-cache.mjs +67 -0
- package/src/agent/orchestrator/tools/mutation-planner.mjs +75 -0
- package/src/agent/orchestrator/tools/next-call-utils.mjs +48 -0
- package/src/agent/orchestrator/tools/patch-binary-fetcher.mjs +133 -0
- package/src/agent/orchestrator/tools/patch-manifest.json +26 -0
- package/src/agent/orchestrator/tools/patch-tool-defs.mjs +20 -0
- package/src/agent/orchestrator/tools/patch.mjs +2754 -0
- package/src/agent/orchestrator/tools/progress-message.mjs +118 -0
- package/src/agent/orchestrator/tools/result-compression.mjs +279 -0
- package/src/agent/orchestrator/tools/shell-command.mjs +865 -0
- package/src/agent/orchestrator/tools/shell-exec-policy.mjs +89 -0
- package/src/agent/orchestrator/tools/shell-policy-danger-target.mjs +27 -0
- package/src/agent/orchestrator/tools/shell-policy-imports.mjs +7 -0
- package/src/agent/orchestrator/tools/shell-policy.mjs +345 -0
- package/src/agent/orchestrator/tools/shell-snapshot.mjs +313 -0
- package/src/agent/orchestrator/workflow-store.mjs +93 -0
- package/src/agent/tool-defs.mjs +103 -0
- package/src/channels/backends/discord.mjs +784 -0
- package/src/channels/data/voice-runtime-manifest.json +138 -0
- package/src/channels/index.mjs +3229 -0
- package/src/channels/lib/cli-worker-host.mjs +12 -0
- package/src/channels/lib/config-lock.mjs +13 -0
- package/src/channels/lib/config.mjs +292 -0
- package/src/channels/lib/drop-trace.mjs +71 -0
- package/src/channels/lib/event-pipeline.mjs +81 -0
- package/src/channels/lib/event-queue.mjs +345 -0
- package/src/channels/lib/executor.mjs +168 -0
- package/src/channels/lib/format.mjs +188 -0
- package/src/channels/lib/holidays.mjs +138 -0
- package/src/channels/lib/hook-pipe-server.mjs +802 -0
- package/src/channels/lib/interaction-workflows.mjs +184 -0
- package/src/channels/lib/memory-client.mjs +149 -0
- package/src/channels/lib/output-forwarder.mjs +765 -0
- package/src/channels/lib/runtime-paths.mjs +479 -0
- package/src/channels/lib/scheduler.mjs +723 -0
- package/src/channels/lib/session-control.mjs +36 -0
- package/src/channels/lib/session-discovery.mjs +103 -0
- package/src/channels/lib/settings.mjs +11 -0
- package/src/channels/lib/state-file.mjs +68 -0
- package/src/channels/lib/status-snapshot.mjs +219 -0
- package/src/channels/lib/tool-format.mjs +140 -0
- package/src/channels/lib/transcript-discovery.mjs +195 -0
- package/src/channels/lib/voice-runtime-fetcher.mjs +734 -0
- package/src/channels/lib/webhook.mjs +1179 -0
- package/src/channels/lib/whisper-server.mjs +477 -0
- package/src/channels/tool-defs.mjs +170 -0
- package/src/daemon/host.mjs +118 -0
- package/src/daemon/mcp-transport.mjs +47 -0
- package/src/daemon/session.mjs +100 -0
- package/src/daemon/thin-client.mjs +71 -0
- package/src/daemon/transport.mjs +163 -0
- package/src/memory/data/runtime-manifest.json +40 -0
- package/src/memory/index.mjs +3305 -0
- package/src/memory/lib/agent-ipc.mjs +93 -0
- package/src/memory/lib/bridge-trace-queries.mjs +120 -0
- package/src/memory/lib/core-memory-store.mjs +330 -0
- package/src/memory/lib/embedding-provider.mjs +269 -0
- package/src/memory/lib/embedding-worker.mjs +323 -0
- package/src/memory/lib/llm-worker-host.mjs +17 -0
- package/src/memory/lib/memory-cycle.mjs +11 -0
- package/src/memory/lib/memory-cycle1.mjs +641 -0
- package/src/memory/lib/memory-cycle2.mjs +1284 -0
- package/src/memory/lib/memory-cycle3.mjs +540 -0
- package/src/memory/lib/memory-embed.mjs +299 -0
- package/src/memory/lib/memory-extraction.mjs +5 -0
- package/src/memory/lib/memory-maintenance-store.mjs +32 -0
- package/src/memory/lib/memory-ops-policy.mjs +190 -0
- package/src/memory/lib/memory-recall-id-patch.mjs +15 -0
- package/src/memory/lib/memory-recall-read-query.mjs +7 -0
- package/src/memory/lib/memory-recall-scope-filter.mjs +63 -0
- package/src/memory/lib/memory-recall-store.mjs +621 -0
- package/src/memory/lib/memory-retrievers.mjs +112 -0
- package/src/memory/lib/memory-score.mjs +71 -0
- package/src/memory/lib/memory-text-utils.mjs +58 -0
- package/src/memory/lib/memory.mjs +412 -0
- package/src/memory/lib/model-profile.mjs +85 -0
- package/src/memory/lib/pg/adapter.mjs +308 -0
- package/src/memory/lib/pg/process.mjs +360 -0
- package/src/memory/lib/pg/supervisor.mjs +396 -0
- package/src/memory/lib/project-id-resolver.mjs +86 -0
- package/src/memory/lib/runtime-fetcher.mjs +442 -0
- package/src/memory/lib/trace-store.mjs +728 -0
- package/src/memory/tool-defs.mjs +79 -0
- package/src/search/index.mjs +1173 -0
- package/src/search/lib/backends/anthropic-oauth.mjs +98 -0
- package/src/search/lib/backends/exa.mjs +50 -0
- package/src/search/lib/backends/firecrawl.mjs +61 -0
- package/src/search/lib/backends/gemini-api.mjs +83 -0
- package/src/search/lib/backends/grok-oauth.mjs +86 -0
- package/src/search/lib/backends/index.mjs +150 -0
- package/src/search/lib/backends/openai-api.mjs +144 -0
- package/src/search/lib/backends/openai-oauth.mjs +98 -0
- package/src/search/lib/backends/openai-web-search.mjs +76 -0
- package/src/search/lib/backends/tavily.mjs +55 -0
- package/src/search/lib/backends/xai-api.mjs +113 -0
- package/src/search/lib/cache.mjs +131 -0
- package/src/search/lib/config.mjs +192 -0
- package/src/search/lib/formatter.mjs +115 -0
- package/src/search/lib/provider-usage.mjs +67 -0
- package/src/search/lib/providers.mjs +47 -0
- package/src/search/lib/search-intent.mjs +109 -0
- package/src/search/lib/setup-handler.mjs +261 -0
- package/src/search/lib/state.mjs +201 -0
- package/src/search/lib/web-tools.mjs +1207 -0
- package/src/search/tool-defs.mjs +83 -0
- package/src/setup/defender-exclusion.mjs +183 -0
- package/src/shared/abort-controller.mjs +15 -0
- package/src/shared/atomic-file.mjs +420 -0
- package/src/shared/config.mjs +350 -0
- package/src/shared/daemon-recycle.mjs +108 -0
- package/src/shared/disable-claude-builtins.mjs +88 -0
- package/src/shared/err-text.mjs +12 -0
- package/src/shared/llm/cost.mjs +66 -0
- package/src/shared/llm/http-agent.mjs +123 -0
- package/src/shared/llm/index.mjs +41 -0
- package/src/shared/llm/pid-cleanup.mjs +27 -0
- package/src/shared/llm/usage-log.mjs +47 -0
- package/src/shared/plugin-paths.mjs +58 -0
- package/src/shared/schedules-store.mjs +70 -0
- package/src/shared/seed.mjs +119 -0
- package/src/shared/user-cwd.mjs +213 -0
- package/src/shared/user-data-guard.mjs +238 -0
- package/src/status/aggregator.mjs +584 -0
- package/src/status/server.mjs +413 -0
- package/tools.json +1653 -0
|
@@ -0,0 +1,728 @@
|
|
|
1
|
+
import { closeSync, lstatSync, openSync, readFileSync, readSync, realpathSync, statSync } from 'fs';
|
|
2
|
+
import * as fsPromises from 'fs/promises';
|
|
3
|
+
import { readFile } from 'fs/promises';
|
|
4
|
+
import { extname } from 'path';
|
|
5
|
+
import { normalizeInputPath } from './path-utils.mjs';
|
|
6
|
+
import { findFileByBasename } from './path-diagnostics.mjs';
|
|
7
|
+
import { getReadSnapshot } from './read-snapshot-runtime.mjs';
|
|
8
|
+
import { snapshotCoversFullFile, statMatchesSnapshot } from './snapshot-helpers.mjs';
|
|
9
|
+
import { formatBinaryReadPreview } from './binary-file.mjs';
|
|
10
|
+
|
|
11
|
+
function snapshotBodyWasReturnedByRead(snapshot) {
|
|
12
|
+
return String(snapshot?.source || '').startsWith('read');
|
|
13
|
+
}
|
|
14
|
+
|
|
15
|
+
// Optional context-budget for a whole-file read: `max_lines:N` requests a
|
|
16
|
+
// TIGHTER head+tail elision than the default 600-line / 200+100 cap, to bound
|
|
17
|
+
// lead-context cost when only a glance is needed. Returns null (= default) when
|
|
18
|
+
// unset. No heuristic guessing — the budget is explicit and reuses the existing
|
|
19
|
+
// smartReadTruncate head/tail invariant. (`budget:'compact'` is a SEPARATE,
|
|
20
|
+
// pre-existing knob handled upstream in read-tool.mjs applyCompactReadBudget —
|
|
21
|
+
// it remaps a whole-file read to mode:'count' stats, not head+tail content.)
|
|
22
|
+
function resolveReadBudget(args) {
|
|
23
|
+
const ml = Number(args?.max_lines);
|
|
24
|
+
if (Number.isFinite(ml) && ml > 0) {
|
|
25
|
+
const maxLines = Math.trunc(ml);
|
|
26
|
+
const headLines = Math.max(1, Math.ceil(maxLines * 0.7));
|
|
27
|
+
return { maxLines, headLines, tailLines: Math.max(0, maxLines - headLines) };
|
|
28
|
+
}
|
|
29
|
+
return null;
|
|
30
|
+
}
|
|
31
|
+
|
|
32
|
+
function withSymbolReadNote(text, args) {
|
|
33
|
+
const note = typeof args?._symbolReadNote === 'string' ? args._symbolReadNote.trim() : '';
|
|
34
|
+
if (!note || typeof text !== 'string') return text;
|
|
35
|
+
return `${note}\n\n${text}`;
|
|
36
|
+
}
|
|
37
|
+
|
|
38
|
+
// BOM-only read-encoding detection. Mirrors write-tool.mjs
|
|
39
|
+
// detectExistingEncoding and CC fileRead.ts:34
|
|
40
|
+
// (buffer[0]===0xff && buffer[1]===0xfe -> 'utf16le') / file.ts
|
|
41
|
+
// detectFileEncoding. STRICTLY a leading-BOM rule — no content sniffing
|
|
42
|
+
// and no heuristic fallback, the same invariant the write path uses so a
|
|
43
|
+
// UTF-16LE file round-trips (write preserves FF FE -> read reverses it).
|
|
44
|
+
// Returns the decoder name plus the BOM byte length to strip before
|
|
45
|
+
// decoding. utf8-with-BOM (EF BB BF) keeps the utf-8 decoder; its leading
|
|
46
|
+
// U+FEFF is stripped for display downstream, so bomLen is reported but not
|
|
47
|
+
// applied for utf8.
|
|
48
|
+
function detectReadEncoding(fullPath) {
|
|
49
|
+
let fd;
|
|
50
|
+
try {
|
|
51
|
+
fd = openSync(fullPath, 'r');
|
|
52
|
+
const head = Buffer.alloc(3);
|
|
53
|
+
const n = readSync(fd, head, 0, 3, 0);
|
|
54
|
+
if (n >= 2 && head[0] === 0xff && head[1] === 0xfe) {
|
|
55
|
+
return { encoding: 'utf16le', bomLen: 2 };
|
|
56
|
+
}
|
|
57
|
+
if (n >= 2 && head[0] === 0xfe && head[1] === 0xff) {
|
|
58
|
+
return { encoding: 'utf16be', bomLen: 2 };
|
|
59
|
+
}
|
|
60
|
+
if (n >= 3 && head[0] === 0xef && head[1] === 0xbb && head[2] === 0xbf) {
|
|
61
|
+
return { encoding: 'utf8', bomLen: 3 };
|
|
62
|
+
}
|
|
63
|
+
return { encoding: 'utf8', bomLen: 0 };
|
|
64
|
+
} catch {
|
|
65
|
+
return { encoding: 'utf8', bomLen: 0 };
|
|
66
|
+
} finally {
|
|
67
|
+
if (fd !== undefined) { try { closeSync(fd); } catch {} }
|
|
68
|
+
}
|
|
69
|
+
}
|
|
70
|
+
|
|
71
|
+
export async function executeSingleReadTool(args, workDir, readStateScope, options = {}, helpers = {}) {
|
|
72
|
+
const {
|
|
73
|
+
appendReadContextAdvisory,
|
|
74
|
+
classifyResultKind,
|
|
75
|
+
extractIpynbText,
|
|
76
|
+
extractPdfText,
|
|
77
|
+
findSimilarFile,
|
|
78
|
+
isBinaryFile,
|
|
79
|
+
isBlockedDevicePath,
|
|
80
|
+
isUncPath,
|
|
81
|
+
isWindowsDevicePath,
|
|
82
|
+
hasUnsafeWin32Component,
|
|
83
|
+
isSpecialFileStat,
|
|
84
|
+
normalizeErrorMessage,
|
|
85
|
+
normalizeOutputPath,
|
|
86
|
+
parseLineLimitArg,
|
|
87
|
+
parseOffsetArg,
|
|
88
|
+
renderReadLine,
|
|
89
|
+
resolveAgainstCwd,
|
|
90
|
+
smartReadTruncate,
|
|
91
|
+
streamReadRange,
|
|
92
|
+
streamSmartReadSummary,
|
|
93
|
+
READ_MAX_OUTPUT_BYTES,
|
|
94
|
+
READ_MAX_SIZE_BYTES,
|
|
95
|
+
READ_SMART_STREAM_MIN_BYTES,
|
|
96
|
+
READ_STREAM_RANGE_MIN_BYTES,
|
|
97
|
+
_cacheGetEntry,
|
|
98
|
+
_cacheSet,
|
|
99
|
+
_hashText,
|
|
100
|
+
_rangeHashesForReadRanges,
|
|
101
|
+
_rangeHashesFromRenderedReadText,
|
|
102
|
+
_rawContentCacheGet,
|
|
103
|
+
_rawContentCacheSet,
|
|
104
|
+
_recordReadSnapshot,
|
|
105
|
+
} = helpers;
|
|
106
|
+
// Normalize path (strip whitespace, expand ~, posix→windows) up front so
|
|
107
|
+
// LLM-injected stray spaces don't trigger an ENOENT retry that pollutes
|
|
108
|
+
// the conversation history and breaks the cache prefix on later turns.
|
|
109
|
+
if (typeof args.path === 'string') args.path = normalizeInputPath(args.path);
|
|
110
|
+
const filePath = args.path;
|
|
111
|
+
if (!filePath)
|
|
112
|
+
return 'Error: path is required.';
|
|
113
|
+
// R1: UNC / SMB share reject (\\server\share, //server/share). Reading
|
|
114
|
+
// these on Windows auto-authenticates to the remote host and leaks the
|
|
115
|
+
// NTLM hash of the current user to any attacker-controlled SMB target.
|
|
116
|
+
// CC parity: FileReadTool.ts:461 rejects the same prefix before stat.
|
|
117
|
+
// Must run before resolveAgainstCwd so a relative path can't be coerced
|
|
118
|
+
// into a UNC share by the cwd resolution.
|
|
119
|
+
if (typeof isUncPath === 'function' && isUncPath(filePath))
|
|
120
|
+
return `Error: cannot read UNC / SMB path (network credential leak risk): ${normalizeOutputPath(filePath)}`;
|
|
121
|
+
// R2: Windows reserved device names (CON / NUL / PRN / AUX / COM[0-9] /
|
|
122
|
+
// LPT[0-9]) and raw-device namespaces (\\.\ and \\?\). These are kernel
|
|
123
|
+
// aliases that never resolve to real files and can hang or grant raw
|
|
124
|
+
// device access regardless of directory.
|
|
125
|
+
if (typeof isWindowsDevicePath === 'function' && isWindowsDevicePath(filePath))
|
|
126
|
+
return `Error: cannot read Windows device path (reserved name or raw-device namespace): ${normalizeOutputPath(filePath)}`;
|
|
127
|
+
// R12: Win32 component guard. Trailing dot/space or embedded ':' in
|
|
128
|
+
// any path component lets Win32 silently resolve to a different file
|
|
129
|
+
// (stripped dot/space) or an NTFS Alternate Data Stream attached to
|
|
130
|
+
// another file, bypassing the string-based device/UNC checks above.
|
|
131
|
+
if (typeof hasUnsafeWin32Component === 'function' && hasUnsafeWin32Component(filePath))
|
|
132
|
+
return `Error: cannot read Windows path with trailing dot/space or NTFS ADS suffix (bypasses device guard): ${normalizeOutputPath(filePath)}`;
|
|
133
|
+
// G6: block device pseudo-files (would hang / produce infinite output).
|
|
134
|
+
if (isBlockedDevicePath(filePath))
|
|
135
|
+
return `Error: cannot read device file (would block or produce infinite output): ${normalizeOutputPath(filePath)}`;
|
|
136
|
+
const fullPath = resolveAgainstCwd(filePath, workDir);
|
|
137
|
+
// R1: re-check the resolved path — `resolveAgainstCwd` could have produced
|
|
138
|
+
// a UNC / Windows device path even when the user-supplied string did not
|
|
139
|
+
// (rare, but possible with custom cwd containing a UNC root).
|
|
140
|
+
if (typeof isUncPath === 'function' && isUncPath(fullPath))
|
|
141
|
+
return `Error: cannot read UNC / SMB path (network credential leak risk): ${normalizeOutputPath(fullPath)}`;
|
|
142
|
+
if (typeof isWindowsDevicePath === 'function' && isWindowsDevicePath(fullPath))
|
|
143
|
+
return `Error: cannot read Windows device path (reserved name or raw-device namespace): ${normalizeOutputPath(fullPath)}`;
|
|
144
|
+
if (typeof hasUnsafeWin32Component === 'function' && hasUnsafeWin32Component(fullPath))
|
|
145
|
+
return `Error: cannot read Windows path with trailing dot/space or NTFS ADS suffix (bypasses device guard): ${normalizeOutputPath(fullPath)}`;
|
|
146
|
+
// Pre-read size cap (Anthropic FileReadTool/limits.ts pattern):
|
|
147
|
+
// throw a small error response when the file is too big rather
|
|
148
|
+
// than truncating to 25K tokens of content. Throw is decisively
|
|
149
|
+
// more token-efficient (Anthropic #21841 reverted truncation).
|
|
150
|
+
// Large-file branch: if offset/limit is provided, stream the
|
|
151
|
+
// requested line window instead of throwing (Task B). Without
|
|
152
|
+
// range args the cap still throws so small-file default path
|
|
153
|
+
// can't be weaponised to pull megabytes by accident.
|
|
154
|
+
const hasOffsetArg = args.offset !== undefined && args.offset !== null;
|
|
155
|
+
const hasLimitArg = args.limit !== undefined && args.limit !== null;
|
|
156
|
+
const hasRangeArgs = hasOffsetArg || hasLimitArg;
|
|
157
|
+
const wantFull = args.full === true;
|
|
158
|
+
const offset = parseOffsetArg(args.offset);
|
|
159
|
+
// full:true bypasses the default 2000-line cap so the whole file
|
|
160
|
+
// can be returned in one call; the byte-cap path below still
|
|
161
|
+
// emits a compact truncation marker when rendered bytes overflow
|
|
162
|
+
// READ_MAX_OUTPUT_BYTES.
|
|
163
|
+
const limit = parseLineLimitArg(args.limit, wantFull ? Infinity : 2000);
|
|
164
|
+
// Context-budget (compact / max_lines) — only meaningful on a whole-file
|
|
165
|
+
// read (no range, not full). Ignored otherwise.
|
|
166
|
+
const _readBudget = (!hasRangeArgs && !wantFull) ? resolveReadBudget(args) : null;
|
|
167
|
+
let st;
|
|
168
|
+
let _statErr;
|
|
169
|
+
try {
|
|
170
|
+
st = statSync(fullPath);
|
|
171
|
+
} catch (err) {
|
|
172
|
+
// Fall through to the existing similar-file recovery path below.
|
|
173
|
+
st = null;
|
|
174
|
+
_statErr = err;
|
|
175
|
+
}
|
|
176
|
+
if (st) {
|
|
177
|
+
// R2: special-file reject AFTER stat. FIFOs, char devices, block
|
|
178
|
+
// devices, and sockets pass a normal stat but reading them either
|
|
179
|
+
// hangs (FIFO with no writer, socket) or produces unbounded output
|
|
180
|
+
// (/dev/zero, /dev/random). Catches arbitrary user paths that point
|
|
181
|
+
// at a special inode (custom mknod, etc.) that the string-based
|
|
182
|
+
// device guard above doesn't know about.
|
|
183
|
+
if (typeof isSpecialFileStat === 'function' && isSpecialFileStat(st))
|
|
184
|
+
return `Error: cannot read special file (FIFO / character / block device / socket): ${normalizeOutputPath(filePath)}`;
|
|
185
|
+
// R1+R2: realpath the resolved path so a symlink → /dev/zero (or any
|
|
186
|
+
// other blocked device, UNC, or Windows reserved name) is caught on
|
|
187
|
+
// the REAL target, not the symlink name. lstatSync detects whether
|
|
188
|
+
// the entry IS a symlink first so realpathSync is only called when
|
|
189
|
+
// it would actually differ — saves a syscall on the common case.
|
|
190
|
+
try {
|
|
191
|
+
const _lst = lstatSync(fullPath);
|
|
192
|
+
if (_lst && typeof _lst.isSymbolicLink === 'function' && _lst.isSymbolicLink()) {
|
|
193
|
+
let _realTarget = null;
|
|
194
|
+
try { _realTarget = realpathSync(fullPath); } catch { _realTarget = null; }
|
|
195
|
+
if (_realTarget && _realTarget !== fullPath) {
|
|
196
|
+
if (isBlockedDevicePath(_realTarget))
|
|
197
|
+
return `Error: cannot read device file via symlink (would block or produce infinite output): ${normalizeOutputPath(filePath)} → ${normalizeOutputPath(_realTarget)}`;
|
|
198
|
+
if (typeof isUncPath === 'function' && isUncPath(_realTarget))
|
|
199
|
+
return `Error: cannot read UNC / SMB path via symlink (network credential leak risk): ${normalizeOutputPath(filePath)} → ${normalizeOutputPath(_realTarget)}`;
|
|
200
|
+
if (typeof isWindowsDevicePath === 'function' && isWindowsDevicePath(_realTarget))
|
|
201
|
+
return `Error: cannot read Windows device path via symlink (reserved name or raw-device namespace): ${normalizeOutputPath(filePath)} → ${normalizeOutputPath(_realTarget)}`;
|
|
202
|
+
// Re-run the special-file stat on the real target — the
|
|
203
|
+
// symlink itself was already checked above via `st`, but
|
|
204
|
+
// the target stat could differ from the link stat in
|
|
205
|
+
// pathological cases (replaced under us).
|
|
206
|
+
try {
|
|
207
|
+
const _rst = statSync(_realTarget);
|
|
208
|
+
if (typeof isSpecialFileStat === 'function' && isSpecialFileStat(_rst))
|
|
209
|
+
return `Error: cannot read special file via symlink (FIFO / character / block device / socket): ${normalizeOutputPath(filePath)} → ${normalizeOutputPath(_realTarget)}`;
|
|
210
|
+
} catch { /* if the target is gone, let the normal path surface ENOENT */ }
|
|
211
|
+
}
|
|
212
|
+
}
|
|
213
|
+
} catch { /* lstat failure is non-fatal; the original `st` is authoritative */ }
|
|
214
|
+
}
|
|
215
|
+
if (!st) {
|
|
216
|
+
const err = _statErr;
|
|
217
|
+
const similar = findSimilarFile(fullPath);
|
|
218
|
+
let hint = similar ? ` Did you mean "${normalizeOutputPath(similar)}"?` : '';
|
|
219
|
+
// Right-name / wrong-directory miss: findSimilarFile only checks the
|
|
220
|
+
// same dir. Locate the basename elsewhere in the tree and name the real
|
|
221
|
+
// path(s) directly — the route a model would otherwise reconstruct with
|
|
222
|
+
// a grep/glob storm.
|
|
223
|
+
if (!similar) {
|
|
224
|
+
const elsewhere = findFileByBasename(workDir, fullPath);
|
|
225
|
+
if (elsewhere.length) {
|
|
226
|
+
hint = ` Not found at this path; the same filename exists at: ${elsewhere.map((p) => `"${normalizeOutputPath(p)}"`).join(', ')}. Read that path directly.`;
|
|
227
|
+
}
|
|
228
|
+
}
|
|
229
|
+
const _rawMsg = err instanceof Error ? err.message : String(err);
|
|
230
|
+
const _safeMsg = normalizeErrorMessage(_rawMsg, workDir);
|
|
231
|
+
return `Error: ${_safeMsg}${hint}`;
|
|
232
|
+
}
|
|
233
|
+
// MEDIA-WINS: .pdf/.ipynb dispatch runs BEFORE any cache/snapshot fast
|
|
234
|
+
// path. A media file previously read as text can carry a stale result-
|
|
235
|
+
// cache or read-snapshot entry; returning that cached TEXT instead of the
|
|
236
|
+
// fresh media shape (PDF document block / ipynb content-block array) is
|
|
237
|
+
// wrong — media must win. Hoisted here, right after the UNC/device/ADS
|
|
238
|
+
// guards + stat but before _cacheGetEntry / getReadSnapshot, so neither
|
|
239
|
+
// fast path can short-circuit a media read. extractPdfText /
|
|
240
|
+
// extractIpynbText own their size handling internally (PDF >20MB → text
|
|
241
|
+
// fallback via PDF_DOCUMENT_MAX_BYTES, page-range filter, ipynb range
|
|
242
|
+
// refusal), so this single early dispatch supersedes the old >10MiB media
|
|
243
|
+
// lines and the old post-cache media lines without bypassing those
|
|
244
|
+
// decisions. mediaTextOnly (batch dispatcher) must produce a flat string,
|
|
245
|
+
// never a content-block object, so a batch aggregate's String()+join can't
|
|
246
|
+
// stringify it to "[object Object]"; scalar reads leave it unset and get
|
|
247
|
+
// the rich block shapes.
|
|
248
|
+
const _mediaTextOnly = options?.mediaTextOnly === true;
|
|
249
|
+
const _mediaExt = extname(fullPath).toLowerCase();
|
|
250
|
+
if (_mediaExt === '.pdf') return extractPdfText(fullPath, args.pages, { maxOutputBytes: READ_MAX_OUTPUT_BYTES, textOnly: _mediaTextOnly });
|
|
251
|
+
if (_mediaExt === '.ipynb') {
|
|
252
|
+
const _ipynbOut = await extractIpynbText(fullPath, { maxOutputBytes: READ_MAX_OUTPUT_BYTES, hasRangeArgs: hasRangeArgs || args.line !== undefined, textOnly: _mediaTextOnly });
|
|
253
|
+
// Record a full-file read snapshot so notebook_edit's read-before-write
|
|
254
|
+
// guard (and edit/write consistency) can recognise the notebook was
|
|
255
|
+
// seen. A rendered ipynb read returns a media/text shape, not the raw
|
|
256
|
+
// JSON, so without this the structural editor could never satisfy its
|
|
257
|
+
// prior-read requirement. Skipped on an Error string (no real read).
|
|
258
|
+
if (typeof _ipynbOut !== 'string' || !_ipynbOut.startsWith('Error:')) {
|
|
259
|
+
_recordReadSnapshot(fullPath, st, readStateScope, { source: 'read', replaceExisting: true });
|
|
260
|
+
}
|
|
261
|
+
return _ipynbOut;
|
|
262
|
+
}
|
|
263
|
+
const cacheKey = `read|${fullPath}|${st.mtimeMs}|${st.size}|${hasOffsetArg ? offset : 'd'}|${hasLimitArg ? limit : 'd'}|${wantFull ? 'f' : 's'}|${_readBudget ? `b${_readBudget.maxLines}` : 'd'}`;
|
|
264
|
+
// Race-guard helper: same-mtime same-size rapid rewrite (NTFS / exFAT 1 s
|
|
265
|
+
// resolution) can pass mtimeMs+size yet differ in content. When the cache
|
|
266
|
+
// entry stores a contentPrefixHash, recompute the current prefix and bail
|
|
267
|
+
// to a fresh read on mismatch. Helper kept local (not hoisted) so it can
|
|
268
|
+
// close over fullPath and st without an extra arg.
|
|
269
|
+
const _readPrefixHashForCacheGuard = () => {
|
|
270
|
+
try {
|
|
271
|
+
if (st.size <= 65536) {
|
|
272
|
+
return _hashText(readFileSync(fullPath, 'utf-8'));
|
|
273
|
+
}
|
|
274
|
+
const _fd = openSync(fullPath, 'r');
|
|
275
|
+
try {
|
|
276
|
+
const _buf = Buffer.allocUnsafe(65536);
|
|
277
|
+
const _n = readSync(_fd, _buf, 0, 65536, 0);
|
|
278
|
+
return _hashText(_buf.subarray(0, _n));
|
|
279
|
+
} finally { try { closeSync(_fd); } catch {} }
|
|
280
|
+
} catch { return ''; }
|
|
281
|
+
};
|
|
282
|
+
const cachedEntry = _cacheGetEntry(cacheKey);
|
|
283
|
+
if (cachedEntry !== null) {
|
|
284
|
+
let _entryStillValid = true;
|
|
285
|
+
// Single-pass cache-hit guard. The cache key already pins
|
|
286
|
+
// mtimeMs+size, so a hit means only a same-mtime/same-size rewrite
|
|
287
|
+
// (NTFS / exFAT 1 s resolution) could differ — caught by re-hashing
|
|
288
|
+
// the on-disk body. Previously this ran as two passes: a 64KiB
|
|
289
|
+
// prefix-hash guard, then a separate full-content guard that
|
|
290
|
+
// re-read the whole file again. For ≤64KiB files contentPrefixHash
|
|
291
|
+
// and contentHash are computed over the identical body at the read
|
|
292
|
+
// result-cache set sites (:360 and :367) and are byte-equal by
|
|
293
|
+
// construction, so the two passes read+hashed the same bytes twice
|
|
294
|
+
// for nothing. Collapse to one read + one hash per hit.
|
|
295
|
+
const _prefixHash = cachedEntry.contentPrefixHash;
|
|
296
|
+
const _snapHash = cachedEntry.readSnapshotMeta?.contentHash;
|
|
297
|
+
if (_prefixHash || _snapHash) {
|
|
298
|
+
if (st.size <= 65536) {
|
|
299
|
+
// ≤64KiB: one full-body read validates whichever hash the
|
|
300
|
+
// entry carries — prefix == full at this size. Prefer the
|
|
301
|
+
// exact full contentHash when present, else the prefix hash
|
|
302
|
+
// (also full-body here). A read failure drops to fresh read.
|
|
303
|
+
try {
|
|
304
|
+
const _freshHash = _hashText(readFileSync(fullPath, 'utf-8'));
|
|
305
|
+
const _expect = _snapHash || _prefixHash;
|
|
306
|
+
if (!_freshHash || _freshHash !== _expect) _entryStillValid = false;
|
|
307
|
+
} catch { _entryStillValid = false; }
|
|
308
|
+
} else if (_prefixHash) {
|
|
309
|
+
// >64KiB: contentHash may still be stored (full-file reads
|
|
310
|
+
// keep it up to the 10MB read cap), but validating it here
|
|
311
|
+
// means a synchronous full-content sha that blocks the main
|
|
312
|
+
// thread on a multi-megabyte body every cache check — so the
|
|
313
|
+
// validation, not the storage, is size-gated: for >64KiB only
|
|
314
|
+
// the 64KiB head prefix is checked. It catches same-mtime/
|
|
315
|
+
// same-size rewrites within the first 64KiB (the common case);
|
|
316
|
+
// writes through edit/apply_patch/write invalidate by path,
|
|
317
|
+
// and shell mutationMode='global' wipes both builtin +
|
|
318
|
+
// code-graph caches, bounding stale risk past the head.
|
|
319
|
+
const _curHash = _readPrefixHashForCacheGuard();
|
|
320
|
+
if (!_curHash || _curHash !== _prefixHash) _entryStillValid = false;
|
|
321
|
+
}
|
|
322
|
+
}
|
|
323
|
+
if (_entryStillValid) {
|
|
324
|
+
// Cross-session stub guard: RESULT_CACHE is process-global, so a
|
|
325
|
+
// cache hit can be an entry SET BY ANOTHER SESSION whose body this
|
|
326
|
+
// conversation never received. The file_unchanged stub assumes the
|
|
327
|
+
// full body is already in a prior tool_result of THIS session — only
|
|
328
|
+
// true when a session-scoped snapshot exists, matches the current
|
|
329
|
+
// stat, and was itself produced by a body-returning read. Probe that
|
|
330
|
+
// BEFORE recording the snapshot below (which would otherwise mark the
|
|
331
|
+
// file as body-returned and mask the cross-session case). A null
|
|
332
|
+
// readStateScope has no session evidence, so it always fails the gate
|
|
333
|
+
// and falls through to the full cached body.
|
|
334
|
+
const _sessionSnap = readStateScope ? getReadSnapshot(fullPath, readStateScope) : null;
|
|
335
|
+
const _stubBodyAlreadySent = !!_sessionSnap
|
|
336
|
+
&& statMatchesSnapshot(st, _sessionSnap)
|
|
337
|
+
&& snapshotBodyWasReturnedByRead(_sessionSnap)
|
|
338
|
+
// Range-coverage guard: snapshotBodyWasReturnedByRead only
|
|
339
|
+
// proves SOME body was returned, not WHICH lines. A session
|
|
340
|
+
// that read just lines 1-10 (ranged, source 'read', stat
|
|
341
|
+
// matches) must NOT get an unchanged stub on a later full
|
|
342
|
+
// read whose body it never saw — another session's full read
|
|
343
|
+
// populated the global cache. For a full-file read require
|
|
344
|
+
// the session snapshot to cover the whole file. For a ranged
|
|
345
|
+
// read there is no requested-window-coverage helper
|
|
346
|
+
// (snapshotRangesCoverAllLines checks ALL lines, not the
|
|
347
|
+
// window), so conservatively require full coverage there too:
|
|
348
|
+
// failing the gate only falls through to the full cached body
|
|
349
|
+
// (a few extra tokens), which is never incorrect. The
|
|
350
|
+
// path-snapshot fallback at the size-gated branch below
|
|
351
|
+
// already requires snapshotCoversFullFile for this reason.
|
|
352
|
+
&& snapshotCoversFullFile(_sessionSnap);
|
|
353
|
+
_recordReadSnapshot(fullPath, st, readStateScope, cachedEntry.readSnapshotMeta || { source: 'read_cached' });
|
|
354
|
+
// G6: file_unchanged stub. The full body is already in the
|
|
355
|
+
// prior tool_result; resending it wastes cache_creation
|
|
356
|
+
// tokens (Claude Code upstream measured ~18% on Read calls).
|
|
357
|
+
// The stub keeps the snapshot tracking intact (Edit
|
|
358
|
+
// validation still works) while collapsing the response
|
|
359
|
+
// payload. Falls back to the full body when the cached
|
|
360
|
+
// value is itself a stub-incompatible error string, or when
|
|
361
|
+
// this session has no body-returned snapshot proving it saw the
|
|
362
|
+
// body (cross-session cache hit — emit the full cached body so
|
|
363
|
+
// the recorded snapshot above is honestly body-returned here).
|
|
364
|
+
const _cachedVal = cachedEntry.value;
|
|
365
|
+
if (typeof _cachedVal === 'string' && classifyResultKind(_cachedVal) !== 'error') {
|
|
366
|
+
if (_stubBodyAlreadySent && options?.suppressReadUnchangedStub !== true) {
|
|
367
|
+
return withSymbolReadNote(`[file unchanged: ${normalizeOutputPath(filePath)}]`, args);
|
|
368
|
+
}
|
|
369
|
+
}
|
|
370
|
+
return withSymbolReadNote(_cachedVal, args);
|
|
371
|
+
}
|
|
372
|
+
// Race detected — fall through to fresh read below.
|
|
373
|
+
}
|
|
374
|
+
// Path-snapshot fallback: exact cache-key hits above can still collapse
|
|
375
|
+
// duplicate reads. Size-gate the fallback so a missing cache entry never
|
|
376
|
+
// hashes a large file just to emit an unchanged stub.
|
|
377
|
+
if (!hasRangeArgs && st.size <= 65536) {
|
|
378
|
+
const _snap = getReadSnapshot(fullPath, readStateScope);
|
|
379
|
+
if (_snap
|
|
380
|
+
&& statMatchesSnapshot(st, _snap)
|
|
381
|
+
&& snapshotCoversFullFile(_snap)
|
|
382
|
+
&& snapshotBodyWasReturnedByRead(_snap)
|
|
383
|
+
&& typeof _snap.contentHash === 'string'
|
|
384
|
+
&& _snap.contentHash) {
|
|
385
|
+
let _diskHash = '';
|
|
386
|
+
try { _diskHash = _hashText(readFileSync(fullPath, 'utf-8')); } catch {}
|
|
387
|
+
if (_diskHash && _diskHash === _snap.contentHash) {
|
|
388
|
+
if (options?.suppressReadUnchangedStub !== true) {
|
|
389
|
+
return withSymbolReadNote(`[file unchanged: ${normalizeOutputPath(filePath)}]`, args);
|
|
390
|
+
}
|
|
391
|
+
}
|
|
392
|
+
}
|
|
393
|
+
}
|
|
394
|
+
// BOM-only encoding detection runs BEFORE the >10MiB size branch so a
|
|
395
|
+
// large UTF-16LE+BOM file is recognized as text up front and routed to
|
|
396
|
+
// the bounded in-memory utf16le path below, never mis-decoded as utf-8
|
|
397
|
+
// or rejected by the utf-8 streaming/binary branch (Bug 1).
|
|
398
|
+
const _readEnc = detectReadEncoding(fullPath);
|
|
399
|
+
// UTF-16 (LE or BE) reads share one constraint: the streaming/binary
|
|
400
|
+
// paths decode chunks as utf-8, so a BOM-flagged UTF-16 file must route
|
|
401
|
+
// to the bounded in-memory decode below regardless of byte order.
|
|
402
|
+
const _isUtf16 = _readEnc.encoding === 'utf16le' || _readEnc.encoding === 'utf16be';
|
|
403
|
+
if (st.size > READ_MAX_SIZE_BYTES) {
|
|
404
|
+
// .pdf/.ipynb were already dispatched up front (MEDIA-WINS), so this
|
|
405
|
+
// >10MiB branch only handles the non-media text path from here on.
|
|
406
|
+
// utf16le bound (Bug 2): utf16le reads route through a single
|
|
407
|
+
// in-memory full read+decode+split (streamReadRange is gated off
|
|
408
|
+
// for utf16le because it decodes chunks as utf-8). Keep that one
|
|
409
|
+
// path but cap it — a >10MiB utf16le file would otherwise be
|
|
410
|
+
// unbounded in memory or mis-routed into the utf-8 stream/binary
|
|
411
|
+
// branch. Refuse so utf16le memory is always <= READ_MAX_SIZE_BYTES.
|
|
412
|
+
if (_isUtf16) {
|
|
413
|
+
return `Error: UTF-16 file size ${st.size} bytes exceeds ${READ_MAX_SIZE_BYTES} bytes; utf16 ranged reads are bounded — convert to UTF-8 or narrow the range.`;
|
|
414
|
+
}
|
|
415
|
+
if (!hasRangeArgs) {
|
|
416
|
+
return `Error: file size ${st.size} bytes exceeds ${READ_MAX_SIZE_BYTES}-byte cap.`;
|
|
417
|
+
}
|
|
418
|
+
if (isBinaryFile(fullPath, st.size)) {
|
|
419
|
+
const { text, snapshotMeta } = formatBinaryReadPreview(fullPath, normalizeOutputPath(filePath), st.size);
|
|
420
|
+
_recordReadSnapshot(fullPath, st, readStateScope, snapshotMeta);
|
|
421
|
+
_cacheSet(cacheKey, text, { paths: [fullPath], readSnapshotMeta: snapshotMeta });
|
|
422
|
+
return withSymbolReadNote(text, args);
|
|
423
|
+
}
|
|
424
|
+
try {
|
|
425
|
+
const _streamRes = await streamReadRange(fullPath, offset, limit, st, { displayPath: filePath });
|
|
426
|
+
const out = _streamRes.text;
|
|
427
|
+
// W1 H: snapshot only emitted line bounds, not the
|
|
428
|
+
// requested window — byte-cap truncation can stop short.
|
|
429
|
+
const _emittedRanges = (_streamRes.firstEmitted && _streamRes.lastEmitted)
|
|
430
|
+
? [{ startLine: _streamRes.firstEmitted, endLine: _streamRes.lastEmitted }]
|
|
431
|
+
: [];
|
|
432
|
+
const snapshotMeta = {
|
|
433
|
+
source: 'read',
|
|
434
|
+
ranges: _emittedRanges,
|
|
435
|
+
// D-R1-1: rangeHash covers the exact text returned so
|
|
436
|
+
// _isSnapshotStale can detect same-mtime+same-size
|
|
437
|
+
// rewrites within the read window at edit time.
|
|
438
|
+
// Fix J-1 (b): hash raw line text, not rendered
|
|
439
|
+
// "N\ttext" form, to match _isSnapshotStale which
|
|
440
|
+
// hashes _lines.slice().join('\n') (raw content).
|
|
441
|
+
// Strip the rendered line-number prefix from each
|
|
442
|
+
// returned line before hashing so both sides match.
|
|
443
|
+
rangeHashes: _rangeHashesFromRenderedReadText(out, _emittedRanges),
|
|
444
|
+
};
|
|
445
|
+
// Compute prefix hash for race-guard on next cache hit.
|
|
446
|
+
// Async to avoid blocking the event loop on a 64KB read
|
|
447
|
+
// for every large-file streaming path.
|
|
448
|
+
const _streamPrefixHash = _streamRes.prefixHash || await (async () => {
|
|
449
|
+
try {
|
|
450
|
+
if (st.size <= 65536) return _hashText(await readFile(fullPath, 'utf-8'));
|
|
451
|
+
const fh = await fsPromises.open(fullPath, 'r');
|
|
452
|
+
try {
|
|
453
|
+
const _buf = Buffer.allocUnsafe(65536);
|
|
454
|
+
const _readRes = await fh.read(_buf, 0, 65536, 0);
|
|
455
|
+
return _hashText(_buf.subarray(0, _readRes.bytesRead));
|
|
456
|
+
} finally { await fh.close().catch(() => {}); }
|
|
457
|
+
} catch { return ''; }
|
|
458
|
+
})();
|
|
459
|
+
_cacheSet(cacheKey, out, { paths: [fullPath], readSnapshotMeta: snapshotMeta, contentPrefixHash: _streamPrefixHash });
|
|
460
|
+
_recordReadSnapshot(fullPath, st, readStateScope, snapshotMeta);
|
|
461
|
+
return withSymbolReadNote(out, args);
|
|
462
|
+
} catch (err) {
|
|
463
|
+
return `Error: ${normalizeErrorMessage(err instanceof Error ? err.message : String(err))}`;
|
|
464
|
+
}
|
|
465
|
+
}
|
|
466
|
+
// Non-text special formats (.pdf/.ipynb) were intercepted up front
|
|
467
|
+
// (MEDIA-WINS, before the cache/snapshot fast paths), so the binary check
|
|
468
|
+
// below only ever sees the non-media text path.
|
|
469
|
+
// BOM-only encoding peek BEFORE the binary/NUL check. A UTF-16LE+BOM
|
|
470
|
+
// file is full of 0x00 bytes (the high byte of every ASCII char), so
|
|
471
|
+
// isBinaryFile would wrongly reject it. The FF FE BOM is an
|
|
472
|
+
// unambiguous TEXT signal, so classify it as utf16le up front and skip
|
|
473
|
+
// NUL rejection. The write tool preserves this encoding
|
|
474
|
+
// (write-tool.mjs detectExistingEncoding); decoding it here reverses
|
|
475
|
+
// that so the file round-trips. (_readEnc was detected above, before
|
|
476
|
+
// the >10MiB size branch, so the large-file path can classify utf16le.)
|
|
477
|
+
if (!_isUtf16 && isBinaryFile(fullPath, st.size)) {
|
|
478
|
+
const { text, snapshotMeta } = formatBinaryReadPreview(fullPath, normalizeOutputPath(filePath), st.size);
|
|
479
|
+
_recordReadSnapshot(fullPath, st, readStateScope, snapshotMeta);
|
|
480
|
+
_cacheSet(cacheKey, text, { paths: [fullPath], readSnapshotMeta: snapshotMeta });
|
|
481
|
+
return withSymbolReadNote(text, args);
|
|
482
|
+
}
|
|
483
|
+
// Whole-file reads above READ_WHOLE_FILE_MAX_BYTES use stream smart-elide
|
|
484
|
+
// (then READ_MAX_OUTPUT_BYTES truncation) instead of refusing. Absolute
|
|
485
|
+
// in-memory ceiling remains READ_MAX_SIZE_BYTES (10 MiB) above.
|
|
486
|
+
// The streaming paths (smart-summary + range) decode chunks as utf-8;
|
|
487
|
+
// a utf16le file must instead fall through to the encoding-aware
|
|
488
|
+
// in-memory regular read below, which still runs smartReadTruncate so
|
|
489
|
+
// smart-elide stays intact. utf-8 keeps the streaming fast path.
|
|
490
|
+
if (!_isUtf16 && !hasRangeArgs && !wantFull && st.size >= READ_SMART_STREAM_MIN_BYTES) {
|
|
491
|
+
try {
|
|
492
|
+
const _streamSmart = typeof streamSmartReadSummary === 'function'
|
|
493
|
+
? await streamSmartReadSummary(fullPath, st, 'read_smart_stream')
|
|
494
|
+
: null;
|
|
495
|
+
if (_streamSmart?.text) {
|
|
496
|
+
let out = _streamSmart.text;
|
|
497
|
+
// Honor a compact/max_lines budget on a large file: the stream
|
|
498
|
+
// already elided to head 200/tail 100; re-apply the tighter
|
|
499
|
+
// head+tail so the lead sees only the requested glance.
|
|
500
|
+
if (_readBudget) {
|
|
501
|
+
// Use the file's REAL line count from the stream pass
|
|
502
|
+
// (snapshotMeta.fileLineCount — the result has no top-level
|
|
503
|
+
// totalLines), not the already-elided output's row count: the
|
|
504
|
+
// re-budget marker otherwise reports "[TRUNCATED - 301 lines]"
|
|
505
|
+
// for a 3800-line file.
|
|
506
|
+
const _rebud = smartReadTruncate(out, _streamSmart.snapshotMeta?.fileLineCount || out.split('\n').length, st.size, filePath, _readBudget);
|
|
507
|
+
if (_rebud?.truncated) out = _rebud.text;
|
|
508
|
+
}
|
|
509
|
+
const snapshotMeta = _streamSmart.snapshotMeta || {
|
|
510
|
+
source: 'read_smart_stream',
|
|
511
|
+
ranges: [],
|
|
512
|
+
};
|
|
513
|
+
const _streamPrefixHash = _streamSmart.prefixHash || await (async () => {
|
|
514
|
+
try {
|
|
515
|
+
if (st.size <= 65536) return _hashText(await readFile(fullPath, 'utf-8'));
|
|
516
|
+
const fh = await fsPromises.open(fullPath, 'r');
|
|
517
|
+
try {
|
|
518
|
+
const _buf = Buffer.allocUnsafe(65536);
|
|
519
|
+
const _readRes = await fh.read(_buf, 0, 65536, 0);
|
|
520
|
+
return _hashText(_buf.subarray(0, _readRes.bytesRead));
|
|
521
|
+
} finally { await fh.close().catch(() => {}); }
|
|
522
|
+
} catch { return ''; }
|
|
523
|
+
})();
|
|
524
|
+
_cacheSet(cacheKey, out, { paths: [fullPath], readSnapshotMeta: snapshotMeta, contentPrefixHash: _streamPrefixHash });
|
|
525
|
+
_recordReadSnapshot(fullPath, st, readStateScope, snapshotMeta);
|
|
526
|
+
return withSymbolReadNote(out, args);
|
|
527
|
+
}
|
|
528
|
+
} catch {
|
|
529
|
+
// Fall through to the regular read path; it still enforces output caps.
|
|
530
|
+
}
|
|
531
|
+
}
|
|
532
|
+
if (!_isUtf16 && hasRangeArgs && !wantFull && st.size > READ_STREAM_RANGE_MIN_BYTES) {
|
|
533
|
+
try {
|
|
534
|
+
const _streamRes = await streamReadRange(fullPath, offset, limit, st, { displayPath: filePath });
|
|
535
|
+
const out = _streamRes.text;
|
|
536
|
+
const _emittedRanges = (_streamRes.firstEmitted && _streamRes.lastEmitted)
|
|
537
|
+
? [{ startLine: _streamRes.firstEmitted, endLine: _streamRes.lastEmitted }]
|
|
538
|
+
: [];
|
|
539
|
+
const snapshotMeta = {
|
|
540
|
+
source: 'read_stream_range',
|
|
541
|
+
ranges: _emittedRanges,
|
|
542
|
+
rangeHashes: _rangeHashesFromRenderedReadText(out, _emittedRanges),
|
|
543
|
+
};
|
|
544
|
+
const _streamPrefixHash = _streamRes.prefixHash || await (async () => {
|
|
545
|
+
try {
|
|
546
|
+
if (st.size <= 65536) return _hashText(await readFile(fullPath, 'utf-8'));
|
|
547
|
+
const fh = await fsPromises.open(fullPath, 'r');
|
|
548
|
+
try {
|
|
549
|
+
const _buf = Buffer.allocUnsafe(65536);
|
|
550
|
+
const _readRes = await fh.read(_buf, 0, 65536, 0);
|
|
551
|
+
return _hashText(_buf.subarray(0, _readRes.bytesRead));
|
|
552
|
+
} finally { await fh.close().catch(() => {}); }
|
|
553
|
+
} catch { return ''; }
|
|
554
|
+
})();
|
|
555
|
+
_cacheSet(cacheKey, out, { paths: [fullPath], readSnapshotMeta: snapshotMeta, contentPrefixHash: _streamPrefixHash });
|
|
556
|
+
_recordReadSnapshot(fullPath, st, readStateScope, snapshotMeta);
|
|
557
|
+
return withSymbolReadNote(out, args);
|
|
558
|
+
} catch (err) {
|
|
559
|
+
return `Error: ${normalizeErrorMessage(err instanceof Error ? err.message : String(err))}`;
|
|
560
|
+
}
|
|
561
|
+
}
|
|
562
|
+
try {
|
|
563
|
+
const cachedRawBuf = _rawContentCacheGet ? _rawContentCacheGet(fullPath, st) : null;
|
|
564
|
+
const rawBuf = cachedRawBuf || await readFile(fullPath);
|
|
565
|
+
// Encoding-aware decode (fresh read AND raw-content cache hit both
|
|
566
|
+
// flow through here). For a BOM-flagged UTF-16LE file, strip the
|
|
567
|
+
// 2-byte FF FE BOM and decode as utf16le so it reverses the write
|
|
568
|
+
// tool's preservation; utf-8 stays byte-identical to before (the
|
|
569
|
+
// leading U+FEFF of a utf8-BOM file is stripped later at the
|
|
570
|
+
// line[0] charCodeAt check for display).
|
|
571
|
+
// UTF-16BE has no Node string encoding: swap byte pairs to LE (swap16
|
|
572
|
+
// needs an even length) then decode as utf16le, so a BE file reverses
|
|
573
|
+
// the same way a LE file does.
|
|
574
|
+
let content;
|
|
575
|
+
if (_readEnc.encoding === 'utf16le') {
|
|
576
|
+
content = rawBuf.subarray(_readEnc.bomLen).toString('utf16le');
|
|
577
|
+
} else if (_readEnc.encoding === 'utf16be') {
|
|
578
|
+
const _body = rawBuf.subarray(_readEnc.bomLen);
|
|
579
|
+
const _even = _body.length & ~1;
|
|
580
|
+
content = Buffer.from(_body.subarray(0, _even)).swap16().toString('utf16le');
|
|
581
|
+
} else {
|
|
582
|
+
content = rawBuf.toString('utf-8');
|
|
583
|
+
}
|
|
584
|
+
// W1 M: re-stat after the async readFile so a concurrent
|
|
585
|
+
// Write that landed during the read is detected before
|
|
586
|
+
// the cache + snapshot record stale bytes.
|
|
587
|
+
let _stPostRead;
|
|
588
|
+
let _readStableForRawCache = true;
|
|
589
|
+
if (cachedRawBuf) {
|
|
590
|
+
_stPostRead = st;
|
|
591
|
+
} else {
|
|
592
|
+
try { _stPostRead = await fsPromises.stat(fullPath); } catch { _stPostRead = st; }
|
|
593
|
+
if (_stPostRead.mtimeMs !== st.mtimeMs || _stPostRead.size !== st.size) {
|
|
594
|
+
st = _stPostRead;
|
|
595
|
+
_readStableForRawCache = false;
|
|
596
|
+
}
|
|
597
|
+
}
|
|
598
|
+
const lines = content.split(/\r?\n/);
|
|
599
|
+
if (lines.length > 0 && lines[0].charCodeAt(0) === 0xFEFF) lines[0] = lines[0].slice(1);
|
|
600
|
+
// wc-l compatible line count: a trailing newline ends a line, it
|
|
601
|
+
// does not start a new empty one. Display count must match the
|
|
602
|
+
// count emitted by mode:"count" so footer and count agree.
|
|
603
|
+
const lineCount = lines.length > 0 && lines[lines.length - 1] === '' ? lines.length - 1 : lines.length;
|
|
604
|
+
const renderEnd = (!hasRangeArgs && !wantFull)
|
|
605
|
+
? lineCount
|
|
606
|
+
: Math.min(offset + limit, lineCount);
|
|
607
|
+
const sliced = lines.slice(offset, renderEnd);
|
|
608
|
+
const rendered = sliced
|
|
609
|
+
.map((line, i) => renderReadLine(offset + i + 1, line, { truncateLongLine: !wantFull }))
|
|
610
|
+
.join('\n');
|
|
611
|
+
// Output byte cap protects against many-line slices that
|
|
612
|
+
// individually pass the file-size check but explode after
|
|
613
|
+
// line-number prefixing.
|
|
614
|
+
let out;
|
|
615
|
+
// W1 H: track lines actually rendered so the snapshot below
|
|
616
|
+
// doesn't mark byte-cap-truncated lines as editable.
|
|
617
|
+
let _renderedLineCount = sliced.length;
|
|
618
|
+
// W1 H: byte-cap truncation drops trailing lines the model never
|
|
619
|
+
// saw. Track it so isFullFileView below records partial coverage
|
|
620
|
+
// (rangeHashes over the visible window) instead of a full-file
|
|
621
|
+
// contentHash — otherwise snapshotCoversFullFile would wrongly
|
|
622
|
+
// green-light an overwrite against bytes the read never returned.
|
|
623
|
+
let _byteCapTruncated = false;
|
|
624
|
+
const smart = (!hasRangeArgs && !wantFull && typeof smartReadTruncate === 'function')
|
|
625
|
+
? smartReadTruncate(rendered, lineCount, st.size, filePath, _readBudget)
|
|
626
|
+
: null;
|
|
627
|
+
let _smartTruncated = false;
|
|
628
|
+
let _smartVisibleRanges = null;
|
|
629
|
+
if (smart?.truncated) {
|
|
630
|
+
out = smart.text;
|
|
631
|
+
_smartTruncated = true;
|
|
632
|
+
_smartVisibleRanges = Array.isArray(smart.ranges) ? smart.ranges : null;
|
|
633
|
+
_renderedLineCount = 0;
|
|
634
|
+
} else if (Buffer.byteLength(rendered, 'utf8') > READ_MAX_OUTPUT_BYTES) {
|
|
635
|
+
let lo = 0;
|
|
636
|
+
let hi = rendered.length;
|
|
637
|
+
while (lo < hi) {
|
|
638
|
+
const mid = Math.ceil((lo + hi) / 2);
|
|
639
|
+
if (Buffer.byteLength(rendered.slice(0, mid), 'utf8') <= READ_MAX_OUTPUT_BYTES) lo = mid;
|
|
640
|
+
else hi = mid - 1;
|
|
641
|
+
}
|
|
642
|
+
const slice = rendered.slice(0, lo);
|
|
643
|
+
const completeRenderedLines = Math.max(0, slice.split('\n').length - 1);
|
|
644
|
+
_renderedLineCount = completeRenderedLines;
|
|
645
|
+
_byteCapTruncated = true;
|
|
646
|
+
out = slice + `\n\n... [output truncated at ${Math.round(READ_MAX_OUTPUT_BYTES/1024)} KB] ...`;
|
|
647
|
+
} else {
|
|
648
|
+
out = rendered;
|
|
649
|
+
}
|
|
650
|
+
if (hasRangeArgs) {
|
|
651
|
+
if (sliced.length === 0 && offset >= lineCount) {
|
|
652
|
+
out = `(no lines in range; file has ${lineCount} lines)`;
|
|
653
|
+
} else if (_byteCapTruncated) {
|
|
654
|
+
const emittedStart = offset + 1;
|
|
655
|
+
const emittedEnd = offset + _renderedLineCount;
|
|
656
|
+
const capKb = Math.round(READ_MAX_OUTPUT_BYTES / 1024);
|
|
657
|
+
const footer = `[lines ${emittedStart}-${emittedEnd} of ${lineCount}; output truncated at ${capKb} KB${emittedEnd < lineCount ? `; pass offset:${emittedEnd} to continue` : ''}]`;
|
|
658
|
+
out += `${out ? '\n' : ''}${footer}`;
|
|
659
|
+
} else if (Buffer.byteLength(rendered, 'utf8') <= READ_MAX_OUTPUT_BYTES) {
|
|
660
|
+
const emittedStart = offset + 1;
|
|
661
|
+
const emittedEnd = offset + sliced.length;
|
|
662
|
+
const footer = `[lines ${emittedStart}-${emittedEnd} of ${lineCount}${emittedEnd < lineCount ? `; pass offset:${emittedEnd} to continue` : ''}]`;
|
|
663
|
+
out += `${out ? '\n' : ''}${footer}`;
|
|
664
|
+
}
|
|
665
|
+
}
|
|
666
|
+
// Smart cap. Only engages when the caller asked for
|
|
667
|
+
// the default read (no offset/limit, full:false) AND the file
|
|
668
|
+
// is over the line/byte threshold. Explicit ranges always see
|
|
669
|
+
// byte-exact output.
|
|
670
|
+
// W1 H: smart-middle elision drops lines the model never
|
|
671
|
+
// saw — don't claim full-file coverage when it triggered.
|
|
672
|
+
if (!hasRangeArgs && !wantFull) {
|
|
673
|
+
if (!_smartTruncated && content.length > 0) {
|
|
674
|
+
out = appendReadContextAdvisory(out, { filePath, lineCount, bytes: st.size });
|
|
675
|
+
}
|
|
676
|
+
}
|
|
677
|
+
// CC parity: empty file gets a system-reminder instead of
|
|
678
|
+
// a bare `1│` line. The reminder makes the empty-state
|
|
679
|
+
// explicit so the agent doesn't assume content was elided.
|
|
680
|
+
if (content.length === 0) {
|
|
681
|
+
// W1 M: filename can contain `<` or `</system-reminder>`
|
|
682
|
+
// sequences; XML-escape before interpolation so a hostile
|
|
683
|
+
// path can't terminate the envelope and inject markup.
|
|
684
|
+
const _safePath = normalizeOutputPath(filePath)
|
|
685
|
+
.replace(/&/g, '&')
|
|
686
|
+
.replace(/</g, '<')
|
|
687
|
+
.replace(/>/g, '>');
|
|
688
|
+
out = `<system-reminder>File exists but has empty contents: ${_safePath}</system-reminder>`;
|
|
689
|
+
}
|
|
690
|
+
const isFullFileView = offset === 0 && offset + limit >= lineCount && !_smartTruncated && !_byteCapTruncated;
|
|
691
|
+
const _visibleRanges = _smartTruncated && _smartVisibleRanges
|
|
692
|
+
? _smartVisibleRanges
|
|
693
|
+
: (_renderedLineCount > 0
|
|
694
|
+
? [{ startLine: offset + 1, endLine: Math.min(lineCount, offset + _renderedLineCount) }]
|
|
695
|
+
: []);
|
|
696
|
+
const _rangeHashes = !isFullFileView ? _rangeHashesForReadRanges(content, _visibleRanges) : [];
|
|
697
|
+
// Hash the full body once when the whole file is in view: both the
|
|
698
|
+
// snapshot contentHash and (for ≤64KiB) the race-guard prefix hash
|
|
699
|
+
// are SHA-256 over the identical `content`, so computing it twice
|
|
700
|
+
// here was pure duplicate CPU on the common small full-file read.
|
|
701
|
+
const _fullContentHash = isFullFileView ? _hashText(content) : '';
|
|
702
|
+
const snapshotMeta = {
|
|
703
|
+
source: 'read',
|
|
704
|
+
fileLineCount: lineCount,
|
|
705
|
+
ranges: isFullFileView
|
|
706
|
+
? [{ startLine: 1, endLine: Infinity }]
|
|
707
|
+
: _visibleRanges,
|
|
708
|
+
...(isFullFileView ? { contentHash: _fullContentHash } : {}),
|
|
709
|
+
...(_rangeHashes.length > 0 ? { rangeHashes: _rangeHashes } : {}),
|
|
710
|
+
};
|
|
711
|
+
// Race-guard prefix hash. content is the full file body here
|
|
712
|
+
// (regular branch, st.size <= READ_MAX_SIZE_BYTES). For files
|
|
713
|
+
// ≤64KiB the prefix hash equals the full-content hash, so reuse
|
|
714
|
+
// _fullContentHash when it was computed; otherwise hash the 64KiB
|
|
715
|
+
// head (sufficient to detect a same-mtime / same-size rewrite of
|
|
716
|
+
// any bytes within the first 64KiB — the common case).
|
|
717
|
+
const _regPrefixHash = (content.length <= 65536 && _fullContentHash)
|
|
718
|
+
? _fullContentHash
|
|
719
|
+
: _hashText(content.length <= 65536 ? content : content.slice(0, 65536));
|
|
720
|
+
_cacheSet(cacheKey, out, { paths: [fullPath], readSnapshotMeta: snapshotMeta, contentPrefixHash: _regPrefixHash });
|
|
721
|
+
if (_readStableForRawCache) _rawContentCacheSet(fullPath, st, rawBuf);
|
|
722
|
+
_recordReadSnapshot(fullPath, st, readStateScope, snapshotMeta);
|
|
723
|
+
return withSymbolReadNote(out, args);
|
|
724
|
+
}
|
|
725
|
+
catch (err) {
|
|
726
|
+
return `Error: ${normalizeErrorMessage(err instanceof Error ? err.message : String(err))}`;
|
|
727
|
+
}
|
|
728
|
+
}
|