@pugi/cli 0.1.0-beta.4 → 0.1.0-beta.41
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/THIRD_PARTY_NOTICES.md +40 -0
- package/assets/pugi-mascot.ansi +15 -25
- package/bin/run.js +33 -1
- package/dist/commands/jobs-watch.js +201 -0
- package/dist/commands/jobs.js +15 -0
- package/dist/commands/smoke.js +133 -0
- package/dist/core/agent-progress/cleanup.js +134 -0
- package/dist/core/agent-progress/schema.js +144 -0
- package/dist/core/agent-progress/writer.js +101 -0
- package/dist/core/artifact-chain/dispatcher.js +148 -0
- package/dist/core/artifact-chain/exporter.js +164 -0
- package/dist/core/artifact-chain/state.js +243 -0
- package/dist/core/artifact-chain/steps.js +169 -0
- package/dist/core/auth/ensure-authenticated.js +129 -0
- package/dist/core/auth/env-provider.js +238 -0
- package/dist/core/auto-update/channels.js +122 -0
- package/dist/core/auto-update/checker.js +241 -0
- package/dist/core/auto-update/state.js +235 -0
- package/dist/core/bare-mode/index.js +107 -0
- package/dist/core/bash-classifier.js +108 -1
- package/dist/core/checkpoint/resumer.js +149 -0
- package/dist/core/checkpoint/rewinder.js +291 -0
- package/dist/core/codegraph/decision-store.js +248 -0
- package/dist/core/codegraph/detect-repo.js +459 -0
- package/dist/core/codegraph/install.js +134 -0
- package/dist/core/codegraph/offer-hook.js +220 -0
- package/dist/core/compact/auto-trigger.js +96 -0
- package/dist/core/compact/buffer-rewriter.js +115 -0
- package/dist/core/compact/summarizer.js +208 -0
- package/dist/core/compact/token-counter.js +108 -0
- package/dist/core/consensus/diff-capture.js +73 -0
- package/dist/core/context/index.js +7 -0
- package/dist/core/context/markdown-traverse.js +255 -0
- package/dist/core/cost/rate-card.js +129 -0
- package/dist/core/cost/tracker.js +221 -0
- package/dist/core/denial-tracking/index.js +8 -0
- package/dist/core/denial-tracking/state.js +264 -0
- package/dist/core/diagnostics/probe-runner.js +93 -0
- package/dist/core/diagnostics/probes/api.js +46 -0
- package/dist/core/diagnostics/probes/auth.js +86 -0
- package/dist/core/diagnostics/probes/bare-mode.js +42 -0
- package/dist/core/diagnostics/probes/cli-version.js +127 -0
- package/dist/core/diagnostics/probes/config.js +72 -0
- package/dist/core/diagnostics/probes/denial-tracking.js +57 -0
- package/dist/core/diagnostics/probes/disk.js +81 -0
- package/dist/core/diagnostics/probes/git.js +65 -0
- package/dist/core/diagnostics/probes/mcp.js +75 -0
- package/dist/core/diagnostics/probes/node.js +59 -0
- package/dist/core/diagnostics/probes/pnpm.js +36 -0
- package/dist/core/diagnostics/probes/pugi-md.js +89 -0
- package/dist/core/diagnostics/probes/session.js +74 -0
- package/dist/core/diagnostics/probes/status-snapshot.js +488 -0
- package/dist/core/diagnostics/probes/workspace.js +63 -0
- package/dist/core/diagnostics/types.js +70 -0
- package/dist/core/dispatch/cache-cleanup.js +197 -0
- package/dist/core/dispatch/cache-handoff.js +295 -0
- package/dist/core/edits/dispatch.js +218 -2
- package/dist/core/edits/journal.js +199 -0
- package/dist/core/edits/layer-d-ast.js +557 -14
- package/dist/core/edits/verify-hook.js +273 -0
- package/dist/core/edits/worktree.js +322 -0
- package/dist/core/engine/anvil-client.js +115 -5
- package/dist/core/engine/budgets.js +98 -0
- package/dist/core/engine/context-prefix.js +155 -0
- package/dist/core/engine/intent.js +260 -0
- package/dist/core/engine/native-pugi.js +860 -211
- package/dist/core/engine/prompts.js +88 -2
- package/dist/core/engine/strip-internal-fields.js +124 -0
- package/dist/core/engine/tool-bridge.js +1045 -36
- package/dist/core/feedback/queue.js +177 -0
- package/dist/core/feedback/submitter.js +145 -0
- package/dist/core/file-cache.js +113 -1
- package/dist/core/hooks/events.js +44 -0
- package/dist/core/hooks/index.js +15 -0
- package/dist/core/hooks/registry.js +213 -0
- package/dist/core/hooks/runner.js +236 -0
- package/dist/core/hooks/v2/event-emitter.js +115 -0
- package/dist/core/hooks/v2/executor.js +282 -0
- package/dist/core/hooks/v2/index.js +25 -0
- package/dist/core/hooks/v2/lifecycle.js +104 -0
- package/dist/core/hooks/v2/loader.js +216 -0
- package/dist/core/hooks/v2/matcher.js +125 -0
- package/dist/core/hooks/v2/trust.js +143 -0
- package/dist/core/hooks/v2/types.js +86 -0
- package/dist/core/lsp/cache.js +105 -0
- package/dist/core/lsp/client.js +776 -0
- package/dist/core/lsp/language-detect.js +66 -0
- package/dist/core/lsp/post-edit-diagnostics.js +171 -0
- package/dist/core/mcp/client.js +75 -6
- package/dist/core/mcp/http-server.js +553 -0
- package/dist/core/mcp/orchestrator-tools.js +662 -0
- package/dist/core/mcp/permission.js +190 -0
- package/dist/core/mcp/registry.js +24 -2
- package/dist/core/mcp/server-tools.js +219 -0
- package/dist/core/mcp/server.js +397 -0
- package/dist/core/memory/dual-write.js +416 -0
- package/dist/core/memory/phase1-kinds.js +20 -0
- package/dist/core/memory-sync/queue.js +158 -0
- package/dist/core/onboarding/ensure-initialized.js +133 -0
- package/dist/core/onboarding/marker.js +111 -0
- package/dist/core/onboarding/telemetry-state.js +108 -0
- package/dist/core/output-style/presets.js +176 -0
- package/dist/core/output-style/state.js +185 -0
- package/dist/core/permissions/auto-classifier.js +124 -0
- package/dist/core/permissions/circuit-breaker.js +83 -0
- package/dist/core/permissions/gate.js +278 -0
- package/dist/core/permissions/index.js +20 -0
- package/dist/core/permissions/mode.js +174 -0
- package/dist/core/permissions/state.js +241 -0
- package/dist/core/permissions/tool-class.js +93 -0
- package/dist/core/prd-check/parser.js +215 -0
- package/dist/core/prd-check/reporter.js +127 -0
- package/dist/core/prd-check/session-review.js +557 -0
- package/dist/core/prd-check/verifiers.js +223 -0
- package/dist/core/pugi-md/context-injector.js +76 -0
- package/dist/core/pugi-md/walk-up.js +207 -0
- package/dist/core/release-notes/parser.js +241 -0
- package/dist/core/release-notes/state.js +116 -0
- package/dist/core/repl/history.js +11 -1
- package/dist/core/repl/model-pricing.js +135 -0
- package/dist/core/repl/session.js +1899 -38
- package/dist/core/repl/slash-commands.js +406 -21
- package/dist/core/repl/store/session-store.js +31 -2
- package/dist/core/repl/workspace-context.js +22 -0
- package/dist/core/repo-map/build.js +125 -0
- package/dist/core/repo-map/cache.js +185 -0
- package/dist/core/repo-map/extractor.js +254 -0
- package/dist/core/repo-map/formatter.js +145 -0
- package/dist/core/repo-map/scanner.js +211 -0
- package/dist/core/retry-budget/budget.js +284 -0
- package/dist/core/retry-budget/index.js +5 -0
- package/dist/core/session.js +92 -0
- package/dist/core/settings.js +80 -0
- package/dist/core/share/formatter.js +271 -0
- package/dist/core/share/redactor.js +221 -0
- package/dist/core/share/uploader.js +267 -0
- package/dist/core/skills/defaults.js +457 -0
- package/dist/core/smoke/headless-driver.js +174 -0
- package/dist/core/smoke/orchestrator.js +194 -0
- package/dist/core/smoke/runner.js +238 -0
- package/dist/core/smoke/scenario-parser.js +316 -0
- package/dist/core/subagents/dispatcher-real.js +600 -0
- package/dist/core/subagents/dispatcher.js +113 -24
- package/dist/core/subagents/index.js +18 -5
- package/dist/core/subagents/isolation-matrix.js +213 -0
- package/dist/core/subagents/spawn.js +19 -4
- package/dist/core/telemetry/emitter.js +229 -0
- package/dist/core/telemetry/queue.js +251 -0
- package/dist/core/theme/context.js +91 -0
- package/dist/core/theme/presets.js +228 -0
- package/dist/core/theme/state.js +181 -0
- package/dist/core/todos/invariant.js +10 -0
- package/dist/core/todos/state.js +177 -0
- package/dist/core/transport/version-interceptor.js +166 -0
- package/dist/core/vim/keymap.js +288 -0
- package/dist/core/vim/state.js +92 -0
- package/dist/index.js +28 -0
- package/dist/runtime/bootstrap.js +190 -0
- package/dist/runtime/cli.js +3073 -321
- package/dist/runtime/commands/cancel.js +231 -0
- package/dist/runtime/commands/chain.js +489 -0
- package/dist/runtime/commands/codegraph-status.js +227 -0
- package/dist/runtime/commands/compact.js +297 -0
- package/dist/runtime/commands/cost.js +199 -0
- package/dist/runtime/commands/delegate.js +242 -11
- package/dist/runtime/commands/dispatch.js +126 -0
- package/dist/runtime/commands/doctor.js +390 -0
- package/dist/runtime/commands/feedback.js +184 -0
- package/dist/runtime/commands/hooks.js +184 -0
- package/dist/runtime/commands/lsp.js +368 -0
- package/dist/runtime/commands/mcp.js +879 -0
- package/dist/runtime/commands/memory.js +508 -0
- package/dist/runtime/commands/model.js +237 -0
- package/dist/runtime/commands/onboarding.js +275 -0
- package/dist/runtime/commands/patch.js +128 -0
- package/dist/runtime/commands/permissions.js +112 -0
- package/dist/runtime/commands/plan.js +143 -0
- package/dist/runtime/commands/prd-check.js +285 -0
- package/dist/runtime/commands/redo-blob-store.js +92 -0
- package/dist/runtime/commands/redo.js +361 -0
- package/dist/runtime/commands/release-notes.js +229 -0
- package/dist/runtime/commands/repo-map.js +95 -0
- package/dist/runtime/commands/report.js +299 -0
- package/dist/runtime/commands/resume.js +118 -0
- package/dist/runtime/commands/review-consensus.js +17 -2
- package/dist/runtime/commands/rewind.js +333 -0
- package/dist/runtime/commands/sessions.js +163 -0
- package/dist/runtime/commands/share.js +316 -0
- package/dist/runtime/commands/status.js +186 -0
- package/dist/runtime/commands/stickers.js +82 -0
- package/dist/runtime/commands/style.js +194 -0
- package/dist/runtime/commands/theme.js +196 -0
- package/dist/runtime/commands/undo.js +32 -0
- package/dist/runtime/commands/update.js +289 -0
- package/dist/runtime/commands/vim.js +140 -0
- package/dist/runtime/commands/worktree.js +177 -0
- package/dist/runtime/headless-repl.js +195 -0
- package/dist/runtime/headless.js +543 -0
- package/dist/runtime/load-hooks-or-exit.js +71 -0
- package/dist/runtime/plan-decompose.js +531 -0
- package/dist/runtime/version.js +65 -0
- package/dist/tools/agent-tool.js +229 -0
- package/dist/tools/apply-patch.js +556 -0
- package/dist/tools/ask-user-question.js +213 -0
- package/dist/tools/ask-user.js +115 -0
- package/dist/tools/file-tools.js +85 -14
- package/dist/tools/lsp-tools.js +189 -0
- package/dist/tools/mcp-tool.js +260 -0
- package/dist/tools/multi-edit.js +361 -0
- package/dist/tools/powershell.js +156 -0
- package/dist/tools/registry.js +51 -0
- package/dist/tools/skill-tool.js +96 -0
- package/dist/tools/tasks.js +208 -0
- package/dist/tools/todo-write.js +184 -0
- package/dist/tools/web-fetch.js +147 -2
- package/dist/tools/web-search.js +458 -0
- package/dist/tui/agent-progress-card.js +111 -0
- package/dist/tui/agent-tree.js +10 -0
- package/dist/tui/ask-modal.js +2 -2
- package/dist/tui/ask-user-question-prompt.js +192 -0
- package/dist/tui/compact-banner.js +81 -0
- package/dist/tui/conversation-pane.js +82 -8
- package/dist/tui/cost-table.js +111 -0
- package/dist/tui/doctor-table.js +46 -0
- package/dist/tui/feedback-prompt.js +156 -0
- package/dist/tui/input-box.js +69 -2
- package/dist/tui/markdown-render.js +4 -4
- package/dist/tui/onboarding-wizard.js +240 -0
- package/dist/tui/permissions-picker.js +86 -0
- package/dist/tui/render.js +35 -0
- package/dist/tui/repl-render.js +303 -13
- package/dist/tui/repl-splash.js +2 -2
- package/dist/tui/repl.js +72 -14
- package/dist/tui/splash.js +1 -1
- package/dist/tui/status-bar.js +94 -16
- package/dist/tui/status-table.js +7 -0
- package/dist/tui/stickers-art.js +136 -0
- package/dist/tui/style-table.js +28 -0
- package/dist/tui/theme-table.js +29 -0
- package/dist/tui/tool-stream-pane.js +52 -3
- package/dist/tui/update-banner.js +20 -2
- package/dist/tui/vim-input.js +267 -0
- package/docs/examples/codegraph.mcp.json +10 -0
- package/package.json +12 -6
- package/test/scenarios/codegen-create-file.scenario.txt +13 -0
- package/test/scenarios/compact-force.scenario.txt +11 -0
- package/test/scenarios/identity.scenario.txt +11 -0
- package/test/scenarios/persona-handoff.scenario.txt +11 -0
- package/test/scenarios/walkback.scenario.txt +12 -0
- package/dist/core/engine/compaction-hook.js +0 -154
|
@@ -0,0 +1,108 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Approximate token counter for the `/compact` auto-trigger gate.
|
|
3
|
+
*
|
|
4
|
+
* Pugi does not bundle tiktoken — adding a 3 MB native module for a
|
|
5
|
+
* single heuristic check after every turn is the wrong trade. We instead
|
|
6
|
+
* use the OpenAI rule-of-thumb that 1 token ≈ 4 characters of English
|
|
7
|
+
* (≈ ¾ of a word). For mixed-language conversations the approximation
|
|
8
|
+
* skews high by 10-20% which is the safe direction — the auto-compact
|
|
9
|
+
* threshold trips slightly EARLY, never LATE. A late trigger would
|
|
10
|
+
* exceed the model's actual context window and crash the next turn.
|
|
11
|
+
*
|
|
12
|
+
* Per-model context windows are exported from `MODEL_CONTEXT_WINDOW` so
|
|
13
|
+
* the caller can resolve the budget from the active model slug without
|
|
14
|
+
* round-tripping to the server. New models added in Anvil should grow
|
|
15
|
+
* this table in lockstep; the fall-back is the conservative 32k window.
|
|
16
|
+
*
|
|
17
|
+
* Override hook: when `PUGI_TOKEN_COUNTER_OVERRIDE` is set the function
|
|
18
|
+
* parses it as a JSON object `{"text": <n>}` (number of tokens to claim
|
|
19
|
+
* per char). Used only by the integration spec — never by production.
|
|
20
|
+
*/
|
|
21
|
+
/** Default chars-per-token ratio for the OpenAI rule-of-thumb. */
|
|
22
|
+
const DEFAULT_CHARS_PER_TOKEN = 4;
|
|
23
|
+
/**
|
|
24
|
+
* Conservative fallback window when the model slug is unknown. 32k is
|
|
25
|
+
* the smallest window any current Anvil-served model exposes; using it
|
|
26
|
+
* as a fall-back guarantees we never overestimate budget and skip a
|
|
27
|
+
* compaction that should have fired.
|
|
28
|
+
*/
|
|
29
|
+
const FALLBACK_WINDOW = 32_000;
|
|
30
|
+
/**
|
|
31
|
+
* Known context windows for models Anvil exposes today. Keep in sync
|
|
32
|
+
* with `apps/admin-api/src/pugi/model-registry.ts` — when a new model
|
|
33
|
+
* lands there, add it here. The table is intentionally narrow: only
|
|
34
|
+
* models we have actually validated.
|
|
35
|
+
*/
|
|
36
|
+
export const MODEL_CONTEXT_WINDOW = Object.freeze({
|
|
37
|
+
'sonnet-4.6': 200_000,
|
|
38
|
+
'sonnet-4.5': 200_000,
|
|
39
|
+
'opus-4.7': 1_000_000,
|
|
40
|
+
'opus-4.6': 200_000,
|
|
41
|
+
'haiku-4.5': 200_000,
|
|
42
|
+
'deepseek-chat-v3.1': 128_000,
|
|
43
|
+
'gpt-5': 200_000,
|
|
44
|
+
'gemini-2.5-pro': 1_000_000,
|
|
45
|
+
});
|
|
46
|
+
/**
|
|
47
|
+
* Estimate the token count of a single string. Returns a positive
|
|
48
|
+
* integer for non-empty input and zero for empty input. The function is
|
|
49
|
+
* pure — same input always yields the same output.
|
|
50
|
+
*
|
|
51
|
+
* The approximation is `ceil(byteLength / chars-per-token)`. We use
|
|
52
|
+
* `Buffer.byteLength` so multi-byte UTF-8 sequences count proportionally
|
|
53
|
+
* to their on-the-wire size, not their char count — this matches the
|
|
54
|
+
* tokenizer's behaviour on CJK / cyrillic / emoji where one char often
|
|
55
|
+
* eats 3-4 tokens.
|
|
56
|
+
*/
|
|
57
|
+
export function estimateTokens(text) {
|
|
58
|
+
if (text.length === 0)
|
|
59
|
+
return 0;
|
|
60
|
+
const ratio = readCharsPerTokenOverride() ?? DEFAULT_CHARS_PER_TOKEN;
|
|
61
|
+
const bytes = Buffer.byteLength(text, 'utf8');
|
|
62
|
+
return Math.max(1, Math.ceil(bytes / ratio));
|
|
63
|
+
}
|
|
64
|
+
/**
|
|
65
|
+
* Resolve the context window in tokens for the given model slug. Falls
|
|
66
|
+
* back to the conservative 32k window when the slug is unknown.
|
|
67
|
+
*/
|
|
68
|
+
export function contextWindowForModel(model) {
|
|
69
|
+
if (!model)
|
|
70
|
+
return FALLBACK_WINDOW;
|
|
71
|
+
const known = MODEL_CONTEXT_WINDOW[model];
|
|
72
|
+
return known ?? FALLBACK_WINDOW;
|
|
73
|
+
}
|
|
74
|
+
/**
|
|
75
|
+
* Sum the token estimates of an arbitrary list of strings. Convenience
|
|
76
|
+
* for the auto-trigger which has to count across N transcript turns.
|
|
77
|
+
*/
|
|
78
|
+
export function estimateTokensInMany(parts) {
|
|
79
|
+
let total = 0;
|
|
80
|
+
for (const part of parts) {
|
|
81
|
+
total += estimateTokens(part);
|
|
82
|
+
}
|
|
83
|
+
return total;
|
|
84
|
+
}
|
|
85
|
+
/**
|
|
86
|
+
* Read the test override env. Returns the parsed chars-per-token ratio
|
|
87
|
+
* when set, or undefined when absent / malformed. Never throws.
|
|
88
|
+
*/
|
|
89
|
+
function readCharsPerTokenOverride() {
|
|
90
|
+
const raw = process.env['PUGI_TOKEN_COUNTER_OVERRIDE'];
|
|
91
|
+
if (!raw)
|
|
92
|
+
return undefined;
|
|
93
|
+
try {
|
|
94
|
+
const parsed = JSON.parse(raw);
|
|
95
|
+
if (typeof parsed === 'object'
|
|
96
|
+
&& parsed !== null
|
|
97
|
+
&& typeof parsed.charsPerToken === 'number') {
|
|
98
|
+
const ratio = parsed.charsPerToken;
|
|
99
|
+
if (Number.isFinite(ratio) && ratio > 0)
|
|
100
|
+
return ratio;
|
|
101
|
+
}
|
|
102
|
+
}
|
|
103
|
+
catch {
|
|
104
|
+
/* malformed env, fall through */
|
|
105
|
+
}
|
|
106
|
+
return undefined;
|
|
107
|
+
}
|
|
108
|
+
//# sourceMappingURL=token-counter.js.map
|
|
@@ -6,6 +6,10 @@
|
|
|
6
6
|
*
|
|
7
7
|
* 1. `--pr <number>` — uses `gh pr diff <num>` (gh CLI required).
|
|
8
8
|
* 2. `--commit <sha>` — diff of that commit vs its first parent.
|
|
9
|
+
* When `--base <ref>` is ALSO provided, the
|
|
10
|
+
* diff is the range `<base>..<commit>` instead
|
|
11
|
+
* (mirrors `git diff base..commit` — covers the
|
|
12
|
+
* full PR-style payload, not just the tip).
|
|
9
13
|
* 3. `--branch <name>` — diff of HEAD vs `origin/<name>` merge-base.
|
|
10
14
|
* 4. (default) — diff of HEAD vs `origin/main` merge-base
|
|
11
15
|
* covering BOTH committed-since-base AND
|
|
@@ -95,6 +99,16 @@ export function captureDiff(spec) {
|
|
|
95
99
|
return captureFromPr(cwd, spec.pr);
|
|
96
100
|
}
|
|
97
101
|
if (typeof spec.commit === 'string' && spec.commit.length > 0) {
|
|
102
|
+
// When `--base` is supplied alongside `--commit`, callers want the
|
|
103
|
+
// full PR-style range diff (`base..commit`), not just the tip
|
|
104
|
+
// commit's parent diff. This matches the convention used by
|
|
105
|
+
// `git diff <base>..<commit>` everywhere else in the toolchain and
|
|
106
|
+
// is the verified-correct mode for reviewing a PR head ref. Without
|
|
107
|
+
// this branch, `--base` was silently ignored when `--commit` was
|
|
108
|
+
// present — see feedback_pugi_review_use_range_diff_not_worktree.
|
|
109
|
+
if (typeof spec.baseRef === 'string' && spec.baseRef.length > 0) {
|
|
110
|
+
return captureFromRange(cwd, spec.baseRef, spec.commit);
|
|
111
|
+
}
|
|
98
112
|
return captureFromCommit(cwd, spec.commit);
|
|
99
113
|
}
|
|
100
114
|
if (typeof spec.branch === 'string' && spec.branch.length > 0) {
|
|
@@ -192,6 +206,65 @@ function captureFromCommit(cwd, commit) {
|
|
|
192
206
|
},
|
|
193
207
|
};
|
|
194
208
|
}
|
|
209
|
+
/**
|
|
210
|
+
* Range capture for `--commit <X> --base <Y>` — diff equivalent to
|
|
211
|
+
* `git diff <base>..<commit>`. Used when the operator names BOTH endpoints
|
|
212
|
+
* (typical PR review against a remote head SHA).
|
|
213
|
+
*
|
|
214
|
+
* Critical: this MUST be a pure read-only range diff against named refs.
|
|
215
|
+
* The previous behavior fell through to `captureFromCommit` which only
|
|
216
|
+
* showed the tip commit (`commit~1..commit`) — fine for single-commit
|
|
217
|
+
* review, wrong for multi-commit PRs. Worse, a stale fallback path was
|
|
218
|
+
* sending the working tree diff (`git diff` with no args), which caused
|
|
219
|
+
* every review on 2026-05-27 to surface identical noise from uncommitted
|
|
220
|
+
* `.gitignore` edits instead of the actual PR contents.
|
|
221
|
+
*
|
|
222
|
+
* Working tree integrity: only `git diff <ref>..<ref>` and metadata
|
|
223
|
+
* `log` / `rev-parse` / `name-rev` are used — none of these touch the
|
|
224
|
+
* index, working tree, or HEAD.
|
|
225
|
+
*/
|
|
226
|
+
function captureFromRange(cwd, baseRef, commit) {
|
|
227
|
+
// Resolve both endpoints up front so an unknown ref errors with a
|
|
228
|
+
// clear message before the diff invocation. `rev-parse` is read-only.
|
|
229
|
+
const fullCommit = safeExec(cwd, 'git', ['rev-parse', commit]).trim();
|
|
230
|
+
if (!fullCommit)
|
|
231
|
+
throw new Error(`Unknown commit ref: ${commit}`);
|
|
232
|
+
// Resolve the base: accept already-qualified refs (`origin/main`,
|
|
233
|
+
// `refs/heads/foo`) and bare branch names. If the bare name isn't
|
|
234
|
+
// locally resolvable, retry against `origin/<name>` — the common
|
|
235
|
+
// CI shape where local main is absent but the remote tracking ref is.
|
|
236
|
+
let resolvedBase = safeExecOptional(cwd, 'git', ['rev-parse', baseRef]).trim();
|
|
237
|
+
let effectiveBase = baseRef;
|
|
238
|
+
if (!resolvedBase && !baseRef.includes('/')) {
|
|
239
|
+
const remoteBase = `origin/${baseRef}`;
|
|
240
|
+
resolvedBase = safeExecOptional(cwd, 'git', ['rev-parse', remoteBase]).trim();
|
|
241
|
+
if (resolvedBase)
|
|
242
|
+
effectiveBase = remoteBase;
|
|
243
|
+
}
|
|
244
|
+
if (!resolvedBase)
|
|
245
|
+
throw new Error(`Unknown base ref: ${baseRef}`);
|
|
246
|
+
const diff = safeExec(cwd, 'git', [
|
|
247
|
+
'diff',
|
|
248
|
+
`${resolvedBase}..${fullCommit}`,
|
|
249
|
+
'--',
|
|
250
|
+
'.',
|
|
251
|
+
...PROTECTED_PATHSPEC_EXCLUDES,
|
|
252
|
+
]);
|
|
253
|
+
const cappedDiff = capDiff(diff);
|
|
254
|
+
const subject = safeExec(cwd, 'git', ['log', '-1', '--pretty=%s', fullCommit]).trim();
|
|
255
|
+
const branch = safeExec(cwd, 'git', ['name-rev', '--name-only', fullCommit]).trim() || 'detached';
|
|
256
|
+
const stats = computeStats(cappedDiff);
|
|
257
|
+
return {
|
|
258
|
+
diff: cappedDiff,
|
|
259
|
+
context: {
|
|
260
|
+
branch,
|
|
261
|
+
commit: shortSha(fullCommit),
|
|
262
|
+
title: subject || `commit ${shortSha(fullCommit)}`,
|
|
263
|
+
ref: `range:${effectiveBase}..${shortSha(fullCommit)}`,
|
|
264
|
+
stats,
|
|
265
|
+
},
|
|
266
|
+
};
|
|
267
|
+
}
|
|
195
268
|
function captureFromBranch(cwd, branch, baseRef) {
|
|
196
269
|
const remoteRef = branch.includes('/') ? branch : `origin/${branch}`;
|
|
197
270
|
const mergeBase = safeExec(cwd, 'git', ['merge-base', baseRef, remoteRef]).trim();
|
|
@@ -18,4 +18,11 @@ export { BASELINE_IGNORE_PATTERNS, SECRET_IGNORE_PATTERNS, globalPugiIgnorePath,
|
|
|
18
18
|
export { COLLAPSE_DIR_ENTRIES, MAX_README_LINES, MAX_SKELETON_BYTES, MAX_TREE_DEPTH, MAX_WALK_NODES, TOP_LANGUAGES, buildRepoSkeleton, detectPackageManager, languageForExtension, readGitBranch, readPackageJson, readReadme, renderSkeleton, topLanguages, } from './repo-skeleton.js';
|
|
19
19
|
export { DEFAULT_WORKING_SET_CAPACITY, WorkingSet, } from './working-set.js';
|
|
20
20
|
export { MAX_WATCHED_PATHS, PugiWatcher, THROTTLE_WINDOW_MS, } from './watcher.js';
|
|
21
|
+
/**
|
|
22
|
+
* β5a R4+P5 — per-directory PUGI.md / AGENTS.md / CLAUDE.md / GEMINI.md
|
|
23
|
+
* traverse-up. Loads agent-context markdown at every directory between
|
|
24
|
+
* `cwd` and `workspaceRoot` (workspace root file is owned by
|
|
25
|
+
* `loadMarkdownContext` in `markdown-loader.ts` — no double-load).
|
|
26
|
+
*/
|
|
27
|
+
export { MAX_TRAVERSE_BYTES, MAX_TRAVERSE_PER_FILE_BYTES, MAX_TRAVERSE_DEPTH, TRAVERSE_SOURCES, loadTraversedMarkdown, } from './markdown-traverse.js';
|
|
21
28
|
//# sourceMappingURL=index.js.map
|
|
@@ -0,0 +1,255 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Per-directory PUGI.md / AGENTS.md / CLAUDE.md / GEMINI.md traverse-up
|
|
3
|
+
* loader — β5a R4+P5.
|
|
4
|
+
*
|
|
5
|
+
* Claude Code, Codex CLI, and Gemini CLI all support a "walk up from
|
|
6
|
+
* cwd to the workspace root, pick up agent-context markdown at every
|
|
7
|
+
* level" pattern. Without this, a `pugi explain` invoked from
|
|
8
|
+
* `apps/admin-api/` cannot see project-local conventions encoded in
|
|
9
|
+
* `apps/admin-api/PUGI.md` (or the cross-CLI shim files) — the
|
|
10
|
+
* existing `loadMarkdownContext` only reads files at `workspaceRoot`.
|
|
11
|
+
*
|
|
12
|
+
* The β5a quality gate (≥80% win-rate vs Claude Code per CEO 2026-05-26)
|
|
13
|
+
* surfaces this gap repeatedly: monorepo-local conventions (NestJS
|
|
14
|
+
* controller style, Prisma migration name format, cabinet brand voice
|
|
15
|
+
* gates) live in per-app context files, and Pugi was blind to them
|
|
16
|
+
* pre-β5a.
|
|
17
|
+
*
|
|
18
|
+
* Contract:
|
|
19
|
+
*
|
|
20
|
+
* - Walk from `cwd` upward until we reach `workspaceRoot` OR cross
|
|
21
|
+
* the filesystem boundary. The workspace root file itself is
|
|
22
|
+
* loaded by the legacy `loadMarkdownContext` so we do NOT include
|
|
23
|
+
* it here (no double-load, no double-budget-charge).
|
|
24
|
+
*
|
|
25
|
+
* - At each intermediate directory, look for the four canonical
|
|
26
|
+
* filenames: `PUGI.md` (native), `AGENTS.md` (cross-CLI shim),
|
|
27
|
+
* `CLAUDE.md` (Claude Code compat), `GEMINI.md` (Gemini CLI compat).
|
|
28
|
+
*
|
|
29
|
+
* - HTML comments stripped, identical to the legacy loader.
|
|
30
|
+
*
|
|
31
|
+
* - `@import` expansion is intentionally NOT performed here — the
|
|
32
|
+
* per-dir surface is "drop a small file with the local
|
|
33
|
+
* conventions"; deep @import chains belong at workspace root.
|
|
34
|
+
* Keeping this surface flat means the per-dir budget cannot be
|
|
35
|
+
* blown out by a runaway @import in an unrelated subtree.
|
|
36
|
+
*
|
|
37
|
+
* - Aggregate budget: `MAX_TRAVERSE_BYTES` across ALL files found
|
|
38
|
+
* in the walk. When exhausted, remaining files are skipped with
|
|
39
|
+
* a `budget_exhausted` warning. Default 32 KB — half the
|
|
40
|
+
* workspace-root budget, because per-dir files are meant to be
|
|
41
|
+
* terse delta conventions, not full project briefs.
|
|
42
|
+
*
|
|
43
|
+
* - The walk is bounded: `MAX_TRAVERSE_DEPTH` levels above
|
|
44
|
+
* workspaceRoot are NEVER traversed (defense against being
|
|
45
|
+
* invoked from a malicious cwd outside the workspace; in
|
|
46
|
+
* practice cwd is always inside workspaceRoot but the symlink
|
|
47
|
+
* case demands belt + suspenders).
|
|
48
|
+
*
|
|
49
|
+
* - Order returned: shallowest-first (workspace root would be
|
|
50
|
+
* first if included, then each level closer to cwd). Closest-
|
|
51
|
+
* to-cwd files are the most specific and the context builder
|
|
52
|
+
* emits them LAST so the model treats them as the highest-
|
|
53
|
+
* priority conventions.
|
|
54
|
+
*
|
|
55
|
+
* This module is pure: no logging, no network, no fs writes. Filesystem
|
|
56
|
+
* reads only.
|
|
57
|
+
*/
|
|
58
|
+
import { existsSync, readFileSync, realpathSync, statSync } from 'node:fs';
|
|
59
|
+
import { dirname, isAbsolute, relative, resolve, sep } from 'node:path';
|
|
60
|
+
import { stripHtmlComments } from './markdown-loader.js';
|
|
61
|
+
/**
|
|
62
|
+
* Per-traverse total byte cap. Half the workspace-root budget — these
|
|
63
|
+
* files are meant to be terse "in this subdir, do X". 32 KB still fits
|
|
64
|
+
* ~8000 words of guidance.
|
|
65
|
+
*/
|
|
66
|
+
export const MAX_TRAVERSE_BYTES = 32 * 1024;
|
|
67
|
+
/**
|
|
68
|
+
* Per-file byte cap. A single per-dir file should never dominate; the
|
|
69
|
+
* 8 KB cap keeps any one level honest. Files larger than this are
|
|
70
|
+
* loaded up to the cap and flagged truncated.
|
|
71
|
+
*/
|
|
72
|
+
export const MAX_TRAVERSE_PER_FILE_BYTES = 8 * 1024;
|
|
73
|
+
/**
|
|
74
|
+
* Maximum number of parent directories above workspaceRoot we will
|
|
75
|
+
* traverse. Zero in normal operation — cwd is always inside the
|
|
76
|
+
* workspace; the cap exists so a misconfigured invocation never
|
|
77
|
+
* walks the whole filesystem looking for AGENTS.md.
|
|
78
|
+
*/
|
|
79
|
+
export const MAX_TRAVERSE_DEPTH = 0;
|
|
80
|
+
/**
|
|
81
|
+
* Filenames we look for at every level of the walk. The order here
|
|
82
|
+
* also defines the per-directory load order: PUGI.md first (highest
|
|
83
|
+
* trust), then cross-CLI compat shims. When the same directory has
|
|
84
|
+
* multiple files (e.g. both PUGI.md AND CLAUDE.md), all are loaded
|
|
85
|
+
* — operators sometimes keep both during a tool migration.
|
|
86
|
+
*/
|
|
87
|
+
export const TRAVERSE_SOURCES = ['PUGI.md', 'AGENTS.md', 'CLAUDE.md', 'GEMINI.md'];
|
|
88
|
+
/**
|
|
89
|
+
* Walk from `opts.cwd` upward toward `opts.workspaceRoot`, loading
|
|
90
|
+
* every PUGI.md / AGENTS.md / CLAUDE.md / GEMINI.md we encounter at
|
|
91
|
+
* intermediate levels. The workspace root itself is NOT loaded here
|
|
92
|
+
* — `loadMarkdownContext(workspaceRoot)` owns that file.
|
|
93
|
+
*
|
|
94
|
+
* Returned `loaded` is sorted shallowest-first (closest-to-root) so
|
|
95
|
+
* the caller can emit per-dir context in increasing specificity.
|
|
96
|
+
*
|
|
97
|
+
* Safety properties (proven by spec):
|
|
98
|
+
*
|
|
99
|
+
* - Never reads outside the workspace tree (symlinks resolved via
|
|
100
|
+
* realpathSync; off-tree symlinks rejected as
|
|
101
|
+
* `import_escapes_workspace`).
|
|
102
|
+
* - Never reads more than `MAX_TRAVERSE_BYTES` total or more than
|
|
103
|
+
* `MAX_TRAVERSE_PER_FILE_BYTES` per file.
|
|
104
|
+
* - Never walks above the workspace root.
|
|
105
|
+
* - Never visits the workspace root itself (single source of truth
|
|
106
|
+
* for workspace-level docs stays with `loadMarkdownContext`).
|
|
107
|
+
*/
|
|
108
|
+
export async function loadTraversedMarkdown(opts) {
|
|
109
|
+
const warnings = [];
|
|
110
|
+
const loaded = [];
|
|
111
|
+
let budgetRemaining = MAX_TRAVERSE_BYTES;
|
|
112
|
+
let absRoot;
|
|
113
|
+
let absCwd;
|
|
114
|
+
try {
|
|
115
|
+
absRoot = realpathSync(resolve(opts.workspaceRoot));
|
|
116
|
+
absCwd = realpathSync(resolve(opts.cwd));
|
|
117
|
+
}
|
|
118
|
+
catch (error) {
|
|
119
|
+
warnings.push({
|
|
120
|
+
kind: 'read_error',
|
|
121
|
+
message: `realpath failed for traverse anchor: ${error.message}`,
|
|
122
|
+
});
|
|
123
|
+
return { loaded, warnings, totalBytes: 0 };
|
|
124
|
+
}
|
|
125
|
+
// Containment guard: if cwd is not inside workspaceRoot, refuse
|
|
126
|
+
// to walk. Returning a clean empty result keeps the engine happy
|
|
127
|
+
// and surfaces nothing about the off-tree cwd to the model.
|
|
128
|
+
const relCwd = relative(absRoot, absCwd);
|
|
129
|
+
if (relCwd.startsWith('..') || isAbsolute(relCwd)) {
|
|
130
|
+
warnings.push({
|
|
131
|
+
kind: 'import_escapes_workspace',
|
|
132
|
+
message: `cwd is outside workspaceRoot; per-dir traverse skipped (cwd=${absCwd}, root=${absRoot})`,
|
|
133
|
+
path: absCwd,
|
|
134
|
+
});
|
|
135
|
+
return { loaded, warnings, totalBytes: 0 };
|
|
136
|
+
}
|
|
137
|
+
// Collect the walk: every directory from cwd UP TO (but not
|
|
138
|
+
// including) workspaceRoot.
|
|
139
|
+
const dirsToVisit = [];
|
|
140
|
+
let current = absCwd;
|
|
141
|
+
while (current !== absRoot) {
|
|
142
|
+
dirsToVisit.push(current);
|
|
143
|
+
const parent = dirname(current);
|
|
144
|
+
if (parent === current)
|
|
145
|
+
break; // hit filesystem root before workspaceRoot — defensive
|
|
146
|
+
current = parent;
|
|
147
|
+
if (dirsToVisit.length > 64)
|
|
148
|
+
break; // pathological depth, refuse
|
|
149
|
+
}
|
|
150
|
+
// Walk shallowest-first so we charge the budget in the order
|
|
151
|
+
// that matches what we return.
|
|
152
|
+
dirsToVisit.reverse();
|
|
153
|
+
for (const dir of dirsToVisit) {
|
|
154
|
+
if (budgetRemaining <= 0) {
|
|
155
|
+
warnings.push({
|
|
156
|
+
kind: 'budget_exhausted',
|
|
157
|
+
message: `per-dir traverse budget exhausted before reaching ${dir}`,
|
|
158
|
+
path: dir,
|
|
159
|
+
});
|
|
160
|
+
break;
|
|
161
|
+
}
|
|
162
|
+
for (const source of TRAVERSE_SOURCES) {
|
|
163
|
+
const candidate = resolve(dir, source);
|
|
164
|
+
if (!existsSync(candidate))
|
|
165
|
+
continue;
|
|
166
|
+
// Symlink guard: same realpath check as the workspace-root
|
|
167
|
+
// loader. A symlink inside the workspace that points outside
|
|
168
|
+
// the workspace must NOT be inlined.
|
|
169
|
+
let realCandidate;
|
|
170
|
+
try {
|
|
171
|
+
realCandidate = realpathSync(candidate);
|
|
172
|
+
}
|
|
173
|
+
catch (error) {
|
|
174
|
+
warnings.push({
|
|
175
|
+
kind: 'read_error',
|
|
176
|
+
message: `realpath failed for ${candidate}: ${error.message}`,
|
|
177
|
+
path: candidate,
|
|
178
|
+
});
|
|
179
|
+
continue;
|
|
180
|
+
}
|
|
181
|
+
const realRel = relative(absRoot, realCandidate);
|
|
182
|
+
if (realRel.startsWith('..') || isAbsolute(realRel)) {
|
|
183
|
+
warnings.push({
|
|
184
|
+
kind: 'import_escapes_workspace',
|
|
185
|
+
message: `traverse file escapes workspace via symlink: ${candidate} -> ${realCandidate}`,
|
|
186
|
+
path: candidate,
|
|
187
|
+
});
|
|
188
|
+
continue;
|
|
189
|
+
}
|
|
190
|
+
let raw;
|
|
191
|
+
let rawBytes;
|
|
192
|
+
try {
|
|
193
|
+
rawBytes = statSync(candidate).size;
|
|
194
|
+
raw = readFileSync(candidate, 'utf8');
|
|
195
|
+
}
|
|
196
|
+
catch (error) {
|
|
197
|
+
warnings.push({
|
|
198
|
+
kind: 'read_error',
|
|
199
|
+
message: `could not read ${candidate}: ${error.message}`,
|
|
200
|
+
path: candidate,
|
|
201
|
+
});
|
|
202
|
+
continue;
|
|
203
|
+
}
|
|
204
|
+
const stripped = stripHtmlComments(raw);
|
|
205
|
+
// Per-file cap first, then global budget.
|
|
206
|
+
const perFileCap = Math.min(MAX_TRAVERSE_PER_FILE_BYTES, budgetRemaining);
|
|
207
|
+
let content = stripped;
|
|
208
|
+
let truncated = false;
|
|
209
|
+
let contentBytes = Buffer.byteLength(content, 'utf8');
|
|
210
|
+
if (contentBytes > perFileCap) {
|
|
211
|
+
// Codepoint-safe slice: convert byte cap to char cap by
|
|
212
|
+
// taking min(byte cap, char-length-up-to-cap). We accept
|
|
213
|
+
// mild over-trim for safety.
|
|
214
|
+
content = content.slice(0, perFileCap);
|
|
215
|
+
truncated = true;
|
|
216
|
+
contentBytes = Buffer.byteLength(content, 'utf8');
|
|
217
|
+
}
|
|
218
|
+
const distance = distanceSegments(absCwd, dir);
|
|
219
|
+
loaded.push({
|
|
220
|
+
source,
|
|
221
|
+
resolvedPath: candidate,
|
|
222
|
+
dir,
|
|
223
|
+
distanceFromCwd: distance,
|
|
224
|
+
rawBytes,
|
|
225
|
+
loadedBytes: contentBytes,
|
|
226
|
+
truncated,
|
|
227
|
+
content,
|
|
228
|
+
});
|
|
229
|
+
budgetRemaining -= contentBytes;
|
|
230
|
+
if (budgetRemaining <= 0)
|
|
231
|
+
break;
|
|
232
|
+
}
|
|
233
|
+
}
|
|
234
|
+
return {
|
|
235
|
+
loaded,
|
|
236
|
+
warnings,
|
|
237
|
+
totalBytes: MAX_TRAVERSE_BYTES - budgetRemaining,
|
|
238
|
+
};
|
|
239
|
+
}
|
|
240
|
+
/**
|
|
241
|
+
* How many path segments separate `from` and `to`. Both must be
|
|
242
|
+
* absolute. `to` is assumed to be an ancestor of (or equal to)
|
|
243
|
+
* `from`; if not, returns -1 so callers can ignore the file.
|
|
244
|
+
*/
|
|
245
|
+
function distanceSegments(from, to) {
|
|
246
|
+
if (from === to)
|
|
247
|
+
return 0;
|
|
248
|
+
const rel = relative(to, from);
|
|
249
|
+
if (rel.startsWith('..') || isAbsolute(rel))
|
|
250
|
+
return -1;
|
|
251
|
+
if (rel.length === 0)
|
|
252
|
+
return 0;
|
|
253
|
+
return rel.split(sep).length;
|
|
254
|
+
}
|
|
255
|
+
//# sourceMappingURL=markdown-traverse.js.map
|
|
@@ -0,0 +1,129 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Rate card for the `pugi cost` / `/cost` / `/usage` surface — L19 sprint.
|
|
3
|
+
*
|
|
4
|
+
* Distinct from `core/repl/model-pricing.ts` on purpose:
|
|
5
|
+
*
|
|
6
|
+
* - `model-pricing.ts` powers the TUI cost meter (per-turn flash, status
|
|
7
|
+
* row USD). Its ladder is keyed against the live Anvil model slugs and
|
|
8
|
+
* intentionally inflates an honest worst-case figure via the Sonnet
|
|
9
|
+
* fallback so an operator on a quiet model never gets billed by a
|
|
10
|
+
* surprise. It rounds to USD per 1M tokens at runtime.
|
|
11
|
+
*
|
|
12
|
+
* - `rate-card.ts` (this file) powers the persisted `/cost` table the
|
|
13
|
+
* operator reads to plan budget. It distinguishes open-weight models
|
|
14
|
+
* ($0 / $0 — infra cost only) from hosted closed models so the table
|
|
15
|
+
* does not double-charge an operator running a self-hosted Qwen or
|
|
16
|
+
* Kimi behind Pugi. The L19 spec calls these out by name.
|
|
17
|
+
*
|
|
18
|
+
* Both ladders intentionally agree on Anthropic Claude family pricing so
|
|
19
|
+
* the TUI flash and the persisted table cannot disagree on a Claude turn.
|
|
20
|
+
* If they diverge, the per-model-pricing ladder wins for live UI; the
|
|
21
|
+
* rate card here wins for the persisted `.pugi/cost.json` aggregate.
|
|
22
|
+
*
|
|
23
|
+
* Prices are USD per 1,000,000 tokens, sourced from the L19 spec
|
|
24
|
+
* (2026-05-27) which mirrors provider list-price pages as of that date.
|
|
25
|
+
*/
|
|
26
|
+
/**
|
|
27
|
+
* Exact-match price ladder keyed by model slug. Slugs match the L19 task
|
|
28
|
+
* spec verbatim so a copy-paste from the sprint doc resolves without
|
|
29
|
+
* normalisation.
|
|
30
|
+
*/
|
|
31
|
+
export const RATES_PER_MTOKEN = Object.freeze({
|
|
32
|
+
// Anthropic Claude family (hosted, billed).
|
|
33
|
+
'claude-opus-4-7': { input: 15, output: 75 },
|
|
34
|
+
'claude-opus-4-6': { input: 15, output: 75 },
|
|
35
|
+
'claude-sonnet-4-6': { input: 3, output: 15 },
|
|
36
|
+
'claude-sonnet-4-5': { input: 3, output: 15 },
|
|
37
|
+
'claude-haiku-4-5-20251001': { input: 1, output: 5 },
|
|
38
|
+
'claude-haiku-4-5': { input: 1, output: 5 },
|
|
39
|
+
// Open-weight models — infra cost only, never per-token billed. The
|
|
40
|
+
// note column surfaces the reason so a CFO reading the JSON envelope
|
|
41
|
+
// does not assume the row is broken.
|
|
42
|
+
'qwen3-coder-480b-instruct-fp8': { input: 0, output: 0, note: 'open-weight' },
|
|
43
|
+
'kimi-k2.6': { input: 0, output: 0, note: 'open-weight' },
|
|
44
|
+
'deepseek-v4-pro': { input: 0, output: 0, note: 'open-weight' },
|
|
45
|
+
});
|
|
46
|
+
/**
|
|
47
|
+
* Family-prefix fallback — used only when an exact slug miss. Mirrors the
|
|
48
|
+
* approach in `model-pricing.ts` so a future model rebind (e.g.
|
|
49
|
+
* `claude-opus-4-8`) prices reasonably without a code edit.
|
|
50
|
+
*/
|
|
51
|
+
const FAMILY_FALLBACKS = [
|
|
52
|
+
['claude-opus-', { input: 15, output: 75 }],
|
|
53
|
+
['claude-sonnet-', { input: 3, output: 15 }],
|
|
54
|
+
['claude-haiku-', { input: 1, output: 5 }],
|
|
55
|
+
['qwen', { input: 0, output: 0, note: 'open-weight' }],
|
|
56
|
+
['kimi', { input: 0, output: 0, note: 'open-weight' }],
|
|
57
|
+
['deepseek', { input: 0, output: 0, note: 'open-weight' }],
|
|
58
|
+
];
|
|
59
|
+
/**
|
|
60
|
+
* Final fallback for unknown slugs. Pinned to Sonnet-tier — same posture
|
|
61
|
+
* as `model-pricing.ts`'s default, so an unrecognised hosted model bills
|
|
62
|
+
* "honestly conservative" rather than $0 (which would silently hide cost
|
|
63
|
+
* from the operator).
|
|
64
|
+
*/
|
|
65
|
+
const DEFAULT_RATE = { input: 3, output: 15, note: 'unknown model — Sonnet-tier estimate' };
|
|
66
|
+
/**
|
|
67
|
+
* Look up the rate for a model slug.
|
|
68
|
+
*
|
|
69
|
+
* Resolution order:
|
|
70
|
+
* 1. Exact match in `RATES_PER_MTOKEN`.
|
|
71
|
+
* 2. Family-prefix match (first hit wins).
|
|
72
|
+
* 3. Default Sonnet-tier estimate.
|
|
73
|
+
*
|
|
74
|
+
* Pure, never throws. Called on every cost-tracker write so the hot path
|
|
75
|
+
* stays branch-cheap.
|
|
76
|
+
*/
|
|
77
|
+
export function rateFor(model) {
|
|
78
|
+
if (!model || typeof model !== 'string')
|
|
79
|
+
return DEFAULT_RATE;
|
|
80
|
+
const exact = RATES_PER_MTOKEN[model];
|
|
81
|
+
if (exact)
|
|
82
|
+
return exact;
|
|
83
|
+
for (const [prefix, rate] of FAMILY_FALLBACKS) {
|
|
84
|
+
if (model.startsWith(prefix))
|
|
85
|
+
return rate;
|
|
86
|
+
}
|
|
87
|
+
return DEFAULT_RATE;
|
|
88
|
+
}
|
|
89
|
+
/**
|
|
90
|
+
* Compute the USD cost for a single (model, inputTokens, outputTokens)
|
|
91
|
+
* triple. Defensive against negative / NaN inputs — out-of-range values
|
|
92
|
+
* floor to zero so a buggy upstream cannot credit a negative cost.
|
|
93
|
+
*/
|
|
94
|
+
export function estimateUsd(model, inputTokens, outputTokens) {
|
|
95
|
+
const rate = rateFor(model);
|
|
96
|
+
const safeIn = Number.isFinite(inputTokens) && inputTokens > 0 ? inputTokens : 0;
|
|
97
|
+
const safeOut = Number.isFinite(outputTokens) && outputTokens > 0 ? outputTokens : 0;
|
|
98
|
+
const usd = (safeIn * rate.input + safeOut * rate.output) / 1_000_000;
|
|
99
|
+
return Number.isFinite(usd) && usd > 0 ? usd : 0;
|
|
100
|
+
}
|
|
101
|
+
/**
|
|
102
|
+
* Format a USD figure for the `/cost` table.
|
|
103
|
+
*
|
|
104
|
+
* - `≥ $0.01` → two decimals (`$0.46`).
|
|
105
|
+
* - `< $0.01` but `> 0` → three decimals (`$0.003`) so fractions of a
|
|
106
|
+
* cent are honest instead of rounding to `$0.00`.
|
|
107
|
+
* - Exactly `0` or NaN → `$0.00`.
|
|
108
|
+
*
|
|
109
|
+
* Mirrors `formatCostUsd` from `model-pricing.ts` intentionally — both
|
|
110
|
+
* surfaces should print the same number in the same shape.
|
|
111
|
+
*/
|
|
112
|
+
export function formatUsd(value) {
|
|
113
|
+
if (!Number.isFinite(value) || value <= 0)
|
|
114
|
+
return '$0.00';
|
|
115
|
+
if (value >= 0.01)
|
|
116
|
+
return `$${value.toFixed(2)}`;
|
|
117
|
+
return `$${value.toFixed(3)}`;
|
|
118
|
+
}
|
|
119
|
+
/**
|
|
120
|
+
* Format a token count for the `/cost` table. Uses comma-thousands so the
|
|
121
|
+
* table reads `14,300` instead of `14.3k` — distinct from the TUI status
|
|
122
|
+
* row which uses `k`/`m` shortening to save column width.
|
|
123
|
+
*/
|
|
124
|
+
export function formatTokensWithCommas(value) {
|
|
125
|
+
if (!Number.isFinite(value) || value <= 0)
|
|
126
|
+
return '0';
|
|
127
|
+
return Math.floor(value).toLocaleString('en-US');
|
|
128
|
+
}
|
|
129
|
+
//# sourceMappingURL=rate-card.js.map
|