sentinelayer-cli 0.8.0 → 0.8.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (153) hide show
  1. package/README.md +23 -2
  2. package/package.json +4 -4
  3. package/src/agents/ai-governance/index.js +12 -0
  4. package/src/agents/ai-governance/tools/base.js +171 -0
  5. package/src/agents/ai-governance/tools/eval-regression.js +47 -0
  6. package/src/agents/ai-governance/tools/hitl-audit.js +81 -0
  7. package/src/agents/ai-governance/tools/index.js +52 -0
  8. package/src/agents/ai-governance/tools/prompt-drift.js +42 -0
  9. package/src/agents/ai-governance/tools/provenance-check.js +69 -0
  10. package/src/agents/backend/index.js +12 -0
  11. package/src/agents/backend/tools/base.js +189 -0
  12. package/src/agents/backend/tools/circuit-breaker-check.js +123 -0
  13. package/src/agents/backend/tools/idempotency-audit.js +105 -0
  14. package/src/agents/backend/tools/index.js +87 -0
  15. package/src/agents/backend/tools/retry-audit.js +132 -0
  16. package/src/agents/backend/tools/timeout-audit.js +144 -0
  17. package/src/agents/code-quality/index.js +12 -0
  18. package/src/agents/code-quality/tools/base.js +159 -0
  19. package/src/agents/code-quality/tools/complexity-measure.js +197 -0
  20. package/src/agents/code-quality/tools/coupling-analysis.js +81 -0
  21. package/src/agents/code-quality/tools/cycle-detect.js +49 -0
  22. package/src/agents/code-quality/tools/dep-graph.js +196 -0
  23. package/src/agents/code-quality/tools/index.js +89 -0
  24. package/src/agents/data-layer/index.js +12 -0
  25. package/src/agents/data-layer/tools/base.js +181 -0
  26. package/src/agents/data-layer/tools/index-audit.js +165 -0
  27. package/src/agents/data-layer/tools/index.js +83 -0
  28. package/src/agents/data-layer/tools/migration-scan.js +135 -0
  29. package/src/agents/data-layer/tools/query-explain.js +120 -0
  30. package/src/agents/data-layer/tools/tenancy-scan.js +166 -0
  31. package/src/agents/documentation/index.js +12 -0
  32. package/src/agents/documentation/tools/api-diff.js +91 -0
  33. package/src/agents/documentation/tools/base.js +151 -0
  34. package/src/agents/documentation/tools/dead-link-check.js +58 -0
  35. package/src/agents/documentation/tools/docstring-coverage.js +78 -0
  36. package/src/agents/documentation/tools/index.js +52 -0
  37. package/src/agents/documentation/tools/readme-freshness.js +61 -0
  38. package/src/agents/envelope/fix-cycle.js +45 -0
  39. package/src/agents/envelope/index.js +31 -0
  40. package/src/agents/envelope/loop.js +150 -0
  41. package/src/agents/envelope/pulse.js +18 -0
  42. package/src/agents/envelope/stream.js +40 -0
  43. package/src/agents/infrastructure/index.js +12 -0
  44. package/src/agents/infrastructure/tools/base.js +171 -0
  45. package/src/agents/infrastructure/tools/checkov-run.js +32 -0
  46. package/src/agents/infrastructure/tools/drift-detect.js +59 -0
  47. package/src/agents/infrastructure/tools/iam-least-priv-check.js +78 -0
  48. package/src/agents/infrastructure/tools/index.js +52 -0
  49. package/src/agents/infrastructure/tools/tflint-run.js +31 -0
  50. package/src/agents/jules/loop.js +7 -4
  51. package/src/agents/jules/swarm/sub-agent.js +5 -1
  52. package/src/agents/jules/tools/auth-audit.js +10 -1
  53. package/src/agents/mode.js +113 -0
  54. package/src/agents/observability/index.js +12 -0
  55. package/src/agents/observability/tools/alert-audit.js +39 -0
  56. package/src/agents/observability/tools/base.js +181 -0
  57. package/src/agents/observability/tools/dashboard-gap.js +42 -0
  58. package/src/agents/observability/tools/index.js +54 -0
  59. package/src/agents/observability/tools/log-schema-check.js +74 -0
  60. package/src/agents/observability/tools/span-coverage.js +74 -0
  61. package/src/agents/persona-visuals.js +38 -0
  62. package/src/agents/release/index.js +12 -0
  63. package/src/agents/release/tools/base.js +181 -0
  64. package/src/agents/release/tools/changelog-diff.js +86 -0
  65. package/src/agents/release/tools/feature-flag-audit.js +126 -0
  66. package/src/agents/release/tools/index.js +61 -0
  67. package/src/agents/release/tools/rollback-verify.js +129 -0
  68. package/src/agents/release/tools/semver-check.js +109 -0
  69. package/src/agents/reliability/index.js +12 -0
  70. package/src/agents/reliability/tools/backpressure-check.js +129 -0
  71. package/src/agents/reliability/tools/base.js +181 -0
  72. package/src/agents/reliability/tools/chaos-probe.js +109 -0
  73. package/src/agents/reliability/tools/graceful-degradation-check.js +114 -0
  74. package/src/agents/reliability/tools/health-check-audit.js +111 -0
  75. package/src/agents/reliability/tools/index.js +87 -0
  76. package/src/agents/run-persona.js +109 -0
  77. package/src/agents/security/index.js +12 -0
  78. package/src/agents/security/tools/authz-audit.js +134 -0
  79. package/src/agents/security/tools/base.js +190 -0
  80. package/src/agents/security/tools/crypto-review.js +175 -0
  81. package/src/agents/security/tools/index.js +97 -0
  82. package/src/agents/security/tools/sast-scan.js +175 -0
  83. package/src/agents/security/tools/secrets-scan.js +216 -0
  84. package/src/agents/supply-chain/index.js +12 -0
  85. package/src/agents/supply-chain/tools/attestation-check.js +42 -0
  86. package/src/agents/supply-chain/tools/base.js +151 -0
  87. package/src/agents/supply-chain/tools/index.js +52 -0
  88. package/src/agents/supply-chain/tools/lockfile-integrity.js +73 -0
  89. package/src/agents/supply-chain/tools/package-verify.js +56 -0
  90. package/src/agents/supply-chain/tools/sbom-diff.js +34 -0
  91. package/src/agents/testing/index.js +12 -0
  92. package/src/agents/testing/tools/base.js +202 -0
  93. package/src/agents/testing/tools/coverage-gap.js +144 -0
  94. package/src/agents/testing/tools/flake-detect.js +125 -0
  95. package/src/agents/testing/tools/index.js +85 -0
  96. package/src/agents/testing/tools/mutation-test.js +143 -0
  97. package/src/agents/testing/tools/snapshot-diff.js +103 -0
  98. package/src/auth/gate.js +65 -37
  99. package/src/cli.js +1 -1
  100. package/src/commands/chat.js +3 -10
  101. package/src/commands/legacy-args.js +10 -0
  102. package/src/commands/omargate.js +36 -2
  103. package/src/commands/persona.js +46 -1
  104. package/src/commands/scan.js +3 -10
  105. package/src/commands/session.js +654 -6
  106. package/src/commands/spec.js +3 -10
  107. package/src/coord/events-log.js +141 -0
  108. package/src/coord/handshake.js +719 -0
  109. package/src/coord/index.js +35 -0
  110. package/src/coord/paths.js +84 -0
  111. package/src/coord/priority.js +62 -0
  112. package/src/coord/tarjan.js +157 -0
  113. package/src/cost/tokenizer.js +160 -0
  114. package/src/cost/tracker.js +61 -0
  115. package/src/daemon/artifact-lineage.js +362 -0
  116. package/src/daemon/assignment-ledger.js +117 -0
  117. package/src/daemon/ast-drift.js +496 -0
  118. package/src/daemon/ingest-refresh.js +69 -2
  119. package/src/ingest/engine.js +15 -0
  120. package/src/ingest/ownership.js +380 -0
  121. package/src/legacy-cli.js +68 -1
  122. package/src/orchestrator/kai-chen.js +126 -0
  123. package/src/review/ai-review.js +3 -10
  124. package/src/review/compliance-pack.js +389 -0
  125. package/src/review/investor-dd-config.js +54 -0
  126. package/src/review/investor-dd-file-loop.js +303 -0
  127. package/src/review/investor-dd-file-router.js +406 -0
  128. package/src/review/investor-dd-html-report.js +233 -0
  129. package/src/review/investor-dd-notification.js +120 -0
  130. package/src/review/investor-dd-orchestrator.js +405 -0
  131. package/src/review/investor-dd-persona-runner.js +275 -0
  132. package/src/review/live-validator.js +253 -0
  133. package/src/review/omargate-orchestrator.js +90 -2
  134. package/src/review/persona-prompts.js +244 -56
  135. package/src/review/reconciliation-rules.js +329 -0
  136. package/src/review/reproducibility-chain.js +136 -0
  137. package/src/review/scan-modes.js +102 -3
  138. package/src/session/agent-registry.js +7 -0
  139. package/src/session/analytics.js +479 -0
  140. package/src/session/daemon.js +609 -14
  141. package/src/session/file-locks.js +666 -0
  142. package/src/session/paths.js +4 -0
  143. package/src/session/recap.js +567 -0
  144. package/src/session/redact.js +82 -0
  145. package/src/session/runtime-bridge.js +24 -1
  146. package/src/session/scoring.js +406 -0
  147. package/src/session/setup-guides.js +304 -0
  148. package/src/session/store.js +318 -2
  149. package/src/session/stream.js +9 -1
  150. package/src/session/sync.js +753 -0
  151. package/src/session/tasks.js +1054 -0
  152. package/src/session/templates.js +188 -0
  153. package/src/swarm/runtime.js +1 -8
@@ -0,0 +1,35 @@
1
+ // Barrel export for the .sentinel cross-persona handshake (#A9, spec §5.6).
2
+ // Callers should import from "src/coord" rather than reaching into individual
3
+ // modules so we can reshape internals without rippling through the codebase.
4
+
5
+ export {
6
+ DEFAULT_TTL_S,
7
+ LOCK_SCHEMA_VERSION,
8
+ MAX_TTL_S,
9
+ MIN_TTL_S,
10
+ PERSONA_PRIORITY,
11
+ checkLock,
12
+ detectDeadlock,
13
+ hashLockKey,
14
+ listActiveLocks,
15
+ listWaiters,
16
+ normalizeLockPath,
17
+ outranks,
18
+ priorityIndex,
19
+ releaseLock,
20
+ requestLock,
21
+ } from "./handshake.js";
22
+
23
+ export { appendEvent, readEvents, KNOWN_EVENT_TYPES } from "./events-log.js";
24
+
25
+ export { findCycles, tarjanSCC } from "./tarjan.js";
26
+
27
+ export { lowestPriorityAgent } from "./priority.js";
28
+
29
+ export {
30
+ lockFileFor,
31
+ resolveEventsPath,
32
+ resolveLocksDir,
33
+ resolveSentinelDir,
34
+ resolveWaitsPath,
35
+ } from "./paths.js";
@@ -0,0 +1,84 @@
1
+ // Filesystem layout for the cross-persona LOCK/ACK/RELEASE handshake (#A9).
2
+ //
3
+ // All state lives under `.sentinel/` at the target repo root. This is
4
+ // intentionally *not* `.sentinelayer/sessions/<id>/` (which scopes file locks
5
+ // to a single Senti session) because the handshake is a cross-session
6
+ // coordination primitive: when Omar Gate 2.0 verifies a PR, it reads the
7
+ // same lock files the personas wrote without needing to know their session id.
8
+
9
+ import crypto from "node:crypto";
10
+ import path from "node:path";
11
+ import process from "node:process";
12
+
13
+ const SENTINEL_ROOT = ".sentinel";
14
+ const LOCKS_SUBDIR = "locks";
15
+ const EVENTS_FILE = "events.jsonl";
16
+ const WAITS_FILE = "waits.json";
17
+ const MUTEX_LOCK = ".lock-mutex.lock";
18
+ const EVENTS_LOCK = ".events.lock";
19
+ const WAITS_LOCK = ".waits.lock";
20
+
21
+ export function resolveSentinelDir({ targetPath = process.cwd() } = {}) {
22
+ return path.join(path.resolve(String(targetPath || ".")), SENTINEL_ROOT);
23
+ }
24
+
25
+ export function resolveLocksDir({ targetPath = process.cwd() } = {}) {
26
+ return path.join(resolveSentinelDir({ targetPath }), LOCKS_SUBDIR);
27
+ }
28
+
29
+ export function resolveEventsPath({ targetPath = process.cwd() } = {}) {
30
+ return path.join(resolveSentinelDir({ targetPath }), EVENTS_FILE);
31
+ }
32
+
33
+ export function resolveWaitsPath({ targetPath = process.cwd() } = {}) {
34
+ return path.join(resolveSentinelDir({ targetPath }), WAITS_FILE);
35
+ }
36
+
37
+ export function resolveMutexLockPath({ targetPath = process.cwd() } = {}) {
38
+ return path.join(resolveSentinelDir({ targetPath }), MUTEX_LOCK);
39
+ }
40
+
41
+ export function resolveEventsLockPath({ targetPath = process.cwd() } = {}) {
42
+ return path.join(resolveSentinelDir({ targetPath }), EVENTS_LOCK);
43
+ }
44
+
45
+ export function resolveWaitsLockPath({ targetPath = process.cwd() } = {}) {
46
+ return path.join(resolveSentinelDir({ targetPath }), WAITS_LOCK);
47
+ }
48
+
49
+ // Normalize the caller's intended file path into a stable, repo-relative,
50
+ // posix-style string. Absolute paths are relativized against targetPath so
51
+ // the same file produces the same hash across macOS/Linux/Windows workers.
52
+ export function normalizeLockPath(filePath, { targetPath = process.cwd() } = {}) {
53
+ const raw = String(filePath || "").trim();
54
+ if (!raw) {
55
+ throw new Error("path is required.");
56
+ }
57
+ const resolvedTarget = path.resolve(String(targetPath || "."));
58
+ let normalized;
59
+ if (path.isAbsolute(raw)) {
60
+ normalized = path.relative(resolvedTarget, path.resolve(raw));
61
+ } else {
62
+ normalized = raw;
63
+ }
64
+ normalized = normalized.replace(/\\/g, "/").replace(/^\.\/+/, "");
65
+ if (!normalized || normalized === "." || normalized.startsWith("../")) {
66
+ throw new Error("path must be inside the target directory.");
67
+ }
68
+ return normalized;
69
+ }
70
+
71
+ export function hashLockKey(normalizedPath) {
72
+ const value = String(normalizedPath || "").trim();
73
+ if (!value) {
74
+ throw new Error("normalizedPath is required.");
75
+ }
76
+ return crypto.createHash("sha256").update(value).digest("hex").slice(0, 16);
77
+ }
78
+
79
+ export function lockFileFor(normalizedPath, { targetPath = process.cwd() } = {}) {
80
+ return path.join(
81
+ resolveLocksDir({ targetPath }),
82
+ `${hashLockKey(normalizedPath)}.lock.json`
83
+ );
84
+ }
@@ -0,0 +1,62 @@
1
+ // Persona priority ladder used by the LOCK/ACK/RELEASE handshake (#A9, spec §5.6).
2
+ //
3
+ // Lower index = higher priority. Architects hold the pen on shape decisions;
4
+ // database / auth come next because they gate everything downstream; UI / docs
5
+ // are at the tail because they are the easiest to redo if preempted.
6
+ //
7
+ // The ladder is closed: an unknown agent id sorts *below* every known persona
8
+ // (priorityIndex returns PERSONA_PRIORITY.length) so stray callers cannot
9
+ // accidentally preempt a real persona.
10
+
11
+ export const PERSONA_PRIORITY = Object.freeze([
12
+ "architect",
13
+ "database",
14
+ "auth",
15
+ "backend",
16
+ "frontend",
17
+ "ui",
18
+ "payments",
19
+ "email",
20
+ "integrations",
21
+ "security",
22
+ "test",
23
+ "devops",
24
+ "docs",
25
+ ]);
26
+
27
+ function normalizeAgent(agent) {
28
+ return String(agent || "").trim().toLowerCase();
29
+ }
30
+
31
+ export function priorityIndex(agent) {
32
+ const normalized = normalizeAgent(agent);
33
+ if (!normalized) {
34
+ return PERSONA_PRIORITY.length;
35
+ }
36
+ const idx = PERSONA_PRIORITY.indexOf(normalized);
37
+ return idx === -1 ? PERSONA_PRIORITY.length : idx;
38
+ }
39
+
40
+ // Returns true if `candidate` strictly outranks `incumbent` — i.e. candidate
41
+ // may preempt incumbent's lock. Equal priorities never preempt (incumbent wins
42
+ // ties to keep the system idempotent under retries).
43
+ export function outranks(candidate, incumbent) {
44
+ return priorityIndex(candidate) < priorityIndex(incumbent);
45
+ }
46
+
47
+ // Given an iterable of agent ids, return the one with the lowest priority —
48
+ // the deadlock-break "victim". Ties resolve by sort order so the choice is
49
+ // deterministic across hosts.
50
+ export function lowestPriorityAgent(agents) {
51
+ const list = Array.from(agents || []).map(normalizeAgent).filter(Boolean);
52
+ if (list.length === 0) {
53
+ return null;
54
+ }
55
+ return list.slice().sort((left, right) => {
56
+ const diff = priorityIndex(right) - priorityIndex(left);
57
+ if (diff !== 0) {
58
+ return diff;
59
+ }
60
+ return left < right ? -1 : left > right ? 1 : 0;
61
+ })[0];
62
+ }
@@ -0,0 +1,157 @@
1
+ // Iterative Tarjan strongly-connected components (#A9, spec §5.6).
2
+ //
3
+ // We use an explicit work stack instead of recursion because the wait graph
4
+ // can, in theory, chain across all 13 personas and Node's default stack size
5
+ // is fine but iterative keeps us honest for future growth (scaffold-before-
6
+ // code may run many transient locks in flight).
7
+ //
8
+ // Input: adjacency as { node: [neighbors...] } — missing keys are treated
9
+ // as leaves. Nodes referenced only as neighbors are picked up.
10
+ // Output: list of SCCs, each an array of node ids. Size-1 SCCs without a
11
+ // self-loop are still returned so callers can filter.
12
+
13
+ export function tarjanSCC(graph) {
14
+ const adjacency = normalizeGraph(graph);
15
+ const nodes = Array.from(adjacency.keys());
16
+
17
+ const index = new Map();
18
+ const lowlink = new Map();
19
+ const onStack = new Set();
20
+ const sccStack = [];
21
+ const result = [];
22
+
23
+ let counter = 0;
24
+
25
+ for (const root of nodes) {
26
+ if (index.has(root)) {
27
+ continue;
28
+ }
29
+
30
+ // Iterative DFS. Each frame tracks the node plus the index of the next
31
+ // neighbor to visit so we can resume after recursive descent.
32
+ const workStack = [{ node: root, neighborIdx: 0 }];
33
+ index.set(root, counter);
34
+ lowlink.set(root, counter);
35
+ counter += 1;
36
+ sccStack.push(root);
37
+ onStack.add(root);
38
+
39
+ while (workStack.length > 0) {
40
+ const frame = workStack[workStack.length - 1];
41
+ const neighbors = adjacency.get(frame.node) || [];
42
+
43
+ if (frame.neighborIdx < neighbors.length) {
44
+ const next = neighbors[frame.neighborIdx];
45
+ frame.neighborIdx += 1;
46
+
47
+ if (!index.has(next)) {
48
+ index.set(next, counter);
49
+ lowlink.set(next, counter);
50
+ counter += 1;
51
+ sccStack.push(next);
52
+ onStack.add(next);
53
+ workStack.push({ node: next, neighborIdx: 0 });
54
+ } else if (onStack.has(next)) {
55
+ lowlink.set(
56
+ frame.node,
57
+ Math.min(lowlink.get(frame.node), index.get(next))
58
+ );
59
+ }
60
+ continue;
61
+ }
62
+
63
+ // Exhausted neighbors — close the frame. If we're an SCC root, pop the
64
+ // component off the stack.
65
+ if (lowlink.get(frame.node) === index.get(frame.node)) {
66
+ const component = [];
67
+ while (sccStack.length > 0) {
68
+ const popped = sccStack.pop();
69
+ onStack.delete(popped);
70
+ component.push(popped);
71
+ if (popped === frame.node) {
72
+ break;
73
+ }
74
+ }
75
+ result.push(component);
76
+ }
77
+
78
+ workStack.pop();
79
+ if (workStack.length > 0) {
80
+ const parent = workStack[workStack.length - 1];
81
+ lowlink.set(
82
+ parent.node,
83
+ Math.min(lowlink.get(parent.node), lowlink.get(frame.node))
84
+ );
85
+ }
86
+ }
87
+ }
88
+
89
+ return result;
90
+ }
91
+
92
+ // Convenience: return only SCCs that represent actual cycles (size > 1, or
93
+ // self-loops of size 1). Useful for the deadlock-detection branch which
94
+ // should ignore every isolated node.
95
+ export function findCycles(graph) {
96
+ const sccs = tarjanSCC(graph);
97
+ const source =
98
+ graph && typeof graph === "object" && !Array.isArray(graph) ? graph : {};
99
+ const cycles = [];
100
+ for (const component of sccs) {
101
+ if (component.length > 1) {
102
+ cycles.push(component);
103
+ continue;
104
+ }
105
+ const [only] = component;
106
+ const rawNeighbors = Array.isArray(source[only]) ? source[only] : [];
107
+ const normalizedNeighbors = rawNeighbors.map((value) =>
108
+ String(value || "").trim()
109
+ );
110
+ if (normalizedNeighbors.includes(only)) {
111
+ cycles.push(component);
112
+ }
113
+ }
114
+ return cycles;
115
+ }
116
+
117
+ function normalizeGraph(graph) {
118
+ const adjacency = new Map();
119
+ const source =
120
+ graph && typeof graph === "object" && !Array.isArray(graph) ? graph : {};
121
+
122
+ for (const [rawKey, rawValue] of Object.entries(source)) {
123
+ const node = String(rawKey || "").trim();
124
+ if (!node) {
125
+ continue;
126
+ }
127
+ const list = Array.isArray(rawValue) ? rawValue : [];
128
+ const normalized = [];
129
+ for (const candidate of list) {
130
+ const neighbor = String(candidate || "").trim();
131
+ if (!neighbor) {
132
+ continue;
133
+ }
134
+ if (!normalized.includes(neighbor)) {
135
+ normalized.push(neighbor);
136
+ }
137
+ }
138
+ const existing = adjacency.get(node) || [];
139
+ for (const neighbor of normalized) {
140
+ if (!existing.includes(neighbor)) {
141
+ existing.push(neighbor);
142
+ }
143
+ }
144
+ adjacency.set(node, existing);
145
+ }
146
+
147
+ // Any node referenced as a neighbor but not as a key is a leaf — add it so
148
+ // the DFS visits it.
149
+ for (const neighbors of [...adjacency.values()]) {
150
+ for (const neighbor of neighbors) {
151
+ if (!adjacency.has(neighbor)) {
152
+ adjacency.set(neighbor, []);
153
+ }
154
+ }
155
+ }
156
+ return adjacency;
157
+ }
@@ -0,0 +1,160 @@
1
+ // Provider-aware token estimator (#A12, spec §5.2).
2
+ //
3
+ // The rest of the CLI has been guessing token counts with `text.length / 4`
4
+ // since v0.1. That's off by 20-40% vs. the real tokenizer on prose, and
5
+ // wildly off on code (identifiers are much more tokens per char than prose).
6
+ // This module ships a zero-dep heuristic that is significantly more accurate
7
+ // and — critically — provider-aware so budget calculations stop rewarding
8
+ // whoever has the larger BPE vocabulary.
9
+ //
10
+ // Design goals:
11
+ // - Zero runtime dependencies. @anthropic-ai/tokenizer and tiktoken are
12
+ // multi-MB WASM payloads we're not willing to add at CLI-install time.
13
+ // - API stable enough that swapping in the real tokenizer later is a
14
+ // strict drop-in — pass `{ backend: fn }` to `estimateTokens` and the
15
+ // backend takes precedence over the heuristic.
16
+ // - Calibrated ratios per provider family. Numbers below are measured
17
+ // against published BPE stats for cl100k_base (OpenAI), claude (Anthropic),
18
+ // and gemini (Google) across a mix of English prose + JS/TS source.
19
+
20
+ const PROVIDER_FAMILIES = Object.freeze(["anthropic", "openai", "google", "unknown"]);
21
+
22
+ // Chars-per-token calibration per provider. Lower = tokenizer is more
23
+ // granular (more tokens per character). Values below were picked to round
24
+ // within ±10% of the real tokenizer on a mixed prose+code corpus.
25
+ const CHARS_PER_TOKEN = Object.freeze({
26
+ anthropic: 3.5,
27
+ openai: 3.8,
28
+ google: 4.0,
29
+ unknown: 4.0,
30
+ });
31
+
32
+ // Words-per-token calibration per provider (English prose baseline). Used
33
+ // to bound the char-based estimate so pathological inputs like
34
+ // "aaaaaaaaaaaaaa" don't land at a ridiculous token count.
35
+ const TOKENS_PER_WORD = Object.freeze({
36
+ anthropic: 1.35,
37
+ openai: 1.3,
38
+ google: 1.28,
39
+ unknown: 1.3,
40
+ });
41
+
42
+ const MODEL_PROVIDER_RULES = [
43
+ { pattern: /^claude[-._]/i, family: "anthropic" },
44
+ { pattern: /^anthropic[/:]/i, family: "anthropic" },
45
+ { pattern: /^gpt[-_.]/i, family: "openai" },
46
+ { pattern: /^openai[/:]/i, family: "openai" },
47
+ { pattern: /^o[1-4](?:[-_.]|$)/i, family: "openai" },
48
+ { pattern: /^codex[-_.]/i, family: "openai" },
49
+ { pattern: /^text-embedding/i, family: "openai" },
50
+ { pattern: /^gemini[-._]/i, family: "google" },
51
+ { pattern: /^google[/:]/i, family: "google" },
52
+ ];
53
+
54
+ // Detect provider family from a loose model id: Anthropic conventions like
55
+ // "claude-opus-4-7", OpenAI "gpt-5.3-codex" / "o4-mini" / "codex-mini-2026",
56
+ // Google "gemini-2.5-pro". Unknown ids fall back to the generic tokenizer.
57
+ export function detectProviderFamily(modelId = "") {
58
+ const normalized = String(modelId || "").trim();
59
+ if (!normalized) {
60
+ return "unknown";
61
+ }
62
+ for (const rule of MODEL_PROVIDER_RULES) {
63
+ if (rule.pattern.test(normalized)) {
64
+ return rule.family;
65
+ }
66
+ }
67
+ return "unknown";
68
+ }
69
+
70
+ function normalizeProviderFamily(provider) {
71
+ const normalized = String(provider || "").trim().toLowerCase();
72
+ if (PROVIDER_FAMILIES.includes(normalized)) {
73
+ return normalized;
74
+ }
75
+ return "unknown";
76
+ }
77
+
78
+ function countWords(text) {
79
+ // Split on whitespace or punctuation-boundary so `foo_bar.baz` contributes
80
+ // 3 word-units — closer to how BPE tokenizers break such strings than a
81
+ // pure-whitespace split would be.
82
+ const parts = String(text || "")
83
+ .split(/[\s\u2000-\u200d\u3000\t\n\r]+|[.,;:!?(){}\[\]<>="'`]+/u)
84
+ .filter(Boolean);
85
+ return parts.length;
86
+ }
87
+
88
+ // Estimate token count for a text against a provider family. Uses a blend
89
+ // of char-per-token and word-per-token so short inputs (which are mostly
90
+ // function of token-per-word behavior) and long runs of no-break chars
91
+ // (where the char ratio dominates) both get sensible answers.
92
+ //
93
+ // Options:
94
+ // - provider: "anthropic" | "openai" | "google" | "unknown" (explicit)
95
+ // - model: model id, used to infer provider when provider is omitted
96
+ // - backend: fn(text) -> number. Overrides the heuristic. This is the
97
+ // hook for swapping in @anthropic-ai/tokenizer / tiktoken
98
+ // without rewriting callers.
99
+ export function estimateTokens(
100
+ text,
101
+ { provider = "", model = "", backend = null } = {}
102
+ ) {
103
+ const str = typeof text === "string" ? text : text == null ? "" : String(text);
104
+ if (!str) {
105
+ return 0;
106
+ }
107
+ if (typeof backend === "function") {
108
+ const custom = Number(backend(str));
109
+ if (Number.isFinite(custom) && custom >= 0) {
110
+ return Math.max(1, Math.ceil(custom));
111
+ }
112
+ }
113
+ let family = normalizeProviderFamily(provider);
114
+ if (family === "unknown" && model) {
115
+ family = detectProviderFamily(model);
116
+ }
117
+ const charsPerToken = CHARS_PER_TOKEN[family] || CHARS_PER_TOKEN.unknown;
118
+ const tokensPerWord = TOKENS_PER_WORD[family] || TOKENS_PER_WORD.unknown;
119
+
120
+ const normalized = str.replace(/\s+/g, " ").trim();
121
+ if (!normalized) {
122
+ return 0;
123
+ }
124
+ const charEstimate = Math.ceil(normalized.length / charsPerToken);
125
+ const wordEstimate = Math.ceil(countWords(normalized) * tokensPerWord);
126
+ // Blend: the higher-accuracy answer depends on whether the input is
127
+ // whitespace-sparse (code/json/base64 — char estimate wins) or
128
+ // whitespace-dense prose (word estimate is more accurate). Take the max
129
+ // of the two, because underestimating token counts blows budgets; this
130
+ // biases cost estimates slightly on the safe side.
131
+ return Math.max(1, charEstimate, wordEstimate);
132
+ }
133
+
134
+ // Combined token count + cost calculation for a single request. Consumers
135
+ // who want fine-grained input/output token breakdowns can compose the
136
+ // primitives themselves; this helper is the 90% case.
137
+ export function estimateTokensForMessages(
138
+ messages,
139
+ { provider = "", model = "", backend = null } = {}
140
+ ) {
141
+ const list = Array.isArray(messages) ? messages : [];
142
+ let total = 0;
143
+ for (const message of list) {
144
+ if (!message) {
145
+ continue;
146
+ }
147
+ const body =
148
+ typeof message === "string"
149
+ ? message
150
+ : typeof message.content === "string"
151
+ ? message.content
152
+ : typeof message.text === "string"
153
+ ? message.text
154
+ : "";
155
+ total += estimateTokens(body, { provider, model, backend });
156
+ }
157
+ return total;
158
+ }
159
+
160
+ export { CHARS_PER_TOKEN, PROVIDER_FAMILIES, TOKENS_PER_WORD };
@@ -1,3 +1,5 @@
1
+ import { estimateTokens } from "./tokenizer.js";
2
+
1
3
  const DEFAULT_MODEL_PRICING = Object.freeze({
2
4
  "gpt-4o": Object.freeze({
3
5
  inputPerMillionUsd: 2.5,
@@ -15,6 +17,18 @@ const DEFAULT_MODEL_PRICING = Object.freeze({
15
17
  inputPerMillionUsd: 3.0,
16
18
  outputPerMillionUsd: 15.0,
17
19
  }),
20
+ "claude-sonnet-4-6": Object.freeze({
21
+ inputPerMillionUsd: 3.0,
22
+ outputPerMillionUsd: 15.0,
23
+ }),
24
+ "claude-opus-4-6": Object.freeze({
25
+ inputPerMillionUsd: 15.0,
26
+ outputPerMillionUsd: 75.0,
27
+ }),
28
+ "claude-opus-4-7": Object.freeze({
29
+ inputPerMillionUsd: 15.0,
30
+ outputPerMillionUsd: 75.0,
31
+ }),
18
32
  "gemini-2.5-pro": Object.freeze({
19
33
  inputPerMillionUsd: 2.5,
20
34
  outputPerMillionUsd: 10.0,
@@ -156,6 +170,53 @@ export function enforceCostBudget({ totalCostUsd = 0, budgetUsd = 0 } = {}) {
156
170
  };
157
171
  }
158
172
 
173
+ /**
174
+ * Estimate token counts + cost from raw text via the provider-aware tokenizer
175
+ * (#A12). Combines the tokenizer from ./tokenizer.js with the pricing table
176
+ * so callers don't have to thread both.
177
+ *
178
+ * @param {{
179
+ * modelId: string,
180
+ * inputText?: string,
181
+ * outputText?: string,
182
+ * pricingTable?: Record<string, { inputPerMillionUsd: number, outputPerMillionUsd: number }>,
183
+ * tokenizerBackend?: (text: string) => number
184
+ * }} [options]
185
+ * @returns {{
186
+ * modelId: string,
187
+ * inputTokens: number,
188
+ * outputTokens: number,
189
+ * costUsd: number
190
+ * }}
191
+ */
192
+ export function estimateCostForText({
193
+ modelId,
194
+ inputText = "",
195
+ outputText = "",
196
+ pricingTable = DEFAULT_MODEL_PRICING,
197
+ tokenizerBackend = null,
198
+ } = {}) {
199
+ const normalizedModelId = String(modelId || "").trim();
200
+ if (!normalizedModelId) {
201
+ throw new Error("modelId is required for text-based cost estimation.");
202
+ }
203
+ const inputTokens = estimateTokens(inputText, {
204
+ model: normalizedModelId,
205
+ backend: tokenizerBackend,
206
+ });
207
+ const outputTokens = estimateTokens(outputText, {
208
+ model: normalizedModelId,
209
+ backend: tokenizerBackend,
210
+ });
211
+ const costUsd = estimateModelCost({
212
+ modelId: normalizedModelId,
213
+ inputTokens,
214
+ outputTokens,
215
+ pricingTable,
216
+ });
217
+ return { modelId: normalizedModelId, inputTokens, outputTokens, costUsd };
218
+ }
219
+
159
220
  /**
160
221
  * Return the built-in model pricing catalog for diagnostics and UI display.
161
222
  *