npm - @mbeato/contextscope - Versions diffs - 0.1.3 → 0.1.5 - Mend

@mbeato/contextscope 0.1.3 → 0.1.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (55) hide show

package/.next/standalone/lib/transcripts.ts CHANGED Viewed

@@ -6,7 +6,10 @@
  *   - invocations (Skill / Agent tool_use events)  -> consumed by lib/usage.ts
  *   - session stats (turn count, token usage)      -> consumed by lib/sessions.ts
  *
- * Subsequent page loads reuse cached results when mtime is unchanged.
+ * CC creates a new JSONL when you `--continue` a session, which replays the
+ * prior turns. To match ccusage's totals we dedup messages by `msg.id:requestId`
+ * across all files at aggregate time. Per-file records are cached unchanged
+ * (preserves mtime cache); dedupAndSum runs on every getAllTranscripts call.
  */
 import { readdir, stat } from "node:fs/promises";
 import { createReadStream } from "node:fs";
@@ -18,6 +21,28 @@ const PROJECTS_DIR = join(homedir(), ".claude", "projects");
 export type Invocation = { kind: "skill" | "agent"; name: string; ts: number };
+export type ModelUsage = {
+  inputTokens: number;
+  cacheReadTokens: number;
+  cacheCreation5mTokens: number;
+  cacheCreation1hTokens: number;
+  outputTokens: number;
+};
+export type UsageRecord = {
+  // `${message.id}:${requestId}` — same key ccusage uses. Empty string if msg
+  // lacked an id (treat as un-dedupable; count it).
+  dedupKey: string;
+  model: string;
+  ts: number;
+  input: number;
+  cacheRead: number;
+  cacheCreation5m: number;
+  cacheCreation1h: number;
+  output: number;
+  isSidechain: boolean;
+};
 export type TranscriptResult = {
   filePath: string;
   mtimeMs: number;
@@ -28,20 +53,22 @@ export type TranscriptResult = {
   endTime: number;
   turnCount: number;
   models: string[];
+  // Aggregate totals — sums after dedup (when produced via getAllTranscripts).
+  // On raw parseFile output these are pre-dedup; getAllTranscripts rebuilds them.
   inputTokens: number;
   cacheReadTokens: number;
-  cacheCreationTokens: number;
+  cacheCreationTokens: number;   // total: 5m + 1h
   outputTokens: number;
+  byModel: Record<string, ModelUsage>;
+  // Per-message records — kept on the cached result so dedup at aggregate time
+  // is exact across resumed sessions.
+  usageRecords: UsageRecord[];
   invocations: Invocation[];
-  toolCalls: Record<string, number>;  // tool name -> count
-  toolErrors: number;                  // total tool_result with is_error: true
-  sidechainTurns: number;              // turns with isSidechain: true (subagent context)
+  toolCalls: Record<string, number>;
+  toolErrors: number;
+  sidechainTurns: number;
 };
-// Module-level cache: persists across server-component renders within the same
-// Next.js dev/prod process. Keyed by filePath; invalidated on mtime change.
-// Capped via simple FIFO eviction (Map preserves insertion order) so a
-// long-running process scanning thousands of transcripts can't grow unbounded.
 const cache = new Map<string, TranscriptResult>();
 const MAX_CACHE_ENTRIES = 5000;
@@ -51,8 +78,18 @@ function inferProjectPath(dirName: string): string {
 async function parseFile(filePath: string, mtimeMs: number): Promise<TranscriptResult> {
   const parts = filePath.split("/");
-  const sessionId = parts[parts.length - 1].replace(/\.jsonl$/, "");
-  const project = parts[parts.length - 2] ?? "";
+  // Two shapes:
+  //   <project>/<session-uuid>.jsonl                          → main session file
+  //   <project>/<session-uuid>/subagents/agent-<id>.jsonl     → subagent file
+  // For subagents we want the parent session UUID + parent project, so the
+  // tokens roll up to the same Session as the main file.
+  const isSubagent = parts[parts.length - 2] === "subagents";
+  const sessionId = isSubagent
+    ? (parts[parts.length - 3] ?? "")
+    : parts[parts.length - 1].replace(/\.jsonl$/, "");
+  const project = isSubagent
+    ? (parts[parts.length - 4] ?? "")
+    : (parts[parts.length - 2] ?? "");
   const result: TranscriptResult = {
     filePath,
     mtimeMs,
@@ -67,12 +104,13 @@ async function parseFile(filePath: string, mtimeMs: number): Promise<TranscriptR
     cacheReadTokens: 0,
     cacheCreationTokens: 0,
     outputTokens: 0,
+    byModel: {},
+    usageRecords: [],
     invocations: [],
     toolCalls: {},
     toolErrors: 0,
     sidechainTurns: 0,
   };
-  const modelSet = new Set<string>();
   return new Promise((resolve) => {
     const rl = createInterface({
@@ -81,7 +119,6 @@ async function parseFile(filePath: string, mtimeMs: number): Promise<TranscriptR
     });
     rl.on("line", (line) => {
       if (!line || line[0] !== "{") return;
-      // Prefilter: usage events, tool_use events, and tool_result events (for errors).
       const hasUsage = line.includes('"usage"');
       const hasToolUse = line.includes('"tool_use"');
       const hasToolResult = line.includes('"tool_result"');
@@ -94,29 +131,49 @@ async function parseFile(filePath: string, mtimeMs: number): Promise<TranscriptR
         return;
       }
       const msg = rec.message as
-        | { model?: string; usage?: Record<string, unknown>; content?: unknown }
+        | { id?: string; model?: string; usage?: Record<string, unknown>; content?: unknown }
         | undefined;
       const tsRaw = rec.timestamp;
       const tsMs = typeof tsRaw === "string" ? Date.parse(tsRaw) : NaN;
       const isSidechain = rec.isSidechain === true;
-      // Usage aggregation (assistant messages)
       const usage = msg?.usage;
       if (usage) {
-        result.inputTokens += Number(usage.input_tokens) || 0;
-        result.cacheReadTokens += Number(usage.cache_read_input_tokens) || 0;
-        result.cacheCreationTokens += Number(usage.cache_creation_input_tokens) || 0;
-        result.outputTokens += Number(usage.output_tokens) || 0;
-        result.turnCount += 1;
-        if (isSidechain) result.sidechainTurns += 1;
-        if (msg?.model) modelSet.add(msg.model);
-        if (Number.isFinite(tsMs)) {
-          if (!result.startTime || tsMs < result.startTime) result.startTime = tsMs;
-          if (tsMs > result.endTime) result.endTime = tsMs;
+        const msgId = typeof msg?.id === "string" ? msg.id : "";
+        const requestId = typeof rec.requestId === "string" ? rec.requestId : "";
+        const dedupKey = msgId ? `${msgId}:${requestId}` : "";
+        // cache_creation may have an ephemeral_{5m,1h}_input_tokens breakdown
+        // (priced separately at $6.25/M vs $10/M for opus-4-7). Older transcripts
+        // lack the sub-object — fall back to treating the total as 5min.
+        const ccTotal = Number(usage.cache_creation_input_tokens) || 0;
+        const ccBreakdown = (usage.cache_creation ?? null) as
+          | { ephemeral_5m_input_tokens?: number; ephemeral_1h_input_tokens?: number }
+          | null;
+        let cc5m = 0;
+        let cc1h = 0;
+        if (ccBreakdown && typeof ccBreakdown === "object") {
+          cc5m = Number(ccBreakdown.ephemeral_5m_input_tokens) || 0;
+          cc1h = Number(ccBreakdown.ephemeral_1h_input_tokens) || 0;
+          // If breakdown is present but sum doesn't match the parent total,
+          // trust the parent and attribute the diff to 5min (conservative).
+          const diff = ccTotal - (cc5m + cc1h);
+          if (diff > 0) cc5m += diff;
+        } else {
+          cc5m = ccTotal;
         }
+        result.usageRecords.push({
+          dedupKey,
+          model: msg?.model || "<synthetic>",
+          ts: Number.isFinite(tsMs) ? tsMs : 0,
+          input: Number(usage.input_tokens) || 0,
+          cacheRead: Number(usage.cache_read_input_tokens) || 0,
+          cacheCreation5m: cc5m,
+          cacheCreation1h: cc1h,
+          output: Number(usage.output_tokens) || 0,
+          isSidechain,
+        });
       }
-      // Content scan: tool_use (counts + invocations) and tool_result (errors)
       if (Array.isArray(msg?.content)) {
         for (const c of msg.content) {
           if (!c || typeof c !== "object") continue;
@@ -146,14 +203,8 @@ async function parseFile(filePath: string, mtimeMs: number): Promise<TranscriptR
         }
       }
     });
-    rl.on("close", () => {
-      result.models = [...modelSet];
-      resolve(result);
-    });
-    rl.on("error", () => {
-      result.models = [...modelSet];
-      resolve(result);
-    });
+    rl.on("close", () => resolve(result));
+    rl.on("error", () => resolve(result));
   });
 }
@@ -161,7 +212,7 @@ async function getFileResult(filePath: string, mtimeMs: number): Promise<Transcr
   const cached = cache.get(filePath);
   if (cached && cached.mtimeMs === mtimeMs) return cached;
   const fresh = await parseFile(filePath, mtimeMs);
-  if (cached) cache.delete(filePath); // re-insert at tail so FIFO eviction stays correct
+  if (cached) cache.delete(filePath);
   cache.set(filePath, fresh);
   while (cache.size > MAX_CACHE_ENTRIES) {
     const oldest = cache.keys().next().value;
@@ -185,7 +236,135 @@ async function pMapLimit<T, R>(items: T[], limit: number, fn: (x: T) => Promise<
   return out;
 }
-/** Scan all transcripts modified in the last N days. Cached per (filePath, mtime). */
+/**
+ * Walk raw per-file results oldest first, dedup messages globally by
+ * (msg.id, requestId), and merge multiple files belonging to the same logical
+ * session (main + subagents/*) into one TranscriptResult per session.
+ *
+ * Important: do NOT mutate the cached `raws` objects — they're shared across
+ * calls.
+ */
+function dedupAndSum(raws: TranscriptResult[]): TranscriptResult[] {
+  const sorted = [...raws].sort((a, b) => a.mtimeMs - b.mtimeMs);
+  const seen = new Set<string>();
+  const merged = new Map<string, TranscriptResult>();
+  for (const r of sorted) {
+    const key = `${r.project}\x00${r.sessionId}`;
+    let t = merged.get(key);
+    if (!t) {
+      t = {
+        filePath: r.filePath,
+        mtimeMs: r.mtimeMs,
+        sessionId: r.sessionId,
+        project: r.project,
+        projectPath: r.projectPath,
+        startTime: 0,
+        endTime: 0,
+        turnCount: 0,
+        models: [],
+        inputTokens: 0,
+        cacheReadTokens: 0,
+        cacheCreationTokens: 0,
+        outputTokens: 0,
+        byModel: {},
+        usageRecords: [],
+        invocations: [],
+        toolCalls: {},
+        toolErrors: 0,
+        sidechainTurns: 0,
+      };
+      merged.set(key, t);
+    } else {
+      // Prefer the main session file's path/mtime as the canonical reference;
+      // a subagent file landed first only if no main yet, which is rare.
+      const incomingIsMain = !r.filePath.includes("/subagents/");
+      if (incomingIsMain) {
+        t.filePath = r.filePath;
+        t.mtimeMs = Math.max(t.mtimeMs, r.mtimeMs);
+      }
+    }
+    // Accumulate ancillary fields
+    for (const inv of r.invocations) t.invocations.push(inv);
+    for (const [name, n] of Object.entries(r.toolCalls)) {
+      t.toolCalls[name] = (t.toolCalls[name] ?? 0) + n;
+    }
+    t.toolErrors += r.toolErrors;
+    const modelSet = new Set<string>(t.models);
+    for (const u of r.usageRecords) {
+      if (u.dedupKey) {
+        if (seen.has(u.dedupKey)) continue;
+        seen.add(u.dedupKey);
+      }
+      t.inputTokens += u.input;
+      t.cacheReadTokens += u.cacheRead;
+      t.cacheCreationTokens += u.cacheCreation5m + u.cacheCreation1h;
+      t.outputTokens += u.output;
+      t.turnCount += 1;
+      if (u.isSidechain) t.sidechainTurns += 1;
+      modelSet.add(u.model);
+      const bm = t.byModel[u.model] ?? {
+        inputTokens: 0,
+        cacheReadTokens: 0,
+        cacheCreation5mTokens: 0,
+        cacheCreation1hTokens: 0,
+        outputTokens: 0,
+      };
+      bm.inputTokens += u.input;
+      bm.cacheReadTokens += u.cacheRead;
+      bm.cacheCreation5mTokens += u.cacheCreation5m;
+      bm.cacheCreation1hTokens += u.cacheCreation1h;
+      bm.outputTokens += u.output;
+      t.byModel[u.model] = bm;
+      if (u.ts > 0) {
+        if (!t.startTime || u.ts < t.startTime) t.startTime = u.ts;
+        if (u.ts > t.endTime) t.endTime = u.ts;
+      }
+    }
+    t.models = [...modelSet];
+  }
+  return [...merged.values()];
+}
+async function collectJsonlFiles(
+  dir: string,
+  cutoff: number,
+  out: { filePath: string; mtimeMs: number }[],
+  depth: number = 0
+): Promise<void> {
+  if (depth > 3) return; // <project>/<session>/subagents/<file> is the deepest expected shape
+  let entries;
+  try {
+    entries = await readdir(dir, { withFileTypes: true });
+  } catch {
+    return;
+  }
+  for (const e of entries) {
+    const fp = join(dir, e.name);
+    if (e.isDirectory()) {
+      await collectJsonlFiles(fp, cutoff, out, depth + 1);
+      continue;
+    }
+    if (!e.isFile() || !e.name.endsWith(".jsonl")) continue;
+    try {
+      const st = await stat(fp);
+      if (st.mtimeMs >= cutoff) out.push({ filePath: fp, mtimeMs: st.mtimeMs });
+    } catch {
+      // skip
+    }
+  }
+}
+/**
+ * Scan all transcripts modified in the last N days. Scans both main session
+ * files (<project>/<session>.jsonl) and subagent files
+ * (<project>/<session>/subagents/agent-*.jsonl), then attributes subagent
+ * tokens to their parent session via shared sessionId. Deduped globally by
+ * (msg.id, requestId).
+ */
 export async function getAllTranscripts(daysBack: number = 30): Promise<TranscriptResult[]> {
   const cutoff = Date.now() - daysBack * 24 * 60 * 60 * 1000;
   let projDirs: import("node:fs").Dirent[];
@@ -198,24 +377,9 @@ export async function getAllTranscripts(daysBack: number = 30): Promise<Transcri
   await Promise.all(
     projDirs.map(async (d) => {
       if (!d.isDirectory()) return;
-      const dir = join(PROJECTS_DIR, String(d.name));
-      let entries;
-      try {
-        entries = await readdir(dir, { withFileTypes: true });
-      } catch {
-        return;
-      }
-      for (const e of entries) {
-        if (!e.isFile() || !e.name.endsWith(".jsonl")) continue;
-        const fp = join(dir, e.name);
-        try {
-          const st = await stat(fp);
-          if (st.mtimeMs >= cutoff) candidates.push({ filePath: fp, mtimeMs: st.mtimeMs });
-        } catch {
-          // skip
-        }
-      }
+      await collectJsonlFiles(join(PROJECTS_DIR, String(d.name)), cutoff, candidates);
     })
   );
-  return pMapLimit(candidates, 16, (c) => getFileResult(c.filePath, c.mtimeMs));
+  const raws = await pMapLimit(candidates, 16, (c) => getFileResult(c.filePath, c.mtimeMs));
+  return dedupAndSum(raws);
 }

package/.next/standalone/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@mbeato/contextscope",
-  "version": "0.1.3",
+  "version": "0.1.5",
   "description": "Local dashboard auditing Claude Code's per-turn token context (skills, agents, commands, CLAUDE.md, MEMORY.md, hooks, MCP) with toggle-based disable and session analytics.",
   "type": "module",
   "bin": {
@@ -12,6 +12,7 @@
     "start": "next start",
     "prod": "next build && next start",
     "lint": "eslint",
+    "refresh-prices": "node scripts/refresh-prices.mjs",
     "prepublishOnly": "next build",
     "release": "test -f .env.publish || (echo 'missing .env.publish — copy .env.publish.example and add your NPM_TOKEN' && exit 1) && set -a && . ./.env.publish && set +a && npm publish"
   },

package/.next/standalone/scripts/refresh-prices.mjs ADDED Viewed

@@ -0,0 +1,58 @@
+#!/usr/bin/env node
+/**
+ * Refresh lib/model-prices.json from LiteLLM's authoritative price list.
+ *
+ * Pulls https://raw.githubusercontent.com/BerriAI/litellm/main/model_prices_and_context_window.json,
+ * keeps only Anthropic models with the cost fields we use, and writes a pruned
+ * JSON to lib/model-prices.json. Run before each contextscope release so npm
+ * users get current prices.
+ *
+ * Usage: node scripts/refresh-prices.mjs
+ */
+import { writeFile } from "node:fs/promises";
+import { fileURLToPath } from "node:url";
+import { dirname, join } from "node:path";
+const SRC = "https://raw.githubusercontent.com/BerriAI/litellm/main/model_prices_and_context_window.json";
+const HERE = dirname(fileURLToPath(import.meta.url));
+const DST = join(HERE, "..", "lib", "model-prices.json");
+const res = await fetch(SRC);
+if (!res.ok) {
+  console.error(`fetch failed: ${res.status} ${res.statusText}`);
+  process.exit(1);
+}
+const all = await res.json();
+const pruned = {};
+for (const [name, m] of Object.entries(all)) {
+  if (m?.litellm_provider !== "anthropic") continue;
+  if (typeof m.input_cost_per_token !== "number") continue;
+  const cc5m = m.cache_creation_input_token_cost ?? 0;
+  pruned[name] = {
+    input: m.input_cost_per_token,
+    output: m.output_cost_per_token ?? 0,
+    cache_read: m.cache_read_input_token_cost ?? 0,
+    cache_creation_5m: cc5m,
+    // Anthropic's documented 1hr cache rate is 2x the 5min rate.
+    // Fall back to 2x when LiteLLM doesn't list it explicitly.
+    cache_creation_1h: m.cache_creation_input_token_cost_above_1hr ?? cc5m * 2,
+  };
+}
+const sorted = Object.fromEntries(Object.entries(pruned).sort(([a], [b]) => a.localeCompare(b)));
+await writeFile(
+  DST,
+  JSON.stringify(
+    {
+      _source: SRC,
+      _refreshedAt: new Date().toISOString(),
+      _description: "Anthropic model prices in USD per token (input, output, cache_read, cache_creation 5min default). Refresh with `npm run refresh-prices`.",
+      models: sorted,
+    },
+    null,
+    2
+  ) + "\n",
+  "utf8"
+);
+console.log(`wrote ${Object.keys(sorted).length} anthropic models → ${DST}`);