npm - modelmeter-collect - Versions diffs - 0.8.0 → 0.10.0 - Mend

modelmeter-collect 0.8.0 → 0.10.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/README.md CHANGED Viewed

@@ -12,13 +12,23 @@ It dedupes (state in `~/.modelmeter/collector-state.json`), so every run is safe
 Not covered: the **ChatGPT** consumer app (no per-message token data exists) and **Cursor**
 on a Pro plan (usage stays on Cursor's servers).
-## Quick start
+## Try it, no account
+```bash
+# See where your Claude Code / Codex tokens go - signals + tips, runs locally:
+npx modelmeter-collect
+```
+With no token configured this reads your local logs and prints your cache reuse, top MCP
+server, context-bloat, and recommendations. Nothing is sent.
+## Track it over time
 ```bash
 # 1. Grab an ingest token from the Providers tab at https://modelmeter.dev, then:
 npx modelmeter-collect init mm_live_xxxxxxxx
-# 2. Backfill the last couple of weeks:
+# 2. Backfill the last couple of weeks (now that a token is saved, it reports usage):
 npx modelmeter-collect
 # Preview what would be sent, without sending:

package/cli.mjs CHANGED Viewed

@@ -23,6 +23,7 @@ import {
   claudeSessionSummary,
   codexSessionSummary,
   buildLocalRecommendations,
+  summarizeSignals,
 } from './lib.mjs'
 const HOME = homedir()
@@ -72,8 +73,9 @@ Commands:
           status, and exactly what would be sent. Add --recommendations for
           local optimization tips (cache, MCP, output, context bloat), or
           --payload for the raw JSON (token counts only, never transcript text).
-  (none)  Scan Claude Code + Codex logs and report token counts. Deduped,
-          so it is safe to run repeatedly. MODELMETER_DRYRUN=1 previews only.
+  (none)  No token yet? Shows your local optimization signals + tips from
+          Claude Code / Codex logs, no account needed. With a token saved,
+          it scans and reports usage (deduped, safe to run repeatedly).
 It sends only model names and token counts. Never your prompts, never your keys.
 Get an ingest token from the Providers tab at https://modelmeter.dev`)
@@ -185,7 +187,7 @@ function recentSessionFiles(dir, cutoffMs, limit) {
     .map((x) => x.p)
 }
-function printRecommendations(cutoffMs) {
+function readSummaries(cutoffMs) {
   const summaries = []
   const sources = [
     [join(HOME, '.claude', 'projects'), claudeSessionSummary],
@@ -203,6 +205,27 @@ function printRecommendations(cutoffMs) {
       if (summary) summaries.push(summary)
     }
   }
+  return summaries
+}
+function pct(x) {
+  return `${Math.round(x * 100)}%`
+}
+// A glance at the optimization signals (the same dimensions ModelMeter surfaces), so
+// the command shows value, not just discovery.
+function printSignals(summaries) {
+  if (summaries.length === 0) return
+  const s = summarizeSignals(summaries)
+  console.log(`\nOptimization signals (last 14 days, ${s.sessions} sessions, computed locally):`)
+  console.log(`  cache reuse:    ${pct(s.cacheRate)}`)
+  console.log(`  output share:   ${pct(s.outputShare)}`)
+  if (s.reasoningShare >= 0.005) console.log(`  reasoning:      ${pct(s.reasoningShare)} of output`)
+  if (s.topMcp) console.log(`  top MCP:        ${s.topMcp} (${pct(s.topMcpShare)} of tool tokens)`)
+  console.log(`  context bloat:  ${s.bloatedSessions} session${s.bloatedSessions === 1 ? '' : 's'} grew past 2x`)
+}
+function printRecommendations(summaries) {
   console.log('\nLocal recommendations (computed from your logs, nothing sent):')
   const recs = buildLocalRecommendations(summaries)
   if (recs.length === 0) {
@@ -233,7 +256,7 @@ if (cmd === 'doctor') {
     }),
   )
   if (args.includes('--recommendations')) {
-    printRecommendations(cutoffMs)
+    printRecommendations(readSummaries(cutoffMs))
     process.exit(0)
   }
   if (args.includes('--payload')) {
@@ -241,6 +264,7 @@ if (cmd === 'doctor') {
     process.env.MODELMETER_DRYRUN = '1'
     await runCollector() // prints the exact payload (counts only), then exits
   } else {
+    printSignals(readSummaries(cutoffMs))
     console.log(
       '\nRun `npx modelmeter-collect doctor --recommendations` for local optimization tips, or',
     )
@@ -249,5 +273,25 @@ if (cmd === 'doctor') {
   }
 }
-// Default: scan and report.
-await runCollector()
+// Default: with a token configured, scan and report (the hook / scheduled path).
+// Without one, this is a new user trying it - show the local value, no account needed.
+const cfg = readConfig()
+const configured = Boolean(process.env.MODELMETER_TOKEN || cfg.token)
+if (configured) {
+  await runCollector()
+} else {
+  const cutoffMs = Date.now() - 14 * 86_400_000
+  const summaries = readSummaries(cutoffMs)
+  console.log('ModelMeter: where your Claude Code and Codex tokens go. Local, token counts only.\n')
+  if (summaries.length === 0) {
+    console.log('No Claude Code or Codex session logs found in the last 14 days.')
+    console.log('Use one of those tools, then run `npx modelmeter-collect` again.')
+    process.exit(0)
+  }
+  printSignals(summaries)
+  printRecommendations(summaries)
+  console.log('\nThis ran entirely on your machine. Nothing was sent.')
+  console.log('Track it over time, across repos, or for your team: get a token at')
+  console.log('https://modelmeter.dev, then `npx modelmeter-collect init <token>`.')
+  process.exit(0)
+}

package/collect.mjs CHANGED Viewed

@@ -19,7 +19,8 @@ import {
   chmodSync,
 } from 'node:fs'
 import { homedir } from 'node:os'
-import { join } from 'node:path'
+import { join, dirname } from 'node:path'
+import { createHash } from 'node:crypto'
 import {
   findLastTokenCount,
   codexToolFromEvent,
@@ -29,8 +30,9 @@ import {
   aggregateDaily,
   aggregateHourly,
   aggregateTools,
-  pruneClaudeState,
-  mergeDetailBatches,
+  claudeSessionSummary,
+  codexSessionSummary,
+  sessionSendRow,
 } from './lib.mjs'
 const HOME = homedir()
@@ -64,6 +66,11 @@ const TOKEN = process.env.MODELMETER_TOKEN || cfg.token
 const INGEST_URL = process.env.MODELMETER_INGEST_URL || cfg.ingestUrl
 if (!TOKEN || !INGEST_URL) process.exit(0) // not configured: do nothing, never block
+// Repo attribution is opt-in for the human-readable label only. A repo hash is always
+// sent (opaque). The label (the repo folder name, never the full path) is sent only
+// when explicitly enabled, so a repo name never leaves the machine by default.
+const REPO_LABELS = process.env.MODELMETER_REPO_LABELS === '1' || cfg.repoLabels === true
 // POST JSON with a hard timeout so a stuck network path can never hang a Stop
 // hook or pile up scheduled collectors. Callers handle the thrown abort/error.
 async function postJson(url, body) {
@@ -81,29 +88,13 @@ async function postJson(url, body) {
   }
 }
-let state = { claude: {}, codex: {}, pendingDetail: { hours: [], tools: [] } }
+let state = { claude: {}, codex: {} }
 try {
-  state = {
-    claude: {},
-    codex: {},
-    pendingDetail: { hours: [], tools: [] },
-    ...JSON.parse(readFileSync(STATE_PATH, 'utf8')),
-  }
+  state = { claude: {}, codex: {}, ...JSON.parse(readFileSync(STATE_PATH, 'utf8')) }
 } catch {
   // first run
 }
-function saveState() {
-  if (!existsSync(MM_DIR)) mkdirSync(MM_DIR, { recursive: true })
-  state.claude = pruneClaudeState(state.claude, CLAUDE_STATE_CAP)
-  writeFileSync(STATE_PATH, JSON.stringify(state))
-  try {
-    chmodSync(STATE_PATH, 0o600) // usage metadata is not secret, but keep it owner-only
-  } catch {
-    // best effort on platforms without POSIX perms
-  }
-}
 // --- invocation detection -------------------------------------------------
 let hookInput = null
 if (!process.stdin.isTTY) {
@@ -177,7 +168,7 @@ function scanClaude(files) {
       }
       const ev = claudeEventFromLine(o)
       if (!ev || !ev.id || state.claude[ev.id]) continue
-      state.claude[ev.id] = { ts: ev.occurredAt || ev.occurredOn || '' }
+      state.claude[ev.id] = 1
       events.push(ev)
     }
   }
@@ -234,13 +225,66 @@ function scanCodex(files) {
   }
 }
+let claudeFiles = []
+let codexFiles = []
 if (hookInput?.transcript_path) {
-  scanClaude([hookInput.transcript_path]) // Claude Code hook: just this session
+  claudeFiles = [hookInput.transcript_path] // Claude Code hook: just this session
 } else if (codexNotify) {
-  scanCodex(recentFiles(join(HOME, '.codex', 'sessions'), 2)) // Codex notify: newest session(s)
+  codexFiles = recentFiles(join(HOME, '.codex', 'sessions'), 2) // Codex notify: newest session(s)
 } else {
-  scanClaude(recentFiles(join(HOME, '.claude', 'projects')))
-  scanCodex(recentFiles(join(HOME, '.codex', 'sessions')))
+  claudeFiles = recentFiles(join(HOME, '.claude', 'projects'))
+  codexFiles = recentFiles(join(HOME, '.codex', 'sessions'))
+}
+scanClaude(claudeFiles)
+scanCodex(codexFiles)
+// Per-session summaries (context bloat, comparisons) for the detail endpoint. Hash
+// the session-file basename (the session id), never the path, so no repo/project
+// label leaks here. Recomputed in full each run; the backend overwrites by hash.
+const SESSION_CAP = 500
+function sessionHashFor(file) {
+  const base = file.split('/').pop() || file
+  return createHash('sha256').update(base).digest('hex').slice(0, 40)
+}
+// Resolve a cwd to its git-root for a stable repo identity (so subdirs of one repo do
+// not fragment). Falls back to the cwd if no .git is found (e.g. the repo is gone).
+function repoRoot(cwd) {
+  if (!cwd) return ''
+  let dir = cwd
+  for (let i = 0; i < 12; i++) {
+    try {
+      if (existsSync(join(dir, '.git'))) return dir
+    } catch {
+      // ignore
+    }
+    const parent = dirname(dir)
+    if (parent === dir) break
+    dir = parent
+  }
+  return cwd
+}
+const sessions = []
+for (const [files, summarize] of [
+  [claudeFiles, claudeSessionSummary],
+  [codexFiles, codexSessionSummary],
+]) {
+  for (const file of files.slice(0, SESSION_CAP)) {
+    let text = ''
+    try {
+      text = readFileSync(file, 'utf8')
+    } catch {
+      continue
+    }
+    const summary = summarize(text)
+    const row = sessionSendRow(summary, sessionHashFor(file))
+    if (!row) continue
+    const root = repoRoot(summary.cwd)
+    if (root) {
+      row.repoHash = createHash('sha256').update(root).digest('hex').slice(0, 40)
+      if (REPO_LABELS) row.repoLabel = (root.split('/').pop() || root).slice(0, 80)
+    }
+    sessions.push(row)
+  }
 }
 // Collapse to one row per (provider, model, day) so the request stays small.
@@ -255,11 +299,10 @@ const HOURLY_URL = deriveHourlyUrl(INGEST_URL, process.env.MODELMETER_HOURLY_ING
 // Per-tool / per-MCP attribution. Claude even-splits each turn's tokens across the
 // tools it called; Codex contributes precomputed deltas. Calls are exact.
 const toolsPayload = aggregateTools(events, codexToolDeltas, today)
-const currentDetail = { hours: hourly, tools: toolsPayload }
-const detailBatch = mergeDetailBatches(state.pendingDetail, currentDetail)
-const hasDetail = detailBatch.hours.length > 0 || detailBatch.tools.length > 0
-if (payload.length === 0 && !hasDetail) {
+const haveDaily = payload.length > 0
+const haveDetail = hourly.length > 0 || toolsPayload.length > 0 || sessions.length > 0
+if (!haveDaily && !haveDetail) {
   process.exit(0)
 }
@@ -267,23 +310,34 @@ if (process.env.MODELMETER_DRYRUN) {
   const tally = {}
   for (const e of events) tally[e.provider] = (tally[e.provider] || 0) + 1
   console.log(`DRY RUN: ${events.length} raw events -> ${payload.length} daily rows`, tally)
-  console.log(`         + ${hourly.length} recent hourly rows, ${toolsPayload.length} tool rows -> ${HOURLY_URL}`)
-  if (state.pendingDetail?.hours?.length || state.pendingDetail?.tools?.length) {
-    console.log(
-      `         + pending retry rows: ${state.pendingDetail.hours?.length || 0} hourly, ${state.pendingDetail.tools?.length || 0} tool`,
-    )
-  }
+  console.log(`         + ${hourly.length} recent hourly rows, ${toolsPayload.length} tool rows, ${sessions.length} session summaries -> ${HOURLY_URL}`)
   console.log(JSON.stringify(payload, null, 2))
   if (toolsPayload.length) console.log('tools:', JSON.stringify(toolsPayload, null, 2))
+  if (sessions.length) console.log('sessions:', JSON.stringify(sessions.slice(0, 3), null, 2))
   process.exit(0)
 }
-let committed = false
-if (payload.length > 0) {
+// With no new daily events there is nothing to commit, but session summaries (and any
+// timestamped detail) are recomputed in full each run and must still be sent, so treat
+// that case as already committed.
+let committed = !haveDaily
+if (haveDaily) {
   try {
     const res = await postJson(INGEST_URL, { source: 'collector', events: payload })
     if (res.ok) {
-      saveState()
+      if (!existsSync(MM_DIR)) mkdirSync(MM_DIR, { recursive: true })
+      const claudeIds = Object.keys(state.claude)
+      if (claudeIds.length > CLAUDE_STATE_CAP) {
+        const next = {}
+        for (const id of claudeIds.slice(-CLAUDE_STATE_CAP)) next[id] = 1
+        state.claude = next
+      }
+      writeFileSync(STATE_PATH, JSON.stringify(state))
+      try {
+        chmodSync(STATE_PATH, 0o600) // usage metadata is not secret, but keep it owner-only
+      } catch {
+        // best effort on platforms without POSIX perms
+      }
       committed = true
       console.error(`modelmeter: reported ${payload.length} usage rows`)
     } else {
@@ -292,32 +346,24 @@ if (payload.length > 0) {
   } catch (err) {
     console.error(`modelmeter: ${err.message}`)
   }
-} else {
-  committed = true // retrying previously committed detail rows
 }
-// Additive detail rows are sent only after daily usage is committed. If the detail
-// endpoint fails, keep the merged batch in state and retry on the next run.
-if (committed && hasDetail) {
-  if (!HOURLY_URL) {
-    state.pendingDetail = detailBatch
-    saveState()
-    console.error('modelmeter: detail ingest URL could not be derived; set MODELMETER_HOURLY_INGEST_URL')
-    process.exit(0)
-  }
-  let detailSent = false
+// Detail rows go only after the daily batch is committed (or when there was none), so a
+// daily retry cannot race them. The endpoint applies them in one transaction; retry once
+// to cover a transient failure, then give up (the window self-heals as new data flows).
+if (committed && haveDetail) {
   for (let attempt = 0; attempt < 2; attempt++) {
     try {
-      const res = await postJson(HOURLY_URL, { source: 'collector', ...detailBatch })
-      if (res.ok) {
-        detailSent = true
-        break
-      }
+      const res = await postJson(HOURLY_URL, {
+        source: 'collector',
+        hours: hourly,
+        tools: toolsPayload,
+        sessions,
+      })
+      if (res.ok) break
     } catch {
       // fall through to one retry, then give up
     }
   }
-  state.pendingDetail = detailSent ? { hours: [], tools: [] } : detailBatch
-  saveState()
 }
 process.exit(0)

package/lib.mjs CHANGED Viewed

@@ -356,7 +356,9 @@ export function claudeSessionSummary(text) {
     }
   }
   if (requests === 0) return null
-  return { provider: 'anthropic', model, uncached, cacheRead, cacheCreate, output, requests, firstTs, lastTs, cwd, contextSeq, tools }
+  // Claude folds extended-thinking into output_tokens with no separate field, so
+  // reasoning is 0 here (the breakdown is only available for Codex).
+  return { provider: 'anthropic', model, uncached, cacheRead, cacheCreate, output, reasoning: 0, requests, firstTs, lastTs, cwd, contextSeq, tools }
 }
 // Summarize one Codex session from its final cumulative token_count. Codex totals are
@@ -401,7 +403,11 @@ export function codexSessionSummary(text) {
   if (!totals) return null
   const cacheRead = totals.cached_input_tokens || 0
   const uncached = Math.max(0, (totals.input_tokens || 0) - cacheRead)
-  const output = (totals.output_tokens || 0) + (totals.reasoning_output_tokens || 0)
+  // Reasoning tokens bill as output (the priciest tier) but are reported separately and
+  // are otherwise hidden, so keep the breakdown: output is the total billed output and
+  // reasoning is the share of it spent thinking.
+  const reasoning = totals.reasoning_output_tokens || 0
+  const output = (totals.output_tokens || 0) + reasoning
   return {
     provider: 'openai',
     model,
@@ -409,6 +415,7 @@ export function codexSessionSummary(text) {
     cacheRead,
     cacheCreate: 0,
     output,
+    reasoning,
     requests: Math.max(1, requests),
     firstTs,
     lastTs,
@@ -439,6 +446,7 @@ export function sessionSendRow(summary, sessionHash) {
     cacheRead: summary.cacheRead,
     cacheCreation: summary.cacheCreate,
     output: summary.output,
+    reasoning: summary.reasoning || 0,
     maxInputTurn: bloat ? bloat.max : 0,
     first5Avg: bloat ? bloat.first5 : 0,
     last5Avg: bloat ? bloat.last5 : 0,
@@ -464,6 +472,7 @@ export function buildLocalRecommendations(summaries) {
   let cacheRead = 0
   let cacheCreate = 0
   let output = 0
+  let reasoning = 0
   let requests = 0
   const tools = {}
   for (const s of list) {
@@ -471,6 +480,7 @@ export function buildLocalRecommendations(summaries) {
     cacheRead += s.cacheRead
     cacheCreate += s.cacheCreate
     output += s.output
+    reasoning += s.reasoning || 0
     requests += s.requests
     for (const [g, v] of Object.entries(s.tools || {})) {
       const cur = tools[g] || { tokens: 0, calls: 0 }
@@ -547,7 +557,19 @@ export function buildLocalRecommendations(summaries) {
     })
   }
-  // 4. Context bloat (Claude sessions carry a per-turn sequence).
+  // 4. Reasoning share (Codex). Reasoning bills as output, the priciest tier, but is
+  // hidden by default, so a large reasoning share is invisible cost.
+  if (output > 100_000 && reasoning / output > 0.4) {
+    recs.push({
+      kind: 'reasoning',
+      level: 'warn',
+      text: `Reasoning is ${pct(
+        reasoning / output,
+      )} of your output tokens, the priciest tier, and hidden by default. Lower the reasoning effort for routine tasks and reserve high effort for genuinely hard problems.`,
+    })
+  }
+  // 5. Context bloat (Claude sessions carry a per-turn sequence).
   let worst = null
   for (const s of list) {
     const b = sessionBloat(s.contextSeq)
@@ -567,3 +589,45 @@ export function buildLocalRecommendations(summaries) {
   return recs
 }
+// Headline optimization signals (metrics, not recommendations) for `doctor` to show
+// at a glance: the same dimensions ModelMeter surfaces, computed locally.
+export function summarizeSignals(summaries) {
+  const list = (summaries || []).filter(Boolean)
+  let uncached = 0
+  let cacheRead = 0
+  let cacheCreate = 0
+  let output = 0
+  let reasoning = 0
+  let bloated = 0
+  const tools = {}
+  for (const s of list) {
+    uncached += s.uncached
+    cacheRead += s.cacheRead
+    cacheCreate += s.cacheCreate
+    output += s.output
+    reasoning += s.reasoning || 0
+    const b = sessionBloat(s.contextSeq)
+    if (b && b.last5 > b.first5 * 2 && b.last5 > 30_000) bloated++
+    for (const [g, v] of Object.entries(s.tools || {})) {
+      tools[g] = (tools[g] || 0) + v.tokens
+    }
+  }
+  const inputTotal = uncached + cacheRead + cacheCreate
+  const total = inputTotal + output
+  const toolArr = Object.entries(tools)
+    .map(([tool, tok]) => ({ tool, tok }))
+    .sort((a, b) => b.tok - a.tok)
+  const toolTotal = toolArr.reduce((n, t) => n + t.tok, 0)
+  const topMcp = toolArr.find((t) => t.tool.startsWith('mcp:'))
+  return {
+    sessions: list.length,
+    totalTokens: total,
+    cacheRate: inputTotal > 0 ? cacheRead / inputTotal : 0,
+    outputShare: total > 0 ? output / total : 0,
+    reasoningShare: output > 0 ? reasoning / output : 0,
+    topMcp: topMcp ? topMcp.tool : null,
+    topMcpShare: topMcp && toolTotal > 0 ? topMcp.tok / toolTotal : 0,
+    bloatedSessions: bloated,
+  }
+}

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "modelmeter-collect",
-  "version": "0.8.0",
+  "version": "0.10.0",
   "description": "Report LLM token usage from local Claude Code / Codex logs to ModelMeter. Token counts only, never prompts or keys.",
   "type": "module",
   "bin": {