npm - @jhizzard/termdeck - Versions diffs - 1.0.1 → 1.0.3 - Mend

@jhizzard/termdeck 1.0.1 → 1.0.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/package.json +2 -1
package/packages/cli/src/init-mnestra.js +175 -3
package/packages/cli/src/init-rumen.js +35 -8
package/packages/server/src/setup/audit-upgrade.js +126 -3
package/packages/server/src/setup/mnestra-migrations/017_memory_sessions_session_metadata.sql +94 -0
package/packages/stack-installer/README.md +73 -0
package/packages/stack-installer/assets/hooks/README.md +172 -0
package/packages/stack-installer/assets/hooks/memory-session-end.js +898 -0

package/packages/stack-installer/assets/hooks/memory-session-end.js ADDED Viewed

@@ -0,0 +1,898 @@
+/**
+ * TermDeck session-end memory hook (Mnestra-direct, no rag-system dependency).
+ *
+ * Vendored into ~/.claude/hooks/memory-session-end.js by @jhizzard/termdeck-stack.
+ * Wired into ~/.claude/settings.json under hooks.SessionEnd — fires once per
+ * Claude Code session close (`/exit`, Ctrl+D, terminal close, or process kill).
+ *
+ * History: this hook was originally registered under hooks.Stop, which fires
+ * after every assistant turn. That meant the same transcript got embedded and
+ * INSERTed dozens of times per session (and most fired with env-var-missing
+ * because Claude Code launched outside TermDeck doesn't have SUPABASE_URL in
+ * scope). Sprint 48 close-out moved registration to SessionEnd (one row per
+ * session, fires deterministically on /exit) AND added the secrets-env
+ * fallback below so a standalone-Claude-Code launch picks up the credentials
+ * without needing them in the parent shell.
+ *
+ * Behavior:
+ *   1. Reads {transcript_path, cwd, session_id, sessionType?, source_agent?}
+ *      from stdin (Claude Code SessionEnd payload, or — Sprint 50 T1 — a
+ *      server-driven invocation for non-Claude agents). source_agent
+ *      defaults to 'claude' when absent (Claude Code's existing hook
+ *      payload doesn't carry it; the TermDeck server's per-adapter
+ *      onPanelClose interceptor sets it explicitly for codex/gemini/grok).
+ *   2. Loads ~/.termdeck/secrets.env into process.env if any required key is
+ *      absent OR is a literal `${VAR}` placeholder (Sprint 47.5 hotfix
+ *      discipline — Claude Code does not expand `${VAR}` in MCP env, and we
+ *      can't trust the parent shell to have sourced secrets.env).
+ *   3. Skips small transcripts (< MIN_TRANSCRIPT_BYTES, default 5KB).
+ *   4. Validates env vars; logs and exits cleanly if any required key is still
+ *      missing after the secrets.env fallback.
+ *   5. Detects project from cwd against PROJECT_MAP (else "global"). Extend the
+ *      map by editing the array below — see assets/hooks/README.md for guidance.
+ *   6. Dispatches to a transcript parser by sessionType (Sprint 45 T4): Claude
+ *      JSONL, Codex JSONL, Gemini single-JSON, or auto-detect when sessionType
+ *      is absent. Builds a coarse summary from the resulting message list
+ *      (last ~30 message excerpts).
+ *   7. Embeds the summary via OpenAI text-embedding-3-small.
+ *   8. POSTs ONE row to Supabase /rest/v1/memory_items with source_type='session_summary'.
+ *   9. (Sprint 51.6 T3) POSTs ONE row to Supabase /rest/v1/memory_sessions with
+ *      Prefer: resolution=merge-duplicates so SessionEnd-fires-twice resolves
+ *      to a single row. Requires Mnestra migration 017 on canonical installs;
+ *      petvetbid already has the rich schema from rag-system bootstrap.
+ *  10. Logs every step to ~/.claude/hooks/memory-hook.log.
+ *
+ * Version stamp (Sprint 51.6 T3 — hook upgrade gap fix):
+ *   The marker `@termdeck/stack-installer-hook v<N>` below is read by both
+ *   stack-installer's installSessionEndHook (version-aware overwrite under
+ *   --yes) and `termdeck init --mnestra` (refreshBundledHookIfNewer step).
+ *   Bump the integer whenever a change to this file should overwrite an
+ *   already-installed copy on the user's machine — e.g. a new write path,
+ *   a new transcript parser, a default PROJECT_MAP change. Comment-only
+ *   tweaks do not need a bump.
+ *
+ *   v2 (Sprint 51.7 T2 — metadata completeness + wire-up insurance):
+ *     - parseTranscriptMetadata() now populates memory_sessions.started_at /
+ *       duration_minutes / facts_extracted from per-message timestamps and
+ *       memory_remember tool_use counts, closing the v1 "minimum viable row"
+ *       gap Codex flagged at Sprint 51.6 Phase B.
+ *     - Stamp bump load-bearing as INSURANCE for the Sprint 51.6 wire-up bug
+ *       (T1 fix landing in same v1.0.3 wave): an installed-v1 user upgrading
+ *       to bundled-v2 always passes the `installed >= bundled` short-circuit
+ *       at init-mnestra.js:550 and reaches the refresh path.
+ *
+ * @termdeck/stack-installer-hook v2
+ *
+ * Required env vars (validated at entry, after the secrets.env fallback):
+ *   - SUPABASE_URL              e.g. https://<project-ref>.supabase.co
+ *   - SUPABASE_SERVICE_ROLE_KEY      service-role key (NOT the anon key — needs INSERT on memory_items)
+ *   - OPENAI_API_KEY            sk-... for text-embedding-3-small
+ *
+ * Optional:
+ *   - TERMDECK_HOOK_DEBUG=1            verbose logging
+ *   - TERMDECK_HOOK_MIN_BYTES=5000     transcript size threshold
+ *   - TERMDECK_SESSION_TYPE=...        override sessionType when payload lacks it
+ *
+ * Fail-soft contract: any error (network, parse, env-var-missing, malformed transcript)
+ * logs and exits 0. Never blocks Claude Code session close.
+ *
+ * Co-existence with Joshua's personal rag-system hook: this bundled hook writes
+ * source_type='session_summary' (one row per session). Joshua's personal hook
+ * writes source_type='fact' (multiple rows from extractFacts pipeline). Different
+ * source_types coexist in memory_items without dedup collisions.
+ */
+'use strict';
+const { existsSync, statSync, appendFileSync, readFileSync } = require('fs');
+const { join } = require('path');
+const os = require('os');
+const LOG_FILE = join(os.homedir(), '.claude', 'hooks', 'memory-hook.log');
+// Resolved per-call so tests can override via TERMDECK_HOOK_SECRETS_PATH
+// (the const-at-load-time pattern would freeze the path before any test
+// that mutates HOME or the override env var gets a chance to take effect).
+function resolveSecretsPath() {
+  return process.env.TERMDECK_HOOK_SECRETS_PATH
+    || join(os.homedir(), '.termdeck', 'secrets.env');
+}
+// PROJECT_MAP — most-specific-first ordering (Sprint 41 design).
+// Patterns match against the cwd reported by Claude Code at SessionEnd.
+// First match wins; falls through to "global".
+//
+// Sprint 51.6 (T1 side finding b): a previous version shipped this array
+// empty, which caused every session to tag as "global" — orphaning rows
+// from project-scoped memory_recall queries. The default below restores
+// the most-specific-first taxonomy from Sprint 41 T1, generalized for
+// universal shipping. Users still extend in place by editing this array.
+//
+// Patterns NOT specific to Joshua's filesystem (e.g. /\/PVB\//i, /\/DOR\//i)
+// are kept because they're benign on other machines — the regex simply
+// doesn't fire on cwds that don't contain those segments. The chopin-
+// nashville catch-all stays LAST (structural invariant) so a TermDeck cwd
+// inside ChopinNashville/SideHustles/ resolves to "termdeck", not the
+// catch-all.
+const PROJECT_MAP = [
+  // ── Active code projects (most-specific FIRST) ──
+  { pattern: /\/SideHustles\/TermDeck\/termdeck/i,           project: 'termdeck' },
+  { pattern: /\/Graciella\/engram(\/|$)/i,                    project: 'mnestra' },
+  { pattern: /\/Graciella\/rumen(\/|$)/i,                     project: 'rumen' },
+  { pattern: /\/Graciella\/rag-system(\/|$)/i,                project: 'rag-system' },
+  { pattern: /\/ChopinInBohemia\/podium(\/|$)/i,              project: 'podium' },
+  { pattern: /\/ChopinInBohemia(\/|$)/i,                      project: 'chopin-in-bohemia' },
+  { pattern: /\/SideHustles\/SchedulingApp(\/|$)/i,           project: 'chopin-scheduler' },
+  { pattern: /\/ChopinNashville\/SchedulingApp(\/|$)/i,       project: 'chopin-scheduler' },
+  { pattern: /\/Graciella\/PVB(\/|$)|\/PVB\/pvb(\/|$)/i,      project: 'pvb' },
+  { pattern: /\/Unagi\/gorgias-ticket-monitor(\/|$)/i,        project: 'claimguard' },
+  { pattern: /\/ChopinNashville\/SideHustles\/ClaimGuard(\/|$)/i, project: 'claimguard' },
+  { pattern: /\/Documents\/DOR(\/|$)/i,                       project: 'dor' },
+  { pattern: /\/Graciella\/joshuaizzard-dev(\/|$)/i,          project: 'portfolio' },
+  { pattern: /\/Graciella\/imessage-reader(\/|$)/i,           project: 'imessage-reader' },
+  // ── chopin-nashville catch-all (MUST be LAST among /ChopinNashville/ matchers).
+  // Sprint 35 + 41 lesson: any /ChopinNashville/-matching pattern placed below
+  // this entry gets shadowed and the row mis-tags as 'chopin-nashville'.
+  { pattern: /\/ChopinNashville(\/|$)/i,                      project: 'chopin-nashville' },
+];
+const MIN_TRANSCRIPT_BYTES = parseInt(process.env.TERMDECK_HOOK_MIN_BYTES || '5000', 10);
+const DEBUG = process.env.TERMDECK_HOOK_DEBUG === '1';
+function log(msg) {
+  try { appendFileSync(LOG_FILE, `[${new Date().toISOString()}] ${msg}\n`); }
+  catch (_) { /* fail-soft */ }
+}
+function debug(msg) { if (DEBUG) log(`[debug] ${msg}`); }
+function detectProject(cwd) {
+  for (const { pattern, project } of PROJECT_MAP) {
+    if (pattern.test(cwd)) return project;
+  }
+  return 'global';
+}
+// Treat values shaped like `${VAR}` as unset. Claude Code does not expand
+// shell placeholders in MCP env or hook env, so a literal `${SUPABASE_URL}`
+// is non-empty-but-invalid — the same trap that caused the Sprint 47.5
+// hotfix on the stack-installer + mnestra MCP. Mirroring that discipline
+// here keeps the hook resilient if any future tooling regresses to the
+// placeholder pattern.
+function isUnexpandedPlaceholder(v) {
+  return typeof v === 'string' && v.startsWith('${') && v.endsWith('}');
+}
+// Load ~/.termdeck/secrets.env into process.env when keys are absent or
+// hold an unexpanded `${VAR}` placeholder. Concrete values already in
+// process.env always win — the fallback only fills gaps. Silent no-op if
+// the file is missing. Mirrors mnestra's loadTermdeckSecretsFallback so
+// the hook works in three launch contexts:
+//   1. Inside TermDeck PTY (Sprint 48 T4 PTY env merge supplies the vars).
+//   2. Standalone Claude Code launched from a shell with secrets.env sourced.
+//   3. Standalone Claude Code launched from a vanilla shell (this fallback).
+function loadTermdeckSecretsFallback() {
+  const secretsPath = resolveSecretsPath();
+  if (!existsSync(secretsPath)) return;
+  let raw;
+  try { raw = readFileSync(secretsPath, 'utf8'); }
+  catch (err) {
+    log(`secrets-env-read-failed: ${err && err.message ? err.message : String(err)}`);
+    return;
+  }
+  let loaded = 0;
+  for (const line of raw.split('\n')) {
+    const trimmed = line.trim();
+    if (!trimmed || trimmed.startsWith('#')) continue;
+    const m = trimmed.match(/^([A-Z_][A-Z0-9_]*)=(.*)$/);
+    if (!m) continue;
+    const key = m[1];
+    const cur = process.env[key];
+    if (cur && !isUnexpandedPlaceholder(cur)) continue;
+    let v = m[2];
+    if (v.length >= 2 && (v[0] === '"' || v[0] === "'") && v[v.length - 1] === v[0]) {
+      v = v.slice(1, -1);
+    }
+    process.env[key] = v;
+    loaded++;
+  }
+  if (loaded > 0) debug(`secrets-env-loaded: ${loaded} keys from ${secretsPath}`);
+}
+function readEnv() {
+  loadTermdeckSecretsFallback();
+  const required = ['SUPABASE_URL', 'SUPABASE_SERVICE_ROLE_KEY', 'OPENAI_API_KEY'];
+  const missing = required.filter((k) => {
+    const v = process.env[k];
+    return !v || isUnexpandedPlaceholder(v);
+  });
+  if (missing.length) {
+    log(`env-var-missing: ${missing.join(', ')} — set these in ~/.termdeck/secrets.env or your shell to enable Mnestra ingestion. Skipping.`);
+    return null;
+  }
+  return {
+    supabaseUrl: process.env.SUPABASE_URL.replace(/\/$/, ''),
+    supabaseKey: process.env.SUPABASE_SERVICE_ROLE_KEY,
+    openaiKey: process.env.OPENAI_API_KEY,
+  };
+}
+// ──────────────────────────────────────────────────────────────────────────
+// Sprint 45 T4 — adapter-pluggable transcript parsers.
+//
+// Each parser takes raw transcript file contents (string) and returns a
+// `{ role: 'user'|'assistant', content: string }[]` array — the shape
+// buildSummary() consumes. Adapters in packages/server/src/agent-adapters/
+// own the canonical parser logic; this file inlines copies because the
+// hook ships standalone to ~/.claude/hooks/ where it can't `require()`
+// from the TermDeck server package. When new agents add adapters, mirror
+// their parseTranscript function body here — keep the two in sync.
+// (Sprint 46 candidate: a sync script that codegens this section from
+// agent-adapters/*.js, analogous to scripts/sync-agent-instructions.js
+// for CLAUDE.md / AGENTS.md / GEMINI.md mirroring.)
+//
+// When sessionType is absent or unknown, parseAutoDetect runs a per-line
+// best-effort that handles Claude JSONL, Codex JSONL, AND Gemini's single
+// JSON-object shape. This is the pre-T4 stop-gap T1+T2 landed inline —
+// preserved as the fallback so existing hook payloads (Claude Code Stop,
+// no sessionType field) continue working for any of the three agents.
+// Once Sprint 46 wires sessionType into payloads, the auto path narrows
+// to a legacy compatibility role.
+// ──────────────────────────────────────────────────────────────────────────
+function parseClaudeJsonl(raw) {
+  if (typeof raw !== 'string' || raw.length === 0) return [];
+  const lines = raw.split('\n').filter(Boolean);
+  const messages = [];
+  for (const line of lines) {
+    let msg;
+    try { msg = JSON.parse(line); } catch (_) { continue; }
+    const role = msg && msg.message && msg.message.role;
+    if (role !== 'user' && role !== 'assistant') continue;
+    const content = msg.message.content;
+    let text = '';
+    if (typeof content === 'string') {
+      text = content;
+    } else if (Array.isArray(content)) {
+      text = content
+        .filter((c) => c && c.type === 'text')
+        .map((c) => c.text || '')
+        .join(' ');
+    }
+    if (text) messages.push({ role, content: text.slice(0, 400) });
+  }
+  return messages;
+}
+function parseCodexJsonl(raw) {
+  if (typeof raw !== 'string' || raw.length === 0) return [];
+  const lines = raw.split('\n').filter(Boolean);
+  const messages = [];
+  for (const line of lines) {
+    let msg;
+    try { msg = JSON.parse(line); } catch (_) { continue; }
+    if (!msg || msg.type !== 'response_item') continue;
+    const payload = msg.payload;
+    if (!payload || payload.type !== 'message') continue;
+    const role = payload.role;
+    // Codex's `developer` role carries the sandbox/permissions prelude — skip.
+    if (role !== 'user' && role !== 'assistant') continue;
+    const content = payload.content;
+    let text = '';
+    if (typeof content === 'string') {
+      text = content;
+    } else if (Array.isArray(content)) {
+      // Codex uses `input_text` (user) and `output_text` (assistant); accept
+      // plain `text` for forward-compat with future Codex CLI versions.
+      text = content
+        .filter((c) => c && (c.type === 'input_text' || c.type === 'output_text' || c.type === 'text'))
+        .map((c) => c.text || '')
+        .join(' ');
+    }
+    if (text) messages.push({ role, content: text.slice(0, 400) });
+  }
+  return messages;
+}
+function parseGeminiJson(raw) {
+  // Gemini CLI persists each session as a single JSON object (NOT JSONL):
+  //   { sessionId, projectHash, startTime, lastUpdated, kind,
+  //     messages: [{ id, timestamp, type: 'user'|'gemini', content }] }
+  // user content: [{ text }]; gemini content: string. Map type='gemini' →
+  // role='assistant' to match the rest of the dispatch shape.
+  if (typeof raw !== 'string' || raw.length === 0) return [];
+  let obj;
+  try { obj = JSON.parse(raw); } catch (_) { return []; }
+  if (!obj || !Array.isArray(obj.messages)) return [];
+  const messages = [];
+  for (const msg of obj.messages) {
+    if (!msg || typeof msg !== 'object') continue;
+    let role;
+    if (msg.type === 'user') role = 'user';
+    else if (msg.type === 'gemini' || msg.type === 'assistant') role = 'assistant';
+    else continue;
+    const content = msg.content;
+    let text = '';
+    if (typeof content === 'string') {
+      text = content;
+    } else if (Array.isArray(content)) {
+      text = content
+        .filter((c) => c && typeof c.text === 'string')
+        .map((c) => c.text)
+        .join(' ');
+    }
+    if (text) messages.push({ role, content: text.slice(0, 400) });
+  }
+  return messages;
+}
+// Sprint 50 T1 — Grok parser. Mirrors packages/server/src/agent-adapters/grok.js
+// parseTranscript: accepts either a JSON array or JSONL of `{role, content}`
+// objects, where content is a string OR an array of `{type, text, ...}` parts
+// (AI SDK provider shape). Tool-call / tool-result / reasoning parts are
+// skipped — only the `type:'text'` parts contribute to the summary.
+//
+// The JSON envelope is produced server-side by the Grok adapter's
+// `resolveTranscriptPath` (which extracts from ~/.grok/grok.db SQLite via
+// better-sqlite3 and writes a tempfile). The hook itself never opens grok.db
+// — that would require better-sqlite3 to be reachable from ~/.claude/hooks/,
+// which isn't part of the install contract. The transcript_path the server
+// hands the hook is the tempfile, and the sessionType in the payload is
+// 'grok' so this parser is the one selected.
+function parseGrokJson(raw) {
+  if (typeof raw !== 'string' || raw.length === 0) return [];
+  let messages = null;
+  try {
+    const parsed = JSON.parse(raw);
+    if (Array.isArray(parsed)) messages = parsed;
+  } catch (_) { /* fall through to JSONL */ }
+  if (!messages) {
+    messages = [];
+    for (const line of raw.split('\n')) {
+      const trimmed = line.trim();
+      if (!trimmed) continue;
+      try {
+        const obj = JSON.parse(trimmed);
+        if (obj && typeof obj === 'object') messages.push(obj);
+      } catch (_) { continue; }
+    }
+  }
+  const out = [];
+  for (const msg of messages) {
+    if (!msg || typeof msg !== 'object') continue;
+    const role = msg.role;
+    if (role !== 'user' && role !== 'assistant') continue;
+    const content = msg.content;
+    let text = '';
+    if (typeof content === 'string') {
+      text = content;
+    } else if (Array.isArray(content)) {
+      text = content
+        .filter((c) => c && c.type === 'text' && typeof c.text === 'string')
+        .map((c) => c.text)
+        .join(' ');
+    }
+    if (text) out.push({ role, content: text.slice(0, 400) });
+  }
+  return out;
+}
+function parseAutoDetect(raw) {
+  // Fallback when sessionType is absent. Tries Gemini's single-JSON shape
+  // first (cheap to detect — starts with `{` and has a top-level `messages`
+  // array), then falls through to per-line Claude/Codex JSONL detection.
+  // This preserves T1+T2's pre-T4 multi-shape stop-gap so any Claude Code
+  // Stop payload (which doesn't carry sessionType) keeps ingesting whichever
+  // CLI's transcript path landed there.
+  if (typeof raw !== 'string' || raw.length === 0) return [];
+  const trimmed = raw.trim();
+  if (trimmed.startsWith('{')) {
+    const geminiTry = parseGeminiJson(raw);
+    if (geminiTry.length > 0) return geminiTry;
+  }
+  const lines = raw.split('\n').filter(Boolean);
+  const messages = [];
+  for (const line of lines) {
+    let msg;
+    try { msg = JSON.parse(line); } catch (_) { continue; }
+    let role;
+    let content;
+    let textBlockType = 'text';
+    if (msg && msg.message && (msg.message.role === 'user' || msg.message.role === 'assistant')) {
+      role = msg.message.role;
+      content = msg.message.content;
+    } else if (msg && msg.type === 'response_item' && msg.payload && msg.payload.type === 'message') {
+      role = msg.payload.role;
+      if (role !== 'user' && role !== 'assistant') continue;
+      content = msg.payload.content;
+      textBlockType = null; // Codex content blocks use input_text/output_text
+    } else {
+      continue;
+    }
+    let text = '';
+    if (typeof content === 'string') {
+      text = content;
+    } else if (Array.isArray(content)) {
+      text = content
+        .filter((c) => c && (
+          textBlockType === null
+            ? (c.type === 'input_text' || c.type === 'output_text' || c.type === 'text')
+            : c.type === textBlockType
+        ))
+        .map((c) => c.text || '')
+        .join(' ');
+    }
+    if (text) messages.push({ role, content: text.slice(0, 400) });
+  }
+  return messages;
+}
+const TRANSCRIPT_PARSERS = {
+  'claude-code': parseClaudeJsonl,
+  'codex': parseCodexJsonl,
+  'gemini': parseGeminiJson,
+  // Sprint 50 T1 — grok parser. Server-side `resolveTranscriptPath` extracts
+  // ~/.grok/grok.db rows via better-sqlite3 and writes a JSON envelope to a
+  // tempfile; the hook reads that tempfile with parseGrokJson here.
+  'grok': parseGrokJson,
+};
+const DEFAULT_SESSION_TYPE = 'auto';
+function selectTranscriptParser(sessionType) {
+  if (sessionType && TRANSCRIPT_PARSERS[sessionType]) {
+    return { parser: TRANSCRIPT_PARSERS[sessionType], sessionType };
+  }
+  return { parser: parseAutoDetect, sessionType: 'auto' };
+}
+// ──────────────────────────────────────────────────────────────────────────
+// Sprint 51.7 T2 — transcript metadata extractor for memory_sessions.
+//
+// The v1 bundled hook (Sprint 51.6 T3) intentionally shipped the "minimum
+// viable row" — postMemorySession set started_at, duration_minutes, and
+// facts_extracted to NULL/0 because v1 omitted transcript parsing for
+// per-message timestamps. The legacy rag-system writer
+// (~/Documents/Graciella/rag-system/src/scripts/process-session.ts) populated
+// those fields by parsing the transcript JSONL passed to it on stdin, and
+// petvetbid's 289 baseline rows carried the rich shape from that writer.
+// v2 closes the gap in pure Node so the bundled hook reaches parity without
+// the rag-system dependency (Class E hidden-dependency rule).
+//
+// Heuristic for facts_extracted: count distinct `tool_use` blocks whose
+// `name` matches a memory_remember MCP tool. Conservative by design — a
+// regex like /Remember:/ inside summary text would over-match quoted user
+// content (e.g., "the user typed 'Remember:' in their prompt"). Counting
+// tool_use blocks instead measures what was actually written into the store
+// during the session, which is the semantic the rag-system writer used.
+//
+// Tool name variants observed in real transcripts (T4-CODEX 11:09 ET pre-
+// audit confirmed both prefixes are live in `~/.claude/projects/`):
+//   - `memory_remember`               (bare; CC native + future-proofing)
+//   - `mcp__mnestra__memory_remember` (current Mnestra MCP, post-rename)
+//   - `mcp__memory__memory_remember`  (legacy MCP server name from when
+//                                       the project was called "memory")
+// Counting all three avoids undercounting on existing user transcripts.
+// ──────────────────────────────────────────────────────────────────────────
+const FACT_TOOL_NAMES = new Set([
+  'memory_remember',
+  'mcp__mnestra__memory_remember',
+  'mcp__memory__memory_remember',
+]);
+// Sprint 51.7 T2 / T4-CODEX 11:13 ET catch: each adapter shipped by this
+// hook stores message content under a different key shape, and we have to
+// match all of them or facts_extracted under-counts whenever a non-Claude
+// session writes to memory_sessions. Mirror the shapes already documented
+// at the top of TRANSCRIPT_PARSERS:
+//
+//   - Claude Code (current):  msg.message.content[]
+//   - Grok (Sprint 50 T1):    msg.content[] (flat, AI SDK provider shape)
+//   - Codex (response_item):  msg.payload.content[] when msg.type === 'response_item'
+//
+// Gemini's single-JSON envelope doesn't apply per-line — its content lives
+// inside a top-level messages array, and each entry's content is a flat
+// array OR a string. extractContentBlocks() handles flat arrays; strings
+// are skipped (no tool_use can hide inside a string).
+function extractContentBlocks(msg) {
+  if (!msg || typeof msg !== 'object') return null;
+  if (msg.message && Array.isArray(msg.message.content)) return msg.message.content;
+  if (Array.isArray(msg.content)) return msg.content;
+  if (msg.type === 'response_item' && msg.payload && Array.isArray(msg.payload.content)) {
+    return msg.payload.content;
+  }
+  return null;
+}
+function parseTranscriptMetadata(rawJsonl) {
+  if (typeof rawJsonl !== 'string' || rawJsonl.length === 0) {
+    return { startedAt: null, endedAt: null, durationMinutes: null, factsExtracted: 0 };
+  }
+  const lines = rawJsonl.split('\n').filter(Boolean);
+  let earliestTs = null;
+  let latestTs = null;
+  let factsExtracted = 0;
+  for (const line of lines) {
+    let msg;
+    try { msg = JSON.parse(line); } catch (_) { continue; }
+    if (!msg || typeof msg !== 'object') continue;
+    // Timestamp: top-level `timestamp` is the canonical Claude Code shape.
+    // Fall back to `msg.message.timestamp` for any future / alt-shape that
+    // nests it (Codex/Gemini/Grok adapters preserve the top-level form, so
+    // this is mostly forward-compat).
+    const ts = msg.timestamp || (msg.message && msg.message.timestamp);
+    if (typeof ts === 'string' || typeof ts === 'number') {
+      const t = Date.parse(ts);
+      if (!Number.isNaN(t)) {
+        if (earliestTs === null || t < earliestTs) earliestTs = t;
+        if (latestTs === null || t > latestTs) latestTs = t;
+      }
+    }
+    // facts_extracted: count tool_use blocks matching a memory_remember
+    // MCP tool name. See FACT_TOOL_NAMES + extractContentBlocks above.
+    const blocks = extractContentBlocks(msg);
+    if (blocks) {
+      for (const b of blocks) {
+        if (b && b.type === 'tool_use' && typeof b.name === 'string' && FACT_TOOL_NAMES.has(b.name)) {
+          factsExtracted += 1;
+        }
+      }
+    }
+  }
+  const startedAt = earliestTs !== null ? new Date(earliestTs).toISOString() : null;
+  const endedAt = latestTs !== null ? new Date(latestTs).toISOString() : null;
+  const durationMinutes = (earliestTs !== null && latestTs !== null)
+    ? Math.max(0, Math.round((latestTs - earliestTs) / 60000))
+    : null;
+  return { startedAt, endedAt, durationMinutes, factsExtracted };
+}
+// Sprint 51.6 T3 → 51.7 T2: `buildSummary` now also returns parser-derived
+// metadata (startedAt, endedAt, durationMinutes, factsExtracted) merged into
+// the result object. parseTranscriptMetadata reuses the same raw string —
+// no second readFileSync. Returns null when the transcript is unreadable or
+// has fewer than 5 messages (skip semantics unchanged from v1).
+function buildSummary(transcriptPath, sessionType) {
+  let raw;
+  try { raw = readFileSync(transcriptPath, 'utf8'); }
+  catch (e) { log(`read-transcript-failed: ${e.message}`); return null; }
+  const { parser, sessionType: resolvedType } = selectTranscriptParser(sessionType);
+  if (sessionType && resolvedType !== sessionType) {
+    debug(`unknown-session-type="${sessionType}", falling back to ${resolvedType}`);
+  }
+  const messages = parser(raw);
+  if (messages.length < 5) {
+    debug(`session-too-short: ${messages.length} messages (parser=${resolvedType}), skipping`);
+    return null;
+  }
+  const tail = messages.slice(-30);
+  const summary =
+    `Session with ${messages.length} messages.\n\n` +
+    tail.map((m) => `[${m.role}] ${m.content}`).join('\n');
+  // OpenAI text-embedding-3-small accepts up to 8192 tokens (~32K chars).
+  // 7000 chars is a safe headroom that survives multibyte expansion.
+  // Sprint 51.7 T2: merge transcript-derived metadata so the caller (
+  // processStdinPayload → postMemorySession) can populate the
+  // memory_sessions.started_at/duration_minutes/facts_extracted fields the
+  // v1 hook left NULL/0.
+  const metadata = parseTranscriptMetadata(raw);
+  return {
+    summary: summary.slice(0, 7000),
+    messagesCount: messages.length,
+    ...metadata,
+  };
+}
+async function embedText(text, openaiKey) {
+  try {
+    const res = await fetch('https://api.openai.com/v1/embeddings', {
+      method: 'POST',
+      headers: {
+        'Content-Type': 'application/json',
+        'Authorization': `Bearer ${openaiKey}`,
+      },
+      body: JSON.stringify({ model: 'text-embedding-3-small', input: text }),
+    });
+    if (!res.ok) {
+      const body = await res.text().catch(() => '');
+      log(`openai-embed-failed: HTTP ${res.status} ${body.slice(0, 200)}`);
+      return null;
+    }
+    const data = await res.json();
+    return data?.data?.[0]?.embedding || null;
+  } catch (e) {
+    log(`openai-embed-exception: ${e.message}`);
+    return null;
+  }
+}
+// Sprint 50 T2: every row written by this hook carries an LLM-provenance
+// tag (memory_items.source_agent). Defaults to 'claude' for backwards
+// compat with Claude Code's existing SessionEnd payload, which doesn't
+// supply the field; TermDeck server's per-adapter onPanelClose
+// interceptor (Sprint 50 T1) sets it explicitly to 'codex'/'gemini'/'grok'
+// for non-Claude panels. The set is open-ended on the server side; this
+// constant gates only the spelling-mistake/empty-string case.
+const ALLOWED_SOURCE_AGENTS = new Set([
+  'claude', 'codex', 'gemini', 'grok', 'orchestrator',
+]);
+function normalizeSourceAgent(raw) {
+  if (typeof raw !== 'string') return 'claude';
+  const v = raw.trim().toLowerCase();
+  if (!v) return 'claude';
+  return ALLOWED_SOURCE_AGENTS.has(v) ? v : 'claude';
+}
+async function postMemoryItem({ supabaseUrl, supabaseKey, content, embedding, project, sessionId, sourceAgent }) {
+  try {
+    const res = await fetch(`${supabaseUrl}/rest/v1/memory_items`, {
+      method: 'POST',
+      headers: {
+        'Content-Type': 'application/json',
+        'apikey': supabaseKey,
+        'Authorization': `Bearer ${supabaseKey}`,
+        'Prefer': 'return=minimal',
+      },
+      body: JSON.stringify({
+        content,
+        embedding: `[${embedding.join(',')}]`,
+        source_type: 'session_summary',
+        category: 'workflow',
+        project,
+        source_session_id: sessionId || null,
+        source_agent: normalizeSourceAgent(sourceAgent),
+      }),
+    });
+    if (!res.ok) {
+      const body = await res.text().catch(() => '');
+      log(`supabase-insert-failed: HTTP ${res.status} ${body.slice(0, 200)}`);
+      return false;
+    }
+    return true;
+  } catch (e) {
+    log(`supabase-insert-exception: ${e.message}`);
+    return false;
+  }
+}
+// Sprint 51.6 T3 — companion write to memory_sessions.
+//
+// History: the bundled hook never wrote memory_sessions until v1.0.2. Joshua's
+// PRIOR personal rag-system hook spawned process-session.ts which inserted
+// memory_sessions rows; the Sprint 38 P0 rewrite replaced that hook with a
+// Mnestra-direct hook that only wrote memory_items. Result: from 2026-05-02
+// 13:24 ET (when bundled overwrote personal) until v1.0.2, no memory_sessions
+// rows accumulated. Sprint 51.6 T1+T2+T3 documented the gap; this function
+// closes it.
+//
+// Schema target: Mnestra migration 017 brings canonical engram in line with
+// petvetbid's rag-system flavor (session_id, summary_embedding, started_at,
+// ended_at, duration_minutes, messages_count, transcript_path, etc). The
+// bundled hook writes the rich shape on every install — fresh-canonical
+// (post-mig-017) and petvetbid alike.
+//
+// Idempotency: Prefer: resolution=merge-duplicates relies on the
+// memory_sessions_session_id_key unique constraint. Mig 017 adds it where
+// absent. SessionEnd-fires-twice (e.g. /exit then PTY close) resolves to a
+// single row.
+async function postMemorySession({
+  supabaseUrl, supabaseKey,
+  summary, summaryEmbedding,
+  project, sessionId,
+  transcriptPath, messagesCount,
+  endedAt,
+  // Sprint 51.7 T2 — transcript-derived metadata (closes Sprint 51.6's
+  // started_at/duration_minutes/facts_extracted=NULL gap). All optional;
+  // null/null/0 fallback preserves the v1 minimum-viable-row shape when the
+  // transcript carries no timestamps (e.g. legacy fixtures, pre-CC-2.x
+  // payloads, or hand-fed test inputs).
+  startedAt = null,
+  durationMinutes = null,
+  factsExtracted = 0,
+}) {
+  if (!sessionId) {
+    log('memory-sessions-skip: sessionId missing — cannot satisfy session_id NOT NULL/UNIQUE.');
+    return false;
+  }
+  try {
+    // Sprint 51.6 T3 / T4-CODEX audit 20:23 ET: PostgREST requires both
+    // `Prefer: resolution=merge-duplicates` AND `?on_conflict=<column>`
+    // on the URL to trigger an UPSERT. Without `on_conflict=session_id`
+    // a duplicate fire would error against memory_sessions_session_id_key.
+    const res = await fetch(`${supabaseUrl}/rest/v1/memory_sessions?on_conflict=session_id`, {
+      method: 'POST',
+      headers: {
+        'Content-Type': 'application/json',
+        'apikey': supabaseKey,
+        'Authorization': `Bearer ${supabaseKey}`,
+        'Prefer': 'resolution=merge-duplicates,return=minimal',
+      },
+      body: JSON.stringify({
+        session_id: sessionId,
+        summary,
+        summary_embedding: Array.isArray(summaryEmbedding)
+          ? `[${summaryEmbedding.join(',')}]`
+          : null,
+        project,
+        // Sprint 51.7 T2: started_at + duration_minutes + facts_extracted now
+        // populated from parseTranscriptMetadata when transcript timestamps
+        // are present. files_changed and topics remain unpopulated (would
+        // require diff parsing the bundled hook doesn't have; deferred).
+        started_at: typeof startedAt === 'string' ? startedAt : null,
+        ended_at: (endedAt instanceof Date ? endedAt : new Date()).toISOString(),
+        duration_minutes: typeof durationMinutes === 'number' ? durationMinutes : null,
+        messages_count: typeof messagesCount === 'number' ? messagesCount : 0,
+        facts_extracted: typeof factsExtracted === 'number' ? factsExtracted : 0,
+        transcript_path: transcriptPath || null,
+      }),
+    });
+    if (!res.ok) {
+      const body = await res.text().catch(() => '');
+      log(`memory-sessions-insert-failed: HTTP ${res.status} ${body.slice(0, 200)}`);
+      return false;
+    }
+    return true;
+  } catch (e) {
+    log(`memory-sessions-insert-exception: ${e.message}`);
+    return false;
+  }
+}
+async function processStdinPayload(input) {
+  let data;
+  try { data = JSON.parse(input); }
+  catch (e) { log(`parse-stdin-failed: ${e.message}`); return; }
+  const transcriptPath = data.transcript_path;
+  const cwd = data.cwd || '';
+  const sessionId =
+    data.session_id ||
+    (transcriptPath ? transcriptPath.split('/').pop().replace('.jsonl', '') : null);
+  // Sprint 45 T4: sessionType drives buildSummary's parser dispatch.
+  // Read order: payload (server-driven invocations) → env var (TermDeck
+  // server can set TERMDECK_SESSION_TYPE in the spawned PTY's env) →
+  // 'auto' default (parseAutoDetect handles Claude + Codex + Gemini).
+  const sessionType =
+    data.sessionType ||
+    data.session_type ||
+    process.env.TERMDECK_SESSION_TYPE ||
+    DEFAULT_SESSION_TYPE;
+  // Sprint 50 T2: provenance tag the row with the LLM that produced it.
+  // Default 'claude' — Claude Code's native SessionEnd payload doesn't
+  // carry source_agent, so any unset path is implicitly Claude. The
+  // TermDeck server's per-adapter onPanelClose interceptor (Sprint 50 T1)
+  // sets it explicitly for non-Claude panels.
+  const sourceAgent =
+    data.source_agent ||
+    data.sourceAgent ||
+    process.env.TERMDECK_SOURCE_AGENT ||
+    'claude';
+  if (!transcriptPath) { log('no-transcript-path: skipping'); return; }
+  let stat;
+  try { stat = statSync(transcriptPath); }
+  catch (e) { log(`cannot-stat-transcript: ${transcriptPath} — ${e.message}`); return; }
+  if (stat.size < MIN_TRANSCRIPT_BYTES) {
+    debug(`small-transcript: ${stat.size} bytes < ${MIN_TRANSCRIPT_BYTES}, skipping`);
+    return;
+  }
+  const env = readEnv();
+  if (!env) return;
+  const project = detectProject(cwd);
+  debug(`project="${project}", session=${sessionId}, sessionType=${sessionType}`);
+  const built = buildSummary(transcriptPath, sessionType);
+  if (!built) return;
+  const {
+    summary,
+    messagesCount,
+    startedAt: parsedStartedAt,
+    endedAt: parsedEndedAt,
+    durationMinutes,
+    factsExtracted,
+  } = built;
+  const embedding = await embedText(summary, env.openaiKey);
+  if (!embedding) return;
+  const itemOk = await postMemoryItem({
+    supabaseUrl: env.supabaseUrl,
+    supabaseKey: env.supabaseKey,
+    content: summary,
+    embedding,
+    project,
+    sessionId,
+    sourceAgent,
+  });
+  // Sprint 51.6 T3: companion memory_sessions write. Independent of the
+  // memory_items write — a memory_items failure shouldn't suppress the
+  // memory_sessions row, and vice versa. Both errors fail-soft.
+  //
+  // Sprint 51.7 T2: prefer parser-derived `endedAt` (last-message
+  // timestamp) over hook-fire-time when the transcript carried timestamps.
+  // Matches the rag-system writer's semantics — `ended_at` is "when the
+  // conversation last had activity," not "when the SessionEnd hook
+  // happened to fire." Falls back to `new Date()` when the parser found
+  // no timestamps, preserving v1 behavior.
+  const sessionOk = await postMemorySession({
+    supabaseUrl: env.supabaseUrl,
+    supabaseKey: env.supabaseKey,
+    summary,
+    summaryEmbedding: embedding,
+    project,
+    sessionId,
+    transcriptPath,
+    messagesCount,
+    endedAt: parsedEndedAt ? new Date(parsedEndedAt) : new Date(),
+    startedAt: parsedStartedAt,
+    durationMinutes,
+    factsExtracted,
+  });
+  if (itemOk || sessionOk) {
+    log(`ingested: project="${project}" session=${sessionId} bytes=${summary.length} messages=${messagesCount} sessionType=${sessionType} sourceAgent=${normalizeSourceAgent(sourceAgent)} startedAt=${parsedStartedAt || 'null'} durationMin=${durationMinutes === null ? 'null' : durationMinutes} factsExtracted=${factsExtracted} memory_items=${itemOk ? 'ok' : 'fail'} memory_sessions=${sessionOk ? 'ok' : 'fail'}`);
+  }
+}
+// Module-export contract for testability. When run as a script (require.main === module),
+// read stdin and process. When require()d (tests), expose helpers.
+if (require.main === module) {
+  let input = '';
+  process.stdin.setEncoding('utf8');
+  process.stdin.on('data', (chunk) => { input += chunk; });
+  process.stdin.on('end', () => {
+    processStdinPayload(input).catch((e) => log(`hook-error: ${e.message}`));
+  });
+} else {
+  module.exports = {
+    PROJECT_MAP,
+    detectProject,
+    readEnv,
+    buildSummary,
+    embedText,
+    postMemoryItem,
+    // Sprint 51.6 T3 — memory_sessions write companion.
+    postMemorySession,
+    processStdinPayload,
+    LOG_FILE,
+    // Sprint 45 T4 — adapter-pluggable transcript-parser surface.
+    TRANSCRIPT_PARSERS,
+    DEFAULT_SESSION_TYPE,
+    parseClaudeJsonl,
+    parseCodexJsonl,
+    parseGeminiJson,
+    parseGrokJson,
+    parseAutoDetect,
+    selectTranscriptParser,
+    // Sprint 50 T2 — source_agent provenance plumbing.
+    normalizeSourceAgent,
+    ALLOWED_SOURCE_AGENTS,
+    // Sprint 51.7 T2 — transcript-metadata extractor for memory_sessions.
+    parseTranscriptMetadata,
+    FACT_TOOL_NAMES,
+    extractContentBlocks,
+  };
+}