npm - selftune - Versions diffs - 0.1.4 → 0.2.1 - Mend

selftune 0.1.4 → 0.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (153) hide show

package/.claude/agents/diagnosis-analyst.md +156 -0
package/.claude/agents/evolution-reviewer.md +180 -0
package/.claude/agents/integration-guide.md +212 -0
package/.claude/agents/pattern-analyst.md +160 -0
package/CHANGELOG.md +46 -1
package/README.md +105 -257
package/apps/local-dashboard/dist/assets/geist-cyrillic-wght-normal-CHSlOQsW.woff2 +0 -0
package/apps/local-dashboard/dist/assets/geist-latin-ext-wght-normal-DMtmJ5ZE.woff2 +0 -0
package/apps/local-dashboard/dist/assets/geist-latin-wght-normal-Dm3htQBi.woff2 +0 -0
package/apps/local-dashboard/dist/assets/index-C4EOTFZ2.js +15 -0
package/apps/local-dashboard/dist/assets/index-bl-Webyd.css +1 -0
package/apps/local-dashboard/dist/assets/vendor-react-U7zYD9Rg.js +60 -0
package/apps/local-dashboard/dist/assets/vendor-table-B7VF2Ipl.js +26 -0
package/apps/local-dashboard/dist/assets/vendor-ui-D7_zX_qy.js +346 -0
package/apps/local-dashboard/dist/favicon.png +0 -0
package/apps/local-dashboard/dist/index.html +17 -0
package/apps/local-dashboard/dist/logo.png +0 -0
package/apps/local-dashboard/dist/logo.svg +9 -0
package/assets/BeforeAfter.gif +0 -0
package/assets/FeedbackLoop.gif +0 -0
package/assets/logo.svg +9 -0
package/assets/skill-health-badge.svg +20 -0
package/cli/selftune/activation-rules.ts +171 -0
package/cli/selftune/badge/badge-data.ts +108 -0
package/cli/selftune/badge/badge-svg.ts +212 -0
package/cli/selftune/badge/badge.ts +99 -0
package/cli/selftune/canonical-export.ts +183 -0
package/cli/selftune/constants.ts +103 -1
package/cli/selftune/contribute/bundle.ts +314 -0
package/cli/selftune/contribute/contribute.ts +214 -0
package/cli/selftune/contribute/sanitize.ts +162 -0
package/cli/selftune/cron/setup.ts +266 -0
package/cli/selftune/dashboard-contract.ts +202 -0
package/cli/selftune/dashboard-server.ts +1049 -0
package/cli/selftune/dashboard.ts +43 -156
package/cli/selftune/eval/baseline.ts +248 -0
package/cli/selftune/eval/composability-v2.ts +273 -0
package/cli/selftune/eval/composability.ts +117 -0
package/cli/selftune/eval/generate-unit-tests.ts +143 -0
package/cli/selftune/eval/hooks-to-evals.ts +101 -16
package/cli/selftune/eval/import-skillsbench.ts +221 -0
package/cli/selftune/eval/synthetic-evals.ts +172 -0
package/cli/selftune/eval/unit-test-cli.ts +152 -0
package/cli/selftune/eval/unit-test.ts +196 -0
package/cli/selftune/evolution/deploy-proposal.ts +142 -1
package/cli/selftune/evolution/evidence.ts +26 -0
package/cli/selftune/evolution/evolve-body.ts +586 -0
package/cli/selftune/evolution/evolve.ts +825 -116
package/cli/selftune/evolution/extract-patterns.ts +105 -16
package/cli/selftune/evolution/pareto.ts +314 -0
package/cli/selftune/evolution/propose-body.ts +171 -0
package/cli/selftune/evolution/propose-description.ts +100 -2
package/cli/selftune/evolution/propose-routing.ts +166 -0
package/cli/selftune/evolution/refine-body.ts +141 -0
package/cli/selftune/evolution/rollback.ts +21 -4
package/cli/selftune/evolution/validate-body.ts +254 -0
package/cli/selftune/evolution/validate-proposal.ts +257 -35
package/cli/selftune/evolution/validate-routing.ts +177 -0
package/cli/selftune/grading/auto-grade.ts +200 -0
package/cli/selftune/grading/grade-session.ts +513 -42
package/cli/selftune/grading/pre-gates.ts +104 -0
package/cli/selftune/grading/results.ts +42 -0
package/cli/selftune/hooks/auto-activate.ts +185 -0
package/cli/selftune/hooks/evolution-guard.ts +165 -0
package/cli/selftune/hooks/prompt-log.ts +172 -2
package/cli/selftune/hooks/session-stop.ts +123 -3
package/cli/selftune/hooks/skill-change-guard.ts +112 -0
package/cli/selftune/hooks/skill-eval.ts +119 -3
package/cli/selftune/index.ts +415 -48
package/cli/selftune/ingestors/claude-replay.ts +377 -0
package/cli/selftune/ingestors/codex-rollout.ts +345 -46
package/cli/selftune/ingestors/codex-wrapper.ts +207 -39
package/cli/selftune/ingestors/openclaw-ingest.ts +573 -0
package/cli/selftune/ingestors/opencode-ingest.ts +193 -17
package/cli/selftune/init.ts +376 -16
package/cli/selftune/last.ts +14 -5
package/cli/selftune/localdb/db.ts +63 -0
package/cli/selftune/localdb/materialize.ts +428 -0
package/cli/selftune/localdb/queries.ts +376 -0
package/cli/selftune/localdb/schema.ts +204 -0
package/cli/selftune/memory/writer.ts +447 -0
package/cli/selftune/monitoring/watch.ts +90 -16
package/cli/selftune/normalization.ts +682 -0
package/cli/selftune/observability.ts +19 -44
package/cli/selftune/orchestrate.ts +1073 -0
package/cli/selftune/quickstart.ts +203 -0
package/cli/selftune/repair/skill-usage.ts +576 -0
package/cli/selftune/schedule.ts +561 -0
package/cli/selftune/status.ts +59 -33
package/cli/selftune/sync.ts +627 -0
package/cli/selftune/types.ts +525 -5
package/cli/selftune/utils/canonical-log.ts +45 -0
package/cli/selftune/utils/frontmatter.ts +217 -0
package/cli/selftune/utils/hooks.ts +41 -0
package/cli/selftune/utils/html.ts +27 -0
package/cli/selftune/utils/llm-call.ts +103 -19
package/cli/selftune/utils/math.ts +10 -0
package/cli/selftune/utils/query-filter.ts +139 -0
package/cli/selftune/utils/skill-discovery.ts +340 -0
package/cli/selftune/utils/skill-log.ts +68 -0
package/cli/selftune/utils/skill-usage-confidence.ts +18 -0
package/cli/selftune/utils/transcript.ts +307 -26
package/cli/selftune/utils/trigger-check.ts +89 -0
package/cli/selftune/utils/tui.ts +156 -0
package/cli/selftune/workflows/discover.ts +254 -0
package/cli/selftune/workflows/skill-md-writer.ts +288 -0
package/cli/selftune/workflows/workflows.ts +188 -0
package/package.json +28 -11
package/packages/telemetry-contract/README.md +11 -0
package/packages/telemetry-contract/fixtures/golden.json +87 -0
package/packages/telemetry-contract/fixtures/golden.test.ts +42 -0
package/packages/telemetry-contract/index.ts +1 -0
package/packages/telemetry-contract/package.json +19 -0
package/packages/telemetry-contract/src/index.ts +2 -0
package/packages/telemetry-contract/src/types.ts +163 -0
package/packages/telemetry-contract/src/validators.ts +109 -0
package/skill/SKILL.md +180 -33
package/skill/Workflows/AutoActivation.md +145 -0
package/skill/Workflows/Badge.md +124 -0
package/skill/Workflows/Baseline.md +144 -0
package/skill/Workflows/Composability.md +107 -0
package/skill/Workflows/Contribute.md +94 -0
package/skill/Workflows/Cron.md +132 -0
package/skill/Workflows/Dashboard.md +214 -0
package/skill/Workflows/Doctor.md +63 -14
package/skill/Workflows/Evals.md +110 -18
package/skill/Workflows/EvolutionMemory.md +154 -0
package/skill/Workflows/Evolve.md +181 -21
package/skill/Workflows/EvolveBody.md +159 -0
package/skill/Workflows/Grade.md +36 -31
package/skill/Workflows/ImportSkillsBench.md +117 -0
package/skill/Workflows/Ingest.md +142 -21
package/skill/Workflows/Initialize.md +91 -23
package/skill/Workflows/Orchestrate.md +139 -0
package/skill/Workflows/Replay.md +91 -0
package/skill/Workflows/Rollback.md +23 -4
package/skill/Workflows/Schedule.md +61 -0
package/skill/Workflows/Sync.md +88 -0
package/skill/Workflows/UnitTest.md +150 -0
package/skill/Workflows/Watch.md +33 -1
package/skill/Workflows/Workflows.md +129 -0
package/skill/assets/activation-rules-default.json +26 -0
package/skill/assets/multi-skill-settings.json +63 -0
package/skill/assets/single-skill-settings.json +57 -0
package/skill/references/invocation-taxonomy.md +2 -2
package/skill/references/logs.md +164 -2
package/skill/references/setup-patterns.md +65 -0
package/skill/references/version-history.md +40 -0
package/skill/settings_snippet.json +23 -0
package/templates/activation-rules-default.json +27 -0
package/templates/multi-skill-settings.json +64 -0
package/templates/single-skill-settings.json +58 -0
package/dashboard/index.html +0 -1119

package/cli/selftune/utils/transcript.ts CHANGED Viewed

@@ -2,9 +2,11 @@
  * Transcript parsing utilities shared by hooks and grading.
  */
-import { existsSync, readFileSync } from "node:fs";
+import { existsSync, readdirSync, readFileSync, statSync } from "node:fs";
 import { basename, dirname } from "node:path";
-import type { TranscriptMetrics } from "../types.js";
+import { CLAUDE_CODE_PROJECTS_DIR } from "../constants.js";
+import type { SessionTelemetryRecord, TranscriptMetrics } from "../types.js";
+import { isActionableQueryText } from "./query-filter.js";
 /**
  * Parse a Claude Code transcript JSONL and extract process metrics.
@@ -23,9 +25,14 @@ export function parseTranscript(transcriptPath: string): TranscriptMetrics {
   const toolCalls: Record<string, number> = {};
   const bashCommands: string[] = [];
   const skillsTriggered: string[] = [];
+  const skillsInvoked: string[] = [];
   let errors = 0;
   let assistantTurns = 0;
   let lastUserQuery = "";
+  let inputTokens = 0;
+  let outputTokens = 0;
+  let firstTimestamp: string | null = null;
+  let lastTimestamp: string | null = null;
   for (const raw of lines) {
     const line = raw.trim();
@@ -38,6 +45,22 @@ export function parseTranscript(transcriptPath: string): TranscriptMetrics {
       continue;
     }
+    // Track timestamps for duration calculation
+    const ts = entry.timestamp as string | undefined;
+    if (ts) {
+      if (!firstTimestamp) firstTimestamp = ts;
+      lastTimestamp = ts;
+    }
+    // Accumulate token usage from usage objects
+    const usage = (entry.usage ?? (entry.message as Record<string, unknown>)?.usage) as
+      | Record<string, unknown>
+      | undefined;
+    if (usage && typeof usage === "object") {
+      if (typeof usage.input_tokens === "number") inputTokens += usage.input_tokens;
+      if (typeof usage.output_tokens === "number") outputTokens += usage.output_tokens;
+    }
     // Normalise: unwrap nested message if present
     const msg = (entry.message as Record<string, unknown>) ?? entry;
     const role = (msg.role as string) ?? (entry.role as string) ?? "";
@@ -45,19 +68,8 @@ export function parseTranscript(transcriptPath: string): TranscriptMetrics {
     // Track last user query
     if (role === "user") {
-      if (typeof content === "string" && content.trim()) {
-        lastUserQuery = content.trim();
-      } else if (Array.isArray(content)) {
-        const texts = content
-          .filter(
-            (p): p is Record<string, unknown> =>
-              typeof p === "object" && p !== null && (p as Record<string, unknown>).type === "text",
-          )
-          .map((p) => (p.text as string) ?? "")
-          .filter(Boolean);
-        const text = texts.join(" ").trim();
-        if (text) lastUserQuery = text;
-      }
+      const text = extractActionableUserText(content);
+      if (text) lastUserQuery = text;
     }
     // Count assistant turns and parse tool use
@@ -72,7 +84,7 @@ export function parseTranscript(transcriptPath: string): TranscriptMetrics {
           toolCalls[toolName] = (toolCalls[toolName] ?? 0) + 1;
           const inp = (b.input as Record<string, unknown>) ?? {};
-          // Track SKILL.md reads
+          // Track SKILL.md reads (may be browsing — kept for backwards compat)
           const filePath = (inp.file_path as string) ?? "";
           if (basename(filePath).toUpperCase() === "SKILL.MD") {
             const skillName = basename(dirname(filePath));
@@ -81,6 +93,14 @@ export function parseTranscript(transcriptPath: string): TranscriptMetrics {
             }
           }
+          // Track actual Skill tool invocations (high-confidence signal)
+          if (toolName === "Skill") {
+            const skillArg = (inp.skill as string) ?? (inp.name as string) ?? "";
+            if (skillArg && !skillsInvoked.includes(skillArg)) {
+              skillsInvoked.push(skillArg);
+            }
+          }
           // Track bash commands
           if (toolName === "Bash") {
             const cmd = ((inp.command as string) ?? "").trim();
@@ -110,15 +130,167 @@ export function parseTranscript(transcriptPath: string): TranscriptMetrics {
     }
   }
+  // Compute duration from first to last timestamp
+  let durationMs: number | undefined;
+  if (firstTimestamp && lastTimestamp && firstTimestamp !== lastTimestamp) {
+    const start = new Date(firstTimestamp).getTime();
+    const end = new Date(lastTimestamp).getTime();
+    if (!Number.isNaN(start) && !Number.isNaN(end) && end > start) {
+      durationMs = end - start;
+    }
+  }
   return {
     tool_calls: toolCalls,
     total_tool_calls: Object.values(toolCalls).reduce((a, b) => a + b, 0),
     bash_commands: bashCommands,
     skills_triggered: skillsTriggered,
+    skills_invoked: skillsInvoked,
     assistant_turns: assistantTurns,
     errors_encountered: errors,
     transcript_chars: totalChars,
     last_user_query: lastUserQuery,
+    ...(inputTokens > 0 ? { input_tokens: inputTokens } : {}),
+    ...(outputTokens > 0 ? { output_tokens: outputTokens } : {}),
+    ...(durationMs !== undefined ? { duration_ms: durationMs } : {}),
+  };
+}
+/**
+ * Extract actionable user queries from a Claude transcript.
+ */
+export function extractActionableUserQueries(
+  transcriptPath: string,
+): Array<{ query: string; timestamp: string }> {
+  if (!existsSync(transcriptPath)) return [];
+  let content: string;
+  try {
+    content = readFileSync(transcriptPath, "utf-8");
+  } catch {
+    return [];
+  }
+  const results: Array<{ query: string; timestamp: string }> = [];
+  for (const raw of content.split("\n")) {
+    const line = raw.trim();
+    if (!line) continue;
+    let entry: Record<string, unknown>;
+    try {
+      entry = JSON.parse(line);
+    } catch {
+      continue;
+    }
+    const msg = (entry.message as Record<string, unknown>) ?? entry;
+    const role = (msg.role as string) ?? (entry.role as string) ?? "";
+    if (role !== "user") continue;
+    const text = extractActionableUserText(msg.content ?? entry.content ?? "");
+    if (!text || text.length < 4) continue;
+    const timestamp = (entry.timestamp as string) ?? (msg.timestamp as string) ?? "";
+    results.push({ query: text, timestamp });
+  }
+  return results;
+}
+/**
+ * Recursively find Claude transcript JSONL files under a projects directory.
+ */
+export function findTranscriptFiles(projectsDir: string, since?: Date): string[] {
+  if (!existsSync(projectsDir)) return [];
+  const files: string[] = [];
+  const walk = (dir: string): void => {
+    let entries: string[];
+    try {
+      entries = readdirSync(dir).sort();
+    } catch {
+      return;
+    }
+    for (const entry of entries) {
+      const entryPath = `${dir}/${entry}`;
+      try {
+        const stats = statSync(entryPath);
+        if (stats.isDirectory()) {
+          walk(entryPath);
+          continue;
+        }
+        if (!stats.isFile() || !entry.endsWith(".jsonl")) continue;
+        if (since && stats.mtime < since) continue;
+        files.push(entryPath);
+      } catch {
+        // Ignore unreadable files and keep scanning.
+      }
+    }
+  };
+  walk(projectsDir);
+  return files.sort();
+}
+/**
+ * Find a Claude transcript path by session ID.
+ */
+export function findTranscriptPathForSession(
+  sessionId: string,
+  projectsDir: string = CLAUDE_CODE_PROJECTS_DIR,
+): string | null {
+  const filename = `${sessionId}.jsonl`;
+  for (const transcriptPath of findTranscriptFiles(projectsDir)) {
+    if (basename(transcriptPath) === filename) return transcriptPath;
+  }
+  return null;
+}
+/**
+ * Build a SessionTelemetryRecord directly from a transcript file.
+ */
+export function buildTelemetryFromTranscript(
+  sessionId: string,
+  transcriptPath: string,
+  source = "claude_code_transcript_fallback",
+): SessionTelemetryRecord | null {
+  if (!existsSync(transcriptPath)) return null;
+  const metrics = parseTranscript(transcriptPath);
+  const userQueries = extractActionableUserQueries(transcriptPath);
+  let timestamp = userQueries[0]?.timestamp ?? "";
+  if (!timestamp) {
+    try {
+      timestamp = statSync(transcriptPath).mtime.toISOString();
+    } catch {
+      timestamp = new Date().toISOString();
+    }
+  }
+  return {
+    timestamp,
+    session_id: sessionId,
+    cwd: "",
+    transcript_path: transcriptPath,
+    tool_calls: metrics.tool_calls,
+    total_tool_calls: metrics.total_tool_calls,
+    bash_commands: metrics.bash_commands,
+    skills_triggered: metrics.skills_triggered,
+    skills_invoked: metrics.skills_invoked,
+    assistant_turns: metrics.assistant_turns,
+    errors_encountered: metrics.errors_encountered,
+    transcript_chars: metrics.transcript_chars,
+    last_user_query: metrics.last_user_query,
+    source,
+    input_tokens: metrics.input_tokens,
+    output_tokens: metrics.output_tokens,
   };
 }
@@ -142,14 +314,14 @@ export function getLastUserMessage(transcriptPath: string): string | null {
       // Format 1: top-level role field
       if (entry.role === "user") {
-        const text = extractUserText(entry.content);
+        const text = extractActionableUserText(entry.content);
         if (text) return text;
       }
       // Format 2: nested message object
       const msg = entry.message as Record<string, unknown> | undefined;
       if (msg && typeof msg === "object" && msg.role === "user") {
-        const text = extractUserText(msg.content);
+        const text = extractActionableUserText(msg.content);
         if (text) return text;
       }
     }
@@ -160,6 +332,40 @@ export function getLastUserMessage(transcriptPath: string): string | null {
   return null;
 }
+function extractTextParts(content: unknown): string {
+  if (!Array.isArray(content)) return "";
+  return content
+    .filter(
+      (part): part is Record<string, unknown> =>
+        typeof part === "object" &&
+        part !== null &&
+        (part as Record<string, unknown>).type === "text",
+    )
+    .map((part) => (part.text as string) ?? "")
+    .filter(Boolean)
+    .join(" ")
+    .trim();
+}
+function summarizeCodexFunctionArguments(argumentsText: unknown): string {
+  if (typeof argumentsText !== "string" || !argumentsText.trim()) return "";
+  try {
+    const parsed = JSON.parse(argumentsText) as Record<string, unknown>;
+    return (
+      (typeof parsed.cmd === "string" && parsed.cmd.trim()) ||
+      (typeof parsed.command === "string" && parsed.command.trim()) ||
+      (typeof parsed.file_path === "string" && parsed.file_path.trim()) ||
+      (typeof parsed.path === "string" && parsed.path.trim()) ||
+      (typeof parsed.query === "string" && parsed.query.trim()) ||
+      argumentsText.trim()
+    ).slice(0, 200);
+  } catch {
+    return argumentsText.trim().slice(0, 200);
+  }
+}
 /**
  * Parse a transcript into a human-readable excerpt for the grader.
  */
@@ -184,19 +390,13 @@ export function readExcerpt(transcriptPath: string, maxChars = 8000): string {
     const msg = (entry.message as Record<string, unknown>) ?? entry;
     const role = (msg.role as string) ?? (entry.role as string) ?? "";
     const entryContent = msg.content ?? entry.content ?? "";
+    const eventType = (entry.type as string) ?? "";
     if (role === "user") {
       if (typeof entryContent === "string") {
         readable.push(`[USER] ${entryContent.slice(0, 200)}`);
       } else if (Array.isArray(entryContent)) {
-        const texts = entryContent
-          .filter(
-            (p): p is Record<string, unknown> =>
-              typeof p === "object" && p !== null && (p as Record<string, unknown>).type === "text",
-          )
-          .map((p) => (p.text as string) ?? "")
-          .filter(Boolean);
-        const text = texts.join(" ").trim().slice(0, 200);
+        const text = extractTextParts(entryContent).slice(0, 200);
         if (text) readable.push(`[USER] ${text}`);
       }
     } else if (role === "assistant") {
@@ -218,6 +418,45 @@ export function readExcerpt(transcriptPath: string, maxChars = 8000): string {
           }
         }
       }
+    } else if (eventType === "event_msg") {
+      const payload = (entry.payload as Record<string, unknown>) ?? {};
+      if (payload.type === "user_message") {
+        const text = extractActionableUserText(payload.message)?.slice(0, 200) ?? "";
+        if (text) readable.push(`[USER] ${text}`);
+      }
+    } else if (eventType === "turn.completed") {
+      const text = extractActionableUserText(entry.user_message)?.slice(0, 200) ?? "";
+      if (text) readable.push(`[USER] ${text}`);
+    } else if (eventType === "response_item") {
+      const payload = (entry.payload as Record<string, unknown>) ?? {};
+      const itemType = (payload.type as string) ?? "";
+      if (itemType === "function_call") {
+        const name = (payload.name as string) ?? "function_call";
+        const detail = summarizeCodexFunctionArguments(payload.arguments);
+        if (detail) readable.push(`[TOOL:${name}] ${detail}`);
+      } else if (itemType === "agent_reasoning") {
+        const text = ((payload.text as string) ?? "").trim().slice(0, 200);
+        if (text) readable.push(`[ASSISTANT] ${text}`);
+      } else if (itemType === "message" && (payload.role as string) === "assistant") {
+        const text = extractTextParts(payload.content).slice(0, 200);
+        if (text) readable.push(`[ASSISTANT] ${text}`);
+      }
+    } else if (
+      eventType === "item.completed" ||
+      eventType === "item.started" ||
+      eventType === "item.updated"
+    ) {
+      const item = (entry.item as Record<string, unknown>) ?? {};
+      const itemType = (item.item_type as string) ?? (item.type as string) ?? "";
+      if (itemType === "command_execution") {
+        const command = ((item.command as string) ?? "").trim().slice(0, 200);
+        if (command) readable.push(`[TOOL:command_execution] ${command}`);
+      } else {
+        const text = ((item.text as string) ?? "").trim().slice(0, 200);
+        if (text) readable.push(`[ASSISTANT] ${text}`);
+      }
     }
   }
@@ -228,12 +467,48 @@ export function readExcerpt(transcriptPath: string, maxChars = 8000): string {
   return `${full.slice(0, head)}\n\n... [truncated] ...\n\n${full.slice(-tail)}`;
 }
+/**
+ * Extract token usage from a transcript JSONL by summing usage fields.
+ *
+ * Scans for entries with a `usage` object containing `input_tokens` and
+ * `output_tokens` (the format Claude Code transcripts use).
+ */
+export function extractTokenUsage(transcriptPath: string): { input: number; output: number } {
+  if (!existsSync(transcriptPath)) return { input: 0, output: 0 };
+  const content = readFileSync(transcriptPath, "utf-8");
+  const lines = content.split("\n");
+  let input = 0;
+  let output = 0;
+  for (const raw of lines) {
+    const line = raw.trim();
+    if (!line) continue;
+    let entry: Record<string, unknown>;
+    try {
+      entry = JSON.parse(line);
+    } catch {
+      continue;
+    }
+    const usage = entry.usage as Record<string, unknown> | undefined;
+    if (usage && typeof usage === "object") {
+      if (typeof usage.input_tokens === "number") input += usage.input_tokens;
+      if (typeof usage.output_tokens === "number") output += usage.output_tokens;
+    }
+  }
+  return { input, output };
+}
 function emptyMetrics(): TranscriptMetrics {
   return {
     tool_calls: {},
     total_tool_calls: 0,
     bash_commands: [],
     skills_triggered: [],
+    skills_invoked: [],
     assistant_turns: 0,
     errors_encountered: 0,
     transcript_chars: 0,
@@ -258,3 +533,9 @@ function extractUserText(content: unknown): string | null {
   }
   return null;
 }
+function extractActionableUserText(content: unknown): string | null {
+  const text = extractUserText(content);
+  if (!text) return null;
+  return isActionableQueryText(text) ? text : null;
+}

package/cli/selftune/utils/trigger-check.ts ADDED Viewed

@@ -0,0 +1,89 @@
+/**
+ * Shared trigger-check utilities.
+ *
+ * Extracted from validate-proposal.ts so other modules (e.g. body validation,
+ * routing validation) can reuse the same prompt-building and response-parsing
+ * logic without depending on the evolution layer.
+ */
+// ---------------------------------------------------------------------------
+// Prompt building
+// ---------------------------------------------------------------------------
+/** Build the trigger check prompt for the LLM. */
+export function buildTriggerCheckPrompt(description: string, query: string): string {
+  return [
+    "Given this skill description, would the following user query trigger this skill?",
+    "Respond YES or NO only.",
+    "",
+    "Skill description:",
+    description,
+    "",
+    "User query:",
+    query,
+  ].join("\n");
+}
+// ---------------------------------------------------------------------------
+// Response parsing
+// ---------------------------------------------------------------------------
+/** Parse YES/NO from LLM response. */
+export function parseTriggerResponse(response: string): boolean {
+  const normalized = response.trim().toUpperCase();
+  if (normalized.startsWith("YES")) return true;
+  if (normalized.startsWith("NO")) return false;
+  return false; // conservative default
+}
+// ---------------------------------------------------------------------------
+// Batch prompt building
+// ---------------------------------------------------------------------------
+/** Build a batch trigger check prompt for multiple queries at once. */
+export function buildBatchTriggerCheckPrompt(description: string, queries: string[]): string {
+  const numbered = queries.map((q, i) => `${i + 1}. "${q}"`).join("\n");
+  return [
+    "Given this skill description, would each query trigger this skill?",
+    "Respond with the query number followed by YES or NO, one per line.",
+    "",
+    "Skill description:",
+    description,
+    "",
+    "Queries:",
+    numbered,
+  ].join("\n");
+}
+// ---------------------------------------------------------------------------
+// Batch response parsing
+// ---------------------------------------------------------------------------
+/**
+ * Parse a batch YES/NO response. Returns a boolean array aligned to the
+ * original query order. Defaults to false for unparseable or missing lines.
+ */
+export function parseBatchTriggerResponse(response: string, queryCount: number): boolean[] {
+  const results: boolean[] = new Array(queryCount).fill(false);
+  const lines = response.trim().split("\n");
+  for (const line of lines) {
+    const trimmed = line.trim();
+    if (!trimmed) continue;
+    // Try to extract a number prefix: "1. YES", "1: YES", "1 YES", "1) YES"
+    const match = trimmed.match(/^(\d+)[.):\s]+\s*(.*)/);
+    if (!match) continue;
+    const idx = parseInt(match[1], 10) - 1; // 1-based to 0-based
+    if (idx < 0 || idx >= queryCount) continue;
+    const answer = match[2].trim().toUpperCase();
+    if (answer.startsWith("YES")) {
+      results[idx] = true;
+    }
+    // NO or anything else stays false (the default)
+  }
+  return results;
+}

package/cli/selftune/utils/tui.ts ADDED Viewed

@@ -0,0 +1,156 @@
+/**
+ * tui.ts
+ *
+ * Zero-dependency TUI primitives for the selftune evolve pipeline.
+ * Uses raw ANSI escape codes for spinners, timers, and step progression.
+ * All output goes to stderr to keep stdout clean for JSON results.
+ */
+const SPINNER_FRAMES = ["⠋", "⠙", "⠹", "⠸", "⠼", "⠴", "⠦", "⠧", "⠇", "⠏"];
+const TICK_MS = 80;
+export interface EvolveTUI {
+  /** Start a new step with a spinner. Completes the previous step (if any) with checkmark. */
+  step(label: string): void;
+  /** Complete the current step with checkmark and a custom label. */
+  done(label: string): void;
+  /** Complete the current step as failed with cross mark and a custom label. */
+  fail(label: string): void;
+  /** Stop all timers and print a summary line. */
+  finish(summary: string): void;
+  /** Clean up timers without printing. For error paths. */
+  destroy(): void;
+}
+function createNoopTUI(): EvolveTUI {
+  return { step() {}, done() {}, fail() {}, finish() {}, destroy() {} };
+}
+export function createEvolveTUI(opts: { skillName: string; model: string }): EvolveTUI {
+  const noColor = !!process.env.NO_COLOR;
+  const isTTY = !!process.stderr.isTTY;
+  // If not a TTY, return no-op to avoid ANSI noise in pipes/tests
+  if (!isTTY && !process.env.SELFTUNE_TUI_FORCE) {
+    return createNoopTUI();
+  }
+  const write = (s: string) => process.stderr.write(s);
+  let spinnerFrame = 0;
+  let stepStartTime = Date.now();
+  let currentLabel = "";
+  let hasActiveSpinner = false;
+  let intervalId: ReturnType<typeof setInterval> | null = null;
+  let destroyed = false;
+  const checkMark = noColor ? "+" : "\u2713";
+  const crossMark = noColor ? "x" : "\u2717";
+  // Print header
+  write(`\n  selftune evolve \u2500\u2500 ${opts.skillName} \u2500\u2500 ${opts.model}\n\n`);
+  function formatTime(ms: number): string {
+    return `${(ms / 1000).toFixed(1)}s`;
+  }
+  function clearSpinnerLine(): void {
+    if (hasActiveSpinner) {
+      write("\x1b[A\x1b[2K");
+    }
+  }
+  function writeSpinnerLine(): void {
+    const frame = noColor ? ">" : SPINNER_FRAMES[spinnerFrame % SPINNER_FRAMES.length];
+    const elapsed = formatTime(Date.now() - stepStartTime);
+    const padding = Math.max(1, 48 - currentLabel.length);
+    write(`  ${frame} ${currentLabel}${" ".repeat(padding)}${elapsed}\n`);
+    hasActiveSpinner = true;
+  }
+  function startSpinner(label: string): void {
+    currentLabel = label;
+    stepStartTime = Date.now();
+    spinnerFrame = 0;
+    writeSpinnerLine();
+    intervalId = setInterval(() => {
+      spinnerFrame++;
+      clearSpinnerLine();
+      writeSpinnerLine();
+    }, TICK_MS);
+  }
+  function stopSpinner(): void {
+    if (intervalId !== null) {
+      clearInterval(intervalId);
+      intervalId = null;
+    }
+  }
+  function writeCompletedLine(marker: string, label: string, elapsed: number): void {
+    const time = formatTime(elapsed);
+    const padding = Math.max(1, 48 - label.length);
+    write(`  ${marker} ${label}${" ".repeat(padding)}${time}\n`);
+  }
+  function completeCurrentStep(marker: string, label: string): void {
+    const elapsed = Date.now() - stepStartTime;
+    stopSpinner();
+    clearSpinnerLine();
+    hasActiveSpinner = false;
+    writeCompletedLine(marker, label, elapsed);
+  }
+  return {
+    step(label: string): void {
+      if (destroyed) return;
+      // Complete previous step if there was one
+      if (hasActiveSpinner) {
+        completeCurrentStep(checkMark, currentLabel);
+      }
+      startSpinner(label);
+    },
+    done(label: string): void {
+      if (destroyed) return;
+      if (hasActiveSpinner) {
+        // Complete active spinner with custom label
+        completeCurrentStep(checkMark, label);
+      } else {
+        // No active spinner — instant step
+        writeCompletedLine(checkMark, label, 0);
+      }
+      currentLabel = "";
+    },
+    fail(label: string): void {
+      if (destroyed) return;
+      if (hasActiveSpinner) {
+        completeCurrentStep(crossMark, label);
+      } else {
+        writeCompletedLine(crossMark, label, 0);
+      }
+      currentLabel = "";
+    },
+    finish(summary: string): void {
+      if (destroyed) return;
+      if (hasActiveSpinner) {
+        completeCurrentStep(checkMark, currentLabel);
+      }
+      stopSpinner();
+      write(`\n  ${summary}\n`);
+      destroyed = true;
+    },
+    destroy(): void {
+      if (destroyed) return;
+      stopSpinner();
+      if (hasActiveSpinner) {
+        clearSpinnerLine();
+        hasActiveSpinner = false;
+      }
+      destroyed = true;
+    },
+  };
+}