npm - selftune - Versions diffs - 0.1.4 → 0.2.1 - Mend

selftune 0.1.4 → 0.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (153) hide show

package/.claude/agents/diagnosis-analyst.md +156 -0
package/.claude/agents/evolution-reviewer.md +180 -0
package/.claude/agents/integration-guide.md +212 -0
package/.claude/agents/pattern-analyst.md +160 -0
package/CHANGELOG.md +46 -1
package/README.md +105 -257
package/apps/local-dashboard/dist/assets/geist-cyrillic-wght-normal-CHSlOQsW.woff2 +0 -0
package/apps/local-dashboard/dist/assets/geist-latin-ext-wght-normal-DMtmJ5ZE.woff2 +0 -0
package/apps/local-dashboard/dist/assets/geist-latin-wght-normal-Dm3htQBi.woff2 +0 -0
package/apps/local-dashboard/dist/assets/index-C4EOTFZ2.js +15 -0
package/apps/local-dashboard/dist/assets/index-bl-Webyd.css +1 -0
package/apps/local-dashboard/dist/assets/vendor-react-U7zYD9Rg.js +60 -0
package/apps/local-dashboard/dist/assets/vendor-table-B7VF2Ipl.js +26 -0
package/apps/local-dashboard/dist/assets/vendor-ui-D7_zX_qy.js +346 -0
package/apps/local-dashboard/dist/favicon.png +0 -0
package/apps/local-dashboard/dist/index.html +17 -0
package/apps/local-dashboard/dist/logo.png +0 -0
package/apps/local-dashboard/dist/logo.svg +9 -0
package/assets/BeforeAfter.gif +0 -0
package/assets/FeedbackLoop.gif +0 -0
package/assets/logo.svg +9 -0
package/assets/skill-health-badge.svg +20 -0
package/cli/selftune/activation-rules.ts +171 -0
package/cli/selftune/badge/badge-data.ts +108 -0
package/cli/selftune/badge/badge-svg.ts +212 -0
package/cli/selftune/badge/badge.ts +99 -0
package/cli/selftune/canonical-export.ts +183 -0
package/cli/selftune/constants.ts +103 -1
package/cli/selftune/contribute/bundle.ts +314 -0
package/cli/selftune/contribute/contribute.ts +214 -0
package/cli/selftune/contribute/sanitize.ts +162 -0
package/cli/selftune/cron/setup.ts +266 -0
package/cli/selftune/dashboard-contract.ts +202 -0
package/cli/selftune/dashboard-server.ts +1049 -0
package/cli/selftune/dashboard.ts +43 -156
package/cli/selftune/eval/baseline.ts +248 -0
package/cli/selftune/eval/composability-v2.ts +273 -0
package/cli/selftune/eval/composability.ts +117 -0
package/cli/selftune/eval/generate-unit-tests.ts +143 -0
package/cli/selftune/eval/hooks-to-evals.ts +101 -16
package/cli/selftune/eval/import-skillsbench.ts +221 -0
package/cli/selftune/eval/synthetic-evals.ts +172 -0
package/cli/selftune/eval/unit-test-cli.ts +152 -0
package/cli/selftune/eval/unit-test.ts +196 -0
package/cli/selftune/evolution/deploy-proposal.ts +142 -1
package/cli/selftune/evolution/evidence.ts +26 -0
package/cli/selftune/evolution/evolve-body.ts +586 -0
package/cli/selftune/evolution/evolve.ts +825 -116
package/cli/selftune/evolution/extract-patterns.ts +105 -16
package/cli/selftune/evolution/pareto.ts +314 -0
package/cli/selftune/evolution/propose-body.ts +171 -0
package/cli/selftune/evolution/propose-description.ts +100 -2
package/cli/selftune/evolution/propose-routing.ts +166 -0
package/cli/selftune/evolution/refine-body.ts +141 -0
package/cli/selftune/evolution/rollback.ts +21 -4
package/cli/selftune/evolution/validate-body.ts +254 -0
package/cli/selftune/evolution/validate-proposal.ts +257 -35
package/cli/selftune/evolution/validate-routing.ts +177 -0
package/cli/selftune/grading/auto-grade.ts +200 -0
package/cli/selftune/grading/grade-session.ts +513 -42
package/cli/selftune/grading/pre-gates.ts +104 -0
package/cli/selftune/grading/results.ts +42 -0
package/cli/selftune/hooks/auto-activate.ts +185 -0
package/cli/selftune/hooks/evolution-guard.ts +165 -0
package/cli/selftune/hooks/prompt-log.ts +172 -2
package/cli/selftune/hooks/session-stop.ts +123 -3
package/cli/selftune/hooks/skill-change-guard.ts +112 -0
package/cli/selftune/hooks/skill-eval.ts +119 -3
package/cli/selftune/index.ts +415 -48
package/cli/selftune/ingestors/claude-replay.ts +377 -0
package/cli/selftune/ingestors/codex-rollout.ts +345 -46
package/cli/selftune/ingestors/codex-wrapper.ts +207 -39
package/cli/selftune/ingestors/openclaw-ingest.ts +573 -0
package/cli/selftune/ingestors/opencode-ingest.ts +193 -17
package/cli/selftune/init.ts +376 -16
package/cli/selftune/last.ts +14 -5
package/cli/selftune/localdb/db.ts +63 -0
package/cli/selftune/localdb/materialize.ts +428 -0
package/cli/selftune/localdb/queries.ts +376 -0
package/cli/selftune/localdb/schema.ts +204 -0
package/cli/selftune/memory/writer.ts +447 -0
package/cli/selftune/monitoring/watch.ts +90 -16
package/cli/selftune/normalization.ts +682 -0
package/cli/selftune/observability.ts +19 -44
package/cli/selftune/orchestrate.ts +1073 -0
package/cli/selftune/quickstart.ts +203 -0
package/cli/selftune/repair/skill-usage.ts +576 -0
package/cli/selftune/schedule.ts +561 -0
package/cli/selftune/status.ts +59 -33
package/cli/selftune/sync.ts +627 -0
package/cli/selftune/types.ts +525 -5
package/cli/selftune/utils/canonical-log.ts +45 -0
package/cli/selftune/utils/frontmatter.ts +217 -0
package/cli/selftune/utils/hooks.ts +41 -0
package/cli/selftune/utils/html.ts +27 -0
package/cli/selftune/utils/llm-call.ts +103 -19
package/cli/selftune/utils/math.ts +10 -0
package/cli/selftune/utils/query-filter.ts +139 -0
package/cli/selftune/utils/skill-discovery.ts +340 -0
package/cli/selftune/utils/skill-log.ts +68 -0
package/cli/selftune/utils/skill-usage-confidence.ts +18 -0
package/cli/selftune/utils/transcript.ts +307 -26
package/cli/selftune/utils/trigger-check.ts +89 -0
package/cli/selftune/utils/tui.ts +156 -0
package/cli/selftune/workflows/discover.ts +254 -0
package/cli/selftune/workflows/skill-md-writer.ts +288 -0
package/cli/selftune/workflows/workflows.ts +188 -0
package/package.json +28 -11
package/packages/telemetry-contract/README.md +11 -0
package/packages/telemetry-contract/fixtures/golden.json +87 -0
package/packages/telemetry-contract/fixtures/golden.test.ts +42 -0
package/packages/telemetry-contract/index.ts +1 -0
package/packages/telemetry-contract/package.json +19 -0
package/packages/telemetry-contract/src/index.ts +2 -0
package/packages/telemetry-contract/src/types.ts +163 -0
package/packages/telemetry-contract/src/validators.ts +109 -0
package/skill/SKILL.md +180 -33
package/skill/Workflows/AutoActivation.md +145 -0
package/skill/Workflows/Badge.md +124 -0
package/skill/Workflows/Baseline.md +144 -0
package/skill/Workflows/Composability.md +107 -0
package/skill/Workflows/Contribute.md +94 -0
package/skill/Workflows/Cron.md +132 -0
package/skill/Workflows/Dashboard.md +214 -0
package/skill/Workflows/Doctor.md +63 -14
package/skill/Workflows/Evals.md +110 -18
package/skill/Workflows/EvolutionMemory.md +154 -0
package/skill/Workflows/Evolve.md +181 -21
package/skill/Workflows/EvolveBody.md +159 -0
package/skill/Workflows/Grade.md +36 -31
package/skill/Workflows/ImportSkillsBench.md +117 -0
package/skill/Workflows/Ingest.md +142 -21
package/skill/Workflows/Initialize.md +91 -23
package/skill/Workflows/Orchestrate.md +139 -0
package/skill/Workflows/Replay.md +91 -0
package/skill/Workflows/Rollback.md +23 -4
package/skill/Workflows/Schedule.md +61 -0
package/skill/Workflows/Sync.md +88 -0
package/skill/Workflows/UnitTest.md +150 -0
package/skill/Workflows/Watch.md +33 -1
package/skill/Workflows/Workflows.md +129 -0
package/skill/assets/activation-rules-default.json +26 -0
package/skill/assets/multi-skill-settings.json +63 -0
package/skill/assets/single-skill-settings.json +57 -0
package/skill/references/invocation-taxonomy.md +2 -2
package/skill/references/logs.md +164 -2
package/skill/references/setup-patterns.md +65 -0
package/skill/references/version-history.md +40 -0
package/skill/settings_snippet.json +23 -0
package/templates/activation-rules-default.json +27 -0
package/templates/multi-skill-settings.json +64 -0
package/templates/single-skill-settings.json +58 -0
package/dashboard/index.html +0 -1119

package/cli/selftune/memory/writer.ts ADDED Viewed

@@ -0,0 +1,447 @@
+/**
+ * Memory writer — pure functions for reading/writing evolution memory files.
+ *
+ * Memory files live at ~/.selftune/memory/ and provide human-readable session
+ * context that survives context resets. Three files:
+ *   - context.md  — active evolutions, known issues
+ *   - plan.md     — current priorities, strategy
+ *   - decisions.md — append-only decision log
+ *
+ * All functions accept an optional memoryDir parameter for testability.
+ * Default: MEMORY_DIR from constants.
+ */
+import { appendFileSync, existsSync, mkdirSync, readFileSync, writeFileSync } from "node:fs";
+import { join } from "node:path";
+import { MEMORY_DIR } from "../constants.js";
+import type { EvolveResult } from "../evolution/evolve.js";
+import type { RollbackResult } from "../evolution/rollback.js";
+import type {
+  DecisionRecord,
+  EvolutionProposal,
+  MemoryContext,
+  MemoryPlan,
+  MonitoringSnapshot,
+} from "../types.js";
+// ---------------------------------------------------------------------------
+// Directory management
+// ---------------------------------------------------------------------------
+export function ensureMemoryDir(memoryDir: string = MEMORY_DIR): void {
+  if (!existsSync(memoryDir)) {
+    mkdirSync(memoryDir, { recursive: true });
+  }
+}
+// ---------------------------------------------------------------------------
+// context.md
+// ---------------------------------------------------------------------------
+function formatContext(data: MemoryContext): string {
+  const lines: string[] = ["# Selftune Context", ""];
+  lines.push("## Active Evolutions");
+  if (data.activeEvolutions.length === 0) {
+    lines.push("- (none)");
+  } else {
+    for (const evo of data.activeEvolutions) {
+      lines.push(`- ${evo.skillName}: ${evo.status} — ${evo.description}`);
+    }
+  }
+  lines.push("");
+  lines.push("## Known Issues");
+  if (data.knownIssues.length === 0) {
+    lines.push("- (none)");
+  } else {
+    for (const issue of data.knownIssues) {
+      lines.push(`- ${issue}`);
+    }
+  }
+  lines.push("");
+  lines.push("## Last Updated");
+  lines.push(data.lastUpdated);
+  lines.push("");
+  return lines.join("\n");
+}
+function parseContext(content: string): MemoryContext {
+  const result: MemoryContext = {
+    activeEvolutions: [],
+    knownIssues: [],
+    lastUpdated: "",
+  };
+  const lines = content.split("\n");
+  let section = "";
+  for (const line of lines) {
+    const trimmed = line.trim();
+    if (trimmed === "## Active Evolutions") {
+      section = "evolutions";
+      continue;
+    }
+    if (trimmed === "## Known Issues") {
+      section = "issues";
+      continue;
+    }
+    if (trimmed === "## Last Updated") {
+      section = "updated";
+      continue;
+    }
+    if (trimmed.startsWith("# ")) {
+      section = "";
+      continue;
+    }
+    if (section === "evolutions" && trimmed.startsWith("- ") && trimmed !== "- (none)") {
+      // Format: "- skillName: status — description"
+      const body = trimmed.slice(2);
+      const colonIdx = body.indexOf(":");
+      if (colonIdx === -1) continue;
+      const skillName = body.slice(0, colonIdx).trim();
+      const rest = body.slice(colonIdx + 1).trim();
+      const dashIdx = rest.indexOf("—");
+      if (dashIdx === -1) {
+        result.activeEvolutions.push({ skillName, status: rest.trim(), description: "" });
+      } else {
+        const status = rest.slice(0, dashIdx).trim();
+        const description = rest.slice(dashIdx + 1).trim();
+        result.activeEvolutions.push({ skillName, status, description });
+      }
+    }
+    if (section === "issues" && trimmed.startsWith("- ") && trimmed !== "- (none)") {
+      result.knownIssues.push(trimmed.slice(2));
+    }
+    if (section === "updated" && trimmed.length > 0) {
+      result.lastUpdated = trimmed;
+      section = "";
+    }
+  }
+  return result;
+}
+export function writeContext(data: MemoryContext, memoryDir: string = MEMORY_DIR): void {
+  ensureMemoryDir(memoryDir);
+  const filePath = join(memoryDir, "context.md");
+  writeFileSync(filePath, formatContext(data), "utf-8");
+}
+export function readContext(memoryDir: string = MEMORY_DIR): MemoryContext {
+  const filePath = join(memoryDir, "context.md");
+  if (!existsSync(filePath)) {
+    return { activeEvolutions: [], knownIssues: [], lastUpdated: "" };
+  }
+  const content = readFileSync(filePath, "utf-8");
+  return parseContext(content);
+}
+// ---------------------------------------------------------------------------
+// plan.md
+// ---------------------------------------------------------------------------
+function formatPlan(data: MemoryPlan): string {
+  const lines: string[] = ["# Evolution Plan", ""];
+  lines.push("## Current Priorities");
+  if (data.currentPriorities.length === 0) {
+    lines.push("1. (none)");
+  } else {
+    for (let i = 0; i < data.currentPriorities.length; i++) {
+      lines.push(`${i + 1}. ${data.currentPriorities[i]}`);
+    }
+  }
+  lines.push("");
+  lines.push("## Strategy");
+  lines.push(data.strategy || "(no strategy defined)");
+  lines.push("");
+  lines.push("## Last Updated");
+  lines.push(data.lastUpdated);
+  lines.push("");
+  return lines.join("\n");
+}
+function parsePlan(content: string): MemoryPlan {
+  const result: MemoryPlan = {
+    currentPriorities: [],
+    strategy: "",
+    lastUpdated: "",
+  };
+  const lines = content.split("\n");
+  let section = "";
+  for (const line of lines) {
+    const trimmed = line.trim();
+    if (trimmed === "## Current Priorities") {
+      section = "priorities";
+      continue;
+    }
+    if (trimmed === "## Strategy") {
+      section = "strategy";
+      continue;
+    }
+    if (trimmed === "## Last Updated") {
+      section = "updated";
+      continue;
+    }
+    if (trimmed.startsWith("# ")) {
+      section = "";
+      continue;
+    }
+    if (section === "priorities") {
+      // Format: "1. priority text"
+      const match = trimmed.match(/^\d+\.\s+(.+)$/);
+      if (match && match[1] !== "(none)") {
+        result.currentPriorities.push(match[1]);
+      }
+    }
+    // Intentionally captures only the first non-empty line as the strategy for simplicity
+    if (section === "strategy" && trimmed.length > 0 && trimmed !== "(no strategy defined)") {
+      result.strategy = trimmed;
+    }
+    if (section === "updated" && trimmed.length > 0) {
+      result.lastUpdated = trimmed;
+      section = "";
+    }
+  }
+  return result;
+}
+export function writePlan(data: MemoryPlan, memoryDir: string = MEMORY_DIR): void {
+  ensureMemoryDir(memoryDir);
+  const filePath = join(memoryDir, "plan.md");
+  writeFileSync(filePath, formatPlan(data), "utf-8");
+}
+export function readPlan(memoryDir: string = MEMORY_DIR): MemoryPlan {
+  const filePath = join(memoryDir, "plan.md");
+  if (!existsSync(filePath)) {
+    return { currentPriorities: [], strategy: "", lastUpdated: "" };
+  }
+  const content = readFileSync(filePath, "utf-8");
+  return parsePlan(content);
+}
+// ---------------------------------------------------------------------------
+// decisions.md (append-only)
+// ---------------------------------------------------------------------------
+function formatDecisionEntry(record: DecisionRecord): string {
+  const lines: string[] = [
+    `## ${record.timestamp} — ${record.actionType}`,
+    `- **Skill:** ${record.skillName}`,
+    `- **Action:** ${record.action}`,
+    `- **Rationale:** ${record.rationale}`,
+    `- **Result:** ${record.result}`,
+    "",
+    "---",
+    "",
+  ];
+  return lines.join("\n");
+}
+function parseDecisions(content: string): DecisionRecord[] {
+  const records: DecisionRecord[] = [];
+  // Split on --- separators
+  const blocks = content.split(/^---$/m);
+  for (const block of blocks) {
+    const lines = block
+      .split("\n")
+      .map((l) => l.trim())
+      .filter((l) => l.length > 0);
+    let timestamp = "";
+    let actionType = "";
+    let skillName = "";
+    let action: DecisionRecord["action"] = "watched";
+    let rationale = "";
+    let result = "";
+    for (const line of lines) {
+      // Header: "## 2026-03-01T00:00:00Z — evolve"
+      const headerMatch = line.match(/^## (.+?) — (.+)$/);
+      if (headerMatch) {
+        timestamp = headerMatch[1];
+        actionType = headerMatch[2];
+        continue;
+      }
+      if (line.startsWith("- **Skill:**")) {
+        skillName = line.replace("- **Skill:**", "").trim();
+      } else if (line.startsWith("- **Action:**")) {
+        const raw = line.replace("- **Action:**", "").trim();
+        if (raw === "evolved" || raw === "rolled-back" || raw === "watched") {
+          action = raw;
+        }
+      } else if (line.startsWith("- **Rationale:**")) {
+        rationale = line.replace("- **Rationale:**", "").trim();
+      } else if (line.startsWith("- **Result:**")) {
+        result = line.replace("- **Result:**", "").trim();
+      }
+    }
+    if (timestamp && skillName) {
+      records.push({ timestamp, actionType, skillName, action, rationale, result });
+    }
+  }
+  return records;
+}
+export function appendDecision(record: DecisionRecord, memoryDir: string = MEMORY_DIR): void {
+  ensureMemoryDir(memoryDir);
+  const filePath = join(memoryDir, "decisions.md");
+  if (!existsSync(filePath)) {
+    writeFileSync(filePath, "# Decision Log\n\n", "utf-8");
+  }
+  const entry = formatDecisionEntry(record);
+  appendFileSync(filePath, entry, "utf-8");
+}
+export function readDecisions(memoryDir: string = MEMORY_DIR): DecisionRecord[] {
+  const filePath = join(memoryDir, "decisions.md");
+  if (!existsSync(filePath)) {
+    return [];
+  }
+  const content = readFileSync(filePath, "utf-8");
+  return parseDecisions(content);
+}
+// ---------------------------------------------------------------------------
+// High-level helpers for integration
+// ---------------------------------------------------------------------------
+export function updateContextAfterEvolve(
+  skillName: string,
+  proposal: EvolutionProposal,
+  result: EvolveResult,
+  memoryDir: string = MEMORY_DIR,
+): void {
+  const now = new Date().toISOString();
+  const context = readContext(memoryDir);
+  const status = result.deployed ? "deployed" : "failed";
+  const description = proposal.rationale || result.reason;
+  // Update or add the evolution entry
+  const idx = context.activeEvolutions.findIndex((e) => e.skillName === skillName);
+  if (idx >= 0) {
+    context.activeEvolutions[idx] = { skillName, status, description };
+  } else {
+    context.activeEvolutions.push({ skillName, status, description });
+  }
+  context.lastUpdated = now;
+  writeContext(context, memoryDir);
+  // Append decision
+  appendDecision(
+    {
+      timestamp: now,
+      actionType: "evolve",
+      skillName,
+      action: "evolved",
+      rationale: proposal.rationale || "Evolution triggered",
+      result: result.reason,
+    },
+    memoryDir,
+  );
+}
+export function updateContextAfterRollback(
+  skillName: string,
+  result: RollbackResult,
+  memoryDir: string = MEMORY_DIR,
+): void {
+  const now = new Date().toISOString();
+  const context = readContext(memoryDir);
+  const status = result.rolledBack ? "rolled-back" : "rollback-failed";
+  const description = result.reason;
+  const idx = context.activeEvolutions.findIndex((e) => e.skillName === skillName);
+  if (idx >= 0) {
+    context.activeEvolutions[idx] = { skillName, status, description };
+  } else {
+    context.activeEvolutions.push({ skillName, status, description });
+  }
+  context.lastUpdated = now;
+  writeContext(context, memoryDir);
+  appendDecision(
+    {
+      timestamp: now,
+      actionType: "rollback",
+      skillName,
+      action: "rolled-back",
+      rationale: result.reason,
+      result: result.rolledBack ? "Successfully rolled back" : "Rollback failed",
+    },
+    memoryDir,
+  );
+}
+export function updateContextAfterWatch(
+  skillName: string,
+  snapshot: MonitoringSnapshot,
+  memoryDir: string = MEMORY_DIR,
+): void {
+  const now = new Date().toISOString();
+  const context = readContext(memoryDir);
+  const status = snapshot.regression_detected ? "regression" : "healthy";
+  const description = `pass_rate=${snapshot.pass_rate.toFixed(2)}, baseline=${snapshot.baseline_pass_rate.toFixed(2)}`;
+  const idx = context.activeEvolutions.findIndex((e) => e.skillName === skillName);
+  if (idx >= 0) {
+    context.activeEvolutions[idx] = { skillName, status, description };
+  } else {
+    context.activeEvolutions.push({ skillName, status, description });
+  }
+  // Add known issue if regression detected
+  if (snapshot.regression_detected) {
+    const issue = `Regression detected for ${skillName}: pass_rate=${snapshot.pass_rate.toFixed(2)} below baseline=${snapshot.baseline_pass_rate.toFixed(2)}`;
+    if (!context.knownIssues.some((i) => i.includes(skillName) && i.includes("Regression"))) {
+      context.knownIssues.push(issue);
+    }
+  }
+  context.lastUpdated = now;
+  writeContext(context, memoryDir);
+  appendDecision(
+    {
+      timestamp: now,
+      actionType: "watch",
+      skillName,
+      action: "watched",
+      rationale: `Monitoring check: pass_rate=${snapshot.pass_rate.toFixed(2)}, regression=${snapshot.regression_detected}`,
+      result: snapshot.regression_detected
+        ? `Regression detected (pass_rate=${snapshot.pass_rate.toFixed(2)})`
+        : `Healthy (pass_rate=${snapshot.pass_rate.toFixed(2)})`,
+    },
+    memoryDir,
+  );
+}

package/cli/selftune/monitoring/watch.ts CHANGED Viewed

@@ -9,7 +9,10 @@
 import { parseArgs } from "node:util";
 import { QUERY_LOG, SKILL_LOG, TELEMETRY_LOG } from "../constants.js";
+import { classifyInvocation } from "../eval/hooks-to-evals.js";
 import { getLastDeployedProposal } from "../evolution/audit.js";
+import { updateContextAfterWatch } from "../memory/writer.js";
+import type { SyncResult } from "../sync.js";
 import type {
   InvocationType,
   MonitoringSnapshot,
@@ -18,6 +21,11 @@ import type {
   SkillUsageRecord,
 } from "../types.js";
 import { readJsonl } from "../utils/jsonl.js";
+import {
+  filterActionableQueryRecords,
+  filterActionableSkillUsageRecords,
+} from "../utils/query-filter.js";
+import { readEffectiveSkillUsageRecords } from "../utils/skill-log.js";
 // ---------------------------------------------------------------------------
 // Public interfaces
@@ -40,6 +48,10 @@ export interface WatchOptions {
     skillPath: string;
     proposalId?: string;
   }) => Promise<{ rolledBack: boolean; restoredDescription: string; reason: string }>;
+  /** Source-truth refresh before reading logs. */
+  syncFirst?: boolean;
+  syncForce?: boolean;
+  _syncFn?: typeof import("../sync.js").syncSources;
 }
 export interface WatchResult {
@@ -47,6 +59,7 @@ export interface WatchResult {
   alert: string | null;
   rolledBack: boolean;
   recommendation: string;
+  sync_result?: SyncResult;
 }
 // ---------------------------------------------------------------------------
@@ -55,6 +68,7 @@ export interface WatchResult {
 const DEFAULT_BASELINE_PASS_RATE = 0.5;
 const DEFAULT_REGRESSION_THRESHOLD = 0.1;
+export const MIN_MONITORING_SKILL_CHECKS = 3;
 // ---------------------------------------------------------------------------
 // computeMonitoringSnapshot - pure function
@@ -64,9 +78,9 @@ const DEFAULT_REGRESSION_THRESHOLD = 0.1;
  * Compute a monitoring snapshot from raw log records.
  *
  * The function windows telemetry to the last `windowSessions` entries, then
- * scopes skill and query records to those sessions. If telemetry is empty or
- * no records match the windowed session IDs, all provided skill/query records
- * are used directly (unfiltered by session).
+ * scopes skill and actionable query records to those sessions. If telemetry is
+ * empty or no records match the windowed session IDs, all provided skill/query
+ * records are used directly (unfiltered by session).
  *
  * @param skillName        - The skill to monitor
  * @param telemetry        - All session telemetry records
@@ -86,43 +100,53 @@ export function computeMonitoringSnapshot(
   regressionThreshold: number = DEFAULT_REGRESSION_THRESHOLD,
 ): MonitoringSnapshot {
   // 1. Window the telemetry to the last N sessions (by array order, assumed chronological)
+  const actionableSkillRecords = filterActionableSkillUsageRecords(skillRecords);
+  const actionableQueryRecords = filterActionableQueryRecords(queryRecords);
   const windowedTelemetry = telemetry.slice(-windowSessions);
   const windowedSessionIds = new Set(windowedTelemetry.map((t) => t.session_id));
   // 2. Filter skill records by skill name first
-  const skillNameFiltered = skillRecords.filter((r) => r.skill_name === skillName);
+  const skillNameFiltered = actionableSkillRecords.filter((r) => r.skill_name === skillName);
   // 3. Apply session ID windowing only if telemetry is present and overlaps
   const hasSessionOverlap =
     windowedSessionIds.size > 0 &&
     (skillNameFiltered.some((r) => windowedSessionIds.has(r.session_id)) ||
-      queryRecords.some((r) => windowedSessionIds.has(r.session_id)));
+      actionableQueryRecords.some((r) => windowedSessionIds.has(r.session_id)));
   const filteredSkillRecords = hasSessionOverlap
     ? skillNameFiltered.filter((r) => windowedSessionIds.has(r.session_id))
     : skillNameFiltered;
   const filteredQueryRecords = hasSessionOverlap
-    ? queryRecords.filter((r) => windowedSessionIds.has(r.session_id))
-    : queryRecords;
+    ? actionableQueryRecords.filter((r) => windowedSessionIds.has(r.session_id))
+    : actionableQueryRecords;
-  // 4. Compute pass rate: triggered_count / total_query_count
+  // 4. Compute pass rate from explicit skill checks, not from all queries.
   const triggeredCount = filteredSkillRecords.filter((r) => r.triggered).length;
-  const totalQueries = filteredQueryRecords.length;
-  const passRate = totalQueries === 0 ? 1.0 : triggeredCount / totalQueries;
+  const totalSkillChecks = filteredSkillRecords.length;
+  const passRate = totalSkillChecks === 0 ? 0 : triggeredCount / totalSkillChecks;
   // 5. Compute false negative rate from skill usage records
-  const totalSkillChecks = filteredSkillRecords.length;
   const falseNegatives = filteredSkillRecords.filter((r) => !r.triggered).length;
   const falseNegativeRate = totalSkillChecks === 0 ? 0 : falseNegatives / totalSkillChecks;
-  // 6. by_invocation_type: MVP classifies everything as "implicit"
+  // 6. by_invocation_type: classify each skill record using classifyInvocation
   const byInvocationType: Record<InvocationType, { passed: number; total: number }> = {
     explicit: { passed: 0, total: 0 },
-    implicit: { passed: triggeredCount, total: totalSkillChecks },
+    implicit: { passed: 0, total: 0 },
     contextual: { passed: 0, total: 0 },
     negative: { passed: 0, total: 0 },
   };
+  for (const record of filteredSkillRecords) {
+    const invType = classifyInvocation(
+      typeof record.query === "string" ? record.query : "",
+      skillName,
+    );
+    byInvocationType[invType].total++;
+    if (record.triggered) {
+      byInvocationType[invType].passed++;
+    }
+  }
   // 7. Regression detection: pass_rate < baseline - threshold
   // Use rounding to avoid floating-point boundary issues (e.g. 0.8 - 0.1 = 0.7000000000000001)
@@ -130,12 +154,16 @@ export function computeMonitoringSnapshot(
   const adjustedThreshold =
     Math.round((baselinePassRate - regressionThreshold) * precision) / precision;
   const roundedPassRate = Math.round(passRate * precision) / precision;
-  const regressionDetected = roundedPassRate < adjustedThreshold;
+  const hasEnoughSignalForRegression =
+    totalSkillChecks >= MIN_MONITORING_SKILL_CHECKS ||
+    (totalSkillChecks === 0 && filteredQueryRecords.length >= MIN_MONITORING_SKILL_CHECKS);
+  const regressionDetected = hasEnoughSignalForRegression && roundedPassRate < adjustedThreshold;
   return {
     timestamp: new Date().toISOString(),
     skill_name: skillName,
     window_sessions: windowSessions,
+    skill_checks: totalSkillChecks,
     pass_rate: passRate,
     false_negative_rate: falseNegativeRate,
     by_invocation_type: byInvocationType,
@@ -163,11 +191,28 @@ export async function watch(options: WatchOptions): Promise<WatchResult> {
     _queryLogPath = QUERY_LOG,
     _auditLogPath,
     _rollbackFn,
+    syncFirst = false,
+    syncForce = false,
+    _syncFn,
   } = options;
+  let syncResult: SyncResult | undefined;
+  if (syncFirst) {
+    const { createDefaultSyncOptions, syncSources: realSyncSources } = await import("../sync.js");
+    const syncRunner = _syncFn ?? realSyncSources;
+    syncResult = syncRunner(
+      createDefaultSyncOptions({
+        force: syncForce,
+      }),
+    );
+  }
   // 1. Read log files
   const telemetry = readJsonl<SessionTelemetryRecord>(_telemetryLogPath);
-  const skillRecords = readJsonl<SkillUsageRecord>(_skillLogPath);
+  const skillRecords =
+    _skillLogPath === SKILL_LOG
+      ? readEffectiveSkillUsageRecords()
+      : readJsonl<SkillUsageRecord>(_skillLogPath);
   const queryRecords = readJsonl<QueryLogRecord>(_queryLogPath);
   // 2. Determine baseline pass rate from last deployed audit entry
@@ -208,15 +253,34 @@ export async function watch(options: WatchOptions): Promise<WatchResult> {
     recommendation = rolledBack
       ? `Rolled back "${skillName}" to previous version. Monitor to confirm recovery.`
       : `Consider running: selftune rollback --skill "${skillName}" --skill-path "${skillPath}"`;
+  } else if (snapshot.skill_checks < MIN_MONITORING_SKILL_CHECKS) {
+    recommendation =
+      `Skill "${skillName}" has only ${snapshot.skill_checks} actionable check(s) in the current window. ` +
+      `Need at least ${MIN_MONITORING_SKILL_CHECKS} before calling it stable.`;
   } else {
     recommendation = `Skill "${skillName}" is stable. Pass rate ${snapshot.pass_rate.toFixed(2)} is within acceptable range of baseline ${baselinePassRate.toFixed(2)}.`;
   }
+  // Update evolution memory (fail-open)
+  try {
+    updateContextAfterWatch(skillName, snapshot);
+  } catch (err) {
+    // Fail-open: memory writes should never fail the main operation
+    console.error(
+      JSON.stringify({
+        level: "debug",
+        code: "memory_write_failed",
+        message: `Failed to update memory after watch for "${skillName}": ${err instanceof Error ? err.message : String(err)}`,
+      }),
+    );
+  }
   return {
     snapshot,
     alert,
     rolledBack,
     recommendation,
+    ...(syncResult ? { sync_result: syncResult } : {}),
   };
 }
@@ -260,6 +324,8 @@ export async function cliMain(): Promise<void> {
       window: { type: "string", default: "20" },
       threshold: { type: "string", default: "0.1" },
       "auto-rollback": { type: "boolean", default: false },
+      "sync-first": { type: "boolean", default: false },
+      "sync-force": { type: "boolean", default: false },
       help: { type: "boolean", default: false },
     },
     strict: true,
@@ -277,6 +343,8 @@ Options:
   --window            Number of recent sessions to consider (default: 20)
   --threshold         Regression threshold below baseline (default: 0.1)
   --auto-rollback     Automatically rollback on regression detection
+  --sync-first        Refresh source-truth telemetry before reading watch inputs
+  --sync-force        Force a full rescan during --sync-first
   --help              Show this help message`);
     process.exit(0);
   }
@@ -285,6 +353,10 @@ Options:
     console.error("[ERROR] --skill and --skill-path are required");
     process.exit(1);
   }
+  if ((values["sync-force"] ?? false) && !(values["sync-first"] ?? false)) {
+    console.error("[ERROR] --sync-force requires --sync-first");
+    process.exit(1);
+  }
   const rawWindow = values.window ?? "20";
   if (!/^\d+$/.test(rawWindow)) {
@@ -314,6 +386,8 @@ Options:
     windowSessions,
     regressionThreshold,
     autoRollback: values["auto-rollback"] ?? false,
+    syncFirst: values["sync-first"] ?? false,
+    syncForce: values["sync-force"] ?? false,
   });
   console.log(JSON.stringify(result, null, 2));