npm - openhermes - Versions diffs - 4.3.0 → 4.11.2 - Mend

openhermes 4.3.0 → 4.11.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (143) hide show

package/CONTEXT.md +10 -1
package/README.md +54 -42
package/bootstrap.ts +396 -142
package/harness/agents/oh-browser.md +97 -0
package/harness/agents/oh-builder.md +78 -0
package/harness/agents/oh-facade.md +75 -0
package/harness/agents/oh-fusion.md +45 -0
package/harness/agents/oh-gauntlet.md +71 -0
package/harness/agents/oh-grill.md +71 -0
package/harness/agents/oh-investigate.md +60 -0
package/harness/agents/oh-manifest.md +95 -0
package/harness/agents/oh-plan-review.md +40 -0
package/harness/agents/oh-planner.md +50 -0
package/harness/agents/oh-refactor.md +37 -0
package/harness/agents/oh-retro.md +46 -0
package/harness/agents/oh-review.md +85 -0
package/harness/agents/oh-security.md +83 -0
package/harness/agents/oh-ship.md +76 -0
package/harness/agents/oh-skill-craft.md +38 -0
package/harness/agents/openhermes.md +28 -73
package/harness/codex/AUTOPILOT.md +235 -87
package/harness/codex/CHARTER.md +80 -0
package/harness/instructions/SHELL.md +76 -0
package/harness/lib/background/background.test.ts +197 -0
package/harness/lib/background/index.ts +7 -0
package/harness/lib/background/interfaces.ts +31 -0
package/harness/lib/background/manager.ts +320 -0
package/harness/lib/composer/compose.test.ts +168 -0
package/harness/lib/composer/compose.ts +65 -0
package/harness/lib/composer/fragments/01-identity.md +1 -0
package/harness/lib/composer/fragments/02-delegation.md +6 -0
package/harness/lib/composer/fragments/03-permissions.md +13 -0
package/harness/lib/composer/fragments/04-task-flow.md +15 -0
package/harness/lib/composer/fragments/05-confidence.md +5 -0
package/harness/lib/composer/fragments/06-parallelization.md +17 -0
package/harness/lib/composer/fragments/07-shell.md +41 -0
package/harness/lib/composer/fragments/08-routing.md +8 -0
package/harness/lib/composer/fragments/09-guardrails.md +12 -0
package/harness/lib/composer/index.ts +1 -0
package/harness/lib/hooks/builtins/confidence-gate-hook.ts +70 -0
package/harness/lib/hooks/builtins/delegation-depth-hook.ts +59 -0
package/harness/lib/hooks/builtins/error-recovery-hook.ts +107 -0
package/harness/lib/hooks/builtins/memory-sync-hook.ts +73 -0
package/harness/lib/hooks/builtins/plan-check-hook.ts +43 -0
package/harness/lib/hooks/builtins/route-tracking-hook.ts +147 -0
package/harness/lib/hooks/builtins/sanity-check-hook.ts +52 -0
package/harness/lib/hooks/builtins/shell-detect-hook.ts +96 -0
package/harness/lib/hooks/hooks.test.ts +1016 -0
package/harness/lib/hooks/index.ts +30 -0
package/harness/lib/hooks/registry.ts +416 -0
package/harness/lib/hooks/types.ts +71 -0
package/harness/lib/memory/index.ts +18 -0
package/harness/lib/memory/interfaces.ts +53 -0
package/harness/lib/memory/memory-manager.ts +205 -0
package/harness/lib/memory/memory.test.ts +491 -0
package/harness/lib/memory/plan-store.ts +366 -0
package/harness/lib/recovery/handler.ts +243 -0
package/harness/lib/recovery/index.ts +14 -0
package/harness/lib/recovery/interfaces.ts +48 -0
package/harness/lib/recovery/patterns.ts +149 -0
package/harness/lib/recovery/recovery.test.ts +312 -0
package/harness/lib/sanity/anomaly-tracker.ts +127 -0
package/harness/lib/sanity/checker.ts +178 -0
package/harness/lib/sanity/index.ts +13 -0
package/harness/lib/sanity/interfaces.ts +24 -0
package/harness/lib/sanity/sanity.test.ts +472 -0
package/harness/lib/sync/file-watcher.ts +174 -0
package/harness/lib/sync/index.ts +11 -0
package/harness/lib/sync/interfaces.ts +27 -0
package/harness/lib/sync/plan-sync.ts +536 -0
package/harness/lib/sync/sync.test.ts +832 -0
package/harness/skills/oh-ascii/DEEP.md +292 -0
package/harness/skills/oh-ascii/SKILL.md +31 -0
package/harness/skills/oh-ascii/scripts/check_ascii_alignment.py +596 -0
package/harness/skills/oh-browser/DEEP.md +54 -0
package/harness/skills/oh-browser/SKILL.md +30 -0
package/harness/skills/oh-builder/DEEP.md +63 -0
package/harness/skills/oh-builder/SKILL.md +12 -90
package/harness/skills/oh-expert/DEEP.md +85 -0
package/harness/skills/oh-expert/SKILL.md +13 -106
package/harness/skills/oh-facade/DEEP.md +182 -0
package/harness/skills/oh-facade/SKILL.md +15 -279
package/harness/skills/oh-freeze/DEEP.md +18 -0
package/harness/skills/oh-freeze/SKILL.md +10 -19
package/harness/skills/oh-full-output/DEEP.md +25 -0
package/harness/skills/oh-full-output/SKILL.md +12 -65
package/harness/skills/oh-fusion/DEEP.md +120 -0
package/harness/skills/oh-fusion/SKILL.md +17 -295
package/harness/skills/oh-gauntlet/DEEP.md +77 -0
package/harness/skills/oh-gauntlet/SKILL.md +13 -105
package/harness/skills/oh-grill/DEEP.md +51 -0
package/harness/skills/oh-grill/SKILL.md +12 -63
package/harness/skills/oh-guard/DEEP.md +19 -0
package/harness/skills/oh-guard/SKILL.md +10 -24
package/harness/skills/oh-handoff/DEEP.md +48 -0
package/harness/skills/oh-handoff/SKILL.md +13 -23
package/harness/skills/oh-health/DEEP.md +74 -0
package/harness/skills/oh-health/SKILL.md +13 -76
package/harness/skills/oh-init/DEEP.md +85 -0
package/harness/skills/oh-init/SKILL.md +13 -127
package/harness/skills/oh-investigate/DEEP.md +171 -0
package/harness/skills/oh-investigate/SKILL.md +13 -66
package/harness/skills/oh-issue/DEEP.md +21 -0
package/harness/skills/oh-issue/SKILL.md +11 -27
package/harness/skills/oh-manifest/DEEP.md +92 -0
package/harness/skills/oh-manifest/SKILL.md +12 -109
package/harness/skills/oh-plan-review/DEEP.md +90 -0
package/harness/skills/oh-plan-review/SKILL.md +13 -115
package/harness/skills/oh-planner/DEEP.md +172 -0
package/harness/skills/oh-planner/SKILL.md +12 -149
package/harness/skills/oh-prd/DEEP.md +45 -0
package/harness/skills/oh-prd/SKILL.md +10 -26
package/harness/skills/oh-refactor/DEEP.md +122 -0
package/harness/skills/oh-refactor/SKILL.md +17 -410
package/harness/skills/oh-retro/DEEP.md +26 -0
package/harness/skills/oh-retro/SKILL.md +12 -24
package/harness/skills/oh-review/DEEP.md +87 -0
package/harness/skills/oh-review/SKILL.md +11 -97
package/harness/skills/oh-security/DEEP.md +83 -0
package/harness/skills/oh-security/SKILL.md +14 -96
package/harness/skills/oh-ship/DEEP.md +141 -0
package/harness/skills/oh-ship/SKILL.md +14 -32
package/harness/skills/oh-skill-craft/DEEP.md +369 -0
package/harness/skills/oh-skill-craft/SKILL.md +13 -177
package/harness/skills/oh-skills-link/DEEP.md +16 -0
package/harness/skills/oh-skills-link/SKILL.md +10 -20
package/harness/skills/oh-skills-list/DEEP.md +20 -0
package/harness/skills/oh-skills-list/SKILL.md +9 -22
package/harness/skills/oh-triage/DEEP.md +23 -0
package/harness/skills/oh-triage/SKILL.md +8 -24
package/harness/skills/oh-worktree/DEEP.md +169 -0
package/harness/skills/oh-worktree/SKILL.md +32 -0
package/lib/harness-resolver.ts +8 -10
package/package.json +7 -5
package/tsconfig.json +1 -1
package/harness/codex/CONSTITUTION.md +0 -73
package/harness/codex/ROUTING.md +0 -92
package/harness/commands/oh-doctor.md +0 -26
package/harness/commands/oh-log.md +0 -18
package/harness/instructions/RUNTIME.md +0 -30
package/harness/skills/oh-caveman/SKILL.md +0 -42
package/harness/skills/oh-learn/SKILL.md +0 -101
package/lib/logger.ts +0 -75

package/harness/lib/recovery/patterns.ts ADDED Viewed

@@ -0,0 +1,149 @@
+// Categorized error patterns with recovery action generators.
+// Each pattern is a RegExp matched against error messages.
+// The first match wins. If none match, the handler escalates.
+import type { ErrorCategory, ErrorContext, RecoveryAction } from "./interfaces.ts";
+export interface ErrorPattern {
+  pattern: RegExp;
+  category: ErrorCategory;
+  getAction: (ctx: ErrorContext) => RecoveryAction;
+}
+/**
+ * Default backoff delays (ms) for retries: [initial, second, third]
+ */
+const RATE_LIMIT_BACKOFF = [1_000, 2_000, 4_000] as const;
+const NETWORK_BACKOFF = [500, 1_000, 2_000] as const;
+export const PATTERNS: ErrorPattern[] = [
+  // ── rate_limit ─────────────────────────────────────────────────────
+  {
+    pattern: /rate.?limit|too.?many.?requests|429/i,
+    category: "rate_limit",
+    getAction: (ctx: ErrorContext): RecoveryAction => {
+      const delay = RATE_LIMIT_BACKOFF[Math.min(ctx.attempt, RATE_LIMIT_BACKOFF.length - 1)];
+      return {
+        type: "retry",
+        delay,
+        maxAttempts: 3,
+        reason: `Rate limited (attempt ${ctx.attempt + 1}): backing off ${delay}ms`,
+        modifyPrompt: undefined,
+      };
+    },
+  },
+  // ── context_overflow ──────────────────────────────────────────────
+  {
+    pattern: /context.?length|token.?limit|maximum.?context/i,
+    category: "context_overflow",
+    getAction: (): RecoveryAction => ({
+      type: "compact",
+      maxAttempts: 2,
+      reason: "Context overflow detected: compacting before retry",
+      modifyPrompt:
+        "--- COMPACTED: Previous context exceeded token limits. Continue from here, preserving only essential state. ---",
+    }),
+  },
+  // ── network ───────────────────────────────────────────────────────
+  {
+    pattern: /ECONNREFUSED|ETIMEDOUT|network|fetch.?failed/i,
+    category: "network",
+    getAction: (ctx: ErrorContext): RecoveryAction => {
+      const delay = NETWORK_BACKOFF[Math.min(ctx.attempt, NETWORK_BACKOFF.length - 1)];
+      return {
+        type: "retry",
+        delay,
+        maxAttempts: 3,
+        reason: `Network error (attempt ${ctx.attempt + 1}): retrying in ${delay}ms`,
+      };
+    },
+  },
+  // ── session ───────────────────────────────────────────────────────
+  {
+    pattern: /session.?not.?found|session.?expired/i,
+    category: "session",
+    getAction: (): RecoveryAction => ({
+      type: "abort",
+      reason: "Session not found or expired — cannot recover",
+    }),
+  },
+  // ── tool_error ────────────────────────────────────────────────────
+  {
+    pattern: /tool.?not.?found|unknown.?tool/i,
+    category: "tool_error",
+    getAction: (): RecoveryAction => ({
+      type: "escalate",
+      reason: "Unknown or missing tool — orchestrator must decide",
+    }),
+  },
+  // ── parse_error ───────────────────────────────────────────────────
+  {
+    pattern: /parse.?error|invalid.?json|syntax.?error/i,
+    category: "parse_error",
+    getAction: (ctx: ErrorContext): RecoveryAction => ({
+      type: "retry",
+      delay: 0,
+      maxAttempts: 2,
+      reason: `Parse error on attempt ${ctx.attempt + 1}: retrying without modification`,
+    }),
+  },
+  // ── gibberish ─────────────────────────────────────────────────────
+  // Broad heuristic on output quality — catches gibberish, keyboard mash,
+  // repeated single characters, and long non-alphabetic sequences.
+  {
+    pattern: /gibberish|nonsens|unintelligible|asdfgh|qwerty|xxxxx|sdfsdf|[^a-z\s]{10,}|(.)\1{4,}/i,
+    category: "gibberish",
+    getAction: (): RecoveryAction => ({
+      type: "retry",
+      delay: 0,
+      maxAttempts: 2,
+      reason: "Gibberish output detected — retrying with clean context",
+      modifyPrompt:
+        "--- RECOVERY: Previous response was incoherent. Restart with only essential instructions. ---",
+    }),
+  },
+  // ── lsp_diagnostic ────────────────────────────────────────────────
+  {
+    pattern: /lsp.?diagnostic|tsc.?error|eslint.?error/i,
+    category: "lsp_diagnostic",
+    getAction: (): RecoveryAction => ({
+      type: "retry",
+      delay: 0,
+      maxAttempts: 2,
+      reason: "LSP diagnostic error — retrying with diagnostics in context",
+      modifyPrompt:
+        "--- RECOVERY: The following LSP diagnostics were detected in the last attempt. Fix them before continuing. ---",
+    }),
+  },
+  // ── timeout ───────────────────────────────────────────────────────
+  {
+    pattern: /execution.?timed.?out|timeout/i,
+    category: "timeout",
+    getAction: (): RecoveryAction => ({
+      type: "retry",
+      delay: 0,
+      maxAttempts: 2,
+      reason: "Execution timed out — retrying with task breakdown hint",
+      modifyPrompt:
+        "--- RECOVERY: Previous execution timed out. Break the task into smaller steps. ---",
+    }),
+  },
+];
+/**
+ * Default escalation action when no pattern matches.
+ */
+export function escalateAction(ctx: ErrorContext): RecoveryAction {
+  return {
+    type: "escalate",
+    reason: `Unrecognized error "${ctx.error.message}" — escalating to orchestrator`,
+  };
+}

package/harness/lib/recovery/recovery.test.ts ADDED Viewed

@@ -0,0 +1,312 @@
+import { describe, it, before, after } from "node:test";
+import assert from "node:assert/strict";
+import { RecoveryHandler } from "./handler.ts";
+import type { ErrorContext, RecoveryAction } from "./interfaces.ts";
+/**
+ * Helper to build an ErrorContext.
+ */
+function ctx(
+  sessionId: string,
+  message: string,
+  attempt = 0,
+  agent?: string,
+): ErrorContext {
+  return {
+    sessionId,
+    error: new Error(message),
+    attempt,
+    timestamp: Date.now(),
+    agent,
+  };
+}
+/**
+ * Check that an action has the expected type & reason substring.
+ */
+function assertAction(
+  action: RecoveryAction,
+  type: string,
+  reasonSubstring?: string,
+): void {
+  assert.equal(action.type, type, `expected type ${type}, got ${action.type}`);
+  if (reasonSubstring) {
+    assert.ok(
+      action.reason.toLowerCase().includes(reasonSubstring.toLowerCase()),
+      `expected reason to include "${reasonSubstring}", got "${action.reason}"`,
+    );
+  }
+}
+// ── Helpers ──────────────────────────────────────────────────────────
+describe("RecoveryHandler — pattern classification", () => {
+  let handler: RecoveryHandler;
+  before(() => {
+    handler = RecoveryHandler.getInstance();
+    handler.reset();
+  });
+  after(() => {
+    handler.reset();
+  });
+  // ── 9 category tests ─────────────────────────────────────────────
+  it("classifies rate_limit errors → retry with backoff", () => {
+    const action = handler.handleError(ctx("s1", "rate limit exceeded", 0));
+    assertAction(action, "retry", "rate");
+    assert.ok(action.delay! >= 1_000, `expected delay >= 1000, got ${action.delay}`);
+    // Second attempt gets longer backoff
+    const action2 = handler.handleError(ctx("s1", "429 Too Many Requests", 1));
+    assertAction(action2, "retry", "rate");
+    assert.ok(action2.delay! >= 2_000, `expected delay >= 2000, got ${action2.delay}`);
+  });
+  it("classifies context_overflow errors → compact", () => {
+    const action = handler.handleError(ctx("s1", "context length exceeded", 0));
+    assertAction(action, "compact", "context");
+    assert.ok(action.modifyPrompt, "compact action should include modifyPrompt");
+  });
+  it("classifies network errors → retry with backoff", () => {
+    const action = handler.handleError(ctx("s1", "ECONNREFUSED", 0));
+    assertAction(action, "retry", "network");
+    assert.ok(action.delay! >= 500, `expected delay >= 500, got ${action.delay}`);
+    const action2 = handler.handleError(ctx("s1", "fetch failed", 1));
+    assertAction(action2, "retry", "network");
+  });
+  it("classifies session errors → abort", () => {
+    const action = handler.handleError(ctx("s1", "session not found", 0));
+    assertAction(action, "abort", "session");
+  });
+  it("classifies tool_error → escalate", () => {
+    const action = handler.handleError(ctx("s1", "unknown tool: foo", 0));
+    assertAction(action, "escalate", "tool");
+  });
+  it("classifies parse_error → retry (max 2)", () => {
+    const action = handler.handleError(ctx("s1", "parse error at line 42", 0));
+    assertAction(action, "retry", "parse");
+    assert.equal(action.maxAttempts, 2);
+  });
+  it("classifies gibberish (explicit) → retry with clean context", () => {
+    // Gibberish pattern now matches "gibberish", "nonsens", keyboard mash,
+    // and other low-quality output patterns in error messages.
+    const action = handler.handleError(ctx("s1", "gibberish output detected", 0));
+    assertAction(action, "retry", "gibberish");
+    assert.ok(action.modifyPrompt, "gibberish action should include modifyPrompt");
+  });
+  it("classifies lsp_diagnostic → retry with diagnostic prompt", () => {
+    const action = handler.handleError(ctx("s1", "tsc error: Type 'X' not assignable", 0));
+    assertAction(action, "retry", "lsp");
+    assert.ok(action.modifyPrompt, "lsp action should include modifyPrompt");
+  });
+  it("classifies timeout → retry with breakdown hint", () => {
+    const action = handler.handleError(ctx("s1", "execution timed out", 0));
+    assertAction(action, "retry", "timed out");
+    assert.ok(action.modifyPrompt, "timeout action should include modifyPrompt");
+    assert.equal(action.maxAttempts, 2);
+  });
+  // ── Unknown error → escalate ──────────────────────────────────────
+  it("unknown error pattern → escalate", () => {
+    const action = handler.handleError(ctx("s1", "some weird error nobody expected", 0));
+    assertAction(action, "escalate", "unrecognized");
+  });
+  // ── Stats tracking ────────────────────────────────────────────────
+  it("getStats() reflects classified errors", () => {
+    handler.reset();
+    handler.handleError(ctx("s1", "rate limit", 0));
+    handler.handleError(ctx("s1", "ECONNREFUSED", 0));
+    handler.handleError(ctx("s1", "context length", 0));
+    handler.handleError(ctx("s1", "session not found", 0));
+    handler.handleError(ctx("s1", "unknown tool", 0));
+    handler.handleError(ctx("s1", "parse error", 0));
+    const stats = handler.getStats();
+    assert.equal(stats.totalRecoveries, 6);
+    assert.equal(stats.byCategory.rate_limit, 1);
+    assert.equal(stats.byCategory.network, 1);
+    assert.equal(stats.byCategory.context_overflow, 1);
+    assert.equal(stats.byCategory.session, 1);
+    assert.equal(stats.byCategory.tool_error, 1);
+    assert.equal(stats.byCategory.parse_error, 1);
+    // Unclassified categories should be 0
+    assert.equal(stats.byCategory.gibberish, 0);
+    assert.equal(stats.byCategory.lsp_diagnostic, 0);
+    assert.equal(stats.byCategory.timeout, 0);
+  });
+  it("getStats() tracks action types", () => {
+    handler.reset();
+    handler.handleError(ctx("s1", "rate limit", 0));       // retry
+    handler.handleError(ctx("s1", "session expired", 0));  // abort
+    handler.handleError(ctx("s1", "unknown tool", 0));     // escalate
+    handler.handleError(ctx("s1", "context length", 0));   // compact
+    const stats = handler.getStats();
+    assert.equal(stats.byAction.retry, 1);
+    assert.equal(stats.byAction.abort, 1);
+    assert.equal(stats.byAction.escalate, 1);
+    assert.equal(stats.byAction.compact, 1);
+  });
+  // ── getHistory ──────────────────────────────────────────────────
+  it("getHistory() returns records most recent first", () => {
+    handler.reset();
+    handler.handleError(ctx("s2", "rate limit", 0));
+    handler.handleError(ctx("s2", "timeout", 0));
+    const history = handler.getHistory();
+    assert.equal(history.length, 2);
+    assert.ok(history[0].timestamp >= history[1].timestamp);
+  });
+  it("getHistory(limit) respects limit", () => {
+    handler.reset();
+    handler.handleError(ctx("s3", "rate limit", 0));
+    handler.handleError(ctx("s3", "timeout", 0));
+    handler.handleError(ctx("s3", "ECONNREFUSED", 0));
+    const limited = handler.getHistory(2);
+    assert.equal(limited.length, 2);
+  });
+  // ── clearSession ────────────────────────────────────────────────
+  it("clearSession() removes records for a session", () => {
+    handler.reset();
+    handler.handleError(ctx("s_a", "rate limit", 0));
+    handler.handleError(ctx("s_b", "timeout", 0));
+    handler.handleError(ctx("s_a", "ECONNREFUSED", 0));
+    assert.equal(handler.getHistory().length, 3);
+    handler.clearSession("s_a");
+    const remaining = handler.getHistory();
+    assert.equal(remaining.length, 1);
+    assert.equal(remaining[0].context.sessionId, "s_b");
+  });
+});
+// ── withRecovery integration ──────────────────────────────────────────
+describe("RecoveryHandler — withRecovery", () => {
+  let handler: RecoveryHandler;
+  before(() => {
+    handler = RecoveryHandler.getInstance();
+    handler.reset();
+  });
+  after(() => {
+    handler.reset();
+  });
+  it("succeeds on first attempt", async () => {
+    const result = await handler.withRecovery("wr1", async () => "hello");
+    assert.equal(result, "hello");
+  });
+  it("retries on retryable error then succeeds", async () => {
+    handler.reset();
+    let callCount = 0;
+    const result = await handler.withRecovery("wr2", async () => {
+      callCount++;
+      if (callCount === 1) throw new Error("parse error: invalid json");
+      return "ok-after-retry";
+    });
+    assert.equal(result, "ok-after-retry");
+    assert.equal(callCount, 2);
+  });
+  it("throws on abort action", async () => {
+    handler.reset();
+    await assert.rejects(
+      handler.withRecovery("wr3", async () => {
+        throw new Error("session not found");
+      }),
+      /session not found/,
+    );
+  });
+  it("throws on escalate action", async () => {
+    handler.reset();
+    await assert.rejects(
+      handler.withRecovery("wr4", async () => {
+        throw new Error("unknown tool: foo");
+      }),
+      /unknown tool/,
+    );
+  });
+  it("respects category maxAttempts and then throws", async () => {
+    handler.reset();
+    await assert.rejects(
+      handler.withRecovery("wr5", async () => {
+        throw new Error("parse error: bad json");
+      }),
+      /parse error/,
+    );
+  });
+  it("respects global maxAttempts option", async () => {
+    handler.reset();
+    let callCount = 0;
+    // Use an unrecognized error (will escalate on first try — so throw immediately).
+    // Instead let's use a timeout pattern which has maxAttempts=2, but set global maxAttempts=1
+    await assert.rejects(
+      handler.withRecovery(
+        "wr6",
+        async () => {
+          callCount++;
+          throw new Error("execution timed out");
+        },
+        { maxAttempts: 1 },
+      ),
+    );
+    // With maxAttempts=1, it should only be called once
+    assert.equal(callCount, 1);
+  });
+  it("tracks success and failure in stats", async () => {
+    handler.reset();
+    // One success
+    await handler.withRecovery("wr7", async () => "good");
+    // One abort (failure)
+    await assert.rejects(
+      handler.withRecovery("wr7", async () => {
+        throw new Error("session expired");
+      }),
+    );
+    const stats = handler.getStats();
+    assert.ok(stats.successRate > 0);
+    assert.ok(stats.successRate < 1);
+  });
+});

package/harness/lib/sanity/anomaly-tracker.ts ADDED Viewed

@@ -0,0 +1,127 @@
+// ---------------------------------------------------------------------------
+// AnomalyTracker — singleton that tracks consecutive anomaly records per session
+// ---------------------------------------------------------------------------
+import type { AnomalyRecord, AnomalyTrackerConfig, SanityResult } from "./interfaces.ts";
+const DEFAULT_CONFIG: AnomalyTrackerConfig = {
+  maxConsecutiveAnomalies: 2,
+  escalationMessage: "recovery: compact context",
+};
+export class AnomalyTracker {
+  private static instance: AnomalyTracker;
+  private records = new Map<string, AnomalyRecord>();
+  private config: AnomalyTrackerConfig;
+  private constructor(config?: Partial<AnomalyTrackerConfig>) {
+    this.config = { ...DEFAULT_CONFIG, ...config };
+  }
+  /** Get the singleton instance. */
+  static getInstance(config?: Partial<AnomalyTrackerConfig>): AnomalyTracker {
+    if (!AnomalyTracker.instance) {
+      AnomalyTracker.instance = new AnomalyTracker(config);
+    }
+    return AnomalyTracker.instance;
+  }
+  /**
+   * Record a sanity result for a session.
+   * If unhealthy: increments consecutive count, updates reason/timestamp.
+   * If healthy: resets consecutive count to 0.
+   * Returns tracking info including whether escalation is needed.
+   */
+  record(
+    sessionId: string,
+    result: SanityResult,
+  ): {
+    shouldEscalate: boolean;
+    consecutiveAnomalies: number;
+    recoveryMessage?: string;
+  } {
+    const existing = this.records.get(sessionId);
+    if (!result.isHealthy) {
+      const count = (existing?.count ?? 0) + 1;
+      this.records.set(sessionId, {
+        sessionId,
+        count,
+        lastReason: result.reason ?? "Unknown anomaly",
+        lastTimestamp: Date.now(),
+      });
+      const shouldEscalate = count >= this.config.maxConsecutiveAnomalies;
+      return {
+        shouldEscalate,
+        consecutiveAnomalies: count,
+        recoveryMessage: shouldEscalate ? this.config.escalationMessage : undefined,
+      };
+    }
+    // Healthy output — reset counter
+    if (existing) {
+      this.records.set(sessionId, {
+        ...existing,
+        count: 0,
+        lastReason: "reset on healthy output",
+        lastTimestamp: Date.now(),
+      });
+    }
+    return {
+      shouldEscalate: false,
+      consecutiveAnomalies: 0,
+    };
+  }
+  /** Get the current anomaly record for a session. */
+  getRecord(sessionId: string): AnomalyRecord | undefined {
+    return this.records.get(sessionId);
+  }
+  /** Clear anomaly record for a specific session. */
+  clearSession(sessionId: string): void {
+    this.records.delete(sessionId);
+  }
+  /** Reset all tracking state (useful in tests). */
+  resetAll(): void {
+    this.records.clear();
+  }
+  /** Get the current config. */
+  getConfig(): AnomalyTrackerConfig {
+    return { ...this.config };
+  }
+  /** Update config at runtime. */
+  setConfig(config: Partial<AnomalyTrackerConfig>): void {
+    this.config = { ...this.config, ...config };
+  }
+  // ── Cross-invocation identical output detection ────────────────
+  private lastOutput: string | null = null;
+  private identicalOutputCount = 0;
+  readonly MAX_IDENTICAL_OUTPUTS = 3;
+  /**
+   * Track output for repeated identical content.
+   * Returns true if output should be flagged as degenerate.
+   */
+  trackOutput(text: string): boolean {
+    if (text === this.lastOutput) {
+      this.identicalOutputCount++;
+      if (this.identicalOutputCount >= this.MAX_IDENTICAL_OUTPUTS) {
+        return true; // Flagged — repeated identical output
+      }
+    } else {
+      this.identicalOutputCount = 0;
+    }
+    this.lastOutput = text;
+    return false;
+  }
+}