npm - @rosh100yx/outlier - Versions diffs - 0.4.25 → 0.10.2 - Mend

@rosh100yx/outlier 0.4.25 → 0.10.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/src/insights.ts ADDED Viewed

@@ -0,0 +1,109 @@
+// Insight rules engine — turns the raw metrics into meaning + one action.
+//
+// The numbers (75% AI, $63, blast radius HIGH) are data. Insights are what they MEAN
+// together: high AI authorship is only alarming if your agents can also deploy; a low
+// AI% next to heavy token use usually means missing trailers, not human authorship.
+// Each rule combines signals and returns a plain message + a concrete next step.
+import type { AuthorshipStats } from './git';
+import type { CarbonStats } from './carbon';
+import type { CapabilitiesStats } from './capabilities';
+export type Severity = 'critical' | 'warn' | 'info' | 'good';
+export interface Insight {
+  severity: Severity;
+  title: string;   // short headline
+  detail: string;  // one plain sentence of why
+  action: string;  // the one thing to do
+}
+const RANK: Record<Severity, number> = { critical: 0, warn: 1, info: 2, good: 3 };
+export interface InsightInput {
+  authorship: AuthorshipStats | null;
+  carbon: CarbonStats | null;
+  caps: CapabilitiesStats | null;
+  policyCap?: number; // 0..1, default 0.70
+}
+export function deriveInsights({ authorship, carbon, caps, policyCap = 0.70 }: InsightInput): Insight[] {
+  const out: Insight[] = [];
+  const ai = authorship ? authorship.ratio : null;
+  const cachePct = carbon && carbon.totalTokens ? (carbon.cacheReadTokens / carbon.totalTokens) * 100 : null;
+  const blast = caps ? caps.blastRadius : null;
+  const writeOrDeploy = caps ? caps.mcps.filter(m => ['money', 'exec', 'deploy', 'write-remote', 'write-local'].includes(m.reach)).length : 0;
+  const heavyTokens = carbon ? carbon.totalTokens > 1_000_000 : false;
+  // 1. The compound one: high reliance AND high reach = you may not own code that can ship.
+  if (ai !== null && ai > 0.7 && (blast === 'HIGH' || blast === 'CRITICAL')) {
+    out.push({
+      severity: 'critical',
+      title: 'High reliance + high reach',
+      detail: `AI wrote ${(ai * 100).toFixed(0)}% here and your agents can ${writeOrDeploy ? 'write/deploy' : 'reach external services'}. You may not own code that can ship to prod.`,
+      action: 'Review the core paths yourself before delegating more this session.',
+    });
+  } else if (ai !== null && ai > 0.7) {
+    // 2. High reliance alone.
+    out.push({
+      severity: 'warn',
+      title: 'You are mostly reviewing, not writing',
+      detail: `AI wrote ${(ai * 100).toFixed(0)}% of recent commits — you risk losing the skill to debug it unaided.`,
+      action: 'Read the AI-written code through, or hand-write the next core change.',
+    });
+  }
+  // 3. Honesty rule: low AI% next to heavy token use = missing trailers, not human authorship.
+  if (ai !== null && ai < 0.1 && heavyTokens) {
+    out.push({
+      severity: 'info',
+      title: 'Low AI% may be misleading',
+      detail: 'Heavy token use but few AI-tagged commits — your agent probably is not writing Co-Authored-By trailers.',
+      action: 'Treat the authorship number as a floor, not the truth, until trailers are on.',
+    });
+  }
+  // 4. Reach / blast radius, independent of authorship.
+  if (caps && (blast === 'CRITICAL' || blast === 'HIGH')) {
+    out.push({
+      severity: blast === 'CRITICAL' ? 'critical' : 'warn',
+      title: `Blast radius ${blast}`,
+      detail: `If an agent (or a prompt injection) drives your tools, it ${caps.blastReasons.slice(0, 2).join(' and ') || 'has broad reach'}.`,
+      action: 'Disable the write/deploy MCP tools you do not need this session.',
+    });
+  }
+  // 5. Cache waste = where the money goes.
+  if (cachePct !== null && cachePct > 80) {
+    out.push({
+      severity: 'warn',
+      title: 'Most of your spend is re-sent context',
+      detail: `${cachePct.toFixed(0)}% of your tokens just re-read old context — that is most of the bill, not new work.`,
+      action: 'Start fresh sessions for new tasks; keep context tight.',
+    });
+  }
+  // 6. Over the policy limit.
+  if (ai !== null && ai > policyCap) {
+    out.push({
+      severity: 'warn',
+      title: 'Over your AI-authorship limit',
+      detail: `AI authorship is ${(ai * 100).toFixed(0)}%, over your ${(policyCap * 100).toFixed(0)}% limit.`,
+      action: 'Either raise the cap deliberately, or write the next change yourself.',
+    });
+  }
+  // 7. Nothing wrong — say so (don't manufacture alarm).
+  if (out.length === 0) {
+    out.push({
+      severity: 'good',
+      title: 'Low risk',
+      detail: ai !== null
+        ? `You wrote most of this (${(100 - ai * 100).toFixed(0)}%) and your agents have limited reach.`
+        : 'No AI logs or git history found to flag.',
+      action: 'Carry on — re-run before your next big delegation.',
+    });
+  }
+  return out.sort((a, b) => RANK[a.severity] - RANK[b.severity]);
+}

package/src/sources.ts ADDED Viewed

@@ -0,0 +1,110 @@
+// Source Detector — the foundation for being tool-agnostic.
+//
+// outlier reads whatever AI telemetry the developer's tools already leave on disk, then
+// uses the richest source per metric and labels its provenance. This keeps us local-first
+// (we never call a tool's API — we read the local trace it writes) and lets us add new
+// tools without changing the receipt.
+//
+// Provenance ladder (per metric): MEASURED  > ESTIMATED > PROXY > NONE.
+import { homedir } from 'os';
+import { join } from 'path';
+import { existsSync } from 'fs';
+import { execSync } from 'child_process';
+export type Provenance = 'measured' | 'estimated' | 'proxy' | 'none';
+export interface DetectedSources {
+  tools: string[];                 // tools/CLIs found on this machine
+  tokenSource: { name: string; provenance: Provenance };
+  carbonSource: { name: string; provenance: Provenance };
+  capabilitySource: { name: string; provenance: Provenance };
+}
+const HOME = homedir();
+function hasCli(cmd: string): boolean {
+  try {
+    // `command -v` is POSIX and does not execute the target.
+    execSync(`command -v ${cmd}`, { stdio: 'ignore' });
+    return true;
+  } catch {
+    return false;
+  }
+}
+function hasPath(p: string): boolean {
+  try { return existsSync(p); } catch { return false; }
+}
+// Fingerprint the local environment. Cheap checks only (no file reads here).
+export function detectSources(cwd: string = process.cwd()): DetectedSources {
+  const tools: string[] = [];
+  const add = (t: string) => { if (!tools.includes(t)) tools.push(t); };
+  // AI coding agents (CLI on PATH or a config dir)
+  const cliTools: Record<string, string> = {
+    claude: 'claude', cursor: 'cursor', aider: 'aider', gemini: 'gemini',
+    opencode: 'opencode', cody: 'cody', continue: 'continue', codex: 'codex',
+  };
+  for (const [name, cmd] of Object.entries(cliTools)) {
+    if (hasCli(cmd)) add(name);
+  }
+  for (const [name, dir] of Object.entries({
+    claude: '.claude', cursor: '.cursor', gemini: '.gemini',
+    codeium: '.codeium', continue: '.continue', aider: '.aider.conf.yml',
+  })) {
+    if (hasPath(join(HOME, dir))) add(name);
+  }
+  // Carbon/cost tooling that writes local data we can trust
+  if (hasCli('codecarbon')) add('codecarbon');
+  if (hasCli('ccusage')) add('ccusage');
+  // ---- Token / cost source (richest first) ----
+  const slug = cwd.replace(/\//g, '-');
+  const claudeProjectDir = join(HOME, '.claude', 'projects', slug);
+  const tokenomicsLog = join(HOME, '.claude', 'tokenomics-log.jsonl');
+  let tokenSource: DetectedSources['tokenSource'];
+  if (hasPath(tokenomicsLog)) {
+    // Custom Stop hook: carries a real cost_usd field -> measured cost.
+    tokenSource = { name: 'caveman tokenomics log', provenance: 'measured' };
+  } else if (hasPath(claudeProjectDir)) {
+    // Standard transcripts: real tokens, estimated cost.
+    tokenSource = { name: 'Claude Code transcripts', provenance: 'estimated' };
+  } else if (tools.includes('ccusage')) {
+    tokenSource = { name: 'ccusage', provenance: 'estimated' };
+  } else {
+    tokenSource = { name: 'none', provenance: 'none' };
+  }
+  // ---- Carbon source ----
+  // Baseline is our bundled offline model+grid ESTIMATE. CodeCarbon, when it has actually
+  // written an emissions.csv, is a higher-accuracy MEASURED path (parser wired in a later
+  // pass). We do not claim "measured" just because the CLI is installed.
+  let carbonSource: DetectedSources['carbonSource'];
+  const codecarbonData = hasPath(join(cwd, 'emissions.csv')) || hasPath(join(HOME, '.codecarbon', 'emissions.csv'));
+  if (codecarbonData) {
+    carbonSource = { name: 'CodeCarbon emissions.csv', provenance: 'measured' };
+  } else if (tokenSource.provenance !== 'none') {
+    carbonSource = { name: 'model+grid estimate', provenance: 'estimated' };
+  } else {
+    carbonSource = { name: 'none', provenance: 'none' };
+  }
+  // ---- Capability source ----
+  let capabilitySource: DetectedSources['capabilitySource'];
+  if (hasPath(join(HOME, '.claude', 'settings.json')) || hasPath(join(cwd, 'AGENTS.md')) || hasPath(join(cwd, '.mcp.json'))) {
+    capabilitySource = { name: 'local config (settings/AGENTS/MCP)', provenance: 'measured' };
+  } else {
+    capabilitySource = { name: 'none', provenance: 'none' };
+  }
+  return { tools, tokenSource, carbonSource, capabilitySource };
+}
+// Short label for the receipt, e.g. "measured · caveman tokenomics log".
+export function provLabel(s: { name: string; provenance: Provenance }): string {
+  if (s.provenance === 'none') return 'no local data';
+  return `${s.provenance} · ${s.name}`;
+}