npm - harness-evolver - Versions diffs - 0.5.0 → 0.6.0 - Mend

harness-evolver 0.5.0 → 0.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/LICENSE +1 -1
package/agents/harness-evolver-proposer.md +2 -0
package/bin/install.js +98 -83
package/examples/classifier/harness.py +1 -1
package/package.json +2 -2
package/skills/compare/SKILL.md +1 -1
package/skills/deploy/SKILL.md +1 -1
package/skills/diagnose/SKILL.md +1 -1
package/skills/evolve/SKILL.md +1 -1
package/skills/init/SKILL.md +1 -1
package/skills/status/SKILL.md +1 -1
package/tools/init.py +34 -0

package/LICENSE CHANGED Viewed

@@ -1,6 +1,6 @@
 MIT License
-Copyright (c) 2026 Raphael Valdetaro Christi Cordeiro
+Copyright (c) 2026 Raphael Valdetaro
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal

package/agents/harness-evolver-proposer.md CHANGED Viewed

@@ -106,6 +106,8 @@ Append a summary to `PROPOSER_HISTORY.md`.
 6. **Prefer readable harnesses over defensive ones.** If the harness has grown past 2x the baseline size without proportional score improvement, consider simplifying. Accumulated try/catch blocks, redundant fallbacks, and growing if-chains are a code smell in evolved harnesses.
+7. **Use available API keys from environment.** Check `config.json` field `api_keys` to see which LLM APIs are available (Anthropic, OpenAI, Gemini, OpenRouter, etc.). Always read keys via `os.environ.get("KEY_NAME")` — never hardcode values. If an evolution strategy requires an API that isn't available, note it in `proposal.md` and choose an alternative.
 ## Documentation Lookup (if Context7 available)
 - Read `config.json` field `stack.detected` to see which libraries the harness uses.

package/bin/install.js CHANGED Viewed

@@ -1,7 +1,7 @@
 #!/usr/bin/env node
 /**
  * Harness Evolver installer.
- * Interactive setup with runtime selection, global/local choice.
+ * Copies plugin to Claude Code plugin cache and registers it.
  *
  * Usage: npx harness-evolver@latest
  */
@@ -15,8 +15,8 @@ const VERSION = require("../package.json").version;
 const PLUGIN_ROOT = path.resolve(__dirname, "..");
 const HOME = process.env.HOME || process.env.USERPROFILE;
-// ANSI colors
-const CYAN = "\x1b[36m";
+const MAGENTA = "\x1b[35m";
+const BRIGHT_MAGENTA = "\x1b[95m";
 const GREEN = "\x1b[32m";
 const YELLOW = "\x1b[33m";
 const RED = "\x1b[31m";
@@ -25,13 +25,13 @@ const BOLD = "\x1b[1m";
 const RESET = "\x1b[0m";
 const LOGO = `
-${CYAN}  ██╗  ██╗ █████╗ ██████╗ ███╗   ██╗███████╗███████╗███████╗
+${BRIGHT_MAGENTA}  ██╗  ██╗ █████╗ ██████╗ ███╗   ██╗███████╗███████╗███████╗
   ██║  ██║██╔══██╗██╔══██╗████╗  ██║██╔════╝██╔════╝██╔════╝
   ███████║███████║██████╔╝██╔██╗ ██║█████╗  ███████╗███████╗
   ██╔══██║██╔══██║██╔══██╗██║╚██╗██║██╔══╝  ╚════██║╚════██║
   ██║  ██║██║  ██║██║  ██║██║ ╚████║███████╗███████║███████║
   ╚═╝  ╚═╝╚═╝  ╚═╝╚═╝  ╚═╝╚═╝  ╚═══╝╚══════╝╚══════╝╚══════╝
-  ${BOLD}███████╗██╗   ██╗ ██████╗ ██╗    ██╗   ██╗███████╗██████╗
+  ${MAGENTA}${BOLD}███████╗██╗   ██╗ ██████╗ ██╗    ██╗   ██╗███████╗██████╗
   ██╔════╝██║   ██║██╔═══██╗██║    ██║   ██║██╔════╝██╔══██╗
   █████╗  ██║   ██║██║   ██║██║    ██║   ██║█████╗  ██████╔╝
   ██╔══╝  ╚██╗ ██╔╝██║   ██║██║    ╚██╗ ██╔╝██╔══╝  ██╔══██╗
@@ -39,13 +39,6 @@ ${CYAN}  ██╗  ██╗ █████╗ ██████╗ ███
   ╚══════╝  ╚═══╝   ╚═════╝ ╚══════╝ ╚═══╝  ╚══════╝╚═╝  ╚═╝${RESET}
 `;
-const RUNTIMES = [
-  { name: "Claude Code", dir: ".claude", detected: () => fs.existsSync(path.join(HOME, ".claude")) },
-  { name: "Cursor", dir: ".cursor", detected: () => fs.existsSync(path.join(HOME, ".cursor")) },
-  { name: "Codex", dir: ".codex", detected: () => fs.existsSync(path.join(HOME, ".codex")) },
-  { name: "Windsurf", dir: ".windsurf", detected: () => fs.existsSync(path.join(HOME, ".windsurf")) },
-];
 function ask(rl, question) {
   return new Promise((resolve) => rl.question(question, resolve));
 }
@@ -56,6 +49,7 @@ function copyDir(src, dest) {
     const srcPath = path.join(src, entry.name);
     const destPath = path.join(dest, entry.name);
     if (entry.isDirectory()) {
+      if (entry.name === "node_modules" || entry.name === ".git" || entry.name === "__pycache__" || entry.name === "tests" || entry.name === "docs") continue;
       copyDir(srcPath, destPath);
     } else {
       fs.copyFileSync(srcPath, destPath);
@@ -63,11 +57,6 @@ function copyDir(src, dest) {
   }
 }
-function copyFile(src, dest) {
-  fs.mkdirSync(path.dirname(dest), { recursive: true });
-  fs.copyFileSync(src, dest);
-}
 function checkPython() {
   try {
     execSync("python3 --version", { stdio: "pipe" });
@@ -77,47 +66,80 @@ function checkPython() {
   }
 }
-function installForRuntime(runtimeDir, scope) {
+function readJSON(filepath) {
+  try {
+    return JSON.parse(fs.readFileSync(filepath, "utf8"));
+  } catch {
+    return null;
+  }
+}
+function writeJSON(filepath, data) {
+  fs.mkdirSync(path.dirname(filepath), { recursive: true });
+  fs.writeFileSync(filepath, JSON.stringify(data, null, 2) + "\n");
+}
+function installPlugin(runtimeDir, scope) {
   const baseDir = scope === "local"
     ? path.join(process.cwd(), runtimeDir)
     : path.join(HOME, runtimeDir);
-  const commandsDir = path.join(baseDir, "commands", "harness-evolver");
-  const agentsDir = path.join(baseDir, "agents");
-  // Skills
-  const skillsSource = path.join(PLUGIN_ROOT, "skills");
-  if (fs.existsSync(skillsSource)) {
-    for (const skill of fs.readdirSync(skillsSource, { withFileTypes: true })) {
-      if (skill.isDirectory()) {
-        copyDir(path.join(skillsSource, skill.name), path.join(commandsDir, skill.name));
-        console.log(`  ${GREEN}✓${RESET} Installed skill: ${skill.name}`);
-      }
-    }
-  }
-  // Agents
-  const agentsSource = path.join(PLUGIN_ROOT, "agents");
-  if (fs.existsSync(agentsSource)) {
-    fs.mkdirSync(agentsDir, { recursive: true });
-    for (const agent of fs.readdirSync(agentsSource)) {
-      copyFile(path.join(agentsSource, agent), path.join(agentsDir, agent));
-      console.log(`  ${GREEN}✓${RESET} Installed agent: ${agent}`);
-    }
-  }
+  // 1. Copy plugin to cache
+  const cacheDir = path.join(baseDir, "plugins", "cache", "local", "harness-evolver", VERSION);
+  console.log(`  Copying plugin to ${scope === "local" ? "." : "~"}/${runtimeDir}/plugins/cache/...`);
+  copyDir(PLUGIN_ROOT, cacheDir);
+  console.log(`  ${GREEN}✓${RESET} Plugin files copied`);
+  // 2. Register in installed_plugins.json
+  const installedPath = path.join(baseDir, "plugins", "installed_plugins.json");
+  let installed = readJSON(installedPath) || { version: 2, plugins: {} };
+  if (!installed.plugins) installed.plugins = {};
+  installed.plugins["harness-evolver@local"] = [{
+    scope: "user",
+    installPath: cacheDir,
+    version: VERSION,
+    installedAt: new Date().toISOString(),
+    lastUpdated: new Date().toISOString(),
+  }];
+  writeJSON(installedPath, installed);
+  console.log(`  ${GREEN}✓${RESET} Registered in installed_plugins.json`);
+  // 3. Enable in settings.json
+  const settingsPath = path.join(baseDir, "settings.json");
+  let settings = readJSON(settingsPath) || {};
+  if (!settings.enabledPlugins) settings.enabledPlugins = {};
+  settings.enabledPlugins["harness-evolver@local"] = true;
+  writeJSON(settingsPath, settings);
+  console.log(`  ${GREEN}✓${RESET} Enabled in settings.json`);
+  // Count installed items
+  const skillCount = fs.existsSync(path.join(cacheDir, "skills"))
+    ? fs.readdirSync(path.join(cacheDir, "skills")).filter(f =>
+        fs.statSync(path.join(cacheDir, "skills", f)).isDirectory()
+      ).length
+    : 0;
+  const agentCount = fs.existsSync(path.join(cacheDir, "agents"))
+    ? fs.readdirSync(path.join(cacheDir, "agents")).length
+    : 0;
+  const toolCount = fs.existsSync(path.join(cacheDir, "tools"))
+    ? fs.readdirSync(path.join(cacheDir, "tools")).filter(f => f.endsWith(".py")).length
+    : 0;
+  console.log(`  ${GREEN}✓${RESET} ${skillCount} skills, ${agentCount} agent, ${toolCount} tools`);
 }
-function installTools() {
+function installToolsGlobal() {
   const toolsDir = path.join(HOME, ".harness-evolver", "tools");
   const toolsSource = path.join(PLUGIN_ROOT, "tools");
   if (fs.existsSync(toolsSource)) {
     fs.mkdirSync(toolsDir, { recursive: true });
     for (const tool of fs.readdirSync(toolsSource)) {
       if (tool.endsWith(".py")) {
-        copyFile(path.join(toolsSource, tool), path.join(toolsDir, tool));
-        console.log(`  ${GREEN}✓${RESET} Installed tool: ${tool}`);
+        fs.copyFileSync(path.join(toolsSource, tool), path.join(toolsDir, tool));
       }
     }
+    console.log(`  ${GREEN}✓${RESET} Tools copied to ~/.harness-evolver/tools/`);
   }
 }
@@ -126,7 +148,7 @@ function installExamples() {
   const examplesSource = path.join(PLUGIN_ROOT, "examples");
   if (fs.existsSync(examplesSource)) {
     copyDir(examplesSource, examplesDir);
-    console.log(`  ${GREEN}✓${RESET} Installed examples: classifier`);
+    console.log(`  ${GREEN}✓${RESET} Examples copied to ~/.harness-evolver/examples/`);
   }
 }
@@ -136,7 +158,6 @@ async function main() {
   console.log(`  ${DIM}Meta-Harness-style autonomous harness optimization${RESET}`);
   console.log();
-  // Check python
   if (!checkPython()) {
     console.error(`  ${RED}ERROR:${RESET} python3 not found in PATH. Install Python 3.8+ first.`);
     process.exit(1);
@@ -144,8 +165,14 @@ async function main() {
   console.log(`  ${GREEN}✓${RESET} python3 found`);
   // Detect runtimes
-  const available = RUNTIMES.filter((r) => r.detected());
-  if (available.length === 0) {
+  const RUNTIMES = [
+    { name: "Claude Code", dir: ".claude" },
+    { name: "Cursor", dir: ".cursor" },
+    { name: "Codex", dir: ".codex" },
+    { name: "Windsurf", dir: ".windsurf" },
+  ].filter(r => fs.existsSync(path.join(HOME, r.dir)));
+  if (RUNTIMES.length === 0) {
     console.error(`\n  ${RED}ERROR:${RESET} No supported runtime detected.`);
     console.error(`  Install Claude Code, Cursor, Codex, or Windsurf first.`);
     process.exit(1);
@@ -155,74 +182,62 @@ async function main() {
   // Runtime selection
   console.log(`\n  ${YELLOW}Which runtime(s) would you like to install for?${RESET}\n`);
-  available.forEach((r, i) => {
-    console.log(`  ${i + 1}) ${r.name.padEnd(14)} (~/${r.dir})`);
-  });
-  if (available.length > 1) {
-    console.log(`  ${available.length + 1}) All`);
+  RUNTIMES.forEach((r, i) => console.log(`  ${i + 1}) ${r.name.padEnd(14)} (~/${r.dir})`));
+  if (RUNTIMES.length > 1) {
+    console.log(`  ${RUNTIMES.length + 1}) All`);
     console.log(`\n  ${DIM}Select multiple: 1,2 or 1 2${RESET}`);
   }
-  const defaultChoice = "1";
-  const runtimeAnswer = await ask(rl, `\n  ${YELLOW}Choice [${defaultChoice}]:${RESET} `);
-  const runtimeInput = (runtimeAnswer.trim() || defaultChoice);
+  const runtimeAnswer = await ask(rl, `\n  ${YELLOW}Choice [1]:${RESET} `);
+  const runtimeInput = (runtimeAnswer.trim() || "1");
-  let selectedRuntimes;
-  if (runtimeInput === String(available.length + 1)) {
-    selectedRuntimes = available;
+  let selected;
+  if (runtimeInput === String(RUNTIMES.length + 1)) {
+    selected = RUNTIMES;
   } else {
-    const indices = runtimeInput.split(/[,\s]+/).map((s) => parseInt(s, 10) - 1);
-    selectedRuntimes = indices
-      .filter((i) => i >= 0 && i < available.length)
-      .map((i) => available[i]);
-  }
-  if (selectedRuntimes.length === 0) {
-    selectedRuntimes = [available[0]];
+    const indices = runtimeInput.split(/[,\s]+/).map(s => parseInt(s, 10) - 1);
+    selected = indices.filter(i => i >= 0 && i < RUNTIMES.length).map(i => RUNTIMES[i]);
   }
+  if (selected.length === 0) selected = [RUNTIMES[0]];
   // Scope selection
   console.log(`\n  ${YELLOW}Where would you like to install?${RESET}\n`);
-  console.log(`  1) Global  (~/${selectedRuntimes[0].dir}) - available in all projects`);
-  console.log(`  2) Local   (./${selectedRuntimes[0].dir}) - this project only`);
+  console.log(`  1) Global  (~/${selected[0].dir}) - available in all projects`);
+  console.log(`  2) Local   (./${selected[0].dir}) - this project only`);
   const scopeAnswer = await ask(rl, `\n  ${YELLOW}Choice [1]:${RESET} `);
   const scope = (scopeAnswer.trim() === "2") ? "local" : "global";
   console.log();
-  // Install for each selected runtime
-  for (const runtime of selectedRuntimes) {
-    const target = scope === "local" ? `./${runtime.dir}` : `~/${runtime.dir}`;
-    console.log(`  Installing for ${CYAN}${runtime.name}${RESET} to ${target}`);
+  // Install
+  for (const runtime of selected) {
+    console.log(`  Installing for ${BRIGHT_MAGENTA}${runtime.name}${RESET}\n`);
+    installPlugin(runtime.dir, scope);
     console.log();
-    installForRuntime(runtime.dir, scope);
   }
-  // Tools and examples are always global
-  installTools();
+  installToolsGlobal();
   installExamples();
-  // Write version file
+  // Version marker
   const versionPath = path.join(HOME, ".harness-evolver", "VERSION");
   fs.mkdirSync(path.dirname(versionPath), { recursive: true });
   fs.writeFileSync(versionPath, VERSION);
-  console.log(`  ${GREEN}✓${RESET} Wrote VERSION (${VERSION})`);
+  console.log(`  ${GREEN}✓${RESET} VERSION ${VERSION}`);
-  console.log(`\n  ${GREEN}Done!${RESET} Open a project in Claude Code and run ${CYAN}/harness-evolver:init${RESET}`);
+  console.log(`\n  ${GREEN}Done!${RESET} Open a project in Claude Code and run ${BRIGHT_MAGENTA}/harness-evolver:init${RESET}`);
   console.log(`\n  ${DIM}Quick start with example:${RESET}`);
   console.log(`    cp -r ~/.harness-evolver/examples/classifier ./my-project`);
   console.log(`    cd my-project && claude`);
   console.log(`    /harness-evolver:init`);
   console.log(`    /harness-evolver:evolve`);
-  console.log(`\n  ${DIM}GitHub: https://github.com/raphaelchristi/harness-evolver${RESET}`);
-  console.log();
+  console.log(`\n  ${DIM}GitHub: https://github.com/raphaelchristi/harness-evolver${RESET}\n`);
   rl.close();
 }
-main().catch((err) => {
+main().catch(err => {
   console.error(`  ${RED}ERROR:${RESET} ${err.message}`);
   process.exit(1);
 });

package/examples/classifier/harness.py CHANGED Viewed

@@ -39,7 +39,7 @@ def classify_mock(text):
 def classify_llm(text, config):
     import urllib.request
-    api_key = config.get("api_key", os.environ.get("ANTHROPIC_API_KEY", ""))
+    api_key = os.environ.get("ANTHROPIC_API_KEY", "")
     model = config.get("model", "claude-haiku-4-5-20251001")
     prompt = (

package/package.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "name": "harness-evolver",
-  "version": "0.5.0",
+  "version": "0.6.0",
   "description": "Meta-Harness-style autonomous harness optimization for Claude Code",
-  "author": "Raphael Valdetaro Christi Cordeiro",
+  "author": "Raphael Valdetaro",
   "license": "MIT",
   "repository": {
     "type": "git",

package/skills/compare/SKILL.md CHANGED Viewed

@@ -1,5 +1,5 @@
 ---
-name: compare
+name: harness-evolver:compare
 description: "Use when the user wants to compare two harness versions, understand what changed between iterations, see why one version scored better than another, or debug a regression."
 argument-hint: "<vA> <vB>"
 allowed-tools: [Read, Bash, Glob, Grep]

package/skills/deploy/SKILL.md CHANGED Viewed

@@ -1,5 +1,5 @@
 ---
-name: deploy
+name: harness-evolver:deploy
 description: "Use when the user wants to use the best evolved harness in their project, promote a version to production, copy the winning harness back, or is done evolving and wants to apply the result."
 argument-hint: "[version]"
 allowed-tools: [Read, Write, Bash, Glob]

package/skills/diagnose/SKILL.md CHANGED Viewed

@@ -1,5 +1,5 @@
 ---
-name: diagnose
+name: harness-evolver:diagnose
 description: "Use when the user wants to understand why a specific harness version failed, investigate a regression, analyze trace data, or debug a low score. Also use when the user says 'why did v003 fail' or 'what went wrong'."
 argument-hint: "[version]"
 allowed-tools: [Read, Bash, Glob, Grep]

package/skills/evolve/SKILL.md CHANGED Viewed

@@ -1,5 +1,5 @@
 ---
-name: evolve
+name: harness-evolver:evolve
 description: "Use when the user wants to run the optimization loop, improve harness performance, evolve the harness, or iterate on harness quality. Requires .harness-evolver/ to exist (run harness-evolver:init first)."
 argument-hint: "[--iterations N]"
 allowed-tools: [Read, Write, Edit, Bash, Glob, Grep, Agent]

package/skills/init/SKILL.md CHANGED Viewed

@@ -1,5 +1,5 @@
 ---
-name: init
+name: harness-evolver:init
 description: "Use when the user wants to set up harness optimization in their project, optimize an LLM agent, improve a harness, or mentions harness-evolver for the first time in a project without .harness-evolver/ directory."
 argument-hint: "[directory]"
 allowed-tools: [Read, Write, Edit, Bash, Glob, Grep, Agent]

package/skills/status/SKILL.md CHANGED Viewed

@@ -1,5 +1,5 @@
 ---
-name: status
+name: harness-evolver:status
 description: "Use when the user asks about evolution progress, current scores, best harness version, how many iterations ran, or whether the loop is stagnating. Also use when the user says 'status', 'progress', or 'how is it going'."
 allowed-tools: [Read, Bash]
 ---

package/tools/init.py CHANGED Viewed

@@ -89,6 +89,30 @@ def _auto_detect(search_dir):
     return harness, eval_script, tasks, config
+def _detect_api_keys():
+    """Detect which LLM/service API keys are available in the environment."""
+    KNOWN_KEYS = {
+        "ANTHROPIC_API_KEY": "Anthropic (Claude)",
+        "OPENAI_API_KEY": "OpenAI (GPT)",
+        "GOOGLE_API_KEY": "Google (Gemini)",
+        "GEMINI_API_KEY": "Google Gemini",
+        "OPENROUTER_API_KEY": "OpenRouter",
+        "LANGSMITH_API_KEY": "LangSmith",
+        "TOGETHER_API_KEY": "Together AI",
+        "GROQ_API_KEY": "Groq",
+        "MISTRAL_API_KEY": "Mistral",
+        "COHERE_API_KEY": "Cohere",
+        "FIREWORKS_API_KEY": "Fireworks AI",
+        "DEEPSEEK_API_KEY": "DeepSeek",
+        "XAI_API_KEY": "xAI (Grok)",
+    }
+    detected = {}
+    for env_var, display_name in KNOWN_KEYS.items():
+        if os.environ.get(env_var):
+            detected[env_var] = {"name": display_name, "status": "detected"}
+    return detected
 def _detect_langsmith():
     """Auto-detect LangSmith API key and return config section."""
     if os.environ.get("LANGSMITH_API_KEY"):
@@ -252,9 +276,19 @@ def main():
             "harnesses": "harnesses/",
         },
     }
+    # Detect API keys available in environment
+    api_keys = _detect_api_keys()
+    config["api_keys"] = api_keys
     with open(os.path.join(base, "config.json"), "w") as f:
         json.dump(config, f, indent=2)
+    if api_keys:
+        print("API keys detected:")
+        for env_var, info in api_keys.items():
+            print(f"  {info['name']} ({env_var})")
+        print()
     ls_config = config["eval"].get("langsmith", {})
     if ls_config.get("enabled"):
         print("  LangSmith tracing enabled (LANGSMITH_API_KEY detected)")