npm - harness-evolver - Versions diffs - 0.4.0 → 0.5.1 - Mend

harness-evolver 0.4.0 → 0.5.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/agents/harness-evolver-proposer.md +2 -0
package/bin/install.js +156 -52
package/examples/classifier/harness.py +1 -1
package/package.json +1 -1
package/tools/init.py +34 -0

package/agents/harness-evolver-proposer.md CHANGED Viewed

@@ -106,6 +106,8 @@ Append a summary to `PROPOSER_HISTORY.md`.
 6. **Prefer readable harnesses over defensive ones.** If the harness has grown past 2x the baseline size without proportional score improvement, consider simplifying. Accumulated try/catch blocks, redundant fallbacks, and growing if-chains are a code smell in evolved harnesses.
+7. **Use available API keys from environment.** Check `config.json` field `api_keys` to see which LLM APIs are available (Anthropic, OpenAI, Gemini, OpenRouter, etc.). Always read keys via `os.environ.get("KEY_NAME")` — never hardcode values. If an evolution strategy requires an API that isn't available, note it in `proposal.md` and choose an alternative.
 ## Documentation Lookup (if Context7 available)
 - Read `config.json` field `stack.detected` to see which libraries the harness uses.

package/bin/install.js CHANGED Viewed

@@ -1,26 +1,54 @@
 #!/usr/bin/env node
 /**
  * Harness Evolver installer.
- * Detects Claude Code, copies skills/agents/tools to the right locations.
+ * Interactive setup with runtime selection, global/local choice.
  *
  * Usage: npx harness-evolver@latest
  */
 const fs = require("fs");
 const path = require("path");
+const readline = require("readline");
 const { execSync } = require("child_process");
+const VERSION = require("../package.json").version;
 const PLUGIN_ROOT = path.resolve(__dirname, "..");
 const HOME = process.env.HOME || process.env.USERPROFILE;
-const CLAUDE_DIR = path.join(HOME, ".claude");
-const COMMANDS_DIR = path.join(CLAUDE_DIR, "commands", "harness-evolver");
-const AGENTS_DIR = path.join(CLAUDE_DIR, "agents");
-const TOOLS_DIR = path.join(HOME, ".harness-evolver", "tools");
-const EXAMPLES_DIR = path.join(HOME, ".harness-evolver", "examples");
-function log(msg) {
-  console.log(`  ${msg}`);
+// ANSI colors
+const MAGENTA = "\x1b[35m";
+const BRIGHT_MAGENTA = "\x1b[95m";
+const GREEN = "\x1b[32m";
+const YELLOW = "\x1b[33m";
+const RED = "\x1b[31m";
+const DIM = "\x1b[2m";
+const BOLD = "\x1b[1m";
+const RESET = "\x1b[0m";
+const LOGO = `
+${BRIGHT_MAGENTA}  ██╗  ██╗ █████╗ ██████╗ ███╗   ██╗███████╗███████╗███████╗
+  ██║  ██║██╔══██╗██╔══██╗████╗  ██║██╔════╝██╔════╝██╔════╝
+  ███████║███████║██████╔╝██╔██╗ ██║█████╗  ███████╗███████╗
+  ██╔══██║██╔══██║██╔══██╗██║╚██╗██║██╔══╝  ╚════██║╚════██║
+  ██║  ██║██║  ██║██║  ██║██║ ╚████║███████╗███████║███████║
+  ╚═╝  ╚═╝╚═╝  ╚═╝╚═╝  ╚═╝╚═╝  ╚═══╝╚══════╝╚══════╝╚══════╝
+  ${MAGENTA}${BOLD}███████╗██╗   ██╗ ██████╗ ██╗    ██╗   ██╗███████╗██████╗
+  ██╔════╝██║   ██║██╔═══██╗██║    ██║   ██║██╔════╝██╔══██╗
+  █████╗  ██║   ██║██║   ██║██║    ██║   ██║█████╗  ██████╔╝
+  ██╔══╝  ╚██╗ ██╔╝██║   ██║██║    ╚██╗ ██╔╝██╔══╝  ██╔══██╗
+  ███████╗ ╚████╔╝ ╚██████╔╝███████╗╚████╔╝ ███████╗██║  ██║
+  ╚══════╝  ╚═══╝   ╚═════╝ ╚══════╝ ╚═══╝  ╚══════╝╚═╝  ╚═╝${RESET}
+`;
+const RUNTIMES = [
+  { name: "Claude Code", dir: ".claude", detected: () => fs.existsSync(path.join(HOME, ".claude")) },
+  { name: "Cursor", dir: ".cursor", detected: () => fs.existsSync(path.join(HOME, ".cursor")) },
+  { name: "Codex", dir: ".codex", detected: () => fs.existsSync(path.join(HOME, ".codex")) },
+  { name: "Windsurf", dir: ".windsurf", detected: () => fs.existsSync(path.join(HOME, ".windsurf")) },
+];
+function ask(rl, question) {
+  return new Promise((resolve) => rl.question(question, resolve));
 }
 function copyDir(src, dest) {
@@ -50,76 +78,152 @@ function checkPython() {
   }
 }
-function main() {
-  console.log("\n  Harness Evolver v0.1.0\n");
+function installForRuntime(runtimeDir, scope) {
+  const baseDir = scope === "local"
+    ? path.join(process.cwd(), runtimeDir)
+    : path.join(HOME, runtimeDir);
-  if (!checkPython()) {
-    console.error("  ERROR: python3 not found in PATH. Install Python 3.8+ first.");
-    process.exit(1);
-  }
-  log("\u2713 python3 found");
+  const commandsDir = path.join(baseDir, "commands", "harness-evolver");
+  const agentsDir = path.join(baseDir, "agents");
-  if (!fs.existsSync(CLAUDE_DIR)) {
-    console.error(`  ERROR: Claude Code directory not found at ${CLAUDE_DIR}`);
-    console.error("  Install Claude Code first: https://claude.ai/code");
-    process.exit(1);
-  }
-  log("\u2713 Claude Code detected");
-  // Copy skills
+  // Skills
   const skillsSource = path.join(PLUGIN_ROOT, "skills");
   if (fs.existsSync(skillsSource)) {
     for (const skill of fs.readdirSync(skillsSource, { withFileTypes: true })) {
       if (skill.isDirectory()) {
-        const src = path.join(skillsSource, skill.name);
-        const dest = path.join(COMMANDS_DIR, skill.name);
-        copyDir(src, dest);
-        log(`  skill: ${skill.name}`);
+        copyDir(path.join(skillsSource, skill.name), path.join(commandsDir, skill.name));
+        console.log(`  ${GREEN}✓${RESET} Installed skill: ${skill.name}`);
       }
     }
   }
-  // Copy agents
+  // Agents
   const agentsSource = path.join(PLUGIN_ROOT, "agents");
   if (fs.existsSync(agentsSource)) {
-    fs.mkdirSync(AGENTS_DIR, { recursive: true });
+    fs.mkdirSync(agentsDir, { recursive: true });
     for (const agent of fs.readdirSync(agentsSource)) {
-      copyFile(
-        path.join(agentsSource, agent),
-        path.join(AGENTS_DIR, agent)
-      );
-      log(`  agent: ${agent}`);
+      copyFile(path.join(agentsSource, agent), path.join(agentsDir, agent));
+      console.log(`  ${GREEN}✓${RESET} Installed agent: ${agent}`);
     }
   }
+}
-  // Copy tools
+function installTools() {
+  const toolsDir = path.join(HOME, ".harness-evolver", "tools");
   const toolsSource = path.join(PLUGIN_ROOT, "tools");
   if (fs.existsSync(toolsSource)) {
-    fs.mkdirSync(TOOLS_DIR, { recursive: true });
+    fs.mkdirSync(toolsDir, { recursive: true });
     for (const tool of fs.readdirSync(toolsSource)) {
       if (tool.endsWith(".py")) {
-        copyFile(
-          path.join(toolsSource, tool),
-          path.join(TOOLS_DIR, tool)
-        );
-        log(`  tool: ${tool}`);
+        copyFile(path.join(toolsSource, tool), path.join(toolsDir, tool));
+        console.log(`  ${GREEN}✓${RESET} Installed tool: ${tool}`);
       }
     }
   }
+}
-  // Copy examples
+function installExamples() {
+  const examplesDir = path.join(HOME, ".harness-evolver", "examples");
   const examplesSource = path.join(PLUGIN_ROOT, "examples");
   if (fs.existsSync(examplesSource)) {
-    copyDir(examplesSource, EXAMPLES_DIR);
-    log("  examples: classifier");
+    copyDir(examplesSource, examplesDir);
+    console.log(`  ${GREEN}✓${RESET} Installed examples: classifier`);
+  }
+}
+async function main() {
+  console.log(LOGO);
+  console.log(`  ${DIM}Harness Evolver v${VERSION}${RESET}`);
+  console.log(`  ${DIM}Meta-Harness-style autonomous harness optimization${RESET}`);
+  console.log();
+  // Check python
+  if (!checkPython()) {
+    console.error(`  ${RED}ERROR:${RESET} python3 not found in PATH. Install Python 3.8+ first.`);
+    process.exit(1);
+  }
+  console.log(`  ${GREEN}✓${RESET} python3 found`);
+  // Detect runtimes
+  const available = RUNTIMES.filter((r) => r.detected());
+  if (available.length === 0) {
+    console.error(`\n  ${RED}ERROR:${RESET} No supported runtime detected.`);
+    console.error(`  Install Claude Code, Cursor, Codex, or Windsurf first.`);
+    process.exit(1);
   }
-  console.log("\n  \u2713 Installed successfully!\n");
-  console.log("  Next steps:");
-  console.log("    1. Copy an example:  cp -r ~/.harness-evolver/examples/classifier ./my-project");
-  console.log("    2. cd my-project");
-  console.log("    3. /harness-evolve-init --harness harness.py --eval eval.py --tasks tasks/");
-  console.log("    4. /harness-evolve --iterations 5\n");
+  const rl = readline.createInterface({ input: process.stdin, output: process.stdout });
+  // Runtime selection
+  console.log(`\n  ${YELLOW}Which runtime(s) would you like to install for?${RESET}\n`);
+  available.forEach((r, i) => {
+    console.log(`  ${i + 1}) ${r.name.padEnd(14)} (~/${r.dir})`);
+  });
+  if (available.length > 1) {
+    console.log(`  ${available.length + 1}) All`);
+    console.log(`\n  ${DIM}Select multiple: 1,2 or 1 2${RESET}`);
+  }
+  const defaultChoice = "1";
+  const runtimeAnswer = await ask(rl, `\n  ${YELLOW}Choice [${defaultChoice}]:${RESET} `);
+  const runtimeInput = (runtimeAnswer.trim() || defaultChoice);
+  let selectedRuntimes;
+  if (runtimeInput === String(available.length + 1)) {
+    selectedRuntimes = available;
+  } else {
+    const indices = runtimeInput.split(/[,\s]+/).map((s) => parseInt(s, 10) - 1);
+    selectedRuntimes = indices
+      .filter((i) => i >= 0 && i < available.length)
+      .map((i) => available[i]);
+  }
+  if (selectedRuntimes.length === 0) {
+    selectedRuntimes = [available[0]];
+  }
+  // Scope selection
+  console.log(`\n  ${YELLOW}Where would you like to install?${RESET}\n`);
+  console.log(`  1) Global  (~/${selectedRuntimes[0].dir}) - available in all projects`);
+  console.log(`  2) Local   (./${selectedRuntimes[0].dir}) - this project only`);
+  const scopeAnswer = await ask(rl, `\n  ${YELLOW}Choice [1]:${RESET} `);
+  const scope = (scopeAnswer.trim() === "2") ? "local" : "global";
+  console.log();
+  // Install for each selected runtime
+  for (const runtime of selectedRuntimes) {
+    const target = scope === "local" ? `./${runtime.dir}` : `~/${runtime.dir}`;
+    console.log(`  Installing for ${BRIGHT_MAGENTA}${runtime.name}${RESET} to ${target}`);
+    console.log();
+    installForRuntime(runtime.dir, scope);
+  }
+  // Tools and examples are always global
+  installTools();
+  installExamples();
+  // Write version file
+  const versionPath = path.join(HOME, ".harness-evolver", "VERSION");
+  fs.mkdirSync(path.dirname(versionPath), { recursive: true });
+  fs.writeFileSync(versionPath, VERSION);
+  console.log(`  ${GREEN}✓${RESET} Wrote VERSION (${VERSION})`);
+  console.log(`\n  ${GREEN}Done!${RESET} Open a project in Claude Code and run ${BRIGHT_MAGENTA}/harness-evolver:init${RESET}`);
+  console.log(`\n  ${DIM}Quick start with example:${RESET}`);
+  console.log(`    cp -r ~/.harness-evolver/examples/classifier ./my-project`);
+  console.log(`    cd my-project && claude`);
+  console.log(`    /harness-evolver:init`);
+  console.log(`    /harness-evolver:evolve`);
+  console.log(`\n  ${DIM}GitHub: https://github.com/raphaelchristi/harness-evolver${RESET}`);
+  console.log();
+  rl.close();
 }
-main();
+main().catch((err) => {
+  console.error(`  ${RED}ERROR:${RESET} ${err.message}`);
+  process.exit(1);
+});

package/examples/classifier/harness.py CHANGED Viewed

@@ -39,7 +39,7 @@ def classify_mock(text):
 def classify_llm(text, config):
     import urllib.request
-    api_key = config.get("api_key", os.environ.get("ANTHROPIC_API_KEY", ""))
+    api_key = os.environ.get("ANTHROPIC_API_KEY", "")
     model = config.get("model", "claude-haiku-4-5-20251001")
     prompt = (

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "harness-evolver",
-  "version": "0.4.0",
+  "version": "0.5.1",
   "description": "Meta-Harness-style autonomous harness optimization for Claude Code",
   "author": "Raphael Valdetaro Christi Cordeiro",
   "license": "MIT",

package/tools/init.py CHANGED Viewed

@@ -89,6 +89,30 @@ def _auto_detect(search_dir):
     return harness, eval_script, tasks, config
+def _detect_api_keys():
+    """Detect which LLM/service API keys are available in the environment."""
+    KNOWN_KEYS = {
+        "ANTHROPIC_API_KEY": "Anthropic (Claude)",
+        "OPENAI_API_KEY": "OpenAI (GPT)",
+        "GOOGLE_API_KEY": "Google (Gemini)",
+        "GEMINI_API_KEY": "Google Gemini",
+        "OPENROUTER_API_KEY": "OpenRouter",
+        "LANGSMITH_API_KEY": "LangSmith",
+        "TOGETHER_API_KEY": "Together AI",
+        "GROQ_API_KEY": "Groq",
+        "MISTRAL_API_KEY": "Mistral",
+        "COHERE_API_KEY": "Cohere",
+        "FIREWORKS_API_KEY": "Fireworks AI",
+        "DEEPSEEK_API_KEY": "DeepSeek",
+        "XAI_API_KEY": "xAI (Grok)",
+    }
+    detected = {}
+    for env_var, display_name in KNOWN_KEYS.items():
+        if os.environ.get(env_var):
+            detected[env_var] = {"name": display_name, "status": "detected"}
+    return detected
 def _detect_langsmith():
     """Auto-detect LangSmith API key and return config section."""
     if os.environ.get("LANGSMITH_API_KEY"):
@@ -252,9 +276,19 @@ def main():
             "harnesses": "harnesses/",
         },
     }
+    # Detect API keys available in environment
+    api_keys = _detect_api_keys()
+    config["api_keys"] = api_keys
     with open(os.path.join(base, "config.json"), "w") as f:
         json.dump(config, f, indent=2)
+    if api_keys:
+        print("API keys detected:")
+        for env_var, info in api_keys.items():
+            print(f"  {info['name']} ({env_var})")
+        print()
     ls_config = config["eval"].get("langsmith", {})
     if ls_config.get("enabled"):
         print("  LangSmith tracing enabled (LANGSMITH_API_KEY detected)")