npm - @evomap/evolver - Versions diffs - 1.87.2 → 1.87.3 - Mend

@evomap/evolver 1.87.2 → 1.87.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (65) hide show

package/README.ja-JP.md +1 -1
package/README.ko-KR.md +1 -1
package/README.md +9 -8
package/README.zh-CN.md +9 -8
package/package.json +1 -1
package/scripts/build_binaries.js +31 -7
package/src/atp/atpExecute.js +35 -8
package/src/atp/autoBuyer.js +71 -16
package/src/atp/autoDeliver.js +16 -0
package/src/atp/cliAutobuyPrompt.js +8 -22
package/src/atp/hubClient.js +42 -4
package/src/evolve/guards.js +1 -1
package/src/evolve/pipeline/collect.js +1 -1
package/src/evolve/pipeline/dispatch.js +1 -1
package/src/evolve/pipeline/enrich.js +1 -1
package/src/evolve/pipeline/hub.js +1 -1
package/src/evolve/pipeline/select.js +1 -1
package/src/evolve/pipeline/signals.js +1 -1
package/src/evolve/utils.js +1 -1
package/src/evolve.js +1 -1
package/src/gep/a2aProtocol.js +1 -1
package/src/gep/assetStore.js +52 -5
package/src/gep/candidateEval.js +1 -1
package/src/gep/candidates.js +1 -1
package/src/gep/contentHash.js +1 -1
package/src/gep/crypto.js +1 -1
package/src/gep/curriculum.js +1 -1
package/src/gep/deviceId.js +1 -1
package/src/gep/envFingerprint.js +1 -1
package/src/gep/epigenetics.js +1 -1
package/src/gep/explore.js +1 -1
package/src/gep/hash.js +1 -1
package/src/gep/hubFetch.js +1 -1
package/src/gep/hubReview.js +1 -1
package/src/gep/hubSearch.js +1 -1
package/src/gep/hubVerify.js +1 -1
package/src/gep/learningSignals.js +1 -1
package/src/gep/memoryGraph.js +1 -1
package/src/gep/memoryGraphAdapter.js +1 -1
package/src/gep/mutation.js +1 -1
package/src/gep/narrativeMemory.js +1 -1
package/src/gep/openPRRegistry.js +1 -1
package/src/gep/paths.js +6 -2
package/src/gep/personality.js +1 -1
package/src/gep/policyCheck.js +1 -1
package/src/gep/prompt.js +1 -1
package/src/gep/recallVerifier.js +1 -1
package/src/gep/reflection.js +1 -1
package/src/gep/sanitize.js +57 -3
package/src/gep/selector.js +1 -1
package/src/gep/selfPR.js +34 -1
package/src/gep/skill2gep.js +108 -29
package/src/gep/skillDistiller.js +1 -1
package/src/gep/solidify.js +1 -1
package/src/gep/strategy.js +1 -1
package/src/gep/workspaceKeychain.js +1 -1
package/src/proxy/lifecycle/manager.js +97 -37
package/src/proxy/router/messages_route.js +25 -0
package/src/proxy/sync/engine.js +68 -31
package/assets/gep/candidates.jsonl +0 -1
package/assets/gep/capsules.json +0 -4
package/assets/gep/events.jsonl +0 -0
package/assets/gep/failed_capsules.json +0 -4
package/assets/gep/genes.json +0 -245
package/assets/gep/genes.jsonl +0 -0

package/README.ja-JP.md CHANGED Viewed

@@ -32,7 +32,7 @@
 >
 > Evolver はこの結論を実装に落とし込んだオープンソースエンジンです。GEP プロトコルの下で、エージェントの経験を場当たり的なプロンプトやスキルドキュメントではなく、Gene と Capsule として符号化します。*なぜ* Evolver が長いスキルドキュメントではなく Gene にこだわるのか疑問に思ったことがあるなら、読むべきはこの論文です。
 >
-> 応用事例を見たい方へ：[OpenClaw x EvoMap：CritPt 評価レポート](https://evomap.ai/blog/openclaw-critpt-report) では、OpenClaw エージェントが CritPt Physics Solver 上の 5 バージョン（Beta → v2.2）にわたって、同じ Gene ベース進化ループによってスコアを 0.00% から 18.57% まで押し上げる全過程を、トークンコストの軌跡、遺伝子活性化マップ、そして推論が再利用可能な Gene に圧縮されるときに現れる「トークンが上昇してから下降する」シグネチャとともに詳述しています。
+> 応用事例を見たい方へ：[OpenClaw x EvoMap：CritPt 評価レポート](https://evomap.ai/blog/openclaw-critpt-report) では、OpenClaw エージェントが CritPt Physics Solver 上の 5 バージョン（Beta → v2.2）にわたって、同じ Gene ベース進化ループによってスコアを 9.1% から 18.57% まで押し上げる全過程を、トークンコストの軌跡、遺伝子活性化マップ、そして推論が再利用可能な Gene に圧縮されるときに現れる「トークンが上昇してから下降する」シグネチャとともに詳述しています。
 ---

package/README.ko-KR.md CHANGED Viewed

@@ -32,7 +32,7 @@
 >
 > Evolver는 이 결과를 실제로 구현하는 오픈소스 엔진입니다. GEP 프로토콜 아래 에이전트의 경험을 임시 프롬프트나 스킬 문서가 아니라 Gene과 Capsule로 인코딩합니다. *왜* Evolver가 더 긴 스킬 문서 대신 Gene을 고집하는지 궁금했다면, 바로 이 논문을 읽어야 합니다.
 >
-> 적용 사례가 궁금하신가요? [OpenClaw x EvoMap: CritPt 평가 보고서](https://evomap.ai/blog/openclaw-critpt-report)는 동일한 Gene 기반 진화 루프가 OpenClaw 에이전트를 CritPt Physics Solver의 5개 버전(Beta → v2.2)에 걸쳐 0.00%에서 18.57%까지 끌어올리는 과정을, 전체 토큰 비용 궤적, 유전자 활성화 매핑, 그리고 추론이 재사용 가능한 Gene으로 압축될 때 나타나는 "토큰이 먼저 상승한 뒤 하강하는" 시그니처와 함께 단계별로 보여줍니다.
+> 적용 사례가 궁금하신가요? [OpenClaw x EvoMap: CritPt 평가 보고서](https://evomap.ai/blog/openclaw-critpt-report)는 동일한 Gene 기반 진화 루프가 OpenClaw 에이전트를 CritPt Physics Solver의 5개 버전(Beta → v2.2)에 걸쳐 9.1%에서 18.57%까지 끌어올리는 과정을, 전체 토큰 비용 궤적, 유전자 활성화 매핑, 그리고 추론이 재사용 가능한 Gene으로 압축될 때 나타나는 "토큰이 먼저 상승한 뒤 하강하는" 시그니처와 함께 단계별로 보여줍니다.
 ---

package/README.md CHANGED Viewed

@@ -32,7 +32,7 @@
 >
 > Evolver is the open-source engine that puts this result into practice: it encodes agent experience as Genes and Capsules under the GEP protocol, not as ad hoc prompts or skill docs. If you've ever wondered *why* Evolver insists on Genes instead of longer skill docs, this is the paper to read.
 >
-> Want the applied version? [OpenClaw x EvoMap: CritPt Evaluation Report](https://evomap.ai/blog/openclaw-critpt-report) walks through how the same Gene-based evolution loop drives an OpenClaw agent from 0.00% to 18.57% on CritPt Physics Solver across five versions (Beta -> v2.2), with full token-cost trajectories, gene activation mapping, and the "tokens rise then fall" signature of reasoning getting compressed into reusable genes.
+> Want the applied version? [OpenClaw x EvoMap: CritPt Evaluation Report](https://evomap.ai/blog/openclaw-critpt-report) walks through how the same Gene-based evolution loop drives an OpenClaw agent from 9.1% to 18.57% on CritPt Physics Solver across five versions (Beta -> v2.2), with full token-cost trajectories, gene activation mapping, and the "tokens rise then fall" signature of reasoning getting compressed into reusable genes.
 ---
@@ -184,7 +184,7 @@ Every `evolver <flag>` invocation in the rest of this README maps 1:1 to `node i
 **Evolver is a prompt generator, not a code patcher.** Each evolution cycle:
 1. Scans your `memory/` directory for runtime logs, error patterns, and signals.
-2. Selects the best-matching [Gene or Capsule](https://evomap.ai/wiki) from `assets/gep/`.
+2. Selects the best-matching [Gene or Capsule](https://evomap.ai/wiki) from the local GEP asset store.
 3. Emits a strict, protocol-bound GEP prompt that guides the next evolution step.
 4. Records an auditable [EvolutionEvent](https://evomap.ai/wiki) for traceability.
@@ -377,16 +377,17 @@ The [evomap.ai](https://evomap.ai) dashboard has a "Worker" toggle on the node d
 This repo includes a protocol-constrained prompt mode based on [GEP (Genome Evolution Protocol)](https://evomap.ai/wiki).
-- **Structured assets** live in `assets/gep/`:
-  - `assets/gep/genes.json`
-  - `assets/gep/capsules.json`
-  - `assets/gep/events.jsonl`
+- **Structured runtime assets** live in `<workspace>/.evolver/gep/` by default:
+  - `<workspace>/.evolver/gep/genes.json`
+  - `<workspace>/.evolver/gep/capsules.json`
+  - `<workspace>/.evolver/gep/events.jsonl`
+- Set `GEP_ASSETS_DIR` to place the runtime asset store elsewhere.
 - **Selector** logic uses extracted signals to prefer existing Genes/Capsules and emits a JSON selector decision in the prompt.
 - **Constraints**: Only the DNA emoji is allowed in documentation; all other emoji are disallowed.
 ### Your local asset store is never overwritten by upgrades
-`assets/gep/genes.json`, `assets/gep/capsules.json`, and `assets/gep/events.jsonl` are owned by your runtime. Starting with 1.78.3, the npm tarball no longer contains these files, so `npm i -g @evomap/evolver` (or `git pull` of the public repo) never clobbers your accumulated Genes, Capsules, or EvolutionEvents. New installs still receive the curated starter Genes through `assets/gep/genes.seed.json`, which is applied only when `genes.json` is absent.
+`<workspace>/.evolver/gep/genes.json`, `<workspace>/.evolver/gep/capsules.json`, and `<workspace>/.evolver/gep/events.jsonl` are owned by your runtime and ignored by git. `assets/gep/` is reserved for bundled starter assets. On first run, evolver copies any legacy runtime files from `assets/gep/` into `.evolver/gep/` without deleting the originals, then seeds `genes.json` from the bundled starter genes only when no local `genes.json` exists.
 If you ran an older evolver version that wiped your local assets, pull back everything you Promoted or published to the Hub with a single command:
@@ -396,7 +397,7 @@ A2A_HUB_URL=https://evomap.ai evolver sync --scope=all --export=backup.gepx
 This hits `/a2a/assets/purchased` (Promoted-to-you plus self-purchased) and `/a2a/assets/published-by-me` (your own drafts and published assets), re-materializes the full payloads into `genes.json` / `capsules.json`, and packs a portable `.gepx` bundle. Previously-purchased payloads re-fetch at zero cost.
-Purely local assets that were never uploaded to the Hub have no remote copy -- recover them from your git history (for example `git show <old_tag>:assets/gep/genes.json > restored.json`) or from disk snapshots.
+Purely local assets that were never uploaded to the Hub have no remote copy -- recover them from `.evolver/gep/`, from an older `assets/gep/` checkout, or from disk snapshots.
 ## Configuration & Decoupling

package/README.zh-CN.md CHANGED Viewed

@@ -32,7 +32,7 @@
 >
 > Evolver 正是把这一结论落地的开源引擎：它基于 GEP 协议，把 Agent 的经验沉淀为 Gene 与 Capsule，而不是散落的 prompt 或技能文档。如果你想知道 *为什么* Evolver 坚持使用 Gene 而不是更长的 skill 文档，这就是那篇该读的论文。
 >
-> 想看应用落地的样本？[OpenClaw x EvoMap：CritPt 评测报告](https://evomap.ai/blog/openclaw-critpt-report) 以 OpenClaw Agent 在 CritPt Physics Solver 上的五个版本演进（Beta → v2.2）为例，完整拆解了同一套 Gene 进化闭环如何把得分从 0.00% 推到 18.57%，并给出 token 成本轨迹、基因激活映射，以及推理被压缩成可复用基因后所呈现的「token 先升后降」特征。
+> 想看应用落地的样本？[OpenClaw x EvoMap：CritPt 评测报告](https://evomap.ai/blog/openclaw-critpt-report) 以 OpenClaw Agent 在 CritPt Physics Solver 上的五个版本演进（Beta → v2.2）为例，完整拆解了同一套 Gene 进化闭环如何把得分从 9.1% 推到 18.57%，并给出 token 成本轨迹、基因激活映射，以及推理被压缩成可复用基因后所呈现的「token 先升后降」特征。
 ---
@@ -159,7 +159,7 @@ evolver --loop
 **Evolver 是一个提示词生成器，不是代码修改器。** 每个进化周期：
 1. 扫描 `memory/` 目录中的运行日志、错误模式和信号。
-2. 从 `assets/gep/` 中选择最匹配的 [Gene 或 Capsule](https://evomap.ai/wiki)。
+2. 从本地 GEP 资产库中选择最匹配的 [Gene 或 Capsule](https://evomap.ai/wiki)。
 3. 输出一份严格的、受协议约束的 GEP 提示词来引导下一步进化。
 4. 记录可审计的 [EvolutionEvent](https://evomap.ai/wiki) 以便追溯。
@@ -351,16 +351,17 @@ WORKER_ENABLED=1 WORKER_DOMAINS=repair,harden WORKER_MAX_LOAD=3 evolver --loop
 本仓库内置基于 [GEP（基因组进化协议）](https://evomap.ai/wiki)的协议受限提示词模式。
-- **结构化资产目录**：`assets/gep/`
-  - `assets/gep/genes.json`
-  - `assets/gep/capsules.json`
-  - `assets/gep/events.jsonl`
+- **结构化运行时资产目录**：默认位于 `<workspace>/.evolver/gep/`
+  - `<workspace>/.evolver/gep/genes.json`
+  - `<workspace>/.evolver/gep/capsules.json`
+  - `<workspace>/.evolver/gep/events.jsonl`
+- 可通过 `GEP_ASSETS_DIR` 把运行时资产库放到其他位置。
 - **Selector 选择器**：根据日志提取 signals，优先复用已有 Gene/Capsule，并在提示词中输出可审计的 Selector 决策 JSON。
 - **约束**：除 🧬 外，禁止使用其他 emoji。
 ### 升级不再覆盖你的本地资产库
-`assets/gep/genes.json`、`assets/gep/capsules.json`、`assets/gep/events.jsonl` 属于你本地运行时。从 1.78.3 起，npm 发行包不再包含这三个文件，`npm i -g @evomap/evolver`（或公共仓库的 `git pull`）不会再覆盖你累积的 Gene、Capsule 和 EvolutionEvent。新装用户依然会通过 `assets/gep/genes.seed.json` 拿到引擎维护的 starter Gene —— 只有在本地 `genes.json` 不存在时才会应用一次。
+`<workspace>/.evolver/gep/genes.json`、`<workspace>/.evolver/gep/capsules.json`、`<workspace>/.evolver/gep/events.jsonl` 属于你本地运行时，并被 git 忽略。`assets/gep/` 保留给随包发布的 starter 资产。首次运行时，evolver 会把旧版遗留在 `assets/gep/` 的运行时文件复制到 `.evolver/gep/`，不会删除原文件；只有在本地 `genes.json` 不存在时，才会从随包 starter Gene 初始化。
 如果你之前用老版本被覆盖过，现在可以一键把所有被 Promoted 给你、以及你自己上传到 Hub 的资产拉回来：
@@ -370,7 +371,7 @@ A2A_HUB_URL=https://evomap.ai evolver sync --scope=all --export=backup.gepx
 它会去 `/a2a/assets/purchased`（被 Promoted 给你 + 自购）和 `/a2a/assets/published-by-me`（你自己发布的，含 draft）拉回完整 payload，直接回写 `genes.json` / `capsules.json`，并顺便打成 `.gepx` 整包备份。已购买过的 payload 这次重新拉取不收费。
-纯本地、从未上传过的资产 Hub 没有副本，只能从 git 历史恢复（例如 `git show <老tag>:assets/gep/genes.json > restored.json`）或从磁盘快照找回。
+纯本地、从未上传过的资产 Hub 没有副本，只能从 `.evolver/gep/`、旧版 `assets/gep/` checkout 或磁盘快照找回。
 ## 配置与解耦

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@evomap/evolver",
-  "version": "1.87.2",
+  "version": "1.87.3",
   "description": "A GEP-powered self-evolution engine for AI agents. Features automated log analysis and Genome Evolution Protocol (GEP) for auditable, reusable evolution assets.",
   "main": "index.js",
   "bin": {

package/scripts/build_binaries.js CHANGED Viewed

@@ -192,7 +192,14 @@ step('Stage 1 — bun bundle (resolve require tree to one file)');
 ensureDir(STAGE_DIR);
 const BUNDLED_JS = path.join(STAGE_DIR, 'bundled.js');
-run('bun', ['build', ENTRY, '--target=node', `--outfile=${BUNDLED_JS}`]);
+// `--external '@napi-rs/keyring'`: keyring is an optional dep loaded via
+// dynamic require() in workspace-id; bun otherwise tries to bundle the
+// platform-specific `.node` file as a second output asset, which makes
+// `bun build … --outfile=…` fail with "cannot write multiple output files
+// without an output directory". Treating it as external preserves the
+// existing optional-fallback behaviour (require throws → FS path used) in
+// the standalone binaries.
+run('bun', ['build', ENTRY, '--target=node', `--outfile=${BUNDLED_JS}`, '--external', '@napi-rs/keyring']);
 const bundleSize = OPTS.dryRun ? 0 : fs.statSync(BUNDLED_JS).size;
 console.log(`  bundled.js: ${(bundleSize / 1024 / 1024).toFixed(2)} MB`);
@@ -266,13 +273,30 @@ if (!OPTS.skipObfuscate) {
       const obfSecs = ((Date.now() - t0) / 1000).toFixed(1);
       const check = spawnSync('node', ['--check', OBF_JS], { encoding: 'utf8' });
-      if (check.status === 0) {
-        console.log(`  obfuscation: ${obfSecs}s, output ${(obfSize / 1024 / 1024).toFixed(2)} MB (attempt ${attempt}/${MAX_OBF_ATTEMPTS}, seed=0x${usedSeed.toString(16)})`);
-        succeeded = true;
-        break;
+      if (check.status !== 0) {
+        lastValidationErr = (check.stderr || check.stdout || '').split('\n').slice(0, 3).join(' | ');
+        console.warn(`  attempt ${attempt}/${MAX_OBF_ATTEMPTS}: obfuscator output failed node --check (${lastValidationErr.slice(0, 200)}); retrying with perturbed seed...`);
+        continue;
       }
-      lastValidationErr = (check.stderr || check.stdout || '').split('\n').slice(0, 3).join(' | ');
-      console.warn(`  attempt ${attempt}/${MAX_OBF_ATTEMPTS}: obfuscator output failed node --check (${lastValidationErr.slice(0, 200)}); retrying with perturbed seed...`);
+      // Second gate: bun's compile-time parser is stricter than node's.
+      // 1.87.x (post `@napi-rs/keyring` dep) revealed that ~5% of obfuscator
+      // outputs that pass `node --check` still trip bun with errors like
+      // `Expected "in" but found ","`. Probe with a cheap bundle-only call
+      // (no --compile, native target) to fail fast and feed back into the
+      // seed-perturbation loop instead of dying in stage 3.
+      const bunProbe = spawnSync('bun', [
+        'build', OBF_JS,
+        '--target=bun',
+        `--outfile=${path.join(STAGE_DIR, 'bundled.obf.bunprobe.js')}`,
+      ], { encoding: 'utf8' });
+      if (bunProbe.status !== 0) {
+        lastValidationErr = (bunProbe.stderr || bunProbe.stdout || '').split('\n').slice(0, 3).join(' | ');
+        console.warn(`  attempt ${attempt}/${MAX_OBF_ATTEMPTS}: obfuscator output rejected by bun parser (${lastValidationErr.slice(0, 200)}); retrying with perturbed seed...`);
+        continue;
+      }
+      console.log(`  obfuscation: ${obfSecs}s, output ${(obfSize / 1024 / 1024).toFixed(2)} MB (attempt ${attempt}/${MAX_OBF_ATTEMPTS}, seed=0x${usedSeed.toString(16)})`);
+      succeeded = true;
+      break;
     }
     if (!succeeded) {
       console.error(`  ERROR: javascript-obfuscator produced syntactically invalid output in ${MAX_OBF_ATTEMPTS} attempts.`);

package/src/atp/atpExecute.js CHANGED Viewed

@@ -27,6 +27,7 @@ const https = require('https');
 const crypto = require('crypto');
 const { computeAssetId } = require('../gep/contentHash');
+const { enforceHubScheme, strictHttpsAgent } = require('../gep/hubFetch');
 const {
   getNodeId,
   getHubUrl,
@@ -114,6 +115,19 @@ function _publishUrl() {
 function _postJson(urlStr, body, timeoutMs) {
   return new Promise(function (resolve) {
+    // Same TLS posture as hubFetch: refuse plain http:// unless
+    // EVOMAP_HUB_ALLOW_INSECURE=1. Before this guard the function
+    // silently fell back to `lib = http` for any non-https URL, so an
+    // operator override `A2A_HUB_URL=http://...` would send /a2a/publish
+    // and /a2a/task/complete in cleartext while hubFetch-routed calls
+    // (e.g. /a2a/verify-solidify) refused the same URL — inconsistent
+    // TLS enforcement across modules.
+    try {
+      enforceHubScheme(urlStr);
+    } catch (e) {
+      resolve({ ok: false, error: 'tls_refused: ' + (e && e.message) });
+      return;
+    }
     let parsed;
     try {
       parsed = new URL(urlStr);
@@ -128,15 +142,28 @@ function _postJson(urlStr, body, timeoutMs) {
       { 'Content-Type': 'application/json', 'Content-Length': Buffer.byteLength(payload) },
       buildHubHeaders() || {},
     );
+    // Pin TLS cert verification for https calls so a globally-disabled
+    // NODE_TLS_REJECT_UNAUTHORIZED=0 cannot weaken the Hub channel
+    // (Cursor Security Reviewer #160 Medium). hubFetch enforces the
+    // same via its undici dispatcher; this is the Node-native-https
+    // equivalent.
+    //
+    // Skipped under EVOMAP_HUB_ALLOW_INSECURE=1 so local-dev / self-
+    // signed mock hubs that legitimately rely on
+    // NODE_TLS_REJECT_UNAUTHORIZED=0 still work.
+    const requestOpts = {
+      hostname: parsed.hostname,
+      port: parsed.port || (isHttps ? 443 : 80),
+      path: parsed.pathname + (parsed.search || ''),
+      method: 'POST',
+      headers: headers,
+      timeout: timeoutMs || PUBLISH_TIMEOUT_MS,
+    };
+    if (isHttps && process.env.EVOMAP_HUB_ALLOW_INSECURE !== '1') {
+      requestOpts.agent = strictHttpsAgent;
+    }
     const req = lib.request(
-      {
-        hostname: parsed.hostname,
-        port: parsed.port || (isHttps ? 443 : 80),
-        path: parsed.pathname + (parsed.search || ''),
-        method: 'POST',
-        headers: headers,
-        timeout: timeoutMs || PUBLISH_TIMEOUT_MS,
-      },
+      requestOpts,
       function (res) {
         const chunks = [];
         res.on('data', function (c) { chunks.push(c); });

package/src/atp/autoBuyer.js CHANGED Viewed

@@ -36,7 +36,13 @@ const DEFAULT_DAILY_CAP = 50;
 const DEFAULT_PER_ORDER_CAP = 10;
 const DEFAULT_ORDER_TIMEOUT_MS = 3000;
 const COLD_START_WINDOW_MS = 5 * 60 * 1000;
+// Successful orders dedup for 24h so the same capability gap is only paid for
+// once per day. Failed orders dedup for 5 minutes only — long enough to
+// absorb tight retry loops (the original goal of "don't hammer the hub")
+// without making the user wait 24h to retry a question after a transient
+// 503/network blip.
 const DEDUP_TTL_MS = 24 * 60 * 60 * 1000;
+const DEDUP_FAILURE_TTL_MS = 5 * 60 * 1000;
 const LEDGER_FILENAME = 'atp-autobuyer-ledger.json';
 const ACK_FILENAME = 'atp-autobuy-ack.json';
@@ -145,13 +151,22 @@ function _rotateIfNewDay(ledger, now) {
 }
 function _pruneDedup(ledger, now) {
-  const cutoff = (typeof now === 'number' ? now : Date.now()) - DEDUP_TTL_MS;
+  const nowMs = typeof now === 'number' ? now : Date.now();
   const out = {};
   const src = ledger.dedup || {};
   const keys = Object.keys(src);
   for (let i = 0; i < keys.length; i++) {
     const k = keys[i];
-    if (typeof src[k] === 'number' && src[k] >= cutoff) out[k] = src[k];
+    const entry = src[k];
+    // Legacy ledgers written by older versions stored plain timestamps; treat
+    // them as successful orders (the original behaviour) so an upgrade does
+    // not suddenly forget recent dedups.
+    if (typeof entry === 'number') {
+      if (entry >= nowMs - DEDUP_TTL_MS) out[k] = entry;
+    } else if (entry && typeof entry.ts === 'number') {
+      const ttl = entry.failed ? DEDUP_FAILURE_TTL_MS : DEDUP_TTL_MS;
+      if (entry.ts >= nowMs - ttl) out[k] = entry;
+    }
   }
   ledger.dedup = out;
   return ledger;
@@ -205,11 +220,36 @@ function _withTimeout(promise, timeoutMs) {
   ]);
 }
-async function considerOrder(opts) {
-  if (!_started) return { ok: false, skipped: true, reason: 'not_started' };
+// Single-flight queue: serialize the read → cap-check → placeOrder → write
+// pipeline so two concurrent considerOrder() calls cannot both pass the cap
+// check on the same ledger snapshot and silently double-spend.
+//
+// Without this, two parallel calls (e.g. user runs Claude Code in two tabs
+// through the same proxy, or two capability gaps fire in the same tick) both
+// read spent=40, both compute remaining=10, both await placeOrder, both
+// increment to spent=50, and write — silently exceeding the daily cap by one
+// full order each. autoBuyer is single-process so an in-memory queue is
+// sufficient; a file lock would only be needed if multiple OS processes
+// shared the same ledger file (not the current deployment model).
+let _orderQueue = Promise.resolve();
+function considerOrder(opts) {
+  if (!_started) return Promise.resolve({ ok: false, skipped: true, reason: 'not_started' });
   if (!opts || !Array.isArray(opts.capabilities) || opts.capabilities.length === 0) {
-    return { ok: false, skipped: true, reason: 'no_capabilities' };
+    return Promise.resolve({ ok: false, skipped: true, reason: 'no_capabilities' });
   }
+  const next = _orderQueue.then(
+    () => _considerOrderSerialized(opts),
+    () => _considerOrderSerialized(opts), // never let a prior rejection break the chain
+  );
+  // Swallow rejection on the queue tail so a single thrown error here does
+  // not poison every subsequent call; the original `next` promise still
+  // surfaces the error to the caller.
+  _orderQueue = next.then(() => {}, () => {});
+  return next;
+}
+async function _considerOrderSerialized(opts) {
   const now = Date.now();
   let ledger = _readLedger();
   ledger = _rotateIfNewDay(ledger, now);
@@ -248,15 +288,17 @@ async function considerOrder(opts) {
   if (result && result.ok) {
     ledger.spent = (ledger.spent || 0) + budget;
-    ledger.dedup[hash] = now;
+    ledger.dedup[hash] = { ts: now, failed: false };
     _writeLedger(ledger);
     console.log('[ATP-AutoBuyer] Order placed: ' + (result.data && result.data.order_id) + ' budget=' + budget + ' remaining_today=' + Math.max(0, dailyCap - ledger.spent));
     return { ok: true, data: result.data, spent: budget };
   }
-  // On failure still record dedup so we don't hammer the hub for the same
-  // capability gap within the TTL window (but do NOT charge the spend).
-  ledger.dedup[hash] = now;
+  // On failure record a SHORT-TTL dedup entry (5 min) so we don't hammer the
+  // hub for the same capability gap inside a tight retry loop, but the user
+  // can retry the same question once the transient error clears — far better
+  // than the previous 24h block for a single 503.
+  ledger.dedup[hash] = { ts: now, failed: true };
   _writeLedger(ledger);
   return { ok: false, error: (result && result.error) || 'unknown_error' };
 }
@@ -267,15 +309,25 @@ async function considerOrder(opts) {
 // via .tmp + rename so a crash mid-write never produces a corrupt ack file.
 function setConsent(enabled) {
   const dir = getMemoryDir();
-  try { if (!fs.existsSync(dir)) fs.mkdirSync(dir, { recursive: true }); } catch (_) {}
   const body = {
     enabled: !!enabled,
     acknowledged_at: new Date().toISOString(),
     version: 1,
   };
   const tmp = _ackPath() + '.tmp';
-  fs.writeFileSync(tmp, JSON.stringify(body, null, 2) + '\n', 'utf8');
-  fs.renameSync(tmp, _ackPath());
+  // Single try/catch over the whole pipeline. Previously the mkdirSync was
+  // wrapped in its own swallowing try/catch, so an EACCES on the parent dir
+  // would surface to the caller as a confusing ENOENT from writeFileSync.
+  // Surface the original error verbatim and best-effort clean up any
+  // partial .tmp file so a retry from a TTY prompt sees a clean slate.
+  try {
+    if (!fs.existsSync(dir)) fs.mkdirSync(dir, { recursive: true });
+    fs.writeFileSync(tmp, JSON.stringify(body, null, 2) + '\n', 'utf8');
+    fs.renameSync(tmp, _ackPath());
+  } catch (err) {
+    try { fs.unlinkSync(tmp); } catch (_) {}
+    throw err;
+  }
   return body;
 }
@@ -288,6 +340,7 @@ function _resetForTests() {
     perOrderCap: DEFAULT_PER_ORDER_CAP,
     timeoutMs: DEFAULT_ORDER_TIMEOUT_MS,
   };
+  _orderQueue = Promise.resolve();
 }
 module.exports = {
@@ -306,22 +359,24 @@ module.exports = {
   readAck: _readAck,
   ACK_FILENAME,
   // Exposed for tests and diagnostics only; callers should not depend on
-  // these internals in production code paths.
+  // these internals in production code paths. Ack-file helpers
+  // (getAckPath / readAck / ACK_FILENAME) are intentionally NOT mirrored
+  // here — production and tests both go through the public surface above,
+  // so a single source of truth survives schema changes (Bugbot PR #141 R6
+  // follow-up: keep "test-only" honest, no production caller may reach in).
   __internals: {
     readLedger: _readLedger,
     writeLedger: _writeLedger,
     questionHash: _questionHash,
     effectiveCap: _effectiveCap,
     resetForTests: _resetForTests,
-    ackPath: _ackPath,
-    readAck: _readAck,
     constants: {
       DEFAULT_DAILY_CAP,
       DEFAULT_PER_ORDER_CAP,
       COLD_START_WINDOW_MS,
       DEDUP_TTL_MS,
+      DEDUP_FAILURE_TTL_MS,
       LEDGER_FILENAME,
-      ACK_FILENAME,
     },
   },
 };

package/src/atp/autoDeliver.js CHANGED Viewed

@@ -155,6 +155,18 @@ function start(opts) {
   _pollInterval = setInterval(function () {
     _tick().catch(function () { /* swallowed in _tick */ });
   }, _pollMs);
+  // .unref() so this background poller does NOT keep the Node event
+  // loop alive on its own. `evolver run` (single-shot) writes its
+  // artifacts and expects to exit — without unref, the setInterval
+  // handle pins the process and the run sits as a residual `node`
+  // process until manually killed (public issue #553). `evolver --loop`
+  // (daemon) keeps the foreground evolve loop alive on its own
+  // schedule, so an unref'd poller still polls — unref only changes
+  // whether THIS handle alone keeps the loop alive, not whether the
+  // handle fires.
+  if (_pollInterval && typeof _pollInterval.unref === 'function') {
+    _pollInterval.unref();
+  }
   // Do not await -- fire the first tick asynchronously so start() returns
   // immediately. This matches the autoBuyer start() semantics.
   _tick().catch(function () { /* swallowed in _tick */ });
@@ -189,6 +201,10 @@ module.exports = {
     writeLedger: _writeLedger,
     buildProofPayload: _buildProofPayload,
     resetForTests: _resetForTests,
+    // Test-only accessor for the active poll Timeout. Used to assert
+    // the timer was `.unref()`ed so it does not pin the Node event
+    // loop (regression guard for public issue #553).
+    getPollIntervalForTest: () => _pollInterval,
     constants: {
       DEFAULT_POLL_MS,
       MIN_POLL_MS,

package/src/atp/cliAutobuyPrompt.js CHANGED Viewed

@@ -22,22 +22,13 @@
 const readline = require("readline");
 const autoBuyer = require("./autoBuyer");
-// All ack file plumbing is owned by autoBuyer: filename constant, path
-// resolution, read (strict validation), and write (atomic tmp+rename).
-// cliAutobuyPrompt delegates through the public API (not __internals) so
-// the two modules cannot diverge on schema or validation — pre-
-// consolidation drift bit us twice (Bugbot PR #141: duplicate writers +
-// lenient-vs-strict reader). Using public exports keeps the "test-only"
-// contract on __internals honest (Bugbot PR #141 R6).
-const ACK_FILE_NAME = autoBuyer.ACK_FILENAME;
-function _getAckPath() {
-  return autoBuyer.getAckPath();
-}
-function _readAck() {
-  return autoBuyer.readAck();
-}
+// All ack file plumbing lives on autoBuyer (filename constant, path
+// resolution, read with strict validation, atomic write via tmp+rename).
+// cliAutobuyPrompt always reaches it through the public surface so the
+// two modules cannot diverge on schema or validation — pre-consolidation
+// drift bit us twice (Bugbot PR #141: duplicate writers + lenient-vs-
+// strict reader). No __internals re-export here either: tests import
+// autoBuyer directly so a future rename trips a single set of asserts.
 /**
  * @returns {"ack_present"|"env_set"|"non_tty"|"eligible"}
@@ -50,7 +41,7 @@ function classify(env, stdin) {
   if (!stdin || !stdin.isTTY) {
     return "non_tty";
   }
-  if (_readAck()) {
+  if (autoBuyer.readAck()) {
     return "ack_present";
   }
   return "eligible";
@@ -160,9 +151,4 @@ async function runPrompt(opts) {
 module.exports = {
   runPrompt,
   classify,
-  __internals: {
-    ACK_FILE_NAME,
-    _readAck,
-    _getAckPath,
-  },
 };

package/src/atp/hubClient.js CHANGED Viewed

@@ -16,6 +16,7 @@
 const http = require('http');
 const { getHubUrl, buildHubHeaders, getNodeId } = require('../gep/a2aProtocol');
+const { hubFetch } = require('../gep/hubFetch');
 const { getProxyUrl, getProxyToken } = require('../proxy/server/settings');
 function _isProxyMode() {
@@ -68,12 +69,33 @@ function _proxyRequest(method, path, body, timeoutMs) {
   });
 }
+// Route through hubFetch() rather than the global `fetch()` for two
+// reasons (both flagged by Cursor reviewers on PR #160):
+//
+//   1. Dispatcher mixing (Bugbot HIGH): `strictUndiciAgent` is an Agent
+//      from the *installed* `undici` package, but `global.fetch` is
+//      backed by Node's *internal* undici. Passing one to the other
+//      throws `UND_ERR_INVALID_ARG: invalid onRequestStart method` at
+//      request time — exactly the failure mode the comment at the top
+//      of hubFetch.js calls out. hubFetch already routes through
+//      `undici.fetch` from the same package as its Agent, so all calls
+//      that go through hubFetch are immune.
+//
+//   2. Case-sensitive scheme check (Security Reviewer MEDIUM): a hand-
+//      rolled `endpoint.startsWith('https:')` would skip the strict
+//      dispatcher for `HTTPS://...`. hubFetch's `_validateHubUrl` uses
+//      `new URL(url).protocol`, which normalises to lowercase, so
+//      routing through it eliminates the bug class.
+//
+// Routing through hubFetch also inherits the URL-scheme enforcement and
+// the EVOMAP_HUB_ALLOW_INSECURE escape hatch automatically; we no
+// longer need the explicit `enforceHubScheme` guard here.
 function _hubPost(pathSuffix, body, timeoutMs) {
   const hubUrl = getHubUrl();
   if (!hubUrl) return Promise.resolve({ ok: false, error: 'no_hub_url' });
   const endpoint = hubUrl.replace(/\/+$/, '') + pathSuffix;
   const timeout = timeoutMs || require('../config').HTTP_TRANSPORT_TIMEOUT_MS;
-  return fetch(endpoint, {
+  return hubFetch(endpoint, {
     method: 'POST',
     headers: buildHubHeaders(),
     body: JSON.stringify(body),
@@ -83,7 +105,17 @@ function _hubPost(pathSuffix, body, timeoutMs) {
       if (!res.ok) return res.text().then(function (t) { return { ok: false, status: res.status, error: t.slice(0, 400) }; });
       return res.json().then(function (data) { return { ok: true, data: data }; });
     })
-    .catch(function (err) { return { ok: false, error: err.message }; });
+    .catch(function (err) {
+      // hubFetch throws synchronously (rejected Promise) when the URL
+      // fails scheme validation in secure mode. Translate to the same
+      // structured envelope the previous in-line guard produced so the
+      // caller contract is unchanged.
+      const msg = (err && err.message) || String(err);
+      if (msg.indexOf('[hubFetch]') !== -1) {
+        return { ok: false, error: 'tls_refused: ' + msg };
+      }
+      return { ok: false, error: msg };
+    });
 }
 function _hubGet(pathSuffix, timeoutMs) {
@@ -91,7 +123,7 @@ function _hubGet(pathSuffix, timeoutMs) {
   if (!hubUrl) return Promise.resolve({ ok: false, error: 'no_hub_url' });
   const endpoint = hubUrl.replace(/\/+$/, '') + pathSuffix;
   const timeout = timeoutMs || require('../config').HTTP_TRANSPORT_TIMEOUT_MS;
-  return fetch(endpoint, {
+  return hubFetch(endpoint, {
     method: 'GET',
     headers: buildHubHeaders(),
     signal: AbortSignal.timeout(timeout),
@@ -100,7 +132,13 @@ function _hubGet(pathSuffix, timeoutMs) {
       if (!res.ok) return res.text().then(function (t) { return { ok: false, status: res.status, error: t.slice(0, 400) }; });
       return res.json().then(function (data) { return { ok: true, data: data }; });
     })
-    .catch(function (err) { return { ok: false, error: err.message }; });
+    .catch(function (err) {
+      const msg = (err && err.message) || String(err);
+      if (msg.indexOf('[hubFetch]') !== -1) {
+        return { ok: false, error: 'tls_refused: ' + msg };
+      }
+      return { ok: false, error: msg };
+    });
 }
 // Dispatcher: choose proxy or direct hub based on env + proxy availability.