npm - @joshuaswarren/openclaw-engram - Versions diffs - 9.1.16 → 9.1.17 - Mend

@joshuaswarren/openclaw-engram 9.1.16 → 9.1.17

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

package/README.md +11 -4
package/dist/access-cli.js +1 -1
package/dist/{chunk-W7435EXA.js → chunk-ZZF2FYBV.js} +16 -3
package/dist/chunk-ZZF2FYBV.js.map +1 -0
package/dist/index.js +1 -1
package/package.json +1 -1
package/dist/chunk-W7435EXA.js.map +0 -1

package/README.md CHANGED Viewed

@@ -68,13 +68,18 @@ After installation, add Engram to your `openclaw.json`:
       "openclaw-engram": {
         "enabled": true,
         "config": {
-          // Use OpenAI for extraction:
+          // Option 1: Use OpenAI for extraction:
           "openaiApiKey": "${OPENAI_API_KEY}"
-          // OR use a local LLM (no API key needed):
+          // Option 2: Use a local LLM (no API key needed):
           // "localLlmEnabled": true,
           // "localLlmUrl": "http://localhost:1234/v1",
           // "localLlmModel": "qwen2.5-32b-instruct"
+          // Option 3: Use the gateway model chain (multi-provider fallback):
+          // "modelSource": "gateway",
+          // "gatewayAgentId": "engram-llm",
+          // "fastGatewayAgentId": "engram-llm-fast"
         }
       }
     }
@@ -82,6 +87,8 @@ After installation, add Engram to your `openclaw.json`:
 }
 ```
+> **Gateway model source:** When `modelSource` is `"gateway"`, Engram routes all LLM calls (extraction, consolidation, reranking) through an OpenClaw agent persona's model chain instead of its own config. Define agent personas in `openclaw.json → agents.list[]` with a `primary` model and `fallbacks[]` array — Engram tries each in order until one succeeds. This lets you build multi-provider fallback chains like Fireworks → local LLM → cloud OpenAI. See the [Gateway Model Source](docs/config-reference.md#gateway-model-source) guide for full setup.
 Restart the gateway:
 ```bash
@@ -192,9 +199,9 @@ OpenClaw's built-in memory is basic — it works for getting started, but lacks
 Engram uses hybrid search (BM25 + vector + reranking via [QMD](https://github.com/tobilu/qmd)) to find semantically relevant memories. It doesn't just match keywords — it understands what you're working on and surfaces the right context.
-### OpenAI or local LLM — your choice
+### Flexible LLM routing — OpenAI, local, or gateway model chain
-Use OpenAI for extraction and reranking, or run entirely offline with a local LLM via Ollama, LM Studio, or any OpenAI-compatible endpoint. The `local-llm-heavy` preset is optimized for fully local operation. See the [Local LLM Guide](docs/guides/local-llm.md).
+Use OpenAI for extraction and reranking, run entirely offline with a local LLM (Ollama, LM Studio), or route through the **gateway model chain** to use any provider with automatic fallback. The `local-llm-heavy` preset is optimized for fully local operation. See the [Local LLM Guide](docs/guides/local-llm.md) and the [Gateway Model Source](docs/config-reference.md#gateway-model-source) section for multi-provider setups.
 ### Progressive complexity

package/dist/access-cli.js CHANGED Viewed

@@ -3,7 +3,7 @@ import {
   EngramAccessService,
   Orchestrator,
   parseConfig
-} from "./chunk-W7435EXA.js";
+} from "./chunk-ZZF2FYBV.js";
 import "./chunk-MQ5EZ6VE.js";
 import "./chunk-IMMYYNXG.js";
 import "./chunk-TS3YC3MY.js";

package/dist/{chunk-W7435EXA.js → chunk-ZZF2FYBV.js} RENAMED Viewed

@@ -21945,6 +21945,19 @@ var Orchestrator = class _Orchestrator {
     const result = await this.fastLlm.chatCompletion(messages, options);
     return result ? { content: result.content } : null;
   }
+  /**
+   * Get a fast-tier LLM client compatible with the rerank interface.
+   * When gateway model source is active, routes through the gateway fast chain.
+   * Otherwise returns the local fast LLM directly.
+   */
+  get fastLlmForRerank() {
+    if (this.fastGatewayLlm && this.config.modelSource === "gateway") {
+      return {
+        chatCompletion: (messages, options) => this.fastChatCompletion(messages, options ?? {})
+      };
+    }
+    return this.fastLlm;
+  }
   async initialize() {
     await this.storage.ensureDirectories();
     await this.storage.loadAliases();
@@ -25879,7 +25892,7 @@ ${tmtNode.summary}`
             id: r.path,
             snippet: r.snippet || r.path
           })),
-          local: this.fastLlm,
+          local: this.fastLlmForRerank,
           enabled: true,
           timeoutMs: this.config.rerankTimeoutMs,
           maxCandidates: this.config.rerankMaxCandidates,
@@ -29159,7 +29172,7 @@ ${lines.join("\n\n")}`;
           id: r.path,
           snippet: r.snippet || r.path
         })),
-        local: this.fastLlm,
+        local: this.fastLlmForRerank,
         enabled: true,
         timeoutMs: this.config.rerankTimeoutMs,
         maxCandidates: this.config.rerankMaxCandidates,
@@ -31521,4 +31534,4 @@ export {
   EngramAccessInputError,
   EngramAccessService
 };
-//# sourceMappingURL=chunk-W7435EXA.js.map
+//# sourceMappingURL=chunk-ZZF2FYBV.js.map