npm - @possumtech/rummy - Versions diffs - 0.5.0 → 2.0.0 - Mend

@possumtech/rummy 0.5.0 → 2.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (153) hide show

package/.env.example +21 -5
package/PLUGINS.md +389 -194
package/README.md +25 -8
package/SPEC.md +850 -373
package/bin/demo.js +166 -0
package/bin/rummy.js +9 -3
package/biome/no-fallbacks.grit +50 -0
package/lang/en.json +2 -2
package/migrations/001_initial_schema.sql +88 -37
package/package.json +6 -4
package/service.js +50 -9
package/src/agent/AgentLoop.js +460 -330
package/src/agent/ContextAssembler.js +4 -4
package/src/agent/Entries.js +655 -0
package/src/agent/ProjectAgent.js +30 -18
package/src/agent/TurnExecutor.js +229 -421
package/src/agent/XmlParser.js +99 -33
package/src/agent/budget.js +56 -0
package/src/agent/errors.js +22 -0
package/src/agent/httpStatus.js +39 -0
package/src/agent/known_checks.sql +8 -4
package/src/agent/known_queries.sql +9 -13
package/src/agent/known_store.sql +275 -125
package/src/agent/materializeContext.js +102 -0
package/src/agent/runs.sql +10 -7
package/src/agent/schemes.sql +14 -3
package/src/agent/turns.sql +9 -9
package/src/hooks/HookRegistry.js +6 -5
package/src/hooks/Hooks.js +44 -3
package/src/hooks/PluginContext.js +29 -21
package/src/{server → hooks}/RpcRegistry.js +2 -1
package/src/hooks/RummyContext.js +135 -35
package/src/hooks/ToolRegistry.js +21 -16
package/src/llm/LlmProvider.js +64 -90
package/src/llm/errors.js +21 -0
package/src/plugins/ask_user/README.md +1 -1
package/src/plugins/ask_user/ask_user.js +37 -12
package/src/plugins/ask_user/ask_userDoc.js +2 -25
package/src/plugins/ask_user/ask_userDoc.md +10 -0
package/src/plugins/budget/README.md +27 -25
package/src/plugins/budget/budget.js +260 -88
package/src/plugins/cp/README.md +2 -2
package/src/plugins/cp/cp.js +29 -11
package/src/plugins/cp/cpDoc.js +2 -15
package/src/plugins/cp/cpDoc.md +7 -0
package/src/plugins/engine/README.md +2 -2
package/src/plugins/engine/engine.sql +4 -4
package/src/plugins/engine/turn_context.sql +10 -10
package/src/plugins/env/README.md +20 -5
package/src/plugins/env/env.js +45 -6
package/src/plugins/env/envDoc.js +2 -23
package/src/plugins/env/envDoc.md +13 -0
package/src/plugins/error/README.md +16 -0
package/src/plugins/error/error.js +151 -0
package/src/plugins/file/README.md +6 -6
package/src/plugins/file/file.js +15 -2
package/src/plugins/get/README.md +1 -1
package/src/plugins/get/get.js +103 -48
package/src/plugins/get/getDoc.js +2 -32
package/src/plugins/get/getDoc.md +36 -0
package/src/plugins/hedberg/README.md +1 -2
package/src/plugins/hedberg/hedberg.js +8 -4
package/src/plugins/hedberg/matcher.js +16 -17
package/src/plugins/hedberg/normalize.js +0 -48
package/src/plugins/helpers.js +42 -2
package/src/plugins/index.js +146 -123
package/src/plugins/instructions/README.md +35 -9
package/src/plugins/instructions/instructions.js +122 -9
package/src/plugins/instructions/instructions.md +25 -0
package/src/plugins/instructions/instructions_104.md +7 -0
package/src/plugins/instructions/instructions_105.md +46 -0
package/src/plugins/instructions/instructions_106.md +0 -0
package/src/plugins/instructions/instructions_107.md +0 -0
package/src/plugins/instructions/instructions_108.md +8 -0
package/src/plugins/instructions/protocol.js +12 -0
package/src/plugins/known/README.md +2 -2
package/src/plugins/known/known.js +67 -36
package/src/plugins/known/knownDoc.js +2 -17
package/src/plugins/known/knownDoc.md +8 -0
package/src/plugins/log/README.md +48 -0
package/src/plugins/log/log.js +109 -0
package/src/plugins/mv/README.md +2 -2
package/src/plugins/mv/mv.js +55 -22
package/src/plugins/mv/mvDoc.js +2 -18
package/src/plugins/mv/mvDoc.md +10 -0
package/src/plugins/ollama/README.md +15 -0
package/src/{llm/OllamaClient.js → plugins/ollama/ollama.js} +40 -18
package/src/plugins/openai/README.md +17 -0
package/src/plugins/openai/openai.js +120 -0
package/src/plugins/openrouter/README.md +27 -0
package/src/plugins/openrouter/openrouter.js +121 -0
package/src/plugins/persona/README.md +20 -0
package/src/plugins/persona/persona.js +9 -16
package/src/plugins/policy/README.md +21 -0
package/src/plugins/policy/policy.js +29 -14
package/src/plugins/prompt/README.md +1 -1
package/src/plugins/prompt/prompt.js +58 -16
package/src/plugins/rm/README.md +1 -1
package/src/plugins/rm/rm.js +56 -12
package/src/plugins/rm/rmDoc.js +2 -20
package/src/plugins/rm/rmDoc.md +13 -0
package/src/plugins/rpc/README.md +2 -2
package/src/plugins/rpc/rpc.js +515 -296
package/src/plugins/set/README.md +1 -1
package/src/plugins/set/set.js +318 -75
package/src/plugins/set/setDoc.js +2 -35
package/src/plugins/set/setDoc.md +22 -0
package/src/plugins/sh/README.md +28 -5
package/src/plugins/sh/sh.js +50 -6
package/src/plugins/sh/shDoc.js +2 -23
package/src/plugins/sh/shDoc.md +13 -0
package/src/plugins/skill/README.md +23 -0
package/src/plugins/skill/skill.js +14 -18
package/src/plugins/stream/README.md +101 -0
package/src/plugins/stream/stream.js +290 -0
package/src/plugins/telemetry/README.md +1 -1
package/src/plugins/telemetry/telemetry.js +129 -80
package/src/plugins/think/README.md +1 -1
package/src/plugins/think/think.js +12 -0
package/src/plugins/think/thinkDoc.js +2 -15
package/src/plugins/think/thinkDoc.md +7 -0
package/src/plugins/unknown/README.md +3 -3
package/src/plugins/unknown/unknown.js +47 -19
package/src/plugins/unknown/unknownDoc.js +2 -21
package/src/plugins/unknown/unknownDoc.md +11 -0
package/src/plugins/update/README.md +1 -1
package/src/plugins/update/update.js +67 -5
package/src/plugins/update/updateDoc.js +2 -30
package/src/plugins/update/updateDoc.md +8 -0
package/src/plugins/xai/README.md +23 -0
package/src/{llm/XaiClient.js → plugins/xai/xai.js} +58 -37
package/src/server/ClientConnection.js +64 -37
package/src/server/SocketServer.js +23 -10
package/src/server/protocol.js +11 -0
package/src/sql/v_model_context.sql +27 -31
package/src/sql/v_run_log.sql +9 -14
package/EXCEPTIONS.md +0 -46
package/FIDELITY_CONTRACT.md +0 -172
package/src/agent/KnownStore.js +0 -337
package/src/agent/ResponseHealer.js +0 -241
package/src/llm/OpenAiClient.js +0 -100
package/src/llm/OpenRouterClient.js +0 -100
package/src/plugins/budget/recovery.js +0 -47
package/src/plugins/instructions/preamble.md +0 -45
package/src/plugins/performed/README.md +0 -15
package/src/plugins/performed/performed.js +0 -45
package/src/plugins/previous/README.md +0 -16
package/src/plugins/previous/previous.js +0 -56
package/src/plugins/progress/README.md +0 -16
package/src/plugins/progress/progress.js +0 -43
package/src/plugins/summarize/README.md +0 -19
package/src/plugins/summarize/summarize.js +0 -32
package/src/plugins/summarize/summarizeDoc.js +0 -27

package/src/llm/LlmProvider.js CHANGED Viewed

@@ -1,46 +1,30 @@
 import msg from "../agent/messages.js";
-import OllamaClient from "./OllamaClient.js";
-import OpenAiClient from "./OpenAiClient.js";
-import OpenRouterClient from "./OpenRouterClient.js";
-import XaiClient from "./XaiClient.js";
+import {
+	ContextExceededError,
+	isContextExceededMessage,
+	isTransientMessage,
+} from "./errors.js";
+const MAX_TRANSIENT_RETRIES = 3;
+/**
+ * Thin dispatcher over the LLM provider registry (`hooks.llm.providers`).
+ * Resolves the model alias via the DB, finds the highest-priority provider
+ * whose `matches()` returns true, and delegates. Wraps the call with
+ * transient-error retry and surfaces context-exceeded as a typed
+ * ContextExceededError.
+ *
+ * Vendor-specific HTTP is owned by per-vendor plugins under
+ * `src/plugins/{openai,ollama,xai,openrouter,...}/`. Adding a new vendor
+ * is a matter of adding a plugin — no changes here.
+ */
 export default class LlmProvider {
 	#db;
-	#openRouter;
-	#ollama;
-	#openAi;
-	#xai;
+	#hooks;
-	constructor(db) {
+	constructor(db, hooks) {
 		this.#db = db;
-	}
-	#getOpenRouter() {
-		this.#openRouter ??= new OpenRouterClient(process.env.OPENROUTER_API_KEY);
-		return this.#openRouter;
-	}
-	#getOllama() {
-		this.#ollama ??= new OllamaClient(process.env.OLLAMA_BASE_URL);
-		return this.#ollama;
-	}
-	#getOpenAi() {
-		if (!this.#openAi) {
-			const baseUrl = process.env.OPENAI_BASE_URL;
-			if (!baseUrl) throw new Error(msg("error.openai_base_url_missing"));
-			this.#openAi = new OpenAiClient(baseUrl, process.env.OPENAI_API_KEY);
-		}
-		return this.#openAi;
-	}
-	#getXai() {
-		if (!this.#xai) {
-			const baseUrl = process.env.XAI_BASE_URL;
-			if (!baseUrl) throw new Error(msg("error.xai_base_url_missing"));
-			this.#xai = new XaiClient(baseUrl, process.env.XAI_API_KEY);
-		}
-		return this.#xai;
+		this.#hooks = hooks;
 	}
 	async resolve(alias) {
@@ -49,6 +33,10 @@ export default class LlmProvider {
 		throw new Error(msg("error.model_alias_unknown", { alias }));
 	}
+	#selectProvider(modelAlias) {
+		return this.#hooks.llm.providers.find((p) => p.matches(modelAlias));
+	}
 	async completion(messages, model, options = {}) {
 		const resolvedModel = await this.resolve(model);
@@ -59,68 +47,54 @@ export default class LlmProvider {
 				: undefined);
 		const resolvedOptions = { ...options, temperature };
-		if (resolvedModel.startsWith("ollama/")) {
-			const localModel = resolvedModel.replace("ollama/", "");
-			return this.#getOllama().completion(
-				messages,
-				localModel,
-				resolvedOptions,
-			);
-		}
-		if (resolvedModel.startsWith("openai/")) {
-			const localModel = resolvedModel.replace("openai/", "");
-			return this.#getOpenAi().completion(
-				messages,
-				localModel,
-				resolvedOptions,
+		const provider = this.#selectProvider(resolvedModel);
+		if (!provider) {
+			throw new Error(
+				`No LLM provider registered for model "${resolvedModel}". ` +
+					`Check your RUMMY_* env vars or register a provider plugin.`,
 			);
 		}
-		if (resolvedModel.startsWith("x.ai/")) {
-			const localModel = resolvedModel.replace("x.ai/", "");
-			return this.#getXai().completion(messages, localModel, resolvedOptions);
+		for (let attempt = 0; ; attempt++) {
+			try {
+				return await provider.completion(
+					messages,
+					resolvedModel,
+					resolvedOptions,
+				);
+			} catch (err) {
+				if (isContextExceededMessage(err.message)) {
+					throw new ContextExceededError(err.message, { cause: err });
+				}
+				if (
+					isTransientMessage(err.message) &&
+					attempt < MAX_TRANSIENT_RETRIES
+				) {
+					const delay = 1000 * 2 ** attempt;
+					await new Promise((r) => setTimeout(r, delay));
+					continue;
+				}
+				throw err;
+			}
 		}
-		return this.#getOpenRouter().completion(
-			messages,
-			resolvedModel,
-			resolvedOptions,
-		);
 	}
 	async getContextSize(model) {
-		// DB is the authority — check models table first
-		if (this.#db) {
-			const row = await this.#db.get_model_by_alias.get({ alias: model });
-			if (row?.context_length) return row.context_length;
-		}
+		const row = await this.#db.get_model_by_alias.get({ alias: model });
+		if (row?.context_length) return row.context_length;
-		// Fall back to API query
 		const resolvedModel = await this.resolve(model);
-		let size;
-		if (resolvedModel.startsWith("ollama/")) {
-			const localModel = resolvedModel.replace("ollama/", "");
-			size = await this.#getOllama().getContextSize(localModel);
-		} else if (resolvedModel.startsWith("openai/")) {
-			size = await this.#getOpenAi().getContextSize(resolvedModel);
-		} else if (resolvedModel.startsWith("x.ai/")) {
-			const localModel = resolvedModel.replace("x.ai/", "");
-			size = await this.#getXai().getContextSize(localModel);
-		} else {
-			size = await this.#getOpenRouter().getContextSize(resolvedModel);
-		}
-		// Cache back to DB for next time
-		if (this.#db && size) {
-			await this.#db.update_model_context_length
-				.run({
-					alias: model,
-					context_length: size,
-				})
-				.catch(() => {});
+		const provider = this.#selectProvider(resolvedModel);
+		if (!provider) {
+			throw new Error(
+				`No LLM provider registered for model "${resolvedModel}".`,
+			);
 		}
+		const size = await provider.getContextSize(resolvedModel);
+		await this.#db.update_model_context_length.run({
+			alias: model,
+			context_length: size,
+		});
 		return size;
 	}
 }

package/src/llm/errors.js ADDED Viewed

@@ -0,0 +1,21 @@
+export class ContextExceededError extends Error {
+	constructor(message, { cause } = {}) {
+		super(message);
+		this.name = "ContextExceededError";
+		if (cause) this.cause = cause;
+	}
+}
+const CONTEXT_EXCEEDED_PATTERN =
+	/\b(context.*(size|length|limit)|token.*(limit|exceed)|too.*(long|large))\b/i;
+export function isContextExceededMessage(message) {
+	return CONTEXT_EXCEEDED_PATTERN.test(String(message));
+}
+const TRANSIENT_PATTERN =
+	/\b(503|429|timeout|ECONNREFUSED|ECONNRESET|unavailable)\b/i;
+export function isTransientMessage(message) {
+	return TRANSIENT_PATTERN.test(String(message));
+}

package/src/plugins/ask_user/README.md CHANGED Viewed

@@ -1,4 +1,4 @@
-# ask_user
+# ask_user {#ask_user_plugin}
 Presents a question to the user with optional multiple-choice answers.

package/src/plugins/ask_user/ask_user.js CHANGED Viewed

@@ -1,5 +1,7 @@
 import docs from "./ask_userDoc.js";
+const LOG_ACTION_RE = /^log:\/\/turn_\d+\/(\w+)\//;
 export default class AskUser {
 	#core;
@@ -7,28 +9,50 @@ export default class AskUser {
 		this.#core = core;
 		core.registerScheme();
 		core.on("handler", this.handler.bind(this));
-		core.on("promoted", this.full.bind(this));
-		core.on("demoted", this.summary.bind(this));
+		core.on("visible", this.full.bind(this));
+		core.on("summarized", this.summary.bind(this));
 		core.filter("instructions.toolDocs", async (docsMap) => {
 			docsMap.ask_user = docs;
 			return docsMap;
 		});
+		core.on("proposal.accepted", this.#onResolved.bind(this));
+		core.on("proposal.rejected", this.#onResolved.bind(this));
+	}
+	async #onResolved(ctx) {
+		const m = LOG_ACTION_RE.exec(ctx.path);
+		if (m?.[1] !== "ask_user") return;
+		if (!ctx.output) return;
+		const turn = (await ctx.db.get_run_by_id.get({ id: ctx.runId })).next_turn;
+		await ctx.entries.set({
+			runId: ctx.runId,
+			turn,
+			path: ctx.path,
+			body: ctx.resolvedBody,
+			attributes: { ...ctx.attrs, answer: ctx.output },
+		});
 	}
 	async handler(entry, rummy) {
 		const { entries: store, sequence: turn, runId, loopId } = rummy;
+		// XmlParser resolved question/options from attr-or-body already.
 		const { question, options: rawOptions } = entry.attributes;
-		const optionText = rawOptions || entry.body || "";
-		const delimiter = optionText.includes(";") ? ";" : ",";
-		const options = optionText
-			? optionText
-					.split(delimiter)
-					.map((o) => o.trim())
-					.filter(Boolean)
-			: [];
+		let options = [];
+		if (rawOptions) {
+			const delimiter = rawOptions.includes(";") ? ";" : ",";
+			options = rawOptions
+				.split(delimiter)
+				.map((o) => o.trim())
+				.filter(Boolean);
+		}
-		await store.upsert(runId, turn, entry.resultPath, entry.body, 202, {
+		await store.set({
+			runId,
+			turn,
+			path: entry.resultPath,
+			body: entry.body,
+			state: "proposed",
 			attributes: { question, options },
 			loopId,
 		});
@@ -44,6 +68,7 @@ export default class AskUser {
 	summary(entry) {
 		const { question, answer } = entry.attributes;
-		return answer ? `${question} → ${answer}` : question || "";
+		if (answer) return `${question} → ${answer}`;
+		return question;
 	}
 }

package/src/plugins/ask_user/ask_userDoc.js CHANGED Viewed

@@ -1,26 +1,3 @@
-// Tool doc for <ask_user>. Each entry: [text, rationale].
-// Text goes to the model. Rationale stays in source.
-// Changing ANY line requires reading ALL rationales first.
-const LINES = [
-	[
-		'## <ask_user question="[Question?]">[option1; option2; ...]</ask_user> - Ask the user a question',
-	],
-	[
-		"* YOU SHOULD use for decisions, preferences, or approvals the user must make",
-		"Positive framing. Shows what ask_user IS for.",
-	],
-	[
-		"* YOU SHOULD use <get></get> to find information before asking the user",
-		"Gentle redirect. Encourages self-sufficiency.",
-	],
-	[
-		'Example: <ask_user question="Which test framework?">Mocha; Jest; Node Native</ask_user>',
-		"Preference decision. Model truly cannot know this without asking.",
-	],
-	[
-		'Example: <ask_user question="Deploy to staging or production?">staging; production</ask_user>',
-		"Consequential action. High-stakes choice.",
-	],
-];
+import { loadDoc } from "../helpers.js";
-export default LINES.map(([text]) => text).join("\n");
+export default loadDoc(import.meta.url, "ask_userDoc.md");

package/src/plugins/ask_user/ask_userDoc.md ADDED Viewed

@@ -0,0 +1,10 @@
+## <ask_user question="[Question?]">[option1; option2; ...]</ask_user> - Ask the user a question
+* YOU SHOULD ONLY use for decisions, preferences, or approvals the user must make
+<!-- Positive framing. Shows what ask_user IS for. -->
+Example: <ask_user question="Which test framework?">Mocha; Jest; Node Native</ask_user>
+<!-- Preference decision. Model truly cannot know this without asking. -->
+Example: <ask_user question="Deploy to staging or production?">staging; production</ask_user>
+<!-- Consequential action. High-stakes choice. -->

package/src/plugins/budget/README.md CHANGED Viewed

@@ -1,41 +1,43 @@
-# budget
+# budget {#budget_plugin}
 Context ceiling enforcement.
 ## Design
-Ceiling = `floor(contextSize × 0.9)`. The 10% headroom is the system's
-operating room for graceful overflow handling. No per-write gating —
-tools run uninterrupted. Enforcement happens at boundaries.
+Ceiling = `floor(contextSize × RUMMY_BUDGET_CEILING)` (default 0.9). The
+10% headroom is the system's operating room for graceful overflow
+handling. No per-write gating — tools run uninterrupted. Enforcement
+happens at boundaries.
 ## Enforcement Points
-1. **Pre-LLM enforce** (`budget.enforce`): checks assembled context
-   before the LLM call. If over ceiling → Prompt Demotion (summarize
-   the incoming prompt). Model runs in the headroom.
+1. **Pre-LLM enforce** (`hooks.budget.enforce`): checks assembled context
+   before the LLM call. If over ceiling on turn 1 → Prompt Demotion
+   (demote the incoming prompt, re-materialize, re-check). Runs in the
+   headroom if that fits. On non-first turns or still-over after
+   Prompt Demotion, emits a 413 error via `hooks.error.log` so the
+   strike system treats the overflow as a turn-level event.
-2. **Post-dispatch Turn Demotion**: after all tools dispatch, check
-   context. If over ceiling → demote ALL entries from this turn
-   (every scheme except `budget`/`system`/`prompt`/`instructions`,
-   and 4xx error states stay promoted). Write `budget://` entry with
-   directive to demote irrelevant entries and promote fewer next time.
-   Model sees it next turn and adapts.
+2. **Post-dispatch Turn Demotion** (`hooks.budget.postDispatch`): after
+   all tools dispatch, re-materialize and check. If over ceiling →
+   demote ALL visible entries from this turn (status < 400, status
+   preserved — demotion only changes visibility). Emits a 413 error
+   with the 50% rule directive as its message; the error entry is
+   what the model sees next turn.
-3. **LLM rejection** (`isContextExceeded`): turn-1 token estimate
-   drift causes LLM to reject. Same demotion pattern.
-4. **AgentLoop recovery**: pre-LLM 413 that Prompt Demotion can't
-   resolve. Batch-demote all full entries, budget entry, model gets
-   recovery turns. 3 strikes without progress → hard 413 to client.
-   Only path where 413 reaches the client.
+3. **LLM rejection** (`isContextExceeded` in TurnExecutor): turn-1
+   token estimate drift causes LLM to reject. Same 413 error path as
+   pre-LLM overflow.
 ## Files
-- **budget.js** — Plugin. Pre-LLM enforce hook.
-- **BudgetGuard.js** — `BudgetExceeded` error type, `delta` utility.
+- **budget.js** — Plugin. Enforce + postDispatch methods exposed on
+  `core.hooks.budget`.
 ## Registration
-- **Hook**: `hooks.budget.enforce` — pre-LLM ceiling check.
-- **Scheme**: `budget://` — logging category, model-visible. `onView`
-  renders body at all fidelity levels (demoted shows full content).
+- **Hook**: `hooks.budget.enforce` — pre-LLM ceiling check + first-turn
+  Prompt Demotion.
+- **Hook**: `hooks.budget.postDispatch` — post-dispatch re-check + Turn
+  Demotion. Emits 413 errors through the unified error channel; there
+  is no separate `budget://` scheme.