npm - @agentforge-io/core - Versions diffs - 2.1.0 → 2.1.1 - Mend

@agentforge-io/core 2.1.0 → 2.1.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/dist/services/agent-runner.service.js +43 -4
package/package.json +1 -1

package/dist/services/agent-runner.service.js CHANGED Viewed

@@ -11,6 +11,38 @@ const model_strategy_1 = require("../types/model-strategy");
 const noopLogger = {
     log: () => { }, warn: () => { }, debug: () => { }, error: () => { },
 };
+/**
+ * Anthropic's newer model families deprecated the `temperature` parameter
+ * entirely — they auto-tune sampling internally and return 400
+ * `invalid_request_error: \`temperature\` is deprecated for this model` if
+ * the caller still sends one. Older families (3.x, the original 4.0
+ * releases) accept it fine.
+ *
+ * Detection by string match on the model id rather than a hard-coded
+ * allowlist: new model ids land between SDK releases, and we don't want
+ * to break temperature on legacy agents the day a new family ships.
+ * Pattern: anything that contains `-4-5`, `-4-6`, `-4-7`, …, `-5-*`,
+ * `-6-*`, etc. counts as "newer." Old 4-0 / 4-1 / 3-x ids are unaffected.
+ *
+ * Heuristic, not exhaustive — if a future family lands with a different
+ * naming convention we'll have to extend this. The cost of being wrong
+ * is a single 400 the operator can fix by clearing the temperature in
+ * the editor; the cost of NOT filtering is the same 400 today.
+ */
+function modelRejectsTemperature(model) {
+    if (!model)
+        return false;
+    // Normalize: ignore vendor prefixes like "anthropic/claude-..." and
+    // bracket suffixes like "claude-opus-4-7[1m]" (long-context variant).
+    const m = model.toLowerCase().replace(/\[[^\]]*\]/g, '');
+    // claude-*-4-5, 4-6, 4-7, 4-8 …
+    if (/claude-[a-z]+-4-([5-9])\b/.test(m))
+        return true;
+    // claude-*-5-x, claude-*-6-x, … (future major bumps)
+    if (/claude-[a-z]+-([5-9])-/.test(m))
+        return true;
+    return false;
+}
 /**
  * Framework-free runner for Claude. Handles the agentic loop (tool calls) for
  * sync runs and exposes streaming as an `AsyncGenerator<StreamChunk>` so any
@@ -74,12 +106,17 @@ class AgentRunnerService {
             if (this.logger && selection.reason !== 'default' && selection.reason !== 'forced') {
                 this.logger.debug(`[modelRouter] agent=${agent.id} ${selection.reason}=${selection.trigger} → ${model}`);
             }
+            // Per-turn temperature gating. The PER-MODEL filter runs INSIDE
+            // the loop because `model` can change between turns (model
+            // strategy can route a long-context turn to a different family
+            // than the short turns above it). Computing once outside would
+            // either over-strip (drop temperature for a legacy follow-up
+            // model) or under-strip (forward it to a new-family upgrade).
+            const includeTemperature = typeof temperature === 'number' && !modelRejectsTemperature(model);
             const response = await this.client.messages.create({
                 model,
                 max_tokens: maxTokens,
-                // Only include temperature when explicitly declared — newer
-                // models 400 on `temperature` when tools are present.
-                ...(typeof temperature === 'number' ? { temperature } : {}),
+                ...(includeTemperature ? { temperature } : {}),
                 system: systemPrompt,
                 messages: currentMessages,
                 tools: tools,
@@ -193,10 +230,12 @@ class AgentRunnerService {
             if (this.logger && selection.reason !== 'default' && selection.reason !== 'forced') {
                 this.logger.debug(`[modelRouter] agent=${agent.id} ${selection.reason}=${selection.trigger} → ${model}`);
             }
+            // Per-turn temperature gating — see `run()` above for rationale.
+            const includeTemperature = typeof temperature === 'number' && !modelRejectsTemperature(model);
             const stream = this.client.messages.stream({
                 model,
                 max_tokens: maxTokens,
-                ...(typeof temperature === 'number' ? { temperature } : {}),
+                ...(includeTemperature ? { temperature } : {}),
                 system: systemPrompt,
                 messages: currentMessages,
                 tools: tools,

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@agentforge-io/core",
-  "version": "2.1.0",
+  "version": "2.1.1",
   "description": "Framework-free AI runtime SDK. Owns: agent loop (Anthropic), conversations, tools, streaming, agent-job queue, SdkHooks. Identity, billing, infra (email/uploads/secrets) live in the host's modules — not here.",
   "license": "MIT",
   "main": "dist/index.js",