npm - @askalf/dario - Versions diffs - 4.8.49 → 4.8.51 - Mend

@askalf/dario 4.8.49 → 4.8.51

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/dist/cc-template.js CHANGED Viewed

@@ -1426,6 +1426,21 @@ export function buildCCRequest(clientBody, billingTag, cacheControl, identity, o
         // wire footprint).
         ccRequest.tools = CC_TOOL_DEFINITIONS;
     }
+    else if (model.toLowerCase().includes('fable')) {
+        // Fable refuses tool-less CC-shaped MULTI-TURN requests (live replay
+        // bisect 2026-06-09): scrubbed system + zero tools + an assistant turn
+        // in history → 200 + stop_reason "refusal" with empty content on every
+        // request, while the byte-identical body WITH CC's tool array answers.
+        // Real CC always sends its tool array, so zero-tools is itself a
+        // fingerprint divergence (see the merge-tools note above) — fable's
+        // refusal layer is just the first model to punish it. Emit the CC base
+        // array pinned with `tool_choice: none` so the model cannot call tools
+        // the client never declared (without the pin it DOES — verified
+        // spurious WebFetch on a weather prompt). Other families keep the
+        // legacy tool-less shape, which they demonstrably accept.
+        ccRequest.tools = CC_TOOL_DEFINITIONS;
+        ccRequest.tool_choice = { type: 'none' };
+    }
     // Metadata
     ccRequest.metadata = {
         user_id: JSON.stringify({

package/dist/proxy.d.ts CHANGED Viewed

@@ -37,6 +37,23 @@ export declare function betaForModel(base: string, model: string | null | undefi
  * very end of the id. Exported for tests.
  */
 export declare function stripContext1mTag(model: string): string;
+/**
+ * Resolve an inbound API path to its upstream target + forwarding mode.
+ * Allowlist semantics — anything unlisted is 403'd (prevents SSRF through
+ * the OAuth-bearing proxy).
+ *
+ * `thin: true` marks endpoints forwarded WITHOUT template injection —
+ * OAuth swap + model-id normalization only. `/v1/messages/count_tokens`
+ * is thin because the endpoint counts the CLIENT's own prompt: bolting on
+ * CC's system/tools/effort would distort the count (and `output_config`
+ * is not a count_tokens request field). `?beta=true` stays a /v1/messages
+ * affordance (billing classification) — not appended for count_tokens.
+ * Exported for tests.
+ */
+export declare function resolveProxyTarget(urlPath: string, isOpenAI: boolean): {
+    target: string;
+    thin: boolean;
+} | null;
 export declare const ORCHESTRATION_TAG_NAMES: string[];
 /**
  * Build the regex list that actually strips orchestration tags.

package/dist/proxy.js CHANGED Viewed

@@ -220,6 +220,29 @@ export function stripContext1mTag(model) {
         return model;
     return model.replace(/\[1m\]$/i, '');
 }
+/**
+ * Resolve an inbound API path to its upstream target + forwarding mode.
+ * Allowlist semantics — anything unlisted is 403'd (prevents SSRF through
+ * the OAuth-bearing proxy).
+ *
+ * `thin: true` marks endpoints forwarded WITHOUT template injection —
+ * OAuth swap + model-id normalization only. `/v1/messages/count_tokens`
+ * is thin because the endpoint counts the CLIENT's own prompt: bolting on
+ * CC's system/tools/effort would distort the count (and `output_config`
+ * is not a count_tokens request field). `?beta=true` stays a /v1/messages
+ * affordance (billing classification) — not appended for count_tokens.
+ * Exported for tests.
+ */
+export function resolveProxyTarget(urlPath, isOpenAI) {
+    if (isOpenAI)
+        return { target: `${ANTHROPIC_API}/v1/messages?beta=true`, thin: false };
+    const allowed = {
+        '/v1/messages': { target: `${ANTHROPIC_API}/v1/messages?beta=true`, thin: false },
+        '/v1/messages/count_tokens': { target: `${ANTHROPIC_API}/v1/messages/count_tokens`, thin: true },
+        '/v1/complete': { target: `${ANTHROPIC_API}/v1/complete`, thin: false },
+    };
+    return allowed[urlPath] ?? null;
+}
 // Orchestration tags injected by agents (Aider, Cursor, OpenCode, etc.)
 // that confuse Claude when passed through. Strip before forwarding.
 export const ORCHESTRATION_TAG_NAMES = [
@@ -940,7 +963,7 @@ export async function startProxy(opts = {}) {
     const JSON_HEADERS = { 'Content-Type': 'application/json', ...SECURITY_HEADERS };
     const MODELS_JSON = JSON.stringify(OPENAI_MODELS_LIST);
     const ERR_UNAUTH = JSON.stringify({ error: 'Unauthorized', message: 'Invalid or missing API key' });
-    const ERR_FORBIDDEN = JSON.stringify({ error: 'Forbidden', message: 'Path not allowed. Supported paths: POST /v1/messages, POST /v1/chat/completions, GET /v1/models' });
+    const ERR_FORBIDDEN = JSON.stringify({ error: 'Forbidden', message: 'Path not allowed. Supported paths: POST /v1/messages, POST /v1/messages/count_tokens, POST /v1/chat/completions, GET /v1/models' });
     const ERR_METHOD = JSON.stringify({ error: 'Method not allowed' });
     function checkAuth(req) {
         return authenticateRequest(req.headers, apiKeyBuf);
@@ -1170,18 +1193,16 @@ export async function startProxy(opts = {}) {
         }
         // Detect OpenAI-format requests
         const isOpenAI = urlPath === '/v1/chat/completions';
-        // Allowlisted API paths — only these are proxied (prevents SSRF)
-        // ?beta=true matches native Claude Code behavior for billing classification
-        const allowedPaths = {
-            '/v1/messages': `${ANTHROPIC_API}/v1/messages?beta=true`,
-            '/v1/complete': `${ANTHROPIC_API}/v1/complete`,
-        };
-        const targetBase = isOpenAI ? `${ANTHROPIC_API}/v1/messages?beta=true` : allowedPaths[urlPath];
-        if (!targetBase) {
+        // Allowlisted API paths — only these are proxied (prevents SSRF).
+        // count_tokens forwards thin (no template injection) — see resolveProxyTarget.
+        const route = resolveProxyTarget(urlPath, isOpenAI);
+        if (!route) {
             res.writeHead(403, JSON_HEADERS);
             res.end(ERR_FORBIDDEN);
             return;
         }
+        const targetBase = route.target;
+        const isCountTokens = route.thin;
         if (req.method !== 'POST') {
             res.writeHead(405, JSON_HEADERS);
             res.end(ERR_METHOD);
@@ -1436,8 +1457,10 @@ export async function startProxy(opts = {}) {
                     const result = isOpenAI ? openaiToAnthropic(parsed, modelOverride) : (modelOverride ? { ...parsed, model: modelOverride } : parsed);
                     const r = result;
                     requestModel = (r.model || '').toLowerCase();
-                    // In passthrough mode, skip all Claude-specific injection — OAuth swap only
-                    if (!passthrough) {
+                    // In passthrough mode, skip all Claude-specific injection — OAuth swap only.
+                    // count_tokens also forwards thin (see resolveProxyTarget) — the endpoint
+                    // counts the CLIENT's own prompt, so template injection would distort it.
+                    if (!passthrough && !isCountTokens) {
                         // ── Template replay: replace the entire request with a CC template ──
                         // Instead of transforming signals one by one, we build a new request
                         // from CC's exact template and inject only the conversation content.
@@ -1563,6 +1586,12 @@ export async function startProxy(opts = {}) {
                         // logic (family buckets, fable beta/effort) sees the user intent.
                         r.model = stripContext1mTag(r.model);
                     }
+                    else if (isCountTokens && typeof r.model === 'string') {
+                        // Thin count_tokens forward still normalizes the model id —
+                        // the literal `[1m]` label 404s upstream here exactly as it
+                        // does on /v1/messages.
+                        r.model = stripContext1mTag(r.model);
+                    }
                     finalBody = Buffer.from(JSON.stringify(r));
                 }
                 catch { /* not JSON, send as-is */ }
@@ -1588,8 +1617,9 @@ export async function startProxy(opts = {}) {
             // Beta headers
             const clientBeta = req.headers['anthropic-beta'];
             let beta;
-            if (passthrough) {
-                // Passthrough: only add oauth beta, forward client betas as-is
+            if (passthrough || isCountTokens) {
+                // Passthrough (and thin count_tokens): only add oauth beta,
+                // forward client betas as-is — no template beta set.
                 beta = 'oauth-2025-04-20';
                 if (clientBeta)
                     beta += ',' + clientBeta;

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@askalf/dario",
-  "version": "4.8.49",
+  "version": "4.8.51",
   "description": "Use your Claude Pro/Max subscription in any tool — Cursor, Cline, Aider, the Agent SDK, your scripts — at subscription pricing, not per-token API bills. One local Anthropic + OpenAI-compatible endpoint.",
   "type": "module",
   "bin": {