npm - @aion0/forge - Versions diffs - 0.10.57 → 0.10.64 - Mend

@aion0/forge 0.10.57 → 0.10.64

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

package/RELEASE_NOTES.md +3 -3
package/app/chat/page.tsx +134 -2
package/lib/agents/known-models.json +104 -0
package/lib/agents/known-models.ts +7 -67
package/lib/chat/agent-loop.ts +4 -2
package/lib/chat/llm/anthropic.ts +5 -1
package/lib/chat/llm/openai.ts +5 -1
package/lib/chat/llm/types.ts +6 -0
package/package.json +1 -1
package/publish.sh +24 -0

package/RELEASE_NOTES.md CHANGED Viewed

@@ -1,8 +1,8 @@
-# Forge v0.10.57
+# Forge v0.10.64
 Released: 2026-06-10
-## Changes since v0.10.56
+## Changes since v0.10.63
-**Full Changelog**: https://github.com/aiwatching/forge/compare/v0.10.56...v0.10.57
+**Full Changelog**: https://github.com/aiwatching/forge/compare/v0.10.63...v0.10.64

package/app/chat/page.tsx CHANGED Viewed

@@ -43,6 +43,17 @@ interface ChatSession extends Session {
   meta?: { kind?: 'main' | 'temp'; [k: string]: unknown };
 }
+// One configured API profile, as the header's quick-switcher lists them.
+// Mirrors settings.apiProfiles entries (apiKey is masked by /api/settings —
+// we never read it here, just id/name/provider/model to label the option).
+interface ProfileOption {
+  id: string;
+  name: string;
+  provider: string;
+  model: string;
+  enabled: boolean;
+}
 export default function ChatPage() {
   const [sessions, setSessions] = useState<ChatSession[]>([]);
   // Inline rename state — only one row edits at a time. editingId is the
@@ -63,6 +74,13 @@ export default function ChatPage() {
   const [memory, setMemory] = useState<MemoryStatus | null>(null);
   const [memoryOpen, setMemoryOpen] = useState(false);
   const [error, setError] = useState('');
+  // Configured API profiles + the header quick-switch dropdown's open state.
+  const [profiles, setProfiles] = useState<ProfileOption[]>([]);
+  const [switchOpen, setSwitchOpen] = useState(false);
+  // The model the backend ACTUALLY served on the last turn (from the
+  // provider response, not the model's self-description). Reset on session
+  // switch so it never shows a stale value from a different conversation.
+  const [servedModel, setServedModel] = useState('');
   const eventSrcRef = useRef<EventSource | null>(null);
   const scrollRef = useRef<HTMLDivElement>(null);
@@ -108,9 +126,32 @@ export default function ChatPage() {
   }, []);
   useEffect(() => {
+    setServedModel(''); // stale across sessions — cleared until next turn reports
     if (activeId) loadMessages(activeId);
   }, [activeId, loadMessages]);
+  // ─── Load configured API profiles (for the header quick-switcher) ──
+  // Served by next-server's /api/settings (same origin) with apiKeys masked.
+  useEffect(() => {
+    (async () => {
+      try {
+        const r = await fetch('/api/settings');
+        if (!r.ok) return;
+        const s = (await r.json()) as { apiProfiles?: Record<string, { name?: string; enabled?: boolean; provider?: string; model?: string }> };
+        const list: ProfileOption[] = Object.entries(s.apiProfiles || {})
+          .filter(([, p]) => p && p.enabled !== false)
+          .map(([id, p]) => ({
+            id,
+            name: p.name || id,
+            provider: p.provider || 'anthropic',
+            model: p.model || 'default',
+            enabled: p.enabled !== false,
+          }));
+        setProfiles(list);
+      } catch { /* non-fatal — header just falls back to plain text */ }
+    })();
+  }, []);
   // ─── SSE subscription ─────────────────────────────────────
   useEffect(() => {
     if (!activeId) return;
@@ -139,6 +180,7 @@ export default function ChatPage() {
         setStreaming(false);
         setStopRequested(false);
         setPartial('');
+        if (data.served_model) setServedModel(String(data.served_model));
         loadMessages(activeId);
         refreshSessions();
       } else if (type === 'watch_status') {
@@ -320,6 +362,32 @@ export default function ChatPage() {
     }
   }
+  // Switch the active session's API profile. session.provider holds the
+  // apiProfile id; session.model the (optional) override. We set both to the
+  // chosen profile's id + its configured model so the next turn uses it —
+  // updateSession merges with ?? semantics, so passing the model explicitly
+  // avoids carrying a stale model from the previous profile.
+  async function switchProfile(p: ProfileOption) {
+    setSwitchOpen(false);
+    if (!activeId) return;
+    if (activeSession?.provider === p.id) return; // already on it
+    try {
+      const r = await fetch(`${PROXY}/sessions/${activeId}`, {
+        method: 'PATCH',
+        headers: { 'content-type': 'application/json' },
+        body: JSON.stringify({ provider: p.id, model: p.model }),
+      });
+      if (!r.ok) {
+        const j = await r.json().catch(() => ({}));
+        setError(j.error || `switch failed (HTTP ${r.status})`);
+        return;
+      }
+      await refreshSessions();
+    } catch (e) {
+      setError(e instanceof Error ? e.message : String(e));
+    }
+  }
   async function clearMessages() {
     if (!activeId) return;
     if (!confirm('Clear all messages in this session?')) return;
@@ -497,10 +565,74 @@ export default function ChatPage() {
                 'No session'}
             </div>
             {activeSession && (
-              <div className="text-[11px] text-[var(--text-secondary)]">
-                {activeSession.provider || 'auto'} · {activeSession.model || 'default'}
+              <div className="relative inline-block">
+                <button
+                  type="button"
+                  onClick={() => setSwitchOpen((v) => !v)}
+                  disabled={profiles.length === 0}
+                  title={profiles.length ? 'Switch API profile for this conversation' : 'No API profiles configured'}
+                  className="flex items-center gap-1 text-[11px] text-[var(--text-secondary)] hover:text-[var(--text-primary)] disabled:cursor-default disabled:hover:text-[var(--text-secondary)] transition-colors"
+                >
+                  <span>
+                    {(() => {
+                      const cur = profiles.find((p) => p.id === activeSession.provider);
+                      const label = cur?.name || activeSession.provider || 'auto';
+                      return `${label} · ${activeSession.model || cur?.model || 'default'}`;
+                    })()}
+                  </span>
+                  {profiles.length > 0 && <span className="opacity-50 text-[9px]">▼</span>}
+                </button>
+                {switchOpen && profiles.length > 0 && (
+                  <>
+                    {/* click-away backdrop */}
+                    <div className="fixed inset-0 z-10" onClick={() => setSwitchOpen(false)} />
+                    <div className="absolute left-0 top-full mt-1 z-20 min-w-[200px] max-h-[60vh] overflow-y-auto rounded-md border border-[var(--border)] bg-[var(--bg-secondary)] shadow-lg py-1">
+                      {profiles.map((p) => {
+                        const active = p.id === activeSession.provider;
+                        return (
+                          <button
+                            key={p.id}
+                            type="button"
+                            onClick={() => switchProfile(p)}
+                            className={`w-full text-left px-3 py-1.5 text-[11px] hover:bg-[var(--bg-tertiary)] transition-colors ${
+                              active ? 'text-[var(--accent)]' : 'text-[var(--text-primary)]'
+                            }`}
+                          >
+                            <div className="flex items-center gap-1.5">
+                              {active && <span className="text-[9px]">✓</span>}
+                              <span className="font-medium truncate">{p.name}</span>
+                            </div>
+                            <div className="text-[10px] text-[var(--text-secondary)] truncate pl-0.5">
+                              {p.provider} · {p.model}
+                            </div>
+                          </button>
+                        );
+                      })}
+                    </div>
+                  </>
+                )}
               </div>
             )}
+            {servedModel && (() => {
+              // The honest backend identity. Tint amber when it differs from
+              // the configured model — that means the proxy (litellm) fell
+              // back server-side (e.g. qwen → claude), which is the usual
+              // cause of "why is everything claude".
+              const cur = profiles.find((p) => p.id === activeSession?.provider);
+              const requested = activeSession?.model || cur?.model || '';
+              const mismatch = requested && servedModel && servedModel !== requested;
+              return (
+                <div
+                  className="text-[10px] mt-0.5"
+                  style={{ color: mismatch ? '#fbbf24' : 'var(--text-secondary)' }}
+                  title={mismatch
+                    ? `Backend actually served "${servedModel}" — differs from the requested "${requested}". The proxy fell back server-side.`
+                    : `Backend-reported model for the last reply (trustworthy — not the model's self-description)`}
+                >
+                  served: {servedModel}{mismatch ? ` ⚠ (≠ ${requested})` : ''}
+                </div>
+              );
+            })()}
           </div>
           <button
             onClick={clearMessages}

package/lib/agents/known-models.json ADDED Viewed

@@ -0,0 +1,104 @@
+{
+  "$schema": "https://raw.githubusercontent.com/aiwatching/forge-public-info/main/models/registry.schema.json",
+  "version": 1,
+  "updatedAt": "2026-06-10",
+  "note": "Forge consumes this at startup via lib/public-info/fetch.ts (24h cache). 'agents' holds CLI agent types (claude-code, codex, aider); 'providers' holds API providers (anthropic, openai, etc). UI looks up by cliType for CLI profiles and by provider for API profiles.",
+  "agents": {
+    "claude-code": {
+      "displayName": "Claude Code",
+      "default": "claude-sonnet-4-6",
+      "aliases": [
+        { "id": "default", "label": "default (CLI decides)" },
+        { "id": "fable",   "label": "fable (alias → latest fable)" },
+        { "id": "sonnet",  "label": "sonnet (alias → latest sonnet)" },
+        { "id": "opus",    "label": "opus (alias → latest opus)" },
+        { "id": "haiku",   "label": "haiku (alias → latest haiku)" }
+      ],
+      "models": [
+        { "id": "claude-fable-5",           "label": "Fable 5",    "tier": "premium",  "default": false },
+        { "id": "claude-opus-4-8",          "label": "Opus 4.8",   "tier": "premium",  "default": false },
+        { "id": "claude-sonnet-4-6",        "label": "Sonnet 4.6", "tier": "standard", "default": true  },
+        { "id": "claude-haiku-4-5-20251001","label": "Haiku 4.5",  "tier": "fast",     "default": false }
+      ]
+    },
+    "codex": {
+      "displayName": "OpenAI Codex",
+      "default": "o4-mini",
+      "aliases": [
+        { "id": "default", "label": "default (CLI decides)" }
+      ],
+      "models": [
+        { "id": "o4-mini",  "label": "o4-mini",  "tier": "fast",     "default": true  },
+        { "id": "o3-mini",  "label": "o3-mini",  "tier": "fast",     "default": false },
+        { "id": "gpt-4.1",  "label": "GPT-4.1",  "tier": "standard", "default": false }
+      ]
+    },
+    "aider": {
+      "displayName": "Aider",
+      "default": "default",
+      "aliases": [
+        { "id": "default", "label": "default (CLI decides)" }
+      ],
+      "models": []
+    }
+  },
+  "providers": {
+    "anthropic": {
+      "displayName": "Anthropic API",
+      "default": "claude-sonnet-4-6",
+      "aliases": [],
+      "models": [
+        { "id": "claude-fable-5",            "label": "Fable 5",    "tier": "premium",  "default": false },
+        { "id": "claude-opus-4-8",           "label": "Opus 4.8",   "tier": "premium",  "default": false },
+        { "id": "claude-sonnet-4-6",         "label": "Sonnet 4.6", "tier": "standard", "default": true  },
+        { "id": "claude-haiku-4-5-20251001", "label": "Haiku 4.5",  "tier": "fast",     "default": false }
+      ]
+    },
+    "openai": {
+      "displayName": "OpenAI API",
+      "default": "gpt-4.1",
+      "aliases": [],
+      "models": [
+        { "id": "gpt-4.1",  "label": "GPT-4.1",  "tier": "premium",  "default": true  },
+        { "id": "gpt-4o",   "label": "GPT-4o",   "tier": "standard", "default": false },
+        { "id": "o4-mini",  "label": "o4-mini",  "tier": "fast",     "default": false },
+        { "id": "o3-mini",  "label": "o3-mini",  "tier": "fast",     "default": false }
+      ]
+    },
+    "grok": {
+      "displayName": "Grok / xAI",
+      "default": "grok-4",
+      "aliases": [],
+      "models": [
+        { "id": "grok-4",      "label": "Grok 4",      "tier": "premium",  "default": true  },
+        { "id": "grok-3",      "label": "Grok 3",      "tier": "standard", "default": false },
+        { "id": "grok-3-mini", "label": "Grok 3 Mini", "tier": "fast",     "default": false }
+      ]
+    },
+    "google": {
+      "displayName": "Google / Gemini",
+      "default": "gemini-2.5-pro",
+      "aliases": [],
+      "models": [
+        { "id": "gemini-2.5-pro",   "label": "Gemini 2.5 Pro",   "tier": "premium",  "default": true  },
+        { "id": "gemini-2.5-flash", "label": "Gemini 2.5 Flash", "tier": "standard", "default": false },
+        { "id": "gemini-2.0-flash", "label": "Gemini 2.0 Flash", "tier": "fast",     "default": false }
+      ]
+    },
+    "deepseek": {
+      "displayName": "DeepSeek",
+      "default": "deepseek-chat",
+      "aliases": [],
+      "models": [
+        { "id": "deepseek-chat",     "label": "DeepSeek Chat",     "tier": "standard", "default": true  },
+        { "id": "deepseek-reasoner", "label": "DeepSeek Reasoner", "tier": "premium",  "default": false }
+      ]
+    },
+    "litellm": {
+      "displayName": "LiteLLM (OpenAI-compatible proxy)",
+      "default": "",
+      "aliases": [],
+      "models": []
+    }
+  }
+}

package/lib/agents/known-models.ts CHANGED Viewed

@@ -4,74 +4,14 @@
  * when the network is unreachable, the file is malformed, or the
  * user is on first-run before the cache is populated.
  *
- * Keep this list reasonably current — if the registry is permanently
- * unreachable, this is what users see. New models in the wild should
- * land in the public-info repo first (no code change required), and
- * trickle into this fallback whenever the next forge release happens.
+ * This is a build-time SNAPSHOT of forge-public-info/models/registry.json,
+ * refreshed automatically by `publish.sh` at each release — do NOT hand-edit
+ * `known-models.json`. To change models, edit the public-info repo; running
+ * installs pick it up within the 24h cache, fresh/offline installs pick it up
+ * at the next forge release when the snapshot is re-pulled.
  */
 import type { ModelsRegistry } from '../public-info/types';
+import snapshot from './known-models.json';
-export const KNOWN_MODELS_FALLBACK: ModelsRegistry = {
-  version: 1,
-  updatedAt: '2026-06-10',
-  note: 'Bundled fallback — actual current list lives in forge-public-info/models/registry.json',
-  agents: {
-    'claude-code': {
-      displayName: 'Claude Code',
-      default: 'claude-sonnet-4-6',
-      aliases: [
-        { id: 'default', label: 'default (CLI decides)' },
-        { id: 'fable',   label: 'fable (alias)' },
-        { id: 'sonnet',  label: 'sonnet (alias)' },
-        { id: 'opus',    label: 'opus (alias)' },
-        { id: 'haiku',   label: 'haiku (alias)' },
-      ],
-      models: [
-        { id: 'claude-fable-5',            label: 'Fable 5',    tier: 'premium'  },
-        { id: 'claude-opus-4-8',           label: 'Opus 4.8',   tier: 'premium'  },
-        { id: 'claude-sonnet-4-6',         label: 'Sonnet 4.6', tier: 'standard', default: true },
-        { id: 'claude-haiku-4-5-20251001', label: 'Haiku 4.5',  tier: 'fast'     },
-      ],
-    },
-    codex: {
-      displayName: 'OpenAI Codex',
-      default: 'o4-mini',
-      aliases: [{ id: 'default', label: 'default (CLI decides)' }],
-      models: [
-        { id: 'o4-mini', label: 'o4-mini', tier: 'fast',     default: true },
-        { id: 'o3-mini', label: 'o3-mini', tier: 'fast'                    },
-        { id: 'gpt-4.1', label: 'GPT-4.1', tier: 'standard'                },
-      ],
-    },
-    aider: {
-      displayName: 'Aider',
-      default: 'default',
-      aliases: [{ id: 'default', label: 'default (CLI decides)' }],
-      models: [],
-    },
-  },
-  providers: {
-    anthropic: {
-      displayName: 'Anthropic API',
-      default: 'claude-sonnet-4-6',
-      aliases: [],
-      models: [
-        { id: 'claude-opus-4-8',           label: 'Opus 4.8',   tier: 'premium'  },
-        { id: 'claude-sonnet-4-6',         label: 'Sonnet 4.6', tier: 'standard', default: true },
-        { id: 'claude-haiku-4-5-20251001', label: 'Haiku 4.5',  tier: 'fast'     },
-      ],
-    },
-    openai: {
-      displayName: 'OpenAI API',
-      default: 'gpt-4.1',
-      aliases: [],
-      models: [
-        { id: 'gpt-4.1', label: 'GPT-4.1', tier: 'premium', default: true },
-        { id: 'gpt-4o',  label: 'GPT-4o',  tier: 'standard' },
-        { id: 'o4-mini', label: 'o4-mini', tier: 'fast' },
-        { id: 'o3-mini', label: 'o3-mini', tier: 'fast' },
-      ],
-    },
-  },
-};
+export const KNOWN_MODELS_FALLBACK: ModelsRegistry = snapshot as ModelsRegistry;

package/lib/chat/agent-loop.ts CHANGED Viewed

@@ -773,6 +773,7 @@ export async function runTurn(args: RunTurnArgs): Promise<{ ok: boolean; error?:
   let iter = 0;
   let lastStop = '';
+  let lastServedModelId = '';
   let assistantBlocksAccum: ContentBlock[] = [];
   // beginTurn already ran at function entry (see top of runTurn). The
@@ -933,8 +934,9 @@ export async function runTurn(args: RunTurnArgs): Promise<{ ok: boolean; error?:
       // ── Real usage from the provider (when reported) ──
       if (result.usage) {
         const u = result.usage;
-        console.log(`[chat-tokens] session=${args.sessionId} turn=${iter} REAL in=${u.inputTokens ?? '?'} out=${u.outputTokens ?? '?'} cache_read=${u.cacheReadTokens ?? 0} cache_create=${u.cacheCreationTokens ?? 0} stop=${result.stopReason}`);
+        console.log(`[chat-tokens] session=${args.sessionId} turn=${iter} REAL in=${u.inputTokens ?? '?'} out=${u.outputTokens ?? '?'} cache_read=${u.cacheReadTokens ?? 0} cache_create=${u.cacheCreationTokens ?? 0} stop=${result.stopReason} served=${result.servedModelId ?? '?'}`);
       }
+      if (result.servedModelId) lastServedModelId = result.servedModelId;
       lastStop = result.stopReason;
       assistantBlocksAccum = result.content;
@@ -1008,7 +1010,7 @@ export async function runTurn(args: RunTurnArgs): Promise<{ ok: boolean; error?:
       cb({ type: 'error', data: { error: `iteration limit (${MAX_ITERATIONS}) exceeded` } });
     }
-    cb({ type: 'turn_done', data: { iterations: iter, stop_reason: lastStop } });
+    cb({ type: 'turn_done', data: { iterations: iter, stop_reason: lastStop, served_model: lastServedModelId || undefined, requested_model: provider.model, profile: provider.name } });
     return { ok: true };
   } catch (err) {
     let msg = err instanceof Error ? err.message : String(err);

package/lib/chat/llm/anthropic.ts CHANGED Viewed

@@ -203,6 +203,10 @@ export const anthropicAdapter: LlmAdapter = {
         };
       }
     } catch {}
-    return { stopReason: mapStop(finishReason), content, usage };
+    // The model the backend ACTUALLY served — may differ from req.model
+    // when a litellm/relay proxy falls back (e.g. forti-coder → claude).
+    let servedModelId: string | undefined;
+    try { servedModelId = (await result.response)?.modelId; } catch {}
+    return { stopReason: mapStop(finishReason), content, usage, servedModelId };
   },
 };

package/lib/chat/llm/openai.ts CHANGED Viewed

@@ -123,6 +123,10 @@ export const openaiAdapter: LlmAdapter = {
         };
       }
     } catch {}
-    return { stopReason: mapStop(finishReason), content, usage };
+    // The model the backend ACTUALLY served — may differ from req.model
+    // when a litellm/relay proxy falls back (e.g. forti-coder → claude).
+    let servedModelId: string | undefined;
+    try { servedModelId = (await result.response)?.modelId; } catch {}
+    return { stopReason: mapStop(finishReason), content, usage, servedModelId };
   },
 };

package/lib/chat/llm/types.ts CHANGED Viewed

@@ -35,6 +35,12 @@ export interface LlmTurnResult {
   /** Token usage from the provider, if reported. May be partially-filled
    *  or absent for proxies that don't expose it. */
   usage?: LlmTurnUsage;
+  /** The model id the backend actually served, read from the response
+   *  (`response.modelId`). For litellm/relay proxies this can DIFFER from
+   *  the requested model — the proxy may silently fall back (e.g. qwen →
+   *  claude-sonnet-4-6). This is the only trustworthy identity, since the
+   *  model's own self-description in the text is often wrong. */
+  servedModelId?: string;
 }
 export interface LlmRequest {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@aion0/forge",
-  "version": "0.10.57",
+  "version": "0.10.64",
   "description": "Unified AI workflow platform — multi-model task orchestration, persistent sessions, web terminal, remote access",
   "type": "module",
   "scripts": {

package/publish.sh CHANGED Viewed

@@ -9,6 +9,13 @@
 set -e
+# Preflight: fail BEFORE any version bump / commit / tag / push if gh is
+# not authenticated. Otherwise the release step 401s after everything else
+# already happened, leaving a tag pushed without a GitHub Release.
+if command -v gh &> /dev/null; then
+  gh auth status &> /dev/null || { echo "✗ gh is not authenticated — run 'gh auth login' first (the GitHub Release step would 401)."; exit 1; }
+fi
 VERSION_ARG=${1:-patch}
 CURRENT=$(node -p "require('./package.json').version")
@@ -32,6 +39,23 @@ fi
 echo "Version: $CURRENT → $NEW_VERSION"
 echo ""
+# Refresh the bundled model-registry snapshot from public-info.
+# This is the offline/first-run fallback for lib/agents/known-models.ts —
+# pulling it here keeps it from drifting against the live registry.
+REGISTRY_URL="https://raw.githubusercontent.com/aiwatching/forge-public-info/main/models/registry.json"
+SNAPSHOT_PATH="lib/agents/known-models.json"
+echo "Refreshing model snapshot from $REGISTRY_URL ..."
+TMP_SNAPSHOT=$(mktemp)
+if curl -fsSL "$REGISTRY_URL" -o "$TMP_SNAPSHOT" && node -e "JSON.parse(require('fs').readFileSync('$TMP_SNAPSHOT','utf8'))"; then
+  mv "$TMP_SNAPSHOT" "$SNAPSHOT_PATH"
+  echo "✓ Updated $SNAPSHOT_PATH"
+else
+  rm -f "$TMP_SNAPSHOT"
+  echo "✗ Failed to fetch/validate model registry — aborting publish (keeping old snapshot)."
+  exit 1
+fi
+echo ""
 # Update package.json
 sed -i '' "s/\"version\": \"$CURRENT\"/\"version\": \"$NEW_VERSION\"/" package.json