npm - free-coding-models - Versions diffs - 0.3.68 → 0.3.70 - Mend

free-coding-models 0.3.68 → 0.3.70

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

package/README.md +13 -13
package/changelog/v0.3.69.md +47 -0
package/changelog/v0.3.70.md +8 -0
package/package.json +2 -2
package/sources.js +92 -66
package/src/app.js +89 -358
package/src/ping-loop.js +105 -0
package/src/render-table.js +79 -3
package/src/tui-filters.js +128 -0
package/src/tui-state.js +265 -0
package/src/updater.js +1 -105
package/web/dist/assets/{index-Cfy_uz7_.js → index-BTwSEyBT.js} +4 -4
package/web/dist/assets/{index-DwztVNMT.css → index-CGN-0_A0.css} +1 -1
package/web/dist/index.html +2 -2
package/web/src/App.jsx +7 -0
package/web/src/components/layout/Sidebar.jsx +1 -0
package/web/src/components/map/MapView.jsx +17 -0
package/web/src/components/map/MapView.module.css +25 -0

package/README.md CHANGED Viewed

@@ -16,7 +16,7 @@
   <img src="https://img.shields.io/npm/v/free-coding-models?color=3d6b00&label=npm&logo=npm" alt="npm version" width="200"><br>
   <img src="https://img.shields.io/node/v/free-coding-models?color=3d6b00&logo=node.js" alt="node version" width="200"><br>
   <img src="https://img.shields.io/npm/l/free-coding-models?color=3d6b00" alt="license" width="200"><br>
-  <img src="https://img.shields.io/badge/models-170+-3d6b00?logo=nvidia" alt="models count" width="200"><br>
+  <img src="https://img.shields.io/badge/models-157+-3d6b00?logo=nvidia" alt="models count" width="200"><br>
   <img src="https://img.shields.io/badge/providers-16-1a56db" alt="providers count" width="200">
 </p>
@@ -59,7 +59,7 @@ free-coding-models
 ## 💡 Why this tool?
-There are **~170 cataloged free or free-limited coding models** across ~15 vetted providers. Which one is fastest right now? Which one is actually stable versus just lucky on the last ping?
+There are **~157 cataloged free or free-limited coding models** across 16 vetted providers. Which one is fastest right now? Which one is actually stable versus just lucky on the last ping?
 This CLI pings them all in parallel, shows live latency, and calculates a **live Stability Score (0-100)**. Average latency alone is misleading if a model randomly spikes to 6 seconds; the stability score measures true reliability by combining **p95 latency** (30%), **jitter/variance** (30%), **spike rate** (20%), and **uptime** (20%).
@@ -73,26 +73,26 @@ It then writes the model you pick directly into your coding tool's config — so
 Create a free account on one provider below to get started:
-**~170 coding models** across ~15 active providers, ranked by practical free-tier usefulness.
+**~157 coding models** across 16 active providers, ranked by practical free-tier usefulness.
 | # | Provider | Models | Tier range | Free tier | Env var |
 |---|----------|--------|-----------|-----------|--------|
-| 1 | [NVIDIA NIM](https://build.nvidia.com) | 42 | S+ → C | ~40 RPM (no credit card) | `NVIDIA_API_KEY` |
+| 1 | [NVIDIA NIM](https://build.nvidia.com) | 26 | S+ → C | ~40 RPM (no credit card) | `NVIDIA_API_KEY` |
 | 2 | [Groq](https://console.groq.com/keys) | 8 | S → B | 30 RPM, 1K‑14.4K req/day (no credit card) | `GROQ_API_KEY` |
-| 3 | [Cerebras](https://cloud.cerebras.ai) | 4 | S+ → B | 30 RPM, 1M tokens/day (no credit card) | `CEREBRAS_API_KEY` |
-| 4 | [Google AI Studio](https://aistudio.google.com/apikey) | 6 | S+ → A | Gemini free quotas vary by model/region | `GOOGLE_API_KEY` |
+| 3 | [Cerebras](https://cloud.cerebras.ai) | 2 | S+ → S | 30 RPM, 1M tokens/day (no credit card) | `CEREBRAS_API_KEY` |
+| 4 | [Google AI Studio](https://aistudio.google.com/apikey) | 7 | S+ → A | Gemini free quotas vary by model/region | `GOOGLE_API_KEY` |
 | 5 | [GitHub Models](https://models.github.ai) | 15 | S+ → C | Quota depends on GitHub/Copilot tier | `GITHUB_TOKEN` |
-| 6 | [Mistral La Plateforme](https://console.mistral.ai/api-keys) | 7 | S+ → A | Experiment plan, free evaluation tier | `MISTRAL_API_KEY` |
-| 7 | [Cloudflare Workers AI](https://dash.cloudflare.com) | 15 | S+ → B | 10K neurons/day, 300 RPM (no credit card) | `CLOUDFLARE_API_TOKEN` + `CLOUDFLARE_ACCOUNT_ID` |
-| 8 | [OpenRouter](https://openrouter.ai/keys) | 31 | S+ → C | 50 req/day free, 1K/day with $10 spend | `OPENROUTER_API_KEY` |
-| 9 | [SambaNova](https://cloud.sambanova.ai/apis) | 6 | S+ → A- | Small developer quota, useful for light usage | `SAMBANOVA_API_KEY` |
+| 6 | [Mistral La Plateforme](https://console.mistral.ai/api-keys) | 5 | S+ → A | Experiment plan, free evaluation tier | `MISTRAL_API_KEY` |
+| 7 | [Cloudflare Workers AI](https://dash.cloudflare.com) | 14 | S+ → B | 10K neurons/day, 300 RPM (no credit card) | `CLOUDFLARE_API_TOKEN` + `CLOUDFLARE_ACCOUNT_ID` |
+| 8 | [OpenRouter](https://openrouter.ai/keys) | 26 | S+ → C | 50 req/day free, 1K/day with $10 spend | `OPENROUTER_API_KEY` |
+| 9 | [SambaNova](https://cloud.sambanova.ai/apis) | 7 | S+ → B+ | Small developer quota, useful for light usage | `SAMBANOVA_API_KEY` |
 | 10 | [OVHcloud AI Endpoints](https://endpoints.ai.cloud.ovh.net) | 10 | S → B | 2 req/min/IP free, 400 RPM with key | `OVH_AI_ENDPOINTS_ACCESS_TOKEN` |
 | 11 | [Codestral](https://console.mistral.ai/api-keys) | 1 | B+ | 30 RPM, 2K req/day | `MISTRAL_API_KEY` |
 | 12 | [ZAI](https://z.ai) | 2 | S | Free Flash models only | `ZAI_API_KEY` |
 | 13 | [Scaleway](https://console.scaleway.com/iam/api-keys) | 10 | S+ → B | 1M free tokens | `SCALEWAY_API_KEY` |
-| 14 | [Alibaba DashScope](https://modelstudio.console.alibabacloud.com) | 9 | S+ → A | 1M free tokens/model, Singapore, 90 days | `DASHSCOPE_API_KEY` |
-| 15 | [Gemini CLI](https://github.com/google-gemini/gemini-cli) | 6 | S+ → A | 1,000 req/day with personal Google account | CLI tool ♊ |
-| 16 | [OpenCode Zen](https://opencode.ai/zen) | 8 | S+ → A | Free with OpenCode account | Zen models ✨ |
+| 14 | [Alibaba DashScope](https://modelstudio.console.alibabacloud.com) | 11 | S+ → A+ | 1M free tokens/model, Singapore, 90 days | `DASHSCOPE_API_KEY` |
+| 15 | [Gemini CLI](https://github.com/google-gemini/gemini-cli) | 7 | S+ → A | 1,000 req/day with personal Google account | CLI tool ♊ |
+| 16 | [OpenCode Zen](https://opencode.ai/zen) | 6 | S+ → A | Free with OpenCode account | Zen models ✨ |
 > 💡 One key is enough. Add more at any time with **`P`** inside the TUI.

package/changelog/v0.3.69.md ADDED Viewed

@@ -0,0 +1,47 @@
+# Changelog v0.3.69 - 2026-05-26
+### Changed
+- **Full provider audit** — Every model across all 16 providers was verified against official APIs and documentation on 2026-05-26. Outdated, deprecated, and phantom models were removed; new models were added; context windows and scores were corrected.
+- **~170 → ~157 models** — Net reduction of ~13 models after removing deprecated/phantom entries and adding new ones. The catalog is now leaner and more accurate.
+### Removed (deprecated / shutdown / phantom)
+- **Cerebras**: `qwen-3-235b-a22b-instruct-2507`, `llama3.1-8b` — deprecated May 27, 2026
+- **SambaNova**: `MiniMax-M2.5` — deprecated May 18, replaced by M2.7
+- **OpenRouter**: `tencent/hy3-preview:free`, `inclusionai/ling-2.6-1t:free`, `google/gemma-3n-e2b-it:free`, `google/gemma-3-27b-it:free`, `google/gemma-3-12b-it:free`, `google/gemma-3n-e4b-it:free`, `google/gemma-3-4b-it:free` — free tiers removed by providers; `google/gemma-4-31b-a4b-it:free` — never existed (data error)
+- **Mistral**: `devstral-medium-latest`, `devstral-small-latest`, `magistral-small-latest` — deprecated, replaced by unified Devstral 2 and Mistral Small 4
+- **Google AI / Gemini CLI**: `gemini-3.1-flash-lite-preview` — endpoint shutdown May 25, 2026
+- **Cloudflare**: `@cf/google/gemma-4-31b-it` — never existed on Cloudflare; `@cf/meta/llama-3.1-8b-instruct` — deprecated May 30 + actual context only 8k
+- **OVHcloud**: `Llama-3.1-8B-Instruct` — delisted from catalog
+- **OpenCode Zen**: `hy3-preview-free`, `ling-2.6-flash-free`, `trinity-mini-free`, `trinity-large-preview-free` — deleted from Zen platform
+### Added (new models)
+- **SambaNova**: `MiniMax-M2.7` (S+, 192k), `gemma-3-12b-it` (B+, 128k)
+- **OpenRouter**: `deepseek/deepseek-v4-flash:free` (S, 1M), `arcee-ai/trinity-large-thinking:free` (A, 262k), `baidu/cobuddy:free` (B+, 131k)
+- **Google AI / Gemini CLI**: `gemini-3.5-flash` (S+, 1M — new GA model), `gemini-3.1-flash-lite` (A+, 1M — graduated from preview)
+- **Qwen (DashScope)**: `qwen3.7-max` (S+, 1M — new flagship), `qwen3.6-plus` (S+, 1M), `qwen3.6-flash` (A+, 1M)
+- **Cloudflare**: `@cf/deepseek-ai/deepseek-r1-distill-qwen-32b` (A-, 80k)
+- **OVHcloud**: `Qwen3.5-397B-A17B` (S, 262k — new on OVHcloud)
+- **OpenCode Zen**: `deepseek-v4-flash-free` (S+, 200k), `qwen3.6-plus-free` (S+, 1M)
+### Fixed
+- **Mistral model IDs** updated from `-latest` aliases to versioned IDs (`mistral-large-2512`, `mistral-medium-3-5`, `mistral-small-2603`, `devstral-2512`, `magistral-medium-2509`)
+- **Codestral** ID updated to `codestral-2508`, context corrected from 256k → 128k
+- **Groq**: 4 models context corrected from 128k → 131k (actual Groq limit)
+- **Cerebras**: 2 models context corrected (gpt-oss-120b 128k→131k, zai-glm-4.7 200k→131k)
+- **SambaNova**: Llama-4-Maverick context corrected from 1M → 128k (SambaNova actual limit)
+- **Scaleway**: 7 models context windows corrected (major fixes: holo2 131k→22k, gemma-3-27b 128k→40k, devstral 256k→200k, qwen3-coder 32k→128k)
+- **OpenRouter**: 7 context corrections, MiniMax M2.5 score updated 74.0% → 80.2%, Laguna models 256k→131k, Owl Alpha 128k→1M
+- **Qwen**: 4 context corrections (qwen3-max 1M→256k, qwen3-coder-plus 256k→1M, qwen3-coder-flash 256k→1M, qwen3-32b 128k→256k), model ID fixed `qwen3-235b-a22b-instruct` → `qwen3-235b-a22b`
+- **Cloudflare**: kimi-k2.6 context corrected 256k → 262k
+- **OVHcloud**: 4 context corrections (Qwen3.5-9B 128k→262k, Mistral-Nemo 128k→118k, Mistral-7B 32k→127k, Mistral-Small 131k→128k)
+- **OpenCode Zen**: nematron-3-super-free context corrected from 1M → 200k (Zen limits it)
+- **GitHub Models**: ministral-3b context corrected from 32k → 128k
+### Docs
+- Added 14 provider audit reports in `provider_updates/` (one per provider)
+- Updated README.md model counts and provider table

package/changelog/v0.3.70.md ADDED Viewed

@@ -0,0 +1,8 @@
+# Changelog v0.3.70 - 2026-05-27
+### Changed
+- Bumped version to 0.3.70 as part of release process.
+- Updated documentation and internal references for the new version.
+### Fixed
+- (No functional changes in this bump; included for completeness.)

package/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "free-coding-models",
-  "version": "0.3.68",
-  "description": "Find the fastest coding LLM models in seconds \u2014 ping free models from multiple providers, pick the best one for OpenCode, Cursor, or any AI coding assistant.",
+  "version": "0.3.70",
+  "description": "Find the fastest coding LLM models in seconds — ping free models from multiple providers, pick the best one for OpenCode, Cursor, or any AI coding assistant.",
   "keywords": [
     "nvidia",
     "nim",

package/sources.js CHANGED Viewed

@@ -84,11 +84,11 @@ export const nvidiaNim = [
 // 📖 Groq source - https://console.groq.com
 // 📖 Free API keys available at https://console.groq.com/keys
 export const groq = [
-  ['llama-3.3-70b-versatile',              'Llama 3.3 70B',      'A-', '39.5%', '128k'],
+  ['llama-3.3-70b-versatile',              'Llama 3.3 70B',      'A-', '39.5%', '131k'],
   ['meta-llama/llama-4-scout-17b-16e-instruct', 'Llama 4 Scout',  'A',  '44.0%', '131k'],
-  ['llama-3.1-8b-instant',                 'Llama 3.1 8B',       'B',  '28.8%', '128k'],
-  ['openai/gpt-oss-120b',                  'GPT OSS 120B',       'S',  '60.0%', '128k'],
-  ['openai/gpt-oss-20b',                   'GPT OSS 20B',        'A',  '42.0%', '128k'],
+  ['llama-3.1-8b-instant',                 'Llama 3.1 8B',       'B',  '28.8%', '131k'],
+  ['openai/gpt-oss-120b',                  'GPT OSS 120B',       'S',  '60.0%', '131k'],
+  ['openai/gpt-oss-20b',                   'GPT OSS 20B',        'A',  '42.0%', '131k'],
   ['qwen/qwen3-32b',                       'Qwen3 32B',          'A+', '50.0%', '131k'],
   ['groq/compound',                        'Groq Compound',      'A',  '45.0%', '131k'],
   ['groq/compound-mini',                   'Groq Compound Mini', 'B+', '32.0%', '131k'],
@@ -97,10 +97,10 @@ export const groq = [
 // 📖 Cerebras source - https://cloud.cerebras.ai
 // 📖 Free API keys available at https://cloud.cerebras.ai
 export const cerebras = [
-  ['gpt-oss-120b',                         'GPT OSS 120B',       'S',  '60.0%', '128k'],
-  ['qwen-3-235b-a22b-instruct-2507',       'Qwen3 235B',         'S+', '70.0%', '128k'], // ⚠️ Deprecation: May 27, 2026
-  ['llama3.1-8b',                          'Llama 3.1 8B',       'B',  '28.8%', '128k'],
-  ['zai-glm-4.7',                          'GLM 4.7',            'S+', '73.8%', '200k'],
+  ['gpt-oss-120b',                         'GPT OSS 120B',       'S',  '60.0%', '131k'],
+  ['zai-glm-4.7',                          'GLM 4.7',            'S+', '73.8%', '131k'],
+  // Removed (2026-05-26): qwen-3-235b-a22b-instruct-2507 (deprecated May 27, 2026)
+  // Removed (2026-05-26): llama3.1-8b (deprecated May 27, 2026)
 ]
 // 📖 SambaNova source - https://cloud.sambanova.ai
@@ -108,14 +108,18 @@ export const cerebras = [
 // 📖 Keep this catalog conservative: only models surfaced in current SambaNova docs.
 export const sambanova = [
   // ── S+ tier ──
-  ['MiniMax-M2.5',                         'MiniMax M2.5',       'S+', '74.0%', '160k'],
+  ['MiniMax-M2.7',                         'MiniMax M2.7',       'S+', '56.2%', '192k'],
   // ── S tier ──
   ['DeepSeek-V3.1',                        'DeepSeek V3.1',      'S',  '62.0%', '128k'],
   ['DeepSeek-V3.2',                        'DeepSeek V3.2',      'S+', '70.0%', '32k'],
-  ['Llama-4-Maverick-17B-128E-Instruct',   'Llama 4 Maverick',   'S',  '62.0%', '1M'],
+  ['Llama-4-Maverick-17B-128E-Instruct',   'Llama 4 Maverick',   'S',  '62.0%', '128k'],
   ['gpt-oss-120b',                         'GPT OSS 120B',       'S',  '60.0%', '128k'],
   // ── A- tier ──
   ['Meta-Llama-3.3-70B-Instruct',          'Llama 3.3 70B',      'A-', '39.5%', '128k'],
+  // ── B+ tier ──
+  ['gemma-3-12b-it',                        'Gemma 3 12B IT',     'B+', '46.0%', '128k'],
+  // Removed (2026-05-26): MiniMax-M2.5 (deprecated, replaced by MiniMax-M2.7)
+  // Fix (2026-05-26): Llama-4-Maverick context 1M → 128k (SambaNova actual limit)
 ]
 // 📖 OpenRouter source - https://openrouter.ai
@@ -131,24 +135,24 @@ export const sambanova = [
 export const openrouter = [
   // ── S+ tier — live :free chat/coding models ──
   ['qwen/qwen3-coder:free',                     'Qwen3 Coder 480B',   'S+', '70.6%', '262k'],
-  ['minimax/minimax-m2.5:free',                 'MiniMax M2.5',       'S+', '74.0%', '197k'],
+  ['minimax/minimax-m2.5:free',                 'MiniMax M2.5',       'S+', '80.2%', '197k'],
   ['z-ai/glm-4.5-air:free',                     'GLM 4.5 Air',        'S+', '72.0%', '131k'],
-  ['tencent/hy3-preview:free',                   'Tencent HY3 Preview','S+', '-',     '262k'],
-  ['poolside/laguna-m.1:free',                  'Poolside Laguna M.1', 'S+', '-',     '256k'],
-  ['poolside/laguna-xs.2:free',                 'Poolside Laguna XS.2','S+', '-',     '256k'],
+  ['deepseek/deepseek-v4-flash:free',           'DeepSeek V4 Flash',  'S',  '-',     '1M'],
+  ['poolside/laguna-m.1:free',                  'Poolside Laguna M.1', 'S+', '-',     '131k'],
+  ['poolside/laguna-xs.2:free',                 'Poolside Laguna XS.2','S+', '-',     '131k'],
   // ── S tier — live :free chat/coding models ──
-  ['qwen/qwen3-next-80b-a3b-instruct:free',     'Qwen3 80B Instruct', 'S',  '65.0%', '131k'],
+  ['qwen/qwen3-next-80b-a3b-instruct:free',     'Qwen3 80B Instruct', 'S',  '65.0%', '262k'],
   ['openai/gpt-oss-120b:free',                  'GPT OSS 120B',       'S',  '60.0%', '131k'],
-  ['inclusionai/ling-2.6-1t:free',              'Ling 2.6 1T',        'S',  '-',     '128k'],
+  ['arcee-ai/trinity-large-thinking:free',      'Arcee Trinity Large', 'A',  '-',     '262k'],
   ['nvidia/nemotron-3-super-120b-a12b:free',    'Nemotron 3 Super',   'A+', '56.0%', '262k'],
   // ── A+ tier — live :free chat/coding models ──
-  ['nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free', 'Nemotron 3 Omni', 'A+', '52.0%', '128k'],
+  ['nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free', 'Nemotron 3 Omni', 'A+', '52.0%', '256k'],
   ['nvidia/nemotron-nano-12b-v2-vl:free',       'Nemotron Nano 12B VL','A',  '20.0%', '128k'],
-  ['openrouter/owl-alpha',                      'Owl Alpha',          'A+', '-',     '128k'],
+  ['openrouter/owl-alpha',                      'Owl Alpha',          'A+', '-',     '1M'],
   // ── A tier — live :free chat/coding models ──
   ['nousresearch/hermes-3-llama-3.1-405b:free', 'Hermes 3 405B',      'A',  '44.0%', '131k'],
   ['openai/gpt-oss-20b:free',                   'GPT OSS 20B',        'A',  '42.0%', '131k'],
-  ['nvidia/nemotron-3-nano-30b-a3b:free',       'Nemotron Nano 30B',  'A',  '43.0%', '128k'],
+  ['nvidia/nemotron-nano-30b-a3b:free',         'Nemotron Nano 30B',  'A',  '43.0%', '256k'],
   ['cognitivecomputations/dolphin-mistral-24b-venice-edition:free', 'Dolphin Mistral 24B', 'B+', '30.0%', '33k'],
   ['google/gemma-4-31b-it:free',                'Gemma 4 31B',        'A',  '45.0%', '256k'],
   ['google/gemma-4-26b-a4b-it:free',            'Gemma 4 26B MoE',    'A-', '38.0%', '256k'],
@@ -157,17 +161,20 @@ export const openrouter = [
   ['meta-llama/llama-3.2-3b-instruct:free',     'Llama 3.2 3B',       'B',  '20.0%', '128k'],
   // ── B+ tier ──
   ['nvidia/nemotron-nano-9b-v2:free',           'Nemotron Nano 9B',   'B+', '18.0%', '128k'],
-  ['google/gemma-3n-e2b-it:free',               'Gemma 3n E2B',       'B+', '-',     '8k'],
+  ['baidu/cobuddy:free',                        'Baidu CoBuddy',      'B+', '-',     '131k'],
   // ── B tier ──
-  ['google/gemma-3-27b-it:free',                'Gemma 3 27B',        'B',  '22.0%', '131k'],
-  ['google/gemma-4-31b-a4b-it:free',            'Gemma 4 31B MoE',    'B',  '-',     '256k'],
-  ['openrouter/free',                           'OpenRouter Free',    'B',  '-',     '128k'],
+  ['openrouter/free',                           'OpenRouter Free',    'B',  '-',     '200k'],
   // ── C tier ──
-  ['google/gemma-3-12b-it:free',                'Gemma 3 12B',        'C',  '15.0%', '131k'],
-  ['google/gemma-3n-e4b-it:free',               'Gemma 3n E4B',       'C',  '10.0%', '8k'],
-  ['google/gemma-3-4b-it:free',                 'Gemma 3 4B',         'C',  '10.0%', '33k'],
   ['liquid/lfm-2.5-1.2b-instruct:free',         'LFM 2.5 1.2B',       'C',  '-',     '32k'],
   ['liquid/lfm-2.5-1.2b-thinking:free',         'LFM 2.5 Thinking',   'C',  '-',     '32k'],
+  // Removed (2026-05-26): tencent/hy3-preview:free (free tier removed)
+  // Removed (2026-05-26): inclusionai/ling-2.6-1t:free (free tier removed)
+  // Removed (2026-05-26): google/gemma-3n-e2b-it:free (free tier removed)
+  // Removed (2026-05-26): google/gemma-3-27b-it:free (free tier removed)
+  // Removed (2026-05-26): google/gemma-3-12b-it:free (free tier removed)
+  // Removed (2026-05-26): google/gemma-3n-e4b-it:free (free tier removed)
+  // Removed (2026-05-26): google/gemma-3-4b-it:free (free tier removed)
+  // Removed (2026-05-26): google/gemma-4-31b-a4b-it:free (never existed — data error)
 ]
 // 📖 GitHub Models source - https://models.github.ai
@@ -188,53 +195,57 @@ export const githubModels = [
   ['mistral-ai/codestral-2501',                   'Codestral 2501',      'B+', '34.0%', '256k'],
   ['mistral-ai/mistral-medium-2505',              'Mistral Medium 2505', 'A',  '48.0%', '128k'],
   ['mistral-ai/mistral-small-2503',               'Mistral Small 2503',  'B+', '30.0%', '128k'],
-  ['mistral-ai/ministral-3b',                     'Ministral 3B',        'C',  '-',     '32k'],
+  ['mistral-ai/ministral-3b',                     'Ministral 3B',        'C',  '-',     '128k'],
 ]
 // 📖 Mistral La Plateforme source - https://console.mistral.ai
 // 📖 Experiment plan is free for evaluation/prototyping and exposes general + coding models.
 // 📖 Keep Codestral as a separate provider key for backward compatibility with existing configs.
 export const mistral = [
-  ['mistral-large-latest',                        'Mistral Large',       'S+', '70.0%', '256k'],
-  ['mistral-medium-latest',                       'Mistral Medium',      'S',  '66.0%', '128k'],
-  ['mistral-small-latest',                        'Mistral Small',       'A',  '48.0%', '128k'],
-  ['devstral-medium-latest',                      'Devstral Medium',     'S+', '72.2%', '128k'],
-  ['devstral-small-latest',                       'Devstral Small',      'A+', '55.0%', '128k'],
-  ['magistral-medium-latest',                     'Magistral Medium',    'A+', '52.0%', '128k'],
-  ['magistral-small-latest',                      'Magistral Small',     'A',  '45.0%', '128k'],
+  ['mistral-large-2512',        'Mistral Large 3',     'S+', '70.0%', '256k'],
+  ['mistral-medium-3-5',        'Mistral Medium 3.5',  'S+', '77.6%', '256k'],
+  ['devstral-2512',             'Devstral 2',          'S+', '72.2%', '256k'],
+  ['magistral-medium-2509',     'Magistral Medium 1.2','A+', '52.0%', '128k'],
+  ['mistral-small-2603',        'Mistral Small 4',     'A',  '48.0%', '256k'],
+  // Removed (2026-05-26): devstral-medium-latest (deprecated, replaced by devstral-2512)
+  // Removed (2026-05-26): devstral-small-latest (deprecated, replaced by devstral-2512)
+  // Removed (2026-05-26): magistral-small-latest (deprecated, replaced by mistral-small-2603)
 ]
 // 📖 Mistral Codestral source - https://codestral.mistral.ai
 // 📖 Free coding model — 30 req/min, 2000/day (phone number required for key)
 // 📖 API keys now use the Mistral platform key format; CODESTRAL_API_KEY remains supported as an alias.
 export const codestral = [
-  ['codestral-latest',                         'Codestral',          'B+', '34.0%', '256k'],
+  ['codestral-2508',            'Codestral',           'B+', '34.0%', '128k'],
 ]
 // 📖 Scaleway source - https://console.scaleway.com
 // 📖 1M free tokens — API keys at https://console.scaleway.com/iam/api-keys
 export const scaleway = [
-  ['devstral-2-123b-instruct-2512',            'Devstral 2 123B',     'S+', '72.2%', '256k'],
+  ['devstral-2-123b-instruct-2512',            'Devstral 2 123B',     'S+', '72.2%', '200k'],
   ['qwen3.5-397b-a17b',                        'Qwen3.5 400B VLM',   'S',  '68.0%', '250k'],
   ['mistral/mistral-large-3-675b-instruct-2512','Mistral Large 675B', 'A+', '58.0%', '250k'],
-  ['qwen3-235b-a22b-instruct-2507',            'Qwen3 235B',         'S+', '70.0%', '128k'],
-  ['gpt-oss-120b',                             'GPT OSS 120B',       'S',  '60.0%', '131k'],
-  ['qwen3-coder-30b-a3b-instruct',             'Qwen3 Coder 30B',    'A+', '55.0%', '32k'],
-  ['holo2-30b-a3b',                            'Holo2 30B',          'A+', '52.0%', '131k'],
-  ['llama-3.3-70b-instruct',                   'Llama 3.3 70B',      'A-', '39.5%', '128k'],
+  ['qwen3-235b-a22b-instruct-2507',            'Qwen3 235B',         'S+', '70.0%', '250k'],
+  ['gpt-oss-120b',                             'GPT OSS 120B',       'S',  '60.0%', '128k'],
+  ['qwen3-coder-30b-a3b-instruct',             'Qwen3 Coder 30B',    'A+', '55.0%', '128k'],
+  ['holo2-30b-a3b',                            'Holo2 30B',          'A+', '52.0%', '22k'],
+  ['llama-3.3-70b-instruct',                   'Llama 3.3 70B',      'A-', '39.5%', '100k'],
   ['mistral-small-3.2-24b-instruct-2506',      'Mistral Small 3.2',  'B+', '30.0%', '128k'],
-  ['gemma-3-27b-it',                           'Gemma 3 27B',        'B',  '22.0%', '128k'],
+  ['gemma-3-27b-it',                           'Gemma 3 27B',        'B',  '22.0%', '40k'],
 ]
 // 📖 Google AI Studio source - https://aistudio.google.com
 // 📖 OpenAI-compatible endpoint exposes Gemini models; free quotas vary by model and region.
 export const googleai = [
+  ['gemini-3.5-flash',                          'Gemini 3.5 Flash',             'S+', '-',     '1M'],
   ['gemini-3.1-pro-preview',                    'Gemini 3.1 Pro Preview',       'S+', '78.0%', '1M'],
   ['gemini-3-flash-preview',                    'Gemini 3 Flash Preview',       'S',  '65.0%', '1M'],
-  ['gemini-3.1-flash-lite-preview',             'Gemini 3.1 Flash Lite Preview','A+', '55.0%', '1M'],
+  ['gemini-3.1-flash-lite',                     'Gemini 3.1 Flash Lite',        'A+', '55.0%', '1M'],
+  // ⚠️ DEPRECATED — shutdown Oct 16, 2026
   ['gemini-2.5-pro',                            'Gemini 2.5 Pro',               'S+', '63.2%', '1M'],
   ['gemini-2.5-flash',                          'Gemini 2.5 Flash',             'A+', '50.0%', '1M'],
   ['gemini-2.5-flash-lite',                     'Gemini 2.5 Flash Lite',        'A',  '42.0%', '1M'],
+  // Removed (2026-05-26): gemini-3.1-flash-lite-preview (endpoint shutdown May 25, 2026 → replaced by gemini-3.1-flash-lite)
 ]
 // 📖 ZAI source - https://open.z.ai
@@ -252,17 +263,22 @@ export const zai = [
 // 📖 Qwen3-Coder models: optimized coding models with excellent SWE-bench scores
 export const qwen = [
   // ── S+ tier — SWE-bench Verified ≥70% ──
-  ['qwen3-max',                               'Qwen3 Max',          'S+', '78.8%', '1M'],
-  ['qwen3-235b-a22b-instruct',                'Qwen3 235B',         'S+', '70.0%', '256k'],
+  ['qwen3.7-max',                               'Qwen3.7 Max',       'S+', '80.0%', '1M'],
+  ['qwen3-max',                               'Qwen3 Max',          'S+', '78.8%', '256k'],
+  ['qwen3.6-plus',                             'Qwen3.6 Plus',      'S+', '72.0%', '1M'],
+  ['qwen3-235b-a22b',                          'Qwen3 235B',         'S+', '70.0%', '256k'],
   // ── S tier — SWE-bench Verified 60–70% ──
   ['qwen3.5-plus',                             'Qwen3.5 Plus',      'S',  '68.0%', '1M'],
-  ['qwen3-coder-plus',                        'Qwen3 Coder Plus',  'S',  '69.6%', '256k'],
+  ['qwen3-coder-plus',                        'Qwen3 Coder Plus',  'S',  '69.6%', '1M'],
   ['qwen3-coder-next',                        'Qwen3 Coder Next',  'S',  '65.0%', '256k'],
   // ── A+ tier — SWE-bench Verified 50–60% ──
+  ['qwen3.6-flash',                           'Qwen3.6 Flash',     'A+', '60.0%', '1M'],
   ['qwen3.5-flash',                           'Qwen3.5 Flash',     'A+', '55.0%', '1M'],
-  ['qwen3-coder-flash',                       'Qwen3 Coder Flash', 'A+', '55.0%', '256k'],
-  ['qwen3-32b',                               'Qwen3 32B',          'A+', '50.0%', '128k'],
-  ['qwen2.5-coder-32b-instruct',              'Qwen2.5 Coder 32B',  'A',  '46.0%', '32k'],
+  ['qwen3-coder-flash',                       'Qwen3 Coder Flash', 'A+', '55.0%', '1M'],
+  ['qwen3-32b',                               'Qwen3 32B',          'A+', '50.0%', '256k'],
+  // Removed (2026-05-26): qwen2.5-coder-32b-instruct (legacy, replaced by qwen3-coder-plus/flash)
+  // Fix (2026-05-26): qwen3-max ctx 1M→256k, qwen3-coder-plus ctx 256k→1M, qwen3-coder-flash ctx 256k→1M, qwen3-32b ctx 128k→256k
+  // Fix (2026-05-26): qwen3-235b-a22b-instruct ID → qwen3-235b-a22b
 ]
 // 📖 Cloudflare Workers AI source - https://developers.cloudflare.com/workers-ai
@@ -271,7 +287,7 @@ export const qwen = [
 // 📖 Free plan includes daily neuron quota and provider-level request limits.
 export const cloudflare = [
   // ── S+ tier ──
-  ['@cf/moonshotai/kimi-k2.6',                'Kimi K2.6',         'S+', '76.8%', '256k'],
+  ['@cf/moonshotai/kimi-k2.6',                'Kimi K2.6',         'S+', '76.8%', '262k'],
   // ── S tier ──
   ['@cf/zai-org/glm-4.7-flash',               'GLM-4.7-Flash',     'S',  '59.2%', '131k'],
   ['@cf/openai/gpt-oss-120b',                 'GPT OSS 120B',      'S',  '60.0%', '128k'],
@@ -285,12 +301,14 @@ export const cloudflare = [
   ['@cf/openai/gpt-oss-20b',                  'GPT OSS 20B',       'A',  '42.0%', '128k'],
   // ── A- tier ──
   ['@cf/meta/llama-3.3-70b-instruct-fp8-fast','Llama 3.3 70B',     'A-', '39.5%', '128k'],
-  ['@cf/google/gemma-4-31b-it',               'Gemma 4 31B',       'A',  '45.0%', '256k'],
   ['@cf/google/gemma-4-26b-a4b-it',           'Gemma 4 26B MoE',   'A-', '38.0%', '256k'],
   ['@cf/mistralai/mistral-small-3.1-24b-instruct', 'Mistral Small 3.1', 'B+', '30.0%', '128k'],
+  ['@cf/deepseek-ai/deepseek-r1-distill-qwen-32b', 'DeepSeek R1 Distill 32B', 'A-', '45.0%', '80k'],
   // ── B tier ──
   ['@cf/ibm/granite-4.0-h-micro',             'Granite 4.0 Micro', 'B+', '30.0%', '128k'],
-  ['@cf/meta/llama-3.1-8b-instruct',          'Llama 3.1 8B',      'B',  '28.8%', '128k'],
+  // Removed (2026-05-26): @cf/google/gemma-4-31b-it (never existed on Cloudflare)
+  // Removed (2026-05-26): @cf/meta/llama-3.1-8b-instruct (deprecated May 30 + actual ctx = 8k, not 128k)
+  // Fix (2026-05-26): @cf/moonshotai/kimi-k2.6 ctx 256k → 262k
 ]
 // 📖 OVHcloud AI Endpoints - https://endpoints.ai.cloud.ovh.net
@@ -298,16 +316,18 @@ export const cloudflare = [
 // 📖 Free sandbox: 2 req/min per IP per model (no API key needed), 400 RPM with API key
 // 📖 Env var: OVH_AI_ENDPOINTS_ACCESS_TOKEN
 export const ovhcloud = [
+  ['Qwen3.5-397B-A17B',                         'Qwen3.5 397B MoE',    'S',  '-',     '262k'],
   ['Qwen3-Coder-30B-A3B-Instruct',             'Qwen3 Coder 30B MoE',  'A+', '55.0%', '256k'],
   ['gpt-oss-120b',                              'GPT OSS 120B',         'S',  '60.0%', '131k'],
   ['gpt-oss-20b',                               'GPT OSS 20B',          'A',  '42.0%', '131k'],
   ['Meta-Llama-3_3-70B-Instruct',               'Llama 3.3 70B',        'A-', '39.5%', '131k'],
   ['Qwen3-32B',                                 'Qwen3 32B',            'A+', '50.0%', '32k'],
-  ['Mistral-Small-3.2-24B-Instruct-2506',       'Mistral Small 3.2',    'B+', '34.0%', '131k'],
-  ['Mistral-7B-Instruct-v0.3',                  'Mistral 7B Instruct',  'B',  '25.0%', '32k'],
-  ['Mistral-Nemo-Instruct-2407',                'Mistral Nemo',         'B+', '30.0%', '128k'],
-  ['Qwen3.5-9B',                                'Qwen3.5 9B',           'B+', '30.0%', '128k'],
-  ['Llama-3.1-8B-Instruct',                     'Llama 3.1 8B',         'B',  '28.8%', '131k'],
+  ['Mistral-Small-3.2-24B-Instruct-2506',       'Mistral Small 3.2',    'B+', '34.0%', '128k'],
+  ['Mistral-7B-Instruct-v0.3',                  'Mistral 7B Instruct',  'B',  '25.0%', '127k'],
+  ['Mistral-Nemo-Instruct-2407',                'Mistral Nemo',         'B+', '30.0%', '118k'],
+  ['Qwen3.5-9B',                                'Qwen3.5 9B',           'B+', '30.0%', '262k'],
+  // Removed (2026-05-26): Llama-3.1-8B-Instruct (delisted from OVHcloud catalog)
+  // Fix (2026-05-26): Qwen3.5-9B ctx 128k→262k, Mistral-Small ctx 131k→128k, Mistral-Nemo ctx 128k→118k, Mistral-7B ctx 32k→127k
 ]
 // 📖 Gemini CLI source - https://github.com/google-gemini/gemini-cli
@@ -317,12 +337,15 @@ export const ovhcloud = [
 // 📖 Models track Google AI Studio IDs; no stale google/ prefix.
 // 📖 Supports custom OpenAI-compatible providers via GEMINI_API_BASE_URL
 export const gemini = [
+  ['gemini-3.5-flash',                   'Gemini 3.5 Flash',             'S+', '-',     '1M'],
   ['gemini-3.1-pro-preview',            'Gemini 3.1 Pro Preview',       'S+', '78.0%', '1M'],
   ['gemini-3-flash-preview',            'Gemini 3 Flash Preview',       'S',  '65.0%', '1M'],
-  ['gemini-3.1-flash-lite-preview',     'Gemini 3.1 Flash Lite Preview','A+', '55.0%', '1M'],
+  ['gemini-3.1-flash-lite',             'Gemini 3.1 Flash Lite',        'A+', '55.0%', '1M'],
+  // ⚠️ DEPRECATED — shutdown Oct 16, 2026
   ['gemini-2.5-pro',                    'Gemini 2.5 Pro',               'S+', '63.2%', '1M'],
   ['gemini-2.5-flash',                  'Gemini 2.5 Flash',             'A+', '50.0%', '1M'],
   ['gemini-2.5-flash-lite',             'Gemini 2.5 Flash Lite',        'A',  '42.0%', '1M'],
+  // Removed (2026-05-26): gemini-3.1-flash-lite-preview (endpoint shutdown May 25, 2026)
 ]
 // 📖 OpenCode Zen free models — hosted AI gateway accessed through OpenCode CLI/Desktop
@@ -331,14 +354,17 @@ export const gemini = [
 // 📖 Login: https://opencode.ai/auth — get your Zen API key
 // 📖 Config: set provider to opencode/<model-id> in OpenCode config
 export const opencodeZen = [
-  ['big-pickle',                              'Big Pickle',           'S+', '72.0%', '200k'],
-  ['minimax-m2.5-free',                       'MiniMax M2.5 Free',   'S+', '80.2%', '200k'],
-  ['nemotron-3-super-free',                   'Nemotron 3 Super Free','A+', '52.0%', '1M'],
-  ['gpt-5-nano',                              'GPT 5 Nano',          'S',  '65.0%', '400k'],
-  ['hy3-preview-free',                        'HY3 Preview Free',    'A+', '-',     '128k'],
-  ['ling-2.6-flash-free',                     'Ling 2.6 Flash Free', 'S',  '-',     '128k'],
-  ['trinity-mini-free',                       'Trinity Mini Preview', 'A',  '-',     '128k'],
-  ['trinity-large-preview-free',              'Trinity Large Preview','S',  '-',     '128k'],
+  ['big-pickle',                       'Big Pickle',              'S+', '72.0%', '200k'],
+  ['minimax-m2.5-free',                'MiniMax M2.5 Free',      'S+', '80.2%', '200k'],
+  ['deepseek-v4-flash-free',           'DeepSeek V4 Flash Free',  'S+', '79.0%', '200k'],
+  ['qwen3.6-plus-free',                'Qwen3.6 Plus Free',       'S+', '78.8%', '1M'],
+  ['nemotron-3-super-free',            'Nemotron 3 Super Free',   'A+', '52.0%', '200k'],
+  ['gpt-5-nano',                       'GPT 5 Nano',              'S',  '65.0%', '400k'],
+  // Removed (2026-05-26): hy3-preview-free (deleted from Zen)
+  // Removed (2026-05-26): ling-2.6-flash-free (deleted from Zen)
+  // Removed (2026-05-26): trinity-mini-free (deleted from Zen)
+  // Removed (2026-05-26): trinity-large-preview-free (deleted from Zen)
+  // Fix (2026-05-26): nematron-3-super-free ctx 1M → 200k (Zen limits it)
 ]
 // 📖 All sources combined - used by the main script