npm - pi-free - Versions diffs - 2.0.13 → 2.0.15 - Mend

pi-free 2.0.13 → 2.0.15

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

package/CHANGELOG.md +28 -0
package/README.md +9 -5
package/config.ts +15 -0
package/constants.ts +3 -0
package/index.ts +135 -0
package/lib/built-in-toggle.ts +4 -4
package/lib/probe-cache.ts +86 -0
package/lib/provider-compat.ts +33 -0
package/lib/registry.ts +25 -3
package/lib/telemetry.ts +328 -0
package/lib/util.ts +10 -1
package/package.json +1 -1
package/provider-failover/benchmark-lookup.ts +94 -8
package/provider-failover/benchmarks-chunk-0.ts +599 -890
package/provider-failover/benchmarks-chunk-1.ts +655 -924
package/provider-failover/benchmarks-chunk-2.ts +675 -966
package/provider-failover/benchmarks-chunk-3.ts +676 -967
package/provider-failover/benchmarks-chunk-4.ts +704 -954
package/provider-failover/benchmarks-chunk-5.ts +1301 -0
package/provider-failover/hardcoded-benchmarks.ts +9 -3
package/providers/cline/cline-models.ts +200 -68
package/providers/cline/cline.ts +3 -3
package/providers/dynamic-built-in/index.ts +1 -1
package/providers/kilo/kilo.ts +2 -2
package/providers/model-fetcher.ts +3 -1
package/providers/nvidia/nvidia.ts +54 -16
package/providers/ollama/ollama.ts +103 -46
package/providers/opencode-session.ts +398 -371
package/providers/qwen/qwen.ts +2 -2
package/providers/routeway/routeway.ts +391 -0

package/provider-failover/benchmarks-chunk-3.ts CHANGED Viewed

@@ -1,23 +1,20 @@
 // Auto-generated benchmark data chunk 3
-// Models: gemini-2.5-pro-preview-may-25 .. phi-3-mini-instruct-3.8b (90 entries)
+// Models: llama-3.1-instruct-70b .. magistral-medium-1 (90 entries)
+// Last updated: 2026-06-01
 // DO NOT EDIT MANUALLY — generated by scripts/update-benchmarks.ts
 import type { HardcodedBenchmark } from "./hardcoded-benchmarks.ts";
 export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
-	"gemini-2.5-pro-preview-may-25": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 29.5,
-		normalizedScore: 42,
+	"llama-3.1-instruct-70b": {
 		// AA specific benchmarks
-		codingIndex: undefined,
-		mathIndex: undefined,
+		codingIndex: 10.9,
+		mathIndex: 4,
 		// Academic benchmarks
-		mmluPro: 0.837,
-		gpqa: 0.822,
-		hle: 0.154,
+		mmluPro: 0.676,
+		gpqa: 0.409,
+		hle: 0.046,
 		// Capabilities
 		contextWindow: 8192,
@@ -25,21 +22,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Llama 3.1 Instruct 70B",
 	},
-	"gemini-2.5-flash-preview-non-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 17.8,
-		normalizedScore: 25,
+	"llama-3.1-instruct-8b": {
 		// AA specific benchmarks
-		codingIndex: undefined,
-		mathIndex: undefined,
+		codingIndex: 4.9,
+		mathIndex: 4.3,
 		// Academic benchmarks
-		mmluPro: 0.783,
-		gpqa: 0.594,
-		hle: 0.05,
+		mmluPro: 0.476,
+		gpqa: 0.259,
+		hle: 0.051,
 		// Capabilities
 		contextWindow: 8192,
@@ -47,21 +41,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Llama 3.1 Instruct 8B",
 	},
-	"gemini-1.5-pro-may-24": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 12,
-		normalizedScore: 17,
+	"llama-3.2-instruct-3b": {
 		// AA specific benchmarks
-		codingIndex: 19.8,
-		mathIndex: undefined,
+		codingIndex: undefined,
+		mathIndex: 3.3,
 		// Academic benchmarks
-		mmluPro: 0.657,
-		gpqa: 0.371,
-		hle: 0.039,
+		mmluPro: 0.347,
+		gpqa: 0.255,
+		hle: 0.052,
 		// Capabilities
 		contextWindow: 8192,
@@ -69,21 +60,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Llama 3.2 Instruct 3B",
 	},
-	"gemini-2.5-flash-non-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 20.6,
-		normalizedScore: 29,
+	"llama-3-instruct-70b": {
 		// AA specific benchmarks
-		codingIndex: 17.8,
-		mathIndex: 60.3,
+		codingIndex: 6.8,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.809,
-		gpqa: 0.683,
-		hle: 0.051,
+		mmluPro: 0.574,
+		gpqa: 0.379,
+		hle: 0.044,
 		// Capabilities
 		contextWindow: 8192,
@@ -91,21 +79,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Llama 3 Instruct 70B",
 	},
-	"gemini-2.5-flash-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 27,
-		normalizedScore: 39,
+	"llama-3-instruct-8b": {
 		// AA specific benchmarks
-		codingIndex: 22.2,
-		mathIndex: 73.3,
+		codingIndex: 4,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.832,
-		gpqa: 0.79,
-		hle: 0.111,
+		mmluPro: 0.405,
+		gpqa: 0.296,
+		hle: 0.051,
 		// Capabilities
 		contextWindow: 8192,
@@ -113,21 +98,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Llama 3 Instruct 8B",
 	},
-	"gemini-2.5-flash-preview-sep-25-non-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 25.7,
-		normalizedScore: 37,
+	"llama-3.2-instruct-1b": {
 		// AA specific benchmarks
-		codingIndex: 22.1,
-		mathIndex: 56.7,
+		codingIndex: 0.6,
+		mathIndex: 0,
 		// Academic benchmarks
-		mmluPro: 0.836,
-		gpqa: 0.766,
-		hle: 0.078,
+		mmluPro: 0.2,
+		gpqa: 0.196,
+		hle: 0.053,
 		// Capabilities
 		contextWindow: 8192,
@@ -135,21 +117,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Llama 3.2 Instruct 1B",
 	},
-	"gemma-3n-e4b-instruct-preview-may-25": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 10.1,
-		normalizedScore: 14,
+	"llama-2-chat-70b": {
 		// AA specific benchmarks
 		codingIndex: undefined,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.483,
-		gpqa: 0.278,
-		hle: 0.049,
+		mmluPro: 0.406,
+		gpqa: 0.327,
+		hle: 0.05,
 		// Capabilities
 		contextWindow: 8192,
@@ -157,21 +136,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Llama 2 Chat 70B",
 	},
-	"gemini-1.5-flash-may-24": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 10.5,
-		normalizedScore: 15,
+	"llama-2-chat-7b": {
 		// AA specific benchmarks
 		codingIndex: undefined,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.574,
-		gpqa: 0.324,
-		hle: 0.042,
+		mmluPro: 0.164,
+		gpqa: 0.227,
+		hle: 0.058,
 		// Capabilities
 		contextWindow: 8192,
@@ -179,21 +155,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Llama 2 Chat 7B",
 	},
-	"gemini-2.5-flash-lite-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 17.6,
-		normalizedScore: 25,
+	"llama-2-chat-13b": {
 		// AA specific benchmarks
-		codingIndex: 9.5,
-		mathIndex: 53.3,
+		codingIndex: undefined,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.759,
-		gpqa: 0.625,
-		hle: 0.064,
+		mmluPro: 0.406,
+		gpqa: 0.321,
+		hle: 0.047,
 		// Capabilities
 		contextWindow: 8192,
@@ -201,21 +174,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Llama 2 Chat 13B",
 	},
-	"gemini-2-flash-lite-feb-25": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 14.7,
-		normalizedScore: 21,
+	"gemini-2.0-pro-experimental-feb-25": {
 		// AA specific benchmarks
-		codingIndex: undefined,
+		codingIndex: 25.5,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.724,
-		gpqa: 0.535,
-		hle: 0.036,
+		mmluPro: 0.805,
+		gpqa: 0.622,
+		hle: 0.068,
 		// Capabilities
 		contextWindow: 8192,
@@ -223,21 +193,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 2.0 Pro Experimental (Feb '25)",
 	},
-	"gemini-2.5-flash-preview-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 24.3,
-		normalizedScore: 35,
+	"gemini-2.0-flash-experimental": {
 		// AA specific benchmarks
 		codingIndex: undefined,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.8,
-		gpqa: 0.698,
-		hle: 0.116,
+		mmluPro: 0.782,
+		gpqa: 0.636,
+		hle: 0.047,
 		// Capabilities
 		contextWindow: 8192,
@@ -245,21 +212,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 2.0 Flash (experimental)",
 	},
-	"gemini-2.5-pro-preview-mar-25": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 30.3,
-		normalizedScore: 43,
+	"gemini-1.5-pro-sep-24": {
 		// AA specific benchmarks
-		codingIndex: 46.7,
+		codingIndex: 23.6,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.858,
-		gpqa: 0.836,
-		hle: 0.171,
+		mmluPro: 0.75,
+		gpqa: 0.589,
+		hle: 0.049,
 		// Capabilities
 		contextWindow: 8192,
@@ -267,21 +231,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 1.5 Pro (Sep '24)",
 	},
-	"gemini-1-ultra": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 10.1,
-		normalizedScore: 14,
+	"gemini-2.0-flash-lite-preview": {
 		// AA specific benchmarks
-		codingIndex: 17.6,
+		codingIndex: undefined,
 		mathIndex: undefined,
 		// Academic benchmarks
 		mmluPro: undefined,
-		gpqa: undefined,
-		hle: undefined,
+		gpqa: 0.542,
+		hle: 0.044,
 		// Capabilities
 		contextWindow: 8192,
@@ -289,21 +250,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 2.0 Flash-Lite (Preview)",
 	},
-	"gemini-2.5-flash-preview-sep-25-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 31.1,
-		normalizedScore: 44,
+	"gemini-2.0-flash-feb-25": {
 		// AA specific benchmarks
-		codingIndex: 24.6,
-		mathIndex: 78.3,
+		codingIndex: 13.6,
+		mathIndex: 21.7,
 		// Academic benchmarks
-		mmluPro: 0.842,
-		gpqa: 0.793,
-		hle: 0.127,
+		mmluPro: 0.779,
+		gpqa: 0.623,
+		hle: 0.053,
 		// Capabilities
 		contextWindow: 8192,
@@ -311,21 +269,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 2.0 Flash (Feb '25)",
 	},
-	"claude-3.5-sonnet-oct-24": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 15.9,
-		normalizedScore: 23,
+	"gemini-1.5-flash-sep-24": {
 		// AA specific benchmarks
-		codingIndex: 30.2,
+		codingIndex: undefined,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.772,
-		gpqa: 0.599,
-		hle: 0.039,
+		mmluPro: 0.68,
+		gpqa: 0.463,
+		hle: 0.035,
 		// Capabilities
 		contextWindow: 8192,
@@ -333,21 +288,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 1.5 Flash (Sep '24)",
 	},
-	"claude-3.5-sonnet-june-24": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 14.2,
-		normalizedScore: 20,
+	"gemini-1.5-flash-8b": {
 		// AA specific benchmarks
-		codingIndex: 26,
+		codingIndex: undefined,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.751,
-		gpqa: 0.56,
-		hle: 0.037,
+		mmluPro: 0.569,
+		gpqa: 0.359,
+		hle: 0.045,
 		// Capabilities
 		contextWindow: 8192,
@@ -355,21 +307,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 1.5 Flash-8B",
 	},
-	"claude-3-opus": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 18,
-		normalizedScore: 26,
+	"gemma-3-1b-instruct": {
 		// AA specific benchmarks
-		codingIndex: 19.5,
-		mathIndex: undefined,
+		codingIndex: 0.2,
+		mathIndex: 3.3,
 		// Academic benchmarks
-		mmluPro: 0.696,
-		gpqa: 0.489,
-		hle: 0.031,
+		mmluPro: 0.135,
+		gpqa: 0.237,
+		hle: 0.052,
 		// Capabilities
 		contextWindow: 8192,
@@ -377,21 +326,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemma 3 1B Instruct",
 	},
-	"claude-3.5-haiku": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 18.7,
-		normalizedScore: 27,
+	"gemini-2.5-flash-lite-non-reasoning": {
 		// AA specific benchmarks
-		codingIndex: 10.7,
-		mathIndex: undefined,
+		codingIndex: 7.4,
+		mathIndex: 35.3,
 		// Academic benchmarks
-		mmluPro: 0.634,
-		gpqa: 0.408,
-		hle: 0.035,
+		mmluPro: 0.724,
+		gpqa: 0.474,
+		hle: 0.037,
 		// Capabilities
 		contextWindow: 8192,
@@ -399,21 +345,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 2.5 Flash-Lite (Non-reasoning)",
 	},
-	"claude-3-sonnet": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 10.3,
-		normalizedScore: 15,
+	"gemini-3-pro-preview-high": {
 		// AA specific benchmarks
-		codingIndex: undefined,
-		mathIndex: undefined,
+		codingIndex: 46.5,
+		mathIndex: 95.7,
 		// Academic benchmarks
-		mmluPro: 0.579,
-		gpqa: 0.4,
-		hle: 0.038,
+		mmluPro: 0.898,
+		gpqa: 0.908,
+		hle: 0.372,
 		// Capabilities
 		contextWindow: 8192,
@@ -421,21 +364,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 3 Pro Preview (high)",
 	},
-	"claude-3-haiku": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 12.3,
-		normalizedScore: 18,
+	"gemma-3n-e2b-instruct": {
 		// AA specific benchmarks
-		codingIndex: 6.7,
-		mathIndex: undefined,
+		codingIndex: 2.2,
+		mathIndex: 10.3,
 		// Academic benchmarks
-		mmluPro: undefined,
-		gpqa: 0.374,
-		hle: 0.039,
+		mmluPro: 0.378,
+		gpqa: 0.229,
+		hle: 0.04,
 		// Capabilities
 		contextWindow: 8192,
@@ -443,21 +383,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemma 3n E2B Instruct",
 	},
-	"claude-instant": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 7.4,
-		normalizedScore: 11,
+	"gemma-3-12b-instruct": {
 		// AA specific benchmarks
-		codingIndex: 7.8,
-		mathIndex: undefined,
+		codingIndex: 6.3,
+		mathIndex: 18.3,
 		// Academic benchmarks
-		mmluPro: 0.434,
-		gpqa: 0.33,
-		hle: 0.038,
+		mmluPro: 0.595,
+		gpqa: 0.349,
+		hle: 0.048,
 		// Capabilities
 		contextWindow: 8192,
@@ -465,21 +402,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemma 3 12B Instruct",
 	},
-	"claude-3.7-sonnet-non-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 30.8,
-		normalizedScore: 44,
+	"gemma-3-27b-instruct": {
 		// AA specific benchmarks
-		codingIndex: 26.7,
-		mathIndex: 21,
+		codingIndex: 9.6,
+		mathIndex: 20.7,
 		// Academic benchmarks
-		mmluPro: 0.803,
-		gpqa: 0.656,
-		hle: 0.048,
+		mmluPro: 0.669,
+		gpqa: 0.428,
+		hle: 0.047,
 		// Capabilities
 		contextWindow: 8192,
@@ -487,21 +421,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemma 3 27B Instruct",
 	},
-	"claude-2.1": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 9.3,
-		normalizedScore: 13,
+	"gemini-2.5-flash-preview-sep-25-reasoning": {
 		// AA specific benchmarks
-		codingIndex: 14,
-		mathIndex: undefined,
+		codingIndex: 24.6,
+		mathIndex: 78.3,
 		// Academic benchmarks
-		mmluPro: 0.495,
-		gpqa: 0.319,
-		hle: 0.042,
+		mmluPro: 0.842,
+		gpqa: 0.793,
+		hle: 0.127,
 		// Capabilities
 		contextWindow: 8192,
@@ -509,21 +440,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 2.5 Flash Preview (Sep '25) (Reasoning)",
 	},
-	"claude-3.7-sonnet-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 34.7,
-		normalizedScore: 50,
+	"gemini-1.5-pro-may-24": {
 		// AA specific benchmarks
-		codingIndex: 27.6,
-		mathIndex: 56.3,
+		codingIndex: 19.8,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.837,
-		gpqa: 0.772,
-		hle: 0.103,
+		mmluPro: 0.657,
+		gpqa: 0.371,
+		hle: 0.039,
 		// Capabilities
 		contextWindow: 8192,
@@ -531,21 +459,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 1.5 Pro (May '24)",
 	},
-	"claude-4.1-opus-non-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 36,
-		normalizedScore: 51,
+	"gemma-3-4b-instruct": {
 		// AA specific benchmarks
-		codingIndex: undefined,
-		mathIndex: undefined,
+		codingIndex: 2.9,
+		mathIndex: 12.7,
 		// Academic benchmarks
-		mmluPro: undefined,
-		gpqa: undefined,
-		hle: undefined,
+		mmluPro: 0.417,
+		gpqa: 0.291,
+		hle: 0.052,
 		// Capabilities
 		contextWindow: 8192,
@@ -553,21 +478,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemma 3 4B Instruct",
 	},
-	"claude-4.1-opus-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 42,
-		normalizedScore: 60,
+	"gemini-2.5-pro-preview-may-25": {
 		// AA specific benchmarks
-		codingIndex: 36.5,
-		mathIndex: 80.3,
+		codingIndex: undefined,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.88,
-		gpqa: 0.809,
-		hle: 0.119,
+		mmluPro: 0.837,
+		gpqa: 0.822,
+		hle: 0.154,
 		// Capabilities
 		contextWindow: 8192,
@@ -575,21 +497,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 2.5 Pro Preview (May' 25)",
 	},
-	"claude-4-sonnet-non-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 33,
-		normalizedScore: 47,
+	"gemini-2.0-flash-thinking-experimental-jan-25": {
 		// AA specific benchmarks
-		codingIndex: 30.6,
-		mathIndex: 38,
+		codingIndex: 24.1,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.837,
-		gpqa: 0.683,
-		hle: 0.04,
+		mmluPro: 0.798,
+		gpqa: 0.701,
+		hle: 0.071,
 		// Capabilities
 		contextWindow: 8192,
@@ -597,21 +516,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 2.0 Flash Thinking Experimental (Jan '25)",
 	},
-	"claude-4-opus-non-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 33,
-		normalizedScore: 47,
+	"gemma-3n-e4b-instruct-preview-may-25": {
 		// AA specific benchmarks
 		codingIndex: undefined,
-		mathIndex: 36.3,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.86,
-		gpqa: 0.701,
-		hle: 0.059,
+		mmluPro: 0.483,
+		gpqa: 0.278,
+		hle: 0.049,
 		// Capabilities
 		contextWindow: 8192,
@@ -619,21 +535,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemma 3n E4B Instruct Preview (May '25)",
 	},
-	"claude-4-sonnet-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 38.7,
-		normalizedScore: 55,
+	"gemini-1.0-ultra": {
 		// AA specific benchmarks
-		codingIndex: 34.1,
-		mathIndex: 74.3,
+		codingIndex: 17.6,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.842,
-		gpqa: 0.777,
-		hle: 0.096,
+		mmluPro: undefined,
+		gpqa: undefined,
+		hle: undefined,
 		// Capabilities
 		contextWindow: 8192,
@@ -641,43 +554,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 1.0 Ultra",
 	},
-	"claude-opus-4.5-non-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 43.1,
-		normalizedScore: 62,
+	"gemma-3n-e4b-instruct": {
 		// AA specific benchmarks
-		codingIndex: 42.9,
-		mathIndex: 62.7,
-		// Academic benchmarks
-		mmluPro: 0.889,
-		gpqa: 0.81,
-		hle: 0.129,
-		// Capabilities
-		contextWindow: 8192,
-		supportsReasoning: false,
-		supportsVision: false,
-		// Metadata
-		lastUpdated: "2026-04-06",
-	},
-	"claude-opus-4.5-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 49.7,
-		normalizedScore: 71,
-		// AA specific benchmarks
-		codingIndex: 47.8,
-		mathIndex: 91.3,
+		codingIndex: 4.2,
+		mathIndex: 14.3,
 		// Academic benchmarks
-		mmluPro: 0.895,
-		gpqa: 0.866,
-		hle: 0.284,
+		mmluPro: 0.488,
+		gpqa: 0.296,
+		hle: 0.044,
 		// Capabilities
 		contextWindow: 8192,
@@ -685,21 +573,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemma 3n E4B Instruct",
 	},
-	"claude-4-opus-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 39,
-		normalizedScore: 56,
+	"gemini-2.5-flash-lite-reasoning": {
 		// AA specific benchmarks
-		codingIndex: 34,
-		mathIndex: 73.3,
+		codingIndex: 9.5,
+		mathIndex: 53.3,
 		// Academic benchmarks
-		mmluPro: 0.873,
-		gpqa: 0.796,
-		hle: 0.117,
+		mmluPro: 0.759,
+		gpqa: 0.625,
+		hle: 0.064,
 		// Capabilities
 		contextWindow: 8192,
@@ -707,21 +592,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 2.5 Flash-Lite (Reasoning)",
 	},
-	"claude-4.5-sonnet-non-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 37.1,
-		normalizedScore: 53,
+	"gemini-2.0-flash-thinking-experimental-dec-24": {
 		// AA specific benchmarks
-		codingIndex: 33.5,
-		mathIndex: 37,
+		codingIndex: undefined,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.86,
-		gpqa: 0.727,
-		hle: 0.071,
+		mmluPro: undefined,
+		gpqa: undefined,
+		hle: undefined,
 		// Capabilities
 		contextWindow: 8192,
@@ -729,21 +611,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 2.0 Flash Thinking Experimental (Dec '24)",
 	},
-	"claude-4.5-sonnet-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 43,
-		normalizedScore: 61,
+	"gemini-2.5-flash-reasoning": {
 		// AA specific benchmarks
-		codingIndex: 38.6,
-		mathIndex: 88,
+		codingIndex: 22.2,
+		mathIndex: 73.3,
 		// Academic benchmarks
-		mmluPro: 0.875,
-		gpqa: 0.834,
-		hle: 0.173,
+		mmluPro: 0.832,
+		gpqa: 0.79,
+		hle: 0.111,
 		// Capabilities
 		contextWindow: 8192,
@@ -751,21 +630,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 2.5 Flash (Reasoning)",
 	},
-	"claude-2": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 9.1,
-		normalizedScore: 13,
+	"gemini-1.5-flash-may-24": {
 		// AA specific benchmarks
-		codingIndex: 12.9,
+		codingIndex: undefined,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.486,
-		gpqa: 0.344,
-		hle: undefined,
+		mmluPro: 0.574,
+		gpqa: 0.324,
+		hle: 0.042,
 		// Capabilities
 		contextWindow: 8192,
@@ -773,21 +649,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 1.5 Flash (May '24)",
 	},
-	"mistral-large-2-nov-24": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 15.1,
-		normalizedScore: 22,
+	"gemini-2.5-flash-preview-reasoning": {
 		// AA specific benchmarks
-		codingIndex: 13.8,
-		mathIndex: 14,
+		codingIndex: undefined,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.697,
-		gpqa: 0.486,
-		hle: 0.04,
+		mmluPro: 0.8,
+		gpqa: 0.698,
+		hle: 0.116,
 		// Capabilities
 		contextWindow: 8192,
@@ -795,21 +668,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 2.5 Flash Preview (Reasoning)",
 	},
-	"mistral-large-2-jul-24": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 13,
-		normalizedScore: 19,
+	"gemini-2.5-flash-lite-preview-sep-25-reasoning": {
 		// AA specific benchmarks
-		codingIndex: undefined,
-		mathIndex: 0,
+		codingIndex: 18.2,
+		mathIndex: 68.7,
 		// Academic benchmarks
-		mmluPro: 0.683,
-		gpqa: 0.472,
-		hle: 0.032,
+		mmluPro: 0.808,
+		gpqa: 0.709,
+		hle: 0.066,
 		// Capabilities
 		contextWindow: 8192,
@@ -817,21 +687,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 2.5 Flash-Lite Preview (Sep '25) (Reasoning)",
 	},
-	"pixtral-large": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 14,
-		normalizedScore: 20,
+	"gemini-2.5-flash-preview-sep-25-non-reasoning": {
 		// AA specific benchmarks
-		codingIndex: undefined,
-		mathIndex: 2.3,
+		codingIndex: 22.1,
+		mathIndex: 56.7,
 		// Academic benchmarks
-		mmluPro: 0.701,
-		gpqa: 0.505,
-		hle: 0.036,
+		mmluPro: 0.836,
+		gpqa: 0.766,
+		hle: 0.078,
 		// Capabilities
 		contextWindow: 8192,
@@ -839,21 +706,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 2.5 Flash Preview (Sep '25) (Non-reasoning)",
 	},
-	"mistral-small-3": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 12.7,
-		normalizedScore: 18,
+	"gemini-2.5-flash-preview-non-reasoning": {
 		// AA specific benchmarks
 		codingIndex: undefined,
-		mathIndex: 4.3,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.652,
-		gpqa: 0.462,
-		hle: 0.041,
+		mmluPro: 0.783,
+		gpqa: 0.594,
+		hle: 0.05,
 		// Capabilities
 		contextWindow: 8192,
@@ -861,21 +725,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 2.5 Flash Preview (Non-reasoning)",
 	},
-	"mistral-small-sep-24": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 10.2,
-		normalizedScore: 15,
+	"gemini-2.5-pro-preview-mar-25": {
 		// AA specific benchmarks
-		codingIndex: undefined,
+		codingIndex: 46.7,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.529,
-		gpqa: 0.381,
-		hle: 0.043,
+		mmluPro: 0.858,
+		gpqa: 0.836,
+		hle: 0.171,
 		// Capabilities
 		contextWindow: 8192,
@@ -883,21 +744,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 2.5 Pro Preview (Mar' 25)",
 	},
-	"mixtral-8x22b-instruct": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 9.8,
-		normalizedScore: 14,
+	"gemini-1.0-pro": {
 		// AA specific benchmarks
 		codingIndex: undefined,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.537,
-		gpqa: 0.332,
-		hle: 0.041,
+		mmluPro: 0.431,
+		gpqa: 0.277,
+		hle: 0.046,
 		// Capabilities
 		contextWindow: 8192,
@@ -905,21 +763,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 1.0 Pro",
 	},
-	"mistral-small-feb-24": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 9,
-		normalizedScore: 13,
+	"gemini-2.5-flash-non-reasoning": {
 		// AA specific benchmarks
-		codingIndex: undefined,
-		mathIndex: undefined,
+		codingIndex: 17.8,
+		mathIndex: 60.3,
 		// Academic benchmarks
-		mmluPro: 0.419,
-		gpqa: 0.302,
-		hle: 0.044,
+		mmluPro: 0.809,
+		gpqa: 0.683,
+		hle: 0.051,
 		// Capabilities
 		contextWindow: 8192,
@@ -927,21 +782,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 2.5 Flash (Non-reasoning)",
 	},
-	"mistral-large-feb-24": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 9.9,
-		normalizedScore: 14,
+	"gemini-2.5-flash-lite-preview-sep-25-non-reasoning": {
 		// AA specific benchmarks
-		codingIndex: undefined,
-		mathIndex: undefined,
+		codingIndex: 14.5,
+		mathIndex: 46.7,
 		// Academic benchmarks
-		mmluPro: 0.515,
-		gpqa: 0.351,
-		hle: 0.034,
+		mmluPro: 0.796,
+		gpqa: 0.651,
+		hle: 0.046,
 		// Capabilities
 		contextWindow: 8192,
@@ -949,21 +801,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 2.5 Flash-Lite Preview (Sep '25) (Non-reasoning)",
 	},
-	"mixtral-8x7b-instruct": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 7.7,
-		normalizedScore: 11,
+	"gemini-3-flash-preview-non-reasoning": {
 		// AA specific benchmarks
-		codingIndex: undefined,
-		mathIndex: undefined,
+		codingIndex: 37.8,
+		mathIndex: 55.7,
 		// Academic benchmarks
-		mmluPro: 0.387,
-		gpqa: 0.292,
-		hle: 0.045,
+		mmluPro: 0.882,
+		gpqa: 0.812,
+		hle: 0.141,
 		// Capabilities
 		contextWindow: 8192,
@@ -971,21 +820,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 3 Flash Preview (Non-reasoning)",
 	},
-	"mistral-7b-instruct": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 7.4,
-		normalizedScore: 11,
+	"gemini-2.0-flash-lite-feb-25": {
 		// AA specific benchmarks
 		codingIndex: undefined,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.245,
-		gpqa: 0.177,
-		hle: 0.043,
+		mmluPro: 0.724,
+		gpqa: 0.535,
+		hle: 0.036,
 		// Capabilities
 		contextWindow: 8192,
@@ -993,21 +839,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 2.0 Flash-Lite (Feb '25)",
 	},
-	"mistral-small-3.1": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 14.5,
-		normalizedScore: 21,
+	"gemini-3-flash-preview-reasoning": {
 		// AA specific benchmarks
-		codingIndex: 13.9,
-		mathIndex: 3.7,
+		codingIndex: 42.6,
+		mathIndex: 97,
 		// Academic benchmarks
-		mmluPro: 0.659,
-		gpqa: 0.454,
-		hle: 0.048,
+		mmluPro: 0.89,
+		gpqa: 0.898,
+		hle: 0.347,
 		// Capabilities
 		contextWindow: 8192,
@@ -1015,21 +858,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 3 Flash Preview (Reasoning)",
 	},
-	"mistral-medium-3": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 18.8,
-		normalizedScore: 27,
+	"gemini-3-pro-preview-low": {
 		// AA specific benchmarks
-		codingIndex: 13.6,
-		mathIndex: 30.3,
+		codingIndex: 39.4,
+		mathIndex: 86.7,
 		// Academic benchmarks
-		mmluPro: 0.76,
-		gpqa: 0.578,
-		hle: 0.043,
+		mmluPro: 0.895,
+		gpqa: 0.887,
+		hle: 0.276,
 		// Capabilities
 		contextWindow: 8192,
@@ -1037,21 +877,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Gemini 3 Pro Preview (low)",
 	},
-	"mistral-saba": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 12.1,
-		normalizedScore: 17,
+	"palm-2": {
 		// AA specific benchmarks
-		codingIndex: undefined,
+		codingIndex: 4.6,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.611,
-		gpqa: 0.424,
-		hle: 0.041,
+		mmluPro: undefined,
+		gpqa: undefined,
+		hle: undefined,
 		// Capabilities
 		contextWindow: 8192,
@@ -1059,21 +896,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "PALM-2",
 	},
-	"mistral-small-3.2": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 15.1,
-		normalizedScore: 22,
+	"claude-3.5-sonnet-oct-24": {
 		// AA specific benchmarks
-		codingIndex: 13.3,
-		mathIndex: 27,
+		codingIndex: 30.2,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.681,
-		gpqa: 0.505,
-		hle: 0.043,
+		mmluPro: 0.772,
+		gpqa: 0.599,
+		hle: 0.039,
 		// Capabilities
 		contextWindow: 8192,
@@ -1081,21 +915,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude 3.5 Sonnet (Oct '24)",
 	},
-	"magistral-medium-1": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 18.8,
-		normalizedScore: 27,
+	"claude-3.5-sonnet-june-24": {
 		// AA specific benchmarks
-		codingIndex: 16,
-		mathIndex: 40.3,
+		codingIndex: 26,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.753,
-		gpqa: 0.679,
-		hle: 0.095,
+		mmluPro: 0.751,
+		gpqa: 0.56,
+		hle: 0.037,
 		// Capabilities
 		contextWindow: 8192,
@@ -1103,21 +934,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude 3.5 Sonnet (June '24)",
 	},
-	"devstral-medium": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 18.7,
-		normalizedScore: 27,
+	"claude-3-opus": {
 		// AA specific benchmarks
-		codingIndex: 15.9,
-		mathIndex: 4.7,
+		codingIndex: 19.5,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.708,
-		gpqa: 0.492,
-		hle: 0.038,
+		mmluPro: 0.696,
+		gpqa: 0.489,
+		hle: 0.031,
 		// Capabilities
 		contextWindow: 8192,
@@ -1125,21 +953,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude 3 Opus",
 	},
-	"magistral-small-1": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 16.8,
-		normalizedScore: 24,
+	"claude-3.5-haiku": {
 		// AA specific benchmarks
-		codingIndex: 11.1,
-		mathIndex: 41.3,
+		codingIndex: 10.7,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.746,
-		gpqa: 0.641,
-		hle: 0.072,
+		mmluPro: 0.634,
+		gpqa: 0.408,
+		hle: 0.035,
 		// Capabilities
 		contextWindow: 8192,
@@ -1147,21 +972,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude 3.5 Haiku",
 	},
-	"mistral-medium": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 9,
-		normalizedScore: 13,
+	"claude-3-sonnet": {
 		// AA specific benchmarks
 		codingIndex: undefined,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.491,
-		gpqa: 0.349,
-		hle: 0.034,
+		mmluPro: 0.579,
+		gpqa: 0.4,
+		hle: 0.038,
 		// Capabilities
 		contextWindow: 8192,
@@ -1169,21 +991,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude 3 Sonnet",
 	},
-	"devstral-small-jul-25": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 15.2,
-		normalizedScore: 22,
+	"claude-3-haiku": {
 		// AA specific benchmarks
-		codingIndex: 12.1,
-		mathIndex: 29.3,
+		codingIndex: 6.7,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.622,
-		gpqa: 0.414,
-		hle: 0.037,
+		mmluPro: undefined,
+		gpqa: 0.374,
+		hle: 0.039,
 		// Capabilities
 		contextWindow: 8192,
@@ -1191,21 +1010,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude 3 Haiku",
 	},
-	"devstral-small-may-25": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 18,
-		normalizedScore: 26,
+	"claude-instant": {
 		// AA specific benchmarks
-		codingIndex: 12.2,
+		codingIndex: 7.8,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.632,
-		gpqa: 0.434,
-		hle: 0.04,
+		mmluPro: 0.434,
+		gpqa: 0.33,
+		hle: 0.038,
 		// Capabilities
 		contextWindow: 8192,
@@ -1213,21 +1029,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude Instant",
 	},
-	"deepseek-r1-distill-qwen-32b": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 17.2,
-		normalizedScore: 25,
+	"claude-4.5-sonnet-reasoning": {
 		// AA specific benchmarks
-		codingIndex: undefined,
-		mathIndex: 63,
+		codingIndex: 38.6,
+		mathIndex: 88,
 		// Academic benchmarks
-		mmluPro: 0.739,
-		gpqa: 0.615,
-		hle: 0.055,
+		mmluPro: 0.875,
+		gpqa: 0.834,
+		hle: 0.173,
 		// Capabilities
 		contextWindow: 8192,
@@ -1235,21 +1048,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude 4.5 Sonnet (Reasoning)",
 	},
-	"deepseek-v3-dec-24": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 16.5,
-		normalizedScore: 24,
+	"claude-4-sonnet-non-reasoning": {
 		// AA specific benchmarks
-		codingIndex: 16.4,
-		mathIndex: 26,
+		codingIndex: 30.6,
+		mathIndex: 38,
 		// Academic benchmarks
-		mmluPro: 0.752,
-		gpqa: 0.557,
-		hle: 0.036,
+		mmluPro: 0.837,
+		gpqa: 0.683,
+		hle: 0.04,
 		// Capabilities
 		contextWindow: 8192,
@@ -1257,21 +1067,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude 4 Sonnet (Non-reasoning)",
 	},
-	"deepseek-r1-distill-qwen-14b": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 15.8,
-		normalizedScore: 23,
+	"claude-3.7-sonnet-non-reasoning": {
 		// AA specific benchmarks
-		codingIndex: undefined,
-		mathIndex: 55.7,
+		codingIndex: 26.7,
+		mathIndex: 21,
 		// Academic benchmarks
-		mmluPro: 0.74,
-		gpqa: 0.484,
-		hle: 0.044,
+		mmluPro: 0.803,
+		gpqa: 0.656,
+		hle: 0.048,
 		// Capabilities
 		contextWindow: 8192,
@@ -1279,20 +1086,17 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude 3.7 Sonnet (Non-reasoning)",
 	},
-	"deepseek-v2.5-dec-24": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 12.5,
-		normalizedScore: 18,
+	"claude-2.0": {
 		// AA specific benchmarks
-		codingIndex: undefined,
+		codingIndex: 12.9,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: undefined,
-		gpqa: undefined,
+		mmluPro: 0.486,
+		gpqa: 0.344,
 		hle: undefined,
 		// Capabilities
@@ -1301,13 +1105,10 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude 2.0",
 	},
-	"deepseek-coder-v2": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 10.6,
-		normalizedScore: 15,
+	"claude-4.1-opus-non-reasoning": {
 		// AA specific benchmarks
 		codingIndex: undefined,
 		mathIndex: undefined,
@@ -1323,21 +1124,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude 4.1 Opus (Non-reasoning)",
 	},
-	"deepseek-r1-distill-llama-8b": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 12.1,
-		normalizedScore: 17,
+	"claude-4.1-opus-reasoning": {
 		// AA specific benchmarks
-		codingIndex: undefined,
-		mathIndex: 41.3,
+		codingIndex: 36.5,
+		mathIndex: 80.3,
 		// Academic benchmarks
-		mmluPro: 0.543,
-		gpqa: 0.302,
-		hle: 0.042,
+		mmluPro: 0.88,
+		gpqa: 0.809,
+		hle: 0.119,
 		// Capabilities
 		contextWindow: 8192,
@@ -1345,21 +1143,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude 4.1 Opus (Reasoning)",
 	},
-	"deepseek-llm-67b-chat-v1": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 8.4,
-		normalizedScore: 12,
+	"claude-4.5-sonnet-non-reasoning": {
 		// AA specific benchmarks
-		codingIndex: undefined,
-		mathIndex: undefined,
+		codingIndex: 33.5,
+		mathIndex: 37,
 		// Academic benchmarks
-		mmluPro: undefined,
-		gpqa: undefined,
-		hle: undefined,
+		mmluPro: 0.86,
+		gpqa: 0.727,
+		hle: 0.071,
 		// Capabilities
 		contextWindow: 8192,
@@ -1367,21 +1162,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude 4.5 Sonnet (Non-reasoning)",
 	},
-	"deepseek-r1-distill-qwen-1.5b": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 9.1,
-		normalizedScore: 13,
+	"claude-opus-4.6-adaptive-reasoning-max-effort": {
 		// AA specific benchmarks
-		codingIndex: undefined,
-		mathIndex: 22,
+		codingIndex: 48.1,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.269,
-		gpqa: 0.098,
-		hle: 0.033,
+		mmluPro: undefined,
+		gpqa: 0.896,
+		hle: 0.367,
 		// Capabilities
 		contextWindow: 8192,
@@ -1389,21 +1181,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude Opus 4.6 (Adaptive Reasoning, Max Effort)",
 	},
-	"deepseek-v3.1-terminus-non-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 28.5,
-		normalizedScore: 41,
+	"claude-opus-4.5-reasoning": {
 		// AA specific benchmarks
-		codingIndex: 31.9,
-		mathIndex: 53.7,
+		codingIndex: 47.8,
+		mathIndex: 91.3,
 		// Academic benchmarks
-		mmluPro: 0.836,
-		gpqa: 0.751,
-		hle: 0.084,
+		mmluPro: 0.895,
+		gpqa: 0.866,
+		hle: 0.284,
 		// Capabilities
 		contextWindow: 8192,
@@ -1411,21 +1200,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude Opus 4.5 (Reasoning)",
 	},
-	"deepseek-v3.2-exp-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 32.9,
-		normalizedScore: 47,
+	"claude-3.7-sonnet-reasoning": {
 		// AA specific benchmarks
-		codingIndex: 33.3,
-		mathIndex: 87.7,
+		codingIndex: 27.6,
+		mathIndex: 56.3,
 		// Academic benchmarks
-		mmluPro: 0.85,
-		gpqa: 0.797,
-		hle: 0.138,
+		mmluPro: 0.837,
+		gpqa: 0.772,
+		hle: 0.103,
 		// Capabilities
 		contextWindow: 8192,
@@ -1433,21 +1219,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude 3.7 Sonnet (Reasoning)",
 	},
-	"deepseek-v3.1-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 27.7,
-		normalizedScore: 40,
+	"claude-opus-4.6-non-reasoning-high-effort": {
 		// AA specific benchmarks
-		codingIndex: 29.7,
-		mathIndex: 89.7,
+		codingIndex: 47.6,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.851,
-		gpqa: 0.779,
-		hle: 0.13,
+		mmluPro: undefined,
+		gpqa: 0.84,
+		hle: 0.186,
 		// Capabilities
 		contextWindow: 8192,
@@ -1455,21 +1238,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude Opus 4.6 (Non-reasoning, High Effort)",
 	},
-	"deepseek-v3.2-exp-non-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 28.4,
-		normalizedScore: 41,
+	"claude-4-opus-non-reasoning": {
 		// AA specific benchmarks
-		codingIndex: 30,
-		mathIndex: 57.7,
+		codingIndex: undefined,
+		mathIndex: 36.3,
 		// Academic benchmarks
-		mmluPro: 0.836,
-		gpqa: 0.738,
-		hle: 0.086,
+		mmluPro: 0.86,
+		gpqa: 0.701,
+		hle: 0.059,
 		// Capabilities
 		contextWindow: 8192,
@@ -1477,21 +1257,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude 4 Opus (Non-reasoning)",
 	},
-	"deepseek-v3.1-terminus-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 33.9,
-		normalizedScore: 48,
+	"claude-opus-4.5-non-reasoning": {
 		// AA specific benchmarks
-		codingIndex: 33.7,
-		mathIndex: 89.7,
+		codingIndex: 42.9,
+		mathIndex: 62.7,
 		// Academic benchmarks
-		mmluPro: 0.851,
-		gpqa: 0.792,
-		hle: 0.152,
+		mmluPro: 0.889,
+		gpqa: 0.81,
+		hle: 0.129,
 		// Capabilities
 		contextWindow: 8192,
@@ -1499,21 +1276,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude Opus 4.5 (Non-reasoning)",
 	},
-	"deepseek-v3-0324": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 22.3,
-		normalizedScore: 32,
+	"claude-4-sonnet-reasoning": {
 		// AA specific benchmarks
-		codingIndex: 22,
-		mathIndex: 41,
+		codingIndex: 34.1,
+		mathIndex: 74.3,
 		// Academic benchmarks
-		mmluPro: 0.819,
-		gpqa: 0.655,
-		hle: 0.052,
+		mmluPro: 0.842,
+		gpqa: 0.777,
+		hle: 0.096,
 		// Capabilities
 		contextWindow: 8192,
@@ -1521,21 +1295,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude 4 Sonnet (Reasoning)",
 	},
-	"deepseek-r1-jan-25": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 18.8,
-		normalizedScore: 27,
+	"claude-4-opus-reasoning": {
 		// AA specific benchmarks
-		codingIndex: 15.9,
-		mathIndex: 68,
+		codingIndex: 34,
+		mathIndex: 73.3,
 		// Academic benchmarks
-		mmluPro: 0.844,
-		gpqa: 0.708,
-		hle: 0.093,
+		mmluPro: 0.873,
+		gpqa: 0.796,
+		hle: 0.117,
 		// Capabilities
 		contextWindow: 8192,
@@ -1543,21 +1314,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude 4 Opus (Reasoning)",
 	},
-	"deepseek-v3.1-non-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 28.1,
-		normalizedScore: 40,
+	"claude-2.1": {
 		// AA specific benchmarks
-		codingIndex: 28.4,
-		mathIndex: 49.7,
+		codingIndex: 14,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.833,
-		gpqa: 0.735,
-		hle: 0.063,
+		mmluPro: 0.495,
+		gpqa: 0.319,
+		hle: 0.042,
 		// Capabilities
 		contextWindow: 8192,
@@ -1565,21 +1333,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Claude 2.1",
 	},
-	"deepseek-v2.5": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 12.3,
-		normalizedScore: 18,
+	"mistral-large-2-nov-24": {
 		// AA specific benchmarks
-		codingIndex: undefined,
-		mathIndex: undefined,
+		codingIndex: 13.8,
+		mathIndex: 14,
 		// Academic benchmarks
-		mmluPro: undefined,
-		gpqa: undefined,
-		hle: undefined,
+		mmluPro: 0.697,
+		gpqa: 0.486,
+		hle: 0.04,
 		// Capabilities
 		contextWindow: 8192,
@@ -1587,21 +1352,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Mistral Large 2 (Nov '24)",
 	},
-	"deepseek-v2-chat": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 9.1,
-		normalizedScore: 13,
+	"mistral-large-2-jul-24": {
 		// AA specific benchmarks
 		codingIndex: undefined,
-		mathIndex: undefined,
+		mathIndex: 0,
 		// Academic benchmarks
-		mmluPro: undefined,
-		gpqa: undefined,
-		hle: undefined,
+		mmluPro: 0.683,
+		gpqa: 0.472,
+		hle: 0.032,
 		// Capabilities
 		contextWindow: 8192,
@@ -1609,21 +1371,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Mistral Large 2 (Jul '24)",
 	},
-	"deepseek-coder-v2-lite-instruct": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 8.5,
-		normalizedScore: 12,
+	"pixtral-large": {
 		// AA specific benchmarks
 		codingIndex: undefined,
-		mathIndex: undefined,
+		mathIndex: 2.3,
 		// Academic benchmarks
-		mmluPro: 0.429,
-		gpqa: 0.319,
-		hle: 0.053,
+		mmluPro: 0.701,
+		gpqa: 0.505,
+		hle: 0.036,
 		// Capabilities
 		contextWindow: 8192,
@@ -1631,21 +1390,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Pixtral Large",
 	},
-	sonar: {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 15.5,
-		normalizedScore: 22,
+	"mistral-small-3": {
 		// AA specific benchmarks
 		codingIndex: undefined,
-		mathIndex: undefined,
+		mathIndex: 4.3,
 		// Academic benchmarks
-		mmluPro: 0.689,
-		gpqa: 0.471,
-		hle: 0.073,
+		mmluPro: 0.652,
+		gpqa: 0.462,
+		hle: 0.041,
 		// Capabilities
 		contextWindow: 8192,
@@ -1653,21 +1409,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Mistral Small 3",
 	},
-	"sonar-reasoning-pro": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 24.6,
-		normalizedScore: 35,
+	"mistral-small-sep-24": {
 		// AA specific benchmarks
 		codingIndex: undefined,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: undefined,
-		gpqa: undefined,
-		hle: undefined,
+		mmluPro: 0.529,
+		gpqa: 0.381,
+		hle: 0.043,
 		// Capabilities
 		contextWindow: 8192,
@@ -1675,21 +1428,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Mistral Small (Sep '24)",
 	},
-	"sonar-pro": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 15.2,
-		normalizedScore: 22,
+	"mixtral-8x22b-instruct": {
 		// AA specific benchmarks
 		codingIndex: undefined,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.755,
-		gpqa: 0.578,
-		hle: 0.079,
+		mmluPro: 0.537,
+		gpqa: 0.332,
+		hle: 0.041,
 		// Capabilities
 		contextWindow: 8192,
@@ -1697,21 +1447,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Mixtral 8x22B Instruct",
 	},
-	"sonar-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 17.9,
-		normalizedScore: 26,
+	"mistral-small-feb-24": {
 		// AA specific benchmarks
 		codingIndex: undefined,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: undefined,
-		gpqa: 0.623,
-		hle: undefined,
+		mmluPro: 0.419,
+		gpqa: 0.302,
+		hle: 0.044,
 		// Capabilities
 		contextWindow: 8192,
@@ -1719,21 +1466,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Mistral Small (Feb '24)",
 	},
-	"grok-beta": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 13.3,
-		normalizedScore: 19,
+	"mistral-large-feb-24": {
 		// AA specific benchmarks
 		codingIndex: undefined,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.703,
-		gpqa: 0.471,
-		hle: 0.047,
+		mmluPro: 0.515,
+		gpqa: 0.351,
+		hle: 0.034,
 		// Capabilities
 		contextWindow: 8192,
@@ -1741,21 +1485,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Mistral Large (Feb '24)",
 	},
-	"grok-4-fast-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 35.1,
-		normalizedScore: 50,
+	"mixtral-8x7b-instruct": {
 		// AA specific benchmarks
-		codingIndex: 27.4,
-		mathIndex: 89.7,
+		codingIndex: undefined,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.85,
-		gpqa: 0.847,
-		hle: 0.17,
+		mmluPro: 0.387,
+		gpqa: 0.292,
+		hle: 0.045,
 		// Capabilities
 		contextWindow: 8192,
@@ -1763,21 +1504,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Mixtral 8x7B Instruct",
 	},
-	"grok-3-reasoning-beta": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 21.6,
-		normalizedScore: 31,
+	"mistral-7b-instruct": {
 		// AA specific benchmarks
 		codingIndex: undefined,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: undefined,
-		gpqa: undefined,
-		hle: undefined,
+		mmluPro: 0.245,
+		gpqa: 0.177,
+		hle: 0.043,
 		// Capabilities
 		contextWindow: 8192,
@@ -1785,21 +1523,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Mistral 7B Instruct",
 	},
-	"grok-3": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 25.2,
-		normalizedScore: 36,
+	"mistral-saba": {
 		// AA specific benchmarks
-		codingIndex: 19.8,
-		mathIndex: 58,
+		codingIndex: undefined,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.799,
-		gpqa: 0.693,
-		hle: 0.051,
+		mmluPro: 0.611,
+		gpqa: 0.424,
+		hle: 0.041,
 		// Capabilities
 		contextWindow: 8192,
@@ -1807,21 +1542,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Mistral Saba",
 	},
-	"grok-4": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 41.5,
-		normalizedScore: 59,
+	"mistral-small-3.2": {
 		// AA specific benchmarks
-		codingIndex: 40.5,
-		mathIndex: 92.7,
+		codingIndex: 13.3,
+		mathIndex: 27,
 		// Academic benchmarks
-		mmluPro: 0.866,
-		gpqa: 0.877,
-		hle: 0.239,
+		mmluPro: 0.681,
+		gpqa: 0.505,
+		hle: 0.043,
 		// Capabilities
 		contextWindow: 8192,
@@ -1829,21 +1561,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Mistral Small 3.2",
 	},
-	"grok-4.1-fast-non-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 23.6,
-		normalizedScore: 34,
+	"mistral-small-3.1": {
 		// AA specific benchmarks
-		codingIndex: 19.5,
-		mathIndex: 34.3,
+		codingIndex: 13.9,
+		mathIndex: 3.7,
 		// Academic benchmarks
-		mmluPro: 0.743,
-		gpqa: 0.637,
-		hle: 0.05,
+		mmluPro: 0.659,
+		gpqa: 0.454,
+		hle: 0.048,
 		// Capabilities
 		contextWindow: 8192,
@@ -1851,21 +1580,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Mistral Small 3.1",
 	},
-	"grok-4.1-fast-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 38.6,
-		normalizedScore: 55,
+	"mistral-medium-3": {
 		// AA specific benchmarks
-		codingIndex: 30.9,
-		mathIndex: 89.3,
+		codingIndex: 13.6,
+		mathIndex: 30.3,
 		// Academic benchmarks
-		mmluPro: 0.854,
-		gpqa: 0.853,
-		hle: 0.176,
+		mmluPro: 0.76,
+		gpqa: 0.578,
+		hle: 0.043,
 		// Capabilities
 		contextWindow: 8192,
@@ -1873,21 +1599,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Mistral Medium 3",
 	},
-	"grok-2-dec-24": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 13.9,
-		normalizedScore: 20,
+	"magistral-small-1": {
 		// AA specific benchmarks
-		codingIndex: undefined,
-		mathIndex: undefined,
+		codingIndex: 11.1,
+		mathIndex: 41.3,
 		// Academic benchmarks
-		mmluPro: 0.709,
-		gpqa: 0.51,
-		hle: 0.038,
+		mmluPro: 0.746,
+		gpqa: 0.641,
+		hle: 0.072,
 		// Capabilities
 		contextWindow: 8192,
@@ -1895,21 +1618,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Magistral Small 1",
 	},
-	"grok-4-fast-non-reasoning": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 23.1,
-		normalizedScore: 33,
+	"devstral-small-may-25": {
 		// AA specific benchmarks
-		codingIndex: 19,
-		mathIndex: 41.3,
+		codingIndex: 12.2,
+		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.73,
-		gpqa: 0.606,
-		hle: 0.05,
+		mmluPro: 0.632,
+		gpqa: 0.434,
+		hle: 0.04,
 		// Capabilities
 		contextWindow: 8192,
@@ -1917,21 +1637,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Devstral Small (May '25)",
 	},
-	"openchat-3.5-1210": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 8.3,
-		normalizedScore: 12,
+	"mistral-medium": {
 		// AA specific benchmarks
 		codingIndex: undefined,
 		mathIndex: undefined,
 		// Academic benchmarks
-		mmluPro: 0.31,
-		gpqa: 0.23,
-		hle: 0.048,
+		mmluPro: 0.491,
+		gpqa: 0.349,
+		hle: 0.034,
 		// Capabilities
 		contextWindow: 8192,
@@ -1939,21 +1656,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Mistral Medium",
 	},
-	"nova-pro": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 13.5,
-		normalizedScore: 19,
+	"devstral-small-jul-25": {
 		// AA specific benchmarks
-		codingIndex: 11,
-		mathIndex: 7,
+		codingIndex: 12.1,
+		mathIndex: 29.3,
 		// Academic benchmarks
-		mmluPro: 0.691,
-		gpqa: 0.499,
-		hle: 0.034,
+		mmluPro: 0.622,
+		gpqa: 0.414,
+		hle: 0.037,
 		// Capabilities
 		contextWindow: 8192,
@@ -1961,21 +1675,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Devstral Small (Jul '25)",
 	},
-	"nova-lite": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 12.7,
-		normalizedScore: 18,
+	"devstral-medium": {
 		// AA specific benchmarks
-		codingIndex: 5.1,
-		mathIndex: 7,
+		codingIndex: 15.9,
+		mathIndex: 4.7,
 		// Academic benchmarks
-		mmluPro: 0.59,
-		gpqa: 0.433,
-		hle: 0.046,
+		mmluPro: 0.708,
+		gpqa: 0.492,
+		hle: 0.038,
 		// Capabilities
 		contextWindow: 8192,
@@ -1983,21 +1694,18 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Devstral Medium",
 	},
-	"phi-3-mini-instruct-3.8b": {
-		// AA Intelligence Index (composite score)
-		intelligenceIndex: 10.1,
-		normalizedScore: 14,
+	"magistral-medium-1": {
 		// AA specific benchmarks
-		codingIndex: 3,
-		mathIndex: 0.3,
+		codingIndex: 16,
+		mathIndex: 40.3,
 		// Academic benchmarks
-		mmluPro: 0.435,
-		gpqa: 0.319,
-		hle: 0.044,
+		mmluPro: 0.753,
+		gpqa: 0.679,
+		hle: 0.095,
 		// Capabilities
 		contextWindow: 8192,
@@ -2005,6 +1713,7 @@ export const BENCHMARKS_CHUNK_3: Record<string, HardcodedBenchmark> = {
 		supportsVision: false,
 		// Metadata
-		lastUpdated: "2026-04-06",
+		lastUpdated: "2026-06-01",
+		originalModel: "Magistral Medium 1",
 	},
 };