npm - @mariozechner/pi-ai - Versions diffs - 0.5.44 → 0.5.45 - Mend

@mariozechner/pi-ai 0.5.44 → 0.5.45

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (31) hide show

package/dist/agent/agent-loop.d.ts +2 -2
package/dist/agent/agent-loop.d.ts.map +1 -1
package/dist/agent/agent-loop.js +18 -2
package/dist/agent/agent-loop.js.map +1 -1
package/dist/agent/index.d.ts +1 -1
package/dist/agent/index.d.ts.map +1 -1
package/dist/agent/index.js.map +1 -1
package/dist/agent/types.d.ts +6 -1
package/dist/agent/types.d.ts.map +1 -1
package/dist/agent/types.js.map +1 -1
package/dist/models.generated.d.ts +458 -16
package/dist/models.generated.d.ts.map +1 -1
package/dist/models.generated.js +532 -90
package/dist/models.generated.js.map +1 -1
package/dist/providers/anthropic.d.ts.map +1 -1
package/dist/providers/anthropic.js +9 -8
package/dist/providers/anthropic.js.map +1 -1
package/dist/providers/google.d.ts.map +1 -1
package/dist/providers/google.js +7 -6
package/dist/providers/google.js.map +1 -1
package/dist/providers/openai-completions.d.ts.map +1 -1
package/dist/providers/openai-completions.js +6 -5
package/dist/providers/openai-completions.js.map +1 -1
package/dist/providers/openai-responses.d.ts.map +1 -1
package/dist/providers/openai-responses.js +6 -5
package/dist/providers/openai-responses.js.map +1 -1
package/dist/utils/sanitize-unicode.d.ts +22 -0
package/dist/utils/sanitize-unicode.d.ts.map +1 -0
package/dist/utils/sanitize-unicode.js +26 -0
package/dist/utils/sanitize-unicode.js.map +1 -0
package/package.json +1 -1

package/dist/models.generated.js CHANGED Viewed

@@ -189,6 +189,142 @@ export const MODELS = {
             contextWindow: 200000,
             maxTokens: 4096,
         },
+        "claude-haiku-4-5-20251001": {
+            id: "claude-haiku-4-5-20251001",
+            name: "Claude Haiku 4.5",
+            api: "anthropic-messages",
+            provider: "anthropic",
+            baseUrl: "https://api.anthropic.com",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 1,
+                output: 5,
+                cacheRead: 0.1,
+                cacheWrite: 1.25,
+            },
+            contextWindow: 200000,
+            maxTokens: 64000,
+        },
+        "claude-sonnet-4-0": {
+            id: "claude-sonnet-4-0",
+            name: "Claude Sonnet 4",
+            api: "anthropic-messages",
+            provider: "anthropic",
+            baseUrl: "https://api.anthropic.com",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 3,
+                output: 15,
+                cacheRead: 0.3,
+                cacheWrite: 3.75,
+            },
+            contextWindow: 200000,
+            maxTokens: 64000,
+        },
+        "claude-3-7-sonnet-latest": {
+            id: "claude-3-7-sonnet-latest",
+            name: "Claude Sonnet 3.7",
+            api: "anthropic-messages",
+            provider: "anthropic",
+            baseUrl: "https://api.anthropic.com",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 3,
+                output: 15,
+                cacheRead: 0.3,
+                cacheWrite: 3.75,
+            },
+            contextWindow: 200000,
+            maxTokens: 64000,
+        },
+        "claude-sonnet-4-5": {
+            id: "claude-sonnet-4-5",
+            name: "Claude Sonnet 4.5",
+            api: "anthropic-messages",
+            provider: "anthropic",
+            baseUrl: "https://api.anthropic.com",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 3,
+                output: 15,
+                cacheRead: 0.3,
+                cacheWrite: 3.75,
+            },
+            contextWindow: 200000,
+            maxTokens: 64000,
+        },
+        "claude-3-5-haiku-latest": {
+            id: "claude-3-5-haiku-latest",
+            name: "Claude Haiku 3.5",
+            api: "anthropic-messages",
+            provider: "anthropic",
+            baseUrl: "https://api.anthropic.com",
+            reasoning: false,
+            input: ["text", "image"],
+            cost: {
+                input: 0.8,
+                output: 4,
+                cacheRead: 0.08,
+                cacheWrite: 1,
+            },
+            contextWindow: 200000,
+            maxTokens: 8192,
+        },
+        "claude-haiku-4-5": {
+            id: "claude-haiku-4-5",
+            name: "Claude Haiku 4.5",
+            api: "anthropic-messages",
+            provider: "anthropic",
+            baseUrl: "https://api.anthropic.com",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 1,
+                output: 5,
+                cacheRead: 0.1,
+                cacheWrite: 1.25,
+            },
+            contextWindow: 200000,
+            maxTokens: 64000,
+        },
+        "claude-opus-4-1": {
+            id: "claude-opus-4-1",
+            name: "Claude Opus 4.1",
+            api: "anthropic-messages",
+            provider: "anthropic",
+            baseUrl: "https://api.anthropic.com",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 15,
+                output: 75,
+                cacheRead: 1.5,
+                cacheWrite: 18.75,
+            },
+            contextWindow: 200000,
+            maxTokens: 32000,
+        },
+        "claude-opus-4-0": {
+            id: "claude-opus-4-0",
+            name: "Claude Opus 4",
+            api: "anthropic-messages",
+            provider: "anthropic",
+            baseUrl: "https://api.anthropic.com",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 15,
+                output: 75,
+                cacheRead: 1.5,
+                cacheWrite: 18.75,
+            },
+            contextWindow: 200000,
+            maxTokens: 32000,
+        },
     },
     google: {
         "gemini-2.5-flash-preview-05-20": {
@@ -251,9 +387,9 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.15,
-                output: 0.6,
-                cacheRead: 0.0375,
+                input: 0.3,
+                output: 2.5,
+                cacheRead: 0.075,
                 cacheWrite: 0,
             },
             contextWindow: 1048576,
@@ -361,6 +497,23 @@ export const MODELS = {
             contextWindow: 1048576,
             maxTokens: 65536,
         },
+        "gemini-live-2.5-flash": {
+            id: "gemini-live-2.5-flash",
+            name: "Gemini Live 2.5 Flash",
+            api: "google-generative-ai",
+            provider: "google",
+            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0.5,
+                output: 2,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 128000,
+            maxTokens: 8000,
+        },
         "gemini-2.5-flash-lite-preview-06-17": {
             id: "gemini-2.5-flash-lite-preview-06-17",
             name: "Gemini 2.5 Flash Lite Preview 06-17",
@@ -387,9 +540,9 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.15,
-                output: 0.6,
-                cacheRead: 0.0375,
+                input: 0.3,
+                output: 2.5,
+                cacheRead: 0.075,
                 cacheWrite: 0,
             },
             contextWindow: 1048576,
@@ -695,9 +848,9 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
+                input: 1.25,
+                output: 10,
+                cacheRead: 0.125,
                 cacheWrite: 0,
             },
             contextWindow: 400000,
@@ -1648,6 +1801,159 @@ export const MODELS = {
         },
     },
     openrouter: {
+        "openrouter/andromeda-alpha": {
+            id: "openrouter/andromeda-alpha",
+            name: "Andromeda Alpha",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0,
+                output: 0,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 128000,
+            maxTokens: 128000,
+        },
+        "deepcogito/cogito-v2-preview-llama-405b": {
+            id: "deepcogito/cogito-v2-preview-llama-405b",
+            name: "Deep Cogito: Cogito V2 Preview Llama 405B",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 3.5,
+                output: 3.5,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 32768,
+            maxTokens: 4096,
+        },
+        "qwen/qwen3-vl-8b-thinking": {
+            id: "qwen/qwen3-vl-8b-thinking",
+            name: "Qwen: Qwen3 VL 8B Thinking",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0.18,
+                output: 2.0999999999999996,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 256000,
+            maxTokens: 32768,
+        },
+        "qwen/qwen3-vl-8b-instruct": {
+            id: "qwen/qwen3-vl-8b-instruct",
+            name: "Qwen: Qwen3 VL 8B Instruct",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: false,
+            input: ["text", "image"],
+            cost: {
+                input: 0.08,
+                output: 0.5,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 32768,
+        },
+        "inclusionai/ring-1t": {
+            id: "inclusionai/ring-1t",
+            name: "inclusionAI: Ring 1T",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.5700000000000001,
+                output: 2.2800000000000002,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 131072,
+        },
+        "inclusionai/ling-1t": {
+            id: "inclusionai/ling-1t",
+            name: "inclusionAI: Ling-1T",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: false,
+            input: ["text"],
+            cost: {
+                input: 0.39999999999999997,
+                output: 2,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 131072,
+        },
+        "nvidia/llama-3.3-nemotron-super-49b-v1.5": {
+            id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
+            name: "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.09999999999999999,
+                output: 0.39999999999999997,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 4096,
+        },
+        "qwen/qwen3-vl-30b-a3b-thinking": {
+            id: "qwen/qwen3-vl-30b-a3b-thinking",
+            name: "Qwen: Qwen3 VL 30B A3B Thinking",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0.19999999999999998,
+                output: 1,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 32768,
+        },
+        "qwen/qwen3-vl-30b-a3b-instruct": {
+            id: "qwen/qwen3-vl-30b-a3b-instruct",
+            name: "Qwen: Qwen3 VL 30B A3B Instruct",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: false,
+            input: ["text", "image"],
+            cost: {
+                input: 0.19999999999999998,
+                output: 0.7,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 32768,
+        },
         "z-ai/glm-4.6": {
             id: "z-ai/glm-4.6",
             name: "Z.AI: GLM 4.6",
@@ -1691,13 +1997,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.5,
-                output: 3.5,
+                input: 0.3,
+                output: 1.2,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 65536,
-            maxTokens: 65536,
+            contextWindow: 262144,
+            maxTokens: 262144,
         },
         "qwen/qwen3-vl-235b-a22b-instruct": {
             id: "qwen/qwen3-vl-235b-a22b-instruct",
@@ -1709,12 +2015,12 @@ export const MODELS = {
             input: ["text", "image"],
             cost: {
                 input: 0.3,
-                output: 1.5,
+                output: 1.2,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
-            maxTokens: 32768,
+            contextWindow: 262144,
+            maxTokens: 262144,
         },
         "qwen/qwen3-max": {
             id: "qwen/qwen3-max",
@@ -1773,7 +2079,7 @@ export const MODELS = {
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
+            reasoning: true,
             input: ["text"],
             cost: {
                 input: 0,
@@ -1827,13 +2133,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.09999999999999999,
-                output: 0.7999999999999999,
+                input: 0.14,
+                output: 1.2,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 262144,
+            maxTokens: 4096,
         },
         "qwen/qwen3-next-80b-a3b-instruct": {
             id: "qwen/qwen3-next-80b-a3b-instruct",
@@ -1954,6 +2260,23 @@ export const MODELS = {
             contextWindow: 262144,
             maxTokens: 262144,
         },
+        "deepcogito/cogito-v2-preview-llama-70b": {
+            id: "deepcogito/cogito-v2-preview-llama-70b",
+            name: "Deep Cogito: Cogito V2 Preview Llama 70B",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.88,
+                output: 0.88,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 32768,
+            maxTokens: 4096,
+        },
         "deepcogito/cogito-v2-preview-llama-109b-moe": {
             id: "deepcogito/cogito-v2-preview-llama-109b-moe",
             name: "Cogito V2 Preview Llama 109B",
@@ -2039,23 +2362,6 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 131072,
         },
-        "deepseek/deepseek-chat-v3.1:free": {
-            id: "deepseek/deepseek-chat-v3.1:free",
-            name: "DeepSeek: DeepSeek V3.1 (free)",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 163800,
-            maxTokens: 4096,
-        },
         "deepseek/deepseek-chat-v3.1": {
             id: "deepseek/deepseek-chat-v3.1",
             name: "DeepSeek: DeepSeek V3.1",
@@ -2065,13 +2371,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.19999999999999998,
-                output: 0.7999999999999999,
+                input: 0.27,
+                output: 1,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 163840,
-            maxTokens: 163840,
+            contextWindow: 131072,
+            maxTokens: 32768,
         },
         "mistralai/mistral-medium-3.1": {
             id: "mistralai/mistral-medium-3.1",
@@ -2090,6 +2396,40 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 4096,
         },
+        "baidu/ernie-4.5-21b-a3b": {
+            id: "baidu/ernie-4.5-21b-a3b",
+            name: "Baidu: ERNIE 4.5 21B A3B",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: false,
+            input: ["text"],
+            cost: {
+                input: 0.07,
+                output: 0.28,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 120000,
+            maxTokens: 8000,
+        },
+        "baidu/ernie-4.5-vl-28b-a3b": {
+            id: "baidu/ernie-4.5-vl-28b-a3b",
+            name: "Baidu: ERNIE 4.5 VL 28B A3B",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0.14,
+                output: 0.56,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 30000,
+            maxTokens: 8000,
+        },
         "z-ai/glm-4.5v": {
             id: "z-ai/glm-4.5v",
             name: "Z.AI: GLM 4.5V",
@@ -2101,7 +2441,7 @@ export const MODELS = {
             cost: {
                 input: 0.6,
                 output: 1.7999999999999998,
-                cacheRead: 0,
+                cacheRead: 0.11,
                 cacheWrite: 0,
             },
             contextWindow: 65536,
@@ -2202,7 +2542,7 @@ export const MODELS = {
             input: ["text"],
             cost: {
                 input: 0.35,
-                output: 1.55,
+                output: 1.5,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
@@ -2235,13 +2575,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.14,
-                output: 0.86,
+                input: 0.13,
+                output: 0.85,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 131072,
+            maxTokens: 98304,
         },
         "qwen/qwen3-235b-a22b-thinking-2507": {
             id: "qwen/qwen3-235b-a22b-thinking-2507",
@@ -2291,8 +2631,8 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 262144,
-            maxTokens: 4096,
+            contextWindow: 262000,
+            maxTokens: 262000,
         },
         "qwen/qwen3-coder": {
             id: "qwen/qwen3-coder",
@@ -2300,7 +2640,7 @@ export const MODELS = {
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
+            reasoning: true,
             input: ["text"],
             cost: {
                 input: 0.22,
@@ -2317,7 +2657,7 @@ export const MODELS = {
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
+            reasoning: true,
             input: ["text"],
             cost: {
                 input: 0.08,
@@ -2379,6 +2719,23 @@ export const MODELS = {
             contextWindow: 128000,
             maxTokens: 4096,
         },
+        "tngtech/deepseek-r1t2-chimera": {
+            id: "tngtech/deepseek-r1t2-chimera",
+            name: "TNG: DeepSeek R1T2 Chimera",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.3,
+                output: 1.2,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 163840,
+            maxTokens: 163840,
+        },
         "inception/mercury": {
             id: "inception/mercury",
             name: "Inception: Mercury",
@@ -2439,8 +2796,8 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.3,
-                output: 1.6500000000000001,
+                input: 0.39999999999999997,
+                output: 2.2,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
@@ -2566,6 +2923,23 @@ export const MODELS = {
             contextWindow: 128000,
             maxTokens: 4028,
         },
+        "nousresearch/deephermes-3-mistral-24b-preview": {
+            id: "nousresearch/deephermes-3-mistral-24b-preview",
+            name: "Nous: DeepHermes 3 Mistral 24B Preview",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.15,
+                output: 0.59,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 32768,
+            maxTokens: 32768,
+        },
         "mistralai/mistral-medium-3": {
             id: "mistralai/mistral-medium-3",
             name: "Mistral: Mistral Medium 3",
@@ -2699,7 +3073,7 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
+            contextWindow: 40960,
             maxTokens: 4096,
         },
         "qwen/qwen3-235b-a22b": {
@@ -2810,7 +3184,7 @@ export const MODELS = {
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
+            reasoning: true,
             input: ["text"],
             cost: {
                 input: 0.24,
@@ -2855,39 +3229,39 @@ export const MODELS = {
             contextWindow: 128000,
             maxTokens: 4096,
         },
-        "microsoft/phi-4-multimodal-instruct": {
-            id: "microsoft/phi-4-multimodal-instruct",
-            name: "Microsoft: Phi 4 Multimodal Instruct",
+        "qwen/qwq-32b": {
+            id: "qwen/qwq-32b",
+            name: "Qwen: QwQ 32B",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text", "image"],
+            reasoning: true,
+            input: ["text"],
             cost: {
-                input: 0.049999999999999996,
-                output: 0.09999999999999999,
+                input: 0.15,
+                output: 0.39999999999999997,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
+            contextWindow: 32768,
             maxTokens: 4096,
         },
-        "qwen/qwq-32b": {
-            id: "qwen/qwq-32b",
-            name: "Qwen: QwQ 32B",
+        "nousresearch/deephermes-3-llama-3-8b-preview": {
+            id: "nousresearch/deephermes-3-llama-3-8b-preview",
+            name: "Nous: DeepHermes 3 Llama 3 8B Preview",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
+            reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.15,
-                output: 0.39999999999999997,
+                input: 0.03,
+                output: 0.11,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 32768,
-            maxTokens: 4096,
+            contextWindow: 131072,
+            maxTokens: 131072,
         },
         "mistralai/mistral-saba": {
             id: "mistralai/mistral-saba",
@@ -2906,6 +3280,23 @@ export const MODELS = {
             contextWindow: 32768,
             maxTokens: 4096,
         },
+        "qwen/qwen-vl-max": {
+            id: "qwen/qwen-vl-max",
+            name: "Qwen: Qwen VL Max",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: false,
+            input: ["text", "image"],
+            cost: {
+                input: 0.7999999999999999,
+                output: 3.1999999999999997,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 8192,
+        },
         "qwen/qwen-turbo": {
             id: "qwen/qwen-turbo",
             name: "Qwen: Qwen-Turbo",
@@ -3056,8 +3447,8 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 65536,
-            maxTokens: 4096,
+            contextWindow: 131072,
+            maxTokens: 2048,
         },
         "meta-llama/llama-3.3-70b-instruct": {
             id: "meta-llama/llama-3.3-70b-instruct",
@@ -3068,13 +3459,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.04,
-                output: 0.12,
+                input: 0.13,
+                output: 0.38,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 131072,
+            maxTokens: 16384,
         },
         "amazon/nova-lite-v1": {
             id: "amazon/nova-lite-v1",
@@ -3212,6 +3603,23 @@ export const MODELS = {
             contextWindow: 128000,
             maxTokens: 4096,
         },
+        "qwen/qwen-2.5-7b-instruct": {
+            id: "qwen/qwen-2.5-7b-instruct",
+            name: "Qwen: Qwen2.5 7B Instruct",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: false,
+            input: ["text"],
+            cost: {
+                input: 0.04,
+                output: 0.09999999999999999,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 32768,
+            maxTokens: 16384,
+        },
         "nvidia/llama-3.1-nemotron-70b-instruct": {
             id: "nvidia/llama-3.1-nemotron-70b-instruct",
             name: "NVIDIA: Llama 3.1 Nemotron 70B Instruct",
@@ -3331,6 +3739,23 @@ export const MODELS = {
             contextWindow: 128000,
             maxTokens: 4000,
         },
+        "sao10k/l3.1-euryale-70b": {
+            id: "sao10k/l3.1-euryale-70b",
+            name: "Sao10K: Llama 3.1 Euryale 70B v2.2",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: false,
+            input: ["text"],
+            cost: {
+                input: 0.65,
+                output: 0.75,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 32768,
+            maxTokens: 4096,
+        },
         "microsoft/phi-3.5-mini-128k-instruct": {
             id: "microsoft/phi-3.5-mini-128k-instruct",
             name: "Microsoft: Phi-3.5 Mini 128K Instruct",
@@ -3362,41 +3787,41 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 65000,
+            contextWindow: 65536,
             maxTokens: 4096,
         },
-        "meta-llama/llama-3.1-405b-instruct": {
-            id: "meta-llama/llama-3.1-405b-instruct",
-            name: "Meta: Llama 3.1 405B Instruct",
+        "meta-llama/llama-3.1-8b-instruct": {
+            id: "meta-llama/llama-3.1-8b-instruct",
+            name: "Meta: Llama 3.1 8B Instruct",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.7999999999999999,
-                output: 0.7999999999999999,
+                input: 0.02,
+                output: 0.03,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 32768,
+            contextWindow: 16384,
             maxTokens: 16384,
         },
-        "meta-llama/llama-3.1-8b-instruct": {
-            id: "meta-llama/llama-3.1-8b-instruct",
-            name: "Meta: Llama 3.1 8B Instruct",
+        "meta-llama/llama-3.1-405b-instruct": {
+            id: "meta-llama/llama-3.1-405b-instruct",
+            name: "Meta: Llama 3.1 405B Instruct",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.02,
-                output: 0.03,
+                input: 0.7999999999999999,
+                output: 0.7999999999999999,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 16384,
+            contextWindow: 32768,
             maxTokens: 16384,
         },
         "meta-llama/llama-3.1-70b-instruct": {
@@ -3433,6 +3858,23 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 16384,
         },
+        "sao10k/l3-euryale-70b": {
+            id: "sao10k/l3-euryale-70b",
+            name: "Sao10k: Llama 3 Euryale 70B v2.1",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: false,
+            input: ["text"],
+            cost: {
+                input: 1.48,
+                output: 1.48,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 8192,
+            maxTokens: 8192,
+        },
         "mistralai/mistral-7b-instruct:free": {
             id: "mistralai/mistral-7b-instruct:free",
             name: "Mistral: Mistral 7B Instruct (free)",
@@ -3561,8 +4003,8 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.8999999999999999,
-                output: 0.8999999999999999,
+                input: 2,
+                output: 6,
                 cacheRead: 0,
                 cacheWrite: 0,
             },