@mariozechner/pi-ai 0.70.6 → 0.71.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (65) hide show
  1. package/README.md +3 -30
  2. package/dist/env-api-keys.d.ts.map +1 -1
  3. package/dist/env-api-keys.js +3 -0
  4. package/dist/env-api-keys.js.map +1 -1
  5. package/dist/index.d.ts +1 -1
  6. package/dist/index.d.ts.map +1 -1
  7. package/dist/index.js.map +1 -1
  8. package/dist/models.d.ts +1 -1
  9. package/dist/models.d.ts.map +1 -1
  10. package/dist/models.generated.d.ts +1378 -551
  11. package/dist/models.generated.d.ts.map +1 -1
  12. package/dist/models.generated.js +1150 -449
  13. package/dist/models.generated.js.map +1 -1
  14. package/dist/models.js +3 -2
  15. package/dist/models.js.map +1 -1
  16. package/dist/providers/anthropic.d.ts.map +1 -1
  17. package/dist/providers/anthropic.js +38 -15
  18. package/dist/providers/anthropic.js.map +1 -1
  19. package/dist/providers/cloudflare.d.ts +9 -3
  20. package/dist/providers/cloudflare.d.ts.map +1 -1
  21. package/dist/providers/cloudflare.js +10 -3
  22. package/dist/providers/cloudflare.js.map +1 -1
  23. package/dist/providers/google-shared.d.ts +7 -2
  24. package/dist/providers/google-shared.d.ts.map +1 -1
  25. package/dist/providers/google-shared.js +4 -13
  26. package/dist/providers/google-shared.js.map +1 -1
  27. package/dist/providers/google-vertex.d.ts +1 -1
  28. package/dist/providers/google-vertex.d.ts.map +1 -1
  29. package/dist/providers/google-vertex.js.map +1 -1
  30. package/dist/providers/google.d.ts +1 -1
  31. package/dist/providers/google.d.ts.map +1 -1
  32. package/dist/providers/google.js.map +1 -1
  33. package/dist/providers/mistral.d.ts.map +1 -1
  34. package/dist/providers/mistral.js +1 -1
  35. package/dist/providers/mistral.js.map +1 -1
  36. package/dist/providers/openai-completions.d.ts.map +1 -1
  37. package/dist/providers/openai-completions.js +21 -7
  38. package/dist/providers/openai-completions.js.map +1 -1
  39. package/dist/providers/openai-responses.d.ts.map +1 -1
  40. package/dist/providers/openai-responses.js +10 -2
  41. package/dist/providers/openai-responses.js.map +1 -1
  42. package/dist/providers/register-builtins.d.ts +0 -3
  43. package/dist/providers/register-builtins.d.ts.map +1 -1
  44. package/dist/providers/register-builtins.js +0 -18
  45. package/dist/providers/register-builtins.js.map +1 -1
  46. package/dist/types.d.ts +3 -2
  47. package/dist/types.d.ts.map +1 -1
  48. package/dist/types.js.map +1 -1
  49. package/dist/utils/oauth/index.d.ts +0 -4
  50. package/dist/utils/oauth/index.d.ts.map +1 -1
  51. package/dist/utils/oauth/index.js +0 -10
  52. package/dist/utils/oauth/index.js.map +1 -1
  53. package/package.json +2 -6
  54. package/dist/providers/google-gemini-cli.d.ts +0 -74
  55. package/dist/providers/google-gemini-cli.d.ts.map +0 -1
  56. package/dist/providers/google-gemini-cli.js +0 -779
  57. package/dist/providers/google-gemini-cli.js.map +0 -1
  58. package/dist/utils/oauth/google-antigravity.d.ts +0 -26
  59. package/dist/utils/oauth/google-antigravity.d.ts.map +0 -1
  60. package/dist/utils/oauth/google-antigravity.js +0 -377
  61. package/dist/utils/oauth/google-antigravity.js.map +0 -1
  62. package/dist/utils/oauth/google-gemini-cli.d.ts +0 -26
  63. package/dist/utils/oauth/google-gemini-cli.d.ts.map +0 -1
  64. package/dist/utils/oauth/google-gemini-cli.js +0 -482
  65. package/dist/utils/oauth/google-gemini-cli.js.map +0 -1
@@ -2539,6 +2539,23 @@ export const MODELS = {
2539
2539
  contextWindow: 272000,
2540
2540
  maxTokens: 128000,
2541
2541
  },
2542
+ "gpt-5.5-pro": {
2543
+ id: "gpt-5.5-pro",
2544
+ name: "GPT-5.5 Pro",
2545
+ api: "azure-openai-responses",
2546
+ provider: "azure-openai-responses",
2547
+ baseUrl: "",
2548
+ reasoning: true,
2549
+ input: ["text", "image"],
2550
+ cost: {
2551
+ input: 30,
2552
+ output: 180,
2553
+ cacheRead: 0,
2554
+ cacheWrite: 0,
2555
+ },
2556
+ contextWindow: 1050000,
2557
+ maxTokens: 128000,
2558
+ },
2542
2559
  "o1": {
2543
2560
  id: "o1",
2544
2561
  name: "o1",
@@ -2703,47 +2720,648 @@ export const MODELS = {
2703
2720
  reasoning: false,
2704
2721
  input: ["text"],
2705
2722
  cost: {
2706
- input: 0.1,
2707
- output: 0.1,
2708
- cacheRead: 0,
2723
+ input: 0.1,
2724
+ output: 0.1,
2725
+ cacheRead: 0,
2726
+ cacheWrite: 0,
2727
+ },
2728
+ contextWindow: 32000,
2729
+ maxTokens: 8000,
2730
+ },
2731
+ "qwen-3-235b-a22b-instruct-2507": {
2732
+ id: "qwen-3-235b-a22b-instruct-2507",
2733
+ name: "Qwen 3 235B Instruct",
2734
+ api: "openai-completions",
2735
+ provider: "cerebras",
2736
+ baseUrl: "https://api.cerebras.ai/v1",
2737
+ reasoning: false,
2738
+ input: ["text"],
2739
+ cost: {
2740
+ input: 0.6,
2741
+ output: 1.2,
2742
+ cacheRead: 0,
2743
+ cacheWrite: 0,
2744
+ },
2745
+ contextWindow: 131000,
2746
+ maxTokens: 32000,
2747
+ },
2748
+ "zai-glm-4.7": {
2749
+ id: "zai-glm-4.7",
2750
+ name: "Z.AI GLM-4.7",
2751
+ api: "openai-completions",
2752
+ provider: "cerebras",
2753
+ baseUrl: "https://api.cerebras.ai/v1",
2754
+ reasoning: false,
2755
+ input: ["text"],
2756
+ cost: {
2757
+ input: 2.25,
2758
+ output: 2.75,
2759
+ cacheRead: 0,
2760
+ cacheWrite: 0,
2761
+ },
2762
+ contextWindow: 131072,
2763
+ maxTokens: 40000,
2764
+ },
2765
+ },
2766
+ "cloudflare-ai-gateway": {
2767
+ "claude-3-5-haiku": {
2768
+ id: "claude-3-5-haiku",
2769
+ name: "Claude Haiku 3.5 (latest)",
2770
+ api: "anthropic-messages",
2771
+ provider: "cloudflare-ai-gateway",
2772
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2773
+ reasoning: false,
2774
+ input: ["text", "image"],
2775
+ cost: {
2776
+ input: 0.8,
2777
+ output: 4,
2778
+ cacheRead: 0.08,
2779
+ cacheWrite: 1,
2780
+ },
2781
+ contextWindow: 200000,
2782
+ maxTokens: 8192,
2783
+ },
2784
+ "claude-3-haiku": {
2785
+ id: "claude-3-haiku",
2786
+ name: "Claude Haiku 3",
2787
+ api: "anthropic-messages",
2788
+ provider: "cloudflare-ai-gateway",
2789
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2790
+ reasoning: false,
2791
+ input: ["text", "image"],
2792
+ cost: {
2793
+ input: 0.25,
2794
+ output: 1.25,
2795
+ cacheRead: 0.03,
2796
+ cacheWrite: 0.3,
2797
+ },
2798
+ contextWindow: 200000,
2799
+ maxTokens: 4096,
2800
+ },
2801
+ "claude-3-opus": {
2802
+ id: "claude-3-opus",
2803
+ name: "Claude Opus 3",
2804
+ api: "anthropic-messages",
2805
+ provider: "cloudflare-ai-gateway",
2806
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2807
+ reasoning: false,
2808
+ input: ["text", "image"],
2809
+ cost: {
2810
+ input: 15,
2811
+ output: 75,
2812
+ cacheRead: 1.5,
2813
+ cacheWrite: 18.75,
2814
+ },
2815
+ contextWindow: 200000,
2816
+ maxTokens: 4096,
2817
+ },
2818
+ "claude-3-sonnet": {
2819
+ id: "claude-3-sonnet",
2820
+ name: "Claude Sonnet 3",
2821
+ api: "anthropic-messages",
2822
+ provider: "cloudflare-ai-gateway",
2823
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2824
+ reasoning: false,
2825
+ input: ["text", "image"],
2826
+ cost: {
2827
+ input: 3,
2828
+ output: 15,
2829
+ cacheRead: 0.3,
2830
+ cacheWrite: 0.3,
2831
+ },
2832
+ contextWindow: 200000,
2833
+ maxTokens: 4096,
2834
+ },
2835
+ "claude-3.5-haiku": {
2836
+ id: "claude-3.5-haiku",
2837
+ name: "Claude Haiku 3.5 (latest)",
2838
+ api: "anthropic-messages",
2839
+ provider: "cloudflare-ai-gateway",
2840
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2841
+ reasoning: false,
2842
+ input: ["text", "image"],
2843
+ cost: {
2844
+ input: 0.8,
2845
+ output: 4,
2846
+ cacheRead: 0.08,
2847
+ cacheWrite: 1,
2848
+ },
2849
+ contextWindow: 200000,
2850
+ maxTokens: 8192,
2851
+ },
2852
+ "claude-3.5-sonnet": {
2853
+ id: "claude-3.5-sonnet",
2854
+ name: "Claude Sonnet 3.5 v2",
2855
+ api: "anthropic-messages",
2856
+ provider: "cloudflare-ai-gateway",
2857
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2858
+ reasoning: false,
2859
+ input: ["text", "image"],
2860
+ cost: {
2861
+ input: 3,
2862
+ output: 15,
2863
+ cacheRead: 0.3,
2864
+ cacheWrite: 3.75,
2865
+ },
2866
+ contextWindow: 200000,
2867
+ maxTokens: 8192,
2868
+ },
2869
+ "claude-haiku-4-5": {
2870
+ id: "claude-haiku-4-5",
2871
+ name: "Claude Haiku 4.5 (latest)",
2872
+ api: "anthropic-messages",
2873
+ provider: "cloudflare-ai-gateway",
2874
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2875
+ reasoning: true,
2876
+ input: ["text", "image"],
2877
+ cost: {
2878
+ input: 1,
2879
+ output: 5,
2880
+ cacheRead: 0.1,
2881
+ cacheWrite: 1.25,
2882
+ },
2883
+ contextWindow: 200000,
2884
+ maxTokens: 64000,
2885
+ },
2886
+ "claude-opus-4": {
2887
+ id: "claude-opus-4",
2888
+ name: "Claude Opus 4 (latest)",
2889
+ api: "anthropic-messages",
2890
+ provider: "cloudflare-ai-gateway",
2891
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2892
+ reasoning: true,
2893
+ input: ["text", "image"],
2894
+ cost: {
2895
+ input: 15,
2896
+ output: 75,
2897
+ cacheRead: 1.5,
2898
+ cacheWrite: 18.75,
2899
+ },
2900
+ contextWindow: 200000,
2901
+ maxTokens: 32000,
2902
+ },
2903
+ "claude-opus-4-1": {
2904
+ id: "claude-opus-4-1",
2905
+ name: "Claude Opus 4.1 (latest)",
2906
+ api: "anthropic-messages",
2907
+ provider: "cloudflare-ai-gateway",
2908
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2909
+ reasoning: true,
2910
+ input: ["text", "image"],
2911
+ cost: {
2912
+ input: 15,
2913
+ output: 75,
2914
+ cacheRead: 1.5,
2915
+ cacheWrite: 18.75,
2916
+ },
2917
+ contextWindow: 200000,
2918
+ maxTokens: 32000,
2919
+ },
2920
+ "claude-opus-4-5": {
2921
+ id: "claude-opus-4-5",
2922
+ name: "Claude Opus 4.5 (latest)",
2923
+ api: "anthropic-messages",
2924
+ provider: "cloudflare-ai-gateway",
2925
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2926
+ reasoning: true,
2927
+ input: ["text", "image"],
2928
+ cost: {
2929
+ input: 5,
2930
+ output: 25,
2931
+ cacheRead: 0.5,
2932
+ cacheWrite: 6.25,
2933
+ },
2934
+ contextWindow: 200000,
2935
+ maxTokens: 64000,
2936
+ },
2937
+ "claude-opus-4-6": {
2938
+ id: "claude-opus-4-6",
2939
+ name: "Claude Opus 4.6 (latest)",
2940
+ api: "anthropic-messages",
2941
+ provider: "cloudflare-ai-gateway",
2942
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2943
+ reasoning: true,
2944
+ input: ["text", "image"],
2945
+ cost: {
2946
+ input: 5,
2947
+ output: 25,
2948
+ cacheRead: 0.5,
2949
+ cacheWrite: 6.25,
2950
+ },
2951
+ contextWindow: 1000000,
2952
+ maxTokens: 128000,
2953
+ },
2954
+ "claude-opus-4-7": {
2955
+ id: "claude-opus-4-7",
2956
+ name: "Claude Opus 4.7",
2957
+ api: "anthropic-messages",
2958
+ provider: "cloudflare-ai-gateway",
2959
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2960
+ reasoning: true,
2961
+ input: ["text", "image"],
2962
+ cost: {
2963
+ input: 5,
2964
+ output: 25,
2965
+ cacheRead: 0.5,
2966
+ cacheWrite: 6.25,
2967
+ },
2968
+ contextWindow: 1000000,
2969
+ maxTokens: 128000,
2970
+ },
2971
+ "claude-sonnet-4": {
2972
+ id: "claude-sonnet-4",
2973
+ name: "Claude Sonnet 4 (latest)",
2974
+ api: "anthropic-messages",
2975
+ provider: "cloudflare-ai-gateway",
2976
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2977
+ reasoning: true,
2978
+ input: ["text", "image"],
2979
+ cost: {
2980
+ input: 3,
2981
+ output: 15,
2982
+ cacheRead: 0.3,
2983
+ cacheWrite: 3.75,
2984
+ },
2985
+ contextWindow: 200000,
2986
+ maxTokens: 64000,
2987
+ },
2988
+ "claude-sonnet-4-5": {
2989
+ id: "claude-sonnet-4-5",
2990
+ name: "Claude Sonnet 4.5 (latest)",
2991
+ api: "anthropic-messages",
2992
+ provider: "cloudflare-ai-gateway",
2993
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2994
+ reasoning: true,
2995
+ input: ["text", "image"],
2996
+ cost: {
2997
+ input: 3,
2998
+ output: 15,
2999
+ cacheRead: 0.3,
3000
+ cacheWrite: 3.75,
3001
+ },
3002
+ contextWindow: 200000,
3003
+ maxTokens: 64000,
3004
+ },
3005
+ "claude-sonnet-4-6": {
3006
+ id: "claude-sonnet-4-6",
3007
+ name: "Claude Sonnet 4.6",
3008
+ api: "anthropic-messages",
3009
+ provider: "cloudflare-ai-gateway",
3010
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
3011
+ reasoning: true,
3012
+ input: ["text", "image"],
3013
+ cost: {
3014
+ input: 3,
3015
+ output: 15,
3016
+ cacheRead: 0.3,
3017
+ cacheWrite: 3.75,
3018
+ },
3019
+ contextWindow: 1000000,
3020
+ maxTokens: 64000,
3021
+ },
3022
+ "gpt-4": {
3023
+ id: "gpt-4",
3024
+ name: "GPT-4",
3025
+ api: "openai-responses",
3026
+ provider: "cloudflare-ai-gateway",
3027
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/openai",
3028
+ reasoning: false,
3029
+ input: ["text"],
3030
+ cost: {
3031
+ input: 30,
3032
+ output: 60,
3033
+ cacheRead: 0,
3034
+ cacheWrite: 0,
3035
+ },
3036
+ contextWindow: 8192,
3037
+ maxTokens: 8192,
3038
+ },
3039
+ "gpt-4-turbo": {
3040
+ id: "gpt-4-turbo",
3041
+ name: "GPT-4 Turbo",
3042
+ api: "openai-responses",
3043
+ provider: "cloudflare-ai-gateway",
3044
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/openai",
3045
+ reasoning: false,
3046
+ input: ["text", "image"],
3047
+ cost: {
3048
+ input: 10,
3049
+ output: 30,
3050
+ cacheRead: 0,
3051
+ cacheWrite: 0,
3052
+ },
3053
+ contextWindow: 128000,
3054
+ maxTokens: 4096,
3055
+ },
3056
+ "gpt-4o": {
3057
+ id: "gpt-4o",
3058
+ name: "GPT-4o",
3059
+ api: "openai-responses",
3060
+ provider: "cloudflare-ai-gateway",
3061
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/openai",
3062
+ reasoning: false,
3063
+ input: ["text", "image"],
3064
+ cost: {
3065
+ input: 2.5,
3066
+ output: 10,
3067
+ cacheRead: 1.25,
3068
+ cacheWrite: 0,
3069
+ },
3070
+ contextWindow: 128000,
3071
+ maxTokens: 16384,
3072
+ },
3073
+ "gpt-4o-mini": {
3074
+ id: "gpt-4o-mini",
3075
+ name: "GPT-4o mini",
3076
+ api: "openai-responses",
3077
+ provider: "cloudflare-ai-gateway",
3078
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/openai",
3079
+ reasoning: false,
3080
+ input: ["text", "image"],
3081
+ cost: {
3082
+ input: 0.15,
3083
+ output: 0.6,
3084
+ cacheRead: 0.08,
3085
+ cacheWrite: 0,
3086
+ },
3087
+ contextWindow: 128000,
3088
+ maxTokens: 16384,
3089
+ },
3090
+ "gpt-5.1": {
3091
+ id: "gpt-5.1",
3092
+ name: "GPT-5.1",
3093
+ api: "openai-responses",
3094
+ provider: "cloudflare-ai-gateway",
3095
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/openai",
3096
+ reasoning: true,
3097
+ input: ["text", "image"],
3098
+ cost: {
3099
+ input: 1.25,
3100
+ output: 10,
3101
+ cacheRead: 0.13,
3102
+ cacheWrite: 0,
3103
+ },
3104
+ contextWindow: 400000,
3105
+ maxTokens: 128000,
3106
+ },
3107
+ "gpt-5.1-codex": {
3108
+ id: "gpt-5.1-codex",
3109
+ name: "GPT-5.1 Codex",
3110
+ api: "openai-responses",
3111
+ provider: "cloudflare-ai-gateway",
3112
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/openai",
3113
+ reasoning: true,
3114
+ input: ["text", "image"],
3115
+ cost: {
3116
+ input: 1.25,
3117
+ output: 10,
3118
+ cacheRead: 0.125,
3119
+ cacheWrite: 0,
3120
+ },
3121
+ contextWindow: 400000,
3122
+ maxTokens: 128000,
3123
+ },
3124
+ "gpt-5.2": {
3125
+ id: "gpt-5.2",
3126
+ name: "GPT-5.2",
3127
+ api: "openai-responses",
3128
+ provider: "cloudflare-ai-gateway",
3129
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/openai",
3130
+ reasoning: true,
3131
+ input: ["text", "image"],
3132
+ cost: {
3133
+ input: 1.75,
3134
+ output: 14,
3135
+ cacheRead: 0.175,
3136
+ cacheWrite: 0,
3137
+ },
3138
+ contextWindow: 400000,
3139
+ maxTokens: 128000,
3140
+ },
3141
+ "gpt-5.2-codex": {
3142
+ id: "gpt-5.2-codex",
3143
+ name: "GPT-5.2 Codex",
3144
+ api: "openai-responses",
3145
+ provider: "cloudflare-ai-gateway",
3146
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/openai",
3147
+ reasoning: true,
3148
+ input: ["text", "image"],
3149
+ cost: {
3150
+ input: 1.75,
3151
+ output: 14,
3152
+ cacheRead: 0.175,
3153
+ cacheWrite: 0,
3154
+ },
3155
+ contextWindow: 400000,
3156
+ maxTokens: 128000,
3157
+ },
3158
+ "gpt-5.3-codex": {
3159
+ id: "gpt-5.3-codex",
3160
+ name: "GPT-5.3 Codex",
3161
+ api: "openai-responses",
3162
+ provider: "cloudflare-ai-gateway",
3163
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/openai",
3164
+ reasoning: true,
3165
+ input: ["text", "image"],
3166
+ cost: {
3167
+ input: 1.75,
3168
+ output: 14,
3169
+ cacheRead: 0.175,
3170
+ cacheWrite: 0,
3171
+ },
3172
+ contextWindow: 400000,
3173
+ maxTokens: 128000,
3174
+ },
3175
+ "gpt-5.4": {
3176
+ id: "gpt-5.4",
3177
+ name: "GPT-5.4",
3178
+ api: "openai-responses",
3179
+ provider: "cloudflare-ai-gateway",
3180
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/openai",
3181
+ reasoning: true,
3182
+ input: ["text", "image"],
3183
+ cost: {
3184
+ input: 2.5,
3185
+ output: 15,
3186
+ cacheRead: 0.25,
3187
+ cacheWrite: 0,
3188
+ },
3189
+ contextWindow: 1050000,
3190
+ maxTokens: 128000,
3191
+ },
3192
+ "gpt-5.5": {
3193
+ id: "gpt-5.5",
3194
+ name: "GPT-5.5",
3195
+ api: "openai-responses",
3196
+ provider: "cloudflare-ai-gateway",
3197
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/openai",
3198
+ reasoning: true,
3199
+ input: ["text", "image"],
3200
+ cost: {
3201
+ input: 5,
3202
+ output: 30,
3203
+ cacheRead: 0.5,
3204
+ cacheWrite: 0,
3205
+ },
3206
+ contextWindow: 1050000,
3207
+ maxTokens: 128000,
3208
+ },
3209
+ "o1": {
3210
+ id: "o1",
3211
+ name: "o1",
3212
+ api: "openai-responses",
3213
+ provider: "cloudflare-ai-gateway",
3214
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/openai",
3215
+ reasoning: true,
3216
+ input: ["text", "image"],
3217
+ cost: {
3218
+ input: 15,
3219
+ output: 60,
3220
+ cacheRead: 7.5,
3221
+ cacheWrite: 0,
3222
+ },
3223
+ contextWindow: 200000,
3224
+ maxTokens: 100000,
3225
+ },
3226
+ "o3": {
3227
+ id: "o3",
3228
+ name: "o3",
3229
+ api: "openai-responses",
3230
+ provider: "cloudflare-ai-gateway",
3231
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/openai",
3232
+ reasoning: true,
3233
+ input: ["text", "image"],
3234
+ cost: {
3235
+ input: 2,
3236
+ output: 8,
3237
+ cacheRead: 0.5,
3238
+ cacheWrite: 0,
3239
+ },
3240
+ contextWindow: 200000,
3241
+ maxTokens: 100000,
3242
+ },
3243
+ "o3-mini": {
3244
+ id: "o3-mini",
3245
+ name: "o3-mini",
3246
+ api: "openai-responses",
3247
+ provider: "cloudflare-ai-gateway",
3248
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/openai",
3249
+ reasoning: true,
3250
+ input: ["text"],
3251
+ cost: {
3252
+ input: 1.1,
3253
+ output: 4.4,
3254
+ cacheRead: 0.55,
3255
+ cacheWrite: 0,
3256
+ },
3257
+ contextWindow: 200000,
3258
+ maxTokens: 100000,
3259
+ },
3260
+ "o3-pro": {
3261
+ id: "o3-pro",
3262
+ name: "o3-pro",
3263
+ api: "openai-responses",
3264
+ provider: "cloudflare-ai-gateway",
3265
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/openai",
3266
+ reasoning: true,
3267
+ input: ["text", "image"],
3268
+ cost: {
3269
+ input: 20,
3270
+ output: 80,
3271
+ cacheRead: 0,
3272
+ cacheWrite: 0,
3273
+ },
3274
+ contextWindow: 200000,
3275
+ maxTokens: 100000,
3276
+ },
3277
+ "o4-mini": {
3278
+ id: "o4-mini",
3279
+ name: "o4-mini",
3280
+ api: "openai-responses",
3281
+ provider: "cloudflare-ai-gateway",
3282
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/openai",
3283
+ reasoning: true,
3284
+ input: ["text", "image"],
3285
+ cost: {
3286
+ input: 1.1,
3287
+ output: 4.4,
3288
+ cacheRead: 0.28,
3289
+ cacheWrite: 0,
3290
+ },
3291
+ contextWindow: 200000,
3292
+ maxTokens: 100000,
3293
+ },
3294
+ "workers-ai/@cf/moonshotai/kimi-k2.5": {
3295
+ id: "workers-ai/@cf/moonshotai/kimi-k2.5",
3296
+ name: "Kimi K2.5",
3297
+ api: "openai-completions",
3298
+ provider: "cloudflare-ai-gateway",
3299
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/compat",
3300
+ compat: { "sendSessionAffinityHeaders": true },
3301
+ reasoning: true,
3302
+ input: ["text", "image"],
3303
+ cost: {
3304
+ input: 0.6,
3305
+ output: 3,
3306
+ cacheRead: 0.1,
3307
+ cacheWrite: 0,
3308
+ },
3309
+ contextWindow: 256000,
3310
+ maxTokens: 256000,
3311
+ },
3312
+ "workers-ai/@cf/moonshotai/kimi-k2.6": {
3313
+ id: "workers-ai/@cf/moonshotai/kimi-k2.6",
3314
+ name: "Kimi K2.6",
3315
+ api: "openai-completions",
3316
+ provider: "cloudflare-ai-gateway",
3317
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/compat",
3318
+ compat: { "sendSessionAffinityHeaders": true },
3319
+ reasoning: true,
3320
+ input: ["text", "image"],
3321
+ cost: {
3322
+ input: 0.95,
3323
+ output: 4,
3324
+ cacheRead: 0.16,
2709
3325
  cacheWrite: 0,
2710
3326
  },
2711
- contextWindow: 32000,
2712
- maxTokens: 8000,
3327
+ contextWindow: 256000,
3328
+ maxTokens: 256000,
2713
3329
  },
2714
- "qwen-3-235b-a22b-instruct-2507": {
2715
- id: "qwen-3-235b-a22b-instruct-2507",
2716
- name: "Qwen 3 235B Instruct",
3330
+ "workers-ai/@cf/nvidia/nemotron-3-120b-a12b": {
3331
+ id: "workers-ai/@cf/nvidia/nemotron-3-120b-a12b",
3332
+ name: "Nemotron 3 Super 120B",
2717
3333
  api: "openai-completions",
2718
- provider: "cerebras",
2719
- baseUrl: "https://api.cerebras.ai/v1",
2720
- reasoning: false,
3334
+ provider: "cloudflare-ai-gateway",
3335
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/compat",
3336
+ compat: { "sendSessionAffinityHeaders": true },
3337
+ reasoning: true,
2721
3338
  input: ["text"],
2722
3339
  cost: {
2723
- input: 0.6,
2724
- output: 1.2,
3340
+ input: 0.5,
3341
+ output: 1.5,
2725
3342
  cacheRead: 0,
2726
3343
  cacheWrite: 0,
2727
3344
  },
2728
- contextWindow: 131000,
2729
- maxTokens: 32000,
3345
+ contextWindow: 256000,
3346
+ maxTokens: 256000,
2730
3347
  },
2731
- "zai-glm-4.7": {
2732
- id: "zai-glm-4.7",
2733
- name: "Z.AI GLM-4.7",
3348
+ "workers-ai/@cf/zai-org/glm-4.7-flash": {
3349
+ id: "workers-ai/@cf/zai-org/glm-4.7-flash",
3350
+ name: "GLM-4.7-Flash",
2734
3351
  api: "openai-completions",
2735
- provider: "cerebras",
2736
- baseUrl: "https://api.cerebras.ai/v1",
2737
- reasoning: false,
3352
+ provider: "cloudflare-ai-gateway",
3353
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/compat",
3354
+ compat: { "sendSessionAffinityHeaders": true },
3355
+ reasoning: true,
2738
3356
  input: ["text"],
2739
3357
  cost: {
2740
- input: 2.25,
2741
- output: 2.75,
3358
+ input: 0.06,
3359
+ output: 0.4,
2742
3360
  cacheRead: 0,
2743
3361
  cacheWrite: 0,
2744
3362
  },
2745
3363
  contextWindow: 131072,
2746
- maxTokens: 40000,
3364
+ maxTokens: 131072,
2747
3365
  },
2748
3366
  },
2749
3367
  "cloudflare-workers-ai": {
@@ -2905,7 +3523,7 @@ export const MODELS = {
2905
3523
  cost: {
2906
3524
  input: 0.14,
2907
3525
  output: 0.28,
2908
- cacheRead: 0.028,
3526
+ cacheRead: 0.0028,
2909
3527
  cacheWrite: 0,
2910
3528
  },
2911
3529
  contextWindow: 1000000,
@@ -2921,9 +3539,9 @@ export const MODELS = {
2921
3539
  reasoning: true,
2922
3540
  input: ["text"],
2923
3541
  cost: {
2924
- input: 1.74,
2925
- output: 3.48,
2926
- cacheRead: 0.145,
3542
+ input: 0.435,
3543
+ output: 0.87,
3544
+ cacheRead: 0.003625,
2927
3545
  cacheWrite: 0,
2928
3546
  },
2929
3547
  contextWindow: 1000000,
@@ -3239,7 +3857,7 @@ export const MODELS = {
3239
3857
  },
3240
3858
  "accounts/fireworks/routers/kimi-k2p5-turbo": {
3241
3859
  id: "accounts/fireworks/routers/kimi-k2p5-turbo",
3242
- name: "Kimi K2.5 Turbo (firepass)",
3860
+ name: "Kimi K2.5 Turbo",
3243
3861
  api: "anthropic-messages",
3244
3862
  provider: "fireworks",
3245
3863
  baseUrl: "https://api.fireworks.ai/inference",
@@ -4164,285 +4782,9 @@ export const MODELS = {
4164
4782
  "gemma-4-26b-a4b-it": {
4165
4783
  id: "gemma-4-26b-a4b-it",
4166
4784
  name: "Gemma 4 26B",
4167
- api: "google-generative-ai",
4168
- provider: "google",
4169
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4170
- reasoning: true,
4171
- input: ["text", "image"],
4172
- cost: {
4173
- input: 0,
4174
- output: 0,
4175
- cacheRead: 0,
4176
- cacheWrite: 0,
4177
- },
4178
- contextWindow: 256000,
4179
- maxTokens: 8192,
4180
- },
4181
- "gemma-4-31b-it": {
4182
- id: "gemma-4-31b-it",
4183
- name: "Gemma 4 31B",
4184
- api: "google-generative-ai",
4185
- provider: "google",
4186
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4187
- reasoning: true,
4188
- input: ["text", "image"],
4189
- cost: {
4190
- input: 0,
4191
- output: 0,
4192
- cacheRead: 0,
4193
- cacheWrite: 0,
4194
- },
4195
- contextWindow: 256000,
4196
- maxTokens: 8192,
4197
- },
4198
- },
4199
- "google-antigravity": {
4200
- "claude-opus-4-5-thinking": {
4201
- id: "claude-opus-4-5-thinking",
4202
- name: "Claude Opus 4.5 Thinking (Antigravity)",
4203
- api: "google-gemini-cli",
4204
- provider: "google-antigravity",
4205
- baseUrl: "https://daily-cloudcode-pa.sandbox.googleapis.com",
4206
- reasoning: true,
4207
- input: ["text", "image"],
4208
- cost: {
4209
- input: 5,
4210
- output: 25,
4211
- cacheRead: 0.5,
4212
- cacheWrite: 6.25,
4213
- },
4214
- contextWindow: 200000,
4215
- maxTokens: 64000,
4216
- },
4217
- "claude-opus-4-6-thinking": {
4218
- id: "claude-opus-4-6-thinking",
4219
- name: "Claude Opus 4.6 Thinking (Antigravity)",
4220
- api: "google-gemini-cli",
4221
- provider: "google-antigravity",
4222
- baseUrl: "https://daily-cloudcode-pa.sandbox.googleapis.com",
4223
- reasoning: true,
4224
- input: ["text", "image"],
4225
- cost: {
4226
- input: 5,
4227
- output: 25,
4228
- cacheRead: 0.5,
4229
- cacheWrite: 6.25,
4230
- },
4231
- contextWindow: 200000,
4232
- maxTokens: 128000,
4233
- },
4234
- "claude-sonnet-4-5": {
4235
- id: "claude-sonnet-4-5",
4236
- name: "Claude Sonnet 4.5 (Antigravity)",
4237
- api: "google-gemini-cli",
4238
- provider: "google-antigravity",
4239
- baseUrl: "https://daily-cloudcode-pa.sandbox.googleapis.com",
4240
- reasoning: false,
4241
- input: ["text", "image"],
4242
- cost: {
4243
- input: 3,
4244
- output: 15,
4245
- cacheRead: 0.3,
4246
- cacheWrite: 3.75,
4247
- },
4248
- contextWindow: 200000,
4249
- maxTokens: 64000,
4250
- },
4251
- "claude-sonnet-4-5-thinking": {
4252
- id: "claude-sonnet-4-5-thinking",
4253
- name: "Claude Sonnet 4.5 Thinking (Antigravity)",
4254
- api: "google-gemini-cli",
4255
- provider: "google-antigravity",
4256
- baseUrl: "https://daily-cloudcode-pa.sandbox.googleapis.com",
4257
- reasoning: true,
4258
- input: ["text", "image"],
4259
- cost: {
4260
- input: 3,
4261
- output: 15,
4262
- cacheRead: 0.3,
4263
- cacheWrite: 3.75,
4264
- },
4265
- contextWindow: 200000,
4266
- maxTokens: 64000,
4267
- },
4268
- "claude-sonnet-4-6": {
4269
- id: "claude-sonnet-4-6",
4270
- name: "Claude Sonnet 4.6 (Antigravity)",
4271
- api: "google-gemini-cli",
4272
- provider: "google-antigravity",
4273
- baseUrl: "https://daily-cloudcode-pa.sandbox.googleapis.com",
4274
- reasoning: true,
4275
- input: ["text", "image"],
4276
- cost: {
4277
- input: 3,
4278
- output: 15,
4279
- cacheRead: 0.3,
4280
- cacheWrite: 3.75,
4281
- },
4282
- contextWindow: 200000,
4283
- maxTokens: 64000,
4284
- },
4285
- "gemini-3-flash": {
4286
- id: "gemini-3-flash",
4287
- name: "Gemini 3 Flash (Antigravity)",
4288
- api: "google-gemini-cli",
4289
- provider: "google-antigravity",
4290
- baseUrl: "https://daily-cloudcode-pa.sandbox.googleapis.com",
4291
- reasoning: true,
4292
- input: ["text", "image"],
4293
- cost: {
4294
- input: 0.5,
4295
- output: 3,
4296
- cacheRead: 0.5,
4297
- cacheWrite: 0,
4298
- },
4299
- contextWindow: 1048576,
4300
- maxTokens: 65535,
4301
- },
4302
- "gemini-3.1-pro-high": {
4303
- id: "gemini-3.1-pro-high",
4304
- name: "Gemini 3.1 Pro High (Antigravity)",
4305
- api: "google-gemini-cli",
4306
- provider: "google-antigravity",
4307
- baseUrl: "https://daily-cloudcode-pa.sandbox.googleapis.com",
4308
- reasoning: true,
4309
- input: ["text", "image"],
4310
- cost: {
4311
- input: 2,
4312
- output: 12,
4313
- cacheRead: 0.2,
4314
- cacheWrite: 2.375,
4315
- },
4316
- contextWindow: 1048576,
4317
- maxTokens: 65535,
4318
- },
4319
- "gemini-3.1-pro-low": {
4320
- id: "gemini-3.1-pro-low",
4321
- name: "Gemini 3.1 Pro Low (Antigravity)",
4322
- api: "google-gemini-cli",
4323
- provider: "google-antigravity",
4324
- baseUrl: "https://daily-cloudcode-pa.sandbox.googleapis.com",
4325
- reasoning: true,
4326
- input: ["text", "image"],
4327
- cost: {
4328
- input: 2,
4329
- output: 12,
4330
- cacheRead: 0.2,
4331
- cacheWrite: 2.375,
4332
- },
4333
- contextWindow: 1048576,
4334
- maxTokens: 65535,
4335
- },
4336
- "gpt-oss-120b-medium": {
4337
- id: "gpt-oss-120b-medium",
4338
- name: "GPT-OSS 120B Medium (Antigravity)",
4339
- api: "google-gemini-cli",
4340
- provider: "google-antigravity",
4341
- baseUrl: "https://daily-cloudcode-pa.sandbox.googleapis.com",
4342
- reasoning: false,
4343
- input: ["text"],
4344
- cost: {
4345
- input: 0.09,
4346
- output: 0.36,
4347
- cacheRead: 0,
4348
- cacheWrite: 0,
4349
- },
4350
- contextWindow: 131072,
4351
- maxTokens: 32768,
4352
- },
4353
- },
4354
- "google-gemini-cli": {
4355
- "gemini-2.0-flash": {
4356
- id: "gemini-2.0-flash",
4357
- name: "Gemini 2.0 Flash (Cloud Code Assist)",
4358
- api: "google-gemini-cli",
4359
- provider: "google-gemini-cli",
4360
- baseUrl: "https://cloudcode-pa.googleapis.com",
4361
- reasoning: false,
4362
- input: ["text", "image"],
4363
- cost: {
4364
- input: 0,
4365
- output: 0,
4366
- cacheRead: 0,
4367
- cacheWrite: 0,
4368
- },
4369
- contextWindow: 1048576,
4370
- maxTokens: 8192,
4371
- },
4372
- "gemini-2.5-flash": {
4373
- id: "gemini-2.5-flash",
4374
- name: "Gemini 2.5 Flash (Cloud Code Assist)",
4375
- api: "google-gemini-cli",
4376
- provider: "google-gemini-cli",
4377
- baseUrl: "https://cloudcode-pa.googleapis.com",
4378
- reasoning: true,
4379
- input: ["text", "image"],
4380
- cost: {
4381
- input: 0,
4382
- output: 0,
4383
- cacheRead: 0,
4384
- cacheWrite: 0,
4385
- },
4386
- contextWindow: 1048576,
4387
- maxTokens: 65535,
4388
- },
4389
- "gemini-2.5-pro": {
4390
- id: "gemini-2.5-pro",
4391
- name: "Gemini 2.5 Pro (Cloud Code Assist)",
4392
- api: "google-gemini-cli",
4393
- provider: "google-gemini-cli",
4394
- baseUrl: "https://cloudcode-pa.googleapis.com",
4395
- reasoning: true,
4396
- input: ["text", "image"],
4397
- cost: {
4398
- input: 0,
4399
- output: 0,
4400
- cacheRead: 0,
4401
- cacheWrite: 0,
4402
- },
4403
- contextWindow: 1048576,
4404
- maxTokens: 65535,
4405
- },
4406
- "gemini-3-flash-preview": {
4407
- id: "gemini-3-flash-preview",
4408
- name: "Gemini 3 Flash Preview (Cloud Code Assist)",
4409
- api: "google-gemini-cli",
4410
- provider: "google-gemini-cli",
4411
- baseUrl: "https://cloudcode-pa.googleapis.com",
4412
- reasoning: true,
4413
- input: ["text", "image"],
4414
- cost: {
4415
- input: 0,
4416
- output: 0,
4417
- cacheRead: 0,
4418
- cacheWrite: 0,
4419
- },
4420
- contextWindow: 1048576,
4421
- maxTokens: 65535,
4422
- },
4423
- "gemini-3-pro-preview": {
4424
- id: "gemini-3-pro-preview",
4425
- name: "Gemini 3 Pro Preview (Cloud Code Assist)",
4426
- api: "google-gemini-cli",
4427
- provider: "google-gemini-cli",
4428
- baseUrl: "https://cloudcode-pa.googleapis.com",
4429
- reasoning: true,
4430
- input: ["text", "image"],
4431
- cost: {
4432
- input: 0,
4433
- output: 0,
4434
- cacheRead: 0,
4435
- cacheWrite: 0,
4436
- },
4437
- contextWindow: 1048576,
4438
- maxTokens: 65535,
4439
- },
4440
- "gemini-3.1-flash-lite-preview": {
4441
- id: "gemini-3.1-flash-lite-preview",
4442
- name: "Gemini 3.1 Flash Lite Preview (Cloud Code Assist)",
4443
- api: "google-gemini-cli",
4444
- provider: "google-gemini-cli",
4445
- baseUrl: "https://cloudcode-pa.googleapis.com",
4785
+ api: "google-generative-ai",
4786
+ provider: "google",
4787
+ baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4446
4788
  reasoning: true,
4447
4789
  input: ["text", "image"],
4448
4790
  cost: {
@@ -4451,15 +4793,15 @@ export const MODELS = {
4451
4793
  cacheRead: 0,
4452
4794
  cacheWrite: 0,
4453
4795
  },
4454
- contextWindow: 1048576,
4455
- maxTokens: 65535,
4796
+ contextWindow: 256000,
4797
+ maxTokens: 8192,
4456
4798
  },
4457
- "gemini-3.1-pro-preview": {
4458
- id: "gemini-3.1-pro-preview",
4459
- name: "Gemini 3.1 Pro Preview (Cloud Code Assist)",
4460
- api: "google-gemini-cli",
4461
- provider: "google-gemini-cli",
4462
- baseUrl: "https://cloudcode-pa.googleapis.com",
4799
+ "gemma-4-31b-it": {
4800
+ id: "gemma-4-31b-it",
4801
+ name: "Gemma 4 31B",
4802
+ api: "google-generative-ai",
4803
+ provider: "google",
4804
+ baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4463
4805
  reasoning: true,
4464
4806
  input: ["text", "image"],
4465
4807
  cost: {
@@ -4468,8 +4810,8 @@ export const MODELS = {
4468
4810
  cacheRead: 0,
4469
4811
  cacheWrite: 0,
4470
4812
  },
4471
- contextWindow: 1048576,
4472
- maxTokens: 65535,
4813
+ contextWindow: 256000,
4814
+ maxTokens: 8192,
4473
4815
  },
4474
4816
  },
4475
4817
  "google-vertex": {
@@ -5802,22 +6144,56 @@ export const MODELS = {
5802
6144
  contextWindow: 262144,
5803
6145
  maxTokens: 262144,
5804
6146
  },
6147
+ "mistral-medium-2604": {
6148
+ id: "mistral-medium-2604",
6149
+ name: "Mistral Medium 3.5",
6150
+ api: "mistral-conversations",
6151
+ provider: "mistral",
6152
+ baseUrl: "https://api.mistral.ai",
6153
+ reasoning: true,
6154
+ input: ["text", "image"],
6155
+ cost: {
6156
+ input: 1.5,
6157
+ output: 7.5,
6158
+ cacheRead: 0,
6159
+ cacheWrite: 0,
6160
+ },
6161
+ contextWindow: 262144,
6162
+ maxTokens: 262144,
6163
+ },
6164
+ "mistral-medium-3.5": {
6165
+ id: "mistral-medium-3.5",
6166
+ name: "Mistral Medium 3.5",
6167
+ api: "mistral-conversations",
6168
+ provider: "mistral",
6169
+ baseUrl: "https://api.mistral.ai",
6170
+ reasoning: true,
6171
+ input: ["text", "image"],
6172
+ cost: {
6173
+ input: 1.5,
6174
+ output: 7.5,
6175
+ cacheRead: 0,
6176
+ cacheWrite: 0,
6177
+ },
6178
+ contextWindow: 262144,
6179
+ maxTokens: 262144,
6180
+ },
5805
6181
  "mistral-medium-latest": {
5806
6182
  id: "mistral-medium-latest",
5807
6183
  name: "Mistral Medium (latest)",
5808
6184
  api: "mistral-conversations",
5809
6185
  provider: "mistral",
5810
6186
  baseUrl: "https://api.mistral.ai",
5811
- reasoning: false,
6187
+ reasoning: true,
5812
6188
  input: ["text", "image"],
5813
6189
  cost: {
5814
- input: 0.4,
5815
- output: 2,
6190
+ input: 1.5,
6191
+ output: 7.5,
5816
6192
  cacheRead: 0,
5817
6193
  cacheWrite: 0,
5818
6194
  },
5819
- contextWindow: 128000,
5820
- maxTokens: 16384,
6195
+ contextWindow: 262144,
6196
+ maxTokens: 262144,
5821
6197
  },
5822
6198
  "mistral-nemo": {
5823
6199
  id: "mistral-nemo",
@@ -5913,64 +6289,320 @@ export const MODELS = {
5913
6289
  reasoning: false,
5914
6290
  input: ["text"],
5915
6291
  cost: {
5916
- input: 2,
5917
- output: 6,
5918
- cacheRead: 0,
6292
+ input: 2,
6293
+ output: 6,
6294
+ cacheRead: 0,
6295
+ cacheWrite: 0,
6296
+ },
6297
+ contextWindow: 64000,
6298
+ maxTokens: 64000,
6299
+ },
6300
+ "open-mixtral-8x7b": {
6301
+ id: "open-mixtral-8x7b",
6302
+ name: "Mixtral 8x7B",
6303
+ api: "mistral-conversations",
6304
+ provider: "mistral",
6305
+ baseUrl: "https://api.mistral.ai",
6306
+ reasoning: false,
6307
+ input: ["text"],
6308
+ cost: {
6309
+ input: 0.7,
6310
+ output: 0.7,
6311
+ cacheRead: 0,
6312
+ cacheWrite: 0,
6313
+ },
6314
+ contextWindow: 32000,
6315
+ maxTokens: 32000,
6316
+ },
6317
+ "pixtral-12b": {
6318
+ id: "pixtral-12b",
6319
+ name: "Pixtral 12B",
6320
+ api: "mistral-conversations",
6321
+ provider: "mistral",
6322
+ baseUrl: "https://api.mistral.ai",
6323
+ reasoning: false,
6324
+ input: ["text", "image"],
6325
+ cost: {
6326
+ input: 0.15,
6327
+ output: 0.15,
6328
+ cacheRead: 0,
6329
+ cacheWrite: 0,
6330
+ },
6331
+ contextWindow: 128000,
6332
+ maxTokens: 128000,
6333
+ },
6334
+ "pixtral-large-latest": {
6335
+ id: "pixtral-large-latest",
6336
+ name: "Pixtral Large (latest)",
6337
+ api: "mistral-conversations",
6338
+ provider: "mistral",
6339
+ baseUrl: "https://api.mistral.ai",
6340
+ reasoning: false,
6341
+ input: ["text", "image"],
6342
+ cost: {
6343
+ input: 2,
6344
+ output: 6,
6345
+ cacheRead: 0,
6346
+ cacheWrite: 0,
6347
+ },
6348
+ contextWindow: 128000,
6349
+ maxTokens: 128000,
6350
+ },
6351
+ },
6352
+ "moonshotai": {
6353
+ "kimi-k2-0711-preview": {
6354
+ id: "kimi-k2-0711-preview",
6355
+ name: "Kimi K2 0711",
6356
+ api: "openai-completions",
6357
+ provider: "moonshotai",
6358
+ baseUrl: "https://api.moonshot.ai/v1",
6359
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6360
+ reasoning: false,
6361
+ input: ["text"],
6362
+ cost: {
6363
+ input: 0.6,
6364
+ output: 2.5,
6365
+ cacheRead: 0.15,
6366
+ cacheWrite: 0,
6367
+ },
6368
+ contextWindow: 131072,
6369
+ maxTokens: 16384,
6370
+ },
6371
+ "kimi-k2-0905-preview": {
6372
+ id: "kimi-k2-0905-preview",
6373
+ name: "Kimi K2 0905",
6374
+ api: "openai-completions",
6375
+ provider: "moonshotai",
6376
+ baseUrl: "https://api.moonshot.ai/v1",
6377
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6378
+ reasoning: false,
6379
+ input: ["text"],
6380
+ cost: {
6381
+ input: 0.6,
6382
+ output: 2.5,
6383
+ cacheRead: 0.15,
6384
+ cacheWrite: 0,
6385
+ },
6386
+ contextWindow: 262144,
6387
+ maxTokens: 262144,
6388
+ },
6389
+ "kimi-k2-thinking": {
6390
+ id: "kimi-k2-thinking",
6391
+ name: "Kimi K2 Thinking",
6392
+ api: "openai-completions",
6393
+ provider: "moonshotai",
6394
+ baseUrl: "https://api.moonshot.ai/v1",
6395
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6396
+ reasoning: true,
6397
+ input: ["text"],
6398
+ cost: {
6399
+ input: 0.6,
6400
+ output: 2.5,
6401
+ cacheRead: 0.15,
6402
+ cacheWrite: 0,
6403
+ },
6404
+ contextWindow: 262144,
6405
+ maxTokens: 262144,
6406
+ },
6407
+ "kimi-k2-thinking-turbo": {
6408
+ id: "kimi-k2-thinking-turbo",
6409
+ name: "Kimi K2 Thinking Turbo",
6410
+ api: "openai-completions",
6411
+ provider: "moonshotai",
6412
+ baseUrl: "https://api.moonshot.ai/v1",
6413
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6414
+ reasoning: true,
6415
+ input: ["text"],
6416
+ cost: {
6417
+ input: 1.15,
6418
+ output: 8,
6419
+ cacheRead: 0.15,
6420
+ cacheWrite: 0,
6421
+ },
6422
+ contextWindow: 262144,
6423
+ maxTokens: 262144,
6424
+ },
6425
+ "kimi-k2-turbo-preview": {
6426
+ id: "kimi-k2-turbo-preview",
6427
+ name: "Kimi K2 Turbo",
6428
+ api: "openai-completions",
6429
+ provider: "moonshotai",
6430
+ baseUrl: "https://api.moonshot.ai/v1",
6431
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6432
+ reasoning: false,
6433
+ input: ["text"],
6434
+ cost: {
6435
+ input: 2.4,
6436
+ output: 10,
6437
+ cacheRead: 0.6,
6438
+ cacheWrite: 0,
6439
+ },
6440
+ contextWindow: 262144,
6441
+ maxTokens: 262144,
6442
+ },
6443
+ "kimi-k2.5": {
6444
+ id: "kimi-k2.5",
6445
+ name: "Kimi K2.5",
6446
+ api: "openai-completions",
6447
+ provider: "moonshotai",
6448
+ baseUrl: "https://api.moonshot.ai/v1",
6449
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6450
+ reasoning: true,
6451
+ input: ["text", "image"],
6452
+ cost: {
6453
+ input: 0.6,
6454
+ output: 3,
6455
+ cacheRead: 0.1,
6456
+ cacheWrite: 0,
6457
+ },
6458
+ contextWindow: 262144,
6459
+ maxTokens: 262144,
6460
+ },
6461
+ "kimi-k2.6": {
6462
+ id: "kimi-k2.6",
6463
+ name: "Kimi K2.6",
6464
+ api: "openai-completions",
6465
+ provider: "moonshotai",
6466
+ baseUrl: "https://api.moonshot.ai/v1",
6467
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6468
+ reasoning: true,
6469
+ input: ["text", "image"],
6470
+ cost: {
6471
+ input: 0.95,
6472
+ output: 4,
6473
+ cacheRead: 0.16,
6474
+ cacheWrite: 0,
6475
+ },
6476
+ contextWindow: 262144,
6477
+ maxTokens: 262144,
6478
+ },
6479
+ },
6480
+ "moonshotai-cn": {
6481
+ "kimi-k2-0711-preview": {
6482
+ id: "kimi-k2-0711-preview",
6483
+ name: "Kimi K2 0711",
6484
+ api: "openai-completions",
6485
+ provider: "moonshotai-cn",
6486
+ baseUrl: "https://api.moonshot.cn/v1",
6487
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6488
+ reasoning: false,
6489
+ input: ["text"],
6490
+ cost: {
6491
+ input: 0.6,
6492
+ output: 2.5,
6493
+ cacheRead: 0.15,
6494
+ cacheWrite: 0,
6495
+ },
6496
+ contextWindow: 131072,
6497
+ maxTokens: 16384,
6498
+ },
6499
+ "kimi-k2-0905-preview": {
6500
+ id: "kimi-k2-0905-preview",
6501
+ name: "Kimi K2 0905",
6502
+ api: "openai-completions",
6503
+ provider: "moonshotai-cn",
6504
+ baseUrl: "https://api.moonshot.cn/v1",
6505
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6506
+ reasoning: false,
6507
+ input: ["text"],
6508
+ cost: {
6509
+ input: 0.6,
6510
+ output: 2.5,
6511
+ cacheRead: 0.15,
6512
+ cacheWrite: 0,
6513
+ },
6514
+ contextWindow: 262144,
6515
+ maxTokens: 262144,
6516
+ },
6517
+ "kimi-k2-thinking": {
6518
+ id: "kimi-k2-thinking",
6519
+ name: "Kimi K2 Thinking",
6520
+ api: "openai-completions",
6521
+ provider: "moonshotai-cn",
6522
+ baseUrl: "https://api.moonshot.cn/v1",
6523
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6524
+ reasoning: true,
6525
+ input: ["text"],
6526
+ cost: {
6527
+ input: 0.6,
6528
+ output: 2.5,
6529
+ cacheRead: 0.15,
6530
+ cacheWrite: 0,
6531
+ },
6532
+ contextWindow: 262144,
6533
+ maxTokens: 262144,
6534
+ },
6535
+ "kimi-k2-thinking-turbo": {
6536
+ id: "kimi-k2-thinking-turbo",
6537
+ name: "Kimi K2 Thinking Turbo",
6538
+ api: "openai-completions",
6539
+ provider: "moonshotai-cn",
6540
+ baseUrl: "https://api.moonshot.cn/v1",
6541
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6542
+ reasoning: true,
6543
+ input: ["text"],
6544
+ cost: {
6545
+ input: 1.15,
6546
+ output: 8,
6547
+ cacheRead: 0.15,
5919
6548
  cacheWrite: 0,
5920
6549
  },
5921
- contextWindow: 64000,
5922
- maxTokens: 64000,
6550
+ contextWindow: 262144,
6551
+ maxTokens: 262144,
5923
6552
  },
5924
- "open-mixtral-8x7b": {
5925
- id: "open-mixtral-8x7b",
5926
- name: "Mixtral 8x7B",
5927
- api: "mistral-conversations",
5928
- provider: "mistral",
5929
- baseUrl: "https://api.mistral.ai",
6553
+ "kimi-k2-turbo-preview": {
6554
+ id: "kimi-k2-turbo-preview",
6555
+ name: "Kimi K2 Turbo",
6556
+ api: "openai-completions",
6557
+ provider: "moonshotai-cn",
6558
+ baseUrl: "https://api.moonshot.cn/v1",
6559
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
5930
6560
  reasoning: false,
5931
6561
  input: ["text"],
5932
6562
  cost: {
5933
- input: 0.7,
5934
- output: 0.7,
5935
- cacheRead: 0,
6563
+ input: 2.4,
6564
+ output: 10,
6565
+ cacheRead: 0.6,
5936
6566
  cacheWrite: 0,
5937
6567
  },
5938
- contextWindow: 32000,
5939
- maxTokens: 32000,
6568
+ contextWindow: 262144,
6569
+ maxTokens: 262144,
5940
6570
  },
5941
- "pixtral-12b": {
5942
- id: "pixtral-12b",
5943
- name: "Pixtral 12B",
5944
- api: "mistral-conversations",
5945
- provider: "mistral",
5946
- baseUrl: "https://api.mistral.ai",
5947
- reasoning: false,
6571
+ "kimi-k2.5": {
6572
+ id: "kimi-k2.5",
6573
+ name: "Kimi K2.5",
6574
+ api: "openai-completions",
6575
+ provider: "moonshotai-cn",
6576
+ baseUrl: "https://api.moonshot.cn/v1",
6577
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6578
+ reasoning: true,
5948
6579
  input: ["text", "image"],
5949
6580
  cost: {
5950
- input: 0.15,
5951
- output: 0.15,
5952
- cacheRead: 0,
6581
+ input: 0.6,
6582
+ output: 3,
6583
+ cacheRead: 0.1,
5953
6584
  cacheWrite: 0,
5954
6585
  },
5955
- contextWindow: 128000,
5956
- maxTokens: 128000,
6586
+ contextWindow: 262144,
6587
+ maxTokens: 262144,
5957
6588
  },
5958
- "pixtral-large-latest": {
5959
- id: "pixtral-large-latest",
5960
- name: "Pixtral Large (latest)",
5961
- api: "mistral-conversations",
5962
- provider: "mistral",
5963
- baseUrl: "https://api.mistral.ai",
5964
- reasoning: false,
6589
+ "kimi-k2.6": {
6590
+ id: "kimi-k2.6",
6591
+ name: "Kimi K2.6",
6592
+ api: "openai-completions",
6593
+ provider: "moonshotai-cn",
6594
+ baseUrl: "https://api.moonshot.cn/v1",
6595
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6596
+ reasoning: true,
5965
6597
  input: ["text", "image"],
5966
6598
  cost: {
5967
- input: 2,
5968
- output: 6,
5969
- cacheRead: 0,
6599
+ input: 0.95,
6600
+ output: 4,
6601
+ cacheRead: 0.16,
5970
6602
  cacheWrite: 0,
5971
6603
  },
5972
- contextWindow: 128000,
5973
- maxTokens: 128000,
6604
+ contextWindow: 262144,
6605
+ maxTokens: 262144,
5974
6606
  },
5975
6607
  },
5976
6608
  "openai": {
@@ -6535,6 +7167,23 @@ export const MODELS = {
6535
7167
  contextWindow: 272000,
6536
7168
  maxTokens: 128000,
6537
7169
  },
7170
+ "gpt-5.5-pro": {
7171
+ id: "gpt-5.5-pro",
7172
+ name: "GPT-5.5 Pro",
7173
+ api: "openai-responses",
7174
+ provider: "openai",
7175
+ baseUrl: "https://api.openai.com/v1",
7176
+ reasoning: true,
7177
+ input: ["text", "image"],
7178
+ cost: {
7179
+ input: 30,
7180
+ output: 180,
7181
+ cacheRead: 0,
7182
+ cacheWrite: 0,
7183
+ },
7184
+ contextWindow: 1050000,
7185
+ maxTokens: 128000,
7186
+ },
6538
7187
  "o1": {
6539
7188
  id: "o1",
6540
7189
  name: "o1",
@@ -7389,23 +8038,6 @@ export const MODELS = {
7389
8038
  contextWindow: 262144,
7390
8039
  maxTokens: 65536,
7391
8040
  },
7392
- "ling-2.6-flash-free": {
7393
- id: "ling-2.6-flash-free",
7394
- name: "Ling 2.6 Flash Free",
7395
- api: "openai-completions",
7396
- provider: "opencode",
7397
- baseUrl: "https://opencode.ai/zen/v1",
7398
- reasoning: false,
7399
- input: ["text"],
7400
- cost: {
7401
- input: 0,
7402
- output: 0,
7403
- cacheRead: 0,
7404
- cacheWrite: 0,
7405
- },
7406
- contextWindow: 262100,
7407
- maxTokens: 32800,
7408
- },
7409
8041
  "minimax-m2.5": {
7410
8042
  id: "minimax-m2.5",
7411
8043
  name: "MiniMax M2.5",
@@ -7516,7 +8148,7 @@ export const MODELS = {
7516
8148
  api: "openai-completions",
7517
8149
  provider: "opencode-go",
7518
8150
  baseUrl: "https://opencode.ai/zen/go/v1",
7519
- compat: { "requiresReasoningContentOnAssistantMessages": true },
8151
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek", "reasoningEffortMap": { "minimal": "high", "low": "high", "medium": "high", "high": "high", "xhigh": "max" } },
7520
8152
  reasoning: true,
7521
8153
  input: ["text"],
7522
8154
  cost: {
@@ -7534,7 +8166,7 @@ export const MODELS = {
7534
8166
  api: "openai-completions",
7535
8167
  provider: "opencode-go",
7536
8168
  baseUrl: "https://opencode.ai/zen/go/v1",
7537
- compat: { "requiresReasoningContentOnAssistantMessages": true },
8169
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek", "reasoningEffortMap": { "minimal": "high", "low": "high", "medium": "high", "high": "high", "xhigh": "max" } },
7538
8170
  reasoning: true,
7539
8171
  input: ["text"],
7540
8172
  cost: {
@@ -8489,7 +9121,7 @@ export const MODELS = {
8489
9121
  api: "openai-completions",
8490
9122
  provider: "openrouter",
8491
9123
  baseUrl: "https://openrouter.ai/api/v1",
8492
- compat: { "requiresReasoningContentOnAssistantMessages": true },
9124
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "reasoningEffortMap": { "minimal": "high", "low": "high", "medium": "high", "high": "high", "xhigh": "max" } },
8493
9125
  reasoning: true,
8494
9126
  input: ["text"],
8495
9127
  cost: {
@@ -8507,7 +9139,7 @@ export const MODELS = {
8507
9139
  api: "openai-completions",
8508
9140
  provider: "openrouter",
8509
9141
  baseUrl: "https://openrouter.ai/api/v1",
8510
- compat: { "requiresReasoningContentOnAssistantMessages": true },
9142
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "reasoningEffortMap": { "minimal": "high", "low": "high", "medium": "high", "high": "high", "xhigh": "max" } },
8511
9143
  reasoning: true,
8512
9144
  input: ["text"],
8513
9145
  cost: {
@@ -8842,6 +9474,23 @@ export const MODELS = {
8842
9474
  contextWindow: 262144,
8843
9475
  maxTokens: 32768,
8844
9476
  },
9477
+ "ibm-granite/granite-4.1-8b": {
9478
+ id: "ibm-granite/granite-4.1-8b",
9479
+ name: "IBM: Granite 4.1 8B",
9480
+ api: "openai-completions",
9481
+ provider: "openrouter",
9482
+ baseUrl: "https://openrouter.ai/api/v1",
9483
+ reasoning: false,
9484
+ input: ["text"],
9485
+ cost: {
9486
+ input: 0.049999999999999996,
9487
+ output: 0.09999999999999999,
9488
+ cacheRead: 0.049999999999999996,
9489
+ cacheWrite: 0,
9490
+ },
9491
+ contextWindow: 131072,
9492
+ maxTokens: 131072,
9493
+ },
8845
9494
  "inception/mercury-2": {
8846
9495
  id: "inception/mercury-2",
8847
9496
  name: "Inception: Mercury 2",
@@ -8876,18 +9525,18 @@ export const MODELS = {
8876
9525
  contextWindow: 262144,
8877
9526
  maxTokens: 32768,
8878
9527
  },
8879
- "inclusionai/ling-2.6-flash:free": {
8880
- id: "inclusionai/ling-2.6-flash:free",
8881
- name: "inclusionAI: Ling-2.6-flash (free)",
9528
+ "inclusionai/ling-2.6-flash": {
9529
+ id: "inclusionai/ling-2.6-flash",
9530
+ name: "inclusionAI: Ling-2.6-flash",
8882
9531
  api: "openai-completions",
8883
9532
  provider: "openrouter",
8884
9533
  baseUrl: "https://openrouter.ai/api/v1",
8885
9534
  reasoning: false,
8886
9535
  input: ["text"],
8887
9536
  cost: {
8888
- input: 0,
8889
- output: 0,
8890
- cacheRead: 0,
9537
+ input: 0.08,
9538
+ output: 0.24,
9539
+ cacheRead: 0.016,
8891
9540
  cacheWrite: 0,
8892
9541
  },
8893
9542
  contextWindow: 262144,
@@ -9345,12 +9994,12 @@ export const MODELS = {
9345
9994
  input: ["text"],
9346
9995
  cost: {
9347
9996
  input: 0.02,
9348
- output: 0.04,
9997
+ output: 0.03,
9349
9998
  cacheRead: 0,
9350
9999
  cacheWrite: 0,
9351
10000
  },
9352
10001
  contextWindow: 131072,
9353
- maxTokens: 16384,
10002
+ maxTokens: 4096,
9354
10003
  },
9355
10004
  "mistralai/mistral-saba": {
9356
10005
  id: "mistralai/mistral-saba",
@@ -9403,23 +10052,6 @@ export const MODELS = {
9403
10052
  contextWindow: 128000,
9404
10053
  maxTokens: 16384,
9405
10054
  },
9406
- "mistralai/mistral-small-creative": {
9407
- id: "mistralai/mistral-small-creative",
9408
- name: "Mistral: Mistral Small Creative",
9409
- api: "openai-completions",
9410
- provider: "openrouter",
9411
- baseUrl: "https://openrouter.ai/api/v1",
9412
- reasoning: false,
9413
- input: ["text"],
9414
- cost: {
9415
- input: 0.09999999999999999,
9416
- output: 0.3,
9417
- cacheRead: 0.01,
9418
- cacheWrite: 0,
9419
- },
9420
- contextWindow: 32768,
9421
- maxTokens: 4096,
9422
- },
9423
10055
  "mistralai/mixtral-8x22b-instruct": {
9424
10056
  id: "mistralai/mixtral-8x22b-instruct",
9425
10057
  name: "Mistral: Mixtral 8x22B Instruct",
@@ -9565,13 +10197,13 @@ export const MODELS = {
9565
10197
  reasoning: true,
9566
10198
  input: ["text", "image"],
9567
10199
  cost: {
9568
- input: 0.7448,
9569
- output: 4.655,
9570
- cacheRead: 0.1463,
10200
+ input: 0.74,
10201
+ output: 3.49,
10202
+ cacheRead: 0.14,
9571
10203
  cacheWrite: 0,
9572
10204
  },
9573
- contextWindow: 256000,
9574
- maxTokens: 65536,
10205
+ contextWindow: 262142,
10206
+ maxTokens: 262142,
9575
10207
  },
9576
10208
  "nex-agi/deepseek-v3.1-nex-n1": {
9577
10209
  id: "nex-agi/deepseek-v3.1-nex-n1",
@@ -10484,12 +11116,12 @@ export const MODELS = {
10484
11116
  input: ["text"],
10485
11117
  cost: {
10486
11118
  input: 0.039,
10487
- output: 0.19,
11119
+ output: 0.18,
10488
11120
  cacheRead: 0,
10489
11121
  cacheWrite: 0,
10490
11122
  },
10491
11123
  contextWindow: 131072,
10492
- maxTokens: 131072,
11124
+ maxTokens: 4096,
10493
11125
  },
10494
11126
  "openai/gpt-oss-120b:free": {
10495
11127
  id: "openai/gpt-oss-120b:free",
@@ -10746,6 +11378,23 @@ export const MODELS = {
10746
11378
  contextWindow: 200000,
10747
11379
  maxTokens: 4096,
10748
11380
  },
11381
+ "openrouter/owl-alpha": {
11382
+ id: "openrouter/owl-alpha",
11383
+ name: "Owl Alpha",
11384
+ api: "openai-completions",
11385
+ provider: "openrouter",
11386
+ baseUrl: "https://openrouter.ai/api/v1",
11387
+ reasoning: false,
11388
+ input: ["text"],
11389
+ cost: {
11390
+ input: 0,
11391
+ output: 0,
11392
+ cacheRead: 0,
11393
+ cacheWrite: 0,
11394
+ },
11395
+ contextWindow: 1048756,
11396
+ maxTokens: 262144,
11397
+ },
10749
11398
  "poolside/laguna-m.1:free": {
10750
11399
  id: "poolside/laguna-m.1:free",
10751
11400
  name: "Poolside: Laguna M.1 (free)",
@@ -11596,23 +12245,6 @@ export const MODELS = {
11596
12245
  contextWindow: 1000000,
11597
12246
  maxTokens: 65536,
11598
12247
  },
11599
- "qwen/qwq-32b": {
11600
- id: "qwen/qwq-32b",
11601
- name: "Qwen: QwQ 32B",
11602
- api: "openai-completions",
11603
- provider: "openrouter",
11604
- baseUrl: "https://openrouter.ai/api/v1",
11605
- reasoning: true,
11606
- input: ["text"],
11607
- cost: {
11608
- input: 0.15,
11609
- output: 0.58,
11610
- cacheRead: 0,
11611
- cacheWrite: 0,
11612
- },
11613
- contextWindow: 131072,
11614
- maxTokens: 131072,
11615
- },
11616
12248
  "rekaai/reka-edge": {
11617
12249
  id: "rekaai/reka-edge",
11618
12250
  name: "Reka Edge",
@@ -12336,13 +12968,13 @@ export const MODELS = {
12336
12968
  reasoning: true,
12337
12969
  input: ["text", "image"],
12338
12970
  cost: {
12339
- input: 0.7448,
12340
- output: 4.655,
12341
- cacheRead: 0.1463,
12971
+ input: 0.74,
12972
+ output: 3.49,
12973
+ cacheRead: 0.14,
12342
12974
  cacheWrite: 0,
12343
12975
  },
12344
- contextWindow: 256000,
12345
- maxTokens: 65536,
12976
+ contextWindow: 262142,
12977
+ maxTokens: 262142,
12346
12978
  },
12347
12979
  "~openai/gpt-latest": {
12348
12980
  id: "~openai/gpt-latest",
@@ -12467,20 +13099,20 @@ export const MODELS = {
12467
13099
  },
12468
13100
  "alibaba/qwen3-235b-a22b-thinking": {
12469
13101
  id: "alibaba/qwen3-235b-a22b-thinking",
12470
- name: "Qwen3 235B A22B Thinking 2507",
13102
+ name: "Qwen3 VL 235B A22B Thinking",
12471
13103
  api: "anthropic-messages",
12472
13104
  provider: "vercel-ai-gateway",
12473
13105
  baseUrl: "https://ai-gateway.vercel.sh",
12474
13106
  reasoning: true,
12475
13107
  input: ["text", "image"],
12476
13108
  cost: {
12477
- input: 0.22999999999999998,
12478
- output: 2.3,
12479
- cacheRead: 0.19999999999999998,
13109
+ input: 0.39999999999999997,
13110
+ output: 4,
13111
+ cacheRead: 0,
12480
13112
  cacheWrite: 0,
12481
13113
  },
12482
- contextWindow: 262114,
12483
- maxTokens: 262114,
13114
+ contextWindow: 131072,
13115
+ maxTokens: 32768,
12484
13116
  },
12485
13117
  "alibaba/qwen3-coder": {
12486
13118
  id: "alibaba/qwen3-coder",
@@ -12652,6 +13284,23 @@ export const MODELS = {
12652
13284
  contextWindow: 1000000,
12653
13285
  maxTokens: 64000,
12654
13286
  },
13287
+ "alibaba/qwen3.6-27b": {
13288
+ id: "alibaba/qwen3.6-27b",
13289
+ name: "Qwen 3.6 27B",
13290
+ api: "anthropic-messages",
13291
+ provider: "vercel-ai-gateway",
13292
+ baseUrl: "https://ai-gateway.vercel.sh",
13293
+ reasoning: true,
13294
+ input: ["text", "image"],
13295
+ cost: {
13296
+ input: 0.6,
13297
+ output: 3.5999999999999996,
13298
+ cacheRead: 0,
13299
+ cacheWrite: 0,
13300
+ },
13301
+ contextWindow: 256000,
13302
+ maxTokens: 256000,
13303
+ },
12655
13304
  "alibaba/qwen3.6-plus": {
12656
13305
  id: "alibaba/qwen3.6-plus",
12657
13306
  name: "Qwen 3.6 Plus",
@@ -13032,16 +13681,16 @@ export const MODELS = {
13032
13681
  api: "anthropic-messages",
13033
13682
  provider: "vercel-ai-gateway",
13034
13683
  baseUrl: "https://ai-gateway.vercel.sh",
13035
- reasoning: true,
13684
+ reasoning: false,
13036
13685
  input: ["text"],
13037
13686
  cost: {
13038
- input: 0.28,
13039
- output: 0.42,
13040
- cacheRead: 0.028,
13687
+ input: 0.62,
13688
+ output: 1.85,
13689
+ cacheRead: 0,
13041
13690
  cacheWrite: 0,
13042
13691
  },
13043
13692
  contextWindow: 128000,
13044
- maxTokens: 64000,
13693
+ maxTokens: 8000,
13045
13694
  },
13046
13695
  "deepseek/deepseek-v4-flash": {
13047
13696
  id: "deepseek/deepseek-v4-flash",
@@ -14879,6 +15528,40 @@ export const MODELS = {
14879
15528
  contextWindow: 1000000,
14880
15529
  maxTokens: 128000,
14881
15530
  },
15531
+ "xiaomi/mimo-v2.5": {
15532
+ id: "xiaomi/mimo-v2.5",
15533
+ name: "MiMo M2.5",
15534
+ api: "anthropic-messages",
15535
+ provider: "vercel-ai-gateway",
15536
+ baseUrl: "https://ai-gateway.vercel.sh",
15537
+ reasoning: true,
15538
+ input: ["text", "image"],
15539
+ cost: {
15540
+ input: 0.39999999999999997,
15541
+ output: 2,
15542
+ cacheRead: 0.08,
15543
+ cacheWrite: 0,
15544
+ },
15545
+ contextWindow: 1050000,
15546
+ maxTokens: 131100,
15547
+ },
15548
+ "xiaomi/mimo-v2.5-pro": {
15549
+ id: "xiaomi/mimo-v2.5-pro",
15550
+ name: "MiMo V2.5 Pro",
15551
+ api: "anthropic-messages",
15552
+ provider: "vercel-ai-gateway",
15553
+ baseUrl: "https://ai-gateway.vercel.sh",
15554
+ reasoning: true,
15555
+ input: ["text", "image"],
15556
+ cost: {
15557
+ input: 1,
15558
+ output: 3,
15559
+ cacheRead: 0.19999999999999998,
15560
+ cacheWrite: 0,
15561
+ },
15562
+ contextWindow: 1050000,
15563
+ maxTokens: 131000,
15564
+ },
14882
15565
  "zai/glm-4.5": {
14883
15566
  id: "zai/glm-4.5",
14884
15567
  name: "GLM-4.5",
@@ -15584,6 +16267,24 @@ export const MODELS = {
15584
16267
  contextWindow: 200000,
15585
16268
  maxTokens: 131072,
15586
16269
  },
16270
+ "glm-5v-turbo": {
16271
+ id: "glm-5v-turbo",
16272
+ name: "glm-5v-turbo",
16273
+ api: "openai-completions",
16274
+ provider: "zai",
16275
+ baseUrl: "https://api.z.ai/api/coding/paas/v4",
16276
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
16277
+ reasoning: true,
16278
+ input: ["text", "image"],
16279
+ cost: {
16280
+ input: 0,
16281
+ output: 0,
16282
+ cacheRead: 0,
16283
+ cacheWrite: 0,
16284
+ },
16285
+ contextWindow: 200000,
16286
+ maxTokens: 131072,
16287
+ },
15587
16288
  },
15588
16289
  };
15589
16290
  //# sourceMappingURL=models.generated.js.map