@llmgateway/models 1.3.1 → 1.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -7,6 +7,7 @@ export const alibabaModels = [
7
7
  releasedAt: new Date("2025-09-05"),
8
8
  providers: [
9
9
  {
10
+ test: "skip",
10
11
  providerId: "alibaba",
11
12
  modelName: "qwen-max",
12
13
  inputPrice: 1.6 / 1e6,
@@ -29,6 +30,7 @@ export const alibabaModels = [
29
30
  releasedAt: new Date("2025-01-25"),
30
31
  providers: [
31
32
  {
33
+ test: "skip",
32
34
  providerId: "alibaba",
33
35
  modelName: "qwen-max-latest",
34
36
  inputPrice: 1.6 / 1e6,
@@ -55,6 +57,23 @@ export const alibabaModels = [
55
57
  modelName: "qwen-plus",
56
58
  inputPrice: 0.4 / 1e6,
57
59
  outputPrice: 1.2 / 1e6,
60
+ cachedInputPrice: 0.08 / 1e6,
61
+ pricingTiers: [
62
+ {
63
+ name: "Up to 256K",
64
+ upToTokens: 256000,
65
+ inputPrice: 0.4 / 1e6,
66
+ outputPrice: 1.2 / 1e6,
67
+ cachedInputPrice: 0.08 / 1e6,
68
+ },
69
+ {
70
+ name: "Over 256K",
71
+ upToTokens: Infinity,
72
+ inputPrice: 1.2 / 1e6,
73
+ outputPrice: 3.6 / 1e6,
74
+ cachedInputPrice: 0.24 / 1e6,
75
+ },
76
+ ],
58
77
  requestPrice: 0,
59
78
  contextSize: 131072,
60
79
  maxOutput: 32000,
@@ -77,6 +96,23 @@ export const alibabaModels = [
77
96
  modelName: "qwen-plus-latest",
78
97
  inputPrice: 0.4 / 1e6,
79
98
  outputPrice: 1.2 / 1e6,
99
+ cachedInputPrice: 0.08 / 1e6,
100
+ pricingTiers: [
101
+ {
102
+ name: "Up to 256K",
103
+ upToTokens: 256000,
104
+ inputPrice: 0.4 / 1e6,
105
+ outputPrice: 1.2 / 1e6,
106
+ cachedInputPrice: 0.08 / 1e6,
107
+ },
108
+ {
109
+ name: "Over 256K",
110
+ upToTokens: Infinity,
111
+ inputPrice: 1.2 / 1e6,
112
+ outputPrice: 3.6 / 1e6,
113
+ cachedInputPrice: 0.24 / 1e6,
114
+ },
115
+ ],
80
116
  requestPrice: 0,
81
117
  contextSize: 1000000,
82
118
  maxOutput: 32000,
@@ -99,6 +135,23 @@ export const alibabaModels = [
99
135
  modelName: "qwen-flash",
100
136
  inputPrice: 0.05 / 1e6,
101
137
  outputPrice: 0.4 / 1e6,
138
+ cachedInputPrice: 0.01 / 1e6,
139
+ pricingTiers: [
140
+ {
141
+ name: "Up to 256K",
142
+ upToTokens: 256000,
143
+ inputPrice: 0.05 / 1e6,
144
+ outputPrice: 0.4 / 1e6,
145
+ cachedInputPrice: 0.01 / 1e6,
146
+ },
147
+ {
148
+ name: "Over 256K",
149
+ upToTokens: Infinity,
150
+ inputPrice: 0.25 / 1e6,
151
+ outputPrice: 2.0 / 1e6,
152
+ cachedInputPrice: 0.05 / 1e6,
153
+ },
154
+ ],
102
155
  requestPrice: 0,
103
156
  contextSize: 1000000,
104
157
  maxOutput: 32000,
@@ -236,6 +289,20 @@ export const alibabaModels = [
236
289
  tools: true,
237
290
  jsonOutput: true,
238
291
  },
292
+ {
293
+ providerId: "novita",
294
+ modelName: "qwen/qwen3-235b-a22b-instruct-2507",
295
+ inputPrice: 0.09 / 1e6,
296
+ outputPrice: 0.58 / 1e6,
297
+ requestPrice: 0,
298
+ contextSize: 131072,
299
+ maxOutput: 16384,
300
+ reasoning: false,
301
+ streaming: true,
302
+ vision: false,
303
+ tools: true,
304
+ jsonOutput: true,
305
+ },
239
306
  ],
240
307
  },
241
308
  {
@@ -260,6 +327,43 @@ export const alibabaModels = [
260
327
  stability: "unstable",
261
328
  jsonOutput: true,
262
329
  },
330
+ {
331
+ providerId: "novita",
332
+ modelName: "qwen/qwen3-235b-a22b-thinking-2507",
333
+ inputPrice: 0.3 / 1e6,
334
+ outputPrice: 3 / 1e6,
335
+ requestPrice: 0,
336
+ contextSize: 131072,
337
+ maxOutput: 32768,
338
+ reasoning: false,
339
+ streaming: true,
340
+ vision: false,
341
+ tools: true,
342
+ jsonOutput: false,
343
+ },
344
+ ],
345
+ },
346
+ {
347
+ id: "qwen3-235b-a22b-fp8",
348
+ name: "Qwen3 235B A22B FP8",
349
+ description: "Qwen 3 235B MoE with FP8 quantization.",
350
+ family: "alibaba",
351
+ releasedAt: new Date("2025-04-28"),
352
+ providers: [
353
+ {
354
+ providerId: "novita",
355
+ modelName: "qwen/qwen3-235b-a22b-fp8",
356
+ inputPrice: 0.2 / 1e6,
357
+ outputPrice: 0.8 / 1e6,
358
+ requestPrice: 0,
359
+ contextSize: 40960,
360
+ maxOutput: 20000,
361
+ reasoning: false,
362
+ streaming: true,
363
+ vision: false,
364
+ tools: false,
365
+ jsonOutput: true,
366
+ },
263
367
  ],
264
368
  },
265
369
  {
@@ -498,6 +602,19 @@ export const alibabaModels = [
498
602
  tools: true,
499
603
  jsonOutput: true,
500
604
  },
605
+ {
606
+ providerId: "novita",
607
+ modelName: "qwen/qwen3-coder-480b-a35b-instruct",
608
+ inputPrice: 0.3 / 1e6,
609
+ outputPrice: 1.3 / 1e6,
610
+ requestPrice: 0,
611
+ contextSize: 262144,
612
+ maxOutput: 65536,
613
+ streaming: true,
614
+ vision: false,
615
+ tools: true,
616
+ jsonOutput: true,
617
+ },
501
618
  ],
502
619
  },
503
620
  {
@@ -520,6 +637,19 @@ export const alibabaModels = [
520
637
  tools: true,
521
638
  jsonOutput: true,
522
639
  },
640
+ {
641
+ providerId: "novita",
642
+ modelName: "qwen/qwen3-coder-30b-a3b-instruct",
643
+ inputPrice: 0.07 / 1e6,
644
+ outputPrice: 0.27 / 1e6,
645
+ requestPrice: 0,
646
+ contextSize: 160000,
647
+ maxOutput: 32768,
648
+ streaming: true,
649
+ vision: false,
650
+ tools: true,
651
+ jsonOutput: true,
652
+ },
523
653
  ],
524
654
  },
525
655
  {
@@ -634,6 +764,20 @@ export const alibabaModels = [
634
764
  tools: true,
635
765
  jsonOutput: false,
636
766
  },
767
+ {
768
+ providerId: "novita",
769
+ modelName: "qwen/qwen3-next-80b-a3b-thinking",
770
+ inputPrice: 0.15 / 1e6,
771
+ outputPrice: 1.5 / 1e6,
772
+ requestPrice: 0,
773
+ contextSize: 131072,
774
+ maxOutput: 32768,
775
+ reasoning: true,
776
+ streaming: true,
777
+ vision: false,
778
+ tools: true,
779
+ jsonOutput: false,
780
+ },
637
781
  ],
638
782
  },
639
783
  {
@@ -656,6 +800,19 @@ export const alibabaModels = [
656
800
  tools: true,
657
801
  jsonOutput: true,
658
802
  },
803
+ {
804
+ providerId: "novita",
805
+ modelName: "qwen/qwen3-next-80b-a3b-instruct",
806
+ inputPrice: 0.15 / 1e6,
807
+ outputPrice: 1.5 / 1e6,
808
+ requestPrice: 0,
809
+ contextSize: 131072,
810
+ maxOutput: 32768,
811
+ streaming: true,
812
+ vision: false,
813
+ tools: true,
814
+ jsonOutput: true,
815
+ },
659
816
  ],
660
817
  },
661
818
  {
@@ -682,6 +839,19 @@ export const alibabaModels = [
682
839
  tools: true,
683
840
  jsonOutput: true,
684
841
  },
842
+ {
843
+ providerId: "novita",
844
+ modelName: "qwen/qwen3-max",
845
+ inputPrice: 0.845 / 1e6,
846
+ outputPrice: 3.38 / 1e6,
847
+ requestPrice: 0,
848
+ contextSize: 262144,
849
+ maxOutput: 65536,
850
+ streaming: true,
851
+ vision: false,
852
+ tools: true,
853
+ jsonOutput: true,
854
+ },
685
855
  ],
686
856
  },
687
857
  {
@@ -707,6 +877,120 @@ export const alibabaModels = [
707
877
  },
708
878
  ],
709
879
  },
880
+ {
881
+ id: "qwen3-vl-30b-a3b-instruct",
882
+ name: "Qwen3 VL 30B A3B Instruct",
883
+ description: "Vision-language Qwen 3 MoE model, 30B size.",
884
+ family: "alibaba",
885
+ releasedAt: new Date("2025-10-05"),
886
+ providers: [
887
+ {
888
+ providerId: "novita",
889
+ modelName: "qwen/qwen3-vl-30b-a3b-instruct",
890
+ inputPrice: 0.2 / 1e6,
891
+ outputPrice: 0.7 / 1e6,
892
+ requestPrice: 0,
893
+ contextSize: 131072,
894
+ maxOutput: 32768,
895
+ streaming: true,
896
+ vision: true,
897
+ tools: true,
898
+ jsonOutput: false,
899
+ },
900
+ ],
901
+ },
902
+ {
903
+ id: "qwen3-vl-30b-a3b-thinking",
904
+ name: "Qwen3 VL 30B A3B Thinking",
905
+ description: "Vision-language Qwen 3 MoE with reasoning capabilities.",
906
+ family: "alibaba",
907
+ releasedAt: new Date("2025-10-11"),
908
+ providers: [
909
+ {
910
+ providerId: "novita",
911
+ modelName: "qwen/qwen3-vl-30b-a3b-thinking",
912
+ inputPrice: 0.2 / 1e6,
913
+ outputPrice: 1 / 1e6,
914
+ requestPrice: 0,
915
+ contextSize: 131072,
916
+ maxOutput: 32768,
917
+ reasoning: true,
918
+ streaming: true,
919
+ vision: true,
920
+ tools: true,
921
+ jsonOutput: true,
922
+ },
923
+ ],
924
+ },
925
+ {
926
+ id: "qwen3-32b-fp8",
927
+ name: "Qwen3 32B FP8",
928
+ description: "Qwen 3 32B with FP8 quantization.",
929
+ family: "alibaba",
930
+ releasedAt: new Date("2025-04-28"),
931
+ providers: [
932
+ {
933
+ providerId: "novita",
934
+ modelName: "qwen/qwen3-32b-fp8",
935
+ inputPrice: 0.1 / 1e6,
936
+ outputPrice: 0.45 / 1e6,
937
+ requestPrice: 0,
938
+ contextSize: 40960,
939
+ maxOutput: 20000,
940
+ reasoning: false,
941
+ streaming: true,
942
+ vision: false,
943
+ tools: false,
944
+ jsonOutput: false,
945
+ },
946
+ ],
947
+ },
948
+ {
949
+ id: "qwen3-30b-a3b-fp8",
950
+ name: "Qwen3 30B A3B FP8",
951
+ description: "Qwen 3 30B MoE with FP8 quantization.",
952
+ family: "alibaba",
953
+ releasedAt: new Date("2025-04-28"),
954
+ providers: [
955
+ {
956
+ providerId: "novita",
957
+ modelName: "qwen/qwen3-30b-a3b-fp8",
958
+ inputPrice: 0.09 / 1e6,
959
+ outputPrice: 0.45 / 1e6,
960
+ requestPrice: 0,
961
+ contextSize: 40960,
962
+ maxOutput: 20000,
963
+ reasoning: false,
964
+ streaming: true,
965
+ vision: false,
966
+ tools: false,
967
+ jsonOutput: false,
968
+ },
969
+ ],
970
+ },
971
+ {
972
+ id: "qwen3-4b-fp8",
973
+ name: "Qwen3 4B FP8",
974
+ description: "Lightweight Qwen 3 4B with FP8 quantization.",
975
+ family: "alibaba",
976
+ releasedAt: new Date("2025-04-28"),
977
+ providers: [
978
+ {
979
+ providerId: "novita",
980
+ modelName: "qwen/qwen3-4b-fp8",
981
+ inputPrice: 0.03 / 1e6,
982
+ outputPrice: 0.03 / 1e6,
983
+ requestPrice: 0,
984
+ contextSize: 128000,
985
+ maxOutput: 20000,
986
+ reasoning: false,
987
+ streaming: true,
988
+ vision: false,
989
+ tools: false,
990
+ jsonOutput: false,
991
+ },
992
+ ],
993
+ },
710
994
  {
711
995
  id: "qwen-image-plus",
712
996
  name: "Qwen Image Plus",
@@ -807,5 +1091,392 @@ export const alibabaModels = [
807
1091
  },
808
1092
  ],
809
1093
  },
1094
+ {
1095
+ id: "qwq-plus",
1096
+ name: "QwQ Plus",
1097
+ description: "Alibaba's reasoning model with enhanced math and code capabilities.",
1098
+ family: "alibaba",
1099
+ releasedAt: new Date("2025-03-06"),
1100
+ providers: [
1101
+ {
1102
+ providerId: "alibaba",
1103
+ modelName: "qwq-plus",
1104
+ inputPrice: 0.8 / 1e6,
1105
+ outputPrice: 2.4 / 1e6,
1106
+ requestPrice: 0,
1107
+ contextSize: 131072,
1108
+ maxOutput: 8192,
1109
+ reasoning: true,
1110
+ reasoningOutput: "omit",
1111
+ streaming: true,
1112
+ vision: false,
1113
+ tools: false,
1114
+ jsonOutput: false,
1115
+ },
1116
+ ],
1117
+ },
1118
+ {
1119
+ id: "qwen-coder-plus",
1120
+ name: "Qwen Coder Plus",
1121
+ description: "Alibaba's code-specialized model based on Qwen2.5.",
1122
+ family: "alibaba",
1123
+ releasedAt: new Date("2024-09-18"),
1124
+ providers: [
1125
+ {
1126
+ test: "skip",
1127
+ providerId: "alibaba",
1128
+ modelName: "qwen-coder-plus",
1129
+ inputPrice: 1.0 / 1e6,
1130
+ outputPrice: 5.0 / 1e6,
1131
+ requestPrice: 0,
1132
+ contextSize: 131072,
1133
+ maxOutput: 8192,
1134
+ streaming: true,
1135
+ vision: false,
1136
+ tools: true,
1137
+ jsonOutput: true,
1138
+ },
1139
+ ],
1140
+ },
1141
+ {
1142
+ id: "qwen3-coder-flash",
1143
+ name: "Qwen3 Coder Flash",
1144
+ description: "Fast, cost-effective Qwen 3 model for code generation.",
1145
+ family: "alibaba",
1146
+ releasedAt: new Date("2025-07-22"),
1147
+ providers: [
1148
+ {
1149
+ providerId: "alibaba",
1150
+ modelName: "qwen3-coder-flash",
1151
+ inputPrice: 0.3 / 1e6,
1152
+ outputPrice: 1.5 / 1e6,
1153
+ cachedInputPrice: 0.06 / 1e6,
1154
+ pricingTiers: [
1155
+ {
1156
+ name: "Up to 32K",
1157
+ upToTokens: 32000,
1158
+ inputPrice: 0.3 / 1e6,
1159
+ outputPrice: 1.5 / 1e6,
1160
+ cachedInputPrice: 0.06 / 1e6,
1161
+ },
1162
+ {
1163
+ name: "32K-128K",
1164
+ upToTokens: 128000,
1165
+ inputPrice: 0.5 / 1e6,
1166
+ outputPrice: 2.5 / 1e6,
1167
+ cachedInputPrice: 0.1 / 1e6,
1168
+ },
1169
+ {
1170
+ name: "128K-256K",
1171
+ upToTokens: 256000,
1172
+ inputPrice: 0.8 / 1e6,
1173
+ outputPrice: 4.0 / 1e6,
1174
+ cachedInputPrice: 0.16 / 1e6,
1175
+ },
1176
+ {
1177
+ name: "Over 256K",
1178
+ upToTokens: Infinity,
1179
+ inputPrice: 1.6 / 1e6,
1180
+ outputPrice: 9.6 / 1e6,
1181
+ cachedInputPrice: 0.32 / 1e6,
1182
+ },
1183
+ ],
1184
+ requestPrice: 0,
1185
+ contextSize: 1000000,
1186
+ maxOutput: 65536,
1187
+ streaming: true,
1188
+ vision: false,
1189
+ tools: true,
1190
+ jsonOutput: true,
1191
+ },
1192
+ ],
1193
+ },
1194
+ {
1195
+ id: "qwen3-vl-plus",
1196
+ name: "Qwen3 VL Plus",
1197
+ description: "Qwen 3 vision-language model with balanced performance.",
1198
+ family: "alibaba",
1199
+ releasedAt: new Date("2025-09-23"),
1200
+ providers: [
1201
+ {
1202
+ providerId: "alibaba",
1203
+ modelName: "qwen3-vl-plus",
1204
+ inputPrice: 0.2 / 1e6,
1205
+ outputPrice: 1.6 / 1e6,
1206
+ cachedInputPrice: 0.04 / 1e6,
1207
+ pricingTiers: [
1208
+ {
1209
+ name: "Up to 32K",
1210
+ upToTokens: 32000,
1211
+ inputPrice: 0.2 / 1e6,
1212
+ outputPrice: 1.6 / 1e6,
1213
+ cachedInputPrice: 0.04 / 1e6,
1214
+ },
1215
+ {
1216
+ name: "32K-128K",
1217
+ upToTokens: 128000,
1218
+ inputPrice: 0.3 / 1e6,
1219
+ outputPrice: 2.4 / 1e6,
1220
+ cachedInputPrice: 0.06 / 1e6,
1221
+ },
1222
+ {
1223
+ name: "Over 128K",
1224
+ upToTokens: Infinity,
1225
+ inputPrice: 0.6 / 1e6,
1226
+ outputPrice: 4.8 / 1e6,
1227
+ cachedInputPrice: 0.12 / 1e6,
1228
+ },
1229
+ ],
1230
+ requestPrice: 0,
1231
+ contextSize: 262144,
1232
+ maxOutput: 32768,
1233
+ streaming: true,
1234
+ vision: true,
1235
+ tools: false,
1236
+ jsonOutput: true,
1237
+ },
1238
+ ],
1239
+ },
1240
+ {
1241
+ id: "qwen3-vl-flash",
1242
+ name: "Qwen3 VL Flash",
1243
+ description: "Fast Qwen 3 vision-language model for quick image tasks.",
1244
+ family: "alibaba",
1245
+ releasedAt: new Date("2025-10-15"),
1246
+ providers: [
1247
+ {
1248
+ providerId: "alibaba",
1249
+ modelName: "qwen3-vl-flash",
1250
+ inputPrice: 0.05 / 1e6,
1251
+ outputPrice: 0.4 / 1e6,
1252
+ cachedInputPrice: 0.01 / 1e6,
1253
+ pricingTiers: [
1254
+ {
1255
+ name: "Up to 32K",
1256
+ upToTokens: 32000,
1257
+ inputPrice: 0.05 / 1e6,
1258
+ outputPrice: 0.4 / 1e6,
1259
+ cachedInputPrice: 0.01 / 1e6,
1260
+ },
1261
+ {
1262
+ name: "32K-128K",
1263
+ upToTokens: 128000,
1264
+ inputPrice: 0.075 / 1e6,
1265
+ outputPrice: 0.6 / 1e6,
1266
+ cachedInputPrice: 0.015 / 1e6,
1267
+ },
1268
+ {
1269
+ name: "Over 128K",
1270
+ upToTokens: Infinity,
1271
+ inputPrice: 0.12 / 1e6,
1272
+ outputPrice: 0.96 / 1e6,
1273
+ cachedInputPrice: 0.024 / 1e6,
1274
+ },
1275
+ ],
1276
+ requestPrice: 0,
1277
+ contextSize: 262144,
1278
+ maxOutput: 32768,
1279
+ streaming: true,
1280
+ vision: true,
1281
+ tools: true,
1282
+ jsonOutput: true,
1283
+ },
1284
+ ],
1285
+ },
1286
+ {
1287
+ id: "qwen3-vl-235b-a22b-instruct",
1288
+ name: "Qwen3 VL 235B A22B Instruct",
1289
+ description: "Large Qwen 3 MoE vision-language instruction model.",
1290
+ family: "alibaba",
1291
+ releasedAt: new Date("2025-09-23"),
1292
+ providers: [
1293
+ {
1294
+ providerId: "alibaba",
1295
+ modelName: "qwen3-vl-235b-a22b-instruct",
1296
+ inputPrice: 0.5 / 1e6,
1297
+ outputPrice: 2.0 / 1e6,
1298
+ requestPrice: 0,
1299
+ contextSize: 131072,
1300
+ maxOutput: 32768,
1301
+ streaming: true,
1302
+ vision: true,
1303
+ tools: true,
1304
+ jsonOutput: true,
1305
+ },
1306
+ {
1307
+ providerId: "novita",
1308
+ modelName: "qwen/qwen3-vl-235b-a22b-instruct",
1309
+ inputPrice: 0.3 / 1e6,
1310
+ outputPrice: 1.5 / 1e6,
1311
+ requestPrice: 0,
1312
+ contextSize: 131072,
1313
+ maxOutput: 32768,
1314
+ streaming: true,
1315
+ vision: true,
1316
+ tools: true,
1317
+ jsonOutput: true,
1318
+ },
1319
+ ],
1320
+ },
1321
+ {
1322
+ id: "qwen3-vl-235b-a22b-thinking",
1323
+ name: "Qwen3 VL 235B A22B Thinking",
1324
+ description: "Large Qwen 3 MoE vision-language model with reasoning capabilities.",
1325
+ family: "alibaba",
1326
+ releasedAt: new Date("2025-09-23"),
1327
+ providers: [
1328
+ {
1329
+ providerId: "alibaba",
1330
+ modelName: "qwen3-vl-235b-a22b-thinking",
1331
+ inputPrice: 0.5 / 1e6,
1332
+ outputPrice: 2.0 / 1e6,
1333
+ requestPrice: 0,
1334
+ contextSize: 131072,
1335
+ maxOutput: 32768,
1336
+ reasoning: true,
1337
+ reasoningOutput: "omit",
1338
+ streaming: true,
1339
+ vision: true,
1340
+ tools: false,
1341
+ jsonOutput: false,
1342
+ },
1343
+ {
1344
+ providerId: "novita",
1345
+ modelName: "qwen/qwen3-vl-235b-a22b-thinking",
1346
+ inputPrice: 0.98 / 1e6,
1347
+ outputPrice: 3.95 / 1e6,
1348
+ requestPrice: 0,
1349
+ contextSize: 131072,
1350
+ maxOutput: 32768,
1351
+ reasoning: true,
1352
+ streaming: true,
1353
+ vision: true,
1354
+ tools: false,
1355
+ jsonOutput: false,
1356
+ },
1357
+ ],
1358
+ },
1359
+ {
1360
+ id: "qwen2-5-vl-32b-instruct",
1361
+ name: "Qwen2.5 VL 32B Instruct",
1362
+ description: "Vision-language Qwen 2.5 model, 32B size.",
1363
+ family: "alibaba",
1364
+ releasedAt: new Date("2025-02-19"),
1365
+ providers: [
1366
+ {
1367
+ test: "skip",
1368
+ providerId: "alibaba",
1369
+ modelName: "qwen2.5-vl-32b-instruct",
1370
+ inputPrice: 1.4 / 1e6,
1371
+ outputPrice: 4.2 / 1e6,
1372
+ requestPrice: 0,
1373
+ contextSize: 131072,
1374
+ maxOutput: 32768,
1375
+ streaming: true,
1376
+ vision: true,
1377
+ tools: false,
1378
+ jsonOutput: true,
1379
+ },
1380
+ ],
1381
+ },
1382
+ {
1383
+ id: "qwen3-max-2026-01-23",
1384
+ name: "Qwen3 Max 2026-01-23",
1385
+ description: "Latest Qwen 3 flagship model with integrated thinking mode and tool support.",
1386
+ family: "alibaba",
1387
+ releasedAt: new Date("2026-01-23"),
1388
+ providers: [
1389
+ {
1390
+ test: "skip",
1391
+ providerId: "alibaba",
1392
+ modelName: "qwen3-max-2026-01-23",
1393
+ inputPrice: 1.2 / 1e6,
1394
+ outputPrice: 6.0 / 1e6,
1395
+ cachedInputPrice: 0.24 / 1e6,
1396
+ pricingTiers: [
1397
+ {
1398
+ name: "Up to 32K",
1399
+ upToTokens: 32000,
1400
+ inputPrice: 1.2 / 1e6,
1401
+ outputPrice: 6.0 / 1e6,
1402
+ cachedInputPrice: 0.24 / 1e6,
1403
+ },
1404
+ {
1405
+ name: "32K-128K",
1406
+ upToTokens: 128000,
1407
+ inputPrice: 2.4 / 1e6,
1408
+ outputPrice: 12.0 / 1e6,
1409
+ cachedInputPrice: 0.48 / 1e6,
1410
+ },
1411
+ {
1412
+ name: "Over 128K",
1413
+ upToTokens: Infinity,
1414
+ inputPrice: 3.0 / 1e6,
1415
+ outputPrice: 15.0 / 1e6,
1416
+ cachedInputPrice: 0.6 / 1e6,
1417
+ },
1418
+ ],
1419
+ requestPrice: 0,
1420
+ contextSize: 262144,
1421
+ maxOutput: 65536,
1422
+ reasoning: true,
1423
+ reasoningOutput: "omit",
1424
+ streaming: true,
1425
+ vision: true,
1426
+ tools: true,
1427
+ jsonOutput: true,
1428
+ },
1429
+ ],
1430
+ },
1431
+ {
1432
+ id: "qwen-image-edit-plus",
1433
+ name: "Qwen Image Edit Plus",
1434
+ description: "Alibaba's image editing model for modifying existing images.",
1435
+ family: "alibaba",
1436
+ output: ["text", "image"],
1437
+ releasedAt: new Date("2025-08-19"),
1438
+ providers: [
1439
+ {
1440
+ test: "skip",
1441
+ providerId: "alibaba",
1442
+ modelName: "qwen-image-edit-plus",
1443
+ inputPrice: 0,
1444
+ outputPrice: 0,
1445
+ requestPrice: 0.04,
1446
+ contextSize: 2000,
1447
+ maxOutput: 4096,
1448
+ streaming: false,
1449
+ vision: true,
1450
+ tools: false,
1451
+ jsonOutput: false,
1452
+ imageGenerations: true,
1453
+ },
1454
+ ],
1455
+ },
1456
+ {
1457
+ id: "qwen-image-edit-max",
1458
+ name: "Qwen Image Edit Max",
1459
+ description: "Alibaba's flagship image editing model for high-quality image modifications.",
1460
+ family: "alibaba",
1461
+ output: ["text", "image"],
1462
+ releasedAt: new Date("2026-01-16"),
1463
+ providers: [
1464
+ {
1465
+ test: "skip",
1466
+ providerId: "alibaba",
1467
+ modelName: "qwen-image-edit-max",
1468
+ inputPrice: 0,
1469
+ outputPrice: 0,
1470
+ requestPrice: 0.08,
1471
+ contextSize: 2000,
1472
+ maxOutput: 4096,
1473
+ streaming: false,
1474
+ vision: true,
1475
+ tools: false,
1476
+ jsonOutput: false,
1477
+ imageGenerations: true,
1478
+ },
1479
+ ],
1480
+ },
810
1481
  ];
811
1482
  //# sourceMappingURL=alibaba.js.map