@lobehub/chat 1.120.2 → 1.120.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,1046 @@
1
+ import { AIChatModelCard } from '../types/aiModel';
2
+
3
+ // https://studio.nebius.com/
4
+
5
+ const nebiusChatModels: AIChatModelCard[] = [
6
+ {
7
+ abilities: {
8
+ functionCall: true,
9
+ },
10
+ contextWindowTokens: 131_072,
11
+ displayName: 'Kimi-K2-Instruct',
12
+ id: 'moonshotai/Kimi-K2-Instruct',
13
+ organization: 'moonshotai',
14
+ pricing: {
15
+ units: [
16
+ { name: 'textInput', rate: 0.5, strategy: 'fixed', unit: 'millionTokens' },
17
+ { name: 'textOutput', rate: 2.4, strategy: 'fixed', unit: 'millionTokens' },
18
+ ],
19
+ },
20
+ type: 'chat',
21
+ },
22
+ {
23
+ abilities: {
24
+ functionCall: true,
25
+ },
26
+ contextWindowTokens: 262_144,
27
+ displayName: 'Qwen/Qwen3-Coder-480B-A35B-Instruct',
28
+ id: 'Qwen/Qwen3-Coder-480B-A35B-Instruct',
29
+ organization: 'Qwen',
30
+ pricing: {
31
+ units: [
32
+ { name: 'textInput', rate: 0.4, strategy: 'fixed', unit: 'millionTokens' },
33
+ { name: 'textOutput', rate: 1.8, strategy: 'fixed', unit: 'millionTokens' },
34
+ ],
35
+ },
36
+ type: 'chat',
37
+ },
38
+ {
39
+ abilities: {
40
+ functionCall: true,
41
+ reasoning: true,
42
+ },
43
+ contextWindowTokens: 131_072,
44
+ displayName: 'gpt-oss-120b',
45
+ enabled: true,
46
+ id: 'openai/gpt-oss-120b',
47
+ organization: 'openai',
48
+ pricing: {
49
+ units: [
50
+ { name: 'textInput', rate: 0.15, strategy: 'fixed', unit: 'millionTokens' },
51
+ { name: 'textOutput', rate: 0.6, strategy: 'fixed', unit: 'millionTokens' },
52
+ ],
53
+ },
54
+ type: 'chat',
55
+ },
56
+ {
57
+ abilities: {
58
+ functionCall: true,
59
+ reasoning: true,
60
+ },
61
+ contextWindowTokens: 131_072,
62
+ displayName: 'gpt-oss-20b',
63
+ id: 'openai/gpt-oss-20b',
64
+ organization: 'openai',
65
+ pricing: {
66
+ units: [
67
+ { name: 'textInput', rate: 0.05, strategy: 'fixed', unit: 'millionTokens' },
68
+ { name: 'textOutput', rate: 0.2, strategy: 'fixed', unit: 'millionTokens' },
69
+ ],
70
+ },
71
+ type: 'chat',
72
+ },
73
+ {
74
+ abilities: {
75
+ functionCall: true,
76
+ reasoning: true,
77
+ },
78
+ contextWindowTokens: 131_072,
79
+ displayName: 'GLM-4.5',
80
+ id: 'zai-org/GLM-4.5',
81
+ organization: 'zai-org',
82
+ pricing: {
83
+ units: [
84
+ { name: 'textInput', rate: 0.6, strategy: 'fixed', unit: 'millionTokens' },
85
+ { name: 'textOutput', rate: 2.2, strategy: 'fixed', unit: 'millionTokens' },
86
+ ],
87
+ },
88
+ type: 'chat',
89
+ },
90
+ {
91
+ abilities: {
92
+ functionCall: true,
93
+ reasoning: true,
94
+ },
95
+ contextWindowTokens: 131_072,
96
+ displayName: 'GLM-4.5-Air',
97
+ id: 'zai-org/GLM-4.5-Air',
98
+ organization: 'zai-org',
99
+ pricing: {
100
+ units: [
101
+ { name: 'textInput', rate: 0.2, strategy: 'fixed', unit: 'millionTokens' },
102
+ { name: 'textOutput', rate: 1.2, strategy: 'fixed', unit: 'millionTokens' },
103
+ ],
104
+ },
105
+ type: 'chat',
106
+ },
107
+ {
108
+ abilities: {
109
+ functionCall: true,
110
+ reasoning: true,
111
+ },
112
+ contextWindowTokens: 163_840,
113
+ displayName: 'DeepSeek-R1-0528',
114
+ id: 'deepseek-ai/DeepSeek-R1-0528',
115
+ organization: 'deepseek',
116
+ pricing: {
117
+ units: [
118
+ { name: 'textInput', rate: 0.8, strategy: 'fixed', unit: 'millionTokens' },
119
+ { name: 'textOutput', rate: 2.4, strategy: 'fixed', unit: 'millionTokens' },
120
+ ],
121
+ },
122
+ type: 'chat',
123
+ },
124
+ {
125
+ abilities: {
126
+ functionCall: true,
127
+ reasoning: true,
128
+ },
129
+ contextWindowTokens: 32_768,
130
+ displayName: 'DeepSeek-R1-0528 (fast)',
131
+ id: 'deepseek-ai/DeepSeek-R1-0528-fast',
132
+ organization: 'deepseek',
133
+ pricing: {
134
+ units: [
135
+ { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
136
+ { name: 'textOutput', rate: 6, strategy: 'fixed', unit: 'millionTokens' },
137
+ ],
138
+ },
139
+ type: 'chat',
140
+ },
141
+ {
142
+ abilities: {
143
+ functionCall: true,
144
+ },
145
+ contextWindowTokens: 262_144,
146
+ displayName: 'Qwen3-235B-A22B-Instruct-2507',
147
+ id: 'Qwen/Qwen3-235B-A22B-Instruct-2507',
148
+ organization: 'Qwen',
149
+ pricing: {
150
+ units: [
151
+ { name: 'textInput', rate: 0.2, strategy: 'fixed', unit: 'millionTokens' },
152
+ { name: 'textOutput', rate: 0.6, strategy: 'fixed', unit: 'millionTokens' },
153
+ ],
154
+ },
155
+ type: 'chat',
156
+ },
157
+ {
158
+ abilities: {
159
+ functionCall: true,
160
+ reasoning: true,
161
+ },
162
+ contextWindowTokens: 40_960,
163
+ displayName: 'Qwen3-235B-A22B',
164
+ id: 'Qwen/Qwen3-235B-A22B',
165
+ organization: 'Qwen',
166
+ pricing: {
167
+ units: [
168
+ { name: 'textInput', rate: 0.2, strategy: 'fixed', unit: 'millionTokens' },
169
+ { name: 'textOutput', rate: 0.6, strategy: 'fixed', unit: 'millionTokens' },
170
+ ],
171
+ },
172
+ type: 'chat',
173
+ },
174
+ {
175
+ abilities: {
176
+ functionCall: true,
177
+ reasoning: true,
178
+ },
179
+ contextWindowTokens: 40_960,
180
+ displayName: 'Qwen3-30B-A3B',
181
+ id: 'Qwen/Qwen3-30B-A3B',
182
+ organization: 'Qwen',
183
+ pricing: {
184
+ units: [
185
+ { name: 'textInput', rate: 0.1, strategy: 'fixed', unit: 'millionTokens' },
186
+ { name: 'textOutput', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' },
187
+ ],
188
+ },
189
+ type: 'chat',
190
+ },
191
+ {
192
+ abilities: {
193
+ functionCall: true,
194
+ reasoning: true,
195
+ },
196
+ contextWindowTokens: 40_960,
197
+ displayName: 'Qwen3-30B-A3B (fast)',
198
+ id: 'Qwen/Qwen3-30B-A3B-fast',
199
+ organization: 'Qwen',
200
+ pricing: {
201
+ units: [
202
+ { name: 'textInput', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' },
203
+ { name: 'textOutput', rate: 0.9, strategy: 'fixed', unit: 'millionTokens' },
204
+ ],
205
+ },
206
+ type: 'chat',
207
+ },
208
+ {
209
+ abilities: {
210
+ functionCall: true,
211
+ reasoning: true,
212
+ },
213
+ contextWindowTokens: 40_960,
214
+ displayName: 'Qwen3-32B',
215
+ id: 'Qwen/Qwen3-32B',
216
+ organization: 'Qwen',
217
+ pricing: {
218
+ units: [
219
+ { name: 'textInput', rate: 0.1, strategy: 'fixed', unit: 'millionTokens' },
220
+ { name: 'textOutput', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' },
221
+ ],
222
+ },
223
+ type: 'chat',
224
+ },
225
+ {
226
+ abilities: {
227
+ functionCall: true,
228
+ reasoning: true,
229
+ },
230
+ contextWindowTokens: 40_960,
231
+ displayName: 'Qwen3-32B (fast)',
232
+ id: 'Qwen/Qwen3-32B-fast',
233
+ organization: 'Qwen',
234
+ pricing: {
235
+ units: [
236
+ { name: 'textInput', rate: 0.2, strategy: 'fixed', unit: 'millionTokens' },
237
+ { name: 'textOutput', rate: 0.6, strategy: 'fixed', unit: 'millionTokens' },
238
+ ],
239
+ },
240
+ type: 'chat',
241
+ },
242
+ {
243
+ abilities: {
244
+ functionCall: true,
245
+ reasoning: true,
246
+ },
247
+ contextWindowTokens: 40_960,
248
+ displayName: 'Qwen3-14B',
249
+ id: 'Qwen/Qwen3-14B',
250
+ organization: 'Qwen',
251
+ pricing: {
252
+ units: [
253
+ { name: 'textInput', rate: 0.08, strategy: 'fixed', unit: 'millionTokens' },
254
+ { name: 'textOutput', rate: 0.24, strategy: 'fixed', unit: 'millionTokens' },
255
+ ],
256
+ },
257
+ type: 'chat',
258
+ },
259
+ {
260
+ abilities: {
261
+ functionCall: true,
262
+ reasoning: true,
263
+ },
264
+ contextWindowTokens: 40_960,
265
+ displayName: 'Qwen3-4B (fast)',
266
+ id: 'Qwen/Qwen3-4B-fast',
267
+ organization: 'Qwen',
268
+ pricing: {
269
+ units: [
270
+ { name: 'textInput', rate: 0.08, strategy: 'fixed', unit: 'millionTokens' },
271
+ { name: 'textOutput', rate: 0.24, strategy: 'fixed', unit: 'millionTokens' },
272
+ ],
273
+ },
274
+ type: 'chat',
275
+ },
276
+ {
277
+ abilities: {
278
+ functionCall: true,
279
+ reasoning: true,
280
+ },
281
+ contextWindowTokens: 131_072,
282
+ displayName: 'Llama-3_1-Nemotron-Ultra-253B-v1',
283
+ id: 'nvidia/Llama-3_1-Nemotron-Ultra-253B-v1',
284
+ organization: 'nvidia',
285
+ pricing: {
286
+ units: [
287
+ { name: 'textInput', rate: 0.6, strategy: 'fixed', unit: 'millionTokens' },
288
+ { name: 'textOutput', rate: 1.8, strategy: 'fixed', unit: 'millionTokens' },
289
+ ],
290
+ },
291
+ type: 'chat',
292
+ },
293
+ {
294
+ abilities: {
295
+ functionCall: true,
296
+ },
297
+ contextWindowTokens: 163_840,
298
+ displayName: 'DeepSeek-V3-0324',
299
+ id: 'deepseek-ai/DeepSeek-V3-0324',
300
+ organization: 'deepseek',
301
+ pricing: {
302
+ units: [
303
+ { name: 'textInput', rate: 0.5, strategy: 'fixed', unit: 'millionTokens' },
304
+ { name: 'textOutput', rate: 1.5, strategy: 'fixed', unit: 'millionTokens' },
305
+ ],
306
+ },
307
+ type: 'chat',
308
+ },
309
+ {
310
+ abilities: {
311
+ functionCall: true,
312
+ },
313
+ contextWindowTokens: 32_768,
314
+ displayName: 'DeepSeek-V3-0324 (fast)',
315
+ id: 'deepseek-ai/DeepSeek-V3-0324-fast',
316
+ organization: 'deepseek',
317
+ pricing: {
318
+ units: [
319
+ { name: 'textInput', rate: 0.75, strategy: 'fixed', unit: 'millionTokens' },
320
+ { name: 'textOutput', rate: 2.25, strategy: 'fixed', unit: 'millionTokens' },
321
+ ],
322
+ },
323
+ type: 'chat',
324
+ },
325
+ {
326
+ abilities: {
327
+ functionCall: true,
328
+ },
329
+ contextWindowTokens: 163_840,
330
+ displayName: 'DeepSeek-V3',
331
+ id: 'deepseek-ai/DeepSeek-V3',
332
+ organization: 'deepseek',
333
+ pricing: {
334
+ units: [
335
+ { name: 'textInput', rate: 0.5, strategy: 'fixed', unit: 'millionTokens' },
336
+ { name: 'textOutput', rate: 1.5, strategy: 'fixed', unit: 'millionTokens' },
337
+ ],
338
+ },
339
+ type: 'chat',
340
+ },
341
+ {
342
+ abilities: {
343
+ functionCall: true,
344
+ reasoning: true,
345
+ },
346
+ contextWindowTokens: 163_840,
347
+ displayName: 'DeepSeek-R1',
348
+ id: 'deepseek-ai/DeepSeek-R1',
349
+ organization: 'deepseek',
350
+ pricing: {
351
+ units: [
352
+ { name: 'textInput', rate: 0.8, strategy: 'fixed', unit: 'millionTokens' },
353
+ { name: 'textOutput', rate: 2.4, strategy: 'fixed', unit: 'millionTokens' },
354
+ ],
355
+ },
356
+ type: 'chat',
357
+ },
358
+ {
359
+ abilities: {
360
+ functionCall: true,
361
+ },
362
+ contextWindowTokens: 163_840,
363
+ displayName: 'DeepSeek-R1 (fast)',
364
+ id: 'deepseek-ai/DeepSeek-R1-fast',
365
+ organization: 'deepseek',
366
+ pricing: {
367
+ units: [
368
+ { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
369
+ { name: 'textOutput', rate: 6, strategy: 'fixed', unit: 'millionTokens' },
370
+ ],
371
+ },
372
+ type: 'chat',
373
+ },
374
+ {
375
+ abilities: {
376
+ functionCall: true,
377
+ },
378
+ contextWindowTokens: 131_072,
379
+ displayName: 'Llama-3.3-70B-Instruct',
380
+ id: 'meta-llama/Llama-3.3-70B-Instruct',
381
+ organization: 'meta',
382
+ pricing: {
383
+ units: [
384
+ { name: 'textInput', rate: 0.13, strategy: 'fixed', unit: 'millionTokens' },
385
+ { name: 'textOutput', rate: 0.4, strategy: 'fixed', unit: 'millionTokens' },
386
+ ],
387
+ },
388
+ type: 'chat',
389
+ },
390
+ {
391
+ abilities: {
392
+ functionCall: true,
393
+ },
394
+ contextWindowTokens: 131_072,
395
+ displayName: 'Llama-3.3-70B-Instruct (fast)',
396
+ id: 'meta-llama/Llama-3.3-70B-Instruct-fast',
397
+ organization: 'meta',
398
+ pricing: {
399
+ units: [
400
+ { name: 'textInput', rate: 0.25, strategy: 'fixed', unit: 'millionTokens' },
401
+ { name: 'textOutput', rate: 0.75, strategy: 'fixed', unit: 'millionTokens' },
402
+ ],
403
+ },
404
+ type: 'chat',
405
+ },
406
+ {
407
+ abilities: {
408
+ functionCall: true,
409
+ },
410
+ contextWindowTokens: 131_072,
411
+ displayName: 'Meta-Llama-3.1-70B-Instruct',
412
+ id: 'meta-llama/Meta-Llama-3.1-70B-Instruct',
413
+ organization: 'meta',
414
+ pricing: {
415
+ units: [
416
+ { name: 'textInput', rate: 0.13, strategy: 'fixed', unit: 'millionTokens' },
417
+ { name: 'textOutput', rate: 0.4, strategy: 'fixed', unit: 'millionTokens' },
418
+ ],
419
+ },
420
+ type: 'chat',
421
+ },
422
+ {
423
+ abilities: {
424
+ functionCall: true,
425
+ },
426
+ contextWindowTokens: 131_072,
427
+ displayName: 'Meta-Llama-3.1-8B-Instruct',
428
+ id: 'meta-llama/Meta-Llama-3.1-8B-Instruct',
429
+ organization: 'meta',
430
+ pricing: {
431
+ units: [
432
+ { name: 'textInput', rate: 0.02, strategy: 'fixed', unit: 'millionTokens' },
433
+ { name: 'textOutput', rate: 0.06, strategy: 'fixed', unit: 'millionTokens' },
434
+ ],
435
+ },
436
+ type: 'chat',
437
+ },
438
+ {
439
+ abilities: {
440
+ functionCall: true,
441
+ },
442
+ contextWindowTokens: 131_072,
443
+ displayName: 'Meta-Llama-3.1-8B-Instruct (fast)',
444
+ id: 'meta-llama/Meta-Llama-3.1-8B-Instruct-fast',
445
+ organization: 'meta',
446
+ pricing: {
447
+ units: [
448
+ { name: 'textInput', rate: 0.03, strategy: 'fixed', unit: 'millionTokens' },
449
+ { name: 'textOutput', rate: 0.09, strategy: 'fixed', unit: 'millionTokens' },
450
+ ],
451
+ },
452
+ type: 'chat',
453
+ },
454
+ {
455
+ abilities: {
456
+ functionCall: true,
457
+ },
458
+ contextWindowTokens: 131_072,
459
+ displayName: 'Meta-Llama-3.1-405B-Instruct',
460
+ id: 'meta-llama/Meta-Llama-3.1-405B-Instruct',
461
+ organization: 'meta',
462
+ pricing: {
463
+ units: [
464
+ { name: 'textInput', rate: 1, strategy: 'fixed', unit: 'millionTokens' },
465
+ { name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' },
466
+ ],
467
+ },
468
+ type: 'chat',
469
+ },
470
+ {
471
+ contextWindowTokens: 128_000,
472
+ displayName: 'Mistral-Nemo-Instruct-2407',
473
+ id: 'mistralai/Mistral-Nemo-Instruct-2407',
474
+ organization: 'mistralai',
475
+ pricing: {
476
+ units: [
477
+ { name: 'textInput', rate: 0.04, strategy: 'fixed', unit: 'millionTokens' },
478
+ { name: 'textOutput', rate: 0.12, strategy: 'fixed', unit: 'millionTokens' },
479
+ ],
480
+ },
481
+ type: 'chat',
482
+ },
483
+ {
484
+ abilities: {
485
+ functionCall: true,
486
+ },
487
+ contextWindowTokens: 32_768,
488
+ displayName: 'Qwen2.5-Coder-7B',
489
+ id: 'Qwen/Qwen2.5-Coder-7B',
490
+ organization: 'Qwen',
491
+ pricing: {
492
+ units: [
493
+ { name: 'textInput', rate: 0.01, strategy: 'fixed', unit: 'millionTokens' },
494
+ { name: 'textOutput', rate: 0.03, strategy: 'fixed', unit: 'millionTokens' },
495
+ ],
496
+ },
497
+ type: 'chat',
498
+ },
499
+ {
500
+ abilities: {
501
+ functionCall: true,
502
+ },
503
+ contextWindowTokens: 32_768,
504
+ displayName: 'Qwen2.5-Coder-7B (fast)',
505
+ id: 'Qwen/Qwen2.5-Coder-7B-fast',
506
+ organization: 'Qwen',
507
+ pricing: {
508
+ units: [
509
+ { name: 'textInput', rate: 0.03, strategy: 'fixed', unit: 'millionTokens' },
510
+ { name: 'textOutput', rate: 0.09, strategy: 'fixed', unit: 'millionTokens' },
511
+ ],
512
+ },
513
+ type: 'chat',
514
+ },
515
+ {
516
+ abilities: {
517
+ functionCall: true,
518
+ },
519
+ contextWindowTokens: 131_072,
520
+ displayName: 'Qwen2.5-Coder-32B-Instruct',
521
+ id: 'Qwen/Qwen2.5-Coder-32B-Instruct',
522
+ organization: 'Qwen',
523
+ pricing: {
524
+ units: [
525
+ { name: 'textInput', rate: 0.06, strategy: 'fixed', unit: 'millionTokens' },
526
+ { name: 'textOutput', rate: 0.18, strategy: 'fixed', unit: 'millionTokens' },
527
+ ],
528
+ },
529
+ type: 'chat',
530
+ },
531
+ {
532
+ abilities: {
533
+ functionCall: true,
534
+ },
535
+ contextWindowTokens: 131_072,
536
+ displayName: 'Qwen2.5-Coder-32B-Instruct (fast)',
537
+ id: 'Qwen/Qwen2.5-Coder-32B-Instruct-fast',
538
+ organization: 'Qwen',
539
+ pricing: {
540
+ units: [
541
+ { name: 'textInput', rate: 0.1, strategy: 'fixed', unit: 'millionTokens' },
542
+ { name: 'textOutput', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' },
543
+ ],
544
+ },
545
+ type: 'chat',
546
+ },
547
+ {
548
+ contextWindowTokens: 8192,
549
+ displayName: 'Gemma-2-2b-it',
550
+ id: 'google/gemma-2-2b-it',
551
+ organization: 'google',
552
+ pricing: {
553
+ units: [
554
+ { name: 'textInput', rate: 0.02, strategy: 'fixed', unit: 'millionTokens' },
555
+ { name: 'textOutput', rate: 0.06, strategy: 'fixed', unit: 'millionTokens' },
556
+ ],
557
+ },
558
+ type: 'chat',
559
+ },
560
+ {
561
+ abilities: {
562
+ functionCall: true,
563
+ },
564
+ contextWindowTokens: 8192,
565
+ displayName: 'Gemma-2-9b-it (fast)',
566
+ id: 'google/gemma-2-9b-it-fast',
567
+ organization: 'google',
568
+ pricing: {
569
+ units: [
570
+ { name: 'textInput', rate: 0.03, strategy: 'fixed', unit: 'millionTokens' },
571
+ { name: 'textOutput', rate: 0.09, strategy: 'fixed', unit: 'millionTokens' },
572
+ ],
573
+ },
574
+ type: 'chat',
575
+ },
576
+ {
577
+ abilities: {
578
+ functionCall: true,
579
+ },
580
+ contextWindowTokens: 131_072,
581
+ displayName: 'Qwen2.5-32B-Instruct',
582
+ id: 'Qwen/Qwen2.5-32B-Instruct',
583
+ organization: 'Qwen',
584
+ pricing: {
585
+ units: [
586
+ { name: 'textInput', rate: 0.06, strategy: 'fixed', unit: 'millionTokens' },
587
+ { name: 'textOutput', rate: 0.2, strategy: 'fixed', unit: 'millionTokens' },
588
+ ],
589
+ },
590
+ type: 'chat',
591
+ },
592
+ {
593
+ abilities: {
594
+ functionCall: true,
595
+ },
596
+ contextWindowTokens: 131_072,
597
+ displayName: 'Qwen2.5-32B-Instruct (fast)',
598
+ id: 'Qwen/Qwen2.5-32B-Instruct-fast',
599
+ organization: 'Qwen',
600
+ pricing: {
601
+ units: [
602
+ { name: 'textInput', rate: 0.13, strategy: 'fixed', unit: 'millionTokens' },
603
+ { name: 'textOutput', rate: 0.4, strategy: 'fixed', unit: 'millionTokens' },
604
+ ],
605
+ },
606
+ type: 'chat',
607
+ },
608
+ {
609
+ abilities: {
610
+ functionCall: true,
611
+ },
612
+ contextWindowTokens: 131_072,
613
+ displayName: 'Qwen2.5-72B-Instruct',
614
+ id: 'Qwen/Qwen2.5-72B-Instruct',
615
+ organization: 'Qwen',
616
+ pricing: {
617
+ units: [
618
+ { name: 'textInput', rate: 0.13, strategy: 'fixed', unit: 'millionTokens' },
619
+ { name: 'textOutput', rate: 0.4, strategy: 'fixed', unit: 'millionTokens' },
620
+ ],
621
+ },
622
+ type: 'chat',
623
+ },
624
+ {
625
+ abilities: {
626
+ functionCall: true,
627
+ },
628
+ contextWindowTokens: 131_072,
629
+ displayName: 'Qwen2.5-72B-Instruct (fast)',
630
+ id: 'Qwen/Qwen2.5-72B-Instruct-fast',
631
+ organization: 'Qwen',
632
+ pricing: {
633
+ units: [
634
+ { name: 'textInput', rate: 0.25, strategy: 'fixed', unit: 'millionTokens' },
635
+ { name: 'textOutput', rate: 0.75, strategy: 'fixed', unit: 'millionTokens' },
636
+ ],
637
+ },
638
+ type: 'chat',
639
+ },
640
+ {
641
+ abilities: {
642
+ functionCall: true,
643
+ },
644
+ contextWindowTokens: 8192,
645
+ displayName: 'Llama3-OpenBioLLM-70B',
646
+ id: 'aaditya/Llama3-OpenBioLLM-70B',
647
+ organization: 'aaditya',
648
+ pricing: {
649
+ units: [
650
+ { name: 'textInput', rate: 0.13, strategy: 'fixed', unit: 'millionTokens' },
651
+ { name: 'textOutput', rate: 0.4, strategy: 'fixed', unit: 'millionTokens' },
652
+ ],
653
+ },
654
+ type: 'chat',
655
+ },
656
+ {
657
+ abilities: {
658
+ functionCall: true,
659
+ reasoning: true,
660
+ },
661
+ contextWindowTokens: 131_072,
662
+ displayName: 'QwQ-32B',
663
+ id: 'Qwen/QwQ-32B',
664
+ organization: 'Qwen',
665
+ pricing: {
666
+ units: [
667
+ { name: 'textInput', rate: 0.15, strategy: 'fixed', unit: 'millionTokens' },
668
+ { name: 'textOutput', rate: 0.45, strategy: 'fixed', unit: 'millionTokens' },
669
+ ],
670
+ },
671
+ type: 'chat',
672
+ },
673
+ {
674
+ abilities: {
675
+ functionCall: true,
676
+ reasoning: true,
677
+ },
678
+ contextWindowTokens: 131_072,
679
+ displayName: 'QwQ-32B (fast)',
680
+ id: 'Qwen/QwQ-32B-fast',
681
+ organization: 'Qwen',
682
+ pricing: {
683
+ units: [
684
+ { name: 'textInput', rate: 0.5, strategy: 'fixed', unit: 'millionTokens' },
685
+ { name: 'textOutput', rate: 1.5, strategy: 'fixed', unit: 'millionTokens' },
686
+ ],
687
+ },
688
+ type: 'chat',
689
+ },
690
+ {
691
+ abilities: {
692
+ functionCall: true,
693
+ },
694
+ contextWindowTokens: 16_384,
695
+ displayName: 'phi-4',
696
+ id: 'microsoft/phi-4',
697
+ organization: 'microsoft',
698
+ pricing: {
699
+ units: [
700
+ { name: 'textInput', rate: 0.1, strategy: 'fixed', unit: 'millionTokens' },
701
+ { name: 'textOutput', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' },
702
+ ],
703
+ },
704
+ type: 'chat',
705
+ },
706
+ {
707
+ abilities: {
708
+ functionCall: true,
709
+ },
710
+ contextWindowTokens: 131_072,
711
+ displayName: 'Hermes-3-Llama-3.1-405B',
712
+ id: 'NousResearch/Hermes-3-Llama-405B',
713
+ organization: 'NousResearch',
714
+ pricing: {
715
+ units: [
716
+ { name: 'textInput', rate: 1, strategy: 'fixed', unit: 'millionTokens' },
717
+ { name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' },
718
+ ],
719
+ },
720
+ type: 'chat',
721
+ },
722
+ {
723
+ abilities: {
724
+ functionCall: true,
725
+ },
726
+ contextWindowTokens: 131_072,
727
+ displayName: 'Hermes-4-70B',
728
+ id: 'NousResearch/Hermes-4-70B',
729
+ organization: 'NousResearch',
730
+ pricing: {
731
+ units: [
732
+ { name: 'textInput', rate: 0.13, strategy: 'fixed', unit: 'millionTokens' },
733
+ { name: 'textOutput', rate: 0.4, strategy: 'fixed', unit: 'millionTokens' },
734
+ ],
735
+ },
736
+ type: 'chat',
737
+ },
738
+ {
739
+ abilities: {
740
+ functionCall: true,
741
+ },
742
+ contextWindowTokens: 131_072,
743
+ displayName: 'Hermes-4-405B',
744
+ id: 'NousResearch/Hermes-4-405B',
745
+ organization: 'NousResearch',
746
+ pricing: {
747
+ units: [
748
+ { name: 'textInput', rate: 1, strategy: 'fixed', unit: 'millionTokens' },
749
+ { name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' },
750
+ ],
751
+ },
752
+ type: 'chat',
753
+ },
754
+ {
755
+ abilities: {
756
+ functionCall: true,
757
+ reasoning: true,
758
+ },
759
+ contextWindowTokens: 131_072,
760
+ displayName: 'DeepSeek-R1-Distill-Llama-70B',
761
+ id: 'deepseek-ai/DeepSeek-R1-Distill-Llama-70B',
762
+ organization: 'deepseek',
763
+ pricing: {
764
+ units: [
765
+ { name: 'textInput', rate: 0.25, strategy: 'fixed', unit: 'millionTokens' },
766
+ { name: 'textOutput', rate: 0.75, strategy: 'fixed', unit: 'millionTokens' },
767
+ ],
768
+ },
769
+ type: 'chat',
770
+ },
771
+ {
772
+ abilities: {
773
+ functionCall: true,
774
+ },
775
+ contextWindowTokens: 128_000,
776
+ displayName: 'Devstral-Small-2505',
777
+ id: 'mistralai/Devstral-Small-2505',
778
+ organization: 'mistralai',
779
+ pricing: {
780
+ units: [
781
+ { name: 'textInput', rate: 0.08, strategy: 'fixed', unit: 'millionTokens' },
782
+ { name: 'textOutput', rate: 0.24, strategy: 'fixed', unit: 'millionTokens' },
783
+ ],
784
+ },
785
+ type: 'chat',
786
+ },
787
+ {
788
+ abilities: {
789
+ functionCall: true,
790
+ },
791
+ contextWindowTokens: 131_072,
792
+ displayName: 'Llama-3_3-Nemotron-Super-49B-v1',
793
+ id: 'nvidia/Llama-3_3-Nemotron-Super-49B-v1',
794
+ organization: 'nvidia',
795
+ pricing: {
796
+ units: [
797
+ { name: 'textInput', rate: 0.13, strategy: 'fixed', unit: 'millionTokens' },
798
+ { name: 'textOutput', rate: 0.4, strategy: 'fixed', unit: 'millionTokens' },
799
+ ],
800
+ },
801
+ type: 'chat',
802
+ },
803
+ {
804
+ abilities: {
805
+ functionCall: true,
806
+ reasoning: true,
807
+ },
808
+ contextWindowTokens: 262_144,
809
+ displayName: 'Qwen3-30B-A3B-Thinking-2507',
810
+ id: 'Qwen/Qwen3-30B-A3B-Thinking-2507',
811
+ organization: 'Qwen',
812
+ pricing: {
813
+ units: [
814
+ { name: 'textInput', rate: 0.1, strategy: 'fixed', unit: 'millionTokens' },
815
+ { name: 'textOutput', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' },
816
+ ],
817
+ },
818
+ type: 'chat',
819
+ },
820
+ {
821
+ abilities: {
822
+ functionCall: true,
823
+ },
824
+ contextWindowTokens: 262_144,
825
+ displayName: 'Qwen3-30B-A3B-Instruct-2507',
826
+ id: 'Qwen/Qwen3-30B-A3B-Instruct-2507',
827
+ organization: 'Qwen',
828
+ pricing: {
829
+ units: [
830
+ { name: 'textInput', rate: 0.1, strategy: 'fixed', unit: 'millionTokens' },
831
+ { name: 'textOutput', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' },
832
+ ],
833
+ },
834
+ type: 'chat',
835
+ },
836
+ {
837
+ abilities: {
838
+ functionCall: true,
839
+ },
840
+ contextWindowTokens: 262_144,
841
+ displayName: 'Qwen3-Coder-30B-A3B-Instruct',
842
+ id: 'Qwen/Qwen3-Coder-30B-A3B-Instruct',
843
+ organization: 'Qwen',
844
+ pricing: {
845
+ units: [
846
+ { name: 'textInput', rate: 0.1, strategy: 'fixed', unit: 'millionTokens' },
847
+ { name: 'textOutput', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' },
848
+ ],
849
+ },
850
+ type: 'chat',
851
+ },
852
+ {
853
+ abilities: {
854
+ functionCall: true,
855
+ },
856
+ contextWindowTokens: 131_072,
857
+ displayName: 'Meta-Llama-Guard-3-8B',
858
+ id: 'meta-llama/Llama-Guard-3-8B',
859
+ organization: 'meta',
860
+ pricing: {
861
+ units: [
862
+ { name: 'textInput', rate: 0.02, strategy: 'fixed', unit: 'millionTokens' },
863
+ { name: 'textOutput', rate: 0.06, strategy: 'fixed', unit: 'millionTokens' },
864
+ ],
865
+ },
866
+ type: 'chat',
867
+ },
868
+ {
869
+ abilities: {
870
+ functionCall: true,
871
+ vision: true,
872
+ },
873
+ contextWindowTokens: 32_768,
874
+ displayName: 'Qwen2-VL-72B-Instruct',
875
+ id: 'Qwen/Qwen2-VL-72B-Instruct',
876
+ organization: 'Qwen',
877
+ pricing: {
878
+ units: [
879
+ { name: 'textInput', rate: 0.13, strategy: 'fixed', unit: 'millionTokens' },
880
+ { name: 'textOutput', rate: 0.4, strategy: 'fixed', unit: 'millionTokens' },
881
+ ],
882
+ },
883
+ type: 'chat',
884
+ },
885
+ {
886
+ abilities: {
887
+ functionCall: true,
888
+ vision: true,
889
+ },
890
+ contextWindowTokens: 131_072,
891
+ displayName: 'Mistral-Small-3.1-24B-Instruct-2503',
892
+ id: 'mistralai/Mistral-Small-3.1-24B-Instruct-2503',
893
+ organization: 'mistralai',
894
+ pricing: {
895
+ units: [
896
+ { name: 'textInput', rate: 0.05, strategy: 'fixed', unit: 'millionTokens' },
897
+ { name: 'textOutput', rate: 0.15, strategy: 'fixed', unit: 'millionTokens' },
898
+ ],
899
+ },
900
+ type: 'chat',
901
+ },
902
+ {
903
+ abilities: {
904
+ functionCall: true,
905
+ vision: true,
906
+ },
907
+ contextWindowTokens: 110_000,
908
+ displayName: 'Gemma-3-27b-it',
909
+ id: 'google/gemma-3-27b-it',
910
+ organization: 'google',
911
+ pricing: {
912
+ units: [
913
+ { name: 'textInput', rate: 0.1, strategy: 'fixed', unit: 'millionTokens' },
914
+ { name: 'textOutput', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' },
915
+ ],
916
+ },
917
+ type: 'chat',
918
+ },
919
+ {
920
+ abilities: {
921
+ functionCall: true,
922
+ vision: true,
923
+ },
924
+ contextWindowTokens: 110_000,
925
+ displayName: 'Gemma-3-27b-it (fast)',
926
+ id: 'google/gemma-3-27b-it-fast',
927
+ organization: 'google',
928
+ pricing: {
929
+ units: [
930
+ { name: 'textInput', rate: 0.2, strategy: 'fixed', unit: 'millionTokens' },
931
+ { name: 'textOutput', rate: 0.6, strategy: 'fixed', unit: 'millionTokens' },
932
+ ],
933
+ },
934
+ type: 'chat',
935
+ },
936
+ {
937
+ abilities: {
938
+ functionCall: true,
939
+ vision: true,
940
+ },
941
+ contextWindowTokens: 32_000,
942
+ displayName: 'Qwen2.5-VL-72B-Instruct',
943
+ id: 'Qwen/Qwen2.5-VL-72B-Instruct',
944
+ organization: 'Qwen',
945
+ pricing: {
946
+ units: [
947
+ { name: 'textInput', rate: 0.25, strategy: 'fixed', unit: 'millionTokens' },
948
+ { name: 'textOutput', rate: 0.75, strategy: 'fixed', unit: 'millionTokens' },
949
+ ],
950
+ },
951
+ type: 'chat',
952
+ },
953
+ ];
954
+
955
+ // 下述模型待验证
956
+
957
+ // export const nebiusImageModels: AIImageModelCard[] = [
958
+ // {
959
+ // contextWindowTokens: 0,
960
+ // displayName: 'FLUX.1-dev',
961
+ // id: 'black-forest-labs/flux-dev',
962
+ // pricing: {
963
+ // units: [
964
+ // { name: 'imageGeneration', rate: 0.007, strategy: 'fixed', unit: 'image' },
965
+ // ],
966
+ // },
967
+ // type: 'image',
968
+ // },
969
+ // {
970
+ // contextWindowTokens: 0,
971
+ // displayName: 'FLUX.1-schnell',
972
+ // id: 'black-forest-labs/flux-schnell',
973
+ // pricing: {
974
+ // units: [
975
+ // { name: 'imageGeneration', rate: 0.0013, strategy: 'fixed', unit: 'image' },
976
+ // ],
977
+ // },
978
+ // type: 'image',
979
+ // },
980
+ // {
981
+ // contextWindowTokens: 0,
982
+ // displayName: 'Stable Diffusion XL 1.0',
983
+ // id: 'stability-ai/sdxl',
984
+ // pricing: {
985
+ // units: [
986
+ // { name: 'imageGeneration', rate: 0.003, strategy: 'fixed', unit: 'image' },
987
+ // ],
988
+ // },
989
+ // type: 'image',
990
+ // },
991
+ // ];
992
+
993
+ // export const nebiusEmbeddingModels: AIEmbeddingModelCard[] = [
994
+ // {
995
+ // contextWindowTokens: 32_768,
996
+ // displayName: 'BGE-ICL',
997
+ // id: 'BAAI/bge-en-icl',
998
+ // maxDimension: 3072,
999
+ // pricing: {
1000
+ // units: [
1001
+ // { name: 'textInput', rate: 0.01, strategy: 'fixed', unit: 'millionTokens' },
1002
+ // ],
1003
+ // },
1004
+ // type: 'embedding',
1005
+ // },
1006
+ // {
1007
+ // contextWindowTokens: 8192,
1008
+ // displayName: 'bge-multilingual-gemma2',
1009
+ // id: 'BAAI/bge-multilingual-gemma2',
1010
+ // maxDimension: 3072,
1011
+ // pricing: {
1012
+ // units: [
1013
+ // { name: 'textInput', rate: 0.01, strategy: 'fixed', unit: 'millionTokens' },
1014
+ // ],
1015
+ // },
1016
+ // type: 'embedding',
1017
+ // },
1018
+ // {
1019
+ // contextWindowTokens: 32_768,
1020
+ // displayName: 'e5-mistral-7b-instruct',
1021
+ // id: 'intfloat/e5-mistral-7b-instruct',
1022
+ // maxDimension: 1536,
1023
+ // pricing: {
1024
+ // units: [
1025
+ // { name: 'textInput', rate: 0.01, strategy: 'fixed', unit: 'millionTokens' },
1026
+ // ],
1027
+ // },
1028
+ // type: 'embedding',
1029
+ // },
1030
+ // {
1031
+ // contextWindowTokens: 40_960,
1032
+ // displayName: 'Qwen3-Embedding-8B',
1033
+ // id: 'Qwen/Qwen3-Embedding-8B',
1034
+ // maxDimension: 3072,
1035
+ // pricing: {
1036
+ // units: [
1037
+ // { name: 'textInput', rate: 0.01, strategy: 'fixed', unit: 'millionTokens' },
1038
+ // ],
1039
+ // },
1040
+ // type: 'embedding',
1041
+ // },
1042
+ // ];
1043
+
1044
+ export const allModels = [...nebiusChatModels];
1045
+
1046
+ export default allModels;