model-library 0.1.3__py3-none-any.whl → 0.1.4__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- model_library/base/base.py +2 -0
- model_library/base/output.py +1 -0
- model_library/config/README.md +169 -0
- model_library/config/ai21labs_models.yaml +11 -11
- model_library/config/alibaba_models.yaml +21 -22
- model_library/config/all_models.json +4572 -2598
- model_library/config/amazon_models.yaml +100 -102
- model_library/config/anthropic_models.yaml +43 -52
- model_library/config/cohere_models.yaml +25 -24
- model_library/config/deepseek_models.yaml +28 -25
- model_library/config/dummy_model.yaml +9 -7
- model_library/config/fireworks_models.yaml +86 -56
- model_library/config/google_models.yaml +131 -126
- model_library/config/inception_models.yaml +6 -6
- model_library/config/kimi_models.yaml +13 -14
- model_library/config/minimax_models.yaml +37 -0
- model_library/config/mistral_models.yaml +85 -29
- model_library/config/openai_models.yaml +192 -150
- model_library/config/perplexity_models.yaml +8 -23
- model_library/config/together_models.yaml +115 -104
- model_library/config/xai_models.yaml +47 -79
- model_library/config/zai_models.yaml +23 -15
- model_library/exceptions.py +6 -15
- model_library/providers/amazon.py +32 -17
- model_library/providers/minimax.py +33 -0
- model_library/providers/mistral.py +10 -1
- model_library/providers/openai.py +2 -6
- model_library/register_models.py +36 -36
- model_library/registry_utils.py +18 -16
- model_library/utils.py +2 -2
- {model_library-0.1.3.dist-info → model_library-0.1.4.dist-info}/METADATA +2 -2
- model_library-0.1.4.dist-info/RECORD +64 -0
- model_library-0.1.3.dist-info/RECORD +0 -61
- {model_library-0.1.3.dist-info → model_library-0.1.4.dist-info}/WHEEL +0 -0
- {model_library-0.1.3.dist-info → model_library-0.1.4.dist-info}/licenses/LICENSE +0 -0
- {model_library-0.1.3.dist-info → model_library-0.1.4.dist-info}/top_level.txt +0 -0
|
@@ -2,7 +2,14 @@ base-config:
|
|
|
2
2
|
company: Google
|
|
3
3
|
documentation_url: https://ai.google.dev/gemini-api/docs/models
|
|
4
4
|
open_source: false
|
|
5
|
-
|
|
5
|
+
supports:
|
|
6
|
+
images: false
|
|
7
|
+
videos: false
|
|
8
|
+
files: false
|
|
9
|
+
batch: false
|
|
10
|
+
temperature: false
|
|
11
|
+
tools: false
|
|
12
|
+
metadata:
|
|
6
13
|
available_for_everyone: true
|
|
7
14
|
available_as_evaluator: false
|
|
8
15
|
ignored_for_cost: false
|
|
@@ -21,30 +28,25 @@ gemma-models:
|
|
|
21
28
|
use such as phones and tablets, capable of handling text, audio, and vision
|
|
22
29
|
inputs with efficient parameter caching techniques.
|
|
23
30
|
release_date: 2025-03-12
|
|
24
|
-
|
|
31
|
+
metadata:
|
|
25
32
|
deprecated: true
|
|
26
33
|
properties:
|
|
27
34
|
context_window: 131_072
|
|
28
|
-
|
|
35
|
+
max_tokens: 8_192
|
|
29
36
|
training_cutoff: "2023-09"
|
|
30
37
|
costs_per_million_token:
|
|
31
38
|
input: 0.00
|
|
32
39
|
output: 0.00
|
|
33
40
|
|
|
34
|
-
|
|
35
41
|
gemini-3-models:
|
|
36
42
|
base-config:
|
|
37
|
-
|
|
38
|
-
|
|
39
|
-
|
|
40
|
-
|
|
41
|
-
|
|
42
|
-
|
|
43
|
-
|
|
44
|
-
supports_videos: true
|
|
45
|
-
supports_tools: true
|
|
46
|
-
supports_batch_requests: true
|
|
47
|
-
supports_temperature: true
|
|
43
|
+
supports:
|
|
44
|
+
images: true
|
|
45
|
+
files: true
|
|
46
|
+
videos: true
|
|
47
|
+
tools: true
|
|
48
|
+
batch: true
|
|
49
|
+
temperature: true
|
|
48
50
|
costs_per_million_token:
|
|
49
51
|
cache:
|
|
50
52
|
read_discount: 0.1
|
|
@@ -58,41 +60,34 @@ gemini-3-models:
|
|
|
58
60
|
release_date: 2025-11-18
|
|
59
61
|
properties:
|
|
60
62
|
context_window: 1048576
|
|
61
|
-
|
|
63
|
+
max_tokens: 65536
|
|
62
64
|
training_cutoff: "2025-01"
|
|
63
65
|
reasoning_model: true
|
|
64
|
-
class_properties:
|
|
65
|
-
supports_images: true
|
|
66
|
-
supports_files: true
|
|
67
|
-
supports_videos: true
|
|
68
|
-
supports_tools: true
|
|
69
|
-
supports_batch_requests: true
|
|
70
|
-
supports_temperature: true
|
|
71
66
|
costs_per_million_token:
|
|
72
|
-
input: 2
|
|
73
|
-
output: 12
|
|
67
|
+
input: 2.0
|
|
68
|
+
output: 12.0
|
|
74
69
|
cache:
|
|
75
70
|
read: 0.20
|
|
76
71
|
context:
|
|
77
72
|
threshold: 200_000
|
|
78
|
-
input:
|
|
79
|
-
output:
|
|
73
|
+
input: 4.0
|
|
74
|
+
output: 18.0
|
|
80
75
|
cache:
|
|
81
76
|
read: 0.40
|
|
82
77
|
|
|
83
78
|
gemini-2.5-models:
|
|
84
79
|
base-config:
|
|
80
|
+
supports:
|
|
81
|
+
images: true
|
|
82
|
+
files: true
|
|
83
|
+
videos: true
|
|
84
|
+
tools: true
|
|
85
|
+
batch: true
|
|
86
|
+
temperature: true
|
|
85
87
|
properties:
|
|
86
88
|
context_window: 1_048_576
|
|
87
|
-
|
|
89
|
+
max_tokens: 8_192
|
|
88
90
|
training_cutoff: "2024-05"
|
|
89
|
-
class_properties:
|
|
90
|
-
supports_images: true
|
|
91
|
-
supports_files: true
|
|
92
|
-
supports_videos: true
|
|
93
|
-
supports_tools: true
|
|
94
|
-
supports_batch_requests: true
|
|
95
|
-
supports_temperature: true
|
|
96
91
|
costs_per_million_token:
|
|
97
92
|
cache:
|
|
98
93
|
read_discount: 0.1
|
|
@@ -107,12 +102,12 @@ gemini-2.5-models:
|
|
|
107
102
|
using multimodal inputs including audio, images, video, and PDFs with a context
|
|
108
103
|
window exceeding 1 million tokens.
|
|
109
104
|
release_date: 2025-07-17
|
|
105
|
+
metadata:
|
|
106
|
+
available_as_evaluator: true
|
|
110
107
|
properties:
|
|
111
108
|
context_window: 1_048_576
|
|
112
|
-
|
|
109
|
+
max_tokens: 65_536
|
|
113
110
|
reasoning_model: true
|
|
114
|
-
class_properties:
|
|
115
|
-
available_as_evaluator: true
|
|
116
111
|
costs_per_million_token:
|
|
117
112
|
input: 1.25
|
|
118
113
|
output: 10.0
|
|
@@ -132,12 +127,12 @@ gemini-2.5-models:
|
|
|
132
127
|
large scale processing with support for multiple modalities, a 1 million token
|
|
133
128
|
context window, and strong reasoning capabilities.
|
|
134
129
|
release_date: 2025-07-17
|
|
130
|
+
metadata:
|
|
131
|
+
available_as_evaluator: true
|
|
135
132
|
properties:
|
|
136
133
|
context_window: 1_048_576
|
|
137
|
-
|
|
134
|
+
max_tokens: 65_536
|
|
138
135
|
reasoning_model: false
|
|
139
|
-
class_properties:
|
|
140
|
-
available_as_evaluator: true
|
|
141
136
|
costs_per_million_token:
|
|
142
137
|
input: 0.30
|
|
143
138
|
output: 2.50
|
|
@@ -156,7 +151,7 @@ gemini-2.5-models:
|
|
|
156
151
|
release_date: 2025-09-25
|
|
157
152
|
properties:
|
|
158
153
|
context_window: 1_048_576
|
|
159
|
-
|
|
154
|
+
max_tokens: 65_535
|
|
160
155
|
reasoning_model: false
|
|
161
156
|
costs_per_million_token:
|
|
162
157
|
input: 0.30
|
|
@@ -177,7 +172,7 @@ gemini-2.5-models:
|
|
|
177
172
|
release_date: 2025-07-22
|
|
178
173
|
properties:
|
|
179
174
|
context_window: 1_048_576
|
|
180
|
-
|
|
175
|
+
max_tokens: 65_535
|
|
181
176
|
reasoning_model: false
|
|
182
177
|
costs_per_million_token:
|
|
183
178
|
input: 0.10
|
|
@@ -198,7 +193,7 @@ gemini-2.5-models:
|
|
|
198
193
|
release_date: 2025-09-25
|
|
199
194
|
properties:
|
|
200
195
|
context_window: 1_048_576
|
|
201
|
-
|
|
196
|
+
max_tokens: 65_535
|
|
202
197
|
reasoning_model: false
|
|
203
198
|
costs_per_million_token:
|
|
204
199
|
input: 0.10
|
|
@@ -217,12 +212,12 @@ gemini-2.5-models:
|
|
|
217
212
|
at scale, with support for text, images, video, and audio input modalities and
|
|
218
213
|
large context length.
|
|
219
214
|
release_date: 2025-06-17
|
|
215
|
+
metadata:
|
|
216
|
+
deprecated: true
|
|
220
217
|
properties:
|
|
221
218
|
context_window: 1_048_576
|
|
222
|
-
|
|
219
|
+
max_tokens: 65_535
|
|
223
220
|
reasoning_model: false
|
|
224
|
-
class_properties:
|
|
225
|
-
deprecated: true
|
|
226
221
|
costs_per_million_token:
|
|
227
222
|
input: 0.10
|
|
228
223
|
output: 0.40
|
|
@@ -240,13 +235,13 @@ gemini-2.5-models:
|
|
|
240
235
|
large scale processing with support for multiple modalities, a 1 million token
|
|
241
236
|
context window, and strong reasoning capabilities.
|
|
242
237
|
release_date: 2025-05-20
|
|
238
|
+
metadata:
|
|
239
|
+
deprecated: true
|
|
243
240
|
properties:
|
|
244
241
|
context_window: 1_048_576
|
|
245
|
-
|
|
242
|
+
max_tokens: 65_536
|
|
246
243
|
training_cutoff: "2025-01"
|
|
247
244
|
reasoning_model: false
|
|
248
|
-
class_properties:
|
|
249
|
-
deprecated: true
|
|
250
245
|
costs_per_million_token:
|
|
251
246
|
input: 0.15
|
|
252
247
|
output: 0.60
|
|
@@ -265,14 +260,15 @@ gemini-2.5-models:
|
|
|
265
260
|
using multimodal inputs including audio, images, video, and PDFs with a context
|
|
266
261
|
window exceeding 1 million tokens.
|
|
267
262
|
release_date: 2025-06-05
|
|
263
|
+
supports:
|
|
264
|
+
batch: false
|
|
265
|
+
metadata:
|
|
266
|
+
deprecated: true
|
|
268
267
|
properties:
|
|
269
268
|
context_window: 1_048_576
|
|
270
|
-
|
|
269
|
+
max_tokens: 65_536
|
|
271
270
|
training_cutoff: "2025-01"
|
|
272
271
|
reasoning_model: true
|
|
273
|
-
class_properties:
|
|
274
|
-
supports_batch_requests: false
|
|
275
|
-
deprecated: true
|
|
276
272
|
costs_per_million_token:
|
|
277
273
|
input: 1.25
|
|
278
274
|
output: 10.0
|
|
@@ -287,14 +283,14 @@ gemini-2.5-models:
|
|
|
287
283
|
using multimodal inputs including audio, images, video, and PDFs with a context
|
|
288
284
|
window exceeding 1 million tokens.
|
|
289
285
|
release_date: 2025-05-06
|
|
286
|
+
metadata:
|
|
287
|
+
available_for_everyone: false
|
|
288
|
+
deprecated: true
|
|
290
289
|
properties:
|
|
291
290
|
context_window: 1_048_576
|
|
292
|
-
|
|
291
|
+
max_tokens: 65_536
|
|
293
292
|
training_cutoff: "2025-01"
|
|
294
|
-
available_for_everyone: false
|
|
295
293
|
reasoning_model: true
|
|
296
|
-
class_properties:
|
|
297
|
-
deprecated: true
|
|
298
294
|
costs_per_million_token:
|
|
299
295
|
input: 1.25
|
|
300
296
|
output: 10.0
|
|
@@ -308,13 +304,13 @@ gemini-2.5-models:
|
|
|
308
304
|
large scale processing with support for multiple modalities, a 1 million token
|
|
309
305
|
context window, and strong reasoning capabilities.
|
|
310
306
|
release_date: 2025-04-17
|
|
307
|
+
metadata:
|
|
308
|
+
deprecated: true
|
|
311
309
|
properties:
|
|
312
310
|
context_window: 1_048_576
|
|
313
|
-
|
|
311
|
+
max_tokens: 65_536
|
|
314
312
|
training_cutoff: "2025-01"
|
|
315
313
|
reasoning_model: false
|
|
316
|
-
class_properties:
|
|
317
|
-
deprecated: true
|
|
318
314
|
costs_per_million_token:
|
|
319
315
|
input: 0.3
|
|
320
316
|
output: 2.5
|
|
@@ -333,14 +329,14 @@ gemini-2.5-models:
|
|
|
333
329
|
using multimodal inputs including audio, images, video, and PDFs with a context
|
|
334
330
|
window exceeding 1 million tokens.
|
|
335
331
|
release_date: 2025-03-25
|
|
332
|
+
metadata:
|
|
333
|
+
available_for_everyone: false
|
|
334
|
+
deprecated: true
|
|
336
335
|
properties:
|
|
337
336
|
context_window: 1_048_576
|
|
338
|
-
|
|
337
|
+
max_tokens: 65_536
|
|
339
338
|
training_cutoff: "2025-01"
|
|
340
|
-
available_for_everyone: false
|
|
341
339
|
reasoning_model: true
|
|
342
|
-
class_properties:
|
|
343
|
-
deprecated: true
|
|
344
340
|
costs_per_million_token:
|
|
345
341
|
input: 1.25
|
|
346
342
|
output: 10.0
|
|
@@ -355,14 +351,14 @@ gemini-2.5-models:
|
|
|
355
351
|
using multimodal inputs including audio, images, video, and PDFs with a context
|
|
356
352
|
window exceeding 1 million tokens.
|
|
357
353
|
release_date: 2025-04-05
|
|
354
|
+
metadata:
|
|
355
|
+
available_for_everyone: false
|
|
356
|
+
deprecated: true
|
|
358
357
|
properties:
|
|
359
358
|
context_window: 1_048_576
|
|
360
|
-
|
|
359
|
+
max_tokens: 65_536
|
|
361
360
|
training_cutoff: "2025-01"
|
|
362
|
-
available_for_everyone: false
|
|
363
361
|
reasoning_model: true
|
|
364
|
-
class_properties:
|
|
365
|
-
deprecated: true
|
|
366
362
|
costs_per_million_token:
|
|
367
363
|
input: 1.25
|
|
368
364
|
output: 10.0
|
|
@@ -371,12 +367,12 @@ gemini-2.5-models:
|
|
|
371
367
|
|
|
372
368
|
old-gemini-models:
|
|
373
369
|
base-config:
|
|
370
|
+
metadata:
|
|
371
|
+
deprecated: true
|
|
374
372
|
properties:
|
|
375
373
|
context_window: 2_097_152
|
|
376
|
-
|
|
374
|
+
max_tokens: 8_192
|
|
377
375
|
training_cutoff: "2024-05"
|
|
378
|
-
class_properties:
|
|
379
|
-
deprecated: true
|
|
380
376
|
costs_per_million_token:
|
|
381
377
|
cache:
|
|
382
378
|
read_discount: 0.25
|
|
@@ -388,17 +384,18 @@ old-gemini-models:
|
|
|
388
384
|
large context processing and multimodal inputs, with strengths in speed, native
|
|
389
385
|
tool use, and dataset comprehension.
|
|
390
386
|
release_date: 2025-02-05
|
|
387
|
+
supports:
|
|
388
|
+
images: true
|
|
389
|
+
files: true
|
|
390
|
+
videos: true
|
|
391
|
+
metadata:
|
|
392
|
+
available_for_everyone: false
|
|
393
|
+
deprecated: true
|
|
391
394
|
properties:
|
|
392
395
|
context_window: 2_097_152
|
|
393
|
-
|
|
396
|
+
max_tokens: 8_192
|
|
394
397
|
training_cutoff: "2024-06"
|
|
395
398
|
reasoning_model: true
|
|
396
|
-
available_for_everyone: false
|
|
397
|
-
class_properties:
|
|
398
|
-
deprecated: true
|
|
399
|
-
supports_images: true
|
|
400
|
-
supports_files: true
|
|
401
|
-
supports_videos: true
|
|
402
399
|
costs_per_million_token:
|
|
403
400
|
input: 1.25
|
|
404
401
|
output: 5.00
|
|
@@ -410,17 +407,18 @@ old-gemini-models:
|
|
|
410
407
|
reasoning and longer contextual memory in multimodal scenarios including text,
|
|
411
408
|
images, video, and audio.
|
|
412
409
|
release_date: 2025-01-21
|
|
410
|
+
supports:
|
|
411
|
+
images: true
|
|
412
|
+
files: true
|
|
413
|
+
videos: true
|
|
414
|
+
metadata:
|
|
415
|
+
available_for_everyone: false
|
|
416
|
+
deprecated: true
|
|
413
417
|
properties:
|
|
414
418
|
context_window: 1_048_576
|
|
415
|
-
|
|
419
|
+
max_tokens: 65_536
|
|
416
420
|
training_cutoff: "2024-05"
|
|
417
421
|
reasoning_model: true
|
|
418
|
-
available_for_everyone: false
|
|
419
|
-
class_properties:
|
|
420
|
-
deprecated: true
|
|
421
|
-
supports_images: true
|
|
422
|
-
supports_files: true
|
|
423
|
-
supports_videos: true
|
|
424
422
|
costs_per_million_token:
|
|
425
423
|
input: 0.10
|
|
426
424
|
output: 0.70
|
|
@@ -432,18 +430,19 @@ old-gemini-models:
|
|
|
432
430
|
with a 1 million token context window and support for text, image, video, and
|
|
433
431
|
audio inputs.
|
|
434
432
|
release_date: 2025-02-05
|
|
433
|
+
supports:
|
|
434
|
+
images: true
|
|
435
|
+
files: true
|
|
436
|
+
videos: true
|
|
435
437
|
properties:
|
|
436
|
-
properties: null
|
|
437
438
|
context_window: 1_048_576
|
|
438
|
-
|
|
439
|
+
max_tokens: 8_192
|
|
439
440
|
training_cutoff: "2024-08"
|
|
440
441
|
costs_per_million_token:
|
|
441
442
|
input: 0.10
|
|
442
443
|
output: 0.40
|
|
443
|
-
|
|
444
|
-
|
|
445
|
-
supports_files: true
|
|
446
|
-
supports_videos: true
|
|
444
|
+
cache:
|
|
445
|
+
read: 0.025
|
|
447
446
|
|
|
448
447
|
google/gemini-2.0-flash-exp:
|
|
449
448
|
label: Gemini 2.0 Flash Exp
|
|
@@ -451,15 +450,16 @@ old-gemini-models:
|
|
|
451
450
|
Gemini 2.0 Flash Experimental is a developer preview for advanced
|
|
452
451
|
use cases requiring extended context and multimodal reasoning capabilities.
|
|
453
452
|
release_date: 2024-12-11
|
|
453
|
+
supports:
|
|
454
|
+
images: true
|
|
455
|
+
files: true
|
|
456
|
+
videos: true
|
|
457
|
+
metadata:
|
|
458
|
+
deprecated: true
|
|
454
459
|
properties:
|
|
455
460
|
context_window: 1_048_576
|
|
456
|
-
|
|
461
|
+
max_tokens: 8_192
|
|
457
462
|
training_cutoff: "2024-05"
|
|
458
|
-
class_properties:
|
|
459
|
-
deprecated: true
|
|
460
|
-
supports_images: true
|
|
461
|
-
supports_files: true
|
|
462
|
-
supports_videos: true
|
|
463
463
|
costs_per_million_token:
|
|
464
464
|
input: 0.075
|
|
465
465
|
output: 0.30
|
|
@@ -470,15 +470,16 @@ old-gemini-models:
|
|
|
470
470
|
Gemini 1.5 Flash is an efficient and speedy version of Gemini 1.5
|
|
471
471
|
with support for multiple data types and large contexts.
|
|
472
472
|
release_date: 2024-09-24
|
|
473
|
+
supports:
|
|
474
|
+
images: true
|
|
475
|
+
files: true
|
|
476
|
+
videos: true
|
|
477
|
+
metadata:
|
|
478
|
+
deprecated: true
|
|
473
479
|
properties:
|
|
474
480
|
context_window: 1_048_576
|
|
475
|
-
|
|
481
|
+
max_tokens: 8_192
|
|
476
482
|
training_cutoff: "2024-05"
|
|
477
|
-
class_properties:
|
|
478
|
-
deprecated: true
|
|
479
|
-
supports_images: true
|
|
480
|
-
supports_files: true
|
|
481
|
-
supports_videos: true
|
|
482
483
|
costs_per_million_token:
|
|
483
484
|
input: 0.075
|
|
484
485
|
output: 0.30
|
|
@@ -489,15 +490,16 @@ old-gemini-models:
|
|
|
489
490
|
Gemini 1.5 Flash (early release) provides fast processing with vision
|
|
490
491
|
and audio capabilities along with text understanding.
|
|
491
492
|
release_date: 2024-05-24
|
|
493
|
+
supports:
|
|
494
|
+
images: true
|
|
495
|
+
files: true
|
|
496
|
+
videos: true
|
|
497
|
+
metadata:
|
|
498
|
+
deprecated: true
|
|
492
499
|
properties:
|
|
493
500
|
context_window: 1_048_576
|
|
494
|
-
|
|
501
|
+
max_tokens: 8_192
|
|
495
502
|
training_cutoff: "2023-11"
|
|
496
|
-
class_properties:
|
|
497
|
-
deprecated: true
|
|
498
|
-
supports_images: true
|
|
499
|
-
supports_files: true
|
|
500
|
-
supports_videos: true
|
|
501
503
|
costs_per_million_token:
|
|
502
504
|
input: 0.075
|
|
503
505
|
output: 0.30
|
|
@@ -508,15 +510,16 @@ old-gemini-models:
|
|
|
508
510
|
Gemini 1.5 Pro is a high-performance model with multimodal capabilities
|
|
509
511
|
useful for complex reasoning tasks and dataset analysis.
|
|
510
512
|
release_date: 2024-09-24
|
|
513
|
+
supports:
|
|
514
|
+
images: true
|
|
515
|
+
files: true
|
|
516
|
+
videos: true
|
|
517
|
+
metadata:
|
|
518
|
+
deprecated: true
|
|
511
519
|
properties:
|
|
512
520
|
context_window: 2_097_152
|
|
513
|
-
|
|
521
|
+
max_tokens: 8_192
|
|
514
522
|
training_cutoff: "2024-05"
|
|
515
|
-
class_properties:
|
|
516
|
-
deprecated: true
|
|
517
|
-
supports_images: true
|
|
518
|
-
supports_files: true
|
|
519
|
-
supports_videos: true
|
|
520
523
|
costs_per_million_token:
|
|
521
524
|
input: 1.25
|
|
522
525
|
output: 5.0
|
|
@@ -530,15 +533,16 @@ old-gemini-models:
|
|
|
530
533
|
Gemini 1.5 Pro (early release) supports multimodal inputs and advanced
|
|
531
534
|
reasoning on moderate context lengths.
|
|
532
535
|
release_date: 2024-05-24
|
|
536
|
+
supports:
|
|
537
|
+
images: true
|
|
538
|
+
files: true
|
|
539
|
+
videos: true
|
|
540
|
+
metadata:
|
|
541
|
+
deprecated: true
|
|
533
542
|
properties:
|
|
534
543
|
context_window: 1_048_576
|
|
535
|
-
|
|
544
|
+
max_tokens: 8_192
|
|
536
545
|
training_cutoff: "2023-11"
|
|
537
|
-
class_properties:
|
|
538
|
-
deprecated: true
|
|
539
|
-
supports_images: true
|
|
540
|
-
supports_files: true
|
|
541
|
-
supports_videos: true
|
|
542
546
|
costs_per_million_token:
|
|
543
547
|
input: 1.25
|
|
544
548
|
output: 5.0
|
|
@@ -549,13 +553,14 @@ old-gemini-models:
|
|
|
549
553
|
Gemini 1.0 Pro is an earlier generation multimodal model supporting
|
|
550
554
|
text, image, and audio inputs with foundational reasoning abilities.
|
|
551
555
|
release_date: 2024-02-14
|
|
556
|
+
supports:
|
|
557
|
+
images: false
|
|
558
|
+
metadata:
|
|
559
|
+
deprecated: true
|
|
552
560
|
properties:
|
|
553
561
|
context_window: 32_760
|
|
554
|
-
|
|
562
|
+
max_tokens: 8_192
|
|
555
563
|
training_cutoff: "2023-02"
|
|
556
|
-
class_properties:
|
|
557
|
-
supports_images: false
|
|
558
|
-
deprecated: true
|
|
559
564
|
costs_per_million_token:
|
|
560
565
|
input: 0.50
|
|
561
566
|
output: 1.50
|
|
@@ -2,11 +2,12 @@ base-config:
|
|
|
2
2
|
company: Inception
|
|
3
3
|
documentation_url: https://docs.inceptionlabs.ai/get-started/models
|
|
4
4
|
open_source: false
|
|
5
|
-
|
|
6
|
-
|
|
7
|
-
|
|
5
|
+
supports:
|
|
6
|
+
images: false
|
|
7
|
+
tools: true
|
|
8
|
+
files: false
|
|
9
|
+
metadata:
|
|
8
10
|
available_as_evaluator: false
|
|
9
|
-
supports_files: false
|
|
10
11
|
available_for_everyone: true
|
|
11
12
|
ignored_for_cost: false
|
|
12
13
|
|
|
@@ -17,8 +18,7 @@ inception-models:
|
|
|
17
18
|
properties:
|
|
18
19
|
reasoning_model: false
|
|
19
20
|
context_window: 128_000
|
|
20
|
-
|
|
21
|
-
max_output_tokens: 16_400 # number lifted from https://openrouter.ai/inception/mercury
|
|
21
|
+
max_tokens: 16_384 # rounded down
|
|
22
22
|
costs_per_million_token:
|
|
23
23
|
input: 0.25
|
|
24
24
|
output: 1
|
|
@@ -2,33 +2,32 @@ base-config:
|
|
|
2
2
|
company: Kimi
|
|
3
3
|
documentation_url: https://platform.moonshot.ai/docs
|
|
4
4
|
open_source: true
|
|
5
|
-
|
|
6
|
-
|
|
7
|
-
|
|
5
|
+
supports:
|
|
6
|
+
images: false
|
|
7
|
+
tools: true
|
|
8
|
+
files: false
|
|
9
|
+
metadata:
|
|
8
10
|
available_as_evaluator: false
|
|
9
|
-
supports_files: false
|
|
10
11
|
available_for_everyone: true
|
|
11
12
|
ignored_for_cost: false
|
|
12
13
|
|
|
13
14
|
kimi-k2-models:
|
|
14
|
-
|
|
15
15
|
kimi/kimi-k2-thinking:
|
|
16
16
|
label: Kimi K2 Thinking
|
|
17
17
|
release_date: 2025-11-06
|
|
18
18
|
properties:
|
|
19
19
|
reasoning_model: true
|
|
20
|
-
context_window:
|
|
21
|
-
|
|
20
|
+
context_window: 256_000
|
|
21
|
+
max_tokens: 32_000
|
|
22
22
|
default_parameters:
|
|
23
23
|
temperature: 1.0
|
|
24
|
-
max_output_tokens: 128_000
|
|
25
24
|
costs_per_million_token:
|
|
26
|
-
input: 0.
|
|
27
|
-
output: 2.
|
|
25
|
+
input: 0.6
|
|
26
|
+
output: 2.5
|
|
27
|
+
cache:
|
|
28
|
+
read: 0.15
|
|
28
29
|
alternative_keys:
|
|
29
30
|
- fireworks/kimi-k2-thinking:
|
|
30
31
|
costs_per_million_token:
|
|
31
|
-
input: 0.
|
|
32
|
-
output:
|
|
33
|
-
cache:
|
|
34
|
-
read_discount: 1
|
|
32
|
+
input: 0.6
|
|
33
|
+
output: 2.5
|
|
@@ -0,0 +1,37 @@
|
|
|
1
|
+
base-config:
|
|
2
|
+
company: MiniMax
|
|
3
|
+
documentation_url: https://platform.minimax.io/docs
|
|
4
|
+
open_source: true
|
|
5
|
+
supports:
|
|
6
|
+
images: false
|
|
7
|
+
files: false
|
|
8
|
+
tools: true
|
|
9
|
+
temperature: true
|
|
10
|
+
metadata:
|
|
11
|
+
available_as_evaluator: false
|
|
12
|
+
available_for_everyone: true
|
|
13
|
+
ignored_for_cost: false
|
|
14
|
+
properties:
|
|
15
|
+
reasoning_model: false
|
|
16
|
+
|
|
17
|
+
minimax-m2-models:
|
|
18
|
+
|
|
19
|
+
minimax/MiniMax-M2:
|
|
20
|
+
label: MiniMax-M2
|
|
21
|
+
description: MiniMax-M2 is a cost-efficient open-source model optimized for agentic applications and coding in particular.
|
|
22
|
+
release_date: 2025-10-26
|
|
23
|
+
properties:
|
|
24
|
+
context_window: 204_800
|
|
25
|
+
max_tokens: 131_000
|
|
26
|
+
reasoning_model: true
|
|
27
|
+
training_cutoff: null
|
|
28
|
+
default_parameters:
|
|
29
|
+
temperature: 1.0
|
|
30
|
+
top_p: 0.95
|
|
31
|
+
costs_per_million_token:
|
|
32
|
+
input: 0.30
|
|
33
|
+
output: 1.20
|
|
34
|
+
cache:
|
|
35
|
+
read: 0.03
|
|
36
|
+
write: 0.375
|
|
37
|
+
|