model-library 0.1.3__py3-none-any.whl → 0.1.4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (36) hide show
  1. model_library/base/base.py +2 -0
  2. model_library/base/output.py +1 -0
  3. model_library/config/README.md +169 -0
  4. model_library/config/ai21labs_models.yaml +11 -11
  5. model_library/config/alibaba_models.yaml +21 -22
  6. model_library/config/all_models.json +4572 -2598
  7. model_library/config/amazon_models.yaml +100 -102
  8. model_library/config/anthropic_models.yaml +43 -52
  9. model_library/config/cohere_models.yaml +25 -24
  10. model_library/config/deepseek_models.yaml +28 -25
  11. model_library/config/dummy_model.yaml +9 -7
  12. model_library/config/fireworks_models.yaml +86 -56
  13. model_library/config/google_models.yaml +131 -126
  14. model_library/config/inception_models.yaml +6 -6
  15. model_library/config/kimi_models.yaml +13 -14
  16. model_library/config/minimax_models.yaml +37 -0
  17. model_library/config/mistral_models.yaml +85 -29
  18. model_library/config/openai_models.yaml +192 -150
  19. model_library/config/perplexity_models.yaml +8 -23
  20. model_library/config/together_models.yaml +115 -104
  21. model_library/config/xai_models.yaml +47 -79
  22. model_library/config/zai_models.yaml +23 -15
  23. model_library/exceptions.py +6 -15
  24. model_library/providers/amazon.py +32 -17
  25. model_library/providers/minimax.py +33 -0
  26. model_library/providers/mistral.py +10 -1
  27. model_library/providers/openai.py +2 -6
  28. model_library/register_models.py +36 -36
  29. model_library/registry_utils.py +18 -16
  30. model_library/utils.py +2 -2
  31. {model_library-0.1.3.dist-info → model_library-0.1.4.dist-info}/METADATA +2 -2
  32. model_library-0.1.4.dist-info/RECORD +64 -0
  33. model_library-0.1.3.dist-info/RECORD +0 -61
  34. {model_library-0.1.3.dist-info → model_library-0.1.4.dist-info}/WHEEL +0 -0
  35. {model_library-0.1.3.dist-info → model_library-0.1.4.dist-info}/licenses/LICENSE +0 -0
  36. {model_library-0.1.3.dist-info → model_library-0.1.4.dist-info}/top_level.txt +0 -0
@@ -2,7 +2,14 @@ base-config:
2
2
  company: Google
3
3
  documentation_url: https://ai.google.dev/gemini-api/docs/models
4
4
  open_source: false
5
- class_properties:
5
+ supports:
6
+ images: false
7
+ videos: false
8
+ files: false
9
+ batch: false
10
+ temperature: false
11
+ tools: false
12
+ metadata:
6
13
  available_for_everyone: true
7
14
  available_as_evaluator: false
8
15
  ignored_for_cost: false
@@ -21,30 +28,25 @@ gemma-models:
21
28
  use such as phones and tablets, capable of handling text, audio, and vision
22
29
  inputs with efficient parameter caching techniques.
23
30
  release_date: 2025-03-12
24
- class_properties:
31
+ metadata:
25
32
  deprecated: true
26
33
  properties:
27
34
  context_window: 131_072
28
- max_token_output: 8_192
35
+ max_tokens: 8_192
29
36
  training_cutoff: "2023-09"
30
37
  costs_per_million_token:
31
38
  input: 0.00
32
39
  output: 0.00
33
40
 
34
-
35
41
  gemini-3-models:
36
42
  base-config:
37
- properties:
38
- context_window: 1_048_576
39
- max_token_output: 8_192
40
- training_cutoff: "2025-01"
41
- class_properties:
42
- supports_images: true
43
- supports_files: true
44
- supports_videos: true
45
- supports_tools: true
46
- supports_batch_requests: true
47
- supports_temperature: true
43
+ supports:
44
+ images: true
45
+ files: true
46
+ videos: true
47
+ tools: true
48
+ batch: true
49
+ temperature: true
48
50
  costs_per_million_token:
49
51
  cache:
50
52
  read_discount: 0.1
@@ -58,41 +60,34 @@ gemini-3-models:
58
60
  release_date: 2025-11-18
59
61
  properties:
60
62
  context_window: 1048576
61
- max_token_output: 65536
63
+ max_tokens: 65536
62
64
  training_cutoff: "2025-01"
63
65
  reasoning_model: true
64
- class_properties:
65
- supports_images: true
66
- supports_files: true
67
- supports_videos: true
68
- supports_tools: true
69
- supports_batch_requests: true
70
- supports_temperature: true
71
66
  costs_per_million_token:
72
- input: 2
73
- output: 12
67
+ input: 2.0
68
+ output: 12.0
74
69
  cache:
75
70
  read: 0.20
76
71
  context:
77
72
  threshold: 200_000
78
- input: 2.5
79
- output: 15.0
73
+ input: 4.0
74
+ output: 18.0
80
75
  cache:
81
76
  read: 0.40
82
77
 
83
78
  gemini-2.5-models:
84
79
  base-config:
80
+ supports:
81
+ images: true
82
+ files: true
83
+ videos: true
84
+ tools: true
85
+ batch: true
86
+ temperature: true
85
87
  properties:
86
88
  context_window: 1_048_576
87
- max_token_output: 8_192
89
+ max_tokens: 8_192
88
90
  training_cutoff: "2024-05"
89
- class_properties:
90
- supports_images: true
91
- supports_files: true
92
- supports_videos: true
93
- supports_tools: true
94
- supports_batch_requests: true
95
- supports_temperature: true
96
91
  costs_per_million_token:
97
92
  cache:
98
93
  read_discount: 0.1
@@ -107,12 +102,12 @@ gemini-2.5-models:
107
102
  using multimodal inputs including audio, images, video, and PDFs with a context
108
103
  window exceeding 1 million tokens.
109
104
  release_date: 2025-07-17
105
+ metadata:
106
+ available_as_evaluator: true
110
107
  properties:
111
108
  context_window: 1_048_576
112
- max_token_output: 65_536
109
+ max_tokens: 65_536
113
110
  reasoning_model: true
114
- class_properties:
115
- available_as_evaluator: true
116
111
  costs_per_million_token:
117
112
  input: 1.25
118
113
  output: 10.0
@@ -132,12 +127,12 @@ gemini-2.5-models:
132
127
  large scale processing with support for multiple modalities, a 1 million token
133
128
  context window, and strong reasoning capabilities.
134
129
  release_date: 2025-07-17
130
+ metadata:
131
+ available_as_evaluator: true
135
132
  properties:
136
133
  context_window: 1_048_576
137
- max_token_output: 65_536
134
+ max_tokens: 65_536
138
135
  reasoning_model: false
139
- class_properties:
140
- available_as_evaluator: true
141
136
  costs_per_million_token:
142
137
  input: 0.30
143
138
  output: 2.50
@@ -156,7 +151,7 @@ gemini-2.5-models:
156
151
  release_date: 2025-09-25
157
152
  properties:
158
153
  context_window: 1_048_576
159
- max_token_output: 65_535
154
+ max_tokens: 65_535
160
155
  reasoning_model: false
161
156
  costs_per_million_token:
162
157
  input: 0.30
@@ -177,7 +172,7 @@ gemini-2.5-models:
177
172
  release_date: 2025-07-22
178
173
  properties:
179
174
  context_window: 1_048_576
180
- max_token_output: 65_535
175
+ max_tokens: 65_535
181
176
  reasoning_model: false
182
177
  costs_per_million_token:
183
178
  input: 0.10
@@ -198,7 +193,7 @@ gemini-2.5-models:
198
193
  release_date: 2025-09-25
199
194
  properties:
200
195
  context_window: 1_048_576
201
- max_token_output: 65_535
196
+ max_tokens: 65_535
202
197
  reasoning_model: false
203
198
  costs_per_million_token:
204
199
  input: 0.10
@@ -217,12 +212,12 @@ gemini-2.5-models:
217
212
  at scale, with support for text, images, video, and audio input modalities and
218
213
  large context length.
219
214
  release_date: 2025-06-17
215
+ metadata:
216
+ deprecated: true
220
217
  properties:
221
218
  context_window: 1_048_576
222
- max_token_output: 65_535
219
+ max_tokens: 65_535
223
220
  reasoning_model: false
224
- class_properties:
225
- deprecated: true
226
221
  costs_per_million_token:
227
222
  input: 0.10
228
223
  output: 0.40
@@ -240,13 +235,13 @@ gemini-2.5-models:
240
235
  large scale processing with support for multiple modalities, a 1 million token
241
236
  context window, and strong reasoning capabilities.
242
237
  release_date: 2025-05-20
238
+ metadata:
239
+ deprecated: true
243
240
  properties:
244
241
  context_window: 1_048_576
245
- max_token_output: 65_536
242
+ max_tokens: 65_536
246
243
  training_cutoff: "2025-01"
247
244
  reasoning_model: false
248
- class_properties:
249
- deprecated: true
250
245
  costs_per_million_token:
251
246
  input: 0.15
252
247
  output: 0.60
@@ -265,14 +260,15 @@ gemini-2.5-models:
265
260
  using multimodal inputs including audio, images, video, and PDFs with a context
266
261
  window exceeding 1 million tokens.
267
262
  release_date: 2025-06-05
263
+ supports:
264
+ batch: false
265
+ metadata:
266
+ deprecated: true
268
267
  properties:
269
268
  context_window: 1_048_576
270
- max_token_output: 65_536
269
+ max_tokens: 65_536
271
270
  training_cutoff: "2025-01"
272
271
  reasoning_model: true
273
- class_properties:
274
- supports_batch_requests: false
275
- deprecated: true
276
272
  costs_per_million_token:
277
273
  input: 1.25
278
274
  output: 10.0
@@ -287,14 +283,14 @@ gemini-2.5-models:
287
283
  using multimodal inputs including audio, images, video, and PDFs with a context
288
284
  window exceeding 1 million tokens.
289
285
  release_date: 2025-05-06
286
+ metadata:
287
+ available_for_everyone: false
288
+ deprecated: true
290
289
  properties:
291
290
  context_window: 1_048_576
292
- max_token_output: 65_536
291
+ max_tokens: 65_536
293
292
  training_cutoff: "2025-01"
294
- available_for_everyone: false
295
293
  reasoning_model: true
296
- class_properties:
297
- deprecated: true
298
294
  costs_per_million_token:
299
295
  input: 1.25
300
296
  output: 10.0
@@ -308,13 +304,13 @@ gemini-2.5-models:
308
304
  large scale processing with support for multiple modalities, a 1 million token
309
305
  context window, and strong reasoning capabilities.
310
306
  release_date: 2025-04-17
307
+ metadata:
308
+ deprecated: true
311
309
  properties:
312
310
  context_window: 1_048_576
313
- max_token_output: 65_536
311
+ max_tokens: 65_536
314
312
  training_cutoff: "2025-01"
315
313
  reasoning_model: false
316
- class_properties:
317
- deprecated: true
318
314
  costs_per_million_token:
319
315
  input: 0.3
320
316
  output: 2.5
@@ -333,14 +329,14 @@ gemini-2.5-models:
333
329
  using multimodal inputs including audio, images, video, and PDFs with a context
334
330
  window exceeding 1 million tokens.
335
331
  release_date: 2025-03-25
332
+ metadata:
333
+ available_for_everyone: false
334
+ deprecated: true
336
335
  properties:
337
336
  context_window: 1_048_576
338
- max_token_output: 65_536
337
+ max_tokens: 65_536
339
338
  training_cutoff: "2025-01"
340
- available_for_everyone: false
341
339
  reasoning_model: true
342
- class_properties:
343
- deprecated: true
344
340
  costs_per_million_token:
345
341
  input: 1.25
346
342
  output: 10.0
@@ -355,14 +351,14 @@ gemini-2.5-models:
355
351
  using multimodal inputs including audio, images, video, and PDFs with a context
356
352
  window exceeding 1 million tokens.
357
353
  release_date: 2025-04-05
354
+ metadata:
355
+ available_for_everyone: false
356
+ deprecated: true
358
357
  properties:
359
358
  context_window: 1_048_576
360
- max_token_output: 65_536
359
+ max_tokens: 65_536
361
360
  training_cutoff: "2025-01"
362
- available_for_everyone: false
363
361
  reasoning_model: true
364
- class_properties:
365
- deprecated: true
366
362
  costs_per_million_token:
367
363
  input: 1.25
368
364
  output: 10.0
@@ -371,12 +367,12 @@ gemini-2.5-models:
371
367
 
372
368
  old-gemini-models:
373
369
  base-config:
370
+ metadata:
371
+ deprecated: true
374
372
  properties:
375
373
  context_window: 2_097_152
376
- max_token_output: 8_192
374
+ max_tokens: 8_192
377
375
  training_cutoff: "2024-05"
378
- class_properties:
379
- deprecated: true
380
376
  costs_per_million_token:
381
377
  cache:
382
378
  read_discount: 0.25
@@ -388,17 +384,18 @@ old-gemini-models:
388
384
  large context processing and multimodal inputs, with strengths in speed, native
389
385
  tool use, and dataset comprehension.
390
386
  release_date: 2025-02-05
387
+ supports:
388
+ images: true
389
+ files: true
390
+ videos: true
391
+ metadata:
392
+ available_for_everyone: false
393
+ deprecated: true
391
394
  properties:
392
395
  context_window: 2_097_152
393
- max_token_output: 8_192
396
+ max_tokens: 8_192
394
397
  training_cutoff: "2024-06"
395
398
  reasoning_model: true
396
- available_for_everyone: false
397
- class_properties:
398
- deprecated: true
399
- supports_images: true
400
- supports_files: true
401
- supports_videos: true
402
399
  costs_per_million_token:
403
400
  input: 1.25
404
401
  output: 5.00
@@ -410,17 +407,18 @@ old-gemini-models:
410
407
  reasoning and longer contextual memory in multimodal scenarios including text,
411
408
  images, video, and audio.
412
409
  release_date: 2025-01-21
410
+ supports:
411
+ images: true
412
+ files: true
413
+ videos: true
414
+ metadata:
415
+ available_for_everyone: false
416
+ deprecated: true
413
417
  properties:
414
418
  context_window: 1_048_576
415
- max_token_output: 65_536
419
+ max_tokens: 65_536
416
420
  training_cutoff: "2024-05"
417
421
  reasoning_model: true
418
- available_for_everyone: false
419
- class_properties:
420
- deprecated: true
421
- supports_images: true
422
- supports_files: true
423
- supports_videos: true
424
422
  costs_per_million_token:
425
423
  input: 0.10
426
424
  output: 0.70
@@ -432,18 +430,19 @@ old-gemini-models:
432
430
  with a 1 million token context window and support for text, image, video, and
433
431
  audio inputs.
434
432
  release_date: 2025-02-05
433
+ supports:
434
+ images: true
435
+ files: true
436
+ videos: true
435
437
  properties:
436
- properties: null
437
438
  context_window: 1_048_576
438
- max_token_output: 8_192
439
+ max_tokens: 8_192
439
440
  training_cutoff: "2024-08"
440
441
  costs_per_million_token:
441
442
  input: 0.10
442
443
  output: 0.40
443
- class_properties:
444
- supports_images: true
445
- supports_files: true
446
- supports_videos: true
444
+ cache:
445
+ read: 0.025
447
446
 
448
447
  google/gemini-2.0-flash-exp:
449
448
  label: Gemini 2.0 Flash Exp
@@ -451,15 +450,16 @@ old-gemini-models:
451
450
  Gemini 2.0 Flash Experimental is a developer preview for advanced
452
451
  use cases requiring extended context and multimodal reasoning capabilities.
453
452
  release_date: 2024-12-11
453
+ supports:
454
+ images: true
455
+ files: true
456
+ videos: true
457
+ metadata:
458
+ deprecated: true
454
459
  properties:
455
460
  context_window: 1_048_576
456
- max_token_output: 8_192
461
+ max_tokens: 8_192
457
462
  training_cutoff: "2024-05"
458
- class_properties:
459
- deprecated: true
460
- supports_images: true
461
- supports_files: true
462
- supports_videos: true
463
463
  costs_per_million_token:
464
464
  input: 0.075
465
465
  output: 0.30
@@ -470,15 +470,16 @@ old-gemini-models:
470
470
  Gemini 1.5 Flash is an efficient and speedy version of Gemini 1.5
471
471
  with support for multiple data types and large contexts.
472
472
  release_date: 2024-09-24
473
+ supports:
474
+ images: true
475
+ files: true
476
+ videos: true
477
+ metadata:
478
+ deprecated: true
473
479
  properties:
474
480
  context_window: 1_048_576
475
- max_token_output: 8_192
481
+ max_tokens: 8_192
476
482
  training_cutoff: "2024-05"
477
- class_properties:
478
- deprecated: true
479
- supports_images: true
480
- supports_files: true
481
- supports_videos: true
482
483
  costs_per_million_token:
483
484
  input: 0.075
484
485
  output: 0.30
@@ -489,15 +490,16 @@ old-gemini-models:
489
490
  Gemini 1.5 Flash (early release) provides fast processing with vision
490
491
  and audio capabilities along with text understanding.
491
492
  release_date: 2024-05-24
493
+ supports:
494
+ images: true
495
+ files: true
496
+ videos: true
497
+ metadata:
498
+ deprecated: true
492
499
  properties:
493
500
  context_window: 1_048_576
494
- max_token_output: 8_192
501
+ max_tokens: 8_192
495
502
  training_cutoff: "2023-11"
496
- class_properties:
497
- deprecated: true
498
- supports_images: true
499
- supports_files: true
500
- supports_videos: true
501
503
  costs_per_million_token:
502
504
  input: 0.075
503
505
  output: 0.30
@@ -508,15 +510,16 @@ old-gemini-models:
508
510
  Gemini 1.5 Pro is a high-performance model with multimodal capabilities
509
511
  useful for complex reasoning tasks and dataset analysis.
510
512
  release_date: 2024-09-24
513
+ supports:
514
+ images: true
515
+ files: true
516
+ videos: true
517
+ metadata:
518
+ deprecated: true
511
519
  properties:
512
520
  context_window: 2_097_152
513
- max_token_output: 8_192
521
+ max_tokens: 8_192
514
522
  training_cutoff: "2024-05"
515
- class_properties:
516
- deprecated: true
517
- supports_images: true
518
- supports_files: true
519
- supports_videos: true
520
523
  costs_per_million_token:
521
524
  input: 1.25
522
525
  output: 5.0
@@ -530,15 +533,16 @@ old-gemini-models:
530
533
  Gemini 1.5 Pro (early release) supports multimodal inputs and advanced
531
534
  reasoning on moderate context lengths.
532
535
  release_date: 2024-05-24
536
+ supports:
537
+ images: true
538
+ files: true
539
+ videos: true
540
+ metadata:
541
+ deprecated: true
533
542
  properties:
534
543
  context_window: 1_048_576
535
- max_token_output: 8_192
544
+ max_tokens: 8_192
536
545
  training_cutoff: "2023-11"
537
- class_properties:
538
- deprecated: true
539
- supports_images: true
540
- supports_files: true
541
- supports_videos: true
542
546
  costs_per_million_token:
543
547
  input: 1.25
544
548
  output: 5.0
@@ -549,13 +553,14 @@ old-gemini-models:
549
553
  Gemini 1.0 Pro is an earlier generation multimodal model supporting
550
554
  text, image, and audio inputs with foundational reasoning abilities.
551
555
  release_date: 2024-02-14
556
+ supports:
557
+ images: false
558
+ metadata:
559
+ deprecated: true
552
560
  properties:
553
561
  context_window: 32_760
554
- max_token_output: 8_192
562
+ max_tokens: 8_192
555
563
  training_cutoff: "2023-02"
556
- class_properties:
557
- supports_images: false
558
- deprecated: true
559
564
  costs_per_million_token:
560
565
  input: 0.50
561
566
  output: 1.50
@@ -2,11 +2,12 @@ base-config:
2
2
  company: Inception
3
3
  documentation_url: https://docs.inceptionlabs.ai/get-started/models
4
4
  open_source: false
5
- class_properties:
6
- supports_images: false
7
- supports_tools: true
5
+ supports:
6
+ images: false
7
+ tools: true
8
+ files: false
9
+ metadata:
8
10
  available_as_evaluator: false
9
- supports_files: false
10
11
  available_for_everyone: true
11
12
  ignored_for_cost: false
12
13
 
@@ -17,8 +18,7 @@ inception-models:
17
18
  properties:
18
19
  reasoning_model: false
19
20
  context_window: 128_000
20
- default_parameters:
21
- max_output_tokens: 16_400 # number lifted from https://openrouter.ai/inception/mercury
21
+ max_tokens: 16_384 # rounded down
22
22
  costs_per_million_token:
23
23
  input: 0.25
24
24
  output: 1
@@ -2,33 +2,32 @@ base-config:
2
2
  company: Kimi
3
3
  documentation_url: https://platform.moonshot.ai/docs
4
4
  open_source: true
5
- class_properties:
6
- supports_images: false
7
- supports_tools: true
5
+ supports:
6
+ images: false
7
+ tools: true
8
+ files: false
9
+ metadata:
8
10
  available_as_evaluator: false
9
- supports_files: false
10
11
  available_for_everyone: true
11
12
  ignored_for_cost: false
12
13
 
13
14
  kimi-k2-models:
14
-
15
15
  kimi/kimi-k2-thinking:
16
16
  label: Kimi K2 Thinking
17
17
  release_date: 2025-11-06
18
18
  properties:
19
19
  reasoning_model: true
20
- context_window: 128_000
21
- max_token_output: 128_000
20
+ context_window: 256_000
21
+ max_tokens: 32_000
22
22
  default_parameters:
23
23
  temperature: 1.0
24
- max_output_tokens: 128_000
25
24
  costs_per_million_token:
26
- input: 0.60
27
- output: 2.50
25
+ input: 0.6
26
+ output: 2.5
27
+ cache:
28
+ read: 0.15
28
29
  alternative_keys:
29
30
  - fireworks/kimi-k2-thinking:
30
31
  costs_per_million_token:
31
- input: 0.50
32
- output: 0.50
33
- cache:
34
- read_discount: 1
32
+ input: 0.6
33
+ output: 2.5
@@ -0,0 +1,37 @@
1
+ base-config:
2
+ company: MiniMax
3
+ documentation_url: https://platform.minimax.io/docs
4
+ open_source: true
5
+ supports:
6
+ images: false
7
+ files: false
8
+ tools: true
9
+ temperature: true
10
+ metadata:
11
+ available_as_evaluator: false
12
+ available_for_everyone: true
13
+ ignored_for_cost: false
14
+ properties:
15
+ reasoning_model: false
16
+
17
+ minimax-m2-models:
18
+
19
+ minimax/MiniMax-M2:
20
+ label: MiniMax-M2
21
+ description: MiniMax-M2 is a cost-efficient open-source model optimized for agentic applications and coding in particular.
22
+ release_date: 2025-10-26
23
+ properties:
24
+ context_window: 204_800
25
+ max_tokens: 131_000
26
+ reasoning_model: true
27
+ training_cutoff: null
28
+ default_parameters:
29
+ temperature: 1.0
30
+ top_p: 0.95
31
+ costs_per_million_token:
32
+ input: 0.30
33
+ output: 1.20
34
+ cache:
35
+ read: 0.03
36
+ write: 0.375
37
+