model-library 0.1.2__py3-none-any.whl → 0.1.4__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- model_library/base/base.py +13 -6
- model_library/base/output.py +55 -0
- model_library/base/utils.py +3 -2
- model_library/config/README.md +169 -0
- model_library/config/ai21labs_models.yaml +11 -10
- model_library/config/alibaba_models.yaml +21 -22
- model_library/config/all_models.json +4708 -2471
- model_library/config/amazon_models.yaml +100 -102
- model_library/config/anthropic_models.yaml +59 -45
- model_library/config/cohere_models.yaml +25 -24
- model_library/config/deepseek_models.yaml +28 -25
- model_library/config/dummy_model.yaml +9 -7
- model_library/config/fireworks_models.yaml +86 -56
- model_library/config/google_models.yaml +156 -102
- model_library/config/inception_models.yaml +6 -6
- model_library/config/kimi_models.yaml +13 -14
- model_library/config/minimax_models.yaml +37 -0
- model_library/config/mistral_models.yaml +85 -29
- model_library/config/openai_models.yaml +192 -159
- model_library/config/perplexity_models.yaml +8 -23
- model_library/config/together_models.yaml +115 -103
- model_library/config/xai_models.yaml +85 -57
- model_library/config/zai_models.yaml +23 -15
- model_library/exceptions.py +12 -17
- model_library/file_utils.py +1 -1
- model_library/providers/amazon.py +32 -17
- model_library/providers/anthropic.py +2 -6
- model_library/providers/google/google.py +35 -29
- model_library/providers/minimax.py +33 -0
- model_library/providers/mistral.py +10 -1
- model_library/providers/openai.py +10 -8
- model_library/providers/together.py +18 -211
- model_library/register_models.py +36 -38
- model_library/registry_utils.py +18 -16
- model_library/utils.py +2 -2
- {model_library-0.1.2.dist-info → model_library-0.1.4.dist-info}/METADATA +3 -4
- model_library-0.1.4.dist-info/RECORD +64 -0
- model_library-0.1.2.dist-info/RECORD +0 -61
- {model_library-0.1.2.dist-info → model_library-0.1.4.dist-info}/WHEEL +0 -0
- {model_library-0.1.2.dist-info → model_library-0.1.4.dist-info}/licenses/LICENSE +0 -0
- {model_library-0.1.2.dist-info → model_library-0.1.4.dist-info}/top_level.txt +0 -0
|
@@ -1,12 +1,14 @@
|
|
|
1
1
|
base-config:
|
|
2
2
|
company: OpenAI
|
|
3
3
|
open_source: false
|
|
4
|
-
|
|
5
|
-
|
|
4
|
+
supports:
|
|
5
|
+
images: false
|
|
6
|
+
files: false
|
|
7
|
+
tools: true
|
|
8
|
+
batch: true
|
|
9
|
+
temperature: true
|
|
10
|
+
metadata:
|
|
6
11
|
available_as_evaluator: false
|
|
7
|
-
supports_files: false
|
|
8
|
-
supports_tools: true
|
|
9
|
-
supports_batch_requests: true
|
|
10
12
|
available_for_everyone: true
|
|
11
13
|
ignored_for_cost: false
|
|
12
14
|
properties:
|
|
@@ -17,21 +19,63 @@ base-config:
|
|
|
17
19
|
output_discount: 0.5
|
|
18
20
|
default_parameters:
|
|
19
21
|
reasoning_effort: "high"
|
|
20
|
-
|
|
21
22
|
gpt-5-models:
|
|
22
23
|
base-config:
|
|
23
24
|
documentation_url: ""
|
|
25
|
+
supports:
|
|
26
|
+
images: true
|
|
27
|
+
files: true
|
|
28
|
+
tools: true
|
|
29
|
+
temperature: false
|
|
30
|
+
metadata:
|
|
31
|
+
available_for_everyone: false
|
|
24
32
|
properties:
|
|
25
33
|
context_window: 400_000
|
|
26
|
-
|
|
34
|
+
max_tokens: 128_000
|
|
35
|
+
training_cutoff: "2024-09"
|
|
27
36
|
reasoning_model: true
|
|
28
|
-
|
|
29
|
-
|
|
30
|
-
|
|
31
|
-
|
|
32
|
-
|
|
33
|
-
|
|
34
|
-
|
|
37
|
+
|
|
38
|
+
openai/gpt-5.2-2025-12-11:
|
|
39
|
+
label: GPT 5.2
|
|
40
|
+
documentation_url: https://platform.openai.com/docs/models/gpt-5.2
|
|
41
|
+
description: GPT-5.2 is OpenAI's most advanced frontier model for everyday professional use and agentic tasks, with leading long-context reasoning, multi-step tool use, and vision capabilities.
|
|
42
|
+
release_date: 2025-12-11
|
|
43
|
+
properties:
|
|
44
|
+
context_window: 400_000
|
|
45
|
+
metadata:
|
|
46
|
+
available_as_evaluator: true
|
|
47
|
+
costs_per_million_token:
|
|
48
|
+
input: 1.75
|
|
49
|
+
output: 14
|
|
50
|
+
cache:
|
|
51
|
+
read: 0.175
|
|
52
|
+
default_parameters:
|
|
53
|
+
reasoning_effort: "xhigh"
|
|
54
|
+
alternative_keys:
|
|
55
|
+
- openai/gpt-5.2
|
|
56
|
+
|
|
57
|
+
openai/gpt-5.2-pro-2025-12-11:
|
|
58
|
+
label: GPT 5.2 Pro
|
|
59
|
+
documentation_url: https://platform.openai.com/docs/models/gpt-5.2-pro
|
|
60
|
+
description: GPT-5.2 Pro is a higher-compute version of GPT-5.2 designed for stronger, more consistent reasoning on complex tasks.
|
|
61
|
+
release_date: 2025-12-11
|
|
62
|
+
properties:
|
|
63
|
+
context_window: 400_000
|
|
64
|
+
costs_per_million_token:
|
|
65
|
+
input: 21
|
|
66
|
+
output: 168
|
|
67
|
+
alternative_keys:
|
|
68
|
+
- openai/gpt-5.2-pro
|
|
69
|
+
|
|
70
|
+
openai/gpt-5.1-codex-max:
|
|
71
|
+
label: GPT 5.1 Codex Max
|
|
72
|
+
release_date: 2025-12-04
|
|
73
|
+
description: OpenAI's frontier agentic coding model. Good at long-running coding tasks.
|
|
74
|
+
costs_per_million_token:
|
|
75
|
+
input: 1.25
|
|
76
|
+
output: 10.0
|
|
77
|
+
cache:
|
|
78
|
+
read: 0.125
|
|
35
79
|
openai/gpt-5.1-codex:
|
|
36
80
|
label: GPT 5.1 Codex
|
|
37
81
|
documentation_url: https://platform.openai.com/docs/models/gpt-5.1-codex
|
|
@@ -42,9 +86,6 @@ gpt-5-models:
|
|
|
42
86
|
output: 10.0
|
|
43
87
|
cache:
|
|
44
88
|
read: 0.125
|
|
45
|
-
default_parameters:
|
|
46
|
-
temperature: 1
|
|
47
|
-
max_output_tokens: 128_000
|
|
48
89
|
|
|
49
90
|
openai/gpt-5.1-codex-mini:
|
|
50
91
|
label: GPT 5.1 Codex Mini
|
|
@@ -56,9 +97,6 @@ gpt-5-models:
|
|
|
56
97
|
output: 2.00
|
|
57
98
|
cache:
|
|
58
99
|
read: 0.025
|
|
59
|
-
default_parameters:
|
|
60
|
-
temperature: 1
|
|
61
|
-
max_output_tokens: 128_000
|
|
62
100
|
|
|
63
101
|
openai/gpt-5-codex:
|
|
64
102
|
label: GPT 5 Codex
|
|
@@ -70,34 +108,19 @@ gpt-5-models:
|
|
|
70
108
|
output: 10.0
|
|
71
109
|
cache:
|
|
72
110
|
read: 0.125
|
|
73
|
-
properties:
|
|
74
|
-
training_cutoff: "2024-09"
|
|
75
|
-
class_properties:
|
|
76
|
-
available_as_evaluator: true
|
|
77
|
-
supports_images: true
|
|
78
|
-
default_parameters:
|
|
79
|
-
temperature: 1
|
|
80
|
-
max_output_tokens: 128_000
|
|
81
111
|
|
|
82
|
-
|
|
83
112
|
openai/gpt-5.1-2025-11-13:
|
|
84
113
|
label: GPT 5.1
|
|
85
114
|
documentation_url: https://platform.openai.com/docs/models/gpt-5.1
|
|
86
115
|
description: GPT-5.1 is OpenAI's flagship model for coding and agentic tasks with configurable reasoning and non-reasoning effort.
|
|
87
116
|
release_date: 2025-11-13
|
|
117
|
+
metadata:
|
|
118
|
+
available_as_evaluator: true
|
|
88
119
|
costs_per_million_token:
|
|
89
120
|
input: 1.25
|
|
90
121
|
output: 10
|
|
91
122
|
cache:
|
|
92
123
|
read: 0.125
|
|
93
|
-
properties:
|
|
94
|
-
training_cutoff: "2024-09"
|
|
95
|
-
class_properties:
|
|
96
|
-
available_as_evaluator: true
|
|
97
|
-
supports_images: true
|
|
98
|
-
default_parameters:
|
|
99
|
-
temperature: 1
|
|
100
|
-
max_output_tokens: 128_000
|
|
101
124
|
|
|
102
125
|
openai/gpt-5-2025-08-07:
|
|
103
126
|
label: GPT 5
|
|
@@ -111,12 +134,10 @@ gpt-5-models:
|
|
|
111
134
|
read: 0.125
|
|
112
135
|
properties:
|
|
113
136
|
training_cutoff: "2025-07"
|
|
114
|
-
|
|
137
|
+
supports:
|
|
138
|
+
images: true
|
|
139
|
+
metadata:
|
|
115
140
|
available_as_evaluator: true
|
|
116
|
-
supports_images: true
|
|
117
|
-
default_parameters:
|
|
118
|
-
temperature: 1
|
|
119
|
-
max_output_tokens: 128_000
|
|
120
141
|
alternative_keys:
|
|
121
142
|
- azure/gpt-5-2025-08-07
|
|
122
143
|
|
|
@@ -132,11 +153,6 @@ gpt-5-models:
|
|
|
132
153
|
read: 0.025
|
|
133
154
|
properties:
|
|
134
155
|
training_cutoff: "2024-05"
|
|
135
|
-
default_parameters:
|
|
136
|
-
temperature: 1
|
|
137
|
-
max_output_tokens: 128_000
|
|
138
|
-
class_properties:
|
|
139
|
-
supports_images: true
|
|
140
156
|
alternative_keys:
|
|
141
157
|
- azure/gpt-5-mini-2025-08-07
|
|
142
158
|
|
|
@@ -150,25 +166,19 @@ gpt-5-models:
|
|
|
150
166
|
output: 0.4
|
|
151
167
|
cache:
|
|
152
168
|
read: 0.005
|
|
153
|
-
properties:
|
|
154
|
-
training_cutoff: "2024-05"
|
|
155
|
-
default_parameters:
|
|
156
|
-
temperature: 1
|
|
157
|
-
max_output_tokens: 128_000
|
|
158
|
-
class_properties:
|
|
159
|
-
supports_images: true
|
|
160
169
|
alternative_keys:
|
|
161
170
|
- azure/gpt-5-nano-2025-08-07
|
|
162
171
|
|
|
163
172
|
o4-models:
|
|
164
173
|
base-config:
|
|
165
174
|
documentation_url: https://platform.openai.com/docs/models#o4
|
|
175
|
+
supports:
|
|
176
|
+
tools: true
|
|
177
|
+
temperature: false
|
|
178
|
+
metadata:
|
|
179
|
+
deprecated: true
|
|
166
180
|
properties:
|
|
167
181
|
reasoning_model: true
|
|
168
|
-
class_properties:
|
|
169
|
-
deprecated: true
|
|
170
|
-
supports_temperature: false
|
|
171
|
-
supports_tools: true
|
|
172
182
|
|
|
173
183
|
openai/o4-mini-2025-04-16:
|
|
174
184
|
label: o4 Mini
|
|
@@ -177,14 +187,15 @@ o4-models:
|
|
|
177
187
|
release_date: 2025-04-16
|
|
178
188
|
properties:
|
|
179
189
|
context_window: 200_000
|
|
180
|
-
|
|
190
|
+
max_tokens: 100_000
|
|
181
191
|
training_cutoff: "2024-05-31"
|
|
182
192
|
reasoning_model: true
|
|
183
|
-
|
|
193
|
+
supports:
|
|
194
|
+
images: true
|
|
195
|
+
temperature: false
|
|
196
|
+
metadata:
|
|
184
197
|
available_for_everyone: true
|
|
185
|
-
supports_temperature: false
|
|
186
198
|
deprecated: false
|
|
187
|
-
supports_images: true
|
|
188
199
|
costs_per_million_token:
|
|
189
200
|
input: 1.1
|
|
190
201
|
output: 4.4
|
|
@@ -197,12 +208,12 @@ gpt-4.1-models:
|
|
|
197
208
|
base-config:
|
|
198
209
|
documentation_url: https://platform.openai.com/docs/models/gpt-4.1
|
|
199
210
|
release_date: 2025-04-14
|
|
200
|
-
|
|
201
|
-
|
|
202
|
-
|
|
211
|
+
supports:
|
|
212
|
+
images: true
|
|
213
|
+
temperature: true
|
|
203
214
|
properties:
|
|
204
215
|
context_window: 1_047_576
|
|
205
|
-
|
|
216
|
+
max_tokens: 32_768
|
|
206
217
|
training_cutoff: "2024-05-31"
|
|
207
218
|
default_parameters:
|
|
208
219
|
temperature: 1
|
|
@@ -216,8 +227,8 @@ gpt-4.1-models:
|
|
|
216
227
|
cache:
|
|
217
228
|
read: 0.5
|
|
218
229
|
documentation_url: https://platform.openai.com/docs/models/gpt-4.1
|
|
219
|
-
|
|
220
|
-
|
|
230
|
+
supports:
|
|
231
|
+
images: true
|
|
221
232
|
alternative_keys:
|
|
222
233
|
- azure/gpt-4.1-2025-04-14
|
|
223
234
|
|
|
@@ -230,8 +241,8 @@ gpt-4.1-models:
|
|
|
230
241
|
cache:
|
|
231
242
|
read: 0.1
|
|
232
243
|
documentation_url: https://platform.openai.com/docs/models/gpt-4.1-mini
|
|
233
|
-
|
|
234
|
-
|
|
244
|
+
supports:
|
|
245
|
+
images: true
|
|
235
246
|
alternative_keys:
|
|
236
247
|
- azure/gpt-4.1-mini-2025-04-14
|
|
237
248
|
|
|
@@ -244,17 +255,18 @@ gpt-4.1-models:
|
|
|
244
255
|
cache:
|
|
245
256
|
read: 0.025
|
|
246
257
|
documentation_url: https://platform.openai.com/docs/models/gpt-4.1-nano
|
|
247
|
-
|
|
248
|
-
|
|
258
|
+
supports:
|
|
259
|
+
images: true
|
|
249
260
|
alternative_keys:
|
|
250
261
|
- azure/gpt-4.1-nano-2025-04-14
|
|
251
262
|
|
|
252
263
|
gpt-4.5-models:
|
|
253
264
|
base-config:
|
|
254
265
|
documentation_url: https://platform.openai.com/docs/models#gpt-4-5
|
|
255
|
-
|
|
266
|
+
supports:
|
|
267
|
+
images: true
|
|
268
|
+
metadata:
|
|
256
269
|
deprecated: true
|
|
257
|
-
supports_images: true
|
|
258
270
|
|
|
259
271
|
openai/gpt-4.5-preview-2025-02-27:
|
|
260
272
|
label: GPT 4.5 Preview
|
|
@@ -262,7 +274,7 @@ gpt-4.5-models:
|
|
|
262
274
|
release_date: 2025-02-27
|
|
263
275
|
properties:
|
|
264
276
|
context_window: 128_000
|
|
265
|
-
|
|
277
|
+
max_tokens: 16_384
|
|
266
278
|
training_cutoff: "2023-10"
|
|
267
279
|
costs_per_million_token:
|
|
268
280
|
input: 75
|
|
@@ -270,16 +282,16 @@ gpt-4.5-models:
|
|
|
270
282
|
cache:
|
|
271
283
|
read: 37.5
|
|
272
284
|
documentation_url: https://platform.openai.com/docs/models/gpt-4.5-preview
|
|
273
|
-
|
|
274
|
-
|
|
285
|
+
supports:
|
|
286
|
+
images: true
|
|
275
287
|
|
|
276
288
|
o3-models:
|
|
277
289
|
base-config:
|
|
278
290
|
documentation_url: https://platform.openai.com/docs/models#o3-mini
|
|
291
|
+
supports:
|
|
292
|
+
tools: true
|
|
279
293
|
properties:
|
|
280
294
|
reasoning_model: true
|
|
281
|
-
class_properties:
|
|
282
|
-
supports_tools: true
|
|
283
295
|
|
|
284
296
|
openai/o3-2025-04-16:
|
|
285
297
|
label: o3
|
|
@@ -288,13 +300,14 @@ o3-models:
|
|
|
288
300
|
release_date: 2025-04-16
|
|
289
301
|
properties:
|
|
290
302
|
context_window: 200_000
|
|
291
|
-
|
|
303
|
+
max_tokens: 100_000
|
|
292
304
|
training_cutoff: "2024-05-31"
|
|
293
305
|
reasoning_model: true
|
|
294
|
-
|
|
306
|
+
supports:
|
|
307
|
+
images: true
|
|
308
|
+
temperature: false
|
|
309
|
+
metadata:
|
|
295
310
|
available_for_everyone: true
|
|
296
|
-
supports_images: true
|
|
297
|
-
supports_temperature: false
|
|
298
311
|
costs_per_million_token:
|
|
299
312
|
input: 2
|
|
300
313
|
output: 8
|
|
@@ -309,7 +322,7 @@ o3-models:
|
|
|
309
322
|
release_date: 2025-01-31
|
|
310
323
|
properties:
|
|
311
324
|
context_window: 200_000
|
|
312
|
-
|
|
325
|
+
max_tokens: 100_000
|
|
313
326
|
training_cutoff: "2023-10"
|
|
314
327
|
reasoning_model: true
|
|
315
328
|
costs_per_million_token:
|
|
@@ -317,7 +330,7 @@ o3-models:
|
|
|
317
330
|
output: 4.4
|
|
318
331
|
cache:
|
|
319
332
|
read: 0.55
|
|
320
|
-
|
|
333
|
+
metadata:
|
|
321
334
|
available_for_everyone: false
|
|
322
335
|
documentation_url: https://platform.openai.com/docs/models/o3-mini
|
|
323
336
|
|
|
@@ -327,7 +340,7 @@ o3-models:
|
|
|
327
340
|
release_date: 2025-01-31
|
|
328
341
|
properties:
|
|
329
342
|
context_window: 200_000
|
|
330
|
-
|
|
343
|
+
max_tokens: 100_000
|
|
331
344
|
training_cutoff: "2023-10"
|
|
332
345
|
reasoning_model: true
|
|
333
346
|
costs_per_million_token:
|
|
@@ -335,9 +348,10 @@ o3-models:
|
|
|
335
348
|
output: 4.4
|
|
336
349
|
cache:
|
|
337
350
|
read: 0.55
|
|
338
|
-
|
|
351
|
+
supports:
|
|
352
|
+
temperature: false
|
|
353
|
+
metadata:
|
|
339
354
|
available_for_everyone: false
|
|
340
|
-
supports_temperature: false
|
|
341
355
|
documentation_url: https://platform.openai.com/docs/models/o3-mini
|
|
342
356
|
alternative_keys:
|
|
343
357
|
- azure/o3-mini-2025-01-31
|
|
@@ -348,7 +362,7 @@ o3-models:
|
|
|
348
362
|
release_date: 2025-06-10
|
|
349
363
|
properties:
|
|
350
364
|
context_window: 200_000
|
|
351
|
-
|
|
365
|
+
max_tokens: 100_000
|
|
352
366
|
training_cutoff: "2024-05-31"
|
|
353
367
|
reasoning_model: true
|
|
354
368
|
costs_per_million_token:
|
|
@@ -356,25 +370,26 @@ o3-models:
|
|
|
356
370
|
output: 80
|
|
357
371
|
cache:
|
|
358
372
|
read_discount: 1
|
|
359
|
-
|
|
373
|
+
supports:
|
|
374
|
+
images: true
|
|
375
|
+
temperature: false
|
|
376
|
+
metadata:
|
|
360
377
|
available_for_everyone: false
|
|
361
|
-
supports_images: true
|
|
362
|
-
supports_temperature: false
|
|
363
378
|
documentation_url: https://platform.openai.com/docs/models/o3-pro
|
|
364
379
|
|
|
365
380
|
deep-research-models:
|
|
366
381
|
base-config:
|
|
367
382
|
documentation_url: https://platform.openai.com/docs/deep-research
|
|
383
|
+
supports:
|
|
384
|
+
images: true
|
|
385
|
+
files: true
|
|
386
|
+
tools: true
|
|
387
|
+
temperature: false
|
|
368
388
|
properties:
|
|
369
389
|
context_window: 200_000
|
|
370
|
-
|
|
390
|
+
max_tokens: 100_000
|
|
371
391
|
training_cutoff: "2024-05-31"
|
|
372
392
|
reasoning_model: true
|
|
373
|
-
class_properties:
|
|
374
|
-
supports_temperature: false
|
|
375
|
-
supports_images: true
|
|
376
|
-
supports_files: true
|
|
377
|
-
supports_tools: true
|
|
378
393
|
provider_properties:
|
|
379
394
|
deep_research: true
|
|
380
395
|
|
|
@@ -389,9 +404,10 @@ deep-research-models:
|
|
|
389
404
|
output: 40
|
|
390
405
|
cache:
|
|
391
406
|
read: 2.5
|
|
392
|
-
|
|
407
|
+
supports:
|
|
408
|
+
images: true
|
|
409
|
+
metadata:
|
|
393
410
|
available_for_everyone: true
|
|
394
|
-
supports_images: true
|
|
395
411
|
documentation_url: https://platform.openai.com/docs/models/o3-deep-research
|
|
396
412
|
|
|
397
413
|
openai/o3-deep-research:
|
|
@@ -405,9 +421,10 @@ deep-research-models:
|
|
|
405
421
|
output: 40
|
|
406
422
|
cache:
|
|
407
423
|
read: 2.5
|
|
408
|
-
|
|
424
|
+
supports:
|
|
425
|
+
images: true
|
|
426
|
+
metadata:
|
|
409
427
|
available_for_everyone: true
|
|
410
|
-
supports_images: true
|
|
411
428
|
documentation_url: https://platform.openai.com/docs/models/o3-deep-research
|
|
412
429
|
|
|
413
430
|
openai/o4-mini-deep-research-2025-06-26:
|
|
@@ -419,9 +436,10 @@ deep-research-models:
|
|
|
419
436
|
output: 8
|
|
420
437
|
cache:
|
|
421
438
|
read: 0.5
|
|
422
|
-
|
|
439
|
+
supports:
|
|
440
|
+
images: true
|
|
441
|
+
metadata:
|
|
423
442
|
available_for_everyone: true
|
|
424
|
-
supports_images: true
|
|
425
443
|
documentation_url: https://platform.openai.com/docs/models/o4-mini-deep-research
|
|
426
444
|
|
|
427
445
|
openai/o4-mini-deep-research:
|
|
@@ -433,19 +451,21 @@ deep-research-models:
|
|
|
433
451
|
output: 8
|
|
434
452
|
cache:
|
|
435
453
|
read: 0.5
|
|
436
|
-
|
|
454
|
+
supports:
|
|
455
|
+
images: true
|
|
456
|
+
metadata:
|
|
437
457
|
available_for_everyone: true
|
|
438
|
-
supports_images: true
|
|
439
458
|
documentation_url: https://platform.openai.com/docs/models/o4-mini-deep-research
|
|
440
459
|
|
|
441
460
|
o1-models:
|
|
442
461
|
base-config:
|
|
443
462
|
documentation_url: https://platform.openai.com/docs/models#o1
|
|
463
|
+
supports:
|
|
464
|
+
temperature: false
|
|
465
|
+
metadata:
|
|
466
|
+
deprecated: true
|
|
444
467
|
properties:
|
|
445
468
|
reasoning_model: true
|
|
446
|
-
class_properties:
|
|
447
|
-
deprecated: true
|
|
448
|
-
supports_temperature: false
|
|
449
469
|
|
|
450
470
|
openai/o1-2024-12-17:
|
|
451
471
|
label: o1
|
|
@@ -453,7 +473,7 @@ o1-models:
|
|
|
453
473
|
release_date: 2024-12-17
|
|
454
474
|
properties:
|
|
455
475
|
context_window: 200_000
|
|
456
|
-
|
|
476
|
+
max_tokens: 100_000
|
|
457
477
|
training_cutoff: "2023-10"
|
|
458
478
|
reasoning_model: true
|
|
459
479
|
costs_per_million_token:
|
|
@@ -461,8 +481,9 @@ o1-models:
|
|
|
461
481
|
output: 60.0
|
|
462
482
|
cache:
|
|
463
483
|
read: 7.5
|
|
464
|
-
|
|
465
|
-
|
|
484
|
+
supports:
|
|
485
|
+
images: true
|
|
486
|
+
metadata:
|
|
466
487
|
available_for_everyone: false
|
|
467
488
|
deprecated: false
|
|
468
489
|
documentation_url: https://platform.openai.com/docs/models/o1
|
|
@@ -479,7 +500,7 @@ o1-models:
|
|
|
479
500
|
release_date: 2024-09-12
|
|
480
501
|
properties:
|
|
481
502
|
context_window: 128_000
|
|
482
|
-
|
|
503
|
+
max_tokens: 32_768
|
|
483
504
|
training_cutoff: "2023-10"
|
|
484
505
|
reasoning_model: true
|
|
485
506
|
costs_per_million_token:
|
|
@@ -487,9 +508,10 @@ o1-models:
|
|
|
487
508
|
output: 60.0
|
|
488
509
|
cache:
|
|
489
510
|
read: 7.5
|
|
490
|
-
|
|
511
|
+
supports:
|
|
512
|
+
temperature: false
|
|
513
|
+
metadata:
|
|
491
514
|
available_for_everyone: false
|
|
492
|
-
supports_temperature: false
|
|
493
515
|
documentation_url: https://platform.openai.com/docs/models/o1-preview
|
|
494
516
|
|
|
495
517
|
openai/o1-preview-2024-09-12:
|
|
@@ -498,7 +520,7 @@ o1-models:
|
|
|
498
520
|
release_date: 2024-09-12
|
|
499
521
|
properties:
|
|
500
522
|
context_window: 128_000
|
|
501
|
-
|
|
523
|
+
max_tokens: 32_768
|
|
502
524
|
training_cutoff: "2023-10"
|
|
503
525
|
reasoning_model: true
|
|
504
526
|
costs_per_million_token:
|
|
@@ -506,7 +528,7 @@ o1-models:
|
|
|
506
528
|
output: 60.0
|
|
507
529
|
cache:
|
|
508
530
|
read: 7.5
|
|
509
|
-
|
|
531
|
+
metadata:
|
|
510
532
|
available_for_everyone: false
|
|
511
533
|
documentation_url: https://platform.openai.com/docs/models/o1-preview
|
|
512
534
|
alternative_keys:
|
|
@@ -518,7 +540,7 @@ o1-models:
|
|
|
518
540
|
release_date: 2024-09-12
|
|
519
541
|
properties:
|
|
520
542
|
context_window: 128_000
|
|
521
|
-
|
|
543
|
+
max_tokens: 65_536
|
|
522
544
|
training_cutoff: "2023-10"
|
|
523
545
|
reasoning_model: true
|
|
524
546
|
costs_per_million_token:
|
|
@@ -526,7 +548,7 @@ o1-models:
|
|
|
526
548
|
output: 4.4
|
|
527
549
|
cache:
|
|
528
550
|
read: 0.55
|
|
529
|
-
|
|
551
|
+
metadata:
|
|
530
552
|
available_for_everyone: true
|
|
531
553
|
deprecated: true
|
|
532
554
|
documentation_url: https://platform.openai.com/docs/models/o1-mini
|
|
@@ -537,12 +559,12 @@ o1-models:
|
|
|
537
559
|
gpt-4o-models:
|
|
538
560
|
base-config:
|
|
539
561
|
documentation_url: https://platform.openai.com/docs/models#gpt-4o
|
|
562
|
+
supports:
|
|
563
|
+
temperature: true
|
|
540
564
|
properties:
|
|
541
565
|
context_window: 128_000
|
|
542
|
-
|
|
566
|
+
max_tokens: 16_384
|
|
543
567
|
training_cutoff: "2023-10"
|
|
544
|
-
class_properties:
|
|
545
|
-
supports_temperature: true
|
|
546
568
|
default_parameters:
|
|
547
569
|
temperature: 1
|
|
548
570
|
|
|
@@ -550,8 +572,9 @@ gpt-4o-models:
|
|
|
550
572
|
label: GPT 4o
|
|
551
573
|
description: GPT-4o is a fast, intelligent, flexible GPT model that accepts text and image inputs and produces text outputs.
|
|
552
574
|
release_date: 2024-08-06
|
|
553
|
-
|
|
554
|
-
|
|
575
|
+
supports:
|
|
576
|
+
images: true
|
|
577
|
+
metadata:
|
|
555
578
|
available_as_evaluator: true
|
|
556
579
|
costs_per_million_token:
|
|
557
580
|
input: 2.5
|
|
@@ -564,9 +587,10 @@ gpt-4o-models:
|
|
|
564
587
|
label: GPT 4o (2024-11-20)
|
|
565
588
|
description: GPT-4o is a fast, intelligent, flexible GPT model that accepts text and image inputs and produces text outputs.
|
|
566
589
|
release_date: 2024-11-20
|
|
567
|
-
|
|
568
|
-
|
|
569
|
-
|
|
590
|
+
supports:
|
|
591
|
+
images: true
|
|
592
|
+
batch: true
|
|
593
|
+
metadata:
|
|
570
594
|
available_as_evaluator: true
|
|
571
595
|
available_for_everyone: false
|
|
572
596
|
costs_per_million_token:
|
|
@@ -580,8 +604,9 @@ gpt-4o-models:
|
|
|
580
604
|
label: GPT 4o (2024-08-06)
|
|
581
605
|
description: GPT-4o is a fast, intelligent, flexible GPT model that accepts text and image inputs and produces text outputs.
|
|
582
606
|
release_date: 2024-08-06
|
|
583
|
-
|
|
584
|
-
|
|
607
|
+
supports:
|
|
608
|
+
images: true
|
|
609
|
+
metadata:
|
|
585
610
|
available_as_evaluator: true
|
|
586
611
|
available_for_everyone: false
|
|
587
612
|
costs_per_million_token:
|
|
@@ -595,8 +620,9 @@ gpt-4o-models:
|
|
|
595
620
|
label: GPT 4o (2024-05-13)
|
|
596
621
|
description: GPT-4o is a fast, intelligent, flexible GPT model that accepts text and image inputs and produces text outputs.
|
|
597
622
|
release_date: 2024-05-13
|
|
598
|
-
|
|
599
|
-
|
|
623
|
+
supports:
|
|
624
|
+
images: true
|
|
625
|
+
metadata:
|
|
600
626
|
available_for_everyone: false
|
|
601
627
|
costs_per_million_token:
|
|
602
628
|
input: 5.0
|
|
@@ -608,12 +634,12 @@ gpt-4o-models:
|
|
|
608
634
|
gpt-4o-mini-models:
|
|
609
635
|
base-config:
|
|
610
636
|
documentation_url: https://platform.openai.com/docs/models#gpt-4o-mini
|
|
637
|
+
supports:
|
|
638
|
+
temperature: true
|
|
611
639
|
properties:
|
|
612
640
|
context_window: 128_000
|
|
613
|
-
|
|
641
|
+
max_tokens: 16_384
|
|
614
642
|
training_cutoff: "2023-10"
|
|
615
|
-
class_properties:
|
|
616
|
-
supports_temperature: true
|
|
617
643
|
default_parameters:
|
|
618
644
|
temperature: 1
|
|
619
645
|
|
|
@@ -621,8 +647,9 @@ gpt-4o-mini-models:
|
|
|
621
647
|
label: GPT 4o Mini
|
|
622
648
|
description: GPT-4o mini is a fast, affordable small model for focused tasks that accepts text and image inputs and produces text outputs.
|
|
623
649
|
release_date: 2024-07-18
|
|
624
|
-
|
|
625
|
-
|
|
650
|
+
supports:
|
|
651
|
+
images: true
|
|
652
|
+
metadata:
|
|
626
653
|
available_as_evaluator: true
|
|
627
654
|
costs_per_million_token:
|
|
628
655
|
input: 0.15
|
|
@@ -635,8 +662,9 @@ gpt-4o-mini-models:
|
|
|
635
662
|
label: GPT 4o Mini
|
|
636
663
|
description: GPT-4o mini is a fast, affordable small model for focused tasks that accepts text and image inputs and produces text outputs.
|
|
637
664
|
release_date: 2024-07-18
|
|
638
|
-
|
|
639
|
-
|
|
665
|
+
supports:
|
|
666
|
+
images: true
|
|
667
|
+
metadata:
|
|
640
668
|
available_as_evaluator: true
|
|
641
669
|
available_for_everyone: false
|
|
642
670
|
costs_per_million_token:
|
|
@@ -651,14 +679,15 @@ gpt-4o-mini-models:
|
|
|
651
679
|
gpt-4-models:
|
|
652
680
|
base-config:
|
|
653
681
|
documentation_url: https://platform.openai.com/docs/models#gpt-4-turbo-and-gpt-4
|
|
682
|
+
supports:
|
|
683
|
+
temperature: true
|
|
684
|
+
metadata:
|
|
685
|
+
available_for_everyone: false
|
|
686
|
+
deprecated: true
|
|
654
687
|
properties:
|
|
655
688
|
context_window: 128_000
|
|
656
|
-
|
|
689
|
+
max_tokens: 4_096
|
|
657
690
|
training_cutoff: "2023-12"
|
|
658
|
-
class_properties:
|
|
659
|
-
available_for_everyone: false
|
|
660
|
-
deprecated: true
|
|
661
|
-
supports_temperature: true
|
|
662
691
|
default_parameters:
|
|
663
692
|
temperature: 1
|
|
664
693
|
|
|
@@ -666,11 +695,12 @@ gpt-4-models:
|
|
|
666
695
|
label: GPT 4 Turbo
|
|
667
696
|
description: GPT-4 Turbo is an older high-intelligence GPT model that accepts text and image inputs and produces text outputs.
|
|
668
697
|
release_date: 2024-04-09
|
|
669
|
-
|
|
698
|
+
supports:
|
|
699
|
+
images: true
|
|
700
|
+
metadata:
|
|
670
701
|
available_as_evaluator: true
|
|
671
702
|
available_for_everyone: false
|
|
672
703
|
deprecated: true
|
|
673
|
-
supports_images: true
|
|
674
704
|
costs_per_million_token:
|
|
675
705
|
input: 10
|
|
676
706
|
output: 30
|
|
@@ -686,8 +716,8 @@ gpt-4-models:
|
|
|
686
716
|
input: 10
|
|
687
717
|
output: 30
|
|
688
718
|
documentation_url: https://platform.openai.com/docs/models/gpt-4-turbo
|
|
689
|
-
|
|
690
|
-
|
|
719
|
+
supports:
|
|
720
|
+
images: true
|
|
691
721
|
alternative_keys:
|
|
692
722
|
- azure/gpt-4-turbo-2024-04-09
|
|
693
723
|
|
|
@@ -722,10 +752,11 @@ gpt-4-models:
|
|
|
722
752
|
label: GPT 4
|
|
723
753
|
description: GPT-4 is an older high-intelligence GPT model for text-only conversations.
|
|
724
754
|
release_date: 2023-06-13
|
|
725
|
-
|
|
755
|
+
metadata:
|
|
726
756
|
deprecated: true
|
|
757
|
+
properties:
|
|
727
758
|
context_window: 8_192
|
|
728
|
-
|
|
759
|
+
max_tokens: 8_192
|
|
729
760
|
training_cutoff: "2021-09"
|
|
730
761
|
costs_per_million_token:
|
|
731
762
|
input: 30
|
|
@@ -737,7 +768,7 @@ gpt-4-models:
|
|
|
737
768
|
label: GPT 4 (2023-06-13)
|
|
738
769
|
properties:
|
|
739
770
|
context_window: 8_192
|
|
740
|
-
|
|
771
|
+
max_tokens: 8_192
|
|
741
772
|
training_cutoff: "2021-09"
|
|
742
773
|
costs_per_million_token:
|
|
743
774
|
input: 30
|
|
@@ -749,7 +780,7 @@ gpt-4-models:
|
|
|
749
780
|
release_date: 2023-03-14
|
|
750
781
|
properties:
|
|
751
782
|
context_window: 8_192
|
|
752
|
-
|
|
783
|
+
max_tokens: 8_192
|
|
753
784
|
training_cutoff: "2021-09"
|
|
754
785
|
costs_per_million_token:
|
|
755
786
|
input: 30
|
|
@@ -758,14 +789,15 @@ gpt-4-models:
|
|
|
758
789
|
gpt-3.5-models:
|
|
759
790
|
base-config:
|
|
760
791
|
documentation_url: https://platform.openai.com/docs/models#gpt-3-5-turbo
|
|
792
|
+
supports:
|
|
793
|
+
temperature: true
|
|
794
|
+
metadata:
|
|
795
|
+
available_for_everyone: false
|
|
796
|
+
deprecated: true
|
|
761
797
|
properties:
|
|
762
798
|
context_window: 16_385
|
|
763
|
-
|
|
799
|
+
max_tokens: 4_096
|
|
764
800
|
training_cutoff: "2021-09"
|
|
765
|
-
class_properties:
|
|
766
|
-
available_for_everyone: false
|
|
767
|
-
deprecated: true
|
|
768
|
-
supports_temperature: true
|
|
769
801
|
default_parameters:
|
|
770
802
|
temperature: 1
|
|
771
803
|
|
|
@@ -773,7 +805,7 @@ gpt-3.5-models:
|
|
|
773
805
|
label: GPT 3.5
|
|
774
806
|
description: GPT-3.5 Turbo is a legacy text-only model for natural language and code conversations.
|
|
775
807
|
release_date: 2023-01-25
|
|
776
|
-
|
|
808
|
+
metadata:
|
|
777
809
|
available_for_everyone: true
|
|
778
810
|
costs_per_million_token:
|
|
779
811
|
input: 0.5
|
|
@@ -804,6 +836,7 @@ gpt-3.5-models:
|
|
|
804
836
|
release_date: 2022-11-06
|
|
805
837
|
properties:
|
|
806
838
|
context_window: 4_096
|
|
839
|
+
max_tokens: 4_096
|
|
807
840
|
costs_per_million_token:
|
|
808
841
|
input: 1.5
|
|
809
842
|
output: 2.0
|
|
@@ -819,9 +852,9 @@ databricks-models:
|
|
|
819
852
|
release_date: 2024-03-27
|
|
820
853
|
properties:
|
|
821
854
|
context_window: 32_768
|
|
822
|
-
|
|
855
|
+
max_tokens: 4_096
|
|
823
856
|
training_cutoff: "2023-12"
|
|
824
|
-
|
|
857
|
+
metadata:
|
|
825
858
|
available_for_everyone: false
|
|
826
859
|
deprecated: true
|
|
827
860
|
costs_per_million_token:
|