llm.rb 11.3.1 → 12.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (57) hide show
  1. checksums.yaml +4 -4
  2. data/CHANGELOG.md +242 -1
  3. data/LICENSE +92 -17
  4. data/README.md +204 -623
  5. data/data/anthropic.json +433 -249
  6. data/data/bedrock.json +2097 -1055
  7. data/data/deepinfra.json +993 -0
  8. data/data/deepseek.json +53 -28
  9. data/data/google.json +389 -771
  10. data/data/openai.json +1053 -771
  11. data/data/xai.json +133 -292
  12. data/data/zai.json +249 -141
  13. data/lib/llm/active_record/acts_as_agent.rb +3 -41
  14. data/lib/llm/active_record/acts_as_llm.rb +18 -0
  15. data/lib/llm/active_record.rb +3 -3
  16. data/lib/llm/context.rb +9 -5
  17. data/lib/llm/contract/completion.rb +2 -2
  18. data/lib/llm/provider.rb +2 -2
  19. data/lib/llm/providers/deepinfra/audio.rb +66 -0
  20. data/lib/llm/providers/deepinfra/images.rb +90 -0
  21. data/lib/llm/providers/deepinfra/response_adapter.rb +36 -0
  22. data/lib/llm/providers/deepinfra.rb +100 -0
  23. data/lib/llm/providers/deepseek/images.rb +109 -0
  24. data/lib/llm/providers/deepseek/request_adapter.rb +32 -0
  25. data/lib/llm/providers/deepseek/response_adapter/image.rb +9 -0
  26. data/lib/llm/providers/deepseek/response_adapter.rb +29 -0
  27. data/lib/llm/providers/deepseek.rb +4 -2
  28. data/lib/llm/providers/google/request_adapter.rb +22 -5
  29. data/lib/llm/providers/google.rb +4 -4
  30. data/lib/llm/providers/openai/audio.rb +6 -2
  31. data/lib/llm/providers/openai/images.rb +9 -50
  32. data/lib/llm/providers/openai/request_adapter/respond.rb +38 -4
  33. data/lib/llm/providers/openai/response_adapter/audio.rb +5 -1
  34. data/lib/llm/providers/openai/response_adapter/completion.rb +1 -1
  35. data/lib/llm/providers/openai/response_adapter/image.rb +0 -4
  36. data/lib/llm/providers/openai/responses.rb +1 -0
  37. data/lib/llm/providers/openai/stream_parser.rb +5 -6
  38. data/lib/llm/providers/openai.rb +2 -2
  39. data/lib/llm/providers/xai/images.rb +49 -26
  40. data/lib/llm/providers/xai.rb +2 -2
  41. data/lib/llm/response.rb +10 -0
  42. data/lib/llm/schema/leaf.rb +7 -1
  43. data/lib/llm/schema/renderer.rb +121 -0
  44. data/lib/llm/schema.rb +30 -0
  45. data/lib/llm/sequel/agent.rb +2 -43
  46. data/lib/llm/sequel/plugin.rb +25 -7
  47. data/lib/llm/tracer/telemetry.rb +4 -6
  48. data/lib/llm/tracer.rb +9 -21
  49. data/lib/llm/transport/execution.rb +16 -1
  50. data/lib/llm/transport/net_http_adapter.rb +1 -1
  51. data/lib/llm/uridata.rb +16 -0
  52. data/lib/llm/version.rb +1 -1
  53. data/lib/llm.rb +9 -0
  54. data/llm.gemspec +5 -18
  55. data/resources/deepdive.md +798 -264
  56. metadata +15 -18
  57. data/lib/llm/tracer/langsmith.rb +0 -144
@@ -0,0 +1,993 @@
1
+ {
2
+ "id": "deepinfra",
3
+ "env": [
4
+ "DEEPINFRA_API_KEY"
5
+ ],
6
+ "npm": "@ai-sdk/deepinfra",
7
+ "name": "Deep Infra",
8
+ "doc": "https://deepinfra.com/models",
9
+ "models": {
10
+ "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8": {
11
+ "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
12
+ "name": "Llama 4 Maverick 17B FP8",
13
+ "family": "llama",
14
+ "attachment": false,
15
+ "reasoning": false,
16
+ "tool_call": false,
17
+ "release_date": "2025-04-05",
18
+ "last_updated": "2025-04-05",
19
+ "modalities": {
20
+ "input": [
21
+ "text",
22
+ "image"
23
+ ],
24
+ "output": [
25
+ "text"
26
+ ]
27
+ },
28
+ "open_weights": true,
29
+ "limit": {
30
+ "context": 1048576,
31
+ "output": 16384
32
+ },
33
+ "cost": {
34
+ "input": 0.15,
35
+ "output": 0.6
36
+ }
37
+ },
38
+ "meta-llama/Llama-4-Scout-17B-16E-Instruct": {
39
+ "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct",
40
+ "name": "Llama 4 Scout 17B",
41
+ "family": "llama",
42
+ "attachment": false,
43
+ "reasoning": false,
44
+ "tool_call": true,
45
+ "release_date": "2025-04-05",
46
+ "last_updated": "2025-04-05",
47
+ "modalities": {
48
+ "input": [
49
+ "text",
50
+ "image"
51
+ ],
52
+ "output": [
53
+ "text"
54
+ ]
55
+ },
56
+ "open_weights": true,
57
+ "limit": {
58
+ "context": 327680,
59
+ "output": 16384
60
+ },
61
+ "cost": {
62
+ "input": 0.1,
63
+ "output": 0.3
64
+ }
65
+ },
66
+ "meta-llama/Llama-3.3-70B-Instruct-Turbo": {
67
+ "id": "meta-llama/Llama-3.3-70B-Instruct-Turbo",
68
+ "name": "Llama 3.3 70B Turbo",
69
+ "family": "llama",
70
+ "attachment": false,
71
+ "reasoning": false,
72
+ "tool_call": true,
73
+ "release_date": "2024-12-06",
74
+ "last_updated": "2024-12-06",
75
+ "modalities": {
76
+ "input": [
77
+ "text"
78
+ ],
79
+ "output": [
80
+ "text"
81
+ ]
82
+ },
83
+ "open_weights": true,
84
+ "limit": {
85
+ "context": 131072,
86
+ "output": 16384
87
+ },
88
+ "cost": {
89
+ "input": 0.1,
90
+ "output": 0.32
91
+ }
92
+ },
93
+ "moonshotai/Kimi-K2.6": {
94
+ "id": "moonshotai/Kimi-K2.6",
95
+ "name": "Kimi K2.6",
96
+ "family": "kimi-k2",
97
+ "attachment": true,
98
+ "reasoning": true,
99
+ "reasoning_options": [
100
+ {
101
+ "type": "toggle"
102
+ }
103
+ ],
104
+ "tool_call": true,
105
+ "interleaved": {
106
+ "field": "reasoning_content"
107
+ },
108
+ "structured_output": true,
109
+ "temperature": true,
110
+ "knowledge": "2024-04",
111
+ "release_date": "2026-04-21",
112
+ "last_updated": "2026-04-21",
113
+ "modalities": {
114
+ "input": [
115
+ "text",
116
+ "image",
117
+ "video"
118
+ ],
119
+ "output": [
120
+ "text"
121
+ ]
122
+ },
123
+ "open_weights": true,
124
+ "limit": {
125
+ "context": 262144,
126
+ "output": 16384
127
+ },
128
+ "cost": {
129
+ "input": 0.75,
130
+ "output": 3.5,
131
+ "cache_read": 0.15
132
+ }
133
+ },
134
+ "moonshotai/Kimi-K2.5": {
135
+ "id": "moonshotai/Kimi-K2.5",
136
+ "name": "Kimi K2.5",
137
+ "family": "kimi-k2",
138
+ "attachment": true,
139
+ "reasoning": true,
140
+ "reasoning_options": [
141
+ {
142
+ "type": "toggle"
143
+ }
144
+ ],
145
+ "tool_call": true,
146
+ "interleaved": {
147
+ "field": "reasoning_content"
148
+ },
149
+ "structured_output": true,
150
+ "temperature": true,
151
+ "knowledge": "2025-01",
152
+ "release_date": "2026-01-27",
153
+ "last_updated": "2026-01-27",
154
+ "modalities": {
155
+ "input": [
156
+ "text",
157
+ "image",
158
+ "video"
159
+ ],
160
+ "output": [
161
+ "text"
162
+ ]
163
+ },
164
+ "open_weights": true,
165
+ "limit": {
166
+ "context": 262144,
167
+ "output": 32768
168
+ },
169
+ "cost": {
170
+ "input": 0.45,
171
+ "output": 2.25,
172
+ "cache_read": 0.07
173
+ }
174
+ },
175
+ "google/gemma-4-31B-it": {
176
+ "id": "google/gemma-4-31B-it",
177
+ "name": "Gemma 4 31B IT",
178
+ "family": "gemma",
179
+ "attachment": true,
180
+ "reasoning": true,
181
+ "reasoning_options": [
182
+ {
183
+ "type": "toggle"
184
+ }
185
+ ],
186
+ "tool_call": true,
187
+ "structured_output": true,
188
+ "temperature": true,
189
+ "release_date": "2026-04-02",
190
+ "last_updated": "2026-04-02",
191
+ "modalities": {
192
+ "input": [
193
+ "text",
194
+ "image"
195
+ ],
196
+ "output": [
197
+ "text"
198
+ ]
199
+ },
200
+ "open_weights": true,
201
+ "limit": {
202
+ "context": 262144,
203
+ "output": 32768
204
+ },
205
+ "cost": {
206
+ "input": 0.13,
207
+ "output": 0.38
208
+ }
209
+ },
210
+ "google/gemma-4-26B-A4B-it": {
211
+ "id": "google/gemma-4-26B-A4B-it",
212
+ "name": "Gemma 4 26B A4B IT",
213
+ "family": "gemma",
214
+ "attachment": true,
215
+ "reasoning": true,
216
+ "reasoning_options": [
217
+ {
218
+ "type": "toggle"
219
+ }
220
+ ],
221
+ "tool_call": true,
222
+ "structured_output": true,
223
+ "temperature": true,
224
+ "release_date": "2026-04-02",
225
+ "last_updated": "2026-04-02",
226
+ "modalities": {
227
+ "input": [
228
+ "text",
229
+ "image"
230
+ ],
231
+ "output": [
232
+ "text"
233
+ ]
234
+ },
235
+ "open_weights": true,
236
+ "limit": {
237
+ "context": 262144,
238
+ "output": 32768
239
+ },
240
+ "cost": {
241
+ "input": 0.07,
242
+ "output": 0.34
243
+ }
244
+ },
245
+ "Qwen/Qwen3.6-35B-A3B": {
246
+ "id": "Qwen/Qwen3.6-35B-A3B",
247
+ "name": "Qwen3.6 35B A3B",
248
+ "family": "qwen",
249
+ "attachment": true,
250
+ "reasoning": true,
251
+ "reasoning_options": [],
252
+ "tool_call": true,
253
+ "temperature": true,
254
+ "release_date": "2026-04-01",
255
+ "last_updated": "2026-04-01",
256
+ "modalities": {
257
+ "input": [
258
+ "text",
259
+ "image",
260
+ "video"
261
+ ],
262
+ "output": [
263
+ "text"
264
+ ]
265
+ },
266
+ "open_weights": true,
267
+ "limit": {
268
+ "context": 262144,
269
+ "output": 81920
270
+ },
271
+ "cost": {
272
+ "input": 0.15,
273
+ "output": 0.95
274
+ }
275
+ },
276
+ "Qwen/Qwen3.5-397B-A17B": {
277
+ "id": "Qwen/Qwen3.5-397B-A17B",
278
+ "name": "Qwen 3.5 397B A17B",
279
+ "family": "qwen",
280
+ "attachment": true,
281
+ "reasoning": true,
282
+ "reasoning_options": [],
283
+ "tool_call": true,
284
+ "temperature": true,
285
+ "knowledge": "2025-01",
286
+ "release_date": "2026-02-01",
287
+ "last_updated": "2026-04-20",
288
+ "modalities": {
289
+ "input": [
290
+ "text",
291
+ "image",
292
+ "video"
293
+ ],
294
+ "output": [
295
+ "text"
296
+ ]
297
+ },
298
+ "open_weights": true,
299
+ "limit": {
300
+ "context": 262144,
301
+ "output": 81920
302
+ },
303
+ "cost": {
304
+ "input": 0.45,
305
+ "output": 3,
306
+ "cache_read": 0.22
307
+ }
308
+ },
309
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo": {
310
+ "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo",
311
+ "name": "Qwen3 Coder 480B A35B Instruct Turbo",
312
+ "family": "qwen",
313
+ "attachment": false,
314
+ "reasoning": false,
315
+ "tool_call": true,
316
+ "temperature": true,
317
+ "knowledge": "2025-04",
318
+ "release_date": "2025-07-23",
319
+ "last_updated": "2025-07-23",
320
+ "modalities": {
321
+ "input": [
322
+ "text"
323
+ ],
324
+ "output": [
325
+ "text"
326
+ ]
327
+ },
328
+ "open_weights": true,
329
+ "limit": {
330
+ "context": 262144,
331
+ "output": 66536
332
+ },
333
+ "cost": {
334
+ "input": 0.3,
335
+ "output": 1
336
+ }
337
+ },
338
+ "Qwen/Qwen3.5-35B-A3B": {
339
+ "id": "Qwen/Qwen3.5-35B-A3B",
340
+ "name": "Qwen 3.5 35B A3B",
341
+ "family": "qwen",
342
+ "attachment": true,
343
+ "reasoning": true,
344
+ "reasoning_options": [],
345
+ "tool_call": true,
346
+ "temperature": true,
347
+ "knowledge": "2025-01",
348
+ "release_date": "2026-02-01",
349
+ "last_updated": "2026-04-20",
350
+ "modalities": {
351
+ "input": [
352
+ "text",
353
+ "image",
354
+ "video"
355
+ ],
356
+ "output": [
357
+ "text"
358
+ ]
359
+ },
360
+ "open_weights": true,
361
+ "limit": {
362
+ "context": 262144,
363
+ "output": 81920
364
+ },
365
+ "cost": {
366
+ "input": 0.14,
367
+ "output": 1,
368
+ "cache_read": 0.05
369
+ }
370
+ },
371
+ "openai/gpt-oss-120b": {
372
+ "id": "openai/gpt-oss-120b",
373
+ "name": "GPT OSS 120B",
374
+ "family": "gpt-oss",
375
+ "attachment": false,
376
+ "reasoning": true,
377
+ "reasoning_options": [
378
+ {
379
+ "type": "effort",
380
+ "values": [
381
+ "low",
382
+ "medium",
383
+ "high"
384
+ ]
385
+ }
386
+ ],
387
+ "tool_call": true,
388
+ "temperature": true,
389
+ "release_date": "2025-08-05",
390
+ "last_updated": "2025-08-05",
391
+ "modalities": {
392
+ "input": [
393
+ "text"
394
+ ],
395
+ "output": [
396
+ "text"
397
+ ]
398
+ },
399
+ "open_weights": true,
400
+ "limit": {
401
+ "context": 131072,
402
+ "output": 16384
403
+ },
404
+ "cost": {
405
+ "input": 0.039,
406
+ "output": 0.19
407
+ }
408
+ },
409
+ "openai/gpt-oss-20b": {
410
+ "id": "openai/gpt-oss-20b",
411
+ "name": "GPT OSS 20B",
412
+ "family": "gpt-oss",
413
+ "attachment": false,
414
+ "reasoning": true,
415
+ "reasoning_options": [
416
+ {
417
+ "type": "effort",
418
+ "values": [
419
+ "low",
420
+ "medium",
421
+ "high"
422
+ ]
423
+ }
424
+ ],
425
+ "tool_call": true,
426
+ "temperature": true,
427
+ "release_date": "2025-08-05",
428
+ "last_updated": "2025-08-05",
429
+ "modalities": {
430
+ "input": [
431
+ "text"
432
+ ],
433
+ "output": [
434
+ "text"
435
+ ]
436
+ },
437
+ "open_weights": true,
438
+ "limit": {
439
+ "context": 131072,
440
+ "output": 16384
441
+ },
442
+ "cost": {
443
+ "input": 0.03,
444
+ "output": 0.14
445
+ }
446
+ },
447
+ "XiaomiMiMo/MiMo-V2.5": {
448
+ "id": "XiaomiMiMo/MiMo-V2.5",
449
+ "name": "MiMo-V2.5",
450
+ "family": "mimo",
451
+ "attachment": true,
452
+ "reasoning": true,
453
+ "reasoning_options": [
454
+ {
455
+ "type": "toggle"
456
+ }
457
+ ],
458
+ "tool_call": true,
459
+ "interleaved": {
460
+ "field": "reasoning_content"
461
+ },
462
+ "temperature": true,
463
+ "knowledge": "2024-12",
464
+ "release_date": "2026-04-22",
465
+ "last_updated": "2026-04-22",
466
+ "modalities": {
467
+ "input": [
468
+ "text",
469
+ "image",
470
+ "audio",
471
+ "video"
472
+ ],
473
+ "output": [
474
+ "text"
475
+ ]
476
+ },
477
+ "open_weights": true,
478
+ "limit": {
479
+ "context": 262144,
480
+ "output": 16384
481
+ },
482
+ "cost": {
483
+ "input": 0.4,
484
+ "output": 2,
485
+ "cache_read": 0.08,
486
+ "tiers": [
487
+ {
488
+ "input": 0.8,
489
+ "output": 4,
490
+ "cache_read": 0.16,
491
+ "tier": {
492
+ "type": "context",
493
+ "size": 256000
494
+ }
495
+ }
496
+ ],
497
+ "context_over_200k": {
498
+ "input": 0.8,
499
+ "output": 4,
500
+ "cache_read": 0.16
501
+ }
502
+ }
503
+ },
504
+ "XiaomiMiMo/MiMo-V2.5-Pro": {
505
+ "id": "XiaomiMiMo/MiMo-V2.5-Pro",
506
+ "name": "MiMo-V2.5-Pro",
507
+ "family": "mimo",
508
+ "attachment": false,
509
+ "reasoning": true,
510
+ "reasoning_options": [
511
+ {
512
+ "type": "toggle"
513
+ }
514
+ ],
515
+ "tool_call": true,
516
+ "interleaved": {
517
+ "field": "reasoning_content"
518
+ },
519
+ "temperature": true,
520
+ "knowledge": "2024-12",
521
+ "release_date": "2026-04-22",
522
+ "last_updated": "2026-04-22",
523
+ "modalities": {
524
+ "input": [
525
+ "text"
526
+ ],
527
+ "output": [
528
+ "text"
529
+ ]
530
+ },
531
+ "open_weights": true,
532
+ "limit": {
533
+ "context": 1048576,
534
+ "output": 16384
535
+ },
536
+ "cost": {
537
+ "input": 1,
538
+ "output": 3,
539
+ "cache_read": 0.2,
540
+ "tiers": [
541
+ {
542
+ "input": 2,
543
+ "output": 6,
544
+ "cache_read": 0.4,
545
+ "tier": {
546
+ "type": "context",
547
+ "size": 256000
548
+ }
549
+ }
550
+ ],
551
+ "context_over_200k": {
552
+ "input": 2,
553
+ "output": 6,
554
+ "cache_read": 0.4
555
+ }
556
+ }
557
+ },
558
+ "zai-org/GLM-4.7-Flash": {
559
+ "id": "zai-org/GLM-4.7-Flash",
560
+ "name": "GLM-4.7-Flash",
561
+ "family": "glm-flash",
562
+ "attachment": false,
563
+ "reasoning": true,
564
+ "reasoning_options": [],
565
+ "tool_call": true,
566
+ "interleaved": {
567
+ "field": "reasoning_content"
568
+ },
569
+ "temperature": true,
570
+ "knowledge": "2025-04",
571
+ "release_date": "2026-01-19",
572
+ "last_updated": "2026-01-19",
573
+ "modalities": {
574
+ "input": [
575
+ "text"
576
+ ],
577
+ "output": [
578
+ "text"
579
+ ]
580
+ },
581
+ "open_weights": true,
582
+ "limit": {
583
+ "context": 202752,
584
+ "output": 16384
585
+ },
586
+ "cost": {
587
+ "input": 0.06,
588
+ "output": 0.4
589
+ }
590
+ },
591
+ "zai-org/GLM-4.6": {
592
+ "id": "zai-org/GLM-4.6",
593
+ "name": "GLM-4.6",
594
+ "family": "glm",
595
+ "attachment": false,
596
+ "reasoning": true,
597
+ "reasoning_options": [
598
+ {
599
+ "type": "toggle"
600
+ }
601
+ ],
602
+ "tool_call": true,
603
+ "interleaved": {
604
+ "field": "reasoning_content"
605
+ },
606
+ "temperature": true,
607
+ "knowledge": "2025-04",
608
+ "release_date": "2025-09-30",
609
+ "last_updated": "2025-09-30",
610
+ "modalities": {
611
+ "input": [
612
+ "text"
613
+ ],
614
+ "output": [
615
+ "text"
616
+ ]
617
+ },
618
+ "open_weights": true,
619
+ "limit": {
620
+ "context": 202752,
621
+ "output": 131072
622
+ },
623
+ "cost": {
624
+ "input": 0.43,
625
+ "output": 1.74,
626
+ "cache_read": 0.08
627
+ }
628
+ },
629
+ "zai-org/GLM-5": {
630
+ "id": "zai-org/GLM-5",
631
+ "name": "GLM-5",
632
+ "family": "glm",
633
+ "attachment": false,
634
+ "reasoning": true,
635
+ "reasoning_options": [
636
+ {
637
+ "type": "toggle"
638
+ }
639
+ ],
640
+ "tool_call": true,
641
+ "interleaved": {
642
+ "field": "reasoning_content"
643
+ },
644
+ "temperature": true,
645
+ "knowledge": "2025-12",
646
+ "release_date": "2026-02-12",
647
+ "last_updated": "2026-02-12",
648
+ "modalities": {
649
+ "input": [
650
+ "text"
651
+ ],
652
+ "output": [
653
+ "text"
654
+ ]
655
+ },
656
+ "open_weights": true,
657
+ "limit": {
658
+ "context": 202752,
659
+ "output": 16384
660
+ },
661
+ "cost": {
662
+ "input": 0.6,
663
+ "output": 2.08,
664
+ "cache_read": 0.12
665
+ }
666
+ },
667
+ "zai-org/GLM-4.7": {
668
+ "id": "zai-org/GLM-4.7",
669
+ "name": "GLM-4.7",
670
+ "family": "glm",
671
+ "attachment": false,
672
+ "reasoning": true,
673
+ "reasoning_options": [
674
+ {
675
+ "type": "toggle"
676
+ }
677
+ ],
678
+ "tool_call": true,
679
+ "interleaved": {
680
+ "field": "reasoning_content"
681
+ },
682
+ "temperature": true,
683
+ "knowledge": "2025-04",
684
+ "release_date": "2025-12-22",
685
+ "last_updated": "2025-12-22",
686
+ "modalities": {
687
+ "input": [
688
+ "text"
689
+ ],
690
+ "output": [
691
+ "text"
692
+ ]
693
+ },
694
+ "open_weights": true,
695
+ "limit": {
696
+ "context": 202752,
697
+ "output": 16384
698
+ },
699
+ "cost": {
700
+ "input": 0.4,
701
+ "output": 1.75,
702
+ "cache_read": 0.08
703
+ }
704
+ },
705
+ "zai-org/GLM-5.2": {
706
+ "id": "zai-org/GLM-5.2",
707
+ "name": "GLM-5.2",
708
+ "family": "glm",
709
+ "attachment": false,
710
+ "reasoning": true,
711
+ "reasoning_options": [
712
+ {
713
+ "type": "toggle"
714
+ },
715
+ {
716
+ "type": "effort",
717
+ "values": [
718
+ "low",
719
+ "medium",
720
+ "high",
721
+ "xhigh"
722
+ ]
723
+ }
724
+ ],
725
+ "tool_call": true,
726
+ "interleaved": {
727
+ "field": "reasoning_content"
728
+ },
729
+ "structured_output": true,
730
+ "temperature": true,
731
+ "release_date": "2026-06-13",
732
+ "last_updated": "2026-06-13",
733
+ "modalities": {
734
+ "input": [
735
+ "text"
736
+ ],
737
+ "output": [
738
+ "text"
739
+ ]
740
+ },
741
+ "open_weights": true,
742
+ "limit": {
743
+ "context": 1048576,
744
+ "output": 32768
745
+ },
746
+ "cost": {
747
+ "input": 0.95,
748
+ "output": 3,
749
+ "cache_read": 0.18
750
+ }
751
+ },
752
+ "zai-org/GLM-5.1": {
753
+ "id": "zai-org/GLM-5.1",
754
+ "name": "GLM-5.1",
755
+ "family": "glm",
756
+ "attachment": false,
757
+ "reasoning": true,
758
+ "reasoning_options": [
759
+ {
760
+ "type": "toggle"
761
+ }
762
+ ],
763
+ "tool_call": true,
764
+ "interleaved": {
765
+ "field": "reasoning_content"
766
+ },
767
+ "structured_output": true,
768
+ "temperature": true,
769
+ "knowledge": "2025-04",
770
+ "release_date": "2026-04-07",
771
+ "last_updated": "2026-04-07",
772
+ "modalities": {
773
+ "input": [
774
+ "text"
775
+ ],
776
+ "output": [
777
+ "text"
778
+ ]
779
+ },
780
+ "open_weights": true,
781
+ "limit": {
782
+ "context": 202752,
783
+ "output": 16384
784
+ },
785
+ "cost": {
786
+ "input": 1.05,
787
+ "output": 3.5,
788
+ "cache_read": 0.205
789
+ }
790
+ },
791
+ "deepseek-ai/DeepSeek-R1-0528": {
792
+ "id": "deepseek-ai/DeepSeek-R1-0528",
793
+ "name": "DeepSeek-R1-0528",
794
+ "attachment": false,
795
+ "reasoning": true,
796
+ "reasoning_options": [],
797
+ "tool_call": true,
798
+ "interleaved": {
799
+ "field": "reasoning_content"
800
+ },
801
+ "temperature": true,
802
+ "knowledge": "2024-07",
803
+ "release_date": "2025-05-28",
804
+ "last_updated": "2025-05-28",
805
+ "modalities": {
806
+ "input": [
807
+ "text"
808
+ ],
809
+ "output": [
810
+ "text"
811
+ ]
812
+ },
813
+ "open_weights": false,
814
+ "limit": {
815
+ "context": 163840,
816
+ "output": 64000
817
+ },
818
+ "cost": {
819
+ "input": 0.5,
820
+ "output": 2.15,
821
+ "cache_read": 0.35
822
+ }
823
+ },
824
+ "deepseek-ai/DeepSeek-V4-Flash": {
825
+ "id": "deepseek-ai/DeepSeek-V4-Flash",
826
+ "name": "DeepSeek V4 Flash",
827
+ "family": "deepseek-flash",
828
+ "attachment": false,
829
+ "reasoning": true,
830
+ "reasoning_options": [
831
+ {
832
+ "type": "toggle"
833
+ },
834
+ {
835
+ "type": "effort",
836
+ "values": [
837
+ "low",
838
+ "medium",
839
+ "high",
840
+ "xhigh"
841
+ ]
842
+ }
843
+ ],
844
+ "tool_call": true,
845
+ "interleaved": {
846
+ "field": "reasoning_content"
847
+ },
848
+ "structured_output": true,
849
+ "temperature": true,
850
+ "knowledge": "2025-05",
851
+ "release_date": "2026-04-24",
852
+ "last_updated": "2026-04-24",
853
+ "modalities": {
854
+ "input": [
855
+ "text"
856
+ ],
857
+ "output": [
858
+ "text"
859
+ ]
860
+ },
861
+ "open_weights": true,
862
+ "limit": {
863
+ "context": 1048576,
864
+ "output": 16384
865
+ },
866
+ "cost": {
867
+ "input": 0.1,
868
+ "output": 0.2,
869
+ "cache_read": 0.02
870
+ }
871
+ },
872
+ "deepseek-ai/DeepSeek-V4-Pro": {
873
+ "id": "deepseek-ai/DeepSeek-V4-Pro",
874
+ "name": "DeepSeek V4 Pro",
875
+ "family": "deepseek-thinking",
876
+ "attachment": false,
877
+ "reasoning": true,
878
+ "reasoning_options": [
879
+ {
880
+ "type": "toggle"
881
+ },
882
+ {
883
+ "type": "effort",
884
+ "values": [
885
+ "low",
886
+ "medium",
887
+ "high",
888
+ "xhigh"
889
+ ]
890
+ }
891
+ ],
892
+ "tool_call": true,
893
+ "interleaved": {
894
+ "field": "reasoning_content"
895
+ },
896
+ "structured_output": true,
897
+ "temperature": true,
898
+ "knowledge": "2025-05",
899
+ "release_date": "2026-04-24",
900
+ "last_updated": "2026-04-24",
901
+ "modalities": {
902
+ "input": [
903
+ "text"
904
+ ],
905
+ "output": [
906
+ "text"
907
+ ]
908
+ },
909
+ "open_weights": true,
910
+ "limit": {
911
+ "context": 1048576,
912
+ "output": 16384
913
+ },
914
+ "cost": {
915
+ "input": 1.3,
916
+ "output": 2.6,
917
+ "cache_read": 0.1
918
+ }
919
+ },
920
+ "deepseek-ai/DeepSeek-V3.2": {
921
+ "id": "deepseek-ai/DeepSeek-V3.2",
922
+ "name": "DeepSeek-V3.2",
923
+ "attachment": false,
924
+ "reasoning": true,
925
+ "reasoning_options": [
926
+ {
927
+ "type": "toggle"
928
+ }
929
+ ],
930
+ "tool_call": true,
931
+ "interleaved": {
932
+ "field": "reasoning_content"
933
+ },
934
+ "temperature": true,
935
+ "knowledge": "2024-12",
936
+ "release_date": "2025-12-02",
937
+ "last_updated": "2025-12-02",
938
+ "modalities": {
939
+ "input": [
940
+ "text"
941
+ ],
942
+ "output": [
943
+ "text"
944
+ ]
945
+ },
946
+ "open_weights": false,
947
+ "limit": {
948
+ "context": 163840,
949
+ "output": 64000
950
+ },
951
+ "cost": {
952
+ "input": 0.26,
953
+ "output": 0.38,
954
+ "cache_read": 0.13
955
+ }
956
+ },
957
+ "MiniMaxAI/MiniMax-M2.5": {
958
+ "id": "MiniMaxAI/MiniMax-M2.5",
959
+ "name": "MiniMax M2.5",
960
+ "family": "minimax",
961
+ "attachment": false,
962
+ "reasoning": true,
963
+ "reasoning_options": [],
964
+ "tool_call": true,
965
+ "interleaved": {
966
+ "field": "reasoning_content"
967
+ },
968
+ "temperature": true,
969
+ "knowledge": "2025-06",
970
+ "release_date": "2026-02-12",
971
+ "last_updated": "2026-02-12",
972
+ "modalities": {
973
+ "input": [
974
+ "text"
975
+ ],
976
+ "output": [
977
+ "text"
978
+ ]
979
+ },
980
+ "open_weights": true,
981
+ "limit": {
982
+ "context": 196608,
983
+ "output": 131072
984
+ },
985
+ "cost": {
986
+ "input": 0.15,
987
+ "output": 1.15,
988
+ "cache_read": 0.03,
989
+ "cache_write": 0.375
990
+ }
991
+ }
992
+ }
993
+ }