@openinference/cli 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (47) hide show
  1. package/data/models.json +1259 -0
  2. package/dist/chat-repl.d.ts +3 -0
  3. package/dist/chat-repl.d.ts.map +1 -0
  4. package/dist/chat-repl.js +35 -0
  5. package/dist/chat-repl.js.map +1 -0
  6. package/dist/chat.d.ts +9 -0
  7. package/dist/chat.d.ts.map +1 -0
  8. package/dist/chat.js +51 -0
  9. package/dist/chat.js.map +1 -0
  10. package/dist/config.d.ts +11 -0
  11. package/dist/config.d.ts.map +1 -0
  12. package/dist/config.js +32 -0
  13. package/dist/config.js.map +1 -0
  14. package/dist/data/models.json +1259 -0
  15. package/dist/hardware.d.ts +13 -0
  16. package/dist/hardware.d.ts.map +1 -0
  17. package/dist/hardware.js +61 -0
  18. package/dist/hardware.js.map +1 -0
  19. package/dist/index.d.ts +3 -0
  20. package/dist/index.d.ts.map +1 -0
  21. package/dist/index.js +153 -0
  22. package/dist/index.js.map +1 -0
  23. package/dist/ollama.d.ts +14 -0
  24. package/dist/ollama.d.ts.map +1 -0
  25. package/dist/ollama.js +189 -0
  26. package/dist/ollama.js.map +1 -0
  27. package/dist/prompt.d.ts +4 -0
  28. package/dist/prompt.d.ts.map +1 -0
  29. package/dist/prompt.js +44 -0
  30. package/dist/prompt.js.map +1 -0
  31. package/dist/recommend-run.d.ts +9 -0
  32. package/dist/recommend-run.d.ts.map +1 -0
  33. package/dist/recommend-run.js +34 -0
  34. package/dist/recommend-run.js.map +1 -0
  35. package/dist/recommend.d.ts +20 -0
  36. package/dist/recommend.d.ts.map +1 -0
  37. package/dist/recommend.js +71 -0
  38. package/dist/recommend.js.map +1 -0
  39. package/dist/setup.d.ts +13 -0
  40. package/dist/setup.d.ts.map +1 -0
  41. package/dist/setup.js +119 -0
  42. package/dist/setup.js.map +1 -0
  43. package/dist/start.d.ts +13 -0
  44. package/dist/start.d.ts.map +1 -0
  45. package/dist/start.js +32 -0
  46. package/dist/start.js.map +1 -0
  47. package/package.json +33 -0
@@ -0,0 +1,1259 @@
1
+ [
2
+ {
3
+ "id": "smollm2:135m",
4
+ "name": "SmolLM2 135M",
5
+ "ramGb": 0.4,
6
+ "sizeMb": 190,
7
+ "quality": 45,
8
+ "useCase": "classification, tags",
9
+ "verified": true
10
+ },
11
+ {
12
+ "id": "smollm2:360m",
13
+ "name": "SmolLM2 360M",
14
+ "ramGb": 0.5,
15
+ "sizeMb": 307,
16
+ "quality": 50,
17
+ "useCase": "light tasks",
18
+ "verified": true
19
+ },
20
+ {
21
+ "id": "qwen2.5:0.5b",
22
+ "name": "Qwen 2.5 0.5B",
23
+ "ramGb": 0.6,
24
+ "sizeMb": 380,
25
+ "quality": 52,
26
+ "useCase": "fast labels",
27
+ "verified": true
28
+ },
29
+ {
30
+ "id": "tinyllama",
31
+ "name": "TinyLlama 1.1B",
32
+ "ramGb": 1.1,
33
+ "sizeMb": 772,
34
+ "quality": 48,
35
+ "useCase": "tiny chat",
36
+ "verified": true
37
+ },
38
+ {
39
+ "id": "tinydolphin",
40
+ "name": "TinyDolphin 1.5B",
41
+ "ramGb": 1.3,
42
+ "sizeMb": 980,
43
+ "quality": 55,
44
+ "useCase": "uncensored small"
45
+ },
46
+ {
47
+ "id": "stablelm2:1.6b",
48
+ "name": "StableLM2 1.6B",
49
+ "ramGb": 1.4,
50
+ "sizeMb": 1032,
51
+ "quality": 54,
52
+ "useCase": "chat"
53
+ },
54
+ {
55
+ "id": "olmo2:1b",
56
+ "name": "OLMo 2 1B",
57
+ "ramGb": 1.1,
58
+ "sizeMb": 720,
59
+ "quality": 56,
60
+ "useCase": "research chat"
61
+ },
62
+ {
63
+ "id": "granite3-dense:2b",
64
+ "name": "Granite 3 Dense 2B",
65
+ "ramGb": 1.6,
66
+ "sizeMb": 1240,
67
+ "quality": 73,
68
+ "useCase": "enterprise chat"
69
+ },
70
+ {
71
+ "id": "gemma3:1b",
72
+ "name": "Gemma 3 1B",
73
+ "ramGb": 1.1,
74
+ "sizeMb": 720,
75
+ "quality": 68,
76
+ "useCase": "chat, general",
77
+ "verified": true
78
+ },
79
+ {
80
+ "id": "llama3.2:1b",
81
+ "name": "Llama 3.2 1B",
82
+ "ramGb": 1.1,
83
+ "sizeMb": 720,
84
+ "quality": 66,
85
+ "useCase": "instructions",
86
+ "verified": true
87
+ },
88
+ {
89
+ "id": "llama3.2:1b-instruct-q8_0",
90
+ "name": "Llama 3.2 1B Q8",
91
+ "ramGb": 1.1,
92
+ "sizeMb": 720,
93
+ "quality": 67,
94
+ "useCase": "precise small"
95
+ },
96
+ {
97
+ "id": "qwen2.5:1.5b",
98
+ "name": "Qwen 2.5 1.5B",
99
+ "ramGb": 1.3,
100
+ "sizeMb": 980,
101
+ "quality": 70,
102
+ "useCase": "JSON, chat",
103
+ "verified": true
104
+ },
105
+ {
106
+ "id": "deepseek-r1:1.5b",
107
+ "name": "DeepSeek R1 1.5B",
108
+ "ramGb": 1.3,
109
+ "sizeMb": 980,
110
+ "quality": 72,
111
+ "useCase": "reasoning",
112
+ "verified": true
113
+ },
114
+ {
115
+ "id": "phi3:mini",
116
+ "name": "Phi-3 Mini",
117
+ "ramGb": 2.5,
118
+ "sizeMb": 2176,
119
+ "quality": 74,
120
+ "useCase": "reasoning small",
121
+ "verified": true
122
+ },
123
+ {
124
+ "id": "gemma2:2b",
125
+ "name": "Gemma 2 2B",
126
+ "ramGb": 1.6,
127
+ "sizeMb": 1240,
128
+ "quality": 71,
129
+ "useCase": "chat",
130
+ "verified": true
131
+ },
132
+ {
133
+ "id": "smollm2:1.7b",
134
+ "name": "SmolLM2 1.7B",
135
+ "ramGb": 1.4,
136
+ "sizeMb": 1084,
137
+ "quality": 65,
138
+ "useCase": "efficient chat",
139
+ "verified": true
140
+ },
141
+ {
142
+ "id": "internlm2:1.8b",
143
+ "name": "InternLM2 1.8B",
144
+ "ramGb": 1.5,
145
+ "sizeMb": 1136,
146
+ "quality": 69,
147
+ "useCase": "multilingual"
148
+ },
149
+ {
150
+ "id": "yi:1.5b",
151
+ "name": "Yi 1.5B",
152
+ "ramGb": 1.3,
153
+ "sizeMb": 980,
154
+ "quality": 67,
155
+ "useCase": "bilingual chat"
156
+ },
157
+ {
158
+ "id": "qwen2:1.5b",
159
+ "name": "Qwen 2 1.5B",
160
+ "ramGb": 1.3,
161
+ "sizeMb": 980,
162
+ "quality": 66,
163
+ "useCase": "chat"
164
+ },
165
+ {
166
+ "id": "orca-mini",
167
+ "name": "Orca Mini 3B",
168
+ "ramGb": 2.1,
169
+ "sizeMb": 1760,
170
+ "quality": 58,
171
+ "useCase": "teaching small"
172
+ },
173
+ {
174
+ "id": "stablelm-zephyr:3b",
175
+ "name": "StableLM Zephyr 3B",
176
+ "ramGb": 2.1,
177
+ "sizeMb": 1760,
178
+ "quality": 68,
179
+ "useCase": "chat"
180
+ },
181
+ {
182
+ "id": "llama3.2:3b",
183
+ "name": "Llama 3.2 3B",
184
+ "ramGb": 2.1,
185
+ "sizeMb": 1760,
186
+ "quality": 76,
187
+ "useCase": "general",
188
+ "verified": true
189
+ },
190
+ {
191
+ "id": "qwen2.5:3b",
192
+ "name": "Qwen 2.5 3B",
193
+ "ramGb": 2.1,
194
+ "sizeMb": 1760,
195
+ "quality": 78,
196
+ "useCase": "coding, JSON",
197
+ "verified": true
198
+ },
199
+ {
200
+ "id": "phi3.5:latest",
201
+ "name": "Phi 3.5",
202
+ "ramGb": 2.5,
203
+ "sizeMb": 2176,
204
+ "quality": 74,
205
+ "useCase": "reasoning",
206
+ "verified": true
207
+ },
208
+ {
209
+ "id": "gemma3:4b",
210
+ "name": "Gemma 3 4B",
211
+ "ramGb": 2.9,
212
+ "sizeMb": 2280,
213
+ "quality": 80,
214
+ "useCase": "quality chat",
215
+ "verified": true
216
+ },
217
+ {
218
+ "id": "gemma3:4b-it-qat",
219
+ "name": "Gemma 3 4B QAT",
220
+ "ramGb": 2.9,
221
+ "sizeMb": 2280,
222
+ "quality": 81,
223
+ "useCase": "efficient 4B"
224
+ },
225
+ {
226
+ "id": "codestral:22b-v0.1-q4_0",
227
+ "name": "Codestral 22B Q4",
228
+ "ramGb": 12.6,
229
+ "sizeMb": 11640,
230
+ "quality": 88,
231
+ "useCase": "coding frontier"
232
+ },
233
+ {
234
+ "id": "codegemma:2b",
235
+ "name": "CodeGemma 2B",
236
+ "ramGb": 1.6,
237
+ "sizeMb": 1240,
238
+ "quality": 72,
239
+ "useCase": "code completion"
240
+ },
241
+ {
242
+ "id": "starcoder2:3b",
243
+ "name": "StarCoder2 3B",
244
+ "ramGb": 2.1,
245
+ "sizeMb": 1760,
246
+ "quality": 75,
247
+ "useCase": "code"
248
+ },
249
+ {
250
+ "id": "deepseek-coder:1.3b",
251
+ "name": "DeepSeek Coder 1.3B",
252
+ "ramGb": 1.2,
253
+ "sizeMb": 876,
254
+ "quality": 70,
255
+ "useCase": "code small"
256
+ },
257
+ {
258
+ "id": "wizardcoder:3b",
259
+ "name": "WizardCoder 3B",
260
+ "ramGb": 2.1,
261
+ "sizeMb": 1760,
262
+ "quality": 71,
263
+ "useCase": "code"
264
+ },
265
+ {
266
+ "id": "sqlcoder:7b",
267
+ "name": "SQLCoder 7B",
268
+ "ramGb": 4.5,
269
+ "sizeMb": 3840,
270
+ "quality": 79,
271
+ "useCase": "SQL"
272
+ },
273
+ {
274
+ "id": "llama3.2-vision:11b",
275
+ "name": "Llama 3.2 Vision 11B",
276
+ "ramGb": 6.9,
277
+ "sizeMb": 5920,
278
+ "quality": 82,
279
+ "useCase": "vision"
280
+ },
281
+ {
282
+ "id": "moondream:1.8b",
283
+ "name": "Moondream 1.8B",
284
+ "ramGb": 1.5,
285
+ "sizeMb": 1136,
286
+ "quality": 64,
287
+ "useCase": "vision small"
288
+ },
289
+ {
290
+ "id": "llava:7b",
291
+ "name": "LLaVA 7B",
292
+ "ramGb": 4.5,
293
+ "sizeMb": 3840,
294
+ "quality": 76,
295
+ "useCase": "vision chat"
296
+ },
297
+ {
298
+ "id": "bakllava:7b",
299
+ "name": "BakLLaVA 7B",
300
+ "ramGb": 4.5,
301
+ "sizeMb": 3840,
302
+ "quality": 75,
303
+ "useCase": "vision"
304
+ },
305
+ {
306
+ "id": "granite3-dense:8b",
307
+ "name": "Granite 3 Dense 8B",
308
+ "ramGb": 5,
309
+ "sizeMb": 4360,
310
+ "quality": 83,
311
+ "useCase": "enterprise"
312
+ },
313
+ {
314
+ "id": "falcon3:3b",
315
+ "name": "Falcon 3 3B",
316
+ "ramGb": 2.1,
317
+ "sizeMb": 1760,
318
+ "quality": 70,
319
+ "useCase": "chat"
320
+ },
321
+ {
322
+ "id": "openhermes:2.5-mistral-7b",
323
+ "name": "OpenHermes Mistral 7B",
324
+ "ramGb": 4.5,
325
+ "sizeMb": 3840,
326
+ "quality": 77,
327
+ "useCase": "chat tuned"
328
+ },
329
+ {
330
+ "id": "mistral:7b",
331
+ "name": "Mistral 7B",
332
+ "ramGb": 4.5,
333
+ "sizeMb": 3840,
334
+ "quality": 82,
335
+ "useCase": "general",
336
+ "verified": true
337
+ },
338
+ {
339
+ "id": "mistral:7b-instruct",
340
+ "name": "Mistral 7B Instruct",
341
+ "ramGb": 4.5,
342
+ "sizeMb": 3840,
343
+ "quality": 83,
344
+ "useCase": "instructions"
345
+ },
346
+ {
347
+ "id": "mistral-nemo:12b",
348
+ "name": "Mistral Nemo 12B",
349
+ "ramGb": 7.4,
350
+ "sizeMb": 6440,
351
+ "quality": 85,
352
+ "useCase": "long context",
353
+ "verified": true
354
+ },
355
+ {
356
+ "id": "llama3.1:8b",
357
+ "name": "Llama 3.1 8B",
358
+ "ramGb": 5,
359
+ "sizeMb": 4360,
360
+ "quality": 84,
361
+ "useCase": "general, tools",
362
+ "verified": true
363
+ },
364
+ {
365
+ "id": "llama3.1:8b-instruct-q4_K_M",
366
+ "name": "Llama 3.1 8B Q4",
367
+ "ramGb": 5,
368
+ "sizeMb": 4360,
369
+ "quality": 84,
370
+ "useCase": "general"
371
+ },
372
+ {
373
+ "id": "llama3.2:3b-instruct-q4_K_M",
374
+ "name": "Llama 3.2 3B Q4",
375
+ "ramGb": 2.1,
376
+ "sizeMb": 1760,
377
+ "quality": 76,
378
+ "useCase": "fast general"
379
+ },
380
+ {
381
+ "id": "llama3.3:70b",
382
+ "name": "Llama 3.3 70B",
383
+ "ramGb": 38.9,
384
+ "sizeMb": 36600,
385
+ "quality": 93,
386
+ "useCase": "frontier",
387
+ "verified": true
388
+ },
389
+ {
390
+ "id": "qwen2.5:7b",
391
+ "name": "Qwen 2.5 7B",
392
+ "ramGb": 4.5,
393
+ "sizeMb": 3840,
394
+ "quality": 86,
395
+ "useCase": "coding, chat",
396
+ "verified": true
397
+ },
398
+ {
399
+ "id": "qwen2.5:7b-instruct",
400
+ "name": "Qwen 2.5 7B Instruct",
401
+ "ramGb": 4.5,
402
+ "sizeMb": 3840,
403
+ "quality": 86,
404
+ "useCase": "chat"
405
+ },
406
+ {
407
+ "id": "qwen2.5-coder:7b",
408
+ "name": "Qwen 2.5 Coder 7B",
409
+ "ramGb": 4.5,
410
+ "sizeMb": 3840,
411
+ "quality": 87,
412
+ "useCase": "coding",
413
+ "verified": true
414
+ },
415
+ {
416
+ "id": "qwen2.5-coder:1.5b",
417
+ "name": "Qwen 2.5 Coder 1.5B",
418
+ "ramGb": 1.3,
419
+ "sizeMb": 980,
420
+ "quality": 74,
421
+ "useCase": "code small"
422
+ },
423
+ {
424
+ "id": "deepseek-r1:7b",
425
+ "name": "DeepSeek R1 7B",
426
+ "ramGb": 4.5,
427
+ "sizeMb": 3840,
428
+ "quality": 85,
429
+ "useCase": "reasoning",
430
+ "verified": true
431
+ },
432
+ {
433
+ "id": "deepseek-r1:8b",
434
+ "name": "DeepSeek R1 8B",
435
+ "ramGb": 5,
436
+ "sizeMb": 4360,
437
+ "quality": 86,
438
+ "useCase": "reasoning"
439
+ },
440
+ {
441
+ "id": "deepseek-coder:6.7b",
442
+ "name": "DeepSeek Coder 6.7B",
443
+ "ramGb": 4.3,
444
+ "sizeMb": 3684,
445
+ "quality": 84,
446
+ "useCase": "coding"
447
+ },
448
+ {
449
+ "id": "deepseek-coder-v2:16b",
450
+ "name": "DeepSeek Coder v2 16B",
451
+ "ramGb": 9.5,
452
+ "sizeMb": 8520,
453
+ "quality": 89,
454
+ "useCase": "coding large"
455
+ },
456
+ {
457
+ "id": "codellama:7b",
458
+ "name": "Code Llama 7B",
459
+ "ramGb": 4.5,
460
+ "sizeMb": 3840,
461
+ "quality": 83,
462
+ "useCase": "coding",
463
+ "verified": true
464
+ },
465
+ {
466
+ "id": "codellama:13b",
467
+ "name": "Code Llama 13B",
468
+ "ramGb": 8,
469
+ "sizeMb": 6960,
470
+ "quality": 86,
471
+ "useCase": "coding"
472
+ },
473
+ {
474
+ "id": "codellama:34b",
475
+ "name": "Code Llama 34B",
476
+ "ramGb": 20.2,
477
+ "sizeMb": 17880,
478
+ "quality": 90,
479
+ "useCase": "coding frontier"
480
+ },
481
+ {
482
+ "id": "neural-chat:7b",
483
+ "name": "Neural Chat 7B",
484
+ "ramGb": 4.5,
485
+ "sizeMb": 3840,
486
+ "quality": 79,
487
+ "useCase": "chat",
488
+ "verified": true
489
+ },
490
+ {
491
+ "id": "starling-lm:7b",
492
+ "name": "Starling 7B",
493
+ "ramGb": 4.5,
494
+ "sizeMb": 3840,
495
+ "quality": 81,
496
+ "useCase": "chat"
497
+ },
498
+ {
499
+ "id": "openchat:7b",
500
+ "name": "OpenChat 7B",
501
+ "ramGb": 4.5,
502
+ "sizeMb": 3840,
503
+ "quality": 80,
504
+ "useCase": "chat"
505
+ },
506
+ {
507
+ "id": "vicuna:7b",
508
+ "name": "Vicuna 7B",
509
+ "ramGb": 4.5,
510
+ "sizeMb": 3840,
511
+ "quality": 78,
512
+ "useCase": "chat"
513
+ },
514
+ {
515
+ "id": "wizardlm2:7b",
516
+ "name": "WizardLM2 7B",
517
+ "ramGb": 4.5,
518
+ "sizeMb": 3840,
519
+ "quality": 80,
520
+ "useCase": "instructions"
521
+ },
522
+ {
523
+ "id": "wizardlm2:8x22b",
524
+ "name": "WizardLM2 8x22B MoE",
525
+ "ramGb": 75.8,
526
+ "sizeMb": 73520,
527
+ "quality": 94,
528
+ "useCase": "MoE frontier"
529
+ },
530
+ {
531
+ "id": "nous-hermes2:7b",
532
+ "name": "Nous Hermes 2 7B",
533
+ "ramGb": 4.5,
534
+ "sizeMb": 3840,
535
+ "quality": 81,
536
+ "useCase": "chat"
537
+ },
538
+ {
539
+ "id": "nous-hermes2-mixtral:8x7b",
540
+ "name": "Nous Hermes Mixtral",
541
+ "ramGb": 26.9,
542
+ "sizeMb": 24640,
543
+ "quality": 90,
544
+ "useCase": "MoE chat"
545
+ },
546
+ {
547
+ "id": "dolphin-mistral:7b",
548
+ "name": "Dolphin Mistral 7B",
549
+ "ramGb": 4.5,
550
+ "sizeMb": 3840,
551
+ "quality": 79,
552
+ "useCase": "uncensored chat"
553
+ },
554
+ {
555
+ "id": "dolphin-llama3:8b",
556
+ "name": "Dolphin Llama 3 8B",
557
+ "ramGb": 5,
558
+ "sizeMb": 4360,
559
+ "quality": 80,
560
+ "useCase": "uncensored chat"
561
+ },
562
+ {
563
+ "id": "solar:10.7b",
564
+ "name": "Solar 10.7B",
565
+ "ramGb": 6.8,
566
+ "sizeMb": 5764,
567
+ "quality": 84,
568
+ "useCase": "depth-upscaled"
569
+ },
570
+ {
571
+ "id": "yi:6b",
572
+ "name": "Yi 6B",
573
+ "ramGb": 4,
574
+ "sizeMb": 3320,
575
+ "quality": 80,
576
+ "useCase": "bilingual"
577
+ },
578
+ {
579
+ "id": "yi:9b",
580
+ "name": "Yi 9B",
581
+ "ramGb": 5.5,
582
+ "sizeMb": 4880,
583
+ "quality": 83,
584
+ "useCase": "bilingual quality"
585
+ },
586
+ {
587
+ "id": "command-r7b",
588
+ "name": "Command R 7B",
589
+ "ramGb": 4.5,
590
+ "sizeMb": 3840,
591
+ "quality": 82,
592
+ "useCase": "RAG, tools"
593
+ },
594
+ {
595
+ "id": "command-r:35b",
596
+ "name": "Command R 35B",
597
+ "ramGb": 20.7,
598
+ "sizeMb": 18400,
599
+ "quality": 91,
600
+ "useCase": "RAG enterprise"
601
+ },
602
+ {
603
+ "id": "command-r-plus:104b",
604
+ "name": "Command R+ 104B",
605
+ "ramGb": 56.6,
606
+ "sizeMb": 54280,
607
+ "quality": 95,
608
+ "useCase": "frontier RAG"
609
+ },
610
+ {
611
+ "id": "granite3.1-dense:8b",
612
+ "name": "Granite 3.1 8B",
613
+ "ramGb": 5,
614
+ "sizeMb": 4360,
615
+ "quality": 84,
616
+ "useCase": "enterprise"
617
+ },
618
+ {
619
+ "id": "granite3.1-moe:1b",
620
+ "name": "Granite 3.1 MoE 1B",
621
+ "ramGb": 1.1,
622
+ "sizeMb": 720,
623
+ "quality": 70,
624
+ "useCase": "efficient MoE"
625
+ },
626
+ {
627
+ "id": "falcon:7b",
628
+ "name": "Falcon 7B",
629
+ "ramGb": 4.5,
630
+ "sizeMb": 3840,
631
+ "quality": 77,
632
+ "useCase": "general"
633
+ },
634
+ {
635
+ "id": "falcon2:11b",
636
+ "name": "Falcon 2 11B",
637
+ "ramGb": 6.9,
638
+ "sizeMb": 5920,
639
+ "quality": 82,
640
+ "useCase": "general"
641
+ },
642
+ {
643
+ "id": "zephyr:7b",
644
+ "name": "Zephyr 7B",
645
+ "ramGb": 4.5,
646
+ "sizeMb": 3840,
647
+ "quality": 80,
648
+ "useCase": "helpful chat",
649
+ "verified": true
650
+ },
651
+ {
652
+ "id": "orca2:7b",
653
+ "name": "Orca 2 7B",
654
+ "ramGb": 4.5,
655
+ "sizeMb": 3840,
656
+ "quality": 79,
657
+ "useCase": "reasoning"
658
+ },
659
+ {
660
+ "id": "orca2:13b",
661
+ "name": "Orca 2 13B",
662
+ "ramGb": 8,
663
+ "sizeMb": 6960,
664
+ "quality": 84,
665
+ "useCase": "reasoning"
666
+ },
667
+ {
668
+ "id": "wizard-vicuna-uncensored:7b",
669
+ "name": "Wizard Vicuna 7B",
670
+ "ramGb": 4.5,
671
+ "sizeMb": 3840,
672
+ "quality": 76,
673
+ "useCase": "uncensored"
674
+ },
675
+ {
676
+ "id": "everythinglm:13b",
677
+ "name": "EverythingLM 13B",
678
+ "ramGb": 8,
679
+ "sizeMb": 6960,
680
+ "quality": 78,
681
+ "useCase": "roleplay"
682
+ },
683
+ {
684
+ "id": "megadolphin:7b",
685
+ "name": "MegaDolphin 7B",
686
+ "ramGb": 4.5,
687
+ "sizeMb": 3840,
688
+ "quality": 77,
689
+ "useCase": "uncensored"
690
+ },
691
+ {
692
+ "id": "open-orca-platypus2:13b",
693
+ "name": "OpenOrca Platypus2 13B",
694
+ "ramGb": 8,
695
+ "sizeMb": 6960,
696
+ "quality": 80,
697
+ "useCase": "reasoning"
698
+ },
699
+ {
700
+ "id": "stable-beluga:7b",
701
+ "name": "Stable Beluga 7B",
702
+ "ramGb": 4.5,
703
+ "sizeMb": 3840,
704
+ "quality": 78,
705
+ "useCase": "chat"
706
+ },
707
+ {
708
+ "id": "stable-beluga:13b",
709
+ "name": "Stable Beluga 13B",
710
+ "ramGb": 8,
711
+ "sizeMb": 6960,
712
+ "quality": 81,
713
+ "useCase": "chat"
714
+ },
715
+ {
716
+ "id": "meditron:7b",
717
+ "name": "Meditron 7B",
718
+ "ramGb": 4.5,
719
+ "sizeMb": 3840,
720
+ "quality": 76,
721
+ "useCase": "medical"
722
+ },
723
+ {
724
+ "id": "medllama2:7b",
725
+ "name": "MedLlama2 7B",
726
+ "ramGb": 4.5,
727
+ "sizeMb": 3840,
728
+ "quality": 75,
729
+ "useCase": "medical"
730
+ },
731
+ {
732
+ "id": "biomistral:7b",
733
+ "name": "BioMistral 7B",
734
+ "ramGb": 4.5,
735
+ "sizeMb": 3840,
736
+ "quality": 77,
737
+ "useCase": "biomedical"
738
+ },
739
+ {
740
+ "id": "llama2:7b",
741
+ "name": "Llama 2 7B",
742
+ "ramGb": 4.5,
743
+ "sizeMb": 3840,
744
+ "quality": 72,
745
+ "useCase": "legacy general",
746
+ "verified": true
747
+ },
748
+ {
749
+ "id": "llama2:13b",
750
+ "name": "Llama 2 13B",
751
+ "ramGb": 8,
752
+ "sizeMb": 6960,
753
+ "quality": 78,
754
+ "useCase": "legacy general"
755
+ },
756
+ {
757
+ "id": "llama2:70b",
758
+ "name": "Llama 2 70B",
759
+ "ramGb": 38.9,
760
+ "sizeMb": 36600,
761
+ "quality": 90,
762
+ "useCase": "legacy frontier"
763
+ },
764
+ {
765
+ "id": "llama2-chinese:7b",
766
+ "name": "Llama 2 Chinese 7B",
767
+ "ramGb": 4.5,
768
+ "sizeMb": 3840,
769
+ "quality": 74,
770
+ "useCase": "chinese"
771
+ },
772
+ {
773
+ "id": "gemma:7b",
774
+ "name": "Gemma 7B",
775
+ "ramGb": 4.5,
776
+ "sizeMb": 3840,
777
+ "quality": 79,
778
+ "useCase": "google chat"
779
+ },
780
+ {
781
+ "id": "gemma2:9b",
782
+ "name": "Gemma 2 9B",
783
+ "ramGb": 5.5,
784
+ "sizeMb": 4880,
785
+ "quality": 84,
786
+ "useCase": "quality chat",
787
+ "verified": true
788
+ },
789
+ {
790
+ "id": "gemma2:27b",
791
+ "name": "Gemma 2 27B",
792
+ "ramGb": 15.2,
793
+ "sizeMb": 14240,
794
+ "quality": 91,
795
+ "useCase": "frontier chat"
796
+ },
797
+ {
798
+ "id": "gemma3:12b",
799
+ "name": "Gemma 3 12B",
800
+ "ramGb": 7.4,
801
+ "sizeMb": 6440,
802
+ "quality": 87,
803
+ "useCase": "multimodal text"
804
+ },
805
+ {
806
+ "id": "gemma3:27b",
807
+ "name": "Gemma 3 27B",
808
+ "ramGb": 15.2,
809
+ "sizeMb": 14240,
810
+ "quality": 92,
811
+ "useCase": "frontier"
812
+ },
813
+ {
814
+ "id": "phi4:14b",
815
+ "name": "Phi-4 14B",
816
+ "ramGb": 8.5,
817
+ "sizeMb": 7480,
818
+ "quality": 88,
819
+ "useCase": "reasoning"
820
+ },
821
+ {
822
+ "id": "marco-o1:7b",
823
+ "name": "Marco-o1 7B",
824
+ "ramGb": 4.5,
825
+ "sizeMb": 3840,
826
+ "quality": 82,
827
+ "useCase": "reasoning"
828
+ },
829
+ {
830
+ "id": "reflection:70b",
831
+ "name": "Reflection 70B",
832
+ "ramGb": 38.9,
833
+ "sizeMb": 36600,
834
+ "quality": 92,
835
+ "useCase": "self-correct"
836
+ },
837
+ {
838
+ "id": "athene-v2:72b",
839
+ "name": "Athene v2 72B",
840
+ "ramGb": 39.9,
841
+ "sizeMb": 37640,
842
+ "quality": 93,
843
+ "useCase": "agentic"
844
+ },
845
+ {
846
+ "id": "sailor2:8b",
847
+ "name": "Sailor2 8B",
848
+ "ramGb": 5,
849
+ "sizeMb": 4360,
850
+ "quality": 81,
851
+ "useCase": "multilingual sea"
852
+ },
853
+ {
854
+ "id": "exaone3.5:7.8b",
855
+ "name": "EXAONE 3.5 7.8B",
856
+ "ramGb": 4.9,
857
+ "sizeMb": 4256,
858
+ "quality": 83,
859
+ "useCase": "korean, english"
860
+ },
861
+ {
862
+ "id": "aya:23-8b",
863
+ "name": "Aya 23 8B",
864
+ "ramGb": 5,
865
+ "sizeMb": 4360,
866
+ "quality": 82,
867
+ "useCase": "multilingual"
868
+ },
869
+ {
870
+ "id": "aya:23-35b",
871
+ "name": "Aya 23 35B",
872
+ "ramGb": 20.7,
873
+ "sizeMb": 18400,
874
+ "quality": 90,
875
+ "useCase": "multilingual large"
876
+ },
877
+ {
878
+ "id": "nemotron-mini:4b",
879
+ "name": "Nemotron Mini 4B",
880
+ "ramGb": 2.9,
881
+ "sizeMb": 2280,
882
+ "quality": 76,
883
+ "useCase": "nvidia small"
884
+ },
885
+ {
886
+ "id": "nemotron:70b",
887
+ "name": "Nemotron 70B",
888
+ "ramGb": 38.9,
889
+ "sizeMb": 36600,
890
+ "quality": 92,
891
+ "useCase": "nvidia frontier"
892
+ },
893
+ {
894
+ "id": "snowflake-arctic-embed:335m",
895
+ "name": "Snowflake Arctic Embed",
896
+ "ramGb": 0.5,
897
+ "sizeMb": 294,
898
+ "quality": 58,
899
+ "useCase": "embeddings",
900
+ "kind": "embed"
901
+ },
902
+ {
903
+ "id": "nomic-embed-text",
904
+ "name": "Nomic Embed Text",
905
+ "ramGb": 0.4,
906
+ "sizeMb": 193,
907
+ "quality": 60,
908
+ "useCase": "embeddings",
909
+ "kind": "embed"
910
+ },
911
+ {
912
+ "id": "mxbai-embed-large",
913
+ "name": "MxBai Embed Large",
914
+ "ramGb": 0.5,
915
+ "sizeMb": 297,
916
+ "quality": 62,
917
+ "useCase": "embeddings",
918
+ "kind": "embed"
919
+ },
920
+ {
921
+ "id": "bge-large",
922
+ "name": "BGE Large",
923
+ "ramGb": 0.5,
924
+ "sizeMb": 297,
925
+ "quality": 61,
926
+ "useCase": "embeddings",
927
+ "kind": "embed"
928
+ },
929
+ {
930
+ "id": "all-minilm",
931
+ "name": "All-MiniLM",
932
+ "ramGb": 0.4,
933
+ "sizeMb": 162,
934
+ "quality": 55,
935
+ "useCase": "embeddings",
936
+ "kind": "embed"
937
+ },
938
+ {
939
+ "id": "qwen2.5:14b",
940
+ "name": "Qwen 2.5 14B",
941
+ "ramGb": 8.5,
942
+ "sizeMb": 7480,
943
+ "quality": 88,
944
+ "useCase": "reasoning",
945
+ "verified": true
946
+ },
947
+ {
948
+ "id": "qwen2.5:14b-instruct",
949
+ "name": "Qwen 2.5 14B Instruct",
950
+ "ramGb": 8.5,
951
+ "sizeMb": 7480,
952
+ "quality": 88,
953
+ "useCase": "chat"
954
+ },
955
+ {
956
+ "id": "qwen2.5:32b",
957
+ "name": "Qwen 2.5 32B",
958
+ "ramGb": 19.1,
959
+ "sizeMb": 16840,
960
+ "quality": 90,
961
+ "useCase": "frontier local"
962
+ },
963
+ {
964
+ "id": "qwen2.5:72b",
965
+ "name": "Qwen 2.5 72B",
966
+ "ramGb": 39.9,
967
+ "sizeMb": 37640,
968
+ "quality": 94,
969
+ "useCase": "frontier"
970
+ },
971
+ {
972
+ "id": "llama3.1:70b",
973
+ "name": "Llama 3.1 70B",
974
+ "ramGb": 38.9,
975
+ "sizeMb": 36600,
976
+ "quality": 92,
977
+ "useCase": "frontier"
978
+ },
979
+ {
980
+ "id": "llama3.1:70b-instruct-q4_K_M",
981
+ "name": "Llama 3.1 70B Q4",
982
+ "ramGb": 38.9,
983
+ "sizeMb": 36600,
984
+ "quality": 92,
985
+ "useCase": "frontier"
986
+ },
987
+ {
988
+ "id": "mixtral:8x7b",
989
+ "name": "Mixtral 8x7B MoE",
990
+ "ramGb": 26.9,
991
+ "sizeMb": 24640,
992
+ "quality": 91,
993
+ "useCase": "MoE quality"
994
+ },
995
+ {
996
+ "id": "mixtral:8x22b",
997
+ "name": "Mixtral 8x22B MoE",
998
+ "ramGb": 75.8,
999
+ "sizeMb": 73520,
1000
+ "quality": 95,
1001
+ "useCase": "MoE frontier"
1002
+ },
1003
+ {
1004
+ "id": "solar-pro:22b",
1005
+ "name": "Solar Pro 22B",
1006
+ "ramGb": 12.6,
1007
+ "sizeMb": 11640,
1008
+ "quality": 89,
1009
+ "useCase": "reasoning"
1010
+ },
1011
+ {
1012
+ "id": "dbrx:132b",
1013
+ "name": "DBRX 132B MoE",
1014
+ "ramGb": 71.1,
1015
+ "sizeMb": 68840,
1016
+ "quality": 96,
1017
+ "useCase": "enterprise MoE"
1018
+ },
1019
+ {
1020
+ "id": "internlm2:7b",
1021
+ "name": "InternLM2 7B",
1022
+ "ramGb": 4.5,
1023
+ "sizeMb": 3840,
1024
+ "quality": 82,
1025
+ "useCase": "multilingual"
1026
+ },
1027
+ {
1028
+ "id": "internlm2:20b",
1029
+ "name": "InternLM2 20B",
1030
+ "ramGb": 11.6,
1031
+ "sizeMb": 10600,
1032
+ "quality": 88,
1033
+ "useCase": "multilingual large"
1034
+ },
1035
+ {
1036
+ "id": "wizardlm:13b",
1037
+ "name": "WizardLM 13B",
1038
+ "ramGb": 8,
1039
+ "sizeMb": 6960,
1040
+ "quality": 80,
1041
+ "useCase": "instructions"
1042
+ },
1043
+ {
1044
+ "id": "nous-hermes2:10.7b",
1045
+ "name": "Nous Hermes 10.7B",
1046
+ "ramGb": 6.8,
1047
+ "sizeMb": 5764,
1048
+ "quality": 83,
1049
+ "useCase": "chat"
1050
+ },
1051
+ {
1052
+ "id": "starcoder2:7b",
1053
+ "name": "StarCoder2 7B",
1054
+ "ramGb": 4.5,
1055
+ "sizeMb": 3840,
1056
+ "quality": 82,
1057
+ "useCase": "code"
1058
+ },
1059
+ {
1060
+ "id": "starcoder2:15b",
1061
+ "name": "StarCoder2 15B",
1062
+ "ramGb": 9,
1063
+ "sizeMb": 8000,
1064
+ "quality": 86,
1065
+ "useCase": "code large"
1066
+ },
1067
+ {
1068
+ "id": "shieldgemma:9b",
1069
+ "name": "ShieldGemma 9B",
1070
+ "ramGb": 5.5,
1071
+ "sizeMb": 4880,
1072
+ "quality": 78,
1073
+ "useCase": "safety"
1074
+ },
1075
+ {
1076
+ "id": "mathstral:7b",
1077
+ "name": "Mathstral 7B",
1078
+ "ramGb": 4.5,
1079
+ "sizeMb": 3840,
1080
+ "quality": 84,
1081
+ "useCase": "math"
1082
+ },
1083
+ {
1084
+ "id": "llama3-groq-tool-use:8b",
1085
+ "name": "Llama 3 Groq Tool Use 8B",
1086
+ "ramGb": 5,
1087
+ "sizeMb": 4360,
1088
+ "quality": 85,
1089
+ "useCase": "tool calling"
1090
+ },
1091
+ {
1092
+ "id": "firefunction-v2:70b",
1093
+ "name": "Firefunction v2 70B",
1094
+ "ramGb": 38.9,
1095
+ "sizeMb": 36600,
1096
+ "quality": 91,
1097
+ "useCase": "function calling"
1098
+ },
1099
+ {
1100
+ "id": "granite3-moe:3b",
1101
+ "name": "Granite 3 MoE 3B",
1102
+ "ramGb": 2.1,
1103
+ "sizeMb": 1760,
1104
+ "quality": 77,
1105
+ "useCase": "efficient MoE"
1106
+ },
1107
+ {
1108
+ "id": "granite-code:8b",
1109
+ "name": "Granite Code 8B",
1110
+ "ramGb": 5,
1111
+ "sizeMb": 4360,
1112
+ "quality": 84,
1113
+ "useCase": "code enterprise"
1114
+ },
1115
+ {
1116
+ "id": "stable-code:3b",
1117
+ "name": "Stable Code 3B",
1118
+ "ramGb": 2.1,
1119
+ "sizeMb": 1760,
1120
+ "quality": 73,
1121
+ "useCase": "code"
1122
+ },
1123
+ {
1124
+ "id": "stablelm2:12b",
1125
+ "name": "StableLM2 12B",
1126
+ "ramGb": 7.4,
1127
+ "sizeMb": 6440,
1128
+ "quality": 82,
1129
+ "useCase": "chat"
1130
+ },
1131
+ {
1132
+ "id": "mpt:7b",
1133
+ "name": "MPT 7B",
1134
+ "ramGb": 4.5,
1135
+ "sizeMb": 3840,
1136
+ "quality": 74,
1137
+ "useCase": "legacy chat"
1138
+ },
1139
+ {
1140
+ "id": "mpt:30b",
1141
+ "name": "MPT 30B",
1142
+ "ramGb": 18.1,
1143
+ "sizeMb": 15800,
1144
+ "quality": 86,
1145
+ "useCase": "legacy large"
1146
+ },
1147
+ {
1148
+ "id": "yarn-mistral:7b-128k",
1149
+ "name": "Yarn Mistral 7B 128k",
1150
+ "ramGb": 4.5,
1151
+ "sizeMb": 3840,
1152
+ "quality": 81,
1153
+ "useCase": "long context"
1154
+ },
1155
+ {
1156
+ "id": "llama-pro:8b",
1157
+ "name": "Llama Pro 8B",
1158
+ "ramGb": 5,
1159
+ "sizeMb": 4360,
1160
+ "quality": 83,
1161
+ "useCase": "block expansion"
1162
+ },
1163
+ {
1164
+ "id": "openhermes:7b-mistral-v2.5",
1165
+ "name": "OpenHermes 7B v2.5",
1166
+ "ramGb": 4.5,
1167
+ "sizeMb": 3840,
1168
+ "quality": 80,
1169
+ "useCase": "chat"
1170
+ },
1171
+ {
1172
+ "id": "nous-capybara:7b",
1173
+ "name": "Nous Capybara 7B",
1174
+ "ramGb": 4.5,
1175
+ "sizeMb": 3840,
1176
+ "quality": 79,
1177
+ "useCase": "chat"
1178
+ },
1179
+ {
1180
+ "id": "neural-chat:7b-v3-3",
1181
+ "name": "Neural Chat 7B v3.3",
1182
+ "ramGb": 4.5,
1183
+ "sizeMb": 3840,
1184
+ "quality": 80,
1185
+ "useCase": "chat"
1186
+ },
1187
+ {
1188
+ "id": "wizard-math:7b",
1189
+ "name": "WizardMath 7B",
1190
+ "ramGb": 4.5,
1191
+ "sizeMb": 3840,
1192
+ "quality": 82,
1193
+ "useCase": "math"
1194
+ },
1195
+ {
1196
+ "id": "wizard-math:13b",
1197
+ "name": "WizardMath 13B",
1198
+ "ramGb": 8,
1199
+ "sizeMb": 6960,
1200
+ "quality": 85,
1201
+ "useCase": "math"
1202
+ },
1203
+ {
1204
+ "id": "deepseek-llm:7b",
1205
+ "name": "DeepSeek LLM 7B",
1206
+ "ramGb": 4.5,
1207
+ "sizeMb": 3840,
1208
+ "quality": 81,
1209
+ "useCase": "general"
1210
+ },
1211
+ {
1212
+ "id": "deepseek-llm:67b",
1213
+ "name": "DeepSeek LLM 67B",
1214
+ "ramGb": 37.3,
1215
+ "sizeMb": 35040,
1216
+ "quality": 91,
1217
+ "useCase": "frontier"
1218
+ },
1219
+ {
1220
+ "id": "qwen:7b",
1221
+ "name": "Qwen 7B",
1222
+ "ramGb": 4.5,
1223
+ "sizeMb": 3840,
1224
+ "quality": 78,
1225
+ "useCase": "legacy chat"
1226
+ },
1227
+ {
1228
+ "id": "qwen:14b",
1229
+ "name": "Qwen 14B",
1230
+ "ramGb": 8.5,
1231
+ "sizeMb": 7480,
1232
+ "quality": 84,
1233
+ "useCase": "legacy chat"
1234
+ },
1235
+ {
1236
+ "id": "qwen:72b",
1237
+ "name": "Qwen 72B",
1238
+ "ramGb": 39.9,
1239
+ "sizeMb": 37640,
1240
+ "quality": 92,
1241
+ "useCase": "legacy frontier"
1242
+ },
1243
+ {
1244
+ "id": "qwen2:7b",
1245
+ "name": "Qwen 2 7B",
1246
+ "ramGb": 4.5,
1247
+ "sizeMb": 3840,
1248
+ "quality": 82,
1249
+ "useCase": "chat"
1250
+ },
1251
+ {
1252
+ "id": "qwen2:72b",
1253
+ "name": "Qwen 2 72B",
1254
+ "ramGb": 39.9,
1255
+ "sizeMb": 37640,
1256
+ "quality": 93,
1257
+ "useCase": "frontier"
1258
+ }
1259
+ ]