@openinference/cli 1.0.2 → 1.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/data/models.json +153 -153
- package/dist/chat.d.ts +9 -0
- package/dist/chat.d.ts.map +1 -1
- package/dist/chat.js +60 -0
- package/dist/chat.js.map +1 -1
- package/dist/data/models.json +153 -153
- package/dist/index.js +17 -2
- package/dist/index.js.map +1 -1
- package/dist/ollama.d.ts +1 -0
- package/dist/ollama.d.ts.map +1 -1
- package/dist/ollama.js +8 -0
- package/dist/ollama.js.map +1 -1
- package/dist/recommend-run.js +1 -1
- package/dist/recommend-run.js.map +1 -1
- package/dist/recommend.d.ts +6 -2
- package/dist/recommend.d.ts.map +1 -1
- package/dist/recommend.js +41 -6
- package/dist/recommend.js.map +1 -1
- package/dist/setup.js +5 -5
- package/dist/setup.js.map +1 -1
- package/dist/shell.d.ts +6 -0
- package/dist/shell.d.ts.map +1 -0
- package/dist/shell.js +268 -0
- package/dist/shell.js.map +1 -0
- package/dist/version.d.ts +2 -0
- package/dist/version.d.ts.map +1 -0
- package/dist/version.js +20 -0
- package/dist/version.js.map +1 -0
- package/package.json +1 -1
package/data/models.json
CHANGED
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
{
|
|
3
3
|
"id": "smollm2:135m",
|
|
4
4
|
"name": "SmolLM2 135M",
|
|
5
|
-
"ramGb": 0.
|
|
5
|
+
"ramGb": 0.6,
|
|
6
6
|
"sizeMb": 190,
|
|
7
7
|
"quality": 45,
|
|
8
8
|
"useCase": "classification, tags",
|
|
@@ -14,7 +14,7 @@
|
|
|
14
14
|
{
|
|
15
15
|
"id": "smollm2:360m",
|
|
16
16
|
"name": "SmolLM2 360M",
|
|
17
|
-
"ramGb": 0.
|
|
17
|
+
"ramGb": 0.8,
|
|
18
18
|
"sizeMb": 307,
|
|
19
19
|
"quality": 50,
|
|
20
20
|
"useCase": "light tasks",
|
|
@@ -26,7 +26,7 @@
|
|
|
26
26
|
{
|
|
27
27
|
"id": "qwen2.5:0.5b",
|
|
28
28
|
"name": "Qwen 2.5 0.5B",
|
|
29
|
-
"ramGb": 0.
|
|
29
|
+
"ramGb": 0.9,
|
|
30
30
|
"sizeMb": 380,
|
|
31
31
|
"quality": 52,
|
|
32
32
|
"useCase": "fast labels",
|
|
@@ -38,7 +38,7 @@
|
|
|
38
38
|
{
|
|
39
39
|
"id": "tinyllama",
|
|
40
40
|
"name": "TinyLlama 1.1B",
|
|
41
|
-
"ramGb": 1.
|
|
41
|
+
"ramGb": 1.8,
|
|
42
42
|
"sizeMb": 772,
|
|
43
43
|
"quality": 48,
|
|
44
44
|
"useCase": "tiny chat",
|
|
@@ -51,7 +51,7 @@
|
|
|
51
51
|
{
|
|
52
52
|
"id": "tinydolphin",
|
|
53
53
|
"name": "TinyDolphin 1.5B",
|
|
54
|
-
"ramGb": 1
|
|
54
|
+
"ramGb": 2.1,
|
|
55
55
|
"sizeMb": 980,
|
|
56
56
|
"quality": 55,
|
|
57
57
|
"useCase": "uncensored small",
|
|
@@ -62,7 +62,7 @@
|
|
|
62
62
|
{
|
|
63
63
|
"id": "stablelm2:1.6b",
|
|
64
64
|
"name": "StableLM2 1.6B",
|
|
65
|
-
"ramGb":
|
|
65
|
+
"ramGb": 2.2,
|
|
66
66
|
"sizeMb": 1032,
|
|
67
67
|
"quality": 54,
|
|
68
68
|
"useCase": "chat",
|
|
@@ -74,7 +74,7 @@
|
|
|
74
74
|
{
|
|
75
75
|
"id": "olmo2:1b",
|
|
76
76
|
"name": "OLMo 2 1B",
|
|
77
|
-
"ramGb": 1.
|
|
77
|
+
"ramGb": 1.7,
|
|
78
78
|
"sizeMb": 720,
|
|
79
79
|
"quality": 56,
|
|
80
80
|
"useCase": "research chat",
|
|
@@ -87,7 +87,7 @@
|
|
|
87
87
|
{
|
|
88
88
|
"id": "granite3-dense:2b",
|
|
89
89
|
"name": "Granite 3 Dense 2B",
|
|
90
|
-
"ramGb":
|
|
90
|
+
"ramGb": 2.9,
|
|
91
91
|
"sizeMb": 1240,
|
|
92
92
|
"quality": 73,
|
|
93
93
|
"useCase": "enterprise chat",
|
|
@@ -99,7 +99,7 @@
|
|
|
99
99
|
{
|
|
100
100
|
"id": "gemma3:1b",
|
|
101
101
|
"name": "Gemma 3 1B",
|
|
102
|
-
"ramGb": 1.
|
|
102
|
+
"ramGb": 1.7,
|
|
103
103
|
"sizeMb": 720,
|
|
104
104
|
"quality": 68,
|
|
105
105
|
"useCase": "chat, general",
|
|
@@ -112,7 +112,7 @@
|
|
|
112
112
|
{
|
|
113
113
|
"id": "llama3.2:1b",
|
|
114
114
|
"name": "Llama 3.2 1B",
|
|
115
|
-
"ramGb": 1.
|
|
115
|
+
"ramGb": 1.7,
|
|
116
116
|
"sizeMb": 720,
|
|
117
117
|
"quality": 66,
|
|
118
118
|
"useCase": "instructions",
|
|
@@ -125,7 +125,7 @@
|
|
|
125
125
|
{
|
|
126
126
|
"id": "llama3.2:1b-instruct-q8_0",
|
|
127
127
|
"name": "Llama 3.2 1B Q8",
|
|
128
|
-
"ramGb": 1.
|
|
128
|
+
"ramGb": 1.7,
|
|
129
129
|
"sizeMb": 720,
|
|
130
130
|
"quality": 67,
|
|
131
131
|
"useCase": "precise small",
|
|
@@ -136,7 +136,7 @@
|
|
|
136
136
|
{
|
|
137
137
|
"id": "qwen2.5:1.5b",
|
|
138
138
|
"name": "Qwen 2.5 1.5B",
|
|
139
|
-
"ramGb": 1
|
|
139
|
+
"ramGb": 2.1,
|
|
140
140
|
"sizeMb": 980,
|
|
141
141
|
"quality": 70,
|
|
142
142
|
"useCase": "JSON, chat",
|
|
@@ -149,7 +149,7 @@
|
|
|
149
149
|
{
|
|
150
150
|
"id": "deepseek-r1:1.5b",
|
|
151
151
|
"name": "DeepSeek R1 1.5B",
|
|
152
|
-
"ramGb": 1
|
|
152
|
+
"ramGb": 2.1,
|
|
153
153
|
"sizeMb": 980,
|
|
154
154
|
"quality": 72,
|
|
155
155
|
"useCase": "reasoning",
|
|
@@ -161,7 +161,7 @@
|
|
|
161
161
|
{
|
|
162
162
|
"id": "phi3:mini",
|
|
163
163
|
"name": "Phi-3 Mini",
|
|
164
|
-
"ramGb": 2
|
|
164
|
+
"ramGb": 4.2,
|
|
165
165
|
"sizeMb": 2176,
|
|
166
166
|
"quality": 74,
|
|
167
167
|
"useCase": "reasoning small",
|
|
@@ -173,7 +173,7 @@
|
|
|
173
173
|
{
|
|
174
174
|
"id": "gemma2:2b",
|
|
175
175
|
"name": "Gemma 2 2B",
|
|
176
|
-
"ramGb":
|
|
176
|
+
"ramGb": 2.9,
|
|
177
177
|
"sizeMb": 1240,
|
|
178
178
|
"quality": 71,
|
|
179
179
|
"useCase": "chat",
|
|
@@ -186,7 +186,7 @@
|
|
|
186
186
|
{
|
|
187
187
|
"id": "smollm2:1.7b",
|
|
188
188
|
"name": "SmolLM2 1.7B",
|
|
189
|
-
"ramGb":
|
|
189
|
+
"ramGb": 2.2,
|
|
190
190
|
"sizeMb": 1084,
|
|
191
191
|
"quality": 65,
|
|
192
192
|
"useCase": "efficient chat",
|
|
@@ -199,7 +199,7 @@
|
|
|
199
199
|
{
|
|
200
200
|
"id": "internlm2:1.8b",
|
|
201
201
|
"name": "InternLM2 1.8B",
|
|
202
|
-
"ramGb":
|
|
202
|
+
"ramGb": 2.3,
|
|
203
203
|
"sizeMb": 1136,
|
|
204
204
|
"quality": 69,
|
|
205
205
|
"useCase": "multilingual",
|
|
@@ -210,7 +210,7 @@
|
|
|
210
210
|
{
|
|
211
211
|
"id": "yi:1.5b",
|
|
212
212
|
"name": "Yi 1.5B",
|
|
213
|
-
"ramGb": 1
|
|
213
|
+
"ramGb": 2.1,
|
|
214
214
|
"sizeMb": 980,
|
|
215
215
|
"quality": 67,
|
|
216
216
|
"useCase": "bilingual chat",
|
|
@@ -222,7 +222,7 @@
|
|
|
222
222
|
{
|
|
223
223
|
"id": "qwen2:1.5b",
|
|
224
224
|
"name": "Qwen 2 1.5B",
|
|
225
|
-
"ramGb": 1
|
|
225
|
+
"ramGb": 2.1,
|
|
226
226
|
"sizeMb": 980,
|
|
227
227
|
"quality": 66,
|
|
228
228
|
"useCase": "chat",
|
|
@@ -234,7 +234,7 @@
|
|
|
234
234
|
{
|
|
235
235
|
"id": "orca-mini",
|
|
236
236
|
"name": "Orca Mini 3B",
|
|
237
|
-
"ramGb":
|
|
237
|
+
"ramGb": 3.7,
|
|
238
238
|
"sizeMb": 1760,
|
|
239
239
|
"quality": 58,
|
|
240
240
|
"useCase": "teaching small",
|
|
@@ -245,7 +245,7 @@
|
|
|
245
245
|
{
|
|
246
246
|
"id": "stablelm-zephyr:3b",
|
|
247
247
|
"name": "StableLM Zephyr 3B",
|
|
248
|
-
"ramGb":
|
|
248
|
+
"ramGb": 3.7,
|
|
249
249
|
"sizeMb": 1760,
|
|
250
250
|
"quality": 68,
|
|
251
251
|
"useCase": "chat",
|
|
@@ -257,7 +257,7 @@
|
|
|
257
257
|
{
|
|
258
258
|
"id": "llama3.2:3b",
|
|
259
259
|
"name": "Llama 3.2 3B",
|
|
260
|
-
"ramGb":
|
|
260
|
+
"ramGb": 3.7,
|
|
261
261
|
"sizeMb": 1760,
|
|
262
262
|
"quality": 76,
|
|
263
263
|
"useCase": "general",
|
|
@@ -270,7 +270,7 @@
|
|
|
270
270
|
{
|
|
271
271
|
"id": "qwen2.5:3b",
|
|
272
272
|
"name": "Qwen 2.5 3B",
|
|
273
|
-
"ramGb":
|
|
273
|
+
"ramGb": 3.7,
|
|
274
274
|
"sizeMb": 1760,
|
|
275
275
|
"quality": 78,
|
|
276
276
|
"useCase": "coding, JSON",
|
|
@@ -282,7 +282,7 @@
|
|
|
282
282
|
{
|
|
283
283
|
"id": "phi3.5:latest",
|
|
284
284
|
"name": "Phi 3.5",
|
|
285
|
-
"ramGb": 2
|
|
285
|
+
"ramGb": 4.2,
|
|
286
286
|
"sizeMb": 2176,
|
|
287
287
|
"quality": 74,
|
|
288
288
|
"useCase": "reasoning",
|
|
@@ -294,7 +294,7 @@
|
|
|
294
294
|
{
|
|
295
295
|
"id": "gemma3:4b",
|
|
296
296
|
"name": "Gemma 3 4B",
|
|
297
|
-
"ramGb":
|
|
297
|
+
"ramGb": 5.1,
|
|
298
298
|
"sizeMb": 2280,
|
|
299
299
|
"quality": 80,
|
|
300
300
|
"useCase": "quality chat",
|
|
@@ -307,7 +307,7 @@
|
|
|
307
307
|
{
|
|
308
308
|
"id": "gemma3:4b-it-qat",
|
|
309
309
|
"name": "Gemma 3 4B QAT",
|
|
310
|
-
"ramGb":
|
|
310
|
+
"ramGb": 5.1,
|
|
311
311
|
"sizeMb": 2280,
|
|
312
312
|
"quality": 81,
|
|
313
313
|
"useCase": "efficient 4B",
|
|
@@ -318,7 +318,7 @@
|
|
|
318
318
|
{
|
|
319
319
|
"id": "codestral:22b-v0.1-q4_0",
|
|
320
320
|
"name": "Codestral 22B Q4",
|
|
321
|
-
"ramGb":
|
|
321
|
+
"ramGb": 19.3,
|
|
322
322
|
"sizeMb": 11640,
|
|
323
323
|
"quality": 88,
|
|
324
324
|
"useCase": "coding frontier",
|
|
@@ -329,7 +329,7 @@
|
|
|
329
329
|
{
|
|
330
330
|
"id": "codegemma:2b",
|
|
331
331
|
"name": "CodeGemma 2B",
|
|
332
|
-
"ramGb":
|
|
332
|
+
"ramGb": 2.9,
|
|
333
333
|
"sizeMb": 1240,
|
|
334
334
|
"quality": 72,
|
|
335
335
|
"useCase": "code completion",
|
|
@@ -340,7 +340,7 @@
|
|
|
340
340
|
{
|
|
341
341
|
"id": "starcoder2:3b",
|
|
342
342
|
"name": "StarCoder2 3B",
|
|
343
|
-
"ramGb":
|
|
343
|
+
"ramGb": 3.7,
|
|
344
344
|
"sizeMb": 1760,
|
|
345
345
|
"quality": 75,
|
|
346
346
|
"useCase": "code",
|
|
@@ -351,7 +351,7 @@
|
|
|
351
351
|
{
|
|
352
352
|
"id": "deepseek-coder:1.3b",
|
|
353
353
|
"name": "DeepSeek Coder 1.3B",
|
|
354
|
-
"ramGb": 1.
|
|
354
|
+
"ramGb": 1.9,
|
|
355
355
|
"sizeMb": 876,
|
|
356
356
|
"quality": 70,
|
|
357
357
|
"useCase": "code small",
|
|
@@ -362,7 +362,7 @@
|
|
|
362
362
|
{
|
|
363
363
|
"id": "wizardcoder:3b",
|
|
364
364
|
"name": "WizardCoder 3B",
|
|
365
|
-
"ramGb":
|
|
365
|
+
"ramGb": 3.7,
|
|
366
366
|
"sizeMb": 1760,
|
|
367
367
|
"quality": 71,
|
|
368
368
|
"useCase": "code",
|
|
@@ -373,7 +373,7 @@
|
|
|
373
373
|
{
|
|
374
374
|
"id": "sqlcoder:7b",
|
|
375
375
|
"name": "SQLCoder 7B",
|
|
376
|
-
"ramGb":
|
|
376
|
+
"ramGb": 7.2,
|
|
377
377
|
"sizeMb": 3840,
|
|
378
378
|
"quality": 79,
|
|
379
379
|
"useCase": "SQL",
|
|
@@ -384,7 +384,7 @@
|
|
|
384
384
|
{
|
|
385
385
|
"id": "llama3.2-vision:11b",
|
|
386
386
|
"name": "Llama 3.2 Vision 11B",
|
|
387
|
-
"ramGb":
|
|
387
|
+
"ramGb": 11.4,
|
|
388
388
|
"sizeMb": 5920,
|
|
389
389
|
"quality": 82,
|
|
390
390
|
"useCase": "vision",
|
|
@@ -395,7 +395,7 @@
|
|
|
395
395
|
{
|
|
396
396
|
"id": "moondream:1.8b",
|
|
397
397
|
"name": "Moondream 1.8B",
|
|
398
|
-
"ramGb":
|
|
398
|
+
"ramGb": 2.3,
|
|
399
399
|
"sizeMb": 1136,
|
|
400
400
|
"quality": 64,
|
|
401
401
|
"useCase": "vision small",
|
|
@@ -406,7 +406,7 @@
|
|
|
406
406
|
{
|
|
407
407
|
"id": "llava:7b",
|
|
408
408
|
"name": "LLaVA 7B",
|
|
409
|
-
"ramGb":
|
|
409
|
+
"ramGb": 7.2,
|
|
410
410
|
"sizeMb": 3840,
|
|
411
411
|
"quality": 76,
|
|
412
412
|
"useCase": "vision chat",
|
|
@@ -419,7 +419,7 @@
|
|
|
419
419
|
{
|
|
420
420
|
"id": "bakllava:7b",
|
|
421
421
|
"name": "BakLLaVA 7B",
|
|
422
|
-
"ramGb":
|
|
422
|
+
"ramGb": 7.2,
|
|
423
423
|
"sizeMb": 3840,
|
|
424
424
|
"quality": 75,
|
|
425
425
|
"useCase": "vision",
|
|
@@ -430,7 +430,7 @@
|
|
|
430
430
|
{
|
|
431
431
|
"id": "granite3-dense:8b",
|
|
432
432
|
"name": "Granite 3 Dense 8B",
|
|
433
|
-
"ramGb":
|
|
433
|
+
"ramGb": 8,
|
|
434
434
|
"sizeMb": 4360,
|
|
435
435
|
"quality": 83,
|
|
436
436
|
"useCase": "enterprise",
|
|
@@ -441,7 +441,7 @@
|
|
|
441
441
|
{
|
|
442
442
|
"id": "falcon3:3b",
|
|
443
443
|
"name": "Falcon 3 3B",
|
|
444
|
-
"ramGb":
|
|
444
|
+
"ramGb": 3.7,
|
|
445
445
|
"sizeMb": 1760,
|
|
446
446
|
"quality": 70,
|
|
447
447
|
"useCase": "chat",
|
|
@@ -453,7 +453,7 @@
|
|
|
453
453
|
{
|
|
454
454
|
"id": "openhermes:2.5-mistral-7b",
|
|
455
455
|
"name": "OpenHermes Mistral 7B",
|
|
456
|
-
"ramGb":
|
|
456
|
+
"ramGb": 7.2,
|
|
457
457
|
"sizeMb": 3840,
|
|
458
458
|
"quality": 77,
|
|
459
459
|
"useCase": "chat tuned",
|
|
@@ -465,7 +465,7 @@
|
|
|
465
465
|
{
|
|
466
466
|
"id": "mistral:7b",
|
|
467
467
|
"name": "Mistral 7B",
|
|
468
|
-
"ramGb":
|
|
468
|
+
"ramGb": 7.2,
|
|
469
469
|
"sizeMb": 3840,
|
|
470
470
|
"quality": 82,
|
|
471
471
|
"useCase": "general",
|
|
@@ -478,7 +478,7 @@
|
|
|
478
478
|
{
|
|
479
479
|
"id": "mistral:7b-instruct",
|
|
480
480
|
"name": "Mistral 7B Instruct",
|
|
481
|
-
"ramGb":
|
|
481
|
+
"ramGb": 7.2,
|
|
482
482
|
"sizeMb": 3840,
|
|
483
483
|
"quality": 83,
|
|
484
484
|
"useCase": "instructions",
|
|
@@ -490,7 +490,7 @@
|
|
|
490
490
|
{
|
|
491
491
|
"id": "mistral-nemo:12b",
|
|
492
492
|
"name": "Mistral Nemo 12B",
|
|
493
|
-
"ramGb":
|
|
493
|
+
"ramGb": 12.1,
|
|
494
494
|
"sizeMb": 6440,
|
|
495
495
|
"quality": 85,
|
|
496
496
|
"useCase": "long context",
|
|
@@ -502,7 +502,7 @@
|
|
|
502
502
|
{
|
|
503
503
|
"id": "llama3.1:8b",
|
|
504
504
|
"name": "Llama 3.1 8B",
|
|
505
|
-
"ramGb":
|
|
505
|
+
"ramGb": 8,
|
|
506
506
|
"sizeMb": 4360,
|
|
507
507
|
"quality": 84,
|
|
508
508
|
"useCase": "general, tools",
|
|
@@ -516,7 +516,7 @@
|
|
|
516
516
|
{
|
|
517
517
|
"id": "llama3.1:8b-instruct-q4_K_M",
|
|
518
518
|
"name": "Llama 3.1 8B Q4",
|
|
519
|
-
"ramGb":
|
|
519
|
+
"ramGb": 8,
|
|
520
520
|
"sizeMb": 4360,
|
|
521
521
|
"quality": 84,
|
|
522
522
|
"useCase": "general",
|
|
@@ -528,7 +528,7 @@
|
|
|
528
528
|
{
|
|
529
529
|
"id": "llama3.2:3b-instruct-q4_K_M",
|
|
530
530
|
"name": "Llama 3.2 3B Q4",
|
|
531
|
-
"ramGb":
|
|
531
|
+
"ramGb": 3.7,
|
|
532
532
|
"sizeMb": 1760,
|
|
533
533
|
"quality": 76,
|
|
534
534
|
"useCase": "fast general",
|
|
@@ -540,7 +540,7 @@
|
|
|
540
540
|
{
|
|
541
541
|
"id": "llama3.3:70b",
|
|
542
542
|
"name": "Llama 3.3 70B",
|
|
543
|
-
"ramGb":
|
|
543
|
+
"ramGb": 55.9,
|
|
544
544
|
"sizeMb": 36600,
|
|
545
545
|
"quality": 93,
|
|
546
546
|
"useCase": "frontier",
|
|
@@ -552,7 +552,7 @@
|
|
|
552
552
|
{
|
|
553
553
|
"id": "qwen2.5:7b",
|
|
554
554
|
"name": "Qwen 2.5 7B",
|
|
555
|
-
"ramGb":
|
|
555
|
+
"ramGb": 7.2,
|
|
556
556
|
"sizeMb": 3840,
|
|
557
557
|
"quality": 86,
|
|
558
558
|
"useCase": "coding, chat",
|
|
@@ -566,7 +566,7 @@
|
|
|
566
566
|
{
|
|
567
567
|
"id": "qwen2.5:7b-instruct",
|
|
568
568
|
"name": "Qwen 2.5 7B Instruct",
|
|
569
|
-
"ramGb":
|
|
569
|
+
"ramGb": 7.2,
|
|
570
570
|
"sizeMb": 3840,
|
|
571
571
|
"quality": 86,
|
|
572
572
|
"useCase": "chat",
|
|
@@ -578,7 +578,7 @@
|
|
|
578
578
|
{
|
|
579
579
|
"id": "qwen2.5-coder:7b",
|
|
580
580
|
"name": "Qwen 2.5 Coder 7B",
|
|
581
|
-
"ramGb":
|
|
581
|
+
"ramGb": 7.2,
|
|
582
582
|
"sizeMb": 3840,
|
|
583
583
|
"quality": 87,
|
|
584
584
|
"useCase": "coding",
|
|
@@ -590,7 +590,7 @@
|
|
|
590
590
|
{
|
|
591
591
|
"id": "qwen2.5-coder:1.5b",
|
|
592
592
|
"name": "Qwen 2.5 Coder 1.5B",
|
|
593
|
-
"ramGb": 1
|
|
593
|
+
"ramGb": 2.1,
|
|
594
594
|
"sizeMb": 980,
|
|
595
595
|
"quality": 74,
|
|
596
596
|
"useCase": "code small",
|
|
@@ -601,7 +601,7 @@
|
|
|
601
601
|
{
|
|
602
602
|
"id": "deepseek-r1:7b",
|
|
603
603
|
"name": "DeepSeek R1 7B",
|
|
604
|
-
"ramGb":
|
|
604
|
+
"ramGb": 7.2,
|
|
605
605
|
"sizeMb": 3840,
|
|
606
606
|
"quality": 85,
|
|
607
607
|
"useCase": "reasoning",
|
|
@@ -613,7 +613,7 @@
|
|
|
613
613
|
{
|
|
614
614
|
"id": "deepseek-r1:8b",
|
|
615
615
|
"name": "DeepSeek R1 8B",
|
|
616
|
-
"ramGb":
|
|
616
|
+
"ramGb": 8,
|
|
617
617
|
"sizeMb": 4360,
|
|
618
618
|
"quality": 86,
|
|
619
619
|
"useCase": "reasoning",
|
|
@@ -624,7 +624,7 @@
|
|
|
624
624
|
{
|
|
625
625
|
"id": "deepseek-coder:6.7b",
|
|
626
626
|
"name": "DeepSeek Coder 6.7B",
|
|
627
|
-
"ramGb":
|
|
627
|
+
"ramGb": 7,
|
|
628
628
|
"sizeMb": 3684,
|
|
629
629
|
"quality": 84,
|
|
630
630
|
"useCase": "coding",
|
|
@@ -635,7 +635,7 @@
|
|
|
635
635
|
{
|
|
636
636
|
"id": "deepseek-coder-v2:16b",
|
|
637
637
|
"name": "DeepSeek Coder v2 16B",
|
|
638
|
-
"ramGb":
|
|
638
|
+
"ramGb": 15,
|
|
639
639
|
"sizeMb": 8520,
|
|
640
640
|
"quality": 89,
|
|
641
641
|
"useCase": "coding large",
|
|
@@ -646,7 +646,7 @@
|
|
|
646
646
|
{
|
|
647
647
|
"id": "codellama:7b",
|
|
648
648
|
"name": "Code Llama 7B",
|
|
649
|
-
"ramGb":
|
|
649
|
+
"ramGb": 7.2,
|
|
650
650
|
"sizeMb": 3840,
|
|
651
651
|
"quality": 83,
|
|
652
652
|
"useCase": "coding",
|
|
@@ -658,7 +658,7 @@
|
|
|
658
658
|
{
|
|
659
659
|
"id": "codellama:13b",
|
|
660
660
|
"name": "Code Llama 13B",
|
|
661
|
-
"ramGb":
|
|
661
|
+
"ramGb": 12.9,
|
|
662
662
|
"sizeMb": 6960,
|
|
663
663
|
"quality": 86,
|
|
664
664
|
"useCase": "coding",
|
|
@@ -669,7 +669,7 @@
|
|
|
669
669
|
{
|
|
670
670
|
"id": "codellama:34b",
|
|
671
671
|
"name": "Code Llama 34B",
|
|
672
|
-
"ramGb":
|
|
672
|
+
"ramGb": 30,
|
|
673
673
|
"sizeMb": 17880,
|
|
674
674
|
"quality": 90,
|
|
675
675
|
"useCase": "coding frontier",
|
|
@@ -680,7 +680,7 @@
|
|
|
680
680
|
{
|
|
681
681
|
"id": "neural-chat:7b",
|
|
682
682
|
"name": "Neural Chat 7B",
|
|
683
|
-
"ramGb":
|
|
683
|
+
"ramGb": 7.2,
|
|
684
684
|
"sizeMb": 3840,
|
|
685
685
|
"quality": 79,
|
|
686
686
|
"useCase": "chat",
|
|
@@ -693,7 +693,7 @@
|
|
|
693
693
|
{
|
|
694
694
|
"id": "starling-lm:7b",
|
|
695
695
|
"name": "Starling 7B",
|
|
696
|
-
"ramGb":
|
|
696
|
+
"ramGb": 7.2,
|
|
697
697
|
"sizeMb": 3840,
|
|
698
698
|
"quality": 81,
|
|
699
699
|
"useCase": "chat",
|
|
@@ -705,7 +705,7 @@
|
|
|
705
705
|
{
|
|
706
706
|
"id": "openchat:7b",
|
|
707
707
|
"name": "OpenChat 7B",
|
|
708
|
-
"ramGb":
|
|
708
|
+
"ramGb": 7.2,
|
|
709
709
|
"sizeMb": 3840,
|
|
710
710
|
"quality": 80,
|
|
711
711
|
"useCase": "chat",
|
|
@@ -717,7 +717,7 @@
|
|
|
717
717
|
{
|
|
718
718
|
"id": "vicuna:7b",
|
|
719
719
|
"name": "Vicuna 7B",
|
|
720
|
-
"ramGb":
|
|
720
|
+
"ramGb": 7.2,
|
|
721
721
|
"sizeMb": 3840,
|
|
722
722
|
"quality": 78,
|
|
723
723
|
"useCase": "chat",
|
|
@@ -729,7 +729,7 @@
|
|
|
729
729
|
{
|
|
730
730
|
"id": "wizardlm2:7b",
|
|
731
731
|
"name": "WizardLM2 7B",
|
|
732
|
-
"ramGb":
|
|
732
|
+
"ramGb": 7.2,
|
|
733
733
|
"sizeMb": 3840,
|
|
734
734
|
"quality": 80,
|
|
735
735
|
"useCase": "instructions",
|
|
@@ -741,7 +741,7 @@
|
|
|
741
741
|
{
|
|
742
742
|
"id": "wizardlm2:8x22b",
|
|
743
743
|
"name": "WizardLM2 8x22B MoE",
|
|
744
|
-
"ramGb":
|
|
744
|
+
"ramGb": 107,
|
|
745
745
|
"sizeMb": 73520,
|
|
746
746
|
"quality": 94,
|
|
747
747
|
"useCase": "MoE frontier",
|
|
@@ -752,7 +752,7 @@
|
|
|
752
752
|
{
|
|
753
753
|
"id": "nous-hermes2:7b",
|
|
754
754
|
"name": "Nous Hermes 2 7B",
|
|
755
|
-
"ramGb":
|
|
755
|
+
"ramGb": 7.2,
|
|
756
756
|
"sizeMb": 3840,
|
|
757
757
|
"quality": 81,
|
|
758
758
|
"useCase": "chat",
|
|
@@ -764,7 +764,7 @@
|
|
|
764
764
|
{
|
|
765
765
|
"id": "nous-hermes2-mixtral:8x7b",
|
|
766
766
|
"name": "Nous Hermes Mixtral",
|
|
767
|
-
"ramGb":
|
|
767
|
+
"ramGb": 39.3,
|
|
768
768
|
"sizeMb": 24640,
|
|
769
769
|
"quality": 90,
|
|
770
770
|
"useCase": "MoE chat",
|
|
@@ -776,7 +776,7 @@
|
|
|
776
776
|
{
|
|
777
777
|
"id": "dolphin-mistral:7b",
|
|
778
778
|
"name": "Dolphin Mistral 7B",
|
|
779
|
-
"ramGb":
|
|
779
|
+
"ramGb": 7.2,
|
|
780
780
|
"sizeMb": 3840,
|
|
781
781
|
"quality": 79,
|
|
782
782
|
"useCase": "uncensored chat",
|
|
@@ -788,7 +788,7 @@
|
|
|
788
788
|
{
|
|
789
789
|
"id": "dolphin-llama3:8b",
|
|
790
790
|
"name": "Dolphin Llama 3 8B",
|
|
791
|
-
"ramGb":
|
|
791
|
+
"ramGb": 8,
|
|
792
792
|
"sizeMb": 4360,
|
|
793
793
|
"quality": 80,
|
|
794
794
|
"useCase": "uncensored chat",
|
|
@@ -800,7 +800,7 @@
|
|
|
800
800
|
{
|
|
801
801
|
"id": "solar:10.7b",
|
|
802
802
|
"name": "Solar 10.7B",
|
|
803
|
-
"ramGb":
|
|
803
|
+
"ramGb": 11.2,
|
|
804
804
|
"sizeMb": 5764,
|
|
805
805
|
"quality": 84,
|
|
806
806
|
"useCase": "depth-upscaled",
|
|
@@ -811,7 +811,7 @@
|
|
|
811
811
|
{
|
|
812
812
|
"id": "yi:6b",
|
|
813
813
|
"name": "Yi 6B",
|
|
814
|
-
"ramGb":
|
|
814
|
+
"ramGb": 6.5,
|
|
815
815
|
"sizeMb": 3320,
|
|
816
816
|
"quality": 80,
|
|
817
817
|
"useCase": "bilingual",
|
|
@@ -822,7 +822,7 @@
|
|
|
822
822
|
{
|
|
823
823
|
"id": "yi:9b",
|
|
824
824
|
"name": "Yi 9B",
|
|
825
|
-
"ramGb":
|
|
825
|
+
"ramGb": 8.7,
|
|
826
826
|
"sizeMb": 4880,
|
|
827
827
|
"quality": 83,
|
|
828
828
|
"useCase": "bilingual quality",
|
|
@@ -833,7 +833,7 @@
|
|
|
833
833
|
{
|
|
834
834
|
"id": "command-r7b",
|
|
835
835
|
"name": "Command R 7B",
|
|
836
|
-
"ramGb":
|
|
836
|
+
"ramGb": 7.2,
|
|
837
837
|
"sizeMb": 3840,
|
|
838
838
|
"quality": 82,
|
|
839
839
|
"useCase": "RAG, tools",
|
|
@@ -845,7 +845,7 @@
|
|
|
845
845
|
{
|
|
846
846
|
"id": "command-r:35b",
|
|
847
847
|
"name": "Command R 35B",
|
|
848
|
-
"ramGb":
|
|
848
|
+
"ramGb": 30.7,
|
|
849
849
|
"sizeMb": 18400,
|
|
850
850
|
"quality": 91,
|
|
851
851
|
"useCase": "RAG enterprise",
|
|
@@ -858,7 +858,7 @@
|
|
|
858
858
|
{
|
|
859
859
|
"id": "command-r-plus:104b",
|
|
860
860
|
"name": "Command R+ 104B",
|
|
861
|
-
"ramGb":
|
|
861
|
+
"ramGb": 80.4,
|
|
862
862
|
"sizeMb": 54280,
|
|
863
863
|
"quality": 95,
|
|
864
864
|
"useCase": "frontier RAG",
|
|
@@ -870,7 +870,7 @@
|
|
|
870
870
|
{
|
|
871
871
|
"id": "granite3.1-dense:8b",
|
|
872
872
|
"name": "Granite 3.1 8B",
|
|
873
|
-
"ramGb":
|
|
873
|
+
"ramGb": 8,
|
|
874
874
|
"sizeMb": 4360,
|
|
875
875
|
"quality": 84,
|
|
876
876
|
"useCase": "enterprise",
|
|
@@ -881,7 +881,7 @@
|
|
|
881
881
|
{
|
|
882
882
|
"id": "granite3.1-moe:1b",
|
|
883
883
|
"name": "Granite 3.1 MoE 1B",
|
|
884
|
-
"ramGb": 1.
|
|
884
|
+
"ramGb": 1.7,
|
|
885
885
|
"sizeMb": 720,
|
|
886
886
|
"quality": 70,
|
|
887
887
|
"useCase": "efficient MoE",
|
|
@@ -892,7 +892,7 @@
|
|
|
892
892
|
{
|
|
893
893
|
"id": "falcon:7b",
|
|
894
894
|
"name": "Falcon 7B",
|
|
895
|
-
"ramGb":
|
|
895
|
+
"ramGb": 7.2,
|
|
896
896
|
"sizeMb": 3840,
|
|
897
897
|
"quality": 77,
|
|
898
898
|
"useCase": "general",
|
|
@@ -904,7 +904,7 @@
|
|
|
904
904
|
{
|
|
905
905
|
"id": "falcon2:11b",
|
|
906
906
|
"name": "Falcon 2 11B",
|
|
907
|
-
"ramGb":
|
|
907
|
+
"ramGb": 11.4,
|
|
908
908
|
"sizeMb": 5920,
|
|
909
909
|
"quality": 82,
|
|
910
910
|
"useCase": "general",
|
|
@@ -916,7 +916,7 @@
|
|
|
916
916
|
{
|
|
917
917
|
"id": "zephyr:7b",
|
|
918
918
|
"name": "Zephyr 7B",
|
|
919
|
-
"ramGb":
|
|
919
|
+
"ramGb": 7.2,
|
|
920
920
|
"sizeMb": 3840,
|
|
921
921
|
"quality": 80,
|
|
922
922
|
"useCase": "helpful chat",
|
|
@@ -929,7 +929,7 @@
|
|
|
929
929
|
{
|
|
930
930
|
"id": "orca2:7b",
|
|
931
931
|
"name": "Orca 2 7B",
|
|
932
|
-
"ramGb":
|
|
932
|
+
"ramGb": 7.2,
|
|
933
933
|
"sizeMb": 3840,
|
|
934
934
|
"quality": 79,
|
|
935
935
|
"useCase": "reasoning",
|
|
@@ -940,7 +940,7 @@
|
|
|
940
940
|
{
|
|
941
941
|
"id": "orca2:13b",
|
|
942
942
|
"name": "Orca 2 13B",
|
|
943
|
-
"ramGb":
|
|
943
|
+
"ramGb": 12.9,
|
|
944
944
|
"sizeMb": 6960,
|
|
945
945
|
"quality": 84,
|
|
946
946
|
"useCase": "reasoning",
|
|
@@ -951,7 +951,7 @@
|
|
|
951
951
|
{
|
|
952
952
|
"id": "wizard-vicuna-uncensored:7b",
|
|
953
953
|
"name": "Wizard Vicuna 7B",
|
|
954
|
-
"ramGb":
|
|
954
|
+
"ramGb": 7.2,
|
|
955
955
|
"sizeMb": 3840,
|
|
956
956
|
"quality": 76,
|
|
957
957
|
"useCase": "uncensored",
|
|
@@ -962,7 +962,7 @@
|
|
|
962
962
|
{
|
|
963
963
|
"id": "everythinglm:13b",
|
|
964
964
|
"name": "EverythingLM 13B",
|
|
965
|
-
"ramGb":
|
|
965
|
+
"ramGb": 12.9,
|
|
966
966
|
"sizeMb": 6960,
|
|
967
967
|
"quality": 78,
|
|
968
968
|
"useCase": "roleplay",
|
|
@@ -973,7 +973,7 @@
|
|
|
973
973
|
{
|
|
974
974
|
"id": "megadolphin:7b",
|
|
975
975
|
"name": "MegaDolphin 7B",
|
|
976
|
-
"ramGb":
|
|
976
|
+
"ramGb": 7.2,
|
|
977
977
|
"sizeMb": 3840,
|
|
978
978
|
"quality": 77,
|
|
979
979
|
"useCase": "uncensored",
|
|
@@ -984,7 +984,7 @@
|
|
|
984
984
|
{
|
|
985
985
|
"id": "open-orca-platypus2:13b",
|
|
986
986
|
"name": "OpenOrca Platypus2 13B",
|
|
987
|
-
"ramGb":
|
|
987
|
+
"ramGb": 12.9,
|
|
988
988
|
"sizeMb": 6960,
|
|
989
989
|
"quality": 80,
|
|
990
990
|
"useCase": "reasoning",
|
|
@@ -995,7 +995,7 @@
|
|
|
995
995
|
{
|
|
996
996
|
"id": "stable-beluga:7b",
|
|
997
997
|
"name": "Stable Beluga 7B",
|
|
998
|
-
"ramGb":
|
|
998
|
+
"ramGb": 7.2,
|
|
999
999
|
"sizeMb": 3840,
|
|
1000
1000
|
"quality": 78,
|
|
1001
1001
|
"useCase": "chat",
|
|
@@ -1007,7 +1007,7 @@
|
|
|
1007
1007
|
{
|
|
1008
1008
|
"id": "stable-beluga:13b",
|
|
1009
1009
|
"name": "Stable Beluga 13B",
|
|
1010
|
-
"ramGb":
|
|
1010
|
+
"ramGb": 12.9,
|
|
1011
1011
|
"sizeMb": 6960,
|
|
1012
1012
|
"quality": 81,
|
|
1013
1013
|
"useCase": "chat",
|
|
@@ -1019,7 +1019,7 @@
|
|
|
1019
1019
|
{
|
|
1020
1020
|
"id": "meditron:7b",
|
|
1021
1021
|
"name": "Meditron 7B",
|
|
1022
|
-
"ramGb":
|
|
1022
|
+
"ramGb": 7.2,
|
|
1023
1023
|
"sizeMb": 3840,
|
|
1024
1024
|
"quality": 76,
|
|
1025
1025
|
"useCase": "medical",
|
|
@@ -1030,7 +1030,7 @@
|
|
|
1030
1030
|
{
|
|
1031
1031
|
"id": "medllama2:7b",
|
|
1032
1032
|
"name": "MedLlama2 7B",
|
|
1033
|
-
"ramGb":
|
|
1033
|
+
"ramGb": 7.2,
|
|
1034
1034
|
"sizeMb": 3840,
|
|
1035
1035
|
"quality": 75,
|
|
1036
1036
|
"useCase": "medical",
|
|
@@ -1041,7 +1041,7 @@
|
|
|
1041
1041
|
{
|
|
1042
1042
|
"id": "biomistral:7b",
|
|
1043
1043
|
"name": "BioMistral 7B",
|
|
1044
|
-
"ramGb":
|
|
1044
|
+
"ramGb": 7.2,
|
|
1045
1045
|
"sizeMb": 3840,
|
|
1046
1046
|
"quality": 77,
|
|
1047
1047
|
"useCase": "biomedical",
|
|
@@ -1052,7 +1052,7 @@
|
|
|
1052
1052
|
{
|
|
1053
1053
|
"id": "llama2:7b",
|
|
1054
1054
|
"name": "Llama 2 7B",
|
|
1055
|
-
"ramGb":
|
|
1055
|
+
"ramGb": 7.2,
|
|
1056
1056
|
"sizeMb": 3840,
|
|
1057
1057
|
"quality": 72,
|
|
1058
1058
|
"useCase": "legacy general",
|
|
@@ -1065,7 +1065,7 @@
|
|
|
1065
1065
|
{
|
|
1066
1066
|
"id": "llama2:13b",
|
|
1067
1067
|
"name": "Llama 2 13B",
|
|
1068
|
-
"ramGb":
|
|
1068
|
+
"ramGb": 12.9,
|
|
1069
1069
|
"sizeMb": 6960,
|
|
1070
1070
|
"quality": 78,
|
|
1071
1071
|
"useCase": "legacy general",
|
|
@@ -1077,7 +1077,7 @@
|
|
|
1077
1077
|
{
|
|
1078
1078
|
"id": "llama2:70b",
|
|
1079
1079
|
"name": "Llama 2 70B",
|
|
1080
|
-
"ramGb":
|
|
1080
|
+
"ramGb": 55.9,
|
|
1081
1081
|
"sizeMb": 36600,
|
|
1082
1082
|
"quality": 90,
|
|
1083
1083
|
"useCase": "legacy frontier",
|
|
@@ -1088,7 +1088,7 @@
|
|
|
1088
1088
|
{
|
|
1089
1089
|
"id": "llama2-chinese:7b",
|
|
1090
1090
|
"name": "Llama 2 Chinese 7B",
|
|
1091
|
-
"ramGb":
|
|
1091
|
+
"ramGb": 7.2,
|
|
1092
1092
|
"sizeMb": 3840,
|
|
1093
1093
|
"quality": 74,
|
|
1094
1094
|
"useCase": "chinese",
|
|
@@ -1099,7 +1099,7 @@
|
|
|
1099
1099
|
{
|
|
1100
1100
|
"id": "gemma:7b",
|
|
1101
1101
|
"name": "Gemma 7B",
|
|
1102
|
-
"ramGb":
|
|
1102
|
+
"ramGb": 7.2,
|
|
1103
1103
|
"sizeMb": 3840,
|
|
1104
1104
|
"quality": 79,
|
|
1105
1105
|
"useCase": "google chat",
|
|
@@ -1111,7 +1111,7 @@
|
|
|
1111
1111
|
{
|
|
1112
1112
|
"id": "gemma2:9b",
|
|
1113
1113
|
"name": "Gemma 2 9B",
|
|
1114
|
-
"ramGb":
|
|
1114
|
+
"ramGb": 8.7,
|
|
1115
1115
|
"sizeMb": 4880,
|
|
1116
1116
|
"quality": 84,
|
|
1117
1117
|
"useCase": "quality chat",
|
|
@@ -1124,7 +1124,7 @@
|
|
|
1124
1124
|
{
|
|
1125
1125
|
"id": "gemma2:27b",
|
|
1126
1126
|
"name": "Gemma 2 27B",
|
|
1127
|
-
"ramGb":
|
|
1127
|
+
"ramGb": 22.9,
|
|
1128
1128
|
"sizeMb": 14240,
|
|
1129
1129
|
"quality": 91,
|
|
1130
1130
|
"useCase": "frontier chat",
|
|
@@ -1136,7 +1136,7 @@
|
|
|
1136
1136
|
{
|
|
1137
1137
|
"id": "gemma3:12b",
|
|
1138
1138
|
"name": "Gemma 3 12B",
|
|
1139
|
-
"ramGb":
|
|
1139
|
+
"ramGb": 12.1,
|
|
1140
1140
|
"sizeMb": 6440,
|
|
1141
1141
|
"quality": 87,
|
|
1142
1142
|
"useCase": "multimodal text",
|
|
@@ -1147,7 +1147,7 @@
|
|
|
1147
1147
|
{
|
|
1148
1148
|
"id": "gemma3:27b",
|
|
1149
1149
|
"name": "Gemma 3 27B",
|
|
1150
|
-
"ramGb":
|
|
1150
|
+
"ramGb": 22.9,
|
|
1151
1151
|
"sizeMb": 14240,
|
|
1152
1152
|
"quality": 92,
|
|
1153
1153
|
"useCase": "frontier",
|
|
@@ -1158,7 +1158,7 @@
|
|
|
1158
1158
|
{
|
|
1159
1159
|
"id": "phi4:14b",
|
|
1160
1160
|
"name": "Phi-4 14B",
|
|
1161
|
-
"ramGb":
|
|
1161
|
+
"ramGb": 13.6,
|
|
1162
1162
|
"sizeMb": 7480,
|
|
1163
1163
|
"quality": 88,
|
|
1164
1164
|
"useCase": "reasoning",
|
|
@@ -1169,7 +1169,7 @@
|
|
|
1169
1169
|
{
|
|
1170
1170
|
"id": "marco-o1:7b",
|
|
1171
1171
|
"name": "Marco-o1 7B",
|
|
1172
|
-
"ramGb":
|
|
1172
|
+
"ramGb": 7.2,
|
|
1173
1173
|
"sizeMb": 3840,
|
|
1174
1174
|
"quality": 82,
|
|
1175
1175
|
"useCase": "reasoning",
|
|
@@ -1180,7 +1180,7 @@
|
|
|
1180
1180
|
{
|
|
1181
1181
|
"id": "reflection:70b",
|
|
1182
1182
|
"name": "Reflection 70B",
|
|
1183
|
-
"ramGb":
|
|
1183
|
+
"ramGb": 55.9,
|
|
1184
1184
|
"sizeMb": 36600,
|
|
1185
1185
|
"quality": 92,
|
|
1186
1186
|
"useCase": "self-correct",
|
|
@@ -1191,7 +1191,7 @@
|
|
|
1191
1191
|
{
|
|
1192
1192
|
"id": "athene-v2:72b",
|
|
1193
1193
|
"name": "Athene v2 72B",
|
|
1194
|
-
"ramGb":
|
|
1194
|
+
"ramGb": 57.3,
|
|
1195
1195
|
"sizeMb": 37640,
|
|
1196
1196
|
"quality": 93,
|
|
1197
1197
|
"useCase": "agentic",
|
|
@@ -1202,7 +1202,7 @@
|
|
|
1202
1202
|
{
|
|
1203
1203
|
"id": "sailor2:8b",
|
|
1204
1204
|
"name": "Sailor2 8B",
|
|
1205
|
-
"ramGb":
|
|
1205
|
+
"ramGb": 8,
|
|
1206
1206
|
"sizeMb": 4360,
|
|
1207
1207
|
"quality": 81,
|
|
1208
1208
|
"useCase": "multilingual sea",
|
|
@@ -1213,7 +1213,7 @@
|
|
|
1213
1213
|
{
|
|
1214
1214
|
"id": "exaone3.5:7.8b",
|
|
1215
1215
|
"name": "EXAONE 3.5 7.8B",
|
|
1216
|
-
"ramGb":
|
|
1216
|
+
"ramGb": 7.8,
|
|
1217
1217
|
"sizeMb": 4256,
|
|
1218
1218
|
"quality": 83,
|
|
1219
1219
|
"useCase": "korean, english",
|
|
@@ -1224,7 +1224,7 @@
|
|
|
1224
1224
|
{
|
|
1225
1225
|
"id": "aya:23-8b",
|
|
1226
1226
|
"name": "Aya 23 8B",
|
|
1227
|
-
"ramGb":
|
|
1227
|
+
"ramGb": 8,
|
|
1228
1228
|
"sizeMb": 4360,
|
|
1229
1229
|
"quality": 82,
|
|
1230
1230
|
"useCase": "multilingual",
|
|
@@ -1235,7 +1235,7 @@
|
|
|
1235
1235
|
{
|
|
1236
1236
|
"id": "aya:23-35b",
|
|
1237
1237
|
"name": "Aya 23 35B",
|
|
1238
|
-
"ramGb":
|
|
1238
|
+
"ramGb": 30.7,
|
|
1239
1239
|
"sizeMb": 18400,
|
|
1240
1240
|
"quality": 90,
|
|
1241
1241
|
"useCase": "multilingual large",
|
|
@@ -1246,7 +1246,7 @@
|
|
|
1246
1246
|
{
|
|
1247
1247
|
"id": "nemotron-mini:4b",
|
|
1248
1248
|
"name": "Nemotron Mini 4B",
|
|
1249
|
-
"ramGb":
|
|
1249
|
+
"ramGb": 5.1,
|
|
1250
1250
|
"sizeMb": 2280,
|
|
1251
1251
|
"quality": 76,
|
|
1252
1252
|
"useCase": "nvidia small",
|
|
@@ -1257,7 +1257,7 @@
|
|
|
1257
1257
|
{
|
|
1258
1258
|
"id": "nemotron:70b",
|
|
1259
1259
|
"name": "Nemotron 70B",
|
|
1260
|
-
"ramGb":
|
|
1260
|
+
"ramGb": 55.9,
|
|
1261
1261
|
"sizeMb": 36600,
|
|
1262
1262
|
"quality": 92,
|
|
1263
1263
|
"useCase": "nvidia frontier",
|
|
@@ -1268,7 +1268,7 @@
|
|
|
1268
1268
|
{
|
|
1269
1269
|
"id": "snowflake-arctic-embed:335m",
|
|
1270
1270
|
"name": "Snowflake Arctic Embed",
|
|
1271
|
-
"ramGb": 0.
|
|
1271
|
+
"ramGb": 0.8,
|
|
1272
1272
|
"sizeMb": 294,
|
|
1273
1273
|
"quality": 58,
|
|
1274
1274
|
"useCase": "embeddings",
|
|
@@ -1280,7 +1280,7 @@
|
|
|
1280
1280
|
{
|
|
1281
1281
|
"id": "nomic-embed-text",
|
|
1282
1282
|
"name": "Nomic Embed Text",
|
|
1283
|
-
"ramGb": 0.
|
|
1283
|
+
"ramGb": 0.7,
|
|
1284
1284
|
"sizeMb": 193,
|
|
1285
1285
|
"quality": 60,
|
|
1286
1286
|
"useCase": "embeddings",
|
|
@@ -1292,7 +1292,7 @@
|
|
|
1292
1292
|
{
|
|
1293
1293
|
"id": "mxbai-embed-large",
|
|
1294
1294
|
"name": "MxBai Embed Large",
|
|
1295
|
-
"ramGb": 0.
|
|
1295
|
+
"ramGb": 0.8,
|
|
1296
1296
|
"sizeMb": 297,
|
|
1297
1297
|
"quality": 62,
|
|
1298
1298
|
"useCase": "embeddings",
|
|
@@ -1304,7 +1304,7 @@
|
|
|
1304
1304
|
{
|
|
1305
1305
|
"id": "bge-large",
|
|
1306
1306
|
"name": "BGE Large",
|
|
1307
|
-
"ramGb": 0.
|
|
1307
|
+
"ramGb": 0.8,
|
|
1308
1308
|
"sizeMb": 297,
|
|
1309
1309
|
"quality": 61,
|
|
1310
1310
|
"useCase": "embeddings",
|
|
@@ -1316,7 +1316,7 @@
|
|
|
1316
1316
|
{
|
|
1317
1317
|
"id": "all-minilm",
|
|
1318
1318
|
"name": "All-MiniLM",
|
|
1319
|
-
"ramGb": 0.
|
|
1319
|
+
"ramGb": 0.6,
|
|
1320
1320
|
"sizeMb": 162,
|
|
1321
1321
|
"quality": 55,
|
|
1322
1322
|
"useCase": "embeddings",
|
|
@@ -1328,7 +1328,7 @@
|
|
|
1328
1328
|
{
|
|
1329
1329
|
"id": "qwen2.5:14b",
|
|
1330
1330
|
"name": "Qwen 2.5 14B",
|
|
1331
|
-
"ramGb":
|
|
1331
|
+
"ramGb": 13.6,
|
|
1332
1332
|
"sizeMb": 7480,
|
|
1333
1333
|
"quality": 88,
|
|
1334
1334
|
"useCase": "reasoning",
|
|
@@ -1340,7 +1340,7 @@
|
|
|
1340
1340
|
{
|
|
1341
1341
|
"id": "qwen2.5:14b-instruct",
|
|
1342
1342
|
"name": "Qwen 2.5 14B Instruct",
|
|
1343
|
-
"ramGb":
|
|
1343
|
+
"ramGb": 13.6,
|
|
1344
1344
|
"sizeMb": 7480,
|
|
1345
1345
|
"quality": 88,
|
|
1346
1346
|
"useCase": "chat",
|
|
@@ -1352,7 +1352,7 @@
|
|
|
1352
1352
|
{
|
|
1353
1353
|
"id": "qwen2.5:32b",
|
|
1354
1354
|
"name": "Qwen 2.5 32B",
|
|
1355
|
-
"ramGb":
|
|
1355
|
+
"ramGb": 28.5,
|
|
1356
1356
|
"sizeMb": 16840,
|
|
1357
1357
|
"quality": 90,
|
|
1358
1358
|
"useCase": "frontier local",
|
|
@@ -1363,7 +1363,7 @@
|
|
|
1363
1363
|
{
|
|
1364
1364
|
"id": "qwen2.5:72b",
|
|
1365
1365
|
"name": "Qwen 2.5 72B",
|
|
1366
|
-
"ramGb":
|
|
1366
|
+
"ramGb": 57.3,
|
|
1367
1367
|
"sizeMb": 37640,
|
|
1368
1368
|
"quality": 94,
|
|
1369
1369
|
"useCase": "frontier",
|
|
@@ -1374,7 +1374,7 @@
|
|
|
1374
1374
|
{
|
|
1375
1375
|
"id": "llama3.1:70b",
|
|
1376
1376
|
"name": "Llama 3.1 70B",
|
|
1377
|
-
"ramGb":
|
|
1377
|
+
"ramGb": 55.9,
|
|
1378
1378
|
"sizeMb": 36600,
|
|
1379
1379
|
"quality": 92,
|
|
1380
1380
|
"useCase": "frontier",
|
|
@@ -1385,7 +1385,7 @@
|
|
|
1385
1385
|
{
|
|
1386
1386
|
"id": "llama3.1:70b-instruct-q4_K_M",
|
|
1387
1387
|
"name": "Llama 3.1 70B Q4",
|
|
1388
|
-
"ramGb":
|
|
1388
|
+
"ramGb": 55.9,
|
|
1389
1389
|
"sizeMb": 36600,
|
|
1390
1390
|
"quality": 92,
|
|
1391
1391
|
"useCase": "frontier",
|
|
@@ -1396,7 +1396,7 @@
|
|
|
1396
1396
|
{
|
|
1397
1397
|
"id": "mixtral:8x7b",
|
|
1398
1398
|
"name": "Mixtral 8x7B MoE",
|
|
1399
|
-
"ramGb":
|
|
1399
|
+
"ramGb": 39.3,
|
|
1400
1400
|
"sizeMb": 24640,
|
|
1401
1401
|
"quality": 91,
|
|
1402
1402
|
"useCase": "MoE quality",
|
|
@@ -1407,7 +1407,7 @@
|
|
|
1407
1407
|
{
|
|
1408
1408
|
"id": "mixtral:8x22b",
|
|
1409
1409
|
"name": "Mixtral 8x22B MoE",
|
|
1410
|
-
"ramGb":
|
|
1410
|
+
"ramGb": 107,
|
|
1411
1411
|
"sizeMb": 73520,
|
|
1412
1412
|
"quality": 95,
|
|
1413
1413
|
"useCase": "MoE frontier",
|
|
@@ -1418,7 +1418,7 @@
|
|
|
1418
1418
|
{
|
|
1419
1419
|
"id": "solar-pro:22b",
|
|
1420
1420
|
"name": "Solar Pro 22B",
|
|
1421
|
-
"ramGb":
|
|
1421
|
+
"ramGb": 19.3,
|
|
1422
1422
|
"sizeMb": 11640,
|
|
1423
1423
|
"quality": 89,
|
|
1424
1424
|
"useCase": "reasoning",
|
|
@@ -1429,7 +1429,7 @@
|
|
|
1429
1429
|
{
|
|
1430
1430
|
"id": "dbrx:132b",
|
|
1431
1431
|
"name": "DBRX 132B MoE",
|
|
1432
|
-
"ramGb":
|
|
1432
|
+
"ramGb": 100.5,
|
|
1433
1433
|
"sizeMb": 68840,
|
|
1434
1434
|
"quality": 96,
|
|
1435
1435
|
"useCase": "enterprise MoE",
|
|
@@ -1440,7 +1440,7 @@
|
|
|
1440
1440
|
{
|
|
1441
1441
|
"id": "internlm2:7b",
|
|
1442
1442
|
"name": "InternLM2 7B",
|
|
1443
|
-
"ramGb":
|
|
1443
|
+
"ramGb": 7.2,
|
|
1444
1444
|
"sizeMb": 3840,
|
|
1445
1445
|
"quality": 82,
|
|
1446
1446
|
"useCase": "multilingual",
|
|
@@ -1451,7 +1451,7 @@
|
|
|
1451
1451
|
{
|
|
1452
1452
|
"id": "internlm2:20b",
|
|
1453
1453
|
"name": "InternLM2 20B",
|
|
1454
|
-
"ramGb":
|
|
1454
|
+
"ramGb": 17.9,
|
|
1455
1455
|
"sizeMb": 10600,
|
|
1456
1456
|
"quality": 88,
|
|
1457
1457
|
"useCase": "multilingual large",
|
|
@@ -1462,7 +1462,7 @@
|
|
|
1462
1462
|
{
|
|
1463
1463
|
"id": "wizardlm:13b",
|
|
1464
1464
|
"name": "WizardLM 13B",
|
|
1465
|
-
"ramGb":
|
|
1465
|
+
"ramGb": 12.9,
|
|
1466
1466
|
"sizeMb": 6960,
|
|
1467
1467
|
"quality": 80,
|
|
1468
1468
|
"useCase": "instructions",
|
|
@@ -1474,7 +1474,7 @@
|
|
|
1474
1474
|
{
|
|
1475
1475
|
"id": "nous-hermes2:10.7b",
|
|
1476
1476
|
"name": "Nous Hermes 10.7B",
|
|
1477
|
-
"ramGb":
|
|
1477
|
+
"ramGb": 11.2,
|
|
1478
1478
|
"sizeMb": 5764,
|
|
1479
1479
|
"quality": 83,
|
|
1480
1480
|
"useCase": "chat",
|
|
@@ -1486,7 +1486,7 @@
|
|
|
1486
1486
|
{
|
|
1487
1487
|
"id": "starcoder2:7b",
|
|
1488
1488
|
"name": "StarCoder2 7B",
|
|
1489
|
-
"ramGb":
|
|
1489
|
+
"ramGb": 7.2,
|
|
1490
1490
|
"sizeMb": 3840,
|
|
1491
1491
|
"quality": 82,
|
|
1492
1492
|
"useCase": "code",
|
|
@@ -1497,7 +1497,7 @@
|
|
|
1497
1497
|
{
|
|
1498
1498
|
"id": "starcoder2:15b",
|
|
1499
1499
|
"name": "StarCoder2 15B",
|
|
1500
|
-
"ramGb":
|
|
1500
|
+
"ramGb": 14.3,
|
|
1501
1501
|
"sizeMb": 8000,
|
|
1502
1502
|
"quality": 86,
|
|
1503
1503
|
"useCase": "code large",
|
|
@@ -1508,7 +1508,7 @@
|
|
|
1508
1508
|
{
|
|
1509
1509
|
"id": "shieldgemma:9b",
|
|
1510
1510
|
"name": "ShieldGemma 9B",
|
|
1511
|
-
"ramGb":
|
|
1511
|
+
"ramGb": 8.7,
|
|
1512
1512
|
"sizeMb": 4880,
|
|
1513
1513
|
"quality": 78,
|
|
1514
1514
|
"useCase": "safety",
|
|
@@ -1519,7 +1519,7 @@
|
|
|
1519
1519
|
{
|
|
1520
1520
|
"id": "mathstral:7b",
|
|
1521
1521
|
"name": "Mathstral 7B",
|
|
1522
|
-
"ramGb":
|
|
1522
|
+
"ramGb": 7.2,
|
|
1523
1523
|
"sizeMb": 3840,
|
|
1524
1524
|
"quality": 84,
|
|
1525
1525
|
"useCase": "math",
|
|
@@ -1530,7 +1530,7 @@
|
|
|
1530
1530
|
{
|
|
1531
1531
|
"id": "llama3-groq-tool-use:8b",
|
|
1532
1532
|
"name": "Llama 3 Groq Tool Use 8B",
|
|
1533
|
-
"ramGb":
|
|
1533
|
+
"ramGb": 8,
|
|
1534
1534
|
"sizeMb": 4360,
|
|
1535
1535
|
"quality": 85,
|
|
1536
1536
|
"useCase": "tool calling",
|
|
@@ -1541,7 +1541,7 @@
|
|
|
1541
1541
|
{
|
|
1542
1542
|
"id": "firefunction-v2:70b",
|
|
1543
1543
|
"name": "Firefunction v2 70B",
|
|
1544
|
-
"ramGb":
|
|
1544
|
+
"ramGb": 55.9,
|
|
1545
1545
|
"sizeMb": 36600,
|
|
1546
1546
|
"quality": 91,
|
|
1547
1547
|
"useCase": "function calling",
|
|
@@ -1552,7 +1552,7 @@
|
|
|
1552
1552
|
{
|
|
1553
1553
|
"id": "granite3-moe:3b",
|
|
1554
1554
|
"name": "Granite 3 MoE 3B",
|
|
1555
|
-
"ramGb":
|
|
1555
|
+
"ramGb": 3.7,
|
|
1556
1556
|
"sizeMb": 1760,
|
|
1557
1557
|
"quality": 77,
|
|
1558
1558
|
"useCase": "efficient MoE",
|
|
@@ -1563,7 +1563,7 @@
|
|
|
1563
1563
|
{
|
|
1564
1564
|
"id": "granite-code:8b",
|
|
1565
1565
|
"name": "Granite Code 8B",
|
|
1566
|
-
"ramGb":
|
|
1566
|
+
"ramGb": 8,
|
|
1567
1567
|
"sizeMb": 4360,
|
|
1568
1568
|
"quality": 84,
|
|
1569
1569
|
"useCase": "code enterprise",
|
|
@@ -1575,7 +1575,7 @@
|
|
|
1575
1575
|
{
|
|
1576
1576
|
"id": "stable-code:3b",
|
|
1577
1577
|
"name": "Stable Code 3B",
|
|
1578
|
-
"ramGb":
|
|
1578
|
+
"ramGb": 3.7,
|
|
1579
1579
|
"sizeMb": 1760,
|
|
1580
1580
|
"quality": 73,
|
|
1581
1581
|
"useCase": "code",
|
|
@@ -1586,7 +1586,7 @@
|
|
|
1586
1586
|
{
|
|
1587
1587
|
"id": "stablelm2:12b",
|
|
1588
1588
|
"name": "StableLM2 12B",
|
|
1589
|
-
"ramGb":
|
|
1589
|
+
"ramGb": 12.1,
|
|
1590
1590
|
"sizeMb": 6440,
|
|
1591
1591
|
"quality": 82,
|
|
1592
1592
|
"useCase": "chat",
|
|
@@ -1598,7 +1598,7 @@
|
|
|
1598
1598
|
{
|
|
1599
1599
|
"id": "mpt:7b",
|
|
1600
1600
|
"name": "MPT 7B",
|
|
1601
|
-
"ramGb":
|
|
1601
|
+
"ramGb": 7.2,
|
|
1602
1602
|
"sizeMb": 3840,
|
|
1603
1603
|
"quality": 74,
|
|
1604
1604
|
"useCase": "legacy chat",
|
|
@@ -1610,7 +1610,7 @@
|
|
|
1610
1610
|
{
|
|
1611
1611
|
"id": "mpt:30b",
|
|
1612
1612
|
"name": "MPT 30B",
|
|
1613
|
-
"ramGb":
|
|
1613
|
+
"ramGb": 27.1,
|
|
1614
1614
|
"sizeMb": 15800,
|
|
1615
1615
|
"quality": 86,
|
|
1616
1616
|
"useCase": "legacy large",
|
|
@@ -1621,7 +1621,7 @@
|
|
|
1621
1621
|
{
|
|
1622
1622
|
"id": "yarn-mistral:7b-128k",
|
|
1623
1623
|
"name": "Yarn Mistral 7B 128k",
|
|
1624
|
-
"ramGb":
|
|
1624
|
+
"ramGb": 7.2,
|
|
1625
1625
|
"sizeMb": 3840,
|
|
1626
1626
|
"quality": 81,
|
|
1627
1627
|
"useCase": "long context",
|
|
@@ -1632,7 +1632,7 @@
|
|
|
1632
1632
|
{
|
|
1633
1633
|
"id": "llama-pro:8b",
|
|
1634
1634
|
"name": "Llama Pro 8B",
|
|
1635
|
-
"ramGb":
|
|
1635
|
+
"ramGb": 8,
|
|
1636
1636
|
"sizeMb": 4360,
|
|
1637
1637
|
"quality": 83,
|
|
1638
1638
|
"useCase": "block expansion",
|
|
@@ -1643,7 +1643,7 @@
|
|
|
1643
1643
|
{
|
|
1644
1644
|
"id": "openhermes:7b-mistral-v2.5",
|
|
1645
1645
|
"name": "OpenHermes 7B v2.5",
|
|
1646
|
-
"ramGb":
|
|
1646
|
+
"ramGb": 7.2,
|
|
1647
1647
|
"sizeMb": 3840,
|
|
1648
1648
|
"quality": 80,
|
|
1649
1649
|
"useCase": "chat",
|
|
@@ -1655,7 +1655,7 @@
|
|
|
1655
1655
|
{
|
|
1656
1656
|
"id": "nous-capybara:7b",
|
|
1657
1657
|
"name": "Nous Capybara 7B",
|
|
1658
|
-
"ramGb":
|
|
1658
|
+
"ramGb": 7.2,
|
|
1659
1659
|
"sizeMb": 3840,
|
|
1660
1660
|
"quality": 79,
|
|
1661
1661
|
"useCase": "chat",
|
|
@@ -1667,7 +1667,7 @@
|
|
|
1667
1667
|
{
|
|
1668
1668
|
"id": "neural-chat:7b-v3-3",
|
|
1669
1669
|
"name": "Neural Chat 7B v3.3",
|
|
1670
|
-
"ramGb":
|
|
1670
|
+
"ramGb": 7.2,
|
|
1671
1671
|
"sizeMb": 3840,
|
|
1672
1672
|
"quality": 80,
|
|
1673
1673
|
"useCase": "chat",
|
|
@@ -1679,7 +1679,7 @@
|
|
|
1679
1679
|
{
|
|
1680
1680
|
"id": "wizard-math:7b",
|
|
1681
1681
|
"name": "WizardMath 7B",
|
|
1682
|
-
"ramGb":
|
|
1682
|
+
"ramGb": 7.2,
|
|
1683
1683
|
"sizeMb": 3840,
|
|
1684
1684
|
"quality": 82,
|
|
1685
1685
|
"useCase": "math",
|
|
@@ -1690,7 +1690,7 @@
|
|
|
1690
1690
|
{
|
|
1691
1691
|
"id": "wizard-math:13b",
|
|
1692
1692
|
"name": "WizardMath 13B",
|
|
1693
|
-
"ramGb":
|
|
1693
|
+
"ramGb": 12.9,
|
|
1694
1694
|
"sizeMb": 6960,
|
|
1695
1695
|
"quality": 85,
|
|
1696
1696
|
"useCase": "math",
|
|
@@ -1701,7 +1701,7 @@
|
|
|
1701
1701
|
{
|
|
1702
1702
|
"id": "deepseek-llm:7b",
|
|
1703
1703
|
"name": "DeepSeek LLM 7B",
|
|
1704
|
-
"ramGb":
|
|
1704
|
+
"ramGb": 7.2,
|
|
1705
1705
|
"sizeMb": 3840,
|
|
1706
1706
|
"quality": 81,
|
|
1707
1707
|
"useCase": "general",
|
|
@@ -1713,7 +1713,7 @@
|
|
|
1713
1713
|
{
|
|
1714
1714
|
"id": "deepseek-llm:67b",
|
|
1715
1715
|
"name": "DeepSeek LLM 67B",
|
|
1716
|
-
"ramGb":
|
|
1716
|
+
"ramGb": 53.7,
|
|
1717
1717
|
"sizeMb": 35040,
|
|
1718
1718
|
"quality": 91,
|
|
1719
1719
|
"useCase": "frontier",
|
|
@@ -1724,7 +1724,7 @@
|
|
|
1724
1724
|
{
|
|
1725
1725
|
"id": "qwen:7b",
|
|
1726
1726
|
"name": "Qwen 7B",
|
|
1727
|
-
"ramGb":
|
|
1727
|
+
"ramGb": 7.2,
|
|
1728
1728
|
"sizeMb": 3840,
|
|
1729
1729
|
"quality": 78,
|
|
1730
1730
|
"useCase": "legacy chat",
|
|
@@ -1736,7 +1736,7 @@
|
|
|
1736
1736
|
{
|
|
1737
1737
|
"id": "qwen:14b",
|
|
1738
1738
|
"name": "Qwen 14B",
|
|
1739
|
-
"ramGb":
|
|
1739
|
+
"ramGb": 13.6,
|
|
1740
1740
|
"sizeMb": 7480,
|
|
1741
1741
|
"quality": 84,
|
|
1742
1742
|
"useCase": "legacy chat",
|
|
@@ -1748,7 +1748,7 @@
|
|
|
1748
1748
|
{
|
|
1749
1749
|
"id": "qwen:72b",
|
|
1750
1750
|
"name": "Qwen 72B",
|
|
1751
|
-
"ramGb":
|
|
1751
|
+
"ramGb": 57.3,
|
|
1752
1752
|
"sizeMb": 37640,
|
|
1753
1753
|
"quality": 92,
|
|
1754
1754
|
"useCase": "legacy frontier",
|
|
@@ -1759,7 +1759,7 @@
|
|
|
1759
1759
|
{
|
|
1760
1760
|
"id": "qwen2:7b",
|
|
1761
1761
|
"name": "Qwen 2 7B",
|
|
1762
|
-
"ramGb":
|
|
1762
|
+
"ramGb": 7.2,
|
|
1763
1763
|
"sizeMb": 3840,
|
|
1764
1764
|
"quality": 82,
|
|
1765
1765
|
"useCase": "chat",
|
|
@@ -1771,7 +1771,7 @@
|
|
|
1771
1771
|
{
|
|
1772
1772
|
"id": "qwen2:72b",
|
|
1773
1773
|
"name": "Qwen 2 72B",
|
|
1774
|
-
"ramGb":
|
|
1774
|
+
"ramGb": 57.3,
|
|
1775
1775
|
"sizeMb": 37640,
|
|
1776
1776
|
"quality": 93,
|
|
1777
1777
|
"useCase": "frontier",
|