gpustack-runner 0.1.24.post1__py3-none-any.whl → 0.1.24.post3__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- gpustack_runner/_version.py +2 -2
- gpustack_runner/_version_appendix.py +1 -1
- gpustack_runner/cmds/images.py +2 -2
- gpustack_runner/runner.py.json +335 -49
- {gpustack_runner-0.1.24.post1.dist-info → gpustack_runner-0.1.24.post3.dist-info}/METADATA +28 -24
- {gpustack_runner-0.1.24.post1.dist-info → gpustack_runner-0.1.24.post3.dist-info}/RECORD +9 -9
- {gpustack_runner-0.1.24.post1.dist-info → gpustack_runner-0.1.24.post3.dist-info}/WHEEL +0 -0
- {gpustack_runner-0.1.24.post1.dist-info → gpustack_runner-0.1.24.post3.dist-info}/entry_points.txt +0 -0
- {gpustack_runner-0.1.24.post1.dist-info → gpustack_runner-0.1.24.post3.dist-info}/licenses/LICENSE +0 -0
gpustack_runner/_version.py
CHANGED
|
@@ -27,8 +27,8 @@ version_tuple: VERSION_TUPLE
|
|
|
27
27
|
__commit_id__: COMMIT_ID
|
|
28
28
|
commit_id: COMMIT_ID
|
|
29
29
|
|
|
30
|
-
__version__ = version = '0.1.24.
|
|
31
|
-
__version_tuple__ = version_tuple = (0, 1, 24, '
|
|
30
|
+
__version__ = version = '0.1.24.post3'
|
|
31
|
+
__version_tuple__ = version_tuple = (0, 1, 24, 'post3')
|
|
32
32
|
try:
|
|
33
33
|
from ._version_appendix import git_commit
|
|
34
34
|
__commit_id__ = commit_id = git_commit
|
|
@@ -1 +1 @@
|
|
|
1
|
-
git_commit = "
|
|
1
|
+
git_commit = "dc41ed2"
|
gpustack_runner/cmds/images.py
CHANGED
|
@@ -464,7 +464,7 @@ class SaveImagesSubCommand(SubCommand):
|
|
|
464
464
|
# Submit tasks
|
|
465
465
|
for task_name, src_img, dst_file, dst_file_relative in saving_tasks:
|
|
466
466
|
if dst_file.exists():
|
|
467
|
-
print(f"{dst_file
|
|
467
|
+
print(f"✅ {dst_file} already exists, skipping save {src_img}.")
|
|
468
468
|
continue
|
|
469
469
|
dst_file.parent.mkdir(parents=True, exist_ok=True, mode=0o744)
|
|
470
470
|
|
|
@@ -976,7 +976,7 @@ class LoadImagesSubCommand(SubCommand):
|
|
|
976
976
|
load_parser.add_argument(
|
|
977
977
|
"input",
|
|
978
978
|
nargs=OPTIONAL,
|
|
979
|
-
help="Input directory to load images (default: current working directory)",
|
|
979
|
+
help="Input directory to load images from (default: current working directory)",
|
|
980
980
|
)
|
|
981
981
|
|
|
982
982
|
load_parser.set_defaults(func=LoadImagesSubCommand)
|
gpustack_runner/runner.py.json
CHANGED
|
@@ -1,35 +1,79 @@
|
|
|
1
1
|
[
|
|
2
2
|
{
|
|
3
3
|
"backend": "cann",
|
|
4
|
-
"backend_version": "8.
|
|
5
|
-
"original_backend_version": "8.
|
|
4
|
+
"backend_version": "8.5",
|
|
5
|
+
"original_backend_version": "8.5.0",
|
|
6
6
|
"backend_variant": "a3",
|
|
7
7
|
"service": "mindie",
|
|
8
|
-
"service_version": "2.
|
|
8
|
+
"service_version": "2.3.0",
|
|
9
9
|
"platform": "linux/amd64",
|
|
10
|
-
"docker_image": "gpustack/runner:cann8.
|
|
10
|
+
"docker_image": "gpustack/runner:cann8.5-a3-mindie2.3.0",
|
|
11
11
|
"deprecated": false
|
|
12
12
|
},
|
|
13
13
|
{
|
|
14
14
|
"backend": "cann",
|
|
15
|
-
"backend_version": "8.
|
|
16
|
-
"original_backend_version": "8.
|
|
15
|
+
"backend_version": "8.5",
|
|
16
|
+
"original_backend_version": "8.5.0",
|
|
17
17
|
"backend_variant": "a3",
|
|
18
18
|
"service": "mindie",
|
|
19
|
-
"service_version": "2.
|
|
19
|
+
"service_version": "2.3.0",
|
|
20
20
|
"platform": "linux/arm64",
|
|
21
|
-
"docker_image": "gpustack/runner:cann8.
|
|
21
|
+
"docker_image": "gpustack/runner:cann8.5-a3-mindie2.3.0",
|
|
22
22
|
"deprecated": false
|
|
23
23
|
},
|
|
24
24
|
{
|
|
25
25
|
"backend": "cann",
|
|
26
|
-
"backend_version": "8.
|
|
27
|
-
"original_backend_version": "8.
|
|
26
|
+
"backend_version": "8.5",
|
|
27
|
+
"original_backend_version": "8.5.0",
|
|
28
28
|
"backend_variant": "a3",
|
|
29
29
|
"service": "sglang",
|
|
30
|
-
"service_version": "0.5.
|
|
30
|
+
"service_version": "0.5.8",
|
|
31
31
|
"platform": "linux/arm64",
|
|
32
|
-
"docker_image": "gpustack/runner:cann8.
|
|
32
|
+
"docker_image": "gpustack/runner:cann8.5-a3-sglang0.5.8",
|
|
33
|
+
"deprecated": false
|
|
34
|
+
},
|
|
35
|
+
{
|
|
36
|
+
"backend": "cann",
|
|
37
|
+
"backend_version": "8.5",
|
|
38
|
+
"original_backend_version": "8.5.0",
|
|
39
|
+
"backend_variant": "a3",
|
|
40
|
+
"service": "vllm",
|
|
41
|
+
"service_version": "0.14.1",
|
|
42
|
+
"platform": "linux/amd64",
|
|
43
|
+
"docker_image": "gpustack/runner:cann8.5-a3-vllm0.14.1",
|
|
44
|
+
"deprecated": false
|
|
45
|
+
},
|
|
46
|
+
{
|
|
47
|
+
"backend": "cann",
|
|
48
|
+
"backend_version": "8.5",
|
|
49
|
+
"original_backend_version": "8.5.0",
|
|
50
|
+
"backend_variant": "a3",
|
|
51
|
+
"service": "vllm",
|
|
52
|
+
"service_version": "0.14.1",
|
|
53
|
+
"platform": "linux/arm64",
|
|
54
|
+
"docker_image": "gpustack/runner:cann8.5-a3-vllm0.14.1",
|
|
55
|
+
"deprecated": false
|
|
56
|
+
},
|
|
57
|
+
{
|
|
58
|
+
"backend": "cann",
|
|
59
|
+
"backend_version": "8.5",
|
|
60
|
+
"original_backend_version": "8.5.0",
|
|
61
|
+
"backend_variant": "a3",
|
|
62
|
+
"service": "vllm",
|
|
63
|
+
"service_version": "0.13.0",
|
|
64
|
+
"platform": "linux/amd64",
|
|
65
|
+
"docker_image": "gpustack/runner:cann8.5-a3-vllm0.13.0",
|
|
66
|
+
"deprecated": false
|
|
67
|
+
},
|
|
68
|
+
{
|
|
69
|
+
"backend": "cann",
|
|
70
|
+
"backend_version": "8.5",
|
|
71
|
+
"original_backend_version": "8.5.0",
|
|
72
|
+
"backend_variant": "a3",
|
|
73
|
+
"service": "vllm",
|
|
74
|
+
"service_version": "0.13.0",
|
|
75
|
+
"platform": "linux/arm64",
|
|
76
|
+
"docker_image": "gpustack/runner:cann8.5-a3-vllm0.13.0",
|
|
33
77
|
"deprecated": false
|
|
34
78
|
},
|
|
35
79
|
{
|
|
@@ -37,10 +81,21 @@
|
|
|
37
81
|
"backend_version": "8.3",
|
|
38
82
|
"original_backend_version": "8.3.rc2",
|
|
39
83
|
"backend_variant": "a3",
|
|
40
|
-
"service": "
|
|
41
|
-
"service_version": "
|
|
84
|
+
"service": "mindie",
|
|
85
|
+
"service_version": "2.2.rc1",
|
|
86
|
+
"platform": "linux/amd64",
|
|
87
|
+
"docker_image": "gpustack/runner:cann8.3-a3-mindie2.2.rc1",
|
|
88
|
+
"deprecated": false
|
|
89
|
+
},
|
|
90
|
+
{
|
|
91
|
+
"backend": "cann",
|
|
92
|
+
"backend_version": "8.3",
|
|
93
|
+
"original_backend_version": "8.3.rc2",
|
|
94
|
+
"backend_variant": "a3",
|
|
95
|
+
"service": "mindie",
|
|
96
|
+
"service_version": "2.2.rc1",
|
|
42
97
|
"platform": "linux/arm64",
|
|
43
|
-
"docker_image": "gpustack/runner:cann8.3-a3-
|
|
98
|
+
"docker_image": "gpustack/runner:cann8.3-a3-mindie2.2.rc1",
|
|
44
99
|
"deprecated": false
|
|
45
100
|
},
|
|
46
101
|
{
|
|
@@ -48,10 +103,10 @@
|
|
|
48
103
|
"backend_version": "8.3",
|
|
49
104
|
"original_backend_version": "8.3.rc2",
|
|
50
105
|
"backend_variant": "a3",
|
|
51
|
-
"service": "
|
|
52
|
-
"service_version": "0.
|
|
53
|
-
"platform": "linux/
|
|
54
|
-
"docker_image": "gpustack/runner:cann8.3-a3-
|
|
106
|
+
"service": "sglang",
|
|
107
|
+
"service_version": "0.5.7",
|
|
108
|
+
"platform": "linux/arm64",
|
|
109
|
+
"docker_image": "gpustack/runner:cann8.3-a3-sglang0.5.7",
|
|
55
110
|
"deprecated": false
|
|
56
111
|
},
|
|
57
112
|
{
|
|
@@ -59,10 +114,10 @@
|
|
|
59
114
|
"backend_version": "8.3",
|
|
60
115
|
"original_backend_version": "8.3.rc2",
|
|
61
116
|
"backend_variant": "a3",
|
|
62
|
-
"service": "
|
|
63
|
-
"service_version": "0.
|
|
117
|
+
"service": "sglang",
|
|
118
|
+
"service_version": "0.5.6.post2",
|
|
64
119
|
"platform": "linux/arm64",
|
|
65
|
-
"docker_image": "gpustack/runner:cann8.3-a3-
|
|
120
|
+
"docker_image": "gpustack/runner:cann8.3-a3-sglang0.5.6.post2",
|
|
66
121
|
"deprecated": false
|
|
67
122
|
},
|
|
68
123
|
{
|
|
@@ -206,7 +261,7 @@
|
|
|
206
261
|
"service_version": "0.10.1.1",
|
|
207
262
|
"platform": "linux/amd64",
|
|
208
263
|
"docker_image": "gpustack/runner:cann8.2-a3-vllm0.10.1.1",
|
|
209
|
-
"deprecated":
|
|
264
|
+
"deprecated": true
|
|
210
265
|
},
|
|
211
266
|
{
|
|
212
267
|
"backend": "cann",
|
|
@@ -217,6 +272,83 @@
|
|
|
217
272
|
"service_version": "0.10.1.1",
|
|
218
273
|
"platform": "linux/arm64",
|
|
219
274
|
"docker_image": "gpustack/runner:cann8.2-a3-vllm0.10.1.1",
|
|
275
|
+
"deprecated": true
|
|
276
|
+
},
|
|
277
|
+
{
|
|
278
|
+
"backend": "cann",
|
|
279
|
+
"backend_version": "8.5",
|
|
280
|
+
"original_backend_version": "8.5.0",
|
|
281
|
+
"backend_variant": "910b",
|
|
282
|
+
"service": "mindie",
|
|
283
|
+
"service_version": "2.3.0",
|
|
284
|
+
"platform": "linux/amd64",
|
|
285
|
+
"docker_image": "gpustack/runner:cann8.5-910b-mindie2.3.0",
|
|
286
|
+
"deprecated": false
|
|
287
|
+
},
|
|
288
|
+
{
|
|
289
|
+
"backend": "cann",
|
|
290
|
+
"backend_version": "8.5",
|
|
291
|
+
"original_backend_version": "8.5.0",
|
|
292
|
+
"backend_variant": "910b",
|
|
293
|
+
"service": "mindie",
|
|
294
|
+
"service_version": "2.3.0",
|
|
295
|
+
"platform": "linux/arm64",
|
|
296
|
+
"docker_image": "gpustack/runner:cann8.5-910b-mindie2.3.0",
|
|
297
|
+
"deprecated": false
|
|
298
|
+
},
|
|
299
|
+
{
|
|
300
|
+
"backend": "cann",
|
|
301
|
+
"backend_version": "8.5",
|
|
302
|
+
"original_backend_version": "8.5.0",
|
|
303
|
+
"backend_variant": "910b",
|
|
304
|
+
"service": "sglang",
|
|
305
|
+
"service_version": "0.5.8",
|
|
306
|
+
"platform": "linux/arm64",
|
|
307
|
+
"docker_image": "gpustack/runner:cann8.5-910b-sglang0.5.8",
|
|
308
|
+
"deprecated": false
|
|
309
|
+
},
|
|
310
|
+
{
|
|
311
|
+
"backend": "cann",
|
|
312
|
+
"backend_version": "8.5",
|
|
313
|
+
"original_backend_version": "8.5.0",
|
|
314
|
+
"backend_variant": "910b",
|
|
315
|
+
"service": "vllm",
|
|
316
|
+
"service_version": "0.14.1",
|
|
317
|
+
"platform": "linux/amd64",
|
|
318
|
+
"docker_image": "gpustack/runner:cann8.5-910b-vllm0.14.1",
|
|
319
|
+
"deprecated": false
|
|
320
|
+
},
|
|
321
|
+
{
|
|
322
|
+
"backend": "cann",
|
|
323
|
+
"backend_version": "8.5",
|
|
324
|
+
"original_backend_version": "8.5.0",
|
|
325
|
+
"backend_variant": "910b",
|
|
326
|
+
"service": "vllm",
|
|
327
|
+
"service_version": "0.14.1",
|
|
328
|
+
"platform": "linux/arm64",
|
|
329
|
+
"docker_image": "gpustack/runner:cann8.5-910b-vllm0.14.1",
|
|
330
|
+
"deprecated": false
|
|
331
|
+
},
|
|
332
|
+
{
|
|
333
|
+
"backend": "cann",
|
|
334
|
+
"backend_version": "8.5",
|
|
335
|
+
"original_backend_version": "8.5.0",
|
|
336
|
+
"backend_variant": "910b",
|
|
337
|
+
"service": "vllm",
|
|
338
|
+
"service_version": "0.13.0",
|
|
339
|
+
"platform": "linux/amd64",
|
|
340
|
+
"docker_image": "gpustack/runner:cann8.5-910b-vllm0.13.0",
|
|
341
|
+
"deprecated": false
|
|
342
|
+
},
|
|
343
|
+
{
|
|
344
|
+
"backend": "cann",
|
|
345
|
+
"backend_version": "8.5",
|
|
346
|
+
"original_backend_version": "8.5.0",
|
|
347
|
+
"backend_variant": "910b",
|
|
348
|
+
"service": "vllm",
|
|
349
|
+
"service_version": "0.13.0",
|
|
350
|
+
"platform": "linux/arm64",
|
|
351
|
+
"docker_image": "gpustack/runner:cann8.5-910b-vllm0.13.0",
|
|
220
352
|
"deprecated": false
|
|
221
353
|
},
|
|
222
354
|
{
|
|
@@ -263,28 +395,6 @@
|
|
|
263
395
|
"docker_image": "gpustack/runner:cann8.3-910b-sglang0.5.6.post2",
|
|
264
396
|
"deprecated": false
|
|
265
397
|
},
|
|
266
|
-
{
|
|
267
|
-
"backend": "cann",
|
|
268
|
-
"backend_version": "8.3",
|
|
269
|
-
"original_backend_version": "8.3.rc2",
|
|
270
|
-
"backend_variant": "910b",
|
|
271
|
-
"service": "vllm",
|
|
272
|
-
"service_version": "0.13.0",
|
|
273
|
-
"platform": "linux/amd64",
|
|
274
|
-
"docker_image": "gpustack/runner:cann8.3-910b-vllm0.13.0",
|
|
275
|
-
"deprecated": false
|
|
276
|
-
},
|
|
277
|
-
{
|
|
278
|
-
"backend": "cann",
|
|
279
|
-
"backend_version": "8.3",
|
|
280
|
-
"original_backend_version": "8.3.rc2",
|
|
281
|
-
"backend_variant": "910b",
|
|
282
|
-
"service": "vllm",
|
|
283
|
-
"service_version": "0.13.0",
|
|
284
|
-
"platform": "linux/arm64",
|
|
285
|
-
"docker_image": "gpustack/runner:cann8.3-910b-vllm0.13.0",
|
|
286
|
-
"deprecated": false
|
|
287
|
-
},
|
|
288
398
|
{
|
|
289
399
|
"backend": "cann",
|
|
290
400
|
"backend_version": "8.3",
|
|
@@ -448,7 +558,7 @@
|
|
|
448
558
|
"service_version": "0.10.1.1",
|
|
449
559
|
"platform": "linux/amd64",
|
|
450
560
|
"docker_image": "gpustack/runner:cann8.2-910b-vllm0.10.1.1",
|
|
451
|
-
"deprecated":
|
|
561
|
+
"deprecated": true
|
|
452
562
|
},
|
|
453
563
|
{
|
|
454
564
|
"backend": "cann",
|
|
@@ -459,7 +569,7 @@
|
|
|
459
569
|
"service_version": "0.10.1.1",
|
|
460
570
|
"platform": "linux/arm64",
|
|
461
571
|
"docker_image": "gpustack/runner:cann8.2-910b-vllm0.10.1.1",
|
|
462
|
-
"deprecated":
|
|
572
|
+
"deprecated": true
|
|
463
573
|
},
|
|
464
574
|
{
|
|
465
575
|
"backend": "cann",
|
|
@@ -514,7 +624,7 @@
|
|
|
514
624
|
"service_version": "0.9.1",
|
|
515
625
|
"platform": "linux/amd64",
|
|
516
626
|
"docker_image": "gpustack/runner:cann8.2-910b-vllm0.9.1",
|
|
517
|
-
"deprecated":
|
|
627
|
+
"deprecated": true
|
|
518
628
|
},
|
|
519
629
|
{
|
|
520
630
|
"backend": "cann",
|
|
@@ -525,6 +635,50 @@
|
|
|
525
635
|
"service_version": "0.9.1",
|
|
526
636
|
"platform": "linux/arm64",
|
|
527
637
|
"docker_image": "gpustack/runner:cann8.2-910b-vllm0.9.1",
|
|
638
|
+
"deprecated": true
|
|
639
|
+
},
|
|
640
|
+
{
|
|
641
|
+
"backend": "cann",
|
|
642
|
+
"backend_version": "8.5",
|
|
643
|
+
"original_backend_version": "8.5.0",
|
|
644
|
+
"backend_variant": "310p",
|
|
645
|
+
"service": "mindie",
|
|
646
|
+
"service_version": "2.3.0",
|
|
647
|
+
"platform": "linux/amd64",
|
|
648
|
+
"docker_image": "gpustack/runner:cann8.5-310p-mindie2.3.0",
|
|
649
|
+
"deprecated": false
|
|
650
|
+
},
|
|
651
|
+
{
|
|
652
|
+
"backend": "cann",
|
|
653
|
+
"backend_version": "8.5",
|
|
654
|
+
"original_backend_version": "8.5.0",
|
|
655
|
+
"backend_variant": "310p",
|
|
656
|
+
"service": "mindie",
|
|
657
|
+
"service_version": "2.3.0",
|
|
658
|
+
"platform": "linux/arm64",
|
|
659
|
+
"docker_image": "gpustack/runner:cann8.5-310p-mindie2.3.0",
|
|
660
|
+
"deprecated": false
|
|
661
|
+
},
|
|
662
|
+
{
|
|
663
|
+
"backend": "cann",
|
|
664
|
+
"backend_version": "8.5",
|
|
665
|
+
"original_backend_version": "8.5.0",
|
|
666
|
+
"backend_variant": "310p",
|
|
667
|
+
"service": "vllm",
|
|
668
|
+
"service_version": "0.14.1",
|
|
669
|
+
"platform": "linux/amd64",
|
|
670
|
+
"docker_image": "gpustack/runner:cann8.5-310p-vllm0.14.1",
|
|
671
|
+
"deprecated": false
|
|
672
|
+
},
|
|
673
|
+
{
|
|
674
|
+
"backend": "cann",
|
|
675
|
+
"backend_version": "8.5",
|
|
676
|
+
"original_backend_version": "8.5.0",
|
|
677
|
+
"backend_variant": "310p",
|
|
678
|
+
"service": "vllm",
|
|
679
|
+
"service_version": "0.14.1",
|
|
680
|
+
"platform": "linux/arm64",
|
|
681
|
+
"docker_image": "gpustack/runner:cann8.5-310p-vllm0.14.1",
|
|
528
682
|
"deprecated": false
|
|
529
683
|
},
|
|
530
684
|
{
|
|
@@ -648,6 +802,28 @@
|
|
|
648
802
|
"docker_image": "gpustack/runner:corex4.2-vllm0.8.3",
|
|
649
803
|
"deprecated": false
|
|
650
804
|
},
|
|
805
|
+
{
|
|
806
|
+
"backend": "cuda",
|
|
807
|
+
"backend_version": "12.9",
|
|
808
|
+
"original_backend_version": "12.9.1",
|
|
809
|
+
"backend_variant": "",
|
|
810
|
+
"service": "sglang",
|
|
811
|
+
"service_version": "0.5.8",
|
|
812
|
+
"platform": "linux/amd64",
|
|
813
|
+
"docker_image": "gpustack/runner:cuda12.9-sglang0.5.8",
|
|
814
|
+
"deprecated": false
|
|
815
|
+
},
|
|
816
|
+
{
|
|
817
|
+
"backend": "cuda",
|
|
818
|
+
"backend_version": "12.9",
|
|
819
|
+
"original_backend_version": "12.9.1",
|
|
820
|
+
"backend_variant": "",
|
|
821
|
+
"service": "sglang",
|
|
822
|
+
"service_version": "0.5.8",
|
|
823
|
+
"platform": "linux/arm64",
|
|
824
|
+
"docker_image": "gpustack/runner:cuda12.9-sglang0.5.8",
|
|
825
|
+
"deprecated": false
|
|
826
|
+
},
|
|
651
827
|
{
|
|
652
828
|
"backend": "cuda",
|
|
653
829
|
"backend_version": "12.9",
|
|
@@ -692,6 +868,28 @@
|
|
|
692
868
|
"docker_image": "gpustack/runner:cuda12.9-sglang0.5.6.post2",
|
|
693
869
|
"deprecated": false
|
|
694
870
|
},
|
|
871
|
+
{
|
|
872
|
+
"backend": "cuda",
|
|
873
|
+
"backend_version": "12.9",
|
|
874
|
+
"original_backend_version": "12.9.1",
|
|
875
|
+
"backend_variant": "",
|
|
876
|
+
"service": "vllm",
|
|
877
|
+
"service_version": "0.14.1",
|
|
878
|
+
"platform": "linux/amd64",
|
|
879
|
+
"docker_image": "gpustack/runner:cuda12.9-vllm0.14.1",
|
|
880
|
+
"deprecated": false
|
|
881
|
+
},
|
|
882
|
+
{
|
|
883
|
+
"backend": "cuda",
|
|
884
|
+
"backend_version": "12.9",
|
|
885
|
+
"original_backend_version": "12.9.1",
|
|
886
|
+
"backend_variant": "",
|
|
887
|
+
"service": "vllm",
|
|
888
|
+
"service_version": "0.14.1",
|
|
889
|
+
"platform": "linux/arm64",
|
|
890
|
+
"docker_image": "gpustack/runner:cuda12.9-vllm0.14.1",
|
|
891
|
+
"deprecated": false
|
|
892
|
+
},
|
|
695
893
|
{
|
|
696
894
|
"backend": "cuda",
|
|
697
895
|
"backend_version": "12.9",
|
|
@@ -758,6 +956,28 @@
|
|
|
758
956
|
"docker_image": "gpustack/runner:cuda12.9-vllm0.11.2",
|
|
759
957
|
"deprecated": false
|
|
760
958
|
},
|
|
959
|
+
{
|
|
960
|
+
"backend": "cuda",
|
|
961
|
+
"backend_version": "12.8",
|
|
962
|
+
"original_backend_version": "12.8.1",
|
|
963
|
+
"backend_variant": "",
|
|
964
|
+
"service": "sglang",
|
|
965
|
+
"service_version": "0.5.8",
|
|
966
|
+
"platform": "linux/amd64",
|
|
967
|
+
"docker_image": "gpustack/runner:cuda12.8-sglang0.5.8",
|
|
968
|
+
"deprecated": false
|
|
969
|
+
},
|
|
970
|
+
{
|
|
971
|
+
"backend": "cuda",
|
|
972
|
+
"backend_version": "12.8",
|
|
973
|
+
"original_backend_version": "12.8.1",
|
|
974
|
+
"backend_variant": "",
|
|
975
|
+
"service": "sglang",
|
|
976
|
+
"service_version": "0.5.8",
|
|
977
|
+
"platform": "linux/arm64",
|
|
978
|
+
"docker_image": "gpustack/runner:cuda12.8-sglang0.5.8",
|
|
979
|
+
"deprecated": false
|
|
980
|
+
},
|
|
761
981
|
{
|
|
762
982
|
"backend": "cuda",
|
|
763
983
|
"backend_version": "12.8",
|
|
@@ -844,7 +1064,7 @@
|
|
|
844
1064
|
"service_version": "0.5.4.post3",
|
|
845
1065
|
"platform": "linux/amd64",
|
|
846
1066
|
"docker_image": "gpustack/runner:cuda12.8-sglang0.5.4.post3",
|
|
847
|
-
"deprecated":
|
|
1067
|
+
"deprecated": true
|
|
848
1068
|
},
|
|
849
1069
|
{
|
|
850
1070
|
"backend": "cuda",
|
|
@@ -855,6 +1075,28 @@
|
|
|
855
1075
|
"service_version": "0.5.4.post3",
|
|
856
1076
|
"platform": "linux/arm64",
|
|
857
1077
|
"docker_image": "gpustack/runner:cuda12.8-sglang0.5.4.post3",
|
|
1078
|
+
"deprecated": true
|
|
1079
|
+
},
|
|
1080
|
+
{
|
|
1081
|
+
"backend": "cuda",
|
|
1082
|
+
"backend_version": "12.8",
|
|
1083
|
+
"original_backend_version": "12.8.1",
|
|
1084
|
+
"backend_variant": "",
|
|
1085
|
+
"service": "vllm",
|
|
1086
|
+
"service_version": "0.14.1",
|
|
1087
|
+
"platform": "linux/amd64",
|
|
1088
|
+
"docker_image": "gpustack/runner:cuda12.8-vllm0.14.1",
|
|
1089
|
+
"deprecated": false
|
|
1090
|
+
},
|
|
1091
|
+
{
|
|
1092
|
+
"backend": "cuda",
|
|
1093
|
+
"backend_version": "12.8",
|
|
1094
|
+
"original_backend_version": "12.8.1",
|
|
1095
|
+
"backend_variant": "",
|
|
1096
|
+
"service": "vllm",
|
|
1097
|
+
"service_version": "0.14.1",
|
|
1098
|
+
"platform": "linux/arm64",
|
|
1099
|
+
"docker_image": "gpustack/runner:cuda12.8-vllm0.14.1",
|
|
858
1100
|
"deprecated": false
|
|
859
1101
|
},
|
|
860
1102
|
{
|
|
@@ -1055,6 +1297,28 @@
|
|
|
1055
1297
|
"docker_image": "gpustack/runner:cuda12.8-voxbox0.0.20",
|
|
1056
1298
|
"deprecated": true
|
|
1057
1299
|
},
|
|
1300
|
+
{
|
|
1301
|
+
"backend": "cuda",
|
|
1302
|
+
"backend_version": "12.6",
|
|
1303
|
+
"original_backend_version": "12.6.3",
|
|
1304
|
+
"backend_variant": "",
|
|
1305
|
+
"service": "vllm",
|
|
1306
|
+
"service_version": "0.14.1",
|
|
1307
|
+
"platform": "linux/amd64",
|
|
1308
|
+
"docker_image": "gpustack/runner:cuda12.6-vllm0.14.1",
|
|
1309
|
+
"deprecated": false
|
|
1310
|
+
},
|
|
1311
|
+
{
|
|
1312
|
+
"backend": "cuda",
|
|
1313
|
+
"backend_version": "12.6",
|
|
1314
|
+
"original_backend_version": "12.6.3",
|
|
1315
|
+
"backend_variant": "",
|
|
1316
|
+
"service": "vllm",
|
|
1317
|
+
"service_version": "0.14.1",
|
|
1318
|
+
"platform": "linux/arm64",
|
|
1319
|
+
"docker_image": "gpustack/runner:cuda12.6-vllm0.14.1",
|
|
1320
|
+
"deprecated": false
|
|
1321
|
+
},
|
|
1058
1322
|
{
|
|
1059
1323
|
"backend": "cuda",
|
|
1060
1324
|
"backend_version": "12.6",
|
|
@@ -1418,6 +1682,28 @@
|
|
|
1418
1682
|
"docker_image": "gpustack/runner:hggc12.3-vllm0.11.1",
|
|
1419
1683
|
"deprecated": false
|
|
1420
1684
|
},
|
|
1685
|
+
{
|
|
1686
|
+
"backend": "maca",
|
|
1687
|
+
"backend_version": "3.3",
|
|
1688
|
+
"original_backend_version": "3.3.0",
|
|
1689
|
+
"backend_variant": "",
|
|
1690
|
+
"service": "sglang",
|
|
1691
|
+
"service_version": "0.5.6",
|
|
1692
|
+
"platform": "linux/amd64",
|
|
1693
|
+
"docker_image": "gpustack/runner:maca3.3-sglang0.5.6",
|
|
1694
|
+
"deprecated": false
|
|
1695
|
+
},
|
|
1696
|
+
{
|
|
1697
|
+
"backend": "maca",
|
|
1698
|
+
"backend_version": "3.3",
|
|
1699
|
+
"original_backend_version": "3.3.0",
|
|
1700
|
+
"backend_variant": "",
|
|
1701
|
+
"service": "vllm",
|
|
1702
|
+
"service_version": "0.11.2",
|
|
1703
|
+
"platform": "linux/amd64",
|
|
1704
|
+
"docker_image": "gpustack/runner:maca3.3-vllm0.11.2",
|
|
1705
|
+
"deprecated": false
|
|
1706
|
+
},
|
|
1421
1707
|
{
|
|
1422
1708
|
"backend": "maca",
|
|
1423
1709
|
"backend_version": "3.2",
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: gpustack-runner
|
|
3
|
-
Version: 0.1.24.
|
|
3
|
+
Version: 0.1.24.post3
|
|
4
4
|
Summary: GPUStack Runner is library for registering runnable accelerated backends and services in GPUStack.
|
|
5
5
|
Project-URL: Homepage, https://github.com/gpustack/runner
|
|
6
6
|
Project-URL: Bug Tracker, https://github.com/gpustack/gpustack/issues
|
|
@@ -52,14 +52,17 @@ The following table lists the supported accelerated backends and their correspon
|
|
|
52
52
|
vllm-ascend [#3316](https://github.com/vllm-project/vllm-ascend/issues/3316)
|
|
53
53
|
and [#2795](https://github.com/vllm-project/vllm-ascend/issues/2795).
|
|
54
54
|
|
|
55
|
-
| CANN Version <br/> (Variant) | MindIE | vLLM
|
|
56
|
-
|
|
57
|
-
| 8.
|
|
58
|
-
| 8.
|
|
59
|
-
| 8.
|
|
60
|
-
| 8.
|
|
61
|
-
| 8.
|
|
62
|
-
| 8.
|
|
55
|
+
| CANN Version <br/> (Variant) | MindIE | vLLM | SGLang |
|
|
56
|
+
|------------------------------|-----------|--------------------------------------------------------------------|------------------------|
|
|
57
|
+
| 8.5 (A3/910C) | `2.3.0` | `0.14.1`, `0.13.0` | `0.5.8` |
|
|
58
|
+
| 8.5 (910B) | `2.3.0` | `0.14.1`, `0.13.0` | `0.5.8` |
|
|
59
|
+
| 8.5 (310P) | `2.3.0` | `0.14.1` | |
|
|
60
|
+
| 8.3 (A3/910C) | `2.2.rc1` | `0.12.0`, `0.11.0` | `0.5.7`, `0.5.6.post2` |
|
|
61
|
+
| 8.3 (910B) | `2.2.rc1` | `0.12.0`, `0.11.0` | `0.5.7`, `0.5.6.post2` |
|
|
62
|
+
| 8.3 (310P) | `2.2.rc1` | | |
|
|
63
|
+
| 8.2 (A3/910C) | `2.1.rc2` | `0.10.2`, ~~`0.10.1.1`~~ | `0.5.2`, `0.5.1.post3` |
|
|
64
|
+
| 8.2 (910B) | `2.1.rc2` | `0.10.2`, ~~`0.10.1.1`~~, <br/>`0.10.0`, `0.9.2`, <br/>~~`0.9.1`~~ | `0.5.2`, `0.5.1.post3` |
|
|
65
|
+
| 8.2 (310P) | `2.1.rc2` | `0.10.0`, `0.9.2` | |
|
|
63
66
|
|
|
64
67
|
### Iluvatar CoreX
|
|
65
68
|
|
|
@@ -77,11 +80,11 @@ The following table lists the supported accelerated backends and their correspon
|
|
|
77
80
|
> - CUDA 12.6/12.4 supports Compute Capabilities:
|
|
78
81
|
`7.5 8.0+PTX 8.9 9.0+PTX`.
|
|
79
82
|
|
|
80
|
-
| CUDA Version <br/> (Variant) | vLLM
|
|
81
|
-
|
|
82
|
-
| 12.9 | `0.
|
|
83
|
-
| 12.8 | `0.
|
|
84
|
-
| 12.6 | `0.
|
|
83
|
+
| CUDA Version <br/> (Variant) | vLLM | SGLang | VoxBox |
|
|
84
|
+
|------------------------------|----------------------------------------------------------------|-----------------------------------------------------------------------------|----------|
|
|
85
|
+
| 12.9 | `0.14.1`, **`0.13.0`**, <br/>`0.12.0`, `0.11.2` | `0.5.8`, `0.5.7`, <br/>`0.5.6.post2` | |
|
|
86
|
+
| 12.8 | `0.14.1`, **`0.13.0`**, <br/>`0.12.0`, `0.11.2`, <br/>`0.10.2` | `0.5.8`, `0.5.7`, <br/>`0.5.6.post2`, `0.5.5.post3`, <br/>~~`0.5.4.post3`~~ | `0.0.21` |
|
|
87
|
+
| 12.6 | `0.14.1`, **`0.13.0`**, <br/>`0.12.0`, `0.11.2`, <br/>`0.10.2` | | `0.0.21` |
|
|
85
88
|
|
|
86
89
|
### Hygon DTK
|
|
87
90
|
|
|
@@ -89,7 +92,7 @@ The following table lists the supported accelerated backends and their correspon
|
|
|
89
92
|
|-----------------------------|----------------------------|
|
|
90
93
|
| 25.04 | `0.11.0`, `0.9.2`, `0.8.5` |
|
|
91
94
|
|
|
92
|
-
###
|
|
95
|
+
### T-Head HGGC
|
|
93
96
|
|
|
94
97
|
| HGGC Version <br/> (Variant) | vLLM | SGLang |
|
|
95
98
|
|------------------------------|----------|---------|
|
|
@@ -97,10 +100,11 @@ The following table lists the supported accelerated backends and their correspon
|
|
|
97
100
|
|
|
98
101
|
### MetaX MACA
|
|
99
102
|
|
|
100
|
-
| MACA Version <br/> (Variant) | vLLM |
|
|
101
|
-
|
|
102
|
-
| 3.
|
|
103
|
-
| 3.
|
|
103
|
+
| MACA Version <br/> (Variant) | vLLM | SGLang |
|
|
104
|
+
|------------------------------|----------|---------|
|
|
105
|
+
| 3.3 | `0.11.2` | `0.5.6` |
|
|
106
|
+
| 3.2 | `0.10.2` | |
|
|
107
|
+
| 3.0 | `0.9.1` | |
|
|
104
108
|
|
|
105
109
|
### MThreads MUSA
|
|
106
110
|
|
|
@@ -118,16 +122,16 @@ The following table lists the supported accelerated backends and their correspon
|
|
|
118
122
|
`gfx908 gfx90a gfx942 gfx1030 gfx1100`.
|
|
119
123
|
|
|
120
124
|
> [!WARNING]
|
|
121
|
-
> - ROCm 7.0 vLLM `0.11.2
|
|
125
|
+
> - ROCm 7.0 vLLM `0.11.2` are reusing the official ROCm 6.4 PyTorch 2.9 wheel package rather than a ROCm
|
|
122
126
|
7.0 specific PyTorch build. Although supports ROCm 7.0 in vLLM `0.11.2`, `gfx1150/gfx1151` are not supported yet.
|
|
123
127
|
> - ROCm 6.4 vLLM `0.13.0` supports `gfx903 gfx90a gfx942` only.
|
|
124
128
|
> - ROCm 6.4 SGLang supports `gfx942` only.
|
|
125
129
|
> - ROCm 7.0 SGLang supports `gfx950` only.
|
|
126
130
|
|
|
127
|
-
| ROCm Version <br/> (Variant) | vLLM
|
|
128
|
-
|
|
129
|
-
| 7.0 |
|
|
130
|
-
| 6.4 |
|
|
131
|
+
| ROCm Version <br/> (Variant) | vLLM | SGLang |
|
|
132
|
+
|------------------------------|-------------------------------------------------|--------------------------------------------|
|
|
133
|
+
| 7.0 | **`0.13.0`**, `0.12.0`, <br/>`0.11.2` | `0.5.7`, `0.5.6.post2` |
|
|
134
|
+
| 6.4 | **`0.13.0`**, `0.12.0`, <br/>`0.11.2`, `0.10.2` | `0.5.7`, `0.5.6.post2`, <br/>`0.5.5.post3` |
|
|
131
135
|
|
|
132
136
|
## Directory Structure
|
|
133
137
|
|
|
@@ -1,17 +1,17 @@
|
|
|
1
1
|
gpustack_runner/__init__.py,sha256=ss8_wsk1oo13qFlP9usrXKX4ypHs1NZb2OVd6uFx5cc,715
|
|
2
2
|
gpustack_runner/__main__.py,sha256=uvpk9GtyJGtHaKM7DyM64N5mwehwpDD3v8ba6Yy8V3A,1364
|
|
3
3
|
gpustack_runner/__utils__.py,sha256=LSo0Iqxd5OjQFncVOYcqC8cncjtywf0qac31UPw7Ou4,4372
|
|
4
|
-
gpustack_runner/_version.py,sha256=
|
|
4
|
+
gpustack_runner/_version.py,sha256=kg14DjAgMOqC65Llz4O18tfum0uZJT0W8cU-i7Xc7Ik,792
|
|
5
5
|
gpustack_runner/_version.pyi,sha256=A42NoSgcqEXVy2OeNm4LXC9CbyonbooYrSUBlPm2lGY,156
|
|
6
6
|
gpustack_runner/envs.py,sha256=Wm0GTIiDJIT1zEjLpaPZNLbOs23NNFc2Y6zZuRLlTKQ,3470
|
|
7
7
|
gpustack_runner/runner.py,sha256=Rk4nyHj7Bn7ibAdxspXpXplMgWVMsG9Jb7GV8sHk2Ig,26310
|
|
8
|
-
gpustack_runner/runner.py.json,sha256=
|
|
8
|
+
gpustack_runner/runner.py.json,sha256=kwdBxVCFNpThnRdT6dwogvK7ayV1vWF-ck2IA9EoKL4,53323
|
|
9
9
|
gpustack_runner/cmds/__init__.py,sha256=zjdv_OC674KAcitjiHrHbXnAwLtw8Ju3psW0IKFqPIg,471
|
|
10
10
|
gpustack_runner/cmds/__types__.py,sha256=7C4kQM0EHPD8WpJpTo6kh9rEdkrYALcLQ-GAzMMsqV8,789
|
|
11
|
-
gpustack_runner/cmds/images.py,sha256=
|
|
12
|
-
gpustack_runner/_version_appendix.py,sha256=
|
|
13
|
-
gpustack_runner-0.1.24.
|
|
14
|
-
gpustack_runner-0.1.24.
|
|
15
|
-
gpustack_runner-0.1.24.
|
|
16
|
-
gpustack_runner-0.1.24.
|
|
17
|
-
gpustack_runner-0.1.24.
|
|
11
|
+
gpustack_runner/cmds/images.py,sha256=qkL862Xx6pcrLALhB8azMmtOAlIT-V5iGPHgSllnsPs,49029
|
|
12
|
+
gpustack_runner/_version_appendix.py,sha256=V2s_ow1zqn0fwyIASwO5DOQ8fRdLrVivPAAg5IskADw,23
|
|
13
|
+
gpustack_runner-0.1.24.post3.dist-info/METADATA,sha256=bo00AC5teijB1MlswDc-qZnQMcqgzJrIO_TKMQezECw,13093
|
|
14
|
+
gpustack_runner-0.1.24.post3.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
|
|
15
|
+
gpustack_runner-0.1.24.post3.dist-info/entry_points.txt,sha256=M1Dxl6cY0kIgf2I4pPsV-_kU6BAtjj93spmsXAdwW3s,66
|
|
16
|
+
gpustack_runner-0.1.24.post3.dist-info/licenses/LICENSE,sha256=OiPibowBvB-NHV3TP_NOj18XNBlXcshXZFMpa3uvKVE,10362
|
|
17
|
+
gpustack_runner-0.1.24.post3.dist-info/RECORD,,
|
|
File without changes
|
{gpustack_runner-0.1.24.post1.dist-info → gpustack_runner-0.1.24.post3.dist-info}/entry_points.txt
RENAMED
|
File without changes
|
{gpustack_runner-0.1.24.post1.dist-info → gpustack_runner-0.1.24.post3.dist-info}/licenses/LICENSE
RENAMED
|
File without changes
|