gpustack-runner 0.1.24.post1__py3-none-any.whl → 0.1.24.post3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -27,8 +27,8 @@ version_tuple: VERSION_TUPLE
27
27
  __commit_id__: COMMIT_ID
28
28
  commit_id: COMMIT_ID
29
29
 
30
- __version__ = version = '0.1.24.post1'
31
- __version_tuple__ = version_tuple = (0, 1, 24, 'post1')
30
+ __version__ = version = '0.1.24.post3'
31
+ __version_tuple__ = version_tuple = (0, 1, 24, 'post3')
32
32
  try:
33
33
  from ._version_appendix import git_commit
34
34
  __commit_id__ = commit_id = git_commit
@@ -1 +1 @@
1
- git_commit = "ed41ee9"
1
+ git_commit = "dc41ed2"
@@ -464,7 +464,7 @@ class SaveImagesSubCommand(SubCommand):
464
464
  # Submit tasks
465
465
  for task_name, src_img, dst_file, dst_file_relative in saving_tasks:
466
466
  if dst_file.exists():
467
- print(f"{dst_file.name} already exists, skipping save {src_img}.")
467
+ print(f"{dst_file} already exists, skipping save {src_img}.")
468
468
  continue
469
469
  dst_file.parent.mkdir(parents=True, exist_ok=True, mode=0o744)
470
470
 
@@ -976,7 +976,7 @@ class LoadImagesSubCommand(SubCommand):
976
976
  load_parser.add_argument(
977
977
  "input",
978
978
  nargs=OPTIONAL,
979
- help="Input directory to load images (default: current working directory)",
979
+ help="Input directory to load images from (default: current working directory)",
980
980
  )
981
981
 
982
982
  load_parser.set_defaults(func=LoadImagesSubCommand)
@@ -1,35 +1,79 @@
1
1
  [
2
2
  {
3
3
  "backend": "cann",
4
- "backend_version": "8.3",
5
- "original_backend_version": "8.3.rc2",
4
+ "backend_version": "8.5",
5
+ "original_backend_version": "8.5.0",
6
6
  "backend_variant": "a3",
7
7
  "service": "mindie",
8
- "service_version": "2.2.rc1",
8
+ "service_version": "2.3.0",
9
9
  "platform": "linux/amd64",
10
- "docker_image": "gpustack/runner:cann8.3-a3-mindie2.2.rc1",
10
+ "docker_image": "gpustack/runner:cann8.5-a3-mindie2.3.0",
11
11
  "deprecated": false
12
12
  },
13
13
  {
14
14
  "backend": "cann",
15
- "backend_version": "8.3",
16
- "original_backend_version": "8.3.rc2",
15
+ "backend_version": "8.5",
16
+ "original_backend_version": "8.5.0",
17
17
  "backend_variant": "a3",
18
18
  "service": "mindie",
19
- "service_version": "2.2.rc1",
19
+ "service_version": "2.3.0",
20
20
  "platform": "linux/arm64",
21
- "docker_image": "gpustack/runner:cann8.3-a3-mindie2.2.rc1",
21
+ "docker_image": "gpustack/runner:cann8.5-a3-mindie2.3.0",
22
22
  "deprecated": false
23
23
  },
24
24
  {
25
25
  "backend": "cann",
26
- "backend_version": "8.3",
27
- "original_backend_version": "8.3.rc2",
26
+ "backend_version": "8.5",
27
+ "original_backend_version": "8.5.0",
28
28
  "backend_variant": "a3",
29
29
  "service": "sglang",
30
- "service_version": "0.5.7",
30
+ "service_version": "0.5.8",
31
31
  "platform": "linux/arm64",
32
- "docker_image": "gpustack/runner:cann8.3-a3-sglang0.5.7",
32
+ "docker_image": "gpustack/runner:cann8.5-a3-sglang0.5.8",
33
+ "deprecated": false
34
+ },
35
+ {
36
+ "backend": "cann",
37
+ "backend_version": "8.5",
38
+ "original_backend_version": "8.5.0",
39
+ "backend_variant": "a3",
40
+ "service": "vllm",
41
+ "service_version": "0.14.1",
42
+ "platform": "linux/amd64",
43
+ "docker_image": "gpustack/runner:cann8.5-a3-vllm0.14.1",
44
+ "deprecated": false
45
+ },
46
+ {
47
+ "backend": "cann",
48
+ "backend_version": "8.5",
49
+ "original_backend_version": "8.5.0",
50
+ "backend_variant": "a3",
51
+ "service": "vllm",
52
+ "service_version": "0.14.1",
53
+ "platform": "linux/arm64",
54
+ "docker_image": "gpustack/runner:cann8.5-a3-vllm0.14.1",
55
+ "deprecated": false
56
+ },
57
+ {
58
+ "backend": "cann",
59
+ "backend_version": "8.5",
60
+ "original_backend_version": "8.5.0",
61
+ "backend_variant": "a3",
62
+ "service": "vllm",
63
+ "service_version": "0.13.0",
64
+ "platform": "linux/amd64",
65
+ "docker_image": "gpustack/runner:cann8.5-a3-vllm0.13.0",
66
+ "deprecated": false
67
+ },
68
+ {
69
+ "backend": "cann",
70
+ "backend_version": "8.5",
71
+ "original_backend_version": "8.5.0",
72
+ "backend_variant": "a3",
73
+ "service": "vllm",
74
+ "service_version": "0.13.0",
75
+ "platform": "linux/arm64",
76
+ "docker_image": "gpustack/runner:cann8.5-a3-vllm0.13.0",
33
77
  "deprecated": false
34
78
  },
35
79
  {
@@ -37,10 +81,21 @@
37
81
  "backend_version": "8.3",
38
82
  "original_backend_version": "8.3.rc2",
39
83
  "backend_variant": "a3",
40
- "service": "sglang",
41
- "service_version": "0.5.6.post2",
84
+ "service": "mindie",
85
+ "service_version": "2.2.rc1",
86
+ "platform": "linux/amd64",
87
+ "docker_image": "gpustack/runner:cann8.3-a3-mindie2.2.rc1",
88
+ "deprecated": false
89
+ },
90
+ {
91
+ "backend": "cann",
92
+ "backend_version": "8.3",
93
+ "original_backend_version": "8.3.rc2",
94
+ "backend_variant": "a3",
95
+ "service": "mindie",
96
+ "service_version": "2.2.rc1",
42
97
  "platform": "linux/arm64",
43
- "docker_image": "gpustack/runner:cann8.3-a3-sglang0.5.6.post2",
98
+ "docker_image": "gpustack/runner:cann8.3-a3-mindie2.2.rc1",
44
99
  "deprecated": false
45
100
  },
46
101
  {
@@ -48,10 +103,10 @@
48
103
  "backend_version": "8.3",
49
104
  "original_backend_version": "8.3.rc2",
50
105
  "backend_variant": "a3",
51
- "service": "vllm",
52
- "service_version": "0.13.0",
53
- "platform": "linux/amd64",
54
- "docker_image": "gpustack/runner:cann8.3-a3-vllm0.13.0",
106
+ "service": "sglang",
107
+ "service_version": "0.5.7",
108
+ "platform": "linux/arm64",
109
+ "docker_image": "gpustack/runner:cann8.3-a3-sglang0.5.7",
55
110
  "deprecated": false
56
111
  },
57
112
  {
@@ -59,10 +114,10 @@
59
114
  "backend_version": "8.3",
60
115
  "original_backend_version": "8.3.rc2",
61
116
  "backend_variant": "a3",
62
- "service": "vllm",
63
- "service_version": "0.13.0",
117
+ "service": "sglang",
118
+ "service_version": "0.5.6.post2",
64
119
  "platform": "linux/arm64",
65
- "docker_image": "gpustack/runner:cann8.3-a3-vllm0.13.0",
120
+ "docker_image": "gpustack/runner:cann8.3-a3-sglang0.5.6.post2",
66
121
  "deprecated": false
67
122
  },
68
123
  {
@@ -206,7 +261,7 @@
206
261
  "service_version": "0.10.1.1",
207
262
  "platform": "linux/amd64",
208
263
  "docker_image": "gpustack/runner:cann8.2-a3-vllm0.10.1.1",
209
- "deprecated": false
264
+ "deprecated": true
210
265
  },
211
266
  {
212
267
  "backend": "cann",
@@ -217,6 +272,83 @@
217
272
  "service_version": "0.10.1.1",
218
273
  "platform": "linux/arm64",
219
274
  "docker_image": "gpustack/runner:cann8.2-a3-vllm0.10.1.1",
275
+ "deprecated": true
276
+ },
277
+ {
278
+ "backend": "cann",
279
+ "backend_version": "8.5",
280
+ "original_backend_version": "8.5.0",
281
+ "backend_variant": "910b",
282
+ "service": "mindie",
283
+ "service_version": "2.3.0",
284
+ "platform": "linux/amd64",
285
+ "docker_image": "gpustack/runner:cann8.5-910b-mindie2.3.0",
286
+ "deprecated": false
287
+ },
288
+ {
289
+ "backend": "cann",
290
+ "backend_version": "8.5",
291
+ "original_backend_version": "8.5.0",
292
+ "backend_variant": "910b",
293
+ "service": "mindie",
294
+ "service_version": "2.3.0",
295
+ "platform": "linux/arm64",
296
+ "docker_image": "gpustack/runner:cann8.5-910b-mindie2.3.0",
297
+ "deprecated": false
298
+ },
299
+ {
300
+ "backend": "cann",
301
+ "backend_version": "8.5",
302
+ "original_backend_version": "8.5.0",
303
+ "backend_variant": "910b",
304
+ "service": "sglang",
305
+ "service_version": "0.5.8",
306
+ "platform": "linux/arm64",
307
+ "docker_image": "gpustack/runner:cann8.5-910b-sglang0.5.8",
308
+ "deprecated": false
309
+ },
310
+ {
311
+ "backend": "cann",
312
+ "backend_version": "8.5",
313
+ "original_backend_version": "8.5.0",
314
+ "backend_variant": "910b",
315
+ "service": "vllm",
316
+ "service_version": "0.14.1",
317
+ "platform": "linux/amd64",
318
+ "docker_image": "gpustack/runner:cann8.5-910b-vllm0.14.1",
319
+ "deprecated": false
320
+ },
321
+ {
322
+ "backend": "cann",
323
+ "backend_version": "8.5",
324
+ "original_backend_version": "8.5.0",
325
+ "backend_variant": "910b",
326
+ "service": "vllm",
327
+ "service_version": "0.14.1",
328
+ "platform": "linux/arm64",
329
+ "docker_image": "gpustack/runner:cann8.5-910b-vllm0.14.1",
330
+ "deprecated": false
331
+ },
332
+ {
333
+ "backend": "cann",
334
+ "backend_version": "8.5",
335
+ "original_backend_version": "8.5.0",
336
+ "backend_variant": "910b",
337
+ "service": "vllm",
338
+ "service_version": "0.13.0",
339
+ "platform": "linux/amd64",
340
+ "docker_image": "gpustack/runner:cann8.5-910b-vllm0.13.0",
341
+ "deprecated": false
342
+ },
343
+ {
344
+ "backend": "cann",
345
+ "backend_version": "8.5",
346
+ "original_backend_version": "8.5.0",
347
+ "backend_variant": "910b",
348
+ "service": "vllm",
349
+ "service_version": "0.13.0",
350
+ "platform": "linux/arm64",
351
+ "docker_image": "gpustack/runner:cann8.5-910b-vllm0.13.0",
220
352
  "deprecated": false
221
353
  },
222
354
  {
@@ -263,28 +395,6 @@
263
395
  "docker_image": "gpustack/runner:cann8.3-910b-sglang0.5.6.post2",
264
396
  "deprecated": false
265
397
  },
266
- {
267
- "backend": "cann",
268
- "backend_version": "8.3",
269
- "original_backend_version": "8.3.rc2",
270
- "backend_variant": "910b",
271
- "service": "vllm",
272
- "service_version": "0.13.0",
273
- "platform": "linux/amd64",
274
- "docker_image": "gpustack/runner:cann8.3-910b-vllm0.13.0",
275
- "deprecated": false
276
- },
277
- {
278
- "backend": "cann",
279
- "backend_version": "8.3",
280
- "original_backend_version": "8.3.rc2",
281
- "backend_variant": "910b",
282
- "service": "vllm",
283
- "service_version": "0.13.0",
284
- "platform": "linux/arm64",
285
- "docker_image": "gpustack/runner:cann8.3-910b-vllm0.13.0",
286
- "deprecated": false
287
- },
288
398
  {
289
399
  "backend": "cann",
290
400
  "backend_version": "8.3",
@@ -448,7 +558,7 @@
448
558
  "service_version": "0.10.1.1",
449
559
  "platform": "linux/amd64",
450
560
  "docker_image": "gpustack/runner:cann8.2-910b-vllm0.10.1.1",
451
- "deprecated": false
561
+ "deprecated": true
452
562
  },
453
563
  {
454
564
  "backend": "cann",
@@ -459,7 +569,7 @@
459
569
  "service_version": "0.10.1.1",
460
570
  "platform": "linux/arm64",
461
571
  "docker_image": "gpustack/runner:cann8.2-910b-vllm0.10.1.1",
462
- "deprecated": false
572
+ "deprecated": true
463
573
  },
464
574
  {
465
575
  "backend": "cann",
@@ -514,7 +624,7 @@
514
624
  "service_version": "0.9.1",
515
625
  "platform": "linux/amd64",
516
626
  "docker_image": "gpustack/runner:cann8.2-910b-vllm0.9.1",
517
- "deprecated": false
627
+ "deprecated": true
518
628
  },
519
629
  {
520
630
  "backend": "cann",
@@ -525,6 +635,50 @@
525
635
  "service_version": "0.9.1",
526
636
  "platform": "linux/arm64",
527
637
  "docker_image": "gpustack/runner:cann8.2-910b-vllm0.9.1",
638
+ "deprecated": true
639
+ },
640
+ {
641
+ "backend": "cann",
642
+ "backend_version": "8.5",
643
+ "original_backend_version": "8.5.0",
644
+ "backend_variant": "310p",
645
+ "service": "mindie",
646
+ "service_version": "2.3.0",
647
+ "platform": "linux/amd64",
648
+ "docker_image": "gpustack/runner:cann8.5-310p-mindie2.3.0",
649
+ "deprecated": false
650
+ },
651
+ {
652
+ "backend": "cann",
653
+ "backend_version": "8.5",
654
+ "original_backend_version": "8.5.0",
655
+ "backend_variant": "310p",
656
+ "service": "mindie",
657
+ "service_version": "2.3.0",
658
+ "platform": "linux/arm64",
659
+ "docker_image": "gpustack/runner:cann8.5-310p-mindie2.3.0",
660
+ "deprecated": false
661
+ },
662
+ {
663
+ "backend": "cann",
664
+ "backend_version": "8.5",
665
+ "original_backend_version": "8.5.0",
666
+ "backend_variant": "310p",
667
+ "service": "vllm",
668
+ "service_version": "0.14.1",
669
+ "platform": "linux/amd64",
670
+ "docker_image": "gpustack/runner:cann8.5-310p-vllm0.14.1",
671
+ "deprecated": false
672
+ },
673
+ {
674
+ "backend": "cann",
675
+ "backend_version": "8.5",
676
+ "original_backend_version": "8.5.0",
677
+ "backend_variant": "310p",
678
+ "service": "vllm",
679
+ "service_version": "0.14.1",
680
+ "platform": "linux/arm64",
681
+ "docker_image": "gpustack/runner:cann8.5-310p-vllm0.14.1",
528
682
  "deprecated": false
529
683
  },
530
684
  {
@@ -648,6 +802,28 @@
648
802
  "docker_image": "gpustack/runner:corex4.2-vllm0.8.3",
649
803
  "deprecated": false
650
804
  },
805
+ {
806
+ "backend": "cuda",
807
+ "backend_version": "12.9",
808
+ "original_backend_version": "12.9.1",
809
+ "backend_variant": "",
810
+ "service": "sglang",
811
+ "service_version": "0.5.8",
812
+ "platform": "linux/amd64",
813
+ "docker_image": "gpustack/runner:cuda12.9-sglang0.5.8",
814
+ "deprecated": false
815
+ },
816
+ {
817
+ "backend": "cuda",
818
+ "backend_version": "12.9",
819
+ "original_backend_version": "12.9.1",
820
+ "backend_variant": "",
821
+ "service": "sglang",
822
+ "service_version": "0.5.8",
823
+ "platform": "linux/arm64",
824
+ "docker_image": "gpustack/runner:cuda12.9-sglang0.5.8",
825
+ "deprecated": false
826
+ },
651
827
  {
652
828
  "backend": "cuda",
653
829
  "backend_version": "12.9",
@@ -692,6 +868,28 @@
692
868
  "docker_image": "gpustack/runner:cuda12.9-sglang0.5.6.post2",
693
869
  "deprecated": false
694
870
  },
871
+ {
872
+ "backend": "cuda",
873
+ "backend_version": "12.9",
874
+ "original_backend_version": "12.9.1",
875
+ "backend_variant": "",
876
+ "service": "vllm",
877
+ "service_version": "0.14.1",
878
+ "platform": "linux/amd64",
879
+ "docker_image": "gpustack/runner:cuda12.9-vllm0.14.1",
880
+ "deprecated": false
881
+ },
882
+ {
883
+ "backend": "cuda",
884
+ "backend_version": "12.9",
885
+ "original_backend_version": "12.9.1",
886
+ "backend_variant": "",
887
+ "service": "vllm",
888
+ "service_version": "0.14.1",
889
+ "platform": "linux/arm64",
890
+ "docker_image": "gpustack/runner:cuda12.9-vllm0.14.1",
891
+ "deprecated": false
892
+ },
695
893
  {
696
894
  "backend": "cuda",
697
895
  "backend_version": "12.9",
@@ -758,6 +956,28 @@
758
956
  "docker_image": "gpustack/runner:cuda12.9-vllm0.11.2",
759
957
  "deprecated": false
760
958
  },
959
+ {
960
+ "backend": "cuda",
961
+ "backend_version": "12.8",
962
+ "original_backend_version": "12.8.1",
963
+ "backend_variant": "",
964
+ "service": "sglang",
965
+ "service_version": "0.5.8",
966
+ "platform": "linux/amd64",
967
+ "docker_image": "gpustack/runner:cuda12.8-sglang0.5.8",
968
+ "deprecated": false
969
+ },
970
+ {
971
+ "backend": "cuda",
972
+ "backend_version": "12.8",
973
+ "original_backend_version": "12.8.1",
974
+ "backend_variant": "",
975
+ "service": "sglang",
976
+ "service_version": "0.5.8",
977
+ "platform": "linux/arm64",
978
+ "docker_image": "gpustack/runner:cuda12.8-sglang0.5.8",
979
+ "deprecated": false
980
+ },
761
981
  {
762
982
  "backend": "cuda",
763
983
  "backend_version": "12.8",
@@ -844,7 +1064,7 @@
844
1064
  "service_version": "0.5.4.post3",
845
1065
  "platform": "linux/amd64",
846
1066
  "docker_image": "gpustack/runner:cuda12.8-sglang0.5.4.post3",
847
- "deprecated": false
1067
+ "deprecated": true
848
1068
  },
849
1069
  {
850
1070
  "backend": "cuda",
@@ -855,6 +1075,28 @@
855
1075
  "service_version": "0.5.4.post3",
856
1076
  "platform": "linux/arm64",
857
1077
  "docker_image": "gpustack/runner:cuda12.8-sglang0.5.4.post3",
1078
+ "deprecated": true
1079
+ },
1080
+ {
1081
+ "backend": "cuda",
1082
+ "backend_version": "12.8",
1083
+ "original_backend_version": "12.8.1",
1084
+ "backend_variant": "",
1085
+ "service": "vllm",
1086
+ "service_version": "0.14.1",
1087
+ "platform": "linux/amd64",
1088
+ "docker_image": "gpustack/runner:cuda12.8-vllm0.14.1",
1089
+ "deprecated": false
1090
+ },
1091
+ {
1092
+ "backend": "cuda",
1093
+ "backend_version": "12.8",
1094
+ "original_backend_version": "12.8.1",
1095
+ "backend_variant": "",
1096
+ "service": "vllm",
1097
+ "service_version": "0.14.1",
1098
+ "platform": "linux/arm64",
1099
+ "docker_image": "gpustack/runner:cuda12.8-vllm0.14.1",
858
1100
  "deprecated": false
859
1101
  },
860
1102
  {
@@ -1055,6 +1297,28 @@
1055
1297
  "docker_image": "gpustack/runner:cuda12.8-voxbox0.0.20",
1056
1298
  "deprecated": true
1057
1299
  },
1300
+ {
1301
+ "backend": "cuda",
1302
+ "backend_version": "12.6",
1303
+ "original_backend_version": "12.6.3",
1304
+ "backend_variant": "",
1305
+ "service": "vllm",
1306
+ "service_version": "0.14.1",
1307
+ "platform": "linux/amd64",
1308
+ "docker_image": "gpustack/runner:cuda12.6-vllm0.14.1",
1309
+ "deprecated": false
1310
+ },
1311
+ {
1312
+ "backend": "cuda",
1313
+ "backend_version": "12.6",
1314
+ "original_backend_version": "12.6.3",
1315
+ "backend_variant": "",
1316
+ "service": "vllm",
1317
+ "service_version": "0.14.1",
1318
+ "platform": "linux/arm64",
1319
+ "docker_image": "gpustack/runner:cuda12.6-vllm0.14.1",
1320
+ "deprecated": false
1321
+ },
1058
1322
  {
1059
1323
  "backend": "cuda",
1060
1324
  "backend_version": "12.6",
@@ -1418,6 +1682,28 @@
1418
1682
  "docker_image": "gpustack/runner:hggc12.3-vllm0.11.1",
1419
1683
  "deprecated": false
1420
1684
  },
1685
+ {
1686
+ "backend": "maca",
1687
+ "backend_version": "3.3",
1688
+ "original_backend_version": "3.3.0",
1689
+ "backend_variant": "",
1690
+ "service": "sglang",
1691
+ "service_version": "0.5.6",
1692
+ "platform": "linux/amd64",
1693
+ "docker_image": "gpustack/runner:maca3.3-sglang0.5.6",
1694
+ "deprecated": false
1695
+ },
1696
+ {
1697
+ "backend": "maca",
1698
+ "backend_version": "3.3",
1699
+ "original_backend_version": "3.3.0",
1700
+ "backend_variant": "",
1701
+ "service": "vllm",
1702
+ "service_version": "0.11.2",
1703
+ "platform": "linux/amd64",
1704
+ "docker_image": "gpustack/runner:maca3.3-vllm0.11.2",
1705
+ "deprecated": false
1706
+ },
1421
1707
  {
1422
1708
  "backend": "maca",
1423
1709
  "backend_version": "3.2",
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: gpustack-runner
3
- Version: 0.1.24.post1
3
+ Version: 0.1.24.post3
4
4
  Summary: GPUStack Runner is library for registering runnable accelerated backends and services in GPUStack.
5
5
  Project-URL: Homepage, https://github.com/gpustack/runner
6
6
  Project-URL: Bug Tracker, https://github.com/gpustack/gpustack/issues
@@ -52,14 +52,17 @@ The following table lists the supported accelerated backends and their correspon
52
52
  vllm-ascend [#3316](https://github.com/vllm-project/vllm-ascend/issues/3316)
53
53
  and [#2795](https://github.com/vllm-project/vllm-ascend/issues/2795).
54
54
 
55
- | CANN Version <br/> (Variant) | MindIE | vLLM | SGLang |
56
- |------------------------------|-----------|------------------------------------------------------------|------------------------|
57
- | 8.3 (A3/910C) | `2.2.rc1` | `0.13.0`, `0.12.0`, `0.11.0` | `0.5.7`, `0.5.6.post2` |
58
- | 8.3 (910B) | `2.2.rc1` | `0.13.0`, `0.12.0`, `0.11.0` | `0.5.7`, `0.5.6.post2` |
59
- | 8.3 (310P) | `2.2.rc1` | | |
60
- | 8.2 (A3/910C) | `2.1.rc2` | `0.10.2`, `0.10.1.1` | `0.5.2`, `0.5.1.post3` |
61
- | 8.2 (910B) | `2.1.rc2` | `0.10.2`, `0.10.1.1`, <br/>`0.10.0`, `0.9.2`, <br/>`0.9.1` | `0.5.2`, `0.5.1.post3` |
62
- | 8.2 (310P) | `2.1.rc2` | `0.10.0`, `0.9.2` | |
55
+ | CANN Version <br/> (Variant) | MindIE | vLLM | SGLang |
56
+ |------------------------------|-----------|--------------------------------------------------------------------|------------------------|
57
+ | 8.5 (A3/910C) | `2.3.0` | `0.14.1`, `0.13.0` | `0.5.8` |
58
+ | 8.5 (910B) | `2.3.0` | `0.14.1`, `0.13.0` | `0.5.8` |
59
+ | 8.5 (310P) | `2.3.0` | `0.14.1` | |
60
+ | 8.3 (A3/910C) | `2.2.rc1` | `0.12.0`, `0.11.0` | `0.5.7`, `0.5.6.post2` |
61
+ | 8.3 (910B) | `2.2.rc1` | `0.12.0`, `0.11.0` | `0.5.7`, `0.5.6.post2` |
62
+ | 8.3 (310P) | `2.2.rc1` | | |
63
+ | 8.2 (A3/910C) | `2.1.rc2` | `0.10.2`, ~~`0.10.1.1`~~ | `0.5.2`, `0.5.1.post3` |
64
+ | 8.2 (910B) | `2.1.rc2` | `0.10.2`, ~~`0.10.1.1`~~, <br/>`0.10.0`, `0.9.2`, <br/>~~`0.9.1`~~ | `0.5.2`, `0.5.1.post3` |
65
+ | 8.2 (310P) | `2.1.rc2` | `0.10.0`, `0.9.2` | |
63
66
 
64
67
  ### Iluvatar CoreX
65
68
 
@@ -77,11 +80,11 @@ The following table lists the supported accelerated backends and their correspon
77
80
  > - CUDA 12.6/12.4 supports Compute Capabilities:
78
81
  `7.5 8.0+PTX 8.9 9.0+PTX`.
79
82
 
80
- | CUDA Version <br/> (Variant) | vLLM | SGLang | VoxBox |
81
- |------------------------------|---------------------------------------------|-----------------------------------------------------------|----------|
82
- | 12.9 | `0.13.0`, `0.12.0`, <br/>`0.11.2` | `0.5.7`, `0.5.6.post2` | |
83
- | 12.8 | `0.13.0`, `0.12.0`, <br/>`0.11.2`, `0.10.2` | `0.5.7`, `0.5.6.post2`, <br/>`0.5.5.post3`, `0.5.4.post3` | `0.0.21` |
84
- | 12.6 | `0.13.0`, `0.12.0`, <br/>`0.11.2`,`0.10.2` | | `0.0.21` |
83
+ | CUDA Version <br/> (Variant) | vLLM | SGLang | VoxBox |
84
+ |------------------------------|----------------------------------------------------------------|-----------------------------------------------------------------------------|----------|
85
+ | 12.9 | `0.14.1`, **`0.13.0`**, <br/>`0.12.0`, `0.11.2` | `0.5.8`, `0.5.7`, <br/>`0.5.6.post2` | |
86
+ | 12.8 | `0.14.1`, **`0.13.0`**, <br/>`0.12.0`, `0.11.2`, <br/>`0.10.2` | `0.5.8`, `0.5.7`, <br/>`0.5.6.post2`, `0.5.5.post3`, <br/>~~`0.5.4.post3`~~ | `0.0.21` |
87
+ | 12.6 | `0.14.1`, **`0.13.0`**, <br/>`0.12.0`, `0.11.2`, <br/>`0.10.2` | | `0.0.21` |
85
88
 
86
89
  ### Hygon DTK
87
90
 
@@ -89,7 +92,7 @@ The following table lists the supported accelerated backends and their correspon
89
92
  |-----------------------------|----------------------------|
90
93
  | 25.04 | `0.11.0`, `0.9.2`, `0.8.5` |
91
94
 
92
- ### THead HGGC
95
+ ### T-Head HGGC
93
96
 
94
97
  | HGGC Version <br/> (Variant) | vLLM | SGLang |
95
98
  |------------------------------|----------|---------|
@@ -97,10 +100,11 @@ The following table lists the supported accelerated backends and their correspon
97
100
 
98
101
  ### MetaX MACA
99
102
 
100
- | MACA Version <br/> (Variant) | vLLM |
101
- |------------------------------|----------|
102
- | 3.2 | `0.10.2` |
103
- | 3.0 | `0.9.1` |
103
+ | MACA Version <br/> (Variant) | vLLM | SGLang |
104
+ |------------------------------|----------|---------|
105
+ | 3.3 | `0.11.2` | `0.5.6` |
106
+ | 3.2 | `0.10.2` | |
107
+ | 3.0 | `0.9.1` | |
104
108
 
105
109
  ### MThreads MUSA
106
110
 
@@ -118,16 +122,16 @@ The following table lists the supported accelerated backends and their correspon
118
122
  `gfx908 gfx90a gfx942 gfx1030 gfx1100`.
119
123
 
120
124
  > [!WARNING]
121
- > - ROCm 7.0 vLLM `0.11.2/0.11.0` are reusing the official ROCm 6.4 PyTorch 2.9 wheel package rather than a ROCm
125
+ > - ROCm 7.0 vLLM `0.11.2` are reusing the official ROCm 6.4 PyTorch 2.9 wheel package rather than a ROCm
122
126
  7.0 specific PyTorch build. Although supports ROCm 7.0 in vLLM `0.11.2`, `gfx1150/gfx1151` are not supported yet.
123
127
  > - ROCm 6.4 vLLM `0.13.0` supports `gfx903 gfx90a gfx942` only.
124
128
  > - ROCm 6.4 SGLang supports `gfx942` only.
125
129
  > - ROCm 7.0 SGLang supports `gfx950` only.
126
130
 
127
- | ROCm Version <br/> (Variant) | vLLM | SGLang |
128
- |------------------------------|---------------------------------------------|--------------------------------------------|
129
- | 7.0 | `0.13.0`, `0.12.0`, <br/>`0.11.2` | `0.5.7`, `0.5.6.post2` |
130
- | 6.4 | `0.13.0`, `0.12.0`, <br/>`0.11.2`, `0.10.2` | `0.5.7`, `0.5.6.post2`, <br/>`0.5.5.post3` |
131
+ | ROCm Version <br/> (Variant) | vLLM | SGLang |
132
+ |------------------------------|-------------------------------------------------|--------------------------------------------|
133
+ | 7.0 | **`0.13.0`**, `0.12.0`, <br/>`0.11.2` | `0.5.7`, `0.5.6.post2` |
134
+ | 6.4 | **`0.13.0`**, `0.12.0`, <br/>`0.11.2`, `0.10.2` | `0.5.7`, `0.5.6.post2`, <br/>`0.5.5.post3` |
131
135
 
132
136
  ## Directory Structure
133
137
 
@@ -1,17 +1,17 @@
1
1
  gpustack_runner/__init__.py,sha256=ss8_wsk1oo13qFlP9usrXKX4ypHs1NZb2OVd6uFx5cc,715
2
2
  gpustack_runner/__main__.py,sha256=uvpk9GtyJGtHaKM7DyM64N5mwehwpDD3v8ba6Yy8V3A,1364
3
3
  gpustack_runner/__utils__.py,sha256=LSo0Iqxd5OjQFncVOYcqC8cncjtywf0qac31UPw7Ou4,4372
4
- gpustack_runner/_version.py,sha256=Ix4zhdok3sdfQ1mOI_tph_pbj5GmpJ04rohojJ2w17c,792
4
+ gpustack_runner/_version.py,sha256=kg14DjAgMOqC65Llz4O18tfum0uZJT0W8cU-i7Xc7Ik,792
5
5
  gpustack_runner/_version.pyi,sha256=A42NoSgcqEXVy2OeNm4LXC9CbyonbooYrSUBlPm2lGY,156
6
6
  gpustack_runner/envs.py,sha256=Wm0GTIiDJIT1zEjLpaPZNLbOs23NNFc2Y6zZuRLlTKQ,3470
7
7
  gpustack_runner/runner.py,sha256=Rk4nyHj7Bn7ibAdxspXpXplMgWVMsG9Jb7GV8sHk2Ig,26310
8
- gpustack_runner/runner.py.json,sha256=rQEZrBRAQngUY9z2AntWTnnwjhTzZI_yywMxhjAAcAw,45403
8
+ gpustack_runner/runner.py.json,sha256=kwdBxVCFNpThnRdT6dwogvK7ayV1vWF-ck2IA9EoKL4,53323
9
9
  gpustack_runner/cmds/__init__.py,sha256=zjdv_OC674KAcitjiHrHbXnAwLtw8Ju3psW0IKFqPIg,471
10
10
  gpustack_runner/cmds/__types__.py,sha256=7C4kQM0EHPD8WpJpTo6kh9rEdkrYALcLQ-GAzMMsqV8,789
11
- gpustack_runner/cmds/images.py,sha256=dH9gSoOpUCyjarfpJ1I7MSR98hYtGVsfcochcC3JqhI,49025
12
- gpustack_runner/_version_appendix.py,sha256=P3_fpwmk6qL5k6PhLsWQyJeGhOHfewu1ukL_vQh56KU,23
13
- gpustack_runner-0.1.24.post1.dist-info/METADATA,sha256=owCPWsrDOrEOZTrHTceS4yeMFOwvWkKmAdxNSyFvcgU,12323
14
- gpustack_runner-0.1.24.post1.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
15
- gpustack_runner-0.1.24.post1.dist-info/entry_points.txt,sha256=M1Dxl6cY0kIgf2I4pPsV-_kU6BAtjj93spmsXAdwW3s,66
16
- gpustack_runner-0.1.24.post1.dist-info/licenses/LICENSE,sha256=OiPibowBvB-NHV3TP_NOj18XNBlXcshXZFMpa3uvKVE,10362
17
- gpustack_runner-0.1.24.post1.dist-info/RECORD,,
11
+ gpustack_runner/cmds/images.py,sha256=qkL862Xx6pcrLALhB8azMmtOAlIT-V5iGPHgSllnsPs,49029
12
+ gpustack_runner/_version_appendix.py,sha256=V2s_ow1zqn0fwyIASwO5DOQ8fRdLrVivPAAg5IskADw,23
13
+ gpustack_runner-0.1.24.post3.dist-info/METADATA,sha256=bo00AC5teijB1MlswDc-qZnQMcqgzJrIO_TKMQezECw,13093
14
+ gpustack_runner-0.1.24.post3.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
15
+ gpustack_runner-0.1.24.post3.dist-info/entry_points.txt,sha256=M1Dxl6cY0kIgf2I4pPsV-_kU6BAtjj93spmsXAdwW3s,66
16
+ gpustack_runner-0.1.24.post3.dist-info/licenses/LICENSE,sha256=OiPibowBvB-NHV3TP_NOj18XNBlXcshXZFMpa3uvKVE,10362
17
+ gpustack_runner-0.1.24.post3.dist-info/RECORD,,