gpustack-runner 0.1.24.post2__py3-none-any.whl → 0.1.24.post3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -27,8 +27,8 @@ version_tuple: VERSION_TUPLE
27
27
  __commit_id__: COMMIT_ID
28
28
  commit_id: COMMIT_ID
29
29
 
30
- __version__ = version = '0.1.24.post2'
31
- __version_tuple__ = version_tuple = (0, 1, 24, 'post2')
30
+ __version__ = version = '0.1.24.post3'
31
+ __version_tuple__ = version_tuple = (0, 1, 24, 'post3')
32
32
  try:
33
33
  from ._version_appendix import git_commit
34
34
  __commit_id__ = commit_id = git_commit
@@ -1 +1 @@
1
- git_commit = "62d75c6"
1
+ git_commit = "dc41ed2"
@@ -261,7 +261,7 @@
261
261
  "service_version": "0.10.1.1",
262
262
  "platform": "linux/amd64",
263
263
  "docker_image": "gpustack/runner:cann8.2-a3-vllm0.10.1.1",
264
- "deprecated": false
264
+ "deprecated": true
265
265
  },
266
266
  {
267
267
  "backend": "cann",
@@ -272,7 +272,7 @@
272
272
  "service_version": "0.10.1.1",
273
273
  "platform": "linux/arm64",
274
274
  "docker_image": "gpustack/runner:cann8.2-a3-vllm0.10.1.1",
275
- "deprecated": false
275
+ "deprecated": true
276
276
  },
277
277
  {
278
278
  "backend": "cann",
@@ -558,7 +558,7 @@
558
558
  "service_version": "0.10.1.1",
559
559
  "platform": "linux/amd64",
560
560
  "docker_image": "gpustack/runner:cann8.2-910b-vllm0.10.1.1",
561
- "deprecated": false
561
+ "deprecated": true
562
562
  },
563
563
  {
564
564
  "backend": "cann",
@@ -569,7 +569,7 @@
569
569
  "service_version": "0.10.1.1",
570
570
  "platform": "linux/arm64",
571
571
  "docker_image": "gpustack/runner:cann8.2-910b-vllm0.10.1.1",
572
- "deprecated": false
572
+ "deprecated": true
573
573
  },
574
574
  {
575
575
  "backend": "cann",
@@ -624,7 +624,7 @@
624
624
  "service_version": "0.9.1",
625
625
  "platform": "linux/amd64",
626
626
  "docker_image": "gpustack/runner:cann8.2-910b-vllm0.9.1",
627
- "deprecated": false
627
+ "deprecated": true
628
628
  },
629
629
  {
630
630
  "backend": "cann",
@@ -635,7 +635,7 @@
635
635
  "service_version": "0.9.1",
636
636
  "platform": "linux/arm64",
637
637
  "docker_image": "gpustack/runner:cann8.2-910b-vllm0.9.1",
638
- "deprecated": false
638
+ "deprecated": true
639
639
  },
640
640
  {
641
641
  "backend": "cann",
@@ -802,6 +802,28 @@
802
802
  "docker_image": "gpustack/runner:corex4.2-vllm0.8.3",
803
803
  "deprecated": false
804
804
  },
805
+ {
806
+ "backend": "cuda",
807
+ "backend_version": "12.9",
808
+ "original_backend_version": "12.9.1",
809
+ "backend_variant": "",
810
+ "service": "sglang",
811
+ "service_version": "0.5.8",
812
+ "platform": "linux/amd64",
813
+ "docker_image": "gpustack/runner:cuda12.9-sglang0.5.8",
814
+ "deprecated": false
815
+ },
816
+ {
817
+ "backend": "cuda",
818
+ "backend_version": "12.9",
819
+ "original_backend_version": "12.9.1",
820
+ "backend_variant": "",
821
+ "service": "sglang",
822
+ "service_version": "0.5.8",
823
+ "platform": "linux/arm64",
824
+ "docker_image": "gpustack/runner:cuda12.9-sglang0.5.8",
825
+ "deprecated": false
826
+ },
805
827
  {
806
828
  "backend": "cuda",
807
829
  "backend_version": "12.9",
@@ -846,6 +868,28 @@
846
868
  "docker_image": "gpustack/runner:cuda12.9-sglang0.5.6.post2",
847
869
  "deprecated": false
848
870
  },
871
+ {
872
+ "backend": "cuda",
873
+ "backend_version": "12.9",
874
+ "original_backend_version": "12.9.1",
875
+ "backend_variant": "",
876
+ "service": "vllm",
877
+ "service_version": "0.14.1",
878
+ "platform": "linux/amd64",
879
+ "docker_image": "gpustack/runner:cuda12.9-vllm0.14.1",
880
+ "deprecated": false
881
+ },
882
+ {
883
+ "backend": "cuda",
884
+ "backend_version": "12.9",
885
+ "original_backend_version": "12.9.1",
886
+ "backend_variant": "",
887
+ "service": "vllm",
888
+ "service_version": "0.14.1",
889
+ "platform": "linux/arm64",
890
+ "docker_image": "gpustack/runner:cuda12.9-vllm0.14.1",
891
+ "deprecated": false
892
+ },
849
893
  {
850
894
  "backend": "cuda",
851
895
  "backend_version": "12.9",
@@ -912,6 +956,28 @@
912
956
  "docker_image": "gpustack/runner:cuda12.9-vllm0.11.2",
913
957
  "deprecated": false
914
958
  },
959
+ {
960
+ "backend": "cuda",
961
+ "backend_version": "12.8",
962
+ "original_backend_version": "12.8.1",
963
+ "backend_variant": "",
964
+ "service": "sglang",
965
+ "service_version": "0.5.8",
966
+ "platform": "linux/amd64",
967
+ "docker_image": "gpustack/runner:cuda12.8-sglang0.5.8",
968
+ "deprecated": false
969
+ },
970
+ {
971
+ "backend": "cuda",
972
+ "backend_version": "12.8",
973
+ "original_backend_version": "12.8.1",
974
+ "backend_variant": "",
975
+ "service": "sglang",
976
+ "service_version": "0.5.8",
977
+ "platform": "linux/arm64",
978
+ "docker_image": "gpustack/runner:cuda12.8-sglang0.5.8",
979
+ "deprecated": false
980
+ },
915
981
  {
916
982
  "backend": "cuda",
917
983
  "backend_version": "12.8",
@@ -998,7 +1064,7 @@
998
1064
  "service_version": "0.5.4.post3",
999
1065
  "platform": "linux/amd64",
1000
1066
  "docker_image": "gpustack/runner:cuda12.8-sglang0.5.4.post3",
1001
- "deprecated": false
1067
+ "deprecated": true
1002
1068
  },
1003
1069
  {
1004
1070
  "backend": "cuda",
@@ -1009,6 +1075,28 @@
1009
1075
  "service_version": "0.5.4.post3",
1010
1076
  "platform": "linux/arm64",
1011
1077
  "docker_image": "gpustack/runner:cuda12.8-sglang0.5.4.post3",
1078
+ "deprecated": true
1079
+ },
1080
+ {
1081
+ "backend": "cuda",
1082
+ "backend_version": "12.8",
1083
+ "original_backend_version": "12.8.1",
1084
+ "backend_variant": "",
1085
+ "service": "vllm",
1086
+ "service_version": "0.14.1",
1087
+ "platform": "linux/amd64",
1088
+ "docker_image": "gpustack/runner:cuda12.8-vllm0.14.1",
1089
+ "deprecated": false
1090
+ },
1091
+ {
1092
+ "backend": "cuda",
1093
+ "backend_version": "12.8",
1094
+ "original_backend_version": "12.8.1",
1095
+ "backend_variant": "",
1096
+ "service": "vllm",
1097
+ "service_version": "0.14.1",
1098
+ "platform": "linux/arm64",
1099
+ "docker_image": "gpustack/runner:cuda12.8-vllm0.14.1",
1012
1100
  "deprecated": false
1013
1101
  },
1014
1102
  {
@@ -1209,6 +1297,28 @@
1209
1297
  "docker_image": "gpustack/runner:cuda12.8-voxbox0.0.20",
1210
1298
  "deprecated": true
1211
1299
  },
1300
+ {
1301
+ "backend": "cuda",
1302
+ "backend_version": "12.6",
1303
+ "original_backend_version": "12.6.3",
1304
+ "backend_variant": "",
1305
+ "service": "vllm",
1306
+ "service_version": "0.14.1",
1307
+ "platform": "linux/amd64",
1308
+ "docker_image": "gpustack/runner:cuda12.6-vllm0.14.1",
1309
+ "deprecated": false
1310
+ },
1311
+ {
1312
+ "backend": "cuda",
1313
+ "backend_version": "12.6",
1314
+ "original_backend_version": "12.6.3",
1315
+ "backend_variant": "",
1316
+ "service": "vllm",
1317
+ "service_version": "0.14.1",
1318
+ "platform": "linux/arm64",
1319
+ "docker_image": "gpustack/runner:cuda12.6-vllm0.14.1",
1320
+ "deprecated": false
1321
+ },
1212
1322
  {
1213
1323
  "backend": "cuda",
1214
1324
  "backend_version": "12.6",
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: gpustack-runner
3
- Version: 0.1.24.post2
3
+ Version: 0.1.24.post3
4
4
  Summary: GPUStack Runner is library for registering runnable accelerated backends and services in GPUStack.
5
5
  Project-URL: Homepage, https://github.com/gpustack/runner
6
6
  Project-URL: Bug Tracker, https://github.com/gpustack/gpustack/issues
@@ -52,17 +52,17 @@ The following table lists the supported accelerated backends and their correspon
52
52
  vllm-ascend [#3316](https://github.com/vllm-project/vllm-ascend/issues/3316)
53
53
  and [#2795](https://github.com/vllm-project/vllm-ascend/issues/2795).
54
54
 
55
- | CANN Version <br/> (Variant) | MindIE | vLLM | SGLang |
56
- |------------------------------|-----------|------------------------------------------------------------|------------------------|
57
- | 8.5 (A3/910C) | `2.3.0` | `0.14.1`, `0.13.0` | `0.5.8` |
58
- | 8.5 (910B) | `2.3.0` | `0.14.1`, `0.13.0` | `0.5.8` |
59
- | 8.5 (310P) | `2.3.0` | `0.14.1` | |
60
- | 8.3 (A3/910C) | `2.2.rc1` | `0.12.0`, `0.11.0` | `0.5.7`, `0.5.6.post2` |
61
- | 8.3 (910B) | `2.2.rc1` | `0.12.0`, `0.11.0` | `0.5.7`, `0.5.6.post2` |
62
- | 8.3 (310P) | `2.2.rc1` | | |
63
- | 8.2 (A3/910C) | `2.1.rc2` | `0.10.2`, `0.10.1.1` | `0.5.2`, `0.5.1.post3` |
64
- | 8.2 (910B) | `2.1.rc2` | `0.10.2`, `0.10.1.1`, <br/>`0.10.0`, `0.9.2`, <br/>`0.9.1` | `0.5.2`, `0.5.1.post3` |
65
- | 8.2 (310P) | `2.1.rc2` | `0.10.0`, `0.9.2` | |
55
+ | CANN Version <br/> (Variant) | MindIE | vLLM | SGLang |
56
+ |------------------------------|-----------|--------------------------------------------------------------------|------------------------|
57
+ | 8.5 (A3/910C) | `2.3.0` | `0.14.1`, `0.13.0` | `0.5.8` |
58
+ | 8.5 (910B) | `2.3.0` | `0.14.1`, `0.13.0` | `0.5.8` |
59
+ | 8.5 (310P) | `2.3.0` | `0.14.1` | |
60
+ | 8.3 (A3/910C) | `2.2.rc1` | `0.12.0`, `0.11.0` | `0.5.7`, `0.5.6.post2` |
61
+ | 8.3 (910B) | `2.2.rc1` | `0.12.0`, `0.11.0` | `0.5.7`, `0.5.6.post2` |
62
+ | 8.3 (310P) | `2.2.rc1` | | |
63
+ | 8.2 (A3/910C) | `2.1.rc2` | `0.10.2`, ~~`0.10.1.1`~~ | `0.5.2`, `0.5.1.post3` |
64
+ | 8.2 (910B) | `2.1.rc2` | `0.10.2`, ~~`0.10.1.1`~~, <br/>`0.10.0`, `0.9.2`, <br/>~~`0.9.1`~~ | `0.5.2`, `0.5.1.post3` |
65
+ | 8.2 (310P) | `2.1.rc2` | `0.10.0`, `0.9.2` | |
66
66
 
67
67
  ### Iluvatar CoreX
68
68
 
@@ -80,11 +80,11 @@ The following table lists the supported accelerated backends and their correspon
80
80
  > - CUDA 12.6/12.4 supports Compute Capabilities:
81
81
  `7.5 8.0+PTX 8.9 9.0+PTX`.
82
82
 
83
- | CUDA Version <br/> (Variant) | vLLM | SGLang | VoxBox |
84
- |------------------------------|---------------------------------------------|-----------------------------------------------------------|----------|
85
- | 12.9 | `0.13.0`, `0.12.0`, <br/>`0.11.2` | `0.5.7`, `0.5.6.post2` | |
86
- | 12.8 | `0.13.0`, `0.12.0`, <br/>`0.11.2`, `0.10.2` | `0.5.7`, `0.5.6.post2`, <br/>`0.5.5.post3`, `0.5.4.post3` | `0.0.21` |
87
- | 12.6 | `0.13.0`, `0.12.0`, <br/>`0.11.2`,`0.10.2` | | `0.0.21` |
83
+ | CUDA Version <br/> (Variant) | vLLM | SGLang | VoxBox |
84
+ |------------------------------|----------------------------------------------------------------|-----------------------------------------------------------------------------|----------|
85
+ | 12.9 | `0.14.1`, **`0.13.0`**, <br/>`0.12.0`, `0.11.2` | `0.5.8`, `0.5.7`, <br/>`0.5.6.post2` | |
86
+ | 12.8 | `0.14.1`, **`0.13.0`**, <br/>`0.12.0`, `0.11.2`, <br/>`0.10.2` | `0.5.8`, `0.5.7`, <br/>`0.5.6.post2`, `0.5.5.post3`, <br/>~~`0.5.4.post3`~~ | `0.0.21` |
87
+ | 12.6 | `0.14.1`, **`0.13.0`**, <br/>`0.12.0`, `0.11.2`, <br/>`0.10.2` | | `0.0.21` |
88
88
 
89
89
  ### Hygon DTK
90
90
 
@@ -128,10 +128,10 @@ The following table lists the supported accelerated backends and their correspon
128
128
  > - ROCm 6.4 SGLang supports `gfx942` only.
129
129
  > - ROCm 7.0 SGLang supports `gfx950` only.
130
130
 
131
- | ROCm Version <br/> (Variant) | vLLM | SGLang |
132
- |------------------------------|---------------------------------------------|--------------------------------------------|
133
- | 7.0 | `0.13.0`, `0.12.0`, <br/>`0.11.2` | `0.5.7`, `0.5.6.post2` |
134
- | 6.4 | `0.13.0`, `0.12.0`, <br/>`0.11.2`, `0.10.2` | `0.5.7`, `0.5.6.post2`, <br/>`0.5.5.post3` |
131
+ | ROCm Version <br/> (Variant) | vLLM | SGLang |
132
+ |------------------------------|-------------------------------------------------|--------------------------------------------|
133
+ | 7.0 | **`0.13.0`**, `0.12.0`, <br/>`0.11.2` | `0.5.7`, `0.5.6.post2` |
134
+ | 6.4 | **`0.13.0`**, `0.12.0`, <br/>`0.11.2`, `0.10.2` | `0.5.7`, `0.5.6.post2`, <br/>`0.5.5.post3` |
135
135
 
136
136
  ## Directory Structure
137
137
 
@@ -1,17 +1,17 @@
1
1
  gpustack_runner/__init__.py,sha256=ss8_wsk1oo13qFlP9usrXKX4ypHs1NZb2OVd6uFx5cc,715
2
2
  gpustack_runner/__main__.py,sha256=uvpk9GtyJGtHaKM7DyM64N5mwehwpDD3v8ba6Yy8V3A,1364
3
3
  gpustack_runner/__utils__.py,sha256=LSo0Iqxd5OjQFncVOYcqC8cncjtywf0qac31UPw7Ou4,4372
4
- gpustack_runner/_version.py,sha256=SigvJTYuRQZ32Z9cgZmeBjPHmNv3OPkdCkWmY-EdHtc,792
4
+ gpustack_runner/_version.py,sha256=kg14DjAgMOqC65Llz4O18tfum0uZJT0W8cU-i7Xc7Ik,792
5
5
  gpustack_runner/_version.pyi,sha256=A42NoSgcqEXVy2OeNm4LXC9CbyonbooYrSUBlPm2lGY,156
6
6
  gpustack_runner/envs.py,sha256=Wm0GTIiDJIT1zEjLpaPZNLbOs23NNFc2Y6zZuRLlTKQ,3470
7
7
  gpustack_runner/runner.py,sha256=Rk4nyHj7Bn7ibAdxspXpXplMgWVMsG9Jb7GV8sHk2Ig,26310
8
- gpustack_runner/runner.py.json,sha256=PJ0Tc0cxlvn0qOHUYqiEYvCBO5p9P_zKGetE7sOslOc,50303
8
+ gpustack_runner/runner.py.json,sha256=kwdBxVCFNpThnRdT6dwogvK7ayV1vWF-ck2IA9EoKL4,53323
9
9
  gpustack_runner/cmds/__init__.py,sha256=zjdv_OC674KAcitjiHrHbXnAwLtw8Ju3psW0IKFqPIg,471
10
10
  gpustack_runner/cmds/__types__.py,sha256=7C4kQM0EHPD8WpJpTo6kh9rEdkrYALcLQ-GAzMMsqV8,789
11
11
  gpustack_runner/cmds/images.py,sha256=qkL862Xx6pcrLALhB8azMmtOAlIT-V5iGPHgSllnsPs,49029
12
- gpustack_runner/_version_appendix.py,sha256=V3FyUmXPRZnROBj6MvdU2i0qBK2IazwbxkITbNVc7tQ,23
13
- gpustack_runner-0.1.24.post2.dist-info/METADATA,sha256=-Zmb7jAVyM7KjyoFUesulwabed6RUnX57XVEfO7oA0A,12804
14
- gpustack_runner-0.1.24.post2.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
15
- gpustack_runner-0.1.24.post2.dist-info/entry_points.txt,sha256=M1Dxl6cY0kIgf2I4pPsV-_kU6BAtjj93spmsXAdwW3s,66
16
- gpustack_runner-0.1.24.post2.dist-info/licenses/LICENSE,sha256=OiPibowBvB-NHV3TP_NOj18XNBlXcshXZFMpa3uvKVE,10362
17
- gpustack_runner-0.1.24.post2.dist-info/RECORD,,
12
+ gpustack_runner/_version_appendix.py,sha256=V2s_ow1zqn0fwyIASwO5DOQ8fRdLrVivPAAg5IskADw,23
13
+ gpustack_runner-0.1.24.post3.dist-info/METADATA,sha256=bo00AC5teijB1MlswDc-qZnQMcqgzJrIO_TKMQezECw,13093
14
+ gpustack_runner-0.1.24.post3.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
15
+ gpustack_runner-0.1.24.post3.dist-info/entry_points.txt,sha256=M1Dxl6cY0kIgf2I4pPsV-_kU6BAtjj93spmsXAdwW3s,66
16
+ gpustack_runner-0.1.24.post3.dist-info/licenses/LICENSE,sha256=OiPibowBvB-NHV3TP_NOj18XNBlXcshXZFMpa3uvKVE,10362
17
+ gpustack_runner-0.1.24.post3.dist-info/RECORD,,