gpustack-runner 0.1.24.post4__py3-none-any.whl → 0.1.25__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- gpustack_runner/_version.py +2 -2
- gpustack_runner/_version_appendix.py +1 -1
- gpustack_runner/runner.py.json +88 -0
- {gpustack_runner-0.1.24.post4.dist-info → gpustack_runner-0.1.25.dist-info}/METADATA +21 -21
- {gpustack_runner-0.1.24.post4.dist-info → gpustack_runner-0.1.25.dist-info}/RECORD +8 -8
- {gpustack_runner-0.1.24.post4.dist-info → gpustack_runner-0.1.25.dist-info}/WHEEL +0 -0
- {gpustack_runner-0.1.24.post4.dist-info → gpustack_runner-0.1.25.dist-info}/entry_points.txt +0 -0
- {gpustack_runner-0.1.24.post4.dist-info → gpustack_runner-0.1.25.dist-info}/licenses/LICENSE +0 -0
gpustack_runner/_version.py
CHANGED
|
@@ -27,8 +27,8 @@ version_tuple: VERSION_TUPLE
|
|
|
27
27
|
__commit_id__: COMMIT_ID
|
|
28
28
|
commit_id: COMMIT_ID
|
|
29
29
|
|
|
30
|
-
__version__ = version = '0.1.
|
|
31
|
-
__version_tuple__ = version_tuple = (0, 1,
|
|
30
|
+
__version__ = version = '0.1.25'
|
|
31
|
+
__version_tuple__ = version_tuple = (0, 1, 25)
|
|
32
32
|
try:
|
|
33
33
|
from ._version_appendix import git_commit
|
|
34
34
|
__commit_id__ = commit_id = git_commit
|
|
@@ -1 +1 @@
|
|
|
1
|
-
git_commit = "
|
|
1
|
+
git_commit = "b005327"
|
gpustack_runner/runner.py.json
CHANGED
|
@@ -868,6 +868,28 @@
|
|
|
868
868
|
"docker_image": "gpustack/runner:cuda12.9-sglang0.5.6.post2",
|
|
869
869
|
"deprecated": false
|
|
870
870
|
},
|
|
871
|
+
{
|
|
872
|
+
"backend": "cuda",
|
|
873
|
+
"backend_version": "12.9",
|
|
874
|
+
"original_backend_version": "12.9.1",
|
|
875
|
+
"backend_variant": "",
|
|
876
|
+
"service": "vllm",
|
|
877
|
+
"service_version": "0.15.0",
|
|
878
|
+
"platform": "linux/amd64",
|
|
879
|
+
"docker_image": "gpustack/runner:cuda12.9-vllm0.15.0",
|
|
880
|
+
"deprecated": false
|
|
881
|
+
},
|
|
882
|
+
{
|
|
883
|
+
"backend": "cuda",
|
|
884
|
+
"backend_version": "12.9",
|
|
885
|
+
"original_backend_version": "12.9.1",
|
|
886
|
+
"backend_variant": "",
|
|
887
|
+
"service": "vllm",
|
|
888
|
+
"service_version": "0.15.0",
|
|
889
|
+
"platform": "linux/arm64",
|
|
890
|
+
"docker_image": "gpustack/runner:cuda12.9-vllm0.15.0",
|
|
891
|
+
"deprecated": false
|
|
892
|
+
},
|
|
871
893
|
{
|
|
872
894
|
"backend": "cuda",
|
|
873
895
|
"backend_version": "12.9",
|
|
@@ -1077,6 +1099,28 @@
|
|
|
1077
1099
|
"docker_image": "gpustack/runner:cuda12.8-sglang0.5.4.post3",
|
|
1078
1100
|
"deprecated": true
|
|
1079
1101
|
},
|
|
1102
|
+
{
|
|
1103
|
+
"backend": "cuda",
|
|
1104
|
+
"backend_version": "12.8",
|
|
1105
|
+
"original_backend_version": "12.8.1",
|
|
1106
|
+
"backend_variant": "",
|
|
1107
|
+
"service": "vllm",
|
|
1108
|
+
"service_version": "0.15.0",
|
|
1109
|
+
"platform": "linux/amd64",
|
|
1110
|
+
"docker_image": "gpustack/runner:cuda12.8-vllm0.15.0",
|
|
1111
|
+
"deprecated": false
|
|
1112
|
+
},
|
|
1113
|
+
{
|
|
1114
|
+
"backend": "cuda",
|
|
1115
|
+
"backend_version": "12.8",
|
|
1116
|
+
"original_backend_version": "12.8.1",
|
|
1117
|
+
"backend_variant": "",
|
|
1118
|
+
"service": "vllm",
|
|
1119
|
+
"service_version": "0.15.0",
|
|
1120
|
+
"platform": "linux/arm64",
|
|
1121
|
+
"docker_image": "gpustack/runner:cuda12.8-vllm0.15.0",
|
|
1122
|
+
"deprecated": false
|
|
1123
|
+
},
|
|
1080
1124
|
{
|
|
1081
1125
|
"backend": "cuda",
|
|
1082
1126
|
"backend_version": "12.8",
|
|
@@ -1297,6 +1341,28 @@
|
|
|
1297
1341
|
"docker_image": "gpustack/runner:cuda12.8-voxbox0.0.20",
|
|
1298
1342
|
"deprecated": true
|
|
1299
1343
|
},
|
|
1344
|
+
{
|
|
1345
|
+
"backend": "cuda",
|
|
1346
|
+
"backend_version": "12.6",
|
|
1347
|
+
"original_backend_version": "12.6.3",
|
|
1348
|
+
"backend_variant": "",
|
|
1349
|
+
"service": "vllm",
|
|
1350
|
+
"service_version": "0.15.0",
|
|
1351
|
+
"platform": "linux/amd64",
|
|
1352
|
+
"docker_image": "gpustack/runner:cuda12.6-vllm0.15.0",
|
|
1353
|
+
"deprecated": false
|
|
1354
|
+
},
|
|
1355
|
+
{
|
|
1356
|
+
"backend": "cuda",
|
|
1357
|
+
"backend_version": "12.6",
|
|
1358
|
+
"original_backend_version": "12.6.3",
|
|
1359
|
+
"backend_variant": "",
|
|
1360
|
+
"service": "vllm",
|
|
1361
|
+
"service_version": "0.15.0",
|
|
1362
|
+
"platform": "linux/arm64",
|
|
1363
|
+
"docker_image": "gpustack/runner:cuda12.6-vllm0.15.0",
|
|
1364
|
+
"deprecated": false
|
|
1365
|
+
},
|
|
1300
1366
|
{
|
|
1301
1367
|
"backend": "cuda",
|
|
1302
1368
|
"backend_version": "12.6",
|
|
@@ -1781,6 +1847,17 @@
|
|
|
1781
1847
|
"docker_image": "gpustack/runner:rocm7.0-sglang0.5.6.post2",
|
|
1782
1848
|
"deprecated": false
|
|
1783
1849
|
},
|
|
1850
|
+
{
|
|
1851
|
+
"backend": "rocm",
|
|
1852
|
+
"backend_version": "7.0",
|
|
1853
|
+
"original_backend_version": "7.0.2",
|
|
1854
|
+
"backend_variant": "",
|
|
1855
|
+
"service": "vllm",
|
|
1856
|
+
"service_version": "0.15.0",
|
|
1857
|
+
"platform": "linux/amd64",
|
|
1858
|
+
"docker_image": "gpustack/runner:rocm7.0-vllm0.15.0",
|
|
1859
|
+
"deprecated": false
|
|
1860
|
+
},
|
|
1784
1861
|
{
|
|
1785
1862
|
"backend": "rocm",
|
|
1786
1863
|
"backend_version": "7.0",
|
|
@@ -1880,6 +1957,17 @@
|
|
|
1880
1957
|
"docker_image": "gpustack/runner:rocm6.4-sglang0.5.5.post3",
|
|
1881
1958
|
"deprecated": false
|
|
1882
1959
|
},
|
|
1960
|
+
{
|
|
1961
|
+
"backend": "rocm",
|
|
1962
|
+
"backend_version": "6.4",
|
|
1963
|
+
"original_backend_version": "6.4.4",
|
|
1964
|
+
"backend_variant": "",
|
|
1965
|
+
"service": "vllm",
|
|
1966
|
+
"service_version": "0.15.0",
|
|
1967
|
+
"platform": "linux/amd64",
|
|
1968
|
+
"docker_image": "gpustack/runner:rocm6.4-vllm0.15.0",
|
|
1969
|
+
"deprecated": false
|
|
1970
|
+
},
|
|
1883
1971
|
{
|
|
1884
1972
|
"backend": "rocm",
|
|
1885
1973
|
"backend_version": "6.4",
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: gpustack-runner
|
|
3
|
-
Version: 0.1.
|
|
3
|
+
Version: 0.1.25
|
|
4
4
|
Summary: GPUStack Runner is library for registering runnable accelerated backends and services in GPUStack.
|
|
5
5
|
Project-URL: Homepage, https://github.com/gpustack/runner
|
|
6
6
|
Project-URL: Bug Tracker, https://github.com/gpustack/gpustack/issues
|
|
@@ -52,17 +52,17 @@ The following table lists the supported accelerated backends and their correspon
|
|
|
52
52
|
vllm-ascend [#3316](https://github.com/vllm-project/vllm-ascend/issues/3316)
|
|
53
53
|
and [#2795](https://github.com/vllm-project/vllm-ascend/issues/2795).
|
|
54
54
|
|
|
55
|
-
| CANN Version <br/> (Variant) | MindIE | vLLM
|
|
56
|
-
|
|
57
|
-
| 8.5 (A3/910C) | `2.3.0` | `0.14.1`, `0.13.0`
|
|
58
|
-
| 8.5 (910B) | `2.3.0` | `0.14.1`, `0.13.0`
|
|
59
|
-
| 8.5 (310P) | `2.3.0` | `0.14.1`
|
|
60
|
-
| 8.3 (A3/910C) | `2.2.rc1` | `0.12.0`, `0.11.0`
|
|
61
|
-
| 8.3 (910B) | `2.2.rc1` | `0.12.0`, `0.11.0`
|
|
62
|
-
| 8.3 (310P) | `2.2.rc1` |
|
|
63
|
-
| 8.2 (A3/910C) | `2.1.rc2` | `0.10.2
|
|
64
|
-
| 8.2 (910B) | `2.1.rc2` | `0.10.2`,
|
|
65
|
-
| 8.2 (310P) | `2.1.rc2` | `0.10.0`, `0.9.2`
|
|
55
|
+
| CANN Version <br/> (Variant) | MindIE | vLLM | SGLang |
|
|
56
|
+
|------------------------------|-----------|-----------------------------------|------------------------|
|
|
57
|
+
| 8.5 (A3/910C) | `2.3.0` | `0.14.1`, `0.13.0` | `0.5.8` |
|
|
58
|
+
| 8.5 (910B) | `2.3.0` | `0.14.1`, `0.13.0` | `0.5.8` |
|
|
59
|
+
| 8.5 (310P) | `2.3.0` | `0.14.1` | |
|
|
60
|
+
| 8.3 (A3/910C) | `2.2.rc1` | `0.12.0`, `0.11.0` | `0.5.7`, `0.5.6.post2` |
|
|
61
|
+
| 8.3 (910B) | `2.2.rc1` | `0.12.0`, `0.11.0` | `0.5.7`, `0.5.6.post2` |
|
|
62
|
+
| 8.3 (310P) | `2.2.rc1` | | |
|
|
63
|
+
| 8.2 (A3/910C) | `2.1.rc2` | `0.10.2` | `0.5.2`, `0.5.1.post3` |
|
|
64
|
+
| 8.2 (910B) | `2.1.rc2` | `0.10.2`, `0.10.0`, <br/>`0.9.2` | `0.5.2`, `0.5.1.post3` |
|
|
65
|
+
| 8.2 (310P) | `2.1.rc2` | `0.10.0`, `0.9.2` | |
|
|
66
66
|
|
|
67
67
|
### Iluvatar CoreX
|
|
68
68
|
|
|
@@ -80,11 +80,11 @@ The following table lists the supported accelerated backends and their correspon
|
|
|
80
80
|
> - CUDA 12.6/12.4 supports Compute Capabilities:
|
|
81
81
|
`7.5 8.0+PTX 8.9 9.0+PTX`.
|
|
82
82
|
|
|
83
|
-
| CUDA Version <br/> (Variant) | vLLM
|
|
84
|
-
|
|
85
|
-
| 12.9 | `0.14.1`,
|
|
86
|
-
| 12.8 | `0.
|
|
87
|
-
| 12.6 | `0.
|
|
83
|
+
| CUDA Version <br/> (Variant) | vLLM | SGLang | VoxBox |
|
|
84
|
+
|------------------------------|----------------------------------------------------------------------|-----------------------------------------------------|----------|
|
|
85
|
+
| 12.9 | `0.15.0`, `0.14.1`, <br/>`0.13.0`, `0.12.0`, <br/>`0.11.2` | `0.5.8`, `0.5.7`, <br/>`0.5.6.post2` | |
|
|
86
|
+
| 12.8 | `0.15.0`, `0.14.1`, <br/>`0.13.0`, `0.12.0`, <br/>`0.11.2`, `0.10.2` | `0.5.8`, `0.5.7`, <br/>`0.5.6.post2`, `0.5.5.post3` | `0.0.21` |
|
|
87
|
+
| 12.6 | `0.15.0`, `0.14.1`, <br/>`0.13.0`, `0.12.0`, <br/>`0.11.2`, `0.10.2` | | `0.0.21` |
|
|
88
88
|
|
|
89
89
|
### Hygon DTK
|
|
90
90
|
|
|
@@ -128,10 +128,10 @@ The following table lists the supported accelerated backends and their correspon
|
|
|
128
128
|
> - ROCm 6.4 SGLang supports `gfx942` only.
|
|
129
129
|
> - ROCm 7.0 SGLang supports `gfx950` only.
|
|
130
130
|
|
|
131
|
-
| ROCm Version <br/> (Variant) | vLLM
|
|
132
|
-
|
|
133
|
-
| 7.0 | `0.14.1`,
|
|
134
|
-
| 6.4 | `0.14.1`,
|
|
131
|
+
| ROCm Version <br/> (Variant) | vLLM | SGLang |
|
|
132
|
+
|------------------------------|----------------------------------------------------------------------|-----------------------------------------------------|
|
|
133
|
+
| 7.0 | `0.15.0`, `0.14.1`, <br/>`0.13.0`, `0.12.0`, <br/>`0.11.2` | `0.5.8`, `0.5.7`, <br/>`0.5.6.post2` |
|
|
134
|
+
| 6.4 | `0.15.0`, `0.14.1`, <br/>`0.13.0`, `0.12.0`, <br/>`0.11.2`, `0.10.2` | `0.5.8`, `0.5.7`, <br/>`0.5.6.post2`, `0.5.5.post3` |
|
|
135
135
|
|
|
136
136
|
## Directory Structure
|
|
137
137
|
|
|
@@ -1,17 +1,17 @@
|
|
|
1
1
|
gpustack_runner/__init__.py,sha256=ss8_wsk1oo13qFlP9usrXKX4ypHs1NZb2OVd6uFx5cc,715
|
|
2
2
|
gpustack_runner/__main__.py,sha256=uvpk9GtyJGtHaKM7DyM64N5mwehwpDD3v8ba6Yy8V3A,1364
|
|
3
3
|
gpustack_runner/__utils__.py,sha256=LSo0Iqxd5OjQFncVOYcqC8cncjtywf0qac31UPw7Ou4,4372
|
|
4
|
-
gpustack_runner/_version.py,sha256=
|
|
4
|
+
gpustack_runner/_version.py,sha256=IYWLENHDtg-FYeQMOf-gTgfO-GgvV1sYU-LK3_0iuWs,777
|
|
5
5
|
gpustack_runner/_version.pyi,sha256=A42NoSgcqEXVy2OeNm4LXC9CbyonbooYrSUBlPm2lGY,156
|
|
6
6
|
gpustack_runner/envs.py,sha256=Wm0GTIiDJIT1zEjLpaPZNLbOs23NNFc2Y6zZuRLlTKQ,3470
|
|
7
7
|
gpustack_runner/runner.py,sha256=Rk4nyHj7Bn7ibAdxspXpXplMgWVMsG9Jb7GV8sHk2Ig,26310
|
|
8
|
-
gpustack_runner/runner.py.json,sha256=
|
|
8
|
+
gpustack_runner/runner.py.json,sha256=JKQ_v5AqHAMpKqgpYJ_q_JDzZMvp22NTJ5YNZs9gNfg,56933
|
|
9
9
|
gpustack_runner/cmds/__init__.py,sha256=zjdv_OC674KAcitjiHrHbXnAwLtw8Ju3psW0IKFqPIg,471
|
|
10
10
|
gpustack_runner/cmds/__types__.py,sha256=7C4kQM0EHPD8WpJpTo6kh9rEdkrYALcLQ-GAzMMsqV8,789
|
|
11
11
|
gpustack_runner/cmds/images.py,sha256=qkL862Xx6pcrLALhB8azMmtOAlIT-V5iGPHgSllnsPs,49029
|
|
12
|
-
gpustack_runner/_version_appendix.py,sha256=
|
|
13
|
-
gpustack_runner-0.1.
|
|
14
|
-
gpustack_runner-0.1.
|
|
15
|
-
gpustack_runner-0.1.
|
|
16
|
-
gpustack_runner-0.1.
|
|
17
|
-
gpustack_runner-0.1.
|
|
12
|
+
gpustack_runner/_version_appendix.py,sha256=YOoMwEs9RIGE46UmO14osF0y9CKc71HhOLIdBUpQxjQ,23
|
|
13
|
+
gpustack_runner-0.1.25.dist-info/METADATA,sha256=ObJexPdV4cthVPis6tTV57HmFCuoBrF9KRe1KnB6xmI,12754
|
|
14
|
+
gpustack_runner-0.1.25.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
|
|
15
|
+
gpustack_runner-0.1.25.dist-info/entry_points.txt,sha256=M1Dxl6cY0kIgf2I4pPsV-_kU6BAtjj93spmsXAdwW3s,66
|
|
16
|
+
gpustack_runner-0.1.25.dist-info/licenses/LICENSE,sha256=OiPibowBvB-NHV3TP_NOj18XNBlXcshXZFMpa3uvKVE,10362
|
|
17
|
+
gpustack_runner-0.1.25.dist-info/RECORD,,
|
|
File without changes
|
{gpustack_runner-0.1.24.post4.dist-info → gpustack_runner-0.1.25.dist-info}/entry_points.txt
RENAMED
|
File without changes
|
{gpustack_runner-0.1.24.post4.dist-info → gpustack_runner-0.1.25.dist-info}/licenses/LICENSE
RENAMED
|
File without changes
|