gpustack-runner 0.1.24.post3__py3-none-any.whl → 0.1.25__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- gpustack_runner/_version.py +2 -2
- gpustack_runner/_version_appendix.py +1 -1
- gpustack_runner/runner.py.json +132 -0
- {gpustack_runner-0.1.24.post3.dist-info → gpustack_runner-0.1.25.dist-info}/METADATA +21 -21
- {gpustack_runner-0.1.24.post3.dist-info → gpustack_runner-0.1.25.dist-info}/RECORD +8 -8
- {gpustack_runner-0.1.24.post3.dist-info → gpustack_runner-0.1.25.dist-info}/WHEEL +0 -0
- {gpustack_runner-0.1.24.post3.dist-info → gpustack_runner-0.1.25.dist-info}/entry_points.txt +0 -0
- {gpustack_runner-0.1.24.post3.dist-info → gpustack_runner-0.1.25.dist-info}/licenses/LICENSE +0 -0
gpustack_runner/_version.py
CHANGED
|
@@ -27,8 +27,8 @@ version_tuple: VERSION_TUPLE
|
|
|
27
27
|
__commit_id__: COMMIT_ID
|
|
28
28
|
commit_id: COMMIT_ID
|
|
29
29
|
|
|
30
|
-
__version__ = version = '0.1.
|
|
31
|
-
__version_tuple__ = version_tuple = (0, 1,
|
|
30
|
+
__version__ = version = '0.1.25'
|
|
31
|
+
__version_tuple__ = version_tuple = (0, 1, 25)
|
|
32
32
|
try:
|
|
33
33
|
from ._version_appendix import git_commit
|
|
34
34
|
__commit_id__ = commit_id = git_commit
|
|
@@ -1 +1 @@
|
|
|
1
|
-
git_commit = "
|
|
1
|
+
git_commit = "b005327"
|
gpustack_runner/runner.py.json
CHANGED
|
@@ -868,6 +868,28 @@
|
|
|
868
868
|
"docker_image": "gpustack/runner:cuda12.9-sglang0.5.6.post2",
|
|
869
869
|
"deprecated": false
|
|
870
870
|
},
|
|
871
|
+
{
|
|
872
|
+
"backend": "cuda",
|
|
873
|
+
"backend_version": "12.9",
|
|
874
|
+
"original_backend_version": "12.9.1",
|
|
875
|
+
"backend_variant": "",
|
|
876
|
+
"service": "vllm",
|
|
877
|
+
"service_version": "0.15.0",
|
|
878
|
+
"platform": "linux/amd64",
|
|
879
|
+
"docker_image": "gpustack/runner:cuda12.9-vllm0.15.0",
|
|
880
|
+
"deprecated": false
|
|
881
|
+
},
|
|
882
|
+
{
|
|
883
|
+
"backend": "cuda",
|
|
884
|
+
"backend_version": "12.9",
|
|
885
|
+
"original_backend_version": "12.9.1",
|
|
886
|
+
"backend_variant": "",
|
|
887
|
+
"service": "vllm",
|
|
888
|
+
"service_version": "0.15.0",
|
|
889
|
+
"platform": "linux/arm64",
|
|
890
|
+
"docker_image": "gpustack/runner:cuda12.9-vllm0.15.0",
|
|
891
|
+
"deprecated": false
|
|
892
|
+
},
|
|
871
893
|
{
|
|
872
894
|
"backend": "cuda",
|
|
873
895
|
"backend_version": "12.9",
|
|
@@ -1077,6 +1099,28 @@
|
|
|
1077
1099
|
"docker_image": "gpustack/runner:cuda12.8-sglang0.5.4.post3",
|
|
1078
1100
|
"deprecated": true
|
|
1079
1101
|
},
|
|
1102
|
+
{
|
|
1103
|
+
"backend": "cuda",
|
|
1104
|
+
"backend_version": "12.8",
|
|
1105
|
+
"original_backend_version": "12.8.1",
|
|
1106
|
+
"backend_variant": "",
|
|
1107
|
+
"service": "vllm",
|
|
1108
|
+
"service_version": "0.15.0",
|
|
1109
|
+
"platform": "linux/amd64",
|
|
1110
|
+
"docker_image": "gpustack/runner:cuda12.8-vllm0.15.0",
|
|
1111
|
+
"deprecated": false
|
|
1112
|
+
},
|
|
1113
|
+
{
|
|
1114
|
+
"backend": "cuda",
|
|
1115
|
+
"backend_version": "12.8",
|
|
1116
|
+
"original_backend_version": "12.8.1",
|
|
1117
|
+
"backend_variant": "",
|
|
1118
|
+
"service": "vllm",
|
|
1119
|
+
"service_version": "0.15.0",
|
|
1120
|
+
"platform": "linux/arm64",
|
|
1121
|
+
"docker_image": "gpustack/runner:cuda12.8-vllm0.15.0",
|
|
1122
|
+
"deprecated": false
|
|
1123
|
+
},
|
|
1080
1124
|
{
|
|
1081
1125
|
"backend": "cuda",
|
|
1082
1126
|
"backend_version": "12.8",
|
|
@@ -1297,6 +1341,28 @@
|
|
|
1297
1341
|
"docker_image": "gpustack/runner:cuda12.8-voxbox0.0.20",
|
|
1298
1342
|
"deprecated": true
|
|
1299
1343
|
},
|
|
1344
|
+
{
|
|
1345
|
+
"backend": "cuda",
|
|
1346
|
+
"backend_version": "12.6",
|
|
1347
|
+
"original_backend_version": "12.6.3",
|
|
1348
|
+
"backend_variant": "",
|
|
1349
|
+
"service": "vllm",
|
|
1350
|
+
"service_version": "0.15.0",
|
|
1351
|
+
"platform": "linux/amd64",
|
|
1352
|
+
"docker_image": "gpustack/runner:cuda12.6-vllm0.15.0",
|
|
1353
|
+
"deprecated": false
|
|
1354
|
+
},
|
|
1355
|
+
{
|
|
1356
|
+
"backend": "cuda",
|
|
1357
|
+
"backend_version": "12.6",
|
|
1358
|
+
"original_backend_version": "12.6.3",
|
|
1359
|
+
"backend_variant": "",
|
|
1360
|
+
"service": "vllm",
|
|
1361
|
+
"service_version": "0.15.0",
|
|
1362
|
+
"platform": "linux/arm64",
|
|
1363
|
+
"docker_image": "gpustack/runner:cuda12.6-vllm0.15.0",
|
|
1364
|
+
"deprecated": false
|
|
1365
|
+
},
|
|
1300
1366
|
{
|
|
1301
1367
|
"backend": "cuda",
|
|
1302
1368
|
"backend_version": "12.6",
|
|
@@ -1748,6 +1814,17 @@
|
|
|
1748
1814
|
"docker_image": "gpustack/runner:musa4.1-vllm0.9.2",
|
|
1749
1815
|
"deprecated": false
|
|
1750
1816
|
},
|
|
1817
|
+
{
|
|
1818
|
+
"backend": "rocm",
|
|
1819
|
+
"backend_version": "7.0",
|
|
1820
|
+
"original_backend_version": "7.0.2",
|
|
1821
|
+
"backend_variant": "",
|
|
1822
|
+
"service": "sglang",
|
|
1823
|
+
"service_version": "0.5.8",
|
|
1824
|
+
"platform": "linux/amd64",
|
|
1825
|
+
"docker_image": "gpustack/runner:rocm7.0-sglang0.5.8",
|
|
1826
|
+
"deprecated": false
|
|
1827
|
+
},
|
|
1751
1828
|
{
|
|
1752
1829
|
"backend": "rocm",
|
|
1753
1830
|
"backend_version": "7.0",
|
|
@@ -1770,6 +1847,28 @@
|
|
|
1770
1847
|
"docker_image": "gpustack/runner:rocm7.0-sglang0.5.6.post2",
|
|
1771
1848
|
"deprecated": false
|
|
1772
1849
|
},
|
|
1850
|
+
{
|
|
1851
|
+
"backend": "rocm",
|
|
1852
|
+
"backend_version": "7.0",
|
|
1853
|
+
"original_backend_version": "7.0.2",
|
|
1854
|
+
"backend_variant": "",
|
|
1855
|
+
"service": "vllm",
|
|
1856
|
+
"service_version": "0.15.0",
|
|
1857
|
+
"platform": "linux/amd64",
|
|
1858
|
+
"docker_image": "gpustack/runner:rocm7.0-vllm0.15.0",
|
|
1859
|
+
"deprecated": false
|
|
1860
|
+
},
|
|
1861
|
+
{
|
|
1862
|
+
"backend": "rocm",
|
|
1863
|
+
"backend_version": "7.0",
|
|
1864
|
+
"original_backend_version": "7.0.2",
|
|
1865
|
+
"backend_variant": "",
|
|
1866
|
+
"service": "vllm",
|
|
1867
|
+
"service_version": "0.14.1",
|
|
1868
|
+
"platform": "linux/amd64",
|
|
1869
|
+
"docker_image": "gpustack/runner:rocm7.0-vllm0.14.1",
|
|
1870
|
+
"deprecated": false
|
|
1871
|
+
},
|
|
1773
1872
|
{
|
|
1774
1873
|
"backend": "rocm",
|
|
1775
1874
|
"backend_version": "7.0",
|
|
@@ -1814,6 +1913,17 @@
|
|
|
1814
1913
|
"docker_image": "gpustack/runner:rocm7.0-vllm0.11.0",
|
|
1815
1914
|
"deprecated": true
|
|
1816
1915
|
},
|
|
1916
|
+
{
|
|
1917
|
+
"backend": "rocm",
|
|
1918
|
+
"backend_version": "6.4",
|
|
1919
|
+
"original_backend_version": "6.4.4",
|
|
1920
|
+
"backend_variant": "",
|
|
1921
|
+
"service": "sglang",
|
|
1922
|
+
"service_version": "0.5.8",
|
|
1923
|
+
"platform": "linux/amd64",
|
|
1924
|
+
"docker_image": "gpustack/runner:rocm6.4-sglang0.5.8",
|
|
1925
|
+
"deprecated": false
|
|
1926
|
+
},
|
|
1817
1927
|
{
|
|
1818
1928
|
"backend": "rocm",
|
|
1819
1929
|
"backend_version": "6.4",
|
|
@@ -1847,6 +1957,28 @@
|
|
|
1847
1957
|
"docker_image": "gpustack/runner:rocm6.4-sglang0.5.5.post3",
|
|
1848
1958
|
"deprecated": false
|
|
1849
1959
|
},
|
|
1960
|
+
{
|
|
1961
|
+
"backend": "rocm",
|
|
1962
|
+
"backend_version": "6.4",
|
|
1963
|
+
"original_backend_version": "6.4.4",
|
|
1964
|
+
"backend_variant": "",
|
|
1965
|
+
"service": "vllm",
|
|
1966
|
+
"service_version": "0.15.0",
|
|
1967
|
+
"platform": "linux/amd64",
|
|
1968
|
+
"docker_image": "gpustack/runner:rocm6.4-vllm0.15.0",
|
|
1969
|
+
"deprecated": false
|
|
1970
|
+
},
|
|
1971
|
+
{
|
|
1972
|
+
"backend": "rocm",
|
|
1973
|
+
"backend_version": "6.4",
|
|
1974
|
+
"original_backend_version": "6.4.4",
|
|
1975
|
+
"backend_variant": "",
|
|
1976
|
+
"service": "vllm",
|
|
1977
|
+
"service_version": "0.14.1",
|
|
1978
|
+
"platform": "linux/amd64",
|
|
1979
|
+
"docker_image": "gpustack/runner:rocm6.4-vllm0.14.1",
|
|
1980
|
+
"deprecated": false
|
|
1981
|
+
},
|
|
1850
1982
|
{
|
|
1851
1983
|
"backend": "rocm",
|
|
1852
1984
|
"backend_version": "6.4",
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: gpustack-runner
|
|
3
|
-
Version: 0.1.
|
|
3
|
+
Version: 0.1.25
|
|
4
4
|
Summary: GPUStack Runner is library for registering runnable accelerated backends and services in GPUStack.
|
|
5
5
|
Project-URL: Homepage, https://github.com/gpustack/runner
|
|
6
6
|
Project-URL: Bug Tracker, https://github.com/gpustack/gpustack/issues
|
|
@@ -52,17 +52,17 @@ The following table lists the supported accelerated backends and their correspon
|
|
|
52
52
|
vllm-ascend [#3316](https://github.com/vllm-project/vllm-ascend/issues/3316)
|
|
53
53
|
and [#2795](https://github.com/vllm-project/vllm-ascend/issues/2795).
|
|
54
54
|
|
|
55
|
-
| CANN Version <br/> (Variant) | MindIE | vLLM
|
|
56
|
-
|
|
57
|
-
| 8.5 (A3/910C) | `2.3.0` | `0.14.1`, `0.13.0`
|
|
58
|
-
| 8.5 (910B) | `2.3.0` | `0.14.1`, `0.13.0`
|
|
59
|
-
| 8.5 (310P) | `2.3.0` | `0.14.1`
|
|
60
|
-
| 8.3 (A3/910C) | `2.2.rc1` | `0.12.0`, `0.11.0`
|
|
61
|
-
| 8.3 (910B) | `2.2.rc1` | `0.12.0`, `0.11.0`
|
|
62
|
-
| 8.3 (310P) | `2.2.rc1` |
|
|
63
|
-
| 8.2 (A3/910C) | `2.1.rc2` | `0.10.2
|
|
64
|
-
| 8.2 (910B) | `2.1.rc2` | `0.10.2`,
|
|
65
|
-
| 8.2 (310P) | `2.1.rc2` | `0.10.0`, `0.9.2`
|
|
55
|
+
| CANN Version <br/> (Variant) | MindIE | vLLM | SGLang |
|
|
56
|
+
|------------------------------|-----------|-----------------------------------|------------------------|
|
|
57
|
+
| 8.5 (A3/910C) | `2.3.0` | `0.14.1`, `0.13.0` | `0.5.8` |
|
|
58
|
+
| 8.5 (910B) | `2.3.0` | `0.14.1`, `0.13.0` | `0.5.8` |
|
|
59
|
+
| 8.5 (310P) | `2.3.0` | `0.14.1` | |
|
|
60
|
+
| 8.3 (A3/910C) | `2.2.rc1` | `0.12.0`, `0.11.0` | `0.5.7`, `0.5.6.post2` |
|
|
61
|
+
| 8.3 (910B) | `2.2.rc1` | `0.12.0`, `0.11.0` | `0.5.7`, `0.5.6.post2` |
|
|
62
|
+
| 8.3 (310P) | `2.2.rc1` | | |
|
|
63
|
+
| 8.2 (A3/910C) | `2.1.rc2` | `0.10.2` | `0.5.2`, `0.5.1.post3` |
|
|
64
|
+
| 8.2 (910B) | `2.1.rc2` | `0.10.2`, `0.10.0`, <br/>`0.9.2` | `0.5.2`, `0.5.1.post3` |
|
|
65
|
+
| 8.2 (310P) | `2.1.rc2` | `0.10.0`, `0.9.2` | |
|
|
66
66
|
|
|
67
67
|
### Iluvatar CoreX
|
|
68
68
|
|
|
@@ -80,11 +80,11 @@ The following table lists the supported accelerated backends and their correspon
|
|
|
80
80
|
> - CUDA 12.6/12.4 supports Compute Capabilities:
|
|
81
81
|
`7.5 8.0+PTX 8.9 9.0+PTX`.
|
|
82
82
|
|
|
83
|
-
| CUDA Version <br/> (Variant) | vLLM
|
|
84
|
-
|
|
85
|
-
| 12.9 | `0.14.1`,
|
|
86
|
-
| 12.8 | `0.
|
|
87
|
-
| 12.6 | `0.
|
|
83
|
+
| CUDA Version <br/> (Variant) | vLLM | SGLang | VoxBox |
|
|
84
|
+
|------------------------------|----------------------------------------------------------------------|-----------------------------------------------------|----------|
|
|
85
|
+
| 12.9 | `0.15.0`, `0.14.1`, <br/>`0.13.0`, `0.12.0`, <br/>`0.11.2` | `0.5.8`, `0.5.7`, <br/>`0.5.6.post2` | |
|
|
86
|
+
| 12.8 | `0.15.0`, `0.14.1`, <br/>`0.13.0`, `0.12.0`, <br/>`0.11.2`, `0.10.2` | `0.5.8`, `0.5.7`, <br/>`0.5.6.post2`, `0.5.5.post3` | `0.0.21` |
|
|
87
|
+
| 12.6 | `0.15.0`, `0.14.1`, <br/>`0.13.0`, `0.12.0`, <br/>`0.11.2`, `0.10.2` | | `0.0.21` |
|
|
88
88
|
|
|
89
89
|
### Hygon DTK
|
|
90
90
|
|
|
@@ -128,10 +128,10 @@ The following table lists the supported accelerated backends and their correspon
|
|
|
128
128
|
> - ROCm 6.4 SGLang supports `gfx942` only.
|
|
129
129
|
> - ROCm 7.0 SGLang supports `gfx950` only.
|
|
130
130
|
|
|
131
|
-
| ROCm Version <br/> (Variant) | vLLM
|
|
132
|
-
|
|
133
|
-
| 7.0 |
|
|
134
|
-
| 6.4 |
|
|
131
|
+
| ROCm Version <br/> (Variant) | vLLM | SGLang |
|
|
132
|
+
|------------------------------|----------------------------------------------------------------------|-----------------------------------------------------|
|
|
133
|
+
| 7.0 | `0.15.0`, `0.14.1`, <br/>`0.13.0`, `0.12.0`, <br/>`0.11.2` | `0.5.8`, `0.5.7`, <br/>`0.5.6.post2` |
|
|
134
|
+
| 6.4 | `0.15.0`, `0.14.1`, <br/>`0.13.0`, `0.12.0`, <br/>`0.11.2`, `0.10.2` | `0.5.8`, `0.5.7`, <br/>`0.5.6.post2`, `0.5.5.post3` |
|
|
135
135
|
|
|
136
136
|
## Directory Structure
|
|
137
137
|
|
|
@@ -1,17 +1,17 @@
|
|
|
1
1
|
gpustack_runner/__init__.py,sha256=ss8_wsk1oo13qFlP9usrXKX4ypHs1NZb2OVd6uFx5cc,715
|
|
2
2
|
gpustack_runner/__main__.py,sha256=uvpk9GtyJGtHaKM7DyM64N5mwehwpDD3v8ba6Yy8V3A,1364
|
|
3
3
|
gpustack_runner/__utils__.py,sha256=LSo0Iqxd5OjQFncVOYcqC8cncjtywf0qac31UPw7Ou4,4372
|
|
4
|
-
gpustack_runner/_version.py,sha256=
|
|
4
|
+
gpustack_runner/_version.py,sha256=IYWLENHDtg-FYeQMOf-gTgfO-GgvV1sYU-LK3_0iuWs,777
|
|
5
5
|
gpustack_runner/_version.pyi,sha256=A42NoSgcqEXVy2OeNm4LXC9CbyonbooYrSUBlPm2lGY,156
|
|
6
6
|
gpustack_runner/envs.py,sha256=Wm0GTIiDJIT1zEjLpaPZNLbOs23NNFc2Y6zZuRLlTKQ,3470
|
|
7
7
|
gpustack_runner/runner.py,sha256=Rk4nyHj7Bn7ibAdxspXpXplMgWVMsG9Jb7GV8sHk2Ig,26310
|
|
8
|
-
gpustack_runner/runner.py.json,sha256=
|
|
8
|
+
gpustack_runner/runner.py.json,sha256=JKQ_v5AqHAMpKqgpYJ_q_JDzZMvp22NTJ5YNZs9gNfg,56933
|
|
9
9
|
gpustack_runner/cmds/__init__.py,sha256=zjdv_OC674KAcitjiHrHbXnAwLtw8Ju3psW0IKFqPIg,471
|
|
10
10
|
gpustack_runner/cmds/__types__.py,sha256=7C4kQM0EHPD8WpJpTo6kh9rEdkrYALcLQ-GAzMMsqV8,789
|
|
11
11
|
gpustack_runner/cmds/images.py,sha256=qkL862Xx6pcrLALhB8azMmtOAlIT-V5iGPHgSllnsPs,49029
|
|
12
|
-
gpustack_runner/_version_appendix.py,sha256=
|
|
13
|
-
gpustack_runner-0.1.
|
|
14
|
-
gpustack_runner-0.1.
|
|
15
|
-
gpustack_runner-0.1.
|
|
16
|
-
gpustack_runner-0.1.
|
|
17
|
-
gpustack_runner-0.1.
|
|
12
|
+
gpustack_runner/_version_appendix.py,sha256=YOoMwEs9RIGE46UmO14osF0y9CKc71HhOLIdBUpQxjQ,23
|
|
13
|
+
gpustack_runner-0.1.25.dist-info/METADATA,sha256=ObJexPdV4cthVPis6tTV57HmFCuoBrF9KRe1KnB6xmI,12754
|
|
14
|
+
gpustack_runner-0.1.25.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
|
|
15
|
+
gpustack_runner-0.1.25.dist-info/entry_points.txt,sha256=M1Dxl6cY0kIgf2I4pPsV-_kU6BAtjj93spmsXAdwW3s,66
|
|
16
|
+
gpustack_runner-0.1.25.dist-info/licenses/LICENSE,sha256=OiPibowBvB-NHV3TP_NOj18XNBlXcshXZFMpa3uvKVE,10362
|
|
17
|
+
gpustack_runner-0.1.25.dist-info/RECORD,,
|
|
File without changes
|
{gpustack_runner-0.1.24.post3.dist-info → gpustack_runner-0.1.25.dist-info}/entry_points.txt
RENAMED
|
File without changes
|
{gpustack_runner-0.1.24.post3.dist-info → gpustack_runner-0.1.25.dist-info}/licenses/LICENSE
RENAMED
|
File without changes
|