gpustack-runner 0.1.22.post2__py3-none-any.whl → 0.1.22.post3__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- gpustack_runner/_version.py +2 -2
- gpustack_runner/_version_appendix.py +1 -1
- gpustack_runner/runner.py.json +88 -0
- {gpustack_runner-0.1.22.post2.dist-info → gpustack_runner-0.1.22.post3.dist-info}/METADATA +13 -12
- {gpustack_runner-0.1.22.post2.dist-info → gpustack_runner-0.1.22.post3.dist-info}/RECORD +8 -8
- {gpustack_runner-0.1.22.post2.dist-info → gpustack_runner-0.1.22.post3.dist-info}/WHEEL +0 -0
- {gpustack_runner-0.1.22.post2.dist-info → gpustack_runner-0.1.22.post3.dist-info}/entry_points.txt +0 -0
- {gpustack_runner-0.1.22.post2.dist-info → gpustack_runner-0.1.22.post3.dist-info}/licenses/LICENSE +0 -0
gpustack_runner/_version.py
CHANGED
|
@@ -27,8 +27,8 @@ version_tuple: VERSION_TUPLE
|
|
|
27
27
|
__commit_id__: COMMIT_ID
|
|
28
28
|
commit_id: COMMIT_ID
|
|
29
29
|
|
|
30
|
-
__version__ = version = '0.1.22.
|
|
31
|
-
__version_tuple__ = version_tuple = (0, 1, 22, '
|
|
30
|
+
__version__ = version = '0.1.22.post3'
|
|
31
|
+
__version_tuple__ = version_tuple = (0, 1, 22, 'post3')
|
|
32
32
|
try:
|
|
33
33
|
from ._version_appendix import git_commit
|
|
34
34
|
__commit_id__ = commit_id = git_commit
|
|
@@ -1 +1 @@
|
|
|
1
|
-
git_commit = "
|
|
1
|
+
git_commit = "c9f91c3"
|
gpustack_runner/runner.py.json
CHANGED
|
@@ -604,6 +604,28 @@
|
|
|
604
604
|
"docker_image": "gpustack/runner:cuda12.9-sglang0.5.6.post2",
|
|
605
605
|
"deprecated": false
|
|
606
606
|
},
|
|
607
|
+
{
|
|
608
|
+
"backend": "cuda",
|
|
609
|
+
"backend_version": "12.9",
|
|
610
|
+
"original_backend_version": "12.9.1",
|
|
611
|
+
"backend_variant": "",
|
|
612
|
+
"service": "vllm",
|
|
613
|
+
"service_version": "0.13.0",
|
|
614
|
+
"platform": "linux/amd64",
|
|
615
|
+
"docker_image": "gpustack/runner:cuda12.9-vllm0.13.0",
|
|
616
|
+
"deprecated": false
|
|
617
|
+
},
|
|
618
|
+
{
|
|
619
|
+
"backend": "cuda",
|
|
620
|
+
"backend_version": "12.9",
|
|
621
|
+
"original_backend_version": "12.9.1",
|
|
622
|
+
"backend_variant": "",
|
|
623
|
+
"service": "vllm",
|
|
624
|
+
"service_version": "0.13.0",
|
|
625
|
+
"platform": "linux/arm64",
|
|
626
|
+
"docker_image": "gpustack/runner:cuda12.9-vllm0.13.0",
|
|
627
|
+
"deprecated": false
|
|
628
|
+
},
|
|
607
629
|
{
|
|
608
630
|
"backend": "cuda",
|
|
609
631
|
"backend_version": "12.9",
|
|
@@ -725,6 +747,28 @@
|
|
|
725
747
|
"docker_image": "gpustack/runner:cuda12.8-sglang0.5.4.post3",
|
|
726
748
|
"deprecated": false
|
|
727
749
|
},
|
|
750
|
+
{
|
|
751
|
+
"backend": "cuda",
|
|
752
|
+
"backend_version": "12.8",
|
|
753
|
+
"original_backend_version": "12.8.1",
|
|
754
|
+
"backend_variant": "",
|
|
755
|
+
"service": "vllm",
|
|
756
|
+
"service_version": "0.13.0",
|
|
757
|
+
"platform": "linux/amd64",
|
|
758
|
+
"docker_image": "gpustack/runner:cuda12.8-vllm0.13.0",
|
|
759
|
+
"deprecated": false
|
|
760
|
+
},
|
|
761
|
+
{
|
|
762
|
+
"backend": "cuda",
|
|
763
|
+
"backend_version": "12.8",
|
|
764
|
+
"original_backend_version": "12.8.1",
|
|
765
|
+
"backend_variant": "",
|
|
766
|
+
"service": "vllm",
|
|
767
|
+
"service_version": "0.13.0",
|
|
768
|
+
"platform": "linux/arm64",
|
|
769
|
+
"docker_image": "gpustack/runner:cuda12.8-vllm0.13.0",
|
|
770
|
+
"deprecated": false
|
|
771
|
+
},
|
|
728
772
|
{
|
|
729
773
|
"backend": "cuda",
|
|
730
774
|
"backend_version": "12.8",
|
|
@@ -879,6 +923,28 @@
|
|
|
879
923
|
"docker_image": "gpustack/runner:cuda12.8-voxbox0.0.20",
|
|
880
924
|
"deprecated": false
|
|
881
925
|
},
|
|
926
|
+
{
|
|
927
|
+
"backend": "cuda",
|
|
928
|
+
"backend_version": "12.6",
|
|
929
|
+
"original_backend_version": "12.6.3",
|
|
930
|
+
"backend_variant": "",
|
|
931
|
+
"service": "vllm",
|
|
932
|
+
"service_version": "0.13.0",
|
|
933
|
+
"platform": "linux/amd64",
|
|
934
|
+
"docker_image": "gpustack/runner:cuda12.6-vllm0.13.0",
|
|
935
|
+
"deprecated": false
|
|
936
|
+
},
|
|
937
|
+
{
|
|
938
|
+
"backend": "cuda",
|
|
939
|
+
"backend_version": "12.6",
|
|
940
|
+
"original_backend_version": "12.6.3",
|
|
941
|
+
"backend_variant": "",
|
|
942
|
+
"service": "vllm",
|
|
943
|
+
"service_version": "0.13.0",
|
|
944
|
+
"platform": "linux/arm64",
|
|
945
|
+
"docker_image": "gpustack/runner:cuda12.6-vllm0.13.0",
|
|
946
|
+
"deprecated": false
|
|
947
|
+
},
|
|
882
948
|
{
|
|
883
949
|
"backend": "cuda",
|
|
884
950
|
"backend_version": "12.6",
|
|
@@ -1198,6 +1264,17 @@
|
|
|
1198
1264
|
"docker_image": "gpustack/runner:rocm7.0-sglang0.5.6.post2",
|
|
1199
1265
|
"deprecated": false
|
|
1200
1266
|
},
|
|
1267
|
+
{
|
|
1268
|
+
"backend": "rocm",
|
|
1269
|
+
"backend_version": "7.0",
|
|
1270
|
+
"original_backend_version": "7.0.2",
|
|
1271
|
+
"backend_variant": "",
|
|
1272
|
+
"service": "vllm",
|
|
1273
|
+
"service_version": "0.13.0",
|
|
1274
|
+
"platform": "linux/amd64",
|
|
1275
|
+
"docker_image": "gpustack/runner:rocm7.0-vllm0.13.0",
|
|
1276
|
+
"deprecated": false
|
|
1277
|
+
},
|
|
1201
1278
|
{
|
|
1202
1279
|
"backend": "rocm",
|
|
1203
1280
|
"backend_version": "7.0",
|
|
@@ -1253,6 +1330,17 @@
|
|
|
1253
1330
|
"docker_image": "gpustack/runner:rocm6.4-sglang0.5.5.post3",
|
|
1254
1331
|
"deprecated": false
|
|
1255
1332
|
},
|
|
1333
|
+
{
|
|
1334
|
+
"backend": "rocm",
|
|
1335
|
+
"backend_version": "6.4",
|
|
1336
|
+
"original_backend_version": "6.4.4",
|
|
1337
|
+
"backend_variant": "",
|
|
1338
|
+
"service": "vllm",
|
|
1339
|
+
"service_version": "0.13.0",
|
|
1340
|
+
"platform": "linux/amd64",
|
|
1341
|
+
"docker_image": "gpustack/runner:rocm6.4-vllm0.13.0",
|
|
1342
|
+
"deprecated": false
|
|
1343
|
+
},
|
|
1256
1344
|
{
|
|
1257
1345
|
"backend": "rocm",
|
|
1258
1346
|
"backend_version": "6.4",
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: gpustack-runner
|
|
3
|
-
Version: 0.1.22.
|
|
3
|
+
Version: 0.1.22.post3
|
|
4
4
|
Summary: GPUStack Runner is library for registering runnable accelerated backends and services in GPUStack.
|
|
5
5
|
Project-URL: Homepage, https://github.com/gpustack/runner
|
|
6
6
|
Project-URL: Bug Tracker, https://github.com/gpustack/gpustack/issues
|
|
@@ -86,12 +86,12 @@ The following table lists the supported accelerated backends and their correspon
|
|
|
86
86
|
> - Applied [Qwen2.5 VL patched](https://github.com/gpustack/gpustack/issues/3606) to vLLM 0.11.2.
|
|
87
87
|
> - Applied [vLLM[audio] packages](https://github.com/vllm-project/vllm/blob/275de34170654274616082721348b7edd9741d32/setup.py#L720-L724) to vLLM 0.11.2.
|
|
88
88
|
|
|
89
|
-
| CUDA Version <br/> (Variant) | vLLM
|
|
90
|
-
|
|
91
|
-
| 12.9 | `0.12.0`, **`0.11.2`** | `0.5.6.post2` | |
|
|
92
|
-
| 12.8 | `0.12.0`, **`0.11.2`**, <br/>`0.11.0`, `0.10.2`, <br/>`0.10.1.1`, `0.10.0` | `0.5.6.post2`, `0.5.5.post3`, <br/>`0.5.5`, `0.5.4.post3` | `0.0.20` |
|
|
93
|
-
| 12.6 | `0.12.0`, **`0.11.2`**, <br/>`0.11.0`, `0.10.2`, <br/>`0.10.1.1`, `0.10.0` | `0.5.6.post2` | `0.0.20` |
|
|
94
|
-
| 12.4 | `0.11.0`, `0.10.2`, <br/>`0.10.1.1`, `0.10.0`
|
|
89
|
+
| CUDA Version <br/> (Variant) | vLLM | SGLang | VoxBox |
|
|
90
|
+
|------------------------------|--------------------------------------------------------------------------------------|-----------------------------------------------------------|----------|
|
|
91
|
+
| 12.9 | `0.13.0`, `0.12.0`, **`0.11.2`** | `0.5.6.post2` | |
|
|
92
|
+
| 12.8 | `0.13.0`, `0.12.0`, **`0.11.2`**, <br/>`0.11.0`, `0.10.2`, <br/>`0.10.1.1`, `0.10.0` | `0.5.6.post2`, `0.5.5.post3`, <br/>`0.5.5`, `0.5.4.post3` | `0.0.20` |
|
|
93
|
+
| 12.6 | `0.13.0`, `0.12.0`, **`0.11.2`**, <br/>`0.11.0`, `0.10.2`, <br/>`0.10.1.1`, `0.10.0` | `0.5.6.post2` | `0.0.20` |
|
|
94
|
+
| 12.4 | `0.11.0`, `0.10.2`, <br/>`0.10.1.1`, `0.10.0` | | `0.0.20` |
|
|
95
95
|
|
|
96
96
|
### Hygon DTK
|
|
97
97
|
|
|
@@ -118,16 +118,17 @@ The following table lists the supported accelerated backends and their correspon
|
|
|
118
118
|
> - ROCm 7.0 vLLM `0.11.2/0.11.0` are reusing the official ROCm 6.4 PyTorch 2.9 wheel package rather than a ROCm
|
|
119
119
|
7.0 specific PyTorch build. Although supports ROCm 7.0 in vLLM `0.11.2/0.11.0`, `gfx1150/gfx1151` are not supported yet.
|
|
120
120
|
> - SGLang supports `gfx942` only.
|
|
121
|
+
> - ROCm 6.4 vLLM `0.13.0` supports `gfx903 gfx90a gfx942` only.
|
|
121
122
|
|
|
122
123
|
> [!IMPORTANT]
|
|
123
124
|
> - Applied [vLLM[audio] packages](https://github.com/vllm-project/vllm/blob/275de34170654274616082721348b7edd9741d32/setup.py#L720-L724) to vLLM 0.11.2.
|
|
124
125
|
> - Applied [petit-kernel package](https://github.com/vllm-project/vllm/blob/275de34170654274616082721348b7edd9741d32/setup.py#L728) to vLLM 0.11.2 and SGLang 0.5.5.post3.
|
|
125
126
|
|
|
126
|
-
| ROCm Version <br/> (Variant) | vLLM
|
|
127
|
-
|
|
128
|
-
| 7.0 | `0.12.0`, **`0.11.2`**, <br/> `0.11.0` | `0.5.6.post2` |
|
|
129
|
-
| 6.4 | `0.12.0`, **`0.11.2`**, <br/> `0.10.2` | `0.5.6.post2`, **`0.5.5.post3`** |
|
|
130
|
-
| 6.3 | `0.10.1.1`, `0.10.0`
|
|
127
|
+
| ROCm Version <br/> (Variant) | vLLM | SGLang |
|
|
128
|
+
|------------------------------|--------------------------------------------------|----------------------------------|
|
|
129
|
+
| 7.0 | `0.13.0`, `0.12.0`, **`0.11.2`**, <br/> `0.11.0` | `0.5.6.post2` |
|
|
130
|
+
| 6.4 | `0.13.0`, `0.12.0`, **`0.11.2`**, <br/> `0.10.2` | `0.5.6.post2`, **`0.5.5.post3`** |
|
|
131
|
+
| 6.3 | `0.10.1.1`, `0.10.0` | |
|
|
131
132
|
|
|
132
133
|
## Directory Structure
|
|
133
134
|
|
|
@@ -1,15 +1,15 @@
|
|
|
1
1
|
gpustack_runner/__init__.py,sha256=0_0jsxo1xjLtHTOIEU0_-A1qFEANzsVw-uXGjcILDwk,530
|
|
2
2
|
gpustack_runner/__main__.py,sha256=wtcp9lwMkaXGbQkuOY08EQhKfIHcTLSjMdnj2W3UGwk,1285
|
|
3
|
-
gpustack_runner/_version.py,sha256=
|
|
3
|
+
gpustack_runner/_version.py,sha256=yMQuvIXXVIrEIokaGWmpbjbyBqb1f3fBWlIy53iYTJs,792
|
|
4
4
|
gpustack_runner/_version.pyi,sha256=A42NoSgcqEXVy2OeNm4LXC9CbyonbooYrSUBlPm2lGY,156
|
|
5
5
|
gpustack_runner/runner.py,sha256=GA7vy4xxaN63cFoc7_Ecft4mV5uYJe_DkQKkR1Htz3o,25881
|
|
6
|
-
gpustack_runner/runner.py.json,sha256=
|
|
6
|
+
gpustack_runner/runner.py.json,sha256=u5qDrFaiWaMgTbT6sS9tUEkI6zbR41yO1PU8QCVYT1o,39041
|
|
7
7
|
gpustack_runner/cmds/__init__.py,sha256=Os8FdvqNjLYiVn_jnDo7rFEtAeVLJJI1odKHEqWF-Fw,417
|
|
8
8
|
gpustack_runner/cmds/__types__.py,sha256=7C4kQM0EHPD8WpJpTo6kh9rEdkrYALcLQ-GAzMMsqV8,789
|
|
9
9
|
gpustack_runner/cmds/images.py,sha256=cFYRCpAdGltYmwkaPmSD7ZFtjlySOTcn4vPTmnUgYwE,38070
|
|
10
|
-
gpustack_runner/_version_appendix.py,sha256=
|
|
11
|
-
gpustack_runner-0.1.22.
|
|
12
|
-
gpustack_runner-0.1.22.
|
|
13
|
-
gpustack_runner-0.1.22.
|
|
14
|
-
gpustack_runner-0.1.22.
|
|
15
|
-
gpustack_runner-0.1.22.
|
|
10
|
+
gpustack_runner/_version_appendix.py,sha256=R9iEnnU0bPP8QLeXZ7sar1vcpPEhr9X3W8R3sQFP-e4,23
|
|
11
|
+
gpustack_runner-0.1.22.post3.dist-info/METADATA,sha256=6iOpRZwepSxVaUf4iIifswJ-OZmJZAwetaK05ZtRM-A,13351
|
|
12
|
+
gpustack_runner-0.1.22.post3.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
|
|
13
|
+
gpustack_runner-0.1.22.post3.dist-info/entry_points.txt,sha256=M1Dxl6cY0kIgf2I4pPsV-_kU6BAtjj93spmsXAdwW3s,66
|
|
14
|
+
gpustack_runner-0.1.22.post3.dist-info/licenses/LICENSE,sha256=OiPibowBvB-NHV3TP_NOj18XNBlXcshXZFMpa3uvKVE,10362
|
|
15
|
+
gpustack_runner-0.1.22.post3.dist-info/RECORD,,
|
|
File without changes
|
{gpustack_runner-0.1.22.post2.dist-info → gpustack_runner-0.1.22.post3.dist-info}/entry_points.txt
RENAMED
|
File without changes
|
{gpustack_runner-0.1.22.post2.dist-info → gpustack_runner-0.1.22.post3.dist-info}/licenses/LICENSE
RENAMED
|
File without changes
|