gpustack-runner 0.1.22.post2__py3-none-any.whl → 0.1.22.post4__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- gpustack_runner/_version.py +2 -2
- gpustack_runner/_version_appendix.py +1 -1
- gpustack_runner/runner.py.json +132 -0
- {gpustack_runner-0.1.22.post2.dist-info → gpustack_runner-0.1.22.post4.dist-info}/METADATA +13 -12
- {gpustack_runner-0.1.22.post2.dist-info → gpustack_runner-0.1.22.post4.dist-info}/RECORD +8 -8
- {gpustack_runner-0.1.22.post2.dist-info → gpustack_runner-0.1.22.post4.dist-info}/WHEEL +0 -0
- {gpustack_runner-0.1.22.post2.dist-info → gpustack_runner-0.1.22.post4.dist-info}/entry_points.txt +0 -0
- {gpustack_runner-0.1.22.post2.dist-info → gpustack_runner-0.1.22.post4.dist-info}/licenses/LICENSE +0 -0
gpustack_runner/_version.py
CHANGED
|
@@ -27,8 +27,8 @@ version_tuple: VERSION_TUPLE
|
|
|
27
27
|
__commit_id__: COMMIT_ID
|
|
28
28
|
commit_id: COMMIT_ID
|
|
29
29
|
|
|
30
|
-
__version__ = version = '0.1.22.
|
|
31
|
-
__version_tuple__ = version_tuple = (0, 1, 22, '
|
|
30
|
+
__version__ = version = '0.1.22.post4'
|
|
31
|
+
__version_tuple__ = version_tuple = (0, 1, 22, 'post4')
|
|
32
32
|
try:
|
|
33
33
|
from ._version_appendix import git_commit
|
|
34
34
|
__commit_id__ = commit_id = git_commit
|
|
@@ -1 +1 @@
|
|
|
1
|
-
git_commit = "
|
|
1
|
+
git_commit = "f3f4d02"
|
gpustack_runner/runner.py.json
CHANGED
|
@@ -604,6 +604,28 @@
|
|
|
604
604
|
"docker_image": "gpustack/runner:cuda12.9-sglang0.5.6.post2",
|
|
605
605
|
"deprecated": false
|
|
606
606
|
},
|
|
607
|
+
{
|
|
608
|
+
"backend": "cuda",
|
|
609
|
+
"backend_version": "12.9",
|
|
610
|
+
"original_backend_version": "12.9.1",
|
|
611
|
+
"backend_variant": "",
|
|
612
|
+
"service": "vllm",
|
|
613
|
+
"service_version": "0.13.0",
|
|
614
|
+
"platform": "linux/amd64",
|
|
615
|
+
"docker_image": "gpustack/runner:cuda12.9-vllm0.13.0",
|
|
616
|
+
"deprecated": false
|
|
617
|
+
},
|
|
618
|
+
{
|
|
619
|
+
"backend": "cuda",
|
|
620
|
+
"backend_version": "12.9",
|
|
621
|
+
"original_backend_version": "12.9.1",
|
|
622
|
+
"backend_variant": "",
|
|
623
|
+
"service": "vllm",
|
|
624
|
+
"service_version": "0.13.0",
|
|
625
|
+
"platform": "linux/arm64",
|
|
626
|
+
"docker_image": "gpustack/runner:cuda12.9-vllm0.13.0",
|
|
627
|
+
"deprecated": false
|
|
628
|
+
},
|
|
607
629
|
{
|
|
608
630
|
"backend": "cuda",
|
|
609
631
|
"backend_version": "12.9",
|
|
@@ -725,6 +747,28 @@
|
|
|
725
747
|
"docker_image": "gpustack/runner:cuda12.8-sglang0.5.4.post3",
|
|
726
748
|
"deprecated": false
|
|
727
749
|
},
|
|
750
|
+
{
|
|
751
|
+
"backend": "cuda",
|
|
752
|
+
"backend_version": "12.8",
|
|
753
|
+
"original_backend_version": "12.8.1",
|
|
754
|
+
"backend_variant": "",
|
|
755
|
+
"service": "vllm",
|
|
756
|
+
"service_version": "0.13.0",
|
|
757
|
+
"platform": "linux/amd64",
|
|
758
|
+
"docker_image": "gpustack/runner:cuda12.8-vllm0.13.0",
|
|
759
|
+
"deprecated": false
|
|
760
|
+
},
|
|
761
|
+
{
|
|
762
|
+
"backend": "cuda",
|
|
763
|
+
"backend_version": "12.8",
|
|
764
|
+
"original_backend_version": "12.8.1",
|
|
765
|
+
"backend_variant": "",
|
|
766
|
+
"service": "vllm",
|
|
767
|
+
"service_version": "0.13.0",
|
|
768
|
+
"platform": "linux/arm64",
|
|
769
|
+
"docker_image": "gpustack/runner:cuda12.8-vllm0.13.0",
|
|
770
|
+
"deprecated": false
|
|
771
|
+
},
|
|
728
772
|
{
|
|
729
773
|
"backend": "cuda",
|
|
730
774
|
"backend_version": "12.8",
|
|
@@ -857,6 +901,28 @@
|
|
|
857
901
|
"docker_image": "gpustack/runner:cuda12.8-vllm0.10.0",
|
|
858
902
|
"deprecated": false
|
|
859
903
|
},
|
|
904
|
+
{
|
|
905
|
+
"backend": "cuda",
|
|
906
|
+
"backend_version": "12.8",
|
|
907
|
+
"original_backend_version": "12.8.1",
|
|
908
|
+
"backend_variant": "",
|
|
909
|
+
"service": "voxbox",
|
|
910
|
+
"service_version": "0.0.21",
|
|
911
|
+
"platform": "linux/amd64",
|
|
912
|
+
"docker_image": "gpustack/runner:cuda12.8-voxbox0.0.21",
|
|
913
|
+
"deprecated": false
|
|
914
|
+
},
|
|
915
|
+
{
|
|
916
|
+
"backend": "cuda",
|
|
917
|
+
"backend_version": "12.8",
|
|
918
|
+
"original_backend_version": "12.8.1",
|
|
919
|
+
"backend_variant": "",
|
|
920
|
+
"service": "voxbox",
|
|
921
|
+
"service_version": "0.0.21",
|
|
922
|
+
"platform": "linux/arm64",
|
|
923
|
+
"docker_image": "gpustack/runner:cuda12.8-voxbox0.0.21",
|
|
924
|
+
"deprecated": false
|
|
925
|
+
},
|
|
860
926
|
{
|
|
861
927
|
"backend": "cuda",
|
|
862
928
|
"backend_version": "12.8",
|
|
@@ -879,6 +945,28 @@
|
|
|
879
945
|
"docker_image": "gpustack/runner:cuda12.8-voxbox0.0.20",
|
|
880
946
|
"deprecated": false
|
|
881
947
|
},
|
|
948
|
+
{
|
|
949
|
+
"backend": "cuda",
|
|
950
|
+
"backend_version": "12.6",
|
|
951
|
+
"original_backend_version": "12.6.3",
|
|
952
|
+
"backend_variant": "",
|
|
953
|
+
"service": "vllm",
|
|
954
|
+
"service_version": "0.13.0",
|
|
955
|
+
"platform": "linux/amd64",
|
|
956
|
+
"docker_image": "gpustack/runner:cuda12.6-vllm0.13.0",
|
|
957
|
+
"deprecated": false
|
|
958
|
+
},
|
|
959
|
+
{
|
|
960
|
+
"backend": "cuda",
|
|
961
|
+
"backend_version": "12.6",
|
|
962
|
+
"original_backend_version": "12.6.3",
|
|
963
|
+
"backend_variant": "",
|
|
964
|
+
"service": "vllm",
|
|
965
|
+
"service_version": "0.13.0",
|
|
966
|
+
"platform": "linux/arm64",
|
|
967
|
+
"docker_image": "gpustack/runner:cuda12.6-vllm0.13.0",
|
|
968
|
+
"deprecated": false
|
|
969
|
+
},
|
|
882
970
|
{
|
|
883
971
|
"backend": "cuda",
|
|
884
972
|
"backend_version": "12.6",
|
|
@@ -1011,6 +1099,28 @@
|
|
|
1011
1099
|
"docker_image": "gpustack/runner:cuda12.6-vllm0.10.0",
|
|
1012
1100
|
"deprecated": false
|
|
1013
1101
|
},
|
|
1102
|
+
{
|
|
1103
|
+
"backend": "cuda",
|
|
1104
|
+
"backend_version": "12.6",
|
|
1105
|
+
"original_backend_version": "12.6.3",
|
|
1106
|
+
"backend_variant": "",
|
|
1107
|
+
"service": "voxbox",
|
|
1108
|
+
"service_version": "0.0.21",
|
|
1109
|
+
"platform": "linux/amd64",
|
|
1110
|
+
"docker_image": "gpustack/runner:cuda12.6-voxbox0.0.21",
|
|
1111
|
+
"deprecated": false
|
|
1112
|
+
},
|
|
1113
|
+
{
|
|
1114
|
+
"backend": "cuda",
|
|
1115
|
+
"backend_version": "12.6",
|
|
1116
|
+
"original_backend_version": "12.6.3",
|
|
1117
|
+
"backend_variant": "",
|
|
1118
|
+
"service": "voxbox",
|
|
1119
|
+
"service_version": "0.0.21",
|
|
1120
|
+
"platform": "linux/arm64",
|
|
1121
|
+
"docker_image": "gpustack/runner:cuda12.6-voxbox0.0.21",
|
|
1122
|
+
"deprecated": false
|
|
1123
|
+
},
|
|
1014
1124
|
{
|
|
1015
1125
|
"backend": "cuda",
|
|
1016
1126
|
"backend_version": "12.6",
|
|
@@ -1198,6 +1308,17 @@
|
|
|
1198
1308
|
"docker_image": "gpustack/runner:rocm7.0-sglang0.5.6.post2",
|
|
1199
1309
|
"deprecated": false
|
|
1200
1310
|
},
|
|
1311
|
+
{
|
|
1312
|
+
"backend": "rocm",
|
|
1313
|
+
"backend_version": "7.0",
|
|
1314
|
+
"original_backend_version": "7.0.2",
|
|
1315
|
+
"backend_variant": "",
|
|
1316
|
+
"service": "vllm",
|
|
1317
|
+
"service_version": "0.13.0",
|
|
1318
|
+
"platform": "linux/amd64",
|
|
1319
|
+
"docker_image": "gpustack/runner:rocm7.0-vllm0.13.0",
|
|
1320
|
+
"deprecated": false
|
|
1321
|
+
},
|
|
1201
1322
|
{
|
|
1202
1323
|
"backend": "rocm",
|
|
1203
1324
|
"backend_version": "7.0",
|
|
@@ -1253,6 +1374,17 @@
|
|
|
1253
1374
|
"docker_image": "gpustack/runner:rocm6.4-sglang0.5.5.post3",
|
|
1254
1375
|
"deprecated": false
|
|
1255
1376
|
},
|
|
1377
|
+
{
|
|
1378
|
+
"backend": "rocm",
|
|
1379
|
+
"backend_version": "6.4",
|
|
1380
|
+
"original_backend_version": "6.4.4",
|
|
1381
|
+
"backend_variant": "",
|
|
1382
|
+
"service": "vllm",
|
|
1383
|
+
"service_version": "0.13.0",
|
|
1384
|
+
"platform": "linux/amd64",
|
|
1385
|
+
"docker_image": "gpustack/runner:rocm6.4-vllm0.13.0",
|
|
1386
|
+
"deprecated": false
|
|
1387
|
+
},
|
|
1256
1388
|
{
|
|
1257
1389
|
"backend": "rocm",
|
|
1258
1390
|
"backend_version": "6.4",
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: gpustack-runner
|
|
3
|
-
Version: 0.1.22.
|
|
3
|
+
Version: 0.1.22.post4
|
|
4
4
|
Summary: GPUStack Runner is library for registering runnable accelerated backends and services in GPUStack.
|
|
5
5
|
Project-URL: Homepage, https://github.com/gpustack/runner
|
|
6
6
|
Project-URL: Bug Tracker, https://github.com/gpustack/gpustack/issues
|
|
@@ -86,12 +86,12 @@ The following table lists the supported accelerated backends and their correspon
|
|
|
86
86
|
> - Applied [Qwen2.5 VL patched](https://github.com/gpustack/gpustack/issues/3606) to vLLM 0.11.2.
|
|
87
87
|
> - Applied [vLLM[audio] packages](https://github.com/vllm-project/vllm/blob/275de34170654274616082721348b7edd9741d32/setup.py#L720-L724) to vLLM 0.11.2.
|
|
88
88
|
|
|
89
|
-
| CUDA Version <br/> (Variant) | vLLM
|
|
90
|
-
|
|
91
|
-
| 12.9 | `0.12.0`,
|
|
92
|
-
| 12.8 | `0.12.0`,
|
|
93
|
-
| 12.6 | `0.12.0`,
|
|
94
|
-
| 12.4 | `0.11.0`, `0.10.2`, <br/>`0.10.1.1`, `0.10.0`
|
|
89
|
+
| CUDA Version <br/> (Variant) | vLLM | SGLang | VoxBox |
|
|
90
|
+
|------------------------------|-------------------------------------------------------------------------------------------|-----------------------------------------------------------|--------------------|
|
|
91
|
+
| 12.9 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`** | `0.5.6.post2` | |
|
|
92
|
+
| 12.8 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`**, `0.11.0`, <br/>`0.10.2`, `0.10.1.1`, <br/>`0.10.0` | `0.5.6.post2`, `0.5.5.post3`, <br/>`0.5.5`, `0.5.4.post3` | `0.0.21`, `0.0.20` |
|
|
93
|
+
| 12.6 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`**, `0.11.0`, <br/>`0.10.2`, `0.10.1.1`, <br/>`0.10.0` | `0.5.6.post2` | `0.0.21`, `0.0.20` |
|
|
94
|
+
| 12.4 | `0.11.0`, `0.10.2`, <br/>`0.10.1.1`, `0.10.0` | | `0.0.20` |
|
|
95
95
|
|
|
96
96
|
### Hygon DTK
|
|
97
97
|
|
|
@@ -118,16 +118,17 @@ The following table lists the supported accelerated backends and their correspon
|
|
|
118
118
|
> - ROCm 7.0 vLLM `0.11.2/0.11.0` are reusing the official ROCm 6.4 PyTorch 2.9 wheel package rather than a ROCm
|
|
119
119
|
7.0 specific PyTorch build. Although supports ROCm 7.0 in vLLM `0.11.2/0.11.0`, `gfx1150/gfx1151` are not supported yet.
|
|
120
120
|
> - SGLang supports `gfx942` only.
|
|
121
|
+
> - ROCm 6.4 vLLM `0.13.0` supports `gfx903 gfx90a gfx942` only.
|
|
121
122
|
|
|
122
123
|
> [!IMPORTANT]
|
|
123
124
|
> - Applied [vLLM[audio] packages](https://github.com/vllm-project/vllm/blob/275de34170654274616082721348b7edd9741d32/setup.py#L720-L724) to vLLM 0.11.2.
|
|
124
125
|
> - Applied [petit-kernel package](https://github.com/vllm-project/vllm/blob/275de34170654274616082721348b7edd9741d32/setup.py#L728) to vLLM 0.11.2 and SGLang 0.5.5.post3.
|
|
125
126
|
|
|
126
|
-
| ROCm Version <br/> (Variant) | vLLM
|
|
127
|
-
|
|
128
|
-
| 7.0 | `0.12.0`,
|
|
129
|
-
| 6.4 | `0.12.0`,
|
|
130
|
-
| 6.3 | `0.10.1.1`, `0.10.0`
|
|
127
|
+
| ROCm Version <br/> (Variant) | vLLM | SGLang |
|
|
128
|
+
|------------------------------|-------------------------------------------------|----------------------------------|
|
|
129
|
+
| 7.0 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`**, `0.11.0` | `0.5.6.post2` |
|
|
130
|
+
| 6.4 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`**, `0.10.2` | `0.5.6.post2`, **`0.5.5.post3`** |
|
|
131
|
+
| 6.3 | `0.10.1.1`, `0.10.0` | |
|
|
131
132
|
|
|
132
133
|
## Directory Structure
|
|
133
134
|
|
|
@@ -1,15 +1,15 @@
|
|
|
1
1
|
gpustack_runner/__init__.py,sha256=0_0jsxo1xjLtHTOIEU0_-A1qFEANzsVw-uXGjcILDwk,530
|
|
2
2
|
gpustack_runner/__main__.py,sha256=wtcp9lwMkaXGbQkuOY08EQhKfIHcTLSjMdnj2W3UGwk,1285
|
|
3
|
-
gpustack_runner/_version.py,sha256=
|
|
3
|
+
gpustack_runner/_version.py,sha256=Uo5gbkPte64mZ6Lli6u4vxJKezjCqo4IDrSelelU37g,792
|
|
4
4
|
gpustack_runner/_version.pyi,sha256=A42NoSgcqEXVy2OeNm4LXC9CbyonbooYrSUBlPm2lGY,156
|
|
5
5
|
gpustack_runner/runner.py,sha256=GA7vy4xxaN63cFoc7_Ecft4mV5uYJe_DkQKkR1Htz3o,25881
|
|
6
|
-
gpustack_runner/runner.py.json,sha256=
|
|
6
|
+
gpustack_runner/runner.py.json,sha256=cwWroAmmvF1H9mT1tOPmWAZESKeclUd67EqOEBlCvs0,40265
|
|
7
7
|
gpustack_runner/cmds/__init__.py,sha256=Os8FdvqNjLYiVn_jnDo7rFEtAeVLJJI1odKHEqWF-Fw,417
|
|
8
8
|
gpustack_runner/cmds/__types__.py,sha256=7C4kQM0EHPD8WpJpTo6kh9rEdkrYALcLQ-GAzMMsqV8,789
|
|
9
9
|
gpustack_runner/cmds/images.py,sha256=cFYRCpAdGltYmwkaPmSD7ZFtjlySOTcn4vPTmnUgYwE,38070
|
|
10
|
-
gpustack_runner/_version_appendix.py,sha256=
|
|
11
|
-
gpustack_runner-0.1.22.
|
|
12
|
-
gpustack_runner-0.1.22.
|
|
13
|
-
gpustack_runner-0.1.22.
|
|
14
|
-
gpustack_runner-0.1.22.
|
|
15
|
-
gpustack_runner-0.1.22.
|
|
10
|
+
gpustack_runner/_version_appendix.py,sha256=AE3f-puqLLOMhjdFlFuVpzA08xMz64uAy3mgO5-nf6I,23
|
|
11
|
+
gpustack_runner-0.1.22.post4.dist-info/METADATA,sha256=xQiljvJ5FPHgqZEgW2dNvoplsOMNiOQ9mdyETO0pQME,13436
|
|
12
|
+
gpustack_runner-0.1.22.post4.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
|
|
13
|
+
gpustack_runner-0.1.22.post4.dist-info/entry_points.txt,sha256=M1Dxl6cY0kIgf2I4pPsV-_kU6BAtjj93spmsXAdwW3s,66
|
|
14
|
+
gpustack_runner-0.1.22.post4.dist-info/licenses/LICENSE,sha256=OiPibowBvB-NHV3TP_NOj18XNBlXcshXZFMpa3uvKVE,10362
|
|
15
|
+
gpustack_runner-0.1.22.post4.dist-info/RECORD,,
|
|
File without changes
|
{gpustack_runner-0.1.22.post2.dist-info → gpustack_runner-0.1.22.post4.dist-info}/entry_points.txt
RENAMED
|
File without changes
|
{gpustack_runner-0.1.22.post2.dist-info → gpustack_runner-0.1.22.post4.dist-info}/licenses/LICENSE
RENAMED
|
File without changes
|