gpustack-runner 0.1.22.post2__py3-none-any.whl → 0.1.22.post4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -27,8 +27,8 @@ version_tuple: VERSION_TUPLE
27
27
  __commit_id__: COMMIT_ID
28
28
  commit_id: COMMIT_ID
29
29
 
30
- __version__ = version = '0.1.22.post2'
31
- __version_tuple__ = version_tuple = (0, 1, 22, 'post2')
30
+ __version__ = version = '0.1.22.post4'
31
+ __version_tuple__ = version_tuple = (0, 1, 22, 'post4')
32
32
  try:
33
33
  from ._version_appendix import git_commit
34
34
  __commit_id__ = commit_id = git_commit
@@ -1 +1 @@
1
- git_commit = "457b969"
1
+ git_commit = "f3f4d02"
@@ -604,6 +604,28 @@
604
604
  "docker_image": "gpustack/runner:cuda12.9-sglang0.5.6.post2",
605
605
  "deprecated": false
606
606
  },
607
+ {
608
+ "backend": "cuda",
609
+ "backend_version": "12.9",
610
+ "original_backend_version": "12.9.1",
611
+ "backend_variant": "",
612
+ "service": "vllm",
613
+ "service_version": "0.13.0",
614
+ "platform": "linux/amd64",
615
+ "docker_image": "gpustack/runner:cuda12.9-vllm0.13.0",
616
+ "deprecated": false
617
+ },
618
+ {
619
+ "backend": "cuda",
620
+ "backend_version": "12.9",
621
+ "original_backend_version": "12.9.1",
622
+ "backend_variant": "",
623
+ "service": "vllm",
624
+ "service_version": "0.13.0",
625
+ "platform": "linux/arm64",
626
+ "docker_image": "gpustack/runner:cuda12.9-vllm0.13.0",
627
+ "deprecated": false
628
+ },
607
629
  {
608
630
  "backend": "cuda",
609
631
  "backend_version": "12.9",
@@ -725,6 +747,28 @@
725
747
  "docker_image": "gpustack/runner:cuda12.8-sglang0.5.4.post3",
726
748
  "deprecated": false
727
749
  },
750
+ {
751
+ "backend": "cuda",
752
+ "backend_version": "12.8",
753
+ "original_backend_version": "12.8.1",
754
+ "backend_variant": "",
755
+ "service": "vllm",
756
+ "service_version": "0.13.0",
757
+ "platform": "linux/amd64",
758
+ "docker_image": "gpustack/runner:cuda12.8-vllm0.13.0",
759
+ "deprecated": false
760
+ },
761
+ {
762
+ "backend": "cuda",
763
+ "backend_version": "12.8",
764
+ "original_backend_version": "12.8.1",
765
+ "backend_variant": "",
766
+ "service": "vllm",
767
+ "service_version": "0.13.0",
768
+ "platform": "linux/arm64",
769
+ "docker_image": "gpustack/runner:cuda12.8-vllm0.13.0",
770
+ "deprecated": false
771
+ },
728
772
  {
729
773
  "backend": "cuda",
730
774
  "backend_version": "12.8",
@@ -857,6 +901,28 @@
857
901
  "docker_image": "gpustack/runner:cuda12.8-vllm0.10.0",
858
902
  "deprecated": false
859
903
  },
904
+ {
905
+ "backend": "cuda",
906
+ "backend_version": "12.8",
907
+ "original_backend_version": "12.8.1",
908
+ "backend_variant": "",
909
+ "service": "voxbox",
910
+ "service_version": "0.0.21",
911
+ "platform": "linux/amd64",
912
+ "docker_image": "gpustack/runner:cuda12.8-voxbox0.0.21",
913
+ "deprecated": false
914
+ },
915
+ {
916
+ "backend": "cuda",
917
+ "backend_version": "12.8",
918
+ "original_backend_version": "12.8.1",
919
+ "backend_variant": "",
920
+ "service": "voxbox",
921
+ "service_version": "0.0.21",
922
+ "platform": "linux/arm64",
923
+ "docker_image": "gpustack/runner:cuda12.8-voxbox0.0.21",
924
+ "deprecated": false
925
+ },
860
926
  {
861
927
  "backend": "cuda",
862
928
  "backend_version": "12.8",
@@ -879,6 +945,28 @@
879
945
  "docker_image": "gpustack/runner:cuda12.8-voxbox0.0.20",
880
946
  "deprecated": false
881
947
  },
948
+ {
949
+ "backend": "cuda",
950
+ "backend_version": "12.6",
951
+ "original_backend_version": "12.6.3",
952
+ "backend_variant": "",
953
+ "service": "vllm",
954
+ "service_version": "0.13.0",
955
+ "platform": "linux/amd64",
956
+ "docker_image": "gpustack/runner:cuda12.6-vllm0.13.0",
957
+ "deprecated": false
958
+ },
959
+ {
960
+ "backend": "cuda",
961
+ "backend_version": "12.6",
962
+ "original_backend_version": "12.6.3",
963
+ "backend_variant": "",
964
+ "service": "vllm",
965
+ "service_version": "0.13.0",
966
+ "platform": "linux/arm64",
967
+ "docker_image": "gpustack/runner:cuda12.6-vllm0.13.0",
968
+ "deprecated": false
969
+ },
882
970
  {
883
971
  "backend": "cuda",
884
972
  "backend_version": "12.6",
@@ -1011,6 +1099,28 @@
1011
1099
  "docker_image": "gpustack/runner:cuda12.6-vllm0.10.0",
1012
1100
  "deprecated": false
1013
1101
  },
1102
+ {
1103
+ "backend": "cuda",
1104
+ "backend_version": "12.6",
1105
+ "original_backend_version": "12.6.3",
1106
+ "backend_variant": "",
1107
+ "service": "voxbox",
1108
+ "service_version": "0.0.21",
1109
+ "platform": "linux/amd64",
1110
+ "docker_image": "gpustack/runner:cuda12.6-voxbox0.0.21",
1111
+ "deprecated": false
1112
+ },
1113
+ {
1114
+ "backend": "cuda",
1115
+ "backend_version": "12.6",
1116
+ "original_backend_version": "12.6.3",
1117
+ "backend_variant": "",
1118
+ "service": "voxbox",
1119
+ "service_version": "0.0.21",
1120
+ "platform": "linux/arm64",
1121
+ "docker_image": "gpustack/runner:cuda12.6-voxbox0.0.21",
1122
+ "deprecated": false
1123
+ },
1014
1124
  {
1015
1125
  "backend": "cuda",
1016
1126
  "backend_version": "12.6",
@@ -1198,6 +1308,17 @@
1198
1308
  "docker_image": "gpustack/runner:rocm7.0-sglang0.5.6.post2",
1199
1309
  "deprecated": false
1200
1310
  },
1311
+ {
1312
+ "backend": "rocm",
1313
+ "backend_version": "7.0",
1314
+ "original_backend_version": "7.0.2",
1315
+ "backend_variant": "",
1316
+ "service": "vllm",
1317
+ "service_version": "0.13.0",
1318
+ "platform": "linux/amd64",
1319
+ "docker_image": "gpustack/runner:rocm7.0-vllm0.13.0",
1320
+ "deprecated": false
1321
+ },
1201
1322
  {
1202
1323
  "backend": "rocm",
1203
1324
  "backend_version": "7.0",
@@ -1253,6 +1374,17 @@
1253
1374
  "docker_image": "gpustack/runner:rocm6.4-sglang0.5.5.post3",
1254
1375
  "deprecated": false
1255
1376
  },
1377
+ {
1378
+ "backend": "rocm",
1379
+ "backend_version": "6.4",
1380
+ "original_backend_version": "6.4.4",
1381
+ "backend_variant": "",
1382
+ "service": "vllm",
1383
+ "service_version": "0.13.0",
1384
+ "platform": "linux/amd64",
1385
+ "docker_image": "gpustack/runner:rocm6.4-vllm0.13.0",
1386
+ "deprecated": false
1387
+ },
1256
1388
  {
1257
1389
  "backend": "rocm",
1258
1390
  "backend_version": "6.4",
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: gpustack-runner
3
- Version: 0.1.22.post2
3
+ Version: 0.1.22.post4
4
4
  Summary: GPUStack Runner is library for registering runnable accelerated backends and services in GPUStack.
5
5
  Project-URL: Homepage, https://github.com/gpustack/runner
6
6
  Project-URL: Bug Tracker, https://github.com/gpustack/gpustack/issues
@@ -86,12 +86,12 @@ The following table lists the supported accelerated backends and their correspon
86
86
  > - Applied [Qwen2.5 VL patched](https://github.com/gpustack/gpustack/issues/3606) to vLLM 0.11.2.
87
87
  > - Applied [vLLM[audio] packages](https://github.com/vllm-project/vllm/blob/275de34170654274616082721348b7edd9741d32/setup.py#L720-L724) to vLLM 0.11.2.
88
88
 
89
- | CUDA Version <br/> (Variant) | vLLM | SGLang | VoxBox |
90
- |------------------------------|----------------------------------------------------------------------------|-----------------------------------------------------------|----------|
91
- | 12.9 | `0.12.0`, **`0.11.2`** | `0.5.6.post2` | |
92
- | 12.8 | `0.12.0`, **`0.11.2`**, <br/>`0.11.0`, `0.10.2`, <br/>`0.10.1.1`, `0.10.0` | `0.5.6.post2`, `0.5.5.post3`, <br/>`0.5.5`, `0.5.4.post3` | `0.0.20` |
93
- | 12.6 | `0.12.0`, **`0.11.2`**, <br/>`0.11.0`, `0.10.2`, <br/>`0.10.1.1`, `0.10.0` | `0.5.6.post2` | `0.0.20` |
94
- | 12.4 | `0.11.0`, `0.10.2`, <br/>`0.10.1.1`, `0.10.0` | | `0.0.20` |
89
+ | CUDA Version <br/> (Variant) | vLLM | SGLang | VoxBox |
90
+ |------------------------------|-------------------------------------------------------------------------------------------|-----------------------------------------------------------|--------------------|
91
+ | 12.9 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`** | `0.5.6.post2` | |
92
+ | 12.8 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`**, `0.11.0`, <br/>`0.10.2`, `0.10.1.1`, <br/>`0.10.0` | `0.5.6.post2`, `0.5.5.post3`, <br/>`0.5.5`, `0.5.4.post3` | `0.0.21`, `0.0.20` |
93
+ | 12.6 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`**, `0.11.0`, <br/>`0.10.2`, `0.10.1.1`, <br/>`0.10.0` | `0.5.6.post2` | `0.0.21`, `0.0.20` |
94
+ | 12.4 | `0.11.0`, `0.10.2`, <br/>`0.10.1.1`, `0.10.0` | | `0.0.20` |
95
95
 
96
96
  ### Hygon DTK
97
97
 
@@ -118,16 +118,17 @@ The following table lists the supported accelerated backends and their correspon
118
118
  > - ROCm 7.0 vLLM `0.11.2/0.11.0` are reusing the official ROCm 6.4 PyTorch 2.9 wheel package rather than a ROCm
119
119
  7.0 specific PyTorch build. Although supports ROCm 7.0 in vLLM `0.11.2/0.11.0`, `gfx1150/gfx1151` are not supported yet.
120
120
  > - SGLang supports `gfx942` only.
121
+ > - ROCm 6.4 vLLM `0.13.0` supports `gfx903 gfx90a gfx942` only.
121
122
 
122
123
  > [!IMPORTANT]
123
124
  > - Applied [vLLM[audio] packages](https://github.com/vllm-project/vllm/blob/275de34170654274616082721348b7edd9741d32/setup.py#L720-L724) to vLLM 0.11.2.
124
125
  > - Applied [petit-kernel package](https://github.com/vllm-project/vllm/blob/275de34170654274616082721348b7edd9741d32/setup.py#L728) to vLLM 0.11.2 and SGLang 0.5.5.post3.
125
126
 
126
- | ROCm Version <br/> (Variant) | vLLM | SGLang |
127
- |------------------------------|----------------------------------------|----------------------------------|
128
- | 7.0 | `0.12.0`, **`0.11.2`**, <br/> `0.11.0` | `0.5.6.post2` |
129
- | 6.4 | `0.12.0`, **`0.11.2`**, <br/> `0.10.2` | `0.5.6.post2`, **`0.5.5.post3`** |
130
- | 6.3 | `0.10.1.1`, `0.10.0` | |
127
+ | ROCm Version <br/> (Variant) | vLLM | SGLang |
128
+ |------------------------------|-------------------------------------------------|----------------------------------|
129
+ | 7.0 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`**, `0.11.0` | `0.5.6.post2` |
130
+ | 6.4 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`**, `0.10.2` | `0.5.6.post2`, **`0.5.5.post3`** |
131
+ | 6.3 | `0.10.1.1`, `0.10.0` | |
131
132
 
132
133
  ## Directory Structure
133
134
 
@@ -1,15 +1,15 @@
1
1
  gpustack_runner/__init__.py,sha256=0_0jsxo1xjLtHTOIEU0_-A1qFEANzsVw-uXGjcILDwk,530
2
2
  gpustack_runner/__main__.py,sha256=wtcp9lwMkaXGbQkuOY08EQhKfIHcTLSjMdnj2W3UGwk,1285
3
- gpustack_runner/_version.py,sha256=LIZgKDndjY7aBblOIWVBp1kX7REnWumpt3NiKrySvD0,792
3
+ gpustack_runner/_version.py,sha256=Uo5gbkPte64mZ6Lli6u4vxJKezjCqo4IDrSelelU37g,792
4
4
  gpustack_runner/_version.pyi,sha256=A42NoSgcqEXVy2OeNm4LXC9CbyonbooYrSUBlPm2lGY,156
5
5
  gpustack_runner/runner.py,sha256=GA7vy4xxaN63cFoc7_Ecft4mV5uYJe_DkQKkR1Htz3o,25881
6
- gpustack_runner/runner.py.json,sha256=L3C0vShTvyT0Dd-w7QCrXgpK5at5_6txVzcruALqdto,36631
6
+ gpustack_runner/runner.py.json,sha256=cwWroAmmvF1H9mT1tOPmWAZESKeclUd67EqOEBlCvs0,40265
7
7
  gpustack_runner/cmds/__init__.py,sha256=Os8FdvqNjLYiVn_jnDo7rFEtAeVLJJI1odKHEqWF-Fw,417
8
8
  gpustack_runner/cmds/__types__.py,sha256=7C4kQM0EHPD8WpJpTo6kh9rEdkrYALcLQ-GAzMMsqV8,789
9
9
  gpustack_runner/cmds/images.py,sha256=cFYRCpAdGltYmwkaPmSD7ZFtjlySOTcn4vPTmnUgYwE,38070
10
- gpustack_runner/_version_appendix.py,sha256=XKK-W1kMdR03nZKV9G_voKhXTk0-OL-q4t4RaELHYE8,23
11
- gpustack_runner-0.1.22.post2.dist-info/METADATA,sha256=Z427l0rI4YNnAStdhzVOu-rl9hpCfjtPKgtjjPiCE98,13176
12
- gpustack_runner-0.1.22.post2.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
13
- gpustack_runner-0.1.22.post2.dist-info/entry_points.txt,sha256=M1Dxl6cY0kIgf2I4pPsV-_kU6BAtjj93spmsXAdwW3s,66
14
- gpustack_runner-0.1.22.post2.dist-info/licenses/LICENSE,sha256=OiPibowBvB-NHV3TP_NOj18XNBlXcshXZFMpa3uvKVE,10362
15
- gpustack_runner-0.1.22.post2.dist-info/RECORD,,
10
+ gpustack_runner/_version_appendix.py,sha256=AE3f-puqLLOMhjdFlFuVpzA08xMz64uAy3mgO5-nf6I,23
11
+ gpustack_runner-0.1.22.post4.dist-info/METADATA,sha256=xQiljvJ5FPHgqZEgW2dNvoplsOMNiOQ9mdyETO0pQME,13436
12
+ gpustack_runner-0.1.22.post4.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
13
+ gpustack_runner-0.1.22.post4.dist-info/entry_points.txt,sha256=M1Dxl6cY0kIgf2I4pPsV-_kU6BAtjj93spmsXAdwW3s,66
14
+ gpustack_runner-0.1.22.post4.dist-info/licenses/LICENSE,sha256=OiPibowBvB-NHV3TP_NOj18XNBlXcshXZFMpa3uvKVE,10362
15
+ gpustack_runner-0.1.22.post4.dist-info/RECORD,,