gpustack-runner 0.1.23__py3-none-any.whl → 0.1.23.post2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -27,8 +27,8 @@ version_tuple: VERSION_TUPLE
27
27
  __commit_id__: COMMIT_ID
28
28
  commit_id: COMMIT_ID
29
29
 
30
- __version__ = version = '0.1.23'
31
- __version_tuple__ = version_tuple = (0, 1, 23)
30
+ __version__ = version = '0.1.23.post2'
31
+ __version_tuple__ = version_tuple = (0, 1, 23, 'post2')
32
32
  try:
33
33
  from ._version_appendix import git_commit
34
34
  __commit_id__ = commit_id = git_commit
@@ -1 +1 @@
1
- git_commit = "60fcf6e"
1
+ git_commit = "6d771e2"
@@ -17,7 +17,7 @@ from typing import TYPE_CHECKING
17
17
  import requests
18
18
  from dataclasses_json import dataclass_json
19
19
 
20
- from gpustack_runner import BackendRunners, list_backend_runners
20
+ from gpustack_runner import BackendRunners, envs, list_backend_runners
21
21
 
22
22
  from .__types__ import SubCommand
23
23
 
@@ -1094,6 +1094,9 @@ def list_images(**kwargs) -> list[PlatformedImage]:
1094
1094
  name = img.name
1095
1095
  if not name:
1096
1096
  continue
1097
+ if namespace := envs.GPUSTACK_RUNNER_DEFAULT_IMAGE_NAMESPACE:
1098
+ name = name.replace("gpustack/", f"{namespace}/")
1099
+ img.name = name
1097
1100
  if name not in image_names_index:
1098
1101
  image_names_index[name] = len(images)
1099
1102
  images.append(img)
gpustack_runner/envs.py CHANGED
@@ -9,7 +9,7 @@ if TYPE_CHECKING:
9
9
 
10
10
  # Global
11
11
 
12
- GPUSTACK_RUNNER_DEFAULT_NAMESPACE: str | None = None
12
+ GPUSTACK_RUNNER_DEFAULT_IMAGE_NAMESPACE: str | None = None
13
13
  """
14
14
  Namespace for default runner images.
15
15
  If not set, it should be "gpustack".
@@ -19,11 +19,12 @@ if TYPE_CHECKING:
19
19
 
20
20
  variables: dict[str, Callable[[], Any]] = {
21
21
  # Global
22
- "GPUSTACK_RUNNER_DEFAULT_NAMESPACE": lambda: trim_str(
22
+ "GPUSTACK_RUNNER_DEFAULT_IMAGE_NAMESPACE": lambda: trim_str(
23
23
  getenvs(
24
24
  keys=[
25
- "GPUSTACK_RUNNER_DEFAULT_NAMESPACE",
26
- "GPUSTACK_RUNTIME_DEPLOY_DEFAULT_NAMESPACE", ## Compatible with gpustack/gpustack_runtime.
25
+ "GPUSTACK_RUNNER_DEFAULT_IMAGE_NAMESPACE",
26
+ ## Compatible with gpustack/gpustack_runtime.
27
+ "GPUSTACK_RUNTIME_DEPLOY_DEFAULT_IMAGE_NAMESPACE",
27
28
  ],
28
29
  ),
29
30
  ),
gpustack_runner/runner.py CHANGED
@@ -239,7 +239,7 @@ def list_runners(**kwargs) -> Runners | list[dict]:
239
239
  json_list = json.load(f)
240
240
  runners = []
241
241
  for item in json_list:
242
- if namespace := envs.GPUSTACK_RUNNER_DEFAULT_NAMESPACE:
242
+ if namespace := envs.GPUSTACK_RUNNER_DEFAULT_IMAGE_NAMESPACE:
243
243
  docker_image = item["docker_image"]
244
244
  docker_image = docker_image.replace("gpustack/", f"{namespace}/")
245
245
  item["docker_image"] = docker_image
@@ -21,6 +21,17 @@
21
21
  "docker_image": "gpustack/runner:cann8.3-a3-mindie2.2.rc1",
22
22
  "deprecated": false
23
23
  },
24
+ {
25
+ "backend": "cann",
26
+ "backend_version": "8.3",
27
+ "original_backend_version": "8.3.rc2",
28
+ "backend_variant": "a3",
29
+ "service": "sglang",
30
+ "service_version": "0.5.7",
31
+ "platform": "linux/arm64",
32
+ "docker_image": "gpustack/runner:cann8.3-a3-sglang0.5.7",
33
+ "deprecated": false
34
+ },
24
35
  {
25
36
  "backend": "cann",
26
37
  "backend_version": "8.3",
@@ -230,6 +241,17 @@
230
241
  "docker_image": "gpustack/runner:cann8.3-910b-mindie2.2.rc1",
231
242
  "deprecated": false
232
243
  },
244
+ {
245
+ "backend": "cann",
246
+ "backend_version": "8.3",
247
+ "original_backend_version": "8.3.rc2",
248
+ "backend_variant": "910b",
249
+ "service": "sglang",
250
+ "service_version": "0.5.7",
251
+ "platform": "linux/arm64",
252
+ "docker_image": "gpustack/runner:cann8.3-910b-sglang0.5.7",
253
+ "deprecated": false
254
+ },
233
255
  {
234
256
  "backend": "cann",
235
257
  "backend_version": "8.3",
@@ -626,6 +648,28 @@
626
648
  "docker_image": "gpustack/runner:corex4.2-vllm0.8.3",
627
649
  "deprecated": false
628
650
  },
651
+ {
652
+ "backend": "cuda",
653
+ "backend_version": "12.9",
654
+ "original_backend_version": "12.9.1",
655
+ "backend_variant": "",
656
+ "service": "sglang",
657
+ "service_version": "0.5.7",
658
+ "platform": "linux/amd64",
659
+ "docker_image": "gpustack/runner:cuda12.9-sglang0.5.7",
660
+ "deprecated": false
661
+ },
662
+ {
663
+ "backend": "cuda",
664
+ "backend_version": "12.9",
665
+ "original_backend_version": "12.9.1",
666
+ "backend_variant": "",
667
+ "service": "sglang",
668
+ "service_version": "0.5.7",
669
+ "platform": "linux/arm64",
670
+ "docker_image": "gpustack/runner:cuda12.9-sglang0.5.7",
671
+ "deprecated": false
672
+ },
629
673
  {
630
674
  "backend": "cuda",
631
675
  "backend_version": "12.9",
@@ -714,6 +758,28 @@
714
758
  "docker_image": "gpustack/runner:cuda12.9-vllm0.11.2",
715
759
  "deprecated": false
716
760
  },
761
+ {
762
+ "backend": "cuda",
763
+ "backend_version": "12.8",
764
+ "original_backend_version": "12.8.1",
765
+ "backend_variant": "",
766
+ "service": "sglang",
767
+ "service_version": "0.5.7",
768
+ "platform": "linux/amd64",
769
+ "docker_image": "gpustack/runner:cuda12.8-sglang0.5.7",
770
+ "deprecated": false
771
+ },
772
+ {
773
+ "backend": "cuda",
774
+ "backend_version": "12.8",
775
+ "original_backend_version": "12.8.1",
776
+ "backend_variant": "",
777
+ "service": "sglang",
778
+ "service_version": "0.5.7",
779
+ "platform": "linux/arm64",
780
+ "docker_image": "gpustack/runner:cuda12.8-sglang0.5.7",
781
+ "deprecated": false
782
+ },
717
783
  {
718
784
  "backend": "cuda",
719
785
  "backend_version": "12.8",
@@ -1341,6 +1407,17 @@
1341
1407
  "docker_image": "gpustack/runner:maca3.0-vllm0.9.1",
1342
1408
  "deprecated": false
1343
1409
  },
1410
+ {
1411
+ "backend": "rocm",
1412
+ "backend_version": "7.0",
1413
+ "original_backend_version": "7.0.2",
1414
+ "backend_variant": "",
1415
+ "service": "sglang",
1416
+ "service_version": "0.5.7",
1417
+ "platform": "linux/amd64",
1418
+ "docker_image": "gpustack/runner:rocm7.0-sglang0.5.7",
1419
+ "deprecated": false
1420
+ },
1344
1421
  {
1345
1422
  "backend": "rocm",
1346
1423
  "backend_version": "7.0",
@@ -1396,6 +1473,17 @@
1396
1473
  "docker_image": "gpustack/runner:rocm7.0-vllm0.11.0",
1397
1474
  "deprecated": true
1398
1475
  },
1476
+ {
1477
+ "backend": "rocm",
1478
+ "backend_version": "6.4",
1479
+ "original_backend_version": "6.4.4",
1480
+ "backend_variant": "",
1481
+ "service": "sglang",
1482
+ "service_version": "0.5.7",
1483
+ "platform": "linux/amd64",
1484
+ "docker_image": "gpustack/runner:rocm6.4-sglang0.5.7",
1485
+ "deprecated": false
1486
+ },
1399
1487
  {
1400
1488
  "backend": "rocm",
1401
1489
  "backend_version": "6.4",
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: gpustack-runner
3
- Version: 0.1.23
3
+ Version: 0.1.23.post2
4
4
  Summary: GPUStack Runner is library for registering runnable accelerated backends and services in GPUStack.
5
5
  Project-URL: Homepage, https://github.com/gpustack/runner
6
6
  Project-URL: Bug Tracker, https://github.com/gpustack/gpustack/issues
@@ -58,8 +58,8 @@ The following table lists the supported accelerated backends and their correspon
58
58
 
59
59
  | CANN Version <br/> (Variant) | MindIE | vLLM | SGLang |
60
60
  |------------------------------|--------------------------|------------------------------------------------------------|------------------------|
61
- | 8.3 (A3/910C) | `2.2.rc1` | `0.13.0`, `0.12.0`, `0.11.0` | `0.5.6.post2` |
62
- | 8.3 (910B) | `2.2.rc1` | `0.13.0`, `0.12.0`, `0.11.0` | `0.5.6.post2` |
61
+ | 8.3 (A3/910C) | `2.2.rc1` | `0.13.0`, `0.12.0`, `0.11.0` | `0.5.7`, `0.5.6.post2` |
62
+ | 8.3 (910B) | `2.2.rc1` | `0.13.0`, `0.12.0`, `0.11.0` | `0.5.7`, `0.5.6.post2` |
63
63
  | 8.3 (310P) | `2.2.rc1` | | |
64
64
  | 8.2 (A3/910C) | `2.1.rc2` | `0.10.2`, `0.10.1.1` | `0.5.2`, `0.5.1.post3` |
65
65
  | 8.2 (910B) | `2.1.rc2`, ~~`2.1.rc1`~~ | `0.10.2`, `0.10.1.1`, <br/>`0.10.0`, `0.9.2`, <br/>`0.9.1` | `0.5.2`, `0.5.1.post3` |
@@ -88,12 +88,12 @@ The following table lists the supported accelerated backends and their correspon
88
88
  > - CUDA 12.6/12.4 supports Compute Capabilities:
89
89
  `7.5 8.0+PTX 8.9 9.0+PTX`.
90
90
 
91
- | CUDA Version <br/> (Variant) | vLLM | SGLang | VoxBox |
92
- |------------------------------|---------------------------------------------------------------------------------------------------|---------------------------------------------------------------|------------------------|
93
- | 12.9 | `0.13.0`, `0.12.0`, <br/>`0.11.2` | `0.5.6.post2` | |
94
- | 12.8 | `0.13.0`, `0.12.0`, <br/>`0.11.2`, ~~`0.11.0`~~, <br/>`0.10.2`, ~~`0.10.1.1`~~, <br/>~~`0.10.0`~~ | `0.5.6.post2`, `0.5.5.post3`, <br/>~~`0.5.5`~~, `0.5.4.post3` | `0.0.21`, ~~`0.0.20`~~ |
95
- | 12.6 | `0.13.0`, `0.12.0`, <br/>`0.11.2`, ~~`0.11.0`~~, <br/>`0.10.2`, ~~`0.10.1.1`~~, <br/>~~`0.10.0`~~ | `0.5.6.post2` | `0.0.21`, ~~`0.0.20`~~ |
96
- | 12.4 | ~~`0.11.0`~~, ~~`0.10.2`~~, <br/>~~`0.10.1.1`~~, ~~`0.10.0`~~ | | ~~`0.0.20`~~ |
91
+ | CUDA Version <br/> (Variant) | vLLM | SGLang | VoxBox |
92
+ |------------------------------|---------------------------------------------------------------------------------------------------|------------------------------------------------------------------------|------------------------|
93
+ | 12.9 | `0.13.0`, `0.12.0`, <br/>`0.11.2` | `0.5.7`, `0.5.6.post2` | |
94
+ | 12.8 | `0.13.0`, `0.12.0`, <br/>`0.11.2`, ~~`0.11.0`~~, <br/>`0.10.2`, ~~`0.10.1.1`~~, <br/>~~`0.10.0`~~ | `0.5.7`, `0.5.6.post2`, `0.5.5.post3`, <br/>~~`0.5.5`~~, `0.5.4.post3` | `0.0.21`, ~~`0.0.20`~~ |
95
+ | 12.6 | `0.13.0`, `0.12.0`, <br/>`0.11.2`, ~~`0.11.0`~~, <br/>`0.10.2`, ~~`0.10.1.1`~~, <br/>~~`0.10.0`~~ | | `0.0.21`, ~~`0.0.20`~~ |
96
+ | 12.4 | ~~`0.11.0`~~, ~~`0.10.2`~~, <br/>~~`0.10.1.1`~~, ~~`0.10.0`~~ | | ~~`0.0.20`~~ |
97
97
 
98
98
  ### Hygon DTK
99
99
 
@@ -112,8 +112,8 @@ The following table lists the supported accelerated backends and their correspon
112
112
 
113
113
  > [!CAUTION]
114
114
  > Since v0.1.23:
115
- > Deprecated all services for ROCm 6.3.
116
- > Deprecated vLLM `0.11.0`.
115
+ > - Deprecated all services for ROCm 6.3.
116
+ > - Deprecated vLLM `0.11.0`.
117
117
 
118
118
  > [!NOTE]
119
119
  > - ROCm 7.0 supports LLVM targets:
@@ -128,11 +128,11 @@ The following table lists the supported accelerated backends and their correspon
128
128
  > - ROCm 6.4 SGLang supports `gfx942` only.
129
129
  > - ROCm 7.0 SGLang supports `gfx950` only.
130
130
 
131
- | ROCm Version <br/> (Variant) | vLLM | SGLang |
132
- |------------------------------|-------------------------------------------------|------------------------------|
133
- | 7.0 | `0.13.0`, `0.12.0`, <br/>`0.11.2`, ~~`0.11.0`~~ | `0.5.6.post2` |
134
- | 6.4 | `0.13.0`, `0.12.0`, <br/>`0.11.2`, `0.10.2` | `0.5.6.post2`, `0.5.5.post3` |
135
- | 6.3 | ~~`0.10.1.1`~~, ~~`0.10.0`~~ | |
131
+ | ROCm Version <br/> (Variant) | vLLM | SGLang |
132
+ |------------------------------|-------------------------------------------------|---------------------------------------|
133
+ | 7.0 | `0.13.0`, `0.12.0`, <br/>`0.11.2`, ~~`0.11.0`~~ | `0.5.7`, `0.5.6.post2` |
134
+ | 6.4 | `0.13.0`, `0.12.0`, <br/>`0.11.2`, `0.10.2` | `0.5.7`, `0.5.6.post2`, `0.5.5.post3` |
135
+ | 6.3 | ~~`0.10.1.1`~~, ~~`0.10.0`~~ | |
136
136
 
137
137
  ## Directory Structure
138
138
 
@@ -0,0 +1,16 @@
1
+ gpustack_runner/__init__.py,sha256=0_0jsxo1xjLtHTOIEU0_-A1qFEANzsVw-uXGjcILDwk,530
2
+ gpustack_runner/__main__.py,sha256=wtcp9lwMkaXGbQkuOY08EQhKfIHcTLSjMdnj2W3UGwk,1285
3
+ gpustack_runner/_version.py,sha256=NCM7WiXV--O7WpmrZyz6RSt8dfOM9XgSzFH_4T36QEA,792
4
+ gpustack_runner/_version.pyi,sha256=A42NoSgcqEXVy2OeNm4LXC9CbyonbooYrSUBlPm2lGY,156
5
+ gpustack_runner/envs.py,sha256=KdRlhBAuluPXaLi_1TAoZsBjSIg78TKo2n2p67VpFUQ,2669
6
+ gpustack_runner/runner.py,sha256=gbr69aab21ZJ1iVLvK5M2ql1UeRXQmhmh3-x5DBLsfs,26154
7
+ gpustack_runner/runner.py.json,sha256=73LUrvctwiZLxZD99CoOPKPHCI6cD4qQE4zTtmWrS_I,43900
8
+ gpustack_runner/cmds/__init__.py,sha256=Os8FdvqNjLYiVn_jnDo7rFEtAeVLJJI1odKHEqWF-Fw,417
9
+ gpustack_runner/cmds/__types__.py,sha256=7C4kQM0EHPD8WpJpTo6kh9rEdkrYALcLQ-GAzMMsqV8,789
10
+ gpustack_runner/cmds/images.py,sha256=76PhBP9KLkCUkyLkYQk4mvnctKzm8WJbVdW34ByE72M,38372
11
+ gpustack_runner/_version_appendix.py,sha256=KdhQh8fb2BZ6pZ-UewzDmtSgGRxfyOHxDGN6mUYIjTA,23
12
+ gpustack_runner-0.1.23.post2.dist-info/METADATA,sha256=HIn9Fveuy4JhloUnIv15c80w0FWIRh6fM7xsyHBN7DA,12967
13
+ gpustack_runner-0.1.23.post2.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
14
+ gpustack_runner-0.1.23.post2.dist-info/entry_points.txt,sha256=M1Dxl6cY0kIgf2I4pPsV-_kU6BAtjj93spmsXAdwW3s,66
15
+ gpustack_runner-0.1.23.post2.dist-info/licenses/LICENSE,sha256=OiPibowBvB-NHV3TP_NOj18XNBlXcshXZFMpa3uvKVE,10362
16
+ gpustack_runner-0.1.23.post2.dist-info/RECORD,,
@@ -1,16 +0,0 @@
1
- gpustack_runner/__init__.py,sha256=0_0jsxo1xjLtHTOIEU0_-A1qFEANzsVw-uXGjcILDwk,530
2
- gpustack_runner/__main__.py,sha256=wtcp9lwMkaXGbQkuOY08EQhKfIHcTLSjMdnj2W3UGwk,1285
3
- gpustack_runner/_version.py,sha256=K62qjl2rYPWyHlip9dUMtefmyJJ6D7jByOIPNGERJAo,777
4
- gpustack_runner/_version.pyi,sha256=A42NoSgcqEXVy2OeNm4LXC9CbyonbooYrSUBlPm2lGY,156
5
- gpustack_runner/envs.py,sha256=zxnUw42fLRZxGmcg9amVIU6SvoeXDGejcqBRggLHkVE,2630
6
- gpustack_runner/runner.py,sha256=YOaTDFQyOfF3rza6llIM_qWsMdeXyp43oXzNM1JutyQ,26148
7
- gpustack_runner/runner.py.json,sha256=So5CUA7iPG8TvLKRrtqD3p5c2WEKSKdifXPLmyNn3aI,41462
8
- gpustack_runner/cmds/__init__.py,sha256=Os8FdvqNjLYiVn_jnDo7rFEtAeVLJJI1odKHEqWF-Fw,417
9
- gpustack_runner/cmds/__types__.py,sha256=7C4kQM0EHPD8WpJpTo6kh9rEdkrYALcLQ-GAzMMsqV8,789
10
- gpustack_runner/cmds/images.py,sha256=ZbimSOqC1DRiEOl434MDugAgZ_1b66xYbpI9AUbZDxk,38194
11
- gpustack_runner/_version_appendix.py,sha256=qDsJqPC7KSnVxuj64wzviBnNEX3UXxL0YUJIn8v6Nts,23
12
- gpustack_runner-0.1.23.dist-info/METADATA,sha256=vN7evuTwPXLM5VzKvky7sQ5KYtHBaPgCEIhlKUXdkDs,12858
13
- gpustack_runner-0.1.23.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
14
- gpustack_runner-0.1.23.dist-info/entry_points.txt,sha256=M1Dxl6cY0kIgf2I4pPsV-_kU6BAtjj93spmsXAdwW3s,66
15
- gpustack_runner-0.1.23.dist-info/licenses/LICENSE,sha256=OiPibowBvB-NHV3TP_NOj18XNBlXcshXZFMpa3uvKVE,10362
16
- gpustack_runner-0.1.23.dist-info/RECORD,,