gpustack-runner 0.1.22.post3__tar.gz → 0.1.22.post4__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/PKG-INFO +12 -12
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/README.md +11 -11
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/gpustack_runner/_version.py +2 -2
- gpustack_runner-0.1.22.post4/gpustack_runner/_version_appendix.py +1 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/gpustack_runner/runner.py.json +44 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/cuda/Dockerfile +1 -1
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/matrix.yaml +0 -1
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tests/gpustack_runner/fixtures/test_list_runners_by_backend.json +44 -0
- gpustack_runner-0.1.22.post3/gpustack_runner/_version_appendix.py +0 -1
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/.codespelldict +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/.codespellrc +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/.gitattributes +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/.gitignore +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/.pre-commit-config.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/.python-version +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/LICENSE +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/Makefile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/docs/index.md +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/docs/modules/gpustack_runner.md +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/gpustack_runner/__init__.py +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/gpustack_runner/__main__.py +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/gpustack_runner/_version.pyi +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/gpustack_runner/cmds/__init__.py +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/gpustack_runner/cmds/__types__.py +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/gpustack_runner/cmds/images.py +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/gpustack_runner/runner.py +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/hatch.toml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/mkdocs.yml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251020_vllm_install_lmcache/cann/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251020_vllm_install_lmcache/cuda/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251020_vllm_install_lmcache/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251020_vllm_install_lmcache/rocm/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251022_vllm_install_ray_client/cann/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251022_vllm_install_ray_client/cuda/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251022_vllm_install_ray_client/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251022_vllm_install_ray_client/rocm/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251022_vllm_install_ray_default/cuda/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251022_vllm_install_ray_default/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251022_vllm_install_ray_default/rocm/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251024_vllm_install_nvidia_hpcx/cuda/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251024_vllm_install_nvidia_hpcx/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251024_vllm_reinstall_lmcache/cuda/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251024_vllm_reinstall_lmcache/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251029_vllm_reinstall_ray/cann/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251029_vllm_reinstall_ray/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251103_mindie_refresh_entrypoint/cann/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251103_mindie_refresh_entrypoint/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251105_vllm_polish_nvidia_hpcx/cuda/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251105_vllm_polish_nvidia_hpcx/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251106_vllm_install_ep_kernel/cuda/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251106_vllm_install_ep_kernel/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251107_vllm_reinstall_lmcache/cuda/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251107_vllm_reinstall_lmcache/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251110_sglang_install_diffusion/cuda/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251110_sglang_install_diffusion/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251110_sglang_install_flashattn/cuda/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251110_sglang_install_flashattn/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251125_mindie_install_posix_ipc/cann/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251125_mindie_install_posix_ipc/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251201_vllm_patch_qwen2_5_vl/cuda/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251201_vllm_patch_qwen2_5_vl/cuda/patches/vllm_001_disable_flashatten_in_qwen2_5_vl.patch +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251201_vllm_patch_qwen2_5_vl/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251209_mindie_install_av/cann/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251209_mindie_install_av/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251213_mindie_patch_minicpm_qwen2_v2/cann/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251213_mindie_patch_minicpm_qwen2_v2/cann/patches.zip +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251213_mindie_patch_minicpm_qwen2_v2/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251213_sglang_patch_server_args/cuda/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251213_sglang_patch_server_args/cuda/patches/sglang_001_fix_server_args.patch +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251213_sglang_patch_server_args/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251214_cuda_several_patches/cuda/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251214_cuda_several_patches/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251215_cann_several_patches/cann/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251215_cann_several_patches/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251216_sglang_uninstall_runai_model_streamer/cuda/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251216_sglang_uninstall_runai_model_streamer/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251219_rocm_install_petit_kernel/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251219_rocm_install_petit_kernel/rocm/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251219_vllm_install_audio_extra/cuda/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251219_vllm_install_audio_extra/matrix.yaml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/20251219_vllm_install_audio_extra/rocm/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/README.md +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/cann/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/cann/mindie-atb-models_2.2.rc1_linux-amd64_py3.11_torch2.1.0-abi0.tar.gz +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/cann/mindie-atb-models_2.2.rc1_linux-arm64_py3.11_torch2.1.0-abi0.tar.gz +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/cann/patches/mindie.zip +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/corex/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/discard_runner.sh +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/dtk/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/expand_matrix.sh +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/maca/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/merge_runner.sh +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/prune_runner.sh +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/rocm/Dockerfile +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/rocm/patches/sglang_001_wrong_vram.patch +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pyproject.toml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pytest.ini +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/ruff.toml +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tests/gpustack_runner/fixtures/__init__.py +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tests/gpustack_runner/fixtures/test_docker_image.json +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tests/gpustack_runner/fixtures/test_list_backend_runners.json +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tests/gpustack_runner/fixtures/test_list_runners_by_prefix.json +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tests/gpustack_runner/fixtures/test_list_service_runners.json +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tests/gpustack_runner/test_runner.py +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tools/activate +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tools/chat.sh +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tools/chat_tool_current_date_time.sh +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tools/chat_tool_get_temperature.sh +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tools/chat_tool_get_weather.sh +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tools/chat_tool_square_of_number.sh +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tools/chat_tool_square_root_of_number.sh +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tools/chat_tool_where_am_i.sh +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tools/run_runner.sh +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tools/run_runner_cluster.sh +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/uv.lock +0 -0
- {gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/uv.toml +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: gpustack-runner
|
|
3
|
-
Version: 0.1.22.
|
|
3
|
+
Version: 0.1.22.post4
|
|
4
4
|
Summary: GPUStack Runner is library for registering runnable accelerated backends and services in GPUStack.
|
|
5
5
|
Project-URL: Homepage, https://github.com/gpustack/runner
|
|
6
6
|
Project-URL: Bug Tracker, https://github.com/gpustack/gpustack/issues
|
|
@@ -86,12 +86,12 @@ The following table lists the supported accelerated backends and their correspon
|
|
|
86
86
|
> - Applied [Qwen2.5 VL patched](https://github.com/gpustack/gpustack/issues/3606) to vLLM 0.11.2.
|
|
87
87
|
> - Applied [vLLM[audio] packages](https://github.com/vllm-project/vllm/blob/275de34170654274616082721348b7edd9741d32/setup.py#L720-L724) to vLLM 0.11.2.
|
|
88
88
|
|
|
89
|
-
| CUDA Version <br/> (Variant) | vLLM
|
|
90
|
-
|
|
91
|
-
| 12.9 | `0.13.0`, `0.12.0`,
|
|
92
|
-
| 12.8 | `0.13.0`, `0.12.0`,
|
|
93
|
-
| 12.6 | `0.13.0`, `0.12.0`,
|
|
94
|
-
| 12.4 | `0.11.0`, `0.10.2`, <br/>`0.10.1.1`, `0.10.0`
|
|
89
|
+
| CUDA Version <br/> (Variant) | vLLM | SGLang | VoxBox |
|
|
90
|
+
|------------------------------|-------------------------------------------------------------------------------------------|-----------------------------------------------------------|--------------------|
|
|
91
|
+
| 12.9 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`** | `0.5.6.post2` | |
|
|
92
|
+
| 12.8 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`**, `0.11.0`, <br/>`0.10.2`, `0.10.1.1`, <br/>`0.10.0` | `0.5.6.post2`, `0.5.5.post3`, <br/>`0.5.5`, `0.5.4.post3` | `0.0.21`, `0.0.20` |
|
|
93
|
+
| 12.6 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`**, `0.11.0`, <br/>`0.10.2`, `0.10.1.1`, <br/>`0.10.0` | `0.5.6.post2` | `0.0.21`, `0.0.20` |
|
|
94
|
+
| 12.4 | `0.11.0`, `0.10.2`, <br/>`0.10.1.1`, `0.10.0` | | `0.0.20` |
|
|
95
95
|
|
|
96
96
|
### Hygon DTK
|
|
97
97
|
|
|
@@ -124,11 +124,11 @@ The following table lists the supported accelerated backends and their correspon
|
|
|
124
124
|
> - Applied [vLLM[audio] packages](https://github.com/vllm-project/vllm/blob/275de34170654274616082721348b7edd9741d32/setup.py#L720-L724) to vLLM 0.11.2.
|
|
125
125
|
> - Applied [petit-kernel package](https://github.com/vllm-project/vllm/blob/275de34170654274616082721348b7edd9741d32/setup.py#L728) to vLLM 0.11.2 and SGLang 0.5.5.post3.
|
|
126
126
|
|
|
127
|
-
| ROCm Version <br/> (Variant) | vLLM
|
|
128
|
-
|
|
129
|
-
| 7.0 | `0.13.0`, `0.12.0`,
|
|
130
|
-
| 6.4 | `0.13.0`, `0.12.0`,
|
|
131
|
-
| 6.3 | `0.10.1.1`, `0.10.0`
|
|
127
|
+
| ROCm Version <br/> (Variant) | vLLM | SGLang |
|
|
128
|
+
|------------------------------|-------------------------------------------------|----------------------------------|
|
|
129
|
+
| 7.0 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`**, `0.11.0` | `0.5.6.post2` |
|
|
130
|
+
| 6.4 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`**, `0.10.2` | `0.5.6.post2`, **`0.5.5.post3`** |
|
|
131
|
+
| 6.3 | `0.10.1.1`, `0.10.0` | |
|
|
132
132
|
|
|
133
133
|
## Directory Structure
|
|
134
134
|
|
|
@@ -66,12 +66,12 @@ The following table lists the supported accelerated backends and their correspon
|
|
|
66
66
|
> - Applied [Qwen2.5 VL patched](https://github.com/gpustack/gpustack/issues/3606) to vLLM 0.11.2.
|
|
67
67
|
> - Applied [vLLM[audio] packages](https://github.com/vllm-project/vllm/blob/275de34170654274616082721348b7edd9741d32/setup.py#L720-L724) to vLLM 0.11.2.
|
|
68
68
|
|
|
69
|
-
| CUDA Version <br/> (Variant) | vLLM
|
|
70
|
-
|
|
71
|
-
| 12.9 | `0.13.0`, `0.12.0`,
|
|
72
|
-
| 12.8 | `0.13.0`, `0.12.0`,
|
|
73
|
-
| 12.6 | `0.13.0`, `0.12.0`,
|
|
74
|
-
| 12.4 | `0.11.0`, `0.10.2`, <br/>`0.10.1.1`, `0.10.0`
|
|
69
|
+
| CUDA Version <br/> (Variant) | vLLM | SGLang | VoxBox |
|
|
70
|
+
|------------------------------|-------------------------------------------------------------------------------------------|-----------------------------------------------------------|--------------------|
|
|
71
|
+
| 12.9 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`** | `0.5.6.post2` | |
|
|
72
|
+
| 12.8 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`**, `0.11.0`, <br/>`0.10.2`, `0.10.1.1`, <br/>`0.10.0` | `0.5.6.post2`, `0.5.5.post3`, <br/>`0.5.5`, `0.5.4.post3` | `0.0.21`, `0.0.20` |
|
|
73
|
+
| 12.6 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`**, `0.11.0`, <br/>`0.10.2`, `0.10.1.1`, <br/>`0.10.0` | `0.5.6.post2` | `0.0.21`, `0.0.20` |
|
|
74
|
+
| 12.4 | `0.11.0`, `0.10.2`, <br/>`0.10.1.1`, `0.10.0` | | `0.0.20` |
|
|
75
75
|
|
|
76
76
|
### Hygon DTK
|
|
77
77
|
|
|
@@ -104,11 +104,11 @@ The following table lists the supported accelerated backends and their correspon
|
|
|
104
104
|
> - Applied [vLLM[audio] packages](https://github.com/vllm-project/vllm/blob/275de34170654274616082721348b7edd9741d32/setup.py#L720-L724) to vLLM 0.11.2.
|
|
105
105
|
> - Applied [petit-kernel package](https://github.com/vllm-project/vllm/blob/275de34170654274616082721348b7edd9741d32/setup.py#L728) to vLLM 0.11.2 and SGLang 0.5.5.post3.
|
|
106
106
|
|
|
107
|
-
| ROCm Version <br/> (Variant) | vLLM
|
|
108
|
-
|
|
109
|
-
| 7.0 | `0.13.0`, `0.12.0`,
|
|
110
|
-
| 6.4 | `0.13.0`, `0.12.0`,
|
|
111
|
-
| 6.3 | `0.10.1.1`, `0.10.0`
|
|
107
|
+
| ROCm Version <br/> (Variant) | vLLM | SGLang |
|
|
108
|
+
|------------------------------|-------------------------------------------------|----------------------------------|
|
|
109
|
+
| 7.0 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`**, `0.11.0` | `0.5.6.post2` |
|
|
110
|
+
| 6.4 | `0.13.0`, `0.12.0`, <br/>**`0.11.2`**, `0.10.2` | `0.5.6.post2`, **`0.5.5.post3`** |
|
|
111
|
+
| 6.3 | `0.10.1.1`, `0.10.0` | |
|
|
112
112
|
|
|
113
113
|
## Directory Structure
|
|
114
114
|
|
|
@@ -27,8 +27,8 @@ version_tuple: VERSION_TUPLE
|
|
|
27
27
|
__commit_id__: COMMIT_ID
|
|
28
28
|
commit_id: COMMIT_ID
|
|
29
29
|
|
|
30
|
-
__version__ = version = '0.1.22.
|
|
31
|
-
__version_tuple__ = version_tuple = (0, 1, 22, '
|
|
30
|
+
__version__ = version = '0.1.22.post4'
|
|
31
|
+
__version_tuple__ = version_tuple = (0, 1, 22, 'post4')
|
|
32
32
|
try:
|
|
33
33
|
from ._version_appendix import git_commit
|
|
34
34
|
__commit_id__ = commit_id = git_commit
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
git_commit = "f3f4d02"
|
{gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/gpustack_runner/runner.py.json
RENAMED
|
@@ -901,6 +901,28 @@
|
|
|
901
901
|
"docker_image": "gpustack/runner:cuda12.8-vllm0.10.0",
|
|
902
902
|
"deprecated": false
|
|
903
903
|
},
|
|
904
|
+
{
|
|
905
|
+
"backend": "cuda",
|
|
906
|
+
"backend_version": "12.8",
|
|
907
|
+
"original_backend_version": "12.8.1",
|
|
908
|
+
"backend_variant": "",
|
|
909
|
+
"service": "voxbox",
|
|
910
|
+
"service_version": "0.0.21",
|
|
911
|
+
"platform": "linux/amd64",
|
|
912
|
+
"docker_image": "gpustack/runner:cuda12.8-voxbox0.0.21",
|
|
913
|
+
"deprecated": false
|
|
914
|
+
},
|
|
915
|
+
{
|
|
916
|
+
"backend": "cuda",
|
|
917
|
+
"backend_version": "12.8",
|
|
918
|
+
"original_backend_version": "12.8.1",
|
|
919
|
+
"backend_variant": "",
|
|
920
|
+
"service": "voxbox",
|
|
921
|
+
"service_version": "0.0.21",
|
|
922
|
+
"platform": "linux/arm64",
|
|
923
|
+
"docker_image": "gpustack/runner:cuda12.8-voxbox0.0.21",
|
|
924
|
+
"deprecated": false
|
|
925
|
+
},
|
|
904
926
|
{
|
|
905
927
|
"backend": "cuda",
|
|
906
928
|
"backend_version": "12.8",
|
|
@@ -1077,6 +1099,28 @@
|
|
|
1077
1099
|
"docker_image": "gpustack/runner:cuda12.6-vllm0.10.0",
|
|
1078
1100
|
"deprecated": false
|
|
1079
1101
|
},
|
|
1102
|
+
{
|
|
1103
|
+
"backend": "cuda",
|
|
1104
|
+
"backend_version": "12.6",
|
|
1105
|
+
"original_backend_version": "12.6.3",
|
|
1106
|
+
"backend_variant": "",
|
|
1107
|
+
"service": "voxbox",
|
|
1108
|
+
"service_version": "0.0.21",
|
|
1109
|
+
"platform": "linux/amd64",
|
|
1110
|
+
"docker_image": "gpustack/runner:cuda12.6-voxbox0.0.21",
|
|
1111
|
+
"deprecated": false
|
|
1112
|
+
},
|
|
1113
|
+
{
|
|
1114
|
+
"backend": "cuda",
|
|
1115
|
+
"backend_version": "12.6",
|
|
1116
|
+
"original_backend_version": "12.6.3",
|
|
1117
|
+
"backend_variant": "",
|
|
1118
|
+
"service": "voxbox",
|
|
1119
|
+
"service_version": "0.0.21",
|
|
1120
|
+
"platform": "linux/arm64",
|
|
1121
|
+
"docker_image": "gpustack/runner:cuda12.6-voxbox0.0.21",
|
|
1122
|
+
"deprecated": false
|
|
1123
|
+
},
|
|
1080
1124
|
{
|
|
1081
1125
|
"backend": "cuda",
|
|
1082
1126
|
"backend_version": "12.6",
|
|
@@ -95,7 +95,7 @@ ARG CMAKE_MAX_JOBS
|
|
|
95
95
|
ARG CUDA_VERSION=12.9.1
|
|
96
96
|
ARG CUDA_ARCHS
|
|
97
97
|
ARG VOXBOX_BASE_IMAGE=gpustack/runner:cuda${CUDA_VERSION}-python${PYTHON_VERSION}
|
|
98
|
-
ARG VOXBOX_VERSION=0.0.
|
|
98
|
+
ARG VOXBOX_VERSION=0.0.21
|
|
99
99
|
ARG VOXBOX_TORCH_VERSION=2.7.1
|
|
100
100
|
ARG VOXBOX_TORCH_CUDA_VERSION=${CUDA_VERSION}
|
|
101
101
|
ARG VLLM_BASE_IMAGE=gpustack/runner:cuda${CUDA_VERSION}-python${PYTHON_VERSION}
|
|
@@ -923,6 +923,28 @@
|
|
|
923
923
|
"docker_image": "gpustack/runner:cuda12.8-vllm0.10.0",
|
|
924
924
|
"deprecated": false
|
|
925
925
|
},
|
|
926
|
+
{
|
|
927
|
+
"backend": "cuda",
|
|
928
|
+
"backend_version": "12.8",
|
|
929
|
+
"original_backend_version": "12.8.1",
|
|
930
|
+
"backend_variant": "",
|
|
931
|
+
"service": "voxbox",
|
|
932
|
+
"service_version": "0.0.21",
|
|
933
|
+
"platform": "linux/amd64",
|
|
934
|
+
"docker_image": "gpustack/runner:cuda12.8-voxbox0.0.21",
|
|
935
|
+
"deprecated": false
|
|
936
|
+
},
|
|
937
|
+
{
|
|
938
|
+
"backend": "cuda",
|
|
939
|
+
"backend_version": "12.8",
|
|
940
|
+
"original_backend_version": "12.8.1",
|
|
941
|
+
"backend_variant": "",
|
|
942
|
+
"service": "voxbox",
|
|
943
|
+
"service_version": "0.0.21",
|
|
944
|
+
"platform": "linux/arm64",
|
|
945
|
+
"docker_image": "gpustack/runner:cuda12.8-voxbox0.0.21",
|
|
946
|
+
"deprecated": false
|
|
947
|
+
},
|
|
926
948
|
{
|
|
927
949
|
"backend": "cuda",
|
|
928
950
|
"backend_version": "12.8",
|
|
@@ -1099,6 +1121,28 @@
|
|
|
1099
1121
|
"docker_image": "gpustack/runner:cuda12.6-vllm0.10.0",
|
|
1100
1122
|
"deprecated": false
|
|
1101
1123
|
},
|
|
1124
|
+
{
|
|
1125
|
+
"backend": "cuda",
|
|
1126
|
+
"backend_version": "12.6",
|
|
1127
|
+
"original_backend_version": "12.6.3",
|
|
1128
|
+
"backend_variant": "",
|
|
1129
|
+
"service": "voxbox",
|
|
1130
|
+
"service_version": "0.0.21",
|
|
1131
|
+
"platform": "linux/amd64",
|
|
1132
|
+
"docker_image": "gpustack/runner:cuda12.6-voxbox0.0.21",
|
|
1133
|
+
"deprecated": false
|
|
1134
|
+
},
|
|
1135
|
+
{
|
|
1136
|
+
"backend": "cuda",
|
|
1137
|
+
"backend_version": "12.6",
|
|
1138
|
+
"original_backend_version": "12.6.3",
|
|
1139
|
+
"backend_variant": "",
|
|
1140
|
+
"service": "voxbox",
|
|
1141
|
+
"service_version": "0.0.21",
|
|
1142
|
+
"platform": "linux/arm64",
|
|
1143
|
+
"docker_image": "gpustack/runner:cuda12.6-voxbox0.0.21",
|
|
1144
|
+
"deprecated": false
|
|
1145
|
+
},
|
|
1102
1146
|
{
|
|
1103
1147
|
"backend": "cuda",
|
|
1104
1148
|
"backend_version": "12.6",
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
git_commit = "c9f91c3"
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/docs/modules/gpustack_runner.md
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/gpustack_runner/cmds/__init__.py
RENAMED
|
File without changes
|
{gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/gpustack_runner/cmds/__types__.py
RENAMED
|
File without changes
|
{gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/gpustack_runner/cmds/images.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/pack/.post_operation/README.md
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tests/gpustack_runner/test_runner.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tools/chat_tool_current_date_time.sh
RENAMED
|
File without changes
|
{gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tools/chat_tool_get_temperature.sh
RENAMED
|
File without changes
|
{gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tools/chat_tool_get_weather.sh
RENAMED
|
File without changes
|
{gpustack_runner-0.1.22.post3 → gpustack_runner-0.1.22.post4}/tools/chat_tool_square_of_number.sh
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|