gpustack-runner 0.1.24.post3__tar.gz → 0.1.24.post4__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (145) hide show
  1. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/PKG-INFO +5 -5
  2. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/README.md +4 -4
  3. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/gpustack_runner/_version.py +2 -2
  4. gpustack_runner-0.1.24.post4/gpustack_runner/_version_appendix.py +1 -0
  5. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/gpustack_runner/runner.py.json +44 -0
  6. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/cann/Dockerfile +15 -2
  7. gpustack_runner-0.1.24.post4/pack/cann/patches/vllm_omni/001_wrong_patch.patch +13 -0
  8. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/cuda/Dockerfile +14 -2
  9. gpustack_runner-0.1.24.post4/pack/cuda/patches/vllm_omni/001_wrong_patch.patch +13 -0
  10. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/rocm/Dockerfile +21 -3
  11. gpustack_runner-0.1.24.post4/pack/rocm/patches/vllm_omni/001_wrong_patch.patch +13 -0
  12. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tests/gpustack_runner/fixtures/test_list_runners_by_backend.json +44 -0
  13. gpustack_runner-0.1.24.post3/gpustack_runner/_version_appendix.py +0 -1
  14. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/.codespelldict +0 -0
  15. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/.codespellrc +0 -0
  16. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/.gitattributes +0 -0
  17. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/.gitignore +0 -0
  18. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/.pre-commit-config.yaml +0 -0
  19. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/.python-version +0 -0
  20. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/LICENSE +0 -0
  21. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/Makefile +0 -0
  22. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/docs/index.md +0 -0
  23. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/docs/modules/gpustack_runner.md +0 -0
  24. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/gpustack_runner/__init__.py +0 -0
  25. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/gpustack_runner/__main__.py +0 -0
  26. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/gpustack_runner/__utils__.py +0 -0
  27. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/gpustack_runner/_version.pyi +0 -0
  28. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/gpustack_runner/cmds/__init__.py +0 -0
  29. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/gpustack_runner/cmds/__types__.py +0 -0
  30. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/gpustack_runner/cmds/images.py +0 -0
  31. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/gpustack_runner/envs.py +0 -0
  32. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/gpustack_runner/runner.py +0 -0
  33. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/hatch.toml +0 -0
  34. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/mkdocs.yml +0 -0
  35. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251020_vllm_install_lmcache/cann/Dockerfile +0 -0
  36. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251020_vllm_install_lmcache/cuda/Dockerfile +0 -0
  37. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251020_vllm_install_lmcache/matrix.yaml +0 -0
  38. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251020_vllm_install_lmcache/rocm/Dockerfile +0 -0
  39. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251022_vllm_install_ray_client/cann/Dockerfile +0 -0
  40. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251022_vllm_install_ray_client/cuda/Dockerfile +0 -0
  41. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251022_vllm_install_ray_client/matrix.yaml +0 -0
  42. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251022_vllm_install_ray_client/rocm/Dockerfile +0 -0
  43. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251022_vllm_install_ray_default/cuda/Dockerfile +0 -0
  44. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251022_vllm_install_ray_default/matrix.yaml +0 -0
  45. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251022_vllm_install_ray_default/rocm/Dockerfile +0 -0
  46. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251024_vllm_install_nvidia_hpcx/cuda/Dockerfile +0 -0
  47. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251024_vllm_install_nvidia_hpcx/matrix.yaml +0 -0
  48. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251024_vllm_reinstall_lmcache/cuda/Dockerfile +0 -0
  49. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251024_vllm_reinstall_lmcache/matrix.yaml +0 -0
  50. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251029_vllm_reinstall_ray/cann/Dockerfile +0 -0
  51. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251029_vllm_reinstall_ray/matrix.yaml +0 -0
  52. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251103_mindie_refresh_entrypoint/cann/Dockerfile +0 -0
  53. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251103_mindie_refresh_entrypoint/matrix.yaml +0 -0
  54. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251105_vllm_polish_nvidia_hpcx/cuda/Dockerfile +0 -0
  55. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251105_vllm_polish_nvidia_hpcx/matrix.yaml +0 -0
  56. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251106_vllm_install_ep_kernel/cuda/Dockerfile +0 -0
  57. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251106_vllm_install_ep_kernel/matrix.yaml +0 -0
  58. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251107_vllm_reinstall_lmcache/cuda/Dockerfile +0 -0
  59. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251107_vllm_reinstall_lmcache/matrix.yaml +0 -0
  60. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251110_sglang_install_diffusion/cuda/Dockerfile +0 -0
  61. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251110_sglang_install_diffusion/matrix.yaml +0 -0
  62. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251110_sglang_install_flashattn/cuda/Dockerfile +0 -0
  63. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251110_sglang_install_flashattn/matrix.yaml +0 -0
  64. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251125_mindie_install_posix_ipc/cann/Dockerfile +0 -0
  65. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251125_mindie_install_posix_ipc/matrix.yaml +0 -0
  66. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251201_vllm_patch_qwen2_5_vl/cuda/Dockerfile +0 -0
  67. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251201_vllm_patch_qwen2_5_vl/cuda/patches/vllm_001_disable_flashatten_in_qwen2_5_vl.patch +0 -0
  68. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251201_vllm_patch_qwen2_5_vl/matrix.yaml +0 -0
  69. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251209_mindie_install_av/cann/Dockerfile +0 -0
  70. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251209_mindie_install_av/matrix.yaml +0 -0
  71. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251213_mindie_patch_minicpm_qwen2_v2/cann/Dockerfile +0 -0
  72. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251213_mindie_patch_minicpm_qwen2_v2/cann/patches.zip +0 -0
  73. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251213_mindie_patch_minicpm_qwen2_v2/matrix.yaml +0 -0
  74. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251213_sglang_patch_server_args/cuda/Dockerfile +0 -0
  75. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251213_sglang_patch_server_args/cuda/patches/sglang_001_fix_server_args.patch +0 -0
  76. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251213_sglang_patch_server_args/matrix.yaml +0 -0
  77. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251214_cuda_several_patches/cuda/Dockerfile +0 -0
  78. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251214_cuda_several_patches/matrix.yaml +0 -0
  79. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251215_cann_several_patches/cann/Dockerfile +0 -0
  80. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251215_cann_several_patches/matrix.yaml +0 -0
  81. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251216_sglang_uninstall_runai_model_streamer/cuda/Dockerfile +0 -0
  82. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251216_sglang_uninstall_runai_model_streamer/matrix.yaml +0 -0
  83. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251219_rocm_install_petit_kernel/matrix.yaml +0 -0
  84. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251219_rocm_install_petit_kernel/rocm/Dockerfile +0 -0
  85. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251219_vllm_install_audio_extra/cuda/Dockerfile +0 -0
  86. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251219_vllm_install_audio_extra/matrix.yaml +0 -0
  87. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251219_vllm_install_audio_extra/rocm/Dockerfile +0 -0
  88. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251224_mindie_patch_atb_config/cann/Dockerfile +0 -0
  89. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20251224_mindie_patch_atb_config/matrix.yaml +0 -0
  90. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20260105_vllm_install_omni/cann/Dockerfile +0 -0
  91. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20260105_vllm_install_omni/cuda/Dockerfile +0 -0
  92. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20260105_vllm_install_omni/matrix.yaml +0 -0
  93. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20260105_vllm_install_omni/rocm/Dockerfile +0 -0
  94. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20260129_sglang_reinstall_kernel/cann/Dockerfile +0 -0
  95. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20260129_sglang_reinstall_kernel/matrix.yaml +0 -0
  96. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20260129_vllm_patch_dp/cuda/Dockerfile +0 -0
  97. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20260129_vllm_patch_dp/cuda/patches/vllm_001_wrong_dp_ray.patch +0 -0
  98. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20260129_vllm_patch_dp/matrix.yaml +0 -0
  99. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20260129_vllm_patch_dp/rocm/Dockerfile +0 -0
  100. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/20260129_vllm_patch_dp/rocm/patches/vllm_001_wrong_dp_ray.patch +0 -0
  101. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/.post_operation/README.md +0 -0
  102. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/cann/mindie-atb-models_2.3.0_linux-amd64_py3.11_torch2.1.0-abi0.tar.gz +0 -0
  103. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/cann/mindie-atb-models_2.3.0_linux-arm64_py3.11_torch2.1.0-abi0.tar.gz +0 -0
  104. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/cann/patches/mindie.zip +0 -0
  105. /gpustack_runner-0.1.24.post3/pack/cann/patches/vllm_001_wrong_dp_ray.patch → /gpustack_runner-0.1.24.post4/pack/cann/patches/vllm/001_wrong_dp_ray.patch +0 -0
  106. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/corex/Dockerfile +0 -0
  107. /gpustack_runner-0.1.24.post3/pack/cuda/patches/vllm_001_wrong_dp_ray.patch → /gpustack_runner-0.1.24.post4/pack/cuda/patches/vllm/001_wrong_dp_ray.patch +0 -0
  108. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/discard_runner.sh +0 -0
  109. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/dtk/Dockerfile +0 -0
  110. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/expand_matrix.sh +0 -0
  111. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/hggc/Dockerfile +0 -0
  112. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/maca/Dockerfile +0 -0
  113. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/matrix.yaml +0 -0
  114. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/merge_runner.sh +0 -0
  115. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/musa/Dockerfile +0 -0
  116. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/prune_runner.sh +0 -0
  117. /gpustack_runner-0.1.24.post3/pack/rocm/patches/sglang_001_wrong_vram.patch → /gpustack_runner-0.1.24.post4/pack/rocm/patches/sglang/001_wrong_vram.patch +0 -0
  118. /gpustack_runner-0.1.24.post3/pack/rocm/patches/vllm_001_wrong_dp_ray.patch → /gpustack_runner-0.1.24.post4/pack/rocm/patches/vllm/001_wrong_dp_ray.patch +0 -0
  119. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/squash_expand_matrix.sh +0 -0
  120. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pack/squash_image.sh +0 -0
  121. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pyproject.toml +0 -0
  122. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/pytest.ini +0 -0
  123. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/ruff.toml +0 -0
  124. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tests/gpustack_runner/fixtures/__init__.py +0 -0
  125. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tests/gpustack_runner/fixtures/test_docker_image.json +0 -0
  126. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tests/gpustack_runner/fixtures/test_list_backend_runners.json +0 -0
  127. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tests/gpustack_runner/fixtures/test_list_runners_by_prefix.json +0 -0
  128. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tests/gpustack_runner/fixtures/test_list_service_runners.json +0 -0
  129. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tests/gpustack_runner/fixtures/test_merge_image.json +0 -0
  130. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tests/gpustack_runner/fixtures/test_replace_image_with.json +0 -0
  131. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tests/gpustack_runner/fixtures/test_split_image.json +0 -0
  132. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tests/gpustack_runner/test_runner.py +0 -0
  133. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tests/gpustack_runner/test_utils.py +0 -0
  134. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tools/activate +0 -0
  135. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tools/chat.sh +0 -0
  136. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tools/chat_tool_current_date_time.sh +0 -0
  137. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tools/chat_tool_get_temperature.sh +0 -0
  138. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tools/chat_tool_get_weather.sh +0 -0
  139. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tools/chat_tool_square_of_number.sh +0 -0
  140. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tools/chat_tool_square_root_of_number.sh +0 -0
  141. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tools/chat_tool_where_am_i.sh +0 -0
  142. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tools/run_runner.sh +0 -0
  143. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/tools/run_runner_cluster.sh +0 -0
  144. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/uv.lock +0 -0
  145. {gpustack_runner-0.1.24.post3 → gpustack_runner-0.1.24.post4}/uv.toml +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: gpustack-runner
3
- Version: 0.1.24.post3
3
+ Version: 0.1.24.post4
4
4
  Summary: GPUStack Runner is library for registering runnable accelerated backends and services in GPUStack.
5
5
  Project-URL: Homepage, https://github.com/gpustack/runner
6
6
  Project-URL: Bug Tracker, https://github.com/gpustack/gpustack/issues
@@ -128,10 +128,10 @@ The following table lists the supported accelerated backends and their correspon
128
128
  > - ROCm 6.4 SGLang supports `gfx942` only.
129
129
  > - ROCm 7.0 SGLang supports `gfx950` only.
130
130
 
131
- | ROCm Version <br/> (Variant) | vLLM | SGLang |
132
- |------------------------------|-------------------------------------------------|--------------------------------------------|
133
- | 7.0 | **`0.13.0`**, `0.12.0`, <br/>`0.11.2` | `0.5.7`, `0.5.6.post2` |
134
- | 6.4 | **`0.13.0`**, `0.12.0`, <br/>`0.11.2`, `0.10.2` | `0.5.7`, `0.5.6.post2`, <br/>`0.5.5.post3` |
131
+ | ROCm Version <br/> (Variant) | vLLM | SGLang |
132
+ |------------------------------|-----------------------------------------------------------|-----------------------------------------------------|
133
+ | 7.0 | `0.14.1`, **`0.13.0`**, <br/>`0.12.0`, `0.11.2` | `0.5.8`, `0.5.7`, <br/>`0.5.6.post2` |
134
+ | 6.4 | `0.14.1`, **`0.13.0`**, <br/>`0.12.0`, `0.11.2`, `0.10.2` | `0.5.8`, `0.5.7`, <br/>`0.5.6.post2`, `0.5.5.post3` |
135
135
 
136
136
  ## Directory Structure
137
137
 
@@ -108,10 +108,10 @@ The following table lists the supported accelerated backends and their correspon
108
108
  > - ROCm 6.4 SGLang supports `gfx942` only.
109
109
  > - ROCm 7.0 SGLang supports `gfx950` only.
110
110
 
111
- | ROCm Version <br/> (Variant) | vLLM | SGLang |
112
- |------------------------------|-------------------------------------------------|--------------------------------------------|
113
- | 7.0 | **`0.13.0`**, `0.12.0`, <br/>`0.11.2` | `0.5.7`, `0.5.6.post2` |
114
- | 6.4 | **`0.13.0`**, `0.12.0`, <br/>`0.11.2`, `0.10.2` | `0.5.7`, `0.5.6.post2`, <br/>`0.5.5.post3` |
111
+ | ROCm Version <br/> (Variant) | vLLM | SGLang |
112
+ |------------------------------|-----------------------------------------------------------|-----------------------------------------------------|
113
+ | 7.0 | `0.14.1`, **`0.13.0`**, <br/>`0.12.0`, `0.11.2` | `0.5.8`, `0.5.7`, <br/>`0.5.6.post2` |
114
+ | 6.4 | `0.14.1`, **`0.13.0`**, <br/>`0.12.0`, `0.11.2`, `0.10.2` | `0.5.8`, `0.5.7`, <br/>`0.5.6.post2`, `0.5.5.post3` |
115
115
 
116
116
  ## Directory Structure
117
117
 
@@ -27,8 +27,8 @@ version_tuple: VERSION_TUPLE
27
27
  __commit_id__: COMMIT_ID
28
28
  commit_id: COMMIT_ID
29
29
 
30
- __version__ = version = '0.1.24.post3'
31
- __version_tuple__ = version_tuple = (0, 1, 24, 'post3')
30
+ __version__ = version = '0.1.24.post4'
31
+ __version_tuple__ = version_tuple = (0, 1, 24, 'post4')
32
32
  try:
33
33
  from ._version_appendix import git_commit
34
34
  __commit_id__ = commit_id = git_commit
@@ -0,0 +1 @@
1
+ git_commit = "907c39c"
@@ -1748,6 +1748,17 @@
1748
1748
  "docker_image": "gpustack/runner:musa4.1-vllm0.9.2",
1749
1749
  "deprecated": false
1750
1750
  },
1751
+ {
1752
+ "backend": "rocm",
1753
+ "backend_version": "7.0",
1754
+ "original_backend_version": "7.0.2",
1755
+ "backend_variant": "",
1756
+ "service": "sglang",
1757
+ "service_version": "0.5.8",
1758
+ "platform": "linux/amd64",
1759
+ "docker_image": "gpustack/runner:rocm7.0-sglang0.5.8",
1760
+ "deprecated": false
1761
+ },
1751
1762
  {
1752
1763
  "backend": "rocm",
1753
1764
  "backend_version": "7.0",
@@ -1770,6 +1781,17 @@
1770
1781
  "docker_image": "gpustack/runner:rocm7.0-sglang0.5.6.post2",
1771
1782
  "deprecated": false
1772
1783
  },
1784
+ {
1785
+ "backend": "rocm",
1786
+ "backend_version": "7.0",
1787
+ "original_backend_version": "7.0.2",
1788
+ "backend_variant": "",
1789
+ "service": "vllm",
1790
+ "service_version": "0.14.1",
1791
+ "platform": "linux/amd64",
1792
+ "docker_image": "gpustack/runner:rocm7.0-vllm0.14.1",
1793
+ "deprecated": false
1794
+ },
1773
1795
  {
1774
1796
  "backend": "rocm",
1775
1797
  "backend_version": "7.0",
@@ -1814,6 +1836,17 @@
1814
1836
  "docker_image": "gpustack/runner:rocm7.0-vllm0.11.0",
1815
1837
  "deprecated": true
1816
1838
  },
1839
+ {
1840
+ "backend": "rocm",
1841
+ "backend_version": "6.4",
1842
+ "original_backend_version": "6.4.4",
1843
+ "backend_variant": "",
1844
+ "service": "sglang",
1845
+ "service_version": "0.5.8",
1846
+ "platform": "linux/amd64",
1847
+ "docker_image": "gpustack/runner:rocm6.4-sglang0.5.8",
1848
+ "deprecated": false
1849
+ },
1817
1850
  {
1818
1851
  "backend": "rocm",
1819
1852
  "backend_version": "6.4",
@@ -1847,6 +1880,17 @@
1847
1880
  "docker_image": "gpustack/runner:rocm6.4-sglang0.5.5.post3",
1848
1881
  "deprecated": false
1849
1882
  },
1883
+ {
1884
+ "backend": "rocm",
1885
+ "backend_version": "6.4",
1886
+ "original_backend_version": "6.4.4",
1887
+ "backend_variant": "",
1888
+ "service": "vllm",
1889
+ "service_version": "0.14.1",
1890
+ "platform": "linux/amd64",
1891
+ "docker_image": "gpustack/runner:rocm6.4-vllm0.14.1",
1892
+ "deprecated": false
1893
+ },
1850
1894
  {
1851
1895
  "backend": "rocm",
1852
1896
  "backend_version": "6.4",
@@ -59,7 +59,7 @@ ARG VLLM_VERSION=0.14.1
59
59
  ARG VLLM_ASCEND_VERSION=0.14.0rc1
60
60
  ARG VLLM_TORCH_VERSION=2.9.0
61
61
  ARG VLLM_MOONCAKE_VERSION=0.3.7.post2
62
- ARG VLLM_OMNI_COMMIT=e8aa32b
62
+ ARG VLLM_OMNI_COMMIT=b11d436
63
63
  ARG SGLANG_BASE_IMAGE=gpustack/runner:cann${CANN_VERSION}-${CANN_ARCHS}-python${PYTHON_VERSION}
64
64
  ARG SGLANG_VERSION=0.5.8
65
65
  ARG SGLANG_TORCH_VERSION=2.8.0
@@ -865,6 +865,15 @@ RUN --mount=type=bind,from=vllm-build-omni,source=/,target=/omni,rw <<EOF
865
865
  uv pip install --no-build-isolation \
866
866
  /omni/workspace/*.whl
867
867
 
868
+ # Dependencies
869
+ uv pip uninstall onnxruntime || true
870
+ cat <<EOT >/tmp/requirements.txt
871
+ onnxruntime-cann
872
+ sox
873
+ EOT
874
+ uv pip install \
875
+ -r /tmp/requirements.txt
876
+
868
877
  # Cleanup
869
878
  rm -rf /var/tmp/* \
870
879
  && rm -rf /tmp/*
@@ -956,7 +965,11 @@ RUN --mount=type=bind,target=/workspace,rw <<EOF
956
965
 
957
966
  tree -hs /workspace/patches
958
967
  pushd $(pip show vllm | grep Location: | cut -d" " -f 2) \
959
- && patch -p1 < /workspace/patches/vllm_*.patch
968
+ && patch -p1 < /workspace/patches/vllm/*.patch
969
+ if pip show vllm_omni > /dev/null 2>&1; then \
970
+ pushd $(pip show vllm_omni | grep Location: | cut -d" " -f 2) \
971
+ && patch -p1 < /workspace/patches/vllm_omni/*.patch; \
972
+ fi
960
973
  EOF
961
974
 
962
975
  ## Entrypoint
@@ -0,0 +1,13 @@
1
+ diff --git a/vllm_omni/patch.py b/vllm_omni/patch.py
2
+ index 687ff51..6b67924 100644
3
+ --- a/vllm_omni/patch.py
4
+ +++ b/vllm_omni/patch.py
5
+ @@ -19,6 +19,8 @@ for module_name, module in sys.modules.items():
6
+ # only do patch on module of vllm, pass others
7
+ if "vllm" not in module_name:
8
+ continue
9
+ + if "--omni" not in sys.argv:
10
+ + continue
11
+ if hasattr(module, "EngineCoreOutput") and module.EngineCoreOutput == _OriginalEngineCoreOutput:
12
+ module.EngineCoreOutput = OmniEngineCoreOutput
13
+ if hasattr(module, "EngineCoreOutputs") and module.EngineCoreOutputs == _OriginalEngineCoreOutputs:
@@ -116,7 +116,7 @@ ARG VLLM_FLASHINFER_VERSION=0.6.1
116
116
  ARG VLLM_FLASHATTENTION_VERSION=2.8.3
117
117
  ARG VLLM_LMCACHE_VERSION=0.3.12
118
118
  ARG VLLM_MOONCAKE_VERSION=0.3.8.post1
119
- ARG VLLM_OMNI_COMMIT=e8aa32b
119
+ ARG VLLM_OMNI_COMMIT=2c294a7
120
120
  ARG SGLANG_BASE_IMAGE=vllm
121
121
  ARG SGLANG_VERSION=0.5.8
122
122
  ARG SGLANG_BUILD_BASE_IMAGE=vllm-build
@@ -1357,6 +1357,14 @@ RUN --mount=type=bind,from=vllm-build-omni,source=/,target=/omni,rw <<EOF
1357
1357
  uv pip install --no-build-isolation \
1358
1358
  /omni/workspace/*.whl
1359
1359
 
1360
+ # Dependencies
1361
+ cat <<EOT >/tmp/requirements.txt
1362
+ onnxruntime
1363
+ sox
1364
+ EOT
1365
+ uv pip install \
1366
+ -r /tmp/requirements.txt
1367
+
1360
1368
  # Cleanup
1361
1369
  rm -rf /var/tmp/* \
1362
1370
  && rm -rf /tmp/*
@@ -1551,7 +1559,11 @@ RUN --mount=type=bind,target=/workspace,rw <<EOF
1551
1559
 
1552
1560
  tree -hs /workspace/patches
1553
1561
  pushd $(pip show vllm | grep Location: | cut -d" " -f 2) \
1554
- && patch -p1 < /workspace/patches/vllm_*.patch
1562
+ && patch -p1 < /workspace/patches/vllm/*.patch
1563
+ if pip show vllm_omni > /dev/null 2>&1; then \
1564
+ pushd $(pip show vllm_omni | grep Location: | cut -d" " -f 2) \
1565
+ && patch -p1 < /workspace/patches/vllm_omni/*.patch; \
1566
+ fi
1555
1567
  EOF
1556
1568
 
1557
1569
  ## Entrypoint
@@ -0,0 +1,13 @@
1
+ diff --git a/vllm_omni/patch.py b/vllm_omni/patch.py
2
+ index 687ff51..6b67924 100644
3
+ --- a/vllm_omni/patch.py
4
+ +++ b/vllm_omni/patch.py
5
+ @@ -19,6 +19,8 @@ for module_name, module in sys.modules.items():
6
+ # only do patch on module of vllm, pass others
7
+ if "vllm" not in module_name:
8
+ continue
9
+ + if "--omni" not in sys.argv:
10
+ + continue
11
+ if hasattr(module, "EngineCoreOutput") and module.EngineCoreOutput == _OriginalEngineCoreOutput:
12
+ module.EngineCoreOutput = OmniEngineCoreOutput
13
+ if hasattr(module, "EngineCoreOutputs") and module.EngineCoreOutputs == _OriginalEngineCoreOutputs:
@@ -84,7 +84,7 @@ ARG VLLM_FLASHATTENTION_VERSION=2.8.3
84
84
  ARG VLLM_AITER_VERSION=0.1.8
85
85
  ARG VLLM_LMCACHE_VERSION=0.3.12
86
86
  ARG VLLM_MOONCAKE_VERSION=0.3.8.post1
87
- ARG VLLM_OMNI_COMMIT=e8aa32b
87
+ ARG VLLM_OMNI_COMMIT=2c294a7
88
88
  ARG SGLANG_BASE_IMAGE=vllm
89
89
  ARG SGLANG_VERSION=0.5.8
90
90
  ARG SGLANG_BUILD_BASE_IMAGE=vllm-build
@@ -724,6 +724,11 @@ RUN --mount=type=bind,from=vllm-build-flashattention,source=/,target=/flashatten
724
724
  --depth 1 --branch v${VLLM_VERSION} --single-branch \
725
725
  https://github.com/vllm-project/vllm.git vllm
726
726
  pushd /tmp/vllm \
727
+ && sed -i "s/\"torch ==.*\"/\"torch\"/g" /tmp/vllm/pyproject.toml \
728
+ && sed -i "s/\"torch==.*\"/\"torch\"/g" /tmp/vllm/requirements/rocm-build.txt \
729
+ && sed -i "s/\"torchvision==.*\"/\"torchvision\"/g" /tmp/vllm/requirements/rocm-build.txt \
730
+ && sed -i "s/\"torchaudio==.*\"/\"torchaudio\"/g" /tmp/vllm/requirements/rocm-build.txt \
731
+ && sed -i "s/\"triton==.*\"/\"triton\"/g" /tmp/vllm/requirements/rocm-build.txt \
727
732
  && uv pip install protobuf>=6.33.2 grpcio-tools>=1.76.0 \
728
733
  && VLLM_TARGET_DEVICE="rocm" python -v -m build --no-isolation --wheel \
729
734
  && tree -hs /tmp/vllm/dist \
@@ -1079,6 +1084,15 @@ RUN --mount=type=bind,from=vllm-build-omni,source=/,target=/omni,rw <<EOF
1079
1084
  uv pip install --no-build-isolation \
1080
1085
  /omni/workspace/*.whl
1081
1086
 
1087
+ # Dependencies
1088
+ uv pip uninstall onnxruntime || true
1089
+ cat <<EOT >/tmp/requirements.txt
1090
+ onnxruntime-rocm
1091
+ sox
1092
+ EOT
1093
+ uv pip install \
1094
+ -r /tmp/requirements.txt
1095
+
1082
1096
  # Cleanup
1083
1097
  rm -rf /var/tmp/* \
1084
1098
  && rm -rf /tmp/*
@@ -1236,7 +1250,11 @@ RUN --mount=type=bind,target=/workspace,rw <<EOF
1236
1250
 
1237
1251
  tree -hs /workspace/patches
1238
1252
  pushd $(pip show vllm | grep Location: | cut -d" " -f 2) \
1239
- && patch -p1 < /workspace/patches/vllm_*.patch
1253
+ && patch -p1 < /workspace/patches/vllm/*.patch
1254
+ if pip show vllm_omni > /dev/null 2>&1; then \
1255
+ pushd $(pip show vllm_omni | grep Location: | cut -d" " -f 2) \
1256
+ && patch -p1 < /workspace/patches/vllm_omni/*.patch; \
1257
+ fi
1240
1258
  EOF
1241
1259
 
1242
1260
  ## Entrypoint
@@ -1537,7 +1555,7 @@ RUN --mount=type=bind,target=/workspace,rw <<EOF
1537
1555
 
1538
1556
  tree -hs /workspace/patches
1539
1557
  pushd $(pip show sglang | grep Location: | cut -d" " -f 2) \
1540
- && patch -p1 < /workspace/patches/sglang_*.patch
1558
+ && patch -p1 < /workspace/patches/sglang/*.patch
1541
1559
  EOF
1542
1560
 
1543
1561
  ## Entrypoint
@@ -0,0 +1,13 @@
1
+ diff --git a/vllm_omni/patch.py b/vllm_omni/patch.py
2
+ index 687ff51..6b67924 100644
3
+ --- a/vllm_omni/patch.py
4
+ +++ b/vllm_omni/patch.py
5
+ @@ -19,6 +19,8 @@ for module_name, module in sys.modules.items():
6
+ # only do patch on module of vllm, pass others
7
+ if "vllm" not in module_name:
8
+ continue
9
+ + if "--omni" not in sys.argv:
10
+ + continue
11
+ if hasattr(module, "EngineCoreOutput") and module.EngineCoreOutput == _OriginalEngineCoreOutput:
12
+ module.EngineCoreOutput = OmniEngineCoreOutput
13
+ if hasattr(module, "EngineCoreOutputs") and module.EngineCoreOutputs == _OriginalEngineCoreOutputs:
@@ -1810,6 +1810,17 @@
1810
1810
  "backend": "rocm"
1811
1811
  },
1812
1812
  [
1813
+ {
1814
+ "backend": "rocm",
1815
+ "backend_version": "7.0",
1816
+ "original_backend_version": "7.0.2",
1817
+ "backend_variant": "",
1818
+ "service": "sglang",
1819
+ "service_version": "0.5.8",
1820
+ "platform": "linux/amd64",
1821
+ "docker_image": "gpustack/runner:rocm7.0-sglang0.5.8",
1822
+ "deprecated": false
1823
+ },
1813
1824
  {
1814
1825
  "backend": "rocm",
1815
1826
  "backend_version": "7.0",
@@ -1832,6 +1843,17 @@
1832
1843
  "docker_image": "gpustack/runner:rocm7.0-sglang0.5.6.post2",
1833
1844
  "deprecated": false
1834
1845
  },
1846
+ {
1847
+ "backend": "rocm",
1848
+ "backend_version": "7.0",
1849
+ "original_backend_version": "7.0.2",
1850
+ "backend_variant": "",
1851
+ "service": "vllm",
1852
+ "service_version": "0.14.1",
1853
+ "platform": "linux/amd64",
1854
+ "docker_image": "gpustack/runner:rocm7.0-vllm0.14.1",
1855
+ "deprecated": false
1856
+ },
1835
1857
  {
1836
1858
  "backend": "rocm",
1837
1859
  "backend_version": "7.0",
@@ -1876,6 +1898,17 @@
1876
1898
  "docker_image": "gpustack/runner:rocm7.0-vllm0.11.0",
1877
1899
  "deprecated": true
1878
1900
  },
1901
+ {
1902
+ "backend": "rocm",
1903
+ "backend_version": "6.4",
1904
+ "original_backend_version": "6.4.4",
1905
+ "backend_variant": "",
1906
+ "service": "sglang",
1907
+ "service_version": "0.5.8",
1908
+ "platform": "linux/amd64",
1909
+ "docker_image": "gpustack/runner:rocm6.4-sglang0.5.8",
1910
+ "deprecated": false
1911
+ },
1879
1912
  {
1880
1913
  "backend": "rocm",
1881
1914
  "backend_version": "6.4",
@@ -1909,6 +1942,17 @@
1909
1942
  "docker_image": "gpustack/runner:rocm6.4-sglang0.5.5.post3",
1910
1943
  "deprecated": false
1911
1944
  },
1945
+ {
1946
+ "backend": "rocm",
1947
+ "backend_version": "6.4",
1948
+ "original_backend_version": "6.4.4",
1949
+ "backend_variant": "",
1950
+ "service": "vllm",
1951
+ "service_version": "0.14.1",
1952
+ "platform": "linux/amd64",
1953
+ "docker_image": "gpustack/runner:rocm6.4-vllm0.14.1",
1954
+ "deprecated": false
1955
+ },
1912
1956
  {
1913
1957
  "backend": "rocm",
1914
1958
  "backend_version": "6.4",
@@ -1 +0,0 @@
1
- git_commit = "dc41ed2"