PyPI - gpustack-runtime - Versions diffs - 0.1.40.post1__py3-none-any.whl → 0.1.41__py3-none-any.whl - Mend

gpustack-runtime 0.1.40.post1py3-none-any.whl → 0.1.41py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (66) hide show

gpustack_runtime/__init__.py +1 -1
gpustack_runtime/__main__.py +5 -3
gpustack_runtime/_version.py +2 -2
gpustack_runtime/_version_appendix.py +1 -1
gpustack_runtime/cmds/__init__.py +5 -3
gpustack_runtime/cmds/__types__.py +1 -1
gpustack_runtime/cmds/deployer.py +140 -18
gpustack_runtime/cmds/detector.py +1 -1
gpustack_runtime/cmds/images.py +1 -1
gpustack_runtime/deployer/__init__.py +28 -2
gpustack_runtime/deployer/__patches__.py +1 -1
gpustack_runtime/deployer/__types__.py +2 -1
gpustack_runtime/deployer/__utils__.py +2 -2
gpustack_runtime/deployer/cdi/__init__.py +85 -5
gpustack_runtime/deployer/cdi/__types__.py +92 -29
gpustack_runtime/deployer/cdi/__utils__.py +178 -0
gpustack_runtime/deployer/cdi/amd.py +146 -0
gpustack_runtime/deployer/cdi/ascend.py +164 -0
gpustack_runtime/deployer/cdi/hygon.py +147 -0
gpustack_runtime/deployer/cdi/iluvatar.py +136 -0
gpustack_runtime/deployer/cdi/metax.py +148 -0
gpustack_runtime/deployer/cdi/thead.py +57 -23
gpustack_runtime/deployer/docker.py +9 -8
gpustack_runtime/deployer/k8s/deviceplugin/__init__.py +240 -0
gpustack_runtime/deployer/k8s/deviceplugin/__types__.py +131 -0
gpustack_runtime/deployer/k8s/deviceplugin/plugin.py +586 -0
gpustack_runtime/deployer/k8s/types/kubelet/deviceplugin/v1beta1/__init__.py +3 -0
gpustack_runtime/deployer/k8s/types/kubelet/deviceplugin/v1beta1/api.proto +212 -0
gpustack_runtime/deployer/k8s/types/kubelet/deviceplugin/v1beta1/api_pb2.py +86 -0
gpustack_runtime/deployer/k8s/types/kubelet/deviceplugin/v1beta1/api_pb2.pyi +168 -0
gpustack_runtime/deployer/k8s/types/kubelet/deviceplugin/v1beta1/api_pb2_grpc.py +358 -0
gpustack_runtime/deployer/k8s/types/kubelet/deviceplugin/v1beta1/constants.py +34 -0
gpustack_runtime/deployer/kuberentes.py +37 -4
gpustack_runtime/deployer/podman.py +9 -8
gpustack_runtime/detector/__init__.py +42 -5
gpustack_runtime/detector/__types__.py +8 -24
gpustack_runtime/detector/__utils__.py +46 -39
gpustack_runtime/detector/amd.py +55 -66
gpustack_runtime/detector/ascend.py +29 -41
gpustack_runtime/detector/cambricon.py +3 -3
gpustack_runtime/detector/hygon.py +21 -49
gpustack_runtime/detector/iluvatar.py +44 -60
gpustack_runtime/detector/metax.py +54 -37
gpustack_runtime/detector/mthreads.py +74 -36
gpustack_runtime/detector/nvidia.py +130 -93
gpustack_runtime/detector/pyacl/__init__.py +1 -1
gpustack_runtime/detector/pyamdgpu/__init__.py +1 -1
gpustack_runtime/detector/pyamdsmi/__init__.py +1 -1
gpustack_runtime/detector/pycuda/__init__.py +1 -1
gpustack_runtime/detector/pydcmi/__init__.py +1 -1
gpustack_runtime/detector/pyhsa/__init__.py +1 -1
gpustack_runtime/detector/pymxsml/__init__.py +1553 -1
gpustack_runtime/detector/pyrocmcore/__init__.py +1 -1
gpustack_runtime/detector/pyrocmsmi/__init__.py +1 -1
gpustack_runtime/detector/thead.py +41 -60
gpustack_runtime/envs.py +104 -12
gpustack_runtime/logging.py +6 -2
{gpustack_runtime-0.1.40.post1.dist-info → gpustack_runtime-0.1.41.dist-info}/METADATA +6 -1
gpustack_runtime-0.1.41.dist-info/RECORD +67 -0
gpustack_runtime/detector/pymxsml/mxsml.py +0 -1580
gpustack_runtime/detector/pymxsml/mxsml_extension.py +0 -816
gpustack_runtime/detector/pymxsml/mxsml_mcm.py +0 -476
gpustack_runtime-0.1.40.post1.dist-info/RECORD +0 -55
{gpustack_runtime-0.1.40.post1.dist-info → gpustack_runtime-0.1.41.dist-info}/WHEEL +0 -0
{gpustack_runtime-0.1.40.post1.dist-info → gpustack_runtime-0.1.41.dist-info}/entry_points.txt +0 -0
{gpustack_runtime-0.1.40.post1.dist-info → gpustack_runtime-0.1.41.dist-info}/licenses/LICENSE +0 -0

gpustack_runtime/detector/pyrocmcore/__init__.py CHANGED Viewed

@@ -1,4 +1,4 @@
-from __future__ import annotations
+from __future__ import annotations as __future_annotations__
 import os
 import sys

gpustack_runtime/detector/pyrocmsmi/__init__.py CHANGED Viewed

@@ -3,7 +3,7 @@
 # https://github.com/ROCm/rocm_smi_lib/blob/rocm-6.2.4/python_smi_tools/rsmiBindings.py,
 # https://rocm.docs.amd.com/projects/rocm_smi_lib/en/latest/doxygen/html/rocm__smi_8h_source.html,
 # https://rocm.docs.amd.com/projects/rocm_smi_lib/en/latest/doxygen/html/rocm__smi_8h.html.
-from __future__ import annotations
+from __future__ import annotations as __future_annotations__
 import os
 import sys

gpustack_runtime/detector/thead.py CHANGED Viewed

@@ -1,4 +1,4 @@
-from __future__ import annotations
+from __future__ import annotations as __future_annotations__
 import contextlib
 import logging
@@ -22,7 +22,6 @@ from .__utils__ import (
     bitmask_to_str,
     byte_to_mebibyte,
     get_brief_version,
-    get_device_files,
     get_numa_node_by_bdf,
     get_numa_nodeset_size,
     get_pci_devices,
@@ -40,7 +39,7 @@ class THeadDetector(Detector):
     """
     @staticmethod
-    @lru_cache
+    @lru_cache(maxsize=1)
     def is_supported() -> bool:
         """
         Check if the T-Head detector is supported.
@@ -69,7 +68,7 @@ class THeadDetector(Detector):
         return supported
     @staticmethod
-    @lru_cache
+    @lru_cache(maxsize=1)
     def detect_pci_devices() -> dict[str, PCIDevice]:
         # See https://pcisig.com/membership/member-companies?combine=Alibaba.
         pci_devs = get_pci_devices(vendor="0x1ded")
@@ -121,17 +120,23 @@ class THeadDetector(Detector):
                 )
             dev_count = pyhgml.hgmlDeviceGetCount()
-            dev_files = None
             for dev_idx in range(dev_count):
                 dev = pyhgml.hgmlDeviceGetHandleByIndex(dev_idx)
                 dev_cc_t = pyhgml.hgmlDeviceGetHggcComputeCapability(dev)
                 dev_cc = ".".join(map(str, dev_cc_t))
-                dev_bdf = None
-                with contextlib.suppress(pyhgml.HGMLError):
-                    dev_pci_info = pyhgml.hgmlDeviceGetPciInfo(dev)
-                    dev_bdf = str(dev_pci_info.busIdLegacy).lower()
+                dev_pci_info = pyhgml.hgmlDeviceGetPciInfo(dev)
+                dev_bdf = str(dev_pci_info.busIdLegacy).lower()
+                dev_numa = get_numa_node_by_bdf(dev_bdf)
+                if not dev_numa:
+                    dev_node_affinity = pyhgml.hgmlDeviceGetMemoryAffinity(
+                        dev,
+                        get_numa_nodeset_size(),
+                        pyhgml.HGML_AFFINITY_SCOPE_NODE,
+                    )
+                    dev_numa = bitmask_to_str(list(dev_node_affinity))
                 dev_mig_mode = pyhgml.HGML_DEVICE_MIG_DISABLE
                 with contextlib.suppress(pyhgml.HGMLError):
@@ -142,14 +147,7 @@ class THeadDetector(Detector):
                 if dev_mig_mode == pyhgml.HGML_DEVICE_MIG_DISABLE:
                     dev_index = dev_idx
                     if envs.GPUSTACK_RUNTIME_DETECT_PHYSICAL_INDEX_PRIORITY:
-                        if dev_files is None:
-                            dev_files = get_device_files(
-                                pattern=r"alixpu_ppu(?P<number>\d+)",
-                            )
-                        if len(dev_files) >= dev_count:
-                            dev_file = dev_files[dev_idx]
-                            if dev_file.number is not None:
-                                dev_index = dev_file.number
+                        dev_index = pyhgml.hgmlDeviceGetMinorNumber(dev)
                     dev_name = pyhgml.hgmlDeviceGetName(dev)
@@ -204,12 +202,9 @@ class THeadDetector(Detector):
                     dev_appendix = {
                         "vgpu": dev_is_vgpu,
+                        "bdf": dev_bdf,
+                        "numa": dev_numa,
                     }
-                    if dev_bdf:
-                        dev_appendix["bdf"] = dev_bdf
-                    if dev_links_state := _get_links_state(dev):
-                        dev_appendix.update(dev_links_state)
                     ret.append(
                         Device(
@@ -273,9 +268,9 @@ class THeadDetector(Detector):
                     mdev_appendix = {
                         "vgpu": True,
+                        "bdf": dev_bdf,
+                        "numa": dev_numa,
                     }
-                    if dev_bdf:
-                        mdev_appendix["bdf"] = dev_bdf
                     mdev_gi_id = pyhgml.hgmlDeviceGetGpuInstanceId(mdev)
                     mdev_appendix["gpu_instance_id"] = mdev_gi_id
@@ -403,36 +398,24 @@ class THeadDetector(Detector):
             for i, dev_i in enumerate(devices):
                 dev_i_handle = pyhgml.hgmlDeviceGetHandleByUUID(dev_i.uuid)
-                # Get affinity with PCIe BDF if possible.
-                if dev_i_bdf := dev_i.appendix.get("bdf", ""):
-                    ret.devices_numa_affinities[i] = get_numa_node_by_bdf(
-                        dev_i_bdf,
-                    )
-                    ret.devices_cpu_affinities[i] = map_numa_node_to_cpu_affinity(
-                        ret.devices_numa_affinities[i],
-                    )
-                # Otherwise, get affinity via IXML.
-                if not ret.devices_cpu_affinities[i]:
-                    # Get NUMA affinity.
-                    try:
-                        dev_i_memset = pyhgml.hgmlDeviceGetMemoryAffinity(
-                            dev_i_handle,
-                            get_numa_nodeset_size(),
-                            pyhgml.HGML_AFFINITY_SCOPE_NODE,
-                        )
-                        ret.devices_numa_affinities[i] = bitmask_to_str(
-                            list(dev_i_memset),
-                        )
-                    except pyhgml.HGMLError:
-                        debug_log_exception(
-                            logger,
-                            "Failed to get NUMA affinity for device %d",
-                            dev_i.index,
-                        )
-                    # Get CPU affinity.
-                    ret.devices_cpu_affinities[i] = map_numa_node_to_cpu_affinity(
-                        ret.devices_numa_affinities[i],
-                    )
+                # Get NUMA and CPU affinities.
+                ret.devices_numa_affinities[i] = dev_i.appendix.get("numa", "")
+                ret.devices_cpu_affinities[i] = map_numa_node_to_cpu_affinity(
+                    ret.devices_numa_affinities[i],
+                )
+                # Get links state if applicable.
+                if dev_i_links_state := _get_links_state(dev_i_handle):
+                    ret.appendices[i].update(dev_i_links_state)
+                    # In practice, if a card has an active *Link,
+                    # then other cards in the same machine should be interconnected with it through the *Link.
+                    if dev_i_links_state.get("links_active_count", 0) > 0:
+                        for j, dev_j in enumerate(devices):
+                            if dev_i.index == dev_j.index:
+                                continue
+                            ret.devices_distances[i][j] = TopologyDistanceEnum.LINK
+                            ret.devices_distances[j][i] = TopologyDistanceEnum.LINK
+                        continue
                 # Get distances to other devices.
                 for j, dev_j in enumerate(devices):
@@ -447,8 +430,6 @@ class THeadDetector(Detector):
                             dev_i_handle,
                             dev_j_handle,
                         )
-                        if dev_i.appendix.get("links_state", 0) > 0:
-                            distance = TopologyDistanceEnum.LINK
                     except pyhgml.HGMLError:
                         debug_log_exception(
                             logger,
@@ -459,9 +440,6 @@ class THeadDetector(Detector):
                     ret.devices_distances[i][j] = distance
                     ret.devices_distances[j][i] = distance
-        except pyhgml.HGMLError:
-            debug_log_exception(logger, "Failed to fetch topology")
-            raise
         except Exception:
             debug_log_exception(logger, "Failed to process topology fetching")
             raise
@@ -621,17 +599,20 @@ def _get_links_state(
         return None
     dev_links_state = 0
+    dev_links_active_count = 0
     try:
         for link_idx in range(int(dev_links_count)):
             dev_link_state = pyhgml.hgmlDeviceGetIcnLinkState(dev, link_idx)
             if dev_link_state:
-                dev_links_state |= 1 << (link_idx + 1)
+                dev_links_state |= 1 << link_idx
+                dev_links_active_count += 1
     except pyhgml.HGMLError:
         debug_log_warning(logger, "Failed to get ICNLink link state")
     return {
         "links_count": dev_links_count,
         "links_state": dev_links_state,
+        "links_active_count": dev_links_active_count,
     }

gpustack_runtime/envs.py CHANGED Viewed

@@ -1,4 +1,4 @@
-from __future__ import annotations
+from __future__ import annotations as __future_annotations__
 import contextlib
 import os
@@ -147,11 +147,6 @@ if TYPE_CHECKING:
     """
     Label prefix for the deployer.
     """
-    GPUSTACK_RUNTIME_DEPLOY_CDI_SPECS_GENERATE: bool = True
-    """
-    During deployment, enable automatic generation of Container Device Interface (CDI) specifications
-    for detected devices.
-    """
     GPUSTACK_RUNTIME_DEPLOY_CDI_SPECS_DIRECTORY: Path | None = None
     """
     During deployment, path of directory containing Container Device Interface (CDI) specifications,
@@ -248,6 +243,15 @@ if TYPE_CHECKING:
     `Env`: Injects resources using standard environment variable, based on `GPUSTACK_RUNTIME_DEPLOY_RESOURCE_KEY_MAP_RUNTIME_VISIBLE_DEVICES`.
     `CDI`: Injects resources using CDI, based on `GPUSTACK_RUNTIME_DEPLOY_RESOURCE_KEY_MAP_CDI`.
     """
+    GPUSTACK_RUNTIME_DOCKER_CDI_SPECS_GENERATE: bool = True
+    """
+    Generate CDI specifications during deployment when using CDI resource injection policy,
+    requires `GPUSTACK_RUNTIME_DEPLOY_CDI_SPECS_DIRECTORY` to be existed.
+    Works only when `GPUSTACK_RUNTIME_DOCKER_RESOURCE_INJECTION_POLICY` is set to `CDI`.
+    Using internal knowledge to generate the CDI specifications for deployer,
+    if the output file conflicts with other tools generating CDI specifications(e.g., NVIDIA Container Toolkit),
+    please disable this and remove the output file manually.
+    """
     ## Kubernetes
     GPUSTACK_RUNTIME_KUBERNETES_NODE_NAME: str | None = None
     """
@@ -274,6 +278,33 @@ if TYPE_CHECKING:
     """
     Deletion propagation policy for Kubernetes resources (e.g., Foreground, Background, Orphan).
     """
+    GPUSTACK_RUNTIME_KUBERNETES_RESOURCE_INJECTION_POLICY: str | None = None
+    """
+    Resource injection policy for the Kubernetes deployer (e.g., Env, KDP).
+    `Env`: Injects resources using standard environment variable, depends on underlying Container Toolkit, based on `GPUSTACK_RUNTIME_DEPLOY_RESOURCE_KEY_MAP_RUNTIME_VISIBLE_DEVICES`.
+    `KDP`: Injects resources using Kubernetes Device Plugin, based on `GPUSTACK_RUNTIME_DEPLOY_RESOURCE_KEY_MAP_CDI`.
+    """
+    GPUSTACK_RUNTIME_KUBERNETES_KDP_PER_DEVICE_MAX_ALLOCATIONS: int | None = None
+    """
+    Maximum allocations for one device in Kubernetes Device Plugin.
+    If not set, it should be 10.
+    """
+    GPUSTACK_RUNTIME_KUBERNETES_KDP_DEVICE_ALLOCATION_POLICY: str | None = None
+    """
+    Device allocation policy for the Kubernetes Device Plugin (e.g., CDI, Env, Opaque).
+    `CDI`: Allocates devices using generated CDI specifications, making it easy to debug and troubleshoot; requires `GPUSTACK_RUNTIME_DEPLOY_CDI_SPECS_DIRECTORY` to exist.
+    `Env`: Allocates devices using runtime-visible environment variables; requires Container Toolkit support.
+    `Opaque`: Uses internal logic for allocation, which is convenient for deployment but difficult to troubleshoot.
+    """
+    GPUSTACK_RUNTIME_KUBERNETES_KDP_CDI_SPECS_GENERATE: bool = True
+    """
+    Generate CDI specifications during deployment,
+    requires `GPUSTACK_RUNTIME_DEPLOY_CDI_SPECS_DIRECTORY` to be existed.
+    Works only when `GPUSTACK_RUNTIME_KUBERNETES_KDP_DEVICE_ALLOCATION_POLICY` is set to `CDI`.
+    Using internal knowledge to generate the CDI specifications for deployer,
+    if the output file conflicts with other tools generating CDI specifications(e.g., NVIDIA Container Toolkit),
+    please disable this and remove the output file manually.
+    """
     ## Podman
     GPUSTACK_RUNTIME_PODMAN_HOST: str | None = None
     """
@@ -308,6 +339,15 @@ if TYPE_CHECKING:
     Mute the original healthcheck of the container in Podman.
     Default is same as `GPUSTACK_RUNTIME_DOCKER_MUTE_ORIGINAL_HEALTHCHECK`.
     """
+    GPUSTACK_RUNTIME_PODMAN_CDI_SPECS_GENERATE: bool = True
+    """
+    Generate CDI specifications during deployment,
+    requires `GPUSTACK_RUNTIME_DEPLOY_CDI_SPECS_DIRECTORY` to be existed.
+    Using internal knowledge to generate the CDI specifications for deployer,
+    if the output file conflicts with other tools generating CDI specifications(e.g., NVIDIA Container Toolkit),
+    please disable this and remove the output file manually.
+    Default is same as `GPUSTACK_RUNTIME_DOCKER_CDI_SPECS_GENERATE`.
+    """
 # --8<-- [start:env-vars-definition]
@@ -479,12 +519,6 @@ variables: dict[str, Callable[[], Any]] = {
         "GPUSTACK_RUNTIME_DEPLOY_LABEL_PREFIX",
         "runtime.gpustack.ai",
     ),
-    "GPUSTACK_RUNTIME_DEPLOY_CDI_SPECS_GENERATE": lambda: to_bool(
-        getenv(
-            "GPUSTACK_RUNTIME_DEPLOY_CDI_SPECS_GENERATE",
-            "1",
-        ),
-    ),
     "GPUSTACK_RUNTIME_DEPLOY_CDI_SPECS_DIRECTORY": lambda: mkdir_path(
         getenv(
             "GPUSTACK_RUNTIME_DEPLOY_CDI_SPECS_DIRECTORY",
@@ -608,6 +642,13 @@ variables: dict[str, Callable[[], Any]] = {
         options=["Env", "CDI"],
         default="Env",
     ),
+    "GPUSTACK_RUNTIME_DOCKER_CDI_SPECS_GENERATE": lambda: ternary(
+        lambda: (
+            getenv("GPUSTACK_RUNTIME_DOCKER_RESOURCE_INJECTION_POLICY", "Env") == "Env"
+        ),
+        lambda: False,
+        lambda: to_bool(getenv("GPUSTACK_RUNTIME_DOCKER_CDI_SPECS_GENERATE", "1")),
+    ),
     ## Kubernetes
     "GPUSTACK_RUNTIME_KUBERNETES_NODE_NAME": lambda: getenv(
         "GPUSTACK_RUNTIME_KUBERNETES_NODE_NAME",
@@ -640,6 +681,46 @@ variables: dict[str, Callable[[], Any]] = {
         options=["Foreground", "Background", "Orphan"],
         default="Foreground",
     ),
+    "GPUSTACK_RUNTIME_KUBERNETES_RESOURCE_INJECTION_POLICY": lambda: choice(
+        getenv(
+            "GPUSTACK_RUNTIME_KUBERNETES_RESOURCE_INJECTION_POLICY",
+        ),
+        options=["Env", "KDP"],
+        default="Env",
+    ),
+    "GPUSTACK_RUNTIME_KUBERNETES_KDP_PER_DEVICE_MAX_ALLOCATIONS": lambda: to_int(
+        getenv(
+            "GPUSTACK_RUNTIME_KUBERNETES_KDP_PER_DEVICE_MAX_ALLOCATIONS",
+            "10",
+        ),
+    ),
+    "GPUSTACK_RUNTIME_KUBERNETES_KDP_DEVICE_ALLOCATION_POLICY": lambda: choice(
+        getenv(
+            "GPUSTACK_RUNTIME_KUBERNETES_KDP_DEVICE_ALLOCATION_POLICY",
+        ),
+        options=["CDI", "Env", "Opaque"],
+        default="CDI",
+    ),
+    "GPUSTACK_RUNTIME_KUBERNETES_KDP_CDI_SPECS_GENERATE": lambda: ternary(
+        lambda: (
+            getenv("GPUSTACK_RUNTIME_KUBERNETES_RESOURCE_INJECTION_POLICY", "Env")
+            == "Env"
+        ),
+        lambda: False,
+        lambda: ternary(
+            lambda: (
+                getenv(
+                    "GPUSTACK_RUNTIME_KUBERNETES_KDP_DEVICE_ALLOCATION_POLICY",
+                    "Opaque",
+                )
+                == "Opaque"
+            ),
+            lambda: False,
+            lambda: to_bool(
+                getenv("GPUSTACK_RUNTIME_KUBERNETES_KDP_CDI_SPECS_GENERATE", "1"),
+            ),
+        ),
+    ),
     ## Podman
     "GPUSTACK_RUNTIME_PODMAN_HOST": lambda: trim_str(
         getenvs(
@@ -697,8 +778,19 @@ variables: dict[str, Callable[[], Any]] = {
             "1",
         ),
     ),
+    "GPUSTACK_RUNTIME_PODMAN_CDI_SPECS_GENERATE": lambda: to_bool(
+        getenvs(
+            [
+                "GPUSTACK_RUNTIME_PODMAN_CDI_SPECS_GENERATE",
+                # Fallback to Docker's setting.
+                "GPUSTACK_RUNTIME_DOCKER_CDI_SPECS_GENERATE",
+            ],
+            "1",
+        ),
+    ),
 }
 # --8<-- [end:env-vars-definition]

gpustack_runtime/logging.py CHANGED Viewed

@@ -1,5 +1,5 @@
 # Borrowed from https://github.com/libp2p/py-libp2p/blob/main/libp2p/utils/logging.py.
-from __future__ import annotations
+from __future__ import annotations as __future_annotations__
 import atexit
 import logging
@@ -133,7 +133,11 @@ def setup_logging():
             module_logger.propagate = False
     # Configure 3rd-party loggers, set slightly higher level than package level
-    for _3rd in ["docker", "kubernetes"]:
+    for _3rd in [
+        "docker",
+        "kubernetes",
+        "grpc",
+    ]:
         _3rd_logger = logging.getLogger(_3rd)
         _3rd_logger.handlers.clear()
         _3rd_logger.addHandler(queue_handler)

{gpustack_runtime-0.1.40.post1.dist-info → gpustack_runtime-0.1.41.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: gpustack-runtime
-Version: 0.1.40.post1
+Version: 0.1.41
 Summary: GPUStack Runtime is library for detecting GPU resources and launching GPU workloads.
 Project-URL: Homepage, https://github.com/gpustack/runtime
 Project-URL: Bug Tracker, https://github.com/gpustack/gpustack/issues
@@ -14,14 +14,19 @@ Classifier: Programming Language :: Python :: 3.12
 Classifier: Programming Language :: Python :: 3.13
 Requires-Python: >=3.10
 Requires-Dist: argcomplete>=3.6.3
+Requires-Dist: cachetools>=5.5.2
 Requires-Dist: docker>=7.1.0
 Requires-Dist: gpustack-runner>=0.1.24.post1
+Requires-Dist: grpc-interceptor>=0.15.4
+Requires-Dist: grpcio>=1.76.0
 Requires-Dist: kubernetes>=33.1.0
 Requires-Dist: mthreads-ml-py>=2.2.10
 Requires-Dist: nvidia-ml-py>=13.580.65
 Requires-Dist: podman==5.6.0
+Requires-Dist: protobuf>=5.28.3
 Requires-Dist: pyyaml
 Requires-Dist: tqdm
+Requires-Dist: types-protobuf>=6.32.1.20251210
 Description-Content-Type: text/markdown
 # GPUStack Runtime

gpustack_runtime-0.1.41.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,67 @@
+gpustack_runtime/__init__.py,sha256=Xw_PVWneitx-8QmW6sJQeymj6zVbEgEndGhIB_km6TI,186
+gpustack_runtime/__main__.py,sha256=O9yJKcN7vg0Ppgc13qesxHwST2wkH3ccOkTQXPWHnNA,3939
+gpustack_runtime/_version.py,sha256=3VyVzUi8Smv4sZH0Q9rdGQXWEqqoTm7L84ArFLnPqZM,777
+gpustack_runtime/_version.pyi,sha256=A42NoSgcqEXVy2OeNm4LXC9CbyonbooYrSUBlPm2lGY,156
+gpustack_runtime/envs.py,sha256=cprrZ-c4owsRLq7M__DlfpK6Ob9zbqMzRGVOsPTMJX0,38583
+gpustack_runtime/logging.py,sha256=wMPriPpOuVsuClsjMh0qwEPQKyJiJa89ggdDjqkk7i0,6934
+gpustack_runtime/cmds/__init__.py,sha256=-_X2O2lBn6KcdLGUzhL3lEjQC4_cwA36fvWDnFAgtVM,1382
+gpustack_runtime/cmds/__types__.py,sha256=TBnUWUqzTkDtJnsMv363kdw-H8fOf-XQYbOvrmQif-M,815
+gpustack_runtime/cmds/deployer.py,sha256=KvhPhU6ZW-UV6vLykI5adKI1ThgVFFJqWaII3n4OhL8,32846
+gpustack_runtime/cmds/detector.py,sha256=AALcoqCiNuwYucKBnyj7r5ScOWc_BSzAhHR2C0QbEHE,8750
+gpustack_runtime/cmds/images.py,sha256=7tb-D3G4yqLPkbS9aSuWI1bD3DYK8BLbPbgqac56blI,594
+gpustack_runtime/deployer/__init__.py,sha256=impMrmvkMjuCBthsn3QUz3LuwpmmNAymHJKJ2o6SZoc,16249
+gpustack_runtime/deployer/__patches__.py,sha256=cTBge8BT6IsY5MzETKY3kN28k3igYfNj7pcpgDzfDzw,17849
+gpustack_runtime/deployer/__types__.py,sha256=PgIWogHOvHKsHoeBjmKFEEM3JrKck89Mmnwlfx01BbE,72248
+gpustack_runtime/deployer/__utils__.py,sha256=paQu2M1UeoSfQPsiskmAqJSiln-8qwibTssEoWFMLec,21109
+gpustack_runtime/deployer/docker.py,sha256=bOaXbTnaalbO42FlyWR1Ha26Y30LGWPzWKPV5Q-Nk7g,85039
+gpustack_runtime/deployer/kuberentes.py,sha256=2M0RgsR1TlzkZ2QsElKZulftUnUMipYQPeQKKSm_Alo,89387
+gpustack_runtime/deployer/podman.py,sha256=_qdbsTezacRmiXa3n04OUPUsgVy1pSFgJSKxous4s14,82156
+gpustack_runtime/deployer/cdi/__init__.py,sha256=y5fFNLhlrVhWzW-GTazT7xXBukHkBQ0DGfncKqKpBzk,3986
+gpustack_runtime/deployer/cdi/__types__.py,sha256=04DKvcogk7OoHS7TU2Bmht3VVMu7iOEBWTEOvxpHt4w,18399
+gpustack_runtime/deployer/cdi/__utils__.py,sha256=cgqub-TQkXEjujlcQC4hJpignmmgxN5Yq9Rn6Z-TAh8,3866
+gpustack_runtime/deployer/cdi/amd.py,sha256=-eq_SOlC56VX2QscZXvnoeffWSRindhr8zFZmaIcKrE,4082
+gpustack_runtime/deployer/cdi/ascend.py,sha256=lDs75a9--c0lM34xfJqu-_QbfWNFrf4zE-GXPKReBe4,4538
+gpustack_runtime/deployer/cdi/hygon.py,sha256=h6-vQfv03sgxYjMJAf_JOMq9cHFPaNjK1YbUYIiSXck,4117
+gpustack_runtime/deployer/cdi/iluvatar.py,sha256=6nNECZpU5IPP6-5l-O1rzU-ib-WcuwKvDg7ZV__1NE4,3650
+gpustack_runtime/deployer/cdi/metax.py,sha256=tmJBvr-n9pERAp-dXsa54qv6xmxt0rJoJwY36TFdoWk,4143
+gpustack_runtime/deployer/cdi/thead.py,sha256=SvIDKNYZx7FwMPTTxyJ2RRjlr9LXLN8BUYCUhidmiQk,3671
+gpustack_runtime/deployer/k8s/deviceplugin/__init__.py,sha256=RTQfArfX3FmS9lXKTwoWnb2gyqTIiDhRHEGe7MPxLzE,8040
+gpustack_runtime/deployer/k8s/deviceplugin/__types__.py,sha256=QaswnGns_hqMdVPeryDqmyhJrAHu_pfAlIC_25NHp4k,3057
+gpustack_runtime/deployer/k8s/deviceplugin/plugin.py,sha256=ktQ44wdNJNnv0Fn-TAnTQN0Jq5ZSqRA09WV407CrPvc,17931
+gpustack_runtime/deployer/k8s/types/kubelet/deviceplugin/v1beta1/__init__.py,sha256=3rOYmgDIIJ4idEtwgnumGStH7PaK-J7EYrOnLa9A-8o,118
+gpustack_runtime/deployer/k8s/types/kubelet/deviceplugin/v1beta1/api.proto,sha256=rmB8RDe4LN5FCVkQ608uS-pl32mk5tt6iGe-g2lKtPs,7919
+gpustack_runtime/deployer/k8s/types/kubelet/deviceplugin/v1beta1/api_pb2.py,sha256=DzmeyfwekwE0U0dK6WfwX1NQYLEr2mFa1hdaUTxt2f8,8404
+gpustack_runtime/deployer/k8s/types/kubelet/deviceplugin/v1beta1/api_pb2.pyi,sha256=lq1dbSgBYqJ7zyGfoKKHCyfr6R5vcCGzJxteeyQpbuI,8232
+gpustack_runtime/deployer/k8s/types/kubelet/deviceplugin/v1beta1/api_pb2_grpc.py,sha256=GM6EyCEFeyOjL0XOCisbcHurRoLKqKDUI5obsUyTxpE,17446
+gpustack_runtime/deployer/k8s/types/kubelet/deviceplugin/v1beta1/constants.py,sha256=tpNk3e_cvY67C9RwVsdTNl75YuNXBgsn53fSJIzeTR4,828
+gpustack_runtime/detector/__init__.py,sha256=9i6KOd3Qp_BmnSyPURlOBHlHJMSInqlDTh1kpAbs4_U,8104
+gpustack_runtime/detector/__types__.py,sha256=tiYbxPD6gV5wS79K3d2dUzy6btJl4QcsgunyxtJ240E,13162
+gpustack_runtime/detector/__utils__.py,sha256=QdLWXwsU1_EMxXG5Y29psqnttWJyXWMphHDjiC_6Byc,25153
+gpustack_runtime/detector/amd.py,sha256=qh86xGhPJRIXwiKaHmeyIrsxchUDRpyggR6yc0cLuKw,17553
+gpustack_runtime/detector/ascend.py,sha256=E6YPoREI5r2HZIegUaQb0XwC3Qau1mnkNeCRbgtlE5k,17992
+gpustack_runtime/detector/cambricon.py,sha256=GzXlS4et8zape0rr19d1EwSV9cfFEmHgaElTVMjR3IY,3947
+gpustack_runtime/detector/hygon.py,sha256=R4I8h66YHJC00iAtDJhBX772VMKUdZ8nleRXZFPUt3Q,12299
+gpustack_runtime/detector/iluvatar.py,sha256=bqciqjYE_tIxBg2PSOlIzH3WcFYBgTDjfN6nT90LSGg,10206
+gpustack_runtime/detector/metax.py,sha256=W4NSZD7Kf5431B63UBpYnKIk2Jz1SutEpwXkwgYfmfE,10374
+gpustack_runtime/detector/mthreads.py,sha256=GcElUIMvU5C6P4Fx_X_kSOsJps8WZ47tkZ2B2MJZmk4,12131
+gpustack_runtime/detector/nvidia.py,sha256=xdvoMdNx943on5fd_mI3WI_85kMY-0dYm5NU3vqXb9M,33400
+gpustack_runtime/detector/thead.py,sha256=43TGPq78FulpYBUeEMVxDTY-0X3ve2FsX4Hsd0Lswy0,25561
+gpustack_runtime/detector/pyacl/__init__.py,sha256=UQjaBxP7nJNyzr08N8_lH-5wPtnFmUY9pyQhs6vIChU,16232
+gpustack_runtime/detector/pyamdgpu/__init__.py,sha256=x-UO07EpKEgfTLmXQOD6j9f6kibuvDC7riQFof3YGdw,8617
+gpustack_runtime/detector/pyamdsmi/__init__.py,sha256=800-khq2w6HLgXM12RkhcdvXBGeAJ4s1_TWJyHebCMk,955
+gpustack_runtime/detector/pycuda/__init__.py,sha256=p-Na5eBjdsFGXPHCEEUfFj5TQFjPxPQGV0i4oU6ywBA,16922
+gpustack_runtime/detector/pydcmi/__init__.py,sha256=zCeImelWgbPDn51dJgp3LlCK-uGOuHmmPGiOsyYB3cI,37264
+gpustack_runtime/detector/pyhgml/__init__.py,sha256=Yp9s-QhHS4ck7Iq9kd4v6a4BruyJQcuOTYlyYSmnOgI,182896
+gpustack_runtime/detector/pyhgml/libhgml.so,sha256=BPzGVBpzrMX1tSvbXddq8Q0Qhi8w-No2JXX8sRxTioI,2101640
+gpustack_runtime/detector/pyhgml/libuki.so,sha256=EE6v1vIYYT4FSDMMm9rSfAqwrwIPFD-4_6KtP51lSps,702352
+gpustack_runtime/detector/pyhsa/__init__.py,sha256=4DuGnBBMUVOCPa6vTx3XT5mffGrKk6M6CYbUWBoMTJ0,15792
+gpustack_runtime/detector/pyixml/__init__.py,sha256=6ss_Dyl8lIT4WrKpfwmQqzBmg4Bxi38vg_eey_wsSY0,162681
+gpustack_runtime/detector/pymxsml/__init__.py,sha256=YxfNHq7TWd7CpNroP45BGXhcWNpY_sXgVzNGtx68DII,45409
+gpustack_runtime/detector/pyrocmcore/__init__.py,sha256=rgwIdPS-7GG7_5luRMR1XG9QyNM3lJh5ryD7kfZqpWg,2523
+gpustack_runtime/detector/pyrocmsmi/__init__.py,sha256=ACwRtJWVIuJ4NTcBJxk0zrVb_qtDOMkApMdbJoag5g0,11906
+gpustack_runtime/_version_appendix.py,sha256=C8KJWDWnWAHNEMYzKYXyeA2PTIO31o7aTAhQlRkmhUA,23
+gpustack_runtime-0.1.41.dist-info/METADATA,sha256=RDItHofAkys1Iqn6uwI03D6nqq-QrrMOcaJ43Iu2XH4,2358
+gpustack_runtime-0.1.41.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
+gpustack_runtime-0.1.41.dist-info/entry_points.txt,sha256=bBO_61GxP6dIT74uZwbSDgW5Vt2pTePUS3CgjUJkUgg,68
+gpustack_runtime-0.1.41.dist-info/licenses/LICENSE,sha256=OiPibowBvB-NHV3TP_NOj18XNBlXcshXZFMpa3uvKVE,10362
+gpustack_runtime-0.1.41.dist-info/RECORD,,

gpustack-runtime 0.1.40.post1__py3-none-any.whl → 0.1.41__py3-none-any.whl

gpustack-runtime 0.1.40.post1py3-none-any.whl → 0.1.41py3-none-any.whl