PyPI - mate-runtime-cuda - Versions diffs - 0.1.0__tar.gz - Mend

mate-runtime-cuda 0.1.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

mate_runtime_cuda-0.1.0/.gitignore +30 -0
mate_runtime_cuda-0.1.0/PKG-INFO +15 -0
mate_runtime_cuda-0.1.0/README.md +19 -0
mate_runtime_cuda-0.1.0/pyproject.toml +41 -0
mate_runtime_cuda-0.1.0/src/mate_runtime_cuda/__init__.py +28 -0
mate_runtime_cuda-0.1.0/src/mate_runtime_cuda/_detect.py +85 -0
mate_runtime_cuda-0.1.0/src/mate_runtime_cuda/_names.py +95 -0
mate_runtime_cuda-0.1.0/tests/__init__.py +0 -0
mate_runtime_cuda-0.1.0/tests/fixtures.py +11 -0
mate_runtime_cuda-0.1.0/tests/test_detect.py +136 -0

mate_runtime_cuda-0.1.0/.gitignore ADDED Viewed

@@ -0,0 +1,30 @@
+# Python
+.venv/
+__pycache__/
+*.py[cod]
+*.egg-info/
+dist/
+build/
+.pytest_cache/
+# uv
+uv.lock
+# Node / Cloudflare Worker
+worker/node_modules/
+worker/.wrangler/
+worker/dist/
+# Results (local benchmark output)
+results/
+# Secrets / local config
+.env
+*.env.local
+# OS
+.DS_Store
+Thumbs.db
+# Internal planning notes
+BENCH_NOTES.md

mate_runtime_cuda-0.1.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,15 @@
+Metadata-Version: 2.4
+Name: mate-runtime-cuda
+Version: 0.1.0
+Summary: NVIDIA CUDA runtime plugin for mate-bench
+Project-URL: Homepage, https://github.com/T0nd3/mate-bench
+Project-URL: Repository, https://github.com/T0nd3/mate-bench
+Author-email: Benjamin Fäuster <benjamin.faeuster@web.de>
+License: MIT
+Classifier: License :: OSI Approved :: MIT License
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Topic :: System :: Benchmark
+Requires-Python: >=3.11
+Requires-Dist: mate-bench<0.2,>=0.1

mate_runtime_cuda-0.1.0/README.md ADDED Viewed

@@ -0,0 +1,19 @@
+# mate-runtime-cuda
+NVIDIA CUDA runtime plugin for [mate-bench](https://github.com/T0nd3/mate-bench).
+Detects GPU name, chip, VRAM, CUDA version and driver from `nvidia-smi`.
+```bash
+pip install mate-bench mate-runtime-cuda
+mate list-runtimes
+```
+## Requirements
+- NVIDIA GPU with drivers installed (`nvidia-smi` must be in PATH)
+- CUDA 11.x or newer
+## Supported GPUs
+Pascal (GTX 10xx) through Blackwell (RTX 50xx), including data centre GPUs (A100, H100, V100).

mate_runtime_cuda-0.1.0/pyproject.toml ADDED Viewed

@@ -0,0 +1,41 @@
+[project]
+name = "mate-runtime-cuda"
+version = "0.1.0"
+description = "NVIDIA CUDA runtime plugin for mate-bench"
+requires-python = ">=3.11"
+license = {text = "MIT"}
+authors = [{name = "Benjamin Fäuster", email = "benjamin.faeuster@web.de"}]
+classifiers = [
+    "License :: OSI Approved :: MIT License",
+    "Programming Language :: Python :: 3",
+    "Programming Language :: Python :: 3.11",
+    "Programming Language :: Python :: 3.12",
+    "Topic :: System :: Benchmark",
+]
+dependencies = [
+    "mate-bench>=0.1,<0.2",
+]
+[project.urls]
+Homepage = "https://github.com/T0nd3/mate-bench"
+Repository = "https://github.com/T0nd3/mate-bench"
+[project.entry-points."mate_bench.runtime"]
+cuda = "mate_runtime_cuda:CudaRuntime"
+[tool.mate-bench]
+requires_mate_bench = ">=0.1,<0.2"
+api_version = 1
+[dependency-groups]
+dev = ["pytest>=8.0", "ruff>=0.4"]
+[tool.pytest.ini_options]
+markers = ["integration: requires an NVIDIA GPU with CUDA drivers"]
+[build-system]
+requires = ["hatchling"]
+build-backend = "hatchling.build"
+[tool.hatch.build.targets.wheel]
+packages = ["src/mate_runtime_cuda"]

mate_runtime_cuda-0.1.0/src/mate_runtime_cuda/__init__.py ADDED Viewed

@@ -0,0 +1,28 @@
+from __future__ import annotations
+from typing import Any
+from mate_bench.plugin import PluginManifest
+from ._detect import GpuInfo, is_cuda_available, query_gpu
+class CudaRuntime:
+    name = "cuda"
+    manifest = PluginManifest(requires_mate_bench=">=0.1,<0.2", api_version=1)
+    def is_available(self) -> bool:
+        return is_cuda_available()
+    def gpu_info(self, index: int = 0) -> dict[str, Any]:
+        info: GpuInfo = query_gpu(index)
+        return {
+            "gpu_vendor": "nvidia",
+            "gpu_name": info.name,
+            "gpu_chip": info.chip,
+            "vram_gb": info.vram_gb,
+            "runtime": info.cuda_version,
+            "driver": info.driver_version,
+            "_gpu_name_raw": info.name_raw,
+            "_gpu_name_known": info.name_known,
+        }

mate_runtime_cuda-0.1.0/src/mate_runtime_cuda/_detect.py ADDED Viewed

@@ -0,0 +1,85 @@
+from __future__ import annotations
+import re
+import subprocess
+from dataclasses import dataclass
+from ._names import chip_from_name, normalize
+@dataclass
+class GpuInfo:
+    chip: str  # die codename, e.g. "AD102"
+    name: str  # normalized, e.g. "RTX 4090"
+    name_raw: str  # as reported by nvidia-smi, e.g. "NVIDIA GeForce RTX 4090"
+    name_known: bool  # False → unknown model, stored raw + flagged
+    vram_gb: float
+    cuda_version: str  # e.g. "CUDA 12.4"
+    driver_version: str  # e.g. "550.54.15"
+def is_cuda_available() -> bool:
+    """CUDA is available if nvidia-smi lists at least one GPU."""
+    return bool(_run(["nvidia-smi", "-L"]))
+def query_gpu(index: int = 0) -> GpuInfo:
+    """Query GPU info for the given device index via nvidia-smi."""
+    rows = _query_smi(
+        ["name", "memory.total", "driver_version", "cuda_version"],
+        units=False,
+    )
+    if not rows:
+        raise RuntimeError("No NVIDIA GPU found. Are the drivers installed?")
+    if index >= len(rows):
+        raise IndexError(f"GPU index {index} out of range ({len(rows)} GPUs found)")
+    row = rows[index]
+    raw_name = row[0].strip()
+    vram_mib = _parse_float(row[1])
+    driver = row[2].strip()
+    cuda = row[3].strip()
+    name, name_known = normalize(raw_name)
+    chip, chip_known = chip_from_name(name)
+    if not chip_known:
+        chip = name  # fall back to display name as chip key
+    return GpuInfo(
+        chip=chip,
+        name=name,
+        name_raw=raw_name,
+        name_known=name_known and chip_known,
+        vram_gb=round(vram_mib / 1024, 1),
+        cuda_version=f"CUDA {cuda}" if cuda else "CUDA unknown",
+        driver_version=driver or "unknown",
+    )
+# ── internal helpers ──────────────────────────────────────────────────────────
+def _run(cmd: list[str], timeout: int = 10) -> str:
+    try:
+        result = subprocess.run(cmd, capture_output=True, text=True, timeout=timeout)
+        return result.stdout
+    except (FileNotFoundError, subprocess.TimeoutExpired, OSError):
+        return ""
+def _query_smi(fields: list[str], units: bool = False) -> list[list[str]]:
+    """Run nvidia-smi --query-gpu and return parsed rows."""
+    cmd = [
+        "nvidia-smi",
+        f"--query-gpu={','.join(fields)}",
+        "--format=csv,noheader" + ("" if units else ",nounits"),
+    ]
+    out = _run(cmd)
+    if not out.strip():
+        return []
+    return [line.split(",") for line in out.strip().splitlines() if line.strip()]
+def _parse_float(s: str) -> float:
+    m = re.search(r"[\d.]+", s)
+    return float(m.group()) if m else 0.0

mate_runtime_cuda-0.1.0/src/mate_runtime_cuda/_names.py ADDED Viewed

@@ -0,0 +1,95 @@
+from __future__ import annotations
+import re
+# (substring to match in normalized name, chip codename)
+# Ordered from most specific to least specific.
+_GPU_CHIP_MAP: list[tuple[str, str]] = [
+    # Blackwell — RTX 50xx
+    ("RTX 5090", "GB202"),
+    ("RTX 5080", "GB203"),
+    ("RTX 5070 Ti", "GB203"),
+    ("RTX 5070", "GB205"),
+    ("RTX 5060 Ti", "GB206"),
+    ("RTX 5060", "GB206"),
+    # Ada Lovelace — RTX 40xx + professional
+    ("RTX 6000 Ada", "AD102"),
+    ("RTX 4090", "AD102"),
+    ("RTX 4080 Super", "AD103"),
+    ("RTX 4080", "AD103"),
+    ("RTX 4070 Ti Super", "AD103"),
+    ("RTX 4070 Ti", "AD104"),
+    ("RTX 4070 Super", "AD104"),
+    ("RTX 4070", "AD104"),
+    ("RTX 4500 Ada", "AD104"),
+    ("RTX 4000 Ada", "AD104"),
+    ("RTX 4060 Ti", "AD106"),
+    ("RTX 4060", "AD107"),
+    # Hopper
+    ("H200", "GH200"),
+    ("H100", "GH100"),
+    # Ampere — data centre
+    ("A100", "GA100"),
+    ("A800", "GA100"),
+    ("RTX A6000", "GA102"),
+    ("RTX A5000", "GA102"),
+    ("RTX A4000", "GA104"),
+    ("RTX A3000", "GA104"),
+    ("RTX A2000", "GA106"),
+    # Ampere — RTX 30xx
+    ("RTX 3090 Ti", "GA102"),
+    ("RTX 3090", "GA102"),
+    ("RTX 3080 Ti", "GA102"),
+    ("RTX 3080", "GA102"),
+    ("RTX 3070 Ti", "GA104"),
+    ("RTX 3070", "GA104"),
+    ("RTX 3060 Ti", "GA104"),
+    ("RTX 3060", "GA106"),
+    ("RTX 3050", "GA107"),
+    # Volta
+    ("Titan V", "GV100"),
+    ("V100", "GV100"),
+    # Turing — RTX 20xx
+    ("RTX 2080 Ti", "TU102"),
+    ("RTX 2080 Super", "TU104"),
+    ("RTX 2080", "TU104"),
+    ("RTX 2070 Super", "TU104"),
+    ("RTX 2070", "TU106"),
+    ("RTX 2060 Super", "TU106"),
+    ("RTX 2060", "TU106"),
+    # Turing — GTX 16xx
+    ("GTX 1660 Ti", "TU116"),
+    ("GTX 1660 Super", "TU116"),
+    ("GTX 1660", "TU116"),
+    ("GTX 1650 Super", "TU116"),
+    ("GTX 1650", "TU117"),
+    # Pascal — GTX 10xx
+    ("Titan Xp", "GP102"),
+    ("GTX 1080 Ti", "GP102"),
+    ("GTX 1080", "GP104"),
+    ("GTX 1070 Ti", "GP104"),
+    ("GTX 1070", "GP104"),
+    ("GTX 1060", "GP106"),
+    ("GTX 1050 Ti", "GP107"),
+    ("GTX 1050", "GP107"),
+]
+_STRIP_PREFIX = re.compile(r"^(?:NVIDIA\s+)?(?:GeForce\s+|Tesla\s+|Quadro\s+)?", re.IGNORECASE)
+def normalize(raw: str) -> tuple[str, bool]:
+    """Return (display_name, is_known_chip).
+    Strips vendor/product-line prefixes and looks up the die codename.
+    """
+    display = _STRIP_PREFIX.sub("", raw).strip()
+    _, known = chip_from_name(display)
+    return display, known
+def chip_from_name(normalized: str) -> tuple[str, bool]:
+    """Return (chip_codename, is_known) for a normalized GPU name."""
+    for substring, chip in _GPU_CHIP_MAP:
+        if substring.lower() in normalized.lower():
+            return chip, True
+    return normalized, False

mate_runtime_cuda-0.1.0/tests/__init__.py ADDED Viewed

File without changes

mate_runtime_cuda-0.1.0/tests/fixtures.py ADDED Viewed

@@ -0,0 +1,11 @@
+# nvidia-smi --query-gpu=name,memory.total,driver_version,cuda_version --format=csv,noheader,nounits
+SMI_RTX4090 = "NVIDIA GeForce RTX 4090, 24564, 550.54.15, 12.4"
+SMI_RTX3080 = "NVIDIA GeForce RTX 3080, 10240, 535.183.01, 12.2"
+SMI_A100 = "NVIDIA A100-SXM4-80GB, 81920, 520.61.05, 11.8"
+SMI_UNKNOWN = "NVIDIA SomeUnknownGPU, 8192, 550.54.15, 12.4"
+SMI_EMPTY = ""
+# nvidia-smi -L
+SMI_LIST_RTX4090 = "GPU 0: NVIDIA GeForce RTX 4090 (UUID: GPU-abc123)\n"
+SMI_LIST_EMPTY = ""

mate_runtime_cuda-0.1.0/tests/test_detect.py ADDED Viewed

@@ -0,0 +1,136 @@
+from __future__ import annotations
+from unittest.mock import patch
+import pytest
+from mate_runtime_cuda._detect import _query_smi, is_cuda_available, query_gpu
+from mate_runtime_cuda._names import chip_from_name, normalize
+from .fixtures import (
+    SMI_A100,
+    SMI_EMPTY,
+    SMI_LIST_EMPTY,
+    SMI_LIST_RTX4090,
+    SMI_RTX3080,
+    SMI_RTX4090,
+    SMI_UNKNOWN,
+)
+# ── is_cuda_available ─────────────────────────────────────────────────────────
+class TestIsCudaAvailable:
+    def test_available_when_smi_returns_output(self):
+        with patch("mate_runtime_cuda._detect._run", return_value=SMI_LIST_RTX4090):
+            assert is_cuda_available() is True
+    def test_unavailable_when_smi_empty(self):
+        with patch("mate_runtime_cuda._detect._run", return_value=SMI_LIST_EMPTY):
+            assert is_cuda_available() is False
+# ── _query_smi ────────────────────────────────────────────────────────────────
+class TestQuerySmi:
+    def test_parses_rtx4090_row(self):
+        with patch("mate_runtime_cuda._detect._run", return_value=SMI_RTX4090):
+            rows = _query_smi(["name", "memory.total", "driver_version", "cuda_version"])
+        assert len(rows) == 1
+        assert "RTX 4090" in rows[0][0]
+    def test_empty_returns_empty_list(self):
+        with patch("mate_runtime_cuda._detect._run", return_value=SMI_EMPTY):
+            assert _query_smi(["name"]) == []
+# ── query_gpu ─────────────────────────────────────────────────────────────────
+class TestQueryGpu:
+    def test_rtx4090(self):
+        with patch("mate_runtime_cuda._detect._run", return_value=SMI_RTX4090):
+            info = query_gpu(0)
+        assert info.chip == "AD102"
+        assert info.name == "RTX 4090"
+        assert info.name_raw == "NVIDIA GeForce RTX 4090"
+        assert info.name_known is True
+        assert info.vram_gb == 24.0
+        assert info.cuda_version == "CUDA 12.4"
+        assert info.driver_version == "550.54.15"
+    def test_rtx3080(self):
+        with patch("mate_runtime_cuda._detect._run", return_value=SMI_RTX3080):
+            info = query_gpu(0)
+        assert info.chip == "GA102"
+        assert info.name == "RTX 3080"
+        assert info.vram_gb == 10.0
+    def test_a100(self):
+        with patch("mate_runtime_cuda._detect._run", return_value=SMI_A100):
+            info = query_gpu(0)
+        assert info.chip == "GA100"
+        assert info.vram_gb == 80.0
+    def test_unknown_gpu_not_known(self):
+        with patch("mate_runtime_cuda._detect._run", return_value=SMI_UNKNOWN):
+            info = query_gpu(0)
+        assert info.name_known is False
+        assert info.name == "SomeUnknownGPU"
+    def test_no_gpu_raises(self):
+        with (
+            patch("mate_runtime_cuda._detect._run", return_value=SMI_EMPTY),
+            pytest.raises(RuntimeError, match="No NVIDIA GPU found"),
+        ):
+            query_gpu(0)
+    def test_index_out_of_range_raises(self):
+        with (
+            patch("mate_runtime_cuda._detect._run", return_value=SMI_RTX4090),
+            pytest.raises(IndexError),
+        ):
+            query_gpu(1)
+# ── normalize & chip_from_name ────────────────────────────────────────────────
+class TestNormalize:
+    @pytest.mark.parametrize(
+        "raw, expected_name",
+        [
+            ("NVIDIA GeForce RTX 4090", "RTX 4090"),
+            ("NVIDIA GeForce RTX 3080", "RTX 3080"),
+            ("NVIDIA A100-SXM4-80GB", "A100-SXM4-80GB"),
+            ("NVIDIA GeForce GTX 1080 Ti", "GTX 1080 Ti"),
+            ("NVIDIA GeForce RTX 2080 Ti", "RTX 2080 Ti"),
+        ],
+    )
+    def test_strips_prefix(self, raw, expected_name):
+        name, _ = normalize(raw)
+        assert name == expected_name
+    @pytest.mark.parametrize(
+        "raw, expected_chip",
+        [
+            ("NVIDIA GeForce RTX 4090", "AD102"),
+            ("NVIDIA GeForce RTX 3090", "GA102"),
+            ("NVIDIA GeForce RTX 3080", "GA102"),
+            ("NVIDIA GeForce RTX 3070", "GA104"),
+            ("NVIDIA GeForce RTX 2080 Ti", "TU102"),
+            ("NVIDIA GeForce GTX 1080 Ti", "GP102"),
+            ("NVIDIA H100", "GH100"),
+            ("NVIDIA A100-SXM4-80GB", "GA100"),
+        ],
+    )
+    def test_known_chips(self, raw, expected_chip):
+        name, _ = normalize(raw)
+        chip, known = chip_from_name(name)
+        assert chip == expected_chip
+        assert known is True
+    def test_unknown_chip(self):
+        _, known = normalize("NVIDIA Futuristic GPU XYZ")
+        assert known is False