PyPI - vec-inf - Versions diffs - 0.5.0__py3-none-any.whl → 0.6.1__py3-none-any.whl - Mend

vec-inf 0.5.0py3-none-any.whl → 0.6.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

vec_inf/README.md +3 -3
vec_inf/cli/_cli.py +239 -104
vec_inf/cli/_helper.py +289 -564
vec_inf/cli/_utils.py +26 -150
vec_inf/cli/_vars.py +32 -0
vec_inf/client/__init__.py +31 -0
vec_inf/client/_client_vars.py +231 -0
vec_inf/client/_exceptions.py +37 -0
vec_inf/client/_helper.py +661 -0
vec_inf/client/_slurm_script_generator.py +178 -0
vec_inf/client/_utils.py +287 -0
vec_inf/client/api.py +302 -0
vec_inf/client/config.py +138 -0
vec_inf/client/models.py +234 -0
vec_inf/client/slurm_vars.py +49 -0
vec_inf/config/README.md +0 -12
vec_inf/config/models.yaml +410 -391
{vec_inf-0.5.0.dist-info → vec_inf-0.6.1.dist-info}/METADATA +52 -63
vec_inf-0.6.1.dist-info/RECORD +25 -0
vec_inf/cli/_config.py +0 -87
vec_inf/multinode_vllm.slurm +0 -154
vec_inf/vllm.slurm +0 -90
vec_inf-0.5.0.dist-info/RECORD +0 -17
{vec_inf-0.5.0.dist-info → vec_inf-0.6.1.dist-info}/WHEEL +0 -0
{vec_inf-0.5.0.dist-info → vec_inf-0.6.1.dist-info}/entry_points.txt +0 -0
{vec_inf-0.5.0.dist-info → vec_inf-0.6.1.dist-info}/licenses/LICENSE +0 -0

vec_inf/client/_slurm_script_generator.py ADDED Viewed

@@ -0,0 +1,178 @@
+"""Class for generating SLURM scripts to run vLLM servers.
+This module provides functionality to generate SLURM scripts for running vLLM servers
+in both single-node and multi-node configurations.
+"""
+from datetime import datetime
+from pathlib import Path
+from typing import Any
+from vec_inf.client._client_vars import (
+    SLURM_JOB_CONFIG_ARGS,
+    SLURM_SCRIPT_TEMPLATE,
+)
+class SlurmScriptGenerator:
+    """A class to generate SLURM scripts for running vLLM servers.
+    This class handles the generation of SLURM scripts for both single-node and
+    multi-node configurations, supporting different virtualization environments
+    (venv or singularity).
+    Parameters
+    ----------
+    params : dict[str, Any]
+        Configuration parameters for the SLURM script. Contains settings for job
+        configuration, model parameters, and virtualization environment.
+    """
+    def __init__(self, params: dict[str, Any]):
+        """Initialize the SlurmScriptGenerator with configuration parameters.
+        Parameters
+        ----------
+        params : dict[str, Any]
+            Configuration parameters for the SLURM script.
+        """
+        self.params = params
+        self.is_multinode = int(self.params["num_nodes"]) > 1
+        self.use_singularity = self.params["venv"] == "singularity"
+        self.additional_binds = self.params.get("bind", "")
+        if self.additional_binds:
+            self.additional_binds = f" --bind {self.additional_binds}"
+        self.model_weights_path = str(
+            Path(params["model_weights_parent_dir"], params["model_name"])
+        )
+    def _generate_script_content(self) -> str:
+        """Generate the complete SLURM script content.
+        Returns
+        -------
+        str
+            The complete SLURM script as a string.
+        """
+        script_content = []
+        script_content.append(self._generate_shebang())
+        script_content.append(self._generate_server_setup())
+        script_content.append(self._generate_launch_cmd())
+        return "\n".join(script_content)
+    def _generate_shebang(self) -> str:
+        """Generate the SLURM script shebang with job specifications.
+        Returns
+        -------
+        str
+            SLURM shebang containing job specifications.
+        """
+        shebang = [SLURM_SCRIPT_TEMPLATE["shebang"]["base"]]
+        for arg, value in SLURM_JOB_CONFIG_ARGS.items():
+            if self.params.get(value):
+                shebang.append(f"#SBATCH --{arg}={self.params[value]}")
+        if self.is_multinode:
+            shebang += SLURM_SCRIPT_TEMPLATE["shebang"]["multinode"]
+        return "\n".join(shebang)
+    def _generate_server_setup(self) -> str:
+        """Generate the server initialization script.
+        Creates the script section that handles server setup, including Ray
+        initialization for multi-node setups and port configuration.
+        Returns
+        -------
+        str
+            Server initialization script content.
+        """
+        server_script = ["\n"]
+        if self.use_singularity:
+            server_script.append("\n".join(SLURM_SCRIPT_TEMPLATE["singularity_setup"]))
+        server_script.append("\n".join(SLURM_SCRIPT_TEMPLATE["env_vars"]))
+        server_script.append(
+            SLURM_SCRIPT_TEMPLATE["imports"].format(src_dir=self.params["src_dir"])
+        )
+        if self.is_multinode:
+            server_setup_str = "\n".join(
+                SLURM_SCRIPT_TEMPLATE["server_setup"]["multinode"]
+            )
+            if self.use_singularity:
+                server_setup_str = server_setup_str.replace(
+                    "SINGULARITY_PLACEHOLDER",
+                    SLURM_SCRIPT_TEMPLATE["singularity_command"].format(
+                        model_weights_path=self.model_weights_path,
+                        additional_binds=self.additional_binds,
+                    ),
+                )
+        else:
+            server_setup_str = "\n".join(
+                SLURM_SCRIPT_TEMPLATE["server_setup"]["single_node"]
+            )
+        server_script.append(server_setup_str)
+        server_script.append("\n".join(SLURM_SCRIPT_TEMPLATE["find_vllm_port"]))
+        server_script.append(
+            "\n".join(SLURM_SCRIPT_TEMPLATE["write_to_json"]).format(
+                log_dir=self.params["log_dir"], model_name=self.params["model_name"]
+            )
+        )
+        return "\n".join(server_script)
+    def _generate_launch_cmd(self) -> str:
+        """Generate the vLLM server launch command.
+        Creates the command to launch the vLLM server, handling different virtualization
+        environments (venv or singularity).
+        Returns
+        -------
+        str
+            Server launch command.
+        """
+        launcher_script = ["\n"]
+        if self.use_singularity:
+            launcher_script.append(
+                SLURM_SCRIPT_TEMPLATE["singularity_command"].format(
+                    model_weights_path=self.model_weights_path,
+                    additional_binds=self.additional_binds,
+                )
+                + " \\"
+            )
+        else:
+            launcher_script.append(
+                SLURM_SCRIPT_TEMPLATE["activate_venv"].format(venv=self.params["venv"])
+            )
+        launcher_script.append(
+            "\n".join(SLURM_SCRIPT_TEMPLATE["launch_cmd"]).format(
+                model_weights_path=self.model_weights_path,
+                model_name=self.params["model_name"],
+            )
+        )
+        for arg, value in self.params["vllm_args"].items():
+            if isinstance(value, bool):
+                launcher_script.append(f"    {arg} \\")
+            else:
+                launcher_script.append(f"    {arg} {value} \\")
+        return "\n".join(launcher_script)
+    def write_to_log_dir(self) -> Path:
+        """Write the generated SLURM script to the log directory.
+        Creates a timestamped script file in the configured log directory.
+        Returns
+        -------
+        Path
+            Path to the generated SLURM script file.
+        """
+        timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+        script_path: Path = (
+            Path(self.params["log_dir"])
+            / f"launch_{self.params['model_name']}_{timestamp}.slurm"
+        )
+        content = self._generate_script_content()
+        script_path.write_text(content)
+        return script_path

vec_inf/client/_utils.py ADDED Viewed

@@ -0,0 +1,287 @@
+"""Utility functions shared between CLI and API.
+This module provides utility functions for managing SLURM jobs, server status checks,
+and configuration handling for the vector inference package.
+"""
+import json
+import os
+import subprocess
+import warnings
+from pathlib import Path
+from typing import Any, Optional, Union, cast
+import requests
+import yaml
+from vec_inf.client._client_vars import MODEL_READY_SIGNATURE
+from vec_inf.client.config import ModelConfig
+from vec_inf.client.models import ModelStatus
+from vec_inf.client.slurm_vars import CACHED_CONFIG
+def run_bash_command(command: str) -> tuple[str, str]:
+    """Run a bash command and return the output.
+    Parameters
+    ----------
+    command : str
+        The bash command to execute
+    Returns
+    -------
+    tuple[str, str]
+        A tuple containing (stdout, stderr) from the command execution
+    """
+    process = subprocess.Popen(
+        command, shell=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True
+    )
+    return process.communicate()
+def read_slurm_log(
+    slurm_job_name: str,
+    slurm_job_id: int,
+    slurm_log_type: str,
+    log_dir: Optional[Union[str, Path]],
+) -> Union[list[str], str, dict[str, str]]:
+    """Read the slurm log file.
+    Parameters
+    ----------
+    slurm_job_name : str
+        Name of the SLURM job
+    slurm_job_id : int
+        ID of the SLURM job
+    slurm_log_type : str
+        Type of log file to read ('out', 'err', or 'json')
+    log_dir : Optional[Union[str, Path]]
+        Directory containing log files, if None uses default location
+    Returns
+    -------
+    Union[list[str], str, dict[str, str]]
+        Contents of the log file:
+        - list[str] for 'out' and 'err' logs
+        - dict[str, str] for 'json' logs
+        - str for error messages if file not found
+    """
+    if not log_dir:
+        # Default log directory
+        models_dir = Path.home() / ".vec-inf-logs"
+        # Iterate over all dirs in models_dir, sorted by dir name length in desc order
+        for directory in sorted(
+            [d for d in models_dir.iterdir() if d.is_dir()],
+            key=lambda d: len(d.name),
+            reverse=True,
+        ):
+            if directory.name in slurm_job_name:
+                log_dir = directory
+                break
+    else:
+        log_dir = Path(log_dir)
+    # If log_dir is still not set, then didn't find the log dir at default location
+    if not log_dir:
+        return "LOG DIR NOT FOUND"
+    try:
+        file_path = (
+            log_dir
+            / Path(f"{slurm_job_name}.{slurm_job_id}")
+            / f"{slurm_job_name}.{slurm_job_id}.{slurm_log_type}"
+        )
+        if slurm_log_type == "json":
+            with file_path.open("r") as file:
+                json_content: dict[str, str] = json.load(file)
+                return json_content
+        else:
+            with file_path.open("r") as file:
+                return file.readlines()
+    except FileNotFoundError:
+        return f"LOG FILE NOT FOUND: {file_path}"
+def is_server_running(
+    slurm_job_name: str, slurm_job_id: int, log_dir: Optional[str]
+) -> Union[str, ModelStatus, tuple[ModelStatus, str]]:
+    """Check if a model is ready to serve requests.
+    Parameters
+    ----------
+    slurm_job_name : str
+        Name of the SLURM job
+    slurm_job_id : int
+        ID of the SLURM job
+    log_dir : Optional[str]
+        Directory containing log files
+    Returns
+    -------
+    Union[str, ModelStatus, tuple[ModelStatus, str]]
+        - str: Error message if logs cannot be read
+        - ModelStatus: Current status of the server
+        - tuple[ModelStatus, str]: Status and error message if server failed
+    """
+    log_content = read_slurm_log(slurm_job_name, slurm_job_id, "err", log_dir)
+    if isinstance(log_content, str):
+        return log_content
+    status: Union[str, tuple[ModelStatus, str]] = ModelStatus.LAUNCHING
+    for line in log_content:
+        if "error" in line.lower():
+            status = (ModelStatus.FAILED, line.strip("\n"))
+        if MODEL_READY_SIGNATURE in line:
+            status = "RUNNING"
+    return status
+def get_base_url(slurm_job_name: str, slurm_job_id: int, log_dir: Optional[str]) -> str:
+    """Get the base URL of a model.
+    Parameters
+    ----------
+    slurm_job_name : str
+        Name of the SLURM job
+    slurm_job_id : int
+        ID of the SLURM job
+    log_dir : Optional[str]
+        Directory containing log files
+    Returns
+    -------
+    str
+        Base URL of the model server or error message if not found
+    """
+    log_content = read_slurm_log(slurm_job_name, slurm_job_id, "json", log_dir)
+    if isinstance(log_content, str):
+        return log_content
+    server_addr = cast(dict[str, str], log_content).get("server_address")
+    return server_addr if server_addr else "URL NOT FOUND"
+def model_health_check(
+    slurm_job_name: str, slurm_job_id: int, log_dir: Optional[str]
+) -> tuple[ModelStatus, Union[str, int]]:
+    """Check the health of a running model on the cluster.
+    Parameters
+    ----------
+    slurm_job_name : str
+        Name of the SLURM job
+    slurm_job_id : int
+        ID of the SLURM job
+    log_dir : Optional[str]
+        Directory containing log files
+    Returns
+    -------
+    tuple[ModelStatus, Union[str, int]]
+        Tuple containing:
+        - ModelStatus: Current status of the model
+        - Union[str, int]: Either HTTP status code or error message
+    """
+    base_url = get_base_url(slurm_job_name, slurm_job_id, log_dir)
+    if not base_url.startswith("http"):
+        return (ModelStatus.FAILED, base_url)
+    health_check_url = base_url.replace("v1", "health")
+    try:
+        response = requests.get(health_check_url)
+        # Check if the request was successful
+        if response.status_code == 200:
+            return (ModelStatus.READY, response.status_code)
+        return (ModelStatus.FAILED, response.status_code)
+    except requests.exceptions.RequestException as e:
+        return (ModelStatus.FAILED, str(e))
+def load_config() -> list[ModelConfig]:
+    """Load the model configuration.
+    Loads configuration from default and user-specified paths, merging them
+    if both exist. User configuration takes precedence over default values.
+    Returns
+    -------
+    list[ModelConfig]
+        List of validated model configurations
+    Notes
+    -----
+    Configuration is loaded from:
+    1. Default path: package's config/models.yaml
+    2. User path: specified by VEC_INF_CONFIG environment variable
+    If user configuration exists, it will be merged with default configuration,
+    with user values taking precedence for overlapping fields.
+    """
+    default_path = (
+        CACHED_CONFIG
+        if CACHED_CONFIG.exists()
+        else Path(__file__).resolve().parent.parent / "config" / "models.yaml"
+    )
+    config: dict[str, Any] = {}
+    with open(default_path) as f:
+        config = yaml.safe_load(f) or {}
+    user_path = os.getenv("VEC_INF_CONFIG")
+    if user_path:
+        user_path_obj = Path(user_path)
+        if user_path_obj.exists():
+            with open(user_path_obj) as f:
+                user_config = yaml.safe_load(f) or {}
+                for name, data in user_config.get("models", {}).items():
+                    if name in config.get("models", {}):
+                        config["models"][name].update(data)
+                    else:
+                        config.setdefault("models", {})[name] = data
+        else:
+            warnings.warn(
+                f"WARNING: Could not find user config: {user_path}, revert to default config located at {default_path}",
+                UserWarning,
+                stacklevel=2,
+            )
+    return [
+        ModelConfig(model_name=name, **model_data)
+        for name, model_data in config.get("models", {}).items()
+    ]
+def parse_launch_output(output: str) -> tuple[str, dict[str, str]]:
+    """Parse output from model launch command.
+    Parameters
+    ----------
+    output : str
+        Raw output from the launch command
+    Returns
+    -------
+    tuple[str, dict[str, str]]
+        Tuple containing:
+        - str: SLURM job ID
+        - dict[str, str]: Dictionary of parsed configuration parameters
+    Notes
+    -----
+    Extracts the SLURM job ID and configuration parameters from the launch
+    command output. Configuration parameters are parsed from key-value pairs
+    in the output text.
+    """
+    slurm_job_id = output.split(" ")[-1].strip().strip("\n")
+    # Extract config parameters
+    config_dict = {}
+    output_lines = output.split("\n")[:-2]
+    for line in output_lines:
+        if ": " in line:
+            key, value = line.split(": ", 1)
+            config_dict[key.lower().replace(" ", "_")] = value
+    return slurm_job_id, config_dict

vec-inf 0.5.0__py3-none-any.whl → 0.6.1__py3-none-any.whl

vec-inf 0.5.0py3-none-any.whl → 0.6.1py3-none-any.whl