PyPI - aissemble-inference-deploy - Versions diffs - 1.5.0rc3__py3-none-any.whl - Mend

aissemble-inference-deploy 1.5.0rc3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

aissemble_inference_deploy/__init__.py ADDED Viewed

@@ -0,0 +1,38 @@
+###
+# #%L
+# aiSSEMBLE::Open Inference Protocol::Modules::deploy
+# %%
+# Copyright (C) 2024 Booz Allen Hamilton Inc.
+# %%
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# #L%
+###
+"""
+aiSSEMBLE OIP Deploy - Deployment tooling for OIP-compatible models.
+This module provides CLI tooling to generate deployment configurations
+for any OIP-compatible model across multiple deployment targets:
+- Local (MLServer)
+- Docker
+- Kubernetes (vanilla)
+- KServe (serverless)
+Custom generators can be added via the 'inference.generators' entry point group.
+"""
+__version__ = "1.5.0.dev"
+from .generators.base import Generator, ModelInfo
+from .registry import GeneratorRegistry
+__all__ = ["Generator", "GeneratorRegistry", "ModelInfo", "__version__"]

aissemble_inference_deploy/cli.py ADDED Viewed

@@ -0,0 +1,278 @@
+###
+# #%L
+# aiSSEMBLE::Open Inference Protocol::Deploy
+# %%
+# Copyright (C) 2024 Booz Allen Hamilton Inc.
+# %%
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# #L%
+###
+"""
+CLI commands for inference-deploy.
+Provides the `inference deploy` command group for generating deployment configurations.
+Generators are discovered via entry points, allowing custom generators to be
+installed as separate packages.
+"""
+from datetime import datetime, timezone
+from pathlib import Path
+import click
+from . import __version__
+from .config import DeployConfig
+from .registry import GeneratorRegistry
+def get_registry() -> GeneratorRegistry:
+    """Get the generator registry instance."""
+    return GeneratorRegistry.instance()
+@click.group()
+@click.version_option(version=__version__)
+def main():
+    """Inference deployment tooling - generate deployment configs for OIP-compatible models."""
+    pass
+@main.group()
+def deploy():
+    """Generate and manage deployment configurations."""
+    pass
+@deploy.command("init")
+@click.option(
+    "--target",
+    "-t",
+    multiple=True,
+    default=None,
+    help="Deployment target(s) to generate configs for. Use 'all' for all targets.",
+)
+@click.option(
+    "--model-dir",
+    "-m",
+    type=click.Path(exists=True, path_type=Path),
+    default=None,
+    help="Path to models directory (default: ./models)",
+)
+@click.option(
+    "--output-dir",
+    "-o",
+    type=click.Path(path_type=Path),
+    default=None,
+    help="Output directory for generated configs (default: ./deploy)",
+)
+@click.option(
+    "--project-dir",
+    "-p",
+    type=click.Path(exists=True, path_type=Path),
+    default=None,
+    help="Project root directory (default: current directory)",
+)
+def init(
+    target: tuple[str, ...] | None,
+    model_dir: Path | None,
+    output_dir: Path | None,
+    project_dir: Path | None,
+):
+    """Initialize deployment configurations for your models.
+    Generates deployment configs in the deploy/ directory for the specified
+    target(s). Use --target all to generate for all available targets.
+    Generators are discovered via entry points, so custom generators can be
+    installed as separate packages.
+    Examples:
+        inference deploy init --target local
+        inference deploy init --target docker --target kubernetes
+        inference deploy init --target all
+    """
+    registry = get_registry()
+    available = registry.list_available()
+    if not available:
+        click.echo("Error: No generators found. Install a generator package or check")
+        click.echo("that aissemble-inference-deploy is installed correctly.")
+        raise SystemExit(1)
+    # Default to 'local' if available, otherwise first available
+    if target is None or len(target) == 0:
+        if "local" in available:
+            targets = ["local"]
+        else:
+            targets = [available[0]]
+    else:
+        targets = list(target)
+    # Expand 'all' to all available targets
+    if "all" in targets:
+        targets = available
+    # Kubernetes depends on Docker - auto-include if not present
+    if "kubernetes" in targets and "docker" not in targets:
+        click.echo("Note: Adding 'docker' target (required by kubernetes)")
+        targets.insert(0, "docker")
+    # KServe depends on Docker - auto-include if not present
+    if "kserve" in targets and "docker" not in targets:
+        click.echo("Note: Adding 'docker' target (required by kserve)")
+        targets.insert(0, "docker")
+    # Validate targets
+    for t in targets:
+        if t not in available and t != "all":
+            click.echo(f"Error: Unknown target '{t}'")
+            click.echo(f"Available targets: {', '.join(available)}")
+            raise SystemExit(1)
+    project_dir = project_dir or Path.cwd()
+    output_dir = output_dir or project_dir / "deploy"
+    # Check if running from wrong directory (inside deploy/)
+    cwd = Path.cwd()
+    if cwd.name == "deploy" and project_dir == cwd:
+        click.echo(
+            "Error: It looks like you're running from inside a deploy/ directory."
+        )
+        click.echo(
+            "Please run from your project root (where pyproject.toml and models/ are)."
+        )
+        click.echo()
+        click.echo("Example:")
+        click.echo("  cd /path/to/your-project")
+        click.echo("  inference deploy init --target docker")
+        raise SystemExit(1)
+    # Check for project root indicators
+    has_pyproject = (project_dir / "pyproject.toml").exists()
+    has_models = (project_dir / "models").exists()
+    if not has_pyproject and not has_models:
+        click.echo(
+            f"Warning: No pyproject.toml or models/ directory found in {project_dir}"
+        )
+        click.echo("Are you running from your project root?")
+        click.echo()
+        if not click.confirm("Continue anyway?"):
+            raise SystemExit(1)
+    # Load or create config
+    config_path = output_dir / ".inference-deploy.yaml"
+    config = DeployConfig.load(config_path)
+    config.generator_version = __version__
+    config.generated_at = datetime.now(timezone.utc).isoformat()
+    click.echo(f"Generating deployment configs in {output_dir}")
+    click.echo(f"Targets: {', '.join(targets)}")
+    click.echo()
+    all_generated_files = []
+    for target_name in targets:
+        generator_cls = registry.get(target_name)
+        if generator_cls is None:
+            click.echo(f"  [{target_name}] Error: Generator not found")
+            continue
+        generator = generator_cls(project_dir, output_dir)
+        # Detect models
+        models_path = model_dir or project_dir / "models"
+        models = generator.detect_models(models_path)
+        if not models:
+            click.echo(f"  [{target_name}] Warning: No models found in {models_path}")
+        else:
+            model_names = ", ".join(m.name for m in models)
+            click.echo(f"  [{target_name}] Found models: {model_names}")
+        # Generate configs
+        generated_files = generator.generate(models)
+        all_generated_files.extend(generated_files)
+        for file_path in generated_files:
+            config.add_file(file_path, target_name, output_dir)
+            rel_path = file_path.relative_to(output_dir)
+            click.echo(f"  [{target_name}] Generated: {rel_path}")
+        if target_name not in config.targets:
+            config.targets.append(target_name)
+    # Save config
+    config.save(config_path)
+    click.echo()
+    click.echo(f"Config saved to {config_path.relative_to(project_dir)}")
+    # Print next steps
+    click.echo()
+    click.echo("Next steps:")
+    if "local" in targets:
+        click.echo("  Local:  cd deploy/local && ./run-mlserver.sh")
+    if "kubernetes" in targets:
+        # Kubernetes workflow: build image, then deploy
+        click.echo("  K8s:    cd deploy/docker && docker-compose build")
+        click.echo("          kubectl apply -k deploy/kubernetes/overlays/dev")
+    elif "docker" in targets:
+        # Docker-only workflow: build and run
+        click.echo("  Docker: cd deploy/docker && docker-compose up --build")
+    if "kserve" in targets:
+        click.echo("  KServe: kubectl apply -f deploy/kserve/serving-runtime.yaml")
+        click.echo("          kubectl apply -f deploy/kserve/inference-service.yaml")
+@deploy.command("list-targets")
+def list_targets():
+    """List available deployment targets.
+    Generators are discovered via entry points. Install additional generator
+    packages to add more targets.
+    """
+    registry = get_registry()
+    available = registry.list_available()
+    if not available:
+        click.echo("No generators found.")
+        click.echo()
+        click.echo(
+            "Install a generator package or check that aissemble-inference-deploy"
+        )
+        click.echo("is installed correctly.")
+        return
+    click.echo("Available deployment targets:")
+    click.echo()
+    for name in available:
+        generator_cls = registry.get(name)
+        # Get description from docstring if available
+        doc = generator_cls.__doc__ if generator_cls else None
+        if doc:
+            # Get first line of docstring
+            desc = doc.strip().split("\n")[0]
+            click.echo(f"  {name:15} - {desc}")
+        else:
+            click.echo(f"  {name}")
+    click.echo()
+    click.echo(
+        "Custom generators can be added via the 'inference.generators' entry point."
+    )
+if __name__ == "__main__":
+    main()

aissemble_inference_deploy/config.py ADDED Viewed

@@ -0,0 +1,182 @@
+###
+# #%L
+# aiSSEMBLE::Open Inference Protocol::Deploy
+# %%
+# Copyright (C) 2024 Booz Allen Hamilton Inc.
+# %%
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# #L%
+###
+"""
+Configuration management for oip-deploy.
+Manages the .inference-deploy.yaml file that tracks generated configs,
+versions, and checksums for update/merge functionality.
+"""
+import hashlib
+import re
+import sys
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from pathlib import Path
+from typing import Any
+import yaml
+@dataclass
+class GeneratedFile:
+    """Tracks a single generated file."""
+    path: str
+    checksum: str
+    generator: str
+    generated_at: str
+    def __post_init__(self):
+        """Validate checksum format."""
+        if not re.match(r"^[a-f0-9]{64}$", self.checksum):
+            raise ValueError(
+                f"Invalid checksum format (expected SHA256 hex): {self.checksum}"
+            )
+@dataclass
+class DeployConfig:
+    """Configuration stored in .inference-deploy.yaml."""
+    version: str = "1.0"
+    generator_version: str = ""
+    generated_at: str = ""
+    targets: list[str] = field(default_factory=list)
+    files: list[GeneratedFile] = field(default_factory=list)
+    @classmethod
+    def load(cls, path: Path) -> "DeployConfig":
+        """
+        Load config from a YAML file.
+        Args:
+            path: Path to .inference-deploy.yaml file
+        Returns:
+            DeployConfig instance
+        Raises:
+            ValueError: If YAML is malformed
+        """
+        if not path.exists():
+            return cls()
+        try:
+            content = path.read_text(encoding="utf-8")
+            data = yaml.safe_load(content)
+        except yaml.YAMLError as e:
+            raise ValueError(f"Invalid YAML in {path}: {e}")
+        except OSError as e:
+            raise ValueError(f"Cannot read {path}: {e}")
+        if data is None:
+            return cls()
+        if not isinstance(data, dict):
+            raise ValueError(f"Expected dict in {path}, got {type(data).__name__}")
+        # Validate and load files with proper error handling
+        files = []
+        for file_data in data.get("files", []):
+            if not isinstance(file_data, dict):
+                print(
+                    f"Warning: Skipping invalid file entry (not a dict): {file_data}",
+                    file=sys.stderr,
+                )
+                continue
+            try:
+                files.append(GeneratedFile(**file_data))
+            except TypeError as e:
+                print(
+                    f"Warning: Skipping invalid file entry: {e}",
+                    file=sys.stderr,
+                )
+            except ValueError as e:
+                print(
+                    f"Warning: Skipping file entry with invalid checksum: {e}",
+                    file=sys.stderr,
+                )
+        return cls(
+            version=str(data.get("version", "1.0")),
+            generator_version=str(data.get("generator_version", "")),
+            generated_at=str(data.get("generated_at", "")),
+            targets=list(data.get("targets", [])),
+            files=files,
+        )
+    def save(self, path: Path) -> None:
+        """Save config to a YAML file."""
+        data: dict[str, Any] = {
+            "version": self.version,
+            "generator_version": self.generator_version,
+            "generated_at": self.generated_at,
+            "targets": self.targets,
+            "files": [
+                {
+                    "path": f.path,
+                    "checksum": f.checksum,
+                    "generator": f.generator,
+                    "generated_at": f.generated_at,
+                }
+                for f in self.files
+            ],
+        }
+        path.parent.mkdir(parents=True, exist_ok=True)
+        path.write_text(
+            yaml.dump(data, default_flow_style=False, sort_keys=False),
+            encoding="utf-8",
+        )
+    def add_file(self, path: Path, generator: str, base_dir: Path) -> None:
+        """Add or update a tracked file."""
+        rel_path = str(path.relative_to(base_dir))
+        checksum = compute_checksum(path)
+        now = datetime.now(timezone.utc).isoformat()
+        # Update existing or add new
+        for f in self.files:
+            if f.path == rel_path:
+                f.checksum = checksum
+                f.generated_at = now
+                return
+        self.files.append(
+            GeneratedFile(
+                path=rel_path,
+                checksum=checksum,
+                generator=generator,
+                generated_at=now,
+            )
+        )
+    def get_file(self, rel_path: str) -> GeneratedFile | None:
+        """Get a tracked file by its relative path."""
+        for f in self.files:
+            if f.path == rel_path:
+                return f
+        return None
+def compute_checksum(path: Path) -> str:
+    """Compute SHA256 checksum of a file."""
+    return hashlib.sha256(path.read_bytes()).hexdigest()

aissemble_inference_deploy/generators/__init__.py ADDED Viewed

@@ -0,0 +1,36 @@
+###
+# #%L
+# aiSSEMBLE::Open Inference Protocol::Modules::deploy
+# %%
+# Copyright (C) 2024 Booz Allen Hamilton Inc.
+# %%
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# #L%
+###
+"""
+Deployment config generators for different targets.
+"""
+from .base import Generator
+from .docker import DockerGenerator
+from .kserve import KServeGenerator
+from .kubernetes import KubernetesGenerator
+from .local import LocalGenerator
+__all__ = [
+    "Generator",
+    "DockerGenerator",
+    "KServeGenerator",
+    "KubernetesGenerator",
+    "LocalGenerator",
+]