PyPI - dayhoff-tools - Versions diffs - 1.1.10__py3-none-any.whl → 1.13.12__py3-none-any.whl - Mend

dayhoff-tools 1.1.10py3-none-any.whl → 1.13.12py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

dayhoff_tools/__init__.py +10 -0
dayhoff_tools/cli/cloud_commands.py +179 -43
dayhoff_tools/cli/engine1/__init__.py +323 -0
dayhoff_tools/cli/engine1/engine_core.py +703 -0
dayhoff_tools/cli/engine1/engine_lifecycle.py +136 -0
dayhoff_tools/cli/engine1/engine_maintenance.py +431 -0
dayhoff_tools/cli/engine1/engine_management.py +505 -0
dayhoff_tools/cli/engine1/shared.py +501 -0
dayhoff_tools/cli/engine1/studio_commands.py +825 -0
dayhoff_tools/cli/engines_studios/__init__.py +6 -0
dayhoff_tools/cli/engines_studios/api_client.py +351 -0
dayhoff_tools/cli/engines_studios/auth.py +144 -0
dayhoff_tools/cli/engines_studios/engine-studio-cli.md +1230 -0
dayhoff_tools/cli/engines_studios/engine_commands.py +1151 -0
dayhoff_tools/cli/engines_studios/progress.py +260 -0
dayhoff_tools/cli/engines_studios/simulators/cli-simulators.md +151 -0
dayhoff_tools/cli/engines_studios/simulators/demo.sh +75 -0
dayhoff_tools/cli/engines_studios/simulators/engine_list_simulator.py +319 -0
dayhoff_tools/cli/engines_studios/simulators/engine_status_simulator.py +369 -0
dayhoff_tools/cli/engines_studios/simulators/idle_status_simulator.py +476 -0
dayhoff_tools/cli/engines_studios/simulators/simulator_utils.py +180 -0
dayhoff_tools/cli/engines_studios/simulators/studio_list_simulator.py +374 -0
dayhoff_tools/cli/engines_studios/simulators/studio_status_simulator.py +164 -0
dayhoff_tools/cli/engines_studios/studio_commands.py +755 -0
dayhoff_tools/cli/main.py +106 -7
dayhoff_tools/cli/utility_commands.py +896 -179
dayhoff_tools/deployment/base.py +70 -6
dayhoff_tools/deployment/deploy_aws.py +165 -25
dayhoff_tools/deployment/deploy_gcp.py +78 -5
dayhoff_tools/deployment/deploy_utils.py +20 -7
dayhoff_tools/deployment/job_runner.py +9 -4
dayhoff_tools/deployment/processors.py +230 -418
dayhoff_tools/deployment/swarm.py +47 -12
dayhoff_tools/embedders.py +28 -26
dayhoff_tools/fasta.py +181 -64
dayhoff_tools/warehouse.py +268 -1
{dayhoff_tools-1.1.10.dist-info → dayhoff_tools-1.13.12.dist-info}/METADATA +20 -5
dayhoff_tools-1.13.12.dist-info/RECORD +54 -0
{dayhoff_tools-1.1.10.dist-info → dayhoff_tools-1.13.12.dist-info}/WHEEL +1 -1
dayhoff_tools-1.1.10.dist-info/RECORD +0 -32
{dayhoff_tools-1.1.10.dist-info → dayhoff_tools-1.13.12.dist-info}/entry_points.txt +0 -0

dayhoff_tools/cli/engines_studios/__init__.py ADDED Viewed

@@ -0,0 +1,6 @@
+"""Engine and Studio CLI commands."""
+from .engine_commands import engine_cli
+from .studio_commands import studio_cli
+__all__ = ["engine_cli", "studio_cli"]

dayhoff_tools/cli/engines_studios/api_client.py ADDED Viewed

@@ -0,0 +1,351 @@
+"""API client for Studio Manager API."""
+import os
+from typing import Any, Dict, Optional
+import boto3
+import click
+import requests
+from botocore.exceptions import ClientError, NoCredentialsError, TokenRetrievalError
+class StudioManagerClient:
+    """Client for Studio Manager API v2."""
+    def __init__(self, api_url: Optional[str] = None, environment: str = "dev"):
+        """Initialize client.
+        Args:
+            api_url: Optional API URL (fetched from SSM if not provided)
+            environment: Environment name (dev, sand, prod)
+        Raises:
+            click.ClickException: If authentication fails or API URL cannot be fetched
+        """
+        self.api_url = api_url
+        self.environment = environment
+        if not self.api_url:
+            # Fetch from SSM Parameter Store
+            param_name = f"/{environment}/studio-manager/api-url"
+            try:
+                ssm = boto3.client("ssm")
+                param = ssm.get_parameter(Name=param_name)
+                self.api_url = param["Parameter"]["Value"]
+            except NoCredentialsError:
+                raise click.ClickException(
+                    f"✗ Not authenticated to AWS\n\n"
+                    f"Cannot fetch API URL from {param_name}\n\n"
+                    f"Please authenticate:\n"
+                    f"  dh aws login --profile <profile-name>"
+                )
+            except TokenRetrievalError as e:
+                # SSO token retrieval errors - most common case for expired SSO sessions
+                error_msg = str(e)
+                if "Token has expired" in error_msg and "refresh failed" in error_msg:
+                    raise click.ClickException(
+                        f"✗ AWS SSO token has expired\n\n"
+                        f"Cannot fetch API URL from {param_name}\n\n"
+                        f"Please refresh your AWS SSO session:\n"
+                        f"  dh aws login --profile <profile-name>"
+                    )
+                # Other token retrieval errors
+                raise click.ClickException(
+                    f"✗ AWS SSO token error\n\n"
+                    f"Cannot fetch API URL from {param_name}\n\n"
+                    f"Error: {error_msg}\n\n"
+                    f"Please refresh your AWS SSO session:\n"
+                    f"  dh aws login --profile <profile-name>"
+                )
+            except ClientError as e:
+                error_code = e.response.get("Error", {}).get("Code", "")
+                error_msg = str(e)
+                # SSO token error - check this first as it's more specific than general "expired"
+                # This is the specific case from user's terminal
+                if "Token has expired" in error_msg and "refresh failed" in error_msg:
+                    raise click.ClickException(
+                        f"✗ AWS SSO token has expired\n\n"
+                        f"Cannot fetch API URL from {param_name}\n\n"
+                        f"Please refresh your AWS SSO session:\n"
+                        f"  dh aws login --profile <profile-name>"
+                    )
+                # Auth/token errors (generic)
+                if "ExpiredToken" in error_code or "expired" in error_msg.lower():
+                    raise click.ClickException(
+                        f"✗ AWS credentials have expired\n\n"
+                        f"Cannot fetch API URL from {param_name}\n\n"
+                        f"Please refresh your credentials:\n"
+                        f"  dh aws login --profile <profile-name>"
+                    )
+                # Parameter not found
+                if error_code == "ParameterNotFound":
+                    raise click.ClickException(
+                        f"✗ API URL parameter not found: {param_name}\n\n"
+                        f"This usually means the infrastructure is not deployed in the '{environment}' environment.\n\n"
+                        f"Try:\n"
+                        f"  • Check if the environment name is correct (--env {environment})\n"
+                        f"  • Verify the infrastructure is deployed\n"
+                        f"  • Contact your admin if you're unsure"
+                    )
+                # Generic error
+                raise click.ClickException(
+                    f"✗ Could not fetch API URL from {param_name}\n\n"
+                    f"Error: {error_msg}\n\n"
+                    f"Set STUDIO_MANAGER_API_URL environment variable to bypass SSM lookup"
+                )
+            except Exception as e:
+                raise click.ClickException(
+                    f"✗ Unexpected error fetching API URL from {param_name}\n\n"
+                    f"Error: {e}\n\n"
+                    f"Set STUDIO_MANAGER_API_URL environment variable to bypass SSM lookup"
+                )
+    def _request(self, method: str, path: str, **kwargs) -> Dict[str, Any]:
+        """Make HTTP request to API.
+        Args:
+            method: HTTP method
+            path: API path
+            **kwargs: Additional arguments for requests
+        Returns:
+            Response JSON
+        Raises:
+            RuntimeError: If request fails with error message from API
+        """
+        url = f"{self.api_url}{path}"
+        response = requests.request(method, url, **kwargs)
+        # Parse error body if request failed
+        if not response.ok:
+            try:
+                error_body = response.json()
+                error_message = error_body.get("error", response.text)
+            except Exception:
+                error_message = response.text or f"HTTP {response.status_code}"
+            # Raise exception with the actual error message from API
+            raise RuntimeError(error_message)
+        return response.json()
+    # Engine operations
+    def list_engines(self) -> Dict[str, Any]:
+        """List all engines."""
+        return self._request("GET", "/engines")
+    def get_engine_readiness(self, engine_id: str) -> Dict[str, Any]:
+        """Get engine readiness status with progress."""
+        return self._request("GET", f"/engines/{engine_id}/readiness")
+    def get_engine_status(self, engine_id: str) -> Dict[str, Any]:
+        """Get comprehensive engine status including idle state."""
+        return self._request("GET", f"/engines/{engine_id}")
+    def launch_engine(
+        self,
+        name: str,
+        user: str,
+        engine_type: str,
+        boot_disk_size: Optional[int] = None,
+    ) -> Dict[str, Any]:
+        """Launch a new engine."""
+        payload = {"name": name, "user": user, "engine_type": engine_type}
+        if boot_disk_size:
+            payload["boot_disk_size"] = boot_disk_size
+        return self._request("POST", "/engines", json=payload)
+    def terminate_engine(self, engine_id: str) -> Dict[str, Any]:
+        """Terminate an engine."""
+        return self._request("DELETE", f"/engines/{engine_id}")
+    def start_engine(self, engine_id: str) -> Dict[str, Any]:
+        """Start a stopped engine."""
+        return self._request("POST", f"/engines/{engine_id}/start")
+    def stop_engine(self, engine_id: str) -> Dict[str, Any]:
+        """Stop a running engine."""
+        return self._request("POST", f"/engines/{engine_id}/stop")
+    def resize_engine(
+        self, engine_id: str, size_gb: int, online: bool = False
+    ) -> Dict[str, Any]:
+        """Resize engine boot disk."""
+        return self._request(
+            "POST",
+            f"/engines/{engine_id}/resize",
+            json={"size_gb": size_gb, "online": online},
+        )
+    def set_coffee(self, engine_id: str, duration: str) -> Dict[str, Any]:
+        """Set coffee lock (keep-alive) for engine."""
+        return self._request(
+            "POST", f"/engines/{engine_id}/coffee", json={"duration": duration}
+        )
+    def cancel_coffee(self, engine_id: str) -> Dict[str, Any]:
+        """Cancel coffee lock for engine."""
+        return self._request("DELETE", f"/engines/{engine_id}/coffee")
+    def update_idle_settings(
+        self, engine_id: str, timeout: Optional[str] = None, slack: Optional[str] = None
+    ) -> Dict[str, Any]:
+        """Update idle detector settings."""
+        payload = {}
+        if timeout:
+            payload["timeout"] = timeout
+        if slack:
+            payload["slack"] = slack
+        return self._request(
+            "PATCH", f"/engines/{engine_id}/idle-settings", json=payload
+        )
+    # Studio operations
+    def list_studios(self) -> Dict[str, Any]:
+        """List all studios."""
+        return self._request("GET", "/studios")
+    def get_studio(self, studio_id: str) -> Dict[str, Any]:
+        """Get studio information."""
+        return self._request("GET", f"/studios/{studio_id}")
+    def create_studio(self, user: str, size_gb: int = 100) -> Dict[str, Any]:
+        """Create a new studio."""
+        return self._request(
+            "POST", "/studios", json={"user": user, "size_gb": size_gb}
+        )
+    def delete_studio(self, studio_id: str) -> Dict[str, Any]:
+        """Delete a studio."""
+        return self._request("DELETE", f"/studios/{studio_id}")
+    def resize_studio(self, studio_id: str, size_gb: int) -> Dict[str, Any]:
+        """Resize a studio volume."""
+        return self._request(
+            "POST", f"/studios/{studio_id}/resize", json={"size_gb": size_gb}
+        )
+    def reset_studio(self, studio_id: str) -> Dict[str, Any]:
+        """Reset a stuck studio to available status."""
+        return self._request("POST", f"/studios/{studio_id}/reset")
+    # Attachment operations
+    def attach_studio(
+        self, studio_id: str, engine_id: str, user: str
+    ) -> Dict[str, Any]:
+        """Initiate studio attachment."""
+        return self._request(
+            "POST",
+            f"/studios/{studio_id}/attach",
+            json={"engine_id": engine_id, "user": user},
+        )
+    def detach_studio(self, studio_id: str) -> Dict[str, Any]:
+        """Detach a studio."""
+        return self._request("POST", f"/studios/{studio_id}/detach")
+    def get_attachment_progress(self, operation_id: str) -> Dict[str, Any]:
+        """Get attachment operation progress."""
+        return self._request("GET", f"/operations/{operation_id}")
+    # Helper methods
+    def check_instance_status(self, instance_id: str) -> Dict[str, Any]:
+        """Check EC2 instance status including status checks.
+        Args:
+            instance_id: EC2 instance ID
+        Returns:
+            Dict with:
+                - state: Instance state (pending, running, etc.)
+                - instance_status: Instance status check (initializing, ok, impaired)
+                - system_status: System status check (initializing, ok, impaired)
+                - reachable: True if both status checks passed
+        """
+        ec2 = boto3.client("ec2")
+        try:
+            # Get instance state
+            instances_resp = ec2.describe_instances(InstanceIds=[instance_id])
+            if not instances_resp["Reservations"]:
+                return {"error": "Instance not found"}
+            instance = instances_resp["Reservations"][0]["Instances"][0]
+            state = instance["State"]["Name"]
+            # Get status checks (only available when running)
+            if state != "running":
+                return {
+                    "state": state,
+                    "instance_status": None,
+                    "system_status": None,
+                    "reachable": False,
+                }
+            # Fetch instance status checks
+            status_resp = ec2.describe_instance_status(
+                InstanceIds=[instance_id],
+                IncludeAllInstances=False,  # Only get running instances
+            )
+            if not status_resp["InstanceStatuses"]:
+                # No status yet - still initializing
+                return {
+                    "state": state,
+                    "instance_status": "initializing",
+                    "system_status": "initializing",
+                    "reachable": False,
+                }
+            status = status_resp["InstanceStatuses"][0]
+            instance_status = status["InstanceStatus"]["Status"]
+            system_status = status["SystemStatus"]["Status"]
+            return {
+                "state": state,
+                "instance_status": instance_status,
+                "system_status": system_status,
+                "reachable": instance_status == "ok" and system_status == "ok",
+            }
+        except ClientError as e:
+            return {"error": str(e)}
+    def get_engine_by_name(self, name: str) -> Optional[Dict[str, Any]]:
+        """Find engine by name.
+        Args:
+            name: Engine name
+        Returns:
+            Engine dict or None if not found
+        """
+        engines = self.list_engines().get("engines", [])
+        for engine in engines:
+            if engine["name"] == name:
+                return engine
+        return None
+    def get_my_studio(self) -> Optional[Dict[str, Any]]:
+        """Get current user's studio.
+        Returns:
+            Studio dict or None if not found
+        Raises:
+            RuntimeError: If not authenticated to AWS
+        """
+        from .auth import get_aws_username
+        user = get_aws_username()
+        studios = self.list_studios().get("studios", [])
+        for studio in studios:
+            if studio["user"] == user:
+                return studio
+        return None

dayhoff_tools/cli/engines_studios/auth.py ADDED Viewed

@@ -0,0 +1,144 @@
+"""AWS authentication and identity helpers."""
+import boto3
+import click
+from botocore.exceptions import ClientError, NoCredentialsError, TokenRetrievalError
+def detect_aws_environment() -> str:
+    """Detect environment (dev/sand/prod) from AWS account ID.
+    Returns:
+        Environment name: "dev", "sand", or "prod"
+    Raises:
+        click.ClickException: If account cannot be detected or is not recognized
+    """
+    try:
+        sts = boto3.client("sts")
+        identity = sts.get_caller_identity()
+        account_id = identity["Account"]
+        # Map account IDs to environments (from aws_config)
+        account_to_env = {
+            "074735440724": "dev",
+            "006207983460": "sand",
+            "011117009798": "prod",
+        }
+        env = account_to_env.get(account_id)
+        if not env:
+            raise click.ClickException(
+                f"✗ Unknown AWS account: {account_id}\n\n"
+                f"This account is not recognized as dev, sand, or prod.\n"
+                f"Please specify --env explicitly."
+            )
+        return env
+    except (NoCredentialsError, ClientError, TokenRetrievalError) as e:
+        raise click.ClickException(
+            "✗ Could not detect AWS environment\n\n"
+            "Please authenticate first or specify --env explicitly:\n"
+            "  dh aws login --profile <profile-name>"
+        ) from e
+def check_aws_auth() -> None:
+    """Check AWS authentication status and provide clear error if not authenticated.
+    This function proactively checks AWS credentials before any AWS API calls
+    to provide clear, actionable error messages.
+    Raises:
+        click.ClickException: If not authenticated to AWS with instructions to fix
+    """
+    try:
+        sts = boto3.client("sts")
+        sts.get_caller_identity()
+    except NoCredentialsError:
+        raise click.ClickException(
+            "✗ Not authenticated to AWS\n\n"
+            "Please authenticate using one of these methods:\n"
+            "  • dh aws login --profile <profile-name>\n"
+            "  • aws sso login --profile <profile-name>\n"
+            "  • export AWS_PROFILE=<profile-name> && aws sso login"
+        )
+    except TokenRetrievalError as e:
+        # SSO token retrieval errors - most common case for expired SSO sessions
+        error_msg = str(e)
+        if "Token has expired" in error_msg and "refresh failed" in error_msg:
+            raise click.ClickException(
+                "✗ AWS SSO token has expired\n\n"
+                "Please refresh your AWS SSO session:\n"
+                "  dh aws login --profile <profile-name>"
+            )
+        # Other token retrieval errors
+        raise click.ClickException(
+            f"✗ AWS SSO token error\n\n"
+            f"Error: {error_msg}\n\n"
+            f"Please refresh your AWS SSO session:\n"
+            f"  dh aws login --profile <profile-name>"
+        )
+    except ClientError as e:
+        error_code = e.response.get("Error", {}).get("Code", "")
+        error_msg = str(e)
+        # SSO token error - check this first as it's more specific than general "expired"
+        # This is the specific case from the user's terminal
+        if "Token has expired" in error_msg and "refresh failed" in error_msg:
+            raise click.ClickException(
+                "✗ AWS SSO token has expired\n\n"
+                "Please refresh your AWS SSO session:\n"
+                "  dh aws login --profile <profile-name>"
+            )
+        # Token expired error (generic)
+        if "ExpiredToken" in error_code or "expired" in error_msg.lower():
+            raise click.ClickException(
+                "✗ AWS credentials have expired\n\n"
+                "Please refresh your credentials:\n"
+                "  dh aws login --profile <profile-name>"
+            )
+        # Generic auth error
+        raise click.ClickException(
+            f"✗ AWS authentication error\n\n"
+            f"Error: {error_msg}\n\n"
+            f"Try refreshing your credentials:\n"
+            f"  dh aws login --profile <profile-name>"
+        )
+def get_aws_username() -> str:
+    """Get username from AWS STS caller identity.
+    Parses username from the AWS SSO assumed role ARN.
+    This works even when running as root in containers where $USER is empty.
+    Returns:
+        Username from AWS identity
+    Raises:
+        RuntimeError: If not authenticated to AWS
+    """
+    try:
+        sts = boto3.client("sts")
+        identity = sts.get_caller_identity()
+        # Parse username from assumed role ARN
+        # Format: arn:aws:sts::123456789012:assumed-role/AWSReservedSSO_DeveloperAccess_xxxx/username
+        arn = identity["Arn"]
+        if "assumed-role" in arn:
+            # SSO auth - username is last component
+            username = arn.split("/")[-1]
+            return username
+        else:
+            # Other auth methods - use last part of UserId
+            return identity["UserId"].split(":")[-1]
+    except (NoCredentialsError, ClientError, TokenRetrievalError) as e:
+        raise RuntimeError(
+            "Not authenticated to AWS. " "Run: dh aws login --profile <profile-name>"
+        ) from e

dayhoff-tools 1.1.10__py3-none-any.whl → 1.13.12__py3-none-any.whl

dayhoff-tools 1.1.10py3-none-any.whl → 1.13.12py3-none-any.whl