PyPI - tetra-rp - Versions diffs - 0.6.0__py3-none-any.whl → 0.24.0__py3-none-any.whl - Mend

tetra-rp 0.6.0py3-none-any.whl → 0.24.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (97) hide show

tetra_rp/__init__.py +109 -19
tetra_rp/cli/commands/__init__.py +1 -0
tetra_rp/cli/commands/apps.py +143 -0
tetra_rp/cli/commands/build.py +1082 -0
tetra_rp/cli/commands/build_utils/__init__.py +1 -0
tetra_rp/cli/commands/build_utils/handler_generator.py +176 -0
tetra_rp/cli/commands/build_utils/lb_handler_generator.py +309 -0
tetra_rp/cli/commands/build_utils/manifest.py +430 -0
tetra_rp/cli/commands/build_utils/mothership_handler_generator.py +75 -0
tetra_rp/cli/commands/build_utils/scanner.py +596 -0
tetra_rp/cli/commands/deploy.py +580 -0
tetra_rp/cli/commands/init.py +123 -0
tetra_rp/cli/commands/resource.py +108 -0
tetra_rp/cli/commands/run.py +296 -0
tetra_rp/cli/commands/test_mothership.py +458 -0
tetra_rp/cli/commands/undeploy.py +533 -0
tetra_rp/cli/main.py +97 -0
tetra_rp/cli/utils/__init__.py +1 -0
tetra_rp/cli/utils/app.py +15 -0
tetra_rp/cli/utils/conda.py +127 -0
tetra_rp/cli/utils/deployment.py +530 -0
tetra_rp/cli/utils/ignore.py +143 -0
tetra_rp/cli/utils/skeleton.py +184 -0
tetra_rp/cli/utils/skeleton_template/.env.example +4 -0
tetra_rp/cli/utils/skeleton_template/.flashignore +40 -0
tetra_rp/cli/utils/skeleton_template/.gitignore +44 -0
tetra_rp/cli/utils/skeleton_template/README.md +263 -0
tetra_rp/cli/utils/skeleton_template/main.py +44 -0
tetra_rp/cli/utils/skeleton_template/mothership.py +55 -0
tetra_rp/cli/utils/skeleton_template/pyproject.toml +58 -0
tetra_rp/cli/utils/skeleton_template/requirements.txt +1 -0
tetra_rp/cli/utils/skeleton_template/workers/__init__.py +0 -0
tetra_rp/cli/utils/skeleton_template/workers/cpu/__init__.py +19 -0
tetra_rp/cli/utils/skeleton_template/workers/cpu/endpoint.py +36 -0
tetra_rp/cli/utils/skeleton_template/workers/gpu/__init__.py +19 -0
tetra_rp/cli/utils/skeleton_template/workers/gpu/endpoint.py +61 -0
tetra_rp/client.py +136 -33
tetra_rp/config.py +29 -0
tetra_rp/core/api/runpod.py +591 -39
tetra_rp/core/deployment.py +232 -0
tetra_rp/core/discovery.py +425 -0
tetra_rp/core/exceptions.py +50 -0
tetra_rp/core/resources/__init__.py +27 -9
tetra_rp/core/resources/app.py +738 -0
tetra_rp/core/resources/base.py +139 -4
tetra_rp/core/resources/constants.py +21 -0
tetra_rp/core/resources/cpu.py +115 -13
tetra_rp/core/resources/gpu.py +182 -16
tetra_rp/core/resources/live_serverless.py +153 -16
tetra_rp/core/resources/load_balancer_sls_resource.py +440 -0
tetra_rp/core/resources/network_volume.py +126 -31
tetra_rp/core/resources/resource_manager.py +436 -35
tetra_rp/core/resources/serverless.py +537 -120
tetra_rp/core/resources/serverless_cpu.py +201 -0
tetra_rp/core/resources/template.py +1 -59
tetra_rp/core/utils/constants.py +10 -0
tetra_rp/core/utils/file_lock.py +260 -0
tetra_rp/core/utils/http.py +67 -0
tetra_rp/core/utils/lru_cache.py +75 -0
tetra_rp/core/utils/singleton.py +36 -1
tetra_rp/core/validation.py +44 -0
tetra_rp/execute_class.py +301 -0
tetra_rp/protos/remote_execution.py +98 -9
tetra_rp/runtime/__init__.py +1 -0
tetra_rp/runtime/circuit_breaker.py +274 -0
tetra_rp/runtime/config.py +12 -0
tetra_rp/runtime/exceptions.py +49 -0
tetra_rp/runtime/generic_handler.py +206 -0
tetra_rp/runtime/lb_handler.py +189 -0
tetra_rp/runtime/load_balancer.py +160 -0
tetra_rp/runtime/manifest_fetcher.py +192 -0
tetra_rp/runtime/metrics.py +325 -0
tetra_rp/runtime/models.py +73 -0
tetra_rp/runtime/mothership_provisioner.py +512 -0
tetra_rp/runtime/production_wrapper.py +266 -0
tetra_rp/runtime/reliability_config.py +149 -0
tetra_rp/runtime/retry_manager.py +118 -0
tetra_rp/runtime/serialization.py +124 -0
tetra_rp/runtime/service_registry.py +346 -0
tetra_rp/runtime/state_manager_client.py +248 -0
tetra_rp/stubs/live_serverless.py +35 -17
tetra_rp/stubs/load_balancer_sls.py +357 -0
tetra_rp/stubs/registry.py +145 -19
{tetra_rp-0.6.0.dist-info → tetra_rp-0.24.0.dist-info}/METADATA +398 -60
tetra_rp-0.24.0.dist-info/RECORD +99 -0
{tetra_rp-0.6.0.dist-info → tetra_rp-0.24.0.dist-info}/WHEEL +1 -1
tetra_rp-0.24.0.dist-info/entry_points.txt +2 -0
tetra_rp/core/pool/cluster_manager.py +0 -177
tetra_rp/core/pool/dataclass.py +0 -18
tetra_rp/core/pool/ex.py +0 -38
tetra_rp/core/pool/job.py +0 -22
tetra_rp/core/pool/worker.py +0 -19
tetra_rp/core/resources/utils.py +0 -50
tetra_rp/core/utils/json.py +0 -33
tetra_rp-0.6.0.dist-info/RECORD +0 -39
/tetra_rp/{core/pool → cli}/__init__.py +0 -0
{tetra_rp-0.6.0.dist-info → tetra_rp-0.24.0.dist-info}/top_level.txt +0 -0

tetra_rp/cli/commands/resource.py ADDED Viewed

@@ -0,0 +1,108 @@
+"""Resource management commands."""
+import time
+import typer
+from rich.console import Console
+from rich.table import Table
+from rich.panel import Panel
+from rich.live import Live
+from ...core.resources.resource_manager import ResourceManager
+console = Console()
+def report_command(
+    live: bool = typer.Option(False, "--live", "-l", help="Live updating status"),
+    refresh: int = typer.Option(
+        2, "--refresh", "-r", help="Refresh interval for live mode"
+    ),
+):
+    """Show resource status dashboard."""
+    resource_manager = ResourceManager()
+    if live:
+        try:
+            with Live(
+                generate_resource_table(resource_manager),
+                console=console,
+                refresh_per_second=1 / refresh,
+                screen=True,
+            ) as live_display:
+                while True:
+                    time.sleep(refresh)
+                    live_display.update(generate_resource_table(resource_manager))
+        except KeyboardInterrupt:
+            console.print("\n📊 Live monitoring stopped")
+    else:
+        table = generate_resource_table(resource_manager)
+        console.print(table)
+def generate_resource_table(resource_manager: ResourceManager) -> Panel:
+    """Generate a formatted table of resources."""
+    resources = resource_manager._resources
+    if not resources:
+        return Panel(
+            "📊 No resources currently tracked\n\n"
+            "Resources will appear here after running your Tetra applications.",
+            title="Resource Status Report",
+            expand=False,
+        )
+    table = Table(title="Resource Status Report")
+    table.add_column("Resource ID", style="cyan", no_wrap=True)
+    table.add_column("Status", justify="center")
+    table.add_column("Type", style="magenta")
+    table.add_column("URL", style="blue")
+    table.add_column("Health", justify="center")
+    active_count = 0
+    error_count = 0
+    for uid, resource in resources.items():
+        # Determine status
+        try:
+            is_deployed = resource.is_deployed()
+            if is_deployed:
+                status = "🟢 Active"
+                active_count += 1
+            else:
+                status = "🔴 Inactive"
+                error_count += 1
+        except Exception:
+            status = "🟡 Unknown"
+        # Get resource info
+        resource_type = resource.__class__.__name__
+        try:
+            url = resource.url if hasattr(resource, "url") else "N/A"
+        except Exception:
+            url = "N/A"
+        # Health check (simplified for now)
+        health = "✓" if status == "🟢 Active" else "✗"
+        table.add_row(
+            uid[:20] + "..." if len(uid) > 20 else uid,
+            status,
+            resource_type,
+            url,
+            health,
+        )
+    # Summary
+    total = len(resources)
+    idle_count = total - active_count - error_count
+    summary = f"Total: {total} resources ({active_count} active"
+    if idle_count > 0:
+        summary += f", {idle_count} idle"
+    if error_count > 0:
+        summary += f", {error_count} error"
+    summary += ")"
+    return Panel(table, subtitle=summary, expand=False)

tetra_rp/cli/commands/run.py ADDED Viewed

@@ -0,0 +1,296 @@
+"""Run Flash development server."""
+import logging
+import os
+import signal
+import subprocess
+import sys
+from pathlib import Path
+from typing import Optional
+import questionary
+import typer
+from rich.console import Console
+logger = logging.getLogger(__name__)
+console = Console()
+def run_command(
+    host: str = typer.Option(
+        "localhost",
+        "--host",
+        envvar="FLASH_HOST",
+        help="Host to bind to (env: FLASH_HOST)",
+    ),
+    port: int = typer.Option(
+        8888,
+        "--port",
+        "-p",
+        envvar="FLASH_PORT",
+        help="Port to bind to (env: FLASH_PORT)",
+    ),
+    reload: bool = typer.Option(
+        True, "--reload/--no-reload", help="Enable auto-reload"
+    ),
+    auto_provision: bool = typer.Option(
+        False,
+        "--auto-provision",
+        help="Auto-provision deployable resources on startup",
+    ),
+):
+    """Run Flash development server with uvicorn."""
+    # Discover entry point
+    entry_point = discover_entry_point()
+    if not entry_point:
+        console.print("[red]Error:[/red] No entry point found")
+        console.print("Create main.py with a FastAPI app")
+        raise typer.Exit(1)
+    # Check if entry point has FastAPI app
+    app_location = check_fastapi_app(entry_point)
+    if not app_location:
+        console.print(f"[red]Error:[/red] No FastAPI app found in {entry_point}")
+        console.print("Make sure your main.py contains: app = FastAPI()")
+        raise typer.Exit(1)
+    # Set flag for all flash run sessions to ensure both auto-provisioned
+    # and on-the-fly provisioned resources get the live- prefix
+    if not _is_reload():
+        os.environ["FLASH_IS_LIVE_PROVISIONING"] = "true"
+    # Auto-provision resources if flag is set and not a reload
+    if auto_provision and not _is_reload():
+        try:
+            resources = _discover_resources(entry_point)
+            if resources:
+                # If many resources found, ask for confirmation
+                if len(resources) > 5:
+                    if not _confirm_large_provisioning(resources):
+                        console.print("[yellow]Auto-provisioning cancelled[/yellow]\n")
+                    else:
+                        _provision_resources(resources)
+                else:
+                    _provision_resources(resources)
+        except Exception as e:
+            logger.error("Auto-provisioning failed", exc_info=True)
+            console.print(
+                f"[yellow]Warning:[/yellow] Resource provisioning failed: {e}"
+            )
+            console.print(
+                "[yellow]Note:[/yellow] Resources will be deployed on-demand when first called"
+            )
+    console.print("\n[green]Starting Flash Server[/green]")
+    console.print(f"Entry point: [bold]{app_location}[/bold]")
+    console.print(f"Server: [bold]http://{host}:{port}[/bold]")
+    console.print(f"Auto-reload: [bold]{'enabled' if reload else 'disabled'}[/bold]")
+    console.print("\nPress CTRL+C to stop\n")
+    # Build uvicorn command
+    cmd = [
+        sys.executable,
+        "-m",
+        "uvicorn",
+        app_location,
+        "--host",
+        host,
+        "--port",
+        str(port),
+        "--log-level",
+        "warning",
+    ]
+    if reload:
+        cmd.append("--reload")
+    # Run uvicorn with proper process group handling
+    process = None
+    try:
+        # Create new process group to ensure all child processes can be killed together
+        # On Unix systems, use process group; on Windows, CREATE_NEW_PROCESS_GROUP
+        if sys.platform == "win32":
+            process = subprocess.Popen(
+                cmd, creationflags=subprocess.CREATE_NEW_PROCESS_GROUP
+            )
+        else:
+            process = subprocess.Popen(cmd, preexec_fn=os.setsid)
+        # Wait for process to complete
+        process.wait()
+    except KeyboardInterrupt:
+        console.print("\n[yellow]Stopping server and cleaning up processes...[/yellow]")
+        # Kill the entire process group to ensure all child processes are terminated
+        if process:
+            try:
+                if sys.platform == "win32":
+                    # Windows: terminate the process
+                    process.terminate()
+                else:
+                    # Unix: kill entire process group
+                    os.killpg(os.getpgid(process.pid), signal.SIGTERM)
+                # Wait briefly for graceful shutdown
+                try:
+                    process.wait(timeout=2)
+                except subprocess.TimeoutExpired:
+                    # Force kill if didn't terminate gracefully
+                    if sys.platform == "win32":
+                        process.kill()
+                    else:
+                        os.killpg(os.getpgid(process.pid), signal.SIGKILL)
+                    process.wait()
+            except (ProcessLookupError, OSError):
+                # Process already terminated
+                pass
+        console.print("[green]Server stopped[/green]")
+        raise typer.Exit(0)
+    except Exception as e:
+        console.print(f"[red]Error:[/red] {e}")
+        if process:
+            try:
+                if sys.platform == "win32":
+                    process.terminate()
+                else:
+                    os.killpg(os.getpgid(process.pid), signal.SIGTERM)
+            except (ProcessLookupError, OSError):
+                pass
+        raise typer.Exit(1)
+def discover_entry_point() -> Optional[str]:
+    """Discover the main entry point file."""
+    candidates = ["main.py", "app.py", "server.py"]
+    for candidate in candidates:
+        if Path(candidate).exists():
+            return candidate
+    return None
+def check_fastapi_app(entry_point: str) -> Optional[str]:
+    """
+    Check if entry point has a FastAPI app and return the app location.
+    Returns:
+        App location in format "module:app" or None
+    """
+    try:
+        # Read the file
+        content = Path(entry_point).read_text()
+        # Check for FastAPI app
+        if "app = FastAPI(" in content or "app=FastAPI(" in content:
+            # Extract module name from file path
+            module = entry_point.replace(".py", "").replace("/", ".")
+            return f"{module}:app"
+        return None
+    except Exception:
+        return None
+def _is_reload() -> bool:
+    """Check if running in uvicorn reload subprocess.
+    Returns:
+        True if running in a reload subprocess
+    """
+    return "UVICORN_RELOADER_PID" in os.environ
+def _discover_resources(entry_point: str):
+    """Discover deployable resources in entry point.
+    Args:
+        entry_point: Path to entry point file
+    Returns:
+        List of discovered DeployableResource instances
+    """
+    from ...core.discovery import ResourceDiscovery
+    try:
+        discovery = ResourceDiscovery(entry_point, max_depth=2)
+        resources = discovery.discover()
+        # Debug: Log what was discovered
+        if resources:
+            console.print(f"\n[dim]Discovered {len(resources)} resource(s):[/dim]")
+            for res in resources:
+                res_name = getattr(res, "name", "Unknown")
+                res_type = res.__class__.__name__
+                console.print(f"  [dim]• {res_name} ({res_type})[/dim]")
+            console.print()
+        return resources
+    except Exception as e:
+        console.print(f"[yellow]Warning:[/yellow] Resource discovery failed: {e}")
+        return []
+def _confirm_large_provisioning(resources) -> bool:
+    """Show resources and prompt user for confirmation.
+    Args:
+        resources: List of resources to provision
+    Returns:
+        True if user confirms, False otherwise
+    """
+    try:
+        console.print(
+            f"\n[yellow]Found {len(resources)} resources to provision:[/yellow]"
+        )
+        for resource in resources:
+            name = getattr(resource, "name", "Unknown")
+            resource_type = resource.__class__.__name__
+            console.print(f"  • {name} ({resource_type})")
+        console.print()
+        confirmed = questionary.confirm(
+            "This may take several minutes. Do you want to proceed?"
+        ).ask()
+        return confirmed if confirmed is not None else False
+    except (KeyboardInterrupt, EOFError):
+        console.print("\n[yellow]Cancelled[/yellow]")
+        return False
+    except Exception as e:
+        console.print(f"[yellow]Warning:[/yellow] Confirmation failed: {e}")
+        return False
+def _provision_resources(resources):
+    """Provision resources and wait for completion.
+    Args:
+        resources: List of resources to provision
+    """
+    import asyncio
+    from ...core.deployment import DeploymentOrchestrator
+    try:
+        console.print(f"\n[bold]Provisioning {len(resources)} resource(s)...[/bold]")
+        orchestrator = DeploymentOrchestrator(max_concurrent=3)
+        # Run provisioning with progress shown
+        loop = asyncio.new_event_loop()
+        asyncio.set_event_loop(loop)
+        loop.run_until_complete(orchestrator.deploy_all(resources, show_progress=True))
+        loop.close()
+    except Exception as e:
+        console.print(f"[yellow]Warning:[/yellow] Provisioning failed: {e}")

tetra-rp 0.6.0__py3-none-any.whl → 0.24.0__py3-none-any.whl

tetra-rp 0.6.0py3-none-any.whl → 0.24.0py3-none-any.whl