PyPI - truss - Versions diffs - 0.10.0rc1__py3-none-any.whl → 0.60.0__py3-none-any.whl - Mend - Supply Chain Defender

truss 0.10.0rc1py3-none-any.whl → 0.60.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of truss might be problematic. Click here for more details.

Files changed (362) hide show

truss/cli/cli.py CHANGED Viewed

@@ -3,29 +3,62 @@ import json
 import logging
 import os
 import sys
+import time
+import warnings
 from functools import wraps
 from pathlib import Path
-from typing import Callable, Optional
+from typing import Callable, List, Optional, Tuple, Union
 import rich
+import rich.live
+import rich.logging
+import rich.spinner
+import rich.table
+import rich.traceback
 import rich_click as click
 import truss
-from truss.cli.console import console
-from truss.cli.create import ask_name
+from InquirerPy import inquirer
+from rich import progress
+from rich.console import Console
+from truss.base.constants import (
+    PRODUCTION_ENVIRONMENT_NAME,
+    TRTLLM_MIN_MEMORY_REQUEST_GI,
+)
+from truss.base.errors import RemoteNetworkError
+from truss.base.trt_llm_config import TrussTRTLLMQuantizationType
+from truss.base.truss_config import Build, ModelServer
+from truss.cli.remote_cli import (
+    inquire_model_name,
+    inquire_remote_config,
+    inquire_remote_name,
+)
 from truss.remote.baseten.core import (
+    ACTIVE_STATUS,
+    DEPLOYING_STATUSES,
     ModelId,
     ModelIdentifier,
     ModelName,
     ModelVersionId,
 )
 from truss.remote.baseten.service import BasetenService
-from truss.remote.remote_cli import inquire_model_name, inquire_remote_name
+from truss.remote.baseten.utils.status import get_displayable_status
 from truss.remote.remote_factory import USER_TRUSSRC_PATH, RemoteFactory
-from truss.truss_config import Build, ModelServer
-from truss.truss_handle import TrussHandle
-logging.basicConfig(level=logging.INFO)
+from truss.trt_llm.config_checks import (
+    is_missing_secrets_for_trt_llm_builder,
+    memory_updated_for_trt_llm_builder,
+    uses_trt_llm_builder,
+)
+from truss.truss_handle.build import cleanup as _cleanup
+from truss.truss_handle.build import init_directory as _init
+from truss.truss_handle.build import load
+from truss.util import docker
+from truss.util.log_utils import LogInterceptor
+rich.spinner.SPINNERS["deploying"] = {"interval": 500, "frames": ["👾 ", " 👾"]}
+rich.spinner.SPINNERS["building"] = {"interval": 500, "frames": ["🛠️ ", " 🛠️"]}
+rich.spinner.SPINNERS["loading"] = {"interval": 500, "frames": ["⏱️ ", " ⏱️"]}
+rich.spinner.SPINNERS["active"] = {"interval": 500, "frames": ["💚 ", " 💚"]}
+rich.spinner.SPINNERS["failed"] = {"interval": 500, "frames": ["😤 ", " 😤"]}
 click.rich_click.COMMAND_GROUPS = {
     "truss": [
@@ -33,26 +66,31 @@ click.rich_click.COMMAND_GROUPS = {
             "name": "Main usage",
             "commands": ["init", "push", "watch", "predict"],
             "table_styles": {  # type: ignore
-                "row_styles": ["green"],
+                "row_styles": ["green"]
             },
         },
         {
             "name": "Advanced Usage",
             "commands": ["image", "container", "cleanup"],
             "table_styles": {  # type: ignore
-                "row_styles": ["yellow"],
+                "row_styles": ["yellow"]
+            },
+        },
+        {
+            "name": "Chains",
+            "commands": ["chains"],
+            "table_styles": {  # type: ignore
+                "row_styles": ["red"]
             },
         },
     ]
 }
+console = Console()
-def echo_output(f: Callable[..., object]):
-    @wraps(f)
-    def wrapper(*args, **kwargs):
-        click.echo(f(*args, **kwargs))
+error_console = Console(stderr=True, style="bold red")
-    return wrapper
+is_humanfriendly_log_level = True
 def error_handling(f: Callable[..., object]):
@@ -63,11 +101,74 @@ def error_handling(f: Callable[..., object]):
         except click.UsageError as e:
             raise e  # You can re-raise the exception or handle it different
         except Exception as e:
-            click.secho(f"ERROR: {e}", fg="red")
+            if is_humanfriendly_log_level:
+                console.print(
+                    f"[bold red]ERROR {type(e).__name__}[/bold red]: {e}",
+                    highlight=True,
+                )
+            else:
+                console.print_exception(show_locals=True)
     return wrapper
+_HUMANFRIENDLY_LOG_LEVEL = "humanfriendly"
+_log_level_str_to_level = {
+    _HUMANFRIENDLY_LOG_LEVEL: logging.INFO,
+    "W": logging.WARNING,
+    "WARNING": logging.WARNING,
+    "I": logging.INFO,
+    "INFO": logging.INFO,
+    "D": logging.DEBUG,
+    "DEBUG": logging.DEBUG,
+}
+def _set_logging_level(log_level: Union[str, int]) -> None:
+    if isinstance(log_level, str):
+        level = _log_level_str_to_level[log_level]
+    else:
+        level = log_level
+    root_logger = logging.getLogger()
+    root_logger.setLevel(level)
+    if log_level == _HUMANFRIENDLY_LOG_LEVEL:
+        rich_handler = rich.logging.RichHandler(
+            show_time=False, show_level=False, show_path=False
+        )
+    else:
+        # Rich handler adds time, levels, file location etc.
+        rich_handler = rich.logging.RichHandler()
+        global is_humanfriendly_log_level
+        is_humanfriendly_log_level = False
+    root_logger.handlers = []  # Clear existing handlers
+    root_logger.addHandler(rich_handler)
+    # Enable deprecation warnings raised in this module.
+    warnings.filterwarnings(
+        "default", category=DeprecationWarning, module="^truss\.cli\\b"
+    )
+def log_level_option(f):
+    def callback(ctx, param, value):
+        _set_logging_level(value)
+        return value
+    return click.option(
+        "--log",
+        default=_HUMANFRIENDLY_LOG_LEVEL,
+        expose_value=False,
+        help="Customizes logging.",
+        type=click.Choice(list(_log_level_str_to_level.keys()), case_sensitive=False),
+        callback=callback,
+    )(f)
+def _format_link(text: str) -> str:
+    return f"[link={text}]{text}[/link]"
 def print_help() -> None:
     ctx = click.get_current_context()
     click.echo(ctx.get_help())
@@ -76,6 +177,7 @@ def print_help() -> None:
 @click.group(name="truss", invoke_without_command=True)  # type: ignore
 @click.pass_context
 @click.version_option(truss.version())
+@log_level_option
 def truss_cli(ctx) -> None:
     """truss: The simplest way to serve models in production"""
     if not ctx.invoked_subcommand:
@@ -85,13 +187,11 @@ def truss_cli(ctx) -> None:
 @click.group()
 def container():
     """Subcommands for truss container"""
-    pass
 @click.group()
 def image():
     """Subcommands for truss image"""
-    pass
 @truss_cli.command()
@@ -103,23 +203,36 @@ def image():
     default=ModelServer.TrussServer.value,
     type=click.Choice([server.value for server in ModelServer]),
 )
+@click.option("-n", "--name", type=click.STRING)
+@click.option(
+    "--python-config/--no-python-config",
+    type=bool,
+    default=False,
+    help="Uses the code first tooling to build models.",
+)
+@log_level_option
 @error_handling
-def init(target_directory, backend) -> None:
+def init(target_directory, backend, name, python_config) -> None:
     """Create a new truss.
     TARGET_DIRECTORY: A Truss is created in this directory
     """
     if os.path.isdir(target_directory):
         raise click.ClickException(
-            f'Error: Directory "{target_directory}" already exists and cannot be overwritten.'
+            f"Error: Directory `{target_directory}` already exists "
+            "and cannot be overwritten."
         )
     tr_path = Path(target_directory)
     build_config = Build(model_server=ModelServer[backend])
-    model_name = ask_name()
-    truss.init(
+    if name:
+        model_name = name
+    else:
+        model_name = inquire_model_name()
+    _init(
         target_directory=target_directory,
         build_config=build_config,
         model_name=model_name,
+        python_config=python_config,
     )
     click.echo(f"Truss {model_name} was created in {tr_path.absolute()}")
@@ -127,6 +240,7 @@ def init(target_directory, backend) -> None:
 @image.command()  # type: ignore
 @click.argument("build_dir")
 @click.argument("target_directory", required=False)
+@log_level_option
 @error_handling
 def build_context(build_dir, target_directory: str) -> None:
     """
@@ -143,9 +257,16 @@ def build_context(build_dir, target_directory: str) -> None:
 @image.command()  # type: ignore
 @click.argument("target_directory", required=False)
 @click.argument("build_dir", required=False)
-@error_handling
 @click.option("--tag", help="Docker image tag")
-def build(target_directory: str, build_dir: Path, tag) -> None:
+@click.option(
+    "--use_host_network",
+    is_flag=True,
+    default=False,
+    help="Use host network for docker build",
+)
+@log_level_option
+@error_handling
+def build(target_directory: str, build_dir: Path, tag, use_host_network) -> None:
     """
     Builds the docker image for a Truss.
@@ -156,6 +277,9 @@ def build(target_directory: str, build_dir: Path, tag) -> None:
     tr = _get_truss_from_directory(target_directory=target_directory)
     if build_dir:
         build_dir = Path(build_dir)
+    if use_host_network:
+        tr.build_serving_docker_image(build_dir=build_dir, tag=tag, network="host")
+        return
     tr.build_serving_docker_image(build_dir=build_dir, tag=tag)
@@ -168,13 +292,16 @@ def build(target_directory: str, build_dir: Path, tag) -> None:
     "--attach", is_flag=True, default=False, help="Flag for attaching the process"
 )
 @click.option(
-    "--cache/--no-cache",
+    "--use_host_network",
     is_flag=True,
-    default=True,
-    help="Flag for caching build or not",
+    default=False,
+    help="Use host network for docker build",
 )
+@log_level_option
 @error_handling
-def run(target_directory: str, build_dir: Path, tag, port, attach, cache) -> None:
+def run(
+    target_directory: str, build_dir: Path, tag, port, attach, use_host_network
+) -> None:
     """
     Runs the docker image for a Truss.
@@ -190,38 +317,74 @@ def run(target_directory: str, build_dir: Path, tag, port, attach, cache) -> Non
         click.confirm(
             f"Container already exists at {urls}. Are you sure you want to continue?"
         )
-    tr.docker_run(
-        build_dir=build_dir, tag=tag, local_port=port, detach=not attach, cache=cache
-    )
+    if use_host_network:
+        tr.docker_run(
+            build_dir=build_dir,
+            tag=tag,
+            local_port=port,
+            detach=not attach,
+            network="host",
+        )
+        return
+    tr.docker_run(build_dir=build_dir, tag=tag, local_port=port, detach=not attach)
 @truss_cli.command()
-@click.argument("target_directory", required=False, default=os.getcwd())
 @click.option(
-    "--remote",
+    "--api-key",
     type=str,
     required=False,
     help="Name of the remote in .trussrc to patch changes to",
 )
+@error_handling
+def login(api_key: Optional[str]):
+    from truss.api import login
+    if not api_key:
+        remote_config = inquire_remote_config()
+        RemoteFactory.update_remote_config(remote_config)
+    else:
+        login(api_key)
+@truss_cli.command()
 @click.option(
-    "--logs",
-    is_flag=True,
-    show_default=True,
-    default=False,
-    help="Automatically open remote logs tab",
+    "--remote",
+    type=str,
+    required=False,
+    help="Name of the remote in .trussrc to check whoami.",
 )
 @error_handling
-def watch(
-    target_directory: str,
-    remote: str,
-    logs: bool,
-) -> None:
+def whoami(remote: Optional[str]):
+    """
+    Shows user information and exit.
+    """
+    from truss.api import whoami
+    if not remote:
+        remote = inquire_remote_name(RemoteFactory.get_available_config_names())
+    user = whoami(remote)
+    console.print(f"{user.workspace_name}\{user.user_email}")
+@truss_cli.command()
+@click.argument("target_directory", required=False, default=os.getcwd())
+@click.option(
+    "--remote",
+    type=str,
+    required=False,
+    help="Name of the remote in .trussrc to patch changes to",
+)
+@log_level_option
+@error_handling
+def watch(target_directory: str, remote: str) -> None:
     """
     Seamless remote development with truss
     TARGET_DIRECTORY: A Truss directory. If none, use current directory.
     """
     # TODO: ensure that provider support draft
     if not remote:
         remote = inquire_remote_name(RemoteFactory.get_available_config_names())
@@ -231,16 +394,456 @@ def watch(
     tr = _get_truss_from_directory(target_directory=target_directory)
     model_name = tr.spec.config.model_name
     if not model_name:
-        rich.print(
+        console.print(
             "🧐 NoneType model_name provided in config.yaml. "
             "Please check that you have the correct model name in your config file."
         )
         sys.exit(1)
     service = remote_provider.get_service(model_identifier=ModelName(model_name))
-    logs_url = remote_provider.get_remote_logs_url(service)
-    rich.print(f"🪵  View logs for your deployment at {logs_url}")
-    remote_provider.sync_truss_to_dev_version_by_name(model_name, target_directory)
+    console.print(
+        f"🪵  View logs for your deployment at {_format_link(service.logs_url)}"
+    )
+    if not os.path.isfile(target_directory):
+        remote_provider.sync_truss_to_dev_version_by_name(
+            model_name, target_directory, console, error_console
+        )
+    else:
+        # These imports are delayed, to handle pydantic v1 envs gracefully.
+        from truss_chains.deployment import deployment_client
+        deployment_client.watch_model(
+            source=Path(target_directory),
+            model_name=model_name,
+            remote_provider=remote_provider,
+            console=console,
+            error_console=error_console,
+        )
+# Chains Stuff #########################################################################
+@click.group()
+def chains():
+    """Subcommands for truss chains"""
+def _make_chains_curl_snippet(run_remote_url: str, environment: Optional[str]) -> str:
+    if environment:
+        idx = run_remote_url.find("deployment")
+        if idx != -1:
+            run_remote_url = (
+                run_remote_url[:idx] + f"environments/{environment}/run_remote"
+            )
+    return (
+        f"curl -X POST '{run_remote_url}' \\\n"
+        '    -H "Authorization: Api-Key $BASETEN_API_KEY" \\\n'
+        "    -d '<JSON_INPUT>'"
+    )
+def _create_chains_table(service) -> Tuple[rich.table.Table, List[str]]:
+    """Creates a status table similar to:
+                                          ⛓️   ItestChain - Chain  ⛓️
+                         🌐 Status page: https://app.baseten.co/chains/p7qrm93v/overview
+    ╭──────────────────────┬──────────────────────────────┬─────────────────────────────────────────────╮
+    │ Status               │ Chainlet                     │ Logs URL                                   │
+    ├──────────────────────┼──────────────────────────────┼────────────────────────────────────────────┤
+    │ 🛠️  BUILDING         │ ItestChain (entrypoint)      │ https://app.baseten.co/chains/.../logs/... │
+    ├──────────────────────┼──────────────────────────────┼────────────────────────────────────────────┤
+    │ 👾  DEPLOYING        │ GENERATE_DATA (internal)     │ https://app.baseten.co/chains/.../logs/... │
+    │ 👾  DEPLOYING        │ SplitTextFailOnce (internal) │ https://app.baseten.co/chains/.../logs/... │
+    │ 👾  DEPLOYING        │ TextReplicator (internal)    │ https://app.baseten.co/chains/.../logs/... │
+    │ 🛠️  BUILDING         │ TextToNum (internal)         │ https://app.baseten.co/chains/.../logs/... │
+    ╰──────────────────────┴──────────────────────────────┴────────────────────────────────────────────╯
+    """
+    title = (
+        f"⛓️   {service.name} - Chain  ⛓️\n\n "
+        f"🌐 Status page: {_format_link(service.status_page_url)}"
+    )
+    table = rich.table.Table(
+        show_header=True,
+        header_style="bold yellow",
+        title=title,
+        box=rich.table.box.ROUNDED,
+        border_style="blue",
+    )
+    table.add_column("Status", style="dim", min_width=20)
+    table.add_column("Chainlet", min_width=20)
+    table.add_column("Logs URL")
+    statuses = []
+    status_iterable = service.get_info()
+    # Organize status_iterable s.t. entrypoint is first.
+    entrypoint = next(x for x in status_iterable if x.is_entrypoint)
+    sorted_chainlets = sorted(
+        (x for x in status_iterable if not x.is_entrypoint), key=lambda x: x.name
+    )
+    for i, chainlet in enumerate([entrypoint] + sorted_chainlets):
+        displayable_status = get_displayable_status(chainlet.status)
+        if displayable_status == ACTIVE_STATUS:
+            spinner_name = "active"
+        elif displayable_status in DEPLOYING_STATUSES:
+            if displayable_status == "BUILDING":
+                spinner_name = "building"
+            elif displayable_status == "LOADING":
+                spinner_name = "loading"
+            else:
+                spinner_name = "deploying"
+        else:
+            spinner_name = "failed"
+        spinner = rich.spinner.Spinner(spinner_name, text=displayable_status)
+        if chainlet.is_entrypoint:
+            display_name = f"{chainlet.name} (entrypoint)"
+        else:
+            display_name = f"{chainlet.name} (internal)"
+        table.add_row(spinner, display_name, _format_link(chainlet.logs_url))
+        # Add section divider after entrypoint, entrypoint must be first.
+        if chainlet.is_entrypoint:
+            table.add_section()
+        statuses.append(displayable_status)
+    return table, statuses
+@chains.command(name="push")  # type: ignore
+@click.argument("source", type=Path, required=True)
+@click.argument("entrypoint", type=str, required=False)
+@click.option(
+    "--name",
+    type=str,
+    required=False,
+    help="Name of the chain to be deployed, if not given, the entrypoint name is used.",
+)
+@click.option(
+    "--publish/--no-publish",
+    type=bool,
+    default=False,
+    help="Create chainlets as published deployments.",
+)
+@click.option(
+    "--promote/--no-promote",
+    type=bool,
+    default=False,
+    help="Replace production chainlets with newly deployed chainlets.",
+)
+@click.option(
+    "--environment",
+    type=str,
+    required=False,
+    help=(
+        "Deploy the chain as a published deployment to the specified environment."
+        "If specified, --publish is implied and the supplied value of --promote will be ignored."
+    ),
+)
+@click.option(
+    "--wait/--no-wait",
+    type=bool,
+    default=True,
+    help="Wait until all chainlets are ready (or deployment failed).",
+)
+@click.option(
+    "--watch/--no-watch",
+    type=bool,
+    default=False,
+    help=(
+        "Watches the chains source code and applies live patches. Using this option "
+        "will wait for the chain to be deployed (i.e. `--wait` flag is applied), "
+        "before starting to watch for changes. This option required the deployment "
+        "to be a development deployment (i.e. `--no-promote` and `--no-publish`."
+    ),
+)
+@click.option(
+    "--dryrun",
+    type=bool,
+    default=False,
+    is_flag=True,
+    help="Produces only generated files, but doesn't deploy anything.",
+)
+@click.option(
+    "--remote",
+    type=str,
+    required=False,
+    help="Name of the remote in .trussrc to push to.",
+)
+@click.option(
+    "--experimental-watch-chainlet-names",
+    type=str,
+    required=False,
+    help=(
+        "Runs `watch`, but only applies patches to specified chainlets. The option is "
+        "a comma-separated list of chainlet (display) names. This option can give "
+        "faster dev loops, but also lead to inconsistent deployments. Use with caution "
+        "and refer to docs."
+    ),
+)
+@log_level_option
+@error_handling
+def push_chain(
+    source: Path,
+    entrypoint: Optional[str],
+    name: Optional[str],
+    publish: bool,
+    promote: bool,
+    wait: bool,
+    watch: bool,
+    dryrun: bool,
+    remote: Optional[str],
+    environment: Optional[str],
+    experimental_watch_chainlet_names: Optional[str],
+) -> None:
+    """
+    Deploys a chain remotely.
+    SOURCE: Path to a python file that contains the entrypoint chainlet.
+    ENTRYPOINT: Class name of the entrypoint chainlet in source file. May be omitted
+    if a chainlet definition in SOURCE is tagged with `@chains.mark_entrypoint`.
+    """
+    # These imports are delayed, to handle pydantic v1 envs gracefully.
+    from truss_chains import definitions as chains_def
+    from truss_chains import framework
+    from truss_chains.deployment import deployment_client
+    if experimental_watch_chainlet_names:
+        watch = True
+    if watch:
+        if publish or promote:
+            raise ValueError(
+                "When using `--watch`, the deployment cannot be published or promoted."
+            )
+        if not wait:
+            console.print(
+                "`--watch` is used. Will wait for deployment before watching files."
+            )
+            wait = True
+    if promote and environment:
+        promote_warning = (
+            "`promote` flag and `environment` flag were both specified. "
+            "Ignoring the value of `promote`."
+        )
+        console.print(promote_warning, style="yellow")
+    if not remote:
+        remote = inquire_remote_name(RemoteFactory.get_available_config_names())
+    with framework.ChainletImporter.import_target(source, entrypoint) as entrypoint_cls:
+        chain_name = (
+            name or entrypoint_cls.meta_data.chain_name or entrypoint_cls.display_name
+        )
+        options = chains_def.PushOptionsBaseten.create(
+            chain_name=chain_name,
+            promote=promote,
+            publish=publish,
+            only_generate_trusses=dryrun,
+            remote=remote,
+            environment=environment,
+        )
+        service = deployment_client.push(
+            entrypoint_cls, options, progress_bar=progress.Progress
+        )
+    if dryrun:
+        return
+    assert isinstance(service, deployment_client.BasetenChainService)
+    curl_snippet = _make_chains_curl_snippet(
+        service.run_remote_url, options.environment
+    )
+    table, statuses = _create_chains_table(service)
+    status_check_wait_sec = 2
+    if wait:
+        num_services = len(statuses)
+        success = False
+        num_failed = 0
+        # Logging inferences with live display (even when using richHandler)
+        # -> capture logs and print later.
+        with LogInterceptor() as log_interceptor, rich.live.Live(
+            table, console=console, refresh_per_second=4
+        ) as live:
+            while True:
+                table, statuses = _create_chains_table(service)
+                live.update(table)
+                num_active = sum(s == ACTIVE_STATUS for s in statuses)
+                num_deploying = sum(s in DEPLOYING_STATUSES for s in statuses)
+                if num_active == num_services:
+                    success = True
+                    break
+                elif num_failed := num_services - num_active - num_deploying:
+                    break
+                time.sleep(status_check_wait_sec)
+            intercepted_logs = log_interceptor.get_logs()
+        # Prints must be outside `Live` context.
+        if intercepted_logs:
+            console.print("Logs intercepted during waiting:", style="blue")
+            for log in intercepted_logs:
+                console.print(f"\t{log}")
+        if success:
+            deploy_success_text = "Deployment succeeded."
+            if environment:
+                deploy_success_text = (
+                    "Your chain has been deployed into "
+                    f"the {options.environment} environment."
+                )
+            console.print(deploy_success_text, style="bold green")
+            console.print(f"You can run the chain with:\n{curl_snippet}")
+            if watch:  # Note that this command will print a startup message.
+                if experimental_watch_chainlet_names:
+                    included_chainlets = [
+                        x.strip() for x in experimental_watch_chainlet_names.split(",")
+                    ]
+                else:
+                    included_chainlets = None
+                deployment_client.watch(
+                    source,
+                    entrypoint,
+                    name,
+                    remote,
+                    console,
+                    error_console,
+                    show_stack_trace=not is_humanfriendly_log_level,
+                    included_chainlets=included_chainlets,
+                )
+        else:
+            console.print(f"Deployment failed ({num_failed} failures).", style="red")
+    else:
+        console.print(table)
+        console.print(
+            "Once all chainlets are deployed, "
+            f"you can run the chain with:\n\n{curl_snippet}"
+        )
+@chains.command(name="watch")  # type: ignore
+@click.argument("source", type=Path, required=True)
+@click.argument("entrypoint", type=str, required=False)
+@click.option(
+    "--name",
+    type=str,
+    required=False,
+    help="Name of the chain to be deployed, if not given, the entrypoint name is used.",
+)
+@click.option(
+    "--remote",
+    type=str,
+    required=False,
+    help="Name of the remote in .trussrc to push to.",
+)
+@click.option(
+    "--experimental-chainlet-names",
+    type=str,
+    required=False,
+    help=(
+        "Runs `watch`, but only applies patches to specified chainlets. The option is "
+        "a comma-separated list of chainlet (display) names. This option can give "
+        "faster dev loops, but also lead to inconsistent deployments. Use with caution "
+        "and refer to docs."
+    ),
+)
+@log_level_option
+@error_handling
+def watch_chains(
+    source: Path,
+    entrypoint: Optional[str],
+    name: Optional[str],
+    remote: Optional[str],
+    experimental_chainlet_names: Optional[str],
+) -> None:
+    """
+    Watches the chains source code and applies live patches to a development deployment.
+    The development deployment must have been deployed before running this command.
+    SOURCE: Path to a python file that contains the entrypoint chainlet.
+    ENTRYPOINT: Class name of the entrypoint chainlet in source file. May be omitted
+    if a chainlet definition in SOURCE is tagged with `@chains.mark_entrypoint`.
+    """
+    # These imports are delayed, to handle pydantic v1 envs gracefully.
+    from truss_chains.deployment import deployment_client
+    if not remote:
+        remote = inquire_remote_name(RemoteFactory.get_available_config_names())
+    if experimental_chainlet_names:
+        included_chainlets = [x.strip() for x in experimental_chainlet_names.split(",")]
+    else:
+        included_chainlets = None
+    deployment_client.watch(
+        source,
+        entrypoint,
+        name,
+        remote,
+        console,
+        error_console,
+        show_stack_trace=not is_humanfriendly_log_level,
+        included_chainlets=included_chainlets,
+    )
+@chains.command(name="init")  # type: ignore
+@click.argument("directory", type=Path, required=False)
+@log_level_option
+@error_handling
+def init_chain(directory: Optional[Path]) -> None:
+    """
+    Initializes a chains project directory.
+    DIRECTORY: A name of new or existing directory to create the chain in,
+      it must be empty. If not specified, the current directory is used.
+    """
+    if not directory:
+        directory = Path.cwd()
+    if directory.exists():
+        if not directory.is_dir():
+            raise ValueError(f"The path {directory} must be a directory.")
+        if any(directory.iterdir()):
+            raise ValueError(f"Directory {directory} must be empty.")
+    else:
+        directory.mkdir()
+    filename = inquirer.text(
+        qmark="",
+        message="Enter the python file name for the chain.",
+        default="my_chain.py",
+    ).execute()
+    filepath = directory / str(filename).strip()
+    console.print(f"Creating and populating {filepath}...\n")
+    source_code = _load_example_chainlet_code()
+    filepath.write_text(source_code)
+    console.print(
+        "Next steps:\n",
+        f"💻 Run [bold green]`python {filepath}`[/bold green] for local debug "
+        "execution.\n"
+        f"🚢 Run [bold green]`truss chains deploy {filepath}`[/bold green] "
+        "to deploy the chain to Baseten.\n",
+    )
+def _load_example_chainlet_code() -> str:
+    try:
+        from truss_chains.reference_code import reference_chainlet
+    # if the example is faulty, a validation error would be raised
+    except Exception as e:
+        raise Exception("Failed to load starter code. Please notify support.") from e
+    source = Path(reference_chainlet.__file__).read_text()
+    return source
+# End Chains Stuff #####################################################################
 def _extract_and_validate_model_identifier(
@@ -315,7 +918,10 @@ def _extract_request_data(data: Optional[str], file: Optional[Path]):
     "--model-version",
     type=str,
     required=False,
-    help="[DEPRECATED] Use --model-deployment instead, this will be removed in future release. ID of model deployment",
+    help=(
+        "[DEPRECATED] Use --model-deployment instead, this will be  "
+        "removed in future release. ID of model deployment"
+    ),
 )
 @click.option(
     "--model-deployment",
@@ -323,13 +929,8 @@ def _extract_request_data(data: Optional[str], file: Optional[Path]):
     required=False,
     help="ID of model deployment to call",
 )
-@click.option(
-    "--model",
-    type=str,
-    required=False,
-    help="ID of model to call",
-)
-@echo_output
+@click.option("--model", type=str, required=False, help="ID of model to call")
+@log_level_option
 def predict(
     target_directory: str,
     remote: str,
@@ -356,7 +957,8 @@ def predict(
     if model_version:
         console.print(
-            "[DEPRECATED] --model-version is deprecated, use --model-deployment instead.",
+            "[DEPRECATED] --model-version is deprecated, "
+            "use --model-deployment instead.",
             style="yellow",
         )
         model_deployment = model_version
@@ -376,7 +978,7 @@ def predict(
     # Log deployment ID for Baseten models.
     if isinstance(service, BasetenService):
-        rich.print(
+        console.print(
             f"Calling predict on {'[cyan]development[/cyan] ' if service.is_draft else ''}"
             f"deployment ID {service.model_version_id}..."
         )
@@ -386,7 +988,40 @@ def predict(
         for chunk in result:
             click.echo(chunk, nl=False)
         return
-    rich.print_json(data=result)
+    console.print_json(data=result)
+@truss_cli.command()
+@click.argument("script", required=True)
+@click.argument("target_directory", required=False, default=os.getcwd())
+def run_python(script, target_directory):
+    if not Path(script).exists():
+        raise click.BadParameter(
+            f"File {script} does not exist. Please provide a valid file."
+        )
+    if not Path(target_directory).exists():
+        raise click.BadParameter(f"Directory {target_directory} does not exist.")
+    if not (Path(target_directory) / "config.yaml").exists():
+        raise click.BadParameter(
+            f"Directory {target_directory} does not contain a valid Truss."
+        )
+    tr = _get_truss_from_directory(target_directory=target_directory)
+    container = tr.run_python_script(Path(script))
+    for output in container.logs():
+        output_type = output[0]
+        output_content = output[1]
+        options = {}
+        if output_type == "stderr":
+            options["fg"] = "red"
+        click.secho(output_content.decode("utf-8", "replace"), nl=False, **options)
+    exit_code = container.wait()
+    sys.exit(exit_code)
 @truss_cli.command()
@@ -422,6 +1057,15 @@ def predict(
         "after deploy completes."
     ),
 )
+@click.option(
+    "--environment",
+    type=str,
+    required=False,
+    help=(
+        "Push the truss as a published deployment to the specified environment."
+        "If specified, --publish is implied and the supplied value of --promote will be ignored."
+    ),
+)
 @click.option(
     "--preserve-previous-production-deployment",
     type=bool,
@@ -429,9 +1073,9 @@ def predict(
     required=False,
     default=False,
     help=(
-        "Preserve the previous production deployment's autoscaling setting. When not specified, "
-        "the previous production deployment will be updated to allow it to scale to zero. "
-        "Can only be use in combination with --promote option"
+        "Preserve the previous production deployment's autoscaling setting. When "
+        "not specified, the previous production deployment will be updated to allow "
+        "it to scale to zero. Can only be use in combination with --promote option."
     ),
 )
 @click.option(
@@ -440,7 +1084,15 @@ def predict(
     is_flag=True,
     required=False,
     default=False,
-    help="Trust truss with hosted secrets.",
+    help="[DEPRECATED]Trust truss with hosted secrets.",
+)
+@click.option(
+    "--disable-truss-download",
+    type=bool,
+    is_flag=True,
+    required=False,
+    default=False,
+    help="Disable downloading the truss directory from the UI.",
 )
 @click.option(
     "--deployment-name",
@@ -448,19 +1100,41 @@ def predict(
     required=False,
     help=(
         "Name of the deployment created by the push. Can only be "
-        "used in combination with --publish or --promote."
+        "used in combination with `--publish` or `--promote`."
     ),
 )
+@click.option(
+    "--wait/--no-wait",
+    type=bool,
+    is_flag=True,
+    required=False,
+    default=False,
+    help="Wait for the deployment to complete before returning.",
+)
+@click.option(
+    "--timeout-seconds",
+    type=int,
+    required=False,
+    help=(
+        "Maximum time to wait for deployment to complete in seconds. Without "
+        "specifying, the command will not complete until the deployment is complete."
+    ),
+)
+@log_level_option
 @error_handling
 def push(
     target_directory: str,
     remote: str,
-    model_name: Optional[str],
+    model_name: str,
     publish: bool = False,
     trusted: bool = False,
+    disable_truss_download: bool = False,
     promote: bool = False,
     preserve_previous_production_deployment: bool = False,
     deployment_name: Optional[str] = None,
+    wait: bool = False,
+    timeout_seconds: Optional[int] = None,
+    environment: Optional[str] = None,
 ) -> None:
     """
     Pushes a truss to a TrussRemote.
@@ -472,27 +1146,72 @@ def push(
         remote = inquire_remote_name(RemoteFactory.get_available_config_names())
     remote_provider = RemoteFactory.create(remote=remote)
     tr = _get_truss_from_directory(target_directory=target_directory)
     model_name = model_name or tr.spec.config.model_name
     if not model_name:
         model_name = inquire_model_name()
+    if promote and environment:
+        promote_warning = "`promote` flag and `environment` flag were both specified. Ignoring the value of `promote`"
+        console.print(promote_warning, style="yellow")
+    if promote and not environment:
+        environment = PRODUCTION_ENVIRONMENT_NAME
     # Write model name to config if it's not already there
     if model_name != tr.spec.config.model_name:
         tr.spec.config.model_name = model_name
         tr.spec.config.write_to_yaml_file(tr.spec.config_path, verbose=False)
+    # Log a warning if using --trusted.
+    if trusted:
+        trusted_deprecation_notice = (
+            "[DEPRECATED] `--trusted` option is deprecated and no longer needed"
+        )
+        console.print(trusted_deprecation_notice, style="yellow")
+    # trt-llm engine builder checks
+    if uses_trt_llm_builder(tr):
+        if not publish:
+            live_reload_disabled_text = "Development mode is currently not supported for trusses using TRT-LLM build flow, push as a published model using --publish"
+            console.print(live_reload_disabled_text, style="red")
+            sys.exit(1)
+        if is_missing_secrets_for_trt_llm_builder(tr):
+            missing_token_text = (
+                "`hf_access_token` must be provided in secrets to build a gated model. "
+                "Please see https://docs.baseten.co/deploy/guides/private-model for configuration instructions."
+            )
+            console.print(missing_token_text, style="red")
+            sys.exit(1)
+        if memory_updated_for_trt_llm_builder(tr):
+            console.print(
+                f"Automatically increasing memory for trt-llm builder to {TRTLLM_MIN_MEMORY_REQUEST_GI}Gi."
+            )
+        for trt_llm_build_config in tr.spec.config.parsed_trt_llm_build_configs:
+            if (
+                trt_llm_build_config.quantization_type
+                in [TrussTRTLLMQuantizationType.FP8, TrussTRTLLMQuantizationType.FP8_KV]
+                and not trt_llm_build_config.num_builder_gpus
+            ):
+                fp8_and_num_builder_gpus_text = (
+                    "Warning: build specifies FP8 quantization but does not explicitly specify number of build GPUs. "
+                    "GPU memory required at build time may be significantly more than that required at inference time due to FP8 quantization, which can result in OOM failures during the engine build phase."
+                    "`num_builder_gpus` can be used to specify the number of GPUs to use at build time."
+                )
+                console.print(fp8_and_num_builder_gpus_text, style="yellow")
     # TODO(Abu): This needs to be refactored to be more generic
     service = remote_provider.push(
         tr,
-        model_name,
+        model_name=model_name,
         publish=publish,
-        trusted=trusted,
+        trusted=True,
         promote=promote,
         preserve_previous_prod_deployment=preserve_previous_production_deployment,
         deployment_name=deployment_name,
+        environment=environment,
+        disable_truss_download=disable_truss_download,
+        progress_bar=progress.Progress,
     )  # type: ignore
     click.echo(f"✨ Model {model_name} was successfully pushed ✨")
@@ -500,7 +1219,7 @@ def push(
     if service.is_draft:
         draft_model_text = """
 |---------------------------------------------------------------------------------------|
-| Your model has been deployed as a development model. Development models allow you to  |
+| Your model is deploying as a development model. Development models allow you to  |
 | iterate quickly during the deployment process.                                        |
 |                                                                                       |
 | When you are ready to publish your deployed model as a new deployment,                |
@@ -512,21 +1231,48 @@ def push(
         click.echo(draft_model_text)
-    # Log a warning if using secrets without --trusted.
-    # TODO(helen): this could be moved to a separate function that includes more config checks.
-    if tr.spec.config.secrets and not trusted:
-        not_trusted_text = """Warning: your Truss has secrets but was not pushed with --trusted.
-Please push with --trusted to grant access to secrets.
-"""
-        console.print(not_trusted_text, style="red")
-    if promote:
-        promotion_text = """Your Truss has been deployed as a production model. After it successfully deploys,
-it will become the next production deployment of your model."""
+    if environment:
+        promotion_text = (
+            f"Your Truss has been deployed into the {environment} environment. After it successfully "
+            f"deploys, it will become the next {environment} deployment of your model."
+        )
         console.print(promotion_text, style="green")
-    logs_url = remote_provider.get_remote_logs_url(service)  # type: ignore[attr-defined]
-    rich.print(f"🪵  View logs for your deployment at {logs_url}")
+    console.print(
+        f"🪵  View logs for your deployment at {_format_link(service.logs_url)}"
+    )
+    if wait:
+        start_time = time.time()
+        with console.status("[bold green]Deploying...") as status:
+            try:
+                # Poll for the deployment status until we have reached. Either ACTIVE,
+                # or a non-deploying status (in which case the deployment has failed).
+                for deployment_status in service.poll_deployment_status():
+                    if (
+                        timeout_seconds is not None
+                        and time.time() - start_time > timeout_seconds
+                    ):
+                        console.print("Deployment timed out.", style="red")
+                        sys.exit(1)
+                    status.update(
+                        f"[bold green]Deploying...Current Status: {deployment_status}"
+                    )
+                    if deployment_status == ACTIVE_STATUS:
+                        console.print("Deployment succeeded.", style="bold green")
+                        return
+                    if deployment_status not in DEPLOYING_STATUSES:
+                        console.print(
+                            f"Deployment failed with status {deployment_status}.",
+                            style="red",
+                        )
+                        sys.exit(1)
+            except RemoteNetworkError:
+                console.print("Deployment failed: Could not reach remote.", style="red")
+                sys.exit(1)
 @truss_cli.command()
@@ -576,8 +1322,8 @@ def kill(target_directory: str) -> None:
 @container.command()  # type: ignore
 def kill_all() -> None:
-    "Kills all truss containers that are not manually persisted"
-    truss.kill_all()
+    """Kills all truss containers that are not manually persisted."""
+    docker.kill_all()
 @truss_cli.command()
@@ -590,18 +1336,25 @@ def cleanup() -> None:
     such as for building docker images. This command clears
     that data to free up disk space.
     """
-    truss.build.cleanup()
+    _cleanup()
-def _get_truss_from_directory(target_directory: Optional[str] = None) -> TrussHandle:
+def _get_truss_from_directory(target_directory: Optional[str] = None):
     """Gets Truss from directory. If none, use the current directory"""
     if target_directory is None:
         target_directory = os.getcwd()
-    return truss.load(target_directory)
+    if not os.path.isfile(target_directory):
+        return load(target_directory)
+    # These imports are delayed, to handle pydantic v1 envs gracefully.
+    from truss_chains.deployment import code_gen
+    truss_dir = code_gen.gen_truss_model_from_source(Path(target_directory))
+    return load(truss_dir)
 truss_cli.add_command(container)
 truss_cli.add_command(image)
+truss_cli.add_command(chains)
 if __name__ == "__main__":
     truss_cli()