PyPI - flyteplugins-wandb - Versions diffs - 2.0.0b52__py3-none-any.whl - Mend

flyteplugins-wandb 2.0.0b52__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

flyteplugins/wandb/__init__.py +493 -0
flyteplugins/wandb/_context.py +381 -0
flyteplugins/wandb/_decorator.py +417 -0
flyteplugins/wandb/_link.py +149 -0
flyteplugins_wandb-2.0.0b52.dist-info/METADATA +34 -0
flyteplugins_wandb-2.0.0b52.dist-info/RECORD +8 -0
flyteplugins_wandb-2.0.0b52.dist-info/WHEEL +5 -0
flyteplugins_wandb-2.0.0b52.dist-info/top_level.txt +1 -0

flyteplugins/wandb/_decorator.py ADDED Viewed

@@ -0,0 +1,417 @@
+import functools
+import logging
+from contextlib import contextmanager
+from dataclasses import asdict
+from inspect import iscoroutinefunction
+from typing import Any, Callable, Optional, TypeVar, cast
+import flyte
+from flyte._task import AsyncFunctionTaskTemplate
+import wandb
+from ._context import RunMode, get_wandb_context, get_wandb_sweep_context
+from ._link import Wandb, WandbSweep
+logger = logging.getLogger(__name__)
+F = TypeVar("F", bound=Callable[..., Any])
+def _build_init_kwargs() -> dict[str, Any]:
+    """Build wandb.init() kwargs from current context config."""
+    context_config = get_wandb_context()
+    if context_config:
+        config_dict = asdict(context_config)
+        extra_kwargs = config_dict.pop("kwargs", None) or {}
+        # Remove Flyte-specific fields that shouldn't be passed to wandb.init()
+        config_dict.pop("run_mode", None)
+        config_dict.pop("download_logs", None)
+        # Filter out None values
+        filtered_config = {k: v for k, v in config_dict.items() if v is not None}
+        return {**extra_kwargs, **filtered_config}
+    return {}
+@contextmanager
+def _wandb_run(
+    run_mode: RunMode = "auto",
+    func: bool = False,
+    **decorator_kwargs,
+):
+    """
+    Context manager for wandb run lifecycle.
+    Initializes wandb.init() when the context is entered.
+    The initialized run is available via get_wandb_run().
+    """
+    # Try to get Flyte context
+    ctx = flyte.ctx()
+    # This enables @wandb_init to work in wandb.agent() callbacks (sweep objectives)
+    if func and ctx is None:
+        # Use config from decorator params (no lazy init for fallback mode)
+        run = wandb.init(**decorator_kwargs)
+        try:
+            yield run
+        finally:
+            run.finish()
+        return
+    elif func and ctx:
+        raise RuntimeError(
+            "@wandb_init cannot be applied to traces. Traces can access the parent's wandb run via get_wandb_run()."
+        )
+    # Save existing state to restore later
+    saved_run_id = ctx.custom_context.get("_wandb_run_id")
+    saved_run = ctx.data.get("_wandb_run")
+    # Build init kwargs from context
+    context_init_kwargs = _build_init_kwargs()
+    init_kwargs = {**context_init_kwargs, **decorator_kwargs}
+    # Check if this is a trace accessing parent's run
+    run = ctx.data.get("_wandb_run")
+    if run:
+        # This is a trace - yield existing run without initializing
+        try:
+            yield run
+        finally:
+            pass  # Don't clean up - parent owns this run
+        return
+    # Get current action name for run ID generation
+    current_action = ctx.action.name
+    # Determine if we should reuse parent's run
+    should_reuse = False
+    if run_mode == "shared":
+        should_reuse = True
+    elif run_mode == "auto":
+        should_reuse = bool(saved_run_id)
+    # Determine run ID
+    if "id" not in init_kwargs or init_kwargs["id"] is None:
+        if should_reuse:
+            if not saved_run_id:
+                raise RuntimeError("Cannot reuse parent run: no parent run ID found")
+            init_kwargs["id"] = saved_run_id
+        else:
+            init_kwargs["id"] = f"{ctx.action.run_name}-{current_action}"
+    # Configure reinit parameter (only for local mode)
+    # In remote/shared mode, wandb handles run creation/joining automatically
+    if flyte.ctx().mode == "local":
+        if should_reuse:
+            if "reinit" not in init_kwargs:
+                init_kwargs["reinit"] = "return_previous"
+        else:
+            init_kwargs["reinit"] = "create_new"
+    # Configure remote mode settings
+    if flyte.ctx().mode == "remote":
+        is_primary = not should_reuse
+        existing_settings = init_kwargs.get("settings", {})
+        shared_config = {
+            "mode": "shared",
+            "x_primary": is_primary,
+            "x_label": current_action,
+        }
+        if not is_primary:
+            shared_config["x_update_finish_state"] = False
+        init_kwargs["settings"] = wandb.Settings(**{**existing_settings, **shared_config})
+    # Initialize wandb
+    run = wandb.init(**init_kwargs)
+    # Store run ID in custom_context (shared with child tasks and accessible to links)
+    ctx.custom_context["_wandb_run_id"] = run.id
+    # Store run object in ctx.data (task-local only and accessible to traces)
+    ctx.data["_wandb_run"] = run
+    try:
+        yield run
+    finally:
+        # Determine if this is a primary run
+        is_primary_run = run_mode == "new" or (run_mode == "auto" and saved_run_id is None)
+        if run:
+            # Different cleanup logic for local vs remote mode
+            should_finish = False
+            if flyte.ctx().mode == "remote":
+                # In remote/shared mode, always call run.finish() to flush data
+                # For secondary tasks, x_update_finish_state=False prevents actually finishing
+                # For primary tasks, this properly finishes the run
+                should_finish = True
+            elif is_primary_run:
+                # In local mode, only primary tasks should call run.finish()
+                # Secondary tasks reuse the parent's run object, so they must not finish it
+                should_finish = True
+            if should_finish:
+                try:
+                    run.finish(exit_code=0)
+                except Exception:
+                    try:
+                        run.finish(exit_code=1)
+                    except Exception:
+                        pass
+                    raise
+        # Restore run ID
+        if saved_run_id is not None:
+            ctx.custom_context["_wandb_run_id"] = saved_run_id
+        else:
+            ctx.custom_context.pop("_wandb_run_id", None)
+        # Restore run object
+        if saved_run is not None:
+            ctx.data["_wandb_run"] = saved_run
+        else:
+            ctx.data.pop("_wandb_run", None)
+def wandb_init(
+    _func: Optional[F] = None,
+    *,
+    run_mode: RunMode = "auto",
+    download_logs: Optional[bool] = None,
+    project: Optional[str] = None,
+    entity: Optional[str] = None,
+    **kwargs,
+) -> F:
+    """
+    Decorator to automatically initialize wandb for Flyte tasks and wandb sweep objectives.
+    Args:
+        run_mode: Controls whether to create a new W&B run or share an existing one:
+            1. "auto" (default): Creates new run if no parent run exists, otherwise shares parent's run
+            2. "new": Always creates a new wandb run with a unique ID
+            3. "shared": Always shares the parent's run ID (useful for child tasks)
+        download_logs: If `True`, downloads wandb run files after task completes
+            and shows them as a trace output in the Flyte UI. If None, uses
+            the value from `wandb_config()` context if set.
+        project: W&B project name (overrides context config if provided)
+        entity: W&B entity/team name (overrides context config if provided)
+        **kwargs: Additional `wandb.init()` parameters (tags, config, mode, etc.)
+    Decorator Order:
+        For tasks, @wandb_init must be the outermost decorator:
+        @wandb_init
+        @env.task
+        async def my_task():
+            ...
+    This decorator:
+    1. Initializes wandb when the context manager is entered
+    2. Auto-generates unique run ID from Flyte action context if not provided
+    3. Makes the run available via get_wandb_run()
+    4. Automatically adds a W&B link to the task in the Flyte UI
+    5. Automatically finishes the run after completion
+    6. Optionally downloads run logs as a trace output (if download_logs=True)
+    """
+    def decorator(func: F) -> F:
+        # Build decorator kwargs dict to pass to _wandb_run
+        decorator_kwargs = {}
+        if project is not None:
+            decorator_kwargs["project"] = project
+        if entity is not None:
+            decorator_kwargs["entity"] = entity
+        decorator_kwargs.update(kwargs)
+        # Check if it's a Flyte task (AsyncFunctionTaskTemplate)
+        if isinstance(func, AsyncFunctionTaskTemplate):
+            # Create a Wandb link
+            # Even if run_mode="shared", we still add a link - it will point to the parent's run
+            wandb_link = Wandb(project=project, entity=entity, run_mode=run_mode)
+            # Get existing links from the task and add wandb link
+            existing_links = getattr(func, "links", ())
+            # Use override to properly add the link to the task
+            func = func.override(links=(*existing_links, wandb_link))
+            # Wrap the task's execute method with wandb_run
+            original_execute = func.execute
+            async def wrapped_execute(*args, **exec_kwargs):
+                with _wandb_run(run_mode=run_mode, **decorator_kwargs) as run:
+                    result = await original_execute(*args, **exec_kwargs)
+                # After run finishes, optionally download logs
+                should_download = download_logs
+                if should_download is None:
+                    # Check context config
+                    ctx_config = get_wandb_context()
+                    should_download = ctx_config.download_logs if ctx_config else False
+                if should_download and run:
+                    from . import download_wandb_run_logs
+                    await download_wandb_run_logs(run.id)
+                return result
+            func.execute = wrapped_execute
+            return cast(F, func)
+        # Regular function
+        else:
+            if iscoroutinefunction(func):
+                @functools.wraps(func)
+                async def async_wrapper(*args, **wrapper_kwargs):
+                    with _wandb_run(run_mode=run_mode, func=True, **decorator_kwargs):
+                        return await func(*args, **wrapper_kwargs)
+                return cast(F, async_wrapper)
+            else:
+                @functools.wraps(func)
+                def sync_wrapper(*args, **wrapper_kwargs):
+                    with _wandb_run(run_mode=run_mode, func=True, **decorator_kwargs):
+                        return func(*args, **wrapper_kwargs)
+                return cast(F, sync_wrapper)
+    if _func is None:
+        return decorator
+    return decorator(_func)
+@contextmanager
+def _create_sweep(project: Optional[str] = None, entity: Optional[str] = None, **decorator_kwargs):
+    """Context manager for wandb sweep creation."""
+    ctx = flyte.ctx()
+    # Check if a sweep already exists in context - reuse it instead of creating new
+    existing_sweep_id = ctx.custom_context.get("_wandb_sweep_id")
+    if existing_sweep_id:
+        yield existing_sweep_id
+        return
+    # Get sweep config from context
+    sweep_config = get_wandb_sweep_context()
+    if not sweep_config:
+        raise RuntimeError(
+            "No wandb sweep config found. Use wandb_sweep_config() "
+            "with flyte.with_runcontext() or as a context manager."
+        )
+    # Get wandb config for project/entity (fallback)
+    wandb_config = get_wandb_context()
+    # Priority: decorator kwargs > sweep config > wandb config
+    project = project or sweep_config.project or (wandb_config.project if wandb_config else None)
+    entity = entity or sweep_config.entity or (wandb_config.entity if wandb_config else None)
+    prior_runs = sweep_config.prior_runs or []
+    # Get sweep config dict
+    sweep_dict = sweep_config.to_sweep_config()
+    # Generate deterministic sweep name if not provided
+    if "name" not in sweep_dict or sweep_dict["name"] is None:
+        sweep_dict["name"] = f"{ctx.action.run_name}-{ctx.action.name}"
+    # Create the sweep
+    sweep_id = wandb.sweep(
+        sweep=sweep_dict,
+        project=project,
+        entity=entity,
+        prior_runs=prior_runs,
+        **decorator_kwargs,
+    )
+    # Store sweep_id in context (accessible to links)
+    ctx.custom_context["_wandb_sweep_id"] = sweep_id
+    try:
+        yield sweep_id
+    finally:
+        # Clean up sweep_id from context
+        ctx.custom_context.pop("_wandb_sweep_id", None)
+def wandb_sweep(
+    _func: Optional[F] = None,
+    *,
+    project: Optional[str] = None,
+    entity: Optional[str] = None,
+    download_logs: Optional[bool] = None,
+    **kwargs,
+) -> F:
+    """
+    Decorator to create a wandb sweep and make `sweep_id` available.
+    This decorator:
+    1. Creates a wandb sweep using config from context
+    2. Makes `sweep_id` available via `get_wandb_sweep_id()`
+    3. Automatically adds a W&B sweep link to the task
+    4. Optionally downloads all sweep run logs as a trace output (if `download_logs=True`)
+    Args:
+        project: W&B project name (overrides context config if provided)
+        entity: W&B entity/team name (overrides context config if provided)
+        download_logs: if `True`, downloads all sweep run files after task completes
+            and shows them as a trace output in the Flyte UI. If None, uses
+            the value from wandb_sweep_config() context if set.
+        **kwargs: additional `wandb.sweep()` parameters
+    Decorator Order:
+        For tasks, @wandb_sweep must be the outermost decorator:
+        @wandb_sweep
+        @env.task
+        async def my_task():
+            ...
+    """
+    def decorator(func: F) -> F:
+        # Check if it's a Flyte task (AsyncFunctionTaskTemplate)
+        if isinstance(func, AsyncFunctionTaskTemplate):
+            # Create a WandbSweep link
+            wandb_sweep_link = WandbSweep()
+            # Get existing links from the task and add wandb sweep link
+            existing_links = getattr(func, "links", ())
+            # Use override to properly add the link to the task
+            func = func.override(links=(*existing_links, wandb_sweep_link))
+            original_execute = func.execute
+            async def wrapped_execute(*args, **exec_kwargs):
+                with _create_sweep(project=project, entity=entity, **kwargs) as sweep_id:
+                    result = await original_execute(*args, **exec_kwargs)
+                # After sweep finishes, optionally download logs
+                should_download = download_logs
+                if should_download is None:
+                    # Check context config
+                    sweep_config = get_wandb_sweep_context()
+                    should_download = sweep_config.download_logs if sweep_config else False
+                if should_download and sweep_id:
+                    from . import download_wandb_sweep_logs
+                    await download_wandb_sweep_logs(sweep_id)
+                return result
+            func.execute = wrapped_execute
+            return cast(F, func)
+        else:
+            raise RuntimeError("@wandb_sweep can only be used with Flyte tasks.")
+    if _func is None:
+        return decorator
+    return decorator(_func)

flyteplugins/wandb/_link.py ADDED Viewed

@@ -0,0 +1,149 @@
+from dataclasses import dataclass
+from typing import Dict, Optional
+from flyte import Link
+from ._context import RunMode
+@dataclass
+class Wandb(Link):
+    """
+    Generates a Weights & Biases run link.
+    Args:
+        host: Base W&B host URL
+        project: W&B project name (overrides context config if provided)
+        entity: W&B entity/team name (overrides context config if provided)
+        run_mode: Controls whether to create a new W&B run or share an existing one:
+            1. "auto" (default): Creates new run if no parent run exists, otherwise shares parent's run
+            2. "new": Always creates a new wandb run with a unique ID
+            3. "shared": Always shares the parent's run ID (useful for child tasks)
+        id: Optional W&B run ID (overrides context config if provided)
+        name: Link name in the Flyte UI
+    """
+    host: str = "https://wandb.ai"
+    project: Optional[str] = None
+    entity: Optional[str] = None
+    run_mode: RunMode = "auto"
+    id: Optional[str] = None
+    name: str = "Weights & Biases"
+    def get_link(
+        self,
+        run_name: str,
+        project: str,
+        domain: str,
+        context: Dict[str, str],
+        parent_action_name: str,
+        action_name: str,
+        pod_name: str,
+        **kwargs,
+    ) -> str:
+        # Get project and entity from decorator values or context
+        wandb_project = self.project
+        wandb_entity = self.entity
+        wandb_run_id = None
+        user_provided_id = self.id  # Prioritize ID provided at link creation time
+        run_mode = self.run_mode  # Defaults to "auto"
+        if context:
+            # Try to get from context if not provided at decoration time
+            if not wandb_project:
+                wandb_project = context.get("wandb_project")
+            if not wandb_entity:
+                wandb_entity = context.get("wandb_entity")
+            # Get parent's run ID if available (set by parent task)
+            parent_run_id = context.get("_wandb_run_id")
+            # Check if user provided a custom run ID in wandb_config (lower priority than self.id)
+            if not user_provided_id:
+                user_provided_id = context.get("wandb_id")
+        else:
+            parent_run_id = None
+        # If we don't have project/entity, we can't create a valid link
+        if not wandb_project or not wandb_entity:
+            return self.host
+        # Determine run ID based on run_mode setting
+        if run_mode == "new":
+            # Always create new run - use user-provided ID if available, otherwise generate
+            wandb_run_id = user_provided_id or f"{run_name}-{action_name}"
+        elif run_mode == "shared":
+            # Always reuse parent's run
+            if parent_run_id:
+                wandb_run_id = parent_run_id
+            else:
+                # Can't generate link without parent run ID
+                return f"{self.host}/{wandb_entity}/{wandb_project}"
+        else:  # run_mode == "auto"
+            # Use parent's run if available, otherwise create new
+            if parent_run_id:
+                wandb_run_id = parent_run_id
+            else:
+                wandb_run_id = user_provided_id or f"{run_name}-{action_name}"
+        return f"{self.host}/{wandb_entity}/{wandb_project}/runs/{wandb_run_id}"
+@dataclass
+class WandbSweep(Link):
+    """
+    Generates a Weights & Biases Sweep link.
+    Args:
+        host: Base W&B host URL
+        project: W&B project name (overrides context config if provided)
+        entity: W&B entity/team name (overrides context config if provided)
+        id: Optional W&B sweep ID (overrides context config if provided)
+        name: Link name in the Flyte UI
+    """
+    host: str = "https://wandb.ai"
+    project: Optional[str] = None
+    entity: Optional[str] = None
+    id: Optional[str] = None
+    name: str = "Weights & Biases Sweep"
+    def get_link(
+        self,
+        run_name: str,
+        project: str,
+        domain: str,
+        context: Dict[str, str],
+        parent_action_name: str,
+        action_name: str,
+        pod_name: str,
+        **kwargs,
+    ) -> str:
+        # Get project and entity from decorator values or context
+        wandb_project = self.project
+        wandb_entity = self.entity
+        sweep_id = self.id  # Prioritize ID provided at link creation time
+        if context:
+            # Try to get from context config if not provided at decoration time
+            if not wandb_project:
+                wandb_project = context.get("wandb_project")
+            if not wandb_entity:
+                wandb_entity = context.get("wandb_entity")
+            # Try to get the sweep_id from context if not provided at link creation
+            # Child tasks inherit this from the parent that created the sweep
+            if not sweep_id:
+                sweep_id = context.get("_wandb_sweep_id")
+        # If we don't have project/entity, return base URL
+        if not wandb_project or not wandb_entity:
+            return self.host
+        # If we have a sweep_id, link to specific sweep
+        if sweep_id:
+            return f"{self.host}/{wandb_entity}/{wandb_project}/sweeps/{sweep_id}"
+        # No sweep_id: link to the project's sweeps list page
+        return f"{self.host}/{wandb_entity}/{wandb_project}/sweeps"

flyteplugins_wandb-2.0.0b52.dist-info/METADATA ADDED Viewed

@@ -0,0 +1,34 @@
+Metadata-Version: 2.4
+Name: flyteplugins-wandb
+Version: 2.0.0b52
+Summary: Weights & Biases plugin for Flyte
+Author: Flyte Contributors
+Requires-Python: >=3.10
+Description-Content-Type: text/markdown
+Requires-Dist: wandb
+Requires-Dist: flyte
+# Weights & Biases Plugin
+- Tasks decorated with `@wandb_init` or `@wandb_sweep` automatically get W&B links in the Flyte UI that point directly to the corresponding W&B runs or sweeps. Links retrieve project/entity from decorator parameters or context configuration (from `with_runcontext`).
+- `@wandb_init` and `@wandb_sweep` must be the **outermost decorators** (applied after `@env.task`). For example:
+  ```python
+  @wandb_init
+  @env.task
+  def my_task():
+      ...
+  ```
+- By default (`run_mode="auto"`), child tasks automatically reuse their parent's W&B run if one exists, or create a new run if they're top-level tasks. You can override this with `run_mode="new"` (always create new) or `run_mode="shared"` (always reuse parent).
+- `@wandb_init` should be applied to tasks (not traces). Traces can access the parent task's W&B run via `get_wandb_run()`. `@wandb_init` can also be applied to regular Python functions for use in `wandb.agent()` sweep callbacks.
+- The wandb run can be accessed via `get_wandb_run()`, which returns the run object or `None` if not within a `@wandb_init` decorated task.
+- When using `run_mode="shared"` or `run_mode="auto"` (with a parent run), child tasks reuse the parent's run ID. Configuration from `wandb_config()` is merged with decorator parameters.
+- `wandb_config` can be used to pass configuration to tasks enclosed within the context manager and can also be provided via `with_runcontext`.
+- When the context manager exits, the configuration falls back to the parent task's config.
+- Arguments passed to `wandb_init` decorator are available only within the current task and traces and are not propagated to child tasks (use `wandb_config` for child tasks).
+- At most 20 sweep agents can be launched at a time: https://docs.wandb.ai/models/sweeps/existing-project#3-launch-agents.
+- `@wandb_sweep` creates a W&B sweep and adds a sweep link to the decorated task. The sweep ID is available via `get_wandb_sweep_id()`. For the parent task that creates the sweep, the link points to the project's sweeps list page. For child tasks, the link points to the specific sweep (they inherit the `sweep_id` from the parent's context).
+- The objective function passed to `wandb.agent()` should be a vanilla Python function decorated with `@wandb_init` to initialize the run. You can access the run with `wandb.run` since the Flyte context won't be available during the objective function call.
+- Set `download_logs=True` in `wandb_config` or `@wandb_init` to download W&B run logs after task completion. The I/O of this download functionality is traced by Flyte's `@flyte.trace`.
+- Set `download_logs=True` in `wandb_sweep_config` or `@wandb_sweep` to download W&B sweep logs after task completion. The I/O of this download functionality is traced by Flyte's `@flyte.trace`.

flyteplugins_wandb-2.0.0b52.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,8 @@
+flyteplugins/wandb/__init__.py,sha256=D5gqDOIy6ePcE2tcbNVsp9ZzxZKC6Qmd-6eHxNX3L88,15881
+flyteplugins/wandb/_context.py,sha256=va_TlRhSW-QBbHhvKmIAggsLw5VFAq4gXMIu7n5ZKSA,12746
+flyteplugins/wandb/_decorator.py,sha256=HenEVJI7kmDMQdHo6jDy3vXvjxT89CCYRBCR2CuGE3s,14785
+flyteplugins/wandb/_link.py,sha256=tEzfW06GPsVMECGAnEhwNzCI2h0d0UnJHMqso6t8Pnw,5319
+flyteplugins_wandb-2.0.0b52.dist-info/METADATA,sha256=oOQOpcjQa99Iy-bhYuop9KtFktttFzNzNYj4yQvUjBc,3058
+flyteplugins_wandb-2.0.0b52.dist-info/WHEEL,sha256=wUyA8OaulRlbfwMtmQsvNngGrxQHAvkKcvRmdizlJi0,92
+flyteplugins_wandb-2.0.0b52.dist-info/top_level.txt,sha256=cgd779rPu9EsvdtuYgUxNHHgElaQvPn74KhB5XSeMBE,13
+flyteplugins_wandb-2.0.0b52.dist-info/RECORD,,

flyteplugins_wandb-2.0.0b52.dist-info/WHEEL ADDED Viewed

@@ -0,0 +1,5 @@
+Wheel-Version: 1.0
+Generator: setuptools (80.10.2)
+Root-Is-Purelib: true
+Tag: py3-none-any

flyteplugins_wandb-2.0.0b52.dist-info/top_level.txt ADDED Viewed

	@@ -0,0 +1 @@
1	+ flyteplugins