PyPI - wandb - Versions diffs - 0.13.11__py3-none-any.whl → 0.14.0__py3-none-any.whl - Mend

wandb 0.13.11py3-none-any.whl → 0.14.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

wandb/__init__.py +1 -1
wandb/apis/importers/__init__.py +4 -0
wandb/apis/importers/base.py +312 -0
wandb/apis/importers/mlflow.py +113 -0
wandb/apis/internal.py +9 -0
wandb/apis/public.py +0 -2
wandb/cli/cli.py +100 -72
wandb/docker/__init__.py +33 -5
wandb/proto/v3/wandb_telemetry_pb2.py +10 -10
wandb/proto/v4/wandb_telemetry_pb2.py +10 -10
wandb/sdk/internal/internal_api.py +85 -9
wandb/sdk/launch/_project_spec.py +45 -55
wandb/sdk/launch/agent/agent.py +80 -18
wandb/sdk/launch/builder/build.py +16 -74
wandb/sdk/launch/builder/docker_builder.py +36 -8
wandb/sdk/launch/builder/kaniko_builder.py +78 -37
wandb/sdk/launch/builder/templates/_wandb_bootstrap.py +68 -18
wandb/sdk/launch/environment/aws_environment.py +4 -0
wandb/sdk/launch/launch.py +1 -6
wandb/sdk/launch/launch_add.py +0 -5
wandb/sdk/launch/registry/abstract.py +12 -0
wandb/sdk/launch/registry/elastic_container_registry.py +31 -1
wandb/sdk/launch/registry/google_artifact_registry.py +32 -0
wandb/sdk/launch/registry/local_registry.py +15 -1
wandb/sdk/launch/runner/abstract.py +0 -14
wandb/sdk/launch/runner/kubernetes_runner.py +25 -19
wandb/sdk/launch/runner/local_container.py +7 -8
wandb/sdk/launch/runner/local_process.py +0 -3
wandb/sdk/launch/runner/sagemaker_runner.py +0 -3
wandb/sdk/launch/runner/vertex_runner.py +0 -2
wandb/sdk/launch/sweeps/scheduler.py +39 -10
wandb/sdk/launch/utils.py +52 -4
wandb/sdk/wandb_run.py +3 -10
wandb/sync/sync.py +1 -0
wandb/util.py +1 -0
{wandb-0.13.11.dist-info → wandb-0.14.0.dist-info}/METADATA +1 -1
{wandb-0.13.11.dist-info → wandb-0.14.0.dist-info}/RECORD +41 -38
{wandb-0.13.11.dist-info → wandb-0.14.0.dist-info}/WHEEL +1 -1
{wandb-0.13.11.dist-info → wandb-0.14.0.dist-info}/LICENSE +0 -0
{wandb-0.13.11.dist-info → wandb-0.14.0.dist-info}/entry_points.txt +0 -0
{wandb-0.13.11.dist-info → wandb-0.14.0.dist-info}/top_level.txt +0 -0

wandb/__init__.py CHANGED Viewed

@@ -11,7 +11,7 @@ For scripts and interactive notebooks, see https://github.com/wandb/examples.
 For reference documentation, see https://docs.wandb.com/ref/python.
 """
-__version__ = "0.13.11"
+__version__ = "0.14.0"
 # Used with pypi checks and other messages related to pip
 _wandb_module = "wandb"

wandb/apis/importers/__init__.py ADDED Viewed

@@ -0,0 +1,4 @@
+from wandb.util import get_module
+if get_module("mlflow"):
+    from .mlflow import MlflowImporter, MlflowRun  # noqa: F401

wandb/apis/importers/base.py ADDED Viewed

@@ -0,0 +1,312 @@
+import json
+import platform
+from abc import ABC, abstractmethod
+from concurrent.futures import ProcessPoolExecutor, as_completed
+from contextlib import contextmanager
+from typing import Any, Dict, Iterable, List, Optional, Tuple
+from tqdm.auto import tqdm
+import wandb
+from wandb.proto import wandb_internal_pb2 as pb
+from wandb.proto import wandb_telemetry_pb2 as telem_pb
+from wandb.sdk.interface.interface import file_policy_to_enum
+from wandb.sdk.interface.interface_queue import InterfaceQueue
+from wandb.sdk.internal.sender import SendManager
+Name = str
+Path = str
+def coalesce(*arg: Any) -> Any:
+    """Return the first non-none value in the list of arguments.  Similar to ?? in C#."""
+    return next((a for a in arg if a is not None), None)
+@contextmanager
+def send_manager(root_dir):
+    sm = SendManager.setup(root_dir, resume=False)
+    try:
+        yield sm
+    finally:
+        # flush any remaining records
+        while sm:
+            data = next(sm)
+            sm.send(data)
+        sm.finish()
+class ImporterRun:
+    def __init__(self) -> None:
+        self.interface = InterfaceQueue()
+        self.run_dir = f"./wandb-importer/{self.run_id()}"
+    def run_id(self) -> str:
+        _id = wandb.util.generate_id()
+        wandb.termwarn(f"`run_id` not specified.  Autogenerating id: {_id}")
+        return _id
+    def entity(self) -> str:
+        _entity = "unspecified-entity"
+        wandb.termwarn(f"`entity` not specified.  Defaulting to: {_entity}")
+        return _entity
+    def project(self) -> str:
+        _project = "unspecified-project"
+        wandb.termwarn(f"`project` not specified.  Defaulting to: {_project}")
+        return _project
+    def config(self) -> Dict[str, Any]:
+        return {}
+    def summary(self) -> Dict[str, float]:
+        return {}
+    def metrics(self) -> List[Dict[str, float]]:
+        """Metrics for the run.
+        We expect metrics in this shape:
+        [
+            {'metric1': 1, 'metric2': 1, '_step': 0},
+            {'metric1': 2, 'metric2': 4, '_step': 1},
+            {'metric1': 3, 'metric2': 9, '_step': 2},
+            ...
+        ]
+        You can also submit metrics in this shape:
+        [
+            {'metric1': 1, '_step': 0},
+            {'metric2': 1, '_step': 0},
+            {'metric1': 2, '_step': 1},
+            {'metric2': 4, '_step': 1},
+            ...
+        ]
+        """
+        return []
+    def run_group(self) -> Optional[str]:
+        ...
+    def job_type(self) -> Optional[str]:
+        ...
+    def display_name(self) -> str:
+        return self.run_id()
+    def notes(self) -> Optional[str]:
+        ...
+    def tags(self) -> Optional[List[str]]:
+        ...
+    def artifacts(self) -> Optional[Iterable[Tuple[Name, Path]]]:
+        ...
+    def os_version(self) -> Optional[str]:
+        ...
+    def python_version(self) -> Optional[str]:
+        ...
+    def cuda_version(self) -> Optional[str]:
+        ...
+    def program(self) -> Optional[str]:
+        ...
+    def host(self) -> Optional[str]:
+        ...
+    def username(self) -> Optional[str]:
+        ...
+    def executable(self) -> Optional[str]:
+        ...
+    def gpus_used(self) -> Optional[str]:
+        ...
+    def cpus_used(self) -> Optional[int]:  # can we get the model?
+        ...
+    def memory_used(self) -> Optional[int]:
+        ...
+    def runtime(self) -> Optional[int]:
+        ...
+    def start_time(self) -> Optional[int]:
+        ...
+    def _make_run_record(self) -> pb.Record:
+        run = pb.RunRecord()
+        run.run_id = self.run_id()
+        run.entity = self.entity()
+        run.project = self.project()
+        run.display_name = coalesce(self.display_name())
+        run.notes = coalesce(self.notes(), "")
+        run.tags.extend(coalesce(self.tags(), list()))
+        # run.start_time.FromMilliseconds(self.start_time())
+        # run.runtime = self.runtime()
+        run_group = self.run_group()
+        if run_group is not None:
+            run.run_group = run_group
+        self.interface._make_config(
+            data=self.config(),
+            obj=run.config,
+        )  # is there a better way?
+        return self.interface._make_record(run=run)
+    def _make_summary_record(self) -> pb.Record:
+        d: dict = {
+            **self.summary(),
+            "_runtime": self.runtime(),  # quirk of runtime -- it has to be here!
+            # '_timestamp': self.start_time()/1000,
+        }
+        summary = self.interface._make_summary_from_dict(d)
+        return self.interface._make_record(summary=summary)
+    def _make_history_records(self) -> Iterable[pb.Record]:
+        for _, metrics in enumerate(self.metrics()):
+            history = pb.HistoryRecord()
+            for k, v in metrics.items():
+                item = history.item.add()
+                item.key = k
+                item.value_json = json.dumps(v)
+            yield self.interface._make_record(history=history)
+    def _make_files_record(self, files_dict) -> pb.Record:
+        # when making the metadata file, it captures most things correctly
+        # but notably it doesn't capture the start time!
+        files_record = pb.FilesRecord()
+        for path, policy in files_dict["files"]:
+            f = files_record.files.add()
+            f.path = path
+            f.policy = file_policy_to_enum(policy)  # is this always "end"?
+        return self.interface._make_record(files=files_record)
+    def _make_metadata_files_record(self) -> pb.Record:
+        self._make_metadata_file(self.run_dir)
+        return self._make_files_record(
+            {"files": [[f"{self.run_dir}/files/wandb-metadata.json", "end"]]}
+        )
+    def _make_artifact_record(self) -> pb.Record:
+        art = wandb.Artifact(self.display_name(), "imported-artifacts")
+        artifacts = self.artifacts()
+        if artifacts is not None:
+            for name, path in artifacts:
+                art.add_file(path, name)
+        proto = self.interface._make_artifact(art)
+        proto.run_id = self.run_id()
+        proto.project = self.project()
+        proto.entity = self.entity()
+        proto.user_created = False
+        proto.use_after_commit = False
+        proto.finalize = True
+        for tag in ["latest", "imported"]:
+            proto.aliases.append(tag)
+        return self.interface._make_record(artifact=proto)
+    def _make_telem_record(self) -> pb.Record:
+        feature = telem_pb.Feature()
+        feature.importer_mlflow = True
+        telem = telem_pb.TelemetryRecord()
+        telem.feature.CopyFrom(feature)
+        telem.python_version = platform.python_version()  # importer's python version
+        telem.cli_version = wandb.__version__
+        return self.interface._make_record(telemetry=telem)
+    def _make_metadata_file(self, run_dir: str) -> None:
+        missing_text = "MLFlow did not capture this info."
+        d = {}
+        if self.os_version() is not None:
+            d["os"] = self.os_version()
+        else:
+            d["os"] = missing_text
+        if self.python_version() is not None:
+            d["python"] = self.python_version()
+        else:
+            d["python"] = missing_text
+        if self.program() is not None:
+            d["program"] = self.program()
+        else:
+            d["program"] = missing_text
+        if self.cuda_version() is not None:
+            d["cuda"] = self.cuda_version()
+        if self.host() is not None:
+            d["host"] = self.host()
+        if self.username() is not None:
+            d["username"] = self.username()
+        if self.executable() is not None:
+            d["executable"] = self.executable()
+        gpus_used = self.gpus_used()
+        if gpus_used is not None:
+            d["gpu_devices"] = json.dumps(gpus_used)
+            d["gpu_count"] = json.dumps(len(gpus_used))
+        cpus_used = self.cpus_used()
+        if cpus_used is not None:
+            d["cpu_count"] = json.dumps(self.cpus_used())
+        mem_used = self.memory_used()
+        if mem_used is not None:
+            d["memory"] = json.dumps({"total": self.memory_used()})
+        with open(f"{run_dir}/files/wandb-metadata.json", "w") as f:
+            f.write(json.dumps(d))
+class Importer(ABC):
+    @abstractmethod
+    def download_all_runs(self) -> Iterable[ImporterRun]:
+        ...
+    def import_all(self, overrides: Optional[Dict[str, Any]] = None) -> None:
+        for run in tqdm(self.download_all_runs(), desc="Sending runs"):
+            self.import_one(run, overrides)
+    def import_all_parallel(
+        self, overrides: Optional[Dict[str, Any]] = None, **pool_kwargs: Any
+    ) -> None:
+        runs = list(self.download_all_runs())
+        with tqdm(total=len(runs)) as pbar:
+            with ProcessPoolExecutor(**pool_kwargs) as exc:
+                futures = {
+                    exc.submit(self.import_one, run, overrides=overrides): run
+                    for run in runs
+                }
+                for future in as_completed(futures):
+                    run = futures[future]
+                    pbar.update(1)
+                    pbar.set_description(
+                        f"Imported Run: {run.run_group()} {run.display_name()}"
+                    )
+    def import_one(
+        self,
+        run: ImporterRun,
+        overrides: Optional[Dict[str, Any]] = None,
+    ) -> None:
+        # does this need to be here for pmap?
+        if overrides:
+            for k, v in overrides.items():
+                # `lambda: v` won't work!
+                # https://stackoverflow.com/questions/10802002/why-deepcopy-doesnt-create-new-references-to-lambda-function
+                setattr(run, k, lambda v=v: v)
+        self._import_one(run)
+    def _import_one(self, run: ImporterRun) -> None:
+        with send_manager(run.run_dir) as sm:
+            sm.send(run._make_run_record())
+            sm.send(run._make_summary_record())
+            sm.send(run._make_metadata_files_record())
+            for history_record in run._make_history_records():
+                sm.send(history_record)
+            if run.artifacts() is not None:
+                sm.send(run._make_artifact_record())
+            sm.send(run._make_telem_record())

wandb/apis/importers/mlflow.py ADDED Viewed

@@ -0,0 +1,113 @@
+from typing import Any, Dict, Iterable, Optional
+from wandb.util import get_module
+from .base import Importer, ImporterRun
+mlflow = get_module(
+    "mlflow",
+    required="To use the MlflowImporter, please install mlflow: `pip install mlflow`",
+)
+class MlflowRun(ImporterRun):
+    def __init__(self, run, mlflow_client):
+        self.run = run
+        self.mlflow_client = mlflow_client
+        super().__init__()
+    def run_id(self):
+        return self.run.info.run_id
+    def entity(self):
+        return self.run.info.user_id
+    def project(self):
+        return "imported-from-mlflow"
+    def config(self):
+        return self.run.data.params
+    def summary(self):
+        return self.run.data.metrics
+    def metrics(self):
+        def wandbify(metrics):
+            for step, t in enumerate(metrics):
+                d = {m.key: m.value for m in t}
+                d["_step"] = step
+                yield d
+        metrics = [
+            self.mlflow_client.get_metric_history(self.run.info.run_id, k)
+            for k in self.run.data.metrics.keys()
+        ]
+        metrics = zip(*metrics)  # transpose
+        return wandbify(metrics)
+        # Alternate: Might be slower but use less mem
+        # Can't make this a generator.  See mlflow get_metric_history internals
+        # https://github.com/mlflow/mlflow/blob/master/mlflow/tracking/_tracking_service/client.py#L74-L93
+        # for k in self.run.data.metrics.keys():
+        #     history = self.mlflow_client.get_metric_history(self.run.info.run_id, k)
+        #     yield wandbify(history)
+    def run_group(self):
+        # this is nesting?  Parent at `run.info.tags.get("mlflow.parentRunId")`
+        return f"Experiment {self.run.info.experiment_id}"
+    def job_type(self):
+        # Is this the right approach?
+        return f"User {self.run.info.user_id}"
+    def display_name(self):
+        return self.run.info.run_name
+    def notes(self):
+        return self.run.data.tags.get("mlflow.note.content")
+    def tags(self):
+        return {
+            k: v for k, v in self.run.data.tags.items() if not k.startswith("mlflow.")
+        }
+    def start_time(self):
+        return self.run.info.start_time // 1000
+    def runtime(self):
+        return self.run.info.end_time // 1_000 - self.start_time()
+    def git(self):
+        ...
+    def artifacts(self):
+        for f in self.mlflow_client.list_artifacts(self.run.info.run_id):
+            dir_path = mlflow.artifacts.download_artifacts(run_id=self.run.info.run_id)
+            full_path = dir_path + f.path
+            yield (f.path, full_path)
+class MlflowImporter(Importer):
+    def __init__(
+        self, mlflow_tracking_uri, mlflow_registry_uri=None, wandb_base_url=None
+    ) -> None:
+        super().__init__()
+        self.mlflow_tracking_uri = mlflow_tracking_uri
+        mlflow.set_tracking_uri(self.mlflow_tracking_uri)
+        if mlflow_registry_uri:
+            mlflow.set_registry_uri(mlflow_registry_uri)
+        self.mlflow_client = mlflow.tracking.MlflowClient(mlflow_tracking_uri)
+    def import_one(
+        self,
+        run: ImporterRun,
+        overrides: Optional[Dict[str, Any]] = None,
+    ) -> None:
+        mlflow.set_tracking_uri(self.mlflow_tracking_uri)
+        super().import_one(run, overrides)
+    def download_all_runs(self) -> Iterable[MlflowRun]:
+        for exp in self.mlflow_client.search_experiments():
+            for run in self.mlflow_client.search_runs(exp.experiment_id):
+                yield MlflowRun(run, self.mlflow_client)

wandb/apis/internal.py CHANGED Viewed

@@ -161,6 +161,9 @@ class Api:
     def get_run_state(self, *args, **kwargs):
         return self.api.get_run_state(*args, **kwargs)
+    def entity_is_team(self, *args, **kwargs):
+        return self.api.entity_is_team(*args, **kwargs)
     def get_project_run_queues(self, *args, **kwargs):
         return self.api.get_project_run_queues(*args, **kwargs)
@@ -182,6 +185,12 @@ class Api:
     def launch_agent_introspection(self, *args, **kwargs):
         return self.api.launch_agent_introspection(*args, **kwargs)
+    def fail_run_queue_item_introspection(self, *args, **kwargs):
+        return self.api.fail_run_queue_item_introspection(*args, **kwargs)
+    def fail_run_queue_item(self, *args, **kwargs):
+        return self.api.fail_run_queue_item(*args, **kwargs)
     def get_launch_agent(self, *args, **kwargs):
         return self.api.get_launch_agent(*args, **kwargs)

wandb/apis/public.py CHANGED Viewed

@@ -5562,7 +5562,6 @@ class Job:
         queue=None,
         resource="local-container",
         resource_args=None,
-        cuda=False,
         project_queue=None,
     ):
         from wandb.sdk.launch import launch_add
@@ -5589,6 +5588,5 @@ class Job:
             resource=resource,
             project_queue=project_queue,
             resource_args=resource_args,
-            cuda=cuda,
         )
         return queued_run

wandb 0.13.11__py3-none-any.whl → 0.14.0__py3-none-any.whl

wandb 0.13.11py3-none-any.whl → 0.14.0py3-none-any.whl