PyPI - wandb - Versions diffs - 0.13.10__py3-none-any.whl → 0.14.0__py3-none-any.whl - Mend

wandb 0.13.10py3-none-any.whl → 0.14.0py3-none-any.whl

Files changed (228) hide show

wandb/__init__.py +2 -3
wandb/apis/__init__.py +1 -3
wandb/apis/importers/__init__.py +4 -0
wandb/apis/importers/base.py +312 -0
wandb/apis/importers/mlflow.py +113 -0
wandb/apis/internal.py +29 -2
wandb/apis/normalize.py +6 -5
wandb/apis/public.py +163 -180
wandb/apis/reports/_templates.py +6 -12
wandb/apis/reports/report.py +1 -1
wandb/apis/reports/runset.py +1 -3
wandb/apis/reports/util.py +12 -10
wandb/beta/workflows.py +57 -34
wandb/catboost/__init__.py +1 -2
wandb/cli/cli.py +215 -133
wandb/data_types.py +63 -56
wandb/docker/__init__.py +78 -16
wandb/docker/auth.py +21 -22
wandb/env.py +0 -1
wandb/errors/__init__.py +8 -116
wandb/errors/term.py +1 -1
wandb/fastai/__init__.py +1 -2
wandb/filesync/dir_watcher.py +8 -5
wandb/filesync/step_prepare.py +76 -75
wandb/filesync/step_upload.py +1 -2
wandb/integration/catboost/__init__.py +1 -3
wandb/integration/catboost/catboost.py +8 -14
wandb/integration/fastai/__init__.py +7 -13
wandb/integration/gym/__init__.py +35 -4
wandb/integration/keras/__init__.py +3 -3
wandb/integration/keras/callbacks/metrics_logger.py +9 -8
wandb/integration/keras/callbacks/model_checkpoint.py +9 -9
wandb/integration/keras/callbacks/tables_builder.py +31 -19
wandb/integration/kfp/kfp_patch.py +20 -17
wandb/integration/kfp/wandb_logging.py +1 -2
wandb/integration/lightgbm/__init__.py +21 -19
wandb/integration/prodigy/prodigy.py +6 -7
wandb/integration/sacred/__init__.py +9 -12
wandb/integration/sagemaker/__init__.py +1 -3
wandb/integration/sagemaker/auth.py +0 -1
wandb/integration/sagemaker/config.py +1 -1
wandb/integration/sagemaker/resources.py +1 -1
wandb/integration/sb3/sb3.py +8 -4
wandb/integration/tensorboard/__init__.py +1 -3
wandb/integration/tensorboard/log.py +8 -8
wandb/integration/tensorboard/monkeypatch.py +11 -9
wandb/integration/tensorflow/__init__.py +1 -3
wandb/integration/xgboost/__init__.py +4 -6
wandb/integration/yolov8/__init__.py +7 -0
wandb/integration/yolov8/yolov8.py +250 -0
wandb/jupyter.py +31 -35
wandb/lightgbm/__init__.py +1 -2
wandb/old/settings.py +2 -2
wandb/plot/bar.py +1 -2
wandb/plot/confusion_matrix.py +1 -3
wandb/plot/histogram.py +1 -2
wandb/plot/line.py +1 -2
wandb/plot/line_series.py +4 -4
wandb/plot/pr_curve.py +17 -20
wandb/plot/roc_curve.py +1 -3
wandb/plot/scatter.py +1 -2
wandb/proto/v3/wandb_server_pb2.py +85 -39
wandb/proto/v3/wandb_telemetry_pb2.py +10 -10
wandb/proto/v4/wandb_server_pb2.py +51 -39
wandb/proto/v4/wandb_telemetry_pb2.py +10 -10
wandb/sdk/__init__.py +1 -3
wandb/sdk/backend/backend.py +1 -1
wandb/sdk/data_types/_dtypes.py +38 -30
wandb/sdk/data_types/base_types/json_metadata.py +1 -3
wandb/sdk/data_types/base_types/media.py +17 -17
wandb/sdk/data_types/base_types/wb_value.py +33 -26
wandb/sdk/data_types/helper_types/bounding_boxes_2d.py +91 -125
wandb/sdk/data_types/helper_types/classes.py +1 -1
wandb/sdk/data_types/helper_types/image_mask.py +12 -12
wandb/sdk/data_types/histogram.py +5 -4
wandb/sdk/data_types/html.py +1 -2
wandb/sdk/data_types/image.py +11 -11
wandb/sdk/data_types/molecule.py +3 -6
wandb/sdk/data_types/object_3d.py +1 -2
wandb/sdk/data_types/plotly.py +1 -2
wandb/sdk/data_types/saved_model.py +10 -8
wandb/sdk/data_types/video.py +1 -1
wandb/sdk/integration_utils/data_logging.py +5 -5
wandb/sdk/interface/artifacts.py +288 -266
wandb/sdk/interface/interface.py +2 -3
wandb/sdk/interface/interface_grpc.py +1 -1
wandb/sdk/interface/interface_queue.py +1 -1
wandb/sdk/interface/interface_relay.py +1 -1
wandb/sdk/interface/interface_shared.py +1 -2
wandb/sdk/interface/interface_sock.py +1 -1
wandb/sdk/interface/message_future.py +1 -1
wandb/sdk/interface/message_future_poll.py +1 -1
wandb/sdk/interface/router.py +1 -1
wandb/sdk/interface/router_queue.py +1 -1
wandb/sdk/interface/router_relay.py +1 -1
wandb/sdk/interface/router_sock.py +1 -1
wandb/sdk/interface/summary_record.py +1 -1
wandb/sdk/internal/artifacts.py +1 -1
wandb/sdk/internal/datastore.py +2 -3
wandb/sdk/internal/file_pusher.py +5 -3
wandb/sdk/internal/file_stream.py +22 -19
wandb/sdk/internal/handler.py +5 -4
wandb/sdk/internal/internal.py +1 -1
wandb/sdk/internal/internal_api.py +115 -55
wandb/sdk/internal/job_builder.py +1 -3
wandb/sdk/internal/profiler.py +1 -1
wandb/sdk/internal/progress.py +4 -6
wandb/sdk/internal/sample.py +1 -3
wandb/sdk/internal/sender.py +28 -16
wandb/sdk/internal/settings_static.py +5 -5
wandb/sdk/internal/system/assets/__init__.py +1 -0
wandb/sdk/internal/system/assets/cpu.py +3 -9
wandb/sdk/internal/system/assets/disk.py +2 -4
wandb/sdk/internal/system/assets/gpu.py +6 -18
wandb/sdk/internal/system/assets/gpu_apple.py +2 -4
wandb/sdk/internal/system/assets/interfaces.py +50 -22
wandb/sdk/internal/system/assets/ipu.py +1 -3
wandb/sdk/internal/system/assets/memory.py +7 -13
wandb/sdk/internal/system/assets/network.py +4 -8
wandb/sdk/internal/system/assets/open_metrics.py +283 -0
wandb/sdk/internal/system/assets/tpu.py +1 -4
wandb/sdk/internal/system/assets/trainium.py +26 -14
wandb/sdk/internal/system/system_info.py +2 -3
wandb/sdk/internal/system/system_monitor.py +52 -20
wandb/sdk/internal/tb_watcher.py +12 -13
wandb/sdk/launch/_project_spec.py +54 -65
wandb/sdk/launch/agent/agent.py +374 -90
wandb/sdk/launch/builder/abstract.py +61 -7
wandb/sdk/launch/builder/build.py +81 -110
wandb/sdk/launch/builder/docker_builder.py +181 -0
wandb/sdk/launch/builder/kaniko_builder.py +419 -0
wandb/sdk/launch/builder/noop.py +31 -12
wandb/sdk/launch/builder/templates/_wandb_bootstrap.py +70 -20
wandb/sdk/launch/environment/abstract.py +28 -0
wandb/sdk/launch/environment/aws_environment.py +276 -0
wandb/sdk/launch/environment/gcp_environment.py +271 -0
wandb/sdk/launch/environment/local_environment.py +65 -0
wandb/sdk/launch/github_reference.py +3 -8
wandb/sdk/launch/launch.py +38 -29
wandb/sdk/launch/launch_add.py +6 -8
wandb/sdk/launch/loader.py +230 -0
wandb/sdk/launch/registry/abstract.py +54 -0
wandb/sdk/launch/registry/elastic_container_registry.py +163 -0
wandb/sdk/launch/registry/google_artifact_registry.py +203 -0
wandb/sdk/launch/registry/local_registry.py +62 -0
wandb/sdk/launch/runner/abstract.py +1 -16
wandb/sdk/launch/runner/{kubernetes.py → kubernetes_runner.py} +83 -95
wandb/sdk/launch/runner/local_container.py +46 -22
wandb/sdk/launch/runner/local_process.py +1 -4
wandb/sdk/launch/runner/{aws.py → sagemaker_runner.py} +53 -212
wandb/sdk/launch/runner/{gcp_vertex.py → vertex_runner.py} +38 -55
wandb/sdk/launch/sweeps/__init__.py +3 -2
wandb/sdk/launch/sweeps/scheduler.py +132 -39
wandb/sdk/launch/sweeps/scheduler_sweep.py +80 -89
wandb/sdk/launch/utils.py +101 -30
wandb/sdk/launch/wandb_reference.py +2 -7
wandb/sdk/lib/_settings_toposort_generate.py +166 -0
wandb/sdk/lib/_settings_toposort_generated.py +201 -0
wandb/sdk/lib/apikey.py +2 -4
wandb/sdk/lib/config_util.py +4 -1
wandb/sdk/lib/console.py +1 -3
wandb/sdk/lib/deprecate.py +3 -3
wandb/sdk/lib/file_stream_utils.py +7 -5
wandb/sdk/lib/filenames.py +1 -1
wandb/sdk/lib/filesystem.py +61 -5
wandb/sdk/lib/git.py +1 -3
wandb/sdk/lib/import_hooks.py +4 -7
wandb/sdk/lib/ipython.py +8 -5
wandb/sdk/lib/lazyloader.py +1 -3
wandb/sdk/lib/mailbox.py +14 -4
wandb/sdk/lib/proto_util.py +10 -5
wandb/sdk/lib/redirect.py +15 -22
wandb/sdk/lib/reporting.py +1 -3
wandb/sdk/lib/retry.py +4 -5
wandb/sdk/lib/runid.py +1 -3
wandb/sdk/lib/server.py +15 -9
wandb/sdk/lib/sock_client.py +1 -1
wandb/sdk/lib/sparkline.py +1 -1
wandb/sdk/lib/wburls.py +1 -1
wandb/sdk/service/port_file.py +1 -2
wandb/sdk/service/service.py +36 -13
wandb/sdk/service/service_base.py +12 -1
wandb/sdk/verify/verify.py +5 -7
wandb/sdk/wandb_artifacts.py +142 -177
wandb/sdk/wandb_config.py +5 -8
wandb/sdk/wandb_helper.py +1 -1
wandb/sdk/wandb_init.py +24 -13
wandb/sdk/wandb_login.py +9 -9
wandb/sdk/wandb_manager.py +39 -4
wandb/sdk/wandb_metric.py +2 -6
wandb/sdk/wandb_require.py +4 -15
wandb/sdk/wandb_require_helpers.py +1 -9
wandb/sdk/wandb_run.py +95 -141
wandb/sdk/wandb_save.py +1 -3
wandb/sdk/wandb_settings.py +149 -54
wandb/sdk/wandb_setup.py +66 -46
wandb/sdk/wandb_summary.py +13 -10
wandb/sdk/wandb_sweep.py +6 -7
wandb/sdk/wandb_watch.py +1 -1
wandb/sklearn/calculate/confusion_matrix.py +1 -1
wandb/sklearn/calculate/learning_curve.py +1 -1
wandb/sklearn/calculate/summary_metrics.py +1 -3
wandb/sklearn/plot/__init__.py +1 -1
wandb/sklearn/plot/classifier.py +27 -18
wandb/sklearn/plot/clusterer.py +4 -5
wandb/sklearn/plot/regressor.py +4 -4
wandb/sklearn/plot/shared.py +2 -2
wandb/sync/__init__.py +1 -3
wandb/sync/sync.py +4 -5
wandb/testing/relay.py +11 -10
wandb/trigger.py +1 -1
wandb/util.py +106 -81
wandb/viz.py +4 -4
wandb/wandb_agent.py +50 -50
wandb/wandb_controller.py +2 -3
wandb/wandb_run.py +1 -2
wandb/wandb_torch.py +1 -1
wandb/xgboost/__init__.py +1 -2
{wandb-0.13.10.dist-info → wandb-0.14.0.dist-info}/METADATA +6 -2
{wandb-0.13.10.dist-info → wandb-0.14.0.dist-info}/RECORD +224 -209
{wandb-0.13.10.dist-info → wandb-0.14.0.dist-info}/WHEEL +1 -1
wandb/sdk/launch/builder/docker.py +0 -80
wandb/sdk/launch/builder/kaniko.py +0 -393
wandb/sdk/launch/builder/loader.py +0 -32
wandb/sdk/launch/runner/loader.py +0 -50
{wandb-0.13.10.dist-info → wandb-0.14.0.dist-info}/LICENSE +0 -0
{wandb-0.13.10.dist-info → wandb-0.14.0.dist-info}/entry_points.txt +0 -0
{wandb-0.13.10.dist-info → wandb-0.14.0.dist-info}/top_level.txt +0 -0

wandb/__init__.py CHANGED Viewed

@@ -5,13 +5,13 @@ The most commonly used functions/objects are:
   - wandb.config — track hyperparameters and metadata
   - wandb.log — log metrics and media over time within your training loop
-For guides and examples, see https://docs.wandb.com/guides.
+For guides and examples, see https://docs.wandb.ai.
 For scripts and interactive notebooks, see https://github.com/wandb/examples.
 For reference documentation, see https://docs.wandb.com/ref/python.
 """
-__version__ = "0.13.10"
+__version__ = "0.14.0"
 # Used with pypi checks and other messages related to pip
 _wandb_module = "wandb"
@@ -193,7 +193,6 @@ if wandb_sdk.lib.ipython.in_jupyter():
     load_ipython_extension(get_ipython())
-wandb.require("service")
 __all__ = [
     "__version__",

wandb/apis/__init__.py CHANGED Viewed

@@ -1,6 +1,4 @@
-"""
-api.
-"""
+"""api."""
 from typing import Callable

wandb/apis/importers/__init__.py ADDED Viewed

@@ -0,0 +1,4 @@
+from wandb.util import get_module
+if get_module("mlflow"):
+    from .mlflow import MlflowImporter, MlflowRun  # noqa: F401

wandb/apis/importers/base.py ADDED Viewed

@@ -0,0 +1,312 @@
+import json
+import platform
+from abc import ABC, abstractmethod
+from concurrent.futures import ProcessPoolExecutor, as_completed
+from contextlib import contextmanager
+from typing import Any, Dict, Iterable, List, Optional, Tuple
+from tqdm.auto import tqdm
+import wandb
+from wandb.proto import wandb_internal_pb2 as pb
+from wandb.proto import wandb_telemetry_pb2 as telem_pb
+from wandb.sdk.interface.interface import file_policy_to_enum
+from wandb.sdk.interface.interface_queue import InterfaceQueue
+from wandb.sdk.internal.sender import SendManager
+Name = str
+Path = str
+def coalesce(*arg: Any) -> Any:
+    """Return the first non-none value in the list of arguments.  Similar to ?? in C#."""
+    return next((a for a in arg if a is not None), None)
+@contextmanager
+def send_manager(root_dir):
+    sm = SendManager.setup(root_dir, resume=False)
+    try:
+        yield sm
+    finally:
+        # flush any remaining records
+        while sm:
+            data = next(sm)
+            sm.send(data)
+        sm.finish()
+class ImporterRun:
+    def __init__(self) -> None:
+        self.interface = InterfaceQueue()
+        self.run_dir = f"./wandb-importer/{self.run_id()}"
+    def run_id(self) -> str:
+        _id = wandb.util.generate_id()
+        wandb.termwarn(f"`run_id` not specified.  Autogenerating id: {_id}")
+        return _id
+    def entity(self) -> str:
+        _entity = "unspecified-entity"
+        wandb.termwarn(f"`entity` not specified.  Defaulting to: {_entity}")
+        return _entity
+    def project(self) -> str:
+        _project = "unspecified-project"
+        wandb.termwarn(f"`project` not specified.  Defaulting to: {_project}")
+        return _project
+    def config(self) -> Dict[str, Any]:
+        return {}
+    def summary(self) -> Dict[str, float]:
+        return {}
+    def metrics(self) -> List[Dict[str, float]]:
+        """Metrics for the run.
+        We expect metrics in this shape:
+        [
+            {'metric1': 1, 'metric2': 1, '_step': 0},
+            {'metric1': 2, 'metric2': 4, '_step': 1},
+            {'metric1': 3, 'metric2': 9, '_step': 2},
+            ...
+        ]
+        You can also submit metrics in this shape:
+        [
+            {'metric1': 1, '_step': 0},
+            {'metric2': 1, '_step': 0},
+            {'metric1': 2, '_step': 1},
+            {'metric2': 4, '_step': 1},
+            ...
+        ]
+        """
+        return []
+    def run_group(self) -> Optional[str]:
+        ...
+    def job_type(self) -> Optional[str]:
+        ...
+    def display_name(self) -> str:
+        return self.run_id()
+    def notes(self) -> Optional[str]:
+        ...
+    def tags(self) -> Optional[List[str]]:
+        ...
+    def artifacts(self) -> Optional[Iterable[Tuple[Name, Path]]]:
+        ...
+    def os_version(self) -> Optional[str]:
+        ...
+    def python_version(self) -> Optional[str]:
+        ...
+    def cuda_version(self) -> Optional[str]:
+        ...
+    def program(self) -> Optional[str]:
+        ...
+    def host(self) -> Optional[str]:
+        ...
+    def username(self) -> Optional[str]:
+        ...
+    def executable(self) -> Optional[str]:
+        ...
+    def gpus_used(self) -> Optional[str]:
+        ...
+    def cpus_used(self) -> Optional[int]:  # can we get the model?
+        ...
+    def memory_used(self) -> Optional[int]:
+        ...
+    def runtime(self) -> Optional[int]:
+        ...
+    def start_time(self) -> Optional[int]:
+        ...
+    def _make_run_record(self) -> pb.Record:
+        run = pb.RunRecord()
+        run.run_id = self.run_id()
+        run.entity = self.entity()
+        run.project = self.project()
+        run.display_name = coalesce(self.display_name())
+        run.notes = coalesce(self.notes(), "")
+        run.tags.extend(coalesce(self.tags(), list()))
+        # run.start_time.FromMilliseconds(self.start_time())
+        # run.runtime = self.runtime()
+        run_group = self.run_group()
+        if run_group is not None:
+            run.run_group = run_group
+        self.interface._make_config(
+            data=self.config(),
+            obj=run.config,
+        )  # is there a better way?
+        return self.interface._make_record(run=run)
+    def _make_summary_record(self) -> pb.Record:
+        d: dict = {
+            **self.summary(),
+            "_runtime": self.runtime(),  # quirk of runtime -- it has to be here!
+            # '_timestamp': self.start_time()/1000,
+        }
+        summary = self.interface._make_summary_from_dict(d)
+        return self.interface._make_record(summary=summary)
+    def _make_history_records(self) -> Iterable[pb.Record]:
+        for _, metrics in enumerate(self.metrics()):
+            history = pb.HistoryRecord()
+            for k, v in metrics.items():
+                item = history.item.add()
+                item.key = k
+                item.value_json = json.dumps(v)
+            yield self.interface._make_record(history=history)
+    def _make_files_record(self, files_dict) -> pb.Record:
+        # when making the metadata file, it captures most things correctly
+        # but notably it doesn't capture the start time!
+        files_record = pb.FilesRecord()
+        for path, policy in files_dict["files"]:
+            f = files_record.files.add()
+            f.path = path
+            f.policy = file_policy_to_enum(policy)  # is this always "end"?
+        return self.interface._make_record(files=files_record)
+    def _make_metadata_files_record(self) -> pb.Record:
+        self._make_metadata_file(self.run_dir)
+        return self._make_files_record(
+            {"files": [[f"{self.run_dir}/files/wandb-metadata.json", "end"]]}
+        )
+    def _make_artifact_record(self) -> pb.Record:
+        art = wandb.Artifact(self.display_name(), "imported-artifacts")
+        artifacts = self.artifacts()
+        if artifacts is not None:
+            for name, path in artifacts:
+                art.add_file(path, name)
+        proto = self.interface._make_artifact(art)
+        proto.run_id = self.run_id()
+        proto.project = self.project()
+        proto.entity = self.entity()
+        proto.user_created = False
+        proto.use_after_commit = False
+        proto.finalize = True
+        for tag in ["latest", "imported"]:
+            proto.aliases.append(tag)
+        return self.interface._make_record(artifact=proto)
+    def _make_telem_record(self) -> pb.Record:
+        feature = telem_pb.Feature()
+        feature.importer_mlflow = True
+        telem = telem_pb.TelemetryRecord()
+        telem.feature.CopyFrom(feature)
+        telem.python_version = platform.python_version()  # importer's python version
+        telem.cli_version = wandb.__version__
+        return self.interface._make_record(telemetry=telem)
+    def _make_metadata_file(self, run_dir: str) -> None:
+        missing_text = "MLFlow did not capture this info."
+        d = {}
+        if self.os_version() is not None:
+            d["os"] = self.os_version()
+        else:
+            d["os"] = missing_text
+        if self.python_version() is not None:
+            d["python"] = self.python_version()
+        else:
+            d["python"] = missing_text
+        if self.program() is not None:
+            d["program"] = self.program()
+        else:
+            d["program"] = missing_text
+        if self.cuda_version() is not None:
+            d["cuda"] = self.cuda_version()
+        if self.host() is not None:
+            d["host"] = self.host()
+        if self.username() is not None:
+            d["username"] = self.username()
+        if self.executable() is not None:
+            d["executable"] = self.executable()
+        gpus_used = self.gpus_used()
+        if gpus_used is not None:
+            d["gpu_devices"] = json.dumps(gpus_used)
+            d["gpu_count"] = json.dumps(len(gpus_used))
+        cpus_used = self.cpus_used()
+        if cpus_used is not None:
+            d["cpu_count"] = json.dumps(self.cpus_used())
+        mem_used = self.memory_used()
+        if mem_used is not None:
+            d["memory"] = json.dumps({"total": self.memory_used()})
+        with open(f"{run_dir}/files/wandb-metadata.json", "w") as f:
+            f.write(json.dumps(d))
+class Importer(ABC):
+    @abstractmethod
+    def download_all_runs(self) -> Iterable[ImporterRun]:
+        ...
+    def import_all(self, overrides: Optional[Dict[str, Any]] = None) -> None:
+        for run in tqdm(self.download_all_runs(), desc="Sending runs"):
+            self.import_one(run, overrides)
+    def import_all_parallel(
+        self, overrides: Optional[Dict[str, Any]] = None, **pool_kwargs: Any
+    ) -> None:
+        runs = list(self.download_all_runs())
+        with tqdm(total=len(runs)) as pbar:
+            with ProcessPoolExecutor(**pool_kwargs) as exc:
+                futures = {
+                    exc.submit(self.import_one, run, overrides=overrides): run
+                    for run in runs
+                }
+                for future in as_completed(futures):
+                    run = futures[future]
+                    pbar.update(1)
+                    pbar.set_description(
+                        f"Imported Run: {run.run_group()} {run.display_name()}"
+                    )
+    def import_one(
+        self,
+        run: ImporterRun,
+        overrides: Optional[Dict[str, Any]] = None,
+    ) -> None:
+        # does this need to be here for pmap?
+        if overrides:
+            for k, v in overrides.items():
+                # `lambda: v` won't work!
+                # https://stackoverflow.com/questions/10802002/why-deepcopy-doesnt-create-new-references-to-lambda-function
+                setattr(run, k, lambda v=v: v)
+        self._import_one(run)
+    def _import_one(self, run: ImporterRun) -> None:
+        with send_manager(run.run_dir) as sm:
+            sm.send(run._make_run_record())
+            sm.send(run._make_summary_record())
+            sm.send(run._make_metadata_files_record())
+            for history_record in run._make_history_records():
+                sm.send(history_record)
+            if run.artifacts() is not None:
+                sm.send(run._make_artifact_record())
+            sm.send(run._make_telem_record())

wandb/apis/importers/mlflow.py ADDED Viewed

@@ -0,0 +1,113 @@
+from typing import Any, Dict, Iterable, Optional
+from wandb.util import get_module
+from .base import Importer, ImporterRun
+mlflow = get_module(
+    "mlflow",
+    required="To use the MlflowImporter, please install mlflow: `pip install mlflow`",
+)
+class MlflowRun(ImporterRun):
+    def __init__(self, run, mlflow_client):
+        self.run = run
+        self.mlflow_client = mlflow_client
+        super().__init__()
+    def run_id(self):
+        return self.run.info.run_id
+    def entity(self):
+        return self.run.info.user_id
+    def project(self):
+        return "imported-from-mlflow"
+    def config(self):
+        return self.run.data.params
+    def summary(self):
+        return self.run.data.metrics
+    def metrics(self):
+        def wandbify(metrics):
+            for step, t in enumerate(metrics):
+                d = {m.key: m.value for m in t}
+                d["_step"] = step
+                yield d
+        metrics = [
+            self.mlflow_client.get_metric_history(self.run.info.run_id, k)
+            for k in self.run.data.metrics.keys()
+        ]
+        metrics = zip(*metrics)  # transpose
+        return wandbify(metrics)
+        # Alternate: Might be slower but use less mem
+        # Can't make this a generator.  See mlflow get_metric_history internals
+        # https://github.com/mlflow/mlflow/blob/master/mlflow/tracking/_tracking_service/client.py#L74-L93
+        # for k in self.run.data.metrics.keys():
+        #     history = self.mlflow_client.get_metric_history(self.run.info.run_id, k)
+        #     yield wandbify(history)
+    def run_group(self):
+        # this is nesting?  Parent at `run.info.tags.get("mlflow.parentRunId")`
+        return f"Experiment {self.run.info.experiment_id}"
+    def job_type(self):
+        # Is this the right approach?
+        return f"User {self.run.info.user_id}"
+    def display_name(self):
+        return self.run.info.run_name
+    def notes(self):
+        return self.run.data.tags.get("mlflow.note.content")
+    def tags(self):
+        return {
+            k: v for k, v in self.run.data.tags.items() if not k.startswith("mlflow.")
+        }
+    def start_time(self):
+        return self.run.info.start_time // 1000
+    def runtime(self):
+        return self.run.info.end_time // 1_000 - self.start_time()
+    def git(self):
+        ...
+    def artifacts(self):
+        for f in self.mlflow_client.list_artifacts(self.run.info.run_id):
+            dir_path = mlflow.artifacts.download_artifacts(run_id=self.run.info.run_id)
+            full_path = dir_path + f.path
+            yield (f.path, full_path)
+class MlflowImporter(Importer):
+    def __init__(
+        self, mlflow_tracking_uri, mlflow_registry_uri=None, wandb_base_url=None
+    ) -> None:
+        super().__init__()
+        self.mlflow_tracking_uri = mlflow_tracking_uri
+        mlflow.set_tracking_uri(self.mlflow_tracking_uri)
+        if mlflow_registry_uri:
+            mlflow.set_registry_uri(mlflow_registry_uri)
+        self.mlflow_client = mlflow.tracking.MlflowClient(mlflow_tracking_uri)
+    def import_one(
+        self,
+        run: ImporterRun,
+        overrides: Optional[Dict[str, Any]] = None,
+    ) -> None:
+        mlflow.set_tracking_uri(self.mlflow_tracking_uri)
+        super().import_one(run, overrides)
+    def download_all_runs(self) -> Iterable[MlflowRun]:
+        for exp in self.mlflow_client.search_experiments():
+            for run in self.mlflow_client.search_runs(exp.experiment_id):
+                yield MlflowRun(run, self.mlflow_client)

wandb/apis/internal.py CHANGED Viewed

@@ -2,14 +2,32 @@ from wandb.sdk.internal.internal_api import Api as InternalApi
 class Api:
-    """Internal proxy to the official internal API.  Eventually these methods
-    should likely be moved to PublicApi"""
+    """Internal proxy to the official internal API."""
+    # TODO: Move these methods to PublicApi.
     def __init__(self, *args, **kwargs):
         self._api_args = args
         self._api_kwargs = kwargs
         self._api = None
+    def __getstate__(self):
+        """Use for serializing.
+        self._api is not serializable, so it's dropped
+        """
+        state = self.__dict__.copy()
+        del state["_api"]
+        return state
+    def __setstate__(self, state):
+        """Used for deserializing.
+        Don't need to set self._api because it's constructed when needed.
+        """
+        self.__dict__.update(state)
+        self._api = None
     @property
     def api(self):
         # This is a property in order to delay construction of Internal API
@@ -143,6 +161,9 @@ class Api:
     def get_run_state(self, *args, **kwargs):
         return self.api.get_run_state(*args, **kwargs)
+    def entity_is_team(self, *args, **kwargs):
+        return self.api.entity_is_team(*args, **kwargs)
     def get_project_run_queues(self, *args, **kwargs):
         return self.api.get_project_run_queues(*args, **kwargs)
@@ -164,6 +185,12 @@ class Api:
     def launch_agent_introspection(self, *args, **kwargs):
         return self.api.launch_agent_introspection(*args, **kwargs)
+    def fail_run_queue_item_introspection(self, *args, **kwargs):
+        return self.api.fail_run_queue_item_introspection(*args, **kwargs)
+    def fail_run_queue_item(self, *args, **kwargs):
+        return self.api.fail_run_queue_item(*args, **kwargs)
     def get_launch_agent(self, *args, **kwargs):
         return self.api.get_launch_agent(*args, **kwargs)

wandb/apis/normalize.py CHANGED Viewed

@@ -1,6 +1,4 @@
-"""
-normalize.
-"""
+"""normalize."""
 import ast
 import sys
@@ -11,13 +9,14 @@ import requests
 from wandb_gql.client import RetryError
 from wandb import env
-from wandb.errors import CommError, ContextCancelledError
+from wandb.errors import CommError
+from wandb.sdk.lib.mailbox import ContextCancelledError
 _F = TypeVar("_F", bound=Callable)
 def normalize_exceptions(func: _F) -> _F:
-    """Function decorator for catching common errors and re-raising as wandb.Error"""
+    """Function decorator for catching common errors and re-raising as wandb.Error."""
     @wraps(func)
     def wrapper(*args, **kwargs):
@@ -48,6 +47,8 @@ def normalize_exceptions(func: _F) -> _F:
                 raise CommError(message, err.last_exception).with_traceback(
                     sys.exc_info()[2]
                 )
+        except CommError as err:
+            raise err
         except Exception as err:
             # gql raises server errors with dict's as strings...
             if len(err.args) > 0:

wandb 0.13.10__py3-none-any.whl → 0.14.0__py3-none-any.whl

wandb 0.13.10py3-none-any.whl → 0.14.0py3-none-any.whl