PyPI - wandb - Versions diffs - 0.16.3__py3-none-any.whl → 0.16.5__py3-none-any.whl - Mend

wandb 0.16.3py3-none-any.whl → 0.16.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (90) hide show

wandb/__init__.py +2 -2
wandb/agents/pyagent.py +1 -1
wandb/apis/importers/__init__.py +1 -4
wandb/apis/importers/internals/internal.py +386 -0
wandb/apis/importers/internals/protocols.py +125 -0
wandb/apis/importers/internals/util.py +78 -0
wandb/apis/importers/mlflow.py +125 -88
wandb/apis/importers/validation.py +108 -0
wandb/apis/importers/wandb.py +1604 -0
wandb/apis/public/api.py +7 -10
wandb/apis/public/artifacts.py +38 -0
wandb/apis/public/files.py +11 -2
wandb/apis/reports/v2/__init__.py +0 -19
wandb/apis/reports/v2/expr_parsing.py +0 -1
wandb/apis/reports/v2/interface.py +15 -18
wandb/apis/reports/v2/internal.py +12 -45
wandb/cli/cli.py +52 -55
wandb/integration/gym/__init__.py +2 -1
wandb/integration/keras/callbacks/model_checkpoint.py +1 -1
wandb/integration/keras/keras.py +6 -4
wandb/integration/kfp/kfp_patch.py +2 -2
wandb/integration/openai/fine_tuning.py +1 -2
wandb/integration/ultralytics/callback.py +0 -1
wandb/proto/v3/wandb_internal_pb2.py +332 -312
wandb/proto/v3/wandb_settings_pb2.py +13 -3
wandb/proto/v3/wandb_telemetry_pb2.py +10 -10
wandb/proto/v4/wandb_internal_pb2.py +316 -312
wandb/proto/v4/wandb_settings_pb2.py +5 -3
wandb/proto/v4/wandb_telemetry_pb2.py +10 -10
wandb/sdk/artifacts/artifact.py +75 -31
wandb/sdk/artifacts/artifact_manifest.py +5 -2
wandb/sdk/artifacts/artifact_manifest_entry.py +6 -1
wandb/sdk/artifacts/artifact_manifests/artifact_manifest_v1.py +8 -2
wandb/sdk/artifacts/artifact_saver.py +19 -47
wandb/sdk/artifacts/storage_handler.py +2 -1
wandb/sdk/artifacts/storage_policies/wandb_storage_policy.py +22 -9
wandb/sdk/artifacts/storage_policy.py +4 -1
wandb/sdk/data_types/base_types/wb_value.py +1 -1
wandb/sdk/data_types/image.py +2 -2
wandb/sdk/interface/interface.py +49 -13
wandb/sdk/interface/interface_shared.py +17 -11
wandb/sdk/internal/file_stream.py +20 -1
wandb/sdk/internal/handler.py +1 -4
wandb/sdk/internal/internal_api.py +3 -1
wandb/sdk/internal/job_builder.py +49 -19
wandb/sdk/internal/profiler.py +1 -1
wandb/sdk/internal/sender.py +96 -124
wandb/sdk/internal/sender_config.py +197 -0
wandb/sdk/internal/settings_static.py +9 -0
wandb/sdk/internal/system/system_info.py +5 -3
wandb/sdk/internal/update.py +1 -1
wandb/sdk/launch/_launch.py +3 -3
wandb/sdk/launch/_launch_add.py +28 -29
wandb/sdk/launch/_project_spec.py +148 -136
wandb/sdk/launch/agent/agent.py +3 -7
wandb/sdk/launch/agent/config.py +0 -27
wandb/sdk/launch/builder/build.py +54 -28
wandb/sdk/launch/builder/docker_builder.py +4 -15
wandb/sdk/launch/builder/kaniko_builder.py +72 -45
wandb/sdk/launch/create_job.py +6 -40
wandb/sdk/launch/loader.py +10 -0
wandb/sdk/launch/registry/anon.py +29 -0
wandb/sdk/launch/registry/local_registry.py +4 -1
wandb/sdk/launch/runner/kubernetes_runner.py +20 -2
wandb/sdk/launch/runner/local_container.py +15 -10
wandb/sdk/launch/runner/sagemaker_runner.py +1 -1
wandb/sdk/launch/sweeps/scheduler.py +11 -3
wandb/sdk/launch/utils.py +14 -0
wandb/sdk/lib/__init__.py +2 -5
wandb/sdk/lib/_settings_toposort_generated.py +4 -1
wandb/sdk/lib/apikey.py +0 -5
wandb/sdk/lib/config_util.py +0 -31
wandb/sdk/lib/filesystem.py +11 -1
wandb/sdk/lib/run_moment.py +72 -0
wandb/sdk/service/service.py +7 -2
wandb/sdk/service/streams.py +1 -6
wandb/sdk/verify/verify.py +2 -1
wandb/sdk/wandb_init.py +12 -1
wandb/sdk/wandb_login.py +43 -26
wandb/sdk/wandb_run.py +164 -110
wandb/sdk/wandb_settings.py +58 -16
wandb/testing/relay.py +5 -6
wandb/util.py +50 -7
{wandb-0.16.3.dist-info → wandb-0.16.5.dist-info}/METADATA +8 -1
{wandb-0.16.3.dist-info → wandb-0.16.5.dist-info}/RECORD +89 -82
{wandb-0.16.3.dist-info → wandb-0.16.5.dist-info}/WHEEL +1 -1
wandb/apis/importers/base.py +0 -400
{wandb-0.16.3.dist-info → wandb-0.16.5.dist-info}/LICENSE +0 -0
{wandb-0.16.3.dist-info → wandb-0.16.5.dist-info}/entry_points.txt +0 -0
{wandb-0.16.3.dist-info → wandb-0.16.5.dist-info}/top_level.txt +0 -0

wandb/sdk/wandb_run.py CHANGED Viewed

@@ -6,6 +6,7 @@ import json
 import logging
 import numbers
 import os
+import pathlib
 import re
 import sys
 import threading
@@ -42,7 +43,6 @@ from wandb.apis import internal, public
 from wandb.apis.internal import Api
 from wandb.apis.public import Api as PublicApi
 from wandb.proto.wandb_internal_pb2 import (
-    JobInfoResponse,
     MetricRecord,
     PollExitResponse,
     Result,
@@ -531,7 +531,6 @@ class Run:
     _check_version: Optional["CheckVersionResponse"]
     _sampled_history: Optional["SampledHistoryResponse"]
     _final_summary: Optional["GetSummaryResponse"]
-    _job_info: Optional["JobInfoResponse"]
     _poll_exit_handle: Optional[MailboxHandle]
     _poll_exit_response: Optional[PollExitResponse]
     _server_info_response: Optional[ServerInfoResponse]
@@ -642,7 +641,6 @@ class Run:
         self._server_info_response = None
         self._internal_messages_response = None
         self._poll_exit_handle = None
-        self._job_info = None
         # Initialize telemetry object
         self._telemetry_obj = telemetry.TelemetryRecord()
@@ -673,6 +671,12 @@ class Run:
                 os.path.join("code", self._settings.program_relpath)
             )
+        if self._settings.fork_from is not None:
+            config[wandb_key]["branch_point"] = {
+                "run_id": self._settings.fork_from.run,
+                "step": self._settings.fork_from.value,
+            }
         self._config._update(config, ignore_locked=True)
         if sweep_config:
@@ -734,7 +738,7 @@ class Run:
             and self._settings.launch_config_path
             and os.path.exists(self._settings.launch_config_path)
         ):
-            self._save(self._settings.launch_config_path)
+            self.save(self._settings.launch_config_path)
             with open(self._settings.launch_config_path) as fp:
                 launch_config = json.loads(fp.read())
             if launch_config.get("overrides", {}).get("artifacts") is not None:
@@ -1385,6 +1389,8 @@ class Run:
     @_run_decorator._noop_on_finish()
     def _summary_update_callback(self, summary_record: SummaryRecord) -> None:
+        with telemetry.context(run=self) as tel:
+            tel.feature.set_summary = True
         if self._backend and self._backend.interface:
             self._backend.interface.publish_summary(summary_record)
@@ -1811,6 +1817,10 @@ class Run:
             ValueError: if invalid data is passed
         """
+        if step is not None:
+            with telemetry.context(run=self) as tel:
+                tel.feature.set_step_log = True
         if sync is not None:
             deprecate.deprecate(
                 field_name=deprecate.Deprecated.run__log_sync,
@@ -1831,20 +1841,53 @@ class Run:
     @_run_decorator._attach
     def save(
         self,
-        glob_str: Optional[str] = None,
-        base_path: Optional[str] = None,
+        glob_str: Optional[Union[str, os.PathLike]] = None,
+        base_path: Optional[Union[str, os.PathLike]] = None,
         policy: "PolicyName" = "live",
     ) -> Union[bool, List[str]]:
-        """Ensure all files matching `glob_str` are synced to wandb with the policy specified.
+        """Sync one or more files to W&B.
+        Relative paths are relative to the current working directory.
+        A Unix glob, such as "myfiles/*", is expanded at the time `save` is
+        called regardless of the `policy`. In particular, new files are not
+        picked up automatically.
+        A `base_path` may be provided to control the directory structure of
+        uploaded files. It should be a prefix of `glob_str`, and the direcotry
+        structure beneath it is preserved. It's best understood through
+        examples:
+        ```
+        wandb.save("these/are/myfiles/*")
+        # => Saves files in a "these/are/myfiles/" folder in the run.
+        wandb.save("these/are/myfiles/*", base_path="these")
+        # => Saves files in an "are/myfiles/" folder in the run.
+        wandb.save("/User/username/Documents/run123/*.txt")
+        # => Saves files in a "run123/" folder in the run.
+        wandb.save("/User/username/Documents/run123/*.txt", base_path="/User")
+        # => Saves files in a "username/Documents/run123/" folder in the run.
+        wandb.save("files/*/saveme.txt")
+        # => Saves each "saveme.txt" file in an appropriate subdirectory
+        # of "files/".
+        ```
         Arguments:
-            glob_str: (string) a relative or absolute path to a unix glob or regular
-                path.  If this isn't specified the method is a noop.
-            base_path: (string) the base path to run the glob relative to
-            policy: (string) one of `live`, `now`, or `end`
-                - live: upload the file as it changes, overwriting the previous version
-                - now: upload the file once now
-                - end: only upload file when the run ends
+            glob_str: A relative or absolute path or Unix glob.
+            base_path: A path to use to infer a directory structure; see examples.
+            policy: One of `live`, `now`, or `end`.
+                * live: upload the file as it changes, overwriting the previous version
+                * now: upload the file once now
+                * end: upload file when the run ends
+        Returns:
+            Paths to the symlinks created for the matched files.
+            For historical reasons, this may return a boolean in legacy code.
         """
         if glob_str is None:
             # noop for historical reasons, run.save() may be called in legacy code
@@ -1857,77 +1900,116 @@ class Run:
             )
             return True
-        return self._save(glob_str, base_path, policy)
+        if isinstance(glob_str, bytes):
+            # Preserved for backward compatibility: allow bytes inputs.
+            glob_str = glob_str.decode("utf-8")
+        if isinstance(glob_str, str) and (
+            glob_str.startswith("gs://") or glob_str.startswith("s3://")
+        ):
+            # Provide a better error message for a common misuse.
+            wandb.termlog(f"{glob_str} is a cloud storage url, can't save file to W&B.")
+            return []
+        glob_path = pathlib.Path(glob_str)
+        if base_path is not None:
+            base_path = pathlib.Path(base_path)
+        elif not glob_path.is_absolute():
+            base_path = pathlib.Path(".")
+        else:
+            # Absolute glob paths with no base path get special handling.
+            wandb.termwarn(
+                "Saving files without folders. If you want to preserve "
+                "subdirectories pass base_path to wandb.save, i.e. "
+                'wandb.save("/mnt/folder/file.h5", base_path="/mnt")',
+                repeat=False,
+            )
+            base_path = glob_path.resolve().parent.parent
-    def _save(
-        self,
-        glob_str: Optional[str] = None,
-        base_path: Optional[str] = None,
-        policy: "PolicyName" = "live",
-    ) -> Union[bool, List[str]]:
         if policy not in ("live", "end", "now"):
             raise ValueError(
-                'Only "live" "end" and "now" policies are currently supported.'
+                'Only "live", "end" and "now" policies are currently supported.'
             )
-        if isinstance(glob_str, bytes):
-            glob_str = glob_str.decode("utf-8")
-        if not isinstance(glob_str, str):
-            raise ValueError("Must call wandb.save(glob_str) with glob_str a str")
-        if base_path is None:
-            if os.path.isabs(glob_str):
-                base_path = os.path.dirname(glob_str)
-                wandb.termwarn(
-                    "Saving files without folders. If you want to preserve "
-                    "sub directories pass base_path to wandb.save, i.e. "
-                    'wandb.save("/mnt/folder/file.h5", base_path="/mnt")',
-                    repeat=False,
-                )
-            else:
-                base_path = "."
-        wandb_glob_str = GlobStr(os.path.relpath(glob_str, base_path))
-        if ".." + os.sep in wandb_glob_str:
-            raise ValueError("globs can't walk above base_path")
+        resolved_glob_path = glob_path.resolve()
+        resolved_base_path = base_path.resolve()
+        return self._save(
+            resolved_glob_path,
+            resolved_base_path,
+            policy,
+        )
+    def _save(
+        self,
+        glob_path: pathlib.Path,
+        base_path: pathlib.Path,
+        policy: "PolicyName",
+    ) -> List[str]:
+        # Can't use is_relative_to() because that's added in Python 3.9,
+        # but we support down to Python 3.7.
+        if not str(glob_path).startswith(str(base_path)):
+            raise ValueError("Glob may not walk above the base path")
+        if glob_path == base_path:
+            raise ValueError("Glob cannot be the same as the base path")
+        relative_glob = glob_path.relative_to(base_path)
+        if relative_glob.parts[0] == "*":
+            raise ValueError("Glob may not start with '*' relative to the base path")
+        relative_glob_str = GlobStr(str(relative_glob))
         with telemetry.context(run=self) as tel:
             tel.feature.save = True
-        if glob_str.startswith("gs://") or glob_str.startswith("s3://"):
-            wandb.termlog(
-                "%s is a cloud storage url, can't save file to wandb." % glob_str
-            )
-            return []
-        files = glob.glob(os.path.join(self._settings.files_dir, wandb_glob_str))
-        warn = False
-        if len(files) == 0 and "*" in wandb_glob_str:
-            warn = True
-        for path in glob.glob(glob_str):
-            file_name = os.path.relpath(path, base_path)
-            abs_path = os.path.abspath(path)
-            wandb_path = os.path.join(self._settings.files_dir, file_name)
-            filesystem.mkdir_exists_ok(os.path.dirname(wandb_path))
-            # We overwrite symlinks because namespaces can change in Tensorboard
-            if os.path.islink(wandb_path) and abs_path != os.readlink(wandb_path):
-                os.remove(wandb_path)
-                os.symlink(abs_path, wandb_path)
-            elif not os.path.exists(wandb_path):
-                os.symlink(abs_path, wandb_path)
-            files.append(wandb_path)
-        if warn:
-            file_str = "%i file" % len(files)
-            if len(files) > 1:
+        # Paths to the symlinks created for the globbed files.
+        wandb_files = [
+            str(path)
+            for path in pathlib.Path(
+                self._settings.files_dir,
+            ).glob(relative_glob_str)
+        ]
+        had_symlinked_files = len(wandb_files) > 0
+        is_star_glob = "*" in relative_glob_str
+        # The base_path may itself be a glob, so we can't do
+        #     base_path.glob(relative_glob_str)
+        for path_str in glob.glob(str(base_path / relative_glob_str)):
+            path = pathlib.Path(path_str).absolute()
+            # We can't use relative_to() because base_path may be a glob.
+            saved_path = pathlib.Path(*path.parts[len(base_path.parts) :])
+            wandb_path = pathlib.Path(self._settings.files_dir, saved_path)
+            wandb_files.append(str(wandb_path))
+            wandb_path.parent.mkdir(parents=True, exist_ok=True)
+            # Delete the symlink if it exists.
+            try:
+                wandb_path.unlink()
+            except FileNotFoundError:
+                # In Python 3.8, we would pass missing_ok=True, but as of now
+                # we support down to Python 3.7.
+                pass
+            wandb_path.symlink_to(path)
+        # Inform users that new files aren't detected automatically.
+        if not had_symlinked_files and is_star_glob:
+            file_str = f"{len(wandb_files)} file"
+            if len(wandb_files) > 1:
                 file_str += "s"
             wandb.termwarn(
-                (
-                    "Symlinked %s into the W&B run directory, "
-                    "call wandb.save again to sync new files."
-                )
-                % file_str
+                f"Symlinked {file_str} into the W&B run directory, "
+                "call wandb.save again to sync new files."
             )
-        files_dict: FilesDict = dict(files=[(wandb_glob_str, policy)])
+        files_dict: FilesDict = {"files": [(relative_glob_str, policy)]}
         if self._backend and self._backend.interface:
             self._backend.interface.publish_files(files_dict)
-        return files
+        return wandb_files
     @_run_decorator._attach
     def restore(
@@ -2286,14 +2368,12 @@ class Run:
         if self._settings._save_requirements:
             if self._backend and self._backend.interface:
-                import pkg_resources
+                from wandb.util import working_set
                 logger.debug(
                     "Saving list of pip packages installed into the current environment"
                 )
-                self._backend.interface.publish_python_packages(
-                    pkg_resources.working_set
-                )
+                self._backend.interface.publish_python_packages(working_set())
         if self._backend and self._backend.interface and not self._settings._offline:
             self._run_status_checker = RunStatusChecker(
@@ -2353,11 +2433,9 @@ class Run:
                 os.remove(self._settings.resume_fname)
     def _make_job_source_reqs(self) -> Tuple[List[str], Dict[str, Any], Dict[str, Any]]:
-        import pkg_resources
+        from wandb.util import working_set
-        installed_packages_list = sorted(
-            f"{d.key}=={d.version}" for d in iter(pkg_resources.working_set)
-        )
+        installed_packages_list = sorted(f"{d.key}=={d.version}" for d in working_set())
         input_types = TypeRegistry.type_of(self.config.as_dict()).to_json()
         output_types = TypeRegistry.type_of(self.summary._as_dict()).to_json()
@@ -2428,8 +2506,6 @@ class Run:
         else:
             return artifact
-    # Add a recurring callback (probe) to poll the backend process
-    # for its status using the "poll_exit" message.
     def _on_probe_exit(self, probe_handle: MailboxProbe) -> None:
         handle = probe_handle.get_mailbox_handle()
         if handle:
@@ -2441,8 +2517,6 @@ class Run:
         handle = self._backend.interface.deliver_poll_exit()
         probe_handle.set_mailbox_handle(handle)
-    # Handles the progress message from the backend process and prints
-    # the current status to the terminal footer
     def _on_progress_exit(self, progress_handle: MailboxProgress) -> None:
         probe_handles = progress_handle.get_probe_handles()
         assert probe_handles and len(probe_handles) == 1
@@ -2493,7 +2567,6 @@ class Run:
         sampled_history_handle = (
             self._backend.interface.deliver_request_sampled_history()
         )
-        job_info_handle = self._backend.interface.deliver_request_job_info()
         result = server_info_handle.wait(timeout=-1)
         assert result
@@ -2507,10 +2580,6 @@ class Run:
         assert result
         self._final_summary = result.response.get_summary_response
-        result = job_info_handle.wait(timeout=-1)
-        assert result
-        self._job_info = result.response.job_info_response
         if self._backend:
             self._backend.cleanup()
@@ -2533,7 +2602,6 @@ class Run:
             server_info_response=self._server_info_response,
             check_version_response=self._check_version,
             internal_messages_response=self._internal_messages_response,
-            job_info=self._job_info,
             reporter=self._reporter,
             quiet=self._quiet,
             settings=self._settings,
@@ -2730,9 +2798,6 @@ class Run:
         if self._backend and self._backend.interface:
             if artifact.is_draft() and not artifact._is_draft_save_started():
                 artifact = self._log_artifact(artifact)
-            # artifact logging is async, wait until the artifact is committed
-            # before trying to link it
-            artifact.wait()
             if not self._settings._offline:
                 self._backend.interface.publish_link_artifact(
                     self,
@@ -2769,7 +2834,6 @@ class Run:
                 can be in the following forms:
                     - name:version
                     - name:alias
-                    - digest
                 You can also pass an Artifact object created by calling `wandb.Artifact`
             type: (str, optional) The type of artifact to use.
             aliases: (list, optional) Aliases to apply to this artifact
@@ -3034,7 +3098,7 @@ class Run:
         self._assert_can_log_artifact(artifact)
         if self._backend and self._backend.interface:
             if not self._settings._offline:
-                handle = self._backend.interface.deliver_artifact(
+                future = self._backend.interface.communicate_artifact(
                     self,
                     artifact,
                     aliases,
@@ -3043,9 +3107,7 @@ class Run:
                     is_user_created=is_user_created,
                     use_after_commit=use_after_commit,
                 )
-                handle.add_probe(self._on_probe_exit)
-                handle.add_progress(self._on_progress_exit)
-                artifact._set_save_handle(handle, self._public_api().client)
+                artifact._set_save_future(future, self._public_api().client)
             else:
                 self._backend.interface.publish_artifact(
                     self,
@@ -3199,7 +3261,6 @@ class Run:
                 can be in the following forms:
                     - model_artifact_name:version
                     - model_artifact_name:alias
-                    - model_artifact_name:digest.
         Examples:
             ```python
@@ -3524,7 +3585,7 @@ class Run:
         if settings._offline or settings.silent:
             return
-        run_url = settings.run_url
+        workspace_url = f"{settings.run_url}/workspace"
         project_url = settings.project_url
         sweep_url = settings.sweep_url
@@ -3535,7 +3596,7 @@ class Run:
         if printer._html:
             if not wandb.jupyter.maybe_display():
-                run_line = f"<strong>{printer.link(run_url, run_name)}</strong>"
+                run_line = f"<strong>{printer.link(workspace_url, run_name)}</strong>"
                 project_line, sweep_line = "", ""
                 # TODO(settings): make settings the source of truth
@@ -3567,7 +3628,7 @@ class Run:
                     f'{printer.emoji("broom")} View sweep at {printer.link(sweep_url)}'
                 )
         printer.display(
-            f'{printer.emoji("rocket")} View run at {printer.link(run_url)}',
+            f'{printer.emoji("rocket")} View run at {printer.link(workspace_url)}',
         )
         # TODO(settings) use `wandb_settings` (if self.settings.anonymous == "true":)
@@ -3591,7 +3652,6 @@ class Run:
         server_info_response: Optional[ServerInfoResponse] = None,
         check_version_response: Optional["CheckVersionResponse"] = None,
         internal_messages_response: Optional["InternalMessagesResponse"] = None,
-        job_info: Optional["JobInfoResponse"] = None,
         reporter: Optional[Reporter] = None,
         quiet: Optional[bool] = None,
         *,
@@ -3608,7 +3668,6 @@ class Run:
         Run._footer_sync_info(
             poll_exit_response=poll_exit_response,
-            job_info=job_info,
             quiet=quiet,
             settings=settings,
             printer=printer,
@@ -3793,7 +3852,6 @@ class Run:
     @staticmethod
     def _footer_sync_info(
         poll_exit_response: Optional[PollExitResponse] = None,
-        job_info: Optional["JobInfoResponse"] = None,
         quiet: Optional[bool] = None,
         *,
         settings: "Settings",
@@ -3813,14 +3871,10 @@ class Run:
         else:
             info = []
             if settings.run_name and settings.run_url:
+                run_workspace = f"{settings.run_url}/workspace"
                 info = [
-                    f"{printer.emoji('rocket')} View run {printer.name(settings.run_name)} at: {printer.link(settings.run_url)}"
+                    f"{printer.emoji('rocket')} View run {printer.name(settings.run_name)} at: {printer.link(run_workspace)}"
                 ]
-            if job_info and job_info.version and job_info.sequenceId:
-                link = f"{settings.project_url}/jobs/{job_info.sequenceId}/version_details/{job_info.version}"
-                info.append(
-                    f"{printer.emoji('lightning')} View job at {printer.link(link)}",
-                )
             if poll_exit_response and poll_exit_response.file_counts:
                 logger.info("logging synced files")
                 file_counts = poll_exit_response.file_counts

wandb/sdk/wandb_settings.py CHANGED Viewed

@@ -45,6 +45,7 @@ from wandb.proto import wandb_settings_pb2
 from wandb.sdk.internal.system.env_probe_helpers import is_aws_lambda
 from wandb.sdk.lib import filesystem
 from wandb.sdk.lib._settings_toposort_generated import SETTINGS_TOPOLOGICALLY_SORTED
+from wandb.sdk.lib.run_moment import RunMoment
 from wandb.sdk.wandb_setup import _EarlyLogger
 from .lib import apikey
@@ -160,6 +161,14 @@ def _get_program() -> Optional[str]:
         return None
+def _runmoment_preprocessor(val: Any) -> Optional[RunMoment]:
+    if isinstance(val, RunMoment) or val is None:
+        return val
+    elif isinstance(val, str):
+        return RunMoment.from_uri(val)
+    raise UsageError(f"Could not parse value {val} as a RunMoment.")
 def _get_program_relpath(
     program: str, root: Optional[str] = None, _logger: Optional[_EarlyLogger] = None
 ) -> Optional[str]:
@@ -291,13 +300,14 @@ class SettingsData:
     _aws_lambda: bool
     _async_upload_concurrency_limit: int
     _cli_only_mode: bool  # Avoid running any code specific for runs
+    _code_path_local: str
     _colab: bool
     # _config_dict: Config
     _cuda: str
     _disable_meta: bool  # Do not collect system metadata
     _disable_service: (
-        bool
-    )  # Disable wandb-service, spin up internal process the old way
+        bool  # Disable wandb-service, spin up internal process the old way
+    )
     _disable_setproctitle: bool  # Do not use setproctitle on internal process
     _disable_stats: bool  # Do not collect system metrics
     _disable_viewer: bool  # Prevent early viewer query
@@ -354,20 +364,18 @@ class SettingsData:
     _stats_sample_rate_seconds: float
     _stats_samples_to_average: int
     _stats_join_assets: (
-        bool
-    )  # join metrics from different assets before sending to backend
+        bool  # join metrics from different assets before sending to backend
+    )
     _stats_neuron_monitor_config_path: (
-        str
-    )  # path to place config file for neuron-monitor (AWS Trainium)
+        str  # path to place config file for neuron-monitor (AWS Trainium)
+    )
     _stats_open_metrics_endpoints: Mapping[str, str]  # open metrics endpoint names/urls
     # open metrics filters in one of the two formats:
     # - {"metric regex pattern, including endpoint name as prefix": {"label": "label value regex pattern"}}
     # - ("metric regex pattern 1", "metric regex pattern 2", ...)
     _stats_open_metrics_filters: Union[Sequence[str], Mapping[str, Mapping[str, str]]]
     _stats_disk_paths: Sequence[str]  # paths to monitor disk usage
-    _stats_buffer_size: (
-        int
-    )  # number of consolidated samples to buffer before flushing, available in run obj
+    _stats_buffer_size: int  # number of consolidated samples to buffer before flushing, available in run obj
     _tmp_code_dir: str
     _tracelog: str
     _unsaved_keys: Sequence[str]
@@ -392,6 +400,7 @@ class SettingsData:
     entity: str
     files_dir: str
     force: bool
+    fork_from: Optional[RunMoment]
     git_commit: str
     git_remote: str
     git_remote_url: str
@@ -619,6 +628,10 @@ class Settings(SettingsData):
                 "hook": lambda _: is_aws_lambda(),
                 "auto_hook": True,
             },
+            _code_path_local={
+                "hook": lambda _: _get_program_relpath(self.program),
+                "auto_hook": True,
+            },
             _colab={
                 "hook": lambda _: "google.colab" in sys.modules,
                 "auto_hook": True,
@@ -800,6 +813,10 @@ class Settings(SettingsData):
                 ),
             },
             force={"preprocessor": _str_as_bool},
+            fork_from={
+                "value": None,
+                "preprocessor": _runmoment_preprocessor,
+            },
             git_remote={"value": "origin"},
             heartbeat_seconds={"value": 30},
             ignore_globs={
@@ -1570,6 +1587,14 @@ class Settings(SettingsData):
                 for key, value in v.items():
                     # we only support dicts with string values for now
                     mapping.value[key] = value
+            elif isinstance(v, RunMoment):
+                getattr(settings, k).CopyFrom(
+                    wandb_settings_pb2.RunMoment(
+                        run=v.run,
+                        value=v.value,
+                        metric=v.metric,
+                    )
+                )
             elif v is None:
                 # None is the default value for all settings, so we don't need to set it,
                 # i.e. None means that the value was not set.
@@ -1892,16 +1917,33 @@ class Settings(SettingsData):
                 f.write(json.dumps({"run_id": self.run_id}))
     def _apply_login(
-        self, login_settings: Dict[str, Any], _logger: Optional[_EarlyLogger] = None
+        self,
+        login_settings: Dict[str, Any],
+        _logger: Optional[_EarlyLogger] = None,
     ) -> None:
-        param_map = dict(key="api_key", host="base_url", timeout="login_timeout")
+        key_map = {
+            "key": "api_key",
+            "host": "base_url",
+            "timeout": "login_timeout",
+        }
+        # Rename keys and keep only the non-None values.
+        #
+        # The input keys are parameters to wandb.login(), but we use different
+        # names for some of them in Settings.
         login_settings = {
-            param_map.get(k, k): v for k, v in login_settings.items() if v is not None
+            key_map.get(key, key): value
+            for key, value in login_settings.items()
+            if value is not None
         }
-        if login_settings:
-            if _logger:
-                _logger.info(f"Applying login settings: {_redact_dict(login_settings)}")
-            self.update(login_settings, source=Source.LOGIN)
+        if _logger:
+            _logger.info(f"Applying login settings: {_redact_dict(login_settings)}")
+        self.update(
+            login_settings,
+            source=Source.LOGIN,
+        )
     def _apply_run_start(self, run_start_settings: Dict[str, Any]) -> None:
         # This dictionary maps from the "run message dict" to relevant fields in settings

wandb 0.16.3__py3-none-any.whl → 0.16.5__py3-none-any.whl

wandb 0.16.3py3-none-any.whl → 0.16.5py3-none-any.whl