PyPI - wandb - Versions diffs - 0.19.6rc4__py3-none-win_amd64.whl → 0.19.8__py3-none-win_amd64.whl - Mend

wandb 0.19.6rc4__py3-none-win_amd64.whl → 0.19.8__py3-none-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (82) hide show

wandb/__init__.py +1 -1
wandb/__init__.pyi +56 -6
wandb/apis/public/_generated/__init__.py +21 -0
wandb/apis/public/_generated/base.py +128 -0
wandb/apis/public/_generated/enums.py +4 -0
wandb/apis/public/_generated/input_types.py +4 -0
wandb/apis/public/_generated/operations.py +15 -0
wandb/apis/public/_generated/server_features_query.py +27 -0
wandb/apis/public/_generated/typing_compat.py +14 -0
wandb/apis/public/api.py +192 -6
wandb/apis/public/artifacts.py +13 -45
wandb/apis/public/registries.py +573 -0
wandb/apis/public/utils.py +36 -0
wandb/bin/gpu_stats.exe +0 -0
wandb/bin/wandb-core +0 -0
wandb/cli/cli.py +11 -20
wandb/data_types.py +1 -1
wandb/env.py +10 -0
wandb/filesync/dir_watcher.py +2 -1
wandb/proto/v3/wandb_internal_pb2.py +243 -222
wandb/proto/v3/wandb_server_pb2.py +4 -4
wandb/proto/v3/wandb_settings_pb2.py +2 -2
wandb/proto/v3/wandb_telemetry_pb2.py +10 -10
wandb/proto/v4/wandb_internal_pb2.py +226 -222
wandb/proto/v4/wandb_server_pb2.py +4 -4
wandb/proto/v4/wandb_settings_pb2.py +2 -2
wandb/proto/v4/wandb_telemetry_pb2.py +10 -10
wandb/proto/v5/wandb_internal_pb2.py +226 -222
wandb/proto/v5/wandb_server_pb2.py +4 -4
wandb/proto/v5/wandb_settings_pb2.py +2 -2
wandb/proto/v5/wandb_telemetry_pb2.py +10 -10
wandb/sdk/artifacts/_graphql_fragments.py +126 -0
wandb/sdk/artifacts/artifact.py +51 -95
wandb/sdk/backend/backend.py +17 -6
wandb/sdk/data_types/helper_types/bounding_boxes_2d.py +14 -6
wandb/sdk/data_types/helper_types/image_mask.py +12 -6
wandb/sdk/data_types/saved_model.py +35 -46
wandb/sdk/data_types/video.py +7 -16
wandb/sdk/interface/interface.py +87 -49
wandb/sdk/interface/interface_queue.py +5 -15
wandb/sdk/interface/interface_relay.py +7 -22
wandb/sdk/interface/interface_shared.py +65 -136
wandb/sdk/interface/interface_sock.py +3 -21
wandb/sdk/interface/router.py +42 -68
wandb/sdk/interface/router_queue.py +13 -11
wandb/sdk/interface/router_relay.py +26 -13
wandb/sdk/interface/router_sock.py +12 -16
wandb/sdk/internal/handler.py +4 -3
wandb/sdk/internal/internal_api.py +12 -1
wandb/sdk/internal/sender.py +3 -19
wandb/sdk/lib/apikey.py +87 -26
wandb/sdk/lib/asyncio_compat.py +210 -0
wandb/sdk/lib/console_capture.py +172 -0
wandb/sdk/lib/progress.py +78 -16
wandb/sdk/lib/redirect.py +102 -76
wandb/sdk/lib/service_connection.py +37 -17
wandb/sdk/lib/sock_client.py +6 -56
wandb/sdk/mailbox/__init__.py +23 -0
wandb/sdk/mailbox/mailbox.py +135 -0
wandb/sdk/mailbox/mailbox_handle.py +127 -0
wandb/sdk/mailbox/response_handle.py +167 -0
wandb/sdk/mailbox/wait_with_progress.py +135 -0
wandb/sdk/service/server_sock.py +9 -3
wandb/sdk/service/streams.py +75 -78
wandb/sdk/verify/verify.py +54 -2
wandb/sdk/wandb_init.py +72 -75
wandb/sdk/wandb_login.py +7 -4
wandb/sdk/wandb_metadata.py +65 -34
wandb/sdk/wandb_require.py +14 -8
wandb/sdk/wandb_run.py +90 -97
wandb/sdk/wandb_settings.py +10 -4
wandb/sdk/wandb_setup.py +19 -8
wandb/sdk/wandb_sync.py +2 -10
wandb/util.py +3 -1
{wandb-0.19.6rc4.dist-info → wandb-0.19.8.dist-info}/METADATA +2 -2
{wandb-0.19.6rc4.dist-info → wandb-0.19.8.dist-info}/RECORD +79 -66
wandb/sdk/interface/message_future.py +0 -27
wandb/sdk/interface/message_future_poll.py +0 -50
wandb/sdk/lib/mailbox.py +0 -442
{wandb-0.19.6rc4.dist-info → wandb-0.19.8.dist-info}/WHEEL +0 -0
{wandb-0.19.6rc4.dist-info → wandb-0.19.8.dist-info}/entry_points.txt +0 -0
{wandb-0.19.6rc4.dist-info → wandb-0.19.8.dist-info}/licenses/LICENSE +0 -0

wandb/sdk/service/streams.py CHANGED Viewed

@@ -8,34 +8,27 @@ StreamMux: Container for dictionary of stream threads per runid
 from __future__ import annotations
+import asyncio
 import functools
-import multiprocessing
 import queue
 import threading
 import time
 from threading import Event
-from typing import Any, Callable
+from typing import Any, Callable, NoReturn
 import psutil
 import wandb
 import wandb.util
 from wandb.proto import wandb_internal_pb2 as pb
+from wandb.sdk.interface.interface_relay import InterfaceRelay
+from wandb.sdk.interface.router_relay import MessageRelayRouter
 from wandb.sdk.internal.settings_static import SettingsStatic
+from wandb.sdk.lib import asyncio_compat, progress
 from wandb.sdk.lib import printer as printerlib
-from wandb.sdk.lib import progress
-from wandb.sdk.lib.mailbox import (
-    Mailbox,
-    MailboxProbe,
-    MailboxProgress,
-    MailboxProgressAll,
-)
+from wandb.sdk.mailbox import Mailbox, MailboxHandle, wait_all_with_progress
 from wandb.sdk.wandb_run import Run
-from ..interface.interface_relay import InterfaceRelay
-# from wandb.sdk.wandb_settings import Settings
 class StreamThread(threading.Thread):
     """Class to running internal process as a thread."""
@@ -61,19 +54,22 @@ class StreamRecord:
     _settings: SettingsStatic
     _started: bool
-    def __init__(self, settings: SettingsStatic, mailbox: Mailbox) -> None:
+    def __init__(self, settings: SettingsStatic) -> None:
         self._started = False
-        self._mailbox = mailbox
+        self._mailbox = Mailbox()
         self._record_q = queue.Queue()
         self._result_q = queue.Queue()
         self._relay_q = queue.Queue()
-        process = multiprocessing.current_process()
+        self._router = MessageRelayRouter(
+            request_queue=self._record_q,
+            response_queue=self._result_q,
+            relay_queue=self._relay_q,
+            mailbox=self._mailbox,
+        )
         self._iface = InterfaceRelay(
             record_q=self._record_q,
             result_q=self._result_q,
             relay_q=self._relay_q,
-            process=process,
-            process_check=False,
             mailbox=self._mailbox,
         )
         self._settings = settings
@@ -84,10 +80,11 @@ class StreamRecord:
         self._wait_thread_active()
     def _wait_thread_active(self) -> None:
-        self._iface.deliver_status().wait(timeout=-1)
+        self._iface.deliver_status().wait_or(timeout=None)
     def join(self) -> None:
         self._iface.join()
+        self._router.join()
         if self._thread:
             self._thread.join()
@@ -141,7 +138,6 @@ class StreamMux:
     _action_q: queue.Queue[StreamAction]
     _stopped: Event
     _pid_checked_ts: float | None
-    _mailbox: Mailbox
     def __init__(self) -> None:
         self._streams_lock = threading.Lock()
@@ -151,8 +147,6 @@ class StreamMux:
         self._stopped = Event()
         self._action_q = queue.Queue()
         self._pid_checked_ts = None
-        self._mailbox = Mailbox()
-        self._mailbox.enable_keepalive()
     def _get_stopped_event(self) -> Event:
         # TODO: clean this up, there should be a better way to abstract this
@@ -209,7 +203,7 @@ class StreamMux:
             return stream
     def _process_add(self, action: StreamAction) -> None:
-        stream = StreamRecord(action._data, mailbox=self._mailbox)
+        stream = StreamRecord(action._data)
         # run_id = action.stream_id  # will want to fix if a streamid != runid
         settings = action._data
         thread = StreamThread(
@@ -247,41 +241,51 @@ class StreamMux:
                 stream.drop()
                 stream.join()
-    def _on_probe_exit(self, probe_handle: MailboxProbe, stream: StreamRecord) -> None:
-        handle = probe_handle.get_mailbox_handle()
-        if handle:
-            result = handle.wait(timeout=0, release=False)
-            if not result:
-                return
-            probe_handle.set_probe_result(result)
-        handle = stream.interface.deliver_poll_exit()
-        probe_handle.set_mailbox_handle(handle)
-    def _on_progress_exit(self, progress_handle: MailboxProgress) -> None:
-        pass
-    def _on_progress_exit_all(
+    async def _finish_all_progress(
         self,
         progress_printer: progress.ProgressPrinter,
-        progress_all_handle: MailboxProgressAll,
+        streams_to_watch: dict[str, StreamRecord],
     ) -> None:
-        probe_handles: list[MailboxProbe] = []
-        progress_handles = progress_all_handle.get_progress_handles()
-        for progress_handle in progress_handles:
-            probe_handles.extend(progress_handle.get_probe_handles())
-        assert probe_handles
-        if self._check_orphaned():
-            self._stopped.set()
-        poll_exit_responses: list[pb.PollExitResponse] = []
-        for probe_handle in probe_handles:
-            result = probe_handle.get_probe_result()
-            if result:
-                poll_exit_responses.append(result.response.poll_exit_response)
-        progress_printer.update(poll_exit_responses)
+        """Poll the streams and display statistics about them.
+        This never returns and must be cancelled.
+        Args:
+            progress_printer: Printer to use for displaying finish progress.
+            streams_to_watch: Streams to poll for finish progress.
+        """
+        results: dict[str, pb.Result | None] = {}
+        async def loop_poll_stream(
+            stream_id: str,
+            stream: StreamRecord,
+        ) -> NoReturn:
+            while True:
+                start_time = time.monotonic()
+                handle = stream.interface.deliver_poll_exit()
+                results[stream_id] = await handle.wait_async(timeout=None)
+                elapsed_time = time.monotonic() - start_time
+                if elapsed_time < 1:
+                    await asyncio.sleep(1 - elapsed_time)
+        async def loop_update_printer() -> NoReturn:
+            while True:
+                poll_exit_responses: list[pb.PollExitResponse] = []
+                for result in results.values():
+                    if not result or not result.response:
+                        continue
+                    if poll_exit_response := result.response.poll_exit_response:
+                        poll_exit_responses.append(poll_exit_response)
+                progress_printer.update(poll_exit_responses)
+                await asyncio.sleep(1)
+        async with asyncio_compat.open_task_group() as task_group:
+            for stream_id, stream in streams_to_watch.items():
+                task_group.start_soon(loop_poll_stream(stream_id, stream))
+            task_group.start_soon(loop_update_printer())
     def _finish_all(self, streams: dict[str, StreamRecord], exit_code: int) -> None:
         if not streams:
@@ -291,7 +295,7 @@ class StreamMux:
         # fixme: for now we have a single printer for all streams,
         # and jupyter is disabled if at least single stream's setting set `_jupyter` to false
-        exit_handles = []
+        exit_handles: list[MailboxHandle[pb.Result]] = []
         # only finish started streams, non started streams failed early
         started_streams: dict[str, StreamRecord] = {}
@@ -302,27 +306,24 @@ class StreamMux:
         for stream in started_streams.values():
             handle = stream.interface.deliver_exit(exit_code)
-            handle.add_progress(self._on_progress_exit)
-            handle.add_probe(functools.partial(self._on_probe_exit, stream=stream))
             exit_handles.append(handle)
-            # this message is confusing, we should remove it
-            # Run._footer_exit_status_info(
-            #     exit_code, settings=stream._settings, printer=printer  # type: ignore
-            # )
-        with progress.progress_printer(printer) as progress_printer:
+        with progress.progress_printer(
+            printer,
+            default_text="Finishing up...",
+        ) as progress_printer:
             # todo: should we wait for the max timeout (?) of all exit handles or just wait forever?
             # timeout = max(stream._settings._exit_timeout for stream in streams.values())
-            got_result = self._mailbox.wait_all(
-                handles=exit_handles,
-                timeout=-1,
-                on_progress_all=functools.partial(
-                    self._on_progress_exit_all,
+            wait_all_with_progress(
+                exit_handles,
+                timeout=None,
+                progress_after=1,
+                display_progress=functools.partial(
+                    self._finish_all_progress,
                     progress_printer,
+                    started_streams,
                 ),
             )
-            assert got_result
         # These could be done in parallel in the future
         for _sid, stream in started_streams.items():
@@ -332,20 +333,16 @@ class StreamMux:
             sampled_history_handle = stream.interface.deliver_request_sampled_history()
             internal_messages_handle = stream.interface.deliver_internal_messages()
-            result = internal_messages_handle.wait(timeout=-1)
-            assert result
+            result = internal_messages_handle.wait_or(timeout=None)
             internal_messages_response = result.response.internal_messages_response
-            result = poll_exit_handle.wait(timeout=-1)
-            assert result
+            result = poll_exit_handle.wait_or(timeout=None)
             poll_exit_response = result.response.poll_exit_response
-            result = sampled_history_handle.wait(timeout=-1)
-            assert result
+            result = sampled_history_handle.wait_or(timeout=None)
             sampled_history = result.response.sampled_history_response
-            result = final_summary_handle.wait(timeout=-1)
-            assert result
+            result = final_summary_handle.wait_or(timeout=None)
             final_summary = result.response.get_summary_response
             Run._footer(

wandb/sdk/verify/verify.py CHANGED Viewed

@@ -1,6 +1,8 @@
 """Utilities for wandb verify."""
+import contextlib
 import getpass
+import io
 import os
 import time
 from functools import partial
@@ -163,8 +165,8 @@ def check_run(api: Api) -> bool:
         )
         print_results(failed_test_strings, False)
         return False
-    for key, value in prev_run.config.items():
-        if config[key] != value:
+    for key, value in config.items():
+        if prev_run.config.get(key) != value:
             failed_test_strings.append(
                 "Read config values don't match run config. Contact W&B for support."
             )
@@ -486,6 +488,56 @@ def check_wandb_version(api: Api) -> None:
     print_results(fail_string, warning)
+def check_sweeps(api: Api) -> bool:
+    print("Checking sweep creation and agent execution".ljust(72, "."), end="")  # noqa: T201
+    failed_test_strings: List[str] = []
+    sweep_config = {
+        "method": "random",
+        "metric": {"goal": "minimize", "name": "score"},
+        "parameters": {
+            "x": {"values": [0.01, 0.05, 0.1]},
+            "y": {"values": [1, 2, 3]},
+        },
+        "name": "verify_sweep",
+    }
+    try:
+        with contextlib.redirect_stdout(io.StringIO()):
+            sweep_id = wandb.sweep(
+                sweep=sweep_config, project=PROJECT_NAME, entity=api.default_entity
+            )
+    except Exception as e:
+        failed_test_strings.append(f"Failed to create sweep: {e}")
+        print_results(failed_test_strings, False)
+        return False
+    if not sweep_id:
+        failed_test_strings.append("Sweep creation returned an invalid ID.")
+        print_results(failed_test_strings, False)
+        return False
+    try:
+        def objective(config):
+            score = config.x**3 + config.y
+            return score
+        def main():
+            with wandb.init(project=PROJECT_NAME) as run:
+                score = objective(run.config)
+                run.log({"score": score})
+        wandb.agent(sweep_id, function=main, count=10)
+    except Exception as e:
+        failed_test_strings.append(f"Failed to run sweep agent: {e}")
+        print_results(failed_test_strings, False)
+        return False
+    print_results(failed_test_strings, False)
+    return len(failed_test_strings) == 0
 def retry_fn(fn: Callable) -> Any:
     ini_time = time.time()
     res = None

wandb/sdk/wandb_init.py CHANGED Viewed

@@ -34,7 +34,7 @@ from wandb.errors import CommError, Error, UsageError
 from wandb.errors.links import url_registry
 from wandb.errors.util import ProtobufErrorHandler
 from wandb.integration import sagemaker
-from wandb.sdk.lib import runid
+from wandb.sdk.lib import progress, runid
 from wandb.sdk.lib.paths import StrPath
 from wandb.util import _is_artifact_representation
@@ -42,7 +42,7 @@ from . import wandb_login, wandb_setup
 from .backend.backend import Backend
 from .lib import SummaryDisabled, filesystem, module, paths, printer, telemetry
 from .lib.deprecate import Deprecated, deprecate
-from .lib.mailbox import Mailbox, MailboxProgress
+from .mailbox import wait_with_progress
 from .wandb_helper import parse_config
 from .wandb_run import Run, TeardownHook, TeardownStage
 from .wandb_settings import Settings
@@ -293,6 +293,16 @@ class _WandbInit:
         settings.x_start_time = time.time()
+        # In shared mode, generate a unique label if not provided.
+        # The label is used to distinguish between system metrics and console logs
+        # from different writers to the same run.
+        if settings._shared and not settings.x_label:
+            # TODO: If executed in a known distributed environment (e.g. Ray or SLURM),
+            #   use the env vars to generate a label (e.g. SLURM_JOB_ID or RANK)
+            prefix = settings.host or ""
+            label = runid.generate_id()
+            settings.x_label = f"{prefix}-{label}" if prefix else label
         return settings
     def _load_autoresume_run_id(self, resume_file: pathlib.Path) -> str | None:
@@ -672,11 +682,11 @@ class _WandbInit:
         drun._Run__metadata = wandb.sdk.wandb_metadata.Metadata()
         # methods
-        drun.log = lambda data, *_, **__: drun.summary.update(data)  # type: ignore
-        drun.finish = lambda *_, **__: module.unset_globals()  # type: ignore
-        drun.join = drun.finish  # type: ignore
-        drun.define_metric = lambda *_, **__: wandb.sdk.wandb_metric.Metric("dummy")  # type: ignore
-        drun.save = lambda *_, **__: False  # type: ignore
+        drun.log = lambda data, *_, **__: drun.summary.update(data)  # type: ignore[method-assign]
+        drun.finish = lambda *_, **__: module.unset_globals()  # type: ignore[method-assign]
+        drun.join = drun.finish  # type: ignore[method-assign]
+        drun.define_metric = lambda *_, **__: wandb.sdk.wandb_metric.Metric("dummy")  # type: ignore[method-assign]
+        drun.save = lambda *_, **__: False  # type: ignore[method-assign]
         for symbol in (
             "alert",
             "finish_artifact",
@@ -723,7 +733,7 @@ class _WandbInit:
             def __call__(self, *args: Any, **kwargs: Any) -> _ChainableNoOp:
                 return _ChainableNoOp()
-        drun.log_artifact = _ChainableNoOpField()
+        drun.log_artifact = _ChainableNoOpField()  # type: ignore[method-assign]
         # attributes
         drun._start_time = time.time()
         drun._starting_step = 0
@@ -747,11 +757,6 @@ class _WandbInit:
         )
         return drun
-    def _on_progress_init(self, handle: MailboxProgress) -> None:
-        line = "Waiting for wandb.init()...\r"
-        percent_done = handle.percent_done
-        self.printer.progress_update(line, percent_done=percent_done)
     def init(self, settings: Settings, config: _ConfigParts) -> Run:  # noqa: C901
         self._logger.info("calling init triggers")
         trigger.call("on_init")
@@ -763,28 +768,18 @@ class _WandbInit:
             f"\nconfig: {config.base_no_artifacts}"
         )
-        if (
-            settings.reinit or (settings._jupyter and settings.reinit is not False)
-        ) and len(self._wl._global_run_stack) > 0:
-            if len(self._wl._global_run_stack) > 1:
-                wandb.termwarn(
-                    "Launching multiple wandb runs using Python's threading"
-                    " module is not well-supported."
-                    " Please use multiprocessing instead."
-                    " Finishing previous run before initializing another."
-                )
-            latest_run = self._wl._global_run_stack[-1]
-            self._logger.info(f"found existing run on stack: {latest_run.id}")
-            latest_run.finish()
-        elif wandb.run is not None and os.getpid() == wandb.run._init_pid:
-            self._logger.info("wandb.init() called when a run is still active")
+        if wandb.run is not None and os.getpid() == wandb.run._init_pid:
+            if settings.reinit:
+                self._logger.info(f"finishing previous run: {wandb.run.id}")
+                wandb.run.finish()
+            else:
+                self._logger.info("wandb.init() called while a run is active")
-            # NOTE: Updates telemetry on the pre-existing run.
-            with telemetry.context() as tel:
-                tel.feature.init_return_run = True
+                # NOTE: Updates telemetry on the pre-existing run.
+                with telemetry.context() as tel:
+                    tel.feature.init_return_run = True
-            return wandb.run
+                return wandb.run
         self._logger.info("starting backend")
@@ -798,12 +793,7 @@ class _WandbInit:
         else:
             service = None
-        mailbox = Mailbox()
-        backend = Backend(
-            settings=settings,
-            service=service,
-            mailbox=mailbox,
-        )
+        backend = Backend(settings=settings, service=service)
         backend.ensure_launched()
         self._logger.info("backend started and connected")
@@ -905,7 +895,6 @@ class _WandbInit:
         run._set_teardown_hooks(self._teardown_hooks)
         assert backend.interface
-        mailbox.enable_keepalive()
         backend.interface.publish_header()
         # Using GitRepo() blocks & can be slow, depending on user's current git setup.
@@ -921,16 +910,6 @@ class _WandbInit:
             )
         error: wandb.Error | None = None
-        # In shared mode, generate a unique label if not provided.
-        # The label is used to distinguish between system metrics and console logs
-        # from different writers to the same run.
-        if settings._shared and not settings.x_label:
-            # TODO: If executed in a known distributed environment (e.g. Ray or SLURM),
-            #   use the env vars to generate a label (e.g. SLURM_JOB_ID or RANK)
-            prefix = settings.host or ""
-            label = runid.generate_id()
-            settings.x_label = f"{prefix}-{label}" if prefix else label
         timeout = settings.init_timeout
         self._logger.info(
@@ -938,11 +917,18 @@ class _WandbInit:
         )
         run_init_handle = backend.interface.deliver_run(run)
-        result = run_init_handle.wait(
-            timeout=timeout,
-            on_progress=self._on_progress_init,
-            cancel=True,
-        )
+        async def display_init_message() -> None:
+            assert backend.interface
+            with progress.progress_printer(
+                self.printer,
+                default_text="Waiting for wandb.init()...",
+            ) as progress_printer:
+                await progress.loop_printing_operation_stats(
+                    progress_printer,
+                    backend.interface,
+                )
         # Raise an error if deliver_run failed.
         #
@@ -951,8 +937,16 @@ class _WandbInit:
         #
         # TODO: Remove try-except once x_disable_service is removed.
         try:
-            if not result or not result.run_result:
-                run_init_handle._cancel()
+            try:
+                result = wait_with_progress(
+                    run_init_handle,
+                    timeout=timeout,
+                    progress_after=1,
+                    display_progress=display_init_message,
+                )
+            except TimeoutError:
+                run_init_handle.cancel(backend.interface)
                 # This may either be an issue with the W&B server (a CommError)
                 # or a bug in the SDK (an Error). We cannot distinguish between
@@ -963,6 +957,8 @@ class _WandbInit:
                     " setting: `wandb.init(settings=wandb.Settings(init_timeout=120))`."
                 )
+            assert result.run_result
             if error := ProtobufErrorHandler.to_exception(result.run_result.error):
                 raise error
@@ -1004,13 +1000,13 @@ class _WandbInit:
         assert backend.interface
         run_start_handle = backend.interface.deliver_run_start(run)
-        # TODO: add progress to let user know we are doing something
-        run_start_result = run_start_handle.wait(timeout=30)
-        if run_start_result is None:
-            run_start_handle.abandon()
+        try:
+            # TODO: add progress to let user know we are doing something
+            run_start_handle.wait_or(timeout=30)
+        except TimeoutError:
+            pass
         assert self._wl is not None
-        self._wl._global_run_stack.append(run)
         self.run = run
         run._handle_launch_artifact_overrides()
@@ -1084,8 +1080,7 @@ def _attach(
     )
     # TODO: consolidate this codepath with wandb.init()
-    mailbox = Mailbox()
-    backend = Backend(settings=settings, service=service, mailbox=mailbox)
+    backend = Backend(settings=settings, service=service)
     backend.ensure_launched()
     logger.info("attach backend started and connected")
@@ -1097,14 +1092,13 @@ def _attach(
     run._set_backend(backend)
     assert backend.interface
-    mailbox.enable_keepalive()
     attach_handle = backend.interface.deliver_attach(attach_id)
-    # TODO: add progress to let user know we are doing something
-    attach_result = attach_handle.wait(timeout=30)
-    if not attach_result:
-        attach_handle.abandon()
+    try:
+        # TODO: add progress to let user know we are doing something
+        attach_result = attach_handle.wait_or(timeout=30)
+    except TimeoutError:
         raise UsageError("Timeout attaching to run")
     attach_response = attach_result.response.attach_response
     if attach_response.error and attach_response.error.message:
         raise UsageError(f"Failed to attach to run: {attach_response.error.message}")
@@ -1222,10 +1216,10 @@ def init(  # noqa: C901
             on the system, such as checking the git root or the current program
             file. If we can't infer the project name, the project will default to
             `"uncategorized"`.
-        dir: An absolute path to the directory where metadata and downloaded
-            files will be stored. When calling `download()` on an artifact, files
-            will be saved to this directory. If not specified, this defaults to
-            the `./wandb` directory.
+        dir: The absolute path to the directory where experiment logs and
+            metadata files are stored. If not specified, this defaults
+            to the `./wandb` directory. Note that this does not affect the
+            location where artifacts are stored when calling `download()`.
         id: A unique identifier for this run, used for resuming. It must be unique
             within the project and cannot be reused once a run is deleted. The
             identifier must not contain any of the following special characters:
@@ -1426,7 +1420,7 @@ def init(  # noqa: C901
     wl: wandb_setup._WandbSetup | None = None
     try:
-        wl = wandb.setup()
+        wl = wandb_setup._setup(start_service=False)
         wi = _WandbInit(wl, init_telemetry)
@@ -1468,6 +1462,9 @@ def init(  # noqa: C901
             _monkeypatch_tensorboard()
             init_telemetry.feature.tensorboard_sync = True
+        if run_settings.x_server_side_derived_summary:
+            init_telemetry.feature.server_side_derived_summary = True
         return wi.init(run_settings, run_config)
     except KeyboardInterrupt as e:

wandb/sdk/wandb_login.py CHANGED Viewed

@@ -162,8 +162,8 @@ class _WandbLogin:
             repeat=False,
         )
-    def configure_api_key(self, key: str) -> None:
-        """Saves the API key and updates the the global setup object."""
+    def try_save_api_key(self, key: str) -> None:
+        """Saves the API key to disk for future use."""
         if self._settings._notebook and not self._settings.silent:
             wandb.termwarn(
                 "If you're specifying your api key in code, ensure this "
@@ -172,7 +172,10 @@ class _WandbLogin:
                 "`wandb login` from the command line."
             )
         if key:
-            apikey.write_key(self._settings, key)
+            try:
+                apikey.write_key(self._settings, key)
+            except apikey.WriteNetrcError as e:
+                wandb.termwarn(str(e))
     def update_session(
         self,
@@ -305,7 +308,7 @@ def _login(
         wlogin._verify_login(key)
     if not key_is_pre_configured:
-        wlogin.configure_api_key(key)
+        wlogin.try_save_api_key(key)
         wlogin.update_session(key, status=key_status)
         wlogin._update_global_anonymous_setting()