PyPI - wandb - Versions diffs - 0.16.5__py3-none-any.whl → 0.17.0rc1__py3-none-any.whl - Mend

wandb 0.16.5py3-none-any.whl → 0.17.0rc1py3-none-any.whl

Files changed (141) hide show

package_readme.md +95 -0
wandb/__init__.py +2 -2
wandb/agents/pyagent.py +0 -1
wandb/analytics/sentry.py +2 -1
wandb/apis/importers/internals/protocols.py +30 -56
wandb/apis/importers/mlflow.py +13 -26
wandb/apis/importers/wandb.py +8 -14
wandb/apis/public/api.py +1 -0
wandb/apis/public/artifacts.py +1 -0
wandb/apis/public/files.py +1 -0
wandb/apis/public/history.py +1 -0
wandb/apis/public/jobs.py +1 -0
wandb/apis/public/projects.py +1 -0
wandb/apis/public/reports.py +1 -0
wandb/apis/public/runs.py +1 -0
wandb/apis/public/sweeps.py +1 -0
wandb/apis/public/teams.py +1 -0
wandb/apis/public/users.py +1 -0
wandb/apis/reports/v1/_blocks.py +2 -6
wandb/apis/reports/v2/gql.py +1 -0
wandb/apis/reports/v2/interface.py +3 -4
wandb/apis/reports/v2/internal.py +5 -8
wandb/cli/cli.py +7 -4
wandb/data_types.py +3 -3
wandb/env.py +35 -5
wandb/errors/__init__.py +5 -0
wandb/integration/catboost/catboost.py +1 -1
wandb/integration/fastai/__init__.py +1 -0
wandb/integration/keras/__init__.py +1 -0
wandb/integration/keras/keras.py +6 -6
wandb/integration/langchain/wandb_tracer.py +1 -0
wandb/integration/lightning/fabric/logger.py +1 -3
wandb/integration/metaflow/metaflow.py +41 -6
wandb/integration/openai/fine_tuning.py +77 -40
wandb/keras/__init__.py +1 -0
wandb/proto/v3/wandb_internal_pb2.py +364 -332
wandb/proto/v3/wandb_settings_pb2.py +2 -2
wandb/proto/v4/wandb_internal_pb2.py +322 -316
wandb/proto/v4/wandb_settings_pb2.py +2 -2
wandb/proto/wandb_internal_codegen.py +0 -25
wandb/sdk/artifacts/artifact.py +41 -13
wandb/sdk/artifacts/artifact_download_logger.py +1 -0
wandb/sdk/artifacts/artifact_file_cache.py +18 -4
wandb/sdk/artifacts/artifact_instance_cache.py +1 -0
wandb/sdk/artifacts/artifact_manifest.py +1 -0
wandb/sdk/artifacts/artifact_manifest_entry.py +1 -0
wandb/sdk/artifacts/artifact_manifests/artifact_manifest_v1.py +1 -0
wandb/sdk/artifacts/artifact_saver.py +21 -21
wandb/sdk/artifacts/artifact_state.py +1 -0
wandb/sdk/artifacts/artifact_ttl.py +1 -0
wandb/sdk/artifacts/exceptions.py +1 -0
wandb/sdk/artifacts/storage_handlers/azure_handler.py +1 -0
wandb/sdk/artifacts/storage_handlers/gcs_handler.py +13 -18
wandb/sdk/artifacts/storage_handlers/http_handler.py +1 -0
wandb/sdk/artifacts/storage_handlers/local_file_handler.py +1 -0
wandb/sdk/artifacts/storage_handlers/multi_handler.py +1 -0
wandb/sdk/artifacts/storage_handlers/s3_handler.py +5 -3
wandb/sdk/artifacts/storage_handlers/tracking_handler.py +1 -0
wandb/sdk/artifacts/storage_handlers/wb_artifact_handler.py +1 -0
wandb/sdk/artifacts/storage_handlers/wb_local_artifact_handler.py +1 -0
wandb/sdk/artifacts/storage_policies/wandb_storage_policy.py +1 -0
wandb/sdk/artifacts/storage_policy.py +1 -0
wandb/sdk/data_types/base_types/media.py +3 -6
wandb/sdk/data_types/helper_types/bounding_boxes_2d.py +3 -1
wandb/sdk/integration_utils/auto_logging.py +5 -6
wandb/sdk/integration_utils/data_logging.py +5 -1
wandb/sdk/interface/interface.py +72 -37
wandb/sdk/interface/interface_shared.py +7 -13
wandb/sdk/internal/datastore.py +1 -1
wandb/sdk/internal/handler.py +18 -2
wandb/sdk/internal/internal.py +0 -1
wandb/sdk/internal/internal_util.py +0 -1
wandb/sdk/internal/job_builder.py +4 -3
wandb/sdk/internal/profiler.py +1 -0
wandb/sdk/internal/run.py +1 -0
wandb/sdk/internal/sender.py +1 -1
wandb/sdk/internal/system/assets/gpu_amd.py +44 -44
wandb/sdk/internal/system/assets/gpu_apple.py +56 -11
wandb/sdk/internal/system/assets/interfaces.py +6 -8
wandb/sdk/internal/system/assets/open_metrics.py +2 -2
wandb/sdk/internal/system/assets/trainium.py +1 -3
wandb/sdk/launch/_launch.py +5 -0
wandb/sdk/launch/_project_spec.py +10 -23
wandb/sdk/launch/agent/agent.py +81 -37
wandb/sdk/launch/agent/config.py +80 -11
wandb/sdk/launch/builder/abstract.py +1 -0
wandb/sdk/launch/builder/build.py +28 -1
wandb/sdk/launch/builder/docker_builder.py +1 -0
wandb/sdk/launch/builder/kaniko_builder.py +149 -134
wandb/sdk/launch/builder/noop.py +1 -0
wandb/sdk/launch/create_job.py +61 -48
wandb/sdk/launch/environment/abstract.py +1 -0
wandb/sdk/launch/environment/gcp_environment.py +1 -0
wandb/sdk/launch/environment/local_environment.py +1 -0
wandb/sdk/launch/loader.py +1 -0
wandb/sdk/launch/registry/abstract.py +1 -0
wandb/sdk/launch/registry/azure_container_registry.py +1 -0
wandb/sdk/launch/registry/elastic_container_registry.py +1 -0
wandb/sdk/launch/registry/google_artifact_registry.py +1 -0
wandb/sdk/launch/registry/local_registry.py +1 -0
wandb/sdk/launch/runner/abstract.py +1 -0
wandb/sdk/launch/runner/kubernetes_monitor.py +4 -1
wandb/sdk/launch/runner/kubernetes_runner.py +4 -3
wandb/sdk/launch/runner/sagemaker_runner.py +11 -10
wandb/sdk/launch/sweeps/scheduler.py +4 -1
wandb/sdk/launch/sweeps/scheduler_sweep.py +1 -0
wandb/sdk/launch/sweeps/utils.py +1 -1
wandb/sdk/launch/utils.py +21 -3
wandb/sdk/lib/_settings_toposort_generated.py +1 -0
wandb/sdk/lib/fsm.py +8 -12
wandb/sdk/lib/gitlib.py +4 -4
wandb/sdk/lib/lazyloader.py +0 -1
wandb/sdk/lib/proto_util.py +1 -1
wandb/sdk/lib/retry.py +3 -2
wandb/sdk/lib/run_moment.py +7 -1
wandb/sdk/service/service.py +17 -15
wandb/sdk/verify/verify.py +2 -1
wandb/sdk/wandb_init.py +2 -8
wandb/sdk/wandb_manager.py +2 -2
wandb/sdk/wandb_require.py +5 -0
wandb/sdk/wandb_run.py +64 -46
wandb/sdk/wandb_settings.py +2 -1
wandb/sklearn/__init__.py +1 -0
wandb/sklearn/plot/__init__.py +1 -0
wandb/sklearn/plot/classifier.py +1 -0
wandb/sklearn/plot/clusterer.py +1 -0
wandb/sklearn/plot/regressor.py +1 -0
wandb/sklearn/plot/shared.py +1 -0
wandb/sklearn/utils.py +1 -0
wandb/testing/relay.py +4 -4
wandb/trigger.py +1 -0
wandb/util.py +40 -17
wandb/wandb_controller.py +0 -1
wandb/wandb_torch.py +1 -2
{wandb-0.16.5.dist-info → wandb-0.17.0rc1.dist-info}/METADATA +68 -69
{wandb-0.16.5.dist-info → wandb-0.17.0rc1.dist-info}/RECORD +139 -140
{wandb-0.16.5.dist-info → wandb-0.17.0rc1.dist-info}/WHEEL +1 -2
wandb/bin/apple_gpu_stats +0 -0
wandb-0.16.5.dist-info/top_level.txt +0 -1
{wandb-0.16.5.dist-info → wandb-0.17.0rc1.dist-info}/entry_points.txt +0 -0
{wandb-0.16.5.dist-info → wandb-0.17.0rc1.dist-info/licenses}/LICENSE +0 -0

wandb/sdk/launch/_project_spec.py CHANGED Viewed

@@ -2,6 +2,7 @@
 Arguments can come from a launch spec or call to wandb launch.
 """
 import enum
 import logging
 import os
@@ -14,6 +15,7 @@ import wandb.docker as docker
 from wandb.apis.internal import Api
 from wandb.errors import CommError
 from wandb.sdk.launch import utils
+from wandb.sdk.launch.utils import get_entrypoint_file
 from wandb.sdk.lib.runid import generate_id
 from .errors import LaunchError
@@ -119,6 +121,7 @@ class LaunchProject:
         self.override_args: List[str] = overrides.get("args", [])
         self.override_config: Dict[str, Any] = overrides.get("run_config", {})
         self.override_artifacts: Dict[str, Any] = overrides.get("artifacts", {})
+        self.override_files: Dict[str, Any] = overrides.get("files", {})
         self.override_entrypoint: Optional[EntryPoint] = None
         self.override_dockerfile: Optional[str] = overrides.get("dockerfile")
         self.deps_type: Optional[str] = None
@@ -127,15 +130,15 @@ class LaunchProject:
         self._queue_name: Optional[str] = None
         self._queue_entity: Optional[str] = None
         self._run_queue_item_id: Optional[str] = None
-        self._entry_point: Optional[
-            EntryPoint
-        ] = None  # todo: keep multiple entrypoint support?
+        self._entry_point: Optional[EntryPoint] = (
+            None  # todo: keep multiple entrypoint support?
+        )
         override_entrypoint = overrides.get("entry_point")
         if override_entrypoint:
             _logger.info("Adding override entry point")
             self.override_entrypoint = EntryPoint(
-                name=_get_entrypoint_file(override_entrypoint),
+                name=get_entrypoint_file(override_entrypoint),
                 command=override_entrypoint,
             )
@@ -536,24 +539,6 @@ class LaunchProject:
                 self.git_version = branch_name
-def _get_entrypoint_file(entrypoint: List[str]) -> Optional[str]:
-    """Get the entrypoint file from the given command.
-    Args:
-        entrypoint (List[str]): List of command and arguments.
-    Returns:
-        Optional[str]: The entrypoint file if found, otherwise None.
-    """
-    if not entrypoint:
-        return None
-    if entrypoint[0].endswith(".py") or entrypoint[0].endswith(".sh"):
-        return entrypoint[0]
-    if len(entrypoint) < 2:
-        return None
-    return entrypoint[1]
 class EntryPoint:
     """An entry point into a wandb launch specification."""
@@ -570,7 +555,9 @@ class EntryPoint:
     def update_entrypoint_path(self, new_path: str) -> None:
         """Updates the entrypoint path to a new path."""
-        if len(self.command) == 2 and self.command[0] in ["python", "bash"]:
+        if len(self.command) == 2 and (
+            self.command[0].startswith("python") or self.command[0] == "bash"
+        ):
             self.command[1] = new_path

wandb/sdk/launch/agent/agent.py CHANGED Viewed

@@ -1,4 +1,5 @@
 """Implementation of launch agent."""
 import asyncio
 import logging
 import os
@@ -45,7 +46,10 @@ MAX_RESUME_COUNT = 5
 RUN_INFO_GRACE_PERIOD = 60
-MAX_WAIT_RUN_STOPPED = 60
+DEFAULT_STOPPED_RUN_TIMEOUT = 60
+DEFAULT_PRINT_INTERVAL = 5 * 60
+VERBOSE_PRINT_INTERVAL = 20
 _env_timeout = os.environ.get("WANDB_LAUNCH_START_TIMEOUT")
 if _env_timeout:
@@ -105,30 +109,29 @@ def _max_from_config(
     return max_from_config
-def _is_scheduler_job(run_spec: Dict[str, Any]) -> bool:
-    """Determine whether a job/runSpec is a sweep scheduler."""
-    if not run_spec:
-        _logger.debug("Recieved runSpec in _is_scheduler_job that was empty")
+class InternalAgentLogger:
+    def __init__(self, verbosity=0):
+        self._print_to_terminal = verbosity >= 2
-    if run_spec.get("uri") != Scheduler.PLACEHOLDER_URI:
-        return False
-    if run_spec.get("resource") == "local-process":
-        # Any job pushed to a run queue that has a scheduler uri is
-        # allowed to use local-process
-        if run_spec.get("job"):
-            return True
+    def error(self, message: str):
+        if self._print_to_terminal:
+            wandb.termerror(f"{LOG_PREFIX}{message}")
+        _logger.error(f"{LOG_PREFIX}{message}")
-        # If a scheduler is local-process and run through CLI, also
-        #    confirm command is in format: [wandb scheduler <sweep>]
-        cmd = run_spec.get("overrides", {}).get("entry_point", [])
-        if len(cmd) < 3:
-            return False
+    def warn(self, message: str):
+        if self._print_to_terminal:
+            wandb.termwarn(f"{LOG_PREFIX}{message}")
+        _logger.warn(f"{LOG_PREFIX}{message}")
-        if cmd[:2] != ["wandb", "scheduler"]:
-            return False
+    def info(self, message: str):
+        if self._print_to_terminal:
+            wandb.termlog(f"{LOG_PREFIX}{message}")
+        _logger.info(f"{LOG_PREFIX}{message}")
-    return True
+    def debug(self, message: str):
+        if self._print_to_terminal:
+            wandb.termlog(f"{LOG_PREFIX}{message}")
+        _logger.debug(f"{LOG_PREFIX}{message}")
 class LaunchAgent:
@@ -184,7 +187,13 @@ class LaunchAgent:
         self._max_jobs = _max_from_config(config, "max_jobs")
         self._max_schedulers = _max_from_config(config, "max_schedulers")
         self._secure_mode = config.get("secure_mode", False)
+        self._verbosity = config.get("verbosity", 0)
+        self._internal_logger = InternalAgentLogger(verbosity=self._verbosity)
+        self._last_status_print_time = 0.0
         self.default_config: Dict[str, Any] = config
+        self._stopped_run_timeout = config.get(
+            "stopped_run_timeout", DEFAULT_STOPPED_RUN_TIMEOUT
+        )
         # Get agent version from env var if present, otherwise wandb version
         self.version: str = "wandb@" + wandb.__version__
@@ -228,6 +237,33 @@ class LaunchAgent:
         self._name = agent_response["name"]
         self._init_agent_run()
+    def _is_scheduler_job(self, run_spec: Dict[str, Any]) -> bool:
+        """Determine whether a job/runSpec is a sweep scheduler."""
+        if not run_spec:
+            self._internal_logger.debug(
+                "Recieved runSpec in _is_scheduler_job that was empty"
+            )
+        if run_spec.get("uri") != Scheduler.PLACEHOLDER_URI:
+            return False
+        if run_spec.get("resource") == "local-process":
+            # Any job pushed to a run queue that has a scheduler uri is
+            # allowed to use local-process
+            if run_spec.get("job"):
+                return True
+            # If a scheduler is local-process and run through CLI, also
+            #    confirm command is in format: [wandb scheduler <sweep>]
+            cmd = run_spec.get("overrides", {}).get("entry_point", [])
+            if len(cmd) < 3:
+                return False
+            if cmd[:2] != ["wandb", "scheduler"]:
+                return False
+        return True
     async def fail_run_queue_item(
         self,
         run_queue_item_id: str,
@@ -298,6 +334,7 @@ class LaunchAgent:
     def print_status(self) -> None:
         """Prints the current status of the agent."""
+        self._last_status_print_time = time.time()
         output_str = "agent "
         if self._name:
             output_str += f"{self._name} "
@@ -344,8 +381,8 @@ class LaunchAgent:
             if run_state.lower() != "pending":
                 return True
         except CommError:
-            _logger.info(
-                f"Run {entity}/{project}/{run_id} with rqi id: {rqi_id} did not have associated run"
+            self._internal_logger.info(
+                f"Run {entity}/{project}/{run_id} with rqi id: {rqi_id} did not have associated run",
             )
         return False
@@ -361,8 +398,8 @@ class LaunchAgent:
             job_and_run_status.entity is not None
             and job_and_run_status.entity != self._entity
         ):
-            _logger.info(
-                "Skipping check for completed run status because run is on a different entity than agent"
+            self._internal_logger.info(
+                "Skipping check for completed run status because run is on a different entity than agent",
             )
         elif exception is not None:
             tb_str = traceback.format_exception(
@@ -378,8 +415,8 @@ class LaunchAgent:
                 fnames,
             )
         elif job_and_run_status.project is None or job_and_run_status.run_id is None:
-            _logger.error(
-                f"called finish_thread_id on thread whose tracker has no project or run id. RunQueueItemID: {job_and_run_status.run_queue_item_id}"
+            self._internal_logger.info(
+                f"called finish_thread_id on thread whose tracker has no project or run id. RunQueueItemID: {job_and_run_status.run_queue_item_id}",
             )
             wandb.termerror(
                 "Missing project or run id on thread called finish thread id"
@@ -430,7 +467,9 @@ class LaunchAgent:
                     job_and_run_status.run_queue_item_id, _msg, "run", fnames
                 )
         else:
-            _logger.info(f"Finish thread id {thread_id} had no exception and no run")
+            self._internal_logger.info(
+                f"Finish thread id {thread_id} had no exception and no run"
+            )
             wandb._sentry.exception(
                 "launch agent called finish thread id on thread without run or exception"
             )
@@ -458,7 +497,7 @@ class LaunchAgent:
         await self.update_status(AGENT_RUNNING)
         # parse job
-        _logger.info("Parsing launch spec")
+        self._internal_logger.info("Parsing launch spec")
         launch_spec = job["runSpec"]
         # Abort if this job attempts to override secure mode
@@ -511,6 +550,10 @@ class LaunchAgent:
             KeyboardInterrupt: if the agent is requested to stop.
         """
         self.print_status()
+        if self._verbosity == 0:
+            print_interval = DEFAULT_PRINT_INTERVAL
+        else:
+            print_interval = VERBOSE_PRINT_INTERVAL
         try:
             while True:
                 job = None
@@ -532,7 +575,7 @@ class LaunchAgent:
                             file_saver = RunQueueItemFileSaver(
                                 self._wandb_run, job["runQueueItemId"]
                             )
-                            if _is_scheduler_job(job.get("runSpec", {})):
+                            if self._is_scheduler_job(job.get("runSpec", {})):
                                 # If job is a scheduler, and we are already at the cap, ignore,
                                 #    don't ack, and it will be pushed back onto the queue in 1 min
                                 if self.num_running_schedulers >= self._max_schedulers:
@@ -567,6 +610,7 @@ class LaunchAgent:
                         await self.update_status(AGENT_POLLING)
                     else:
                         await self.update_status(AGENT_RUNNING)
+                if time.time() - self._last_status_print_time > print_interval:
                     self.print_status()
                 if self.num_running_jobs == self._max_jobs or job is None:
@@ -634,14 +678,14 @@ class LaunchAgent:
         await self.check_sweep_state(launch_spec, api)
         job_tracker.update_run_info(project)
-        _logger.info("Fetching and validating project...")
+        self._internal_logger.info("Fetching and validating project...")
         project.fetch_and_validate_project()
-        _logger.info("Fetching resource...")
+        self._internal_logger.info("Fetching resource...")
         resource = launch_spec.get("resource") or "local-container"
         backend_config: Dict[str, Any] = {
             PROJECT_SYNCHRONOUS: False,  # agent always runs async
         }
-        _logger.info("Loading backend")
+        self._internal_logger.info("Loading backend")
         override_build_config = launch_spec.get("builder")
         _, build_config, registry_config = construct_agent_configs(
@@ -661,13 +705,13 @@ class LaunchAgent:
             assert entrypoint is not None
             image_uri = await builder.build_image(project, entrypoint, job_tracker)
-        _logger.info("Backend loaded...")
+        self._internal_logger.info("Backend loaded...")
         if isinstance(backend, LocalProcessRunner):
             run = await backend.run(project, image_uri)
         else:
             assert image_uri
             run = await backend.run(project, image_uri)
-        if _is_scheduler_job(launch_spec):
+        if self._is_scheduler_job(launch_spec):
             with self._jobs_lock:
                 self._jobs[thread_id].is_scheduler = True
             wandb.termlog(
@@ -700,7 +744,7 @@ class LaunchAgent:
                 if stopped_time is None:
                     stopped_time = time.time()
                 else:
-                    if time.time() - stopped_time > MAX_WAIT_RUN_STOPPED:
+                    if time.time() - stopped_time > self._stopped_run_timeout:
                         await run.cancel()
             await asyncio.sleep(AGENT_POLLING_INTERVAL)
@@ -720,7 +764,7 @@ class LaunchAgent:
                     project=launch_spec["project"],
                 )
             except Exception as e:
-                _logger.debug(f"Fetch sweep state error: {e}")
+                self._internal_logger.debug(f"Fetch sweep state error: {e}")
                 state = None
             if state != "RUNNING" and state != "PAUSED":

wandb/sdk/launch/agent/config.py CHANGED Viewed

@@ -80,17 +80,7 @@ class RegistryConfig(BaseModel):
     @validator("uri")  # type: ignore
     @classmethod
     def validate_uri(cls, uri: str) -> str:
-        for regex in [
-            GCP_ARTIFACT_REGISTRY_URI_REGEX,
-            AZURE_CONTAINER_REGISTRY_URI_REGEX,
-            ELASTIC_CONTAINER_REGISTRY_URI_REGEX,
-        ]:
-            if regex.match(uri):
-                return uri
-        raise ValueError(
-            "Invalid uri. URI must be a repository URI for an "
-            "ECR, ACR, or GCP Artifact Registry."
-        )
+        return validate_registry_uri(uri)
 class EnvironmentConfig(BaseModel):
@@ -186,6 +176,14 @@ class BuilderConfig(BaseModel):
         """Right now there are no required fields for docker builds."""
         return values
+    @validator("destination")  # type: ignore
+    @classmethod
+    def validate_destination(cls, destination: Optional[str]) -> Optional[str]:
+        """Validate that the destination is a valid container registry URI."""
+        if destination is None:
+            return None
+        return validate_registry_uri(destination)
 class AgentConfig(BaseModel):
     """Configuration for the Launch agent."""
@@ -225,6 +223,77 @@ class AgentConfig(BaseModel):
         None,
         description="The builder to use.",
     )
+    verbosity: Optional[int] = Field(
+        0,
+        description="How verbose to print, 0 = default, 1 = verbose, 2 = very verbose",
+    )
+    stopped_run_timeout: Optional[int] = Field(
+        60,
+        description="How many seconds to wait after receiving the stop command before forcibly cancelling a run.",
+    )
     class Config:
         extra = "forbid"
+def validate_registry_uri(uri: str) -> str:
+    """Validate that the registry URI is a valid container registry URI.
+    The URI should resolve to an image name in a container registry. The recognized
+    formats are for ECR, ACR, and GCP Artifact Registry. If the URI does not match
+    any of these formats, a warning is printed indicating the registry type is not
+    recognized and the agent can't guarantee that images can be pushed.
+    If the format is recognized but does not resolve to an image name, an
+    error is raised. For example, if the URI is an ECR URI but does not include
+    an image name or includes a tag as well as an image name, an error is raised.
+    """
+    tag_msg = (
+        "Destination for built images may not include a tag, but the URI provided "
+        "includes the suffix '{tag}'. Please remove the tag and try again. The agent "
+        "will automatically tag each image with a unique hash of the source code."
+    )
+    if uri.startswith("https://"):
+        uri = uri[8:]
+    match = GCP_ARTIFACT_REGISTRY_URI_REGEX.match(uri)
+    if match:
+        if match.group("tag"):
+            raise ValueError(tag_msg.format(tag=match.group("tag")))
+        if not match.group("image_name"):
+            raise ValueError(
+                "An image name must be specified in the URI for a GCP Artifact Registry. "
+                "Please provide a uri with the format "
+                "'https://<region>-docker.pkg.dev/<project>/<repository>/<image>'."
+            )
+        return uri
+    match = AZURE_CONTAINER_REGISTRY_URI_REGEX.match(uri)
+    if match:
+        if match.group("tag"):
+            raise ValueError(tag_msg.format(tag=match.group("tag")))
+        if not match.group("repository"):
+            raise ValueError(
+                "A repository name must be specified in the URI for an "
+                "Azure Container Registry. Please provide a uri with the format "
+                "'https://<registry-name>.azurecr.io/<repository>'."
+            )
+        return uri
+    match = ELASTIC_CONTAINER_REGISTRY_URI_REGEX.match(uri)
+    if match:
+        if match.group("tag"):
+            raise ValueError(tag_msg.format(tag=match.group("tag")))
+        if not match.group("repository"):
+            raise ValueError(
+                "A repository name must be specified in the URI for an "
+                "Elastic Container Registry. Please provide a uri with the format "
+                "'https://<account-id>.dkr.ecr.<region>.amazonaws.com/<repository>'."
+            )
+        return uri
+    wandb.termwarn(
+        f"Unable to recognize registry type in URI {uri}. You are responsible "
+        "for ensuring the agent can push images to this registry."
+    )
+    return uri

wandb/sdk/launch/builder/abstract.py CHANGED Viewed

@@ -1,4 +1,5 @@
 """Abstract plugin class defining the interface needed to build container images for W&B Launch."""
 from abc import ABC, abstractmethod
 from typing import TYPE_CHECKING, Any, Dict, Optional

wandb/sdk/launch/builder/build.py CHANGED Viewed

@@ -237,7 +237,11 @@ def get_base_setup(
     CPU version is built on python, Accelerator version is built on user provided.
     """
-    python_base_image = f"python:{py_version}-buster"
+    minor = int(py_version.split(".")[1])
+    if minor < 12:
+        python_base_image = f"python:{py_version}-buster"
+    else:
+        python_base_image = f"python:{py_version}-bookworm"
     if launch_project.accelerator_base_image:
         _logger.info(
             f"Using accelerator base image: {launch_project.accelerator_base_image}"
@@ -311,6 +315,11 @@ def get_env_vars_dict(
     _inject_wandb_config_env_vars(
         launch_project.override_config, env_vars, max_env_length
     )
+    _inject_file_overrides_env_vars(
+        launch_project.override_files, env_vars, max_env_length
+    )
     artifacts = {}
     # if we're spinning up a launch process from a job
     # we should tell the run to use that artifact
@@ -677,3 +686,21 @@ def _inject_wandb_config_env_vars(
     ]
     config_chunks_dict = {f"WANDB_CONFIG_{i}": chunk for i, chunk in enumerate(chunks)}
     env_dict.update(config_chunks_dict)
+def _inject_file_overrides_env_vars(
+    overrides: Dict[str, Any], env_dict: Dict[str, Any], maximum_env_length: int
+) -> None:
+    str_overrides = json.dumps(overrides)
+    if len(str_overrides) <= maximum_env_length:
+        env_dict["WANDB_LAUNCH_FILE_OVERRIDES"] = str_overrides
+        return
+    chunks = [
+        str_overrides[i : i + maximum_env_length]
+        for i in range(0, len(str_overrides), maximum_env_length)
+    ]
+    overrides_chunks_dict = {
+        f"WANDB_LAUNCH_FILE_OVERRIDES_{i}": chunk for i, chunk in enumerate(chunks)
+    }
+    env_dict.update(overrides_chunks_dict)

wandb/sdk/launch/builder/docker_builder.py CHANGED Viewed

@@ -1,4 +1,5 @@
 """Implementation of the docker builder."""
 import logging
 import os
 from typing import Any, Dict, Optional

wandb 0.16.5__py3-none-any.whl → 0.17.0rc1__py3-none-any.whl

wandb 0.16.5py3-none-any.whl → 0.17.0rc1py3-none-any.whl