PyPI - wandb - Versions diffs - 0.16.6__py3-none-any.whl → 0.17.0__py3-none-any.whl - Mend

wandb 0.16.6py3-none-any.whl → 0.17.0py3-none-any.whl

Files changed (193) hide show

package_readme.md +95 -0
wandb/__init__.py +2 -3
wandb/agents/pyagent.py +0 -1
wandb/analytics/sentry.py +2 -1
wandb/apis/importers/internals/internal.py +0 -1
wandb/apis/importers/internals/protocols.py +30 -56
wandb/apis/importers/mlflow.py +13 -26
wandb/apis/importers/wandb.py +8 -14
wandb/apis/internal.py +0 -3
wandb/apis/public/api.py +55 -3
wandb/apis/public/artifacts.py +1 -0
wandb/apis/public/files.py +1 -0
wandb/apis/public/history.py +1 -0
wandb/apis/public/jobs.py +17 -4
wandb/apis/public/projects.py +1 -0
wandb/apis/public/reports.py +1 -0
wandb/apis/public/runs.py +15 -17
wandb/apis/public/sweeps.py +1 -0
wandb/apis/public/teams.py +1 -0
wandb/apis/public/users.py +1 -0
wandb/apis/reports/v1/_blocks.py +3 -7
wandb/apis/reports/v2/gql.py +1 -0
wandb/apis/reports/v2/interface.py +3 -4
wandb/apis/reports/v2/internal.py +5 -8
wandb/cli/cli.py +92 -22
wandb/data_types.py +9 -6
wandb/docker/__init__.py +1 -1
wandb/env.py +38 -8
wandb/errors/__init__.py +5 -0
wandb/errors/term.py +10 -2
wandb/filesync/step_checksum.py +1 -4
wandb/filesync/step_prepare.py +4 -24
wandb/filesync/step_upload.py +4 -106
wandb/filesync/upload_job.py +0 -76
wandb/integration/catboost/catboost.py +1 -1
wandb/integration/fastai/__init__.py +1 -0
wandb/integration/huggingface/resolver.py +2 -2
wandb/integration/keras/__init__.py +1 -0
wandb/integration/keras/callbacks/metrics_logger.py +1 -1
wandb/integration/keras/keras.py +7 -7
wandb/integration/langchain/wandb_tracer.py +1 -0
wandb/integration/lightning/fabric/logger.py +1 -3
wandb/integration/metaflow/metaflow.py +41 -6
wandb/integration/openai/fine_tuning.py +3 -3
wandb/integration/prodigy/prodigy.py +1 -1
wandb/old/summary.py +1 -1
wandb/plot/confusion_matrix.py +1 -1
wandb/plot/pr_curve.py +2 -1
wandb/plot/roc_curve.py +2 -1
wandb/{plots → plot}/utils.py +13 -25
wandb/proto/v3/wandb_internal_pb2.py +364 -332
wandb/proto/v3/wandb_settings_pb2.py +2 -2
wandb/proto/v3/wandb_telemetry_pb2.py +10 -10
wandb/proto/v4/wandb_internal_pb2.py +322 -316
wandb/proto/v4/wandb_settings_pb2.py +2 -2
wandb/proto/v4/wandb_telemetry_pb2.py +10 -10
wandb/proto/wandb_deprecated.py +7 -1
wandb/proto/wandb_internal_codegen.py +3 -29
wandb/sdk/artifacts/artifact.py +26 -11
wandb/sdk/artifacts/artifact_download_logger.py +1 -0
wandb/sdk/artifacts/artifact_file_cache.py +18 -4
wandb/sdk/artifacts/artifact_instance_cache.py +1 -0
wandb/sdk/artifacts/artifact_manifest.py +1 -0
wandb/sdk/artifacts/artifact_manifest_entry.py +7 -3
wandb/sdk/artifacts/artifact_manifests/artifact_manifest_v1.py +1 -0
wandb/sdk/artifacts/artifact_saver.py +2 -8
wandb/sdk/artifacts/artifact_state.py +1 -0
wandb/sdk/artifacts/artifact_ttl.py +1 -0
wandb/sdk/artifacts/exceptions.py +1 -0
wandb/sdk/artifacts/storage_handlers/azure_handler.py +1 -0
wandb/sdk/artifacts/storage_handlers/gcs_handler.py +13 -18
wandb/sdk/artifacts/storage_handlers/http_handler.py +1 -0
wandb/sdk/artifacts/storage_handlers/local_file_handler.py +1 -0
wandb/sdk/artifacts/storage_handlers/multi_handler.py +1 -0
wandb/sdk/artifacts/storage_handlers/s3_handler.py +5 -3
wandb/sdk/artifacts/storage_handlers/tracking_handler.py +1 -0
wandb/sdk/artifacts/storage_handlers/wb_artifact_handler.py +1 -0
wandb/sdk/artifacts/storage_handlers/wb_local_artifact_handler.py +1 -0
wandb/sdk/artifacts/storage_policies/wandb_storage_policy.py +3 -42
wandb/sdk/artifacts/storage_policy.py +2 -12
wandb/sdk/data_types/_dtypes.py +8 -8
wandb/sdk/data_types/base_types/media.py +3 -6
wandb/sdk/data_types/helper_types/bounding_boxes_2d.py +3 -1
wandb/sdk/data_types/image.py +1 -1
wandb/sdk/data_types/video.py +1 -1
wandb/sdk/integration_utils/auto_logging.py +5 -6
wandb/sdk/integration_utils/data_logging.py +10 -6
wandb/sdk/interface/interface.py +68 -32
wandb/sdk/interface/interface_shared.py +7 -13
wandb/sdk/internal/datastore.py +1 -1
wandb/sdk/internal/file_pusher.py +2 -5
wandb/sdk/internal/file_stream.py +5 -18
wandb/sdk/internal/handler.py +18 -2
wandb/sdk/internal/internal.py +0 -1
wandb/sdk/internal/internal_api.py +1 -129
wandb/sdk/internal/internal_util.py +0 -1
wandb/sdk/internal/job_builder.py +159 -45
wandb/sdk/internal/profiler.py +1 -0
wandb/sdk/internal/progress.py +0 -28
wandb/sdk/internal/run.py +1 -0
wandb/sdk/internal/sender.py +1 -2
wandb/sdk/internal/system/assets/gpu_amd.py +44 -44
wandb/sdk/internal/system/assets/gpu_apple.py +56 -11
wandb/sdk/internal/system/assets/interfaces.py +6 -8
wandb/sdk/internal/system/assets/open_metrics.py +2 -2
wandb/sdk/internal/system/assets/trainium.py +1 -3
wandb/sdk/launch/__init__.py +9 -1
wandb/sdk/launch/_launch.py +4 -24
wandb/sdk/launch/_launch_add.py +1 -3
wandb/sdk/launch/_project_spec.py +186 -224
wandb/sdk/launch/agent/agent.py +37 -13
wandb/sdk/launch/agent/config.py +72 -14
wandb/sdk/launch/builder/abstract.py +69 -1
wandb/sdk/launch/builder/build.py +156 -555
wandb/sdk/launch/builder/context_manager.py +235 -0
wandb/sdk/launch/builder/docker_builder.py +8 -23
wandb/sdk/launch/builder/kaniko_builder.py +12 -25
wandb/sdk/launch/builder/noop.py +1 -0
wandb/sdk/launch/builder/templates/dockerfile.py +92 -0
wandb/sdk/launch/create_job.py +47 -37
wandb/sdk/launch/environment/abstract.py +1 -0
wandb/sdk/launch/environment/gcp_environment.py +1 -0
wandb/sdk/launch/environment/local_environment.py +1 -0
wandb/sdk/launch/inputs/files.py +148 -0
wandb/sdk/launch/inputs/internal.py +217 -0
wandb/sdk/launch/inputs/manage.py +95 -0
wandb/sdk/launch/loader.py +1 -0
wandb/sdk/launch/registry/abstract.py +1 -0
wandb/sdk/launch/registry/azure_container_registry.py +1 -0
wandb/sdk/launch/registry/elastic_container_registry.py +1 -0
wandb/sdk/launch/registry/google_artifact_registry.py +2 -1
wandb/sdk/launch/registry/local_registry.py +1 -0
wandb/sdk/launch/runner/abstract.py +1 -0
wandb/sdk/launch/runner/kubernetes_monitor.py +1 -0
wandb/sdk/launch/runner/kubernetes_runner.py +9 -10
wandb/sdk/launch/runner/local_container.py +2 -3
wandb/sdk/launch/runner/local_process.py +8 -29
wandb/sdk/launch/runner/sagemaker_runner.py +21 -20
wandb/sdk/launch/runner/vertex_runner.py +8 -7
wandb/sdk/launch/sweeps/scheduler.py +4 -3
wandb/sdk/launch/sweeps/scheduler_sweep.py +2 -1
wandb/sdk/launch/sweeps/utils.py +3 -3
wandb/sdk/launch/utils.py +15 -140
wandb/sdk/lib/_settings_toposort_generated.py +0 -5
wandb/sdk/lib/fsm.py +8 -12
wandb/sdk/lib/gitlib.py +4 -4
wandb/sdk/lib/import_hooks.py +1 -1
wandb/sdk/lib/lazyloader.py +0 -1
wandb/sdk/lib/proto_util.py +23 -2
wandb/sdk/lib/redirect.py +19 -14
wandb/sdk/lib/retry.py +3 -2
wandb/sdk/lib/tracelog.py +1 -1
wandb/sdk/service/service.py +19 -16
wandb/sdk/verify/verify.py +2 -1
wandb/sdk/wandb_init.py +14 -55
wandb/sdk/wandb_manager.py +2 -2
wandb/sdk/wandb_require.py +5 -0
wandb/sdk/wandb_run.py +114 -56
wandb/sdk/wandb_settings.py +0 -48
wandb/sdk/wandb_setup.py +1 -1
wandb/sklearn/__init__.py +1 -0
wandb/sklearn/plot/__init__.py +1 -0
wandb/sklearn/plot/classifier.py +11 -12
wandb/sklearn/plot/clusterer.py +2 -1
wandb/sklearn/plot/regressor.py +1 -0
wandb/sklearn/plot/shared.py +1 -0
wandb/sklearn/utils.py +1 -0
wandb/testing/relay.py +4 -4
wandb/trigger.py +1 -0
wandb/util.py +67 -54
wandb/wandb_controller.py +2 -3
wandb/wandb_torch.py +1 -2
{wandb-0.16.6.dist-info → wandb-0.17.0.dist-info}/METADATA +67 -70
{wandb-0.16.6.dist-info → wandb-0.17.0.dist-info}/RECORD +177 -187
{wandb-0.16.6.dist-info → wandb-0.17.0.dist-info}/WHEEL +1 -2
wandb/bin/apple_gpu_stats +0 -0
wandb/catboost/__init__.py +0 -9
wandb/fastai/__init__.py +0 -9
wandb/keras/__init__.py +0 -18
wandb/lightgbm/__init__.py +0 -9
wandb/plots/__init__.py +0 -6
wandb/plots/explain_text.py +0 -36
wandb/plots/heatmap.py +0 -81
wandb/plots/named_entity.py +0 -43
wandb/plots/part_of_speech.py +0 -50
wandb/plots/plot_definitions.py +0 -768
wandb/plots/precision_recall.py +0 -121
wandb/plots/roc.py +0 -103
wandb/sacred/__init__.py +0 -3
wandb/xgboost/__init__.py +0 -9
wandb-0.16.6.dist-info/top_level.txt +0 -1
{wandb-0.16.6.dist-info → wandb-0.17.0.dist-info}/entry_points.txt +0 -0
{wandb-0.16.6.dist-info → wandb-0.17.0.dist-info/licenses}/LICENSE +0 -0

wandb/sdk/launch/_project_spec.py CHANGED Viewed

@@ -2,18 +2,20 @@
 Arguments can come from a launch spec or call to wandb launch.
 """
 import enum
+import json
 import logging
 import os
 import tempfile
 from copy import deepcopy
 from typing import TYPE_CHECKING, Any, Dict, List, Optional, cast
+from six.moves import shlex_quote
 import wandb
-import wandb.docker as docker
 from wandb.apis.internal import Api
 from wandb.errors import CommError
-from wandb.sdk.launch import utils
 from wandb.sdk.launch.utils import get_entrypoint_file
 from wandb.sdk.lib.runid import generate_id
@@ -33,15 +35,18 @@ IMAGE_TAG_MAX_LENGTH = 32
 class LaunchSource(enum.IntEnum):
-    WANDB: int = 1
-    GIT: int = 2
-    LOCAL: int = 3
-    DOCKER: int = 4
-    JOB: int = 5
+    """Enumeration of possible sources for a launch project.
+    Attributes:
+        DOCKER: Source is a Docker image. This can happen if a user runs
+            `wandb launch -d <docker-image>`.
+        JOB: Source is a job. This is standard case.
+        SCHEDULER: Source is a wandb sweep scheduler command.
+    """
-class EntrypointDefaults(List[str]):
-    PYTHON = ["python", "main.py"]
+    DOCKER: int = 1
+    JOB: int = 2
+    SCHEDULER: int = 3
 class LaunchProject:
@@ -60,8 +65,16 @@ class LaunchProject:
     This class is stateful and certain methods can only be called after
     `LaunchProject.fetch_and_validate_project()` has been called.
+    Notes on the entrypoint:
+    - The entrypoint is the command that will be run inside the container.
+    - The LaunchProject stores two entrypoints
+        - The job entrypoint is the entrypoint specified in the job's config.
+        - The override entrypoint is the entrypoint specified in the launch spec.
+    - The override entrypoint takes precedence over the job entrypoint.
     """
+    # This init is way to long, and there are too many attributes on this sucker.
     def __init__(
         self,
         uri: Optional[str],
@@ -79,9 +92,6 @@ class LaunchProject:
         run_id: Optional[str],
         sweep_id: Optional[str] = None,
     ):
-        if uri is not None and utils.is_bare_wandb_uri(uri):
-            uri = api.settings("base_url") + uri
-            _logger.info(f"{LOG_PREFIX}Updating uri with base uri: {uri}")
         self.uri = uri
         self.job = job
         if job is not None:
@@ -105,74 +115,57 @@ class LaunchProject:
         self.accelerator_base_image: Optional[str] = resource_args_build.get(
             "accelerator", {}
         ).get("base_image") or resource_args_build.get("cuda", {}).get("base_image")
-        self._base_image: Optional[str] = launch_spec.get("base_image")
         self.docker_image: Optional[str] = docker_config.get(
             "docker_image"
         ) or launch_spec.get("image_uri")
-        uid = RESOURCE_UID_MAP.get(resource, 1000)
-        if self._base_image:
-            uid = docker.get_image_uid(self._base_image)
-            _logger.info(f"{LOG_PREFIX}Retrieved base image uid {uid}")
-        self.docker_user_id: int = docker_config.get("user_id", uid)
-        self.git_version: Optional[str] = git_info.get("version")
-        self.git_repo: Optional[str] = git_info.get("repo")
-        self.overrides = overrides
-        self.override_args: List[str] = overrides.get("args", [])
-        self.override_config: Dict[str, Any] = overrides.get("run_config", {})
-        self.override_artifacts: Dict[str, Any] = overrides.get("artifacts", {})
-        self.override_entrypoint: Optional[EntryPoint] = None
-        self.override_dockerfile: Optional[str] = overrides.get("dockerfile")
+        self.docker_user_id = docker_config.get("user_id", 1000)
+        self._entry_point: Optional[EntryPoint] = (
+            None  # todo: keep multiple entrypoint support?
+        )
+        self.init_overrides(overrides)
+        self.init_source()
+        self.init_git(git_info)
         self.deps_type: Optional[str] = None
         self._runtime: Optional[str] = None
         self.run_id = run_id or generate_id()
         self._queue_name: Optional[str] = None
         self._queue_entity: Optional[str] = None
         self._run_queue_item_id: Optional[str] = None
-        self._entry_point: Optional[
-            EntryPoint
-        ] = None  # todo: keep multiple entrypoint support?
-        override_entrypoint = overrides.get("entry_point")
-        if override_entrypoint:
-            _logger.info("Adding override entry point")
-            self.override_entrypoint = EntryPoint(
-                name=get_entrypoint_file(override_entrypoint),
-                command=override_entrypoint,
-            )
+        self._job_dockerfile: Optional[str] = None
+        self._job_build_context: Optional[str] = None
-        if overrides.get("sweep_id") is not None:
-            _logger.info("Adding override sweep id")
-            self.sweep_id = overrides["sweep_id"]
+    def init_source(self) -> None:
         if self.docker_image is not None:
             self.source = LaunchSource.DOCKER
             self.project_dir = None
         elif self.job is not None:
             self.source = LaunchSource.JOB
             self.project_dir = tempfile.mkdtemp()
-        elif self.uri is not None and utils._is_wandb_uri(self.uri):
-            _logger.info(f"URI {self.uri} indicates a wandb uri")
-            self.source = LaunchSource.WANDB
-            self.project_dir = tempfile.mkdtemp()
-        elif self.uri is not None and utils._is_git_uri(self.uri):
-            _logger.info(f"URI {self.uri} indicates a git uri")
-            self.source = LaunchSource.GIT
-            self.project_dir = tempfile.mkdtemp()
-        elif self.uri is not None and "placeholder-" in self.uri:
-            wandb.termlog(
-                f"{LOG_PREFIX}Launch received placeholder URI, replacing with local path."
+        if self.uri and self.uri.startswith("placeholder"):
+            self.source = LaunchSource.SCHEDULER
+            self.project_dir = os.getcwd()
+            self._entry_point = self.override_entrypoint
+    def init_git(self, git_info: Dict[str, str]) -> None:
+        self.git_version = git_info.get("version")
+        self.git_repo = git_info.get("repo")
+    def init_overrides(self, overrides: Dict[str, Any]) -> None:
+        """Initialize override attributes for a launch project."""
+        self.overrides = overrides
+        self.override_args: List[str] = overrides.get("args", [])
+        self.override_config: Dict[str, Any] = overrides.get("run_config", {})
+        self.override_artifacts: Dict[str, Any] = overrides.get("artifacts", {})
+        self.override_files: Dict[str, Any] = overrides.get("files", {})
+        self.override_entrypoint: Optional[EntryPoint] = None
+        self.override_dockerfile: Optional[str] = overrides.get("dockerfile")
+        override_entrypoint = overrides.get("entry_point")
+        if override_entrypoint:
+            _logger.info("Adding override entry point")
+            self.override_entrypoint = EntryPoint(
+                name=get_entrypoint_file(override_entrypoint),
+                command=override_entrypoint,
             )
-            self.uri = os.getcwd()
-            self.source = LaunchSource.LOCAL
-            self.project_dir = self.uri
-        else:
-            _logger.info(f"URI {self.uri} indicates a local uri")
-            # assume local
-            if self.uri is not None and not os.path.exists(self.uri):
-                raise LaunchError(
-                    "Assumed URI supplied is a local path but path is not valid"
-                )
-            self.source = LaunchSource.LOCAL
-            self.project_dir = self.uri
     def __repr__(self) -> str:
         """String representation of LaunchProject."""
@@ -211,6 +204,20 @@ class LaunchProject:
             launch_spec.get("sweep_id", {}),
         )
+    @property
+    def job_dockerfile(self) -> Optional[str]:
+        return self._job_dockerfile
+    @property
+    def job_build_context(self) -> Optional[str]:
+        return self._job_build_context
+    def set_job_dockerfile(self, dockerfile: str) -> None:
+        self._job_dockerfile = dockerfile
+    def set_job_build_context(self, build_context: str) -> None:
+        self._job_build_context = build_context
     @property
     def image_name(self) -> str:
         if self.docker_image is not None:
@@ -274,7 +281,7 @@ class LaunchProject:
             image (str): The image name to fill in for ${wandb-image}.
         Returns:
-            None
+            Dict[str, Any]: The resource args with all macros filled in.
         """
         update_dict = {
             "project_name": self.target_project,
@@ -324,8 +331,8 @@ class LaunchProject:
         self._docker_image = value
         self._ensure_not_docker_image_and_local_process()
-    def get_single_entry_point(self) -> Optional["EntryPoint"]:
-        """Returns the first entrypoint for the project, or None if no entry point was provided because a docker image was provided."""
+    def get_job_entry_point(self) -> Optional["EntryPoint"]:
+        """Returns the job entrypoint for the project."""
         # assuming project only has 1 entry point, pull that out
         # tmp fn until we figure out if we want to support multiple entry points or not
         if not self._entry_point:
@@ -336,8 +343,8 @@ class LaunchProject:
             return None
         return self._entry_point
-    def set_entry_point(self, command: List[str]) -> "EntryPoint":
-        """Add an entry point to the project."""
+    def set_job_entry_point(self, command: List[str]) -> "EntryPoint":
+        """Set job entrypoint for the project."""
         assert (
             self._entry_point is None
         ), "Cannot set entry point twice. Use LaunchProject.override_entrypoint"
@@ -358,51 +365,23 @@ class LaunchProject:
         """
         if self.source == LaunchSource.DOCKER:
             return
-        if self.source == LaunchSource.LOCAL:
-            if not self._entry_point:
-                wandb.termlog(
-                    f"{LOG_PREFIX}Entry point for repo not specified, defaulting to `python main.py`"
-                )
-                self.set_entry_point(EntrypointDefaults.PYTHON)
         elif self.source == LaunchSource.JOB:
             self._fetch_job()
-        else:
-            self._fetch_project_local(internal_api=self.api)
         assert self.project_dir is not None
-        # this prioritizes pip, and we don't support any cases where both are present conda projects when uploaded to
-        # wandb become pip projects via requirements.frozen.txt, wandb doesn't preserve conda envs
-        if os.path.exists(
-            os.path.join(self.project_dir, "requirements.txt")
-        ) or os.path.exists(os.path.join(self.project_dir, "requirements.frozen.txt")):
-            self.deps_type = "pip"
-        elif os.path.exists(os.path.join(self.project_dir, "environment.yml")):
-            self.deps_type = "conda"
+    # Let's make sure we document this very clearly.
     def get_image_source_string(self) -> str:
         """Returns a unique string identifying the source of an image."""
-        if self.source == LaunchSource.LOCAL:
-            # TODO: more correct to get a hash of local uri contents
-            assert isinstance(self.uri, str)
-            return self.uri
-        elif self.source == LaunchSource.JOB:
+        if self.source == LaunchSource.JOB:
             assert self._job_artifact is not None
             return f"{self._job_artifact.name}:v{self._job_artifact.version}"
-        elif self.source == LaunchSource.GIT:
-            assert isinstance(self.uri, str)
-            ret = self.uri
-            if self.git_version:
-                ret += self.git_version
-            return ret
-        elif self.source == LaunchSource.WANDB:
-            assert isinstance(self.uri, str)
-            return self.uri
         elif self.source == LaunchSource.DOCKER:
             assert isinstance(self.docker_image, str)
-            _logger.debug("")
             return self.docker_image
         else:
-            raise LaunchError("Unknown source type when determing image source string")
+            raise LaunchError(
+                "Unknown source type when determining image source string"
+            )
     def _ensure_not_docker_image_and_local_process(self) -> None:
         """Ensure that docker image is not specified with local-process resource runner.
@@ -430,111 +409,84 @@ class LaunchProject:
             raise LaunchError(
                 f"Error accessing job {self.job}: {msg} on {public_api.settings.get('base_url')}"
             )
-        job.configure_launch_project(self)
+        job.configure_launch_project(self)  # Why is this a method of the job?
         self._job_artifact = job._job_artifact
-    def _fetch_project_local(self, internal_api: Api) -> None:
-        """Fetch a project (either wandb run or git repo) into a local directory, returning the path to the local project directory."""
-        # these asserts are all guaranteed to pass, but are required by mypy
-        assert self.source != LaunchSource.LOCAL and self.source != LaunchSource.JOB
-        assert isinstance(self.uri, str)
-        assert self.project_dir is not None
-        _logger.info("Fetching project locally...")
-        if utils._is_wandb_uri(self.uri):
-            source_entity, source_project, source_run_name = utils.parse_wandb_uri(
-                self.uri
-            )
-            run_info = utils.fetch_wandb_project_run_info(
-                source_entity, source_project, source_run_name, internal_api
-            )
-            program_name = run_info.get("codePath") or run_info["program"]
-            self.python_version = run_info.get("python", "3")
-            downloaded_code_artifact = utils.check_and_download_code_artifacts(
-                source_entity,
-                source_project,
-                source_run_name,
-                internal_api,
-                self.project_dir,
-            )
-            if not downloaded_code_artifact:
-                if not run_info["git"]:
-                    raise LaunchError(
-                        "Reproducing a run requires either an associated git repo or a code artifact logged with `run.log_code()`"
-                    )
-                branch_name = utils._fetch_git_repo(
-                    self.project_dir,
-                    run_info["git"]["remote"],
-                    run_info["git"]["commit"],
-                )
-                if self.git_version is None:
-                    self.git_version = branch_name
-                patch = utils.fetch_project_diff(
-                    source_entity, source_project, source_run_name, internal_api
-                )
-                if patch:
-                    utils.apply_patch(patch, self.project_dir)
-                # For cases where the entry point wasn't checked into git
-                if not os.path.exists(os.path.join(self.project_dir, program_name)):
-                    downloaded_entrypoint = utils.download_entry_point(
-                        source_entity,
-                        source_project,
-                        source_run_name,
-                        internal_api,
-                        program_name,
-                        self.project_dir,
-                    )
-                    if not downloaded_entrypoint:
-                        raise LaunchError(
-                            f"Entrypoint file: {program_name} does not exist, "
-                            "and could not be downloaded. Please specify the entrypoint for this run."
-                        )
-            if (
-                "_session_history.ipynb" in os.listdir(self.project_dir)
-                or ".ipynb" in program_name
-            ):
-                program_name = utils.convert_jupyter_notebook_to_script(
-                    program_name, self.project_dir
-                )
+    def get_env_vars_dict(self, api: Api, max_env_length: int) -> Dict[str, str]:
+        """Generate environment variables for the project.
-            # Download any frozen requirements
-            utils.download_wandb_python_deps(
-                source_entity,
-                source_project,
-                source_run_name,
-                internal_api,
-                self.project_dir,
-            )
+        Arguments:
+        launch_project: LaunchProject to generate environment variables for.
-            if not self._entry_point:
-                _, ext = os.path.splitext(program_name)
-                if ext == ".py":
-                    entry_point = ["python", program_name]
-                elif ext == ".sh":
-                    command = os.environ.get("SHELL", "bash")
-                    entry_point = [command, program_name]
-                else:
-                    raise LaunchError(f"Unsupported entrypoint: {program_name}")
-                self.set_entry_point(entry_point)
-            if not self.override_args:
-                self.override_args = run_info["args"]
-        else:
-            assert utils._GIT_URI_REGEX.match(self.uri), (
-                "Non-wandb URI %s should be a Git URI" % self.uri
-            )
-            if not self._entry_point:
-                wandb.termlog(
-                    f"{LOG_PREFIX}Entry point for repo not specified, defaulting to python main.py"
-                )
-                self.set_entry_point(EntrypointDefaults.PYTHON)
-            branch_name = utils._fetch_git_repo(
-                self.project_dir, self.uri, self.git_version
-            )
-            if self.git_version is None:
-                self.git_version = branch_name
+        Returns:
+            Dictionary of environment variables.
+        """
+        env_vars = {}
+        env_vars["WANDB_BASE_URL"] = api.settings("base_url")
+        override_api_key = self.launch_spec.get("_wandb_api_key")
+        env_vars["WANDB_API_KEY"] = override_api_key or api.api_key
+        if self.target_project:
+            env_vars["WANDB_PROJECT"] = self.target_project
+        env_vars["WANDB_ENTITY"] = self.target_entity
+        env_vars["WANDB_LAUNCH"] = "True"
+        env_vars["WANDB_RUN_ID"] = self.run_id
+        if self.docker_image:
+            env_vars["WANDB_DOCKER"] = self.docker_image
+        if self.name is not None:
+            env_vars["WANDB_NAME"] = self.name
+        if "author" in self.launch_spec and not override_api_key:
+            env_vars["WANDB_USERNAME"] = self.launch_spec["author"]
+        if self.sweep_id:
+            env_vars["WANDB_SWEEP_ID"] = self.sweep_id
+        if self.launch_spec.get("_resume_count", 0) > 0:
+            env_vars["WANDB_RESUME"] = "allow"
+        if self.queue_name:
+            env_vars[wandb.env.LAUNCH_QUEUE_NAME] = self.queue_name
+        if self.queue_entity:
+            env_vars[wandb.env.LAUNCH_QUEUE_ENTITY] = self.queue_entity
+        if self.run_queue_item_id:
+            env_vars[wandb.env.LAUNCH_TRACE_ID] = self.run_queue_item_id
+        _inject_wandb_config_env_vars(self.override_config, env_vars, max_env_length)
+        _inject_file_overrides_env_vars(self.override_files, env_vars, max_env_length)
+        artifacts = {}
+        # if we're spinning up a launch process from a job
+        # we should tell the run to use that artifact
+        if self.job:
+            artifacts = {wandb.util.LAUNCH_JOB_ARTIFACT_SLOT_NAME: self.job}
+        env_vars["WANDB_ARTIFACTS"] = json.dumps(
+            {**artifacts, **self.override_artifacts}
+        )
+        return env_vars
+    def parse_existing_requirements(self) -> str:
+        import pkg_resources
+        requirements_line = ""
+        assert self.project_dir is not None
+        base_requirements = os.path.join(self.project_dir, "requirements.txt")
+        if os.path.exists(base_requirements):
+            include_only = set()
+            with open(base_requirements) as f:
+                iter = pkg_resources.parse_requirements(f)
+                while True:
+                    try:
+                        pkg = next(iter)
+                        if hasattr(pkg, "name"):
+                            name = pkg.name.lower()
+                        else:
+                            name = str(pkg)
+                        include_only.add(shlex_quote(name))
+                    except StopIteration:
+                        break
+                    # Different versions of pkg_resources throw different errors
+                    # just catch them all and ignore packages we can't parse
+                    except Exception as e:
+                        _logger.warn(f"Unable to parse requirements.txt: {e}")
+                        continue
+            requirements_line += "WANDB_ONLY_INCLUDE={} ".format(",".join(include_only))
+        return requirements_line
 class EntryPoint:
@@ -544,13 +496,6 @@ class EntryPoint:
         self.name = name
         self.command = command
-    def compute_command(self, user_parameters: Optional[List[str]]) -> List[str]:
-        """Converts user parameter dictionary to a string."""
-        ret = self.command
-        if user_parameters:
-            return ret + user_parameters
-        return ret
     def update_entrypoint_path(self, new_path: str) -> None:
         """Updates the entrypoint path to a new path."""
         if len(self.command) == 2 and (
@@ -559,18 +504,35 @@ class EntryPoint:
             self.command[1] = new_path
-def get_entry_point_command(
-    entry_point: Optional["EntryPoint"], parameters: List[str]
-) -> List[str]:
-    """Returns the shell command to execute in order to run the specified entry point.
-    Arguments:
-    entry_point: Entry point to run
-    parameters: Parameters (dictionary) for the entry point command
-    Returns:
-        List of strings representing the shell command to be executed
-    """
-    if entry_point is None:
-        return []
-    return entry_point.compute_command(parameters)
+def _inject_wandb_config_env_vars(
+    config: Dict[str, Any], env_dict: Dict[str, Any], maximum_env_length: int
+) -> None:
+    str_config = json.dumps(config)
+    if len(str_config) <= maximum_env_length:
+        env_dict["WANDB_CONFIG"] = str_config
+        return
+    chunks = [
+        str_config[i : i + maximum_env_length]
+        for i in range(0, len(str_config), maximum_env_length)
+    ]
+    config_chunks_dict = {f"WANDB_CONFIG_{i}": chunk for i, chunk in enumerate(chunks)}
+    env_dict.update(config_chunks_dict)
+def _inject_file_overrides_env_vars(
+    overrides: Dict[str, Any], env_dict: Dict[str, Any], maximum_env_length: int
+) -> None:
+    str_overrides = json.dumps(overrides)
+    if len(str_overrides) <= maximum_env_length:
+        env_dict["WANDB_LAUNCH_FILE_OVERRIDES"] = str_overrides
+        return
+    chunks = [
+        str_overrides[i : i + maximum_env_length]
+        for i in range(0, len(str_overrides), maximum_env_length)
+    ]
+    overrides_chunks_dict = {
+        f"WANDB_LAUNCH_FILE_OVERRIDES_{i}": chunk for i, chunk in enumerate(chunks)
+    }
+    env_dict.update(overrides_chunks_dict)

wandb/sdk/launch/agent/agent.py CHANGED Viewed

@@ -1,4 +1,5 @@
 """Implementation of launch agent."""
 import asyncio
 import logging
 import os
@@ -8,7 +9,9 @@ import time
 import traceback
 from dataclasses import dataclass
 from multiprocessing import Event
-from typing import Any, Dict, List, Optional, Union
+from typing import Any, Dict, List, Optional, Tuple, Union
+import yaml
 import wandb
 from wandb.apis.internal import Api
@@ -17,11 +20,11 @@ from wandb.sdk.launch._launch_add import launch_add
 from wandb.sdk.launch.runner.local_container import LocalSubmittedRun
 from wandb.sdk.launch.runner.local_process import LocalProcessRunner
 from wandb.sdk.launch.sweeps.scheduler import Scheduler
+from wandb.sdk.launch.utils import LAUNCH_CONFIG_FILE, resolve_build_and_registry_config
 from wandb.sdk.lib import runid
 from .. import loader
 from .._project_spec import LaunchProject
-from ..builder.build import construct_agent_configs
 from ..errors import LaunchDockerError, LaunchError
 from ..utils import (
     LAUNCH_DEFAULT_PROJECT,
@@ -133,6 +136,31 @@ class InternalAgentLogger:
         _logger.debug(f"{LOG_PREFIX}{message}")
+def construct_agent_configs(
+    launch_config: Optional[Dict] = None,
+    build_config: Optional[Dict] = None,
+) -> Tuple[Optional[Dict[str, Any]], Dict[str, Any], Dict[str, Any]]:
+    registry_config = None
+    environment_config = None
+    if launch_config is not None:
+        build_config = launch_config.get("builder")
+        registry_config = launch_config.get("registry")
+    default_launch_config = None
+    if os.path.exists(os.path.expanduser(LAUNCH_CONFIG_FILE)):
+        with open(os.path.expanduser(LAUNCH_CONFIG_FILE)) as f:
+            default_launch_config = (
+                yaml.safe_load(f) or {}
+            )  # In case the config is empty, we want it to be {} instead of None.
+        environment_config = default_launch_config.get("environment")
+    build_config, registry_config = resolve_build_and_registry_config(
+        default_launch_config, build_config, registry_config
+    )
+    return environment_config, build_config, registry_config
 class LaunchAgent:
     """Launch agent class which polls run given run queues and launches runs for wandb launch."""
@@ -172,7 +200,7 @@ class LaunchAgent:
             config: Config dictionary for the agent.
         """
         self._entity = config["entity"]
-        self._project = config.get("project", LAUNCH_DEFAULT_PROJECT)
+        self._project = LAUNCH_DEFAULT_PROJECT
         self._api = api
         self._base_url = self._api.settings().get("base_url")
         self._ticks = 0
@@ -240,7 +268,7 @@ class LaunchAgent:
         """Determine whether a job/runSpec is a sweep scheduler."""
         if not run_spec:
             self._internal_logger.debug(
-                "Recieved runSpec in _is_scheduler_job that was empty"
+                "Received runSpec in _is_scheduler_job that was empty"
             )
         if run_spec.get("uri") != Scheduler.PLACEHOLDER_URI:
@@ -276,6 +304,8 @@ class LaunchAgent:
     def _init_agent_run(self) -> None:
         # TODO: has it been long enough that all backends support agents?
+        self._wandb_run = None
         if self.gorilla_supports_agents:
             settings = wandb.Settings(silent=True, disable_git=True)
             self._wandb_run = wandb.init(
@@ -285,8 +315,6 @@ class LaunchAgent:
                 id=self._name,
                 job_type=HIDDEN_AGENT_RUN_TYPE,
             )
-        else:
-            self._wandb_run = None
     @property
     def thread_ids(self) -> List[int]:
@@ -338,10 +366,7 @@ class LaunchAgent:
         if self._name:
             output_str += f"{self._name} "
         if self.num_running_jobs < self._max_jobs:
-            output_str += "polling on "
-            if self._project != LAUNCH_DEFAULT_PROJECT:
-                output_str += f"project {self._project}, "
-            output_str += f"queues {','.join(self._queues)}, "
+            output_str += f"polling on queues {','.join(self._queues)}, "
         output_str += (
             f"running {self.num_running_jobs} out of a maximum of {self._max_jobs} jobs"
         )
@@ -433,7 +458,6 @@ class LaunchAgent:
             # We retry for 60 seconds with an exponential backoff in case
             # upsert run is taking a while.
             logs = None
-            start_time = time.time()
             interval = 1
             while True:
                 called_init = self._check_run_exists_and_inited(
@@ -442,7 +466,7 @@ class LaunchAgent:
                     job_and_run_status.run_id,
                     job_and_run_status.run_queue_item_id,
                 )
-                if called_init or time.time() - start_time > RUN_INFO_GRACE_PERIOD:
+                if called_init or interval > RUN_INFO_GRACE_PERIOD:
                     break
                 if not called_init:
                     # Fetch the logs now if we don't get run info on the
@@ -691,7 +715,7 @@ class LaunchAgent:
             default_config, override_build_config
         )
         image_uri = project.docker_image
-        entrypoint = project.get_single_entry_point()
+        entrypoint = project.get_job_entry_point()
         environment = loader.environment_from_config(
             default_config.get("environment", {})
         )

wandb 0.16.6__py3-none-any.whl → 0.17.0__py3-none-any.whl

wandb 0.16.6py3-none-any.whl → 0.17.0py3-none-any.whl