PyPI - wandb - Versions diffs - 0.16.6__py3-none-any.whl → 0.17.0__py3-none-any.whl - Mend

wandb 0.16.6py3-none-any.whl → 0.17.0py3-none-any.whl

Files changed (193) hide show

package_readme.md +95 -0
wandb/__init__.py +2 -3
wandb/agents/pyagent.py +0 -1
wandb/analytics/sentry.py +2 -1
wandb/apis/importers/internals/internal.py +0 -1
wandb/apis/importers/internals/protocols.py +30 -56
wandb/apis/importers/mlflow.py +13 -26
wandb/apis/importers/wandb.py +8 -14
wandb/apis/internal.py +0 -3
wandb/apis/public/api.py +55 -3
wandb/apis/public/artifacts.py +1 -0
wandb/apis/public/files.py +1 -0
wandb/apis/public/history.py +1 -0
wandb/apis/public/jobs.py +17 -4
wandb/apis/public/projects.py +1 -0
wandb/apis/public/reports.py +1 -0
wandb/apis/public/runs.py +15 -17
wandb/apis/public/sweeps.py +1 -0
wandb/apis/public/teams.py +1 -0
wandb/apis/public/users.py +1 -0
wandb/apis/reports/v1/_blocks.py +3 -7
wandb/apis/reports/v2/gql.py +1 -0
wandb/apis/reports/v2/interface.py +3 -4
wandb/apis/reports/v2/internal.py +5 -8
wandb/cli/cli.py +92 -22
wandb/data_types.py +9 -6
wandb/docker/__init__.py +1 -1
wandb/env.py +38 -8
wandb/errors/__init__.py +5 -0
wandb/errors/term.py +10 -2
wandb/filesync/step_checksum.py +1 -4
wandb/filesync/step_prepare.py +4 -24
wandb/filesync/step_upload.py +4 -106
wandb/filesync/upload_job.py +0 -76
wandb/integration/catboost/catboost.py +1 -1
wandb/integration/fastai/__init__.py +1 -0
wandb/integration/huggingface/resolver.py +2 -2
wandb/integration/keras/__init__.py +1 -0
wandb/integration/keras/callbacks/metrics_logger.py +1 -1
wandb/integration/keras/keras.py +7 -7
wandb/integration/langchain/wandb_tracer.py +1 -0
wandb/integration/lightning/fabric/logger.py +1 -3
wandb/integration/metaflow/metaflow.py +41 -6
wandb/integration/openai/fine_tuning.py +3 -3
wandb/integration/prodigy/prodigy.py +1 -1
wandb/old/summary.py +1 -1
wandb/plot/confusion_matrix.py +1 -1
wandb/plot/pr_curve.py +2 -1
wandb/plot/roc_curve.py +2 -1
wandb/{plots → plot}/utils.py +13 -25
wandb/proto/v3/wandb_internal_pb2.py +364 -332
wandb/proto/v3/wandb_settings_pb2.py +2 -2
wandb/proto/v3/wandb_telemetry_pb2.py +10 -10
wandb/proto/v4/wandb_internal_pb2.py +322 -316
wandb/proto/v4/wandb_settings_pb2.py +2 -2
wandb/proto/v4/wandb_telemetry_pb2.py +10 -10
wandb/proto/wandb_deprecated.py +7 -1
wandb/proto/wandb_internal_codegen.py +3 -29
wandb/sdk/artifacts/artifact.py +26 -11
wandb/sdk/artifacts/artifact_download_logger.py +1 -0
wandb/sdk/artifacts/artifact_file_cache.py +18 -4
wandb/sdk/artifacts/artifact_instance_cache.py +1 -0
wandb/sdk/artifacts/artifact_manifest.py +1 -0
wandb/sdk/artifacts/artifact_manifest_entry.py +7 -3
wandb/sdk/artifacts/artifact_manifests/artifact_manifest_v1.py +1 -0
wandb/sdk/artifacts/artifact_saver.py +2 -8
wandb/sdk/artifacts/artifact_state.py +1 -0
wandb/sdk/artifacts/artifact_ttl.py +1 -0
wandb/sdk/artifacts/exceptions.py +1 -0
wandb/sdk/artifacts/storage_handlers/azure_handler.py +1 -0
wandb/sdk/artifacts/storage_handlers/gcs_handler.py +13 -18
wandb/sdk/artifacts/storage_handlers/http_handler.py +1 -0
wandb/sdk/artifacts/storage_handlers/local_file_handler.py +1 -0
wandb/sdk/artifacts/storage_handlers/multi_handler.py +1 -0
wandb/sdk/artifacts/storage_handlers/s3_handler.py +5 -3
wandb/sdk/artifacts/storage_handlers/tracking_handler.py +1 -0
wandb/sdk/artifacts/storage_handlers/wb_artifact_handler.py +1 -0
wandb/sdk/artifacts/storage_handlers/wb_local_artifact_handler.py +1 -0
wandb/sdk/artifacts/storage_policies/wandb_storage_policy.py +3 -42
wandb/sdk/artifacts/storage_policy.py +2 -12
wandb/sdk/data_types/_dtypes.py +8 -8
wandb/sdk/data_types/base_types/media.py +3 -6
wandb/sdk/data_types/helper_types/bounding_boxes_2d.py +3 -1
wandb/sdk/data_types/image.py +1 -1
wandb/sdk/data_types/video.py +1 -1
wandb/sdk/integration_utils/auto_logging.py +5 -6
wandb/sdk/integration_utils/data_logging.py +10 -6
wandb/sdk/interface/interface.py +68 -32
wandb/sdk/interface/interface_shared.py +7 -13
wandb/sdk/internal/datastore.py +1 -1
wandb/sdk/internal/file_pusher.py +2 -5
wandb/sdk/internal/file_stream.py +5 -18
wandb/sdk/internal/handler.py +18 -2
wandb/sdk/internal/internal.py +0 -1
wandb/sdk/internal/internal_api.py +1 -129
wandb/sdk/internal/internal_util.py +0 -1
wandb/sdk/internal/job_builder.py +159 -45
wandb/sdk/internal/profiler.py +1 -0
wandb/sdk/internal/progress.py +0 -28
wandb/sdk/internal/run.py +1 -0
wandb/sdk/internal/sender.py +1 -2
wandb/sdk/internal/system/assets/gpu_amd.py +44 -44
wandb/sdk/internal/system/assets/gpu_apple.py +56 -11
wandb/sdk/internal/system/assets/interfaces.py +6 -8
wandb/sdk/internal/system/assets/open_metrics.py +2 -2
wandb/sdk/internal/system/assets/trainium.py +1 -3
wandb/sdk/launch/__init__.py +9 -1
wandb/sdk/launch/_launch.py +4 -24
wandb/sdk/launch/_launch_add.py +1 -3
wandb/sdk/launch/_project_spec.py +186 -224
wandb/sdk/launch/agent/agent.py +37 -13
wandb/sdk/launch/agent/config.py +72 -14
wandb/sdk/launch/builder/abstract.py +69 -1
wandb/sdk/launch/builder/build.py +156 -555
wandb/sdk/launch/builder/context_manager.py +235 -0
wandb/sdk/launch/builder/docker_builder.py +8 -23
wandb/sdk/launch/builder/kaniko_builder.py +12 -25
wandb/sdk/launch/builder/noop.py +1 -0
wandb/sdk/launch/builder/templates/dockerfile.py +92 -0
wandb/sdk/launch/create_job.py +47 -37
wandb/sdk/launch/environment/abstract.py +1 -0
wandb/sdk/launch/environment/gcp_environment.py +1 -0
wandb/sdk/launch/environment/local_environment.py +1 -0
wandb/sdk/launch/inputs/files.py +148 -0
wandb/sdk/launch/inputs/internal.py +217 -0
wandb/sdk/launch/inputs/manage.py +95 -0
wandb/sdk/launch/loader.py +1 -0
wandb/sdk/launch/registry/abstract.py +1 -0
wandb/sdk/launch/registry/azure_container_registry.py +1 -0
wandb/sdk/launch/registry/elastic_container_registry.py +1 -0
wandb/sdk/launch/registry/google_artifact_registry.py +2 -1
wandb/sdk/launch/registry/local_registry.py +1 -0
wandb/sdk/launch/runner/abstract.py +1 -0
wandb/sdk/launch/runner/kubernetes_monitor.py +1 -0
wandb/sdk/launch/runner/kubernetes_runner.py +9 -10
wandb/sdk/launch/runner/local_container.py +2 -3
wandb/sdk/launch/runner/local_process.py +8 -29
wandb/sdk/launch/runner/sagemaker_runner.py +21 -20
wandb/sdk/launch/runner/vertex_runner.py +8 -7
wandb/sdk/launch/sweeps/scheduler.py +4 -3
wandb/sdk/launch/sweeps/scheduler_sweep.py +2 -1
wandb/sdk/launch/sweeps/utils.py +3 -3
wandb/sdk/launch/utils.py +15 -140
wandb/sdk/lib/_settings_toposort_generated.py +0 -5
wandb/sdk/lib/fsm.py +8 -12
wandb/sdk/lib/gitlib.py +4 -4
wandb/sdk/lib/import_hooks.py +1 -1
wandb/sdk/lib/lazyloader.py +0 -1
wandb/sdk/lib/proto_util.py +23 -2
wandb/sdk/lib/redirect.py +19 -14
wandb/sdk/lib/retry.py +3 -2
wandb/sdk/lib/tracelog.py +1 -1
wandb/sdk/service/service.py +19 -16
wandb/sdk/verify/verify.py +2 -1
wandb/sdk/wandb_init.py +14 -55
wandb/sdk/wandb_manager.py +2 -2
wandb/sdk/wandb_require.py +5 -0
wandb/sdk/wandb_run.py +114 -56
wandb/sdk/wandb_settings.py +0 -48
wandb/sdk/wandb_setup.py +1 -1
wandb/sklearn/__init__.py +1 -0
wandb/sklearn/plot/__init__.py +1 -0
wandb/sklearn/plot/classifier.py +11 -12
wandb/sklearn/plot/clusterer.py +2 -1
wandb/sklearn/plot/regressor.py +1 -0
wandb/sklearn/plot/shared.py +1 -0
wandb/sklearn/utils.py +1 -0
wandb/testing/relay.py +4 -4
wandb/trigger.py +1 -0
wandb/util.py +67 -54
wandb/wandb_controller.py +2 -3
wandb/wandb_torch.py +1 -2
{wandb-0.16.6.dist-info → wandb-0.17.0.dist-info}/METADATA +67 -70
{wandb-0.16.6.dist-info → wandb-0.17.0.dist-info}/RECORD +177 -187
{wandb-0.16.6.dist-info → wandb-0.17.0.dist-info}/WHEEL +1 -2
wandb/bin/apple_gpu_stats +0 -0
wandb/catboost/__init__.py +0 -9
wandb/fastai/__init__.py +0 -9
wandb/keras/__init__.py +0 -18
wandb/lightgbm/__init__.py +0 -9
wandb/plots/__init__.py +0 -6
wandb/plots/explain_text.py +0 -36
wandb/plots/heatmap.py +0 -81
wandb/plots/named_entity.py +0 -43
wandb/plots/part_of_speech.py +0 -50
wandb/plots/plot_definitions.py +0 -768
wandb/plots/precision_recall.py +0 -121
wandb/plots/roc.py +0 -103
wandb/sacred/__init__.py +0 -3
wandb/xgboost/__init__.py +0 -9
wandb-0.16.6.dist-info/top_level.txt +0 -1
{wandb-0.16.6.dist-info → wandb-0.17.0.dist-info}/entry_points.txt +0 -0
{wandb-0.16.6.dist-info → wandb-0.17.0.dist-info/licenses}/LICENSE +0 -0

wandb/sdk/artifacts/storage_policies/wandb_storage_policy.py CHANGED Viewed

@@ -1,4 +1,5 @@
 """WandB storage policy."""
 import hashlib
 import math
 import os
@@ -262,7 +263,7 @@ class WandbStoragePolicy(StoragePolicy):
             return math.ceil(file_size / S3_MAX_PART_NUMBERS)
         return default_chunk_size
-    def store_file_sync(
+    def store_file(
         self,
         artifact_id: str,
         artifact_manifest_id: str,
@@ -300,7 +301,7 @@ class WandbStoragePolicy(StoragePolicy):
                     hex_digests[part_number] = hex_digest
                     part_number += 1
-        resp = preparer.prepare_sync(
+        resp = preparer.prepare(
             {
                 "artifactID": artifact_id,
                 "artifactManifestID": artifact_manifest_id,
@@ -346,46 +347,6 @@ class WandbStoragePolicy(StoragePolicy):
         return False
-    async def store_file_async(
-        self,
-        artifact_id: str,
-        artifact_manifest_id: str,
-        entry: "ArtifactManifestEntry",
-        preparer: "StepPrepare",
-        progress_callback: Optional["progress.ProgressFn"] = None,
-    ) -> bool:
-        """Async equivalent to `store_file_sync`."""
-        resp = await preparer.prepare_async(
-            {
-                "artifactID": artifact_id,
-                "artifactManifestID": artifact_manifest_id,
-                "name": entry.path,
-                "md5": entry.digest,
-            }
-        )
-        entry.birth_artifact_id = resp.birth_artifact_id
-        if resp.upload_url is None:
-            return True
-        if entry.local_path is None:
-            return False
-        with open(entry.local_path, "rb") as file:
-            # This fails if we don't send the first byte before the signed URL expires.
-            await self._api.upload_file_retry_async(
-                resp.upload_url,
-                file,
-                progress_callback,
-                extra_headers={
-                    header.split(":", 1)[0]: header.split(":", 1)[1]
-                    for header in (resp.upload_headers or {})
-                },
-            )
-        self._write_cache(entry)
-        return False
     def _write_cache(self, entry: "ArtifactManifestEntry") -> None:
         if entry.local_path is None:
             return

wandb/sdk/artifacts/storage_policy.py CHANGED Viewed

@@ -1,4 +1,5 @@
 """Storage policy."""
 from typing import TYPE_CHECKING, Dict, Optional, Sequence, Type, Union
 from wandb.sdk.internal.internal_api import Api as InternalApi
@@ -42,17 +43,7 @@ class StoragePolicy:
     ) -> FilePathStr:
         raise NotImplementedError
-    def store_file_sync(
-        self,
-        artifact_id: str,
-        artifact_manifest_id: str,
-        entry: "ArtifactManifestEntry",
-        preparer: "StepPrepare",
-        progress_callback: Optional["ProgressFn"] = None,
-    ) -> bool:
-        raise NotImplementedError
-    async def store_file_async(
+    def store_file(
         self,
         artifact_id: str,
         artifact_manifest_id: str,
@@ -60,7 +51,6 @@ class StoragePolicy:
         preparer: "StepPrepare",
         progress_callback: Optional["ProgressFn"] = None,
     ) -> bool:
-        """Async equivalent to `store_file_sync`."""
         raise NotImplementedError
     def store_reference(

wandb/sdk/data_types/_dtypes.py CHANGED Viewed

@@ -14,7 +14,7 @@ np = get_module("numpy")  # intentionally not required
 if t.TYPE_CHECKING:
     from wandb.sdk.artifacts.artifact import Artifact
-ConvertableToType = t.Union["Type", t.Type["Type"], type, t.Any]
+ConvertibleToType = t.Union["Type", t.Type["Type"], type, t.Any]
 class TypeRegistry:
@@ -84,7 +84,7 @@ class TypeRegistry:
         return _type.from_json(json_dict, artifact)
     @staticmethod
-    def type_from_dtype(dtype: ConvertableToType) -> "Type":
+    def type_from_dtype(dtype: ConvertibleToType) -> "Type":
         # The dtype is already an instance of Type
         if isinstance(dtype, Type):
             wbtype: Type = dtype
@@ -528,7 +528,7 @@ class UnionType(Type):
     def __init__(
         self,
-        allowed_types: t.Optional[t.Sequence[ConvertableToType]] = None,
+        allowed_types: t.Optional[t.Sequence[ConvertibleToType]] = None,
     ):
         assert allowed_types is None or (allowed_types.__class__ == list)
         if allowed_types is None:
@@ -576,7 +576,7 @@ class UnionType(Type):
         return "{}".format(" or ".join([str(t) for t in self.params["allowed_types"]]))
-def OptionalType(dtype: ConvertableToType) -> UnionType:  # noqa: N802
+def OptionalType(dtype: ConvertibleToType) -> UnionType:  # noqa: N802
     """Function that mimics the Type class API for constructing an "Optional Type".
     This is just a Union[wb_type, NoneType].
@@ -591,14 +591,14 @@ def OptionalType(dtype: ConvertableToType) -> UnionType:  # noqa: N802
 class ListType(Type):
-    """A list of homogenous types."""
+    """A list of homogeneous types."""
     name = "list"
     types: t.ClassVar[t.List[type]] = [list, tuple, set, frozenset]
     def __init__(
         self,
-        element_type: t.Optional[ConvertableToType] = None,
+        element_type: t.Optional[ConvertibleToType] = None,
         length: t.Optional[int] = None,
     ):
         if element_type is None:
@@ -691,7 +691,7 @@ class ListType(Type):
 class NDArrayType(Type):
-    """Represents a list of homogenous types."""
+    """Represents a list of homogeneous types."""
     name = "ndarray"
     types: t.ClassVar[t.List[type]] = []  # will manually add type if np is available
@@ -786,7 +786,7 @@ class TypedDictType(Type):
     def __init__(
         self,
-        type_map: t.Optional[t.Dict[str, ConvertableToType]] = None,
+        type_map: t.Optional[t.Dict[str, ConvertibleToType]] = None,
     ):
         if type_map is None:
             type_map = {}

wandb/sdk/data_types/base_types/media.py CHANGED Viewed

@@ -177,9 +177,7 @@ class Media(WBValue):
                 json_obj["_latest_artifact_path"] = artifact_entry_latest_url
             if artifact_entry_url is None or self.is_bound():
-                assert (
-                    self.is_bound()
-                ), "Value of type {} must be bound to a run with bind_to_run() before being serialized to JSON.".format(
+                assert self.is_bound(), "Value of type {} must be bound to a run with bind_to_run() before being serialized to JSON.".format(
                     type(self).__name__
                 )
@@ -221,8 +219,7 @@ class Media(WBValue):
                     # if not, check to see if there is a source artifact for this object
                     if (
-                        self._artifact_source
-                        is not None
+                        self._artifact_source is not None
                         # and self._artifact_source.artifact != artifact
                     ):
                         default_root = self._artifact_source.artifact._default_root()
@@ -292,7 +289,7 @@ class BatchableMedia(Media):
 def _numpy_arrays_to_lists(
-    payload: Union[dict, Sequence, "np.ndarray"]
+    payload: Union[dict, Sequence, "np.ndarray"],
 ) -> Union[Sequence, dict, str, int, float, bool]:
     # Casts all numpy arrays to lists so we don't convert them to histograms, primarily for Plotly

wandb/sdk/data_types/helper_types/bounding_boxes_2d.py CHANGED Viewed

@@ -231,8 +231,10 @@ class BoundingBoxes2D(JSONMetadata):
         for box in boxes:
             # Required arguments
-            error_str = "Each box must contain a position with: middle, width, and height or \
+            error_str = (
+                "Each box must contain a position with: middle, width, and height or \
                     \nminX, maxX, minY, maxY."
+            )
             if "position" not in box:
                 raise TypeError(error_str)
             else:

wandb/sdk/data_types/image.py CHANGED Viewed

@@ -167,7 +167,7 @@ class Image(BatchableMedia):
         self._file_type = None
         # Allows the user to pass an Image object as the first parameter and have a perfect copy,
-        # only overriding additional metdata passed in. If this pattern is compelling, we can generalize.
+        # only overriding additional metadata passed in. If this pattern is compelling, we can generalize.
         if isinstance(data_or_path, Image):
             self._initialize_from_wbimage(data_or_path)
         elif isinstance(data_or_path, str):

wandb/sdk/data_types/video.py CHANGED Viewed

@@ -24,7 +24,7 @@ if TYPE_CHECKING:  # pragma: no cover
 # https://github.com/wandb/wandb/issues/3472
 #
 # Essentially, the issue is that moviepy's write_gif function fails to close
-# the open write / file descripter returned from `imageio.save`. The following
+# the open write / file descriptor returned from `imageio.save`. The following
 # function is a simplified copy of the function in the moviepy source code.
 # See https://github.com/Zulko/moviepy/blob/7e3e8bb1b739eb6d1c0784b0cb2594b587b93b39/moviepy/video/io/gif_writers.py#L428
 #

wandb/sdk/integration_utils/auto_logging.py CHANGED Viewed

@@ -27,11 +27,11 @@ V = TypeVar("V")
 class Response(Protocol[K, V]):
-    def __getitem__(self, key: K) -> V:
-        ...  # pragma: no cover
+    def __getitem__(self, key: K) -> V: ...  # pragma: no cover
-    def get(self, key: K, default: Optional[V] = None) -> Optional[V]:
-        ...  # pragma: no cover
+    def get(
+        self, key: K, default: Optional[V] = None
+    ) -> Optional[V]: ...  # pragma: no cover
 class ArgumentResponseResolver(Protocol):
@@ -42,8 +42,7 @@ class ArgumentResponseResolver(Protocol):
         response: Response,
         start_time: float,
         time_elapsed: float,
-    ) -> Optional[Dict[str, Any]]:
-        ...  # pragma: no cover
+    ) -> Optional[Dict[str, Any]]: ...  # pragma: no cover
 class PatchAPI:

wandb/sdk/integration_utils/data_logging.py CHANGED Viewed

@@ -78,7 +78,7 @@ class ValidationDataLogger:
                 Defaults to `"wb_validation_data"`.
             artifact_type: The artifact type to use for the validation data.
                 Defaults to `"validation_dataset"`.
-            class_labels: Optional list of lables to use in the inferred
+            class_labels: Optional list of labels to use in the inferred
                 processors. If the model's `target` or `output` is inferred to be a class,
                 we will attempt to map the class to these labels. Defaults to `None`.
             infer_missing_processors: Determines if processors are inferred if
@@ -262,7 +262,7 @@ def _infer_single_example_keyed_processor(
     ):
         np = wandb.util.get_module(
             "numpy",
-            required="Infering processors require numpy",
+            required="Inferring processors require numpy",
         )
         # Assume these are logits
         class_names = class_labels_table.get_column("label")
@@ -291,13 +291,17 @@ def _infer_single_example_keyed_processor(
     ):
         # assume this is a class
         if class_labels_table is not None:
-            processors["class"] = lambda n, d, p: class_labels_table.index_ref(d[0]) if d[0] < len(class_labels_table.data) else d[0]  # type: ignore
+            processors["class"] = (
+                lambda n, d, p: class_labels_table.index_ref(d[0])
+                if d[0] < len(class_labels_table.data)
+                else d[0]
+            )  # type: ignore
         else:
             processors["val"] = lambda n, d, p: d[0]
     elif len(shape) == 1:
         np = wandb.util.get_module(
             "numpy",
-            required="Infering processors require numpy",
+            required="Inferring processors require numpy",
         )
         # This could be anything
         if shape[0] <= 10:
@@ -350,7 +354,7 @@ def _infer_validation_row_processor(
     input_col_name: str = "input",
     target_col_name: str = "target",
 ) -> Callable:
-    """Infers the composit processor for the validation data."""
+    """Infers the composite processor for the validation data."""
     single_processors = {}
     if isinstance(example_input, dict):
         for key in example_input:
@@ -427,7 +431,7 @@ def _infer_prediction_row_processor(
     input_col_name: str = "input",
     output_col_name: str = "output",
 ) -> Callable:
-    """Infers the composit processor for the prediction output data."""
+    """Infers the composite processor for the prediction output data."""
     single_processors = {}
     if isinstance(example_prediction, dict):

wandb/sdk/interface/interface.py CHANGED Viewed

@@ -387,18 +387,30 @@ class InterfaceBase:
     def _make_partial_source_str(
         source: Any, job_info: Dict[str, Any], metadata: Dict[str, Any]
     ) -> str:
-        """Construct use_artifact.partial.source_info.sourc as str."""
+        """Construct use_artifact.partial.source_info.source as str."""
         source_type = job_info.get("source_type", "").strip()
         if source_type == "artifact":
             info_source = job_info.get("source", {})
             source.artifact.artifact = info_source.get("artifact", "")
             source.artifact.entrypoint.extend(info_source.get("entrypoint", []))
             source.artifact.notebook = info_source.get("notebook", False)
+            build_context = info_source.get("build_context")
+            if build_context:
+                source.artifact.build_context = build_context
+            dockerfile = info_source.get("dockerfile")
+            if dockerfile:
+                source.artifact.dockerfile = dockerfile
         elif source_type == "repo":
             source.git.git_info.remote = metadata.get("git", {}).get("remote", "")
             source.git.git_info.commit = metadata.get("git", {}).get("commit", "")
             source.git.entrypoint.extend(metadata.get("entrypoint", []))
             source.git.notebook = metadata.get("notebook", False)
+            build_context = metadata.get("build_context")
+            if build_context:
+                source.git.build_context = build_context
+            dockerfile = metadata.get("dockerfile")
+            if dockerfile:
+                source.git.dockerfile = dockerfile
         elif source_type == "image":
             source.image.image = metadata.get("docker", "")
         else:
@@ -424,7 +436,7 @@ class InterfaceBase:
             job_info=job_info,
             metadata=metadata,
         )
-        use_artifact.partial.source_info.source.ParseFromString(src_str)
+        use_artifact.partial.source_info.source.ParseFromString(src_str)  # type: ignore[arg-type]
         return use_artifact
@@ -516,11 +528,15 @@ class InterfaceBase:
         artifact_id: str,
         download_root: str,
         allow_missing_references: bool,
+        skip_cache: bool,
+        path_prefix: Optional[str],
     ) -> MailboxHandle:
         download_artifact = pb.DownloadArtifactRequest()
         download_artifact.artifact_id = artifact_id
         download_artifact.download_root = download_root
         download_artifact.allow_missing_references = allow_missing_references
+        download_artifact.skip_cache = skip_cache
+        download_artifact.path_prefix = path_prefix or ""
         resp = self._deliver_download_artifact(download_artifact)
         return resp
@@ -729,6 +745,56 @@ class InterfaceBase:
     def _publish_keepalive(self, keepalive: pb.KeepaliveRequest) -> None:
         raise NotImplementedError
+    def publish_job_input(
+        self,
+        include_paths: List[List[str]],
+        exclude_paths: List[List[str]],
+        run_config: bool = False,
+        file_path: str = "",
+    ):
+        """Publishes a request to add inputs to the job.
+        If run_config is True, the wandb.config will be added as a job input.
+        If file_path is provided, the file at file_path will be added as a job
+        input.
+        The paths provided as arguments are sequences of dictionary keys that
+        specify a path within the wandb.config. If a path is included, the
+        corresponding field will be treated as a job input. If a path is
+        excluded, the corresponding field will not be treated as a job input.
+        Args:
+            include_paths: paths within config to include as job inputs.
+            exclude_paths: paths within config to exclude as job inputs.
+            run_config: bool indicating whether wandb.config is the input source.
+            file_path: path to file to include as a job input.
+        """
+        if run_config and file_path:
+            raise ValueError(
+                "run_config and file_path are mutually exclusive arguments."
+            )
+        request = pb.JobInputRequest()
+        include_records = [pb.JobInputPath(path=path) for path in include_paths]
+        exclude_records = [pb.JobInputPath(path=path) for path in exclude_paths]
+        request.include_paths.extend(include_records)
+        request.exclude_paths.extend(exclude_records)
+        source = pb.JobInputSource(
+            run_config=pb.JobInputSource.RunConfigSource(),
+        )
+        if run_config:
+            source.run_config.CopyFrom(pb.JobInputSource.RunConfigSource())
+        else:
+            source.file.CopyFrom(
+                pb.JobInputSource.ConfigFileSource(path=file_path),
+            )
+        request.input_source.CopyFrom(source)
+        return self._publish_job_input(request)
+    @abstractmethod
+    def _publish_job_input(self, request: pb.JobInputRequest) -> MailboxHandle:
+        raise NotImplementedError
     def join(self) -> None:
         # Drop indicates that the internal process has already been shutdown
         if self._drop:
@@ -779,36 +845,6 @@ class InterfaceBase:
         run_start.run.CopyFrom(run_pb)
         return self._deliver_run_start(run_start)
-    def publish_launch_wandb_config_parameters(
-        self, include_paths: List[List[str]], exclude_paths: List[List[str]]
-    ):
-        """Tells the internal process to treat wandb.config fields as job inputs.
-        The paths provided as arguments are sequences of dictionary keys that
-        specify a path within the wandb.config. If a path is included, the
-        corresponding field will be treated as a job input. If a path is
-        excluded, the corresponding field will not be treated as a job input.
-        Args:
-            include_paths: paths within config to include as job inputs.
-            exclude_paths: paths within config to exclude as job inputs.
-        Returns:
-            None
-        """
-        config_parameters = pb.LaunchWandbConfigParametersRecord()
-        include_records = [pb.ConfigFilterPath(path=path) for path in include_paths]
-        exclude_records = [pb.ConfigFilterPath(path=path) for path in exclude_paths]
-        config_parameters.include_paths.extend(include_records)
-        config_parameters.exclude_paths.extend(exclude_records)
-        return self._publish_launch_wandb_config_parameters(config_parameters)
-    @abstractmethod
-    def _publish_launch_wandb_config_parameters(
-        self, config_parameters: pb.LaunchWandbConfigParametersRecord
-    ) -> None:
-        raise NotImplementedError
     @abstractmethod
     def _deliver_run_start(self, run_start: pb.RunStartRequest) -> MailboxHandle:
         raise NotImplementedError

wandb/sdk/interface/interface_shared.py CHANGED Viewed

@@ -100,6 +100,10 @@ class InterfaceShared(InterfaceBase):
         rec = self._make_record(telemetry=telem)
         self._publish(rec)
+    def _publish_job_input(self, job_input: pb.JobInputRequest) -> MailboxHandle:
+        record = self._make_request(job_input=job_input)
+        return self._deliver_record(record)
     def _make_stats(self, stats_dict: dict) -> pb.StatsRecord:
         stats = pb.StatsRecord()
         stats.stats_type = pb.StatsRecord.StatsType.SYSTEM
@@ -147,6 +151,7 @@ class InterfaceShared(InterfaceBase):
         telemetry_record: Optional[pb.TelemetryRecordRequest] = None,
         get_system_metrics: Optional[pb.GetSystemMetricsRequest] = None,
         python_packages: Optional[pb.PythonPackagesRequest] = None,
+        job_input: Optional[pb.JobInputRequest] = None,
     ) -> pb.Record:
         request = pb.Request()
         if login:
@@ -207,6 +212,8 @@ class InterfaceShared(InterfaceBase):
             request.sync.CopyFrom(sync)
         elif python_packages:
             request.python_packages.CopyFrom(python_packages)
+        elif job_input:
+            request.job_input.CopyFrom(job_input)
         else:
             raise Exception("Invalid request")
         record = self._make_record(request=request)
@@ -239,9 +246,6 @@ class InterfaceShared(InterfaceBase):
         use_artifact: Optional[pb.UseArtifactRecord] = None,
         output: Optional[pb.OutputRecord] = None,
         output_raw: Optional[pb.OutputRawRecord] = None,
-        launch_wandb_config_parameters: Optional[
-            pb.LaunchWandbConfigParametersRecord
-        ] = None,
     ) -> pb.Record:
         record = pb.Record()
         if run:
@@ -286,8 +290,6 @@ class InterfaceShared(InterfaceBase):
             record.output.CopyFrom(output)
         elif output_raw:
             record.output_raw.CopyFrom(output_raw)
-        elif launch_wandb_config_parameters:
-            record.wandb_config_parameters.CopyFrom(launch_wandb_config_parameters)
         else:
             raise Exception("Invalid record")
         return record
@@ -417,14 +419,6 @@ class InterfaceShared(InterfaceBase):
         rec = self._make_record(alert=proto_alert)
         self._publish(rec)
-    def _publish_launch_wandb_config_parameters(
-        self, launch_wandb_config_parameters: pb.LaunchWandbConfigParametersRecord
-    ) -> None:
-        rec = self._make_record(
-            launch_wandb_config_parameters=launch_wandb_config_parameters
-        )
-        self._publish(rec)
     def _communicate_status(
         self, status: pb.StatusRequest
     ) -> Optional[pb.StatusResponse]:

wandb/sdk/internal/datastore.py CHANGED Viewed

@@ -52,7 +52,7 @@ try:
     bytes("", "ascii")
     def strtobytes(x):
-        """strtobytes."""
+        """Strtobytes."""
         return bytes(x, "iso8859-1")
     # def bytestostr(x):

wandb/sdk/internal/file_pusher.py CHANGED Viewed

@@ -14,7 +14,7 @@ from wandb.sdk.lib.paths import LogicalPath
 if TYPE_CHECKING:
     from wandb.sdk.artifacts.artifact_manifest import ArtifactManifest
-    from wandb.sdk.artifacts.artifact_saver import SaveFn, SaveFnAsync
+    from wandb.sdk.artifacts.artifact_saver import SaveFn
     from wandb.sdk.internal import file_stream, internal_api
     from wandb.sdk.internal.settings_static import SettingsStatic
@@ -148,11 +148,8 @@ class FilePusher:
         manifest: "ArtifactManifest",
         artifact_id: str,
         save_fn: "SaveFn",
-        save_fn_async: "SaveFnAsync",
     ) -> None:
-        event = step_checksum.RequestStoreManifestFiles(
-            manifest, artifact_id, save_fn, save_fn_async
-        )
+        event = step_checksum.RequestStoreManifestFiles(manifest, artifact_id, save_fn)
         self._incoming_queue.put(event)
     def commit_artifact(

wandb/sdk/internal/file_stream.py CHANGED Viewed

@@ -1,4 +1,3 @@
-import base64
 import functools
 import itertools
 import json
@@ -53,7 +52,7 @@ logger = logging.getLogger(__name__)
 class Chunk(NamedTuple):
     filename: str
-    data: Any
+    data: str
 class DefaultFilePolicy:
@@ -227,7 +226,7 @@ class CRDedupeFilePolicy(DefaultFilePolicy):
         prefix += token + " "
         return prefix, rest
-    def process_chunks(self, chunks: List) -> List["ProcessedChunk"]:
+    def process_chunks(self, chunks: List[Chunk]) -> List["ProcessedChunk"]:
         r"""Process chunks.
         Args:
@@ -300,18 +299,6 @@ class CRDedupeFilePolicy(DefaultFilePolicy):
         return ret
-class BinaryFilePolicy(DefaultFilePolicy):
-    def __init__(self) -> None:
-        super().__init__()
-        self._offset: int = 0
-    def process_chunks(self, chunks: List[Chunk]) -> "ProcessedBinaryChunk":
-        data = b"".join([c.data for c in chunks])
-        enc = base64.b64encode(data).decode("ascii")
-        self._offset += len(data)
-        return {"offset": self._offset, "content": enc, "encoding": "base64"}
 class FileStreamApi:
     """Pushes chunks of files to our streaming endpoint.
@@ -585,12 +572,12 @@ class FileStreamApi:
     def enqueue_preempting(self) -> None:
         self._queue.put(self.Preempting())
-    def push(self, filename: str, data: Any) -> None:
+    def push(self, filename: str, data: str) -> None:
         """Push a chunk of a file to the streaming endpoint.
         Arguments:
-            filename: Name of file that this is a chunk of.
-            data: File data.
+            filename: Name of file to append to.
+            data: Text to append to the file.
         """
         self._queue.put(Chunk(filename, data))

wandb/sdk/internal/handler.py CHANGED Viewed

@@ -50,6 +50,18 @@ SummaryDict = Dict[str, Any]
 logger = logging.getLogger(__name__)
+# Update (March 5, 2024): Since ~2020/2021, when constructing the summary
+# object, we had replaced the artifact path for media types with the latest
+# artifact path. The primary purpose of this was to support live updating of
+# media objects in the UI (since the default artifact path was fully qualified
+# and would not update). However, in March of 2024, a bug was discovered with
+# this approach which causes this path to be incorrect in cases where the media
+# object is logged to another artifact before being logged to the run. Setting
+# this to `False` disables this copy behavior. The impact is that users will
+# need to refresh to see updates. Ironically, this updating behavior is not
+# currently supported in the UI, so the impact of this change is minimal.
+REPLACE_SUMMARY_ART_PATH_WITH_LATEST = False
 def _dict_nested_set(target: Dict[str, Any], key_list: Sequence[str], v: Any) -> None:
     # recurse down the dictionary structure:
@@ -371,7 +383,11 @@ class HandleManager:
                     updated = True
             return updated
         # If the dict is a media object, update the pointer to the latest alias
-        elif isinstance(v, dict) and handler_util.metric_is_wandb_dict(v):
+        elif (
+            REPLACE_SUMMARY_ART_PATH_WITH_LATEST
+            and isinstance(v, dict)
+            and handler_util.metric_is_wandb_dict(v)
+        ):
             if "_latest_artifact_path" in v and "artifact_path" in v:
                 # TODO: Make non-destructive?
                 v["artifact_path"] = v["_latest_artifact_path"]
@@ -381,7 +397,7 @@ class HandleManager:
     def _update_summary_media_objects(self, v: Dict[str, Any]) -> Dict[str, Any]:
         # For now, non-recursive - just top level
         for nk, nv in v.items():
-            if (
+            if REPLACE_SUMMARY_ART_PATH_WITH_LATEST and (
                 isinstance(nv, dict)
                 and handler_util.metric_is_wandb_dict(nv)
                 and "_latest_artifact_path" in nv

wandb/sdk/internal/internal.py CHANGED Viewed

@@ -12,7 +12,6 @@ Threads:
 """
 import atexit
 import logging
 import os

wandb 0.16.6__py3-none-any.whl → 0.17.0__py3-none-any.whl

wandb 0.16.6py3-none-any.whl → 0.17.0py3-none-any.whl