PyPI - xpk - Versions diffs - 1.0.0__py3-none-any.whl → 1.1.0__py3-none-any.whl - Mend

xpk 1.0.0py3-none-any.whl → 1.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (57) hide show

xpk/commands/cluster.py +29 -30
xpk/commands/cluster_gcluster.py +19 -14
xpk/commands/cluster_test.py +1 -21
xpk/commands/common.py +39 -6
xpk/commands/common_test.py +170 -0
xpk/commands/info.py +9 -5
xpk/commands/inspector.py +33 -4
xpk/commands/inspector_test.py +142 -0
xpk/commands/workload.py +22 -8
xpk/commands/workload_test.py +70 -3
xpk/core/blueprint/blueprint_generator.py +19 -8
xpk/core/blueprint/testing/data/a3_ultra.yaml +3 -1
xpk/core/blueprint/testing/data/a4.yaml +3 -1
xpk/core/capacity.py +37 -17
xpk/core/capacity_test.py +66 -1
xpk/core/cluster.py +10 -10
xpk/core/cluster_private.py +3 -3
xpk/core/cluster_test.py +29 -2
xpk/core/docker_container.py +31 -24
xpk/core/docker_manager.py +4 -4
xpk/core/docker_resources.py +4 -1
xpk/core/kueue_manager.py +6 -8
xpk/core/kueue_manager_test.py +4 -5
xpk/core/nap.py +14 -3
xpk/core/nodepool.py +46 -13
xpk/core/nodepool_test.py +143 -8
xpk/core/remote_state/fuse_remote_state.py +1 -1
xpk/core/scheduling.py +4 -1
xpk/core/scheduling_test.py +1 -1
xpk/core/system_characteristics.py +6 -0
xpk/core/telemetry.py +11 -1
xpk/core/telemetry_test.py +39 -0
xpk/core/testing/commands_tester.py +26 -0
xpk/core/testing/commands_tester_test.py +20 -1
xpk/core/workload_decorators/rdma_decorator.py +9 -0
xpk/parser/cluster.py +11 -1
xpk/parser/cluster_test.py +59 -1
xpk/parser/common.py +11 -0
xpk/parser/storage.py +3 -3
xpk/utils/console.py +1 -1
xpk/utils/feature_flags.py +7 -3
{xpk-1.0.0.dist-info → xpk-1.1.0.dist-info}/METADATA +37 -21
{xpk-1.0.0.dist-info → xpk-1.1.0.dist-info}/RECORD +47 -54
xpk-1.1.0.dist-info/top_level.txt +1 -0
integration/README.md +0 -19
integration/__init__.py +0 -15
integration/docker_manager_test.py +0 -102
integration/gcluster_a3mega_test.py +0 -215
integration/gcluster_a3ultra_test.py +0 -187
integration/gcluster_a4_test.py +0 -187
integration/gcluster_test.py +0 -107
xpk/utils/user_input.py +0 -48
xpk/utils/user_input_test.py +0 -92
xpk-1.0.0.dist-info/top_level.txt +0 -2
{xpk-1.0.0.dist-info → xpk-1.1.0.dist-info}/WHEEL +0 -0
{xpk-1.0.0.dist-info → xpk-1.1.0.dist-info}/entry_points.txt +0 -0
{xpk-1.0.0.dist-info → xpk-1.1.0.dist-info}/licenses/LICENSE +0 -0

xpk/core/scheduling.py CHANGED Viewed

@@ -33,8 +33,11 @@ from .system_characteristics import (
 from packaging.version import Version
 _SUB_SLICING_MINIMUM_KUEUE_VERSION = Version('0.13.0')
-_SUPER_SLICING_MINIMUM_KUEUE_VERSION = Version('0.14.0')
+_SUPER_SLICING_MINIMUM_KUEUE_VERSION = Version('0.15.2')
 _SUPER_SLICING_MAX_TOPOLOGY = (16, 24, 24)
+ONE_TO_ONE_REPLICA_NODE_POOL_ASSIGNMENT_ANNOTATION = (
+    'alpha.jobset.sigs.k8s.io/exclusive-topology: cloud.google.com/gke-nodepool'
+)
 class WorkloadScheduling(Enum):

xpk/core/scheduling_test.py CHANGED Viewed

@@ -208,7 +208,7 @@ SUPER_SLICING_CASE = SchedulingTestCase(
     cluster_system=_get_system_characteristics_or_die('tpu7x-4x4x4'),
     # 5 4x4x4 cubes:
     resources_config_map={'tpu7x-128': str(64 // 4 * 5)},
-    kueue_version='0.14.0',
+    kueue_version='0.15.2',
     super_slicing_feature_enabled=True,
     super_slicing_topology_set=True,
     num_slices=1,

xpk/core/system_characteristics.py CHANGED Viewed

@@ -131,6 +131,8 @@ class SystemCharacteristics:
     supports_super_slicing: Whether the Super-slicing feature is supported.
     requires_workload_policy: A boolean indicating if a GCE resource
       workload policy is required. This is automatically set to True for GPUs.
+    parallel_containers: The number of containers running on a single VM.
   """
   topology: str
@@ -146,6 +148,7 @@ class SystemCharacteristics:
   docker_platform: DockerPlatform
   requires_workload_policy: bool = False
   gpu_config: Optional[GpuConfig] = None
+  parallel_containers: int = 1
   def __post_init__(self):
     if self.accelerator_type == AcceleratorType.GPU:
@@ -239,6 +242,7 @@ def get_tpu_system_characteristics_map(
     default_topologies: set[str] | None = None,
     sub_slicing_topologies: set[str] | None = None,
     super_slicing_topologies: set[str] | None = None,
+    parallel_containers: int = 1,
 ) -> dict[str, SystemCharacteristics]:
   system_characteristics_map = {}
   default_topologies = default_topologies or set()
@@ -263,6 +267,7 @@ def get_tpu_system_characteristics_map(
         supports_super_slicing=topology in super_slicing_topologies,
         supports_accelerator_network_profile=supports_accelerator_network_profile,
         docker_platform=docker_platform,
+        parallel_containers=parallel_containers,
     )
     system_characteristics_map[f'{prefix}-{topology}'] = system
     if (
@@ -544,6 +549,7 @@ UserFacingNameToSystemCharacteristics = {
         tpu_type_requires_workload_policy=True,
         supports_accelerator_network_profile=False,
         docker_platform=AMD_PLATFORM,
+        parallel_containers=2,
         supported_topologies=generate_tpu_topologies(max_cubes=144),
         super_slicing_topologies=set(['4x4x4']),
         default_topologies=set([

xpk/core/telemetry.py CHANGED Viewed

@@ -30,7 +30,7 @@ from dataclasses import dataclass
 from .config import get_config, CLIENT_ID_KEY, SEND_TELEMETRY_KEY, __version__ as xpk_version
 from ..utils.execution_context import is_dry_run
 from ..utils.user_agent import get_user_agent
-from ..utils.feature_flags import FeatureFlags
+from ..utils.feature_flags import FeatureFlags, is_tester
 def should_send_telemetry():
@@ -114,6 +114,8 @@ def _clearcut_flush(file_path: str) -> None:
 class MetricsEventMetadataKey(Enum):
+  """Represents available metadata keys."""
   SESSION_ID = "XPK_SESSION_ID"
   DRY_RUN = "XPK_DRY_RUN"
   PYTHON_VERSION = "XPK_PYTHON_VERSION"
@@ -125,6 +127,7 @@ class MetricsEventMetadataKey(Enum):
   RUNNING_AS_PIP = "XPK_RUNNING_AS_PIP"
   RUNNING_FROM_SOURCE = "XPK_RUNNING_FROM_SOURCE"
   LATENCY_SECONDS = "XPK_LATENCY_SECONDS"
+  TESTER = "XPK_TESTER"
 @dataclass
@@ -230,6 +233,9 @@ def _get_base_event_metadata() -> dict[MetricsEventMetadataKey, str]:
       MetricsEventMetadataKey.RUNNING_FROM_SOURCE: str(
           _is_running_from_source()
       ).lower(),
+      MetricsEventMetadataKey.TESTER: str(
+          is_tester() or _is_trash_execution()
+      ).lower(),
   }
@@ -241,6 +247,10 @@ def _get_base_concord_event() -> dict[str, str]:
   }
+def _is_trash_execution() -> bool:
+  return os.getenv("TELEMETRY_TRASH_EXECUTION") == "true"
 def _is_running_as_pip() -> bool:
   return os.path.basename(sys.argv[0]) == "xpk"

xpk/core/telemetry_test.py CHANGED Viewed

@@ -30,7 +30,9 @@ def setup_mocks(mocker: MockerFixture):
   mocker.patch('time.time', side_effect=itertools.count())
   mocker.patch('platform.python_version', return_value='99.99.99')
   mocker.patch('os.path.basename', return_value='xpk.py')
+  mocker.patch('os.getenv', return_value='false')
   mocker.patch('os.path.abspath', return_value='/home/xpk_user')
+  mocker.patch('xpk.core.telemetry.is_tester', return_value=False)
   set_dry_run(False)
   get_config().set(CLIENT_ID_KEY, 'client_id')
   yield
@@ -76,6 +78,7 @@ def test_metrics_collector_logs_start_event_correctly():
           {'key': 'XPK_PYTHON_VERSION', 'value': '99.99.99'},
           {'key': 'XPK_RUNNING_AS_PIP', 'value': 'false'},
           {'key': 'XPK_RUNNING_FROM_SOURCE', 'value': 'true'},
+          {'key': 'XPK_TESTER', 'value': 'false'},
           {'key': 'XPK_COMMAND', 'value': 'test'},
           {'key': 'XPK_LATENCY_SECONDS', 'value': '0'},
       ],
@@ -107,6 +110,7 @@ def test_metrics_collector_logs_complete_event_correctly():
           {'key': 'XPK_PYTHON_VERSION', 'value': '99.99.99'},
           {'key': 'XPK_RUNNING_AS_PIP', 'value': 'false'},
           {'key': 'XPK_RUNNING_FROM_SOURCE', 'value': 'true'},
+          {'key': 'XPK_TESTER', 'value': 'false'},
           {'key': 'XPK_EXIT_CODE', 'value': '2'},
           {'key': 'XPK_LATENCY_SECONDS', 'value': '0'},
       ],
@@ -131,6 +135,7 @@ def test_metrics_collector_logs_custom_event_correctly():
           {'key': 'XPK_PYTHON_VERSION', 'value': '99.99.99'},
           {'key': 'XPK_RUNNING_AS_PIP', 'value': 'false'},
           {'key': 'XPK_RUNNING_FROM_SOURCE', 'value': 'true'},
+          {'key': 'XPK_TESTER', 'value': 'false'},
           {'key': 'XPK_PROVISIONING_MODE', 'value': 'flex'},
           {'key': 'XPK_LATENCY_SECONDS', 'value': '0'},
       ],
@@ -219,6 +224,40 @@ def test_metrics_collectors_logs_correct_running_from_source_value(
   assert _get_metadata_value(payload, 'XPK_RUNNING_FROM_SOURCE') == expected
+@pytest.mark.parametrize(
+    argnames='tester,expected',
+    argvalues=[
+        (True, 'true'),
+        (False, 'false'),
+    ],
+)
+def test_metrics_collectors_logs_correct_tester_value_for_is_tester_variable(
+    tester: bool, expected: str, mocker: MockerFixture
+):
+  mocker.patch('xpk.core.telemetry.is_tester', return_value=tester)
+  MetricsCollector.log_start(command='test')
+  payload = MetricsCollector.flush()
+  assert _get_metadata_value(payload, 'XPK_TESTER') == expected
+@pytest.mark.parametrize(
+    argnames='trash_execution,expected',
+    argvalues=[
+        ('true', 'true'),
+        ('false', 'false'),
+        ('', 'false'),
+        (None, 'false'),
+    ],
+)
+def test_metrics_collectors_logs_correct_tester_value_for_trash_variable(
+    trash_execution: str, expected: str, mocker: MockerFixture
+):
+  mocker.patch('os.getenv', return_value=trash_execution)
+  MetricsCollector.log_start(command='test')
+  payload = MetricsCollector.flush()
+  assert _get_metadata_value(payload, 'XPK_TESTER') == expected
 def _get_metadata_value(payload_str: str, key: str) -> str | None:
   payload = json.loads(payload_str)
   metadata = json.loads(payload['log_event'][0]['source_extension_json'])[

xpk/core/testing/commands_tester.py CHANGED Viewed

@@ -17,6 +17,8 @@ limitations under the License.
 import re
 from pytest_mock import MockerFixture
+from ..commands import FailedCommand
 class CommandsTester:
   """Tester class useful for mocking and asserting command runs."""
@@ -27,6 +29,7 @@ class CommandsTester:
       run_command_for_value_path: str | None = None,
       run_command_with_updates_path: str | None = None,
       run_command_with_updates_retry_path: str | None = None,
+      run_command_batch_path: str | None = None,
   ):
     self.__results: dict[re.Pattern, tuple[int, str]] = {}
     self.commands_history: list[str] = []
@@ -45,6 +48,11 @@ class CommandsTester:
           run_command_with_updates_retry_path,
           wraps=self.__fake_run_command_with_updates_retry,
       )
+    if run_command_batch_path:
+      mocker.patch(
+          run_command_batch_path,
+          wraps=self.__fake_run_command_batch,
+      )
   def set_result_for_command(
       self, result: tuple[int, str], *command_parts: str
@@ -111,6 +119,24 @@ class CommandsTester:
   ) -> tuple[int, str]:
     return self.__common_fake_run_command(command, (0, dry_run_return_val))
+  def __fake_run_command_batch(
+      self,
+      commands: list[str],
+      jobname: str,
+      per_command_name: list[str],
+      output_logs: list[str],
+  ) -> FailedCommand | None:
+    for i, command in enumerate(commands):
+      result = self.__common_fake_run_command(command, (0, ""))[0]
+      if result != 0:
+        return FailedCommand(
+            return_code=result,
+            name=per_command_name[i],
+            command=command,
+            logfile=output_logs[i],
+        )
+    return None
   # pylint: enable=unused-argument
   def __common_fake_run_command(

xpk/core/testing/commands_tester_test.py CHANGED Viewed

@@ -17,7 +17,7 @@ limitations under the License.
 import pytest
 from pytest_mock import MockerFixture
-from xpk.core.commands import run_command_for_value, run_command_with_updates_retry
+from xpk.core.commands import run_command_for_value, run_command_with_updates_retry, run_command_batch
 from xpk.core.testing.commands_tester import CommandsTester
@@ -31,6 +31,9 @@ def mock_commands(mocker: MockerFixture) -> CommandsTester:
       run_command_with_updates_retry_path=(
           "xpk.core.testing.commands_tester_test.run_command_with_updates_retry"
       ),
+      run_command_batch_path=(
+          "xpk.core.testing.commands_tester_test.run_command_batch"
+      ),
   )
@@ -54,6 +57,22 @@ def test_run_command_with_updates_retry_default_result(
   mock_commands.assert_command_run("cmd", "bar")
+def test_run_command_batch_default_result(
+    mock_commands: CommandsTester,
+):
+  result = run_command_batch(
+      commands=["cmd1 foo bar", "cmd2 foo bar"],
+      jobname="Test command",
+      per_command_name=["cmd1", "cmd2"],
+      output_logs=["log1", "log2"],
+  )
+  assert result is None
+  mock_commands.assert_command_run("foo bar", times=2)
+  mock_commands.assert_command_run("cmd1")
+  mock_commands.assert_command_run("cmd2")
 def test_set_result_for_command(mock_commands: CommandsTester):
   mock_commands.set_result_for_command((17, "Error!"), "cmd", "--err")

xpk/core/workload_decorators/rdma_decorator.py CHANGED Viewed

@@ -84,6 +84,12 @@ def add_volumes(job_manifest):
   volumes.append(
       {'name': 'gib', 'hostPath': {'path': '/home/kubernetes/bin/gib'}}
   )
+  volumes.append({
+      'name': 'dshm',
+      'emptyDir': {
+          'medium': 'Memory',
+      },
+  })
 def add_tolerations(job_manifest):
@@ -111,3 +117,6 @@ def update_gpu_containers(job_manifest):
       container['volumeMounts'].append(
           {'name': 'gib', 'mountPath': '/usr/local/gib'}
       )
+      container['volumeMounts'].append(
+          {'name': 'dshm', 'mountPath': '/dev/shm'}
+      )

xpk/parser/cluster.py CHANGED Viewed

@@ -338,7 +338,10 @@ def set_cluster_create_ray_parser(cluster_create_ray_parser: ArgumentParser):
   add_resource_limits(cluster_create_resource_limits)
   cluster_create_ray_parser.set_defaults(
-      func=cluster_create_ray_cluster, sub_slicing=False, super_slicing=False
+      func=cluster_create_ray_cluster,
+      sub_slicing=False,
+      super_slicing=False,
+      num_cubes=None,
   )
@@ -503,6 +506,13 @@ def set_cluster_adapt_parser(cluster_adapt_parser: ArgumentParser):
   )
   add_driver_arguments(cluster_adapt_optional_arguments)
   add_shared_arguments(cluster_adapt_optional_arguments)
+  add_resource_limits(cluster_adapt_optional_arguments)
+  if FeatureFlags.SUB_SLICING_ENABLED:
+    add_cluster_create_sub_slicing_arguments(cluster_adapt_optional_arguments)
+  if FeatureFlags.SUPER_SLICING_ENABLED:
+    add_cluster_create_super_slicing_arguments(cluster_adapt_optional_arguments)
   cluster_adapt_capacity_arguments = cluster_adapt_parser.add_argument_group(
       'Capacity Arguments', 'Arguments related to capacity for cluster create.'

xpk/parser/cluster_test.py CHANGED Viewed

@@ -15,8 +15,8 @@ limitations under the License.
 """
 import argparse
-from xpk.parser.cluster import set_cluster_create_parser, set_cluster_create_pathways_parser, set_cluster_create_ray_parser
 import pytest
+from xpk.parser.cluster import set_cluster_create_parser, set_cluster_create_pathways_parser, set_cluster_create_ray_parser, set_cluster_adapt_parser
 from ..utils.feature_flags import FeatureFlags
@@ -261,3 +261,61 @@ def test_cluster_create_num_slices_has_no_default_if_superslicing_feature():
   )
   assert args.num_slices is None
+def test_cluster_adapt_sub_slicing_is_hidden_with_flag_off():
+  FeatureFlags.SUB_SLICING_ENABLED = False
+  parser = argparse.ArgumentParser()
+  set_cluster_adapt_parser(parser)
+  help_str = parser.format_help()
+  assert "--sub-slicing" not in help_str
+def test_cluster_adapt_sub_slicing_is_shown_with_flag_on():
+  FeatureFlags.SUB_SLICING_ENABLED = True
+  parser = argparse.ArgumentParser()
+  set_cluster_adapt_parser(parser)
+  help_str = parser.format_help()
+  assert "--sub-slicing" in help_str
+def test_cluster_adapt_super_slicing_is_hidden_with_flag_off():
+  FeatureFlags.SUPER_SLICING_ENABLED = False
+  parser = argparse.ArgumentParser()
+  set_cluster_adapt_parser(parser)
+  help_str = parser.format_help()
+  assert "--super-slicing" not in help_str
+def test_cluster_adapt_super_slicing_is_shown_with_flag_on():
+  FeatureFlags.SUPER_SLICING_ENABLED = True
+  parser = argparse.ArgumentParser()
+  set_cluster_adapt_parser(parser)
+  help_str = parser.format_help()
+  assert "--super-slicing" in help_str
+def test_cluster_adapt_memory_limit_is_shown():
+  parser = argparse.ArgumentParser()
+  set_cluster_adapt_parser(parser)
+  help_str = parser.format_help()
+  assert "--memory-limit" in help_str
+def test_cluster_adapt_cpu_limit_is_shown():
+  parser = argparse.ArgumentParser()
+  set_cluster_adapt_parser(parser)
+  help_str = parser.format_help()
+  assert "--cpu-limit" in help_str

xpk/parser/common.py CHANGED Viewed

@@ -83,6 +83,17 @@ def add_shared_arguments(
       help='GCE project name, defaults to "gcloud config project."',
       required=required,
   )
+  custom_parser_or_group.add_argument(
+      '--project-number',
+      type=str,
+      default=None,
+      help=(
+          'GCE project number. If provided, skips the Cloud Resource Manager'
+          ' API call to translate project ID to project number. Useful when'
+          ' the API is not enabled or you lack permissions.'
+      ),
+      required=False,
+  )
   custom_parser_or_group.add_argument(
       '--zone',
       type=str,

xpk/parser/storage.py CHANGED Viewed

@@ -127,7 +127,7 @@ def add_storage_attach_parser(
       type=str,
       help=(
           '(optional) Name of the bucket. If not set, then the "name" parameter'
-          ' is infered as a bucket name.'
+          ' is inferred as a bucket name.'
       ),
   )
   gcsfuse_args.add_argument(
@@ -165,7 +165,7 @@ def add_storage_attach_parser(
       type=str,
       help=(
           '(optional) Name of the filestore instance. If not set, then the'
-          ' "name" parameter is infered as an instance name.'
+          ' "name" parameter is inferred as an instance name.'
       ),
   )
@@ -238,7 +238,7 @@ def add_storage_create_parser(storage_subcommands_parser: Subcommands) -> None:
       type=str,
       help=(
           '(optional) Name of the filestore instance. If not set, then the'
-          ' "name" parameter is infered as an instance name.'
+          ' "name" parameter is inferred as an instance name.'
       ),
   )
   opt_args.add_argument(

xpk/utils/console.py CHANGED Viewed

@@ -51,7 +51,7 @@ def ask_for_user_consent(
     question: str, default_option: Literal["Y", "N"] = "N"
 ) -> bool:
   """Prompts user with the given question, asking for a yes/no answer and returns a relevant boolean.
-  Important: immediatelly returns `True` in quiet mode!
+  Important: immediately returns `True` in quiet mode!
   Example prompt for `question='Continue?'`: `[XPK] Continue? (y/N): `.

xpk/utils/feature_flags.py CHANGED Viewed

@@ -17,20 +17,24 @@ limitations under the License.
 import os
+def is_tester() -> bool:
+  """Returns true if user is a tester."""
+  return os.getenv("XPK_TESTER", "").lower() == "true"
 def _get_boolean_flag(flag: str, default: bool) -> bool:
   experiment_value = os.getenv(flag, "").lower()
   if experiment_value in ["true", "false"]:
     return experiment_value == "true"
-  xpk_tester = os.getenv("XPK_TESTER", "").lower() == "true"
-  return xpk_tester or default
+  return is_tester() or default
 class _FeatureFlags:
   SUB_SLICING_ENABLED = _get_boolean_flag("SUB_SLICING_ENABLED", default=False)
   TELEMETRY_ENABLED = _get_boolean_flag("TELEMETRY_ENABLED", default=True)
   SUPER_SLICING_ENABLED = _get_boolean_flag(
-      "SUPER_SLICING_ENABLED", default=False
+      "SUPER_SLICING_ENABLED", default=True
   )

{xpk-1.0.0.dist-info → xpk-1.1.0.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: xpk
-Version: 1.0.0
+Version: 1.1.0
 Summary: xpk helps Cloud developers to orchestrate training jobs on accelerators on GKE.
 Author-email: XPK team <xpk-code-reviewers@google.com>
 License: Apache-2.0
@@ -93,28 +93,41 @@ XPK supports a variety of hardware accelerators.
 XPK also supports the following [Google Cloud Storage solutions](./docs/usage/storage.md):
-| Storage Type                               | Documentation                                                                            |
-|--------------------------------------------|------------------------------------------------------------------------------------------|
-| Cloud Storage FUSE                         | [docs](./docs/usage/storage.md#fuse)                                                     |
-| Filestore                                  | [docs](./docs/usage/storage.md#filestore)                                                |
-| Parallelstore                              | [docs](./docs/usage/storage.md#parallelstore)                                            |
-| Block storage (Persistent Disk, Hyperdisk) | [docs](./docs/usage/storage.md#block-storage-persistent-disk-hyperdisk)                  |
+| Storage Type                               | Documentation                                                           |
+| ------------------------------------------ | ----------------------------------------------------------------------- |
+| Cloud Storage FUSE                         | [docs](./docs/usage/storage.md#fuse)                                    |
+| Filestore                                  | [docs](./docs/usage/storage.md#filestore)                               |
+| Parallelstore                              | [docs](./docs/usage/storage.md#parallelstore)                           |
+| Block storage (Persistent Disk, Hyperdisk) | [docs](./docs/usage/storage.md#block-storage-persistent-disk-hyperdisk) |
 # Documentation
-* [Permissions](./docs/permissions.md)
-* [Installation](./docs/installation.md)
-* Usage:
-  * [Clusters](./docs/usage/clusters.md)
-    * [GPU](./docs/usage/gpu.md)
-    * [CPU](./docs/usage/cpu.md)
-    * [Autoprovisioning](./docs/usage/autoprovisioning.md)
-  * [Workloads](./docs/usage/workloads.md)
-    * [Docker](./docs/usage/docker.md)
-  * [Storage](./docs/usage/storage.md)
-  * [Advanced](./docs/usage/advanced.md)
-  * [Inspector](./docs/usage/inspector.md)
-* [Troubleshooting](./docs/troubleshooting.md)
+- [Permissions](./docs/permissions.md)
+- [Installation](./docs/installation.md)
+- Usage:
+  - [Clusters](./docs/usage/clusters.md)
+    - [GPU](./docs/usage/gpu.md)
+    - [CPU](./docs/usage/cpu.md)
+    - [Autoprovisioning](./docs/usage/autoprovisioning.md)
+  - [Workloads](./docs/usage/workloads.md)
+    - [Docker](./docs/usage/docker.md)
+  - [Storage](./docs/usage/storage.md)
+  - [Advanced](./docs/usage/advanced.md)
+  - [Inspector](./docs/usage/inspector.md)
+- [Troubleshooting](./docs/troubleshooting.md)
+# Dependencies
+| Dependency                                                                                                   | When used                   |
+| ------------------------------------------------------------------------------------------------------------ | --------------------------- |
+| [Google Cloud SDK (gcloud)](https://cloud.google.com/sdk/docs/install)                                       | _always_                    |
+| [kubectl](https://cloud.google.com/kubernetes-engine/docs/how-to/cluster-access-for-kubectl#install_kubectl) | _always_                    |
+| [ClusterToolkit](https://github.com/GoogleCloudPlatform/cluster-toolkit)                                     | Provisioning GPU clusters   |
+| [Kueue](https://github.com/kubernetes-sigs/kueue)                                                            | Scheduling workloads        |
+| [JobSet](https://github.com/kubernetes-sigs/jobset)                                                          | Workload creation           |
+| [Docker](https://docs.docker.com/engine/install/)                                                            | Building workload container |
+| [CoreDNS](https://github.com/coredns/deployment/tree/master/kubernetes)                                      | Cluster set up              |
+| [PathwaysJob](https://github.com/google/pathways-job)                                                        | Running Pathways workloads  |
 # Privacy notice
@@ -129,11 +142,14 @@ XPK telemetry overall is handled in accordance with the [Google Privacy Policy](
 you use XPK to interact with or utilize GCP Services, your information is handled in accordance with the
 [Google Cloud Privacy Notice](https://cloud.google.com/terms/cloud-privacy-notice).
 # Contributing
 Please read [`contributing.md`](./docs/contributing.md) for details on our code of conduct, and the process for submitting pull requests to us.
+# Get involved
+We'd love to hear from you! If you have questions or want to discuss ideas, join us on [GitHub Discussions](https://github.com/AI-Hypercomputer/xpk/discussions). Found a bug or have a feature request? Please let us know on [GitHub Issues](https://github.com/AI-Hypercomputer/xpk/issues).
 # License
 This project is licensed under the Apache License 2.0 - see the [`LICENSE`](./LICENSE) file for details

xpk 1.0.0__py3-none-any.whl → 1.1.0__py3-none-any.whl

xpk 1.0.0py3-none-any.whl → 1.1.0py3-none-any.whl