PyPI - xpk - Versions diffs - 0.12.0__py3-none-any.whl → 0.14.0__py3-none-any.whl - Mend

xpk 0.12.0py3-none-any.whl → 0.14.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (68) hide show

xpk/commands/batch.py +17 -10
xpk/commands/cluster.py +137 -123
xpk/commands/cluster_gcluster.py +77 -14
xpk/commands/cluster_gcluster_test.py +177 -0
xpk/commands/common.py +13 -27
xpk/commands/info.py +11 -9
xpk/commands/inspector.py +22 -11
xpk/commands/job.py +53 -9
xpk/commands/kind.py +38 -40
xpk/commands/kjob_common.py +4 -4
xpk/commands/run.py +9 -2
xpk/commands/shell.py +13 -10
xpk/commands/storage.py +26 -2
xpk/commands/version.py +0 -4
xpk/commands/workload.py +58 -30
xpk/core/blueprint/blueprint_generator.py +4 -40
xpk/core/blueprint/blueprint_test.py +0 -6
xpk/core/capacity.py +6 -5
xpk/core/cluster.py +96 -195
xpk/core/cluster_private.py +9 -12
xpk/core/commands.py +21 -25
xpk/core/config.py +1 -1
xpk/core/docker_image.py +17 -9
xpk/core/docker_resources.py +9 -4
xpk/core/gcloud_context.py +26 -2
xpk/core/gcloud_context_test.py +96 -0
xpk/core/gcluster_manager.py +0 -3
xpk/core/jobset.py +5 -8
xpk/core/kjob.py +19 -29
xpk/core/kueue_manager.py +383 -0
xpk/core/kueue_manager_test.py +542 -0
xpk/core/monitoring.py +1 -1
xpk/core/nap.py +11 -16
xpk/core/network.py +18 -19
xpk/core/nodepool.py +65 -71
xpk/core/nodepool_test.py +198 -1
xpk/core/pathways.py +9 -5
xpk/core/ray.py +11 -15
xpk/core/resources.py +15 -10
xpk/core/scheduling.py +23 -1
xpk/core/scheduling_test.py +31 -0
xpk/core/system_characteristics.py +335 -229
xpk/core/vertex.py +1 -1
xpk/core/workload.py +7 -8
xpk/main.py +3 -2
xpk/parser/cluster.py +50 -0
xpk/parser/cluster_test.py +66 -0
xpk/parser/common.py +11 -0
xpk/parser/workload.py +62 -25
xpk/parser/workload_test.py +82 -0
xpk/utils/execution_context.py +28 -0
xpk/utils/feature_flags.py +28 -0
xpk/utils/file.py +25 -10
xpk/utils/kueue.py +20 -0
xpk/utils/network.py +4 -0
xpk/utils/templates.py +2 -0
xpk/utils/topology.py +37 -0
xpk/utils/topology_test.py +43 -0
xpk/utils/validation.py +79 -55
xpk/utils/validation_test.py +37 -0
{xpk-0.12.0.dist-info → xpk-0.14.0.dist-info}/METADATA +6 -1
xpk-0.14.0.dist-info/RECORD +112 -0
xpk/core/kueue.py +0 -545
xpk-0.12.0.dist-info/RECORD +0 -100
{xpk-0.12.0.dist-info → xpk-0.14.0.dist-info}/WHEEL +0 -0
{xpk-0.12.0.dist-info → xpk-0.14.0.dist-info}/entry_points.txt +0 -0
{xpk-0.12.0.dist-info → xpk-0.14.0.dist-info}/licenses/LICENSE +0 -0
{xpk-0.12.0.dist-info → xpk-0.14.0.dist-info}/top_level.txt +0 -0

xpk/core/commands.py CHANGED Viewed

@@ -18,14 +18,14 @@ import datetime
 import subprocess
 import sys
 import time
-from argparse import Namespace
 from ..utils.objects import chunks
 from ..utils.file import make_tmp_files, write_tmp_file
 from ..utils.console import xpk_print
+from ..utils.execution_context import is_dry_run
-def run_commands(commands, jobname, per_command_name, batch=10, dry_run=False):
+def run_commands(commands, jobname, per_command_name, batch=10):
   """Run commands in groups of `batch`.
   Args:
@@ -33,7 +33,6 @@ def run_commands(commands, jobname, per_command_name, batch=10, dry_run=False):
     jobname: the name of the job.
     per_command_name: list of command names.
     batch: number of commands to run in parallel.
-    dry_run: enables dry_run if set to true.
   Returns:
     0 if successful and 1 otherwise.
@@ -46,7 +45,7 @@ def run_commands(commands, jobname, per_command_name, batch=10, dry_run=False):
       f'Breaking up a total of {len(commands)} commands into'
       f' {len(commands_batched)} batches'
   )
-  if dry_run:
+  if is_dry_run():
     xpk_print('Pretending all the jobs succeeded')
     return 0
@@ -78,14 +77,13 @@ def run_command_batch(commands, jobname, per_command_name, output_logs):
     The max return code and a list of all the return codes.
   """
+  files = [open(f, 'w', encoding='utf-8') for f in output_logs]
   children = []
   start_time = datetime.datetime.now()
-  for i, command in enumerate(commands):
+  for command, file in zip(commands, files):
     children.append(
         # subprocess managed by list pylint: disable=consider-using-with
-        subprocess.Popen(
-            command, stdout=output_logs[i], stderr=output_logs[i], shell=True
-        )
+        subprocess.Popen(command, stdout=file, stderr=file, shell=True)
     )
   while True:
@@ -99,7 +97,7 @@ def run_command_batch(commands, jobname, per_command_name, output_logs):
       slow_worker_text = per_command_name[slow_worker_index]
       slow_str = (
           f', task {slow_worker_text} still working, logfile'
-          f' {output_logs[slow_worker_index].name}'
+          f' {output_logs[slow_worker_index]}'
       )
     else:
       slow_str = ''
@@ -116,7 +114,7 @@ def run_command_batch(commands, jobname, per_command_name, output_logs):
       )
       xpk_print(
           f'Failure is {per_command_name[failing_index]}'
-          f' and logfile {output_logs[failing_index].name}'
+          f' and logfile {output_logs[failing_index]}'
       )
       for child in children:
         child.terminate()
@@ -126,18 +124,21 @@ def run_command_batch(commands, jobname, per_command_name, output_logs):
       break
     time.sleep(1)
+  for file in files:
+    file.close()
   return max_returncode, returncodes
 def run_command_with_updates_retry(
-    command, task, args, verbose=True, num_retry_attempts=5, wait_seconds=10
+    command, task, verbose=True, num_retry_attempts=5, wait_seconds=10
 ) -> int:
   """Generic run commands function with updates and retry logic.
   Args:
     command: command to execute
     task: user-facing name of the task
-    args: user provided arguments for running the command.
     verbose: shows stdout and stderr if set to true. Set to True by default.
     num_retry_attempts: number of attempts to retry the command.
         This has a default value in the function arguments.
@@ -157,23 +158,22 @@ def run_command_with_updates_retry(
       time.sleep(wait_seconds)
     i += 1
     xpk_print(f'Try {i}: {task}')
-    return_code = run_command_with_updates(command, task, args, verbose=verbose)
+    return_code = run_command_with_updates(command, task, verbose=verbose)
   return return_code
-def run_command_with_updates(command, task, global_args, verbose=True) -> int:
+def run_command_with_updates(command, task, verbose=True) -> int:
   """Generic run commands function with updates.
   Args:
     command: command to execute
     task: user-facing name of the task
-    global_args: user provided arguments for running the command.
     verbose: shows stdout and stderr if set to true. Set to True by default.
   Returns:
     0 if successful and 1 otherwise.
   """
-  if global_args.dry_run:
+  if is_dry_run():
     xpk_print(
         f'Task: `{task}` is implemented by the following command'
         ' not running since it is a dry run.'
@@ -223,7 +223,6 @@ def run_command_with_updates(command, task, global_args, verbose=True) -> int:
 def run_command_for_value(
     command,
     task,
-    global_args,
     dry_run_return_val='0',
     print_timer=False,
     hide_error=False,
@@ -236,7 +235,6 @@ def run_command_for_value(
   Args:
     command: user provided command to run.
     task: user provided task name for running the command.
-    global_args: user provided arguments for running the command.
     dry_run_return_val: return value of this command for dry run.
     print_timer: print out the time the command is running.
     hide_error: hide the error from the command output upon success.
@@ -246,7 +244,7 @@ def run_command_for_value(
     int: return_code, default is 0
     str: return_val, default is '0'
   """
-  if global_args is not None and global_args.dry_run:
+  if is_dry_run():
     xpk_print(
         f'Task: `{task}` is implemented by the following command'
         ' not running since it is a dry run.'
@@ -302,7 +300,6 @@ def run_command_for_value(
 def run_command_with_full_controls(
     command: str,
     task: str,
-    global_args: Namespace,
     instructions: str | None = None,
 ) -> int:
   """Run command in current shell with system out, in and error handles. Wait
@@ -311,13 +308,12 @@ def run_command_with_full_controls(
   Args:
     command: command to execute
     task: user-facing name of the task
-    global_args: user provided arguments for running the command.
     verbose: shows stdout and stderr if set to true. Set to True by default.
   Returns:
     0 if successful and 1 otherwise.
   """
-  if global_args.dry_run:
+  if is_dry_run():
     xpk_print(
         f'Task: `{task}` is implemented by the following command'
         ' not running since it is a dry run.'
@@ -349,8 +345,8 @@ def run_command_with_full_controls(
   return return_code
-def run_kubectl_apply(yml_string: str, task: str, args: Namespace) -> int:
+def run_kubectl_apply(yml_string: str, task: str) -> int:
   tmp = write_tmp_file(yml_string)
-  command = f'kubectl apply -f {str(tmp.file.name)}'
-  err_code = run_command_with_updates(command, task, args)
+  command = f'kubectl apply -f {str(tmp)}'
+  err_code = run_command_with_updates(command, task)
   return err_code

xpk/core/config.py CHANGED Viewed

@@ -22,7 +22,7 @@ from ..utils import file
 from ..utils.console import xpk_print
 # This is the version for XPK PyPI package
-__version__ = 'v0.12.0'
+__version__ = 'v0.14.0'
 XPK_CURRENT_VERSION = __version__
 XPK_CONFIG_FILE = os.path.expanduser('~/.config/xpk/config.yaml')

xpk/core/docker_image.py CHANGED Viewed

@@ -21,6 +21,7 @@ import string
 from ..utils.console import xpk_exit, xpk_print
 from ..utils.file import write_tmp_file
+from ..utils.execution_context import is_dry_run
 from .commands import run_command_with_updates
 DEFAULT_DOCKER_IMAGE = 'python:3.10'
@@ -48,7 +49,7 @@ def validate_docker_image(docker_image, args) -> int:
       f'gcloud container images describe {docker_image} --project {project}'
   )
   return_code = run_command_with_updates(
-      command, 'Validate Docker Image', args, verbose=False
+      command, 'Validate Docker Image', verbose=False
   )
   if return_code != 0:
     xpk_print(
@@ -75,7 +76,9 @@ def build_docker_image_from_base_image(args, verbose=True) -> tuple[int, str]:
   """
   # Pick a name for the docker image.
-  docker_image_prefix = os.getenv('USER', 'unknown')
+  docker_image_prefix = (
+      'dry-run' if is_dry_run() else os.getenv('USER', 'unknown')
+  )
   docker_name = f'{docker_image_prefix}-runner'
   script_dir_dockerfile = """FROM {base_docker_image}
@@ -94,14 +97,13 @@ def build_docker_image_from_base_image(args, verbose=True) -> tuple[int, str]:
   )
   tmp = write_tmp_file(docker_file)
   docker_build_command = (
-      f'docker buildx build --platform={PLATFORM} -f {str(tmp.file.name)} -t'
+      f'docker buildx build --platform={PLATFORM} -f {str(tmp)} -t'
       f' {docker_name} {args.script_dir}'
   )
   xpk_print(f'Building {args.script_dir} into docker image.')
   return_code = run_command_with_updates(
       docker_build_command,
       'Building script_dir into docker image',
-      args,
       verbose=verbose,
   )
   if return_code != 0:
@@ -114,10 +116,16 @@ def build_docker_image_from_base_image(args, verbose=True) -> tuple[int, str]:
   # Pick a randomly generated `tag_length` character docker tag.
   tag_length = 4
-  tag_random_prefix = ''.join(
-      random.choices(string.ascii_lowercase, k=tag_length)
+  tag_random_prefix = (
+      'prefix'
+      if is_dry_run()
+      else ''.join(random.choices(string.ascii_lowercase, k=tag_length))
+  )
+  tag_datetime = (
+      'current'
+      if is_dry_run()
+      else datetime.datetime.now().strftime('%Y-%m-%d-%H-%M-%S')
   )
-  tag_datetime = datetime.datetime.now().strftime('%Y-%m-%d-%H-%M-%S')
   tag_name = f'{tag_random_prefix}-{tag_datetime}'
   cloud_docker_image = f'gcr.io/{args.project}/{docker_name}:{tag_name}'
   xpk_print(f'Adding Docker Image: {cloud_docker_image} to {args.project}')
@@ -125,7 +133,7 @@ def build_docker_image_from_base_image(args, verbose=True) -> tuple[int, str]:
   # Tag the docker image.
   tag_docker_image_command = f'docker tag {docker_name} {cloud_docker_image}'
   return_code = run_command_with_updates(
-      tag_docker_image_command, 'Tag Docker Image', args, verbose=verbose
+      tag_docker_image_command, 'Tag Docker Image', verbose=verbose
   )
   if return_code != 0:
     xpk_print(
@@ -138,7 +146,7 @@ def build_docker_image_from_base_image(args, verbose=True) -> tuple[int, str]:
   # Upload image to Artifact Registry.
   upload_docker_image_command = f'docker push {cloud_docker_image}'
   return_code = run_command_with_updates(
-      upload_docker_image_command, 'Upload Docker Image', args, verbose=verbose
+      upload_docker_image_command, 'Upload Docker Image', verbose=verbose
   )
   if return_code != 0:
     xpk_print(

xpk/core/docker_resources.py CHANGED Viewed

@@ -20,6 +20,7 @@ from .capacity import H100_DEVICE_TYPE, H100_MEGA_DEVICE_TYPE, H200_DEVICE_TYPE
 from .cluster import setup_k8s_env
 from .storage import GCS_FUSE_TYPE, GCP_FILESTORE_TYPE, PARALLELSTORE_TYPE, GCE_PD_TYPE, LUSTRE_TYPE, Storage, get_storages_to_mount
 from .system_characteristics import AcceleratorType, SystemCharacteristics
+from ..utils.execution_context import is_dry_run
 def get_main_container_resources(
@@ -272,8 +273,10 @@ def get_volumes(args, system: SystemCharacteristics) -> str:
               - name: shared-data
               """
-  storages: list[Storage] = get_storages_to_mount(
-      setup_k8s_env(args), args.storage
+  storages: list[Storage] = (
+      []
+      if is_dry_run()
+      else get_storages_to_mount(setup_k8s_env(args), args.storage)
   )
   for storage in storages:
     if storage.type in {
@@ -325,8 +328,10 @@ def get_volume_mounts(args, system: SystemCharacteristics) -> str:
   elif system.accelerator_type == AcceleratorType['GPU']:
     volume_mount_yaml = ''
-  storages: list[Storage] = get_storages_to_mount(
-      setup_k8s_env(args), args.storage
+  storages: list[Storage] = (
+      []
+      if is_dry_run()
+      else get_storages_to_mount(setup_k8s_env(args), args.storage)
   )
   for storage in storages:
     if storage.type in {

xpk/core/gcloud_context.py CHANGED Viewed

@@ -18,8 +18,9 @@ import subprocess
 import sys
 from dataclasses import dataclass
-from ..utils.console import xpk_print
+from ..utils.console import xpk_print, xpk_exit
 from .commands import run_command_for_value
+from functools import lru_cache
 def get_project():
@@ -85,9 +86,33 @@ def zone_to_region(zone: str) -> str:
      The region name.
   """
   zone_terms = zone.split('-')
+  if len(zone_terms) != 2 and len(zone_terms) != 3:
+    raise ValueError(f'Invalid zone name: {zone}')
   return zone_terms[0] + '-' + zone_terms[1]
+@lru_cache()
+def get_cluster_location(project: str, name: str, zone: str) -> str:
+  """Helper function to resolve location for a given cluster"""
+  return_code, result = run_command_for_value(
+      command=(
+          'gcloud container clusters list '
+          f'--project={project} '
+          f'--filter=name={name} '
+          '--format="value(location)"'
+      ),
+      task='Find cluster region or zone',
+      dry_run_return_val=zone_to_region(zone),
+  )
+  if return_code != 0:
+    xpk_print('Error: Unable to determine cluster region or zone')
+    xpk_exit(return_code)
+  regions = result.strip().splitlines()
+  return zone if zone in regions else zone_to_region(zone)
 @dataclass
 class GkeServerConfig:
   """Stores the valid gke versions based on gcloud recommendations."""
@@ -139,7 +164,6 @@ def get_gke_server_config(args) -> tuple[int, GkeServerConfig | None]:
     return_code, cmd_output = run_command_for_value(
         command,
         command_description,
-        args,
         hide_error=True,
     )
     if return_code != 0:

xpk/core/gcloud_context_test.py ADDED Viewed

@@ -0,0 +1,96 @@
+"""
+Copyright 2025 Google LLC
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+     https://www.apache.org/licenses/LICENSE-2.0
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+import pytest
+from .gcloud_context import get_cluster_location, zone_to_region
+def test_zone_to_region_raises_when_zone_is_invalid():
+  with pytest.raises(ValueError):
+    zone_to_region("us")
+def test_zone_to_region_returns_region_when_region_given():
+  assert zone_to_region("us-central1") == "us-central1"
+def test_zone_to_region_returns_region_when_zone_is_valid():
+  assert zone_to_region("us-central1-a") == "us-central1"
+def test_get_cluster_location_returns_cluster_region_when_cluster_is_regional(
+    mocker,
+):
+  mocker.patch(
+      "xpk.core.gcloud_context.run_command_for_value",
+      return_value=(0, "us-central1"),
+  )
+  result = get_cluster_location(
+      project="project1", name="name1", zone="us-central1-a"
+  )
+  assert result == "us-central1"
+def test_get_cluster_location_returns_cluster_zone_when_both_regional_and_zonal_clusters_exist(
+    mocker,
+):
+  mocker.patch(
+      "xpk.core.gcloud_context.run_command_for_value",
+      return_value=(0, "us-central1\nus-central1-a"),
+  )
+  result = get_cluster_location(
+      project="project2", name="name2", zone="us-central1-a"
+  )
+  assert result == "us-central1-a"
+def test_get_cluster_location_returns_given_zone_converted_to_region_when_cluster_is_not_found(
+    mocker,
+):
+  mocker.patch(
+      "xpk.core.gcloud_context.run_command_for_value", return_value=(0, "")
+  )
+  result = get_cluster_location(
+      project="project3", name="name3", zone="us-central1-a"
+  )
+  assert result == "us-central1"
+def test_get_cluster_location_caches_previous_command_result(mocker):
+  mock = mocker.patch(
+      "xpk.core.gcloud_context.run_command_for_value", return_value=(0, "")
+  )
+  get_cluster_location(project="project4", name="name4", zone="us-central1-a")
+  assert mock.call_count == 1
+def test_get_cluster_location_invokes_command_for_different_input_args(mocker):
+  mock = mocker.patch(
+      "xpk.core.gcloud_context.run_command_for_value", return_value=(0, "")
+  )
+  get_cluster_location(project="project5", name="name5", zone="us-central1-a")
+  get_cluster_location(project="project6", name="name6", zone="us-central1-a")
+  assert mock.call_count == 2

xpk/core/gcluster_manager.py CHANGED Viewed

@@ -27,9 +27,6 @@ blueprint_file_name = 'xpk_blueprint.yaml'
 deployment_module = '/out/xpk-deployment'
 a3_utils_dir_name = 'a3-mega-xpk'
 config_map_repo_path = 'src/xpk/blueprints/a3-mega-xpk/config-map.yaml.tftpl'
-kueue_config_repo_path = (
-    'src/xpk/blueprints/a3-mega-xpk/kueue-xpk-configuration.yaml.tftpl'
-)
 class GclusterManager:

xpk/core/jobset.py CHANGED Viewed

@@ -18,7 +18,7 @@ import math
 from ..utils.console import xpk_exit, xpk_print
 from ..utils.file import write_tmp_file
-from ..core.kueue import (
+from ..core.kueue_manager import (
     MEMORY_SIZE_PER_VM,
     MIN_MEMORY_LIMIT_SIZE,
 )
@@ -110,19 +110,16 @@ spec:
 """
-def update_jobset_resources_if_necessary(args):
+def update_jobset_resources_if_necessary():
   """Update the jobset manifest to increase the resources for the jobset controller manager.
-  Args:
-    args: user provided arguments for running the command.
   Returns:
     0 if successful and 1 otherwise.
   """
   # Get total number of nodes
   cmd_total_node_num = 'kubectl get node --no-headers | wc -l'
   return_code, out = run_command_for_value(
-      cmd_total_node_num, 'Count total nodes', args
+      cmd_total_node_num, 'Count total nodes'
   )
   if return_code != 0:
     xpk_exit(1)
@@ -134,10 +131,10 @@ def update_jobset_resources_if_necessary(args):
       memory_limit_size=new_memory_limit,
   )
   tmp = write_tmp_file(yml_string)
-  command = f'kubectl apply -f {str(tmp.file.name)}'
+  command = f'kubectl apply -f {str(tmp)}'
   task = 'Updating jobset Controller Manager resources'
-  return_code = run_command_with_updates_retry(command, task, args)
+  return_code = run_command_with_updates_retry(command, task)
   if return_code != 0:
     xpk_print(f'{task} returned ERROR {return_code}')
   return return_code

xpk/core/kjob.py CHANGED Viewed

@@ -23,6 +23,7 @@ from kubernetes.client import ApiClient
 from kubernetes.client.rest import ApiException
 from ..utils import templates
+from ..utils.execution_context import is_dry_run
 from ..utils.console import xpk_exit, xpk_print
 from .capacity import H100_DEVICE_TYPE, H100_MEGA_DEVICE_TYPE, H200_DEVICE_TYPE
 from .cluster import DEFAULT_NAMESPACE, XPK_SA, setup_k8s_env
@@ -166,8 +167,8 @@ Kueue_TAS_annotation = "kueue.x-k8s.io/podset-preferred-topology=cloud.google.co
 default_interface_annotation = "networking.gke.io/default-interface=eth0"
-def get_a4_pod_template_annotations(args) -> tuple[str, str]:
-  sub_networks = get_cluster_subnetworks(args)
+def get_a4_pod_template_annotations() -> tuple[str, str]:
+  sub_networks = get_cluster_subnetworks()
   interfaces_key, interfaces_value = rdma_decorator.get_interfaces_entry(
       sub_networks
   )
@@ -178,8 +179,8 @@ def get_a4_pod_template_annotations(args) -> tuple[str, str]:
   )
-def get_a3ultra_pod_template_annotations(args: Namespace) -> tuple[str, str]:
-  sub_networks = get_cluster_subnetworks(args)
+def get_a3ultra_pod_template_annotations() -> tuple[str, str]:
+  sub_networks = get_cluster_subnetworks()
   interfaces_key, interfaces_value = rdma_decorator.get_interfaces_entry(
       sub_networks
   )
@@ -190,11 +191,9 @@ def get_a3ultra_pod_template_annotations(args: Namespace) -> tuple[str, str]:
   )
-def get_a3mega_pod_template_annotations(
-    args: Namespace,
-) -> tuple[str, str, str]:
+def get_a3mega_pod_template_annotations() -> tuple[str, str, str]:
   """Adds or updates annotations in the Pod template."""
-  sub_networks = get_cluster_subnetworks(args)
+  sub_networks = get_cluster_subnetworks()
   tcpxo_deamon_key, tcpxo_deamon_paths = get_tcpxo_deamon_entry()
   interfaces_key, interfaces_value = tcpxo_decorator.get_interfaces_entry(
       sub_networks
@@ -204,16 +203,14 @@ def get_a3mega_pod_template_annotations(
   return tcpxo, interfaces, default_interface_annotation
-def verify_kjob_installed(args: Namespace) -> int:
+def verify_kjob_installed() -> int:
   """Check if kjob is installed. If not provide user with proper communicate and exit.
-  Args:
-    args - user provided arguments.
   Returns:
     error code > if kjob not installed, otherwise 0
   """
   command = "kubectl-kjob help"
   task = "Verify kjob installation "
-  verify_kjob_installed_code, _ = run_command_for_value(command, task, args)
+  verify_kjob_installed_code, _ = run_command_for_value(command, task)
   if verify_kjob_installed_code == 0:
     xpk_print("kjob found")
@@ -245,9 +242,7 @@ def get_pod_template_interactive_command() -> str:
   return pod_command
-def create_app_profile_instance(
-    args: Namespace, volume_bundles: list[str]
-) -> int:
+def create_app_profile_instance(volume_bundles: list[str]) -> int:
   """Create new AppProfile instance on cluster with default settings.
   Args:
@@ -263,7 +258,6 @@ def create_app_profile_instance(
           volume_bundles=volume_bundles,
       ),
       task="Creating AppProfile",
-      args=args,
   )
@@ -331,15 +325,12 @@ def create_job_template_instance(
   return run_kubectl_apply(
       yml_string,
       task="Creating JobTemplate",
-      args=args,
   )
-def create_pod_template_instance(args: Namespace, service_account: str) -> int:
+def create_pod_template_instance(service_account: str) -> int:
   """Create new PodTemplate instance on cluster with default settings.
-  Args:
-    args - user provided arguments
   Returns:
     exit_code > 0 if creating PodTemplate fails, 0 otherwise
   """
@@ -361,15 +352,16 @@ def create_pod_template_instance(args: Namespace, service_account: str) -> int:
           service_account=service_account,
       ),
       task="Creating PodTemplate",
-      args=args,
   )
 def prepare_kjob(args: Namespace) -> int:
   system = get_cluster_system_characteristics(args)
-  k8s_api_client = setup_k8s_env(args)
-  storages = get_auto_mount_storages(k8s_api_client)
+  storages = []
+  if not is_dry_run():
+    k8s_api_client = setup_k8s_env(args)
+    storages = get_auto_mount_storages(k8s_api_client)
   service_account = ""
   if len(storages) > 0:
@@ -378,29 +370,27 @@ def prepare_kjob(args: Namespace) -> int:
   job_err_code = create_job_template_instance(args, system, service_account)
   if job_err_code > 0:
     return job_err_code
-  pod_err_code = create_pod_template_instance(args, service_account)
+  pod_err_code = create_pod_template_instance(service_account)
   if pod_err_code > 0:
     return pod_err_code
   volume_bundles = [item.name for item in storages]
-  return create_app_profile_instance(args, volume_bundles)
+  return create_app_profile_instance(volume_bundles)
-def apply_kjob_crds(args: Namespace) -> int:
+def apply_kjob_crds() -> int:
   """Apply kjob CRDs on cluster.
   This function install kjob CRDs files from kjobctl printcrds.
   It creates all neccessary kjob CRDs.
-  Args:
-    args - user provided arguments
   Returns:
     None
   """
   command = "kubectl kjob printcrds | kubectl apply --server-side -f -"
   task = "Create kjob CRDs on cluster"
-  return_code = run_command_with_updates(command, task, args)
+  return_code = run_command_with_updates(command, task)
   if return_code != 0:
     xpk_print(f"{task} returned ERROR {return_code}")
     return return_code

xpk 0.12.0__py3-none-any.whl → 0.14.0__py3-none-any.whl

xpk 0.12.0py3-none-any.whl → 0.14.0py3-none-any.whl