xpk 1.1.1__tar.gz → 1.1.2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (258) hide show
  1. {xpk-1.1.1/src/xpk.egg-info → xpk-1.1.2}/PKG-INFO +1 -1
  2. {xpk-1.1.1 → xpk-1.1.2}/recipes/Workload_create_super-slicing.md +3 -3
  3. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/docker_container.py +3 -1
  4. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/docker_resources.py +5 -5
  5. {xpk-1.1.1 → xpk-1.1.2/src/xpk.egg-info}/PKG-INFO +1 -1
  6. {xpk-1.1.1 → xpk-1.1.2}/.dockerignore +0 -0
  7. {xpk-1.1.1 → xpk-1.1.2}/.github/CODEOWNERS +0 -0
  8. {xpk-1.1.1 → xpk-1.1.2}/.github/PULL_REQUEST_TEMPLATE.md +0 -0
  9. {xpk-1.1.1 → xpk-1.1.2}/.github/actions/install-kueue/action.yml +0 -0
  10. {xpk-1.1.1 → xpk-1.1.2}/.github/actions/setup-test-env/action.yml +0 -0
  11. {xpk-1.1.1 → xpk-1.1.2}/.github/release.yaml +0 -0
  12. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/README.md +0 -0
  13. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/build_tests.yaml +0 -0
  14. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/build_wheels.yaml +0 -0
  15. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/cleanup.yaml +0 -0
  16. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/gemini-dispatch.yml +0 -0
  17. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/gemini-invoke.yml +0 -0
  18. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/gemini-review.yml +0 -0
  19. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/gemini-scheduled-triage.yml +0 -0
  20. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/gemini-triage.yml +0 -0
  21. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/integration_basic_cluster_create.yaml +0 -0
  22. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/integration_gpu_cluster_create.yaml +0 -0
  23. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/integration_pathways_cluster_create.yaml +0 -0
  24. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/integration_ray_cluster_create.yaml +0 -0
  25. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/integration_storage_tests.yaml +0 -0
  26. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/label-validation.yaml +0 -0
  27. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/nightly_tests.yaml +0 -0
  28. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/periodic_release.yaml +0 -0
  29. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/release_branch_versioning.yaml +0 -0
  30. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/reusable_build_scripts.yaml +0 -0
  31. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/reusable_build_wheel.yaml +0 -0
  32. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/reusable_goldens.yaml +0 -0
  33. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/reusable_lint_and_format.yml +0 -0
  34. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/reusable_storage_create.yaml +0 -0
  35. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/reusable_storage_delete.yaml +0 -0
  36. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/reusable_unit_tests.yaml +0 -0
  37. {xpk-1.1.1 → xpk-1.1.2}/.github/workflows/stale.yaml +0 -0
  38. {xpk-1.1.1 → xpk-1.1.2}/.gitignore +0 -0
  39. {xpk-1.1.1 → xpk-1.1.2}/.pre-commit-config.yaml +0 -0
  40. {xpk-1.1.1 → xpk-1.1.2}/LICENSE +0 -0
  41. {xpk-1.1.1 → xpk-1.1.2}/Makefile +0 -0
  42. {xpk-1.1.1 → xpk-1.1.2}/README.md +0 -0
  43. {xpk-1.1.1 → xpk-1.1.2}/backoff_retry.sh +0 -0
  44. {xpk-1.1.1 → xpk-1.1.2}/data/Dockerfile +0 -0
  45. {xpk-1.1.1 → xpk-1.1.2}/docs/code-of-conduct.md +0 -0
  46. {xpk-1.1.1 → xpk-1.1.2}/docs/contributing.md +0 -0
  47. {xpk-1.1.1 → xpk-1.1.2}/docs/installation.md +0 -0
  48. {xpk-1.1.1 → xpk-1.1.2}/docs/permissions.md +0 -0
  49. {xpk-1.1.1 → xpk-1.1.2}/docs/testing.md +0 -0
  50. {xpk-1.1.1 → xpk-1.1.2}/docs/troubleshooting.md +0 -0
  51. {xpk-1.1.1 → xpk-1.1.2}/docs/usage/advanced.md +0 -0
  52. {xpk-1.1.1 → xpk-1.1.2}/docs/usage/autoprovisioning.md +0 -0
  53. {xpk-1.1.1 → xpk-1.1.2}/docs/usage/clusters.md +0 -0
  54. {xpk-1.1.1 → xpk-1.1.2}/docs/usage/cpu.md +0 -0
  55. {xpk-1.1.1 → xpk-1.1.2}/docs/usage/docker.md +0 -0
  56. {xpk-1.1.1 → xpk-1.1.2}/docs/usage/gpu.md +0 -0
  57. {xpk-1.1.1 → xpk-1.1.2}/docs/usage/inspector.md +0 -0
  58. {xpk-1.1.1 → xpk-1.1.2}/docs/usage/storage.md +0 -0
  59. {xpk-1.1.1 → xpk-1.1.2}/docs/usage/tpu7x/recipes/flex_filestore_recipe.md +0 -0
  60. {xpk-1.1.1 → xpk-1.1.2}/docs/usage/tpu7x/recipes/flex_lustre_recipe.md +0 -0
  61. {xpk-1.1.1 → xpk-1.1.2}/docs/usage/tpu7x/recipes/reservation_gcs_bucket_recipe.md +0 -0
  62. {xpk-1.1.1 → xpk-1.1.2}/docs/usage/workloads.md +0 -0
  63. {xpk-1.1.1 → xpk-1.1.2}/examples/fake_training.py +0 -0
  64. {xpk-1.1.1 → xpk-1.1.2}/examples/llama-3.1-finetuning/check_cuda.sh +0 -0
  65. {xpk-1.1.1 → xpk-1.1.2}/examples/llama-3.1-finetuning/requirements.txt +0 -0
  66. {xpk-1.1.1 → xpk-1.1.2}/examples/llama-3.1-finetuning/train.py +0 -0
  67. {xpk-1.1.1 → xpk-1.1.2}/examples/llama-3.1-finetuning/train.slurm +0 -0
  68. {xpk-1.1.1 → xpk-1.1.2}/examples/llama-3.1-finetuning/training_data.jsonl +0 -0
  69. {xpk-1.1.1 → xpk-1.1.2}/examples/nccl/nccl-a3mega.sh +0 -0
  70. {xpk-1.1.1 → xpk-1.1.2}/examples/nccl/nccl-a3ultra.sh +0 -0
  71. {xpk-1.1.1 → xpk-1.1.2}/examples/nccl/nccl.md +0 -0
  72. {xpk-1.1.1 → xpk-1.1.2}/examples/storage/filestore-manifest-attach.yaml +0 -0
  73. {xpk-1.1.1 → xpk-1.1.2}/examples/storage/gcsfuse-manifest.yaml +0 -0
  74. {xpk-1.1.1 → xpk-1.1.2}/examples/storage/lustre-manifest-attach.yaml +0 -0
  75. {xpk-1.1.1 → xpk-1.1.2}/examples/storage/parallelstore-manifest-attach.yaml +0 -0
  76. {xpk-1.1.1 → xpk-1.1.2}/examples/storage/pd-manifest-attach.yaml +0 -0
  77. {xpk-1.1.1 → xpk-1.1.2}/pylintrc +0 -0
  78. {xpk-1.1.1 → xpk-1.1.2}/pyproject.toml +0 -0
  79. {xpk-1.1.1 → xpk-1.1.2}/recipes/Basic_cluster_adapt.md +0 -0
  80. {xpk-1.1.1 → xpk-1.1.2}/recipes/Basic_cluster_create.md +0 -0
  81. {xpk-1.1.1 → xpk-1.1.2}/recipes/Cluster_create_RayCluster.md +0 -0
  82. {xpk-1.1.1 → xpk-1.1.2}/recipes/Cluster_create_for_multi-host_nodepool.md +0 -0
  83. {xpk-1.1.1 → xpk-1.1.2}/recipes/Cluster_create_for_single-host_nodepool.md +0 -0
  84. {xpk-1.1.1 → xpk-1.1.2}/recipes/Cluster_create_private.md +0 -0
  85. {xpk-1.1.1 → xpk-1.1.2}/recipes/Cluster_create_sub-slicing.md +0 -0
  86. {xpk-1.1.1 → xpk-1.1.2}/recipes/Cluster_create_super-slicing.md +0 -0
  87. {xpk-1.1.1 → xpk-1.1.2}/recipes/Cluster_create_with_CPU_and_memory_limits_above_capacity.md +0 -0
  88. {xpk-1.1.1 → xpk-1.1.2}/recipes/Cluster_create_with_CPU_and_memory_limits_below_capacity.md +0 -0
  89. {xpk-1.1.1 → xpk-1.1.2}/recipes/Cluster_create_with_Managed_Lustre_driver.md +0 -0
  90. {xpk-1.1.1 → xpk-1.1.2}/recipes/Cluster_create_with_Managed_Lustre_driver_and_legacy_port.md +0 -0
  91. {xpk-1.1.1 → xpk-1.1.2}/recipes/Cluster_create_with_gb200-4.md +0 -0
  92. {xpk-1.1.1 → xpk-1.1.2}/recipes/Cluster_create_with_shared_reservation.md +0 -0
  93. {xpk-1.1.1 → xpk-1.1.2}/recipes/Cluster_delete.md +0 -0
  94. {xpk-1.1.1 → xpk-1.1.2}/recipes/Cluster_delete_force.md +0 -0
  95. {xpk-1.1.1 → xpk-1.1.2}/recipes/NAP_cluster-create.md +0 -0
  96. {xpk-1.1.1 → xpk-1.1.2}/recipes/NAP_cluster-create_with_pathways.md +0 -0
  97. {xpk-1.1.1 → xpk-1.1.2}/recipes/Storage_list.md +0 -0
  98. {xpk-1.1.1 → xpk-1.1.2}/recipes/Workload_create.md +0 -0
  99. {xpk-1.1.1 → xpk-1.1.2}/recipes/Workload_create_pathways.md +0 -0
  100. {xpk-1.1.1 → xpk-1.1.2}/recipes/Workload_create_sub-slicing.md +0 -0
  101. {xpk-1.1.1 → xpk-1.1.2}/recipes/Workload_create_with_output-manifest-file.md +0 -0
  102. {xpk-1.1.1 → xpk-1.1.2}/recipes/Workload_delete.md +0 -0
  103. {xpk-1.1.1 → xpk-1.1.2}/recipes/Workload_list.md +0 -0
  104. {xpk-1.1.1 → xpk-1.1.2}/recipes/comprehensive-demo.md +0 -0
  105. {xpk-1.1.1 → xpk-1.1.2}/setup.cfg +0 -0
  106. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/__init__.py +0 -0
  107. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/api/__init__.py +0 -0
  108. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/api/storage_crd.yaml +0 -0
  109. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/blueprints/a3mega/config-map.yaml.tftpl +0 -0
  110. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/blueprints/a3mega/storage_crd.yaml +0 -0
  111. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/blueprints/a3ultra/config-map.yaml.tftpl +0 -0
  112. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/blueprints/a3ultra/mlgru-disable.yaml +0 -0
  113. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/blueprints/a3ultra/nccl-installer.yaml +0 -0
  114. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/blueprints/a3ultra/storage_crd.yaml +0 -0
  115. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/blueprints/a4/config-map.yaml.tftpl +0 -0
  116. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/blueprints/a4/nccl-rdma-installer-a4.yaml +0 -0
  117. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/blueprints/a4/storage_crd.yaml +0 -0
  118. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/commands/__init__.py +0 -0
  119. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/commands/cluster.py +0 -0
  120. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/commands/cluster_gcluster.py +0 -0
  121. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/commands/cluster_gcluster_test.py +0 -0
  122. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/commands/cluster_test.py +0 -0
  123. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/commands/common.py +0 -0
  124. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/commands/common_test.py +0 -0
  125. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/commands/config.py +0 -0
  126. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/commands/info.py +0 -0
  127. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/commands/inspector.py +0 -0
  128. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/commands/inspector_test.py +0 -0
  129. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/commands/managed_ml_diagnostics.py +0 -0
  130. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/commands/managed_ml_diagnostics_test.py +0 -0
  131. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/commands/storage.py +0 -0
  132. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/commands/version.py +0 -0
  133. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/commands/workload.py +0 -0
  134. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/commands/workload_test.py +0 -0
  135. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/__init__.py +0 -0
  136. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/blueprint/__init__.py +0 -0
  137. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/blueprint/blueprint_definitions.py +0 -0
  138. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/blueprint/blueprint_generator.py +0 -0
  139. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/blueprint/blueprint_test.py +0 -0
  140. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/blueprint/testing/__init__.py +0 -0
  141. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/blueprint/testing/data/a3_mega.yaml +0 -0
  142. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/blueprint/testing/data/a3_mega_spot.yaml +0 -0
  143. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/blueprint/testing/data/a3_ultra.yaml +0 -0
  144. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/blueprint/testing/data/a4.yaml +0 -0
  145. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/capacity.py +0 -0
  146. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/capacity_test.py +0 -0
  147. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/cluster.py +0 -0
  148. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/cluster_private.py +0 -0
  149. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/cluster_test.py +0 -0
  150. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/commands.py +0 -0
  151. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/config.py +0 -0
  152. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/config_test.py +0 -0
  153. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/docker_image.py +0 -0
  154. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/docker_manager.py +0 -0
  155. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/filestore.py +0 -0
  156. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/gcloud_context.py +0 -0
  157. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/gcloud_context_test.py +0 -0
  158. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/gcluster_manager.py +0 -0
  159. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/gcsfuse.py +0 -0
  160. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/jobset.py +0 -0
  161. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/kueue_manager.py +0 -0
  162. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/kueue_manager_test.py +0 -0
  163. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/monitoring.py +0 -0
  164. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/mtc.py +0 -0
  165. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/nap.py +0 -0
  166. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/network.py +0 -0
  167. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/nodepool.py +0 -0
  168. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/nodepool_test.py +0 -0
  169. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/pathways.py +0 -0
  170. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/pathways_test.py +0 -0
  171. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/ray.py +0 -0
  172. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/remote_state/__init__.py +0 -0
  173. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/remote_state/fuse_remote_state.py +0 -0
  174. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/remote_state/remote_state_client.py +0 -0
  175. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/resources.py +0 -0
  176. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/scheduling.py +0 -0
  177. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/scheduling_test.py +0 -0
  178. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/storage.py +0 -0
  179. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/system_characteristics.py +0 -0
  180. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/system_characteristics_test.py +0 -0
  181. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/telemetry.py +0 -0
  182. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/telemetry_test.py +0 -0
  183. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/testing/__init__.py +0 -0
  184. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/testing/commands_tester.py +0 -0
  185. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/testing/commands_tester_test.py +0 -0
  186. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/updates.py +0 -0
  187. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/updates_test.py +0 -0
  188. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/vertex.py +0 -0
  189. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/workload.py +0 -0
  190. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/workload_decorators/__init__.py +0 -0
  191. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/workload_decorators/rdma_decorator.py +0 -0
  192. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/workload_decorators/storage_decorator.py +0 -0
  193. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/workload_decorators/tcpx_decorator.py +0 -0
  194. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/workload_decorators/tcpx_decorator_test.py +0 -0
  195. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/workload_decorators/tcpxo_decorator.py +0 -0
  196. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/core/workload_test.py +0 -0
  197. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/main.py +0 -0
  198. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/parser/__init__.py +0 -0
  199. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/parser/cluster.py +0 -0
  200. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/parser/cluster_test.py +0 -0
  201. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/parser/common.py +0 -0
  202. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/parser/common_test.py +0 -0
  203. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/parser/config.py +0 -0
  204. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/parser/core.py +0 -0
  205. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/parser/info.py +0 -0
  206. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/parser/inspector.py +0 -0
  207. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/parser/storage.py +0 -0
  208. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/parser/storage_test.py +0 -0
  209. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/parser/validators.py +0 -0
  210. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/parser/version.py +0 -0
  211. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/parser/workload.py +0 -0
  212. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/parser/workload_test.py +0 -0
  213. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/telemetry_uploader.py +0 -0
  214. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/templates/__init__.py +0 -0
  215. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/templates/arm_gpu_workload_crate.yaml.j2 +0 -0
  216. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/templates/cluster_preheat.yaml.j2 +0 -0
  217. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/templates/filestore-pv.yaml +0 -0
  218. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/templates/filestore-pvc.yaml +0 -0
  219. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/templates/filestore-sc.yaml +0 -0
  220. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/templates/fuse-pv.yaml +0 -0
  221. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/templates/fuse-pvc.yaml +0 -0
  222. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/templates/kueue_config.yaml.j2 +0 -0
  223. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/templates/kueue_gke_default_topology.yaml.j2 +0 -0
  224. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/templates/kueue_sub_slicing_topology.yaml.j2 +0 -0
  225. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/templates/kueue_super_slicing_topology.yaml.j2 +0 -0
  226. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/templates/mtc-cpc.yaml +0 -0
  227. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/templates/storage.yaml +0 -0
  228. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/__init__.py +0 -0
  229. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/console.py +0 -0
  230. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/console_test.py +0 -0
  231. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/execution_context.py +0 -0
  232. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/feature_flags.py +0 -0
  233. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/file.py +0 -0
  234. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/gcs_utils.py +0 -0
  235. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/kubectl.py +0 -0
  236. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/kueue.py +0 -0
  237. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/network.py +0 -0
  238. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/objects.py +0 -0
  239. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/templates.py +0 -0
  240. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/topology.py +0 -0
  241. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/topology_test.py +0 -0
  242. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/user_agent.py +0 -0
  243. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/user_agent_test.py +0 -0
  244. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/validation.py +0 -0
  245. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/validation_test.py +0 -0
  246. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/versions.py +0 -0
  247. {xpk-1.1.1 → xpk-1.1.2}/src/xpk/utils/yaml.py +0 -0
  248. {xpk-1.1.1 → xpk-1.1.2}/src/xpk.egg-info/SOURCES.txt +0 -0
  249. {xpk-1.1.1 → xpk-1.1.2}/src/xpk.egg-info/dependency_links.txt +0 -0
  250. {xpk-1.1.1 → xpk-1.1.2}/src/xpk.egg-info/entry_points.txt +0 -0
  251. {xpk-1.1.1 → xpk-1.1.2}/src/xpk.egg-info/requires.txt +0 -0
  252. {xpk-1.1.1 → xpk-1.1.2}/src/xpk.egg-info/top_level.txt +0 -0
  253. {xpk-1.1.1 → xpk-1.1.2}/tools/install-gke-auth-plugin.sh +0 -0
  254. {xpk-1.1.1 → xpk-1.1.2}/tools/install-xpk.sh +0 -0
  255. {xpk-1.1.1 → xpk-1.1.2}/tools/recipes.py +0 -0
  256. {xpk-1.1.1 → xpk-1.1.2}/xpk-large-scale-guide.sh +0 -0
  257. {xpk-1.1.1 → xpk-1.1.2}/xpk-notebooks.md +0 -0
  258. {xpk-1.1.1 → xpk-1.1.2}/xpk.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: xpk
3
- Version: 1.1.1
3
+ Version: 1.1.2
4
4
  Summary: xpk helps Cloud developers to orchestrate training jobs on accelerators on GKE.
5
5
  Author-email: XPK team <xpk-code-reviewers@google.com>
6
6
  License: Apache-2.0
@@ -47,7 +47,7 @@ docker buildx build --platform=linux/amd64 -f 4b6736a12db8ea0f78ce793fd0d4ee0c94
47
47
  docker tag dry-run-runner gcr.io/golden-project/dry-run-runner:prefix-current
48
48
  [XPK] Task: `Upload Docker Image` is implemented by the following command not running since it is a dry run.
49
49
  docker push gcr.io/golden-project/dry-run-runner:prefix-current
50
- [XPK] Temp file (2eed164577b237a7b764f6adf46b9c249551c2200e440ef0f696c53dfb2d1cb5) content:
50
+ [XPK] Temp file (2c5ab381c0d643f8512a07d296d411413080ec652c15e8c676fd58435de5a327) content:
51
51
  apiVersion: jobset.x-k8s.io/v1alpha2
52
52
  kind: JobSet
53
53
  metadata:
@@ -136,7 +136,7 @@ spec:
136
136
  exit $EXIT_CODE
137
137
  resources:
138
138
  limits:
139
- google.com/tpu: 2
139
+ google.com/tpu: 4
140
140
 
141
141
  volumeMounts:
142
142
  - mountPath: /dev/shm
@@ -156,7 +156,7 @@ spec:
156
156
 
157
157
 
158
158
  [XPK] Task: `Creating Workload` is implemented by the following command not running since it is a dry run.
159
- kubectl apply -f 2eed164577b237a7b764f6adf46b9c249551c2200e440ef0f696c53dfb2d1cb5
159
+ kubectl apply -f 2c5ab381c0d643f8512a07d296d411413080ec652c15e8c676fd58435de5a327
160
160
  [XPK] Task: `GKE Dashboard List` is implemented by the following command not running since it is a dry run.
161
161
  gcloud monitoring dashboards list --project=golden-project --filter="displayName:'GKE - TPU Monitoring Dashboard'" --format="value(name)" --verbosity=error
162
162
  [XPK] Check statistics and outlier mode of GKE metrics here: https://console.cloud.google.com/monitoring/dashboards/builder/0?project=golden-project&f.rlabel.cluster_name.ClusterName=golden-cluster. To view the metric data for your workload, select golden-workload from the JobName filter on the dashboard.
@@ -181,7 +181,9 @@ def get_main_container(
181
181
  tpu_stacktrace_terminate_command=tpu_stacktrace_terminate_command,
182
182
  gpu_workload_terminate_command=gpu_workload_terminate_command,
183
183
  xpk_internal_commands=xpk_internal_commands,
184
- resources=get_main_container_resources(args, system, resource_type),
184
+ resources=get_main_container_resources(
185
+ args, system, resource_type, parallel_containers
186
+ ),
185
187
  volume_mounts=volume_mounts,
186
188
  )
187
189
  )
@@ -23,7 +23,10 @@ from ..utils.execution_context import is_dry_run
23
23
 
24
24
 
25
25
  def get_main_container_resources(
26
- args, system: SystemCharacteristics, resource_type
26
+ args,
27
+ system: SystemCharacteristics,
28
+ resource_type: str,
29
+ parallel_containers: int,
27
30
  ) -> str:
28
31
  """Resources for the main container.
29
32
  Args:
@@ -53,10 +56,7 @@ def get_main_container_resources(
53
56
  offset_vCPUs = int(system.chips_per_vm) * 0.95
54
57
  return f'{resource_type}: {offset_vCPUs}'
55
58
 
56
- return (
57
- f'{resource_type}:'
58
- f' {int(system.chips_per_vm / system.parallel_containers)}'
59
- )
59
+ return f'{resource_type}: {int(system.chips_per_vm / parallel_containers)}'
60
60
 
61
61
 
62
62
  def get_env_container(args, system: SystemCharacteristics) -> str:
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: xpk
3
- Version: 1.1.1
3
+ Version: 1.1.2
4
4
  Summary: xpk helps Cloud developers to orchestrate training jobs on accelerators on GKE.
5
5
  Author-email: XPK team <xpk-code-reviewers@google.com>
6
6
  License: Apache-2.0
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes