gpu-dev 0.5.0__tar.gz → 0.5.1__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/PKG-INFO +1 -1
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/cli-tools/gpu-dev-cli/gpu_dev.egg-info/PKG-INFO +1 -1
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/cli-tools/gpu-dev-cli/gpu_dev_cli/cli.py +5 -5
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/cli-tools/gpu-dev-cli/gpu_dev_cli/interactive.py +1 -1
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/cli-tools/gpu-dev-cli/gpu_dev_cli/reservations.py +1 -1
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/pyproject.toml +1 -1
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/eks.tf +2 -2
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/reservation_processor/index.py +3 -3
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda.tf +2 -2
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/main.tf +3 -3
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/.github/workflows/no-gitlinks.yml +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/.github/workflows/publish.yml +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/.gitignore +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/CLAUDE.md +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/PROGRESS.md +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/PR_DESCRIPTION.md +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/TODO.md +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/admin/README.md +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/admin/generate_stats.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/admin/requirements.txt +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/cli-tools/gpu-dev-cli/README.md +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/cli-tools/gpu-dev-cli/ZERO_CONFIG_SETUP.md +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/cli-tools/gpu-dev-cli/gpu_dev.egg-info/SOURCES.txt +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/cli-tools/gpu-dev-cli/gpu_dev.egg-info/dependency_links.txt +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/cli-tools/gpu-dev-cli/gpu_dev.egg-info/entry_points.txt +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/cli-tools/gpu-dev-cli/gpu_dev.egg-info/requires.txt +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/cli-tools/gpu-dev-cli/gpu_dev.egg-info/top_level.txt +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/cli-tools/gpu-dev-cli/gpu_dev_cli/__init__.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/cli-tools/gpu-dev-cli/gpu_dev_cli/auth.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/cli-tools/gpu-dev-cli/gpu_dev_cli/config.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/cli-tools/gpu-dev-cli/gpu_dev_cli/disks.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/cli-tools/gpu-dev-cli/gpu_dev_cli/name_generator.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/cli-tools/gpu-dev-cli/gpu_dev_cli/ssh_proxy.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/cli-tools/gpu-dev-cli/minimal-iam-policy.json +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/cli-tools/scripts/clear_stale_disk_locks.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/docs/USER_GUIDE.md +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/docs/devgpu-features.html +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/docs/docker-mark-blue.svg +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/docs/icons8-cursor-ai.svg +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/post.md +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/setup.cfg +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/.claude/skills/deploy.md +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/.terraform.lock.hcl +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/README.md +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/alb.tf +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/availability.tf +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/backend.tf +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/.dockerignore +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/Dockerfile +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/backup-dotfiles +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/bash_profile +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/bashrc +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/bashrc_ext +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/build-with-efa.sh +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/dotfiles-shutdown-handler +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/list-dotfile-versions +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/motd_script +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/nproc_wrapper +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/profile +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/restore-dotfiles +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/restore-dotfiles-version +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/setup-dotfiles-persistence +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/shell_env +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/ssh_config +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/zprofile +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/zshrc +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker/zshrc_ext +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker-build.tf +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker-example/Dockerfile +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/docker-example/hello.txt +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/ecr.tf +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/efs.tf +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/expiry.tf +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/git-cache.tf +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/kubernetes.tf +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/availability_updater/index.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/availability_updater/requirements.txt +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/migration/tag_largest_snapshots.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/reservation_expiry/index.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/reservation_expiry/requirements.txt +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/reservation_processor/buildkit_job.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/reservation_processor/requirements.txt +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/shared/__init__.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/shared/alb_utils.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/shared/dns_utils.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/shared/k8s_client.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/shared/k8s_resource_tracker.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/shared/requirements.txt +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/shared/snapshot_utils.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/migrations/backfill_snapshot_contents.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/migrations/backfill_snapshot_contents.py.bak +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/migrations/check_snapshots.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/migrations/migrate_disks_to_named.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/migrations/run_backfill.sh +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/monitoring.tf +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/outputs.tf +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/pyproject.toml +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/queue.tf +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/route53.tf +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/s3-disk-contents.tf +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/scripts/CLEANUP_GUIDE.md +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/scripts/detect_empty_volumes.sh +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/scripts/ec2_avail_probe.sh +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/scripts/inspect_user_data.sh +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/ssh-proxy/Dockerfile +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/ssh-proxy/proxy.py +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/ssh-proxy/requirements.txt +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/ssh-proxy-service.tf +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/ssh-proxy.tf +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/switch-to.sh +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/templates/al2023-cpu-user-data.sh +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/templates/al2023-user-data.sh +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/templates/user-data-self-managed.sh +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/templates/user-data.sh +0 -0
- {gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/variables.tf +0 -0
|
@@ -498,9 +498,9 @@ def main(ctx: click.Context) -> None:
|
|
|
498
498
|
"--gpu-type",
|
|
499
499
|
"-t",
|
|
500
500
|
type=click.Choice(
|
|
501
|
-
["b200", "h200", "h100", "a100", "
|
|
501
|
+
["b200", "h200", "h100", "a100", "rtxpro6000", "a10g", "t4", "l4", "t4-small", "cpu-arm", "cpu-x86"], case_sensitive=False
|
|
502
502
|
),
|
|
503
|
-
help="GPU type to reserve (b200/h200/h100/a100/
|
|
503
|
+
help="GPU type to reserve (b200/h200/h100/a100/rtxpro6000/a10g/t4/l4/t4-small/cpu-arm/cpu-x86)",
|
|
504
504
|
)
|
|
505
505
|
@click.option(
|
|
506
506
|
"--hours",
|
|
@@ -652,7 +652,7 @@ def reserve(
|
|
|
652
652
|
"t4": {"max_gpus": 4, "instance_type": "g4dn.12xlarge"},
|
|
653
653
|
"l4": {"max_gpus": 4, "instance_type": "g6.12xlarge"},
|
|
654
654
|
"a10g": {"max_gpus": 4, "instance_type": "g5.12xlarge"},
|
|
655
|
-
"
|
|
655
|
+
"rtxpro6000": {"max_gpus": 4, "instance_type": "g7e.24xlarge"},
|
|
656
656
|
"t4-small": {"max_gpus": 1, "instance_type": "g4dn.xlarge"},
|
|
657
657
|
"a100": {"max_gpus": 8, "instance_type": "p4d.24xlarge"},
|
|
658
658
|
"h100": {"max_gpus": 8, "instance_type": "p5.48xlarge"},
|
|
@@ -2398,7 +2398,7 @@ def _show_availability() -> None:
|
|
|
2398
2398
|
"a100": "Ampere (sm80)",
|
|
2399
2399
|
"a10g": "Ampere (sm80)",
|
|
2400
2400
|
"l4": "Ada Lovelace (sm89)",
|
|
2401
|
-
"
|
|
2401
|
+
"rtxpro6000": "Blackwell (sm120)",
|
|
2402
2402
|
"t4": "Turing (sm75)",
|
|
2403
2403
|
"cpu-x86": "CPU (x86_64)",
|
|
2404
2404
|
"cpu-arm": "CPU (arm64)",
|
|
@@ -2547,7 +2547,7 @@ def _show_availability_watch(interval: int) -> None:
|
|
|
2547
2547
|
"a100": "Ampere (sm80)",
|
|
2548
2548
|
"a10g": "Ampere (sm80)",
|
|
2549
2549
|
"l4": "Ada Lovelace (sm89)",
|
|
2550
|
-
"
|
|
2550
|
+
"rtxpro6000": "Blackwell (sm120)",
|
|
2551
2551
|
"t4": "Turing (sm75)",
|
|
2552
2552
|
"cpu-x86": "CPU (x86_64)",
|
|
2553
2553
|
"cpu-arm": "CPU (arm64)",
|
|
@@ -153,7 +153,7 @@ def select_gpu_count_interactive(gpu_type: str, max_gpus: int) -> Optional[int]:
|
|
|
153
153
|
# CPU instances don't have GPUs, but we still need a "count" for nodes
|
|
154
154
|
valid_counts = [0] # 0 GPUs for CPU-only instances
|
|
155
155
|
multinode_counts = [] # No multinode for CPU instances
|
|
156
|
-
elif gpu_type in ["t4", "l4", "a10g", "
|
|
156
|
+
elif gpu_type in ["t4", "l4", "a10g", "rtxpro6000"]:
|
|
157
157
|
valid_counts = [1, 2, 4]
|
|
158
158
|
# Add multinode options
|
|
159
159
|
multinode_counts = [8, 12, 16, 20, 24] # multiples of 4
|
|
@@ -535,7 +535,7 @@ class ReservationManager:
|
|
|
535
535
|
"t4": {"max_gpus": 4},
|
|
536
536
|
"l4": {"max_gpus": 4},
|
|
537
537
|
"a10g": {"max_gpus": 4},
|
|
538
|
-
"
|
|
538
|
+
"rtxpro6000": {"max_gpus": 4},
|
|
539
539
|
"t4-small": {"max_gpus": 1},
|
|
540
540
|
"g5g": {"max_gpus": 2},
|
|
541
541
|
"a100": {"max_gpus": 8},
|
|
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
|
4
4
|
|
|
5
5
|
[project]
|
|
6
6
|
name = "gpu-dev"
|
|
7
|
-
version = "0.5.
|
|
7
|
+
version = "0.5.1"
|
|
8
8
|
description = "CLI tool for PyTorch GPU developer server reservations"
|
|
9
9
|
authors = [{name = "PyTorch Team"}]
|
|
10
10
|
readme = "cli-tools/gpu-dev-cli/README.md"
|
|
@@ -184,8 +184,8 @@ locals {
|
|
|
184
184
|
"t4" = "t4"
|
|
185
185
|
"t4-az2" = "t4" # Both t4 and t4-az2 should be labeled as "t4" in Kubernetes
|
|
186
186
|
"l4" = "l4"
|
|
187
|
-
"a10g"
|
|
188
|
-
"
|
|
187
|
+
"a10g" = "a10g"
|
|
188
|
+
"rtxpro6000" = "rtxpro6000"
|
|
189
189
|
"h100" = "h100"
|
|
190
190
|
"h200" = "h200"
|
|
191
191
|
"b200" = "b200"
|
{gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/reservation_processor/index.py
RENAMED
|
@@ -66,7 +66,7 @@ GPU_CONFIG = {
|
|
|
66
66
|
"t4": {"instance_type": "g4dn.12xlarge", "max_gpus": 4, "cpus": 48, "memory_gb": 192, "efa_count": 0},
|
|
67
67
|
"l4": {"instance_type": "g6.12xlarge", "max_gpus": 4, "cpus": 48, "memory_gb": 192, "efa_count": 1},
|
|
68
68
|
"a10g": {"instance_type": "g5.12xlarge", "max_gpus": 4, "cpus": 48, "memory_gb": 192, "efa_count": 1},
|
|
69
|
-
"
|
|
69
|
+
"rtxpro6000": {"instance_type": "g7e.24xlarge", "max_gpus": 4, "cpus": 96, "memory_gb": 1024, "efa_count": 2},
|
|
70
70
|
"t4-small": {"instance_type": "g4dn.2xlarge", "max_gpus": 1, "cpus": 8, "memory_gb": 32, "efa_count": 0},
|
|
71
71
|
"g5g": {"instance_type": "g5g.2xlarge", "max_gpus": 2, "cpus": 8, "memory_gb": 32, "efa_count": 0},
|
|
72
72
|
"a100": {"instance_type": "p4d.24xlarge", "max_gpus": 8, "cpus": 96, "memory_gb": 1152, "efa_count": 4},
|
|
@@ -2151,7 +2151,7 @@ def validate_reservation_request(request: dict[str, Any]) -> tuple[bool, str]:
|
|
|
2151
2151
|
gpu_type = request.get("gpu_type", "")
|
|
2152
2152
|
|
|
2153
2153
|
# Validate GPU type
|
|
2154
|
-
valid_gpu_types = ["t4", "l4", "a10g", "
|
|
2154
|
+
valid_gpu_types = ["t4", "l4", "a10g", "rtxpro6000", "t4-small", "a100",
|
|
2155
2155
|
"h100", "h200", "b200", "cpu-arm", "cpu-x86"]
|
|
2156
2156
|
if gpu_type not in valid_gpu_types:
|
|
2157
2157
|
error_msg = f"Invalid GPU type: {gpu_type}. Must be one of: {', '.join(valid_gpu_types)}"
|
|
@@ -2382,7 +2382,7 @@ def update_gpu_availability_table(
|
|
|
2382
2382
|
"t4": {"gpus_per_instance": 4},
|
|
2383
2383
|
"l4": {"gpus_per_instance": 4},
|
|
2384
2384
|
"a10g": {"gpus_per_instance": 4},
|
|
2385
|
-
"
|
|
2385
|
+
"rtxpro6000": {"gpus_per_instance": 4},
|
|
2386
2386
|
"a100": {"gpus_per_instance": 8},
|
|
2387
2387
|
"h100": {"gpus_per_instance": 8},
|
|
2388
2388
|
"h200": {"gpus_per_instance": 8},
|
|
@@ -180,8 +180,8 @@ resource "aws_lambda_function" "reservation_processor" {
|
|
|
180
180
|
HOSTED_ZONE_ID = local.effective_domain_name != "" ? local.hosted_zone_id : ""
|
|
181
181
|
SSH_DOMAIN_MAPPINGS_TABLE = local.effective_domain_name != "" ? aws_dynamodb_table.ssh_domain_mappings.name : ""
|
|
182
182
|
SSL_CERTIFICATE_ARN = local.effective_domain_name != "" ? aws_acm_certificate.wildcard[0].arn : ""
|
|
183
|
-
LAMBDA_VERSION = "0.5.
|
|
184
|
-
MIN_CLI_VERSION = "0.5.
|
|
183
|
+
LAMBDA_VERSION = "0.5.1"
|
|
184
|
+
MIN_CLI_VERSION = "0.5.1"
|
|
185
185
|
DISK_CONTENTS_BUCKET = aws_s3_bucket.disk_contents.bucket
|
|
186
186
|
OPERATIONS_TABLE = aws_dynamodb_table.operations.name
|
|
187
187
|
}, local.alb_env_vars)
|
|
@@ -207,7 +207,7 @@ locals {
|
|
|
207
207
|
architecture = "x86_64"
|
|
208
208
|
efa_network_cards = 1
|
|
209
209
|
}
|
|
210
|
-
"
|
|
210
|
+
"rtxpro6000" = {
|
|
211
211
|
instance_type = "g7e.24xlarge"
|
|
212
212
|
instance_types = null
|
|
213
213
|
instance_count = 2
|
|
@@ -302,8 +302,8 @@ locals {
|
|
|
302
302
|
a100 = "primary"
|
|
303
303
|
t4 = "primary"
|
|
304
304
|
l4 = "secondary"
|
|
305
|
-
a10g
|
|
306
|
-
|
|
305
|
+
a10g = "secondary"
|
|
306
|
+
rtxpro6000 = "secondary"
|
|
307
307
|
"cpu-arm" = "primary"
|
|
308
308
|
"cpu-x86" = "primary"
|
|
309
309
|
}
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/availability_updater/index.py
RENAMED
|
File without changes
|
|
File without changes
|
{gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/migration/tag_largest_snapshots.py
RENAMED
|
File without changes
|
|
File without changes
|
{gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/reservation_expiry/requirements.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/lambda/shared/k8s_resource_tracker.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/migrations/backfill_snapshot_contents.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/migrations/migrate_disks_to_named.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{gpu_dev-0.5.0 → gpu_dev-0.5.1}/terraform-gpu-devservers/templates/user-data-self-managed.sh
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|