npm - @aws/ml-container-creator - Versions diffs - 0.2.0 - Mend

@aws/ml-container-creator 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (143) hide show

package/LICENSE +202 -0
package/LICENSE-THIRD-PARTY +68620 -0
package/NOTICE +2 -0
package/README.md +106 -0
package/bin/cli.js +365 -0
package/config/defaults.json +32 -0
package/config/presets/transformers-djl.json +26 -0
package/config/presets/transformers-gpu.json +24 -0
package/config/presets/transformers-lmi.json +27 -0
package/package.json +129 -0
package/servers/README.md +419 -0
package/servers/base-image-picker/catalogs/model-servers.json +1191 -0
package/servers/base-image-picker/catalogs/python-slim.json +38 -0
package/servers/base-image-picker/catalogs/triton-backends.json +51 -0
package/servers/base-image-picker/catalogs/triton.json +38 -0
package/servers/base-image-picker/index.js +495 -0
package/servers/base-image-picker/manifest.json +17 -0
package/servers/base-image-picker/package.json +15 -0
package/servers/hyperpod-cluster-picker/LICENSE +202 -0
package/servers/hyperpod-cluster-picker/index.js +424 -0
package/servers/hyperpod-cluster-picker/manifest.json +14 -0
package/servers/hyperpod-cluster-picker/package.json +17 -0
package/servers/instance-recommender/LICENSE +202 -0
package/servers/instance-recommender/catalogs/instances.json +852 -0
package/servers/instance-recommender/index.js +284 -0
package/servers/instance-recommender/manifest.json +16 -0
package/servers/instance-recommender/package.json +15 -0
package/servers/lib/LICENSE +202 -0
package/servers/lib/bedrock-client.js +160 -0
package/servers/lib/custom-validators.js +46 -0
package/servers/lib/dynamic-resolver.js +36 -0
package/servers/lib/package.json +11 -0
package/servers/lib/schemas/image-catalog.schema.json +185 -0
package/servers/lib/schemas/instances.schema.json +124 -0
package/servers/lib/schemas/manifest.schema.json +64 -0
package/servers/lib/schemas/model-catalog.schema.json +91 -0
package/servers/lib/schemas/regions.schema.json +26 -0
package/servers/lib/schemas/triton-backends.schema.json +51 -0
package/servers/model-picker/catalogs/jumpstart-public.json +66 -0
package/servers/model-picker/catalogs/popular-diffusors.json +88 -0
package/servers/model-picker/catalogs/popular-transformers.json +226 -0
package/servers/model-picker/index.js +1693 -0
package/servers/model-picker/manifest.json +18 -0
package/servers/model-picker/package.json +20 -0
package/servers/region-picker/LICENSE +202 -0
package/servers/region-picker/catalogs/regions.json +263 -0
package/servers/region-picker/index.js +230 -0
package/servers/region-picker/manifest.json +16 -0
package/servers/region-picker/package.json +15 -0
package/src/app.js +1007 -0
package/src/copy-tpl.js +77 -0
package/src/lib/accelerator-validator.js +39 -0
package/src/lib/asset-manager.js +385 -0
package/src/lib/aws-profile-parser.js +181 -0
package/src/lib/bootstrap-command-handler.js +1647 -0
package/src/lib/bootstrap-config.js +238 -0
package/src/lib/ci-register-helpers.js +124 -0
package/src/lib/ci-report-helpers.js +158 -0
package/src/lib/ci-stage-helpers.js +268 -0
package/src/lib/cli-handler.js +529 -0
package/src/lib/comment-generator.js +544 -0
package/src/lib/community-reports-validator.js +91 -0
package/src/lib/config-manager.js +2106 -0
package/src/lib/configuration-exporter.js +204 -0
package/src/lib/configuration-manager.js +695 -0
package/src/lib/configuration-matcher.js +221 -0
package/src/lib/cpu-validator.js +36 -0
package/src/lib/cuda-validator.js +57 -0
package/src/lib/deployment-config-resolver.js +103 -0
package/src/lib/deployment-entry-schema.js +125 -0
package/src/lib/deployment-registry.js +598 -0
package/src/lib/docker-introspection-validator.js +51 -0
package/src/lib/engine-prefix-resolver.js +60 -0
package/src/lib/huggingface-client.js +172 -0
package/src/lib/key-value-parser.js +37 -0
package/src/lib/known-flags-validator.js +200 -0
package/src/lib/manifest-cli.js +280 -0
package/src/lib/mcp-client.js +303 -0
package/src/lib/mcp-command-handler.js +532 -0
package/src/lib/neuron-validator.js +80 -0
package/src/lib/parameter-schema-validator.js +284 -0
package/src/lib/prompt-runner.js +1349 -0
package/src/lib/prompts.js +1138 -0
package/src/lib/registry-command-handler.js +519 -0
package/src/lib/registry-loader.js +198 -0
package/src/lib/rocm-validator.js +80 -0
package/src/lib/schema-validator.js +157 -0
package/src/lib/sensitive-redactor.js +59 -0
package/src/lib/template-engine.js +156 -0
package/src/lib/template-manager.js +341 -0
package/src/lib/validation-engine.js +314 -0
package/src/prompt-adapter.js +63 -0
package/templates/Dockerfile +300 -0
package/templates/IAM_PERMISSIONS.md +84 -0
package/templates/MIGRATION.md +488 -0
package/templates/PROJECT_README.md +439 -0
package/templates/TEMPLATE_SYSTEM.md +243 -0
package/templates/buildspec.yml +64 -0
package/templates/code/chat_template.jinja +1 -0
package/templates/code/flask/gunicorn_config.py +35 -0
package/templates/code/flask/wsgi.py +10 -0
package/templates/code/model_handler.py +387 -0
package/templates/code/serve +300 -0
package/templates/code/serve.py +175 -0
package/templates/code/serving.properties +105 -0
package/templates/code/start_server.py +39 -0
package/templates/code/start_server.sh +39 -0
package/templates/diffusors/Dockerfile +72 -0
package/templates/diffusors/patch_image_api.py +35 -0
package/templates/diffusors/serve +115 -0
package/templates/diffusors/start_server.sh +114 -0
package/templates/do/.gitkeep +1 -0
package/templates/do/README.md +541 -0
package/templates/do/build +83 -0
package/templates/do/ci +681 -0
package/templates/do/clean +811 -0
package/templates/do/config +260 -0
package/templates/do/deploy +1560 -0
package/templates/do/export +306 -0
package/templates/do/logs +319 -0
package/templates/do/manifest +12 -0
package/templates/do/push +119 -0
package/templates/do/register +580 -0
package/templates/do/run +113 -0
package/templates/do/submit +417 -0
package/templates/do/test +1147 -0
package/templates/hyperpod/configmap.yaml +24 -0
package/templates/hyperpod/deployment.yaml +71 -0
package/templates/hyperpod/pvc.yaml +42 -0
package/templates/hyperpod/service.yaml +17 -0
package/templates/nginx-diffusors.conf +74 -0
package/templates/nginx-predictors.conf +47 -0
package/templates/nginx-tensorrt.conf +74 -0
package/templates/requirements.txt +61 -0
package/templates/sample_model/test_inference.py +123 -0
package/templates/sample_model/train_abalone.py +252 -0
package/templates/test/test_endpoint.sh +79 -0
package/templates/test/test_local_image.sh +80 -0
package/templates/test/test_model_handler.py +180 -0
package/templates/triton/Dockerfile +128 -0
package/templates/triton/config.pbtxt +163 -0
package/templates/triton/model.py +130 -0
package/templates/triton/requirements.txt +11 -0

package/servers/instance-recommender/catalogs/instances.json ADDED Viewed

@@ -0,0 +1,852 @@
+{
+    "catalog": {
+        "ml.c5.2xlarge": {
+            "category": "cpu",
+            "gpus": 0,
+            "vcpus": 8,
+            "memGb": 16,
+            "accelerator": "",
+            "cudaVersions": null,
+            "tags": [
+                "compute",
+                "cpu",
+                "high-cpu"
+            ],
+            "family": "c5",
+            "acceleratorType": "cpu",
+            "hardware": "None",
+            "gpuArchitecture": "None",
+            "defaultCudaVersion": null,
+            "notes": ""
+        },
+        "ml.c5.xlarge": {
+            "category": "cpu",
+            "gpus": 0,
+            "vcpus": 4,
+            "memGb": 8,
+            "accelerator": "",
+            "cudaVersions": null,
+            "tags": [
+                "compute",
+                "cpu",
+                "cost-effective"
+            ],
+            "family": "c5",
+            "acceleratorType": "cpu",
+            "hardware": "None",
+            "gpuArchitecture": "None",
+            "defaultCudaVersion": null,
+            "notes": ""
+        },
+        "ml.g4dn.12xlarge": {
+            "category": "gpu",
+            "gpus": 4,
+            "vcpus": 48,
+            "memGb": 192,
+            "accelerator": "4x T4 64GB",
+            "cudaVersions": [
+                "11.4",
+                "11.8"
+            ],
+            "tags": [
+                "gpu",
+                "multi-gpu",
+                "t4",
+                "cuda-11"
+            ],
+            "family": "g4dn",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA T4",
+            "gpuArchitecture": "Turing",
+            "defaultCudaVersion": "11.8",
+            "notes": "4x NVIDIA T4 GPUs (64GB total). Multi-GPU for tensor parallelism"
+        },
+        "ml.g4dn.16xlarge": {
+            "category": "gpu",
+            "gpus": 1,
+            "vcpus": 64,
+            "memGb": 256,
+            "accelerator": "T4 16GB",
+            "cudaVersions": [
+                "11.4",
+                "11.8"
+            ],
+            "tags": [
+                "gpu",
+                "single-gpu",
+                "t4",
+                "cuda-11"
+            ],
+            "family": "g4dn",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA T4",
+            "gpuArchitecture": "Turing",
+            "defaultCudaVersion": "11.8",
+            "notes": "1x NVIDIA T4 GPU (16GB). Very high CPU/memory ratio"
+        },
+        "ml.g4dn.2xlarge": {
+            "category": "gpu",
+            "gpus": 1,
+            "vcpus": 8,
+            "memGb": 32,
+            "accelerator": "T4 16GB",
+            "cudaVersions": [
+                "11.4",
+                "11.8"
+            ],
+            "tags": [
+                "gpu",
+                "single-gpu",
+                "budget",
+                "cost-effective",
+                "inference",
+                "t4",
+                "cuda-11"
+            ],
+            "family": "g4dn",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA T4",
+            "gpuArchitecture": "Turing",
+            "defaultCudaVersion": "11.8",
+            "notes": "1x NVIDIA T4 GPU (16GB). Better CPU/memory for preprocessing"
+        },
+        "ml.g4dn.4xlarge": {
+            "category": "gpu",
+            "gpus": 1,
+            "vcpus": 16,
+            "memGb": 64,
+            "accelerator": "T4 16GB",
+            "cudaVersions": [
+                "11.4",
+                "11.8"
+            ],
+            "tags": [
+                "gpu",
+                "single-gpu",
+                "t4",
+                "cuda-11"
+            ],
+            "family": "g4dn",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA T4",
+            "gpuArchitecture": "Turing",
+            "defaultCudaVersion": "11.8",
+            "notes": "1x NVIDIA T4 GPU (16GB). High CPU/memory ratio"
+        },
+        "ml.g4dn.8xlarge": {
+            "category": "gpu",
+            "gpus": 1,
+            "vcpus": 32,
+            "memGb": 128,
+            "accelerator": "T4 16GB",
+            "cudaVersions": [
+                "11.4",
+                "11.8"
+            ],
+            "tags": [
+                "gpu",
+                "single-gpu",
+                "t4",
+                "cuda-11"
+            ],
+            "family": "g4dn",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA T4",
+            "gpuArchitecture": "Turing",
+            "defaultCudaVersion": "11.8",
+            "notes": "1x NVIDIA T4 GPU (16GB). Maximum CPU/memory for single GPU"
+        },
+        "ml.g4dn.xlarge": {
+            "category": "gpu",
+            "gpus": 1,
+            "vcpus": 4,
+            "memGb": 16,
+            "accelerator": "T4 16GB",
+            "cudaVersions": [
+                "11.4",
+                "11.8"
+            ],
+            "tags": [
+                "gpu",
+                "single-gpu",
+                "budget",
+                "cost-effective",
+                "inference",
+                "t4",
+                "cuda-11"
+            ],
+            "family": "g4dn",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA T4",
+            "gpuArchitecture": "Turing",
+            "defaultCudaVersion": "11.8",
+            "notes": "1x NVIDIA T4 GPU (16GB). Cost-effective for smaller models"
+        },
+        "ml.g5.12xlarge": {
+            "category": "gpu",
+            "gpus": 4,
+            "vcpus": 48,
+            "memGb": 192,
+            "accelerator": "4x A10G 96GB",
+            "cudaVersions": [
+                "11.8",
+                "12.1",
+                "12.2"
+            ],
+            "tags": [
+                "gpu",
+                "multi-gpu",
+                "large",
+                "a10g",
+                "parallel",
+                "cuda-11",
+                "cuda-12"
+            ],
+            "family": "g5",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA A10G",
+            "gpuArchitecture": "Ampere",
+            "defaultCudaVersion": "12.1",
+            "notes": "4x NVIDIA A10G GPUs (96GB total). Good for tensor parallelism"
+        },
+        "ml.g5.16xlarge": {
+            "category": "gpu",
+            "gpus": 1,
+            "vcpus": 64,
+            "memGb": 256,
+            "accelerator": "A10G 24GB",
+            "cudaVersions": [
+                "11.8",
+                "12.1",
+                "12.2"
+            ],
+            "tags": [
+                "gpu",
+                "single-gpu",
+                "a10g",
+                "cuda-11",
+                "cuda-12"
+            ],
+            "family": "g5",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA A10G",
+            "gpuArchitecture": "Ampere",
+            "defaultCudaVersion": "12.1",
+            "notes": "1x NVIDIA A10G GPU (24GB). Very high CPU/memory ratio"
+        },
+        "ml.g5.24xlarge": {
+            "category": "gpu",
+            "gpus": 4,
+            "vcpus": 96,
+            "memGb": 384,
+            "accelerator": "4x A10G 96GB",
+            "cudaVersions": [
+                "11.8",
+                "12.1",
+                "12.2"
+            ],
+            "tags": [
+                "gpu",
+                "multi-gpu",
+                "a10g",
+                "cuda-11",
+                "cuda-12"
+            ],
+            "family": "g5",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA A10G",
+            "gpuArchitecture": "Ampere",
+            "defaultCudaVersion": "12.1",
+            "notes": "4x NVIDIA A10G GPUs (96GB total). High CPU/memory with multi-GPU"
+        },
+        "ml.g5.2xlarge": {
+            "category": "gpu",
+            "gpus": 1,
+            "vcpus": 8,
+            "memGb": 32,
+            "accelerator": "A10G 24GB",
+            "cudaVersions": [
+                "11.8",
+                "12.1",
+                "12.2"
+            ],
+            "tags": [
+                "gpu",
+                "single-gpu",
+                "inference",
+                "a10g",
+                "cuda-11",
+                "cuda-12"
+            ],
+            "family": "g5",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA A10G",
+            "gpuArchitecture": "Ampere",
+            "defaultCudaVersion": "12.1",
+            "notes": "1x NVIDIA A10G GPU (24GB). Better CPU/memory for preprocessing"
+        },
+        "ml.g5.48xlarge": {
+            "category": "gpu",
+            "gpus": 8,
+            "vcpus": 192,
+            "memGb": 768,
+            "accelerator": "8x A10G 192GB",
+            "cudaVersions": [
+                "11.8",
+                "12.1",
+                "12.2"
+            ],
+            "tags": [
+                "gpu",
+                "multi-gpu",
+                "a10g",
+                "cuda-11",
+                "cuda-12"
+            ],
+            "family": "g5",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA A10G",
+            "gpuArchitecture": "Ampere",
+            "defaultCudaVersion": "12.1",
+            "notes": "8x NVIDIA A10G GPUs (192GB total). Maximum multi-GPU configuration"
+        },
+        "ml.g5.4xlarge": {
+            "category": "gpu",
+            "gpus": 1,
+            "vcpus": 16,
+            "memGb": 64,
+            "accelerator": "A10G 24GB",
+            "cudaVersions": [
+                "11.8",
+                "12.1",
+                "12.2"
+            ],
+            "tags": [
+                "gpu",
+                "single-gpu",
+                "large",
+                "a10g",
+                "cuda-11",
+                "cuda-12"
+            ],
+            "family": "g5",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA A10G",
+            "gpuArchitecture": "Ampere",
+            "defaultCudaVersion": "12.1",
+            "notes": "1x NVIDIA A10G GPU (24GB). High CPU/memory for complex preprocessing"
+        },
+        "ml.g5.8xlarge": {
+            "category": "gpu",
+            "gpus": 1,
+            "vcpus": 32,
+            "memGb": 128,
+            "accelerator": "A10G 24GB",
+            "cudaVersions": [
+                "11.8",
+                "12.1",
+                "12.2"
+            ],
+            "tags": [
+                "gpu",
+                "single-gpu",
+                "a10g",
+                "cuda-11",
+                "cuda-12"
+            ],
+            "family": "g5",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA A10G",
+            "gpuArchitecture": "Ampere",
+            "defaultCudaVersion": "12.1",
+            "notes": "1x NVIDIA A10G GPU (24GB). Maximum CPU/memory for single GPU"
+        },
+        "ml.g5.xlarge": {
+            "category": "gpu",
+            "gpus": 1,
+            "vcpus": 4,
+            "memGb": 16,
+            "accelerator": "A10G 24GB",
+            "cudaVersions": [
+                "11.8",
+                "12.1",
+                "12.2"
+            ],
+            "tags": [
+                "gpu",
+                "single-gpu",
+                "inference",
+                "a10g",
+                "cuda-11",
+                "cuda-12"
+            ],
+            "family": "g5",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA A10G",
+            "gpuArchitecture": "Ampere",
+            "defaultCudaVersion": "12.1",
+            "notes": "1x NVIDIA A10G GPU (24GB). Good for small to medium models"
+        },
+        "ml.g6.12xlarge": {
+            "category": "gpu",
+            "gpus": 4,
+            "vcpus": 48,
+            "memGb": 192,
+            "accelerator": "4x L4 96GB",
+            "cudaVersions": [
+                "12.1",
+                "12.2",
+                "12.4"
+            ],
+            "tags": [
+                "gpu",
+                "multi-gpu",
+                "large",
+                "l4",
+                "newer",
+                "parallel",
+                "cuda-12"
+            ],
+            "family": "g6",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA L4",
+            "gpuArchitecture": "Ada Lovelace",
+            "defaultCudaVersion": "12.2",
+            "notes": "Multi-GPU (newer)"
+        },
+        "ml.g6.2xlarge": {
+            "category": "gpu",
+            "gpus": 1,
+            "vcpus": 8,
+            "memGb": 32,
+            "accelerator": "L4 24GB",
+            "cudaVersions": [
+                "12.1",
+                "12.2",
+                "12.4"
+            ],
+            "tags": [
+                "gpu",
+                "single-gpu",
+                "inference",
+                "l4",
+                "newer",
+                "cuda-12"
+            ],
+            "family": "g6",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA L4",
+            "gpuArchitecture": "Ada Lovelace",
+            "defaultCudaVersion": "12.2",
+            "notes": "Medium GPU (newer)"
+        },
+        "ml.g6.xlarge": {
+            "category": "gpu",
+            "gpus": 1,
+            "vcpus": 4,
+            "memGb": 16,
+            "accelerator": "L4 24GB",
+            "cudaVersions": [
+                "12.1",
+                "12.2",
+                "12.4"
+            ],
+            "tags": [
+                "gpu",
+                "single-gpu",
+                "inference",
+                "l4",
+                "newer",
+                "cuda-12"
+            ],
+            "family": "g6",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA L4",
+            "gpuArchitecture": "Ada Lovelace",
+            "defaultCudaVersion": "12.2",
+            "notes": "Small GPU (newer)"
+        },
+        "ml.inf2.24xlarge": {
+            "category": "gpu",
+            "gpus": 6,
+            "vcpus": 96,
+            "memGb": 384,
+            "accelerator": "6x Inferentia2",
+            "cudaVersions": [
+                "2.15.0",
+                "2.16.0",
+                "2.17.0"
+            ],
+            "tags": [
+                "gpu",
+                "multi-gpu",
+                "inferentia2",
+                "neuron"
+            ],
+            "family": "inf2",
+            "acceleratorType": "neuron",
+            "hardware": "AWS Inferentia2",
+            "gpuArchitecture": "Inferentia2",
+            "defaultCudaVersion": "2.16.0",
+            "notes": "6x Inferentia2 chips. Multi-chip for large models"
+        },
+        "ml.inf2.48xlarge": {
+            "category": "gpu",
+            "gpus": 12,
+            "vcpus": 192,
+            "memGb": 768,
+            "accelerator": "12x Inferentia2",
+            "cudaVersions": [
+                "2.15.0",
+                "2.16.0",
+                "2.17.0"
+            ],
+            "tags": [
+                "gpu",
+                "multi-gpu",
+                "inferentia2",
+                "neuron"
+            ],
+            "family": "inf2",
+            "acceleratorType": "neuron",
+            "hardware": "AWS Inferentia2",
+            "gpuArchitecture": "Inferentia2",
+            "defaultCudaVersion": "2.16.0",
+            "notes": "12x Inferentia2 chips. Maximum multi-chip configuration"
+        },
+        "ml.inf2.8xlarge": {
+            "category": "gpu",
+            "gpus": 1,
+            "vcpus": 32,
+            "memGb": 128,
+            "accelerator": "Inferentia2",
+            "cudaVersions": [
+                "2.15.0",
+                "2.16.0",
+                "2.17.0"
+            ],
+            "tags": [
+                "gpu",
+                "single-gpu",
+                "inferentia2",
+                "neuron"
+            ],
+            "family": "inf2",
+            "acceleratorType": "neuron",
+            "hardware": "AWS Inferentia2",
+            "gpuArchitecture": "Inferentia2",
+            "defaultCudaVersion": "2.16.0",
+            "notes": "1x Inferentia2 chip. Higher CPU/memory for preprocessing"
+        },
+        "ml.inf2.xlarge": {
+            "category": "gpu",
+            "gpus": 1,
+            "vcpus": 4,
+            "memGb": 16,
+            "accelerator": "Inferentia2",
+            "cudaVersions": [
+                "2.15.0",
+                "2.16.0",
+                "2.17.0"
+            ],
+            "tags": [
+                "gpu",
+                "single-gpu",
+                "inferentia2",
+                "neuron"
+            ],
+            "family": "inf2",
+            "acceleratorType": "neuron",
+            "hardware": "AWS Inferentia2",
+            "gpuArchitecture": "Inferentia2",
+            "defaultCudaVersion": "2.16.0",
+            "notes": "1x Inferentia2 chip. Cost-effective for transformer inference"
+        },
+        "ml.m5.2xlarge": {
+            "category": "cpu",
+            "gpus": 0,
+            "vcpus": 8,
+            "memGb": 32,
+            "accelerator": "",
+            "cudaVersions": null,
+            "tags": [
+                "large",
+                "cpu",
+                "general",
+                "high-memory"
+            ],
+            "family": "m5",
+            "acceleratorType": "cpu",
+            "hardware": "None",
+            "gpuArchitecture": "None",
+            "defaultCudaVersion": null,
+            "notes": "Large CPU workloads"
+        },
+        "ml.m5.4xlarge": {
+            "category": "cpu",
+            "gpus": 0,
+            "vcpus": 16,
+            "memGb": 64,
+            "accelerator": "",
+            "cudaVersions": null,
+            "tags": [
+                "xlarge",
+                "cpu",
+                "general",
+                "high-memory",
+                "high-cpu"
+            ],
+            "family": "m5",
+            "acceleratorType": "cpu",
+            "hardware": "None",
+            "gpuArchitecture": "None",
+            "defaultCudaVersion": null,
+            "notes": "XL CPU workloads"
+        },
+        "ml.m5.large": {
+            "category": "cpu",
+            "gpus": 0,
+            "vcpus": 2,
+            "memGb": 8,
+            "accelerator": "",
+            "cudaVersions": null,
+            "tags": [
+                "small",
+                "cpu",
+                "general",
+                "cheap",
+                "cost-effective",
+                "budget"
+            ],
+            "family": "m5",
+            "acceleratorType": "cpu",
+            "hardware": "None",
+            "gpuArchitecture": "None",
+            "defaultCudaVersion": null,
+            "notes": "Small CPU workloads"
+        },
+        "ml.m5.xlarge": {
+            "category": "cpu",
+            "gpus": 0,
+            "vcpus": 4,
+            "memGb": 16,
+            "accelerator": "",
+            "cudaVersions": null,
+            "tags": [
+                "medium",
+                "cpu",
+                "general",
+                "cost-effective"
+            ],
+            "family": "m5",
+            "acceleratorType": "cpu",
+            "hardware": "None",
+            "gpuArchitecture": "None",
+            "defaultCudaVersion": null,
+            "notes": "Medium CPU workloads"
+        },
+        "ml.p3.16xlarge": {
+            "category": "gpu",
+            "gpus": 8,
+            "vcpus": 64,
+            "memGb": 488,
+            "accelerator": "8x V100 128GB",
+            "cudaVersions": [
+                "11.0",
+                "11.4",
+                "11.8"
+            ],
+            "tags": [
+                "gpu",
+                "multi-gpu",
+                "v100",
+                "cuda-11"
+            ],
+            "family": "p3",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA V100",
+            "gpuArchitecture": "Volta",
+            "defaultCudaVersion": "11.8",
+            "notes": "8x NVIDIA V100 GPUs (128GB total). Maximum multi-GPU configuration"
+        },
+        "ml.p3.2xlarge": {
+            "category": "gpu",
+            "gpus": 1,
+            "vcpus": 8,
+            "memGb": 61,
+            "accelerator": "V100 16GB",
+            "cudaVersions": [
+                "11.0",
+                "11.4",
+                "11.8"
+            ],
+            "tags": [
+                "gpu",
+                "single-gpu",
+                "high-performance",
+                "training",
+                "v100",
+                "cuda-11"
+            ],
+            "family": "p3",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA V100",
+            "gpuArchitecture": "Volta",
+            "defaultCudaVersion": "11.8",
+            "notes": "1x NVIDIA V100 GPU (16GB). High-performance for training and inference"
+        },
+        "ml.p3.8xlarge": {
+            "category": "gpu",
+            "gpus": 4,
+            "vcpus": 32,
+            "memGb": 244,
+            "accelerator": "4x V100 64GB",
+            "cudaVersions": [
+                "11.0",
+                "11.4",
+                "11.8"
+            ],
+            "tags": [
+                "gpu",
+                "multi-gpu",
+                "high-performance",
+                "training",
+                "v100",
+                "parallel",
+                "cuda-11"
+            ],
+            "family": "p3",
+            "acceleratorType": "cuda",
+            "hardware": "NVIDIA V100",
+            "gpuArchitecture": "Volta",
+            "defaultCudaVersion": "11.8",
+            "notes": "4x NVIDIA V100 GPUs (64GB total). Multi-GPU for large models"
+        },
+        "ml.r5.large": {
+            "category": "cpu",
+            "gpus": 0,
+            "vcpus": 2,
+            "memGb": 16,
+            "accelerator": "",
+            "cudaVersions": null,
+            "tags": [
+                "memory",
+                "cpu",
+                "high-memory"
+            ],
+            "family": "r5",
+            "acceleratorType": "cpu",
+            "hardware": "None",
+            "gpuArchitecture": "None",
+            "defaultCudaVersion": null,
+            "notes": ""
+        },
+        "ml.r5.xlarge": {
+            "category": "cpu",
+            "gpus": 0,
+            "vcpus": 4,
+            "memGb": 32,
+            "accelerator": "",
+            "cudaVersions": null,
+            "tags": [
+                "memory",
+                "cpu",
+                "high-memory"
+            ],
+            "family": "r5",
+            "acceleratorType": "cpu",
+            "hardware": "None",
+            "gpuArchitecture": "None",
+            "defaultCudaVersion": null,
+            "notes": ""
+        },
+        "ml.trn1.2xlarge": {
+            "category": "gpu",
+            "gpus": 1,
+            "vcpus": 8,
+            "memGb": 32,
+            "accelerator": "Trainium",
+            "cudaVersions": [
+                "2.15.0",
+                "2.16.0",
+                "2.17.0"
+            ],
+            "tags": [
+                "gpu",
+                "single-gpu",
+                "trainium",
+                "neuron"
+            ],
+            "family": "trn1",
+            "acceleratorType": "neuron",
+            "hardware": "AWS Trainium",
+            "gpuArchitecture": "Trainium1",
+            "defaultCudaVersion": "2.16.0",
+            "notes": "1x Trainium chip. Optimized for training, also supports inference"
+        },
+        "ml.trn1.32xlarge": {
+            "category": "gpu",
+            "gpus": 16,
+            "vcpus": 128,
+            "memGb": 512,
+            "accelerator": "16x Trainium",
+            "cudaVersions": [
+                "2.15.0",
+                "2.16.0",
+                "2.17.0"
+            ],
+            "tags": [
+                "gpu",
+                "multi-gpu",
+                "trainium",
+                "neuron"
+            ],
+            "family": "trn1",
+            "acceleratorType": "neuron",
+            "hardware": "AWS Trainium",
+            "gpuArchitecture": "Trainium1",
+            "defaultCudaVersion": "2.16.0",
+            "notes": "16x Trainium chips. Maximum multi-chip for large-scale training/inference"
+        }
+    },
+    "recommendations": {
+        "cpu": [
+            "ml.m5.large",
+            "ml.m5.xlarge",
+            "ml.m5.2xlarge",
+            "ml.m5.4xlarge",
+            "ml.c5.xlarge",
+            "ml.c5.2xlarge",
+            "ml.r5.large",
+            "ml.r5.xlarge"
+        ],
+        "gpu": [
+            "ml.g4dn.xlarge",
+            "ml.g4dn.2xlarge",
+            "ml.g5.xlarge",
+            "ml.g5.2xlarge",
+            "ml.g5.4xlarge",
+            "ml.p3.2xlarge",
+            "ml.g5.12xlarge",
+            "ml.g6.xlarge",
+            "ml.g6.2xlarge",
+            "ml.g6.12xlarge",
+            "ml.p3.8xlarge",
+            "ml.g5.8xlarge",
+            "ml.g5.16xlarge",
+            "ml.g5.24xlarge",
+            "ml.g5.48xlarge",
+            "ml.g4dn.4xlarge",
+            "ml.g4dn.8xlarge",
+            "ml.g4dn.12xlarge",
+            "ml.g4dn.16xlarge",
+            "ml.p3.16xlarge",
+            "ml.inf2.xlarge",
+            "ml.inf2.8xlarge",
+            "ml.inf2.24xlarge",
+            "ml.inf2.48xlarge",
+            "ml.trn1.2xlarge",
+            "ml.trn1.32xlarge"
+        ]
+    }
+}