npm - @aws/ml-container-creator - Versions diffs - 0.9.1 → 0.10.0 - Mend

@aws/ml-container-creator 0.9.1 → 0.10.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (32) hide show

package/config/parameter-schema-v2.json +2065 -0
package/package.json +4 -4
package/servers/lib/catalogs/jumpstart-public.json +101 -16
package/servers/lib/catalogs/models.json +182 -26
package/src/app.js +1 -389
package/src/lib/bootstrap-command-handler.js +75 -1078
package/src/lib/bootstrap-profile-manager.js +634 -0
package/src/lib/bootstrap-provisioners.js +421 -0
package/src/lib/config-loader.js +405 -0
package/src/lib/config-manager.js +59 -1685
package/src/lib/config-mcp-client.js +118 -0
package/src/lib/config-validator.js +634 -0
package/src/lib/cuda-resolver.js +140 -0
package/src/lib/e2e-catalog-validator.js +251 -3
package/src/lib/e2e-ci-recorder.js +103 -0
package/src/lib/generated/cli-options.js +8 -4
package/src/lib/generated/parameter-matrix.js +671 -0
package/src/lib/generated/validation-rules.js +2 -2
package/src/lib/marketplace-flow.js +276 -0
package/src/lib/mcp-query-runner.js +768 -0
package/src/lib/parameter-schema-validator.js +62 -18
package/src/lib/prompt-runner.js +41 -1504
package/src/lib/prompts/feature-prompts.js +172 -0
package/src/lib/prompts/index.js +48 -0
package/src/lib/prompts/infrastructure-prompts.js +690 -0
package/src/lib/prompts/model-prompts.js +552 -0
package/src/lib/prompts/project-prompts.js +70 -0
package/src/lib/prompts.js +2 -1446
package/src/lib/registry-command-handler.js +135 -3
package/src/lib/secrets-prompt-runner.js +251 -0
package/src/lib/template-variable-resolver.js +398 -0
package/config/parameter-schema.json +0 -88

package/config/parameter-schema-v2.json ADDED Viewed

@@ -0,0 +1,2065 @@
+{
+    "$schema": "https://json-schema.org/draft/2020-12/schema",
+    "schemaVersion": "2.0.0",
+    "_comment": "Single source of truth for all MCC parameters. Drives CLI, validation, prompts, widget, and tests.",
+    "parameters": {
+        "projectName": {
+            "type": "string",
+            "description": "Name for the generated project",
+            "cliFlag": "--project-name",
+            "cliArgName": "name",
+            "envVar": "ML_PROJECT_NAME",
+            "templateVar": "projectName",
+            "configKey": "projectName",
+            "default": null,
+            "validation": {
+                "pattern": "^[a-z0-9][a-z0-9-]*[a-z0-9]$",
+                "minLength": 2,
+                "maxLength": 63
+            },
+            "phase": "project",
+            "group": "project",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": {
+                "section": "model-server",
+                "inputType": "text",
+                "placeholder": "my-project"
+            },
+            "prompt": {
+                "message": "Project name?",
+                "type": "input"
+            },
+            "deprecated": false,
+            "since": "0.1.0"
+        },
+        "deploymentConfig": {
+            "type": "enum",
+            "description": "Deployment configuration (e.g. http-flask, transformers-vllm, triton-fil)",
+            "cliFlag": "--deployment-config",
+            "cliArgName": "config",
+            "envVar": "ML_DEPLOYMENT_CONFIG",
+            "templateVar": "deploymentConfig",
+            "configKey": "deploymentConfig",
+            "default": null,
+            "validation": {
+                "enum": [
+                    "http-flask",
+                    "http-fastapi",
+                    "transformers-vllm",
+                    "transformers-sglang",
+                    "transformers-tensorrt-llm",
+                    "transformers-lmi",
+                    "transformers-djl",
+                    "triton-fil",
+                    "triton-onnxruntime",
+                    "triton-tensorflow",
+                    "triton-pytorch",
+                    "triton-vllm",
+                    "triton-tensorrtllm",
+                    "triton-python",
+                    "diffusors-vllm-omni",
+                    "marketplace"
+                ]
+            },
+            "phase": "model",
+            "group": "model",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": {
+                "section": "model-server",
+                "inputType": "select"
+            },
+            "prompt": {
+                "message": "Deployment configuration?",
+                "type": "list"
+            },
+            "deprecated": false,
+            "since": "0.5.0"
+        },
+        "modelName": {
+            "type": "string",
+            "description": "Model identifier (hf-org/model, s3://..., registry://..., marketplace://...)",
+            "cliFlag": "--model-name",
+            "cliArgName": "name",
+            "envVar": "ML_MODEL_NAME",
+            "templateVar": "modelName",
+            "configKey": "modelName",
+            "default": null,
+            "validation": {
+                "minLength": 1
+            },
+            "phase": "model",
+            "group": "model",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "transformers",
+                    "diffusors"
+                ]
+            },
+            "widget": {
+                "section": "model-server",
+                "inputType": "text",
+                "datalist": "models",
+                "placeholder": "e.g. meta-llama/Llama-3.1-8B-Instruct"
+            },
+            "prompt": {
+                "message": "Model name or path?",
+                "type": "input"
+            },
+            "deprecated": false,
+            "since": "0.3.0"
+        },
+        "deploymentTarget": {
+            "type": "enum",
+            "description": "Deployment target (managed-inference, async-inference, batch-transform, hyperpod-eks)",
+            "cliFlag": "--deployment-target",
+            "cliArgName": "target",
+            "envVar": "ML_DEPLOYMENT_TARGET",
+            "templateVar": "deploymentTarget",
+            "configKey": "deploymentTarget",
+            "default": "realtime-inference",
+            "validation": {
+                "enum": [
+                    "managed-inference",
+                    "realtime-inference",
+                    "async-inference",
+                    "batch-transform",
+                    "hyperpod-eks"
+                ]
+            },
+            "phase": "infrastructure",
+            "group": "infrastructure",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": {
+                "section": "infrastructure",
+                "inputType": "select"
+            },
+            "prompt": {
+                "message": "Deployment target?",
+                "type": "list"
+            },
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "instanceType": {
+            "type": "string",
+            "description": "SageMaker instance type (e.g. ml.g5.xlarge, ml.m5.large)",
+            "cliFlag": "--instance-type",
+            "cliArgName": "type",
+            "envVar": "ML_INSTANCE_TYPE",
+            "templateVar": "instanceType",
+            "configKey": "instanceType",
+            "default": null,
+            "validation": {
+                "pattern": "^ml\\.[a-z0-9]+\\.[a-z0-9]+$"
+            },
+            "phase": "infrastructure",
+            "group": "infrastructure",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference",
+                    "async-inference",
+                    "batch-transform"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": {
+                "section": "infrastructure",
+                "inputType": "text",
+                "datalist": "instances",
+                "placeholder": "e.g. ml.g5.2xlarge"
+            },
+            "prompt": {
+                "message": "Instance type?",
+                "type": "input",
+                "when": "deploymentTarget !== 'hyperpod-eks'"
+            },
+            "deprecated": false,
+            "since": "0.1.0"
+        },
+        "icGpuCount": {
+            "type": "integer",
+            "description": "GPUs allocated to the inference component",
+            "cliFlag": "--ic-gpu-count",
+            "cliArgName": "n",
+            "envVar": "ML_IC_GPU_COUNT",
+            "templateVar": "icGpuCount",
+            "configKey": "icGpuCount",
+            "default": null,
+            "validation": {
+                "min": 0,
+                "max": 8
+            },
+            "phase": "infrastructure",
+            "group": "inference-component",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": {
+                "section": "infrastructure",
+                "inputType": "number",
+                "placeholder": "auto"
+            },
+            "prompt": null,
+            "serverMapping": {
+                "icConfVar": "IC_GPU_COUNT"
+            },
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "icCopyCount": {
+            "type": "integer",
+            "description": "Number of inference component copies",
+            "cliFlag": "--ic-copy-count",
+            "cliArgName": "n",
+            "envVar": "ML_IC_COPY_COUNT",
+            "templateVar": "icCopyCount",
+            "configKey": "icCopyCount",
+            "default": 1,
+            "validation": {
+                "min": 0,
+                "max": 100
+            },
+            "phase": "infrastructure",
+            "group": "inference-component",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": {
+                "section": "infrastructure",
+                "inputType": "number",
+                "placeholder": "1"
+            },
+            "prompt": null,
+            "serverMapping": {
+                "icConfVar": "IC_COPY_COUNT"
+            },
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "icMemorySize": {
+            "type": "integer",
+            "description": "Memory in MB for the inference component",
+            "cliFlag": "--ic-memory-size",
+            "cliArgName": "mb",
+            "envVar": "ML_IC_MEMORY_SIZE",
+            "templateVar": "icMemorySize",
+            "configKey": "icMemorySize",
+            "default": null,
+            "validation": {
+                "min": 128,
+                "max": 3145728
+            },
+            "phase": "infrastructure",
+            "group": "inference-component",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": {
+                "section": "infrastructure",
+                "inputType": "number",
+                "placeholder": "1024"
+            },
+            "prompt": null,
+            "serverMapping": {
+                "icConfVar": "IC_MIN_MEMORY_MB"
+            },
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "enableLora": {
+            "type": "boolean",
+            "description": "Enable LoRA adapter serving",
+            "cliFlag": "--enable-lora",
+            "cliArgName": null,
+            "envVar": "ML_ENABLE_LORA",
+            "templateVar": "enableLora",
+            "configKey": "enableLora",
+            "default": false,
+            "validation": {},
+            "phase": "features",
+            "group": "lora",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference"
+                ],
+                "architectures": [
+                    "transformers"
+                ]
+            },
+            "widget": {
+                "section": "features",
+                "inputType": "checkbox"
+            },
+            "prompt": {
+                "message": "Enable LoRA adapter serving?",
+                "type": "confirm",
+                "when": "architecture === 'transformers' && ['vllm','sglang','djl'].includes(modelServer)"
+            },
+            "serverMapping": {
+                "envVar": "VLLM_ENABLE_LORA",
+                "booleanFlag": true
+            },
+            "deprecated": false,
+            "since": "0.5.0"
+        },
+        "maxLoras": {
+            "type": "integer",
+            "description": "Maximum concurrent LoRA adapters in GPU memory",
+            "cliFlag": "--max-loras",
+            "cliArgName": "n",
+            "envVar": "ML_MAX_LORAS",
+            "templateVar": "maxLoras",
+            "configKey": "maxLoras",
+            "default": 30,
+            "validation": {
+                "min": 1,
+                "max": 256
+            },
+            "phase": "features",
+            "group": "lora",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference"
+                ],
+                "architectures": [
+                    "transformers"
+                ]
+            },
+            "widget": {
+                "section": "features",
+                "inputType": "number",
+                "placeholder": "30"
+            },
+            "prompt": {
+                "message": "Max concurrent LoRA adapters?",
+                "type": "number",
+                "when": "enableLora === true"
+            },
+            "serverMapping": {
+                "envVar": "VLLM_MAX_LORAS"
+            },
+            "deprecated": false,
+            "since": "0.5.0"
+        },
+        "maxLoraRank": {
+            "type": "integer",
+            "description": "Maximum LoRA rank",
+            "cliFlag": "--max-lora-rank",
+            "cliArgName": "n",
+            "envVar": "ML_MAX_LORA_RANK",
+            "templateVar": "maxLoraRank",
+            "configKey": "maxLoraRank",
+            "default": 64,
+            "validation": {
+                "min": 8,
+                "max": 512
+            },
+            "phase": "features",
+            "group": "lora",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference"
+                ],
+                "architectures": [
+                    "transformers"
+                ]
+            },
+            "widget": {
+                "section": "features",
+                "inputType": "number",
+                "placeholder": "64"
+            },
+            "prompt": {
+                "message": "Max LoRA rank?",
+                "type": "number",
+                "when": "enableLora === true"
+            },
+            "serverMapping": {
+                "envVar": "VLLM_MAX_LORA_RANK"
+            },
+            "deprecated": false,
+            "since": "0.5.0"
+        },
+        "includeBenchmark": {
+            "type": "boolean",
+            "description": "Include SageMaker AI Benchmarking",
+            "cliFlag": "--include-benchmark",
+            "cliArgName": null,
+            "envVar": "ML_INCLUDE_BENCHMARK",
+            "templateVar": "includeBenchmark",
+            "configKey": "includeBenchmark",
+            "default": false,
+            "validation": {},
+            "phase": "features",
+            "group": "benchmark",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference"
+                ],
+                "architectures": [
+                    "transformers",
+                    "diffusors"
+                ]
+            },
+            "widget": {
+                "section": "features",
+                "inputType": "checkbox"
+            },
+            "prompt": {
+                "message": "Include benchmarking?",
+                "type": "confirm",
+                "when": "['transformers','diffusors'].includes(architecture)"
+            },
+            "deprecated": false,
+            "since": "0.6.0"
+        },
+        "benchmarkConcurrency": {
+            "type": "integer",
+            "description": "Benchmark concurrent requests",
+            "cliFlag": "--benchmark-concurrency",
+            "cliArgName": "n",
+            "envVar": null,
+            "templateVar": "benchmarkConcurrency",
+            "configKey": "benchmarkConcurrency",
+            "default": 10,
+            "validation": {
+                "min": 1,
+                "max": 1000
+            },
+            "phase": "features",
+            "group": "benchmark",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference"
+                ],
+                "architectures": [
+                    "transformers",
+                    "diffusors"
+                ]
+            },
+            "widget": {
+                "section": "features",
+                "inputType": "number",
+                "placeholder": "10"
+            },
+            "prompt": {
+                "message": "Benchmark concurrency?",
+                "type": "number",
+                "when": "includeBenchmark === true"
+            },
+            "deprecated": false,
+            "since": "0.6.0"
+        },
+        "benchmarkInputTokens": {
+            "type": "integer",
+            "description": "Benchmark mean input tokens",
+            "cliFlag": "--benchmark-input-tokens",
+            "cliArgName": "n",
+            "envVar": null,
+            "templateVar": "benchmarkInputTokensMean",
+            "configKey": "benchmarkInputTokensMean",
+            "default": 550,
+            "validation": {
+                "min": 1,
+                "max": 128000
+            },
+            "phase": "features",
+            "group": "benchmark",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference"
+                ],
+                "architectures": [
+                    "transformers",
+                    "diffusors"
+                ]
+            },
+            "widget": {
+                "section": "features",
+                "inputType": "number",
+                "placeholder": "550"
+            },
+            "prompt": {
+                "message": "Mean input tokens?",
+                "type": "number",
+                "when": "includeBenchmark === true"
+            },
+            "deprecated": false,
+            "since": "0.6.0"
+        },
+        "benchmarkOutputTokens": {
+            "type": "integer",
+            "description": "Benchmark mean output tokens",
+            "cliFlag": "--benchmark-output-tokens",
+            "cliArgName": "n",
+            "envVar": null,
+            "templateVar": "benchmarkOutputTokensMean",
+            "configKey": "benchmarkOutputTokensMean",
+            "default": 150,
+            "validation": {
+                "min": 1,
+                "max": 128000
+            },
+            "phase": "features",
+            "group": "benchmark",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference"
+                ],
+                "architectures": [
+                    "transformers",
+                    "diffusors"
+                ]
+            },
+            "widget": {
+                "section": "features",
+                "inputType": "number",
+                "placeholder": "150"
+            },
+            "prompt": {
+                "message": "Mean output tokens?",
+                "type": "number",
+                "when": "includeBenchmark === true"
+            },
+            "deprecated": false,
+            "since": "0.6.0"
+        },
+        "benchmarkStreaming": {
+            "type": "boolean",
+            "description": "Enable streaming in benchmark",
+            "cliFlag": "--benchmark-streaming",
+            "cliArgName": null,
+            "envVar": null,
+            "templateVar": "benchmarkStreaming",
+            "configKey": "benchmarkStreaming",
+            "default": true,
+            "validation": {},
+            "phase": "features",
+            "group": "benchmark",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference"
+                ],
+                "architectures": [
+                    "transformers",
+                    "diffusors"
+                ]
+            },
+            "widget": {
+                "section": "features",
+                "inputType": "checkbox"
+            },
+            "prompt": {
+                "message": "Enable streaming in benchmark?",
+                "type": "confirm",
+                "when": "includeBenchmark === true"
+            },
+            "deprecated": false,
+            "since": "0.6.0"
+        },
+        "benchmarkRequestCount": {
+            "type": "integer",
+            "description": "Total number of benchmark requests to send",
+            "cliFlag": "--benchmark-request-count",
+            "cliArgName": "n",
+            "envVar": null,
+            "templateVar": "benchmarkRequestCount",
+            "configKey": "benchmarkRequestCount",
+            "default": null,
+            "validation": {
+                "min": 1
+            },
+            "phase": "features",
+            "group": "benchmark",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference"
+                ],
+                "architectures": [
+                    "transformers",
+                    "diffusors"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.6.0"
+        },
+        "benchmarkS3OutputPath": {
+            "type": "string",
+            "description": "S3 URI for benchmark results output",
+            "cliFlag": "--benchmark-s3-output-path",
+            "cliArgName": "path",
+            "envVar": "ML_BENCHMARK_S3_OUTPUT_PATH",
+            "templateVar": "benchmarkS3OutputPath",
+            "configKey": "benchmarkS3OutputPath",
+            "default": null,
+            "validation": {
+                "pattern": "^s3://"
+            },
+            "phase": "features",
+            "group": "benchmark",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference"
+                ],
+                "architectures": [
+                    "transformers",
+                    "diffusors"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.6.0"
+        },
+        "skipPrompts": {
+            "type": "boolean",
+            "description": "Skip interactive prompts and use configuration from other sources",
+            "cliFlag": "--skip-prompts",
+            "cliArgName": null,
+            "envVar": "MCC_SKIP_PROMPTS",
+            "templateVar": null,
+            "configKey": "skipPrompts",
+            "default": false,
+            "validation": {},
+            "phase": "project",
+            "group": "project",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "cliBehavior": true,
+            "deprecated": false,
+            "since": "0.5.0"
+        },
+        "autoPrompt": {
+            "type": "boolean",
+            "description": "Fill defaults, prompt only for missing required values",
+            "cliFlag": "--auto-prompt",
+            "cliArgName": null,
+            "envVar": null,
+            "templateVar": null,
+            "configKey": "autoPrompt",
+            "default": false,
+            "validation": {},
+            "phase": "project",
+            "group": "project",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "cliBehavior": true,
+            "deprecated": false,
+            "since": "0.5.0"
+        },
+        "config": {
+            "type": "string",
+            "description": "Path to JSON configuration file",
+            "cliFlag": "--config",
+            "cliArgName": "path",
+            "envVar": null,
+            "templateVar": null,
+            "configKey": null,
+            "default": null,
+            "validation": {},
+            "phase": "project",
+            "group": "project",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "cliBehavior": true,
+            "deprecated": false,
+            "since": "0.5.0"
+        },
+        "projectDir": {
+            "type": "string",
+            "description": "Output directory path",
+            "cliFlag": "--project-dir",
+            "cliArgName": "dir",
+            "envVar": "ML_PROJECT_DIR",
+            "templateVar": null,
+            "configKey": "projectDir",
+            "default": null,
+            "validation": {},
+            "phase": "project",
+            "group": "project",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.3.0"
+        },
+        "force": {
+            "type": "boolean",
+            "description": "Overwrite existing output directory without prompting",
+            "cliFlag": "--force",
+            "cliArgName": null,
+            "envVar": null,
+            "templateVar": null,
+            "configKey": "force",
+            "default": false,
+            "validation": {},
+            "phase": "project",
+            "group": "project",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "cliBehavior": true,
+            "deprecated": false,
+            "since": "0.3.0"
+        },
+        "framework": {
+            "type": "enum",
+            "description": "ML framework",
+            "cliFlag": "--framework",
+            "cliArgName": "framework",
+            "envVar": null,
+            "templateVar": "framework",
+            "configKey": "framework",
+            "default": null,
+            "validation": {
+                "enum": [
+                    "sklearn",
+                    "xgboost",
+                    "tensorflow",
+                    "transformers"
+                ]
+            },
+            "phase": "model",
+            "group": "model",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": true,
+            "replacedBy": "deploymentConfig",
+            "since": "0.1.0"
+        },
+        "modelFormat": {
+            "type": "string",
+            "description": "Model serialization format (pkl, joblib, json, model, ubj, keras, h5, SavedModel)",
+            "cliFlag": "--model-format",
+            "cliArgName": "format",
+            "envVar": "ML_MODEL_FORMAT",
+            "templateVar": "modelFormat",
+            "configKey": "modelFormat",
+            "default": null,
+            "validation": {
+                "enum": [
+                    "pkl",
+                    "joblib",
+                    "json",
+                    "model",
+                    "ubj",
+                    "keras",
+                    "h5",
+                    "SavedModel"
+                ]
+            },
+            "phase": "model",
+            "group": "model",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "http"
+                ]
+            },
+            "widget": null,
+            "prompt": {
+                "message": "Model format?",
+                "type": "list",
+                "when": "architecture === 'http'"
+            },
+            "deprecated": false,
+            "since": "0.1.0"
+        },
+        "modelServer": {
+            "type": "enum",
+            "description": "Model server",
+            "cliFlag": "--model-server",
+            "cliArgName": "server",
+            "envVar": null,
+            "templateVar": "modelServer",
+            "configKey": "modelServer",
+            "default": null,
+            "validation": {
+                "enum": [
+                    "flask",
+                    "fastapi",
+                    "vllm",
+                    "sglang"
+                ]
+            },
+            "phase": "model",
+            "group": "model",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": true,
+            "replacedBy": "deploymentConfig",
+            "since": "0.1.0"
+        },
+        "baseImage": {
+            "type": "string",
+            "description": "Base container image for Dockerfile",
+            "cliFlag": "--base-image",
+            "cliArgName": "image",
+            "envVar": "ML_BASE_IMAGE",
+            "templateVar": "baseImage",
+            "configKey": "baseImage",
+            "default": null,
+            "validation": {},
+            "phase": "build",
+            "group": "build",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.3.0"
+        },
+        "region": {
+            "type": "string",
+            "description": "AWS region",
+            "cliFlag": "--region",
+            "cliArgName": "region",
+            "envVar": "ML_REGION",
+            "templateVar": "awsRegion",
+            "configKey": "region",
+            "default": "us-east-1",
+            "validation": {
+                "pattern": "^[a-z]{2}-[a-z]+-\\d+$"
+            },
+            "phase": "infrastructure",
+            "group": "infrastructure",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": {
+                "message": "AWS region?",
+                "type": "input"
+            },
+            "deprecated": false,
+            "since": "0.1.0"
+        },
+        "roleArn": {
+            "type": "string",
+            "description": "IAM role ARN for SageMaker execution",
+            "cliFlag": "--role-arn",
+            "cliArgName": "arn",
+            "envVar": "ML_ROLE_ARN",
+            "templateVar": "roleArn",
+            "configKey": "roleArn",
+            "default": null,
+            "validation": {
+                "pattern": "^arn:aws:iam::"
+            },
+            "phase": "infrastructure",
+            "group": "infrastructure",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.3.0"
+        },
+        "buildTarget": {
+            "type": "string",
+            "description": "Build target (codebuild)",
+            "cliFlag": "--build-target",
+            "cliArgName": "target",
+            "envVar": "ML_BUILD_TARGET",
+            "templateVar": "buildTarget",
+            "configKey": "buildTarget",
+            "default": "codebuild",
+            "validation": {
+                "enum": [
+                    "codebuild"
+                ]
+            },
+            "phase": "build",
+            "group": "build",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "codebuildComputeType": {
+            "type": "string",
+            "description": "CodeBuild compute type (SMALL, MEDIUM, LARGE)",
+            "cliFlag": "--codebuild-compute-type",
+            "cliArgName": "type",
+            "envVar": "ML_CODEBUILD_COMPUTE_TYPE",
+            "templateVar": "codebuildComputeType",
+            "configKey": "codebuildComputeType",
+            "default": "BUILD_GENERAL1_LARGE",
+            "validation": {
+                "enum": [
+                    "SMALL",
+                    "MEDIUM",
+                    "LARGE",
+                    "BUILD_GENERAL1_SMALL",
+                    "BUILD_GENERAL1_MEDIUM",
+                    "BUILD_GENERAL1_LARGE",
+                    "BUILD_GENERAL1_2XLARGE"
+                ]
+            },
+            "phase": "build",
+            "group": "build",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "hfToken": {
+            "type": "string",
+            "description": "HuggingFace token (or $HF_TOKEN for env var reference)",
+            "cliFlag": "--hf-token",
+            "cliArgName": "token",
+            "envVar": null,
+            "templateVar": "hfToken",
+            "configKey": "hfToken",
+            "default": null,
+            "validation": {},
+            "phase": "auth",
+            "group": "auth",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "transformers",
+                    "diffusors"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "sensitive": true,
+            "deprecated": false,
+            "since": "0.3.0"
+        },
+        "hfTokenArn": {
+            "type": "string",
+            "description": "HuggingFace token ARN from Secrets Manager",
+            "cliFlag": "--hf-token-arn",
+            "cliArgName": "arn",
+            "envVar": "ML_HF_TOKEN_ARN",
+            "templateVar": "hfTokenArn",
+            "configKey": "hfTokenArn",
+            "default": null,
+            "validation": {
+                "pattern": "^arn:aws:secretsmanager:"
+            },
+            "phase": "auth",
+            "group": "auth",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "transformers",
+                    "diffusors"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.5.0"
+        },
+        "ngcToken": {
+            "type": "string",
+            "description": "NVIDIA NGC token (or $NGC_API_KEY for env var reference)",
+            "cliFlag": "--ngc-token",
+            "cliArgName": "token",
+            "envVar": null,
+            "templateVar": "ngcToken",
+            "configKey": "ngcToken",
+            "default": null,
+            "validation": {},
+            "phase": "auth",
+            "group": "auth",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "transformers"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "sensitive": true,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "ngcTokenArn": {
+            "type": "string",
+            "description": "NVIDIA NGC token ARN from Secrets Manager",
+            "cliFlag": "--ngc-token-arn",
+            "cliArgName": "arn",
+            "envVar": "ML_NGC_TOKEN_ARN",
+            "templateVar": "ngcTokenArn",
+            "configKey": "ngcTokenArn",
+            "default": null,
+            "validation": {
+                "pattern": "^arn:aws:secretsmanager:"
+            },
+            "phase": "auth",
+            "group": "auth",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "transformers"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.5.0"
+        },
+        "endpointInitialInstanceCount": {
+            "type": "integer",
+            "description": "Number of instances for the endpoint",
+            "cliFlag": "--endpoint-initial-instance-count",
+            "cliArgName": "n",
+            "envVar": "ML_ENDPOINT_INSTANCE_COUNT",
+            "templateVar": "endpointInitialInstanceCount",
+            "configKey": "endpointInitialInstanceCount",
+            "default": 1,
+            "validation": {
+                "min": 1,
+                "max": 100
+            },
+            "phase": "infrastructure",
+            "group": "endpoint",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "endpointDataCapturePercent": {
+            "type": "integer",
+            "description": "Data capture percentage for monitoring, 0-100",
+            "cliFlag": "--endpoint-data-capture-percent",
+            "cliArgName": "pct",
+            "envVar": null,
+            "templateVar": "endpointDataCapturePercent",
+            "configKey": "endpointDataCapturePercent",
+            "default": 0,
+            "validation": {
+                "min": 0,
+                "max": 100
+            },
+            "phase": "infrastructure",
+            "group": "endpoint",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "endpointVariantName": {
+            "type": "string",
+            "description": "Production variant name",
+            "cliFlag": "--endpoint-variant-name",
+            "cliArgName": "name",
+            "envVar": null,
+            "templateVar": "endpointVariantName",
+            "configKey": "endpointVariantName",
+            "default": "AllTraffic",
+            "validation": {
+                "pattern": "^[a-zA-Z0-9]([\\w-]{0,62}[a-zA-Z0-9])?$"
+            },
+            "phase": "infrastructure",
+            "group": "endpoint",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "endpointVolumeSize": {
+            "type": "integer",
+            "description": "ML storage volume size in GB",
+            "cliFlag": "--endpoint-volume-size",
+            "cliArgName": "gb",
+            "envVar": null,
+            "templateVar": "endpointVolumeSize",
+            "configKey": "endpointVolumeSize",
+            "default": null,
+            "validation": {
+                "min": 1,
+                "max": 16384
+            },
+            "phase": "infrastructure",
+            "group": "endpoint",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "icCpuCount": {
+            "type": "number",
+            "description": "vCPUs allocated to the inference component",
+            "cliFlag": "--ic-cpu-count",
+            "cliArgName": "n",
+            "envVar": "ML_IC_CPU_COUNT",
+            "templateVar": "icCpuCount",
+            "configKey": "icCpuCount",
+            "default": null,
+            "validation": {
+                "min": 0.25,
+                "max": 768
+            },
+            "phase": "infrastructure",
+            "group": "inference-component",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "icModelWeight": {
+            "type": "number",
+            "description": "Traffic routing weight, 0-1",
+            "cliFlag": "--ic-model-weight",
+            "cliArgName": "weight",
+            "envVar": null,
+            "templateVar": "icModelWeight",
+            "configKey": "icModelWeight",
+            "default": 1,
+            "validation": {
+                "min": 0,
+                "max": 1
+            },
+            "phase": "infrastructure",
+            "group": "inference-component",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "managed-inference"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.5.0"
+        },
+        "asyncS3OutputPath": {
+            "type": "string",
+            "description": "S3 output path for async results",
+            "cliFlag": "--async-s3-output-path",
+            "cliArgName": "path",
+            "envVar": "ML_ASYNC_S3_OUTPUT_PATH",
+            "templateVar": "asyncS3OutputPath",
+            "configKey": "asyncS3OutputPath",
+            "default": null,
+            "validation": {
+                "pattern": "^s3://"
+            },
+            "phase": "infrastructure",
+            "group": "async",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "async-inference"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": {
+                "message": "S3 output path for async results?",
+                "type": "input",
+                "when": "deploymentTarget === 'async-inference'"
+            },
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "asyncSnsSuccessTopic": {
+            "type": "string",
+            "description": "SNS topic ARN for success notifications",
+            "cliFlag": "--async-sns-success-topic",
+            "cliArgName": "arn",
+            "envVar": null,
+            "templateVar": "asyncSnsSuccessTopic",
+            "configKey": "asyncSnsSuccessTopic",
+            "default": null,
+            "validation": {
+                "pattern": "^arn:aws:sns:"
+            },
+            "phase": "infrastructure",
+            "group": "async",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "async-inference"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "asyncSnsErrorTopic": {
+            "type": "string",
+            "description": "SNS topic ARN for error notifications",
+            "cliFlag": "--async-sns-error-topic",
+            "cliArgName": "arn",
+            "envVar": null,
+            "templateVar": "asyncSnsErrorTopic",
+            "configKey": "asyncSnsErrorTopic",
+            "default": null,
+            "validation": {
+                "pattern": "^arn:aws:sns:"
+            },
+            "phase": "infrastructure",
+            "group": "async",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "async-inference"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "asyncMaxConcurrent": {
+            "type": "integer",
+            "description": "Max concurrent invocations per instance",
+            "cliFlag": "--async-max-concurrent",
+            "cliArgName": "n",
+            "envVar": null,
+            "templateVar": "asyncMaxConcurrent",
+            "configKey": "asyncMaxConcurrent",
+            "default": 1,
+            "validation": {
+                "min": 1,
+                "max": 100
+            },
+            "phase": "infrastructure",
+            "group": "async",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "async-inference"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "batchInputPath": {
+            "type": "string",
+            "description": "S3 input path for batch data",
+            "cliFlag": "--batch-input-path",
+            "cliArgName": "path",
+            "envVar": "ML_BATCH_INPUT_PATH",
+            "templateVar": "batchInputPath",
+            "configKey": "batchInputPath",
+            "default": null,
+            "validation": {
+                "pattern": "^s3://"
+            },
+            "phase": "infrastructure",
+            "group": "batch",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "batch-transform"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": {
+                "message": "S3 input path?",
+                "type": "input",
+                "when": "deploymentTarget === 'batch-transform'"
+            },
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "batchOutputPath": {
+            "type": "string",
+            "description": "S3 output path for batch results",
+            "cliFlag": "--batch-output-path",
+            "cliArgName": "path",
+            "envVar": "ML_BATCH_OUTPUT_PATH",
+            "templateVar": "batchOutputPath",
+            "configKey": "batchOutputPath",
+            "default": null,
+            "validation": {
+                "pattern": "^s3://"
+            },
+            "phase": "infrastructure",
+            "group": "batch",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "batch-transform"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": {
+                "message": "S3 output path?",
+                "type": "input",
+                "when": "deploymentTarget === 'batch-transform'"
+            },
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "batchInstanceCount": {
+            "type": "integer",
+            "description": "Number of batch instances",
+            "cliFlag": "--batch-instance-count",
+            "cliArgName": "n",
+            "envVar": null,
+            "templateVar": "batchInstanceCount",
+            "configKey": "batchInstanceCount",
+            "default": 1,
+            "validation": {
+                "min": 1,
+                "max": 100
+            },
+            "phase": "infrastructure",
+            "group": "batch",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "batch-transform"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "batchSplitType": {
+            "type": "enum",
+            "description": "Input split type: Line, RecordIO, None",
+            "cliFlag": "--batch-split-type",
+            "cliArgName": "type",
+            "envVar": null,
+            "templateVar": "batchSplitType",
+            "configKey": "batchSplitType",
+            "default": "Line",
+            "validation": {
+                "enum": [
+                    "Line",
+                    "RecordIO",
+                    "None"
+                ]
+            },
+            "phase": "infrastructure",
+            "group": "batch",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "batch-transform"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "batchStrategy": {
+            "type": "enum",
+            "description": "Batch strategy: MultiRecord, SingleRecord",
+            "cliFlag": "--batch-strategy",
+            "cliArgName": "strategy",
+            "envVar": null,
+            "templateVar": "batchStrategy",
+            "configKey": "batchStrategy",
+            "default": "MultiRecord",
+            "validation": {
+                "enum": [
+                    "MultiRecord",
+                    "SingleRecord"
+                ]
+            },
+            "phase": "infrastructure",
+            "group": "batch",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "batch-transform"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "batchJoinSource": {
+            "type": "enum",
+            "description": "Join source: Input, None",
+            "cliFlag": "--batch-join-source",
+            "cliArgName": "source",
+            "envVar": null,
+            "templateVar": "batchJoinSource",
+            "configKey": "batchJoinSource",
+            "default": "None",
+            "validation": {
+                "enum": [
+                    "Input",
+                    "None"
+                ]
+            },
+            "phase": "infrastructure",
+            "group": "batch",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "batch-transform"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "batchMaxConcurrent": {
+            "type": "integer",
+            "description": "Max concurrent transforms per instance",
+            "cliFlag": "--batch-max-concurrent",
+            "cliArgName": "n",
+            "envVar": null,
+            "templateVar": "batchMaxConcurrent",
+            "configKey": "batchMaxConcurrent",
+            "default": 1,
+            "validation": {
+                "min": 1
+            },
+            "phase": "infrastructure",
+            "group": "batch",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "batch-transform"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "batchMaxPayload": {
+            "type": "integer",
+            "description": "Max payload size in MB, 0-100",
+            "cliFlag": "--batch-max-payload",
+            "cliArgName": "mb",
+            "envVar": null,
+            "templateVar": "batchMaxPayload",
+            "configKey": "batchMaxPayload",
+            "default": 6,
+            "validation": {
+                "min": 0,
+                "max": 100
+            },
+            "phase": "infrastructure",
+            "group": "batch",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "batch-transform"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "hyperpodCluster": {
+            "type": "string",
+            "description": "HyperPod EKS cluster name",
+            "cliFlag": "--hyperpod-cluster",
+            "cliArgName": "name",
+            "envVar": "ML_HYPERPOD_CLUSTER",
+            "templateVar": "hyperPodCluster",
+            "configKey": "hyperpodCluster",
+            "default": null,
+            "validation": {},
+            "phase": "infrastructure",
+            "group": "hyperpod",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "hyperpod-eks"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": {
+                "message": "HyperPod cluster name?",
+                "type": "input",
+                "when": "deploymentTarget === 'hyperpod-eks'"
+            },
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "hyperpodNamespace": {
+            "type": "string",
+            "description": "Kubernetes namespace",
+            "cliFlag": "--hyperpod-namespace",
+            "cliArgName": "ns",
+            "envVar": "ML_HYPERPOD_NAMESPACE",
+            "templateVar": "hyperPodNamespace",
+            "configKey": "hyperpodNamespace",
+            "default": "default",
+            "validation": {},
+            "phase": "infrastructure",
+            "group": "hyperpod",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "hyperpod-eks"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "hyperpodReplicas": {
+            "type": "integer",
+            "description": "Number of replicas",
+            "cliFlag": "--hyperpod-replicas",
+            "cliArgName": "count",
+            "envVar": null,
+            "templateVar": "hyperPodReplicas",
+            "configKey": "hyperpodReplicas",
+            "default": 1,
+            "validation": {
+                "min": 1
+            },
+            "phase": "infrastructure",
+            "group": "hyperpod",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "hyperpod-eks"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "fsxVolumeHandle": {
+            "type": "string",
+            "description": "FSx for Lustre volume handle",
+            "cliFlag": "--fsx-volume-handle",
+            "cliArgName": "handle",
+            "envVar": "ML_FSX_VOLUME_HANDLE",
+            "templateVar": "fsxVolumeHandle",
+            "configKey": "fsxVolumeHandle",
+            "default": null,
+            "validation": {},
+            "phase": "infrastructure",
+            "group": "hyperpod",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "hyperpod-eks"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.4.0"
+        },
+        "modelEnv": {
+            "type": "string",
+            "description": "Model env var, repeatable (e.g. VLLM_TENSOR_PARALLEL_SIZE=4)",
+            "cliFlag": "--model-env",
+            "cliArgName": "KEY=VALUE",
+            "envVar": null,
+            "templateVar": null,
+            "configKey": "modelEnv",
+            "default": [],
+            "validation": {},
+            "phase": "features",
+            "group": "model",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": {
+                "section": "env-vars",
+                "inputType": "repeatable-kv"
+            },
+            "prompt": null,
+            "repeatable": true,
+            "deprecated": false,
+            "since": "0.5.0"
+        },
+        "serverEnv": {
+            "type": "string",
+            "description": "Server env var, repeatable (e.g. SGLANG_MEM_FRACTION=0.9)",
+            "cliFlag": "--server-env",
+            "cliArgName": "KEY=VALUE",
+            "envVar": null,
+            "templateVar": null,
+            "configKey": "serverEnv",
+            "default": [],
+            "validation": {},
+            "phase": "features",
+            "group": "model",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": {
+                "section": "env-vars",
+                "inputType": "repeatable-kv"
+            },
+            "prompt": null,
+            "repeatable": true,
+            "deprecated": false,
+            "since": "0.5.0"
+        },
+        "includeSample": {
+            "type": "boolean",
+            "description": "Include sample model code",
+            "cliFlag": "--include-sample",
+            "cliArgName": null,
+            "envVar": "ML_INCLUDE_SAMPLE",
+            "templateVar": "includeSampleModel",
+            "configKey": "includeSample",
+            "default": true,
+            "validation": {},
+            "phase": "features",
+            "group": "testing",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "http"
+                ]
+            },
+            "widget": null,
+            "prompt": {
+                "message": "Include sample model?",
+                "type": "confirm",
+                "when": "architecture === 'http'"
+            },
+            "deprecated": false,
+            "since": "0.1.0"
+        },
+        "includeTesting": {
+            "type": "boolean",
+            "description": "Include test suite",
+            "cliFlag": "--include-testing",
+            "cliArgName": null,
+            "envVar": "ML_INCLUDE_TESTING",
+            "templateVar": "includeTesting",
+            "configKey": "includeTesting",
+            "default": true,
+            "validation": {},
+            "phase": "features",
+            "group": "testing",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": {
+                "message": "Include test suite?",
+                "type": "confirm"
+            },
+            "deprecated": false,
+            "since": "0.1.0"
+        },
+        "testTypes": {
+            "type": "string",
+            "description": "Comma-separated test types",
+            "cliFlag": "--test-types",
+            "cliArgName": "types",
+            "envVar": "ML_TEST_TYPES",
+            "templateVar": "testTypes",
+            "configKey": "testTypes",
+            "default": null,
+            "validation": {},
+            "phase": "features",
+            "group": "testing",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "deprecated": false,
+            "since": "0.1.0"
+        },
+        "smart": {
+            "type": "boolean",
+            "description": "Enable smart mode (live AWS API calls for MCP servers)",
+            "cliFlag": "--smart",
+            "cliArgName": null,
+            "envVar": null,
+            "templateVar": null,
+            "configKey": "smart",
+            "default": false,
+            "validation": {},
+            "phase": "project",
+            "group": "project",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "cliBehavior": true,
+            "deprecated": false,
+            "since": "0.5.0"
+        },
+        "discover": {
+            "type": "boolean",
+            "description": "Enable discovery mode for MCP servers",
+            "cliFlag": "--discover",
+            "cliArgName": null,
+            "envVar": null,
+            "templateVar": null,
+            "configKey": "discover",
+            "default": false,
+            "validation": {},
+            "phase": "project",
+            "group": "project",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "cliBehavior": true,
+            "deprecated": false,
+            "since": "0.5.0"
+        },
+        "noValidate": {
+            "type": "boolean",
+            "description": "Skip parameter validation",
+            "cliFlag": "--no-validate",
+            "cliArgName": null,
+            "envVar": null,
+            "templateVar": null,
+            "configKey": "noValidate",
+            "default": false,
+            "validation": {},
+            "phase": "project",
+            "group": "project",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "cliBehavior": true,
+            "deprecated": false,
+            "since": "0.5.0"
+        },
+        "validateEnvVars": {
+            "type": "boolean",
+            "description": "Validate environment variables against schema",
+            "cliFlag": "--validate-env-vars",
+            "cliArgName": null,
+            "envVar": null,
+            "templateVar": null,
+            "configKey": "validateEnvVars",
+            "default": false,
+            "validation": {},
+            "phase": "project",
+            "group": "project",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "cliBehavior": true,
+            "deprecated": false,
+            "since": "0.6.0"
+        },
+        "validateWithDocker": {
+            "type": "boolean",
+            "description": "Validate Dockerfile builds successfully",
+            "cliFlag": "--validate-with-docker",
+            "cliArgName": null,
+            "envVar": null,
+            "templateVar": null,
+            "configKey": "validateWithDocker",
+            "default": false,
+            "validation": {},
+            "phase": "project",
+            "group": "project",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "cliBehavior": true,
+            "deprecated": false,
+            "since": "0.6.0"
+        },
+        "offline": {
+            "type": "boolean",
+            "description": "Run in offline mode (no network calls)",
+            "cliFlag": "--offline",
+            "cliArgName": null,
+            "envVar": null,
+            "templateVar": null,
+            "configKey": "offline",
+            "default": false,
+            "validation": {},
+            "phase": "project",
+            "group": "project",
+            "appliesTo": {
+                "deploymentTargets": [
+                    "*"
+                ],
+                "architectures": [
+                    "*"
+                ]
+            },
+            "widget": null,
+            "prompt": null,
+            "cliBehavior": true,
+            "deprecated": false,
+            "since": "0.6.0"
+        }
+    }
+}