npm - @aws/ml-container-creator - Versions diffs - 0.10.0 → 0.12.1 - Mend

@aws/ml-container-creator 0.10.0 → 0.12.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (90) hide show

package/LICENSE-THIRD-PARTY +9304 -0
package/bin/cli.js +2 -0
package/config/bootstrap-e2e-stack.json +341 -0
package/config/bootstrap-stack.json +40 -3
package/config/parameter-schema-v2.json +33 -22
package/config/tune-catalog.json +1781 -0
package/infra/ci-harness/buildspec.yml +1 -0
package/infra/ci-harness/lambda/path-prover/brain.ts +306 -0
package/infra/ci-harness/lambda/path-prover/write-results.ts +152 -0
package/infra/ci-harness/lib/ci-harness-stack.ts +851 -7
package/infra/ci-harness/state-machines/path-prover.asl.json +496 -0
package/package.json +53 -67
package/servers/base-image-picker/index.js +121 -121
package/servers/e2e-status/index.js +297 -0
package/servers/e2e-status/manifest.json +14 -0
package/servers/e2e-status/package.json +15 -0
package/servers/endpoint-picker/LICENSE +202 -0
package/servers/endpoint-picker/index.js +536 -0
package/servers/endpoint-picker/manifest.json +14 -0
package/servers/endpoint-picker/package.json +18 -0
package/servers/hyperpod-cluster-picker/index.js +125 -125
package/servers/instance-sizer/index.js +166 -153
package/servers/instance-sizer/lib/instance-ranker.js +120 -76
package/servers/instance-sizer/lib/model-resolver.js +61 -61
package/servers/instance-sizer/lib/quota-resolver.js +113 -113
package/servers/instance-sizer/lib/vram-estimator.js +31 -31
package/servers/lib/bedrock-client.js +38 -38
package/servers/lib/catalogs/instances.json +27 -0
package/servers/lib/catalogs/model-servers.json +201 -3
package/servers/lib/custom-validators.js +13 -13
package/servers/lib/dynamic-resolver.js +4 -4
package/servers/marketplace-picker/index.js +342 -0
package/servers/marketplace-picker/manifest.json +14 -0
package/servers/marketplace-picker/package.json +18 -0
package/servers/model-picker/index.js +382 -382
package/servers/region-picker/index.js +56 -56
package/servers/workload-picker/LICENSE +202 -0
package/servers/workload-picker/catalogs/workload-profiles.json +67 -0
package/servers/workload-picker/index.js +171 -0
package/servers/workload-picker/manifest.json +16 -0
package/servers/workload-picker/package.json +16 -0
package/src/app.js +12 -3
package/src/lib/bootstrap-command-handler.js +609 -15
package/src/lib/bootstrap-config.js +36 -0
package/src/lib/bootstrap-profile-manager.js +48 -41
package/src/lib/ci-register-helpers.js +74 -0
package/src/lib/config-loader.js +3 -0
package/src/lib/config-manager.js +7 -0
package/src/lib/config-validator.js +1 -1
package/src/lib/cuda-resolver.js +17 -8
package/src/lib/generated/cli-options.js +319 -314
package/src/lib/generated/parameter-matrix.js +672 -661
package/src/lib/generated/validation-rules.js +76 -72
package/src/lib/path-prover-brain.js +664 -0
package/src/lib/prompts/infrastructure-prompts.js +2 -2
package/src/lib/prompts/model-prompts.js +6 -0
package/src/lib/prompts/project-prompts.js +12 -0
package/src/lib/secrets-prompt-runner.js +4 -0
package/src/lib/template-manager.js +1 -1
package/src/lib/template-variable-resolver.js +87 -1
package/src/lib/tune-catalog-validator.js +37 -4
package/templates/Dockerfile +9 -0
package/templates/code/adapter_sidecar.py +444 -0
package/templates/code/serve +6 -0
package/templates/code/serve.d/vllm.ejs +1 -1
package/templates/do/.benchmark_writer.py +1476 -0
package/templates/do/.tune_helper.py +982 -57
package/templates/do/__pycache__/.benchmark_writer.cpython-312.pyc +0 -0
package/templates/do/adapter +154 -0
package/templates/do/benchmark +639 -85
package/templates/do/build +5 -0
package/templates/do/clean.d/async-inference.ejs +5 -0
package/templates/do/clean.d/batch-transform.ejs +5 -0
package/templates/do/clean.d/hyperpod-eks.ejs +5 -0
package/templates/do/clean.d/managed-inference.ejs +5 -0
package/templates/do/config +115 -45
package/templates/do/deploy.d/async-inference.ejs +30 -3
package/templates/do/deploy.d/batch-transform.ejs +29 -3
package/templates/do/deploy.d/hyperpod-eks.ejs +4 -0
package/templates/do/deploy.d/managed-inference.ejs +216 -14
package/templates/do/lib/endpoint-config.sh +1 -1
package/templates/do/lib/profile.sh +44 -0
package/templates/do/optimize +106 -37
package/templates/do/push +5 -0
package/templates/do/register +94 -0
package/templates/do/stage +567 -0
package/templates/do/submit +7 -0
package/templates/do/test +14 -0
package/templates/do/tune +382 -59
package/templates/do/validate +44 -4

package/src/lib/generated/validation-rules.js CHANGED Viewed

@@ -1,202 +1,206 @@
 // AUTO-GENERATED by scripts/codegen-validator.js — DO NOT EDIT
 // Source: config/parameter-schema-v2.json
-// Generated: 2026-05-23T12:02:19.548Z
+// Generated: 2026-06-12T22:03:00.468Z
 /**
  * Validation rules derived from parameter-schema-v2.json.
  * Each key maps to a function that returns null (valid) or an error string.
  */
 export const validationRules = {
-    "projectName": (value) => {
-        if (value.length < 2) return `projectName must be at least 2 characters`;
-        if (value.length > 63) return `projectName must be at most 63 characters`;
-        if (!new RegExp("^[a-z0-9][a-z0-9-]*[a-z0-9]$").test(value)) return `projectName does not match required pattern`;
+    'projectName': (value) => {
+        if (value.length < 2) return 'projectName must be at least 2 characters';
+        if (value.length > 63) return 'projectName must be at most 63 characters';
+        if (!new RegExp('^[a-z0-9][a-z0-9-]*[a-z0-9]$').test(value)) return 'projectName does not match required pattern';
         return null;
     },
-    "deploymentConfig": (value) => {
-        if (!["http-flask","http-fastapi","transformers-vllm","transformers-sglang","transformers-tensorrt-llm","transformers-lmi","transformers-djl","triton-fil","triton-onnxruntime","triton-tensorflow","triton-pytorch","triton-vllm","triton-tensorrtllm","triton-python","diffusors-vllm-omni","marketplace"].includes(value)) return `Invalid value "${value}" for deploymentConfig. Valid: http-flask, http-fastapi, transformers-vllm, transformers-sglang, transformers-tensorrt-llm, transformers-lmi, transformers-djl, triton-fil, triton-onnxruntime, triton-tensorflow, triton-pytorch, triton-vllm, triton-tensorrtllm, triton-python, diffusors-vllm-omni, marketplace`;
+    'deploymentConfig': (value) => {
+        if (!['http-flask','http-fastapi','transformers-vllm','transformers-sglang','transformers-tensorrt-llm','transformers-lmi','transformers-djl','triton-fil','triton-onnxruntime','triton-tensorflow','triton-pytorch','triton-vllm','triton-tensorrtllm','triton-python','diffusors-vllm-omni','marketplace'].includes(value)) return `Invalid value "${value}" for deploymentConfig. Valid: http-flask, http-fastapi, transformers-vllm, transformers-sglang, transformers-tensorrt-llm, transformers-lmi, transformers-djl, triton-fil, triton-onnxruntime, triton-tensorflow, triton-pytorch, triton-vllm, triton-tensorrtllm, triton-python, diffusors-vllm-omni, marketplace`;
         return null;
     },
-    "modelName": (value) => {
-        if (value.length < 1) return `modelName must be at least 1 characters`;
+    'modelName': (value) => {
+        if (value.length < 1) return 'modelName must be at least 1 characters';
         return null;
     },
-    "deploymentTarget": (value) => {
-        if (!["managed-inference","realtime-inference","async-inference","batch-transform","hyperpod-eks"].includes(value)) return `Invalid value "${value}" for deploymentTarget. Valid: managed-inference, realtime-inference, async-inference, batch-transform, hyperpod-eks`;
+    'deploymentTarget': (value) => {
+        if (!['managed-inference','realtime-inference','async-inference','batch-transform','hyperpod-eks'].includes(value)) return `Invalid value "${value}" for deploymentTarget. Valid: managed-inference, realtime-inference, async-inference, batch-transform, hyperpod-eks`;
         return null;
     },
-    "instanceType": (value) => {
-        if (!new RegExp("^ml\\.[a-z0-9]+\\.[a-z0-9]+$").test(value)) return `instanceType does not match required pattern`;
+    'instanceType': (value) => {
+        if (!new RegExp('^ml\\.[a-z0-9-]+\\.[a-z0-9]+$').test(value)) return 'instanceType does not match required pattern';
         return null;
     },
-    "icGpuCount": (value) => {
+    'icGpuCount': (value) => {
         if (value < 0) return `icGpuCount must be >= 0, got ${value}`;
         if (value > 8) return `icGpuCount must be <= 8, got ${value}`;
         return null;
     },
-    "icCopyCount": (value) => {
+    'icCopyCount': (value) => {
         if (value < 0) return `icCopyCount must be >= 0, got ${value}`;
         if (value > 100) return `icCopyCount must be <= 100, got ${value}`;
         return null;
     },
-    "icMemorySize": (value) => {
+    'icMemorySize': (value) => {
         if (value < 128) return `icMemorySize must be >= 128, got ${value}`;
         if (value > 3145728) return `icMemorySize must be <= 3145728, got ${value}`;
         return null;
     },
-    "maxLoras": (value) => {
+    'maxLoras': (value) => {
         if (value < 1) return `maxLoras must be >= 1, got ${value}`;
         if (value > 256) return `maxLoras must be <= 256, got ${value}`;
         return null;
     },
-    "maxLoraRank": (value) => {
+    'maxLoraRank': (value) => {
         if (value < 8) return `maxLoraRank must be >= 8, got ${value}`;
         if (value > 512) return `maxLoraRank must be <= 512, got ${value}`;
         return null;
     },
-    "benchmarkConcurrency": (value) => {
+    'benchmarkConcurrency': (value) => {
         if (value < 1) return `benchmarkConcurrency must be >= 1, got ${value}`;
         if (value > 1000) return `benchmarkConcurrency must be <= 1000, got ${value}`;
         return null;
     },
-    "benchmarkInputTokens": (value) => {
+    'benchmarkInputTokens': (value) => {
         if (value < 1) return `benchmarkInputTokens must be >= 1, got ${value}`;
         if (value > 128000) return `benchmarkInputTokens must be <= 128000, got ${value}`;
         return null;
     },
-    "benchmarkOutputTokens": (value) => {
+    'benchmarkOutputTokens': (value) => {
         if (value < 1) return `benchmarkOutputTokens must be >= 1, got ${value}`;
         if (value > 128000) return `benchmarkOutputTokens must be <= 128000, got ${value}`;
         return null;
     },
-    "benchmarkRequestCount": (value) => {
+    'benchmarkRequestCount': (value) => {
         if (value < 1) return `benchmarkRequestCount must be >= 1, got ${value}`;
         return null;
     },
-    "benchmarkS3OutputPath": (value) => {
-        if (!new RegExp("^s3://").test(value)) return `benchmarkS3OutputPath does not match required pattern`;
+    'benchmarkS3OutputPath': (value) => {
+        if (!new RegExp('^s3://').test(value)) return 'benchmarkS3OutputPath does not match required pattern';
         return null;
     },
-    "framework": (value) => {
-        if (!["sklearn","xgboost","tensorflow","transformers"].includes(value)) return `Invalid value "${value}" for framework. Valid: sklearn, xgboost, tensorflow, transformers`;
+    'framework': (value) => {
+        if (!['sklearn','xgboost','tensorflow','transformers'].includes(value)) return `Invalid value "${value}" for framework. Valid: sklearn, xgboost, tensorflow, transformers`;
         return null;
     },
-    "modelFormat": (value) => {
-        if (!["pkl","joblib","json","model","ubj","keras","h5","SavedModel"].includes(value)) return `Invalid value "${value}" for modelFormat. Valid: pkl, joblib, json, model, ubj, keras, h5, SavedModel`;
+    'modelFormat': (value) => {
+        if (!['pkl','joblib','json','model','ubj','keras','h5','SavedModel'].includes(value)) return `Invalid value "${value}" for modelFormat. Valid: pkl, joblib, json, model, ubj, keras, h5, SavedModel`;
         return null;
     },
-    "modelServer": (value) => {
-        if (!["flask","fastapi","vllm","sglang"].includes(value)) return `Invalid value "${value}" for modelServer. Valid: flask, fastapi, vllm, sglang`;
+    'modelServer': (value) => {
+        if (!['flask','fastapi','vllm','sglang'].includes(value)) return `Invalid value "${value}" for modelServer. Valid: flask, fastapi, vllm, sglang`;
         return null;
     },
-    "region": (value) => {
-        if (!new RegExp("^[a-z]{2}-[a-z]+-\\d+$").test(value)) return `region does not match required pattern`;
+    'region': (value) => {
+        if (!new RegExp('^[a-z]{2}-[a-z]+-\\d+$').test(value)) return 'region does not match required pattern';
         return null;
     },
-    "roleArn": (value) => {
-        if (!new RegExp("^arn:aws:iam::").test(value)) return `roleArn does not match required pattern`;
+    'roleArn': (value) => {
+        if (!new RegExp('^arn:aws:iam::').test(value)) return 'roleArn does not match required pattern';
         return null;
     },
-    "buildTarget": (value) => {
-        if (!["codebuild"].includes(value)) return `Invalid value "${value}" for buildTarget. Valid: codebuild`;
+    'buildTarget': (value) => {
+        if (!['codebuild'].includes(value)) return `Invalid value "${value}" for buildTarget. Valid: codebuild`;
         return null;
     },
-    "codebuildComputeType": (value) => {
-        if (!["SMALL","MEDIUM","LARGE","BUILD_GENERAL1_SMALL","BUILD_GENERAL1_MEDIUM","BUILD_GENERAL1_LARGE","BUILD_GENERAL1_2XLARGE"].includes(value)) return `Invalid value "${value}" for codebuildComputeType. Valid: SMALL, MEDIUM, LARGE, BUILD_GENERAL1_SMALL, BUILD_GENERAL1_MEDIUM, BUILD_GENERAL1_LARGE, BUILD_GENERAL1_2XLARGE`;
+    'codebuildComputeType': (value) => {
+        if (!['SMALL','MEDIUM','LARGE','BUILD_GENERAL1_SMALL','BUILD_GENERAL1_MEDIUM','BUILD_GENERAL1_LARGE','BUILD_GENERAL1_2XLARGE'].includes(value)) return `Invalid value "${value}" for codebuildComputeType. Valid: SMALL, MEDIUM, LARGE, BUILD_GENERAL1_SMALL, BUILD_GENERAL1_MEDIUM, BUILD_GENERAL1_LARGE, BUILD_GENERAL1_2XLARGE`;
         return null;
     },
-    "hfTokenArn": (value) => {
-        if (!new RegExp("^arn:aws:secretsmanager:").test(value)) return `hfTokenArn does not match required pattern`;
+    'hfTokenArn': (value) => {
+        if (!new RegExp('^arn:aws:secretsmanager:').test(value)) return 'hfTokenArn does not match required pattern';
         return null;
     },
-    "ngcTokenArn": (value) => {
-        if (!new RegExp("^arn:aws:secretsmanager:").test(value)) return `ngcTokenArn does not match required pattern`;
+    'ngcTokenArn': (value) => {
+        if (!new RegExp('^arn:aws:secretsmanager:').test(value)) return 'ngcTokenArn does not match required pattern';
         return null;
     },
-    "endpointInitialInstanceCount": (value) => {
+    'endpointInitialInstanceCount': (value) => {
         if (value < 1) return `endpointInitialInstanceCount must be >= 1, got ${value}`;
         if (value > 100) return `endpointInitialInstanceCount must be <= 100, got ${value}`;
         return null;
     },
-    "endpointDataCapturePercent": (value) => {
+    'endpointDataCapturePercent': (value) => {
         if (value < 0) return `endpointDataCapturePercent must be >= 0, got ${value}`;
         if (value > 100) return `endpointDataCapturePercent must be <= 100, got ${value}`;
         return null;
     },
-    "endpointVariantName": (value) => {
-        if (!new RegExp("^[a-zA-Z0-9]([\\w-]{0,62}[a-zA-Z0-9])?$").test(value)) return `endpointVariantName does not match required pattern`;
+    'endpointVariantName': (value) => {
+        if (!new RegExp('^[a-zA-Z0-9]([\\w-]{0,62}[a-zA-Z0-9])?$').test(value)) return 'endpointVariantName does not match required pattern';
         return null;
     },
-    "endpointVolumeSize": (value) => {
+    'endpointVolumeSize': (value) => {
         if (value < 1) return `endpointVolumeSize must be >= 1, got ${value}`;
         if (value > 16384) return `endpointVolumeSize must be <= 16384, got ${value}`;
         return null;
     },
-    "icCpuCount": (value) => {
+    'capacityReservationArn': (value) => {
+        if (!new RegExp('^arn:aws:sagemaker:').test(value)) return 'capacityReservationArn does not match required pattern';
+        return null;
+    },
+    'icCpuCount': (value) => {
         if (value < 0.25) return `icCpuCount must be >= 0.25, got ${value}`;
         if (value > 768) return `icCpuCount must be <= 768, got ${value}`;
         return null;
     },
-    "icModelWeight": (value) => {
+    'icModelWeight': (value) => {
         if (value < 0) return `icModelWeight must be >= 0, got ${value}`;
         if (value > 1) return `icModelWeight must be <= 1, got ${value}`;
         return null;
     },
-    "asyncS3OutputPath": (value) => {
-        if (!new RegExp("^s3://").test(value)) return `asyncS3OutputPath does not match required pattern`;
+    'asyncS3OutputPath': (value) => {
+        if (!new RegExp('^s3://').test(value)) return 'asyncS3OutputPath does not match required pattern';
         return null;
     },
-    "asyncSnsSuccessTopic": (value) => {
-        if (!new RegExp("^arn:aws:sns:").test(value)) return `asyncSnsSuccessTopic does not match required pattern`;
+    'asyncSnsSuccessTopic': (value) => {
+        if (!new RegExp('^arn:aws:sns:').test(value)) return 'asyncSnsSuccessTopic does not match required pattern';
         return null;
     },
-    "asyncSnsErrorTopic": (value) => {
-        if (!new RegExp("^arn:aws:sns:").test(value)) return `asyncSnsErrorTopic does not match required pattern`;
+    'asyncSnsErrorTopic': (value) => {
+        if (!new RegExp('^arn:aws:sns:').test(value)) return 'asyncSnsErrorTopic does not match required pattern';
         return null;
     },
-    "asyncMaxConcurrent": (value) => {
+    'asyncMaxConcurrent': (value) => {
         if (value < 1) return `asyncMaxConcurrent must be >= 1, got ${value}`;
         if (value > 100) return `asyncMaxConcurrent must be <= 100, got ${value}`;
         return null;
     },
-    "batchInputPath": (value) => {
-        if (!new RegExp("^s3://").test(value)) return `batchInputPath does not match required pattern`;
+    'batchInputPath': (value) => {
+        if (!new RegExp('^s3://').test(value)) return 'batchInputPath does not match required pattern';
         return null;
     },
-    "batchOutputPath": (value) => {
-        if (!new RegExp("^s3://").test(value)) return `batchOutputPath does not match required pattern`;
+    'batchOutputPath': (value) => {
+        if (!new RegExp('^s3://').test(value)) return 'batchOutputPath does not match required pattern';
         return null;
     },
-    "batchInstanceCount": (value) => {
+    'batchInstanceCount': (value) => {
         if (value < 1) return `batchInstanceCount must be >= 1, got ${value}`;
         if (value > 100) return `batchInstanceCount must be <= 100, got ${value}`;
         return null;
     },
-    "batchSplitType": (value) => {
-        if (!["Line","RecordIO","None"].includes(value)) return `Invalid value "${value}" for batchSplitType. Valid: Line, RecordIO, None`;
+    'batchSplitType': (value) => {
+        if (!['Line','RecordIO','None'].includes(value)) return `Invalid value "${value}" for batchSplitType. Valid: Line, RecordIO, None`;
         return null;
     },
-    "batchStrategy": (value) => {
-        if (!["MultiRecord","SingleRecord"].includes(value)) return `Invalid value "${value}" for batchStrategy. Valid: MultiRecord, SingleRecord`;
+    'batchStrategy': (value) => {
+        if (!['MultiRecord','SingleRecord'].includes(value)) return `Invalid value "${value}" for batchStrategy. Valid: MultiRecord, SingleRecord`;
         return null;
     },
-    "batchJoinSource": (value) => {
-        if (!["Input","None"].includes(value)) return `Invalid value "${value}" for batchJoinSource. Valid: Input, None`;
+    'batchJoinSource': (value) => {
+        if (!['Input','None'].includes(value)) return `Invalid value "${value}" for batchJoinSource. Valid: Input, None`;
         return null;
     },
-    "batchMaxConcurrent": (value) => {
+    'batchMaxConcurrent': (value) => {
         if (value < 1) return `batchMaxConcurrent must be >= 1, got ${value}`;
         return null;
     },
-    "batchMaxPayload": (value) => {
+    'batchMaxPayload': (value) => {
         if (value < 0) return `batchMaxPayload must be >= 0, got ${value}`;
         if (value > 100) return `batchMaxPayload must be <= 100, got ${value}`;
         return null;
     },
-    "hyperpodReplicas": (value) => {
+    'hyperpodReplicas': (value) => {
         if (value < 1) return `hyperpodReplicas must be >= 1, got ${value}`;
         return null;
-    },
+    }
 };
-// 43 parameters have validation rules
+// 44 parameters have validation rules