npm - @aws/ml-container-creator - Versions diffs - 0.2.1 → 0.2.3 - Mend

@aws/ml-container-creator 0.2.1 → 0.2.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (36) hide show

package/bin/cli.js +88 -86
package/config/bootstrap-stack.json +211 -0
package/config/parameter-schema.json +88 -0
package/infra/ci-harness/bin/ci-harness.ts +26 -0
package/infra/ci-harness/buildspec.yml +352 -0
package/infra/ci-harness/cdk.json +27 -0
package/infra/ci-harness/lambda/scanner/index.ts +199 -0
package/infra/ci-harness/lib/ci-harness-stack.ts +609 -0
package/infra/ci-harness/package-lock.json +3979 -0
package/infra/ci-harness/package.json +32 -0
package/infra/ci-harness/tsconfig.json +38 -0
package/package.json +13 -3
package/src/app.js +318 -318
package/src/copy-tpl.js +19 -19
package/src/lib/asset-manager.js +74 -74
package/src/lib/aws-profile-parser.js +45 -45
package/src/lib/bootstrap-command-handler.js +560 -547
package/src/lib/bootstrap-config.js +45 -45
package/src/lib/ci-register-helpers.js +19 -19
package/src/lib/ci-report-helpers.js +37 -37
package/src/lib/ci-stage-helpers.js +49 -49
package/src/lib/comment-generator.js +4 -4
package/src/lib/config-manager.js +105 -105
package/src/lib/deployment-config-resolver.js +10 -10
package/src/lib/deployment-registry.js +153 -153
package/src/lib/engine-prefix-resolver.js +8 -8
package/src/lib/key-value-parser.js +6 -6
package/src/lib/manifest-cli.js +108 -108
package/src/lib/prompt-runner.js +224 -224
package/src/lib/prompts.js +121 -121
package/src/lib/registry-command-handler.js +174 -174
package/src/lib/registry-loader.js +52 -52
package/src/lib/sensitive-redactor.js +9 -9
package/src/lib/template-engine.js +1 -1
package/src/lib/template-manager.js +62 -62
package/src/prompt-adapter.js +18 -18

package/src/lib/prompts.js CHANGED Viewed

@@ -35,7 +35,7 @@ function loadInstanceTypeRegistry() {
                     ? entry.accelerator || entry.hardware
                     : 'None',
                 useCase: entry.notes || entry.tags?.join(', ') || '',
-                category: entry.category || 'cpu',
+                category: entry.category || 'cpu'
             };
         }
         return registry;
@@ -192,8 +192,8 @@ const enginePrompts = [
             { name: 'TensorFlow', value: 'tensorflow' }
         ],
         when: (answers) => {
-            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0]
-            return architecture === 'http'
+            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0];
+            return architecture === 'http';
         }
     }
 ];
@@ -245,75 +245,75 @@ const modelFormatPrompts = [
         message: 'In which format is your model serialized?',
         choices: (answers) => {
             // Derive architecture from deploymentConfig
-            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0]
-            const backend = answers.backend || answers.deploymentConfig?.split('-').slice(1).join('-')
+            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0];
+            const backend = answers.backend || answers.deploymentConfig?.split('-').slice(1).join('-');
             // For http architecture, use engine to determine formats
             if (architecture === 'http') {
-                const engine = answers.engine
+                const engine = answers.engine;
                 const formatMap = {
                     'xgboost': ['json', 'model', 'ubj'],
                     'sklearn': ['pkl', 'joblib'],
                     'tensorflow': ['keras', 'h5', 'SavedModel']
-                }
-                return formatMap[engine] || []
+                };
+                return formatMap[engine] || [];
             }
             // For triton architecture, use backend-specific formats
             if (architecture === 'triton') {
                 // FIL backend has multiple format choices
                 if (backend === 'fil') {
-                    return ['xgboost_json', 'xgboost_ubj', 'lightgbm_txt']
+                    return ['xgboost_json', 'xgboost_ubj', 'lightgbm_txt'];
                 }
                 // Python backend has multiple format choices
                 if (backend === 'python') {
-                    return ['pkl', 'joblib', 'custom']
+                    return ['pkl', 'joblib', 'custom'];
                 }
                 // Other Triton backends have auto-set formats (handled in when clause)
-                return []
+                return [];
             }
             // Legacy support for old format (should not be reached with new configs)
-            const framework = answers.framework || architecture
+            const framework = answers.framework || architecture;
             const formatMap = {
                 'xgboost': ['json', 'model', 'ubj'],
                 'sklearn': ['pkl', 'joblib'],
                 'tensorflow': ['keras', 'h5', 'SavedModel']
-            }
-            return formatMap[framework] || []
+            };
+            return formatMap[framework] || [];
         },
         when: answers => {
-            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0]
-            const backend = answers.backend || answers.deploymentConfig?.split('-').slice(1).join('-')
+            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0];
+            const backend = answers.backend || answers.deploymentConfig?.split('-').slice(1).join('-');
             // Skip for transformers (they use HF Hub)
             if (architecture === 'transformers') {
-                return false
+                return false;
             }
             // Skip for diffusors (they use HF Hub)
             if (architecture === 'diffusors') {
-                return false
+                return false;
             }
             // For http architecture, always show
             if (architecture === 'http') {
-                return true
+                return true;
             }
             // For triton architecture, only show for backends with multiple format choices
             if (architecture === 'triton') {
                 // FIL and Python backends have multiple format choices
                 if (backend === 'fil' || backend === 'python') {
-                    return true
+                    return true;
                 }
                 // Other backends have auto-set formats
-                return false
+                return false;
             }
             // Legacy support
-            const framework = answers.framework || architecture
-            return framework !== 'transformers'
+            const framework = answers.framework || architecture;
+            return framework !== 'transformers';
         }
     },
     {
@@ -323,55 +323,55 @@ const modelFormatPrompts = [
         choices: (answers) => {
             // Use MCP model-picker choices when available
             if (answers._mcpModelChoices && answers._mcpModelChoices.length > 0) {
-                return [...answers._mcpModelChoices, 'Custom (enter manually)']
+                return [...answers._mcpModelChoices, 'Custom (enter manually)'];
             }
             // Fallback to hardcoded defaults based on architecture
-            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0]
+            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0];
             if (architecture === 'diffusors') {
                 return [
                     'stabilityai/stable-diffusion-3.5-medium',
                     'black-forest-labs/FLUX.1-schnell',
                     'black-forest-labs/FLUX.1-dev',
                     'Custom (enter manually)'
-                ]
+                ];
             }
             return [
                 'openai/gpt-oss-20b',
                 'meta-llama/Llama-3.2-3B-Instruct',
                 'meta-llama/Llama-3.2-1B-Instruct',
                 'Custom (enter manually)'
-            ]
+            ];
         },
         default: (answers) => {
             if (answers._mcpModelChoices && answers._mcpModelChoices.length > 0) {
-                return answers._mcpModelChoices[0]
+                return answers._mcpModelChoices[0];
             }
-            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0]
+            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0];
             if (architecture === 'diffusors') {
-                return 'stabilityai/stable-diffusion-3.5-medium'
+                return 'stabilityai/stable-diffusion-3.5-medium';
             }
-            return 'openai/gpt-oss-20b'
+            return 'openai/gpt-oss-20b';
         },
         when: answers => {
-            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0]
-            const backend = answers.backend || answers.deploymentConfig?.split('-').slice(1).join('-')
+            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0];
+            const backend = answers.backend || answers.deploymentConfig?.split('-').slice(1).join('-');
             // Show for transformers architecture
             if (architecture === 'transformers') {
-                return true
+                return true;
             }
             // Show for diffusors architecture (reuse HuggingFace model selection)
             if (architecture === 'diffusors') {
-                return true
+                return true;
             }
             // Show for Triton LLM backends (vllm, tensorrtllm)
             if (architecture === 'triton' && (backend === 'vllm' || backend === 'tensorrtllm')) {
-                return true
+                return true;
             }
-            return false
+            return false;
         }
     },
     {
@@ -380,34 +380,34 @@ const modelFormatPrompts = [
         message: 'Enter the model path:',
         validate: (input) => {
             if (!input || input.trim() === '') {
-                return 'Model name is required'
+                return 'Model name is required';
             }
             // Basic validation - must contain a slash (org/model, hub/model, s3://path, etc.)
             if (!input.includes('/')) {
-                return 'Please use the full model path (e.g., microsoft/DialoGPT-medium, jumpstart-hub://my-hub/my-model)'
+                return 'Please use the full model path (e.g., microsoft/DialoGPT-medium, jumpstart-hub://my-hub/my-model)';
             }
-            return true
+            return true;
         },
         when: answers => {
-            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0]
-            const backend = answers.backend || answers.deploymentConfig?.split('-').slice(1).join('-')
+            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0];
+            const backend = answers.backend || answers.deploymentConfig?.split('-').slice(1).join('-');
             // Show for transformers with custom model selection
             if (architecture === 'transformers' && answers.modelName === 'Custom (enter manually)') {
-                return true
+                return true;
             }
             // Show for diffusors with custom model selection
             if (architecture === 'diffusors' && answers.modelName === 'Custom (enter manually)') {
-                return true
+                return true;
             }
             // Show for Triton LLM backends with custom model selection
             if (architecture === 'triton' && (backend === 'vllm' || backend === 'tensorrtllm') && answers.modelName === 'Custom (enter manually)') {
-                return true
+                return true;
             }
-            return false
+            return false;
         }
     }
 ];
@@ -433,8 +433,8 @@ const modelLoadStrategyPrompts = [
         ],
         default: 'runtime',
         when: (answers) => {
-            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0]
-            return architecture === 'transformers' || architecture === 'diffusors'
+            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0];
+            return architecture === 'transformers' || architecture === 'diffusors';
         }
     }
 ];
@@ -476,58 +476,58 @@ const hfTokenPrompts = [
         name: 'hfToken',
         message: 'HuggingFace token (enter token, "$HF_TOKEN" for env var, or leave empty):',
         when: (answers) => {
-            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0]
-            const backend = answers.backend || answers.deploymentConfig?.split('-').slice(1).join('-')
+            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0];
+            const backend = answers.backend || answers.deploymentConfig?.split('-').slice(1).join('-');
             // Prompt for transformers architecture
-            const isTransformers = architecture === 'transformers'
+            const isTransformers = architecture === 'transformers';
             // Prompt for diffusors architecture (uses HuggingFace Hub)
-            const isDiffusors = architecture === 'diffusors'
+            const isDiffusors = architecture === 'diffusors';
             // Prompt for Triton LLM backends (vllm, tensorrtllm)
             // Requirements: 9.1, 9.2
-            const isTritonLlm = architecture === 'triton' && (backend === 'vllm' || backend === 'tensorrtllm')
+            const isTritonLlm = architecture === 'triton' && (backend === 'vllm' || backend === 'tensorrtllm');
             if (!isTransformers && !isDiffusors && !isTritonLlm) {
-                return false
+                return false;
             }
             // Skip HF token prompt for non-HuggingFace model sources
             // (S3, JumpStart, Private Hub, Registry models don't need HF auth)
-            const modelSource = answers.modelSource
+            const modelSource = answers.modelSource;
             if (modelSource && modelSource !== 'huggingface') {
-                return false
+                return false;
             }
             // Display security warning before prompting
-            console.log('\n🔐 HuggingFace Authentication')
-            console.log('   Many models (e.g. Llama, Mistral) are gated and require a token.')
-            console.log('⚠️  Security Note: The token will be baked into the Docker image.')
-            console.log('   Anyone with access to the image can extract the token using \'docker inspect\'.')
-            console.log('   For CI/CD pipelines, use "$HF_TOKEN" to reference an environment variable.')
-            console.log('   This keeps the token out of the image and allows rotation without rebuilding.\n')
+            console.log('\n🔐 HuggingFace Authentication');
+            console.log('   Many models (e.g. Llama, Mistral) are gated and require a token.');
+            console.log('⚠️  Security Note: The token will be baked into the Docker image.');
+            console.log('   Anyone with access to the image can extract the token using \'docker inspect\'.');
+            console.log('   For CI/CD pipelines, use "$HF_TOKEN" to reference an environment variable.');
+            console.log('   This keeps the token out of the image and allows rotation without rebuilding.\n');
-            return true
+            return true;
         },
         validate: (input) => {
             // Empty is valid (not all models require auth)
             if (!input || input.trim() === '') {
-                return true
+                return true;
             }
             // $HF_TOKEN reference is valid
             if (input.trim() === '$HF_TOKEN') {
-                return true
+                return true;
             }
             // Direct token should start with hf_ (warning only, not blocking)
             if (!input.startsWith('hf_')) {
-                console.warn('\n⚠️  Warning: HuggingFace tokens typically start with "hf_"')
-                console.warn('   If this is intentional, you can ignore this warning.')
+                console.warn('\n⚠️  Warning: HuggingFace tokens typically start with "hf_"');
+                console.warn('   If this is intentional, you can ignore this warning.');
             }
-            return true // Always return true (non-blocking validation)
+            return true; // Always return true (non-blocking validation)
         }
     }
 ];
@@ -538,42 +538,42 @@ const ngcApiKeyPrompts = [
         name: 'ngcApiKey',
         message: 'NVIDIA NGC API key (enter key, "$NGC_API_KEY" for env var, or leave empty):',
         when: (answers) => {
-            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0]
-            const backend = answers.backend || answers.deploymentConfig?.split('-').slice(1).join('-')
+            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0];
+            const backend = answers.backend || answers.deploymentConfig?.split('-').slice(1).join('-');
             // Never prompt for NGC key for Triton configs (public images)
             // Requirements: 9.2
             if (architecture === 'triton') {
-                return false
+                return false;
             }
             // Never prompt for NGC key for diffusors configs (public Docker Hub images)
             if (architecture === 'diffusors') {
-                return false
+                return false;
             }
             // Only prompt for transformers-tensorrt-llm
             if (architecture === 'transformers' && backend === 'tensorrt-llm') {
-                console.log('\n🔐 NVIDIA NGC Authentication')
-                console.log('   TensorRT-LLM base images are hosted on NVIDIA NGC and require an API key.')
-                console.log('   1. Create account at: https://ngc.nvidia.com/')
-                console.log('   2. Generate API key in account settings')
-                console.log('   For CI/CD pipelines, use "$NGC_API_KEY" to reference an environment variable.\n')
-                return true
+                console.log('\n🔐 NVIDIA NGC Authentication');
+                console.log('   TensorRT-LLM base images are hosted on NVIDIA NGC and require an API key.');
+                console.log('   1. Create account at: https://ngc.nvidia.com/');
+                console.log('   2. Generate API key in account settings');
+                console.log('   For CI/CD pipelines, use "$NGC_API_KEY" to reference an environment variable.\n');
+                return true;
             }
-            return false
+            return false;
         },
         validate: (input) => {
             if (!input || input.trim() === '') {
-                return true
+                return true;
             }
             if (input.trim() === '$NGC_API_KEY') {
-                return true
+                return true;
             }
-            return true
+            return true;
         }
     }
 ];
@@ -585,31 +585,31 @@ const modulePrompts = [
         message: 'Include sample Abalone classifier?',
         default: false,
         when: (answers) => {
-            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0]
-            const backend = answers.backend || answers.deploymentConfig?.split('-').slice(1).join('-')
+            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0];
+            const backend = answers.backend || answers.deploymentConfig?.split('-').slice(1).join('-');
             // Never for transformers
             if (architecture === 'transformers') {
-                return false
+                return false;
             }
             // Never for diffusors (diffusion models cannot be trained inline)
             if (architecture === 'diffusors') {
-                return false
+                return false;
             }
             // For Triton, check if backend supports sample model
             if (architecture === 'triton') {
                 // Triton LLM backends don't support sample model
                 if (backend === 'vllm' || backend === 'tensorrtllm' || backend === 'pytorch') {
-                    return false
+                    return false;
                 }
                 // Other Triton backends support sample model
-                return true
+                return true;
             }
             // For http architecture, always show
-            return true
+            return true;
         }
     },
     {
@@ -617,31 +617,31 @@ const modulePrompts = [
         name: 'testTypes',
         message: 'Test type?',
         choices: (answers) => {
-            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0]
-            const backend = answers.backend || answers.deploymentConfig?.split('-').slice(1).join('-')
+            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0];
+            const backend = answers.backend || answers.deploymentConfig?.split('-').slice(1).join('-');
             // Transformers and Triton LLM backends only support hosted endpoint tests
             if (architecture === 'transformers') {
-                return ['hosted-model-endpoint']
+                return ['hosted-model-endpoint'];
             }
             if (architecture === 'triton' && (backend === 'vllm' || backend === 'tensorrtllm')) {
-                return ['hosted-model-endpoint']
+                return ['hosted-model-endpoint'];
             }
-            return ['local-model-cli', 'local-model-server', 'hosted-model-endpoint']
+            return ['local-model-cli', 'local-model-server', 'hosted-model-endpoint'];
         },
         default: (answers) => {
-            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0]
-            const backend = answers.backend || answers.deploymentConfig?.split('-').slice(1).join('-')
+            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0];
+            const backend = answers.backend || answers.deploymentConfig?.split('-').slice(1).join('-');
             if (architecture === 'transformers') {
-                return ['hosted-model-endpoint']
+                return ['hosted-model-endpoint'];
             }
             if (architecture === 'triton' && (backend === 'vllm' || backend === 'tensorrtllm')) {
-                return ['hosted-model-endpoint']
+                return ['hosted-model-endpoint'];
             }
-            return ['local-model-cli', 'local-model-server', 'hosted-model-endpoint']
+            return ['local-model-cli', 'local-model-server', 'hosted-model-endpoint'];
         }
     }
 ];
@@ -662,13 +662,13 @@ const infraRegionAndTargetPrompts = [
         message: 'Target AWS region?',
         choices: (answers) => {
             // If a bootstrap profile set a region, include it in choices
-            const bootstrapRegion = answers._bootstrapRegion
-            const choices = ['us-east-1']
+            const bootstrapRegion = answers._bootstrapRegion;
+            const choices = ['us-east-1'];
             if (bootstrapRegion && bootstrapRegion !== 'us-east-1') {
-                choices.unshift({ name: `${bootstrapRegion} (from bootstrap profile)`, value: bootstrapRegion })
+                choices.unshift({ name: `${bootstrapRegion} (from bootstrap profile)`, value: bootstrapRegion });
             }
-            choices.push({ name: 'Custom...', value: 'custom' })
-            return choices
+            choices.push({ name: 'Custom...', value: 'custom' });
+            return choices;
         },
         default: (answers) => answers._bootstrapRegion || 'us-east-1'
     },
@@ -1045,16 +1045,16 @@ const destinationPrompts = [
  */
 function formatImageChoices(entries, isTransformer) {
     return entries.map(entry => {
-        const cuda = entry.labels.cuda_version || '-'
-        const python = entry.labels.python_version || '-'
-        const date = entry.created.slice(0, 10)
+        const cuda = entry.labels.cuda_version || '-';
+        const python = entry.labels.python_version || '-';
+        const date = entry.created.slice(0, 10);
         const name = isTransformer
             ? `${entry.repository.padEnd(30)} ${entry.tag.padEnd(16)} ${entry.architecture.padEnd(7)} ${cuda.padEnd(6)} ${python.padEnd(8)} ${date}`
-            : `${entry.repository.padEnd(30)} ${entry.tag.padEnd(16)} ${entry.architecture.padEnd(7)} ${python.padEnd(8)} ${date}`
+            : `${entry.repository.padEnd(30)} ${entry.tag.padEnd(16)} ${entry.architecture.padEnd(7)} ${python.padEnd(8)} ${date}`;
-        return { name, value: entry.image }
-    })
+        return { name, value: entry.image };
+    });
 }
 /**
@@ -1068,12 +1068,12 @@ const baseImageSearchPrompts = [
         message: '🔌 Search for a Python base image (e.g. "3.11", "3.10", or leave empty for all):',
         default: '',
         when: (answers) => {
-            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0]
+            const architecture = answers.architecture || answers.deploymentConfig?.split('-')[0];
             // Skip for transformers (uses model-server images) and triton (uses NGC images)
-            return architecture !== 'transformers' && architecture !== 'triton'
+            return architecture !== 'transformers' && architecture !== 'triton';
         }
     }
-]
+];
 /**
  * Base image selection prompt (all frameworks)
@@ -1085,11 +1085,11 @@ const baseImagePrompts = [
         name: 'baseImage',
         message: 'Select base container image:',
         choices: (answers) => {
-            const mcpChoices = answers._mcpBaseImageChoices || []
-            return [...mcpChoices, { name: 'Custom (enter your own)', value: 'custom' }]
+            const mcpChoices = answers._mcpBaseImageChoices || [];
+            return [...mcpChoices, { name: 'Custom (enter your own)', value: 'custom' }];
         },
         when: (answers) => {
-            return answers._mcpBaseImageChoices && answers._mcpBaseImageChoices.length > 0
+            return answers._mcpBaseImageChoices && answers._mcpBaseImageChoices.length > 0;
         }
     },
     {
@@ -1098,17 +1098,17 @@ const baseImagePrompts = [
         message: 'Enter custom base container image (e.g. myrepo/myimage:v1):',
         validate: (input) => {
             if (!input || input.trim() === '') {
-                return 'Base image is required'
+                return 'Base image is required';
             }
-            const pattern = /^[a-zA-Z0-9][a-zA-Z0-9._\-\/]*(:[a-zA-Z0-9._\-]+)?$/
+            const pattern = /^[a-zA-Z0-9][a-zA-Z0-9._\-/]*(:[a-zA-Z0-9._-]+)?$/;
             if (!pattern.test(input.trim())) {
-                return 'Invalid image format. Expected: [registry/]repository[:tag]'
+                return 'Invalid image format. Expected: [registry/]repository[:tag]';
             }
-            return true
+            return true;
         },
         when: (answers) => answers.baseImage === 'custom'
     }
-]
+];
 export {
     deploymentConfigPrompts,