npm - @aws/ml-container-creator - Versions diffs - 0.8.0 → 0.9.1 - Mend

@aws/ml-container-creator 0.8.0 → 0.9.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

package/LICENSE-THIRD-PARTY +50760 -16218
package/bin/cli.js +31 -137
package/package.json +7 -2
package/servers/lib/catalogs/instances.json +52 -1275
package/servers/lib/catalogs/models.json +0 -132
package/servers/lib/catalogs/popular-diffusors.json +1 -110
package/src/app.js +29 -2
package/src/lib/config-manager.js +17 -0
package/src/lib/generated/cli-options.js +467 -0
package/src/lib/generated/validation-rules.js +202 -0
package/src/lib/mcp-client.js +16 -1
package/src/lib/mcp-command-handler.js +10 -2
package/src/lib/prompt-runner.js +16 -2
package/src/lib/train-config-parser.js +136 -0
package/src/lib/train-config-persistence.js +143 -0
package/src/lib/train-config-validator.js +112 -0
package/src/lib/train-feedback.js +46 -0
package/src/lib/train-idempotency.js +97 -0
package/src/lib/train-request-builder.js +120 -0
package/templates/code/serve +5 -134
package/templates/code/serve.d/lmi.ejs +19 -0
package/templates/code/serve.d/sglang.ejs +47 -0
package/templates/code/serve.d/tensorrt-llm.ejs +53 -0
package/templates/code/serve.d/vllm.ejs +48 -0
package/templates/do/.train_build_request.py +141 -0
package/templates/do/.train_poll_parser.py +135 -0
package/templates/do/.train_status_parser.py +187 -0
package/templates/do/clean +1 -1387
package/templates/do/clean.d/async-inference.ejs +508 -0
package/templates/do/clean.d/batch-transform.ejs +512 -0
package/templates/do/clean.d/hyperpod-eks.ejs +481 -0
package/templates/do/clean.d/managed-inference.ejs +1043 -0
package/templates/do/deploy +1 -1766
package/templates/do/deploy.d/async-inference.ejs +501 -0
package/templates/do/deploy.d/batch-transform.ejs +529 -0
package/templates/do/deploy.d/hyperpod-eks.ejs +339 -0
package/templates/do/deploy.d/managed-inference.ejs +726 -0
package/templates/do/lib/feedback.sh +41 -0
package/templates/do/train +786 -0
package/templates/do/training/config.yaml +140 -0
package/templates/do/training/train.py +463 -0

package/servers/lib/catalogs/models.json CHANGED Viewed

@@ -555,98 +555,6 @@
             "text-generation"
         ]
     },
-    "stabilityai/stable-diffusion-3.5-medium": {
-        "family": "stable-diffusion-3",
-        "gated": false,
-        "tags": [
-            "image-generation",
-            "diffusion",
-            "stable-diffusion"
-        ],
-        "architecture": "StableDiffusion3Pipeline",
-        "profiles": {
-            "default": {
-                "displayName": "SD3.5 Medium",
-                "envVars": {}
-            }
-        },
-        "notes": "Stable Diffusion 3.5 medium model. Supported natively by vLLM-Omni StableDiffusion3Pipeline.",
-        "chatTemplate": null,
-        "frameworkCompatibility": {
-            "vllm-omni": ">=0.14.0"
-        },
-        "validationLevel": "experimental",
-        "modelType": "diffusor",
-        "tasks": [
-            "text-to-image"
-        ]
-    },
-    "black-forest-labs/FLUX.1-dev": {
-        "family": "flux",
-        "gated": true,
-        "tags": [
-            "image-generation",
-            "diffusion",
-            "flux"
-        ],
-        "architecture": "FluxPipeline",
-        "profiles": {
-            "default": {
-                "displayName": "FLUX.1 Dev",
-                "envVars": {}
-            }
-        },
-        "notes": "FLUX.1-dev high-quality generation model. Uses dual text encoders (CLIP + T5) and FlowMatchEuler scheduler. Requires significant VRAM.",
-        "chatTemplate": null,
-        "frameworkCompatibility": {
-            "vllm-omni": ">=0.14.0"
-        },
-        "validationLevel": "experimental",
-        "modelType": "diffusor",
-        "tasks": [
-            "text-to-image"
-        ]
-    },
-    "black-forest-labs/FLUX.1-schnell": {
-        "family": "flux",
-        "gated": false,
-        "tags": [
-            "image-generation",
-            "diffusion",
-            "flux"
-        ],
-        "architecture": "FluxPipeline",
-        "notes": "FLUX.1-schnell fast generation model. Fewer denoising steps for faster inference at slightly lower quality",
-        "chatTemplate": null,
-        "frameworkCompatibility": {
-            "vllm-omni": ">=0.14.0"
-        },
-        "validationLevel": "experimental",
-        "modelType": "diffusor",
-        "tasks": [
-            "text-to-image"
-        ]
-    },
-    "Wan-AI/Wan2.1-T2V-14B-Diffusers": {
-        "family": "wan",
-        "gated": false,
-        "tags": [
-            "video-generation",
-            "diffusion",
-            "wan"
-        ],
-        "architecture": "WanPipeline",
-        "notes": "Wan2.1 text-to-video 14B model (diffusers format). Requires multi-GPU instance (ml.g5.12xlarge or larger). Must use the -Diffusers variant — the base Wan2.1-T2V-14B repo lacks model_index.json required by vLLM-Omni",
-        "chatTemplate": null,
-        "frameworkCompatibility": {
-            "vllm-omni": ">=0.16.0"
-        },
-        "validationLevel": "experimental",
-        "modelType": "diffusor",
-        "tasks": [
-            "text-to-video"
-        ]
-    },
     "meta-llama/Llama-3*": {
         "family": "llama-3",
         "gated": true,
@@ -731,45 +639,5 @@
         "tasks": [
             "text-generation"
         ]
-    },
-    "stabilityai/stable-diffusion-*": {
-        "family": "stable-diffusion",
-        "gated": false,
-        "tags": [
-            "image-generation",
-            "diffusion",
-            "stable-diffusion"
-        ],
-        "architecture": null,
-        "notes": "Fallback for Stable Diffusion variants not explicitly listed",
-        "chatTemplate": null,
-        "frameworkCompatibility": {
-            "vllm-omni": ">=0.14.0"
-        },
-        "validationLevel": "experimental",
-        "modelType": "diffusor",
-        "tasks": [
-            "text-to-image"
-        ]
-    },
-    "black-forest-labs/FLUX*": {
-        "family": "flux",
-        "gated": false,
-        "tags": [
-            "image-generation",
-            "diffusion",
-            "flux"
-        ],
-        "architecture": null,
-        "notes": "Fallback for FLUX model variants not explicitly listed",
-        "chatTemplate": null,
-        "frameworkCompatibility": {
-            "vllm-omni": ">=0.14.0"
-        },
-        "validationLevel": "experimental",
-        "modelType": "diffusor",
-        "tasks": [
-            "text-to-image"
-        ]
     }
 }

package/servers/lib/catalogs/popular-diffusors.json CHANGED Viewed

@@ -1,110 +1 @@
-{
-    "stabilityai/stable-diffusion-3.5-medium": {
-        "family": "stable-diffusion-3",
-        "chat_template": null,
-        "gated": false,
-        "tags": [
-            "image-generation",
-            "diffusion",
-            "stable-diffusion"
-        ],
-        "architecture": "StableDiffusion3Pipeline",
-        "framework_compatibility": {
-            "vllm-omni": ">=0.14.0"
-        },
-        "validation_level": "experimental",
-        "profiles": {
-            "default": {
-                "displayName": "SD3.5 Medium",
-                "envVars": {}
-            }
-        },
-        "notes": "Stable Diffusion 3.5 medium model. Supported natively by vLLM-Omni StableDiffusion3Pipeline."
-    },
-    "black-forest-labs/FLUX.1-dev": {
-        "family": "flux",
-        "chat_template": null,
-        "gated": true,
-        "tags": [
-            "image-generation",
-            "diffusion",
-            "flux"
-        ],
-        "architecture": "FluxPipeline",
-        "framework_compatibility": {
-            "vllm-omni": ">=0.14.0"
-        },
-        "validation_level": "experimental",
-        "profiles": {
-            "default": {
-                "displayName": "FLUX.1 Dev",
-                "envVars": {}
-            }
-        },
-        "notes": "FLUX.1-dev high-quality generation model. Uses dual text encoders (CLIP + T5) and FlowMatchEuler scheduler. Requires significant VRAM."
-    },
-    "black-forest-labs/FLUX.1-schnell": {
-        "family": "flux",
-        "chat_template": null,
-        "gated": false,
-        "tags": [
-            "image-generation",
-            "diffusion",
-            "flux"
-        ],
-        "architecture": "FluxPipeline",
-        "framework_compatibility": {
-            "vllm-omni": ">=0.14.0"
-        },
-        "validation_level": "experimental",
-        "notes": "FLUX.1-schnell fast generation model. Fewer denoising steps for faster inference at slightly lower quality"
-    },
-    "Wan-AI/Wan2.1-T2V-14B-Diffusers": {
-        "family": "wan",
-        "chat_template": null,
-        "gated": false,
-        "tags": [
-            "video-generation",
-            "diffusion",
-            "wan"
-        ],
-        "architecture": "WanPipeline",
-        "framework_compatibility": {
-            "vllm-omni": ">=0.16.0"
-        },
-        "validation_level": "experimental",
-        "notes": "Wan2.1 text-to-video 14B model (diffusers format). Requires multi-GPU instance (ml.g5.12xlarge or larger). Must use the -Diffusers variant — the base Wan2.1-T2V-14B repo lacks model_index.json required by vLLM-Omni"
-    },
-    "stabilityai/stable-diffusion-*": {
-        "family": "stable-diffusion",
-        "chat_template": null,
-        "gated": false,
-        "tags": [
-            "image-generation",
-            "diffusion",
-            "stable-diffusion"
-        ],
-        "architecture": null,
-        "framework_compatibility": {
-            "vllm-omni": ">=0.14.0"
-        },
-        "validation_level": "experimental",
-        "notes": "Fallback for Stable Diffusion variants not explicitly listed"
-    },
-    "black-forest-labs/FLUX*": {
-        "family": "flux",
-        "chat_template": null,
-        "gated": false,
-        "tags": [
-            "image-generation",
-            "diffusion",
-            "flux"
-        ],
-        "architecture": null,
-        "framework_compatibility": {
-            "vllm-omni": ">=0.14.0"
-        },
-        "validation_level": "experimental",
-        "notes": "Fallback for FLUX model variants not explicitly listed"
-    }
-}
+{}

package/src/app.js CHANGED Viewed

@@ -296,6 +296,11 @@ export async function writeProject(templateDir, destDir, answers, registryConfig
     // Build ignore patterns
     const ignorePatterns = [];
+    // EJS partials — included by templates at render time, not copied to output
+    ignorePatterns.push('**/serve.d/**');
+    ignorePatterns.push('**/deploy.d/**');
+    ignorePatterns.push('**/clean.d/**');
     if (answers.deploymentTarget !== 'hyperpod-eks') {
         ignorePatterns.push('**/hyperpod/**');
     }
@@ -349,11 +354,27 @@ export async function writeProject(templateDir, destDir, answers, registryConfig
     }
     // Exclude tune files when framework is NOT transformers OR deploymentTarget is batch-transform
-    if (architecture !== 'transformers' || answers.deploymentTarget === 'batch-transform') {
+    const tuneIncluded = architecture === 'transformers' && answers.deploymentTarget !== 'batch-transform';
+    if (!tuneIncluded) {
         ignorePatterns.push('**/do/tune');
         ignorePatterns.push('**/do/.tune_helper.py');
     }
+    // Exclude train files when deploymentTarget is batch-transform
+    const trainIncluded = answers.deploymentTarget !== 'batch-transform';
+    if (!trainIncluded) {
+        ignorePatterns.push('**/do/train');
+        ignorePatterns.push('**/do/.train_build_request.py');
+        ignorePatterns.push('**/do/.train_status_parser.py');
+        ignorePatterns.push('**/do/.train_poll_parser.py');
+        ignorePatterns.push('**/do/training/**');
+    }
+    // Exclude feedback.sh when neither tune nor train is included
+    if (!tuneIncluded && !trainIncluded) {
+        ignorePatterns.push('**/do/lib/feedback.sh');
+    }
     // Exclude do/test when hosted-model-endpoint is not selected
     const testTypes = answers.testTypes || [];
     if (!testTypes.includes('hosted-model-endpoint')) {
@@ -371,6 +392,11 @@ export async function writeProject(templateDir, destDir, answers, registryConfig
         ignorePatterns.push('**/do/adapters/**');
         ignorePatterns.push('**/do/tune');
         ignorePatterns.push('**/do/.tune_helper.py');
+        ignorePatterns.push('**/do/train');
+        ignorePatterns.push('**/do/.train_build_request.py');
+        ignorePatterns.push('**/do/.train_status_parser.py');
+        ignorePatterns.push('**/do/.train_poll_parser.py');
+        ignorePatterns.push('**/do/training/**');
         ignorePatterns.push('**/do/add-ic');
         ignorePatterns.push('**/do/run');
         ignorePatterns.push('**/sample_model/**');
@@ -1177,7 +1203,8 @@ function _setExecutablePermissions(destDir, answers = {}) {
         'do/status',
         'do/add-ic',
         'do/adapter',
-        'do/tune'
+        'do/tune',
+        'do/train'
     ];
     const shellScripts = architecture === 'marketplace' ? marketplaceScripts : defaultScripts;

package/src/lib/config-manager.js CHANGED Viewed

@@ -26,6 +26,7 @@ import DeploymentConfigResolver from './deployment-config-resolver.js';
 import BootstrapConfig from './bootstrap-config.js';
 import { parseKeyValue } from './key-value-parser.js';
 import ParameterSchemaValidator from './parameter-schema-validator.js';
+import { validationRules } from './generated/validation-rules.js';
 const __configMgrFilename = fileURLToPath(import.meta.url);
 const __configMgrDir = dirname(__configMgrFilename);
@@ -2261,6 +2262,22 @@ export default class ConfigManager {
      * @private
      */
     _validateParameterValue(parameter, value, context = {}) {
+        // First pass: schema-derived validation rules (type, range, pattern, enum)
+        // Skip deprecated params — they have relaxed validation handled by the switch below
+        const schemaRule = validationRules[parameter];
+        if (schemaRule && value !== null && value !== undefined) {
+            // Don't apply strict enum validation to internally-derived values
+            // The switch statement below handles context-dependent validation
+            const skipSchemaValidation = ['framework', 'modelServer', 'deploymentConfig'].includes(parameter);
+            if (!skipSchemaValidation) {
+                const error = schemaRule(value);
+                if (error) {
+                    throw new ValidationError(error, parameter, value);
+                }
+            }
+        }
+        // Second pass: context-dependent validations that require runtime state
         const supportedOptions = this._getSupportedOptions();
         switch (parameter) {