@aws/ml-container-creator 0.7.1 → 0.9.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE-THIRD-PARTY +50760 -16218
- package/bin/cli.js +1 -1
- package/infra/ci-harness/buildspec.yml +4 -0
- package/package.json +3 -1
- package/servers/lib/catalogs/instances.json +52 -1275
- package/servers/lib/catalogs/model-servers.json +80 -0
- package/servers/lib/catalogs/models.json +0 -132
- package/servers/lib/catalogs/popular-diffusors.json +1 -110
- package/servers/model-picker/index.js +27 -16
- package/src/app.js +113 -23
- package/src/lib/cli-handler.js +1 -1
- package/src/lib/config-manager.js +39 -2
- package/src/lib/cross-cutting-checker.js +146 -33
- package/src/lib/deployment-config-resolver.js +10 -4
- package/src/lib/e2e-bootstrap.js +227 -0
- package/src/lib/e2e-catalog-validator.js +103 -0
- package/src/lib/e2e-quota-validator.js +135 -0
- package/src/lib/mcp-client.js +16 -1
- package/src/lib/mcp-command-handler.js +10 -2
- package/src/lib/prompt-runner.js +306 -24
- package/src/lib/prompts.js +9 -3
- package/src/lib/template-manager.js +10 -4
- package/src/lib/train-config-parser.js +136 -0
- package/src/lib/train-config-persistence.js +143 -0
- package/src/lib/train-config-validator.js +112 -0
- package/src/lib/train-feedback.js +46 -0
- package/src/lib/train-idempotency.js +97 -0
- package/src/lib/train-request-builder.js +120 -0
- package/src/lib/tune-catalog-validator.js +5 -5
- package/templates/code/serve +2 -2
- package/templates/code/serving.properties +2 -2
- package/templates/diffusors/serve +3 -3
- package/templates/do/.train_build_request.py +141 -0
- package/templates/do/.train_poll_parser.py +135 -0
- package/templates/do/.train_status_parser.py +187 -0
- package/templates/do/.tune_helper.py +2 -2
- package/templates/do/lib/feedback.sh +41 -0
- package/templates/do/register +8 -2
- package/templates/do/test +5 -5
- package/templates/do/train +786 -0
- package/templates/do/training/config.yaml +140 -0
- package/templates/do/training/train.py +463 -0
- package/templates/do/tune +2 -2
- package/templates/marketplace/config +118 -0
- package/templates/marketplace/deploy +890 -0
- package/templates/marketplace/test +453 -0
package/templates/do/test
CHANGED
|
@@ -103,9 +103,9 @@ case "${FRAMEWORK}" in
|
|
|
103
103
|
case "${MODEL_SERVER}" in
|
|
104
104
|
vllm|sglang)
|
|
105
105
|
# OpenAI-compatible chat completions format
|
|
106
|
-
# For S3/
|
|
106
|
+
# For S3/registry models, vLLM registers the model under the local path
|
|
107
107
|
VLLM_MODEL_NAME="${MODEL_NAME}"
|
|
108
|
-
if [[ "${MODEL_NAME}" ==
|
|
108
|
+
if [[ "${MODEL_NAME}" == s3://* ]] || [[ "${MODEL_NAME}" == /opt/ml/* ]]; then
|
|
109
109
|
VLLM_MODEL_NAME="/opt/ml/model"
|
|
110
110
|
fi
|
|
111
111
|
TEST_PAYLOAD='{"model": "'"${VLLM_MODEL_NAME}"'", "messages": [{"role": "user", "content": "What is machine learning?"}], "max_tokens": 50, "temperature": 0.7}'
|
|
@@ -431,7 +431,7 @@ case "${FRAMEWORK}" in
|
|
|
431
431
|
case "${MODEL_SERVER}" in
|
|
432
432
|
vllm|sglang)
|
|
433
433
|
VLLM_MODEL_NAME="${MODEL_NAME}"
|
|
434
|
-
if [[ "${MODEL_NAME}" ==
|
|
434
|
+
if [[ "${MODEL_NAME}" == s3://* ]] || [[ "${MODEL_NAME}" == /opt/ml/* ]]; then
|
|
435
435
|
VLLM_MODEL_NAME="/opt/ml/model"
|
|
436
436
|
fi
|
|
437
437
|
TEST_PAYLOAD='{"model": "'"${VLLM_MODEL_NAME}"'", "messages": [{"role": "user", "content": "What is machine learning?"}], "max_tokens": 50, "temperature": 0.7}'
|
|
@@ -808,7 +808,7 @@ case "${FRAMEWORK}" in
|
|
|
808
808
|
vllm|sglang)
|
|
809
809
|
# OpenAI-compatible chat completions format
|
|
810
810
|
VLLM_MODEL_NAME="${MODEL_NAME}"
|
|
811
|
-
if [[ "${MODEL_NAME}" ==
|
|
811
|
+
if [[ "${MODEL_NAME}" == s3://* ]] || [[ "${MODEL_NAME}" == /opt/ml/* ]]; then
|
|
812
812
|
VLLM_MODEL_NAME="/opt/ml/model"
|
|
813
813
|
fi
|
|
814
814
|
TEST_PAYLOAD='{"model": "'"${VLLM_MODEL_NAME}"'", "messages": [{"role": "user", "content": "What is machine learning?"}], "max_tokens": 50, "temperature": 0.7}'
|
|
@@ -1095,7 +1095,7 @@ case "${FRAMEWORK}" in
|
|
|
1095
1095
|
case "${MODEL_SERVER}" in
|
|
1096
1096
|
vllm|sglang)
|
|
1097
1097
|
VLLM_MODEL_NAME="${MODEL_NAME}"
|
|
1098
|
-
if [[ "${MODEL_NAME}" ==
|
|
1098
|
+
if [[ "${MODEL_NAME}" == s3://* ]] || [[ "${MODEL_NAME}" == /opt/ml/* ]]; then
|
|
1099
1099
|
VLLM_MODEL_NAME="/opt/ml/model"
|
|
1100
1100
|
fi
|
|
1101
1101
|
TEST_PAYLOAD='{"model": "'"${VLLM_MODEL_NAME}"'", "messages": [{"role": "user", "content": "What is machine learning?"}], "max_tokens": 50, "temperature": 0.7}'
|