npm - @aws/ml-container-creator - Versions diffs - 0.10.3 → 0.13.3 - Mend

@aws/ml-container-creator 0.10.3 → 0.13.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (40) hide show

package/config/parameter-schema-v2.json +28 -1
package/infra/ci-harness/lib/ci-harness-stack.ts +50 -36
package/package.json +14 -5
package/servers/instance-sizer/index.js +30 -17
package/servers/instance-sizer/lib/instance-ranker.js +44 -0
package/servers/lib/catalogs/instances.json +27 -0
package/src/app.js +22 -1
package/src/lib/bootstrap-command-handler.js +32 -3
package/src/lib/config-validator.js +1 -1
package/src/lib/generated/cli-options.js +7 -2
package/src/lib/generated/parameter-matrix.js +16 -5
package/src/lib/generated/validation-rules.js +7 -3
package/src/lib/path-prover-brain.js +58 -1
package/src/lib/prompts/infrastructure-prompts.js +2 -2
package/src/lib/prompts/model-prompts.js +6 -0
package/src/lib/prove-pipeline-executor.js +294 -0
package/src/lib/secrets-prompt-runner.js +4 -0
package/src/lib/template-manager.js +1 -1
package/src/lib/template-variable-resolver.js +62 -0
package/templates/do/README.md +37 -0
package/templates/do/adapter +8 -0
package/templates/do/build +8 -0
package/templates/do/clean.d/async-inference.ejs +8 -0
package/templates/do/clean.d/batch-transform.ejs +8 -0
package/templates/do/clean.d/hyperpod-eks.ejs +8 -0
package/templates/do/clean.d/managed-inference.ejs +8 -0
package/templates/do/config +12 -45
package/templates/do/deploy.d/async-inference.ejs +33 -3
package/templates/do/deploy.d/batch-transform.ejs +32 -3
package/templates/do/deploy.d/hyperpod-eks.ejs +7 -0
package/templates/do/deploy.d/managed-inference.ejs +27 -3
package/templates/do/lib/endpoint-config.sh +1 -1
package/templates/do/lib/profile.sh +44 -0
package/templates/do/lib/staged-assets.sh +217 -0
package/templates/do/push +8 -0
package/templates/do/register +8 -0
package/templates/do/stage +569 -0
package/templates/do/submit +10 -0
package/templates/do/test +1 -0
package/templates/do/tune +7 -0

package/templates/do/config CHANGED Viewed

@@ -13,23 +13,23 @@ export MODEL_SERVER="<%= modelServer %>"
 # AWS configuration
 export AWS_REGION=${AWS_REGION:-<%= awsRegion %>}
-export ECR_REPOSITORY_NAME="ml-container-creator"
+# ── Profile-resolved values (from ~/.ml-container-creator/config.json) ────
+# ECR_REPOSITORY_NAME, ROLE_ARN, ADAPTER_S3_BUCKET — see do/lib/profile.sh
 <% if (typeof enableLora !== 'undefined' && enableLora) { %>
 # LoRA adapter serving
 export ENABLE_LORA=true
-export ADAPTER_S3_BUCKET="mlcc-adapters-$(aws sts get-caller-identity --query Account --output text 2>/dev/null || echo 'UNKNOWN')-${AWS_REGION}"
 <% } else if (framework === 'transformers' || framework === 'diffusors') { %>
 # LoRA adapter serving (uncomment to enable)
 # export ENABLE_LORA=true
-# export ADAPTER_S3_BUCKET="mlcc-adapters-$(aws sts get-caller-identity --query Account --output text 2>/dev/null || echo 'UNKNOWN')-${AWS_REGION}"
 <% } %>
 # Build configuration — WHERE the Docker image gets built
 export BUILD_TARGET="<%= buildTarget %>"
 <% if (buildTarget === 'codebuild') { %>
 export CODEBUILD_COMPUTE_TYPE="<%= codebuildComputeType %>"
-export CODEBUILD_PROJECT_NAME="${PROJECT_NAME}-build-$(date +%Y%m%d)"
+# CODEBUILD_PROJECT_NAME — derived in do/submit at runtime
 <% } %>
 # Deployment configuration — WHERE the model runs
@@ -83,26 +83,9 @@ export INFERENCE_AMI_VERSION="<%= inferenceAmiVersion %>"
 <% } %>
 # Async-specific configuration
-# Resolve AWS account ID at runtime for default resource names
-ACCOUNT_ID=$(aws sts get-caller-identity --query Account --output text 2>/dev/null || echo "UNKNOWN")
-<% if (asyncS3OutputPath) { %>
-export ASYNC_S3_OUTPUT_PATH="<%= asyncS3OutputPath %>"
-<% } else { %>
-export ASYNC_S3_OUTPUT_PATH="s3://mlcc-async-${ACCOUNT_ID}-${AWS_REGION}/${PROJECT_NAME}/output/"
-<% } %>
-<% if (asyncSnsSuccessTopic) { %>
-export ASYNC_SNS_SUCCESS_TOPIC="<%= asyncSnsSuccessTopic %>"
-<% } else { %>
-export ASYNC_SNS_SUCCESS_TOPIC="arn:aws:sns:${AWS_REGION}:${ACCOUNT_ID}:ml-container-creator-${PROJECT_NAME}-async-success"
-<% } %>
-<% if (asyncSnsErrorTopic) { %>
-export ASYNC_SNS_ERROR_TOPIC="<%= asyncSnsErrorTopic %>"
-<% } else { %>
-export ASYNC_SNS_ERROR_TOPIC="arn:aws:sns:${AWS_REGION}:${ACCOUNT_ID}:ml-container-creator-${PROJECT_NAME}-async-error"
-<% } %>
+# ── Profile-resolved values (from ~/.ml-container-creator/config.json) ────
+# ASYNC_S3_OUTPUT_PATH, ASYNC_SNS_SUCCESS_TOPIC, ASYNC_SNS_ERROR_TOPIC — see do/lib/profile.sh
+# ACCOUNT_ID — derived inline in consuming scripts (do/deploy.d/async-inference)
 <% if (asyncMaxConcurrentInvocations) { %>
 export ASYNC_MAX_CONCURRENT_INVOCATIONS="<%= asyncMaxConcurrentInvocations %>"
@@ -129,19 +112,10 @@ export FSX_VOLUME_HANDLE="<%= fsxVolumeHandle %>"
 # SageMaker Batch Transform configuration
 export INSTANCE_TYPE="<%= instanceType %>"
-# Resolve AWS account ID at runtime for default resource names
-ACCOUNT_ID=$(aws sts get-caller-identity --query Account --output text 2>/dev/null || echo "UNKNOWN")
+# ── Profile-resolved values (from ~/.ml-container-creator/config.json) ────
+# BATCH_INPUT_PATH, BATCH_OUTPUT_PATH — see do/lib/profile.sh
+# ACCOUNT_ID — derived inline in consuming scripts (do/deploy.d/batch-transform)
-<% if (batchInputPath) { %>
-export BATCH_INPUT_PATH="<%= batchInputPath %>"
-<% } else { %>
-export BATCH_INPUT_PATH="s3://mlcc-batch-${ACCOUNT_ID}-${AWS_REGION}/${PROJECT_NAME}/input/"
-<% } %>
-<% if (batchOutputPath) { %>
-export BATCH_OUTPUT_PATH="<%= batchOutputPath %>"
-<% } else { %>
-export BATCH_OUTPUT_PATH="s3://mlcc-batch-${ACCOUNT_ID}-${AWS_REGION}/${PROJECT_NAME}/output/"
-<% } %>
 export BATCH_INSTANCE_COUNT="<%= batchInstanceCount %>"
 export BATCH_SPLIT_TYPE="<%= batchSplitType %>"
 export BATCH_STRATEGY="<%= batchStrategy %>"
@@ -256,6 +230,8 @@ export NGC_API_KEY="<%= ngcApiKey %>"
 <% if (deploymentTarget !== 'batch-transform') { %>
 # Managed Model Customization (do/tune)
+# ── Profile-resolved values (from ~/.ml-container-creator/config.json) ────
+# TUNE_S3_BUCKET — see do/lib/profile.sh
 export TUNE_SUPPORTED=<%= (typeof tuneSupported !== 'undefined' && tuneSupported) ? 'true' : 'false' %>
 <% if (typeof tuneSupported !== 'undefined' && tuneSupported) { %>
 <% if (typeof tuneModelId !== 'undefined' && tuneModelId) { %>
@@ -270,7 +246,6 @@ export TUNE_MODEL_ID="<%= tuneModelId %>"
 # export TUNE_MODEL_ID=""
 <% } %>
 <% } %>
-export TUNE_S3_BUCKET="mlcc-tune-$(aws sts get-caller-identity --query Account --output text 2>/dev/null || echo 'UNKNOWN')-${AWS_REGION}"
 # MLflow App ARN for experiment tracking (set by bootstrap, or override manually)
 # export MLFLOW_APP_ARN=""
 <% } %>
@@ -296,13 +271,6 @@ export MODEL_FORMAT="<%= modelFormat %>"
 # export MODEL_FORMAT=""
 <% } %>
-<% if (roleArn) { %>
-export ROLE_ARN="<%= roleArn %>"
-<% } else { %>
-# IAM execution role for SageMaker (uncomment to override bootstrap role)
-# export ROLE_ARN=""
-<% } %>
 <% if (typeof includeBenchmark !== 'undefined' && includeBenchmark) { %>
 # SageMaker AI Benchmarking configuration
 export BENCHMARK_CONCURRENCY="<%= benchmarkConcurrency %>"
@@ -353,7 +321,6 @@ export BASE_IMAGE=${BASE_IMAGE:-<%= baseImage || '' %>}
 <% if ((deploymentTarget === 'realtime-inference' && !(typeof existingEndpointName !== 'undefined' && existingEndpointName)) || deploymentTarget === 'async-inference' || deploymentTarget === 'batch-transform') { %>
 export INSTANCE_TYPE=${INSTANCE_TYPE:-<%= instanceType %>}
 <% } %>
-export ECR_REPOSITORY_NAME=${ECR_REPOSITORY_NAME:-ml-container-creator}
 # Print configuration summary
 echo "⚙️  Configuration loaded"

package/templates/do/deploy.d/async-inference.ejs CHANGED Viewed

@@ -38,6 +38,21 @@ done
 # Source configuration
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 source "${SCRIPT_DIR}/config"
+source "${SCRIPT_DIR}/lib/profile.sh"
+# ── Profile-resolved variables (env var > profile > default) ──────────────────
+# Disable unbound-variable checking for associative array access (bash 3.2 compat)
+set +u
+ROLE_ARN="${ROLE_ARN:-${_PROFILE[roleArn]:-}}"
+ECR_REPOSITORY_NAME="${ECR_REPOSITORY_NAME:-${_PROFILE[ecrRepositoryName]:-ml-container-creator}}"
+export AWS_REGION="${AWS_REGION:-${_PROFILE[awsRegion]:-us-east-1}}"
+# Async-specific derived variables
+_ASYNC_BUCKET="${_PROFILE[asyncS3Bucket]:-mlcc-async-${_PROFILE[accountId]:-unknown}-${_PROFILE[awsRegion]:-us-east-1}}"
+ASYNC_S3_OUTPUT_PATH="${ASYNC_S3_OUTPUT_PATH:-s3://${_ASYNC_BUCKET}/${PROJECT_NAME}/output/}"
+ASYNC_SNS_SUCCESS_TOPIC="${ASYNC_SNS_SUCCESS_TOPIC:-arn:aws:sns:${_PROFILE[awsRegion]:-us-east-1}:${_PROFILE[accountId]:-unknown}:ml-container-creator-${PROJECT_NAME}-async-success}"
+ASYNC_SNS_ERROR_TOPIC="${ASYNC_SNS_ERROR_TOPIC:-arn:aws:sns:${_PROFILE[awsRegion]:-us-east-1}:${_PROFILE[accountId]:-unknown}:ml-container-creator-${PROJECT_NAME}-async-error}"
+set -u
 echo "🚀 Deploying to AWS"
 echo "   Project: ${PROJECT_NAME}"
@@ -137,16 +152,31 @@ source "${SCRIPT_DIR}/lib/wait.sh"
 # Resolve container secrets (HF_TOKEN, NGC_API_KEY)
 resolve_secrets
+<% if (typeof serverEnvVars !== 'undefined' && serverEnvVars && Object.keys(serverEnvVars).length > 0) { %>
+# ============================================================
+# Inject server environment variables into container Environment
+# ============================================================
+<% Object.keys(serverEnvVars).forEach(function(key) { %>
+if [ -n "${<%= key %>:-}" ]; then
+    if [ -n "${CONTAINER_ENV_JSON}" ]; then
+        CONTAINER_ENV_JSON="${CONTAINER_ENV_JSON},\"<%= key %>\":\"${<%= key %>}\""
+    else
+        CONTAINER_ENV_JSON="\"<%= key %>\":\"${<%= key %>}\""
+    fi
+fi
+<% }); %>
+<% } %>
 # Validate execution role ARN
 if [ -z "${ROLE_ARN:-}" ]; then
-    echo "❌ Execution role ARN not provided"
+    echo "❌ ROLE_ARN is not set."
+    echo "   Run 'ml-container-creator bootstrap' to configure your profile,"
+    echo "   or set ROLE_ARN as an environment variable."
     echo ""
     echo "Usage:"
     echo "  export ROLE_ARN=arn:aws:iam::ACCOUNT_ID:role/YOUR_ROLE"
     echo "  ./do/deploy"
     echo ""
-    echo "Or set ROLE_ARN in do/config"
-    echo ""
     echo "The execution role must have permissions for:"
     echo "  • SageMaker model and endpoint management"
     echo "  • ECR image access"

package/templates/do/deploy.d/batch-transform.ejs CHANGED Viewed

@@ -38,6 +38,20 @@ done
 # Source configuration
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 source "${SCRIPT_DIR}/config"
+source "${SCRIPT_DIR}/lib/profile.sh"
+# ── Profile-resolved variables (env var > profile > default) ──────────────────
+# Disable unbound-variable checking for associative array access (bash 3.2 compat)
+set +u
+ROLE_ARN="${ROLE_ARN:-${_PROFILE[roleArn]:-}}"
+ECR_REPOSITORY_NAME="${ECR_REPOSITORY_NAME:-${_PROFILE[ecrRepositoryName]:-ml-container-creator}}"
+export AWS_REGION="${AWS_REGION:-${_PROFILE[awsRegion]:-us-east-1}}"
+# Batch-specific derived variables
+_BATCH_BUCKET="${_PROFILE[batchS3Bucket]:-mlcc-batch-${_PROFILE[accountId]:-unknown}-${_PROFILE[awsRegion]:-us-east-1}}"
+BATCH_INPUT_PATH="${BATCH_INPUT_PATH:-s3://${_BATCH_BUCKET}/${PROJECT_NAME}/input/}"
+BATCH_OUTPUT_PATH="${BATCH_OUTPUT_PATH:-s3://${_BATCH_BUCKET}/${PROJECT_NAME}/output/}"
+set -u
 echo "🚀 Deploying to AWS"
 echo "   Project: ${PROJECT_NAME}"
@@ -135,16 +149,31 @@ source "${SCRIPT_DIR}/lib/wait.sh"
 # Resolve container secrets (HF_TOKEN, NGC_API_KEY)
 resolve_secrets
+<% if (typeof serverEnvVars !== 'undefined' && serverEnvVars && Object.keys(serverEnvVars).length > 0) { %>
+# ============================================================
+# Inject server environment variables into container Environment
+# ============================================================
+<% Object.keys(serverEnvVars).forEach(function(key) { %>
+if [ -n "${<%= key %>:-}" ]; then
+    if [ -n "${CONTAINER_ENV_JSON}" ]; then
+        CONTAINER_ENV_JSON="${CONTAINER_ENV_JSON},\"<%= key %>\":\"${<%= key %>}\""
+    else
+        CONTAINER_ENV_JSON="\"<%= key %>\":\"${<%= key %>}\""
+    fi
+fi
+<% }); %>
+<% } %>
 # Validate execution role ARN
 if [ -z "${ROLE_ARN:-}" ]; then
-    echo "❌ Execution role ARN not provided"
+    echo "❌ ROLE_ARN is not set."
+    echo "   Run 'ml-container-creator bootstrap' to configure your profile,"
+    echo "   or set ROLE_ARN as an environment variable."
     echo ""
     echo "Usage:"
     echo "  export ROLE_ARN=arn:aws:iam::ACCOUNT_ID:role/YOUR_ROLE"
     echo "  ./do/deploy"
     echo ""
-    echo "Or set ROLE_ARN in do/config"
-    echo ""
     echo "The execution role must have permissions for:"
     echo "  • SageMaker model and transform job management"
     echo "  • ECR image access"

package/templates/do/deploy.d/hyperpod-eks.ejs CHANGED Viewed

@@ -38,6 +38,13 @@ done
 # Source configuration
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 source "${SCRIPT_DIR}/config"
+source "${SCRIPT_DIR}/lib/profile.sh"
+# ── Profile-resolved variables (env var > profile > default) ──────────────────
+# Disable unbound-variable checking for associative array access (bash 3.2 compat)
+set +u
+export AWS_REGION="${AWS_REGION:-${_PROFILE[awsRegion]:-us-east-1}}"
+set -u
 echo "🚀 Deploying to AWS"
 echo "   Project: ${PROJECT_NAME}"

package/templates/do/deploy.d/managed-inference.ejs CHANGED Viewed

@@ -211,6 +211,15 @@ _ci_handle_existing_endpoint() {
 # Source configuration
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 source "${SCRIPT_DIR}/config"
+source "${SCRIPT_DIR}/lib/profile.sh"
+# ── Profile-resolved variables (env var > profile > default) ──────────────────
+# Disable unbound-variable checking for associative array access (bash 3.2 compat)
+set +u
+ROLE_ARN="${ROLE_ARN:-${_PROFILE[roleArn]:-}}"
+ECR_REPOSITORY_NAME="${ECR_REPOSITORY_NAME:-${_PROFILE[ecrRepositoryName]:-ml-container-creator}}"
+export AWS_REGION="${AWS_REGION:-${_PROFILE[awsRegion]:-us-east-1}}"
+set -u
 echo "🚀 Deploying to AWS"
 echo "   Project: ${PROJECT_NAME}"
@@ -307,14 +316,14 @@ source "${SCRIPT_DIR}/lib/inference-component.sh"
 # Validate execution role ARN
 if [ -z "${ROLE_ARN:-}" ]; then
-    echo "❌ Execution role ARN not provided"
+    echo "❌ ROLE_ARN is not set."
+    echo "   Run 'ml-container-creator bootstrap' to configure your profile,"
+    echo "   or set ROLE_ARN as an environment variable."
     echo ""
     echo "Usage:"
     echo "  export ROLE_ARN=arn:aws:iam::ACCOUNT_ID:role/YOUR_ROLE"
     echo "  ./do/deploy"
     echo ""
-    echo "Or set ROLE_ARN in do/config"
-    echo ""
     echo "The execution role must have permissions for:"
     echo "  • SageMaker endpoint and inference component management"
     echo "  • ECR image access"
@@ -350,6 +359,21 @@ fi
 # Resolve container secrets (HF_TOKEN, NGC_API_KEY)
 resolve_secrets
+<% if (typeof serverEnvVars !== 'undefined' && serverEnvVars && Object.keys(serverEnvVars).length > 0) { %>
+# ============================================================
+# Inject server environment variables into container Environment
+# ============================================================
+<% Object.keys(serverEnvVars).forEach(function(key) { %>
+if [ -n "${<%= key %>:-}" ]; then
+    if [ -n "${CONTAINER_ENV_JSON}" ]; then
+        CONTAINER_ENV_JSON="${CONTAINER_ENV_JSON},\"<%= key %>\":\"${<%= key %>}\""
+    else
+        CONTAINER_ENV_JSON="\"<%= key %>\":\"${<%= key %>}\""
+    fi
+fi
+<% }); %>
+<% } %>
 # ============================================================
 # CI-Mode: Idempotent deployment check (runs before normal idempotency)
 # ============================================================

package/templates/do/lib/endpoint-config.sh CHANGED Viewed

@@ -165,7 +165,7 @@ create_endpoint_config() {
         # Optional: capacity reservation
         if [ -n "${CAPACITY_RESERVATION_ARN:-}" ]; then
             variant_json="${variant_json},\"CapacityReservationConfig\":{\"CapacityReservationPreference\":\"capacity-reservations-only\",\"MlReservationArn\":\"${CAPACITY_RESERVATION_ARN}\"}"
-            echo "   ⚠️  Capacity reservation (experimental): ${CAPACITY_RESERVATION_ARN}"
+            echo "   ✓ Capacity reservation: ${CAPACITY_RESERVATION_ARN}"
         fi
         variant_json="${variant_json}}]"

package/templates/do/lib/profile.sh ADDED Viewed

@@ -0,0 +1,44 @@
+#!/usr/bin/env bash
+# Profile loader — reads active bootstrap profile into _PROFILE[] associative array.
+# Source this file after do/config. Values provide defaults; explicit env vars take precedence.
+#
+# Requires bash 4+ for associative array support.
+# macOS ships with bash 3.2 — install bash 4+ via Homebrew: brew install bash
+#
+# Expected keys in _PROFILE:
+#   awsRegion, accountId, awsProfile, roleArn, ecrRepositoryName,
+#   benchmarkS3Bucket, ciBenchmarkResultsBucket, asyncS3Bucket, batchS3Bucket,
+#   ciTableName, ciInfraProvisioned
+# Temporarily disable unbound variable checking for profile loading
+# (keys may not exist in the profile config, and declare -A behavior
+# varies across bash versions with set -u)
+set +u 2>/dev/null || true
+declare -A _PROFILE 2>/dev/null || true
+if command -v python3 &>/dev/null; then
+    _PROFILE_RAW=$(python3 -c "
+import json, os
+try:
+    with open(os.path.expanduser('~/.ml-container-creator/config.json')) as f:
+        c = json.load(f)
+    p = c['profiles'][c['activeProfile']]
+    # Output as KEY=VALUE lines (simple, no JSON parsing in bash)
+    for k, v in p.items():
+        if isinstance(v, (str, int, float, bool)):
+            print(f'{k}={v}')
+except:
+    pass
+" 2>/dev/null) || _PROFILE_RAW=""
+    if [ -n "${_PROFILE_RAW}" ]; then
+        while IFS='=' read -r key value; do
+            [ -n "${key}" ] && _PROFILE["${key}"]="${value}"
+        done <<< "${_PROFILE_RAW}"
+    fi
+fi
+# NOTE: set -u is NOT re-enabled here. The caller is responsible for managing
+# their own shell options. Re-enabling set -u would cause "unbound variable"
+# errors when accessing _PROFILE keys on bash versions where empty associative
+# arrays are treated as unset (bash 5.x on some platforms).

package/templates/do/lib/staged-assets.sh ADDED Viewed

@@ -0,0 +1,217 @@
+# Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Shared helper: read/write the .mlcc/staged-assets.json tracking file.
+# Sourced by do/stage, do/submit, and other lifecycle scripts.
+#
+# ─── Schema (.mlcc/staged-assets.json) ───────────────────────────────────────
+#
+# {
+#   "version": "1",
+#   "models": {
+#     "<ic-name>": {
+#       "source":     "<HuggingFace model ID, e.g. google/gemma-4-31B-it>",
+#       "staged_uri": "<S3 URI with trailing slash>",
+#       "staged_at":  "<ISO 8601 timestamp>",
+#       "region":     "<AWS region where the model was staged>",
+#       "size_gb":    <numeric size in GB>
+#     }
+#   },
+#   "adapters": {}
+# }
+#
+# Notes:
+#   - "version" is for forward-compatible schema evolution (start at "1")
+#   - "models" is keyed by IC name; use "default" for single-model projects
+#   - "adapters" is reserved for future LoRA adapter staging (BL-122)
+#   - This file is git-ignored (.mlcc/ contains account-specific URIs)
+#   - The file SHALL NOT be created unless a valid staging operation completes
+# ──────────────────────────────────────────────────────────────────────────────
+# Path to the staged-assets file (relative to project root)
+STAGED_ASSETS_DIR=".mlcc"
+STAGED_ASSETS_FILE="${STAGED_ASSETS_DIR}/staged-assets.json"
+# _staged_assets_has_jq()
+#   Check if jq is available on the system.
+#   Returns 0 if available, 1 if not.
+_staged_assets_has_jq() {
+    command -v jq &>/dev/null
+}
+# _staged_assets_warn_no_jq()
+#   Print a one-time warning when jq is not available.
+_staged_assets_warn_no_jq() {
+    if [ -z "${_STAGED_ASSETS_JQ_WARNED:-}" ]; then
+        echo "⚠️  jq not found — using fallback parser (install jq for full functionality)" >&2
+        _STAGED_ASSETS_JQ_WARNED=1
+    fi
+}
+# staged_assets_read_model_uri()
+#   Read the staged S3 URI for the default model from the staged-assets file.
+#   Echoes the S3 URI if found, or an empty string if not available.
+#
+#   Uses jq when available; falls back to grep/sed extraction.
+#
+#   Arguments: none
+#   Output:    S3 URI string (stdout) or empty string
+staged_assets_read_model_uri() {
+    local uri=""
+    # No file → empty string
+    if [ ! -f "${STAGED_ASSETS_FILE}" ]; then
+        echo ""
+        return 0
+    fi
+    if _staged_assets_has_jq; then
+        uri=$(jq -r '.models.default.staged_uri // empty' "${STAGED_ASSETS_FILE}" 2>/dev/null) || uri=""
+    else
+        _staged_assets_warn_no_jq
+        # Fallback: grep/sed extraction for the staged_uri field within the default model block
+        # This handles the common single-model case reliably
+        uri=$(grep -A 5 '"default"' "${STAGED_ASSETS_FILE}" 2>/dev/null \
+            | grep '"staged_uri"' \
+            | sed 's/.*"staged_uri"[[:space:]]*:[[:space:]]*"\([^"]*\)".*/\1/' \
+            | head -1) || uri=""
+    fi
+    echo "${uri}"
+}
+# staged_assets_write_model()
+#   Create or update the staged-assets file with model staging information.
+#   Creates the .mlcc directory if it does not exist.
+#
+#   Arguments:
+#     $1 - source:   HuggingFace model ID (e.g. "google/gemma-4-31B-it")
+#     $2 - uri:      S3 URI where the model was staged (with trailing slash)
+#     $3 - region:   AWS region where the model was staged
+#     $4 - size_gb:  Total size of the staged model in GB (numeric)
+staged_assets_write_model() {
+    local source="$1"
+    local uri="$2"
+    local region="$3"
+    local size_gb="$4"
+    local timestamp
+    timestamp=$(date -u +%Y-%m-%dT%H:%M:%SZ)
+    # Ensure the .mlcc directory exists
+    mkdir -p "${STAGED_ASSETS_DIR}"
+    if _staged_assets_has_jq; then
+        if [ -f "${STAGED_ASSETS_FILE}" ]; then
+            # Update existing file — merge the new model entry
+            local tmp_file="${STAGED_ASSETS_FILE}.tmp"
+            jq --arg source "${source}" \
+               --arg uri "${uri}" \
+               --arg ts "${timestamp}" \
+               --arg region "${region}" \
+               --argjson size "${size_gb}" \
+               '.models.default = {
+                   "source": $source,
+                   "staged_uri": $uri,
+                   "staged_at": $ts,
+                   "region": $region,
+                   "size_gb": $size
+               }' "${STAGED_ASSETS_FILE}" > "${tmp_file}" && mv "${tmp_file}" "${STAGED_ASSETS_FILE}"
+        else
+            # Create new file from scratch
+            jq -n --arg source "${source}" \
+                  --arg uri "${uri}" \
+                  --arg ts "${timestamp}" \
+                  --arg region "${region}" \
+                  --argjson size "${size_gb}" \
+                  '{
+                      "version": "1",
+                      "models": {
+                          "default": {
+                              "source": $source,
+                              "staged_uri": $uri,
+                              "staged_at": $ts,
+                              "region": $region,
+                              "size_gb": $size
+                          }
+                      },
+                      "adapters": {}
+                  }' > "${STAGED_ASSETS_FILE}"
+        fi
+    else
+        _staged_assets_warn_no_jq
+        # Fallback: write the JSON directly (create-only, no merge support without jq)
+        cat > "${STAGED_ASSETS_FILE}" << EOF
+{
+  "version": "1",
+  "models": {
+    "default": {
+      "source": "${source}",
+      "staged_uri": "${uri}",
+      "staged_at": "${timestamp}",
+      "region": "${region}",
+      "size_gb": ${size_gb}
+    }
+  },
+  "adapters": {}
+}
+EOF
+    fi
+}
+# staged_assets_status()
+#   Print a human-readable table of all staged assets.
+#   Shows models and adapters with their source, URI, region, size, and timestamp.
+#
+#   Arguments: none
+#   Output:    formatted table to stdout
+staged_assets_status() {
+    if [ ! -f "${STAGED_ASSETS_FILE}" ]; then
+        echo "No staged assets found."
+        echo "  Run do/stage to stage model weights to S3."
+        return 0
+    fi
+    echo "Staged Assets (.mlcc/staged-assets.json)"
+    echo "─────────────────────────────────────────────────────────────────"
+    if _staged_assets_has_jq; then
+        # Print models section
+        local model_count
+        model_count=$(jq -r '.models | length' "${STAGED_ASSETS_FILE}" 2>/dev/null) || model_count=0
+        if [ "${model_count}" -gt 0 ]; then
+            echo ""
+            echo "  Models:"
+            echo "  ┌──────────────┬─────────────────────────────────┬──────────────────────────────────────────────────────┬────────────┬─────────┐"
+            printf "  │ %-12s │ %-31s │ %-52s │ %-10s │ %-7s │\n" "IC Name" "Source" "S3 URI" "Region" "Size"
+            echo "  ├──────────────┼─────────────────────────────────┼──────────────────────────────────────────────────────┼────────────┼─────────┤"
+            jq -r '.models | to_entries[] | "\(.key)\t\(.value.source)\t\(.value.staged_uri)\t\(.value.region)\t\(.value.size_gb)"' "${STAGED_ASSETS_FILE}" 2>/dev/null | \
+            while IFS=$'\t' read -r ic_name source staged_uri region size_gb; do
+                printf "  │ %-12s │ %-31s │ %-52s │ %-10s │ %5s GB│\n" \
+                    "${ic_name}" "${source}" "${staged_uri}" "${region}" "${size_gb}"
+            done
+            echo "  └──────────────┴─────────────────────────────────┴──────────────────────────────────────────────────────┴────────────┴─────────┘"
+        fi
+        # Print adapters section (future — show placeholder if empty)
+        local adapter_count
+        adapter_count=$(jq -r '.adapters | length' "${STAGED_ASSETS_FILE}" 2>/dev/null) || adapter_count=0
+        if [ "${adapter_count}" -gt 0 ]; then
+            echo ""
+            echo "  Adapters:"
+            jq -r '.adapters | to_entries[] | "    \(.key): \(.value.staged_uri // "not staged")"' "${STAGED_ASSETS_FILE}" 2>/dev/null
+        fi
+    else
+        _staged_assets_warn_no_jq
+        # Fallback: basic display without jq
+        echo ""
+        echo "  Raw contents:"
+        echo ""
+        cat "${STAGED_ASSETS_FILE}"
+    fi
+    echo ""
+}

package/templates/do/push CHANGED Viewed

@@ -9,6 +9,14 @@ set -o pipefail
 # Source configuration
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 source "${SCRIPT_DIR}/config"
+source "${SCRIPT_DIR}/lib/profile.sh"
+# ── Profile-resolved variables (env var > profile > default) ──────────────────
+# Disable unbound-variable checking for associative array access (bash 3.2 compat)
+set +u
+ECR_REPOSITORY_NAME="${ECR_REPOSITORY_NAME:-${_PROFILE[ecrRepositoryName]:-ml-container-creator}}"
+export AWS_REGION="${AWS_REGION:-${_PROFILE[awsRegion]:-us-east-1}}"
+set -u
 echo "🚀 Pushing Docker image to Amazon ECR"
 echo "   Project: ${PROJECT_NAME}"

package/templates/do/register CHANGED Viewed

@@ -9,6 +9,14 @@ set -o pipefail
 # Source configuration
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 source "${SCRIPT_DIR}/config"
+source "${SCRIPT_DIR}/lib/profile.sh"
+# ── Profile-resolved variables (env var > profile > default) ──────────────────
+# Disable unbound-variable checking for associative array access (bash 3.2 compat)
+set +u
+ROLE_ARN="${ROLE_ARN:-${_PROFILE[roleArn]:-}}"
+ECR_REPOSITORY_NAME="${ECR_REPOSITORY_NAME:-${_PROFILE[ecrRepositoryName]:-ml-container-creator}}"
+set -u
 # ============================================================
 # Register deployment to the deployment registry