npm - @pennyfarthing/core - Versions diffs - 7.4.1 → 7.6.0 - Mend

@pennyfarthing/core 7.4.1 → 7.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (127) hide show

package/pennyfarthing-dist/scripts/theme/compute-theme-tiers.js ADDED Viewed

@@ -0,0 +1,492 @@
+#!/usr/bin/env node
+/**
+ * compute-theme-tiers.js - Compute tier rankings from job-fair results
+ *
+ * Reads all summary.yaml files from internal/results/job-fair/
+ * For each theme, extracts character×role scores from the matrix
+ * Normalizes across formats, then computes delta vs baseline
+ * Assigns tier based on overall performance vs control baseline
+ *
+ * KEY DESIGN DECISIONS:
+ * 1. Normalizes dev roles: averages dev-codegen + dev-debug into synthetic "dev"
+ *    to enable fair comparison across old 4-role and new 6-role formats.
+ *    Final comparison uses: dev, reviewer, sm, tea (4 roles)
+ * 2. Uses the MOST COMPLETE run for each theme (most matrix entries),
+ *    not the most recent. This prevents incomplete runs from overriding good data.
+ *
+ * Tier criteria (calibrated for actual delta distribution):
+ *   S: delta >= +7  (elite - top performers)
+ *   A: delta >= +5  (excellent - strong positive)
+ *   B: delta >= +3  (strong - solid performers)
+ *   C: delta >= +1  (good - above average)
+ *   D: delta < +1   (average/below)
+ *   U: no data      (unbenchmarked)
+ *
+ * Usage:
+ *   compute-theme-tiers.js [--dry-run] [--verbose] [--min-entries N]
+ */
+import { readdirSync, readFileSync, writeFileSync, existsSync } from 'fs';
+import { join, dirname, basename } from 'path';
+import { fileURLToPath } from 'url';
+import { execSync } from 'child_process';
+const __filename = fileURLToPath(import.meta.url);
+const __dirname = dirname(__filename);
+const PROJECT_ROOT = join(__dirname, '..', '..');
+const JOB_FAIR_DIR = join(PROJECT_ROOT, '..', 'internal', 'results', 'job-fair');
+const THEMES_DIR = join(PROJECT_ROOT, 'personas', 'themes');
+// Default minimum entries for a run to be considered complete
+const DEFAULT_MIN_ENTRIES = 20;
+// Normalized roles for fair comparison across old (4-role) and new (6-role) formats:
+//   - Old format: dev, reviewer, sm, tea
+//   - New format: architect, dev-codegen, dev-debug, reviewer, sm, tea
+//
+// Strategy: Average dev-codegen + dev-debug into synthetic "dev" score, giving us
+// 4 comparable roles: dev, reviewer, sm, tea
+const NORMALIZED_ROLES = new Set(['dev', 'reviewer', 'sm', 'tea']);
+const DEV_SUBROLES = ['dev-codegen', 'dev-debug'];
+// Tier thresholds (calibrated for actual delta distribution)
+const TIER_THRESHOLDS = {
+  S: 7,    // delta >= +7  (elite - top performers)
+  A: 5,    // delta >= +5  (excellent - strong positive)
+  B: 3,    // delta >= +3  (strong - solid performers)
+  C: 1,    // delta >= +1  (good - above average)
+  // D: below +1 (average/below)
+};
+function parseArgs(argv) {
+  const args = {
+    dryRun: false,
+    verbose: false,
+    minEntries: DEFAULT_MIN_ENTRIES,
+  };
+  let i = 2;
+  while (i < argv.length) {
+    const arg = argv[i];
+    switch (arg) {
+      case '--dry-run':
+        args.dryRun = true;
+        break;
+      case '--verbose':
+        args.verbose = true;
+        break;
+      case '--min-entries':
+        args.minEntries = parseInt(argv[++i], 10);
+        break;
+      case '--help':
+      case '-h':
+        showUsage();
+        process.exit(0);
+    }
+    i++;
+  }
+  return args;
+}
+function showUsage() {
+  console.log(`Usage: compute-theme-tiers.js [OPTIONS]
+Options:
+  --dry-run           Output changes without writing to theme files
+  --verbose           Show detailed output including skipped runs
+  --min-entries N     Minimum matrix entries for a run to be complete (default: ${DEFAULT_MIN_ENTRIES})
+  --help, -h          Show this help message
+Normalization:
+  Averages dev-codegen + dev-debug into synthetic "dev" score.
+  Final comparison uses 4 roles: dev, reviewer, sm, tea.
+Tier Criteria (based on mean delta from control on common roles):
+  S: delta >= +7    (elite - top performers)
+  A: delta >= +5    (excellent - strong positive)
+  B: delta >= +3    (strong - solid performers)
+  C: delta >= +1    (good - above average)
+  D: delta < +1     (average/below)
+  U: no data        (unbenchmarked)`);
+}
+/**
+ * Extract YAML field using yq
+ */
+function yqGet(filePath, field) {
+  try {
+    const result = execSync(`yq -r '${field}' "${filePath}"`, {
+      encoding: 'utf-8',
+      stdio: ['pipe', 'pipe', 'pipe'],
+    }).trim();
+    return result === 'null' ? null : result;
+  } catch {
+    return null;
+  }
+}
+/**
+ * Parse baselines from summary.yaml
+ * Returns: { role: { mean, std, n } }
+ */
+function parseBaselines(filePath) {
+  try {
+    const raw = execSync(`yq -o=json '.baselines' "${filePath}"`, {
+      encoding: 'utf-8',
+      stdio: ['pipe', 'pipe', 'pipe'],
+    });
+    return JSON.parse(raw);
+  } catch {
+    return null;
+  }
+}
+/**
+ * Count matrix entries by grep (handles duplicate YAML keys)
+ * Counts lines matching "mean:" within the matrix section
+ */
+function countMatrixEntries(filePath) {
+  try {
+    // Count "mean:" lines after "matrix:" line, excluding baselines section
+    const result = execSync(
+      `awk '/^matrix:/,0 { if (/mean:/) count++ } END { print count }' "${filePath}"`,
+      { encoding: 'utf-8', stdio: ['pipe', 'pipe', 'pipe'] }
+    ).trim();
+    return parseInt(result, 10) || 0;
+  } catch {
+    return 0;
+  }
+}
+/**
+ * Extract all scores from matrix section using yq (handles duplicate keys)
+ * Returns: [{ character, role, mean, n }]
+ */
+function parseMatrixScores(filePath) {
+  try {
+    // Use yq to iterate through matrix entries - handles duplicates
+    const raw = execSync(
+      `yq '.matrix | to_entries | .[] | .key as $char | .value | to_entries | .[] | [$char, .key, .value.mean, .value.n] | @csv' "${filePath}"`,
+      { encoding: 'utf-8', stdio: ['pipe', 'pipe', 'pipe'] }
+    );
+    const scores = [];
+    for (const line of raw.trim().split('\n')) {
+      if (!line) continue;
+      // Parse CSV: character,role,mean,n (unquoted or quoted)
+      // Handle both: death,dev,70.00,1 and "death","dev",70.00,1
+      const parts = line.split(',');
+      if (parts.length >= 4) {
+        const character = parts[0].replace(/^"|"$/g, '');
+        const role = parts[1].replace(/^"|"$/g, '');
+        const mean = parseFloat(parts[2]);
+        const n = parseInt(parts[3], 10);
+        if (!isNaN(mean) && !isNaN(n)) {
+          scores.push({ character, role, mean, n });
+        }
+      }
+    }
+    return scores;
+  } catch {
+    return [];
+  }
+}
+/**
+ * Normalize baselines: average dev-codegen + dev-debug into synthetic "dev"
+ */
+function normalizeBaselines(baselines) {
+  if (!baselines) return null;
+  const normalized = { ...baselines };
+  // If we have dev-codegen and dev-debug but no dev, create synthetic dev
+  if (!normalized.dev && normalized['dev-codegen'] && normalized['dev-debug']) {
+    const codegen = normalized['dev-codegen'];
+    const debug = normalized['dev-debug'];
+    normalized.dev = {
+      mean: (codegen.mean + debug.mean) / 2,
+      std: Math.sqrt((codegen.std ** 2 + debug.std ** 2) / 2), // pooled std approximation
+      n: codegen.n + debug.n,
+    };
+  }
+  return normalized;
+}
+/**
+ * Compute delta vs baselines for a job-fair run
+ * Returns: { meanDelta, meanScore, nRoles, roleDeltas }
+ *
+ * Normalizes dev-codegen + dev-debug into synthetic "dev" for fair comparison
+ * across old (4-role) and new (6-role) benchmark formats.
+ */
+function computeDeltas(baselines, matrixScores) {
+  if (!baselines || !matrixScores || matrixScores.length === 0) return null;
+  // Normalize baselines (average dev-codegen + dev-debug into dev)
+  const normalizedBaselines = normalizeBaselines(baselines);
+  // Aggregate scores by role
+  // First pass: collect raw scores including dev subroles
+  const rawScores = {};
+  for (const { role, mean } of matrixScores) {
+    if (typeof mean !== 'number') continue;
+    if (!rawScores[role]) {
+      rawScores[role] = { sum: 0, count: 0 };
+    }
+    rawScores[role].sum += mean;
+    rawScores[role].count++;
+  }
+  // Second pass: normalize dev subroles into synthetic "dev"
+  const roleScores = {};
+  for (const [role, scores] of Object.entries(rawScores)) {
+    if (DEV_SUBROLES.includes(role)) {
+      // Accumulate dev subroles into synthetic "dev"
+      if (!roleScores.dev) {
+        roleScores.dev = { sum: 0, count: 0 };
+      }
+      roleScores.dev.sum += scores.sum;
+      roleScores.dev.count += scores.count;
+    } else if (NORMALIZED_ROLES.has(role)) {
+      roleScores[role] = scores;
+    }
+    // Skip roles not in NORMALIZED_ROLES (e.g., architect)
+  }
+  // Compute deltas vs normalized baselines
+  const roleDeltas = {};
+  let totalDelta = 0;
+  let totalScore = 0;
+  let nRoles = 0;
+  for (const [role, scores] of Object.entries(roleScores)) {
+    const baseline = normalizedBaselines[role];
+    if (!baseline || typeof baseline.mean !== 'number') continue;
+    const roleMean = scores.sum / scores.count;
+    const delta = roleMean - baseline.mean;
+    roleDeltas[role] = {
+      mean: roleMean,
+      baseline: baseline.mean,
+      delta,
+      n: scores.count,
+    };
+    totalDelta += delta;
+    totalScore += roleMean;
+    nRoles++;
+  }
+  if (nRoles === 0) return null;
+  return {
+    meanDelta: totalDelta / nRoles,
+    meanScore: totalScore / nRoles,
+    nRoles,
+    roleDeltas,
+  };
+}
+/**
+ * Assign tier based on mean delta
+ */
+function assignTier(meanDelta) {
+  if (meanDelta >= TIER_THRESHOLDS.S) return 'S';
+  if (meanDelta >= TIER_THRESHOLDS.A) return 'A';
+  if (meanDelta >= TIER_THRESHOLDS.B) return 'B';
+  if (meanDelta >= TIER_THRESHOLDS.C) return 'C';
+  return 'D';
+}
+/**
+ * Find all job-fair summary files
+ */
+function findSummaryFiles() {
+  if (!existsSync(JOB_FAIR_DIR)) {
+    console.error(`Error: Job fair directory not found: ${JOB_FAIR_DIR}`);
+    process.exit(1);
+  }
+  const files = [];
+  for (const entry of readdirSync(JOB_FAIR_DIR, { withFileTypes: true })) {
+    if (!entry.isDirectory()) continue;
+    const summaryPath = join(JOB_FAIR_DIR, entry.name, 'summary.yaml');
+    if (existsSync(summaryPath)) {
+      files.push({
+        path: summaryPath,
+        runName: entry.name,
+      });
+    }
+  }
+  return files.sort((a, b) => a.runName.localeCompare(b.runName));
+}
+/**
+ * Update tier in theme file
+ */
+function updateThemeTier(themeName, newTier, dryRun) {
+  const themeFile = join(THEMES_DIR, `${themeName}.yaml`);
+  if (!existsSync(themeFile)) {
+    return { updated: false, reason: 'file not found' };
+  }
+  const content = readFileSync(themeFile, 'utf-8');
+  const tierMatch = content.match(/^(\s+tier:\s*)(\S+)/m);
+  if (!tierMatch) {
+    return { updated: false, reason: 'no tier field', currentTier: 'U' };
+  }
+  const currentTier = tierMatch[2];
+  if (currentTier === newTier) {
+    return { updated: false, reason: 'unchanged', currentTier };
+  }
+  if (!dryRun) {
+    const newContent = content.replace(/^(\s+tier:\s*)\S+/m, `$1${newTier}`);
+    writeFileSync(themeFile, newContent);
+  }
+  return { updated: true, currentTier, newTier };
+}
+/**
+ * Main execution
+ */
+function main() {
+  const args = parseArgs(process.argv);
+  if (args.dryRun) {
+    console.log('DRY RUN - no changes will be made\n');
+  }
+  console.log('Configuration:');
+  console.log(`  Minimum entries for complete run: ${args.minEntries}`);
+  console.log(`  Normalized roles: ${[...NORMALIZED_ROLES].join(', ')}`);
+  console.log(`  Dev subroles (averaged): ${DEV_SUBROLES.join(' + ')} → dev`);
+  console.log(`  Job fair directory: ${JOB_FAIR_DIR}`);
+  console.log('');
+  // Find all summary files
+  const summaryFiles = findSummaryFiles();
+  console.log(`Scanning ${summaryFiles.length} job-fair runs...\n`);
+  // Process each run and collect best run per theme
+  const themeRuns = {}; // theme -> { bestRun, entries, data }
+  const skippedRuns = [];
+  for (const { path, runName } of summaryFiles) {
+    const theme = yqGet(path, '.theme');
+    if (!theme) continue;
+    const entries = countMatrixEntries(path);
+    // Skip incomplete runs
+    if (entries < args.minEntries) {
+      skippedRuns.push({ theme, runName, entries, reason: 'incomplete' });
+      continue;
+    }
+    const baselines = parseBaselines(path);
+    const matrixScores = parseMatrixScores(path);
+    const deltas = computeDeltas(baselines, matrixScores);
+    if (!deltas) {
+      skippedRuns.push({ theme, runName, entries, reason: 'no valid deltas' });
+      continue;
+    }
+    // Keep the most complete run for each theme
+    if (!themeRuns[theme] || entries > themeRuns[theme].entries) {
+      themeRuns[theme] = {
+        runName,
+        entries,
+        ...deltas,
+      };
+    }
+  }
+  // Show skipped runs in verbose mode
+  if (args.verbose && skippedRuns.length > 0) {
+    console.log('Skipped Runs (incomplete or invalid):');
+    for (const { theme, runName, entries, reason } of skippedRuns) {
+      console.log(`  ${theme}: ${runName} (${entries} entries) - ${reason}`);
+    }
+    console.log('');
+  }
+  // Sort themes by delta (best first)
+  const sortedThemes = Object.entries(themeRuns)
+    .map(([theme, data]) => ({ theme, ...data }))
+    .sort((a, b) => b.meanDelta - a.meanDelta);
+  // Print results
+  console.log('Theme Performance Summary');
+  console.log('='.repeat(70));
+  console.log('');
+  console.log(
+    'Theme'.padEnd(28) +
+    'Entries'.padStart(8) +
+    'Mean'.padStart(8) +
+    'Delta'.padStart(10) +
+    'Tier'.padStart(6) +
+    (args.verbose ? '  Source Run' : '')
+  );
+  console.log('-'.repeat(70));
+  let updated = 0;
+  let unchanged = 0;
+  const tierCounts = { S: 0, A: 0, B: 0, C: 0, D: 0 };
+  for (const { theme, runName, entries, meanScore, meanDelta } of sortedThemes) {
+    const tier = assignTier(meanDelta);
+    tierCounts[tier]++;
+    const deltaStr = (meanDelta >= 0 ? '+' : '') + meanDelta.toFixed(2);
+    console.log(
+      theme.padEnd(28) +
+      entries.toString().padStart(8) +
+      meanScore.toFixed(2).padStart(8) +
+      deltaStr.padStart(10) +
+      tier.padStart(6) +
+      (args.verbose ? `  ${runName}` : '')
+    );
+    // Update theme file
+    const result = updateThemeTier(theme, tier, args.dryRun);
+    if (result.updated) {
+      updated++;
+      if (args.verbose) {
+        console.log(`  → Updated: ${result.currentTier} → ${result.newTier}`);
+      }
+    } else {
+      unchanged++;
+    }
+  }
+  console.log('');
+  console.log('Tier Distribution:');
+  for (const tier of ['S', 'A', 'B', 'C', 'D']) {
+    console.log(`  ${tier}: ${tierCounts[tier]} themes`);
+  }
+  // Count unbenchmarked themes
+  const allThemes = readdirSync(THEMES_DIR)
+    .filter(f => f.endsWith('.yaml'))
+    .map(f => f.replace('.yaml', ''));
+  const benchmarkedThemes = new Set(Object.keys(themeRuns));
+  const unbenchmarked = allThemes.filter(t => !benchmarkedThemes.has(t));
+  console.log(`  U: ${unbenchmarked.length} themes (unbenchmarked)`);
+  if (args.verbose && unbenchmarked.length > 0) {
+    console.log(`     ${unbenchmarked.slice(0, 10).join(', ')}${unbenchmarked.length > 10 ? '...' : ''}`);
+  }
+  console.log('');
+  console.log(`Summary: ${updated} updated, ${unchanged} unchanged`);
+}
+main();

package/pennyfarthing-dist/scripts/theme/compute-theme-tiers.sh CHANGED Viewed

@@ -1,203 +1,11 @@
-#!/usr/bin/env bash
-# compute-theme-tiers.sh - Compute tier rankings from job-fair results and update theme files
+#!/bin/bash
+# compute-theme-tiers.sh - Shell wrapper for compute-theme-tiers.js
+# Computes tier rankings from job-fair results and updates theme files
 #
-# Usage: compute-theme-tiers.sh [--dry-run] [--verbose]
+# Uses the MOST COMPLETE run for each theme (most matrix entries),
+# not the most recent. This prevents incomplete runs from overriding good data.
 #
-# Reads all summary.yaml files from internal/results/job-fair/
-# For each theme, extracts all character×role scores from the matrix
-# Computes delta vs baseline for each role, then averages across all roles
-# Assigns tier based on overall performance vs control baseline
-#
-# Tier criteria (based on mean delta from control):
-#   S: delta >= +10 (elite - consistently beats control)
-#   A: delta >= 0   (excellent - matches or beats control)
-#   B: delta >= -10 (strong - slightly below control)
-#   C: delta >= -20 (good - notably below control)
-#   D: delta < -20  (below average)
-#   U: no data      (unbenchmarked)
-set -euo pipefail
-SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
-PROJECT_ROOT="$(cd "$SCRIPT_DIR/../.." && pwd)"
-JOB_FAIR_DIR="$PROJECT_ROOT/internal/results/job-fair"
-THEMES_DIR="$PROJECT_ROOT/pennyfarthing-dist/personas/themes"
-DRY_RUN=false
-VERBOSE=false
-for arg in "$@"; do
-    case $arg in
-        --dry-run) DRY_RUN=true ;;
-        --verbose) VERBOSE=true ;;
-    esac
-done
-if [[ "$DRY_RUN" == "true" ]]; then
-    echo "DRY RUN - no changes will be made"
-    echo ""
-fi
-# Check dependencies
-if ! command -v yq &> /dev/null; then
-    echo "Error: yq is required but not installed"
-    exit 1
-fi
-# Temporary files for aggregation
-THEME_DATA=$(mktemp)
-THEME_AGG=$(mktemp)
-trap "rm -f $THEME_DATA $THEME_AGG" EXIT
-# Process all job-fair summary.yaml files
-# Extract theme name, compute mean score and delta vs baselines
-echo "Scanning job-fair results..."
-find "$JOB_FAIR_DIR" -name "summary.yaml" -type f | while read -r f; do
-    theme=$(yq '.theme' "$f" 2>/dev/null | grep -v "^null$" || true)
-    [[ -z "$theme" ]] && continue
-    # Extract baselines as "role:mean" pairs
-    baselines=$(yq '.baselines | to_entries | .[] | .key + ":" + (.value.mean | tostring)' "$f" 2>/dev/null || true)
-    [[ -z "$baselines" ]] && continue
-    # Extract all matrix scores as "role:mean" pairs (flatten character dimension)
-    # Matrix format: character: { role: {mean: X, n: Y} }
-    scores=$(yq '.matrix | to_entries | .[] | .value | to_entries | .[] | .key + ":" + (.value.mean | tostring)' "$f" 2>/dev/null || true)
-    [[ -z "$scores" ]] && continue
-    # Use awk to compute per-role averages and deltas, then overall mean
-    echo "$theme" "$(echo "$baselines" | tr '\n' '|')" "$(echo "$scores" | tr '\n' '|')"
-done | awk '
-{
-    theme = $1
-    # Parse baselines (field 2)
-    n_base = split($2, base_pairs, "|")
-    for (i = 1; i <= n_base; i++) {
-        if (base_pairs[i] == "") continue
-        split(base_pairs[i], kv, ":")
-        baseline[kv[1]] = kv[2]
-    }
-    # Parse scores (field 3) and accumulate by role
-    delete role_sum
-    delete role_count
-    n_scores = split($3, score_pairs, "|")
-    for (i = 1; i <= n_scores; i++) {
-        if (score_pairs[i] == "") continue
-        split(score_pairs[i], kv, ":")
-        role = kv[1]
-        score = kv[2]
-        role_sum[role] += score
-        role_count[role]++
-    }
-    # Compute delta for each role, then average
-    total_delta = 0
-    total_score = 0
-    n_roles = 0
-    for (role in role_sum) {
-        role_mean = role_sum[role] / role_count[role]
-        if (role in baseline) {
-            delta = role_mean - baseline[role]
-            total_delta += delta
-            total_score += role_mean
-            n_roles++
-        }
-    }
-    if (n_roles > 0) {
-        mean_delta = total_delta / n_roles
-        mean_score = total_score / n_roles
-        print theme, n_scores, mean_score, mean_delta
-    }
-}
-' > "$THEME_DATA"
-summary_count=$(wc -l < "$THEME_DATA" | tr -d ' ')
-echo "Found $summary_count themes with job-fair results"
-echo ""
-# Aggregate by theme (in case multiple job-fair runs exist for same theme)
-# Take the most recent (last) result for each theme
-awk '
-{
-    theme = $1
-    n = $2
-    score = $3
-    delta = $4
-    # Keep last occurrence (most recent)
-    data[theme] = n "|" score "|" delta
-}
-END {
-    for (theme in data) {
-        split(data[theme], parts, "|")
-        n = parts[1]
-        score = parts[2]
-        delta = parts[3]
-        # Assign tier based on mean delta
-        if (delta >= 10) tier = "S"
-        else if (delta >= 0) tier = "A"
-        else if (delta >= -10) tier = "B"
-        else if (delta >= -20) tier = "C"
-        else tier = "D"
-        printf "%s|%d|%.2f|%.2f|%s\n", theme, n, score, delta, tier
-    }
-}
-' "$THEME_DATA" | sort -t'|' -k4 -rn > "$THEME_AGG"
-# Print results
-echo "Theme Performance Summary"
-echo "========================="
-echo ""
-printf "%-25s %6s %8s %8s %4s\n" "Theme" "Runs" "Mean" "Delta" "Tier"
-printf "%-25s %6s %8s %8s %4s\n" "-------------------------" "------" "--------" "--------" "----"
-updated=0
-unchanged=0
-while IFS='|' read -r theme n score delta tier; do
-    printf "%-25s %6d %8.2f %+8.2f %4s\n" "$theme" "$n" "$score" "$delta" "$tier"
-    # Update theme file
-    theme_file="$THEMES_DIR/${theme}.yaml"
-    if [[ -f "$theme_file" ]]; then
-        current_tier=$(grep -E "^  tier:" "$theme_file" 2>/dev/null | sed 's/.*tier:[[:space:]]*//' || echo "U")
-        if [[ "$current_tier" != "$tier" ]]; then
-            if [[ "$DRY_RUN" == "true" ]]; then
-                [[ "$VERBOSE" == "true" ]] && echo "  Would update: $current_tier → $tier"
-            else
-                sed -i '' "s/^  tier:.*/  tier: $tier/" "$theme_file"
-                [[ "$VERBOSE" == "true" ]] && echo "  Updated: $current_tier → $tier"
-            fi
-            updated=$((updated + 1))
-        else
-            unchanged=$((unchanged + 1))
-        fi
-    else
-        [[ "$VERBOSE" == "true" ]] && echo "  Warning: No theme file for $theme"
-    fi
-done < "$THEME_AGG"
-echo ""
-# Count themes by tier
-echo "Tier Distribution:"
-for t in S A B C D; do
-    count=$(grep -c "|$t$" "$THEME_AGG" 2>/dev/null || echo 0)
-    echo "  $t: $count themes"
-done
-# Count unbenchmarked themes
-benchmarked=$(wc -l < "$THEME_AGG" | tr -d ' ')
-total_themes=$(ls "$THEMES_DIR"/*.yaml 2>/dev/null | wc -l | tr -d ' ')
-unbenchmarked=$((total_themes - benchmarked))
-echo "  U: $unbenchmarked themes (unbenchmarked)"
+# All logic is implemented in compute-theme-tiers.js (Node.js)
-echo ""
-echo "Summary: $updated updated, $unchanged unchanged"
+SCRIPT_DIR="$(cd "$(dirname "$0")" && pwd)"
+exec node "$SCRIPT_DIR/compute-theme-tiers.js" "$@"