npm - make-mp-data - Versions diffs - 3.0.3 → 3.0.5 - Mend

make-mp-data 3.0.3 → 3.0.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (70) hide show

package/README.md +46 -0
package/dungeons/array-of-object-lookup-schema.json +327 -0
package/dungeons/array-of-object-lookup.js +29 -9
package/dungeons/capstone/capstone-ic3.js +291 -0
package/dungeons/capstone/capstone-ic4.js +598 -0
package/dungeons/capstone/capstone-ic5.js +668 -0
package/dungeons/capstone/generate-product-lookup.js +309 -0
package/dungeons/ecommerce-schema.json +462 -0
package/dungeons/{copilot.js → ecommerce.js} +79 -17
package/dungeons/education-schema.json +2409 -0
package/dungeons/education.js +226 -462
package/dungeons/fintech-schema.json +14034 -0
package/dungeons/fintech.js +134 -413
package/dungeons/foobar-schema.json +403 -0
package/dungeons/foobar.js +27 -4
package/dungeons/food-delivery-schema.json +192 -0
package/dungeons/food-delivery.js +602 -0
package/dungeons/food-schema.json +1152 -0
package/dungeons/food.js +173 -406
package/dungeons/gaming-schema.json +1270 -0
package/dungeons/gaming.js +182 -42
package/dungeons/insurance-application-schema.json +204 -0
package/dungeons/insurance-application.js +605 -0
package/dungeons/media-schema.json +906 -0
package/dungeons/media.js +250 -420
package/dungeons/retention-cadence-schema.json +78 -0
package/dungeons/retention-cadence.js +35 -1
package/dungeons/rpg-schema.json +4526 -0
package/dungeons/rpg.js +171 -429
package/dungeons/sanity-schema.json +255 -0
package/dungeons/sanity.js +21 -10
package/dungeons/sass-schema.json +1291 -0
package/dungeons/sass.js +241 -368
package/dungeons/scd-schema.json +919 -0
package/dungeons/scd.js +41 -13
package/dungeons/simple-schema.json +608 -0
package/dungeons/simple.js +52 -15
package/dungeons/simplest-schema.json +1418 -0
package/dungeons/simplest.js +392 -0
package/dungeons/social-schema.json +1118 -0
package/dungeons/social.js +150 -391
package/dungeons/text-generation-schema.json +3096 -0
package/dungeons/text-generation.js +71 -0
package/index.js +8 -6
package/lib/core/config-validator.js +28 -8
package/lib/core/storage.js +5 -5
package/lib/generators/events.js +4 -4
package/lib/orchestrators/mixpanel-sender.js +16 -13
package/lib/orchestrators/user-loop.js +14 -6
package/lib/templates/soup-presets.js +188 -0
package/lib/utils/utils.js +52 -6
package/package.json +1 -1
package/types.d.ts +20 -3
package/dungeons/adspend.js +0 -130
package/dungeons/anon.js +0 -128
package/dungeons/benchmark-heavy.js +0 -240
package/dungeons/benchmark-light.js +0 -140
package/dungeons/big.js +0 -226
package/dungeons/business.js +0 -391
package/dungeons/complex.js +0 -428
package/dungeons/experiments.js +0 -137
package/dungeons/funnels.js +0 -309
package/dungeons/mil.js +0 -323
package/dungeons/mirror.js +0 -161
package/dungeons/soup-test.js +0 -52
package/dungeons/streaming.js +0 -372
package/dungeons/strict-event-test.js +0 -30
package/dungeons/student-teacher.js +0 -438
package/dungeons/too-big-events.js +0 -203
package/dungeons/user-agent.js +0 -209

package/dungeons/sass.js CHANGED Viewed

@@ -10,9 +10,13 @@ const chance = u.initChance(SEED);
 const num_users = 5_000;
 const days = 100;
-/** @typedef  {import("../../types.js").Dungeon} Config */
+/** @typedef  {import("../types.js").Dungeon} Config */
-/**
+/*
+ * ═══════════════════════════════════════════════════════════════════════════════
+ * DATASET OVERVIEW
+ * ═══════════════════════════════════════════════════════════════════════════════
+ *
  * CLOUDFORGE - B2B Cloud Infrastructure Monitoring & Deployment Platform
  *
  * CloudForge is a B2B SaaS platform that combines infrastructure monitoring (like Datadog)
@@ -20,6 +24,12 @@ const days = 100;
  * of all sizes - from startups deploying their first microservice to enterprises managing
  * thousands of services across multi-cloud environments.
  *
+ * - 5,000 users over 100 days
+ * - 600K events across 18 event types (+ 1 hook-created event type)
+ * - 8 funnels (onboarding, monitoring, incident response, deployment, infra, team, docs, billing)
+ * - Group analytics (companies)
+ * - Desktop/browser only (B2B SaaS - no mobile devices)
+ *
  * CORE PLATFORM:
  * Teams create workspaces, deploy services across AWS/GCP/Azure, and monitor everything
  * from a unified dashboard. The platform tracks uptime, latency, error rates, CPU/memory
@@ -27,42 +37,202 @@ const days = 100;
  * PagerDuty/Slack integrations, and on-call engineers acknowledge and resolve incidents
  * using automated runbooks.
  *
- * DEPLOYMENT PIPELINE:
- * CloudForge manages CI/CD pipelines that deploy services to production, staging, and dev
- * environments. Pipelines track commit counts, duration, and success/failure rates. When
- * deployments fail, recovery deploys take longer as engineers carefully roll forward.
- * Infrastructure can scale automatically or manually based on load.
+ * PRICING MODEL:
+ * Four tiers: Free, Team, Business, Enterprise. Enterprise customers get dedicated
+ * customer success managers and annual contracts. Pricing based on seat count and
+ * resource usage.
+ */
+/*
+ * ═══════════════════════════════════════════════════════════════════════════════
+ * ANALYTICS HOOKS
+ * ═══════════════════════════════════════════════════════════════════════════════
+ *
+ * 8 deliberately architected patterns hidden in the data, simulating real-world
+ * B2B SaaS behavior. Several hooks use event removal (splice), event replacement,
+ * and module-level closure state tracking via Map objects.
  *
- * INCIDENT MANAGEMENT:
- * Alerts flow through a severity system (info -> warning -> critical -> emergency).
- * Critical and emergency alerts sometimes escalate into formal incidents with P1/P2
- * classification, paging multiple teams. Teams with Slack + PagerDuty integrations
- * respond and resolve incidents significantly faster than those without.
+ * ─────────────────────────────────────────────────────────────────────────────
+ * 1. END-OF-QUARTER SPIKE (event hook)
+ * ─────────────────────────────────────────────────────────────────────────────
  *
- * COST MANAGEMENT:
- * The platform generates cost reports showing daily/weekly/monthly spend. When costs
- * spike beyond budgets, teams react by scaling down infrastructure. End-of-quarter
- * pushes drive plan upgrades and team expansion as companies rush to hit targets.
+ * Days 80-90: billing events shift toward plan upgrades 40% of the time, and team
+ * member invitations are duplicated 50% of the time. Tagged: quarter_end_push: true.
  *
- * SECURITY & COMPLIANCE:
- * Regular security scans check for vulnerabilities, compliance violations, and access
- * audit issues. Feature flags control rollout of new capabilities across environments.
+ * Mixpanel Report — Plan Upgrades Over Time:
+ *   • Insights line chart
+ *   • Event: "billing event", filter "event_type" = "plan_upgraded"
+ *   • Daily trend
+ *   • Expected: Spike in plan upgrades during days 80-90 (4x normal volume)
  *
- * PRICING MODEL:
- * Four tiers: Free (limited), Team (small teams), Business (mid-market), Enterprise
- * (large organizations). Pricing based on seat count and resource usage. Enterprise
- * customers get dedicated customer success managers and annual contracts.
- *
- * TARGET USERS:
- * Engineers, SREs, DevOps professionals, engineering managers, and executives who
- * need visibility into their cloud infrastructure and deployment processes.
- *
- * WHY THESE EVENTS/PROPERTIES?
- * - Events model a complete B2B SaaS lifecycle: onboarding -> adoption -> expansion -> renewal
- * - Properties enable cohort analysis: company size, plan tier, role, cloud provider
- * - Funnels reveal friction: onboarding completion, incident resolution, deployment success
- * - Hooks simulate real operational insights hidden in production telemetry data
- * - The "needle in haystack" hooks create discoverable patterns that mirror real B2B analytics
+ * Mixpanel Report — Team Expansion Surge:
+ *   • Insights line chart
+ *   • Event: "team member invited", filter "quarter_end_push" = true
+ *   • Daily trend
+ *   • Expected: Clear volume spike in last 10 days with duplicate invites
+ *
+ * ─────────────────────────────────────────────────────────────────────────────
+ * 2. CHURNED ACCOUNT SILENCING (everything hook)
+ * ─────────────────────────────────────────────────────────────────────────────
+ *
+ * ~10% of users (hash of distinct_id, idHash % 5 === 0) go completely silent
+ * after day 30. ALL events after month 1 are removed via splice(). User profiles
+ * are tagged churned_account: true for discoverability.
+ *
+ * Mixpanel Report — Churned Account Retention:
+ *   • Retention report
+ *   • Event A/B: Any event
+ *   • Breakdown: User profile "churned_account"
+ *   • Expected: churned_account=true shows 0% retention after day 30
+ *
+ * Mixpanel Report — Churned Account Activity:
+ *   • Insights line chart
+ *   • Event: Any event, measure total per user
+ *   • Breakdown: User profile "churned_account"
+ *   • Weekly trend
+ *   • Expected: churned_account=true flatlines after week 4
+ *
+ * ─────────────────────────────────────────────────────────────────────────────
+ * 3. ALERT ESCALATION REPLACEMENT (event hook)
+ * ─────────────────────────────────────────────────────────────────────────────
+ *
+ * 30% of critical/emergency "alert triggered" events are REPLACED with a new
+ * event type "incident created" (not in the events array — hook-only). Includes
+ * escalation_level (P1/P2), teams_paged, incident_id.
+ *
+ * Mixpanel Report — Incident Created Discovery:
+ *   • Insights report
+ *   • Event: "incident created"
+ *   • Breakdown: "escalation_level"
+ *   • Expected: P1 and P2 incidents, ~30% of critical/emergency alert volume
+ *
+ * Mixpanel Report — Alert vs Incident Ratio:
+ *   • Insights report
+ *   • Events: "alert triggered" AND "incident created"
+ *   • Expected: incident created count ~ 30% of critical+emergency alerts
+ *
+ * ─────────────────────────────────────────────────────────────────────────────
+ * 4. INTEGRATION USERS SUCCEED (everything hook)
+ * ─────────────────────────────────────────────────────────────────────────────
+ *
+ * Users with BOTH Slack AND PagerDuty integrations resolve alerts faster:
+ * response_time_mins reduced 60%, resolution_time_mins reduced 50%.
+ * Tagged: integrated_team: true.
+ *
+ * Mixpanel Report — Integration Impact on Response Time:
+ *   • Insights report
+ *   • Event: "alert acknowledged", measure avg "response_time_mins"
+ *   • Breakdown: "integrated_team"
+ *   • Expected: integrated_team=true ~ 60% lower response time
+ *
+ * Mixpanel Report — Integration Impact on Resolution:
+ *   • Insights report
+ *   • Event: "alert resolved", measure avg "resolution_time_mins"
+ *   • Breakdown: "integrated_team"
+ *   • Expected: integrated_team=true ~ 50% faster resolution
+ *
+ * ─────────────────────────────────────────────────────────────────────────────
+ * 5. DOCS READERS DEPLOY MORE (everything hook)
+ * ─────────────────────────────────────────────────────────────────────────────
+ *
+ * Users with 3+ "best_practices" documentation views get 2-3 extra production
+ * deploys spliced into their event stream. Tagged: docs_informed: true.
+ *
+ * Mixpanel Report — Docs-Informed Deployments:
+ *   • Insights report
+ *   • Event: "service deployed", filter "environment" = "production"
+ *   • Breakdown: "docs_informed"
+ *   • Expected: docs_informed=true shows extra production deployments
+ *
+ * Mixpanel Report — Docs Readers vs Non-Readers:
+ *   • Insights report
+ *   • Event: "service deployed", measure total per user
+ *   • Segment: Users with 3+ "documentation viewed" (doc_section = "best_practices")
+ *   • Expected: ~1.8x more production deploys per user for docs readers
+ *
+ * ─────────────────────────────────────────────────────────────────────────────
+ * 6. COST OVERRUN PATTERN (event hook — closure state)
+ * ─────────────────────────────────────────────────────────────────────────────
+ *
+ * When cost_change_percent > 25 on a "cost report generated" event, the user
+ * is stored in a module-level Map. Their next "infrastructure scaled" event
+ * is forced to scale_direction: "down". Tagged: budget_exceeded, cost_reaction.
+ *
+ * Mixpanel Report — Cost Overrun to Scale Down:
+ *   • Insights report
+ *   • Event: "infrastructure scaled"
+ *   • Breakdown: "cost_reaction"
+ *   • Expected: cost_reaction=true events are 100% scale_direction="down"
+ *
+ * ─────────────────────────────────────────────────────────────────────────────
+ * 7. FAILED DEPLOYMENT RECOVERY (event hook — closure state)
+ * ─────────────────────────────────────────────────────────────────────────────
+ *
+ * After a failed pipeline run, the user's next successful deploy has
+ * duration_sec * 1.5 (recovery deploys are slower). Tagged: recovery_deployment.
+ * Uses module-level Map for cross-call state.
+ *
+ * Mixpanel Report — Recovery Deploy Duration:
+ *   • Insights report
+ *   • Event: "deployment pipeline run", measure avg "duration_sec"
+ *   • Breakdown: "recovery_deployment"
+ *   • Expected: recovery_deployment=true ~ 1.5x longer duration
+ *
+ * ─────────────────────────────────────────────────────────────────────────────
+ * 8. ENTERPRISE VS STARTUP (user hook)
+ * ─────────────────────────────────────────────────────────────────────────────
+ *
+ * Company size determines seat_count, annual_contract_value, and
+ * customer_success_manager (enterprise only). All users get customer_health_score.
+ *
+ * Mixpanel Report — ACV by Company Size:
+ *   • Insights report
+ *   • Event: Any, measure unique users
+ *   • Breakdown: User profile "company_size"
+ *   • Expected: startup ($0-3.6K), smb ($3.6K-12K), mid_market ($12K-50K),
+ *     enterprise ($50K-500K)
+ *
+ * ─────────────────────────────────────────────────────────────────────────────
+ * EXPECTED METRICS SUMMARY
+ * ─────────────────────────────────────────────────────────────────────────────
+ *
+ * Hook                     | Metric                   | Baseline  | Hook Effect    | Ratio
+ * -------------------------|--------------------------|-----------|----------------|------
+ * End-of-Quarter Spike     | Plan upgrades/day        | ~2/day    | ~8/day         | 4x
+ * Churned Accounts         | Users active month 2     | 100%      | 90%            | 0.9x
+ * Alert Escalation         | Incidents from alerts    | 0%        | ~30% of crit   | new
+ * Integration Users        | MTTR (minutes)           | ~300      | ~150           | 0.5x
+ * Docs Readers             | Prod deploys/user        | ~3        | ~5-6           | 1.8x
+ * Cost Overrun             | Scale-down after overrun | 50%       | 100%           | 2x
+ * Failed Deploy Recovery   | Deploy duration (sec)    | ~500      | ~750           | 1.5x
+ * Enterprise vs Startup    | ACV range                | $0-3.6K   | $50K-500K      | 100x+
+ *
+ * ─────────────────────────────────────────────────────────────────────────────
+ * ADVANCED ANALYSIS IDEAS
+ * ─────────────────────────────────────────────────────────────────────────────
+ *
+ * CROSS-HOOK PATTERNS:
+ * - Churned + Enterprise: Do churned accounts skew toward startups or are
+ *   enterprise accounts also silenced?
+ * - Integration + Cost: Do teams with full integrations manage costs better?
+ * - Docs + Deploys + Failures: Do docs readers have fewer failed deployments?
+ * - Quarter Spike + Churn: Are quarter-end upgrades correlated with later churn?
+ * - Enterprise Recovery: Do enterprise customers recover from failed deploys
+ *   differently than startups?
+ *
+ * COHORT ANALYSIS:
+ * - By company_size: Compare all metrics across startup/smb/mid_market/enterprise
+ * - By plan_tier: Free vs. Team vs. Business vs. Enterprise engagement
+ * - By cloud_provider: AWS vs. GCP vs. Azure deployment and alert patterns
+ * - By primary_role: Engineer vs. SRE vs. DevOps vs. Manager behaviors
+ *
+ * KEY METRICS:
+ * - MTTR: alert triggered → alert resolved duration
+ * - Deployment Frequency: service deployed per user per week
+ * - Deployment Success Rate: pipeline success vs. failure ratio
+ * - Cost Efficiency: total_cost trend over time per company
+ * - Feature Adoption: integration configured events by type
+ * - Documentation Engagement: documentation viewed by section
  */
 // Generate consistent IDs for lookup tables and event properties
@@ -167,8 +337,8 @@ const config = {
 			weight: 1,
 			isFirstEvent: true,
 			properties: {
-				company_size: u.pickAWinner(["startup", "smb", "mid_market", "enterprise"]),
-				industry: u.pickAWinner(["tech", "finance", "healthcare", "retail", "media"]),
+				company_size: ["startup", "smb", "mid_market", "enterprise"],
+				industry: ["tech", "finance", "healthcare", "retail", "media"],
 			}
 		},
 		{
@@ -176,17 +346,17 @@ const config = {
 			weight: 10,
 			properties: {
 				service_id: u.pickAWinner(serviceIds),
-				service_type: u.pickAWinner(["web_app", "api", "database", "cache", "queue", "ml_model"]),
-				environment: u.pickAWinner(["production", "staging", "dev"]),
-				cloud_provider: u.pickAWinner(["aws", "gcp", "azure"]),
+				service_type: ["web_app", "api", "database", "cache", "queue", "ml_model"],
+				environment: ["production", "staging", "dev"],
+				cloud_provider: ["aws", "gcp", "azure"],
 			}
 		},
 		{
 			event: "dashboard viewed",
 			weight: 20,
 			properties: {
-				dashboard_type: u.pickAWinner(["overview", "cost", "performance", "security", "custom"]),
-				time_range: u.pickAWinner(["1h", "6h", "24h", "7d", "30d"]),
+				dashboard_type: ["overview", "cost", "performance", "security", "custom"],
+				time_range: ["1h", "6h", "24h", "7d", "30d"],
 			}
 		},
 		{
@@ -194,8 +364,8 @@ const config = {
 			weight: 12,
 			properties: {
 				alert_id: u.pickAWinner(alertIds),
-				severity: u.pickAWinner(["info", "warning", "critical", "emergency"]),
-				alert_type: u.pickAWinner(["cpu", "memory", "latency", "error_rate", "disk", "network"]),
+				severity: ["info", "warning", "critical", "emergency"],
+				alert_type: ["cpu", "memory", "latency", "error_rate", "disk", "network"],
 				service_id: u.pickAWinner(serviceIds),
 			}
 		},
@@ -205,7 +375,7 @@ const config = {
 			properties: {
 				alert_id: u.pickAWinner(alertIds),
 				response_time_mins: u.weighNumRange(1, 120),
-				acknowledged_by_role: u.pickAWinner(["engineer", "sre", "manager", "oncall"]),
+				acknowledged_by_role: ["engineer", "sre", "manager", "oncall"],
 			}
 		},
 		{
@@ -214,7 +384,7 @@ const config = {
 			properties: {
 				alert_id: u.pickAWinner(alertIds),
 				resolution_time_mins: u.weighNumRange(5, 1440),
-				root_cause: u.pickAWinner(["config_change", "capacity", "bug", "dependency", "network"]),
+				root_cause: ["config_change", "capacity", "bug", "dependency", "network"],
 			}
 		},
 		{
@@ -222,7 +392,7 @@ const config = {
 			weight: 9,
 			properties: {
 				pipeline_id: u.pickAWinner(pipelineIds),
-				status: u.pickAWinner(["success", "failed", "cancelled"]),
+				status: ["success", "failed", "cancelled"],
 				duration_sec: u.weighNumRange(30, 1800),
 				commit_count: u.weighNumRange(1, 20),
 			}
@@ -242,7 +412,7 @@ const config = {
 			event: "cost report generated",
 			weight: 4,
 			properties: {
-				report_period: u.pickAWinner(["daily", "weekly", "monthly"]),
+				report_period: ["daily", "weekly", "monthly"],
 				total_cost: u.weighNumRange(100, 50000),
 				cost_change_percent: u.weighNumRange(-30, 50),
 			}
@@ -251,23 +421,23 @@ const config = {
 			event: "team member invited",
 			weight: 3,
 			properties: {
-				role: u.pickAWinner(["admin", "editor", "viewer", "billing"]),
-				invitation_method: u.pickAWinner(["email", "sso", "slack"]),
+				role: ["admin", "editor", "viewer", "billing"],
+				invitation_method: ["email", "sso", "slack"],
 			}
 		},
 		{
 			event: "integration configured",
 			weight: 4,
 			properties: {
-				integration_type: u.pickAWinner(["slack", "pagerduty", "jira", "github", "datadog", "terraform"]),
-				status: u.pickAWinner(["active", "paused", "error"]),
+				integration_type: ["slack", "pagerduty", "jira", "github", "datadog", "terraform"],
+				status: ["active", "paused", "error"],
 			}
 		},
 		{
 			event: "query executed",
 			weight: 15,
 			properties: {
-				query_type: u.pickAWinner(["metrics", "logs", "traces"]),
+				query_type: ["metrics", "logs", "traces"],
 				time_range_hours: u.weighNumRange(1, 720),
 				result_count: u.weighNumRange(0, 10000),
 			}
@@ -277,7 +447,7 @@ const config = {
 			weight: 3,
 			properties: {
 				runbook_id: u.pickAWinner(runbookIds),
-				trigger: u.pickAWinner(["manual", "automated", "alert_triggered"]),
+				trigger: ["manual", "automated", "alert_triggered"],
 				success: u.pickAWinner([true, false], 0.15),
 			}
 		},
@@ -285,7 +455,7 @@ const config = {
 			event: "billing event",
 			weight: 3,
 			properties: {
-				event_type: u.pickAWinner(["invoice_generated", "payment_received", "payment_failed", "plan_upgraded", "plan_downgraded"]),
+				event_type: ["invoice_generated", "payment_received", "payment_failed", "plan_upgraded", "plan_downgraded"],
 				amount: u.weighNumRange(99, 25000),
 			}
 		},
@@ -293,7 +463,7 @@ const config = {
 			event: "security scan",
 			weight: 6,
 			properties: {
-				scan_type: u.pickAWinner(["vulnerability", "compliance", "access_audit"]),
+				scan_type: ["vulnerability", "compliance", "access_audit"],
 				findings_count: u.weighNumRange(0, 50),
 				critical_findings: u.weighNumRange(0, 10),
 			}
@@ -302,8 +472,8 @@ const config = {
 			event: "api call",
 			weight: 16,
 			properties: {
-				endpoint: u.pickAWinner(["/deploy", "/status", "/metrics", "/alerts", "/config", "/billing"]),
-				method: u.pickAWinner(["GET", "POST", "PUT", "DELETE"]),
+				endpoint: ["/deploy", "/status", "/metrics", "/alerts", "/config", "/billing"],
+				method: ["GET", "POST", "PUT", "DELETE"],
 				response_time_ms: u.weighNumRange(10, 5000),
 				status_code: u.pickAWinner([200, 201, 400, 401, 403, 500, 503]),
 			}
@@ -312,7 +482,7 @@ const config = {
 			event: "documentation viewed",
 			weight: 7,
 			properties: {
-				doc_section: u.pickAWinner(["getting_started", "api_reference", "best_practices", "troubleshooting", "changelog"]),
+				doc_section: ["getting_started", "api_reference", "best_practices", "troubleshooting", "changelog"],
 				time_on_page_sec: u.weighNumRange(5, 600),
 			}
 		},
@@ -322,20 +492,20 @@ const config = {
 			properties: {
 				flag_name: () => `flag_${chance.word()}`,
 				new_state: u.pickAWinner(["enabled", "disabled"], 0.15),
-				environment: u.pickAWinner(["production", "staging", "dev"]),
+				environment: ["production", "staging", "dev"],
 			}
 		},
 	],
 	superProps: {
 		plan_tier: u.pickAWinner(["free", "free", "team", "team", "business", "enterprise"]),
-		cloud_provider: u.pickAWinner(["aws", "gcp", "azure", "multi_cloud"]),
+		cloud_provider: ["aws", "gcp", "azure", "multi_cloud"],
 	},
 	userProps: {
 		company_size: u.pickAWinner(["startup", "startup", "smb", "mid_market", "enterprise"]),
-		primary_role: u.pickAWinner(["engineer", "sre", "devops", "manager", "executive"]),
-		team_name: u.pickAWinner(["Platform", "Backend", "Frontend", "Data", "Security", "Infrastructure"]),
+		primary_role: ["engineer", "sre", "devops", "manager", "executive"],
+		team_name: ["Platform", "Backend", "Frontend", "Data", "Security", "Infrastructure"],
 	},
 	groupKeys: [
@@ -345,9 +515,9 @@ const config = {
 	groupProps: {
 		company_id: {
 			name: () => `${chance.word({ capitalize: true })} ${chance.pickone(["Systems", "Technologies", "Labs", "Cloud", "Digital", "Networks", "Solutions"])}`,
-			industry: u.pickAWinner(["tech", "finance", "healthcare", "retail", "media", "manufacturing", "logistics"]),
-			employee_count: u.pickAWinner(["1-10", "11-50", "51-200", "201-1000", "1001-5000", "5000+"]),
-			arr_bucket: u.pickAWinner(["<10k", "10k-50k", "50k-200k", "200k-1M", "1M+"]),
+			industry: ["tech", "finance", "healthcare", "retail", "media", "manufacturing", "logistics"],
+			employee_count: ["1-10", "11-50", "51-200", "201-1000", "1001-5000", "5000+"],
+			arr_bucket: ["<10k", "10k-50k", "50k-200k", "200k-1M", "1M+"],
 		}
 	},
@@ -486,14 +656,14 @@ const config = {
 		// ─────────────────────────────────────────────────────────────
 		// Hook #2: CHURNED ACCOUNT SILENCING (everything)
-		// ~10% of users go completely silent after day 30
+		// ~20% targeted (hash % 5), yielding ~10% visible after accounting for invisible churned users
 		// ─────────────────────────────────────────────────────────────
 		if (type === "everything") {
 			const userEvents = record;
 			if (userEvents && userEvents.length > 0) {
 				const firstEvent = userEvents[0];
 				const idHash = String(firstEvent.user_id || firstEvent.device_id).split("").reduce((acc, char) => acc + char.charCodeAt(0), 0);
-				const isChurnedAccount = (idHash % 10) === 0;
+				const isChurnedAccount = (idHash % 5) === 0;
 				if (isChurnedAccount) {
 					for (let i = userEvents.length - 1; i >= 0; i--) {
@@ -591,6 +761,10 @@ const config = {
 		// Company size determines seat count, ACV, and health score
 		// ─────────────────────────────────────────────────────────────
 		if (type === "user") {
+			// Hook #2 support: tag churned accounts on user profile for discoverability
+			const idHash = String(record.distinct_id || "").split("").reduce((acc, char) => acc + char.charCodeAt(0), 0);
+			record.churned_account = (idHash % 5) === 0;
 			const companySize = record.company_size;
 			if (companySize === "enterprise") {
@@ -619,304 +793,3 @@ const config = {
 };
 export default config;
-/**
- * =================================================================================
- * NEEDLE IN A HAYSTACK - CLOUDFORGE B2B SAAS ANALYTICS
- * =================================================================================
- *
- * A B2B cloud infrastructure monitoring and deployment platform dungeon with 8
- * deliberately architected analytics insights hidden in the data. This dungeon
- * simulates CloudForge - a Datadog + Terraform hybrid serving engineering teams
- * across companies of all sizes.
- *
- * =================================================================================
- * DATASET OVERVIEW
- * =================================================================================
- *
- * - 5,000 users over 100 days
- * - 360K events across 18 event types (+ 1 hook-created event type)
- * - 3 funnels (onboarding, incident response, deployment pipeline)
- * - Group analytics (companies)
- * - Lookup tables (services, alerts)
- * - Desktop/browser only (B2B SaaS - no mobile devices)
- *
- * =================================================================================
- * THE 8 ARCHITECTED HOOKS
- * =================================================================================
- *
- * Each hook creates a specific, discoverable analytics insight that simulates
- * real-world B2B SaaS behavior patterns. Several hooks use techniques like
- * event removal (splice), event replacement, and module-level closure
- * state tracking via Map objects.
- *
- * ---------------------------------------------------------------------------------
- * 1. END-OF-QUARTER SPIKE (event hook)
- * ---------------------------------------------------------------------------------
- *
- * PATTERN: During days 80-90 of the dataset (end of quarter), billing events
- * shift toward plan upgrades 40% of the time, and team member invitations are
- * duplicated 50% of the time. All affected events are tagged with
- * quarter_end_push: true.
- *
- * HOW TO FIND IT:
- *   - Chart "billing event" by event_type, broken down by week
- *   - Chart "team member invited" count by day
- *   - Filter: quarter_end_push = true
- *   - Compare: last 10 days vs. rest of dataset
- *
- * EXPECTED INSIGHT: Clear spike in plan_upgraded billing events and team
- * invitations in the final 10 days. Duplicate invitations create an
- * artificially inflated invite count.
- *
- * REAL-WORLD ANALOGUE: End-of-quarter sales pushes, budget utilization
- * deadlines, and team expansion before fiscal year-end.
- *
- * ---------------------------------------------------------------------------------
- * 2. CHURNED ACCOUNT SILENCING (everything hook)
- * ---------------------------------------------------------------------------------
- *
- * PATTERN: ~10% of users (determined by hash of distinct_id) go completely
- * silent after day 30. ALL of their events after month 1 are removed via
- * splice() - they simply vanish from the dataset.
- *
- * HOW TO FIND IT:
- *   - Chart: unique users per week
- *   - Retention analysis: D30 retention by cohort
- *   - Compare: users active in month 1 vs. month 2
- *   - Look for users with events ONLY in the first 30 days
- *
- * EXPECTED INSIGHT: A distinct cohort of ~300 users with activity exclusively
- * in the first month. No gradual decline - a hard cutoff at day 30.
- *
- * REAL-WORLD ANALOGUE: Trial users who never convert, accounts that churn
- * after initial evaluation period, or companies that lose budget approval.
- *
- * ---------------------------------------------------------------------------------
- * 3. ALERT ESCALATION REPLACEMENT (event hook)
- * ---------------------------------------------------------------------------------
- *
- * PATTERN: When an "alert triggered" event has severity "critical" or
- * "emergency", there is a 30% chance the event is REPLACED entirely with a
- * new event type: "incident created". This event type does NOT exist in the
- * events array - it only appears because of hooks.
- *
- * HOW TO FIND IT:
- *   - Look for "incident created" events in the dataset (surprise event type)
- *   - Correlate: incident created events have escalation_level (P1, P2),
- *     teams_paged, incident_id, and auto_escalated: true
- *   - Compare: ratio of critical/emergency alerts to incident creations
- *
- * EXPECTED INSIGHT: Approximately 30% of critical/emergency alerts escalate
- * into formal incidents. The "incident created" event is a hidden event type
- * that analysts must discover through exploration.
- *
- * REAL-WORLD ANALOGUE: Automated escalation systems that create incident
- * records from high-severity alerts (PagerDuty, OpsGenie workflows).
- *
- * ---------------------------------------------------------------------------------
- * 4. INTEGRATION USERS SUCCEED (everything hook)
- * ---------------------------------------------------------------------------------
- *
- * PATTERN: Users who have configured BOTH Slack AND PagerDuty integrations
- * respond to and resolve alerts significantly faster:
- *   - alert_acknowledged response_time_mins reduced by 60%
- *   - alert_resolved resolution_time_mins reduced by 50%
- *   - Affected events tagged with integrated_team: true
- *
- * HOW TO FIND IT:
- *   - Segment users by: has "integration configured" for both "slack" AND "pagerduty"
- *   - Compare: average response_time_mins on alert acknowledged
- *   - Compare: average resolution_time_mins on alert resolved
- *   - Filter: integrated_team = true
- *
- * EXPECTED INSIGHT: Users with both integrations have median response time
- * ~60% lower than baseline. This is a two-feature combination effect.
- *
- * REAL-WORLD ANALOGUE: Tool integration stacks that compound productivity
- * (e.g., CI/CD + monitoring + alerting creating faster MTTR).
- *
- * ---------------------------------------------------------------------------------
- * 5. DOCS READERS DEPLOY MORE (everything hook)
- * ---------------------------------------------------------------------------------
- *
- * PATTERN: Users who view "best_practices" documentation 3 or more times get
- * 2-3 extra "service deployed" events with environment: "production" spliced
- * into their event stream. Tagged with docs_informed: true.
- *
- * HOW TO FIND IT:
- *   - Segment users by: count of "documentation viewed" where doc_section = "best_practices" >= 3
- *   - Compare: count of "service deployed" where environment = "production"
- *   - Filter: docs_informed = true
- *
- * EXPECTED INSIGHT: Users who read best practices documentation 3+ times
- * deploy more services to production, suggesting docs drive confidence
- * and adoption.
- *
- * REAL-WORLD ANALOGUE: Documentation engagement as a leading indicator of
- * product adoption (developer tools where docs reading predicts usage).
- *
- * ---------------------------------------------------------------------------------
- * 6. COST OVERRUN PATTERN (event hook - closure state)
- * ---------------------------------------------------------------------------------
- *
- * PATTERN: When a "cost report generated" event has cost_change_percent > 25,
- * the user is stored in a module-level Map. When that same user later triggers
- * an "infrastructure scaled" event, the scale_direction is forced to "down"
- * (cost-cutting reaction). Uses closure-based state tracking across separate
- * hook calls.
- *
- * HOW TO FIND IT:
- *   - Filter: cost_report_generated where budget_exceeded = true
- *   - Correlate: subsequent infrastructure_scaled where cost_reaction = true
- *   - Compare: scale_direction distribution for cost_reaction users vs. others
- *
- * EXPECTED INSIGHT: Users who experience cost overruns (>25% increase)
- * consistently scale down their infrastructure afterward. The Map-based
- * tracking creates a causal chain across separate events.
- *
- * REAL-WORLD ANALOGUE: Cloud cost management behavior - teams that exceed
- * budgets immediately react by reducing resource allocation.
- *
- * ---------------------------------------------------------------------------------
- * 7. FAILED DEPLOYMENT RECOVERY (event hook - closure state)
- * ---------------------------------------------------------------------------------
- *
- * PATTERN: When a deployment pipeline fails, the user is stored in a
- * module-level Map. Their next successful deployment has duration_sec
- * multiplied by 1.5x (recovery deploys are slower/more careful). Tagged
- * with recovery_deployment: true.
- *
- * HOW TO FIND IT:
- *   - Filter: deployment_pipeline_run where recovery_deployment = true
- *   - Compare: average duration_sec for recovery vs. normal deployments
- *   - Sequence: look for failed -> success pairs per user
- *
- * EXPECTED INSIGHT: Recovery deployments after failures take 50% longer
- * than normal deployments, reflecting more cautious deployment practices.
- *
- * REAL-WORLD ANALOGUE: Post-incident deployment behavior - engineers take
- * extra care after a failed deploy, adding more checks and review steps.
- *
- * ---------------------------------------------------------------------------------
- * 8. ENTERPRISE VS STARTUP (user hook)
- * ---------------------------------------------------------------------------------
- *
- * PATTERN: Based on company_size, users get additional profile properties:
- *   - enterprise: seat_count (50-500), annual_contract_value (50K-500K), customer_success_manager: true
- *   - mid_market: seat_count (10-50), annual_contract_value (12K-50K)
- *   - smb: seat_count (3-10), annual_contract_value (3.6K-12K)
- *   - startup: seat_count (1-5), annual_contract_value (0-3.6K)
- *   - All users get customer_health_score (1-100)
- *
- * HOW TO FIND IT:
- *   - Segment users by: company_size
- *   - Compare: annual_contract_value distribution
- *   - Compare: seat_count ranges
- *   - Filter: customer_success_manager = true (enterprise only)
- *
- * EXPECTED INSIGHT: Clear segmentation of user base by company size with
- * corresponding ACV and seat count distributions. Enterprise customers
- * uniquely have dedicated CSMs.
- *
- * REAL-WORLD ANALOGUE: B2B SaaS customer segmentation where company size
- * directly determines contract value, support tier, and expansion potential.
- *
- * =================================================================================
- * ADVANCED ANALYSIS IDEAS
- * =================================================================================
- *
- * CROSS-HOOK PATTERNS:
- *
- * 1. Churned + Enterprise: Do churned accounts (Hook #2) skew toward startups
- *    or are enterprise accounts also silenced? Cross-reference company_size
- *    with the ~10% churn cohort.
- *
- * 2. Integration + Cost: Do teams with full integrations (Hook #4) also manage
- *    costs better (Hook #6)? Integrated teams may detect cost overruns faster.
- *
- * 3. Docs + Deploys + Failures: Do docs readers (Hook #5) have fewer failed
- *    deployments (Hook #7)? Best practices readers may deploy more carefully.
- *
- * 4. Quarter Spike + Churn: Are quarter-end upgrades (Hook #1) correlated with
- *    accounts that later churn? False expansion before abandonment.
- *
- * 5. Enterprise Recovery: Do enterprise customers (Hook #8) recover from failed
- *    deployments (Hook #7) differently than startups?
- *
- * COHORT ANALYSIS:
- *
- * - Cohort by company_size: Compare all metrics across startup/smb/mid_market/enterprise
- * - Cohort by plan_tier: Free vs. Team vs. Business vs. Enterprise engagement
- * - Cohort by cloud_provider: AWS vs. GCP vs. Azure deployment and alert patterns
- * - Cohort by primary_role: Engineer vs. SRE vs. DevOps vs. Manager behaviors
- *
- * FUNNEL ANALYSIS:
- *
- * - Onboarding: workspace created -> service deployed -> dashboard viewed
- *   Compare by company_size and plan_tier
- * - Incident Response: alert triggered -> acknowledged -> resolved
- *   Compare integrated_team vs. non-integrated response times
- * - Deployment: pipeline run -> service deployed -> dashboard viewed
- *   Compare recovery_deployment vs. normal deployment success
- *
- * KEY METRICS TO TRACK:
- *
- * - MTTR (Mean Time To Resolve): alert triggered -> alert resolved duration
- * - Deployment Frequency: service deployed events per user per week
- * - Deployment Success Rate: pipeline success vs. failure ratio
- * - Cost Efficiency: total_cost trend over time per company
- * - Feature Adoption: integration configured events by type
- * - Documentation Engagement: documentation viewed by section
- *
- * =================================================================================
- * EXPECTED METRICS SUMMARY
- * =================================================================================
- *
- * Hook                     | Metric                   | Baseline  | Hook Effect    | Ratio
- * -------------------------|--------------------------|-----------|----------------|------
- * End-of-Quarter Spike     | Plan upgrades/day        | ~2/day    | ~8/day         | 4x
- * Churned Accounts         | Users active month 2     | 100%      | 90%            | 0.9x
- * Alert Escalation         | Incidents from alerts    | 0%        | ~30% of crit   | new
- * Integration Users        | MTTR (minutes)           | ~300      | ~150           | 0.5x
- * Docs Readers             | Prod deploys/user        | ~3        | ~5-6           | 1.8x
- * Cost Overrun             | Scale-down after overrun | 50%       | 100%           | 2x
- * Failed Deploy Recovery   | Deploy duration (sec)    | ~500      | ~750           | 1.5x
- * Enterprise vs Startup    | ACV range                | $0-3.6K   | $50K-500K      | 100x+
- *
- * =================================================================================
- * HOW TO RUN THIS DUNGEON
- * =================================================================================
- *
- * From the dm4 root directory:
- *
- *   npm start
- *
- * Or programmatically:
- *
- *   import generate from './index.js';
- *   import config from './dungeons/harness-sass.js';
- *   const results = await generate(config);
- *
- * =================================================================================
- * TECHNICAL NOTES
- * =================================================================================
- *
- * - Module-level Maps (costOverrunUsers, failedDeployUsers) provide closure-based
- *   state tracking across individual event hook calls. This is the key differentiator
- *   for this dungeon - hooks 6 and 7 maintain state between separate invocations.
- *
- * - Hook #3 creates "incident created" events that do NOT exist in the events array.
- *   This event type only appears because of hook-based event replacement.
- *
- * - Hook #2 uses splice() in the "everything" handler to remove events after day 30
- *   for ~10% of users. This creates accounts with a hard activity cutoff - complete silence.
- *
- * - The "everything" hooks (2, 4, and 5) operate on the full user event array, enabling
- *   two-pass analysis: first identify patterns, then modify events accordingly.
- *
- * - Desktop/browser only: hasAndroidDevices and hasIOSDevices are both false,
- *   reflecting the B2B SaaS reality that CloudForge is used from workstations.
- *
- * =================================================================================
- */