npm - @elizaos/training - Versions diffs - 2.0.0-alpha.13 → 2.0.0-alpha.15 - Mend

@elizaos/training 2.0.0-alpha.13 → 2.0.0-alpha.15

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (87) hide show

package/package.json +2 -2
package/research-output/training-runs/training-run-1773726941205.json +38 -0
package/scripts/rank_trajectories.ts +0 -1
package/scripts/run_task_benchmark.ts +4 -11
package/src/adapter.ts +96 -49
package/src/archetypes/ArchetypeConfigService.ts +188 -185
package/src/archetypes/derive-archetype.ts +47 -47
package/src/archetypes/index.ts +2 -2
package/src/benchmark/ArchetypeMatchupBenchmark.ts +70 -70
package/src/benchmark/BenchmarkChartGenerator.ts +70 -69
package/src/benchmark/BenchmarkDataGenerator.ts +136 -136
package/src/benchmark/BenchmarkDataViewer.ts +32 -30
package/src/benchmark/BenchmarkHistoryService.ts +13 -12
package/src/benchmark/BenchmarkRunner.ts +87 -83
package/src/benchmark/BenchmarkValidator.ts +48 -46
package/src/benchmark/FastEvalRunner.ts +17 -16
package/src/benchmark/MetricsValidator.ts +20 -21
package/src/benchmark/MetricsVisualizer.ts +92 -85
package/src/benchmark/ModelBenchmarkService.ts +90 -82
package/src/benchmark/ModelRegistry.ts +44 -44
package/src/benchmark/RulerBenchmarkIntegration.ts +24 -24
package/src/benchmark/SimulationA2AInterface.ts +118 -118
package/src/benchmark/SimulationEngine.ts +51 -51
package/src/benchmark/TaskRunner.ts +87 -79
package/src/benchmark/__tests__/BenchmarkRunner.test.ts +80 -80
package/src/benchmark/__tests__/HeadToHead.test.ts +26 -26
package/src/benchmark/index.ts +27 -27
package/src/benchmark/parseSimulationMetrics.ts +32 -32
package/src/benchmark/simulation-types.ts +10 -10
package/src/dependencies.ts +34 -34
package/src/generation/TrajectoryGenerator.ts +39 -37
package/src/generation/index.ts +1 -1
package/src/huggingface/HuggingFaceDatasetUploader.ts +72 -72
package/src/huggingface/HuggingFaceIntegrationService.ts +59 -53
package/src/huggingface/HuggingFaceModelUploader.ts +60 -59
package/src/huggingface/index.ts +6 -6
package/src/huggingface/shared/HuggingFaceUploadUtil.ts +32 -32
package/src/index.ts +27 -27
package/src/init-training.ts +6 -6
package/src/metrics/TrajectoryMetricsExtractor.ts +70 -71
package/src/metrics/__tests__/TrajectoryMetricsExtractor.test.ts +182 -182
package/src/metrics/index.ts +2 -2
package/src/rubrics/__tests__/index.test.ts +73 -73
package/src/rubrics/ass-kisser.ts +6 -6
package/src/rubrics/degen.ts +6 -6
package/src/rubrics/goody-twoshoes.ts +6 -6
package/src/rubrics/index.ts +50 -50
package/src/rubrics/information-trader.ts +6 -6
package/src/rubrics/infosec.ts +6 -6
package/src/rubrics/liar.ts +6 -6
package/src/rubrics/perps-trader.ts +6 -6
package/src/rubrics/researcher.ts +6 -6
package/src/rubrics/scammer.ts +6 -6
package/src/rubrics/social-butterfly.ts +7 -7
package/src/rubrics/super-predictor.ts +6 -6
package/src/rubrics/trader.ts +5 -5
package/src/scoring/ArchetypeScoringService.ts +56 -54
package/src/scoring/JudgePromptBuilder.ts +96 -96
package/src/scoring/LLMJudgeCache.ts +26 -23
package/src/scoring/index.ts +3 -3
package/src/training/AutomationPipeline.ts +149 -140
package/src/training/BenchmarkService.ts +49 -45
package/src/training/ConfigValidator.ts +38 -32
package/src/training/MarketOutcomesTracker.ts +22 -12
package/src/training/ModelDeployer.ts +15 -15
package/src/training/ModelFetcher.ts +7 -7
package/src/training/ModelSelectionService.ts +32 -32
package/src/training/ModelUsageVerifier.ts +31 -24
package/src/training/MultiModelOrchestrator.ts +44 -44
package/src/training/RLModelConfig.ts +57 -57
package/src/training/RewardBackpropagationService.ts +18 -17
package/src/training/RulerScoringService.ts +73 -72
package/src/training/TrainingMonitor.ts +29 -29
package/src/training/TrajectoryRecorder.ts +25 -27
package/src/training/__tests__/TrajectoryRecorder.test.ts +105 -105
package/src/training/index.ts +36 -36
package/src/training/logRLConfig.ts +7 -7
package/src/training/pipeline.ts +13 -16
package/src/training/storage/ModelStorageService.ts +32 -32
package/src/training/storage/TrainingDataArchiver.ts +21 -21
package/src/training/storage/index.ts +2 -2
package/src/training/types.ts +6 -6
package/src/training/window-utils.ts +14 -14
package/src/utils/index.ts +7 -7
package/src/utils/logger.ts +5 -5
package/src/utils/snowflake.ts +1 -1
package/src/utils/synthetic-detector.ts +7 -7

package/src/archetypes/derive-archetype.ts CHANGED Viewed

@@ -7,7 +7,7 @@
  * @packageDocumentation
  */
-import { getAvailableArchetypes, normalizeArchetype } from '../rubrics';
+import { getAvailableArchetypes, normalizeArchetype } from "../rubrics";
 /**
  * NPC characteristics used for archetype derivation
@@ -29,28 +29,28 @@ export interface NPCCharacteristics {
  */
 const ROLE_TO_ARCHETYPE: Record<string, string> = {
   // High-reliability roles → ethical archetypes
-  insider: 'information-trader',
-  expert: 'researcher',
-  whistleblower: 'goody-twoshoes',
-  analyst: 'researcher',
+  insider: "information-trader",
+  expert: "researcher",
+  whistleblower: "goody-twoshoes",
+  analyst: "researcher",
   // Media/content roles
-  journalist: 'social-butterfly',
-  reporter: 'social-butterfly',
-  influencer: 'social-butterfly',
+  journalist: "social-butterfly",
+  reporter: "social-butterfly",
+  influencer: "social-butterfly",
   // Low-reliability roles → deceptive archetypes
-  deceiver: 'scammer',
-  politician: 'liar',
-  conspiracy: 'liar',
+  deceiver: "scammer",
+  politician: "liar",
+  conspiracy: "liar",
   // Trading-focused roles
-  trader: 'trader',
-  investor: 'trader',
-  speculator: 'degen',
+  trader: "trader",
+  investor: "trader",
+  speculator: "degen",
   // Default fallback
-  unknown: 'trader',
+  unknown: "trader",
 };
 /**
@@ -64,57 +64,57 @@ const PERSONALITY_KEYWORDS: Array<{
 }> = [
   // High priority - distinctive personalities
   {
-    keywords: ['manipulative', 'deceptive', 'cunning', 'unethical'],
-    archetype: 'scammer',
+    keywords: ["manipulative", "deceptive", "cunning", "unethical"],
+    archetype: "scammer",
     priority: 10,
   },
   {
-    keywords: ['reckless', 'impulsive', 'yolo', 'fomo', 'aggressive'],
-    archetype: 'degen',
+    keywords: ["reckless", "impulsive", "yolo", "fomo", "aggressive"],
+    archetype: "degen",
     priority: 10,
   },
   {
-    keywords: ['honest', 'ethical', 'helpful', 'transparent', 'altruistic'],
-    archetype: 'goody-twoshoes',
+    keywords: ["honest", "ethical", "helpful", "transparent", "altruistic"],
+    archetype: "goody-twoshoes",
     priority: 10,
   },
   {
-    keywords: ['thorough', 'meticulous', 'analytical', 'data-driven'],
-    archetype: 'researcher',
+    keywords: ["thorough", "meticulous", "analytical", "data-driven"],
+    archetype: "researcher",
     priority: 8,
   },
   // Medium priority - trading styles
   {
-    keywords: ['disciplined', 'methodical', 'patient', 'risk-averse'],
-    archetype: 'trader',
+    keywords: ["disciplined", "methodical", "patient", "risk-averse"],
+    archetype: "trader",
     priority: 5,
   },
   {
-    keywords: ['social', 'networker', 'outgoing', 'community'],
-    archetype: 'social-butterfly',
+    keywords: ["social", "networker", "outgoing", "community"],
+    archetype: "social-butterfly",
     priority: 5,
   },
   {
-    keywords: ['flattering', 'agreeable', 'sycophantic', 'pleasing'],
-    archetype: 'ass-kisser',
+    keywords: ["flattering", "agreeable", "sycophantic", "pleasing"],
+    archetype: "ass-kisser",
     priority: 5,
   },
   // Low priority - general
   {
-    keywords: ['suspicious', 'secretive', 'paranoid', 'security'],
-    archetype: 'infosec',
+    keywords: ["suspicious", "secretive", "paranoid", "security"],
+    archetype: "infosec",
     priority: 3,
   },
   {
-    keywords: ['leverage', 'perpetual', 'futures', 'derivatives'],
-    archetype: 'perps-trader',
+    keywords: ["leverage", "perpetual", "futures", "derivatives"],
+    archetype: "perps-trader",
     priority: 3,
   },
   {
-    keywords: ['prediction', 'forecast', 'oracle', 'prophet'],
-    archetype: 'super-predictor',
+    keywords: ["prediction", "forecast", "oracle", "prophet"],
+    archetype: "super-predictor",
     priority: 3,
   },
 ];
@@ -155,7 +155,7 @@ export function deriveArchetype(npc: NPCCharacteristics): string {
     npc.willingToLie === true
   ) {
     // Confirmed deceptive: low reliability + actively willing to lie
-    return 'scammer';
+    return "scammer";
   }
   // Note: High reliability is factored into personality analysis below, not used as an override.
@@ -168,7 +168,7 @@ export function deriveArchetype(npc: NPCCharacteristics): string {
     for (const mapping of PERSONALITY_KEYWORDS) {
       const matchCount = mapping.keywords.filter((keyword) =>
-        personalityLower.includes(keyword)
+        personalityLower.includes(keyword),
       ).length;
       if (matchCount > 0) {
@@ -190,19 +190,19 @@ export function deriveArchetype(npc: NPCCharacteristics): string {
   // 4. Check domain for trading specialization
   if (npc.domain && npc.domain.length > 0) {
     const domains = npc.domain.map((d) => d.toLowerCase());
-    if (domains.includes('trading') || domains.includes('finance')) {
-      return 'trader';
+    if (domains.includes("trading") || domains.includes("finance")) {
+      return "trader";
     }
-    if (domains.includes('technology') || domains.includes('tech')) {
-      return 'researcher';
+    if (domains.includes("technology") || domains.includes("tech")) {
+      return "researcher";
     }
-    if (domains.includes('media') || domains.includes('social')) {
-      return 'social-butterfly';
+    if (domains.includes("media") || domains.includes("social")) {
+      return "social-butterfly";
     }
   }
   // 5. Default fallback
-  return 'trader';
+  return "trader";
 }
 /**
@@ -218,7 +218,7 @@ export type ArchetypeResolver = (npcId: string) => string;
  * @returns Function that resolves archetype from NPC ID
  */
 export function createArchetypeResolver(
-  npcs: NPCCharacteristics[]
+  npcs: NPCCharacteristics[],
 ): ArchetypeResolver {
   const archetypeMap = new Map<string, string>();
@@ -227,7 +227,7 @@ export function createArchetypeResolver(
   }
   return (npcId: string): string => {
-    return archetypeMap.get(npcId) ?? 'trader';
+    return archetypeMap.get(npcId) ?? "trader";
   };
 }
@@ -237,7 +237,7 @@ export function createArchetypeResolver(
  */
 export function getRoleArchetype(role: string): string {
   const normalized = role.toLowerCase().trim();
-  return ROLE_TO_ARCHETYPE[normalized] ?? 'trader';
+  return ROLE_TO_ARCHETYPE[normalized] ?? "trader";
 }
 /**

package/src/archetypes/index.ts CHANGED Viewed

@@ -10,7 +10,7 @@ export {
   ArchetypeConfigService,
   type ArchetypeTraits,
   archetypeConfigService,
-} from './ArchetypeConfigService';
+} from "./ArchetypeConfigService";
 export {
   type ArchetypeResolver,
@@ -19,4 +19,4 @@ export {
   getRoleArchetype,
   getValidArchetypes,
   type NPCCharacteristics,
-} from './derive-archetype';
+} from "./derive-archetype";

package/src/benchmark/ArchetypeMatchupBenchmark.ts CHANGED Viewed

@@ -12,18 +12,18 @@
 import {
   type ArchetypeConfig,
   ArchetypeConfigService,
-} from '../archetypes/ArchetypeConfigService';
+} from "../archetypes/ArchetypeConfigService";
 import {
   createMultiModelOrchestrator,
   type MultiModelOrchestrator,
-} from '../training/MultiModelOrchestrator';
-import { logger } from '../utils/logger';
+} from "../training/MultiModelOrchestrator";
+import { logger } from "../utils/logger";
 import {
   type BenchmarkConfig,
   BenchmarkDataGenerator,
   type BenchmarkGameSnapshot,
   type Tick,
-} from './BenchmarkDataGenerator';
+} from "./BenchmarkDataGenerator";
 /**
  * Individual agent in the matchup simulation
@@ -95,7 +95,7 @@ export interface MatchupBenchmarkResult {
   headToHead: ArchetypeVsResult[];
   /** Market condition during benchmark */
-  marketCondition: 'bull' | 'bear' | 'volatile' | 'stable';
+  marketCondition: "bull" | "bear" | "volatile" | "stable";
   /** Insights derived from the matchup */
   insights: string[];
@@ -106,7 +106,7 @@ export interface MatchupBenchmarkResult {
  */
 export interface MatchupBenchmarkConfig {
   /** Archetypes to include in matchup (or 'all' for all archetypes) */
-  archetypes: string[] | 'all';
+  archetypes: string[] | "all";
   /** Number of agents per archetype */
   agentsPerArchetype: number;
@@ -118,7 +118,7 @@ export interface MatchupBenchmarkConfig {
   ticksPerRound: number;
   /** Market conditions to test */
-  marketConditions: Array<'bull' | 'bear' | 'volatile' | 'stable'>;
+  marketConditions: Array<"bull" | "bear" | "volatile" | "stable">;
   /** Available VRAM for model loading */
   availableVramGb: number;
@@ -140,7 +140,7 @@ export class ArchetypeMatchupBenchmark {
    * Get all archetypes to benchmark
    */
   private getArchetypes(): string[] {
-    if (this.config.archetypes === 'all') {
+    if (this.config.archetypes === "all") {
       return ArchetypeConfigService.getAvailableArchetypes();
     }
     return this.config.archetypes;
@@ -173,7 +173,7 @@ export class ArchetypeMatchupBenchmark {
    * Market condition affects seed to create different scenarios
    */
   private async generateBenchmarkData(
-    condition: 'bull' | 'bear' | 'volatile' | 'stable'
+    condition: "bull" | "bear" | "volatile" | "stable",
   ): Promise<BenchmarkGameSnapshot> {
     // Convert ticks to duration minutes (assuming 1 tick per second)
     const durationMinutes = Math.ceil(this.config.ticksPerRound / 60);
@@ -190,8 +190,8 @@ export class ArchetypeMatchupBenchmark {
     const benchmarkConfig: BenchmarkConfig = {
       durationMinutes,
       tickInterval: 1,
-      numPredictionMarkets: condition === 'volatile' ? 8 : 5,
-      numPerpetualMarkets: condition === 'volatile' ? 5 : 3,
+      numPredictionMarkets: condition === "volatile" ? 8 : 5,
+      numPerpetualMarkets: condition === "volatile" ? 5 : 3,
       numAgents: 10,
       seed: baseSeed + (Date.now() % 1000), // Semi-reproducible
     };
@@ -206,18 +206,18 @@ export class ArchetypeMatchupBenchmark {
   private async simulateRound(
     agents: MatchupAgent[],
     snapshot: BenchmarkGameSnapshot,
-    roundNumber: number
+    roundNumber: number,
   ): Promise<MatchupAgentResult[]> {
     const results: MatchupAgentResult[] = [];
     logger.info(
       `Simulating round ${roundNumber} with ${agents.length} agents`,
       { archetypes: [...new Set(agents.map((a) => a.archetype))] },
-      'ArchetypeMatchupBenchmark'
+      "ArchetypeMatchupBenchmark",
     );
     // Check if we should use real inference or simulation
-    const useRealInference = process.env.USE_REAL_INFERENCE === 'true';
+    const useRealInference = process.env.USE_REAL_INFERENCE === "true";
     if (useRealInference) {
       // Use real model inference via the orchestrator
@@ -247,7 +247,7 @@ export class ArchetypeMatchupBenchmark {
    */
   private async runAgentWithRealModel(
     agent: MatchupAgent,
-    snapshot: BenchmarkGameSnapshot
+    snapshot: BenchmarkGameSnapshot,
   ): Promise<MatchupAgentResult> {
     let totalPnl = 0;
     let totalTrades = 0;
@@ -275,20 +275,20 @@ export class ArchetypeMatchupBenchmark {
       // Parse the decision and simulate outcome
       const decision = this.parseAgentDecision(response.response);
-      if (decision.action === 'trade') {
+      if (decision.action === "trade") {
         totalTrades++;
         // Simulate trade outcome based on market conditions
         const marketTrend = this.getMarketTrend(tick);
         const isCorrectDirection =
-          (decision.direction === 'long' && marketTrend > 0) ||
-          (decision.direction === 'short' && marketTrend < 0);
+          (decision.direction === "long" && marketTrend > 0) ||
+          (decision.direction === "short" && marketTrend < 0);
         if (isCorrectDirection) {
           wins++;
           totalPnl += Math.abs(marketTrend) * 100 * (decision.confidence || 1);
         } else {
           totalPnl -= Math.abs(marketTrend) * 50 * (decision.confidence || 1);
         }
-      } else if (decision.action === 'post') {
+      } else if (decision.action === "post") {
         postsCreated++;
       }
     }
@@ -326,7 +326,7 @@ export class ArchetypeMatchupBenchmark {
     // Extract market prices from perpetual markets
     const marketPrices = Object.fromEntries(
-      state.perpetualMarkets.map((m) => [m.ticker, m.price])
+      state.perpetualMarkets.map((m) => [m.ticker, m.price]),
     );
     // Recent posts can serve as "news"
@@ -352,8 +352,8 @@ Respond with a JSON object containing:
    * Parse agent decision from model response
    */
   private parseAgentDecision(response: string): {
-    action: 'trade' | 'post' | 'observe';
-    direction?: 'long' | 'short';
+    action: "trade" | "post" | "observe";
+    direction?: "long" | "short";
     confidence?: number;
   } {
     try {
@@ -362,7 +362,7 @@ Respond with a JSON object containing:
       if (jsonMatch) {
         const parsed = JSON.parse(jsonMatch[0]);
         return {
-          action: parsed.action || 'observe',
+          action: parsed.action || "observe",
           direction: parsed.direction,
           confidence: parsed.confidence || 0.5,
         };
@@ -373,25 +373,25 @@ Respond with a JSON object containing:
     // Default behavior based on response content
     if (
-      response.toLowerCase().includes('trade') ||
-      response.toLowerCase().includes('buy') ||
-      response.toLowerCase().includes('sell')
+      response.toLowerCase().includes("trade") ||
+      response.toLowerCase().includes("buy") ||
+      response.toLowerCase().includes("sell")
     ) {
       return {
-        action: 'trade',
-        direction: response.toLowerCase().includes('short') ? 'short' : 'long',
+        action: "trade",
+        direction: response.toLowerCase().includes("short") ? "short" : "long",
         confidence: 0.5,
       };
     }
     if (
-      response.toLowerCase().includes('post') ||
-      response.toLowerCase().includes('share')
+      response.toLowerCase().includes("post") ||
+      response.toLowerCase().includes("share")
     ) {
-      return { action: 'post' };
+      return { action: "post" };
     }
-    return { action: 'observe' };
+    return { action: "observe" };
   }
   /**
@@ -403,7 +403,7 @@ Respond with a JSON object containing:
     if (state.perpetualMarkets.length === 0) return 0;
     const prices = Object.fromEntries(
-      state.perpetualMarkets.map((m) => [m.ticker, m.price])
+      state.perpetualMarkets.map((m) => [m.ticker, m.price]),
     );
     // Calculate average price change
@@ -422,7 +422,7 @@ Respond with a JSON object containing:
    */
   private simulateAgentPerformance(
     agent: MatchupAgent,
-    snapshot: BenchmarkGameSnapshot
+    snapshot: BenchmarkGameSnapshot,
   ): MatchupAgentResult {
     const config = agent.config;
     const tickCount = snapshot.ticks.length;
@@ -465,7 +465,7 @@ Respond with a JSON object containing:
    * Calculate head-to-head results between archetypes
    */
   private calculateHeadToHead(
-    allResults: MatchupAgentResult[][]
+    allResults: MatchupAgentResult[][],
   ): ArchetypeVsResult[] {
     const archetypes = this.getArchetypes();
     const headToHead: ArchetypeVsResult[] = [];
@@ -484,10 +484,10 @@ Respond with a JSON object containing:
         // Compare performance in each round
         for (const roundResults of allResults) {
           const arch1Results = roundResults.filter(
-            (r) => r.archetype === arch1
+            (r) => r.archetype === arch1,
           );
           const arch2Results = roundResults.filter(
-            (r) => r.archetype === arch2
+            (r) => r.archetype === arch2,
           );
           if (arch1Results.length === 0 || arch2Results.length === 0) continue;
@@ -532,8 +532,8 @@ Respond with a JSON object containing:
    * Calculate overall archetype rankings
    */
   private calculateRankings(
-    allResults: MatchupAgentResult[][]
-  ): MatchupBenchmarkResult['archetypeRankings'] {
+    allResults: MatchupAgentResult[][],
+  ): MatchupBenchmarkResult["archetypeRankings"] {
     const archetypes = this.getArchetypes();
     const rankings: Map<
       string,
@@ -593,9 +593,9 @@ Respond with a JSON object containing:
    * Generate insights from the matchup results
    */
   private generateInsights(
-    rankings: MatchupBenchmarkResult['archetypeRankings'],
+    rankings: MatchupBenchmarkResult["archetypeRankings"],
     headToHead: ArchetypeVsResult[],
-    marketCondition: string
+    marketCondition: string,
   ): string[] {
     const insights: string[] = [];
@@ -603,7 +603,7 @@ Respond with a JSON object containing:
     const topRanking = rankings[0];
     if (topRanking) {
       insights.push(
-        `${topRanking.archetype} performed best in ${marketCondition} conditions with avg rank ${topRanking.avgRank.toFixed(2)}`
+        `${topRanking.archetype} performed best in ${marketCondition} conditions with avg rank ${topRanking.avgRank.toFixed(2)}`,
       );
     }
@@ -611,11 +611,11 @@ Respond with a JSON object containing:
     for (const h2h of headToHead) {
       if (h2h.winRate1 >= 0.7) {
         insights.push(
-          `${h2h.archetype1} dominates ${h2h.archetype2} (${(h2h.winRate1 * 100).toFixed(0)}% win rate)`
+          `${h2h.archetype1} dominates ${h2h.archetype2} (${(h2h.winRate1 * 100).toFixed(0)}% win rate)`,
         );
       } else if (h2h.winRate2 >= 0.7) {
         insights.push(
-          `${h2h.archetype2} dominates ${h2h.archetype1} (${(h2h.winRate2 * 100).toFixed(0)}% win rate)`
+          `${h2h.archetype2} dominates ${h2h.archetype1} (${(h2h.winRate2 * 100).toFixed(0)}% win rate)`,
         );
       }
     }
@@ -657,9 +657,9 @@ Respond with a JSON object containing:
         if (bWins) {
           for (const c of bWins) {
             const cWins = wins.get(c);
-            if (cWins && cWins.has(a)) {
+            if (cWins?.has(a)) {
               insights.push(
-                `Counter triangle found: ${a} → ${b} → ${c} → ${a}`
+                `Counter triangle found: ${a} → ${b} → ${c} → ${a}`,
               );
             }
           }
@@ -678,14 +678,14 @@ Respond with a JSON object containing:
     const results: MatchupBenchmarkResult[] = [];
     logger.info(
-      'Starting Archetype Matchup Benchmark',
+      "Starting Archetype Matchup Benchmark",
       {
         archetypes: this.getArchetypes(),
         agentsPerArchetype: this.config.agentsPerArchetype,
         rounds: this.config.rounds,
         conditions: this.config.marketConditions,
       },
-      'ArchetypeMatchupBenchmark'
+      "ArchetypeMatchupBenchmark",
     );
     const agents = this.createAgents();
@@ -694,7 +694,7 @@ Respond with a JSON object containing:
       logger.info(
         `Testing in ${condition} market conditions`,
         {},
-        'ArchetypeMatchupBenchmark'
+        "ArchetypeMatchupBenchmark",
       );
       const allRoundResults: MatchupAgentResult[][] = [];
@@ -704,7 +704,7 @@ Respond with a JSON object containing:
         const roundResults = await this.simulateRound(
           agents,
           snapshot,
-          round + 1
+          round + 1,
         );
         allRoundResults.push(roundResults);
       }
@@ -734,7 +734,7 @@ Respond with a JSON object containing:
           topArchetype: rankings[0]?.archetype,
           avgPnl: rankings[0]?.avgPnl.toFixed(2),
         },
-        'ArchetypeMatchupBenchmark'
+        "ArchetypeMatchupBenchmark",
       );
     }
@@ -743,13 +743,13 @@ Respond with a JSON object containing:
     const totalDuration = Date.now() - startTime;
     logger.info(
-      'Archetype Matchup Benchmark complete',
+      "Archetype Matchup Benchmark complete",
       {
         totalDurationMs: totalDuration,
         conditionsTested: this.config.marketConditions.length,
         totalRounds: this.config.rounds * this.config.marketConditions.length,
       },
-      'ArchetypeMatchupBenchmark'
+      "ArchetypeMatchupBenchmark",
     );
     return results;
@@ -760,49 +760,49 @@ Respond with a JSON object containing:
    */
   static generateReport(results: MatchupBenchmarkResult[]): string {
     const lines: string[] = [];
-    lines.push('# Archetype Matchup Benchmark Report\n');
+    lines.push("# Archetype Matchup Benchmark Report\n");
     for (const result of results) {
       lines.push(
-        `## ${result.marketCondition.toUpperCase()} Market Conditions\n`
+        `## ${result.marketCondition.toUpperCase()} Market Conditions\n`,
       );
       // Rankings table
-      lines.push('### Overall Rankings\n');
-      lines.push('| Rank | Archetype | Avg PnL | Win Rate |');
-      lines.push('|------|-----------|---------|----------|');
+      lines.push("### Overall Rankings\n");
+      lines.push("| Rank | Archetype | Avg PnL | Win Rate |");
+      lines.push("|------|-----------|---------|----------|");
       for (const ranking of result.archetypeRankings) {
         lines.push(
-          `| ${ranking.avgRank.toFixed(1)} | ${ranking.archetype} | ${ranking.avgPnl.toFixed(2)} | ${(ranking.winRate * 100).toFixed(1)}% |`
+          `| ${ranking.avgRank.toFixed(1)} | ${ranking.archetype} | ${ranking.avgPnl.toFixed(2)} | ${(ranking.winRate * 100).toFixed(1)}% |`,
         );
       }
-      lines.push('');
+      lines.push("");
       // Head-to-head table
-      lines.push('### Head-to-Head Results\n');
-      lines.push('| Matchup | Winner | Win Rate |');
-      lines.push('|---------|--------|----------|');
+      lines.push("### Head-to-Head Results\n");
+      lines.push("| Matchup | Winner | Win Rate |");
+      lines.push("|---------|--------|----------|");
       for (const h2h of result.headToHead) {
         const winner =
           h2h.winRate1 > h2h.winRate2 ? h2h.archetype1 : h2h.archetype2;
         const winRate = Math.max(h2h.winRate1, h2h.winRate2);
         lines.push(
-          `| ${h2h.archetype1} vs ${h2h.archetype2} | ${winner} | ${(winRate * 100).toFixed(1)}% |`
+          `| ${h2h.archetype1} vs ${h2h.archetype2} | ${winner} | ${(winRate * 100).toFixed(1)}% |`,
         );
       }
-      lines.push('');
+      lines.push("");
       // Insights
       if (result.insights.length > 0) {
-        lines.push('### Key Insights\n');
+        lines.push("### Key Insights\n");
         for (const insight of result.insights) {
           lines.push(`- ${insight}`);
         }
-        lines.push('');
+        lines.push("");
       }
     }
-    return lines.join('\n');
+    return lines.join("\n");
   }
 }
@@ -813,11 +813,11 @@ export async function runQuickMatchupBenchmark(): Promise<
   MatchupBenchmarkResult[]
 > {
   const benchmark = new ArchetypeMatchupBenchmark({
-    archetypes: 'all',
+    archetypes: "all",
     agentsPerArchetype: 2,
     rounds: 5,
     ticksPerRound: 100,
-    marketConditions: ['bull', 'bear', 'volatile', 'stable'],
+    marketConditions: ["bull", "bear", "volatile", "stable"],
     availableVramGb: 16,
   });