npm - @peakinfer/cli - Versions diffs - 1.0.133 - Mend

@peakinfer/cli 1.0.133

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (367) hide show

package/.claude/settings.local.json +8 -0
package/.env.example +6 -0
package/.github/workflows/peakinfer.yml +64 -0
package/CHANGELOG.md +31 -0
package/LICENSE +190 -0
package/README.md +335 -0
package/data/inferencemax.json +274 -0
package/dist/agent-analyzer.d.ts +45 -0
package/dist/agent-analyzer.d.ts.map +1 -0
package/dist/agent-analyzer.js +374 -0
package/dist/agent-analyzer.js.map +1 -0
package/dist/agent.d.ts +76 -0
package/dist/agent.d.ts.map +1 -0
package/dist/agent.js +965 -0
package/dist/agent.js.map +1 -0
package/dist/agents/correlation-analyzer.d.ts +34 -0
package/dist/agents/correlation-analyzer.d.ts.map +1 -0
package/dist/agents/correlation-analyzer.js +261 -0
package/dist/agents/correlation-analyzer.js.map +1 -0
package/dist/agents/index.d.ts +91 -0
package/dist/agents/index.d.ts.map +1 -0
package/dist/agents/index.js +111 -0
package/dist/agents/index.js.map +1 -0
package/dist/agents/runtime-analyzer.d.ts +38 -0
package/dist/agents/runtime-analyzer.d.ts.map +1 -0
package/dist/agents/runtime-analyzer.js +244 -0
package/dist/agents/runtime-analyzer.js.map +1 -0
package/dist/analysis-types.d.ts +500 -0
package/dist/analysis-types.d.ts.map +1 -0
package/dist/analysis-types.js +11 -0
package/dist/analysis-types.js.map +1 -0
package/dist/analytics.d.ts +25 -0
package/dist/analytics.d.ts.map +1 -0
package/dist/analytics.js +94 -0
package/dist/analytics.js.map +1 -0
package/dist/analyzer.d.ts +48 -0
package/dist/analyzer.d.ts.map +1 -0
package/dist/analyzer.js +547 -0
package/dist/analyzer.js.map +1 -0
package/dist/artifacts.d.ts +44 -0
package/dist/artifacts.d.ts.map +1 -0
package/dist/artifacts.js +165 -0
package/dist/artifacts.js.map +1 -0
package/dist/benchmarks/index.d.ts +88 -0
package/dist/benchmarks/index.d.ts.map +1 -0
package/dist/benchmarks/index.js +205 -0
package/dist/benchmarks/index.js.map +1 -0
package/dist/cli.d.ts +3 -0
package/dist/cli.d.ts.map +1 -0
package/dist/cli.js +427 -0
package/dist/cli.js.map +1 -0
package/dist/commands/ci.d.ts +19 -0
package/dist/commands/ci.d.ts.map +1 -0
package/dist/commands/ci.js +253 -0
package/dist/commands/ci.js.map +1 -0
package/dist/commands/config.d.ts +16 -0
package/dist/commands/config.d.ts.map +1 -0
package/dist/commands/config.js +249 -0
package/dist/commands/config.js.map +1 -0
package/dist/commands/demo.d.ts +15 -0
package/dist/commands/demo.d.ts.map +1 -0
package/dist/commands/demo.js +106 -0
package/dist/commands/demo.js.map +1 -0
package/dist/commands/export.d.ts +14 -0
package/dist/commands/export.d.ts.map +1 -0
package/dist/commands/export.js +209 -0
package/dist/commands/export.js.map +1 -0
package/dist/commands/history.d.ts +15 -0
package/dist/commands/history.d.ts.map +1 -0
package/dist/commands/history.js +389 -0
package/dist/commands/history.js.map +1 -0
package/dist/commands/template.d.ts +14 -0
package/dist/commands/template.d.ts.map +1 -0
package/dist/commands/template.js +341 -0
package/dist/commands/template.js.map +1 -0
package/dist/commands/validate-map.d.ts +12 -0
package/dist/commands/validate-map.d.ts.map +1 -0
package/dist/commands/validate-map.js +274 -0
package/dist/commands/validate-map.js.map +1 -0
package/dist/commands/whatif.d.ts +17 -0
package/dist/commands/whatif.d.ts.map +1 -0
package/dist/commands/whatif.js +206 -0
package/dist/commands/whatif.js.map +1 -0
package/dist/comparison.d.ts +38 -0
package/dist/comparison.d.ts.map +1 -0
package/dist/comparison.js +223 -0
package/dist/comparison.js.map +1 -0
package/dist/config.d.ts +42 -0
package/dist/config.d.ts.map +1 -0
package/dist/config.js +158 -0
package/dist/config.js.map +1 -0
package/dist/connectors/helicone.d.ts +9 -0
package/dist/connectors/helicone.d.ts.map +1 -0
package/dist/connectors/helicone.js +106 -0
package/dist/connectors/helicone.js.map +1 -0
package/dist/connectors/index.d.ts +37 -0
package/dist/connectors/index.d.ts.map +1 -0
package/dist/connectors/index.js +65 -0
package/dist/connectors/index.js.map +1 -0
package/dist/connectors/langsmith.d.ts +9 -0
package/dist/connectors/langsmith.d.ts.map +1 -0
package/dist/connectors/langsmith.js +122 -0
package/dist/connectors/langsmith.js.map +1 -0
package/dist/connectors/types.d.ts +83 -0
package/dist/connectors/types.d.ts.map +1 -0
package/dist/connectors/types.js +98 -0
package/dist/connectors/types.js.map +1 -0
package/dist/cost-estimator.d.ts +46 -0
package/dist/cost-estimator.d.ts.map +1 -0
package/dist/cost-estimator.js +104 -0
package/dist/cost-estimator.js.map +1 -0
package/dist/costs.d.ts +57 -0
package/dist/costs.d.ts.map +1 -0
package/dist/costs.js +251 -0
package/dist/costs.js.map +1 -0
package/dist/counterfactuals.d.ts +29 -0
package/dist/counterfactuals.d.ts.map +1 -0
package/dist/counterfactuals.js +448 -0
package/dist/counterfactuals.js.map +1 -0
package/dist/enhancement-prompts.d.ts +41 -0
package/dist/enhancement-prompts.d.ts.map +1 -0
package/dist/enhancement-prompts.js +88 -0
package/dist/enhancement-prompts.js.map +1 -0
package/dist/envelopes.d.ts +20 -0
package/dist/envelopes.d.ts.map +1 -0
package/dist/envelopes.js +790 -0
package/dist/envelopes.js.map +1 -0
package/dist/format-normalizer.d.ts +71 -0
package/dist/format-normalizer.d.ts.map +1 -0
package/dist/format-normalizer.js +1331 -0
package/dist/format-normalizer.js.map +1 -0
package/dist/history.d.ts +79 -0
package/dist/history.d.ts.map +1 -0
package/dist/history.js +313 -0
package/dist/history.js.map +1 -0
package/dist/html.d.ts +11 -0
package/dist/html.d.ts.map +1 -0
package/dist/html.js +463 -0
package/dist/html.js.map +1 -0
package/dist/impact.d.ts +42 -0
package/dist/impact.d.ts.map +1 -0
package/dist/impact.js +443 -0
package/dist/impact.js.map +1 -0
package/dist/index.d.ts +26 -0
package/dist/index.d.ts.map +1 -0
package/dist/index.js +34 -0
package/dist/index.js.map +1 -0
package/dist/insights.d.ts +5 -0
package/dist/insights.d.ts.map +1 -0
package/dist/insights.js +271 -0
package/dist/insights.js.map +1 -0
package/dist/joiner.d.ts +9 -0
package/dist/joiner.d.ts.map +1 -0
package/dist/joiner.js +247 -0
package/dist/joiner.js.map +1 -0
package/dist/orchestrator.d.ts +34 -0
package/dist/orchestrator.d.ts.map +1 -0
package/dist/orchestrator.js +827 -0
package/dist/orchestrator.js.map +1 -0
package/dist/pdf.d.ts +26 -0
package/dist/pdf.d.ts.map +1 -0
package/dist/pdf.js +84 -0
package/dist/pdf.js.map +1 -0
package/dist/prediction.d.ts +33 -0
package/dist/prediction.d.ts.map +1 -0
package/dist/prediction.js +316 -0
package/dist/prediction.js.map +1 -0
package/dist/prompts/loader.d.ts +38 -0
package/dist/prompts/loader.d.ts.map +1 -0
package/dist/prompts/loader.js +60 -0
package/dist/prompts/loader.js.map +1 -0
package/dist/renderer.d.ts +64 -0
package/dist/renderer.d.ts.map +1 -0
package/dist/renderer.js +923 -0
package/dist/renderer.js.map +1 -0
package/dist/runid.d.ts +57 -0
package/dist/runid.d.ts.map +1 -0
package/dist/runid.js +199 -0
package/dist/runid.js.map +1 -0
package/dist/runtime.d.ts +29 -0
package/dist/runtime.d.ts.map +1 -0
package/dist/runtime.js +366 -0
package/dist/runtime.js.map +1 -0
package/dist/scanner.d.ts +11 -0
package/dist/scanner.d.ts.map +1 -0
package/dist/scanner.js +426 -0
package/dist/scanner.js.map +1 -0
package/dist/templates.d.ts +120 -0
package/dist/templates.d.ts.map +1 -0
package/dist/templates.js +429 -0
package/dist/templates.js.map +1 -0
package/dist/tools/index.d.ts +153 -0
package/dist/tools/index.d.ts.map +1 -0
package/dist/tools/index.js +177 -0
package/dist/tools/index.js.map +1 -0
package/dist/types.d.ts +3647 -0
package/dist/types.d.ts.map +1 -0
package/dist/types.js +703 -0
package/dist/types.js.map +1 -0
package/dist/version.d.ts +7 -0
package/dist/version.d.ts.map +1 -0
package/dist/version.js +23 -0
package/dist/version.js.map +1 -0
package/docs/demo-guide.md +423 -0
package/docs/events-format.md +295 -0
package/docs/inferencemap-spec.md +344 -0
package/docs/migration-v2.md +293 -0
package/fixtures/demo/precomputed.json +142 -0
package/fixtures/demo-project/README.md +52 -0
package/fixtures/demo-project/ai-service.ts +65 -0
package/fixtures/demo-project/sample-events.jsonl +15 -0
package/fixtures/demo-project/src/ai-service.ts +128 -0
package/fixtures/demo-project/src/llm-client.ts +155 -0
package/package.json +65 -0
package/prompts/agent-analyzer.yaml +47 -0
package/prompts/ci-gate.yaml +98 -0
package/prompts/correlation-analyzer.yaml +178 -0
package/prompts/format-normalizer.yaml +46 -0
package/prompts/peak-performance.yaml +180 -0
package/prompts/pr-comment.yaml +111 -0
package/prompts/runtime-analyzer.yaml +189 -0
package/prompts/unified-analyzer.yaml +241 -0
package/schemas/inference-map.v0.1.json +215 -0
package/scripts/benchmark.ts +394 -0
package/scripts/demo-v1.5.sh +158 -0
package/scripts/sync-from-site.sh +197 -0
package/scripts/validate-sync.sh +178 -0
package/src/agent-analyzer.ts +481 -0
package/src/agent.ts +1232 -0
package/src/agents/correlation-analyzer.ts +353 -0
package/src/agents/index.ts +235 -0
package/src/agents/runtime-analyzer.ts +343 -0
package/src/analysis-types.ts +558 -0
package/src/analytics.ts +100 -0
package/src/analyzer.ts +692 -0
package/src/artifacts.ts +218 -0
package/src/benchmarks/index.ts +309 -0
package/src/cli.ts +503 -0
package/src/commands/ci.ts +336 -0
package/src/commands/config.ts +288 -0
package/src/commands/demo.ts +175 -0
package/src/commands/export.ts +297 -0
package/src/commands/history.ts +425 -0
package/src/commands/template.ts +385 -0
package/src/commands/validate-map.ts +324 -0
package/src/commands/whatif.ts +272 -0
package/src/comparison.ts +283 -0
package/src/config.ts +188 -0
package/src/connectors/helicone.ts +164 -0
package/src/connectors/index.ts +93 -0
package/src/connectors/langsmith.ts +179 -0
package/src/connectors/types.ts +180 -0
package/src/cost-estimator.ts +146 -0
package/src/costs.ts +347 -0
package/src/counterfactuals.ts +516 -0
package/src/enhancement-prompts.ts +118 -0
package/src/envelopes.ts +814 -0
package/src/format-normalizer.ts +1486 -0
package/src/history.ts +400 -0
package/src/html.ts +512 -0
package/src/impact.ts +522 -0
package/src/index.ts +83 -0
package/src/insights.ts +341 -0
package/src/joiner.ts +289 -0
package/src/orchestrator.ts +1015 -0
package/src/pdf.ts +110 -0
package/src/prediction.ts +392 -0
package/src/prompts/loader.ts +88 -0
package/src/renderer.ts +1045 -0
package/src/runid.ts +261 -0
package/src/runtime.ts +450 -0
package/src/scanner.ts +508 -0
package/src/templates.ts +561 -0
package/src/tools/index.ts +214 -0
package/src/types.ts +873 -0
package/src/version.ts +24 -0
package/templates/context-accumulation.yaml +23 -0
package/templates/cost-concentration.yaml +20 -0
package/templates/dead-code.yaml +20 -0
package/templates/latency-explainer.yaml +23 -0
package/templates/optimizations/ab-testing-framework.yaml +74 -0
package/templates/optimizations/api-gateway-optimization.yaml +81 -0
package/templates/optimizations/api-model-routing-strategy.yaml +126 -0
package/templates/optimizations/auto-scaling-optimization.yaml +85 -0
package/templates/optimizations/batch-utilization-diagnostic.yaml +142 -0
package/templates/optimizations/comprehensive-apm.yaml +76 -0
package/templates/optimizations/context-window-optimization.yaml +91 -0
package/templates/optimizations/cost-sensitive-batch-processing.yaml +77 -0
package/templates/optimizations/distributed-training-optimization.yaml +77 -0
package/templates/optimizations/document-analysis-edge.yaml +77 -0
package/templates/optimizations/document-pipeline-optimization.yaml +78 -0
package/templates/optimizations/domain-specific-distillation.yaml +78 -0
package/templates/optimizations/error-handling-optimization.yaml +76 -0
package/templates/optimizations/gptq-4bit-quantization.yaml +96 -0
package/templates/optimizations/long-context-memory-management.yaml +78 -0
package/templates/optimizations/max-tokens-optimization.yaml +76 -0
package/templates/optimizations/memory-bandwidth-optimization.yaml +73 -0
package/templates/optimizations/multi-framework-resilience.yaml +75 -0
package/templates/optimizations/multi-tenant-optimization.yaml +75 -0
package/templates/optimizations/prompt-caching-optimization.yaml +143 -0
package/templates/optimizations/pytorch-to-onnx-migration.yaml +109 -0
package/templates/optimizations/quality-monitoring.yaml +74 -0
package/templates/optimizations/realtime-budget-controls.yaml +74 -0
package/templates/optimizations/realtime-latency-optimization.yaml +74 -0
package/templates/optimizations/sglang-concurrency-optimization.yaml +78 -0
package/templates/optimizations/smart-model-routing.yaml +96 -0
package/templates/optimizations/streaming-batch-selection.yaml +167 -0
package/templates/optimizations/system-prompt-optimization.yaml +75 -0
package/templates/optimizations/tensorrt-llm-performance.yaml +77 -0
package/templates/optimizations/vllm-high-throughput-optimization.yaml +93 -0
package/templates/optimizations/vllm-migration-memory-bound.yaml +78 -0
package/templates/overpowered-extraction.yaml +32 -0
package/templates/overpowered-model.yaml +31 -0
package/templates/prompt-bloat.yaml +24 -0
package/templates/retry-explosion.yaml +28 -0
package/templates/schema/insight.schema.json +113 -0
package/templates/schema/optimization.schema.json +180 -0
package/templates/streaming-drift.yaml +30 -0
package/templates/throughput-gap.yaml +21 -0
package/templates/token-underutilization.yaml +28 -0
package/templates/untested-fallback.yaml +21 -0
package/tests/accuracy/drift-detection.test.ts +184 -0
package/tests/accuracy/false-positives.test.ts +166 -0
package/tests/accuracy/templates.test.ts +205 -0
package/tests/action/commands.test.ts +125 -0
package/tests/action/comments.test.ts +347 -0
package/tests/cli.test.ts +203 -0
package/tests/comparison.test.ts +309 -0
package/tests/correlation-analyzer.test.ts +534 -0
package/tests/counterfactuals.test.ts +347 -0
package/tests/fixtures/events/missing-id.jsonl +1 -0
package/tests/fixtures/events/missing-input.jsonl +1 -0
package/tests/fixtures/events/missing-latency.jsonl +1 -0
package/tests/fixtures/events/missing-model.jsonl +1 -0
package/tests/fixtures/events/missing-output.jsonl +1 -0
package/tests/fixtures/events/missing-provider.jsonl +1 -0
package/tests/fixtures/events/missing-ts.jsonl +1 -0
package/tests/fixtures/events/valid.csv +3 -0
package/tests/fixtures/events/valid.json +1 -0
package/tests/fixtures/events/valid.jsonl +2 -0
package/tests/fixtures/events/with-callsite.jsonl +1 -0
package/tests/fixtures/events/with-intent.jsonl +1 -0
package/tests/fixtures/events/wrong-type.jsonl +1 -0
package/tests/fixtures/repos/empty/.gitkeep +0 -0
package/tests/fixtures/repos/hybrid-router/router.py +35 -0
package/tests/fixtures/repos/saas-anthropic/agent.ts +27 -0
package/tests/fixtures/repos/saas-openai/assistant.js +33 -0
package/tests/fixtures/repos/saas-openai/client.py +26 -0
package/tests/fixtures/repos/self-hosted-vllm/inference.py +22 -0
package/tests/github-action.test.ts +292 -0
package/tests/insights.test.ts +878 -0
package/tests/joiner.test.ts +168 -0
package/tests/performance/action-latency.test.ts +132 -0
package/tests/performance/benchmark.test.ts +189 -0
package/tests/performance/cli-latency.test.ts +102 -0
package/tests/pr-comment.test.ts +313 -0
package/tests/prediction.test.ts +296 -0
package/tests/runtime-analyzer.test.ts +375 -0
package/tests/runtime.test.ts +205 -0
package/tests/scanner.test.ts +122 -0
package/tests/template-conformance.test.ts +526 -0
package/tests/unit/cost-calculator.test.ts +303 -0
package/tests/unit/credits.test.ts +180 -0
package/tests/unit/inference-map.test.ts +276 -0
package/tests/unit/schema.test.ts +300 -0
package/tsconfig.json +20 -0
package/vitest.config.ts +14 -0

package/src/agent.ts ADDED Viewed

@@ -0,0 +1,1232 @@
+import { existsSync, statSync, readFileSync, writeFileSync } from 'fs';
+import { resolve } from 'path';
+import type { ExecutionPlan, PlannedTask, TaskResult, ScanResult, Callsite, InferenceEvent, JoinedOutput, Insight, RuntimeSummary, InferenceMap, ImpactEstimate, EnrichedCallsite } from './types.js';
+import { scan } from './scanner.js';
+import { analyze, type LLMInsight } from './analyzer.js';
+import { parseEvents, aggregate } from './runtime.js';
+import { join } from './joiner.js';
+import { loadTemplates, getDefaultPrompt, type AnalysisPrompt } from './templates.js';
+import { evaluate } from './insights.js';
+import { ENVELOPES } from './envelopes.js';
+import { loadPricing } from './costs.js';
+import { saveArtifacts, checkResumable, loadArtifacts, generateRunId, type ArtifactData } from './artifacts.js';
+import { generateHTML } from './html.js';
+import { generatePDF } from './pdf.js';
+import { VERSION } from './version.js';
+import { enrichInsightsWithImpact, generateImpactSummary, type ImpactSummary } from './impact.js';
+import { saveRun, getLatestRun, loadRun, type AnalysisData } from './history.js';
+import { compareSnapshots, formatComparisonSummary, type AnalysisSnapshot } from './comparison.js';
+import { generatePredictions } from './prediction.js';
+import { generateCounterfactuals } from './counterfactuals.js';
+import type { ComparisonResult, PredictionResult, CounterfactualResult } from './types.js';
+// Agent SDK pattern (DESIGN.md v2.0 Section 2.1, Patterns v0.2)
+import {
+  DiscoveryAgent,
+  AnalyzerAgent,
+  JoinerAgent,
+  InsightAgent,
+  RuntimeAnalyzerAgent,
+  CorrelationAnalyzerAgent,
+  StaticAnalysisOrchestrator,
+  type StaticAnalysisOutput,
+  type PerformanceProfile,
+} from './agents/index.js';
+import { getPricingContext } from './costs.js';
+// =============================================================================
+// HELPERS
+// =============================================================================
+/**
+ * Create synthetic enriched inference points from runtime events for insight evaluation.
+ * Groups events by provider:model and computes usage statistics.
+ * This enables runtime-only analysis to benefit from template-based insights.
+ */
+function createSyntheticCallsitesFromEvents(events: InferenceEvent[]): EnrichedCallsite[] {
+  // Group events by provider:model
+  const groups = new Map<string, InferenceEvent[]>();
+  for (const event of events) {
+    const key = `${event.provider}:${event.model}`;
+    if (!groups.has(key)) {
+      groups.set(key, []);
+    }
+    groups.get(key)!.push(event);
+  }
+  // Convert each group to a synthetic enriched inference point
+  const callsites: EnrichedCallsite[] = [];
+  let id = 1;
+  for (const [key, groupEvents] of groups) {
+    const [provider, model] = key.split(':');
+    // Compute usage stats
+    const calls = groupEvents.length;
+    const tokens_in = groupEvents.reduce((sum, e) => sum + e.input_tokens, 0);
+    const tokens_out = groupEvents.reduce((sum, e) => sum + e.output_tokens, 0);
+    const latencies = groupEvents.map(e => e.latency_ms).sort((a, b) => a - b);
+    const p50Index = Math.floor(latencies.length * 0.5);
+    const p95Index = Math.floor(latencies.length * 0.95);
+    const p99Index = Math.floor(latencies.length * 0.99);
+    callsites.push({
+      id: `runtime-${id++}`,
+      file: 'runtime',  // Synthetic location
+      line: 0,
+      provider: provider as EnrichedCallsite['provider'],
+      model,
+      framework: null,
+      runtime: null,
+      patterns: {
+        streaming: groupEvents.some(e => e.streaming === true),
+        batching: groupEvents.some(e => e.batch_id !== undefined),
+        caching: groupEvents.some(e => e.cached === true),
+        retries: groupEvents.some(e => (e.retry_count || 0) > 0),
+        fallback: groupEvents.some(e => e.fallback_used === true),
+      },
+      confidence: 1.0,
+      usage: {
+        calls,
+        tokens_in,
+        tokens_out,
+        latency_p50: latencies[p50Index] || 0,
+        latency_p95: latencies[p95Index] || latencies[p50Index] || 0,
+        latency_p99: latencies[p99Index] || latencies[p95Index] || latencies[p50Index] || 0,
+      },
+    });
+  }
+  return callsites;
+}
+/**
+ * Convert StaticAnalysisOutput to LLM insights for display.
+ * Maps optimizations from all dimensions (cost, latency, throughput, reliability) to insights.
+ */
+function convertPerformanceToInsights(analysis: StaticAnalysisOutput): Array<{
+  severity: 'critical' | 'warning' | 'info';
+  category: string;
+  headline: string;
+  evidence: string;
+  location?: string;
+  recommendation: string;
+  impact?: {
+    layer: string;
+    impactType: string;
+    estimatedImpactPercent: number;
+    effort: string;
+  };
+}> {
+  const insights: Array<{
+    severity: 'critical' | 'warning' | 'info';
+    category: string;
+    headline: string;
+    evidence: string;
+    location?: string;
+    recommendation: string;
+    impact?: {
+      layer: string;
+      impactType: string;
+      estimatedImpactPercent: number;
+      effort: string;
+    };
+  }> = [];
+  // Convert all optimizations to insights
+  for (const opt of analysis.all_optimizations) {
+    const severity = opt.priority === 'critical' || opt.priority === 'high' ? 'critical' :
+                     opt.priority === 'medium' ? 'warning' : 'info';
+    const categoryMap: Record<string, string> = {
+      cost: 'Cost Optimization',
+      latency: 'Latency Optimization',
+      throughput: 'Throughput Optimization',
+      reliability: 'Reliability Improvement',
+    };
+    const impactTypeMap: Record<string, string> = {
+      cost: 'cost',
+      latency: 'latency',
+      throughput: 'throughput',
+      reliability: 'improvement',
+    };
+    // Parse impact percentage from the impact string (e.g., "90% savings" or "50% improvement")
+    const impactMatch = opt.impact.match(/(\d+)%/);
+    const impactPercent = impactMatch ? parseInt(impactMatch[1]) : 20;
+    insights.push({
+      severity,
+      category: categoryMap[opt.dimension] || opt.dimension,
+      headline: opt.description,
+      evidence: `${opt.type}: ${opt.impact}`,
+      location: `${opt.file}:${opt.line}`,
+      recommendation: opt.description,
+      impact: {
+        layer: opt.dimension,
+        impactType: impactTypeMap[opt.dimension] || 'improvement',
+        estimatedImpactPercent: impactPercent,
+        effort: opt.effort,
+      },
+    });
+  }
+  // Add reliability anti-pattern insights
+  for (const profile of analysis.performance_profiles) {
+    if (profile.reliability?.anti_patterns) {
+      for (const antiPattern of profile.reliability.anti_patterns) {
+        const severity = antiPattern.severity === 'high' ? 'critical' :
+                        antiPattern.severity === 'medium' ? 'warning' : 'info';
+        insights.push({
+          severity,
+          category: 'Reliability Issue',
+          headline: antiPattern.pattern,
+          evidence: antiPattern.description,
+          location: antiPattern.location,
+          recommendation: `Fix: ${antiPattern.pattern}`,
+          impact: {
+            layer: 'reliability',
+            impactType: 'improvement',
+            estimatedImpactPercent: antiPattern.severity === 'high' ? 40 : 20,
+            effort: 'low',
+          },
+        });
+      }
+    }
+  }
+  return insights;
+}
+// =============================================================================
+// TYPES
+// =============================================================================
+export interface AgentOptions {
+  path: string;
+  events?: string;
+  eventsUrl?: string;             // URL to fetch runtime events
+  html?: boolean;
+  pdf?: boolean;
+  open?: boolean;
+  out?: string;                   // Write output to file
+  offline?: boolean;
+  verbose?: boolean;
+  noCache?: boolean; // Force fresh analysis, ignore cached runs
+  // Format detection options (PRD §6.4)
+  formatHint?: string;            // User-specified format type
+  fieldHints?: Record<string, string>; // User-specified field mappings
+  lenient?: boolean;              // Accept low-confidence mappings
+  strict?: boolean;               // Fail on missing fields
+  redact?: boolean;               // Redact code snippets from artifacts
+  // History options (v1.5)
+  noHistory?: boolean;            // Skip saving run to history
+  compare?: boolean;              // Compare with previous run
+  compareRunId?: string;          // Specific run ID to compare with
+  predict?: boolean;              // Generate deploy-time predictions
+  targetP95?: number;             // Target p95 latency for budget calculation
+}
+// Progress phases - Julie Zhou aligned (DD Section 6.4)
+export type ProgressPhase = 'scanning' | 'analyzing' | 'profiling' | 'parsing' | 'correlating' | 'generating';
+export interface ProgressData {
+  phase: ProgressPhase;
+  detail?: string; // e.g., "847 files" or "23 inference points"
+  percent?: number; // 0-100 for progress bar
+  currentFile?: string; // current file being analyzed
+}
+export interface AgentCallbacks {
+  onPlanReady?: (plan: ExecutionPlan) => void;
+  onTaskStart?: (task: PlannedTask) => void;
+  onTaskComplete?: (task: PlannedTask, result: TaskResult) => void;
+  onProgress?: (data: ProgressData) => void; // User-meaningful progress
+  onComplete?: (results: AgentResults) => void;
+  onError?: (error: Error) => void;
+  onResumed?: (runId: string) => void; // Called when resuming from cache
+  onPartial?: (warnings: string[]) => void; // Called for partial results
+}
+export interface AgentResults {
+  mode: 'static' | 'runtime' | 'combined';
+  runId: string;
+  resumed: boolean;
+  scanResult?: ScanResult;
+  callsites?: Callsite[];
+  events?: InferenceEvent[];
+  runtimeSummary?: RuntimeSummary;
+  joined?: JoinedOutput;
+  insights: Insight[];
+  impactSummary?: ImpactSummary; // Stack-ranked impact analysis
+  inferenceMap?: InferenceMap;
+  staticAnalysis?: StaticAnalysisOutput; // 6-agent performance profiling
+  comparison?: ComparisonResult; // v1.5: Historical comparison
+  prediction?: PredictionResult; // v1.5: Deploy-time predictions
+  counterfactuals?: CounterfactualResult; // v1.5: What-if optimization scenarios
+  htmlPath?: string;
+  pdfPath?: string;
+  warnings?: string[]; // Partial state warnings
+}
+// =============================================================================
+// AGENT CONTEXT
+// =============================================================================
+interface AgentContext {
+  opts: AgentOptions;
+  runId: string;
+  resumed: boolean;
+  scanResult?: ScanResult;
+  callsites?: Callsite[];
+  events?: InferenceEvent[];
+  runtimeSummary?: RuntimeSummary;
+  joined?: JoinedOutput;
+  insights?: Insight[];
+  llmInsights?: LLMInsight[]; // Phase 1: LLM-generated semantic insights
+  impactSummary?: ImpactSummary; // Stack-ranked impact analysis
+  inferenceMap?: InferenceMap;
+  staticAnalysis?: StaticAnalysisOutput; // 6-agent performance profiling
+  comparison?: ComparisonResult; // v1.5: Historical comparison result
+  prediction?: PredictionResult; // v1.5: Deploy-time predictions
+  counterfactuals?: CounterfactualResult; // v1.5: What-if scenarios
+  htmlContent?: string;
+  pdfPath?: string;
+  warnings: string[]; // Track partial state warnings
+}
+// =============================================================================
+// PASS 1: PLAN
+// =============================================================================
+function detectMode(opts: AgentOptions): 'static' | 'runtime' | 'combined' {
+  // Check if the main path is an events file (case-insensitive for robustness)
+  const pathLower = opts.path.toLowerCase();
+  const isEventsFile = pathLower.endsWith('.jsonl') ||
+                       pathLower.endsWith('.ndjson') ||
+                       pathLower.endsWith('.json') ||
+                       pathLower.endsWith('.csv');
+  // Also check if it's a file (not directory) - file paths with these extensions are events
+  const pathIsFile = !isDirectory(opts.path);
+  // Runtime mode: events file path without separate --events option
+  if (isEventsFile && pathIsFile && !opts.events) {
+    return 'runtime';
+  }
+  // Combined mode: directory path with --events option
+  if (!isEventsFile && opts.events) {
+    return 'combined';
+  }
+  // Combined mode: events file path with separate --events option (rare but valid)
+  if (isEventsFile && opts.events) {
+    return 'combined';
+  }
+  // Static mode: directory path without --events option
+  if (!isEventsFile && !opts.events) {
+    return 'static';
+  }
+  return 'combined';
+}
+function isDirectory(path: string): boolean {
+  try {
+    return existsSync(path) && statSync(path).isDirectory();
+  } catch {
+    return false;
+  }
+}
+/**
+ * Fetch runtime events from a URL
+ */
+async function fetchEventsFromUrl(url: string): Promise<string> {
+  const response = await fetch(url);
+  if (!response.ok) {
+    throw new Error(`Failed to fetch events from ${url}: ${response.status} ${response.statusText}`);
+  }
+  return response.text();
+}
+export interface PlanResult {
+  plan: ExecutionPlan;
+  runId: string;
+  canResume: boolean;
+  runDir: string;
+}
+export function plan(opts: AgentOptions): PlanResult {
+  const tasks: PlannedTask[] = [];
+  let id = 1;
+  const mode = detectMode(opts);
+  const pathIsDirectory = isDirectory(opts.path);
+  // Generate run ID and check resumability
+  const inputs = {
+    repoRoot: isDirectory(opts.path) ? opts.path : undefined,
+    eventsPath: opts.events || (isDirectory(opts.path) ? undefined : opts.path),
+    offline: opts.offline,
+  };
+  const runId = generateRunId(inputs);
+  const resumeCheck = checkResumable(inputs);
+  const shouldResume = !opts.noCache && resumeCheck.canResume;
+  // If we can resume, skip analysis tasks
+  if (!shouldResume) {
+    // Always load pricing first
+    tasks.push({
+      id: id++,
+      type: 'scan', // Reusing for pricing load
+      description: 'Load pricing data',
+    });
+    // Only add static analysis tasks if path is a directory AND mode requires it
+    if ((mode === 'static' || mode === 'combined') && pathIsDirectory) {
+      tasks.push({
+        id: id++,
+        type: 'scan',
+        description: 'Scan repository',
+      });
+      // Unified analysis: discovery + profiling in single LLM call
+      tasks.push({
+        id: id++,
+        type: 'analyze',
+        description: 'Analyze and profile inference points',
+        depends_on: [id - 1],
+      });
+    }
+    if (mode === 'runtime' || mode === 'combined') {
+      tasks.push({
+        id: id++,
+        type: 'parse_events',
+        description: 'Parse runtime events',
+      });
+      // NEW: LLM-based runtime analysis for ALL modes with runtime data (Patterns v0.2)
+      tasks.push({
+        id: id++,
+        type: 'analyze', // Reuse 'analyze' type for runtime LLM analysis
+        description: 'Analyze runtime patterns',
+        depends_on: [id - 1],
+      });
+    }
+    if (mode === 'combined') {
+      tasks.push({
+        id: id++,
+        type: 'join',
+        description: 'Correlate static + runtime',
+      });
+      // NEW: LLM-based correlation analysis (Patterns v0.2)
+      tasks.push({
+        id: id++,
+        type: 'join', // Reuse 'join' type for correlation analysis
+        description: 'Analyze code-runtime drift',
+        depends_on: [id - 1],
+      });
+    }
+    tasks.push({
+      id: id++,
+      type: 'load_templates',
+      description: 'Load insight templates',
+    });
+    tasks.push({
+      id: id++,
+      type: 'generate_insights',
+      description: 'Generate findings',
+    });
+    // v1.5: Compare with previous run if requested
+    if (opts.compare) {
+      tasks.push({
+        id: id++,
+        type: 'compare',
+        description: 'Compare with previous run',
+      });
+    }
+    // v1.5: Generate deploy-time predictions if requested
+    if (opts.predict) {
+      tasks.push({
+        id: id++,
+        type: 'predict',
+        description: 'Generate latency predictions',
+      });
+    }
+    // v1.5: Always generate counterfactual insights (show optimization opportunities)
+    tasks.push({
+      id: id++,
+      type: 'counterfactuals',
+      description: 'Identify optimization opportunities',
+    });
+    if (opts.html) {
+      tasks.push({
+        id: id++,
+        type: 'generate_html',
+        description: 'Generate HTML report',
+      });
+    }
+    if (opts.pdf) {
+      tasks.push({
+        id: id++,
+        type: 'generate_pdf',
+        description: 'Generate PDF report',
+      });
+    }
+    tasks.push({
+      id: id++,
+      type: 'save_artifacts',
+      description: 'Save artifacts',
+    });
+    // v1.5: Save to history for comparison/prediction (unless --no-history)
+    if (!opts.noHistory) {
+      tasks.push({
+        id: id++,
+        type: 'save_history',
+        description: 'Save to history',
+      });
+    }
+  } else {
+    // Resuming - just need to load cached artifacts
+    tasks.push({
+      id: id++,
+      type: 'scan', // Reusing for load cached
+      description: 'Load cached results',
+    });
+    // Always generate HTML if requested, even when resuming
+    if (opts.html) {
+      tasks.push({
+        id: id++,
+        type: 'generate_html',
+        description: 'Generate HTML report',
+      });
+    }
+    if (opts.pdf) {
+      tasks.push({
+        id: id++,
+        type: 'generate_pdf',
+        description: 'Generate PDF report',
+      });
+    }
+    if (opts.html || opts.pdf) {
+      tasks.push({
+        id: id++,
+        type: 'save_artifacts',
+        description: 'Save artifacts',
+      });
+    }
+  }
+  return {
+    plan: { mode, tasks },
+    runId,
+    canResume: shouldResume,
+    runDir: resumeCheck.runDir,
+  };
+}
+// =============================================================================
+// PASS 2: EXECUTE
+// =============================================================================
+async function executeTask(
+  task: PlannedTask,
+  ctx: AgentContext,
+  templates: Awaited<ReturnType<typeof loadTemplates>>,
+  runDir?: string,
+  onProgress?: (data: ProgressData) => void
+): Promise<void> {
+  switch (task.type) {
+    case 'scan':
+      if (task.description === 'Load pricing data') {
+        await loadPricing();
+      } else if (task.description === 'Load cached results') {
+        // Resume from cache
+        if (runDir) {
+          const cached = loadArtifacts(runDir);
+          ctx.inferenceMap = cached.inferenceMap;
+          ctx.insights = cached.insights;
+          ctx.joined = cached.joined;
+          ctx.runtimeSummary = cached.runtime;
+          if (cached.inferenceMap) {
+            ctx.callsites = cached.inferenceMap.callsites;
+          }
+          if (cached.insights && cached.insights.length > 0) {
+            ctx.impactSummary = generateImpactSummary(cached.insights);
+          }
+        }
+      } else {
+        // Validate that path is a directory before attempting to scan
+        if (!isDirectory(ctx.opts.path)) {
+          const ext = ctx.opts.path.toLowerCase();
+          if (ext.endsWith('.jsonl') || ext.endsWith('.ndjson') || ext.endsWith('.json') || ext.endsWith('.csv')) {
+            throw new Error(`Cannot scan file "${ctx.opts.path}" as a codebase. This looks like an events file - try 'peakinfer analyze ${ctx.opts.path}' for runtime analysis.`);
+          }
+          throw new Error(`Expected directory for static analysis, got file: ${ctx.opts.path}`);
+        }
+        // Agent SDK pattern: DiscoveryAgent with constrained tools (Glob/Grep/Read)
+        const discoveryResult = await DiscoveryAgent.execute({ root: ctx.opts.path });
+        ctx.scanResult = discoveryResult.result.scanResult;
+        const fileCount = ctx.scanResult?.files.length ?? 0;
+        onProgress?.({ phase: 'scanning', detail: `${fileCount} files` });
+      }
+      break;
+    case 'analyze':
+      // Handle static code analysis, runtime pattern analysis, AND performance profiling
+      if (task.description === 'Analyze runtime patterns') {
+        // NEW: LLM-based runtime analysis (Patterns v0.2)
+        if (!ctx.events || !ctx.runtimeSummary) {
+          ctx.warnings.push('Runtime analysis skipped: no events parsed');
+          break;
+        }
+        try {
+          // Get pricing context for models in the data
+          const models = Object.keys(ctx.runtimeSummary.byModel);
+          const pricingContext = getPricingContext(models);
+          // Emit progress: starting runtime pattern analysis
+          onProgress?.({ phase: 'analyzing', detail: `analyzing ${ctx.events.length} runtime events...` });
+          const runtimeResult = await RuntimeAnalyzerAgent.execute({
+            events: ctx.events,
+            runtimeSummary: ctx.runtimeSummary,
+            pricingContext,
+          });
+          // Store runtime insights for later merging
+          const runtimeInsights = runtimeResult.result.insights.map(i => ({
+            ...i,
+            source: 'llm' as const,
+          }));
+          ctx.llmInsights = [...(ctx.llmInsights || []), ...runtimeInsights as LLMInsight[]];
+          onProgress?.({ phase: 'analyzing', detail: `${runtimeResult.result.insights.length} runtime insights` });
+        } catch (error) {
+          ctx.warnings.push(`Runtime analysis warning: ${error instanceof Error ? error.message : String(error)}`);
+        }
+      } else if (task.description === 'Analyze and profile inference points') {
+        // UNIFIED: Discovery + Profiling in single LLM call
+        if (!ctx.scanResult) throw new Error('Scan result required');
+        try {
+          const scanRoot = ctx.scanResult.root;
+          // Read all source files (no artificial limit - process all candidates)
+          const filesToAnalyze = ctx.scanResult.files
+            .map(f => {
+              const fullPath = resolve(scanRoot, f.path);
+              try {
+                return {
+                  path: fullPath,
+                  content: readFileSync(fullPath, 'utf-8'),
+                  language: f.language,
+                };
+              } catch {
+                return null;
+              }
+            })
+            .filter((f): f is { path: string; content: string; language: string } => f !== null);
+          if (filesToAnalyze.length === 0) {
+            ctx.warnings.push('Analysis skipped: no source files available');
+            ctx.callsites = [];
+            ctx.llmInsights = [];
+            break;
+          }
+          // Run unified analysis (discovery + profiling in one LLM call)
+          // Pass progress callback for Claude Code-style per-file progress updates
+          const orchestrator = new StaticAnalysisOrchestrator();
+          ctx.staticAnalysis = await orchestrator.analyze(
+            { files: filesToAnalyze },
+            (progressData) => {
+              // Forward progress to renderer with percent for progress bar
+              onProgress?.({
+                phase: 'analyzing',
+                percent: progressData.percent,
+                currentFile: progressData.currentFile,
+                detail: `${progressData.completed}/${progressData.total} files`,
+              });
+            }
+          );
+          // Extract callsites from unified analysis for rest of pipeline
+          const callsitesFromAnalysis: Callsite[] = [];
+          for (const profile of ctx.staticAnalysis.performance_profiles) {
+            callsitesFromAnalysis.push({
+              id: profile.inference_point_id,
+              file: profile.file.replace(scanRoot + '/', '').replace(scanRoot, ''),
+              line: profile.line,
+              provider: profile.provider as Callsite['provider'],
+              model: profile.model ?? null,
+              framework: null,
+              runtime: null,
+              patterns: {},
+              confidence: 0.9,
+            });
+          }
+          ctx.callsites = callsitesFromAnalysis;
+          // Convert performance profiles to insights
+          const performanceInsights = convertPerformanceToInsights(ctx.staticAnalysis);
+          ctx.llmInsights = performanceInsights as LLMInsight[];
+          // Build inference map
+          let promptMeta: MapMetadata = { llmUsed: true };
+          try {
+            const prompt = getDefaultPrompt();
+            promptMeta.promptId = prompt.id;
+            promptMeta.promptVersion = prompt.version;
+          } catch {
+            // Prompt not found, use defaults
+          }
+          ctx.inferenceMap = buildInferenceMap(ctx.opts.path, ctx.callsites, promptMeta);
+          onProgress?.({
+            phase: 'profiling',
+            detail: `${ctx.staticAnalysis.summary.total_optimizations} optimizations found`,
+          });
+        } catch (error) {
+          ctx.warnings.push(`Analysis warning: ${error instanceof Error ? error.message : String(error)}`);
+          ctx.callsites = [];
+          ctx.llmInsights = [];
+          ctx.inferenceMap = buildInferenceMap(ctx.opts.path, [], { llmUsed: false });
+        }
+      } else if (task.description === 'Profile performance') {
+        // Legacy: Skip - now handled by unified analysis above
+        break;
+      } else {
+        // Original static code analysis
+        if (!ctx.scanResult) throw new Error('Scan result required');
+        try {
+          // Agent SDK pattern: AnalyzerAgent with tool-limited semantic analysis
+          // Pass progress callback for visual progress bar during LLM analysis
+          const analyzerResult = await AnalyzerAgent.execute({
+            scanResult: ctx.scanResult,
+            onProgress: onProgress ? (data) => {
+              onProgress({ phase: 'analyzing', percent: data.percent, currentFile: data.currentFile });
+            } : undefined,
+          });
+          ctx.callsites = analyzerResult.result.callsites;
+          ctx.llmInsights = analyzerResult.result.llmInsights as LLMInsight[];
+          // Get prompt metadata for report
+          let promptMeta: MapMetadata = { llmUsed: ctx.llmInsights.length > 0 };
+          try {
+            const prompt = getDefaultPrompt();
+            promptMeta.promptId = prompt.id;
+            promptMeta.promptVersion = prompt.version;
+          } catch {
+            // Prompt not found, use defaults
+          }
+          ctx.inferenceMap = buildInferenceMap(ctx.opts.path, ctx.callsites, promptMeta);
+          onProgress?.({ phase: 'analyzing', detail: `${ctx.callsites.length} inference points` });
+        } catch (error) {
+          // Partial state: analysis failed but we can continue
+          ctx.warnings.push(`Analysis warning: ${error instanceof Error ? error.message : String(error)}`);
+          ctx.callsites = [];
+          ctx.llmInsights = [];
+          ctx.inferenceMap = buildInferenceMap(ctx.opts.path, [], { llmUsed: false });
+        }
+      }
+      break;
+    case 'parse_events': {
+      try {
+        // Build normalization options from CLI flags (PRD §6.4)
+        const normalizationOptions = {
+          format_hint: ctx.opts.formatHint as import('./types.js').FormatType | undefined,
+          field_hints: ctx.opts.fieldHints,
+          lenient: ctx.opts.lenient,
+          strict: ctx.opts.strict,
+          codebase_context: ctx.scanResult, // Pass codebase context for smarter normalization
+        };
+        // Handle --events-url: fetch from URL first
+        if (ctx.opts.eventsUrl) {
+          const eventsContent = await fetchEventsFromUrl(ctx.opts.eventsUrl);
+          // Write to temp file for parsing
+          const tempPath = '.peakinfer/.tmp_events.jsonl';
+          writeFileSync(tempPath, eventsContent);
+          ctx.events = await parseEvents(tempPath, normalizationOptions);
+        } else {
+          const eventsPath = ctx.opts.events || ctx.opts.path;
+          ctx.events = await parseEvents(eventsPath, normalizationOptions);
+        }
+        ctx.runtimeSummary = aggregate(ctx.events);
+        // Emit progress with event count
+        onProgress?.({ phase: 'parsing', detail: `${ctx.events.length} events` });
+      } catch (error) {
+        // Partial state: event parsing failed
+        ctx.warnings.push(`Events parsing warning: ${error instanceof Error ? error.message : String(error)}`);
+        ctx.events = [];
+      }
+      break;
+    }
+    case 'join':
+      // Handle both basic join AND LLM-based correlation analysis
+      if (task.description === 'Analyze code-runtime drift') {
+        // NEW: LLM-based correlation analysis (Patterns v0.2)
+        if (!ctx.callsites || !ctx.events || !ctx.runtimeSummary) {
+          ctx.warnings.push('Correlation analysis skipped: missing callsites or events');
+          break;
+        }
+        try {
+          // Emit progress: starting drift detection analysis
+          onProgress?.({ phase: 'correlating', detail: 'detecting code-runtime drift...' });
+          const correlationResult = await CorrelationAnalyzerAgent.execute({
+            callsites: ctx.callsites,
+            events: ctx.events,
+            runtimeSummary: ctx.runtimeSummary,
+          });
+          // Merge correlation insights
+          const correlationInsights = correlationResult.result.insights.map(i => ({
+            ...i,
+            source: 'llm' as const,
+          }));
+          ctx.llmInsights = [...(ctx.llmInsights || []), ...correlationInsights as LLMInsight[]];
+          // Update drift signals in joined output
+          if (ctx.joined) {
+            ctx.joined.drift = [
+              ...ctx.joined.drift,
+              ...correlationResult.result.driftSignals,
+            ];
+          }
+          onProgress?.({
+            phase: 'correlating',
+            detail: `alignment: ${Math.round(correlationResult.result.alignmentScore * 100)}%`,
+          });
+        } catch (error) {
+          ctx.warnings.push(`Correlation analysis warning: ${error instanceof Error ? error.message : String(error)}`);
+        }
+      } else {
+        // Original basic join
+        if (!ctx.callsites || !ctx.events) throw new Error('Callsites and events required');
+        // Agent SDK pattern: JoinerAgent correlates static + runtime
+        const joinerResult = await JoinerAgent.execute({ callsites: ctx.callsites, events: ctx.events });
+        ctx.joined = joinerResult.result.joined;
+        onProgress?.({
+          phase: 'correlating',
+          detail: `${ctx.joined.callsites.filter(c => 'usage' in c && c.usage).length} matched`,
+        });
+      }
+      break;
+    case 'load_templates':
+      // Templates already loaded, just verify
+      break;
+    case 'generate_insights': {
+      // Agent SDK pattern: InsightAgent evaluates templates
+      // For runtime-only mode, create synthetic inference points from events for template evaluation
+      let data: { callsites: Callsite[] } | JoinedOutput;
+      if (ctx.joined) {
+        data = ctx.joined;
+      } else if (ctx.callsites && ctx.callsites.length > 0) {
+        data = { callsites: ctx.callsites };
+      } else if (ctx.events && ctx.events.length > 0) {
+        // Runtime-only mode: create synthetic enriched inference points from events
+        data = { callsites: createSyntheticCallsitesFromEvents(ctx.events) };
+      } else {
+        data = { callsites: [] };
+      }
+      const insightResult = await InsightAgent.execute({ data, templates });
+      const templateInsights = insightResult.result.insights;
+      // Convert LLM insights to Insight format, preserving any LLM-provided impact estimates
+      const llmFormattedInsights: Insight[] = (ctx.llmInsights || []).map(llmInsight => ({
+        id: `llm_${Date.now()}_${Math.random().toString(36).slice(2, 8)}`,
+        severity: llmInsight.severity,
+        category: llmInsight.category,
+        headline: llmInsight.headline,
+        evidence: llmInsight.evidence,
+        location: llmInsight.location,
+        recommendation: llmInsight.recommendation,
+        source: 'llm' as const, // Mark as LLM-generated
+        // Preserve LLM-provided impact estimates if present
+        impact: llmInsight.impact ? {
+          layer: llmInsight.impact.layer,
+          impactType: llmInsight.impact.impactType,
+          estimatedImpactPercent: llmInsight.impact.estimatedImpactPercent,
+          effort: llmInsight.impact.effort,
+          confidence: 0.8, // LLM estimates have higher confidence
+        } : undefined,
+      }));
+      // Combine: LLM semantic insights first (phase 1), then template pattern insights (phase 2)
+      const combinedInsights = [...llmFormattedInsights, ...templateInsights];
+      // Enrich all insights with impact estimates (fills in missing ones)
+      ctx.insights = enrichInsightsWithImpact(combinedInsights);
+      // Generate stack-ranked impact summary
+      ctx.impactSummary = generateImpactSummary(ctx.insights);
+      // Emit progress with insight count
+      onProgress?.({ phase: 'generating', detail: `${ctx.insights.length} findings` });
+      break;
+    }
+    case 'generate_html':
+      if (!ctx.inferenceMap) throw new Error('InferenceMap required for HTML');
+      ctx.htmlContent = generateHTML({
+        inferenceMap: ctx.inferenceMap,
+        insights: ctx.insights || [],
+        joined: ctx.joined,
+        runtime: ctx.runtimeSummary,
+      });
+      break;
+    case 'generate_pdf': {
+      if (!ctx.htmlContent) throw new Error('HTML content required for PDF');
+      // Generate human-friendly PDF filename
+      const pdfAbsolutePath = ctx.inferenceMap?.metadata?.absolutePath || ctx.opts.path;
+      const pdfProjectName = pdfAbsolutePath.split('/').filter(Boolean).pop() || 'project';
+      const pdfProjectSlug = pdfProjectName.toLowerCase().replace(/[^a-z0-9]+/g, '_').replace(/^_+|_+$/g, '').substring(0, 50);
+      const pdfFileName = `${pdfProjectSlug}_peakinfer_report.pdf`;
+      const pdfPath = `.peakinfer/${pdfFileName}`;
+      await generatePDF(ctx.htmlContent, pdfPath);
+      ctx.pdfPath = pdfPath;
+      break;
+    }
+    case 'save_artifacts': {
+      const inputs = {
+        repoRoot: isDirectory(ctx.opts.path) ? ctx.opts.path : undefined,
+        eventsPath: ctx.opts.events || (isDirectory(ctx.opts.path) ? undefined : ctx.opts.path),
+        offline: ctx.opts.offline,
+      };
+      // Extract project name for human-friendly report naming
+      const absolutePath = ctx.inferenceMap?.metadata?.absolutePath || ctx.opts.path;
+      const projectName = absolutePath.split('/').filter(Boolean).pop() || 'project';
+      saveArtifacts(
+        {
+          inferenceMap: ctx.inferenceMap,
+          insights: ctx.insights,
+          joined: ctx.joined,
+          runtime: ctx.runtimeSummary,
+          html: ctx.htmlContent,
+        },
+        '.peakinfer',
+        {
+          runId: ctx.runId,
+          inputs,
+          projectName,
+        }
+      );
+      break;
+    }
+    case 'save_history': {
+      // v1.5: Save run to history for comparison/prediction features
+      const mode = ctx.joined ? 'combined' : (ctx.events?.length ? 'runtime' : 'static');
+      // Prepare analysis data for history storage
+      const historyData: AnalysisData = {
+        inferenceMap: ctx.inferenceMap,
+        insights: ctx.insights,
+        joined: ctx.joined,
+        runtime: ctx.runtimeSummary,
+      };
+      // Generate human-friendly HTML path if generated
+      const absolutePath = ctx.inferenceMap?.metadata?.absolutePath || ctx.opts.path;
+      const projectName = absolutePath.split('/').filter(Boolean).pop() || 'project';
+      const projectSlug = projectName.toLowerCase().replace(/[^a-z0-9]+/g, '_').replace(/^_+|_+$/g, '').substring(0, 50);
+      saveRun({
+        path: ctx.opts.path,
+        analysisType: mode,
+        data: historyData,
+        htmlPath: ctx.htmlContent ? `.peakinfer/${projectSlug}_peakinfer_report.html` : undefined,
+        pdfPath: ctx.pdfPath,
+      });
+      break;
+    }
+    case 'compare': {
+      // v1.5: Compare with previous run
+      // Build current snapshot
+      const currentSnapshot: AnalysisSnapshot = {
+        runId: ctx.runId,
+        timestamp: new Date().toISOString(),
+        callsites: ctx.callsites || [],
+        insights: ctx.insights,
+      };
+      // Get baseline (specific run or latest)
+      let baselineRun;
+      if (ctx.opts.compareRunId) {
+        baselineRun = loadRun(ctx.opts.compareRunId);
+        if (!baselineRun) {
+          ctx.warnings.push(`Comparison skipped: run ${ctx.opts.compareRunId} not found`);
+          break;
+        }
+      } else {
+        baselineRun = getLatestRun(ctx.opts.path);
+        if (!baselineRun) {
+          ctx.warnings.push('Comparison skipped: no previous runs found');
+          break;
+        }
+      }
+      // Build baseline snapshot
+      const baselineSnapshot: AnalysisSnapshot = {
+        runId: baselineRun.manifest.runId,
+        timestamp: baselineRun.manifest.timestamp,
+        callsites: baselineRun.data.inferenceMap?.callsites || [],
+        insights: baselineRun.data.insights,
+      };
+      // Perform comparison
+      ctx.comparison = compareSnapshots(baselineSnapshot, currentSnapshot);
+      // Log summary for progress
+      const summary = formatComparisonSummary(ctx.comparison);
+      onProgress?.({ phase: 'generating', detail: `compared with ${baselineRun.manifest.runId.slice(0, 8)}` });
+      break;
+    }
+    case 'predict': {
+      // v1.5: Generate deploy-time latency predictions
+      if (!ctx.inferenceMap) {
+        ctx.warnings.push('Prediction skipped: no inference map available');
+        break;
+      }
+      // Generate predictions based on inference points
+      const predictionResult = generatePredictions(
+        ctx.inferenceMap,
+        0, // Historical run count (can be enhanced later with actual history)
+        { targetP95: ctx.opts.targetP95 }
+      );
+      ctx.prediction = predictionResult;
+      // Log summary for progress
+      const riskCount = predictionResult.summary.highRiskCount + predictionResult.summary.mediumRiskCount;
+      onProgress?.({
+        phase: 'generating',
+        detail: `${predictionResult.predictions.length} predictions, ${riskCount} at risk`,
+      });
+      break;
+    }
+    case 'counterfactuals': {
+      // v1.5: Generate what-if optimization scenarios
+      if (!ctx.inferenceMap) {
+        ctx.warnings.push('Counterfactuals skipped: no inference map available');
+        break;
+      }
+      // Generate counterfactual insights
+      const counterfactualResult = generateCounterfactuals(ctx.inferenceMap);
+      ctx.counterfactuals = counterfactualResult;
+      // Log summary for progress
+      onProgress?.({
+        phase: 'generating',
+        detail: `${counterfactualResult.summary.totalOpportunities} optimization opportunities`,
+      });
+      break;
+    }
+  }
+}
+interface MapMetadata {
+  promptId?: string;
+  promptVersion?: string;
+  llmUsed?: boolean;
+}
+function buildInferenceMap(
+  root: string,
+  callsites: Callsite[],
+  metadata: MapMetadata = {}
+): InferenceMap {
+  const providers = [...new Set(callsites.map(c => c.provider).filter(Boolean))] as string[];
+  const models = [...new Set(callsites.map(c => c.model).filter(Boolean))] as string[];
+  const patternCounts: Record<string, number> = {};
+  for (const cs of callsites) {
+    for (const [pattern, enabled] of Object.entries(cs.patterns)) {
+      if (enabled) {
+        patternCounts[pattern] = (patternCounts[pattern] || 0) + 1;
+      }
+    }
+  }
+  return {
+    version: '0.1',  // InferenceMap schema version (not CLI version)
+    root,
+    generatedAt: new Date().toISOString(),
+    metadata: {
+      absolutePath: resolve(root),
+      promptId: metadata.promptId || 'peak-performance',
+      promptVersion: metadata.promptVersion,
+      templatesVersion: VERSION,  // CLI version for audit trail
+      llmProvider: metadata.llmUsed ? 'anthropic' : 'none',
+      llmModel: metadata.llmUsed ? 'claude-sonnet-4-20250514' : undefined,
+    },
+    summary: {
+      totalCallsites: callsites.length,
+      providers,
+      models,
+      patterns: patternCounts,
+    },
+    callsites,
+  };
+}
+// =============================================================================
+// PUBLIC API
+// =============================================================================
+export class Agent {
+  private callbacks: AgentCallbacks;
+  constructor(callbacks: AgentCallbacks = {}) {
+    this.callbacks = callbacks;
+  }
+  async run(opts: AgentOptions): Promise<AgentResults> {
+    const planResult = plan(opts);
+    const { plan: executionPlan, runId, canResume, runDir } = planResult;
+    // Notify if resuming from cache
+    if (canResume) {
+      this.callbacks.onResumed?.(runId);
+    }
+    this.callbacks.onPlanReady?.(executionPlan);
+    const ctx: AgentContext = {
+      opts,
+      runId,
+      resumed: canResume,
+      warnings: [],
+    };
+    const results: TaskResult[] = [];
+    // Load templates once (not needed if resuming)
+    const templates = canResume ? [] : await loadTemplates({ offline: opts.offline });
+    for (const task of executionPlan.tasks) {
+      this.callbacks.onTaskStart?.(task);
+      const startTime = Date.now();
+      try {
+        await executeTask(task, ctx, templates, runDir, this.callbacks.onProgress);
+        const result: TaskResult = {
+          taskId: task.id,
+          status: 'success',
+          durationMs: Date.now() - startTime,
+        };
+        results.push(result);
+        this.callbacks.onTaskComplete?.(task, result);
+      } catch (error) {
+        const result: TaskResult = {
+          taskId: task.id,
+          status: 'failed',
+          error: error instanceof Error ? error.message : String(error),
+          durationMs: Date.now() - startTime,
+        };
+        results.push(result);
+        this.callbacks.onTaskComplete?.(task, result);
+        // Critical tasks abort execution only if not partial-safe
+        if (['scan'].includes(task.type) && task.description !== 'Load cached results') {
+          throw error;
+        }
+        // analyze and parse_events can fail gracefully (partial state)
+      }
+    }
+    // Notify if there were warnings (partial state)
+    if (ctx.warnings.length > 0) {
+      this.callbacks.onPartial?.(ctx.warnings);
+    }
+    // Generate human-friendly report filename
+    const absolutePath = ctx.inferenceMap?.metadata?.absolutePath || opts.path;
+    const projectName = absolutePath.split('/').filter(Boolean).pop() || 'project';
+    const projectSlug = projectName.toLowerCase().replace(/[^a-z0-9]+/g, '_').replace(/^_+|_+$/g, '').substring(0, 50);
+    const reportFileName = ctx.htmlContent
+      ? `.peakinfer/${projectSlug}_peakinfer_report.html`
+      : undefined;
+    const agentResults: AgentResults = {
+      mode: executionPlan.mode,
+      runId,
+      resumed: canResume,
+      scanResult: ctx.scanResult,
+      callsites: ctx.callsites,
+      events: ctx.events,
+      runtimeSummary: ctx.runtimeSummary,
+      joined: ctx.joined,
+      insights: ctx.insights || [],
+      impactSummary: ctx.impactSummary,
+      inferenceMap: ctx.inferenceMap,
+      staticAnalysis: ctx.staticAnalysis,
+      comparison: ctx.comparison, // v1.5: Historical comparison
+      prediction: ctx.prediction, // v1.5: Deploy-time predictions
+      counterfactuals: ctx.counterfactuals, // v1.5: What-if scenarios
+      htmlPath: reportFileName,
+      pdfPath: ctx.pdfPath,
+      warnings: ctx.warnings.length > 0 ? ctx.warnings : undefined,
+    };
+    // Handle --out: write output to file
+    if (opts.out) {
+      const outputData = {
+        schema: 'peakinfer-analysis',
+        version: '1.0',  // Analysis export format version
+        cliVersion: VERSION,
+        mode: agentResults.mode,
+        runId: agentResults.runId,
+        timestamp: new Date().toISOString(),
+        inferenceMap: agentResults.inferenceMap,
+        insights: agentResults.insights,
+        impactSummary: agentResults.impactSummary,
+        comparison: agentResults.comparison,
+        prediction: agentResults.prediction,
+        counterfactuals: agentResults.counterfactuals,
+        runtimeSummary: agentResults.runtimeSummary,
+      };
+      writeFileSync(opts.out, JSON.stringify(outputData, null, 2));
+    }
+    this.callbacks.onComplete?.(agentResults);
+    return agentResults;
+  }
+}