npm - @peakinfer/cli - Versions diffs - 1.0.133 - Mend

@peakinfer/cli 1.0.133

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (367) hide show

package/.claude/settings.local.json +8 -0
package/.env.example +6 -0
package/.github/workflows/peakinfer.yml +64 -0
package/CHANGELOG.md +31 -0
package/LICENSE +190 -0
package/README.md +335 -0
package/data/inferencemax.json +274 -0
package/dist/agent-analyzer.d.ts +45 -0
package/dist/agent-analyzer.d.ts.map +1 -0
package/dist/agent-analyzer.js +374 -0
package/dist/agent-analyzer.js.map +1 -0
package/dist/agent.d.ts +76 -0
package/dist/agent.d.ts.map +1 -0
package/dist/agent.js +965 -0
package/dist/agent.js.map +1 -0
package/dist/agents/correlation-analyzer.d.ts +34 -0
package/dist/agents/correlation-analyzer.d.ts.map +1 -0
package/dist/agents/correlation-analyzer.js +261 -0
package/dist/agents/correlation-analyzer.js.map +1 -0
package/dist/agents/index.d.ts +91 -0
package/dist/agents/index.d.ts.map +1 -0
package/dist/agents/index.js +111 -0
package/dist/agents/index.js.map +1 -0
package/dist/agents/runtime-analyzer.d.ts +38 -0
package/dist/agents/runtime-analyzer.d.ts.map +1 -0
package/dist/agents/runtime-analyzer.js +244 -0
package/dist/agents/runtime-analyzer.js.map +1 -0
package/dist/analysis-types.d.ts +500 -0
package/dist/analysis-types.d.ts.map +1 -0
package/dist/analysis-types.js +11 -0
package/dist/analysis-types.js.map +1 -0
package/dist/analytics.d.ts +25 -0
package/dist/analytics.d.ts.map +1 -0
package/dist/analytics.js +94 -0
package/dist/analytics.js.map +1 -0
package/dist/analyzer.d.ts +48 -0
package/dist/analyzer.d.ts.map +1 -0
package/dist/analyzer.js +547 -0
package/dist/analyzer.js.map +1 -0
package/dist/artifacts.d.ts +44 -0
package/dist/artifacts.d.ts.map +1 -0
package/dist/artifacts.js +165 -0
package/dist/artifacts.js.map +1 -0
package/dist/benchmarks/index.d.ts +88 -0
package/dist/benchmarks/index.d.ts.map +1 -0
package/dist/benchmarks/index.js +205 -0
package/dist/benchmarks/index.js.map +1 -0
package/dist/cli.d.ts +3 -0
package/dist/cli.d.ts.map +1 -0
package/dist/cli.js +427 -0
package/dist/cli.js.map +1 -0
package/dist/commands/ci.d.ts +19 -0
package/dist/commands/ci.d.ts.map +1 -0
package/dist/commands/ci.js +253 -0
package/dist/commands/ci.js.map +1 -0
package/dist/commands/config.d.ts +16 -0
package/dist/commands/config.d.ts.map +1 -0
package/dist/commands/config.js +249 -0
package/dist/commands/config.js.map +1 -0
package/dist/commands/demo.d.ts +15 -0
package/dist/commands/demo.d.ts.map +1 -0
package/dist/commands/demo.js +106 -0
package/dist/commands/demo.js.map +1 -0
package/dist/commands/export.d.ts +14 -0
package/dist/commands/export.d.ts.map +1 -0
package/dist/commands/export.js +209 -0
package/dist/commands/export.js.map +1 -0
package/dist/commands/history.d.ts +15 -0
package/dist/commands/history.d.ts.map +1 -0
package/dist/commands/history.js +389 -0
package/dist/commands/history.js.map +1 -0
package/dist/commands/template.d.ts +14 -0
package/dist/commands/template.d.ts.map +1 -0
package/dist/commands/template.js +341 -0
package/dist/commands/template.js.map +1 -0
package/dist/commands/validate-map.d.ts +12 -0
package/dist/commands/validate-map.d.ts.map +1 -0
package/dist/commands/validate-map.js +274 -0
package/dist/commands/validate-map.js.map +1 -0
package/dist/commands/whatif.d.ts +17 -0
package/dist/commands/whatif.d.ts.map +1 -0
package/dist/commands/whatif.js +206 -0
package/dist/commands/whatif.js.map +1 -0
package/dist/comparison.d.ts +38 -0
package/dist/comparison.d.ts.map +1 -0
package/dist/comparison.js +223 -0
package/dist/comparison.js.map +1 -0
package/dist/config.d.ts +42 -0
package/dist/config.d.ts.map +1 -0
package/dist/config.js +158 -0
package/dist/config.js.map +1 -0
package/dist/connectors/helicone.d.ts +9 -0
package/dist/connectors/helicone.d.ts.map +1 -0
package/dist/connectors/helicone.js +106 -0
package/dist/connectors/helicone.js.map +1 -0
package/dist/connectors/index.d.ts +37 -0
package/dist/connectors/index.d.ts.map +1 -0
package/dist/connectors/index.js +65 -0
package/dist/connectors/index.js.map +1 -0
package/dist/connectors/langsmith.d.ts +9 -0
package/dist/connectors/langsmith.d.ts.map +1 -0
package/dist/connectors/langsmith.js +122 -0
package/dist/connectors/langsmith.js.map +1 -0
package/dist/connectors/types.d.ts +83 -0
package/dist/connectors/types.d.ts.map +1 -0
package/dist/connectors/types.js +98 -0
package/dist/connectors/types.js.map +1 -0
package/dist/cost-estimator.d.ts +46 -0
package/dist/cost-estimator.d.ts.map +1 -0
package/dist/cost-estimator.js +104 -0
package/dist/cost-estimator.js.map +1 -0
package/dist/costs.d.ts +57 -0
package/dist/costs.d.ts.map +1 -0
package/dist/costs.js +251 -0
package/dist/costs.js.map +1 -0
package/dist/counterfactuals.d.ts +29 -0
package/dist/counterfactuals.d.ts.map +1 -0
package/dist/counterfactuals.js +448 -0
package/dist/counterfactuals.js.map +1 -0
package/dist/enhancement-prompts.d.ts +41 -0
package/dist/enhancement-prompts.d.ts.map +1 -0
package/dist/enhancement-prompts.js +88 -0
package/dist/enhancement-prompts.js.map +1 -0
package/dist/envelopes.d.ts +20 -0
package/dist/envelopes.d.ts.map +1 -0
package/dist/envelopes.js +790 -0
package/dist/envelopes.js.map +1 -0
package/dist/format-normalizer.d.ts +71 -0
package/dist/format-normalizer.d.ts.map +1 -0
package/dist/format-normalizer.js +1331 -0
package/dist/format-normalizer.js.map +1 -0
package/dist/history.d.ts +79 -0
package/dist/history.d.ts.map +1 -0
package/dist/history.js +313 -0
package/dist/history.js.map +1 -0
package/dist/html.d.ts +11 -0
package/dist/html.d.ts.map +1 -0
package/dist/html.js +463 -0
package/dist/html.js.map +1 -0
package/dist/impact.d.ts +42 -0
package/dist/impact.d.ts.map +1 -0
package/dist/impact.js +443 -0
package/dist/impact.js.map +1 -0
package/dist/index.d.ts +26 -0
package/dist/index.d.ts.map +1 -0
package/dist/index.js +34 -0
package/dist/index.js.map +1 -0
package/dist/insights.d.ts +5 -0
package/dist/insights.d.ts.map +1 -0
package/dist/insights.js +271 -0
package/dist/insights.js.map +1 -0
package/dist/joiner.d.ts +9 -0
package/dist/joiner.d.ts.map +1 -0
package/dist/joiner.js +247 -0
package/dist/joiner.js.map +1 -0
package/dist/orchestrator.d.ts +34 -0
package/dist/orchestrator.d.ts.map +1 -0
package/dist/orchestrator.js +827 -0
package/dist/orchestrator.js.map +1 -0
package/dist/pdf.d.ts +26 -0
package/dist/pdf.d.ts.map +1 -0
package/dist/pdf.js +84 -0
package/dist/pdf.js.map +1 -0
package/dist/prediction.d.ts +33 -0
package/dist/prediction.d.ts.map +1 -0
package/dist/prediction.js +316 -0
package/dist/prediction.js.map +1 -0
package/dist/prompts/loader.d.ts +38 -0
package/dist/prompts/loader.d.ts.map +1 -0
package/dist/prompts/loader.js +60 -0
package/dist/prompts/loader.js.map +1 -0
package/dist/renderer.d.ts +64 -0
package/dist/renderer.d.ts.map +1 -0
package/dist/renderer.js +923 -0
package/dist/renderer.js.map +1 -0
package/dist/runid.d.ts +57 -0
package/dist/runid.d.ts.map +1 -0
package/dist/runid.js +199 -0
package/dist/runid.js.map +1 -0
package/dist/runtime.d.ts +29 -0
package/dist/runtime.d.ts.map +1 -0
package/dist/runtime.js +366 -0
package/dist/runtime.js.map +1 -0
package/dist/scanner.d.ts +11 -0
package/dist/scanner.d.ts.map +1 -0
package/dist/scanner.js +426 -0
package/dist/scanner.js.map +1 -0
package/dist/templates.d.ts +120 -0
package/dist/templates.d.ts.map +1 -0
package/dist/templates.js +429 -0
package/dist/templates.js.map +1 -0
package/dist/tools/index.d.ts +153 -0
package/dist/tools/index.d.ts.map +1 -0
package/dist/tools/index.js +177 -0
package/dist/tools/index.js.map +1 -0
package/dist/types.d.ts +3647 -0
package/dist/types.d.ts.map +1 -0
package/dist/types.js +703 -0
package/dist/types.js.map +1 -0
package/dist/version.d.ts +7 -0
package/dist/version.d.ts.map +1 -0
package/dist/version.js +23 -0
package/dist/version.js.map +1 -0
package/docs/demo-guide.md +423 -0
package/docs/events-format.md +295 -0
package/docs/inferencemap-spec.md +344 -0
package/docs/migration-v2.md +293 -0
package/fixtures/demo/precomputed.json +142 -0
package/fixtures/demo-project/README.md +52 -0
package/fixtures/demo-project/ai-service.ts +65 -0
package/fixtures/demo-project/sample-events.jsonl +15 -0
package/fixtures/demo-project/src/ai-service.ts +128 -0
package/fixtures/demo-project/src/llm-client.ts +155 -0
package/package.json +65 -0
package/prompts/agent-analyzer.yaml +47 -0
package/prompts/ci-gate.yaml +98 -0
package/prompts/correlation-analyzer.yaml +178 -0
package/prompts/format-normalizer.yaml +46 -0
package/prompts/peak-performance.yaml +180 -0
package/prompts/pr-comment.yaml +111 -0
package/prompts/runtime-analyzer.yaml +189 -0
package/prompts/unified-analyzer.yaml +241 -0
package/schemas/inference-map.v0.1.json +215 -0
package/scripts/benchmark.ts +394 -0
package/scripts/demo-v1.5.sh +158 -0
package/scripts/sync-from-site.sh +197 -0
package/scripts/validate-sync.sh +178 -0
package/src/agent-analyzer.ts +481 -0
package/src/agent.ts +1232 -0
package/src/agents/correlation-analyzer.ts +353 -0
package/src/agents/index.ts +235 -0
package/src/agents/runtime-analyzer.ts +343 -0
package/src/analysis-types.ts +558 -0
package/src/analytics.ts +100 -0
package/src/analyzer.ts +692 -0
package/src/artifacts.ts +218 -0
package/src/benchmarks/index.ts +309 -0
package/src/cli.ts +503 -0
package/src/commands/ci.ts +336 -0
package/src/commands/config.ts +288 -0
package/src/commands/demo.ts +175 -0
package/src/commands/export.ts +297 -0
package/src/commands/history.ts +425 -0
package/src/commands/template.ts +385 -0
package/src/commands/validate-map.ts +324 -0
package/src/commands/whatif.ts +272 -0
package/src/comparison.ts +283 -0
package/src/config.ts +188 -0
package/src/connectors/helicone.ts +164 -0
package/src/connectors/index.ts +93 -0
package/src/connectors/langsmith.ts +179 -0
package/src/connectors/types.ts +180 -0
package/src/cost-estimator.ts +146 -0
package/src/costs.ts +347 -0
package/src/counterfactuals.ts +516 -0
package/src/enhancement-prompts.ts +118 -0
package/src/envelopes.ts +814 -0
package/src/format-normalizer.ts +1486 -0
package/src/history.ts +400 -0
package/src/html.ts +512 -0
package/src/impact.ts +522 -0
package/src/index.ts +83 -0
package/src/insights.ts +341 -0
package/src/joiner.ts +289 -0
package/src/orchestrator.ts +1015 -0
package/src/pdf.ts +110 -0
package/src/prediction.ts +392 -0
package/src/prompts/loader.ts +88 -0
package/src/renderer.ts +1045 -0
package/src/runid.ts +261 -0
package/src/runtime.ts +450 -0
package/src/scanner.ts +508 -0
package/src/templates.ts +561 -0
package/src/tools/index.ts +214 -0
package/src/types.ts +873 -0
package/src/version.ts +24 -0
package/templates/context-accumulation.yaml +23 -0
package/templates/cost-concentration.yaml +20 -0
package/templates/dead-code.yaml +20 -0
package/templates/latency-explainer.yaml +23 -0
package/templates/optimizations/ab-testing-framework.yaml +74 -0
package/templates/optimizations/api-gateway-optimization.yaml +81 -0
package/templates/optimizations/api-model-routing-strategy.yaml +126 -0
package/templates/optimizations/auto-scaling-optimization.yaml +85 -0
package/templates/optimizations/batch-utilization-diagnostic.yaml +142 -0
package/templates/optimizations/comprehensive-apm.yaml +76 -0
package/templates/optimizations/context-window-optimization.yaml +91 -0
package/templates/optimizations/cost-sensitive-batch-processing.yaml +77 -0
package/templates/optimizations/distributed-training-optimization.yaml +77 -0
package/templates/optimizations/document-analysis-edge.yaml +77 -0
package/templates/optimizations/document-pipeline-optimization.yaml +78 -0
package/templates/optimizations/domain-specific-distillation.yaml +78 -0
package/templates/optimizations/error-handling-optimization.yaml +76 -0
package/templates/optimizations/gptq-4bit-quantization.yaml +96 -0
package/templates/optimizations/long-context-memory-management.yaml +78 -0
package/templates/optimizations/max-tokens-optimization.yaml +76 -0
package/templates/optimizations/memory-bandwidth-optimization.yaml +73 -0
package/templates/optimizations/multi-framework-resilience.yaml +75 -0
package/templates/optimizations/multi-tenant-optimization.yaml +75 -0
package/templates/optimizations/prompt-caching-optimization.yaml +143 -0
package/templates/optimizations/pytorch-to-onnx-migration.yaml +109 -0
package/templates/optimizations/quality-monitoring.yaml +74 -0
package/templates/optimizations/realtime-budget-controls.yaml +74 -0
package/templates/optimizations/realtime-latency-optimization.yaml +74 -0
package/templates/optimizations/sglang-concurrency-optimization.yaml +78 -0
package/templates/optimizations/smart-model-routing.yaml +96 -0
package/templates/optimizations/streaming-batch-selection.yaml +167 -0
package/templates/optimizations/system-prompt-optimization.yaml +75 -0
package/templates/optimizations/tensorrt-llm-performance.yaml +77 -0
package/templates/optimizations/vllm-high-throughput-optimization.yaml +93 -0
package/templates/optimizations/vllm-migration-memory-bound.yaml +78 -0
package/templates/overpowered-extraction.yaml +32 -0
package/templates/overpowered-model.yaml +31 -0
package/templates/prompt-bloat.yaml +24 -0
package/templates/retry-explosion.yaml +28 -0
package/templates/schema/insight.schema.json +113 -0
package/templates/schema/optimization.schema.json +180 -0
package/templates/streaming-drift.yaml +30 -0
package/templates/throughput-gap.yaml +21 -0
package/templates/token-underutilization.yaml +28 -0
package/templates/untested-fallback.yaml +21 -0
package/tests/accuracy/drift-detection.test.ts +184 -0
package/tests/accuracy/false-positives.test.ts +166 -0
package/tests/accuracy/templates.test.ts +205 -0
package/tests/action/commands.test.ts +125 -0
package/tests/action/comments.test.ts +347 -0
package/tests/cli.test.ts +203 -0
package/tests/comparison.test.ts +309 -0
package/tests/correlation-analyzer.test.ts +534 -0
package/tests/counterfactuals.test.ts +347 -0
package/tests/fixtures/events/missing-id.jsonl +1 -0
package/tests/fixtures/events/missing-input.jsonl +1 -0
package/tests/fixtures/events/missing-latency.jsonl +1 -0
package/tests/fixtures/events/missing-model.jsonl +1 -0
package/tests/fixtures/events/missing-output.jsonl +1 -0
package/tests/fixtures/events/missing-provider.jsonl +1 -0
package/tests/fixtures/events/missing-ts.jsonl +1 -0
package/tests/fixtures/events/valid.csv +3 -0
package/tests/fixtures/events/valid.json +1 -0
package/tests/fixtures/events/valid.jsonl +2 -0
package/tests/fixtures/events/with-callsite.jsonl +1 -0
package/tests/fixtures/events/with-intent.jsonl +1 -0
package/tests/fixtures/events/wrong-type.jsonl +1 -0
package/tests/fixtures/repos/empty/.gitkeep +0 -0
package/tests/fixtures/repos/hybrid-router/router.py +35 -0
package/tests/fixtures/repos/saas-anthropic/agent.ts +27 -0
package/tests/fixtures/repos/saas-openai/assistant.js +33 -0
package/tests/fixtures/repos/saas-openai/client.py +26 -0
package/tests/fixtures/repos/self-hosted-vllm/inference.py +22 -0
package/tests/github-action.test.ts +292 -0
package/tests/insights.test.ts +878 -0
package/tests/joiner.test.ts +168 -0
package/tests/performance/action-latency.test.ts +132 -0
package/tests/performance/benchmark.test.ts +189 -0
package/tests/performance/cli-latency.test.ts +102 -0
package/tests/pr-comment.test.ts +313 -0
package/tests/prediction.test.ts +296 -0
package/tests/runtime-analyzer.test.ts +375 -0
package/tests/runtime.test.ts +205 -0
package/tests/scanner.test.ts +122 -0
package/tests/template-conformance.test.ts +526 -0
package/tests/unit/cost-calculator.test.ts +303 -0
package/tests/unit/credits.test.ts +180 -0
package/tests/unit/inference-map.test.ts +276 -0
package/tests/unit/schema.test.ts +300 -0
package/tsconfig.json +20 -0
package/vitest.config.ts +14 -0

package/src/analyzer.ts ADDED Viewed

@@ -0,0 +1,692 @@
+import { readFileSync } from 'fs';
+import { join } from 'path';
+import { query } from '@anthropic-ai/claude-agent-sdk';
+import type { SDKMessage } from '@anthropic-ai/claude-agent-sdk';
+import type { ScanResult, Callsite, Patterns, Provider } from './types.js';
+import { createHash } from 'crypto';
+import { loadPrompt, getDefaultPrompt, loadConfig, getConfiguredMode, isCascadeEnabled, type AnalysisPrompt } from './templates.js';
+import { analyzeWithAgent, convertAgentCallsites } from './agent-analyzer.js';
+// =============================================================================
+// CONSTANTS
+// =============================================================================
+const LLM_BATCH_SIZE = 2; // Process files in small batches for smoother progress
+const MAX_CONTEXT_CHARS = 4000; // Max chars per file to send to LLM
+// Fallback regex patterns (used when LLM unavailable)
+const PROVIDER_PATTERNS: Record<string, RegExp[]> = {
+  openai: [/openai/i, /\.chat\.completions\.create/, /\.embeddings\.create/, /from\s+['"]openai['"]/],
+  anthropic: [/anthropic/i, /\.messages\.create/, /from\s+['"]@anthropic-ai/],
+  google: [/google\.generative/i, /genai\./, /from\s+['"]@google\/generative/],
+  together: [/together/i, /Together\s*\(/, /from\s+['"]together/],
+  fireworks: [/fireworks/i, /Fireworks\s*\(/],
+  groq: [/groq/i, /Groq\s*\(/],
+  mistral: [/mistral/i, /Mistral\s*\(/],
+  cohere: [/cohere/i, /Cohere\s*\(/],
+  replicate: [/replicate/i, /Replicate\s*\(/],
+  aws_bedrock: [/bedrock/i, /BedrockRuntime/],
+  azure: [/azure.*openai/i, /AzureOpenAI/],
+  vllm: [/vllm/i, /from\s+vllm/],
+  sglang: [/sglang/i, /SGLang/],
+  ollama: [/ollama/i, /Ollama\s*\(/],
+};
+// Framework detection patterns
+const FRAMEWORK_PATTERNS: Record<string, RegExp[]> = {
+  dspy: [/import\s+dspy/, /from\s+dspy/, /dspy\.Predict/, /dspy\.ChainOfThought/, /dspy\.LM\(/],
+  langchain: [/from\s+langchain/, /import\s+langchain/, /ChatOpenAI\(/, /LLMChain\(/],
+  llamaindex: [/from\s+llama_index/, /import\s+llama_index/, /llama_index\.llms/],
+};
+const MODEL_PATTERNS: RegExp[] = [
+  /model\s*[=:]\s*['"]([^'"]+)['"]/i,
+  /model_name\s*[=:]\s*['"]([^'"]+)['"]/i,
+  /modelId\s*[=:]\s*['"]([^'"]+)['"]/i,
+  // DSPy-style: dspy.LM("openai/gpt-4o-mini") or dspy.LM("anthropic/claude-3-5-sonnet")
+  /dspy\.LM\s*\(\s*['"](?:[\w-]+\/)?([^'"]+)['"]/i,
+  // Embeddings models
+  /embeddings\.create\([^)]*model\s*[=:]\s*['"]([^'"]+)['"]/i,
+];
+const PATTERN_DETECTORS: Record<keyof Patterns, RegExp[]> = {
+  streaming: [/stream\s*[=:]\s*true/i, /\.stream\s*\(/, /for\s+await\s*\(/],
+  batching: [/batch/i, /Promise\.all/, /\.map\s*\(\s*async/],
+  retries: [/retry/i, /max_retries/i, /backoff/i],
+  caching: [/cache/i, /memoize/i, /redis/i],
+  fallback: [/fallback/i, /\.catch\s*\(/, /except\s*:/],
+};
+// =============================================================================
+// TYPES
+// =============================================================================
+interface LLMCallsite {
+  line: number;
+  provider: string | null;
+  model: string | null;
+  framework: string | null;
+  patterns: {
+    streaming?: boolean;
+    batching?: boolean;
+    retries?: boolean;
+    caching?: boolean;
+    fallback?: boolean;
+  };
+  confidence: number;
+  reasoning: string;
+}
+// LLM-generated impact estimate (v1.8: 6-layer architecture)
+export interface LLMImpactEstimate {
+  layer: 'application' | 'api' | 'gateway' | 'runtime' | 'model' | 'hardware';
+  impactType: 'cost' | 'latency' | 'throughput';
+  estimatedImpactPercent: number;
+  effort: 'low' | 'medium' | 'high';
+}
+// LLM-generated semantic insight (exported for use by agent)
+export interface LLMInsight {
+  severity: 'critical' | 'warning' | 'info';
+  category: 'cost' | 'latency' | 'reliability' | 'waste' | 'security' | 'best-practice' | 'throughput';
+  headline: string;
+  evidence: string;
+  location: string; // file:line
+  recommendation?: string;
+  impact?: LLMImpactEstimate; // LLM-generated impact estimate
+}
+interface LLMAnalysisResult {
+  callsites: LLMCallsite[];
+  insights: LLMInsight[];
+}
+interface AnalyzeOptions {
+  useLLM?: boolean;
+  useAgent?: boolean; // Use agent-based analysis with tool use (Opus 4.5) for better accuracy
+  verbose?: boolean;
+  promptId?: string; // ID of the analysis prompt to use (defaults to 'peak-performance')
+  onProgress?: (data: { percent: number; currentFile?: string }) => void; // Progress callback
+}
+// =============================================================================
+// HELPERS
+// =============================================================================
+function generateCallsiteId(file: string, line: number): string {
+  const hash = createHash('sha256')
+    .update(`${file}:${line}`)
+    .digest('hex')
+    .slice(0, 8);
+  return `cs_${hash}`;
+}
+function extractContext(content: string, line: number, windowSize: number = 10): string {
+  const lines = content.split('\n');
+  const start = Math.max(0, line - windowSize);
+  const end = Math.min(lines.length, line + windowSize);
+  return lines.slice(start, end).join('\n');
+}
+function truncateContent(content: string): string {
+  if (content.length <= MAX_CONTEXT_CHARS) return content;
+  return content.slice(0, MAX_CONTEXT_CHARS) + '\n// ... truncated ...';
+}
+// =============================================================================
+// LLM ANALYSIS (Claude Agent SDK)
+// =============================================================================
+/**
+ * Extract text content from Claude Agent SDK messages
+ */
+function extractTextFromMessages(messages: SDKMessage[]): string {
+  let text = '';
+  for (const msg of messages) {
+    if (msg.type === 'assistant' && msg.message?.content) {
+      for (const block of msg.message.content) {
+        if (block.type === 'text') {
+          text += block.text;
+        }
+      }
+    }
+  }
+  return text;
+}
+// Legacy static analysis prompt (hardcoded fallback)
+// NOTE: Primary analysis now uses unified-analyzer.yaml via StaticAnalysisOrchestrator
+function getStaticAnalysisPrompt(): string {
+  return `You are an expert at analyzing code to identify LLM inference usage and potential issues.
+Analyze the following code and:
+## PART 1: Identify LLM Usage
+For each LLM API call, extract:
+- line: The EXACT line number where the inference call is made (not client initialization)
+- provider: MUST be one of: openai, anthropic, google, together, fireworks, groq, mistral, cohere, replicate, aws_bedrock, azure, vllm, sglang, ollama, unknown
+- model: The EXACT model name as specified in the code (e.g., "gpt-4o", "gpt-4o-mini", "claude-3-5-sonnet-20241022", "text-embedding-3-small")
+- framework: langchain, llamaindex, dspy, or null
+- patterns: streaming, batching, retries, caching, fallback (true/false)
+- confidence: 0.0 to 1.0
+- reasoning: Brief explanation
+CRITICAL RULES FOR MODEL EXTRACTION:
+1. Look at the model= parameter in the SAME function call
+2. If model is a variable, trace it to find the string value
+3. For embeddings calls, use the embedding model name (e.g., "text-embedding-3-small"), NOT a chat model
+4. For DSPy: look at dspy.LM("provider/model") or dspy.context(lm=...) to find the model
+5. Return the FULL model name exactly as written (e.g., "gpt-4o-mini" not "gpt-4")
+CRITICAL: DO NOT flag these as callsites:
+- Client initialization: openai.OpenAI(), anthropic.Anthropic(), etc.
+- Import statements
+- Type annotations or comments
+- Variable assignments without actual API calls
+## PART 2: Generate Insights
+Identify potential issues, anti-patterns, or improvements.
+IMPORTANT - Use these EXACT values:
+- severity: MUST be one of: "critical", "warning", "info"
+- category: MUST be one of: "cost", "latency", "reliability", "waste", "security", "best-practice"
+Issues to look for:
+- Missing error handling for LLM calls (reliability)
+- Hardcoded API keys or secrets (security)
+- Inefficient patterns - no batching, no streaming (latency)
+- Model selection issues - overpowered model for simple tasks (cost)
+- Missing retries for production code (reliability)
+- Cost optimization opportunities (cost)
+Return ONLY valid JSON:
+{
+  "callsites": [
+    {
+      "line": 42,
+      "provider": "openai",
+      "model": "gpt-4o",
+      "framework": null,
+      "patterns": {"streaming": true, "batching": false, "retries": true, "caching": false, "fallback": true},
+      "confidence": 0.95,
+      "reasoning": "Direct OpenAI API call"
+    }
+  ],
+  "insights": [
+    {
+      "severity": "warning",
+      "category": "reliability",
+      "headline": "No retry logic for LLM call",
+      "evidence": "The API call at line 42 has no retry handling - LLM APIs can fail transiently",
+      "location": "src/chat.py:42",
+      "recommendation": "Add exponential backoff retry logic"
+    }
+  ]
+}
+If no issues found, return empty arrays: {"callsites": [], "insights": []}`;
+}
+interface LLMAnalysisOutput {
+  callsitesByFile: Map<string, LLMCallsite[]>;
+  insights: LLMInsight[];
+}
+// Normalize LLM insights to valid values
+function normalizeInsight(insight: LLMInsight): LLMInsight {
+  // Normalize severity
+  const severityMap: Record<string, 'critical' | 'warning' | 'info'> = {
+    error: 'critical',
+    high: 'critical',
+    medium: 'warning',
+    low: 'info',
+  };
+  const severity = severityMap[insight.severity] || insight.severity;
+  // Normalize category
+  const categoryMap: Record<string, 'cost' | 'latency' | 'reliability' | 'waste' | 'security' | 'best-practice'> = {
+    cost_optimization: 'cost',
+    performance: 'latency',
+    efficiency: 'waste',
+    error_handling: 'reliability',
+    'error-handling': 'reliability',
+  };
+  const category = categoryMap[insight.category] || insight.category;
+  return {
+    ...insight,
+    severity: severity as 'critical' | 'warning' | 'info',
+    category: category as 'cost' | 'latency' | 'reliability' | 'waste' | 'security' | 'best-practice',
+  };
+}
+async function analyzewithLLM(
+  files: Array<{ path: string; content: string; candidateLines: number[] }>,
+  analysisPrompt: string,
+  onProgress?: (data: { percent: number; currentFile?: string }) => void
+): Promise<LLMAnalysisOutput> {
+  const callsitesByFile = new Map<string, LLMCallsite[]>();
+  const allInsights: LLMInsight[] = [];
+  const totalFiles = files.length;
+  let llmErrorLogged = false; // Only log LLM errors once to avoid noise
+  // Process in batches
+  for (let i = 0; i < files.length; i += LLM_BATCH_SIZE) {
+    const batch = files.slice(i, i + LLM_BATCH_SIZE);
+    const currentFile = batch[0]?.path;
+    // Show progress bar BEFORE processing (visible during LLM call)
+    const percentBefore = Math.floor((i / totalFiles) * 100);
+    onProgress?.({ percent: percentBefore, currentFile });
+    const fileContents = batch.map(f => {
+      const truncated = truncateContent(f.content);
+      return `=== FILE: ${f.path} ===\nCandidate lines: ${f.candidateLines.join(', ')}\n\n${truncated}`;
+    }).join('\n\n');
+    try {
+      // Use Claude Agent SDK query() function
+      const agentQuery = query({
+        prompt: `${analysisPrompt}\n\n${fileContents}`,
+        options: {
+          model: 'claude-sonnet-4-20250514',
+          tools: [],
+          permissionMode: 'plan',
+          cwd: process.cwd(),
+        },
+      });
+      // Collect all messages from the async generator
+      const messages: SDKMessage[] = [];
+      for await (const message of agentQuery) {
+        messages.push(message);
+      }
+      // Extract text content from messages
+      const text = extractTextFromMessages(messages);
+      const jsonMatch = text.match(/\{[\s\S]*\}/);
+      if (jsonMatch) {
+        const parsed = JSON.parse(jsonMatch[0]) as LLMAnalysisResult;
+        // Map callsites back to files
+        for (const callsite of parsed.callsites) {
+          for (const file of batch) {
+            if (file.candidateLines.includes(callsite.line)) {
+              const existing = callsitesByFile.get(file.path) || [];
+              existing.push(callsite);
+              callsitesByFile.set(file.path, existing);
+              break;
+            }
+          }
+        }
+        // Collect insights (normalized to valid values)
+        if (parsed.insights && Array.isArray(parsed.insights)) {
+          allInsights.push(...parsed.insights.map(normalizeInsight));
+        }
+      }
+    } catch (error) {
+      // Continue with regex fallback for this batch
+      // Only log once to avoid noisy output (Julie Zhou: calm, not alarming)
+      if (!llmErrorLogged) {
+        llmErrorLogged = true;
+        const errMsg = error instanceof Error ? error.message : String(error);
+        // Extract just the error type for cleaner output
+        const shortErr = errMsg.includes('authentication_error') ? 'invalid API key'
+          : errMsg.includes('rate_limit') ? 'rate limited'
+          : 'API error';
+        console.warn(`[analyzer] Claude Agent SDK unavailable (${shortErr}), using pattern matching`);
+      }
+    }
+    // Report progress AFTER batch completes
+    const processedFiles = Math.min(i + LLM_BATCH_SIZE, totalFiles);
+    const percentAfter = Math.floor((processedFiles / totalFiles) * 100);
+    onProgress?.({ percent: percentAfter, currentFile });
+  }
+  return { callsitesByFile, insights: allInsights };
+}
+// =============================================================================
+// REGEX FALLBACK
+// =============================================================================
+function detectProviderRegex(context: string, fileContent: string): string | undefined {
+  for (const [provider, patterns] of Object.entries(PROVIDER_PATTERNS)) {
+    for (const pattern of patterns) {
+      if (pattern.test(context) || pattern.test(fileContent)) {
+        return provider;
+      }
+    }
+  }
+  return undefined;
+}
+function detectFrameworkRegex(context: string, fileContent: string): string | null {
+  for (const [framework, patterns] of Object.entries(FRAMEWORK_PATTERNS)) {
+    for (const pattern of patterns) {
+      if (pattern.test(context) || pattern.test(fileContent)) {
+        return framework;
+      }
+    }
+  }
+  return null;
+}
+function detectModelRegex(context: string): string | undefined {
+  for (const pattern of MODEL_PATTERNS) {
+    const match = context.match(pattern);
+    if (match && match[1]) {
+      return match[1];
+    }
+  }
+  return undefined;
+}
+function detectPatternsRegex(context: string): Patterns {
+  const patterns: Patterns = {};
+  for (const [pattern, regexes] of Object.entries(PATTERN_DETECTORS)) {
+    for (const regex of regexes) {
+      if (regex.test(context)) {
+        patterns[pattern as keyof Patterns] = true;
+        break;
+      }
+    }
+  }
+  return patterns;
+}
+function calculateConfidence(
+  hasProvider: boolean,
+  hasModel: boolean,
+  patternCount: number
+): number {
+  let confidence = 0.3;
+  if (hasProvider) confidence += 0.3;
+  if (hasModel) confidence += 0.25;
+  if (patternCount > 0) confidence += 0.05 * Math.min(patternCount, 3);
+  return Math.min(confidence, 1.0);
+}
+// =============================================================================
+// PUBLIC API
+// =============================================================================
+/**
+ * Result of analyzing scan results
+ */
+export interface AnalyzeResult {
+  callsites: Callsite[];
+  insights: LLMInsight[];
+}
+/**
+ * Analyze scan results to extract semantic information from callsites.
+ * Uses LLM for semantic analysis when ANTHROPIC_API_KEY is available,
+ * falls back to regex patterns otherwise.
+ *
+ * Returns both callsites AND LLM-generated semantic insights (phase 1).
+ * Template-based insights are generated separately (phase 2).
+ */
+export async function analyze(
+  scanResult: ScanResult,
+  options: AnalyzeOptions = {}
+): Promise<AnalyzeResult> {
+  // Load config and determine analysis mode
+  const config = loadConfig();
+  const configuredMode = getConfiguredMode();
+  const cascadeEnabled = isCascadeEnabled();
+  // Options can override config, but config provides defaults
+  const {
+    useLLM = configuredMode === 'llm' || (configuredMode === 'agent' && cascadeEnabled),
+    useAgent = configuredMode === 'agent',
+    verbose = config.agent.verbose,
+    promptId,
+    onProgress
+  } = options;
+  if (verbose) {
+    console.log(`[analyzer] Mode: ${configuredMode}, Cascade: ${cascadeEnabled}`);
+  }
+  // First preference: Agent-based analysis (most accurate)
+  if (useAgent && process.env.ANTHROPIC_API_KEY) {
+    try {
+      if (verbose) {
+        console.log('[analyzer] Using agent-based analysis');
+      }
+      const agentResult = await analyzeWithAgent(scanResult, { verbose });
+      return {
+        callsites: convertAgentCallsites(agentResult.callsites),
+        insights: agentResult.insights as LLMInsight[],
+      };
+    } catch (error) {
+      if (cascadeEnabled) {
+        console.warn('[analyzer] Agent analysis failed, falling back to LLM/regex:', error);
+        // Fall through to LLM or regex analysis
+      } else {
+        throw error; // Don't cascade, re-throw
+      }
+    }
+  }
+  // Second preference: Single-prompt LLM analysis
+  // Third preference: Regex-only analysis (when useLLM=false or no API key)
+  const callsites: Callsite[] = [];
+  const llmInsights: LLMInsight[] = [];
+  const fileContents = new Map<string, string>();
+  // Load analysis prompt (from YAML config or fallback)
+  let analysisPromptText = getStaticAnalysisPrompt(); // Load from YAML or fallback
+  if (promptId) {
+    const customPrompt = loadPrompt(promptId);
+    if (customPrompt) {
+      analysisPromptText = customPrompt.prompt;
+    } else {
+      console.warn(`[analyzer] Prompt '${promptId}' not found, using default`);
+    }
+  } else {
+    // Try to load default peak-performance prompt
+    try {
+      const defaultPrompt = getDefaultPrompt();
+      analysisPromptText = defaultPrompt.prompt;
+    } catch {
+      // Use hardcoded fallback if prompts directory doesn't exist
+    }
+  }
+  // Read file contents
+  for (const file of scanResult.files) {
+    try {
+      const absPath = join(scanResult.root, file.path);
+      fileContents.set(file.path, readFileSync(absPath, 'utf-8'));
+    } catch {
+      continue;
+    }
+  }
+  // Group candidates by file
+  const candidatesByFile = new Map<string, number[]>();
+  for (const candidate of scanResult.candidates) {
+    const existing = candidatesByFile.get(candidate.file) || [];
+    existing.push(candidate.line);
+    candidatesByFile.set(candidate.file, existing);
+  }
+  // Try LLM analysis if API key available (Claude Agent SDK uses env var)
+  let llmOutput: LLMAnalysisOutput | null = null;
+  if (useLLM && process.env.ANTHROPIC_API_KEY) {
+    try {
+      const filesToAnalyze = Array.from(candidatesByFile.entries())
+        .filter(([path]) => fileContents.has(path))
+        .map(([path, lines]) => ({
+          path,
+          content: fileContents.get(path)!,
+          candidateLines: lines,
+        }));
+      if (filesToAnalyze.length > 0) {
+        llmOutput = await analyzewithLLM(filesToAnalyze, analysisPromptText, onProgress);
+        // Collect LLM-generated insights (phase 1)
+        llmInsights.push(...llmOutput.insights);
+      }
+    } catch (error) {
+      console.warn('[analyzer] Claude Agent SDK initialization failed, using regex fallback');
+    }
+  }
+  // Process each candidate
+  for (const candidate of scanResult.candidates) {
+    const content = fileContents.get(candidate.file);
+    if (!content) continue;
+    // Check if we have LLM results for this file/line
+    const llmCallsites = llmOutput?.callsitesByFile.get(candidate.file);
+    const llmMatch = llmCallsites?.find(c => c.line === candidate.line);
+    if (llmMatch) {
+      // Use LLM results
+      const typedProvider: Provider | null = llmMatch.provider as Provider | null;
+      callsites.push({
+        id: generateCallsiteId(candidate.file, candidate.line),
+        file: candidate.file,
+        line: candidate.line,
+        provider: typedProvider,
+        model: llmMatch.model,
+        framework: llmMatch.framework,
+        runtime: null,
+        patterns: llmMatch.patterns,
+        confidence: llmMatch.confidence,
+      });
+    } else {
+      // Fallback to regex analysis
+      const context = extractContext(content, candidate.line);
+      const provider = detectProviderRegex(context, content);
+      const model = detectModelRegex(context);
+      const framework = detectFrameworkRegex(context, content);
+      const patterns = detectPatternsRegex(context);
+      const patternCount = Object.values(patterns).filter(Boolean).length;
+      const confidence = calculateConfidence(!!provider, !!model, patternCount);
+      const typedProvider: Provider | null = provider as Provider | null ?? null;
+      callsites.push({
+        id: generateCallsiteId(candidate.file, candidate.line),
+        file: candidate.file,
+        line: candidate.line,
+        provider: typedProvider,
+        model: model ?? null,
+        framework: framework,
+        runtime: null,
+        patterns,
+        confidence,
+      });
+    }
+  }
+  // Sort by confidence descending
+  callsites.sort((a, b) => b.confidence - a.confidence);
+  return { callsites, insights: llmInsights };
+}
+/**
+ * Re-analyze a single file (for incremental updates)
+ */
+export async function analyzeFile(
+  filePath: string,
+  content: string,
+  lines: number[],
+  options: AnalyzeOptions = {}
+): Promise<AnalyzeResult> {
+  const { useLLM = true, promptId } = options;
+  const callsites: Callsite[] = [];
+  const llmInsights: LLMInsight[] = [];
+  // Load analysis prompt (from YAML config or fallback)
+  let analysisPromptText = getStaticAnalysisPrompt();
+  if (promptId) {
+    const customPrompt = loadPrompt(promptId);
+    if (customPrompt) {
+      analysisPromptText = customPrompt.prompt;
+    }
+  } else {
+    try {
+      const defaultPrompt = getDefaultPrompt();
+      analysisPromptText = defaultPrompt.prompt;
+    } catch {
+      // Use hardcoded fallback
+    }
+  }
+  // Try LLM analysis (Claude Agent SDK uses env var)
+  let llmCallsites: LLMCallsite[] = [];
+  if (useLLM && process.env.ANTHROPIC_API_KEY) {
+    try {
+      const output = await analyzewithLLM(
+        [{ path: filePath, content, candidateLines: lines }],
+        analysisPromptText
+      );
+      llmCallsites = output.callsitesByFile.get(filePath) || [];
+      llmInsights.push(...output.insights);
+    } catch {
+      // Fall through to regex
+    }
+  }
+  for (const line of lines) {
+    const llmMatch = llmCallsites.find(c => c.line === line);
+    if (llmMatch) {
+      const typedProvider: Provider | null = llmMatch.provider as Provider | null;
+      callsites.push({
+        id: generateCallsiteId(filePath, line),
+        file: filePath,
+        line,
+        provider: typedProvider,
+        model: llmMatch.model,
+        framework: llmMatch.framework,
+        runtime: null,
+        patterns: llmMatch.patterns,
+        confidence: llmMatch.confidence,
+      });
+    } else {
+      // Regex fallback
+      const context = extractContext(content, line);
+      const provider = detectProviderRegex(context, content);
+      const model = detectModelRegex(context);
+      const framework = detectFrameworkRegex(context, content);
+      const patterns = detectPatternsRegex(context);
+      const patternCount = Object.values(patterns).filter(Boolean).length;
+      const confidence = calculateConfidence(!!provider, !!model, patternCount);
+      const typedProvider: Provider | null = provider as Provider | null ?? null;
+      callsites.push({
+        id: generateCallsiteId(filePath, line),
+        file: filePath,
+        line,
+        provider: typedProvider,
+        model: model ?? null,
+        framework: framework,
+        runtime: null,
+        patterns,
+        confidence,
+      });
+    }
+  }
+  return { callsites, insights: llmInsights };
+}