npm - @peakinfer/cli - Versions diffs - 1.0.133 - Mend

@peakinfer/cli 1.0.133

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (367) hide show

package/.claude/settings.local.json +8 -0
package/.env.example +6 -0
package/.github/workflows/peakinfer.yml +64 -0
package/CHANGELOG.md +31 -0
package/LICENSE +190 -0
package/README.md +335 -0
package/data/inferencemax.json +274 -0
package/dist/agent-analyzer.d.ts +45 -0
package/dist/agent-analyzer.d.ts.map +1 -0
package/dist/agent-analyzer.js +374 -0
package/dist/agent-analyzer.js.map +1 -0
package/dist/agent.d.ts +76 -0
package/dist/agent.d.ts.map +1 -0
package/dist/agent.js +965 -0
package/dist/agent.js.map +1 -0
package/dist/agents/correlation-analyzer.d.ts +34 -0
package/dist/agents/correlation-analyzer.d.ts.map +1 -0
package/dist/agents/correlation-analyzer.js +261 -0
package/dist/agents/correlation-analyzer.js.map +1 -0
package/dist/agents/index.d.ts +91 -0
package/dist/agents/index.d.ts.map +1 -0
package/dist/agents/index.js +111 -0
package/dist/agents/index.js.map +1 -0
package/dist/agents/runtime-analyzer.d.ts +38 -0
package/dist/agents/runtime-analyzer.d.ts.map +1 -0
package/dist/agents/runtime-analyzer.js +244 -0
package/dist/agents/runtime-analyzer.js.map +1 -0
package/dist/analysis-types.d.ts +500 -0
package/dist/analysis-types.d.ts.map +1 -0
package/dist/analysis-types.js +11 -0
package/dist/analysis-types.js.map +1 -0
package/dist/analytics.d.ts +25 -0
package/dist/analytics.d.ts.map +1 -0
package/dist/analytics.js +94 -0
package/dist/analytics.js.map +1 -0
package/dist/analyzer.d.ts +48 -0
package/dist/analyzer.d.ts.map +1 -0
package/dist/analyzer.js +547 -0
package/dist/analyzer.js.map +1 -0
package/dist/artifacts.d.ts +44 -0
package/dist/artifacts.d.ts.map +1 -0
package/dist/artifacts.js +165 -0
package/dist/artifacts.js.map +1 -0
package/dist/benchmarks/index.d.ts +88 -0
package/dist/benchmarks/index.d.ts.map +1 -0
package/dist/benchmarks/index.js +205 -0
package/dist/benchmarks/index.js.map +1 -0
package/dist/cli.d.ts +3 -0
package/dist/cli.d.ts.map +1 -0
package/dist/cli.js +427 -0
package/dist/cli.js.map +1 -0
package/dist/commands/ci.d.ts +19 -0
package/dist/commands/ci.d.ts.map +1 -0
package/dist/commands/ci.js +253 -0
package/dist/commands/ci.js.map +1 -0
package/dist/commands/config.d.ts +16 -0
package/dist/commands/config.d.ts.map +1 -0
package/dist/commands/config.js +249 -0
package/dist/commands/config.js.map +1 -0
package/dist/commands/demo.d.ts +15 -0
package/dist/commands/demo.d.ts.map +1 -0
package/dist/commands/demo.js +106 -0
package/dist/commands/demo.js.map +1 -0
package/dist/commands/export.d.ts +14 -0
package/dist/commands/export.d.ts.map +1 -0
package/dist/commands/export.js +209 -0
package/dist/commands/export.js.map +1 -0
package/dist/commands/history.d.ts +15 -0
package/dist/commands/history.d.ts.map +1 -0
package/dist/commands/history.js +389 -0
package/dist/commands/history.js.map +1 -0
package/dist/commands/template.d.ts +14 -0
package/dist/commands/template.d.ts.map +1 -0
package/dist/commands/template.js +341 -0
package/dist/commands/template.js.map +1 -0
package/dist/commands/validate-map.d.ts +12 -0
package/dist/commands/validate-map.d.ts.map +1 -0
package/dist/commands/validate-map.js +274 -0
package/dist/commands/validate-map.js.map +1 -0
package/dist/commands/whatif.d.ts +17 -0
package/dist/commands/whatif.d.ts.map +1 -0
package/dist/commands/whatif.js +206 -0
package/dist/commands/whatif.js.map +1 -0
package/dist/comparison.d.ts +38 -0
package/dist/comparison.d.ts.map +1 -0
package/dist/comparison.js +223 -0
package/dist/comparison.js.map +1 -0
package/dist/config.d.ts +42 -0
package/dist/config.d.ts.map +1 -0
package/dist/config.js +158 -0
package/dist/config.js.map +1 -0
package/dist/connectors/helicone.d.ts +9 -0
package/dist/connectors/helicone.d.ts.map +1 -0
package/dist/connectors/helicone.js +106 -0
package/dist/connectors/helicone.js.map +1 -0
package/dist/connectors/index.d.ts +37 -0
package/dist/connectors/index.d.ts.map +1 -0
package/dist/connectors/index.js +65 -0
package/dist/connectors/index.js.map +1 -0
package/dist/connectors/langsmith.d.ts +9 -0
package/dist/connectors/langsmith.d.ts.map +1 -0
package/dist/connectors/langsmith.js +122 -0
package/dist/connectors/langsmith.js.map +1 -0
package/dist/connectors/types.d.ts +83 -0
package/dist/connectors/types.d.ts.map +1 -0
package/dist/connectors/types.js +98 -0
package/dist/connectors/types.js.map +1 -0
package/dist/cost-estimator.d.ts +46 -0
package/dist/cost-estimator.d.ts.map +1 -0
package/dist/cost-estimator.js +104 -0
package/dist/cost-estimator.js.map +1 -0
package/dist/costs.d.ts +57 -0
package/dist/costs.d.ts.map +1 -0
package/dist/costs.js +251 -0
package/dist/costs.js.map +1 -0
package/dist/counterfactuals.d.ts +29 -0
package/dist/counterfactuals.d.ts.map +1 -0
package/dist/counterfactuals.js +448 -0
package/dist/counterfactuals.js.map +1 -0
package/dist/enhancement-prompts.d.ts +41 -0
package/dist/enhancement-prompts.d.ts.map +1 -0
package/dist/enhancement-prompts.js +88 -0
package/dist/enhancement-prompts.js.map +1 -0
package/dist/envelopes.d.ts +20 -0
package/dist/envelopes.d.ts.map +1 -0
package/dist/envelopes.js +790 -0
package/dist/envelopes.js.map +1 -0
package/dist/format-normalizer.d.ts +71 -0
package/dist/format-normalizer.d.ts.map +1 -0
package/dist/format-normalizer.js +1331 -0
package/dist/format-normalizer.js.map +1 -0
package/dist/history.d.ts +79 -0
package/dist/history.d.ts.map +1 -0
package/dist/history.js +313 -0
package/dist/history.js.map +1 -0
package/dist/html.d.ts +11 -0
package/dist/html.d.ts.map +1 -0
package/dist/html.js +463 -0
package/dist/html.js.map +1 -0
package/dist/impact.d.ts +42 -0
package/dist/impact.d.ts.map +1 -0
package/dist/impact.js +443 -0
package/dist/impact.js.map +1 -0
package/dist/index.d.ts +26 -0
package/dist/index.d.ts.map +1 -0
package/dist/index.js +34 -0
package/dist/index.js.map +1 -0
package/dist/insights.d.ts +5 -0
package/dist/insights.d.ts.map +1 -0
package/dist/insights.js +271 -0
package/dist/insights.js.map +1 -0
package/dist/joiner.d.ts +9 -0
package/dist/joiner.d.ts.map +1 -0
package/dist/joiner.js +247 -0
package/dist/joiner.js.map +1 -0
package/dist/orchestrator.d.ts +34 -0
package/dist/orchestrator.d.ts.map +1 -0
package/dist/orchestrator.js +827 -0
package/dist/orchestrator.js.map +1 -0
package/dist/pdf.d.ts +26 -0
package/dist/pdf.d.ts.map +1 -0
package/dist/pdf.js +84 -0
package/dist/pdf.js.map +1 -0
package/dist/prediction.d.ts +33 -0
package/dist/prediction.d.ts.map +1 -0
package/dist/prediction.js +316 -0
package/dist/prediction.js.map +1 -0
package/dist/prompts/loader.d.ts +38 -0
package/dist/prompts/loader.d.ts.map +1 -0
package/dist/prompts/loader.js +60 -0
package/dist/prompts/loader.js.map +1 -0
package/dist/renderer.d.ts +64 -0
package/dist/renderer.d.ts.map +1 -0
package/dist/renderer.js +923 -0
package/dist/renderer.js.map +1 -0
package/dist/runid.d.ts +57 -0
package/dist/runid.d.ts.map +1 -0
package/dist/runid.js +199 -0
package/dist/runid.js.map +1 -0
package/dist/runtime.d.ts +29 -0
package/dist/runtime.d.ts.map +1 -0
package/dist/runtime.js +366 -0
package/dist/runtime.js.map +1 -0
package/dist/scanner.d.ts +11 -0
package/dist/scanner.d.ts.map +1 -0
package/dist/scanner.js +426 -0
package/dist/scanner.js.map +1 -0
package/dist/templates.d.ts +120 -0
package/dist/templates.d.ts.map +1 -0
package/dist/templates.js +429 -0
package/dist/templates.js.map +1 -0
package/dist/tools/index.d.ts +153 -0
package/dist/tools/index.d.ts.map +1 -0
package/dist/tools/index.js +177 -0
package/dist/tools/index.js.map +1 -0
package/dist/types.d.ts +3647 -0
package/dist/types.d.ts.map +1 -0
package/dist/types.js +703 -0
package/dist/types.js.map +1 -0
package/dist/version.d.ts +7 -0
package/dist/version.d.ts.map +1 -0
package/dist/version.js +23 -0
package/dist/version.js.map +1 -0
package/docs/demo-guide.md +423 -0
package/docs/events-format.md +295 -0
package/docs/inferencemap-spec.md +344 -0
package/docs/migration-v2.md +293 -0
package/fixtures/demo/precomputed.json +142 -0
package/fixtures/demo-project/README.md +52 -0
package/fixtures/demo-project/ai-service.ts +65 -0
package/fixtures/demo-project/sample-events.jsonl +15 -0
package/fixtures/demo-project/src/ai-service.ts +128 -0
package/fixtures/demo-project/src/llm-client.ts +155 -0
package/package.json +65 -0
package/prompts/agent-analyzer.yaml +47 -0
package/prompts/ci-gate.yaml +98 -0
package/prompts/correlation-analyzer.yaml +178 -0
package/prompts/format-normalizer.yaml +46 -0
package/prompts/peak-performance.yaml +180 -0
package/prompts/pr-comment.yaml +111 -0
package/prompts/runtime-analyzer.yaml +189 -0
package/prompts/unified-analyzer.yaml +241 -0
package/schemas/inference-map.v0.1.json +215 -0
package/scripts/benchmark.ts +394 -0
package/scripts/demo-v1.5.sh +158 -0
package/scripts/sync-from-site.sh +197 -0
package/scripts/validate-sync.sh +178 -0
package/src/agent-analyzer.ts +481 -0
package/src/agent.ts +1232 -0
package/src/agents/correlation-analyzer.ts +353 -0
package/src/agents/index.ts +235 -0
package/src/agents/runtime-analyzer.ts +343 -0
package/src/analysis-types.ts +558 -0
package/src/analytics.ts +100 -0
package/src/analyzer.ts +692 -0
package/src/artifacts.ts +218 -0
package/src/benchmarks/index.ts +309 -0
package/src/cli.ts +503 -0
package/src/commands/ci.ts +336 -0
package/src/commands/config.ts +288 -0
package/src/commands/demo.ts +175 -0
package/src/commands/export.ts +297 -0
package/src/commands/history.ts +425 -0
package/src/commands/template.ts +385 -0
package/src/commands/validate-map.ts +324 -0
package/src/commands/whatif.ts +272 -0
package/src/comparison.ts +283 -0
package/src/config.ts +188 -0
package/src/connectors/helicone.ts +164 -0
package/src/connectors/index.ts +93 -0
package/src/connectors/langsmith.ts +179 -0
package/src/connectors/types.ts +180 -0
package/src/cost-estimator.ts +146 -0
package/src/costs.ts +347 -0
package/src/counterfactuals.ts +516 -0
package/src/enhancement-prompts.ts +118 -0
package/src/envelopes.ts +814 -0
package/src/format-normalizer.ts +1486 -0
package/src/history.ts +400 -0
package/src/html.ts +512 -0
package/src/impact.ts +522 -0
package/src/index.ts +83 -0
package/src/insights.ts +341 -0
package/src/joiner.ts +289 -0
package/src/orchestrator.ts +1015 -0
package/src/pdf.ts +110 -0
package/src/prediction.ts +392 -0
package/src/prompts/loader.ts +88 -0
package/src/renderer.ts +1045 -0
package/src/runid.ts +261 -0
package/src/runtime.ts +450 -0
package/src/scanner.ts +508 -0
package/src/templates.ts +561 -0
package/src/tools/index.ts +214 -0
package/src/types.ts +873 -0
package/src/version.ts +24 -0
package/templates/context-accumulation.yaml +23 -0
package/templates/cost-concentration.yaml +20 -0
package/templates/dead-code.yaml +20 -0
package/templates/latency-explainer.yaml +23 -0
package/templates/optimizations/ab-testing-framework.yaml +74 -0
package/templates/optimizations/api-gateway-optimization.yaml +81 -0
package/templates/optimizations/api-model-routing-strategy.yaml +126 -0
package/templates/optimizations/auto-scaling-optimization.yaml +85 -0
package/templates/optimizations/batch-utilization-diagnostic.yaml +142 -0
package/templates/optimizations/comprehensive-apm.yaml +76 -0
package/templates/optimizations/context-window-optimization.yaml +91 -0
package/templates/optimizations/cost-sensitive-batch-processing.yaml +77 -0
package/templates/optimizations/distributed-training-optimization.yaml +77 -0
package/templates/optimizations/document-analysis-edge.yaml +77 -0
package/templates/optimizations/document-pipeline-optimization.yaml +78 -0
package/templates/optimizations/domain-specific-distillation.yaml +78 -0
package/templates/optimizations/error-handling-optimization.yaml +76 -0
package/templates/optimizations/gptq-4bit-quantization.yaml +96 -0
package/templates/optimizations/long-context-memory-management.yaml +78 -0
package/templates/optimizations/max-tokens-optimization.yaml +76 -0
package/templates/optimizations/memory-bandwidth-optimization.yaml +73 -0
package/templates/optimizations/multi-framework-resilience.yaml +75 -0
package/templates/optimizations/multi-tenant-optimization.yaml +75 -0
package/templates/optimizations/prompt-caching-optimization.yaml +143 -0
package/templates/optimizations/pytorch-to-onnx-migration.yaml +109 -0
package/templates/optimizations/quality-monitoring.yaml +74 -0
package/templates/optimizations/realtime-budget-controls.yaml +74 -0
package/templates/optimizations/realtime-latency-optimization.yaml +74 -0
package/templates/optimizations/sglang-concurrency-optimization.yaml +78 -0
package/templates/optimizations/smart-model-routing.yaml +96 -0
package/templates/optimizations/streaming-batch-selection.yaml +167 -0
package/templates/optimizations/system-prompt-optimization.yaml +75 -0
package/templates/optimizations/tensorrt-llm-performance.yaml +77 -0
package/templates/optimizations/vllm-high-throughput-optimization.yaml +93 -0
package/templates/optimizations/vllm-migration-memory-bound.yaml +78 -0
package/templates/overpowered-extraction.yaml +32 -0
package/templates/overpowered-model.yaml +31 -0
package/templates/prompt-bloat.yaml +24 -0
package/templates/retry-explosion.yaml +28 -0
package/templates/schema/insight.schema.json +113 -0
package/templates/schema/optimization.schema.json +180 -0
package/templates/streaming-drift.yaml +30 -0
package/templates/throughput-gap.yaml +21 -0
package/templates/token-underutilization.yaml +28 -0
package/templates/untested-fallback.yaml +21 -0
package/tests/accuracy/drift-detection.test.ts +184 -0
package/tests/accuracy/false-positives.test.ts +166 -0
package/tests/accuracy/templates.test.ts +205 -0
package/tests/action/commands.test.ts +125 -0
package/tests/action/comments.test.ts +347 -0
package/tests/cli.test.ts +203 -0
package/tests/comparison.test.ts +309 -0
package/tests/correlation-analyzer.test.ts +534 -0
package/tests/counterfactuals.test.ts +347 -0
package/tests/fixtures/events/missing-id.jsonl +1 -0
package/tests/fixtures/events/missing-input.jsonl +1 -0
package/tests/fixtures/events/missing-latency.jsonl +1 -0
package/tests/fixtures/events/missing-model.jsonl +1 -0
package/tests/fixtures/events/missing-output.jsonl +1 -0
package/tests/fixtures/events/missing-provider.jsonl +1 -0
package/tests/fixtures/events/missing-ts.jsonl +1 -0
package/tests/fixtures/events/valid.csv +3 -0
package/tests/fixtures/events/valid.json +1 -0
package/tests/fixtures/events/valid.jsonl +2 -0
package/tests/fixtures/events/with-callsite.jsonl +1 -0
package/tests/fixtures/events/with-intent.jsonl +1 -0
package/tests/fixtures/events/wrong-type.jsonl +1 -0
package/tests/fixtures/repos/empty/.gitkeep +0 -0
package/tests/fixtures/repos/hybrid-router/router.py +35 -0
package/tests/fixtures/repos/saas-anthropic/agent.ts +27 -0
package/tests/fixtures/repos/saas-openai/assistant.js +33 -0
package/tests/fixtures/repos/saas-openai/client.py +26 -0
package/tests/fixtures/repos/self-hosted-vllm/inference.py +22 -0
package/tests/github-action.test.ts +292 -0
package/tests/insights.test.ts +878 -0
package/tests/joiner.test.ts +168 -0
package/tests/performance/action-latency.test.ts +132 -0
package/tests/performance/benchmark.test.ts +189 -0
package/tests/performance/cli-latency.test.ts +102 -0
package/tests/pr-comment.test.ts +313 -0
package/tests/prediction.test.ts +296 -0
package/tests/runtime-analyzer.test.ts +375 -0
package/tests/runtime.test.ts +205 -0
package/tests/scanner.test.ts +122 -0
package/tests/template-conformance.test.ts +526 -0
package/tests/unit/cost-calculator.test.ts +303 -0
package/tests/unit/credits.test.ts +180 -0
package/tests/unit/inference-map.test.ts +276 -0
package/tests/unit/schema.test.ts +300 -0
package/tsconfig.json +20 -0
package/vitest.config.ts +14 -0

package/tests/pr-comment.test.ts ADDED Viewed

@@ -0,0 +1,313 @@
+/**
+ * PR Comment Tests
+ * Per Test Cases v1.9.3 - PR/CI Integration Tests
+ */
+import { describe, test, expect } from 'vitest';
+// Types for PR comment generation
+interface InferencePoint {
+  id: string;
+  file: string;
+  line: number;
+  provider: string;
+  model: string;
+}
+interface Issue {
+  id: string;
+  severity: 'critical' | 'high' | 'medium' | 'low';
+  category: string;
+  title: string;
+  description: string;
+  file: string;
+  line: number;
+}
+interface AnalysisResult {
+  inferencePoints: InferencePoint[];
+  issues: Issue[];
+  summary: {
+    totalInferencePoints: number;
+    criticalIssues: number;
+    highIssues: number;
+    mediumIssues: number;
+    lowIssues: number;
+  };
+}
+// PR Comment generator (to be implemented in src/pr-comment.ts)
+function generatePRComment(result: AnalysisResult): string {
+  const lines: string[] = [];
+  // Header
+  lines.push('## PeakInfer Analysis');
+  lines.push('');
+  // Summary
+  lines.push(`Found **${result.summary.totalInferencePoints}** inference points`);
+  lines.push('');
+  // Issues by severity
+  if (result.summary.criticalIssues > 0 || result.summary.highIssues > 0) {
+    lines.push('### Issues Found');
+    lines.push('');
+    const critical = result.issues.filter(i => i.severity === 'critical');
+    const high = result.issues.filter(i => i.severity === 'high');
+    for (const issue of [...critical, ...high].slice(0, 5)) {
+      const emoji = issue.severity === 'critical' ? ':red_circle:' : ':orange_circle:';
+      lines.push(`${emoji} **${issue.severity.toUpperCase()}**: ${issue.title}`);
+      lines.push(`   - ${issue.file}:${issue.line}`);
+      lines.push(`   - ${issue.description}`);
+      lines.push('');
+    }
+  }
+  // No issues case
+  if (result.issues.length === 0) {
+    lines.push(':white_check_mark: No issues found');
+  }
+  // Footer
+  lines.push('---');
+  lines.push('*Generated by [PeakInfer](https://peakinfer.dev)*');
+  return lines.join('\n');
+}
+function generateCompactComment(result: AnalysisResult): string {
+  const criticalHigh = result.summary.criticalIssues + result.summary.highIssues;
+  if (criticalHigh === 0) {
+    return `:white_check_mark: PeakInfer: ${result.summary.totalInferencePoints} inference points, no critical issues`;
+  }
+  return `:warning: PeakInfer: ${result.summary.totalInferencePoints} inference points, ${criticalHigh} critical/high issues`;
+}
+function shouldBlockPR(result: AnalysisResult, threshold: 'critical' | 'high' | 'medium'): boolean {
+  if (threshold === 'critical') {
+    return result.summary.criticalIssues > 0;
+  }
+  if (threshold === 'high') {
+    return result.summary.criticalIssues > 0 || result.summary.highIssues > 0;
+  }
+  return result.summary.criticalIssues > 0 || result.summary.highIssues > 0 || result.summary.mediumIssues > 0;
+}
+describe('PR Comment Generation', () => {
+  test('Generates markdown comment with issues', () => {
+    const result: AnalysisResult = {
+      inferencePoints: [
+        { id: 'ip-1', file: 'src/chat.ts', line: 42, provider: 'anthropic', model: 'claude-sonnet-4-20250514' },
+      ],
+      issues: [
+        {
+          id: 'issue-1',
+          severity: 'critical',
+          category: 'cost',
+          title: 'Expensive model for simple task',
+          description: 'Using claude-opus for chat completion',
+          file: 'src/chat.ts',
+          line: 42,
+        },
+      ],
+      summary: {
+        totalInferencePoints: 1,
+        criticalIssues: 1,
+        highIssues: 0,
+        mediumIssues: 0,
+        lowIssues: 0,
+      },
+    };
+    const comment = generatePRComment(result);
+    expect(comment).toContain('## PeakInfer Analysis');
+    expect(comment).toContain('1 inference points');
+    expect(comment).toContain('CRITICAL');
+    expect(comment).toContain('Expensive model');
+    expect(comment).toContain('src/chat.ts:42');
+  });
+  test('Generates clean comment when no issues', () => {
+    const result: AnalysisResult = {
+      inferencePoints: [
+        { id: 'ip-1', file: 'src/chat.ts', line: 42, provider: 'anthropic', model: 'claude-sonnet-4-20250514' },
+      ],
+      issues: [],
+      summary: {
+        totalInferencePoints: 1,
+        criticalIssues: 0,
+        highIssues: 0,
+        mediumIssues: 0,
+        lowIssues: 0,
+      },
+    };
+    const comment = generatePRComment(result);
+    expect(comment).toContain('No issues found');
+    expect(comment).not.toContain('CRITICAL');
+  });
+  test('Limits issues to top 5', () => {
+    const issues: Issue[] = Array.from({ length: 10 }, (_, i) => ({
+      id: `issue-${i}`,
+      severity: 'high' as const,
+      category: 'cost',
+      title: `Issue ${i}`,
+      description: 'Test issue',
+      file: 'src/chat.ts',
+      line: i + 1,
+    }));
+    const result: AnalysisResult = {
+      inferencePoints: [],
+      issues,
+      summary: {
+        totalInferencePoints: 0,
+        criticalIssues: 0,
+        highIssues: 10,
+        mediumIssues: 0,
+        lowIssues: 0,
+      },
+    };
+    const comment = generatePRComment(result);
+    // Should only show 5 issues max
+    const highCount = (comment.match(/HIGH/g) || []).length;
+    expect(highCount).toBeLessThanOrEqual(5);
+  });
+  test('Includes PeakInfer branding', () => {
+    const result: AnalysisResult = {
+      inferencePoints: [],
+      issues: [],
+      summary: {
+        totalInferencePoints: 0,
+        criticalIssues: 0,
+        highIssues: 0,
+        mediumIssues: 0,
+        lowIssues: 0,
+      },
+    };
+    const comment = generatePRComment(result);
+    expect(comment).toContain('PeakInfer');
+    expect(comment).toContain('peakinfer.dev');
+  });
+});
+describe('Compact Comment', () => {
+  test('Shows success for no critical issues', () => {
+    const result: AnalysisResult = {
+      inferencePoints: [{ id: 'ip-1', file: 'test.ts', line: 1, provider: 'openai', model: 'gpt-4' }],
+      issues: [],
+      summary: {
+        totalInferencePoints: 1,
+        criticalIssues: 0,
+        highIssues: 0,
+        mediumIssues: 0,
+        lowIssues: 0,
+      },
+    };
+    const comment = generateCompactComment(result);
+    expect(comment).toContain(':white_check_mark:');
+    expect(comment).toContain('no critical issues');
+  });
+  test('Shows warning for critical/high issues', () => {
+    const result: AnalysisResult = {
+      inferencePoints: [],
+      issues: [
+        { id: 'i-1', severity: 'critical', category: 'cost', title: 'Test', description: 'Test', file: 'test.ts', line: 1 },
+      ],
+      summary: {
+        totalInferencePoints: 1,
+        criticalIssues: 1,
+        highIssues: 0,
+        mediumIssues: 0,
+        lowIssues: 0,
+      },
+    };
+    const comment = generateCompactComment(result);
+    expect(comment).toContain(':warning:');
+    expect(comment).toContain('1 critical/high issues');
+  });
+});
+describe('PR Blocking Logic', () => {
+  test('Blocks on critical when threshold is critical', () => {
+    const result: AnalysisResult = {
+      inferencePoints: [],
+      issues: [],
+      summary: {
+        totalInferencePoints: 0,
+        criticalIssues: 1,
+        highIssues: 0,
+        mediumIssues: 0,
+        lowIssues: 0,
+      },
+    };
+    expect(shouldBlockPR(result, 'critical')).toBe(true);
+  });
+  test('Does not block on high when threshold is critical', () => {
+    const result: AnalysisResult = {
+      inferencePoints: [],
+      issues: [],
+      summary: {
+        totalInferencePoints: 0,
+        criticalIssues: 0,
+        highIssues: 5,
+        mediumIssues: 0,
+        lowIssues: 0,
+      },
+    };
+    expect(shouldBlockPR(result, 'critical')).toBe(false);
+  });
+  test('Blocks on high when threshold is high', () => {
+    const result: AnalysisResult = {
+      inferencePoints: [],
+      issues: [],
+      summary: {
+        totalInferencePoints: 0,
+        criticalIssues: 0,
+        highIssues: 1,
+        mediumIssues: 0,
+        lowIssues: 0,
+      },
+    };
+    expect(shouldBlockPR(result, 'high')).toBe(true);
+  });
+  test('Does not block when no issues', () => {
+    const result: AnalysisResult = {
+      inferencePoints: [],
+      issues: [],
+      summary: {
+        totalInferencePoints: 5,
+        criticalIssues: 0,
+        highIssues: 0,
+        mediumIssues: 0,
+        lowIssues: 0,
+      },
+    };
+    expect(shouldBlockPR(result, 'critical')).toBe(false);
+    expect(shouldBlockPR(result, 'high')).toBe(false);
+    expect(shouldBlockPR(result, 'medium')).toBe(false);
+  });
+});

package/tests/prediction.test.ts ADDED Viewed

@@ -0,0 +1,296 @@
+import { describe, it, expect } from 'vitest';
+import {
+  generatePredictions,
+  formatPredictionSummary,
+  hasHighRiskPredictions,
+} from '../src/prediction.js';
+import type { Callsite, InferenceMap } from '../src/types.js';
+// =============================================================================
+// TEST FIXTURES
+// =============================================================================
+function createCallsite(overrides: Partial<Callsite> = {}): Callsite {
+  return {
+    id: `cs_${Date.now()}_${Math.random().toString(36).slice(2, 6)}`,
+    file: 'src/agent.ts',
+    line: 42,
+    col: 10,
+    provider: 'openai',
+    model: 'gpt-4o',
+    framework: null,
+    runtime: null,
+    patterns: {},
+    confidence: 0.9,
+    ...overrides,
+  };
+}
+function createInferenceMap(callsites: Callsite[]): InferenceMap {
+  return {
+    version: '0.1',
+    callsites,
+    frameworks: {},
+    scanResult: {
+      root: '/test',
+      files: [],
+      summary: { totalFiles: 0, totalLoc: 0, languages: [], totalCandidates: 0 },
+    },
+  };
+}
+// =============================================================================
+// TESTS
+// =============================================================================
+describe('prediction', () => {
+  describe('generatePredictions', () => {
+    it('should generate predictions for callsites', () => {
+      const inferenceMap = createInferenceMap([
+        createCallsite({ file: 'src/a.ts', line: 10, model: 'gpt-4o' }),
+        createCallsite({ file: 'src/b.ts', line: 20, model: 'gpt-4o-mini' }),
+      ]);
+      const result = generatePredictions(inferenceMap);
+      expect(result.predictions.length).toBe(2);
+      expect(result.summary.totalPoints).toBe(2);
+    });
+    it('should assign risk levels based on latency', () => {
+      const inferenceMap = createInferenceMap([
+        createCallsite({ file: 'src/a.ts', line: 10, model: 'claude-3-opus' }), // high latency
+        createCallsite({ file: 'src/b.ts', line: 20, model: 'gemini-1.5-flash' }), // low latency
+      ]);
+      const result = generatePredictions(inferenceMap);
+      const opusPrediction = result.predictions.find(p => p.model?.includes('opus'));
+      const flashPrediction = result.predictions.find(p => p.model?.includes('flash'));
+      expect(opusPrediction?.risk).toBe('high');
+      expect(flashPrediction?.risk).toBe('low');
+    });
+    it('should include prediction factors', () => {
+      const inferenceMap = createInferenceMap([
+        createCallsite({
+          file: 'src/a.ts',
+          line: 10,
+          model: 'gpt-4o',
+          patterns: { streaming: true },
+        }),
+      ]);
+      const result = generatePredictions(inferenceMap);
+      expect(result.predictions[0].factors.length).toBeGreaterThan(0);
+      const streamingFactor = result.predictions[0].factors.find(f =>
+        f.name.toLowerCase().includes('streaming')
+      );
+      expect(streamingFactor).toBeDefined();
+      expect(streamingFactor?.impact).toBe('positive');
+    });
+    it('should reduce latency for patterns like batching and caching', () => {
+      const baseInferenceMap = createInferenceMap([
+        createCallsite({
+          file: 'src/a.ts',
+          line: 10,
+          model: 'gpt-4o',
+          patterns: {},
+        }),
+      ]);
+      const optimizedInferenceMap = createInferenceMap([
+        createCallsite({
+          file: 'src/a.ts',
+          line: 10,
+          model: 'gpt-4o',
+          patterns: { batching: true, caching: true },
+        }),
+      ]);
+      const baseResult = generatePredictions(baseInferenceMap);
+      const optimizedResult = generatePredictions(optimizedInferenceMap);
+      expect(optimizedResult.predictions[0].predictedLatency.p95)
+        .toBeLessThan(baseResult.predictions[0].predictedLatency.p95);
+    });
+    it('should calculate correct summary statistics', () => {
+      const inferenceMap = createInferenceMap([
+        createCallsite({ file: 'src/a.ts', line: 10, model: 'gpt-4' }), // high
+        createCallsite({ file: 'src/b.ts', line: 20, model: 'gpt-4o' }), // medium
+        createCallsite({ file: 'src/c.ts', line: 30, model: 'gpt-4o-mini' }), // low
+      ]);
+      const result = generatePredictions(inferenceMap);
+      expect(result.summary.totalPoints).toBe(3);
+      expect(result.summary.highRiskCount).toBeGreaterThanOrEqual(0);
+      expect(result.summary.averageP95).toBeGreaterThan(0);
+      expect(result.summary.worstP95).toBeGreaterThanOrEqual(result.summary.averageP95);
+    });
+    it('should check budget when targetP95 is specified', () => {
+      const inferenceMap = createInferenceMap([
+        createCallsite({ file: 'src/a.ts', line: 10, model: 'gpt-4' }), // p95 ~5000ms
+      ]);
+      const withinBudget = generatePredictions(inferenceMap, 0, { targetP95: 10000 });
+      const overBudget = generatePredictions(inferenceMap, 0, { targetP95: 1000 });
+      expect(withinBudget.summary.budgetExceeded).toBe(false);
+      expect(overBudget.summary.budgetExceeded).toBe(true);
+    });
+    it('should handle empty inference map', () => {
+      const inferenceMap = createInferenceMap([]);
+      const result = generatePredictions(inferenceMap);
+      expect(result.predictions.length).toBe(0);
+      expect(result.summary.totalPoints).toBe(0);
+      expect(result.summary.averageP95).toBe(0);
+    });
+    it('should handle unknown models with medium confidence when model is set', () => {
+      const inferenceMap = createInferenceMap([
+        createCallsite({
+          file: 'src/a.ts',
+          line: 10,
+          model: 'custom-fine-tuned-model',
+        }),
+      ]);
+      const result = generatePredictions(inferenceMap);
+      expect(result.predictions.length).toBe(1);
+      // When model is set (even unknown), confidence is medium; low only when no model
+      expect(result.predictions[0].confidence).toBe('medium');
+    });
+    it('should include location in predictions', () => {
+      const inferenceMap = createInferenceMap([
+        createCallsite({ file: 'src/agent.ts', line: 42 }),
+      ]);
+      const result = generatePredictions(inferenceMap);
+      expect(result.predictions[0].location).toBe('src/agent.ts:42');
+    });
+  });
+  describe('formatPredictionSummary', () => {
+    it('should format summary with risk counts', () => {
+      const inferenceMap = createInferenceMap([
+        createCallsite({ file: 'src/a.ts', line: 10, model: 'gpt-4' }),
+        createCallsite({ file: 'src/b.ts', line: 20, model: 'gpt-4o-mini' }),
+      ]);
+      const result = generatePredictions(inferenceMap);
+      const summary = formatPredictionSummary(result);
+      expect(summary).toContain('inference points');
+      expect(summary).toContain('p95');
+    });
+    it('should show budget status when target specified', () => {
+      const inferenceMap = createInferenceMap([
+        createCallsite({ file: 'src/a.ts', line: 10, model: 'gpt-4' }),
+      ]);
+      const result = generatePredictions(inferenceMap, 0, { targetP95: 1000 });
+      const summary = formatPredictionSummary(result);
+      expect(summary).toContain('Budget exceeded');
+    });
+  });
+  describe('hasHighRiskPredictions', () => {
+    it('should return true when high-risk predictions exist', () => {
+      const inferenceMap = createInferenceMap([
+        createCallsite({ file: 'src/a.ts', line: 10, model: 'claude-3-opus' }),
+      ]);
+      const result = generatePredictions(inferenceMap);
+      expect(hasHighRiskPredictions(result)).toBe(true);
+    });
+    it('should return false when no high-risk predictions', () => {
+      const inferenceMap = createInferenceMap([
+        createCallsite({ file: 'src/a.ts', line: 10, model: 'gemini-1.5-flash' }),
+      ]);
+      const result = generatePredictions(inferenceMap);
+      expect(hasHighRiskPredictions(result)).toBe(false);
+    });
+    it('should return false for empty predictions', () => {
+      const inferenceMap = createInferenceMap([]);
+      const result = generatePredictions(inferenceMap);
+      expect(hasHighRiskPredictions(result)).toBe(false);
+    });
+  });
+  describe('model latency estimates', () => {
+    it('should estimate higher latency for Claude Opus vs Haiku', () => {
+      const opus = createInferenceMap([
+        createCallsite({ file: 'src/a.ts', line: 10, model: 'claude-3-opus' }),
+      ]);
+      const haiku = createInferenceMap([
+        createCallsite({ file: 'src/a.ts', line: 10, model: 'claude-3-haiku' }),
+      ]);
+      const opusResult = generatePredictions(opus);
+      const haikuResult = generatePredictions(haiku);
+      // Opus should have higher latency than Haiku
+      expect(opusResult.predictions[0].predictedLatency.p95)
+        .toBeGreaterThan(haikuResult.predictions[0].predictedLatency.p95);
+    });
+    it('should estimate higher latency for o1 models', () => {
+      const o1 = createInferenceMap([
+        createCallsite({ file: 'src/a.ts', line: 10, model: 'o1-preview' }),
+      ]);
+      const gpt4 = createInferenceMap([
+        createCallsite({ file: 'src/a.ts', line: 10, model: 'gpt-4' }),
+      ]);
+      const o1Result = generatePredictions(o1);
+      const gpt4Result = generatePredictions(gpt4);
+      expect(o1Result.predictions[0].predictedLatency.p95)
+        .toBeGreaterThan(gpt4Result.predictions[0].predictedLatency.p95);
+    });
+  });
+  describe('self-hosted providers', () => {
+    it('should identify self-hosted providers as positive factor', () => {
+      const inferenceMap = createInferenceMap([
+        createCallsite({
+          file: 'src/a.ts',
+          line: 10,
+          provider: 'vllm',
+          model: 'llama-3.1-70b',
+        }),
+      ]);
+      const result = generatePredictions(inferenceMap);
+      const selfHostedFactor = result.predictions[0].factors.find(f =>
+        f.name.toLowerCase().includes('self-hosted')
+      );
+      expect(selfHostedFactor).toBeDefined();
+      expect(selfHostedFactor?.impact).toBe('positive');
+    });
+  });
+});