@peakinfer/cli 1.0.133

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (367) hide show
  1. package/.claude/settings.local.json +8 -0
  2. package/.env.example +6 -0
  3. package/.github/workflows/peakinfer.yml +64 -0
  4. package/CHANGELOG.md +31 -0
  5. package/LICENSE +190 -0
  6. package/README.md +335 -0
  7. package/data/inferencemax.json +274 -0
  8. package/dist/agent-analyzer.d.ts +45 -0
  9. package/dist/agent-analyzer.d.ts.map +1 -0
  10. package/dist/agent-analyzer.js +374 -0
  11. package/dist/agent-analyzer.js.map +1 -0
  12. package/dist/agent.d.ts +76 -0
  13. package/dist/agent.d.ts.map +1 -0
  14. package/dist/agent.js +965 -0
  15. package/dist/agent.js.map +1 -0
  16. package/dist/agents/correlation-analyzer.d.ts +34 -0
  17. package/dist/agents/correlation-analyzer.d.ts.map +1 -0
  18. package/dist/agents/correlation-analyzer.js +261 -0
  19. package/dist/agents/correlation-analyzer.js.map +1 -0
  20. package/dist/agents/index.d.ts +91 -0
  21. package/dist/agents/index.d.ts.map +1 -0
  22. package/dist/agents/index.js +111 -0
  23. package/dist/agents/index.js.map +1 -0
  24. package/dist/agents/runtime-analyzer.d.ts +38 -0
  25. package/dist/agents/runtime-analyzer.d.ts.map +1 -0
  26. package/dist/agents/runtime-analyzer.js +244 -0
  27. package/dist/agents/runtime-analyzer.js.map +1 -0
  28. package/dist/analysis-types.d.ts +500 -0
  29. package/dist/analysis-types.d.ts.map +1 -0
  30. package/dist/analysis-types.js +11 -0
  31. package/dist/analysis-types.js.map +1 -0
  32. package/dist/analytics.d.ts +25 -0
  33. package/dist/analytics.d.ts.map +1 -0
  34. package/dist/analytics.js +94 -0
  35. package/dist/analytics.js.map +1 -0
  36. package/dist/analyzer.d.ts +48 -0
  37. package/dist/analyzer.d.ts.map +1 -0
  38. package/dist/analyzer.js +547 -0
  39. package/dist/analyzer.js.map +1 -0
  40. package/dist/artifacts.d.ts +44 -0
  41. package/dist/artifacts.d.ts.map +1 -0
  42. package/dist/artifacts.js +165 -0
  43. package/dist/artifacts.js.map +1 -0
  44. package/dist/benchmarks/index.d.ts +88 -0
  45. package/dist/benchmarks/index.d.ts.map +1 -0
  46. package/dist/benchmarks/index.js +205 -0
  47. package/dist/benchmarks/index.js.map +1 -0
  48. package/dist/cli.d.ts +3 -0
  49. package/dist/cli.d.ts.map +1 -0
  50. package/dist/cli.js +427 -0
  51. package/dist/cli.js.map +1 -0
  52. package/dist/commands/ci.d.ts +19 -0
  53. package/dist/commands/ci.d.ts.map +1 -0
  54. package/dist/commands/ci.js +253 -0
  55. package/dist/commands/ci.js.map +1 -0
  56. package/dist/commands/config.d.ts +16 -0
  57. package/dist/commands/config.d.ts.map +1 -0
  58. package/dist/commands/config.js +249 -0
  59. package/dist/commands/config.js.map +1 -0
  60. package/dist/commands/demo.d.ts +15 -0
  61. package/dist/commands/demo.d.ts.map +1 -0
  62. package/dist/commands/demo.js +106 -0
  63. package/dist/commands/demo.js.map +1 -0
  64. package/dist/commands/export.d.ts +14 -0
  65. package/dist/commands/export.d.ts.map +1 -0
  66. package/dist/commands/export.js +209 -0
  67. package/dist/commands/export.js.map +1 -0
  68. package/dist/commands/history.d.ts +15 -0
  69. package/dist/commands/history.d.ts.map +1 -0
  70. package/dist/commands/history.js +389 -0
  71. package/dist/commands/history.js.map +1 -0
  72. package/dist/commands/template.d.ts +14 -0
  73. package/dist/commands/template.d.ts.map +1 -0
  74. package/dist/commands/template.js +341 -0
  75. package/dist/commands/template.js.map +1 -0
  76. package/dist/commands/validate-map.d.ts +12 -0
  77. package/dist/commands/validate-map.d.ts.map +1 -0
  78. package/dist/commands/validate-map.js +274 -0
  79. package/dist/commands/validate-map.js.map +1 -0
  80. package/dist/commands/whatif.d.ts +17 -0
  81. package/dist/commands/whatif.d.ts.map +1 -0
  82. package/dist/commands/whatif.js +206 -0
  83. package/dist/commands/whatif.js.map +1 -0
  84. package/dist/comparison.d.ts +38 -0
  85. package/dist/comparison.d.ts.map +1 -0
  86. package/dist/comparison.js +223 -0
  87. package/dist/comparison.js.map +1 -0
  88. package/dist/config.d.ts +42 -0
  89. package/dist/config.d.ts.map +1 -0
  90. package/dist/config.js +158 -0
  91. package/dist/config.js.map +1 -0
  92. package/dist/connectors/helicone.d.ts +9 -0
  93. package/dist/connectors/helicone.d.ts.map +1 -0
  94. package/dist/connectors/helicone.js +106 -0
  95. package/dist/connectors/helicone.js.map +1 -0
  96. package/dist/connectors/index.d.ts +37 -0
  97. package/dist/connectors/index.d.ts.map +1 -0
  98. package/dist/connectors/index.js +65 -0
  99. package/dist/connectors/index.js.map +1 -0
  100. package/dist/connectors/langsmith.d.ts +9 -0
  101. package/dist/connectors/langsmith.d.ts.map +1 -0
  102. package/dist/connectors/langsmith.js +122 -0
  103. package/dist/connectors/langsmith.js.map +1 -0
  104. package/dist/connectors/types.d.ts +83 -0
  105. package/dist/connectors/types.d.ts.map +1 -0
  106. package/dist/connectors/types.js +98 -0
  107. package/dist/connectors/types.js.map +1 -0
  108. package/dist/cost-estimator.d.ts +46 -0
  109. package/dist/cost-estimator.d.ts.map +1 -0
  110. package/dist/cost-estimator.js +104 -0
  111. package/dist/cost-estimator.js.map +1 -0
  112. package/dist/costs.d.ts +57 -0
  113. package/dist/costs.d.ts.map +1 -0
  114. package/dist/costs.js +251 -0
  115. package/dist/costs.js.map +1 -0
  116. package/dist/counterfactuals.d.ts +29 -0
  117. package/dist/counterfactuals.d.ts.map +1 -0
  118. package/dist/counterfactuals.js +448 -0
  119. package/dist/counterfactuals.js.map +1 -0
  120. package/dist/enhancement-prompts.d.ts +41 -0
  121. package/dist/enhancement-prompts.d.ts.map +1 -0
  122. package/dist/enhancement-prompts.js +88 -0
  123. package/dist/enhancement-prompts.js.map +1 -0
  124. package/dist/envelopes.d.ts +20 -0
  125. package/dist/envelopes.d.ts.map +1 -0
  126. package/dist/envelopes.js +790 -0
  127. package/dist/envelopes.js.map +1 -0
  128. package/dist/format-normalizer.d.ts +71 -0
  129. package/dist/format-normalizer.d.ts.map +1 -0
  130. package/dist/format-normalizer.js +1331 -0
  131. package/dist/format-normalizer.js.map +1 -0
  132. package/dist/history.d.ts +79 -0
  133. package/dist/history.d.ts.map +1 -0
  134. package/dist/history.js +313 -0
  135. package/dist/history.js.map +1 -0
  136. package/dist/html.d.ts +11 -0
  137. package/dist/html.d.ts.map +1 -0
  138. package/dist/html.js +463 -0
  139. package/dist/html.js.map +1 -0
  140. package/dist/impact.d.ts +42 -0
  141. package/dist/impact.d.ts.map +1 -0
  142. package/dist/impact.js +443 -0
  143. package/dist/impact.js.map +1 -0
  144. package/dist/index.d.ts +26 -0
  145. package/dist/index.d.ts.map +1 -0
  146. package/dist/index.js +34 -0
  147. package/dist/index.js.map +1 -0
  148. package/dist/insights.d.ts +5 -0
  149. package/dist/insights.d.ts.map +1 -0
  150. package/dist/insights.js +271 -0
  151. package/dist/insights.js.map +1 -0
  152. package/dist/joiner.d.ts +9 -0
  153. package/dist/joiner.d.ts.map +1 -0
  154. package/dist/joiner.js +247 -0
  155. package/dist/joiner.js.map +1 -0
  156. package/dist/orchestrator.d.ts +34 -0
  157. package/dist/orchestrator.d.ts.map +1 -0
  158. package/dist/orchestrator.js +827 -0
  159. package/dist/orchestrator.js.map +1 -0
  160. package/dist/pdf.d.ts +26 -0
  161. package/dist/pdf.d.ts.map +1 -0
  162. package/dist/pdf.js +84 -0
  163. package/dist/pdf.js.map +1 -0
  164. package/dist/prediction.d.ts +33 -0
  165. package/dist/prediction.d.ts.map +1 -0
  166. package/dist/prediction.js +316 -0
  167. package/dist/prediction.js.map +1 -0
  168. package/dist/prompts/loader.d.ts +38 -0
  169. package/dist/prompts/loader.d.ts.map +1 -0
  170. package/dist/prompts/loader.js +60 -0
  171. package/dist/prompts/loader.js.map +1 -0
  172. package/dist/renderer.d.ts +64 -0
  173. package/dist/renderer.d.ts.map +1 -0
  174. package/dist/renderer.js +923 -0
  175. package/dist/renderer.js.map +1 -0
  176. package/dist/runid.d.ts +57 -0
  177. package/dist/runid.d.ts.map +1 -0
  178. package/dist/runid.js +199 -0
  179. package/dist/runid.js.map +1 -0
  180. package/dist/runtime.d.ts +29 -0
  181. package/dist/runtime.d.ts.map +1 -0
  182. package/dist/runtime.js +366 -0
  183. package/dist/runtime.js.map +1 -0
  184. package/dist/scanner.d.ts +11 -0
  185. package/dist/scanner.d.ts.map +1 -0
  186. package/dist/scanner.js +426 -0
  187. package/dist/scanner.js.map +1 -0
  188. package/dist/templates.d.ts +120 -0
  189. package/dist/templates.d.ts.map +1 -0
  190. package/dist/templates.js +429 -0
  191. package/dist/templates.js.map +1 -0
  192. package/dist/tools/index.d.ts +153 -0
  193. package/dist/tools/index.d.ts.map +1 -0
  194. package/dist/tools/index.js +177 -0
  195. package/dist/tools/index.js.map +1 -0
  196. package/dist/types.d.ts +3647 -0
  197. package/dist/types.d.ts.map +1 -0
  198. package/dist/types.js +703 -0
  199. package/dist/types.js.map +1 -0
  200. package/dist/version.d.ts +7 -0
  201. package/dist/version.d.ts.map +1 -0
  202. package/dist/version.js +23 -0
  203. package/dist/version.js.map +1 -0
  204. package/docs/demo-guide.md +423 -0
  205. package/docs/events-format.md +295 -0
  206. package/docs/inferencemap-spec.md +344 -0
  207. package/docs/migration-v2.md +293 -0
  208. package/fixtures/demo/precomputed.json +142 -0
  209. package/fixtures/demo-project/README.md +52 -0
  210. package/fixtures/demo-project/ai-service.ts +65 -0
  211. package/fixtures/demo-project/sample-events.jsonl +15 -0
  212. package/fixtures/demo-project/src/ai-service.ts +128 -0
  213. package/fixtures/demo-project/src/llm-client.ts +155 -0
  214. package/package.json +65 -0
  215. package/prompts/agent-analyzer.yaml +47 -0
  216. package/prompts/ci-gate.yaml +98 -0
  217. package/prompts/correlation-analyzer.yaml +178 -0
  218. package/prompts/format-normalizer.yaml +46 -0
  219. package/prompts/peak-performance.yaml +180 -0
  220. package/prompts/pr-comment.yaml +111 -0
  221. package/prompts/runtime-analyzer.yaml +189 -0
  222. package/prompts/unified-analyzer.yaml +241 -0
  223. package/schemas/inference-map.v0.1.json +215 -0
  224. package/scripts/benchmark.ts +394 -0
  225. package/scripts/demo-v1.5.sh +158 -0
  226. package/scripts/sync-from-site.sh +197 -0
  227. package/scripts/validate-sync.sh +178 -0
  228. package/src/agent-analyzer.ts +481 -0
  229. package/src/agent.ts +1232 -0
  230. package/src/agents/correlation-analyzer.ts +353 -0
  231. package/src/agents/index.ts +235 -0
  232. package/src/agents/runtime-analyzer.ts +343 -0
  233. package/src/analysis-types.ts +558 -0
  234. package/src/analytics.ts +100 -0
  235. package/src/analyzer.ts +692 -0
  236. package/src/artifacts.ts +218 -0
  237. package/src/benchmarks/index.ts +309 -0
  238. package/src/cli.ts +503 -0
  239. package/src/commands/ci.ts +336 -0
  240. package/src/commands/config.ts +288 -0
  241. package/src/commands/demo.ts +175 -0
  242. package/src/commands/export.ts +297 -0
  243. package/src/commands/history.ts +425 -0
  244. package/src/commands/template.ts +385 -0
  245. package/src/commands/validate-map.ts +324 -0
  246. package/src/commands/whatif.ts +272 -0
  247. package/src/comparison.ts +283 -0
  248. package/src/config.ts +188 -0
  249. package/src/connectors/helicone.ts +164 -0
  250. package/src/connectors/index.ts +93 -0
  251. package/src/connectors/langsmith.ts +179 -0
  252. package/src/connectors/types.ts +180 -0
  253. package/src/cost-estimator.ts +146 -0
  254. package/src/costs.ts +347 -0
  255. package/src/counterfactuals.ts +516 -0
  256. package/src/enhancement-prompts.ts +118 -0
  257. package/src/envelopes.ts +814 -0
  258. package/src/format-normalizer.ts +1486 -0
  259. package/src/history.ts +400 -0
  260. package/src/html.ts +512 -0
  261. package/src/impact.ts +522 -0
  262. package/src/index.ts +83 -0
  263. package/src/insights.ts +341 -0
  264. package/src/joiner.ts +289 -0
  265. package/src/orchestrator.ts +1015 -0
  266. package/src/pdf.ts +110 -0
  267. package/src/prediction.ts +392 -0
  268. package/src/prompts/loader.ts +88 -0
  269. package/src/renderer.ts +1045 -0
  270. package/src/runid.ts +261 -0
  271. package/src/runtime.ts +450 -0
  272. package/src/scanner.ts +508 -0
  273. package/src/templates.ts +561 -0
  274. package/src/tools/index.ts +214 -0
  275. package/src/types.ts +873 -0
  276. package/src/version.ts +24 -0
  277. package/templates/context-accumulation.yaml +23 -0
  278. package/templates/cost-concentration.yaml +20 -0
  279. package/templates/dead-code.yaml +20 -0
  280. package/templates/latency-explainer.yaml +23 -0
  281. package/templates/optimizations/ab-testing-framework.yaml +74 -0
  282. package/templates/optimizations/api-gateway-optimization.yaml +81 -0
  283. package/templates/optimizations/api-model-routing-strategy.yaml +126 -0
  284. package/templates/optimizations/auto-scaling-optimization.yaml +85 -0
  285. package/templates/optimizations/batch-utilization-diagnostic.yaml +142 -0
  286. package/templates/optimizations/comprehensive-apm.yaml +76 -0
  287. package/templates/optimizations/context-window-optimization.yaml +91 -0
  288. package/templates/optimizations/cost-sensitive-batch-processing.yaml +77 -0
  289. package/templates/optimizations/distributed-training-optimization.yaml +77 -0
  290. package/templates/optimizations/document-analysis-edge.yaml +77 -0
  291. package/templates/optimizations/document-pipeline-optimization.yaml +78 -0
  292. package/templates/optimizations/domain-specific-distillation.yaml +78 -0
  293. package/templates/optimizations/error-handling-optimization.yaml +76 -0
  294. package/templates/optimizations/gptq-4bit-quantization.yaml +96 -0
  295. package/templates/optimizations/long-context-memory-management.yaml +78 -0
  296. package/templates/optimizations/max-tokens-optimization.yaml +76 -0
  297. package/templates/optimizations/memory-bandwidth-optimization.yaml +73 -0
  298. package/templates/optimizations/multi-framework-resilience.yaml +75 -0
  299. package/templates/optimizations/multi-tenant-optimization.yaml +75 -0
  300. package/templates/optimizations/prompt-caching-optimization.yaml +143 -0
  301. package/templates/optimizations/pytorch-to-onnx-migration.yaml +109 -0
  302. package/templates/optimizations/quality-monitoring.yaml +74 -0
  303. package/templates/optimizations/realtime-budget-controls.yaml +74 -0
  304. package/templates/optimizations/realtime-latency-optimization.yaml +74 -0
  305. package/templates/optimizations/sglang-concurrency-optimization.yaml +78 -0
  306. package/templates/optimizations/smart-model-routing.yaml +96 -0
  307. package/templates/optimizations/streaming-batch-selection.yaml +167 -0
  308. package/templates/optimizations/system-prompt-optimization.yaml +75 -0
  309. package/templates/optimizations/tensorrt-llm-performance.yaml +77 -0
  310. package/templates/optimizations/vllm-high-throughput-optimization.yaml +93 -0
  311. package/templates/optimizations/vllm-migration-memory-bound.yaml +78 -0
  312. package/templates/overpowered-extraction.yaml +32 -0
  313. package/templates/overpowered-model.yaml +31 -0
  314. package/templates/prompt-bloat.yaml +24 -0
  315. package/templates/retry-explosion.yaml +28 -0
  316. package/templates/schema/insight.schema.json +113 -0
  317. package/templates/schema/optimization.schema.json +180 -0
  318. package/templates/streaming-drift.yaml +30 -0
  319. package/templates/throughput-gap.yaml +21 -0
  320. package/templates/token-underutilization.yaml +28 -0
  321. package/templates/untested-fallback.yaml +21 -0
  322. package/tests/accuracy/drift-detection.test.ts +184 -0
  323. package/tests/accuracy/false-positives.test.ts +166 -0
  324. package/tests/accuracy/templates.test.ts +205 -0
  325. package/tests/action/commands.test.ts +125 -0
  326. package/tests/action/comments.test.ts +347 -0
  327. package/tests/cli.test.ts +203 -0
  328. package/tests/comparison.test.ts +309 -0
  329. package/tests/correlation-analyzer.test.ts +534 -0
  330. package/tests/counterfactuals.test.ts +347 -0
  331. package/tests/fixtures/events/missing-id.jsonl +1 -0
  332. package/tests/fixtures/events/missing-input.jsonl +1 -0
  333. package/tests/fixtures/events/missing-latency.jsonl +1 -0
  334. package/tests/fixtures/events/missing-model.jsonl +1 -0
  335. package/tests/fixtures/events/missing-output.jsonl +1 -0
  336. package/tests/fixtures/events/missing-provider.jsonl +1 -0
  337. package/tests/fixtures/events/missing-ts.jsonl +1 -0
  338. package/tests/fixtures/events/valid.csv +3 -0
  339. package/tests/fixtures/events/valid.json +1 -0
  340. package/tests/fixtures/events/valid.jsonl +2 -0
  341. package/tests/fixtures/events/with-callsite.jsonl +1 -0
  342. package/tests/fixtures/events/with-intent.jsonl +1 -0
  343. package/tests/fixtures/events/wrong-type.jsonl +1 -0
  344. package/tests/fixtures/repos/empty/.gitkeep +0 -0
  345. package/tests/fixtures/repos/hybrid-router/router.py +35 -0
  346. package/tests/fixtures/repos/saas-anthropic/agent.ts +27 -0
  347. package/tests/fixtures/repos/saas-openai/assistant.js +33 -0
  348. package/tests/fixtures/repos/saas-openai/client.py +26 -0
  349. package/tests/fixtures/repos/self-hosted-vllm/inference.py +22 -0
  350. package/tests/github-action.test.ts +292 -0
  351. package/tests/insights.test.ts +878 -0
  352. package/tests/joiner.test.ts +168 -0
  353. package/tests/performance/action-latency.test.ts +132 -0
  354. package/tests/performance/benchmark.test.ts +189 -0
  355. package/tests/performance/cli-latency.test.ts +102 -0
  356. package/tests/pr-comment.test.ts +313 -0
  357. package/tests/prediction.test.ts +296 -0
  358. package/tests/runtime-analyzer.test.ts +375 -0
  359. package/tests/runtime.test.ts +205 -0
  360. package/tests/scanner.test.ts +122 -0
  361. package/tests/template-conformance.test.ts +526 -0
  362. package/tests/unit/cost-calculator.test.ts +303 -0
  363. package/tests/unit/credits.test.ts +180 -0
  364. package/tests/unit/inference-map.test.ts +276 -0
  365. package/tests/unit/schema.test.ts +300 -0
  366. package/tsconfig.json +20 -0
  367. package/vitest.config.ts +14 -0
package/src/html.ts ADDED
@@ -0,0 +1,512 @@
1
+ import type { InferenceMap, Insight, JoinedOutput, RuntimeSummary } from './types.js';
2
+ import { generateImpactSummary, type ImpactSummary } from './impact.js';
3
+ import { VERSION } from './version.js';
4
+
5
+ // =============================================================================
6
+ // TYPES
7
+ // =============================================================================
8
+
9
+ export interface HTMLData {
10
+ inferenceMap: InferenceMap;
11
+ insights: Insight[];
12
+ joined?: JoinedOutput;
13
+ runtime?: RuntimeSummary;
14
+ impactSummary?: ImpactSummary;
15
+ }
16
+
17
+ // =============================================================================
18
+ // STYLES
19
+ // =============================================================================
20
+
21
+ const STYLES = `
22
+ :root {
23
+ --critical: #dc2626;
24
+ --warning: #d97706;
25
+ --info: #2563eb;
26
+ --bg: #fafafa;
27
+ --text: #1a1a1a;
28
+ --muted: #6b7280;
29
+ --border: #e5e7eb;
30
+ }
31
+
32
+ * { box-sizing: border-box; margin: 0; padding: 0; }
33
+
34
+ body {
35
+ font-family: system-ui, -apple-system, sans-serif;
36
+ max-width: 1200px;
37
+ margin: 0 auto;
38
+ padding: 2rem;
39
+ background: var(--bg);
40
+ color: var(--text);
41
+ line-height: 1.6;
42
+ }
43
+
44
+ header {
45
+ margin-bottom: 2rem;
46
+ padding-bottom: 1rem;
47
+ border-bottom: 1px solid var(--border);
48
+ }
49
+
50
+ h1 { font-size: 1.5rem; font-weight: 600; }
51
+ h2 { font-size: 1.25rem; font-weight: 600; margin: 1.5rem 0 1rem; }
52
+ h3 { font-size: 1rem; font-weight: 600; margin: 1rem 0 0.5rem; }
53
+
54
+ .meta { color: var(--muted); font-size: 0.875rem; margin-top: 0.5rem; }
55
+ .meta-grid { display: grid; grid-template-columns: auto 1fr; gap: 0.25rem 1rem; margin-top: 0.75rem; }
56
+ .meta-label { color: var(--muted); font-size: 0.8rem; }
57
+ .meta-value { font-family: ui-monospace, monospace; font-size: 0.8rem; word-break: break-all; }
58
+ .project-name { font-size: 1.1rem; font-weight: 500; margin-top: 0.5rem; color: var(--text); }
59
+
60
+ section { margin-bottom: 2rem; }
61
+
62
+ .finding {
63
+ border-left: 4px solid;
64
+ padding: 1rem;
65
+ margin: 1rem 0;
66
+ background: white;
67
+ border-radius: 0 4px 4px 0;
68
+ }
69
+
70
+ .finding.critical { border-color: var(--critical); }
71
+ .finding.warning { border-color: var(--warning); }
72
+ .finding.info { border-color: var(--info); }
73
+
74
+ .finding h3 { margin: 0 0 0.5rem; }
75
+ .finding p { color: var(--muted); margin: 0; }
76
+ .finding code {
77
+ display: block;
78
+ margin-top: 0.5rem;
79
+ font-size: 0.875rem;
80
+ color: var(--muted);
81
+ font-family: ui-monospace, monospace;
82
+ }
83
+
84
+ .stats {
85
+ display: grid;
86
+ grid-template-columns: repeat(auto-fit, minmax(200px, 1fr));
87
+ gap: 1rem;
88
+ }
89
+
90
+ .stat {
91
+ background: white;
92
+ padding: 1rem;
93
+ border-radius: 4px;
94
+ border: 1px solid var(--border);
95
+ }
96
+
97
+ .stat-label { font-size: 0.875rem; color: var(--muted); }
98
+ .stat-value { font-size: 1.5rem; font-weight: 600; }
99
+
100
+ table {
101
+ width: 100%;
102
+ border-collapse: collapse;
103
+ font-size: 0.875rem;
104
+ background: white;
105
+ border-radius: 4px;
106
+ overflow: hidden;
107
+ }
108
+
109
+ th, td {
110
+ text-align: left;
111
+ padding: 0.75rem;
112
+ border-bottom: 1px solid var(--border);
113
+ }
114
+
115
+ th { background: var(--bg); font-weight: 600; }
116
+ tr:last-child td { border-bottom: none; }
117
+
118
+ details { margin: 1rem 0; }
119
+ summary { cursor: pointer; font-weight: 500; }
120
+
121
+ footer {
122
+ margin-top: 3rem;
123
+ padding-top: 1rem;
124
+ border-top: 1px solid var(--border);
125
+ color: var(--muted);
126
+ font-size: 0.875rem;
127
+ }
128
+
129
+ footer a { color: var(--info); text-decoration: none; }
130
+ footer a:hover { text-decoration: underline; }
131
+
132
+ .badge {
133
+ display: inline-block;
134
+ padding: 0.125rem 0.5rem;
135
+ border-radius: 9999px;
136
+ font-size: 0.75rem;
137
+ font-weight: 500;
138
+ }
139
+
140
+ .badge.streaming { background: #dbeafe; color: #1d4ed8; }
141
+ .badge.batching { background: #dcfce7; color: #15803d; }
142
+ .badge.retries { background: #fef3c7; color: #b45309; }
143
+ .badge.caching { background: #f3e8ff; color: #7e22ce; }
144
+ .badge.fallback { background: #fee2e2; color: #dc2626; }
145
+
146
+ .summary-line { font-size: 1.25rem; margin: 0.5rem 0; }
147
+ .potential { font-size: 1.5rem; margin: 1rem 0; }
148
+ .potential strong { color: #15803d; }
149
+
150
+ .layer-table { max-width: 500px; margin: 1rem 0; }
151
+ .layer-table td:first-child { width: 40px; }
152
+
153
+ .quick-wins { margin: 1rem 0; padding-left: 1.5rem; }
154
+ .quick-wins li { margin: 0.5rem 0; }
155
+
156
+ .impact-tag {
157
+ font-size: 0.75rem;
158
+ color: var(--muted);
159
+ font-weight: normal;
160
+ }
161
+
162
+ .location-list {
163
+ margin: 0.5rem 0;
164
+ padding-left: 1.5rem;
165
+ font-size: 0.8rem;
166
+ }
167
+
168
+ .location-list li {
169
+ margin: 0.25rem 0;
170
+ }
171
+
172
+ .location-list code {
173
+ display: inline;
174
+ margin: 0;
175
+ color: var(--text);
176
+ }
177
+
178
+ .finding details {
179
+ margin-top: 0.5rem;
180
+ }
181
+
182
+ .finding details summary {
183
+ font-size: 0.875rem;
184
+ color: var(--muted);
185
+ cursor: pointer;
186
+ }
187
+
188
+ .finding p {
189
+ font-size: 0.875rem;
190
+ }
191
+ `;
192
+
193
+ // =============================================================================
194
+ // HELPERS
195
+ // =============================================================================
196
+
197
+ function escapeHtml(str: string): string {
198
+ return str
199
+ .replace(/&/g, '&')
200
+ .replace(/</g, '&lt;')
201
+ .replace(/>/g, '&gt;')
202
+ .replace(/"/g, '&quot;');
203
+ }
204
+
205
+ function formatNumber(n: number): string {
206
+ if (n >= 1_000_000) return `${(n / 1_000_000).toFixed(1)}M`;
207
+ if (n >= 1_000) return `${(n / 1_000).toFixed(1)}K`;
208
+ return n.toLocaleString();
209
+ }
210
+
211
+ function renderPatterns(patterns: Record<string, boolean | undefined>): string {
212
+ return Object.entries(patterns)
213
+ .filter(([_, v]) => v)
214
+ .map(([k]) => `<span class="badge ${k}">${k}</span>`)
215
+ .join(' ');
216
+ }
217
+
218
+ // =============================================================================
219
+ // SECTIONS
220
+ // =============================================================================
221
+
222
+ function renderSummary(insights: Insight[], callsiteCount: number): string {
223
+ const summary = generateImpactSummary(insights);
224
+ const { costReductionPercent, latencyReductionPercent, throughputGainPercent } = summary.totalPotentialImpact;
225
+
226
+ const potentialParts: string[] = [];
227
+ if (costReductionPercent > 0) potentialParts.push(`<strong>-${costReductionPercent}%</strong> cost`);
228
+ if (latencyReductionPercent > 0) potentialParts.push(`<strong>-${latencyReductionPercent}%</strong> latency`);
229
+ if (throughputGainPercent > 0) potentialParts.push(`<strong>+${throughputGainPercent}%</strong> throughput`);
230
+
231
+ const layerRows = summary.stackRanking.map((rank, i) => {
232
+ const avgImpact = Math.round(rank.totalImpactPercent / rank.insightCount);
233
+ return `<tr><td>${i + 1}</td><td>${rank.layer}</td><td>~${avgImpact}%</td><td>${rank.insightCount}</td></tr>`;
234
+ }).join('');
235
+
236
+ // Deduplicate quick wins by templateId+model combination, show unique recommendations
237
+ const seen = new Set<string>();
238
+ const uniqueQuickWins = summary.quickWins.filter(insight => {
239
+ const key = `${insight.templateId || ''}:${insight.headline}`;
240
+ if (seen.has(key)) return false;
241
+ seen.add(key);
242
+ return true;
243
+ }).slice(0, 3);
244
+
245
+ const quickWins = uniqueQuickWins.map(insight => {
246
+ const pct = insight.impact?.estimatedImpactPercent || 0;
247
+ const type = insight.impact?.impactType || '';
248
+ const typeLabel = type === 'cost' ? 'cost reduction' : type === 'latency' ? 'latency reduction' : type;
249
+ // Use assumptions if available (more actionable), otherwise headline
250
+ const recommendation = insight.impact?.assumptions || insight.headline;
251
+ return `<li><strong>${escapeHtml(recommendation)}</strong> <span class="impact-tag">(${pct}% ${typeLabel})</span></li>`;
252
+ }).join('');
253
+
254
+ return `
255
+ <section id="summary">
256
+ <h2>Potential Performance Improvement</h2>
257
+ <p class="summary-line">${insights.length} findings across ${callsiteCount} inference points</p>
258
+ ${potentialParts.length > 0 ? `<p class="potential">${potentialParts.join(' &nbsp;|&nbsp; ')}</p>` : ''}
259
+
260
+ ${summary.stackRanking.length > 0 ? `
261
+ <h3>By Layer</h3>
262
+ <table class="layer-table">
263
+ <thead><tr><th>#</th><th>Layer</th><th>Avg Impact</th><th>Items</th></tr></thead>
264
+ <tbody>${layerRows}</tbody>
265
+ </table>
266
+ ` : ''}
267
+
268
+ ${summary.quickWins.length > 0 ? `
269
+ <h3>Quick Wins</h3>
270
+ <ul class="quick-wins">${quickWins}</ul>
271
+ ` : ''}
272
+ </section>
273
+ `;
274
+ }
275
+
276
+ function renderFindings(insights: Insight[]): string {
277
+ if (insights.length === 0) {
278
+ return `
279
+ <section id="findings">
280
+ <h2>Findings</h2>
281
+ <p>No issues detected. Your inference setup looks good.</p>
282
+ </section>
283
+ `;
284
+ }
285
+
286
+ // Group insights by recommendation (assumptions or headline)
287
+ // Julie Zhou: "Progress should be phase-based (not noisy per-file spam)"
288
+ const grouped = new Map<string, {
289
+ recommendation: string;
290
+ severity: string;
291
+ layer: string;
292
+ impactType: string;
293
+ impactPercent: number;
294
+ locations: string[];
295
+ evidence: string;
296
+ }>();
297
+
298
+ for (const insight of insights) {
299
+ const recommendation = insight.impact?.assumptions || insight.headline;
300
+ const key = recommendation;
301
+
302
+ if (!grouped.has(key)) {
303
+ grouped.set(key, {
304
+ recommendation,
305
+ severity: insight.severity,
306
+ layer: insight.impact?.layer || '',
307
+ impactType: insight.impact?.impactType || 'improvement',
308
+ impactPercent: insight.impact?.estimatedImpactPercent || 0,
309
+ locations: [],
310
+ evidence: insight.evidence,
311
+ });
312
+ }
313
+ if (insight.location) {
314
+ grouped.get(key)!.locations.push(insight.location);
315
+ }
316
+ }
317
+
318
+ // Sort by impact (highest first)
319
+ const sortedGroups = Array.from(grouped.values()).sort((a, b) => b.impactPercent - a.impactPercent);
320
+
321
+ const items = sortedGroups.map(group => {
322
+ const typeLabel = group.impactType === 'cost' ? 'cost reduction'
323
+ : group.impactType === 'latency' ? 'latency reduction'
324
+ : group.impactType;
325
+ const impactTag = group.layer
326
+ ? `<span class="impact-tag">[${group.layer}] ${group.impactPercent}% ${typeLabel}</span>`
327
+ : '';
328
+ const locationCount = group.locations.length;
329
+ const locationList = group.locations.map(loc => `<li><code>${escapeHtml(loc)}</code></li>`).join('');
330
+
331
+ return `
332
+ <div class="finding ${group.severity}">
333
+ <h3>${escapeHtml(group.recommendation)} ${impactTag}</h3>
334
+ <p>${locationCount} inference point${locationCount !== 1 ? 's' : ''}</p>
335
+ ${locationCount > 0 ? `
336
+ <details>
337
+ <summary>Show locations</summary>
338
+ <ul class="location-list">${locationList}</ul>
339
+ </details>
340
+ ` : ''}
341
+ </div>
342
+ `;
343
+ }).join('');
344
+
345
+ return `
346
+ <section id="findings">
347
+ <h2>Findings</h2>
348
+ ${items}
349
+ </section>
350
+ `;
351
+ }
352
+
353
+ function renderInferenceMap(map: InferenceMap): string {
354
+ const rows = map.callsites.map(cs => `
355
+ <tr>
356
+ <td>${escapeHtml(cs.file)}</td>
357
+ <td>${cs.line}</td>
358
+ <td>${cs.provider || '-'}</td>
359
+ <td>${cs.model || '-'}</td>
360
+ <td>${renderPatterns(cs.patterns)}</td>
361
+ </tr>
362
+ `).join('');
363
+
364
+ return `
365
+ <section id="inferencemap">
366
+ <h2>InferenceMap</h2>
367
+ <details>
368
+ <summary>${map.summary.totalCallsites} inference points</summary>
369
+ <table>
370
+ <thead>
371
+ <tr>
372
+ <th>File</th>
373
+ <th>Line</th>
374
+ <th>Provider</th>
375
+ <th>Model</th>
376
+ <th>Patterns</th>
377
+ </tr>
378
+ </thead>
379
+ <tbody>
380
+ ${rows}
381
+ </tbody>
382
+ </table>
383
+ </details>
384
+ </section>
385
+ `;
386
+ }
387
+
388
+ function renderRuntime(runtime: RuntimeSummary): string {
389
+ return `
390
+ <section id="runtime">
391
+ <h2>Runtime</h2>
392
+ <div class="stats">
393
+ <div class="stat">
394
+ <div class="stat-label">Total Events</div>
395
+ <div class="stat-value">${formatNumber(runtime.totalEvents)}</div>
396
+ </div>
397
+ <div class="stat">
398
+ <div class="stat-label">Latency p50</div>
399
+ <div class="stat-value">${runtime.global.p50}ms</div>
400
+ </div>
401
+ <div class="stat">
402
+ <div class="stat-label">Latency p95</div>
403
+ <div class="stat-value">${runtime.global.p95}ms</div>
404
+ </div>
405
+ <div class="stat">
406
+ <div class="stat-label">Latency p99</div>
407
+ <div class="stat-value">${runtime.global.p99}ms</div>
408
+ </div>
409
+ </div>
410
+ </section>
411
+ `;
412
+ }
413
+
414
+ function renderDrift(joined: JoinedOutput): string {
415
+ if (joined.drift.length === 0) return '';
416
+
417
+ const codeOnlyItems = joined.codeOnly.map(cs =>
418
+ `<li>${escapeHtml(cs.file)}:${cs.line} — ${cs.provider || '?'}/${cs.model || '?'}</li>`
419
+ ).join('');
420
+
421
+ const runtimeByKey = new Map<string, number>();
422
+ for (const evt of joined.runtimeOnly) {
423
+ const key = `${evt.provider}/${evt.model}`;
424
+ runtimeByKey.set(key, (runtimeByKey.get(key) || 0) + 1);
425
+ }
426
+
427
+ const runtimeOnlyItems = Array.from(runtimeByKey.entries())
428
+ .map(([key, count]) => `<li>${escapeHtml(key)} — ${count} events</li>`)
429
+ .join('');
430
+
431
+ return `
432
+ <section id="drift">
433
+ <h2>Drift</h2>
434
+ ${joined.codeOnly.length > 0 ? `
435
+ <h3>Code-only (${joined.codeOnly.length})</h3>
436
+ <ul>${codeOnlyItems}</ul>
437
+ ` : ''}
438
+ ${joined.runtimeOnly.length > 0 ? `
439
+ <h3>Runtime-only (${runtimeByKey.size})</h3>
440
+ <ul>${runtimeOnlyItems}</ul>
441
+ ` : ''}
442
+ </section>
443
+ `;
444
+ }
445
+
446
+ // =============================================================================
447
+ // PUBLIC API
448
+ // =============================================================================
449
+
450
+ export function generateHTML(data: HTMLData): string {
451
+ const { inferenceMap, insights, joined, runtime } = data;
452
+ const now = new Date();
453
+ const timestamp = now.toISOString().replace('T', ' ').substring(0, 19) + ' UTC';
454
+ const callsiteCount = inferenceMap.summary.totalCallsites;
455
+
456
+ // Use absolute path if available, otherwise fall back to root
457
+ const absolutePath = inferenceMap.metadata?.absolutePath || inferenceMap.root;
458
+ const projectName = absolutePath.split('/').filter(Boolean).pop() || 'Unknown Project';
459
+
460
+ // Build project overview
461
+ const providers = inferenceMap.summary.providers;
462
+ const models = inferenceMap.summary.models;
463
+ const patterns = Object.entries(inferenceMap.summary.patterns)
464
+ .filter(([_, count]) => count > 0)
465
+ .map(([name, count]) => `${name} (${count})`)
466
+ .join(', ') || 'none detected';
467
+
468
+ return `<!DOCTYPE html>
469
+ <html lang="en">
470
+ <head>
471
+ <meta charset="UTF-8">
472
+ <meta name="viewport" content="width=device-width, initial-scale=1.0">
473
+ <title>PeakInfer Report — ${escapeHtml(projectName)}</title>
474
+ <style>${STYLES}</style>
475
+ </head>
476
+ <body>
477
+ <header>
478
+ <h1>PeakInfer Report</h1>
479
+ <p class="project-name">${escapeHtml(projectName)}</p>
480
+ <div class="meta-grid">
481
+ <span class="meta-label">Path</span>
482
+ <span class="meta-value">${escapeHtml(absolutePath)}</span>
483
+ <span class="meta-label">Generated</span>
484
+ <span class="meta-value">${timestamp}</span>
485
+ </div>
486
+ </header>
487
+
488
+ <section id="overview">
489
+ <h2>Project Overview</h2>
490
+ <p><strong>${callsiteCount}</strong> inference points found across <strong>${providers.length}</strong> providers and <strong>${models.length}</strong> models.</p>
491
+ <div class="meta-grid" style="margin-top: 1rem;">
492
+ <span class="meta-label">Providers</span>
493
+ <span class="meta-value">${escapeHtml(providers.join(', '))}</span>
494
+ <span class="meta-label">Models</span>
495
+ <span class="meta-value">${escapeHtml(models.slice(0, 5).join(', '))}${models.length > 5 ? ` +${models.length - 5} more` : ''}</span>
496
+ <span class="meta-label">Patterns</span>
497
+ <span class="meta-value">${escapeHtml(patterns)}</span>
498
+ </div>
499
+ </section>
500
+
501
+ ${renderSummary(insights, callsiteCount)}
502
+ ${renderFindings(insights)}
503
+ ${renderInferenceMap(inferenceMap)}
504
+ ${runtime ? renderRuntime(runtime) : ''}
505
+ ${joined ? renderDrift(joined) : ''}
506
+
507
+ <footer>
508
+ <p>Generated by PeakInfer v${VERSION} | <a href="https://github.com/Kalmantic/peakinfer">GitHub</a></p>
509
+ </footer>
510
+ </body>
511
+ </html>`;
512
+ }