npm - perf-skill - Versions diffs - 0.0.1 → 0.2.0 - Mend

perf-skill 0.0.1 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (116) hide show

package/LICENSE +21 -0
package/README.md +414 -0
package/SKILL.md +238 -0
package/dist/cli/main.d.ts +6 -0
package/dist/cli/main.d.ts.map +1 -0
package/dist/cli/main.js +353 -0
package/dist/cli/main.js.map +1 -0
package/dist/cli/options.d.ts +37 -0
package/dist/cli/options.d.ts.map +1 -0
package/dist/cli/options.js +54 -0
package/dist/cli/options.js.map +1 -0
package/dist/convert/converter.d.ts +39 -0
package/dist/convert/converter.d.ts.map +1 -0
package/dist/convert/converter.js +99 -0
package/dist/convert/converter.js.map +1 -0
package/dist/convert/extract.d.ts +32 -0
package/dist/convert/extract.d.ts.map +1 -0
package/dist/convert/extract.js +235 -0
package/dist/convert/extract.js.map +1 -0
package/dist/convert/index.d.ts +7 -0
package/dist/convert/index.d.ts.map +1 -0
package/dist/convert/index.js +7 -0
package/dist/convert/index.js.map +1 -0
package/dist/convert/sanitize.d.ts +60 -0
package/dist/convert/sanitize.d.ts.map +1 -0
package/dist/convert/sanitize.js +169 -0
package/dist/convert/sanitize.js.map +1 -0
package/dist/diff/engine.d.ts +76 -0
package/dist/diff/engine.d.ts.map +1 -0
package/dist/diff/engine.js +386 -0
package/dist/diff/engine.js.map +1 -0
package/dist/diff/index.d.ts +6 -0
package/dist/diff/index.d.ts.map +1 -0
package/dist/diff/index.js +6 -0
package/dist/diff/index.js.map +1 -0
package/dist/diff/markdown.d.ts +16 -0
package/dist/diff/markdown.d.ts.map +1 -0
package/dist/diff/markdown.js +342 -0
package/dist/diff/markdown.js.map +1 -0
package/dist/index.d.ts +52 -0
package/dist/index.d.ts.map +1 -0
package/dist/index.js +247 -0
package/dist/index.js.map +1 -0
package/dist/llm/client.d.ts +39 -0
package/dist/llm/client.d.ts.map +1 -0
package/dist/llm/client.js +270 -0
package/dist/llm/client.js.map +1 -0
package/dist/llm/index.d.ts +8 -0
package/dist/llm/index.d.ts.map +1 -0
package/dist/llm/index.js +8 -0
package/dist/llm/index.js.map +1 -0
package/dist/llm/prompt.d.ts +32 -0
package/dist/llm/prompt.d.ts.map +1 -0
package/dist/llm/prompt.js +146 -0
package/dist/llm/prompt.js.map +1 -0
package/dist/llm/schema.d.ts +150 -0
package/dist/llm/schema.d.ts.map +1 -0
package/dist/llm/schema.js +131 -0
package/dist/llm/schema.js.map +1 -0
package/dist/llm/validate.d.ts +33 -0
package/dist/llm/validate.d.ts.map +1 -0
package/dist/llm/validate.js +241 -0
package/dist/llm/validate.js.map +1 -0
package/dist/profile/duration.d.ts +2 -0
package/dist/profile/duration.d.ts.map +1 -0
package/dist/profile/duration.js +24 -0
package/dist/profile/duration.js.map +1 -0
package/dist/profile/preload.d.ts +2 -0
package/dist/profile/preload.d.ts.map +1 -0
package/dist/profile/preload.js +100 -0
package/dist/profile/preload.js.map +1 -0
package/dist/profile/runner.d.ts +22 -0
package/dist/profile/runner.d.ts.map +1 -0
package/dist/profile/runner.js +88 -0
package/dist/profile/runner.js.map +1 -0
package/dist/server/http.d.ts +27 -0
package/dist/server/http.d.ts.map +1 -0
package/dist/server/http.js +285 -0
package/dist/server/http.js.map +1 -0
package/dist/server/utils.d.ts +15 -0
package/dist/server/utils.d.ts.map +1 -0
package/dist/server/utils.js +71 -0
package/dist/server/utils.js.map +1 -0
package/dist/skill/handler.d.ts +77 -0
package/dist/skill/handler.d.ts.map +1 -0
package/dist/skill/handler.js +91 -0
package/dist/skill/handler.js.map +1 -0
package/dist/skill/index.d.ts +6 -0
package/dist/skill/index.d.ts.map +1 -0
package/dist/skill/index.js +6 -0
package/dist/skill/index.js.map +1 -0
package/dist/skill/manifest.d.ts +17 -0
package/dist/skill/manifest.d.ts.map +1 -0
package/dist/skill/manifest.js +231 -0
package/dist/skill/manifest.js.map +1 -0
package/dist/types.d.ts +260 -0
package/dist/types.d.ts.map +1 -0
package/dist/types.js +5 -0
package/dist/types.js.map +1 -0
package/dist/utils/fs.d.ts +52 -0
package/dist/utils/fs.d.ts.map +1 -0
package/dist/utils/fs.js +106 -0
package/dist/utils/fs.js.map +1 -0
package/dist/utils/index.d.ts +7 -0
package/dist/utils/index.d.ts.map +1 -0
package/dist/utils/index.js +7 -0
package/dist/utils/index.js.map +1 -0
package/dist/utils/limits.d.ts +38 -0
package/dist/utils/limits.d.ts.map +1 -0
package/dist/utils/limits.js +86 -0
package/dist/utils/limits.js.map +1 -0
package/dist/utils/logger.d.ts +21 -0
package/dist/utils/logger.d.ts.map +1 -0
package/dist/utils/logger.js +82 -0
package/dist/utils/logger.js.map +1 -0
package/package.json +70 -6

package/LICENSE ADDED Viewed

@@ -0,0 +1,21 @@
+MIT License
+Copyright (c) 2026 skillsland
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

package/README.md ADDED Viewed

@@ -0,0 +1,414 @@
+# perf-skill
+![Node CI](https://github.com/skillsland/perf-skill/workflows/Node%20CI/badge.svg)
+[![npm version](https://badge.fury.io/js/perf-skill.svg)](http://badge.fury.io/js/perf-skill)
+![license](https://img.shields.io/npm/l/perf-skill)
+AI‑assisted pprof toolkit for CPU/heap profiles: convert .pb.gz/.pprof to structured Markdown, compare profiles for regressions, and optionally generate evidence‑backed recommendations.
+## Features
+- **Convert**: Transform pprof profiles to structured Markdown
+- **Analyze**: Get AI-powered optimization recommendations
+- **Diff**: Compare two profiles to find regressions
+- **Multi-format**: Library, CLI, and HTTP API
+## Installation
+```bash
+npm install perf-skill
+```
+Or run directly with npx:
+```bash
+npx perf-skill analyze profile.pb.gz
+```
+## Quick Start
+### CLI Usage
+```bash
+# Convert profile to markdown (fast, no LLM)
+perf-skill convert cpu.pb.gz -o report.md
+# Full analysis with AI recommendations
+perf-skill analyze cpu.pb.gz --mode analyze
+# Profile a Node entry (CPU, 10s) and analyze
+perf-skill run slow.mjs --duration 10s
+# CPU + Heap profiling (separate reports)
+perf-skill run slow.mjs --heap --output cpu.md --heap-output heap.md
+# Compare two profiles
+perf-skill diff base.pb.gz current.pb.gz -o diff.md
+# Start HTTP server
+perf-skill server --port 3000
+```
+### Programmatic Usage
+```typescript
+import { analyze, diff } from "perf-skill-skill";
+// Convert only (no LLM)
+const result = await analyze("cpu.pb.gz", { mode: "convert-only" });
+console.log(result.markdown);
+console.log(result.hotspots);
+// Full analysis with AI recommendations
+const fullResult = await analyze("cpu.pb.gz", {
+  mode: "analyze",
+  context: {
+    serviceName: "api-server",
+    scenario: "load test",
+    targetSLO: "p99 < 100ms",
+  },
+});
+console.log(fullResult.recommendations);
+// Compare two profiles
+const diffResult = await diff("base.pb.gz", "current.pb.gz", {
+  normalize: "scale-to-base-total",
+});
+console.log(diffResult.regressions);
+console.log(diffResult.improvements);
+```
+### HTTP API
+```bash
+# Start server
+perf-skill server
+# Start server with security overrides
+perf-skill server --no-cors --no-helmet --rate-limit --rate-limit-max 120 --rate-limit-window-ms 60000
+# Analyze profile
+curl -X POST http://localhost:3000/v1/pprof/analyze \
+  -F "file=@cpu.pb.gz"
+# Compare profiles
+curl -X POST http://localhost:3000/v1/pprof/diff \
+  -F "base=@base.pb.gz" \
+  -F "current=@current.pb.gz"
+```
+## CLI Options
+### `perf-skill analyze <profile.pb.gz>`
+| Option                 | Description                                      | Default    |
+| ---------------------- | ------------------------------------------------ | ---------- |
+| `-f, --format`         | Output format: `summary`, `detailed`, `adaptive` | `adaptive` |
+| `-t, --type`           | Profile type: `cpu`, `heap`, `auto`              | `auto`     |
+| `-o, --output`         | Output markdown file                             | stdout     |
+| `-j, --json`           | Output JSON results file                         | -          |
+| `-m, --mode`           | `convert-only` or `analyze`                      | `analyze`  |
+| `-s, --source-dir`     | Source directory for code context                | -          |
+| `--max-hotspots`       | Maximum hotspots to show                         | `10`       |
+| `--llm-provider`       | LLM provider: `openai`, `anthropic`, etc.        | `openai`   |
+| `--llm-model`          | LLM model name                                   | `gpt-5.2`  |
+| `--service`            | Service name for context                         | -          |
+| `--scenario`           | Scenario description                             | -          |
+| `--redact/--no-redact` | Redact sensitive information                     | `true`     |
+### `perf-skill run <entry> [entryArgs...]`
+| Option                  | Description                                      | Default                     |
+| ----------------------- | ------------------------------------------------ | --------------------------- |
+| `-d, --duration`        | CPU profile duration (e.g. `10s`, `5000ms`)      | `10s`                       |
+| `--profile-out`         | Profile output file                              | `cpu.pb.gz`                 |
+| `--heap`                | Also capture a heap profile                      | `false`                     |
+| `--heap-profile-out`    | Heap profile output file                         | `heap.pb.gz`                |
+| `--heap-interval-bytes` | Heap sampling interval (bytes)                   | `524288`                    |
+| `--heap-stack-depth`    | Heap sampling stack depth                        | `64`                        |
+| `--heap-output`         | Heap markdown output file                        | `heap.md` (if heap enabled) |
+| `--heap-json`           | Heap JSON output file                            | -                           |
+| `-f, --format`          | Output format: `summary`, `detailed`, `adaptive` | `adaptive`                  |
+| `-t, --type`            | Profile type: `cpu`, `heap`, `auto`              | `auto`                      |
+| `-o, --output`          | Output markdown file                             | stdout                      |
+| `-j, --json`            | Output JSON results file                         | -                           |
+| `-m, --mode`            | `convert-only` or `analyze`                      | `analyze`                   |
+| `-s, --source-dir`      | Source directory for code context                | -                           |
+| `--max-hotspots`        | Maximum hotspots to show                         | `10`                        |
+| `--llm-provider`        | LLM provider: `openai`, `anthropic`, etc.        | `openai`                    |
+| `--llm-model`           | LLM model name                                   | `gpt-5.2`                   |
+| `--service`             | Service name for context                         | -                           |
+| `--scenario`            | Scenario description                             | -                           |
+| `--redact/--no-redact`  | Redact sensitive information                     | `true`                      |
+When `--heap` is enabled and `--output` is omitted, `perf-skill` writes `cpu.md` and `heap.md` instead of printing to stdout.
+### `perf-skill profile <entry> [entryArgs...]`
+| Option                  | Description                                 | Default      |
+| ----------------------- | ------------------------------------------- | ------------ |
+| `-d, --duration`        | CPU profile duration (e.g. `10s`, `5000ms`) | `10s`        |
+| `-o, --output`          | Profile output file                         | `cpu.pb.gz`  |
+| `--heap`                | Also capture a heap profile                 | `false`      |
+| `--heap-profile-out`    | Heap profile output file                    | `heap.pb.gz` |
+| `--heap-interval-bytes` | Heap sampling interval (bytes)              | `524288`     |
+| `--heap-stack-depth`    | Heap sampling stack depth                   | `64`         |
+### `perf-skill diff <base.pb.gz> <current.pb.gz>`
+| Option                     | Description                                      | Default               |
+| -------------------------- | ------------------------------------------------ | --------------------- |
+| `-f, --format`             | `diff-summary`, `diff-detailed`, `diff-adaptive` | `diff-adaptive`       |
+| `-n, --normalize`          | `none`, `scale-to-base-total`, `per-second`      | `scale-to-base-total` |
+| `--max-regressions`        | Maximum regressions to show                      | `10`                  |
+| `--max-improvements`       | Maximum improvements to show                     | `5`                   |
+| `--max-decompressed-bytes` | Maximum decompressed profile size (bytes)        | -                     |
+## Output Formats
+### Summary
+Compact format for quick triage:
+```markdown
+# PPROF Analysis: CPU
+**Duration:** 30s | **Samples:** 45,231
+## Top Hotspots
+| Rank | Function         | Self% | Cum%  | Location         |
+| ---- | ---------------- | ----- | ----- | ---------------- |
+| 1    | `JSON.parse`     | 23.4% | 23.4% | `<native>`       |
+| 2    | `processRequest` | 15.2% | 67.8% | `handler.ts:142` |
+```
+### Detailed
+Full context with call trees and source code.
+### Adaptive (Default)
+Summary with drill-down sections and anchor links for navigation.
+## AI Recommendations
+When using `--mode analyze`, the tool generates structured recommendations:
+```typescript
+interface Recommendation {
+  title: string; // Short action title
+  rationale: string; // Evidence-based explanation
+  steps: string[]; // Concrete action steps
+  expectedImpact: "high" | "medium" | "low";
+  risk: "high" | "medium" | "low";
+  confidence: number; // 0-1 based on evidence quality
+}
+```
+All recommendations must reference evidence from the profile (function names, percentages, locations).
+## Profile Diff
+Compare two profiles to identify performance regressions:
+```typescript
+const result = await diff("base.pb.gz", "current.pb.gz");
+// Top regressions (got slower)
+for (const reg of result.regressions) {
+  console.log(`${reg.function}: +${reg.deltaSelfPct.toFixed(1)}%`);
+}
+// Top improvements (got faster)
+for (const imp of result.improvements) {
+  console.log(`${imp.function}: ${imp.deltaSelfPct.toFixed(1)}%`);
+}
+```
+### Normalization Modes
+- **none**: Direct comparison (current - base)
+- **scale-to-base-total**: Scale current to match base total (compare structure)
+- **per-second**: Normalize by duration (compare rate)
+## Collecting Profiles
+### Node.js with @datadog/pprof
+```typescript
+import * as pprof from "@datadog/pprof";
+import { writeFileSync } from "fs";
+import { gzipSync } from "zlib";
+// CPU profiling
+pprof.time.start({ durationMillis: 30000 });
+// ... run workload ...
+const profile = await pprof.time.stop();
+writeFileSync("cpu.pb.gz", gzipSync(profile.encode()));
+// Heap profiling
+pprof.heap.start(512 * 1024, 64);
+// ... run workload ...
+const heapProfile = await pprof.heap.profile();
+writeFileSync("heap.pb.gz", gzipSync(heapProfile.encode()));
+```
+## Configuration
+### Environment Variables
+| Variable               | Description                                     |
+| ---------------------- | ----------------------------------------------- |
+| `OPENAI_API_KEY`       | OpenAI API key for analysis                     |
+| `ANTHROPIC_API_KEY`    | Anthropic API key                               |
+| `LLM_PROVIDER`         | Default LLM provider                            |
+| `LLM_MODEL`            | Default LLM model                               |
+| `LLM_BASE_URL`         | Custom LLM API endpoint                         |
+| `LLM_TIMEOUT_MS`       | LLM request timeout in ms                       |
+| `LLM_MAX_RETRIES`      | LLM retry count for transient failures          |
+| `LLM_RETRY_DELAY_MS`   | Base retry delay in ms                          |
+| `LOG_LEVEL`            | Logging level: `debug`, `info`, `warn`, `error` |
+| `LOG_FORMAT`           | Log format: `text`, `json`                      |
+| `CORS_ENABLED`         | Enable CORS (`true`/`false`)                    |
+| `CORS_ORIGIN`          | CORS origin(s), comma-separated or `*`          |
+| `HELMET_ENABLED`       | Enable Helmet (`true`/`false`)                  |
+| `RATE_LIMIT_ENABLED`   | Enable rate limiting (`true`/`false`)           |
+| `RATE_LIMIT_MAX`       | Rate limit max requests per window              |
+| `RATE_LIMIT_WINDOW_MS` | Rate limit window size in ms                    |
+Example:
+```bash
+export LLM_TIMEOUT_MS=30000
+export LLM_MAX_RETRIES=2
+export LLM_RETRY_DELAY_MS=500
+```
+### Resource Limits
+```typescript
+const result = await analyze("large-profile.pb.gz", {
+  limits: {
+    maxProfileBytes: 100 * 1024 * 1024, // 100MB
+    maxDecompressedBytes: 200 * 1024 * 1024, // 200MB uncompressed
+    maxMarkdownChars: 500_000, // 500k chars
+    maxSourceLinesPerFile: 100, // lines per snippet
+    timeoutMs: 120_000, // 2 minutes
+  },
+});
+```
+## Security
+### Redaction
+By default, the tool redacts:
+- AWS access keys
+- Bearer tokens
+- Private keys
+- API keys and secrets
+- Absolute paths (normalized to relative)
+Disable with `--no-redact` or `redact: false`.
+### Server Mode
+In HTTP server mode:
+- Source code inclusion is disabled by default
+- File size limits are enforced
+- Only `.pb.gz` files are accepted
+Security defaults (configurable via env or server options):
+- CORS enabled (set `CORS_ENABLED=false` to disable)
+- Helmet enabled (set `HELMET_ENABLED=false` to disable)
+- Rate limiting enabled (default 60 req/min, set `RATE_LIMIT_ENABLED=false` or `RATE_LIMIT_MAX=0` to disable)
+Server CLI flags (override env defaults):
+- `--cors/--no-cors`
+- `--cors-origin <origin>` (comma-separated or `*`)
+- `--helmet/--no-helmet`
+- `--rate-limit/--no-rate-limit`
+- `--rate-limit-max <n>`
+- `--rate-limit-window-ms <ms>`
+ServerOptions (programmatic):
+```typescript
+const server = await createServer({
+  enableCors: true,
+  corsOrigin: "https://example.com",
+  enableHelmet: true,
+  enableRateLimit: true,
+  rateLimitMax: 60,
+  rateLimitWindowMs: 60_000,
+});
+```
+## Requirements
+- Node.js >= 22.6.0
+- For AI analysis: API key for OpenAI, Anthropic, or compatible provider
+- CPU profiling uses bundled `@datadog/pprof` (native module) on supported platforms
+## Architecture
+```
+perf-skill/
+├── src/
+│   ├── index.ts          # Main exports
+│   ├── types.ts          # TypeScript types
+│   ├── convert/          # pprof-to-md wrapper
+│   │   ├── converter.ts  # Core conversion
+│   │   ├── sanitize.ts   # Redaction & limits
+│   │   └── extract.ts    # Hotspot parsing
+│   ├── llm/              # LLM integration
+│   │   ├── client.ts     # OpenAI/Anthropic clients
+│   │   ├── prompt.ts     # Prompt templates
+│   │   ├── schema.ts     # Zod schemas
+│   │   └── validate.ts   # Output validation
+│   ├── diff/             # Profile comparison
+│   │   ├── engine.ts     # Pure TS diff engine
+│   │   └── markdown.ts   # Diff report generation
+│   ├── cli/              # CLI implementation
+│   ├── server/           # HTTP API
+│   └── skill/            # Agent integration
+│       ├── handler.ts    # Skill handlers
+│       └── manifest.ts   # Tool schema
+├── SKILL.md              # Claude Code skill file
+└── package.json
+```
+## API Reference
+### `analyze(profile, options): Promise<AnalyzeResult>`
+Analyze a single profile.
+### `diff(baseProfile, currentProfile, options): Promise<DiffResult>`
+Compare two profiles.
+### `convertProfileToMarkdown(buffer, options): Promise<ConvertResult>`
+Low-level conversion function.
+### `createLLMClient(config): LLMClient`
+Create an LLM client for custom integrations.
+## License
+MIT
+### Updating Prompt Fixtures
+If you change prompt templates and need to refresh fixtures:
+```bash
+npm run update-prompts
+```

package/SKILL.md ADDED Viewed

@@ -0,0 +1,238 @@
+---
+name: perf-skill
+description: Analyze pprof CPU and heap profiles with AI-powered recommendations, or profile a Node.js entry file and generate a full report. Use when the user has a .pb.gz profile file or wants to profile a Node.js script and get optimization suggestions.
+argument-hint: [profile.pb.gz|entry.js] [options]
+allowed-tools: Bash(node *), Bash(npx *), Read, Glob
+---
+# perf-skill: Performance Profile Analysis Skill
+Analyze pprof profiles (.pb.gz) to identify performance bottlenecks and generate actionable optimization recommendations.
+## Quick Start
+### Analyze a Single Profile
+```bash
+# Quick conversion to markdown (no LLM)
+npx perf-skill convert $ARGUMENTS
+# Full analysis with AI recommendations
+npx perf-skill analyze $ARGUMENTS --mode analyze
+# Output to file
+npx perf-skill analyze $ARGUMENTS -o analysis.md -j results.json
+```
+### Profile a Node Entry and Analyze (One Command)
+```bash
+# Default CPU profiling (10s) + analysis
+npx perf-skill run slow.mjs
+# Customize duration and output
+npx perf-skill run slow.mjs --duration 10s -o analysis.md
+# CPU + Heap profiling (separate reports)
+npx perf-skill run slow.mjs --heap --output cpu.md --heap-output heap.md
+```
+### Compare Two Profiles (Diff)
+```bash
+# Compare base vs current profile
+npx perf-skill diff base.pb.gz current.pb.gz
+# With specific format
+npx perf-skill diff base.pb.gz current.pb.gz --format diff-detailed
+```
+## When to Use This Skill
+Use `perf-skill` when:
+- User provides a `.pb.gz` pprof profile file
+- User provides a Node.js entry file (`.js/.mjs/.cjs`) and wants an end-to-end performance report
+- User asks "why is my app slow?" with a profile attached
+- User wants to compare performance before/after a change
+- User needs help interpreting profile data
+- User asks about CPU or memory hotspots
+## Routing
+- If the argument ends with `.pb`, `.pb.gz`, or `.pprof`, run `analyze` or `diff` directly.
+- If the argument ends with `.js`, `.mjs`, or `.cjs`, run `perf-skill run <entry>` to generate a CPU profile and analyze it.
+- If the user asks for both CPU and heap (including misspellings like "heep" or terms like "memory"/"heap"), add `--heap` and save separate reports (`--output` + `--heap-output`).
+## Available Commands
+### `analyze` (default)
+Analyze a single profile with optional AI recommendations.
+```bash
+perf-skill analyze profile.pb.gz [options]
+```
+**Options:**
+- `-f, --format <format>`: Output format (`summary`, `detailed`, `adaptive`)
+- `-t, --type <type>`: Profile type (`cpu`, `heap`, `auto`)
+- `-o, --output <file>`: Save markdown to file
+- `-j, --json <file>`: Save JSON results to file
+- `-m, --mode <mode>`: `convert-only` (no LLM) or `analyze` (with LLM)
+- `-s, --source-dir <path>`: Include source code context
+- `--max-hotspots <n>`: Limit hotspots shown (default: 10)
+- `--service <name>`: Service name for context
+- `--scenario <desc>`: Scenario description
+### `diff`
+Compare two profiles to find performance regressions.
+```bash
+perf-skill diff base.pb.gz current.pb.gz [options]
+```
+**Options:**
+- `-f, --format <format>`: `diff-summary`, `diff-detailed`, `diff-adaptive`
+- `-n, --normalize <mode>`: `none`, `scale-to-base-total`, `per-second`
+- `--max-regressions <n>`: Limit regressions shown (default: 10)
+- `--max-improvements <n>`: Limit improvements shown (default: 5)
+### `convert`
+Convert profile to markdown without AI analysis (faster).
+```bash
+perf-skill convert profile.pb.gz -o report.md
+```
+### `run`
+Profile a Node entry file (CPU) and analyze the resulting profile.
+```bash
+perf-skill run entry.js [entryArgs...]
+```
+**Options:**
+- `-d, --duration <duration>`: Profiling duration (default: `10s`)
+- `--profile-out <file>`: Profile output file (default: `cpu.pb.gz`)
+- `--heap`: Also capture heap profile
+- `--heap-profile-out <file>`: Heap profile output file (default: `heap.pb.gz`)
+- `--heap-output <file>`: Heap markdown output file (default: derived from CPU output or `heap.md`)
+- `--heap-json <file>`: Heap JSON output file (optional)
+- `--heap-interval-bytes <n>`: Heap sampling interval (bytes, default: `524288`)
+- `--heap-stack-depth <n>`: Heap sampling stack depth (default: `64`)
+- All `analyze` options (`--format`, `--mode`, `--output`, etc.)
+When `--heap` is enabled and `--output` is omitted, the CLI writes `cpu.md` and `heap.md` instead of printing to stdout.
+### `profile`
+Generate a CPU profile for a Node entry file without analysis.
+```bash
+perf-skill profile entry.js [entryArgs...]
+```
+**Options:**
+- `-d, --duration <duration>`: Profiling duration (default: `10s`)
+- `-o, --output <file>`: Profile output file (default: `cpu.pb.gz`)
+- `--heap`: Also capture heap profile
+- `--heap-profile-out <file>`: Heap profile output file (default: `heap.pb.gz`)
+- `--heap-interval-bytes <n>`: Heap sampling interval (bytes, default: `524288`)
+- `--heap-stack-depth <n>`: Heap sampling stack depth (default: `64`)
+## Programmatic Usage
+```typescript
+import { analyze, diff } from 'perf-skill';
+// Analyze with AI
+const result = await analyze('cpu.pb.gz', {
+  mode: 'analyze',
+  context: { serviceName: 'api-server' }
+});
+console.log(result.markdown);
+console.log(result.recommendations);
+// Compare profiles
+const diffResult = await diff('base.pb.gz', 'current.pb.gz');
+console.log(diffResult.regressions);
+```
+## Understanding the Output
+### Hotspots
+Functions ranked by CPU time or memory allocation:
+- **Self%**: Time spent in this function only
+- **Cum%**: Time spent in this function + its callees
+- **Location**: Source file and line number
+### Recommendations (AI mode)
+Each recommendation includes:
+- **Title**: What to do
+- **Rationale**: Why (with evidence from the profile)
+- **Steps**: How to implement
+- **Impact/Risk/Confidence**: Prioritization info
+### Diff Analysis
+When comparing profiles:
+- **Regressions**: Functions that got slower
+- **Improvements**: Functions that got faster
+- **Call Path Δ**: Which paths contributed to the change
+## Collecting Profiles
+### Node.js with @datadog/pprof
+```typescript
+import * as pprof from '@datadog/pprof';
+import { writeFileSync } from 'fs';
+import { gzipSync } from 'zlib';
+// CPU profiling (30 seconds)
+pprof.time.start({ durationMillis: 30000 });
+// ... run your workload ...
+const profile = await pprof.time.stop();
+writeFileSync('cpu.pb.gz', gzipSync(profile.encode()));
+// Heap profiling
+pprof.heap.start(512 * 1024, 64);
+// ... run your workload ...
+const heapProfile = await pprof.heap.profile();
+writeFileSync('heap.pb.gz', gzipSync(heapProfile.encode()));
+```
+## Tips
+1. **Start with `--format summary`** for quick triage
+2. **Use `--mode convert-only`** when you just need the markdown
+3. **Compare profiles** to find the cause of regressions
+4. **Provide context** (`--service`, `--scenario`) for better AI recommendations
+5. **High self%** = function is doing expensive work directly
+6. **High cum%** = function is on a hot path (may be calling slow functions)
+## Requirements
+- Node.js >= 22.6.0
+- For AI analysis: Set `OPENAI_API_KEY` or configure LLM provider
+- CPU profiling uses bundled `@datadog/pprof` (native module); supported on common platforms
+## Troubleshooting
+### "No symbols found"
+The profile may be from a production build without debug info. The analysis still works but function names may be mangled.
+### "Native code dominates"
+If native functions (like `JSON.parse`) are top hotspots, consider:
+- Using streaming parsers for large JSON
+- Caching parsed results
+- Using binary formats like Protocol Buffers
+### "Low sample count"
+Run the profiler longer to get more samples for statistical significance.

package/dist/cli/main.d.ts ADDED Viewed

@@ -0,0 +1,6 @@
+#!/usr/bin/env node
+/**
+ * perf-skill CLI - Analyze pprof profiles with AI assistance
+ */
+export {};
+//# sourceMappingURL=main.d.ts.map

package/dist/cli/main.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"main.d.ts","sourceRoot":"","sources":["../../src/cli/main.ts"],"names":[],"mappings":";AACA;;GAEG"}