npm - firecrawl-cli - Versions diffs - 1.9.3 → 1.9.5 - Mend

firecrawl-cli 1.9.3 → 1.9.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (62) hide show

package/dist/commands/experimental/workflows/demo.js ADDED Viewed

@@ -0,0 +1,190 @@
+"use strict";
+/**
+ * Workflow: Demo Walkthrough
+ *
+ * Uses Firecrawl's cloud browser to walk through a product's key flows --
+ * signup, onboarding, pricing, docs -- step by step. Captures every screen,
+ * documents interactions, and produces a structured walkthrough report.
+ */
+var __createBinding = (this && this.__createBinding) || (Object.create ? (function(o, m, k, k2) {
+    if (k2 === undefined) k2 = k;
+    var desc = Object.getOwnPropertyDescriptor(m, k);
+    if (!desc || ("get" in desc ? !m.__esModule : desc.writable || desc.configurable)) {
+      desc = { enumerable: true, get: function() { return m[k]; } };
+    }
+    Object.defineProperty(o, k2, desc);
+}) : (function(o, m, k, k2) {
+    if (k2 === undefined) k2 = k;
+    o[k2] = m[k];
+}));
+var __setModuleDefault = (this && this.__setModuleDefault) || (Object.create ? (function(o, v) {
+    Object.defineProperty(o, "default", { enumerable: true, value: v });
+}) : function(o, v) {
+    o["default"] = v;
+});
+var __importStar = (this && this.__importStar) || (function () {
+    var ownKeys = function(o) {
+        ownKeys = Object.getOwnPropertyNames || function (o) {
+            var ar = [];
+            for (var k in o) if (Object.prototype.hasOwnProperty.call(o, k)) ar[ar.length] = k;
+            return ar;
+        };
+        return ownKeys(o);
+    };
+    return function (mod) {
+        if (mod && mod.__esModule) return mod;
+        var result = {};
+        if (mod != null) for (var k = ownKeys(mod), i = 0; i < k.length; i++) if (k[i] !== "default") __createBinding(result, mod, k[i]);
+        __setModuleDefault(result, mod);
+        return result;
+    };
+})();
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.register = register;
+const backends_1 = require("../backends");
+const shared_1 = require("../shared");
+// ─── Input gathering ────────────────────────────────────────────────────────
+async function gatherInputs(prefill) {
+    const { input, select } = await Promise.resolve().then(() => __importStar(require('@inquirer/prompts')));
+    const rawUrl = prefill?.url ||
+        (await input({
+            message: 'What product do you want to walk through?',
+            validate: shared_1.validateUrl,
+        }));
+    const focus = await select({
+        message: 'What flows should the agent explore?',
+        choices: [
+            { name: 'Full product walkthrough (all key flows)', value: 'full' },
+            { name: 'Signup and onboarding flow', value: 'signup' },
+            { name: 'Pricing and plans', value: 'pricing' },
+            { name: 'Documentation and developer experience', value: 'docs' },
+            { name: 'Dashboard and core product', value: 'dashboard' },
+        ],
+    });
+    const context = await input({
+        message: 'Anything specific to look for? (leave blank to skip)',
+        default: '',
+    });
+    const output = await select({
+        message: 'How should the walkthrough be delivered?',
+        choices: [
+            { name: 'Print to terminal', value: 'terminal' },
+            { name: 'Save as Markdown file', value: 'markdown' },
+        ],
+    });
+    return { url: (0, shared_1.normalizeUrl)(rawUrl), focus, context, output };
+}
+// ─── System prompt ──────────────────────────────────────────────────────────
+function buildSystemPrompt(opts) {
+    const outputInstructions = opts.output === 'markdown'
+        ? 'Save the walkthrough to a file called `demo-walkthrough.md` in the current directory. Tell the user the file path when done.'
+        : 'Print the full walkthrough to the terminal in well-formatted markdown.';
+    const focusInstructions = {
+        full: `Spawn these parallel agents, each walking a different flow:
+1. **Homepage & Marketing Agent** -- Open the homepage. Click through marketing pages (features, about, use cases). Document the messaging, value prop, key claims, and CTAs. Note what's above the fold vs below.
+2. **Signup & Onboarding Agent** -- Find the signup/get-started flow. Walk through every step of signup and onboarding. Document each screen, what's required, friction points, and the first-run experience. Do NOT submit real credentials -- just document the flow.
+3. **Pricing & Plans Agent** -- Navigate to pricing. Click to expand tiers, toggle monthly/annual, check feature comparisons. Document every plan, price, and feature. Look for hidden costs or confusing language.
+4. **Docs & Developer Experience Agent** -- Navigate to docs. Walk through the quickstart guide. Check navigation, code examples, search functionality. Document the developer onboarding experience.`,
+        signup: `Spawn these parallel agents to thoroughly explore the signup and onboarding experience:
+1. **Signup Discovery Agent** -- Find every signup entry point (header CTA, pricing page, landing pages). Document how many clicks to get to signup from different starting points.
+2. **Signup Flow Agent** -- Walk through the signup form step by step. Document every field, validation message, and screen transition. Note required vs optional fields. Do NOT submit real credentials.
+3. **Onboarding Agent** -- After signup screens, document the onboarding flow: welcome screens, setup wizards, tutorials, first-run experience. Walk through every step.
+4. **Social Proof Agent** -- Look for trust signals during signup: testimonials, logos, security badges, terms. Document what reassurance the user gets during the flow.`,
+        pricing: `Spawn these parallel agents to deeply analyze the pricing experience:
+1. **Pricing Page Agent** -- Navigate to the pricing page. Snapshot the full layout. Toggle between monthly/annual. Click to expand feature lists. Document every plan name, price, and feature.
+2. **Feature Comparison Agent** -- Find the feature comparison table or matrix. Click through each tier's detail page. Document what's included and excluded at each level.
+3. **Pricing Discovery Agent** -- Check multiple entry points to pricing (nav, footer, CTAs). Look for different pricing shown to different segments. Check if pricing changes based on region or plan selection.
+4. **Competitor Pricing Agent** -- Search for and scrape competitor pricing pages. Build a side-by-side comparison of pricing tiers and features.`,
+        docs: `Spawn these parallel agents to walk through the documentation experience:
+1. **Quickstart Agent** -- Find and follow the quickstart guide from start to finish. Try every step. Document the experience: was it clear? Were code examples correct? How long would it take a new developer?
+2. **Navigation Agent** -- Explore the doc structure. Click through the sidebar, use search, check breadcrumbs. Document the information architecture and how easy it is to find things.
+3. **Code Examples Agent** -- Find code examples across the docs. Check multiple languages/SDKs. Document which are available, their quality, and whether they look copy-pasteable.
+4. **API Reference Agent** -- Find the API reference. Walk through endpoints, check request/response examples, look for interactive "try it" features. Document completeness and usability.`,
+        dashboard: `Spawn these parallel agents to explore the core product experience:
+1. **Entry Point Agent** -- Find the login/dashboard entry. Document what the user sees on first login. Walk through the main navigation. Map out the product sections.
+2. **Core Flow Agent** -- Identify the primary user action (create something, configure something). Walk through it step by step. Document each screen and interaction.
+3. **Settings & Config Agent** -- Explore settings, integrations, API keys, team management. Document what's configurable and how.
+4. **Help & Support Agent** -- Find help resources within the product: tooltips, help center links, chat widgets, documentation links. Document what support is available in-context.`,
+    };
+    return `You are a product demo team lead powered by Firecrawl. You walk through a product's key flows using cloud browser automation, documenting every screen and interaction.
+${shared_1.QA_TOOLS_BLOCK}
+## Your Strategy
+You are a **team lead**. Your job is to:
+1. **Open the site first** -- Run \`firecrawl browser "open <url>"\` yourself to get the initial page state and understand the site structure.
+2. **Spawn parallel subagents** -- Each agent walks through a different flow using \`firecrawl browser\`. They click, scroll, type, and snapshot their way through the product.
+3. **Collect results** -- Each agent reports back a step-by-step walkthrough of their flow.
+4. **Synthesize** -- Merge all walkthroughs into one structured report.
+## Agent Assignments
+${focusInstructions[opts.focus]}
+${shared_1.SUBAGENT_INSTRUCTIONS}
+- Tell each agent to use \`firecrawl browser\` commands to navigate interactively
+- Each agent should describe every screen they see: layout, content, CTAs, forms
+- Agents should \`firecrawl browser "snapshot"\` at each step to see interactive elements
+- Agents should note the user experience: what's clear, what's confusing, what's missing
+## Output Format
+${outputInstructions}
+Structure the walkthrough as:
+### Product Overview
+One paragraph summary of what the product does based on exploring it.
+### Flow Walkthroughs
+For each flow explored:
+#### [Flow Name]
+Step-by-step walkthrough:
+1. **[Screen/Page Name]** -- What's on screen, key elements, what the user would do next
+2. **[Next Screen]** -- What changed, new elements, user actions available
+...
+Key observations:
+- What works well
+- What's confusing or could be improved
+- Notable UX patterns
+### Key Findings
+- First impression and overall UX quality
+- Standout features or patterns
+- Friction points or usability issues
+- How the product compares to typical products in the space
+### Recommendations
+What could be improved, from a user experience perspective.
+### Pages Visited
+Full list of every URL the agents navigated to.
+---
+Be specific and descriptive. Don't just say "the pricing page looks good" -- describe what's on it, how it's organized, and what makes it effective or not.
+Start by opening the site, then immediately fan out your agents to walk through different flows in parallel.`;
+}
+// ─── Command registration ───────────────────────────────────────────────────
+function register(parentCmd, backend) {
+    const config = backends_1.BACKENDS[backend];
+    parentCmd
+        .command('demo')
+        .description("Walk through a product's key flows using cloud browser")
+        .argument('[url]', 'Product URL to explore')
+        .option('-y, --yes', 'Auto-approve all tool permissions')
+        .action(async (url, options) => {
+        const inputs = await gatherInputs(url ? { url } : undefined);
+        const skipPermissions = options.yes || (await (0, shared_1.askPermissionMode)(backend));
+        console.log(`\nLaunching ${config.displayName}...\n`);
+        (0, backends_1.launchAgent)(backend, buildSystemPrompt({ focus: inputs.focus, output: inputs.output }), (0, shared_1.buildMessage)([`Walk through ${inputs.url}`, inputs.context]), skipPermissions);
+    });
+}
+//# sourceMappingURL=demo.js.map

package/dist/commands/experimental/workflows/demo.js.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"demo.js","sourceRoot":"","sources":["../../../../src/commands/experimental/workflows/demo.ts"],"names":[],"mappings":";AAAA;;;;;;GAMG;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;AA0KH,4BAqBC;AA5LD,0CAAkE;AAClE,sCAOmB;AAWnB,+EAA+E;AAE/E,KAAK,UAAU,YAAY,CAAC,OAA0B;IACpD,MAAM,EAAE,KAAK,EAAE,MAAM,EAAE,GAAG,wDAAa,mBAAmB,GAAC,CAAC;IAE5D,MAAM,MAAM,GACV,OAAO,EAAE,GAAG;QACZ,CAAC,MAAM,KAAK,CAAC;YACX,OAAO,EAAE,2CAA2C;YACpD,QAAQ,EAAE,oBAAW;SACtB,CAAC,CAAC,CAAC;IAEN,MAAM,KAAK,GAAG,MAAM,MAAM,CAAC;QACzB,OAAO,EAAE,sCAAsC;QAC/C,OAAO,EAAE;YACP,EAAE,IAAI,EAAE,0CAA0C,EAAE,KAAK,EAAE,MAAM,EAAE;YACnE,EAAE,IAAI,EAAE,4BAA4B,EAAE,KAAK,EAAE,QAAQ,EAAE;YACvD,EAAE,IAAI,EAAE,mBAAmB,EAAE,KAAK,EAAE,SAAS,EAAE;YAC/C,EAAE,IAAI,EAAE,wCAAwC,EAAE,KAAK,EAAE,MAAM,EAAE;YACjE,EAAE,IAAI,EAAE,4BAA4B,EAAE,KAAK,EAAE,WAAW,EAAE;SAC3D;KACF,CAAC,CAAC;IAEH,MAAM,OAAO,GAAG,MAAM,KAAK,CAAC;QAC1B,OAAO,EAAE,sDAAsD;QAC/D,OAAO,EAAE,EAAE;KACZ,CAAC,CAAC;IAEH,MAAM,MAAM,GAAG,MAAM,MAAM,CAAC;QAC1B,OAAO,EAAE,0CAA0C;QACnD,OAAO,EAAE;YACP,EAAE,IAAI,EAAE,mBAAmB,EAAE,KAAK,EAAE,UAAU,EAAE;YAChD,EAAE,IAAI,EAAE,uBAAuB,EAAE,KAAK,EAAE,UAAU,EAAE;SACrD;KACF,CAAC,CAAC;IAEH,OAAO,EAAE,GAAG,EAAE,IAAA,qBAAY,EAAC,MAAM,CAAC,EAAE,KAAK,EAAE,OAAO,EAAE,MAAM,EAAE,CAAC;AAC/D,CAAC;AAED,+EAA+E;AAE/E,SAAS,iBAAiB,CAAC,IAAuC;IAChE,MAAM,kBAAkB,GACtB,IAAI,CAAC,MAAM,KAAK,UAAU;QACxB,CAAC,CAAC,8HAA8H;QAChI,CAAC,CAAC,wEAAwE,CAAC;IAE/E,MAAM,iBAAiB,GAA2B;QAChD,IAAI,EAAE;;;;sMAI4L;QAElM,MAAM,EAAE;;;;yKAI6J;QAErK,OAAO,EAAE;;;;kJAIqI;QAE9I,IAAI,EAAE;;;;4LAIkL;QAExL,SAAS,EAAE;;;;sLAIuK;KACnL,CAAC;IAEF,OAAO;;EAEP,uBAAc;;;;;;;;;;;;;EAad,iBAAiB,CAAC,IAAI,CAAC,KAAK,CAAC;;EAE7B,8BAAqB;;;;;;;;;EASrB,kBAAkB;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;6GAsCyF,CAAC;AAC9G,CAAC;AAED,+EAA+E;AAE/E,SAAgB,QAAQ,CAAC,SAAkB,EAAE,OAAgB;IAC3D,MAAM,MAAM,GAAG,mBAAQ,CAAC,OAAO,CAAC,CAAC;IAEjC,SAAS;SACN,OAAO,CAAC,MAAM,CAAC;SACf,WAAW,CAAC,wDAAwD,CAAC;SACrE,QAAQ,CAAC,OAAO,EAAE,wBAAwB,CAAC;SAC3C,MAAM,CAAC,WAAW,EAAE,mCAAmC,CAAC;SACxD,MAAM,CAAC,KAAK,EAAE,GAAG,EAAE,OAAO,EAAE,EAAE;QAC7B,MAAM,MAAM,GAAG,MAAM,YAAY,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,GAAG,EAAE,CAAC,CAAC,CAAC,SAAS,CAAC,CAAC;QAE7D,MAAM,eAAe,GAAG,OAAO,CAAC,GAAG,IAAI,CAAC,MAAM,IAAA,0BAAiB,EAAC,OAAO,CAAC,CAAC,CAAC;QAC1E,OAAO,CAAC,GAAG,CAAC,eAAe,MAAM,CAAC,WAAW,OAAO,CAAC,CAAC;QAEtD,IAAA,sBAAW,EACT,OAAO,EACP,iBAAiB,CAAC,EAAE,KAAK,EAAE,MAAM,CAAC,KAAK,EAAE,MAAM,EAAE,MAAM,CAAC,MAAM,EAAE,CAAC,EACjE,IAAA,qBAAY,EAAC,CAAC,gBAAgB,MAAM,CAAC,GAAG,EAAE,EAAE,MAAM,CAAC,OAAO,CAAC,CAAC,EAC5D,eAAe,CAChB,CAAC;IACJ,CAAC,CAAC,CAAC;AACP,CAAC"}

package/dist/commands/experimental/workflows/knowledge-base.d.ts ADDED Viewed

@@ -0,0 +1,11 @@
+/**
+ * Workflow: Knowledge Base
+ *
+ * A single command that adapts based on the user's goal: local reference docs,
+ * RAG-ready chunks, fine-tuning datasets, or full doc site mirrors. All output
+ * follows the `.firecrawl/<hostname>/<path>/index.md` convention.
+ */
+import { Command } from 'commander';
+import { type Backend } from '../backends';
+export declare function register(parentCmd: Command, backend: Backend): void;
+//# sourceMappingURL=knowledge-base.d.ts.map

package/dist/commands/experimental/workflows/knowledge-base.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"knowledge-base.d.ts","sourceRoot":"","sources":["../../../../src/commands/experimental/workflows/knowledge-base.ts"],"names":[],"mappings":"AAAA;;;;;;GAMG;AAEH,OAAO,EAAE,OAAO,EAAE,MAAM,WAAW,CAAC;AACpC,OAAO,EAAE,KAAK,OAAO,EAAyB,MAAM,aAAa,CAAC;AAwTlE,wBAAgB,QAAQ,CAAC,SAAS,EAAE,OAAO,EAAE,OAAO,EAAE,OAAO,GAAG,IAAI,CAgCnE"}

package/dist/commands/experimental/workflows/knowledge-base.js ADDED Viewed

@@ -0,0 +1,319 @@
+"use strict";
+/**
+ * Workflow: Knowledge Base
+ *
+ * A single command that adapts based on the user's goal: local reference docs,
+ * RAG-ready chunks, fine-tuning datasets, or full doc site mirrors. All output
+ * follows the `.firecrawl/<hostname>/<path>/index.md` convention.
+ */
+var __createBinding = (this && this.__createBinding) || (Object.create ? (function(o, m, k, k2) {
+    if (k2 === undefined) k2 = k;
+    var desc = Object.getOwnPropertyDescriptor(m, k);
+    if (!desc || ("get" in desc ? !m.__esModule : desc.writable || desc.configurable)) {
+      desc = { enumerable: true, get: function() { return m[k]; } };
+    }
+    Object.defineProperty(o, k2, desc);
+}) : (function(o, m, k, k2) {
+    if (k2 === undefined) k2 = k;
+    o[k2] = m[k];
+}));
+var __setModuleDefault = (this && this.__setModuleDefault) || (Object.create ? (function(o, v) {
+    Object.defineProperty(o, "default", { enumerable: true, value: v });
+}) : function(o, v) {
+    o["default"] = v;
+});
+var __importStar = (this && this.__importStar) || (function () {
+    var ownKeys = function(o) {
+        ownKeys = Object.getOwnPropertyNames || function (o) {
+            var ar = [];
+            for (var k in o) if (Object.prototype.hasOwnProperty.call(o, k)) ar[ar.length] = k;
+            return ar;
+        };
+        return ownKeys(o);
+    };
+    return function (mod) {
+        if (mod && mod.__esModule) return mod;
+        var result = {};
+        if (mod != null) for (var k = ownKeys(mod), i = 0; i < k.length; i++) if (k[i] !== "default") __createBinding(result, mod, k[i]);
+        __setModuleDefault(result, mod);
+        return result;
+    };
+})();
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.register = register;
+const backends_1 = require("../backends");
+const shared_1 = require("../shared");
+// ─── Input gathering ────────────────────────────────────────────────────────
+async function gatherInputs(prefill) {
+    const { input, select } = await Promise.resolve().then(() => __importStar(require('@inquirer/prompts')));
+    const rawSource = prefill?.source ||
+        (await input({
+            message: 'What do you want to build a knowledge base from? (URL or topic)',
+            validate: (0, shared_1.validateRequired)('URL or topic'),
+        }));
+    const goal = await select({
+        message: 'What are you building this for?',
+        choices: [
+            {
+                name: 'Local reference (organized markdown files)',
+                value: 'reference',
+            },
+            {
+                name: 'RAG / embedding pipeline (chunked, with metadata)',
+                value: 'rag',
+            },
+            { name: 'Fine-tuning dataset (JSONL training data)', value: 'train' },
+            { name: 'Documentation scrape (mirror a doc site)', value: 'docs' },
+        ],
+    });
+    let trainFormat = '';
+    let trainExamples = '';
+    if (goal === 'train') {
+        trainFormat = (await select({
+            message: 'Training data format?',
+            choices: [
+                { name: 'OpenAI JSONL (messages array)', value: 'openai' },
+                { name: 'Alpaca (instruction/input/output)', value: 'alpaca' },
+                { name: 'ShareGPT (conversations)', value: 'sharegpt' },
+            ],
+        }));
+        trainExamples = await input({
+            message: 'Roughly how many training examples?',
+            default: '100',
+        });
+    }
+    const depth = await select({
+        message: 'How thorough?',
+        choices: [
+            { name: 'Quick (5-10 sources)', value: 'quick' },
+            { name: 'Thorough (15-25 sources)', value: 'thorough' },
+            { name: 'Exhaustive (25+ sources)', value: 'exhaustive' },
+        ],
+    });
+    const context = await input({
+        message: 'Any specific focus or instructions? (leave blank to skip)',
+        default: '',
+    });
+    const outputDir = await input({
+        message: 'Output directory?',
+        default: '.firecrawl/',
+    });
+    return {
+        source: (0, shared_1.normalizeSource)(rawSource),
+        goal,
+        depth,
+        context,
+        outputDir,
+        trainFormat,
+        trainExamples,
+    };
+}
+// ─── System prompt ──────────────────────────────────────────────────────────
+const FILE_CONVENTION = `## File Organization
+**IMPORTANT:** Follow the same structure as \`firecrawl download\`. Save all files under \`.firecrawl/\` using nested directories that mirror each URL's hostname and path:
+\`\`\`
+.firecrawl/
+  <hostname>/
+    <path>/
+      index.md          # Page content as clean markdown
+\`\`\`
+For example, \`https://docs.stripe.com/api/charges\` becomes:
+\`\`\`
+.firecrawl/docs.stripe.com/api/charges/index.md
+\`\`\`
+Strip \`www.\` from hostnames. Each page gets its own directory with an \`index.md\` inside it.`;
+function buildGoalInstructions(opts) {
+    switch (opts.goal) {
+        case 'reference':
+            return `${FILE_CONVENTION}
+Also create these at the root of \`${opts.outputDir}\`:
+- \`index.md\` -- Table of contents with links to all scraped pages
+- \`sources.json\` -- All URLs scraped with metadata (title, type, url)
+Each markdown file should have frontmatter:
+\`\`\`yaml
+---
+title: "Page Title"
+url: "https://..."
+source: "Source Name"
+type: "docs | article | tutorial | reference | discussion"
+---
+\`\`\`
+Focus on clean, readable markdown. Preserve code examples and formatting.`;
+        case 'rag':
+            return `${FILE_CONVENTION}
+After scraping, chunk each page into embedding-ready pieces (500-1500 tokens). Save chunks alongside the source:
+\`\`\`
+.firecrawl/<hostname>/<path>/
+  index.md              # Full page content
+  chunks/
+    001.md              # Chunk 1
+    002.md              # Chunk 2
+\`\`\`
+Each chunk file should have frontmatter:
+\`\`\`yaml
+---
+title: "Page Title"
+url: "https://..."
+chunk: 1
+total_chunks: 5
+section: "Section Name"
+---
+\`\`\`
+Also create \`${opts.outputDir}/manifest.json\` listing every chunk with its metadata for easy ingestion into a vector store.`;
+        case 'train':
+            return `${FILE_CONVENTION}
+Scrape source pages into the \`.firecrawl/\` directory structure first, then generate training data from the scraped content.
+## Training Data Format
+${opts.trainFormat === 'openai'
+                ? `OpenAI fine-tuning JSONL. Each line:
+\`\`\`json
+{"messages": [{"role": "system", "content": "..."}, {"role": "user", "content": "..."}, {"role": "assistant", "content": "..."}]}
+\`\`\``
+                : opts.trainFormat === 'alpaca'
+                    ? `Alpaca format JSONL. Each line:
+\`\`\`json
+{"instruction": "...", "input": "...", "output": "..."}
+\`\`\``
+                    : `ShareGPT conversation JSONL. Each line:
+\`\`\`json
+{"conversations": [{"from": "human", "value": "..."}, {"from": "gpt", "value": "..."}]}
+\`\`\``}
+Target ~${opts.trainExamples} examples.
+Save the dataset to \`training-data.jsonl\` in the current directory.
+Also save \`training-metadata.json\` with:
+- Total examples generated
+- Sources used (URLs)
+- Topic coverage breakdown
+- Format used
+### Quality Guidelines
+- Each example should be self-contained and accurate
+- Vary the instruction style (questions, commands, scenarios)
+- Include code examples where relevant
+- Remove boilerplate, navigation, and ads from scraped content
+- Cite the source URL in a metadata field for traceability
+- Deduplicate similar examples`;
+        case 'docs':
+            return `${FILE_CONVENTION}
+Also create \`${opts.outputDir}/index.md\` as a table of contents linking to all scraped pages, organized by section.
+Each markdown file should have frontmatter:
+\`\`\`yaml
+---
+title: "Page Title"
+url: "https://..."
+section: "Section Name"
+---
+\`\`\`
+Be thorough. Scrape every page, preserve all code examples. This content will be used as LLM context, so accuracy matters.`;
+        default:
+            return FILE_CONVENTION;
+    }
+}
+function buildAgentStrategy(goal) {
+    switch (goal) {
+        case 'docs':
+            return `## Agent Assignments
+Spawn agents based on the doc structure:
+1. **Section Agent** (one per major section) -- Scrape all pages in the section. Save each page as clean markdown. Preserve code examples and formatting.
+Start by mapping the site with \`firecrawl map\` to discover all pages, then divide by section.`;
+        case 'train':
+            return `## Agent Assignments
+Spawn agents by source type:
+1. **Documentation Agent** -- Scrape official docs. Generate instruction/response pairs from doc sections (e.g., "How do I X?" with the answer from docs).
+2. **Tutorial Agent** -- Scrape tutorials and how-to articles. Generate step-by-step instruction pairs.
+3. **Q&A Agent** -- Scrape Stack Overflow, GitHub discussions, forums. Extract real question/answer pairs.
+4. **Reference Agent** -- Scrape reference material. Generate factual Q&A pairs.`;
+        default:
+            return `## Agent Assignments
+Spawn agents by source type:
+1. **Official Docs Agent** -- Find and scrape official documentation, reference material, specs.
+2. **Articles & Tutorials Agent** -- Find and scrape the best articles, blog posts, tutorials.
+3. **Community & Discussions Agent** -- Find and scrape relevant forum posts, Stack Overflow answers, GitHub discussions.
+4. **Reference Agent** -- Wikipedia, glossaries, standards documents, whitepapers.
+Adjust agents based on what sources exist for the topic.`;
+    }
+}
+function buildSystemPrompt(opts) {
+    const depthInstructions = {
+        quick: 'Find and scrape 5-10 of the best sources.',
+        thorough: 'Find and scrape 15-25 sources covering different perspectives.',
+        exhaustive: 'Find and scrape 25+ sources including primary docs, articles, tutorials, and reference material.',
+    };
+    return `You are a knowledge base team lead powered by Firecrawl. You scrape web content and organize it into structured, LLM-ready formats.
+${shared_1.FIRECRAWL_TOOLS_BLOCK}
+## Depth
+${depthInstructions[opts.depth]}
+## Your Strategy
+You are a **team lead**. Your job is to:
+1. **Find the best sources** -- ${opts.goal === 'docs' ? 'Map the documentation site to discover all pages.' : 'Search broadly to identify the most valuable sources on the topic.'}
+2. **Spawn parallel subagents** -- Divide the work across agents. Each scrapes their assigned sources.
+3. **Collect and organize** -- Build the final output structure from all agent results.
+${buildAgentStrategy(opts.goal)}
+${shared_1.SUBAGENT_INSTRUCTIONS}
+${buildGoalInstructions(opts)}
+---
+Tell the user the output path when done.
+Start immediately.`;
+}
+// ─── Command registration ───────────────────────────────────────────────────
+function register(parentCmd, backend) {
+    const config = backends_1.BACKENDS[backend];
+    parentCmd
+        .command('knowledge-base')
+        .description('Build a knowledge base from web content (docs, RAG, fine-tuning)')
+        .argument('[source]', 'URL or topic to build from')
+        .option('-y, --yes', 'Auto-approve all tool permissions')
+        .action(async (source, options) => {
+        const inputs = await gatherInputs(source ? { source } : undefined);
+        const skipPermissions = options.yes || (await (0, shared_1.askPermissionMode)(backend));
+        console.log(`\nLaunching ${config.displayName}...\n`);
+        (0, backends_1.launchAgent)(backend, buildSystemPrompt({
+            goal: inputs.goal,
+            depth: inputs.depth,
+            outputDir: inputs.outputDir,
+            trainFormat: inputs.trainFormat,
+            trainExamples: inputs.trainExamples,
+        }), (0, shared_1.buildMessage)([
+            `Build a knowledge base from: ${inputs.source}`,
+            inputs.context,
+        ]), skipPermissions);
+    });
+}
+//# sourceMappingURL=knowledge-base.js.map

package/dist/commands/experimental/workflows/knowledge-base.js.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"knowledge-base.js","sourceRoot":"","sources":["../../../../src/commands/experimental/workflows/knowledge-base.ts"],"names":[],"mappings":";AAAA;;;;;;GAMG;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;AA2TH,4BAgCC;AAxVD,0CAAkE;AAClE,sCAOmB;AAcnB,+EAA+E;AAE/E,KAAK,UAAU,YAAY,CAAC,OAA6B;IACvD,MAAM,EAAE,KAAK,EAAE,MAAM,EAAE,GAAG,wDAAa,mBAAmB,GAAC,CAAC;IAE5D,MAAM,SAAS,GACb,OAAO,EAAE,MAAM;QACf,CAAC,MAAM,KAAK,CAAC;YACX,OAAO,EACL,iEAAiE;YACnE,QAAQ,EAAE,IAAA,yBAAgB,EAAC,cAAc,CAAC;SAC3C,CAAC,CAAC,CAAC;IAEN,MAAM,IAAI,GAAG,MAAM,MAAM,CAAC;QACxB,OAAO,EAAE,iCAAiC;QAC1C,OAAO,EAAE;YACP;gBACE,IAAI,EAAE,4CAA4C;gBAClD,KAAK,EAAE,WAAW;aACnB;YACD;gBACE,IAAI,EAAE,mDAAmD;gBACzD,KAAK,EAAE,KAAK;aACb;YACD,EAAE,IAAI,EAAE,2CAA2C,EAAE,KAAK,EAAE,OAAO,EAAE;YACrE,EAAE,IAAI,EAAE,0CAA0C,EAAE,KAAK,EAAE,MAAM,EAAE;SACpE;KACF,CAAC,CAAC;IAEH,IAAI,WAAW,GAAG,EAAE,CAAC;IACrB,IAAI,aAAa,GAAG,EAAE,CAAC;IAEvB,IAAI,IAAI,KAAK,OAAO,EAAE,CAAC;QACrB,WAAW,GAAG,CAAC,MAAM,MAAM,CAAC;YAC1B,OAAO,EAAE,uBAAuB;YAChC,OAAO,EAAE;gBACP,EAAE,IAAI,EAAE,+BAA+B,EAAE,KAAK,EAAE,QAAQ,EAAE;gBAC1D,EAAE,IAAI,EAAE,mCAAmC,EAAE,KAAK,EAAE,QAAQ,EAAE;gBAC9D,EAAE,IAAI,EAAE,0BAA0B,EAAE,KAAK,EAAE,UAAU,EAAE;aACxD;SACF,CAAC,CAAW,CAAC;QAEd,aAAa,GAAG,MAAM,KAAK,CAAC;YAC1B,OAAO,EAAE,qCAAqC;YAC9C,OAAO,EAAE,KAAK;SACf,CAAC,CAAC;IACL,CAAC;IAED,MAAM,KAAK,GAAG,MAAM,MAAM,CAAC;QACzB,OAAO,EAAE,eAAe;QACxB,OAAO,EAAE;YACP,EAAE,IAAI,EAAE,sBAAsB,EAAE,KAAK,EAAE,OAAO,EAAE;YAChD,EAAE,IAAI,EAAE,0BAA0B,EAAE,KAAK,EAAE,UAAU,EAAE;YACvD,EAAE,IAAI,EAAE,0BAA0B,EAAE,KAAK,EAAE,YAAY,EAAE;SAC1D;KACF,CAAC,CAAC;IAEH,MAAM,OAAO,GAAG,MAAM,KAAK,CAAC;QAC1B,OAAO,EAAE,2DAA2D;QACpE,OAAO,EAAE,EAAE;KACZ,CAAC,CAAC;IAEH,MAAM,SAAS,GAAG,MAAM,KAAK,CAAC;QAC5B,OAAO,EAAE,mBAAmB;QAC5B,OAAO,EAAE,aAAa;KACvB,CAAC,CAAC;IAEH,OAAO;QACL,MAAM,EAAE,IAAA,wBAAe,EAAC,SAAS,CAAC;QAClC,IAAI;QACJ,KAAK;QACL,OAAO;QACP,SAAS;QACT,WAAW;QACX,aAAa;KACd,CAAC;AACJ,CAAC;AAED,+EAA+E;AAE/E,MAAM,eAAe,GAAG;;;;;;;;;;;;;;;;gGAgBwE,CAAC;AAEjG,SAAS,qBAAqB,CAAC,IAK9B;IACC,QAAQ,IAAI,CAAC,IAAI,EAAE,CAAC;QAClB,KAAK,WAAW;YACd,OAAO,GAAG,eAAe;;qCAEM,IAAI,CAAC,SAAS;;;;;;;;;;;;;;0EAcuB,CAAC;QAEvE,KAAK,KAAK;YACR,OAAO,GAAG,eAAe;;;;;;;;;;;;;;;;;;;;;;gBAsBf,IAAI,CAAC,SAAS,gGAAgG,CAAC;QAE3H,KAAK,OAAO;YACV,OAAO,GAAG,eAAe;;;;;;EAO7B,IAAI,CAAC,WAAW,KAAK,QAAQ;gBAC3B,CAAC,CAAC;;;OAGC;gBACH,CAAC,CAAC,IAAI,CAAC,WAAW,KAAK,QAAQ;oBAC7B,CAAC,CAAC;;;OAGD;oBACD,CAAC,CAAC;;;OAIR;;UAEU,IAAI,CAAC,aAAa;;;;;;;;;;;;;;;;;+BAiBG,CAAC;QAE5B,KAAK,MAAM;YACT,OAAO,GAAG,eAAe;;gBAEf,IAAI,CAAC,SAAS;;;;;;;;;;;2HAW6F,CAAC;QAExH;YACE,OAAO,eAAe,CAAC;IAC3B,CAAC;AACH,CAAC;AAED,SAAS,kBAAkB,CAAC,IAAY;IACtC,QAAQ,IAAI,EAAE,CAAC;QACb,KAAK,MAAM;YACT,OAAO;;;;;gGAKmF,CAAC;QAE7F,KAAK,OAAO;YACV,OAAO;;;;;;iFAMoE,CAAC;QAE9E;YACE,OAAO;;;;;;;;yDAQ4C,CAAC;IACxD,CAAC;AACH,CAAC;AAED,SAAS,iBAAiB,CAAC,IAM1B;IACC,MAAM,iBAAiB,GAA2B;QAChD,KAAK,EAAE,2CAA2C;QAClD,QAAQ,EAAE,gEAAgE;QAC1E,UAAU,EACR,kGAAkG;KACrG,CAAC;IAEF,OAAO;;EAEP,8BAAqB;;;;EAIrB,iBAAiB,CAAC,IAAI,CAAC,KAAK,CAAC;;;;;;kCAMG,IAAI,CAAC,IAAI,KAAK,MAAM,CAAC,CAAC,CAAC,mDAAmD,CAAC,CAAC,CAAC,oEAAoE;;;;EAIjL,kBAAkB,CAAC,IAAI,CAAC,IAAI,CAAC;;EAE7B,8BAAqB;;EAErB,qBAAqB,CAAC,IAAI,CAAC;;;;;;mBAMV,CAAC;AACpB,CAAC;AAED,+EAA+E;AAE/E,SAAgB,QAAQ,CAAC,SAAkB,EAAE,OAAgB;IAC3D,MAAM,MAAM,GAAG,mBAAQ,CAAC,OAAO,CAAC,CAAC;IAEjC,SAAS;SACN,OAAO,CAAC,gBAAgB,CAAC;SACzB,WAAW,CACV,kEAAkE,CACnE;SACA,QAAQ,CAAC,UAAU,EAAE,4BAA4B,CAAC;SAClD,MAAM,CAAC,WAAW,EAAE,mCAAmC,CAAC;SACxD,MAAM,CAAC,KAAK,EAAE,MAAM,EAAE,OAAO,EAAE,EAAE;QAChC,MAAM,MAAM,GAAG,MAAM,YAAY,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,MAAM,EAAE,CAAC,CAAC,CAAC,SAAS,CAAC,CAAC;QAEnE,MAAM,eAAe,GAAG,OAAO,CAAC,GAAG,IAAI,CAAC,MAAM,IAAA,0BAAiB,EAAC,OAAO,CAAC,CAAC,CAAC;QAC1E,OAAO,CAAC,GAAG,CAAC,eAAe,MAAM,CAAC,WAAW,OAAO,CAAC,CAAC;QAEtD,IAAA,sBAAW,EACT,OAAO,EACP,iBAAiB,CAAC;YAChB,IAAI,EAAE,MAAM,CAAC,IAAI;YACjB,KAAK,EAAE,MAAM,CAAC,KAAK;YACnB,SAAS,EAAE,MAAM,CAAC,SAAS;YAC3B,WAAW,EAAE,MAAM,CAAC,WAAW;YAC/B,aAAa,EAAE,MAAM,CAAC,aAAa;SACpC,CAAC,EACF,IAAA,qBAAY,EAAC;YACX,gCAAgC,MAAM,CAAC,MAAM,EAAE;YAC/C,MAAM,CAAC,OAAO;SACf,CAAC,EACF,eAAe,CAChB,CAAC;IACJ,CAAC,CAAC,CAAC;AACP,CAAC"}

package/dist/commands/experimental/workflows/lead-research.d.ts ADDED Viewed

@@ -0,0 +1,11 @@
+/**
+ * Workflow: Lead Research
+ *
+ * Spawns parallel agents to research a company, recent news/activity, and
+ * optionally a specific person -- all at once. Results are synthesized into
+ * a brief with talking points and pain points.
+ */
+import { Command } from 'commander';
+import { type Backend } from '../backends';
+export declare function register(parentCmd: Command, backend: Backend): void;
+//# sourceMappingURL=lead-research.d.ts.map

package/dist/commands/experimental/workflows/lead-research.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"lead-research.d.ts","sourceRoot":"","sources":["../../../../src/commands/experimental/workflows/lead-research.ts"],"names":[],"mappings":"AAAA;;;;;;GAMG;AAEH,OAAO,EAAE,OAAO,EAAE,MAAM,WAAW,CAAC;AACpC,OAAO,EAAE,KAAK,OAAO,EAAyB,MAAM,aAAa,CAAC;AAkHlE,wBAAgB,QAAQ,CAAC,SAAS,EAAE,OAAO,EAAE,OAAO,EAAE,OAAO,GAAG,IAAI,CAyBnE"}