npm - firecrawl-mcp - Versions diffs - 3.1.13 → 3.3.0 - Mend

firecrawl-mcp 3.1.13 → 3.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/dist/index.js +70 -39
package/package.json +1 -1

package/dist/index.js CHANGED Viewed

@@ -79,8 +79,9 @@ const server = new FastMCP({
             return { firecrawlApiKey: apiKey };
         }
         else {
-            if (!process.env.FIRECRAWL_API_KEY) {
-                console.error('Firecrawl API key is required');
+            // For self-hosted instances, API key is optional if FIRECRAWL_API_URL is provided
+            if (!process.env.FIRECRAWL_API_KEY && !process.env.FIRECRAWL_API_URL) {
+                console.error('Either FIRECRAWL_API_KEY or FIRECRAWL_API_URL must be provided');
                 process.exit(1);
             }
             return { firecrawlApiKey: process.env.FIRECRAWL_API_KEY };
@@ -95,25 +96,45 @@ const server = new FastMCP({
     },
 });
 function createClient(apiKey) {
-    return new FirecrawlApp({
-        apiKey,
+    const config = {
         ...(process.env.FIRECRAWL_API_URL && {
             apiUrl: process.env.FIRECRAWL_API_URL,
         }),
-    });
+    };
+    // Only add apiKey if it's provided (required for cloud, optional for self-hosted)
+    if (apiKey) {
+        config.apiKey = apiKey;
+    }
+    return new FirecrawlApp(config);
 }
 const ORIGIN = 'mcp-fastmcp';
+// Safe mode is enabled by default for cloud service to comply with ChatGPT safety requirements
+const SAFE_MODE = process.env.CLOUD_SERVICE === 'true';
 function getClient(session) {
-    if (!session || !session.firecrawlApiKey) {
-        throw new Error('Unauthorized');
+    // For cloud service, API key is required
+    if (process.env.CLOUD_SERVICE === 'true') {
+        if (!session || !session.firecrawlApiKey) {
+            throw new Error('Unauthorized');
+        }
+        return createClient(session.firecrawlApiKey);
+    }
+    // For self-hosted instances, API key is optional if FIRECRAWL_API_URL is provided
+    if (!process.env.FIRECRAWL_API_URL && (!session || !session.firecrawlApiKey)) {
+        throw new Error('Unauthorized: API key is required when not using a self-hosted instance');
     }
-    return createClient(session.firecrawlApiKey);
+    return createClient(session?.firecrawlApiKey);
 }
 function asText(data) {
     return JSON.stringify(data, null, 2);
 }
 // scrape tool (v2 semantics, minimal args)
 // Centralized scrape params (used by scrape, and referenced in search/crawl scrapeOptions)
+// Define safe action types
+const safeActionTypes = ['wait', 'screenshot', 'scroll', 'scrape'];
+const otherActions = ['click', 'write', 'press', 'executeJavascript', 'generatePDF'];
+const allActionTypes = [...safeActionTypes, ...otherActions];
+// Use appropriate action types based on safe mode
+const allowedActionTypes = SAFE_MODE ? safeActionTypes : allActionTypes;
 const scrapeParamsSchema = z.object({
     url: z.string().url(),
     formats: z
@@ -146,28 +167,20 @@ const scrapeParamsSchema = z.object({
     includeTags: z.array(z.string()).optional(),
     excludeTags: z.array(z.string()).optional(),
     waitFor: z.number().optional(),
-    actions: z
-        .array(z.object({
-        type: z.enum([
-            'wait',
-            'click',
-            'screenshot',
-            'write',
-            'press',
-            'scroll',
-            'scrape',
-            'executeJavascript',
-            'generatePDF',
-        ]),
-        selector: z.string().optional(),
-        milliseconds: z.number().optional(),
-        text: z.string().optional(),
-        key: z.string().optional(),
-        direction: z.enum(['up', 'down']).optional(),
-        script: z.string().optional(),
-        fullPage: z.boolean().optional(),
-    }))
-        .optional(),
+    ...(SAFE_MODE ? {} : {
+        actions: z
+            .array(z.object({
+            type: z.enum(allowedActionTypes),
+            selector: z.string().optional(),
+            milliseconds: z.number().optional(),
+            text: z.string().optional(),
+            key: z.string().optional(),
+            direction: z.enum(['up', 'down']).optional(),
+            script: z.string().optional(),
+            fullPage: z.boolean().optional(),
+        }))
+            .optional(),
+    }),
     mobile: z.boolean().optional(),
     skipTlsVerification: z.boolean().optional(),
     removeBase64Images: z.boolean().optional(),
@@ -203,6 +216,7 @@ This is the most powerful, fastest and most reliable scraper tool, if available
 \`\`\`
 **Performance:** Add maxAge parameter for 500% faster scrapes using cached data.
 **Returns:** Markdown, HTML, or other formats as specified.
+${SAFE_MODE ? '**Safe Mode:** Read-only content extraction. Interactive actions (click, write, executeJavascript) are disabled for security.' : ''}
 `,
     parameters: scrapeParamsSchema,
     execute: async (args, { session, log }) => {
@@ -256,6 +270,20 @@ server.addTool({
     description: `
 Search the web and optionally extract content from search results. This is the most powerful web search tool available, and if available you should always default to using this tool for any web search needs.
+The query also supports search operators, that you can use if needed to refine the search:
+| Operator | Functionality | Examples |
+---|-|-|
+| \`"\"\` | Non-fuzzy matches a string of text | \`"Firecrawl"\`
+| \`-\` | Excludes certain keywords or negates other operators | \`-bad\`, \`-site:firecrawl.dev\`
+| \`site:\` | Only returns results from a specified website | \`site:firecrawl.dev\`
+| \`inurl:\` | Only returns results that include a word in the URL | \`inurl:firecrawl\`
+| \`allinurl:\` | Only returns results that include multiple words in the URL | \`allinurl:git firecrawl\`
+| \`intitle:\` | Only returns results that include a word in the title of the page | \`intitle:Firecrawl\`
+| \`allintitle:\` | Only returns results that include multiple words in the title of the page | \`allintitle:firecrawl playground\`
+| \`related:\` | Only returns results that are related to a specific domain | \`related:firecrawl.dev\`
+| \`imagesize:\` | Only returns images with exact dimensions | \`imagesize:1920x1080\`
+| \`larger:\` | Only returns images larger than specified dimensions | \`larger:1920x1080\`
 **Best for:** Finding specific information across multiple websites, when you don't know which website has the information; when you need the most relevant content for a query.
 **Not recommended for:** When you need to search the filesystem. When you already know which website to scrape (use scrape); when you need comprehensive coverage of a single website (use map or crawl.
 **Common mistakes:** Using crawl or map for open-ended questions (use search instead).
@@ -346,6 +374,7 @@ server.addTool({
  }
  \`\`\`
  **Returns:** Operation ID for status checking; use firecrawl_check_crawl_status to check progress.
+ ${SAFE_MODE ? '**Safe Mode:** Read-only crawling. Webhooks and interactive actions are disabled for security.' : ''}
  `,
     parameters: z.object({
         url: z.string(),
@@ -360,15 +389,17 @@ server.addTool({
         crawlEntireDomain: z.boolean().optional(),
         delay: z.number().optional(),
         maxConcurrency: z.number().optional(),
-        webhook: z
-            .union([
-            z.string(),
-            z.object({
-                url: z.string(),
-                headers: z.record(z.string(), z.string()).optional(),
-            }),
-        ])
-            .optional(),
+        ...(SAFE_MODE ? {} : {
+            webhook: z
+                .union([
+                z.string(),
+                z.object({
+                    url: z.string(),
+                    headers: z.record(z.string(), z.string()).optional(),
+                }),
+            ])
+                .optional(),
+        }),
         deduplicateSimilarURLs: z.boolean().optional(),
         ignoreQueryParameters: z.boolean().optional(),
         scrapeOptions: scrapeParamsSchema.omit({ url: true }).partial().optional(),

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "firecrawl-mcp",
-  "version": "3.1.13",
+  "version": "3.3.0",
   "description": "MCP server for Firecrawl web scraping integration. Supports both cloud and self-hosted instances. Features include web scraping, search, batch processing, structured data extraction, and LLM-powered content analysis.",
   "type": "module",
   "bin": {