@mendable/firecrawl 1.2.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/tsconfig.json ADDED
@@ -0,0 +1,111 @@
1
+ {
2
+ "compilerOptions": {
3
+ /* Visit https://aka.ms/tsconfig to read more about this file */
4
+
5
+ /* Projects */
6
+ // "incremental": true, /* Save .tsbuildinfo files to allow for incremental compilation of projects. */
7
+ // "composite": true, /* Enable constraints that allow a TypeScript project to be used with project references. */
8
+ // "tsBuildInfoFile": "./.tsbuildinfo", /* Specify the path to .tsbuildinfo incremental compilation file. */
9
+ // "disableSourceOfProjectReferenceRedirect": true, /* Disable preferring source files instead of declaration files when referencing composite projects. */
10
+ // "disableSolutionSearching": true, /* Opt a project out of multi-project reference checking when editing. */
11
+ // "disableReferencedProjectLoad": true, /* Reduce the number of projects loaded automatically by TypeScript. */
12
+
13
+ /* Language and Environment */
14
+ "target": "es2020", /* Set the JavaScript language version for emitted JavaScript and include compatible library declarations. */
15
+ // "lib": [], /* Specify a set of bundled library declaration files that describe the target runtime environment. */
16
+ // "jsx": "preserve", /* Specify what JSX code is generated. */
17
+ // "experimentalDecorators": true, /* Enable experimental support for legacy experimental decorators. */
18
+ // "emitDecoratorMetadata": true, /* Emit design-type metadata for decorated declarations in source files. */
19
+ // "jsxFactory": "", /* Specify the JSX factory function used when targeting React JSX emit, e.g. 'React.createElement' or 'h'. */
20
+ // "jsxFragmentFactory": "", /* Specify the JSX Fragment reference used for fragments when targeting React JSX emit e.g. 'React.Fragment' or 'Fragment'. */
21
+ // "jsxImportSource": "", /* Specify module specifier used to import the JSX factory functions when using 'jsx: react-jsx*'. */
22
+ // "reactNamespace": "", /* Specify the object invoked for 'createElement'. This only applies when targeting 'react' JSX emit. */
23
+ // "noLib": true, /* Disable including any library files, including the default lib.d.ts. */
24
+ // "useDefineForClassFields": true, /* Emit ECMAScript-standard-compliant class fields. */
25
+ // "moduleDetection": "auto", /* Control what method is used to detect module-format JS files. */
26
+
27
+ /* Modules */
28
+ "module": "commonjs", /* Specify what module code is generated. */
29
+ "rootDir": "./src", /* Specify the root folder within your source files. */
30
+ "moduleResolution": "node", /* Specify how TypeScript looks up a file from a given module specifier. */
31
+ // "baseUrl": "./", /* Specify the base directory to resolve non-relative module names. */
32
+ // "paths": {}, /* Specify a set of entries that re-map imports to additional lookup locations. */
33
+ // "rootDirs": [], /* Allow multiple folders to be treated as one when resolving modules. */
34
+ // "typeRoots": [], /* Specify multiple folders that act like './node_modules/@types'. */
35
+ // "types": [], /* Specify type package names to be included without being referenced in a source file. */
36
+ // "allowUmdGlobalAccess": true, /* Allow accessing UMD globals from modules. */
37
+ // "moduleSuffixes": [], /* List of file name suffixes to search when resolving a module. */
38
+ // "allowImportingTsExtensions": true, /* Allow imports to include TypeScript file extensions. Requires '--moduleResolution bundler' and either '--noEmit' or '--emitDeclarationOnly' to be set. */
39
+ // "resolvePackageJsonExports": true, /* Use the package.json 'exports' field when resolving package imports. */
40
+ // "resolvePackageJsonImports": true, /* Use the package.json 'imports' field when resolving imports. */
41
+ // "customConditions": [], /* Conditions to set in addition to the resolver-specific defaults when resolving imports. */
42
+ // "resolveJsonModule": true, /* Enable importing .json files. */
43
+ // "allowArbitraryExtensions": true, /* Enable importing files with any extension, provided a declaration file is present. */
44
+ // "noResolve": true, /* Disallow 'import's, 'require's or '<reference>'s from expanding the number of files TypeScript should add to a project. */
45
+
46
+ /* JavaScript Support */
47
+ // "allowJs": true, /* Allow JavaScript files to be a part of your program. Use the 'checkJS' option to get errors from these files. */
48
+ // "checkJs": true, /* Enable error reporting in type-checked JavaScript files. */
49
+ // "maxNodeModuleJsDepth": 1, /* Specify the maximum folder depth used for checking JavaScript files from 'node_modules'. Only applicable with 'allowJs'. */
50
+
51
+ /* Emit */
52
+ "declaration": true, /* Generate .d.ts files from TypeScript and JavaScript files in your project. */
53
+ // "declarationMap": true, /* Create sourcemaps for d.ts files. */
54
+ // "emitDeclarationOnly": true, /* Only output d.ts files and not JavaScript files. */
55
+ // "sourceMap": true, /* Create source map files for emitted JavaScript files. */
56
+ // "inlineSourceMap": true, /* Include sourcemap files inside the emitted JavaScript. */
57
+ // "outFile": "./", /* Specify a file that bundles all outputs into one JavaScript file. If 'declaration' is true, also designates a file that bundles all .d.ts output. */
58
+ "outDir": "./build", /* Specify an output folder for all emitted files. */
59
+ // "removeComments": true, /* Disable emitting comments. */
60
+ // "noEmit": true, /* Disable emitting files from a compilation. */
61
+ // "importHelpers": true, /* Allow importing helper functions from tslib once per project, instead of including them per-file. */
62
+ // "importsNotUsedAsValues": "remove", /* Specify emit/checking behavior for imports that are only used for types. */
63
+ // "downlevelIteration": true, /* Emit more compliant, but verbose and less performant JavaScript for iteration. */
64
+ // "sourceRoot": "", /* Specify the root path for debuggers to find the reference source code. */
65
+ // "mapRoot": "", /* Specify the location where debugger should locate map files instead of generated locations. */
66
+ // "inlineSources": true, /* Include source code in the sourcemaps inside the emitted JavaScript. */
67
+ // "emitBOM": true, /* Emit a UTF-8 Byte Order Mark (BOM) in the beginning of output files. */
68
+ // "newLine": "crlf", /* Set the newline character for emitting files. */
69
+ // "stripInternal": true, /* Disable emitting declarations that have '@internal' in their JSDoc comments. */
70
+ // "noEmitHelpers": true, /* Disable generating custom helper functions like '__extends' in compiled output. */
71
+ // "noEmitOnError": true, /* Disable emitting files if any type checking errors are reported. */
72
+ // "preserveConstEnums": true, /* Disable erasing 'const enum' declarations in generated code. */
73
+ "declarationDir": "./types", /* Specify the output directory for generated declaration files. */
74
+ // "preserveValueImports": true, /* Preserve unused imported values in the JavaScript output that would otherwise be removed. */
75
+
76
+ /* Interop Constraints */
77
+ // "isolatedModules": true, /* Ensure that each file can be safely transpiled without relying on other imports. */
78
+ // "verbatimModuleSyntax": true, /* Do not transform or elide any imports or exports not marked as type-only, ensuring they are written in the output file's format based on the 'module' setting. */
79
+ // "allowSyntheticDefaultImports": true, /* Allow 'import x from y' when a module doesn't have a default export. */
80
+ "esModuleInterop": true, /* Emit additional JavaScript to ease support for importing CommonJS modules. This enables 'allowSyntheticDefaultImports' for type compatibility. */
81
+ // "preserveSymlinks": true, /* Disable resolving symlinks to their realpath. This correlates to the same flag in node. */
82
+ "forceConsistentCasingInFileNames": true, /* Ensure that casing is correct in imports. */
83
+
84
+ /* Type Checking */
85
+ "strict": true, /* Enable all strict type-checking options. */
86
+ // "noImplicitAny": true, /* Enable error reporting for expressions and declarations with an implied 'any' type. */
87
+ // "strictNullChecks": true, /* When type checking, take into account 'null' and 'undefined'. */
88
+ // "strictFunctionTypes": true, /* When assigning functions, check to ensure parameters and the return values are subtype-compatible. */
89
+ // "strictBindCallApply": true, /* Check that the arguments for 'bind', 'call', and 'apply' methods match the original function. */
90
+ // "strictPropertyInitialization": true, /* Check for class properties that are declared but not set in the constructor. */
91
+ // "noImplicitThis": true, /* Enable error reporting when 'this' is given the type 'any'. */
92
+ // "useUnknownInCatchVariables": true, /* Default catch clause variables as 'unknown' instead of 'any'. */
93
+ // "alwaysStrict": true, /* Ensure 'use strict' is always emitted. */
94
+ // "noUnusedLocals": true, /* Enable error reporting when local variables aren't read. */
95
+ // "noUnusedParameters": true, /* Raise an error when a function parameter isn't read. */
96
+ // "exactOptionalPropertyTypes": true, /* Interpret optional property types as written, rather than adding 'undefined'. */
97
+ // "noImplicitReturns": true, /* Enable error reporting for codepaths that do not explicitly return in a function. */
98
+ // "noFallthroughCasesInSwitch": true, /* Enable error reporting for fallthrough cases in switch statements. */
99
+ // "noUncheckedIndexedAccess": true, /* Add 'undefined' to a type when accessed using an index. */
100
+ // "noImplicitOverride": true, /* Ensure overriding members in derived classes are marked with an override modifier. */
101
+ // "noPropertyAccessFromIndexSignature": true, /* Enforces using indexed accessors for keys declared using an indexed type. */
102
+ // "allowUnusedLabels": true, /* Disable error reporting for unused labels. */
103
+ // "allowUnreachableCode": true, /* Disable error reporting for unreachable code. */
104
+
105
+ /* Completeness */
106
+ // "skipDefaultLibCheck": true, /* Skip type checking .d.ts files that are included with TypeScript. */
107
+ "skipLibCheck": true /* Skip type checking all .d.ts files. */
108
+ },
109
+ "include": ["src/**/*"],
110
+ "exclude": ["node_modules", "dist", "**/__tests__/*"]
111
+ }
@@ -0,0 +1,260 @@
1
+ import { AxiosResponse, AxiosRequestHeaders } from "axios";
2
+ import { z } from "zod";
3
+ import { TypedEventTarget } from "typescript-event-target";
4
+ /**
5
+ * Configuration interface for FirecrawlApp.
6
+ * @param apiKey - Optional API key for authentication.
7
+ * @param apiUrl - Optional base URL of the API; defaults to 'https://api.firecrawl.dev'.
8
+ */
9
+ export interface FirecrawlAppConfig {
10
+ apiKey?: string | null;
11
+ apiUrl?: string | null;
12
+ }
13
+ /**
14
+ * Metadata for a Firecrawl document.
15
+ * Includes various optional properties for document metadata.
16
+ */
17
+ export interface FirecrawlDocumentMetadata {
18
+ title?: string;
19
+ description?: string;
20
+ language?: string;
21
+ keywords?: string;
22
+ robots?: string;
23
+ ogTitle?: string;
24
+ ogDescription?: string;
25
+ ogUrl?: string;
26
+ ogImage?: string;
27
+ ogAudio?: string;
28
+ ogDeterminer?: string;
29
+ ogLocale?: string;
30
+ ogLocaleAlternate?: string[];
31
+ ogSiteName?: string;
32
+ ogVideo?: string;
33
+ dctermsCreated?: string;
34
+ dcDateCreated?: string;
35
+ dcDate?: string;
36
+ dctermsType?: string;
37
+ dcType?: string;
38
+ dctermsAudience?: string;
39
+ dctermsSubject?: string;
40
+ dcSubject?: string;
41
+ dcDescription?: string;
42
+ dctermsKeywords?: string;
43
+ modifiedTime?: string;
44
+ publishedTime?: string;
45
+ articleTag?: string;
46
+ articleSection?: string;
47
+ sourceURL?: string;
48
+ statusCode?: number;
49
+ error?: string;
50
+ [key: string]: any;
51
+ }
52
+ /**
53
+ * Document interface for Firecrawl.
54
+ * Represents a document retrieved or processed by Firecrawl.
55
+ */
56
+ export interface FirecrawlDocument {
57
+ url?: string;
58
+ markdown?: string;
59
+ html?: string;
60
+ rawHtml?: string;
61
+ links?: string[];
62
+ extract?: Record<any, any>;
63
+ screenshot?: string;
64
+ metadata?: FirecrawlDocumentMetadata;
65
+ }
66
+ /**
67
+ * Parameters for scraping operations.
68
+ * Defines the options and configurations available for scraping web content.
69
+ */
70
+ export interface ScrapeParams {
71
+ formats: ("markdown" | "html" | "rawHtml" | "content" | "links" | "screenshot" | "extract" | "full@scrennshot")[];
72
+ headers?: Record<string, string>;
73
+ includeTags?: string[];
74
+ excludeTags?: string[];
75
+ onlyMainContent?: boolean;
76
+ extract?: {
77
+ prompt?: string;
78
+ schema?: z.ZodSchema | any;
79
+ systemPrompt?: string;
80
+ };
81
+ waitFor?: number;
82
+ timeout?: number;
83
+ }
84
+ /**
85
+ * Response interface for scraping operations.
86
+ * Defines the structure of the response received after a scraping operation.
87
+ */
88
+ export interface ScrapeResponse extends FirecrawlDocument {
89
+ success: true;
90
+ warning?: string;
91
+ error?: string;
92
+ }
93
+ /**
94
+ * Parameters for crawling operations.
95
+ * Includes options for both scraping and mapping during a crawl.
96
+ */
97
+ export interface CrawlParams {
98
+ includePaths?: string[];
99
+ excludePaths?: string[];
100
+ maxDepth?: number;
101
+ limit?: number;
102
+ allowBackwardLinks?: boolean;
103
+ allowExternalLinks?: boolean;
104
+ ignoreSitemap?: boolean;
105
+ scrapeOptions?: ScrapeParams;
106
+ webhook?: string;
107
+ }
108
+ /**
109
+ * Response interface for crawling operations.
110
+ * Defines the structure of the response received after initiating a crawl.
111
+ */
112
+ export interface CrawlResponse {
113
+ id?: string;
114
+ url?: string;
115
+ success: true;
116
+ error?: string;
117
+ }
118
+ /**
119
+ * Response interface for job status checks.
120
+ * Provides detailed status of a crawl job including progress and results.
121
+ */
122
+ export interface CrawlStatusResponse {
123
+ success: true;
124
+ total: number;
125
+ completed: number;
126
+ creditsUsed: number;
127
+ expiresAt: Date;
128
+ status: "scraping" | "completed" | "failed";
129
+ next: string;
130
+ data?: FirecrawlDocument[];
131
+ error?: string;
132
+ }
133
+ /**
134
+ * Parameters for mapping operations.
135
+ * Defines options for mapping URLs during a crawl.
136
+ */
137
+ export interface MapParams {
138
+ search?: string;
139
+ ignoreSitemap?: boolean;
140
+ includeSubdomains?: boolean;
141
+ limit?: number;
142
+ }
143
+ /**
144
+ * Response interface for mapping operations.
145
+ * Defines the structure of the response received after a mapping operation.
146
+ */
147
+ export interface MapResponse {
148
+ success: true;
149
+ links?: string[];
150
+ error?: string;
151
+ }
152
+ /**
153
+ * Error response interface.
154
+ * Defines the structure of the response received when an error occurs.
155
+ */
156
+ export interface ErrorResponse {
157
+ success: false;
158
+ error: string;
159
+ }
160
+ /**
161
+ * Main class for interacting with the Firecrawl API.
162
+ * Provides methods for scraping, searching, crawling, and mapping web content.
163
+ */
164
+ export default class FirecrawlApp {
165
+ apiKey: string;
166
+ apiUrl: string;
167
+ /**
168
+ * Initializes a new instance of the FirecrawlApp class.
169
+ * @param config - Configuration options for the FirecrawlApp instance.
170
+ */
171
+ constructor({ apiKey, apiUrl }: FirecrawlAppConfig);
172
+ /**
173
+ * Scrapes a URL using the Firecrawl API.
174
+ * @param url - The URL to scrape.
175
+ * @param params - Additional parameters for the scrape request.
176
+ * @returns The response from the scrape operation.
177
+ */
178
+ scrapeUrl(url: string, params?: ScrapeParams): Promise<ScrapeResponse | ErrorResponse>;
179
+ /**
180
+ * This method is intended to search for a query using the Firecrawl API. However, it is not supported in version 1 of the API.
181
+ * @param query - The search query string.
182
+ * @param params - Additional parameters for the search.
183
+ * @returns Throws an error advising to use version 0 of the API.
184
+ */
185
+ search(query: string, params?: any): Promise<any>;
186
+ /**
187
+ * Initiates a crawl job for a URL using the Firecrawl API.
188
+ * @param url - The URL to crawl.
189
+ * @param params - Additional parameters for the crawl request.
190
+ * @param pollInterval - Time in seconds for job status checks.
191
+ * @param idempotencyKey - Optional idempotency key for the request.
192
+ * @returns The response from the crawl operation.
193
+ */
194
+ crawlUrl(url: string, params?: CrawlParams, pollInterval?: number, idempotencyKey?: string): Promise<CrawlStatusResponse | ErrorResponse>;
195
+ asyncCrawlUrl(url: string, params?: CrawlParams, idempotencyKey?: string): Promise<CrawlResponse | ErrorResponse>;
196
+ /**
197
+ * Checks the status of a crawl job using the Firecrawl API.
198
+ * @param id - The ID of the crawl operation.
199
+ * @returns The response containing the job status.
200
+ */
201
+ checkCrawlStatus(id?: string): Promise<CrawlStatusResponse | ErrorResponse>;
202
+ crawlUrlAndWatch(url: string, params?: CrawlParams, idempotencyKey?: string): Promise<CrawlWatcher>;
203
+ mapUrl(url: string, params?: MapParams): Promise<MapResponse | ErrorResponse>;
204
+ /**
205
+ * Prepares the headers for an API request.
206
+ * @param idempotencyKey - Optional key to ensure idempotency.
207
+ * @returns The prepared headers.
208
+ */
209
+ prepareHeaders(idempotencyKey?: string): AxiosRequestHeaders;
210
+ /**
211
+ * Sends a POST request to the specified URL.
212
+ * @param url - The URL to send the request to.
213
+ * @param data - The data to send in the request.
214
+ * @param headers - The headers for the request.
215
+ * @returns The response from the POST request.
216
+ */
217
+ postRequest(url: string, data: any, headers: AxiosRequestHeaders): Promise<AxiosResponse>;
218
+ /**
219
+ * Sends a GET request to the specified URL.
220
+ * @param url - The URL to send the request to.
221
+ * @param headers - The headers for the request.
222
+ * @returns The response from the GET request.
223
+ */
224
+ getRequest(url: string, headers: AxiosRequestHeaders): Promise<AxiosResponse>;
225
+ /**
226
+ * Monitors the status of a crawl job until completion or failure.
227
+ * @param id - The ID of the crawl operation.
228
+ * @param headers - The headers for the request.
229
+ * @param checkInterval - Interval in seconds for job status checks.
230
+ * @param checkUrl - Optional URL to check the status (used for v1 API)
231
+ * @returns The final job status or data.
232
+ */
233
+ monitorJobStatus(id: string, headers: AxiosRequestHeaders, checkInterval: number): Promise<CrawlStatusResponse>;
234
+ /**
235
+ * Handles errors from API responses.
236
+ * @param {AxiosResponse} response - The response from the API.
237
+ * @param {string} action - The action being performed when the error occurred.
238
+ */
239
+ handleError(response: AxiosResponse, action: string): void;
240
+ }
241
+ interface CrawlWatcherEvents {
242
+ document: CustomEvent<FirecrawlDocument>;
243
+ done: CustomEvent<{
244
+ status: CrawlStatusResponse["status"];
245
+ data: FirecrawlDocument[];
246
+ }>;
247
+ error: CustomEvent<{
248
+ status: CrawlStatusResponse["status"];
249
+ data: FirecrawlDocument[];
250
+ error: string;
251
+ }>;
252
+ }
253
+ export declare class CrawlWatcher extends TypedEventTarget<CrawlWatcherEvents> {
254
+ private ws;
255
+ data: FirecrawlDocument[];
256
+ status: CrawlStatusResponse["status"];
257
+ constructor(id: string, app: FirecrawlApp);
258
+ close(): void;
259
+ }
260
+ export {};