@democratize-quality/mcp-server 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (48) hide show
  1. package/LICENSE +15 -0
  2. package/README.md +423 -0
  3. package/browserControl.js +113 -0
  4. package/cli.js +187 -0
  5. package/docs/api/tool-reference.md +317 -0
  6. package/docs/api_tools_usage.md +477 -0
  7. package/docs/development/adding-tools.md +274 -0
  8. package/docs/development/configuration.md +332 -0
  9. package/docs/examples/authentication.md +124 -0
  10. package/docs/examples/basic-automation.md +105 -0
  11. package/docs/getting-started.md +214 -0
  12. package/docs/index.md +61 -0
  13. package/mcpServer.js +280 -0
  14. package/package.json +83 -0
  15. package/run-server.js +140 -0
  16. package/src/config/environments/api-only.js +53 -0
  17. package/src/config/environments/development.js +54 -0
  18. package/src/config/environments/production.js +69 -0
  19. package/src/config/index.js +341 -0
  20. package/src/config/server.js +41 -0
  21. package/src/config/tools/api.js +67 -0
  22. package/src/config/tools/browser.js +90 -0
  23. package/src/config/tools/default.js +32 -0
  24. package/src/services/browserService.js +325 -0
  25. package/src/tools/api/api-request.js +641 -0
  26. package/src/tools/api/api-session-report.js +1262 -0
  27. package/src/tools/api/api-session-status.js +395 -0
  28. package/src/tools/base/ToolBase.js +230 -0
  29. package/src/tools/base/ToolRegistry.js +269 -0
  30. package/src/tools/browser/advanced/browser-console.js +384 -0
  31. package/src/tools/browser/advanced/browser-dialog.js +319 -0
  32. package/src/tools/browser/advanced/browser-evaluate.js +337 -0
  33. package/src/tools/browser/advanced/browser-file.js +480 -0
  34. package/src/tools/browser/advanced/browser-keyboard.js +343 -0
  35. package/src/tools/browser/advanced/browser-mouse.js +332 -0
  36. package/src/tools/browser/advanced/browser-network.js +421 -0
  37. package/src/tools/browser/advanced/browser-pdf.js +407 -0
  38. package/src/tools/browser/advanced/browser-tabs.js +497 -0
  39. package/src/tools/browser/advanced/browser-wait.js +378 -0
  40. package/src/tools/browser/click.js +168 -0
  41. package/src/tools/browser/close.js +60 -0
  42. package/src/tools/browser/dom.js +70 -0
  43. package/src/tools/browser/launch.js +67 -0
  44. package/src/tools/browser/navigate.js +270 -0
  45. package/src/tools/browser/screenshot.js +351 -0
  46. package/src/tools/browser/type.js +174 -0
  47. package/src/tools/index.js +95 -0
  48. package/src/utils/browserHelpers.js +83 -0
@@ -0,0 +1,325 @@
1
+ const CDP = require('chrome-remote-interface');
2
+ //const launchChrome = require('chrome-launcher').launch;
3
+ const fs = require('fs');
4
+ const path = require('path');
5
+ const { findNodeBySelector, getElementClickCoordinates } = require('../utils/browserHelpers'); // Import helpers
6
+ const config = require('../config');
7
+
8
+ // A private in-memory store for our browser instances within the service
9
+ // Each key will be a unique browserId, value will be { chromeInstance, cdpClient, userDataDir }
10
+ const activeBrowsers = {};
11
+
12
+ /**
13
+ * Ensures a user data directory exists.
14
+ * @param {string} dirPath - The absolute path to the user data directory.
15
+ */
16
+ function ensureUserDataDir(dirPath) {
17
+ if (!fs.existsSync(dirPath)) {
18
+ fs.mkdirSync(dirPath, { recursive: true });
19
+ console.log(`[BrowserService] Created user data directory: ${dirPath}`);
20
+ } else {
21
+ console.log(`[BrowserService] Using existing user data directory: ${dirPath}`);
22
+ }
23
+ }
24
+
25
+ /**
26
+ * Retrieves a browser instance by ID.
27
+ * @param {string} browserId - The ID of the browser instance.
28
+ * @returns {object|null} - The browser instance object or null if not found.
29
+ */
30
+ function getBrowserInstance(browserId) {
31
+ return activeBrowsers[browserId];
32
+ }
33
+
34
+ /**
35
+ * Launches a new Chrome instance.
36
+ * @param {boolean} headless - Whether to run Chrome in headless mode.
37
+ * @param {number} port - The port for remote debugging.
38
+ * @param {string|null} userDataDir - Path to the user data directory for persistent profiles.
39
+ * @returns {Promise<object>} - Object containing browserId, port, and resolvedUserDataDir.
40
+ */
41
+ async function launchBrowser(headless, port, userDataDir) {
42
+ let chrome;
43
+ let client;
44
+ const { launch: launchChrome } = await import('chrome-launcher');
45
+ let resolvedUserDataDir = null;
46
+
47
+ try {
48
+ if (userDataDir) {
49
+ resolvedUserDataDir = path.resolve(process.cwd(), userDataDir);
50
+ ensureUserDataDir(resolvedUserDataDir);
51
+ }
52
+
53
+ console.log(`[BrowserService] Launching Chrome (headless: ${headless}, userDataDir: ${resolvedUserDataDir || 'temporary'})...`);
54
+
55
+ const launchOptions = {
56
+ port: port,
57
+ userDataDir: resolvedUserDataDir, // Set userDataDir if provided
58
+ chromeFlags: [
59
+ headless ? '--headless=new' : '',
60
+ '--disable-gpu',
61
+ '--disable-setuid-sandbox',
62
+ '--no-sandbox'
63
+ ].filter(Boolean)
64
+ };
65
+
66
+ chrome = await launchChrome(launchOptions);
67
+
68
+ // Generate browserId: profile-name if userDataDir is used, otherwise a unique timestamped ID
69
+ const browserId = userDataDir ? `profile-${path.basename(resolvedUserDataDir)}` : `browser-${Date.now()}-${Math.random().toString(36).substring(2, 9)}`;
70
+
71
+ if (activeBrowsers[browserId]) {
72
+ console.warn(`[BrowserService] Warning: Browser ID '${browserId}' already exists. Overwriting.`);
73
+ // In a real scenario, you might want more sophisticated handling here,
74
+ // e.g., error if ID exists, or try to attach to existing.
75
+ // For now, we're assuming a new launch means a fresh start or overwrite.
76
+ try { // Attempt to clean up old instance if it exists
77
+ if (activeBrowsers[browserId].cdpClient) activeBrowsers[browserId].cdpClient.close();
78
+ if (activeBrowsers[browserId].chromeInstance) await activeBrowsers[browserId].chromeInstance.kill();
79
+ } catch (cleanupErr) {
80
+ console.error(`[BrowserService] Error cleaning up old instance for ${browserId}:`, cleanupErr.message);
81
+ }
82
+ }
83
+
84
+ activeBrowsers[browserId] = { chromeInstance: chrome, cdpClient: null, userDataDir: resolvedUserDataDir };
85
+ console.log(`[BrowserService] Chrome launched on port ${chrome.port} with ID: ${browserId}`);
86
+
87
+ client = await CDP({ port: chrome.port });
88
+ activeBrowsers[browserId].cdpClient = client;
89
+
90
+ const { Page, Runtime, DOM, Network, Security, Input } = client; // Enable Input domain here
91
+ await Page.enable();
92
+ await Runtime.enable();
93
+ await DOM.enable();
94
+ await Network.enable();
95
+ await Security.enable();
96
+ //await Input.enable(); // Enable Input domain
97
+
98
+ console.log(`[BrowserService] CDP client connected and domains enabled for ${browserId}.`);
99
+
100
+ return { browserId, port: chrome.port, userDataDir: resolvedUserDataDir };
101
+
102
+ } catch (error) {
103
+ console.error(`[BrowserService] Error launching browser:`, error);
104
+ if (chrome && !client) { // If chrome launched but CDP connection failed
105
+ try {
106
+ await chrome.kill();
107
+ console.log(`[BrowserService] Partially launched Chrome instance killed due to error.`);
108
+ } catch (killError) {
109
+ console.error(`[BrowserService] Error killing partially launched Chrome:`, killError);
110
+ }
111
+ }
112
+ throw error; // Re-throw to be caught by the route handler
113
+ }
114
+ }
115
+
116
+ /**
117
+ * Navigates a specific browser instance to a URL.
118
+ * @param {string} browserId - The ID of the browser instance.
119
+ * @param {string} url - The URL to navigate to.
120
+ * @returns {Promise<void>}
121
+ */
122
+ async function navigateBrowser(browserId, url) {
123
+ const instance = getBrowserInstance(browserId);
124
+ if (!instance) throw new Error(`Browser instance with ID '${browserId}' not found.`);
125
+
126
+ const { cdpClient } = instance;
127
+ console.log(`[BrowserService] Browser ${browserId} navigating to: ${url}`);
128
+ await cdpClient.Page.navigate({ url: url });
129
+ await cdpClient.Page.loadEventFired(); // Wait for page to load
130
+ console.log(`[BrowserService] Browser ${browserId} successfully navigated to ${url}.`);
131
+ }
132
+
133
+ /**
134
+ * Takes a screenshot of a specific browser page and can save it to disk.
135
+ * @param {string} browserId - The ID of the browser instance.
136
+ * @param {string} [fileName='screenshot.png'] - Optional: The name of the file to save the screenshot as.
137
+ * @param {boolean} [saveToDisk=true] - Optional: Whether to save the screenshot to disk.
138
+ * @returns {Promise<string>} - Base64 encoded screenshot data.
139
+ */
140
+ async function takeScreenshot(browserId, fileName = 'screenshot.png', saveToDisk = true) { // Added fileName and saveToDisk params
141
+ const instance = getBrowserInstance(browserId);
142
+ if (!instance) throw new Error(`Browser instance with ID '${browserId}' not found.`);
143
+
144
+ const { cdpClient } = instance;
145
+ console.log(`[BrowserService] Taking screenshot for browser ${browserId}...`);
146
+ const screenshot = await cdpClient.Page.captureScreenshot({ format: 'png', quality: 80 });
147
+
148
+ if (saveToDisk) {
149
+ const screenshotBuffer = Buffer.from(screenshot.data, 'base64');
150
+ // Ensure the output directory exists
151
+ if (!fs.existsSync(config.OUTPUT_DIR)) {
152
+ fs.mkdirSync(config.OUTPUT_DIR, { recursive: true });
153
+ }
154
+ const filePath = path.join(config.OUTPUT_DIR, fileName);
155
+ fs.writeFileSync(filePath, screenshotBuffer);
156
+ console.log(`[BrowserService] Screenshot saved to ${filePath}`);
157
+ }
158
+
159
+ console.log(`[BrowserService] Screenshot captured for browser ${browserId}.`);
160
+ return screenshot.data; // Always return base64 data to the caller (e.g., AI agent)
161
+ }
162
+
163
+ /**
164
+ * Gets the current DOM content of a specific browser page.
165
+ * @param {string} browserId - The ID of the browser instance.
166
+ * @returns {Promise<string>} - The outer HTML of the document.
167
+ */
168
+ async function getDomContent(browserId) {
169
+ const instance = getBrowserInstance(browserId);
170
+ if (!instance) throw new Error(`Browser instance with ID '${browserId}' not found.`);
171
+
172
+ const { cdpClient } = instance;
173
+ console.log(`[BrowserService] Getting DOM for browser ${browserId}...`);
174
+ const documentNode = await cdpClient.DOM.getDocument({ depth: -1 });
175
+ const outerHTML = await cdpClient.DOM.getOuterHTML({ nodeId: documentNode.root.nodeId });
176
+ console.log(`[BrowserService] DOM content retrieved for browser ${browserId}.`);
177
+ return outerHTML.outerHTML;
178
+ }
179
+
180
+ /**
181
+ * Clicks an element identified by a locator.
182
+ * @param {string} browserId - The ID of the browser instance.
183
+ * @param {object} locator - { type: 'css'|'xpath', value: 'selector' }
184
+ * @returns {Promise<object>} - Coordinates of the click.
185
+ */
186
+ async function clickElement(browserId, locator) {
187
+ const instance = getBrowserInstance(browserId);
188
+ if (!instance) throw new Error(`Browser instance with ID '${browserId}' not found.`);
189
+
190
+ const { cdpClient } = instance;
191
+ const { Input } = cdpClient;
192
+
193
+ console.log(`[BrowserService] Browser ${browserId}: Attempting to click element with locator:`, locator);
194
+
195
+ const nodeId = await findNodeBySelector(cdpClient, locator.type, locator.value);
196
+ if (!nodeId) {
197
+ throw new Error(`Element not found for locator: ${JSON.stringify(locator)}`);
198
+ }
199
+
200
+ const coords = await getElementClickCoordinates(cdpClient, nodeId);
201
+ if (!coords) {
202
+ throw new Error(`Could not determine click coordinates for element: ${JSON.stringify(locator)}`);
203
+ }
204
+
205
+ await Input.dispatchMouseEvent({
206
+ type: 'mousePressed',
207
+ button: 'left',
208
+ x: coords.x,
209
+ y: coords.y,
210
+ clickCount: 1
211
+ });
212
+ await Input.dispatchMouseEvent({
213
+ type: 'mouseReleased',
214
+ button: 'left',
215
+ x: coords.x,
216
+ y: coords.y,
217
+ clickCount: 1
218
+ });
219
+
220
+ console.log(`[BrowserService] Browser ${browserId}: Clicked element at x: ${coords.x}, y: ${coords.y}`);
221
+ return coords;
222
+ }
223
+
224
+ /**
225
+ * Types text into an element identified by a locator.
226
+ * @param {string} browserId - The ID of the browser instance.
227
+ * @param {object} locator - { type: 'css'|'xpath', value: 'selector' }
228
+ * @param {string} text - The text to type.
229
+ * @returns {Promise<void>}
230
+ */
231
+ async function typeIntoElement(browserId, locator, text) {
232
+ const instance = getBrowserInstance(browserId);
233
+ if (!instance) throw new Error(`Browser instance with ID '${browserId}' not found.`);
234
+
235
+ const { cdpClient } = instance;
236
+ const { DOM, Input } = cdpClient;
237
+
238
+ console.log(`[BrowserService] Browser ${browserId}: Attempting to type "${text}" into element with locator:`, locator);
239
+
240
+ const nodeId = await findNodeBySelector(cdpClient, locator.type, locator.value);
241
+ if (!nodeId) {
242
+ throw new Error(`Element not found for locator: ${JSON.stringify(locator)}`);
243
+ }
244
+
245
+ await DOM.focus({ nodeId: nodeId });
246
+ await new Promise(resolve => setTimeout(resolve, 50)); // Small delay for focus
247
+
248
+ // Clear existing text: Cmd/Ctrl+A then Backspace
249
+ await Input.dispatchKeyEvent({ type: 'keyDown', text: 'a', modifiers: (process.platform === 'darwin' ? 4 : 2) }); // 4 for Meta (Cmd), 2 for Control
250
+ await Input.dispatchKeyEvent({ type: 'keyUp', text: 'a', modifiers: (process.platform === 'darwin' ? 4 : 2) });
251
+ await Input.dispatchKeyEvent({ type: 'keyDown', key: 'Backspace' });
252
+ await Input.dispatchKeyEvent({ type: 'keyUp', key: 'Backspace' });
253
+ await new Promise(resolve => setTimeout(resolve, 50)); // Small delay for clear
254
+
255
+ for (const char of text) {
256
+ await Input.dispatchKeyEvent({ type: 'keyDown', text: char, key: char });
257
+ await Input.dispatchKeyEvent({ type: 'keyUp', text: char, key: char });
258
+ await new Promise(resolve => setTimeout(resolve, 10)); // Small delay for realism
259
+ }
260
+
261
+ console.log(`[BrowserService] Browser ${browserId}: Typed "${text}" into element.`);
262
+ }
263
+
264
+ /**
265
+ * Closes a specific browser instance.
266
+ * @param {string} browserId - The ID of the browser instance.
267
+ * @returns {Promise<void>}
268
+ */
269
+ async function closeBrowser(browserId) {
270
+ const instance = getBrowserInstance(browserId);
271
+ if (!instance) throw new Error(`Browser instance with ID '${browserId}' not found.`);
272
+
273
+ const { chromeInstance, cdpClient, userDataDir } = instance;
274
+
275
+ console.log(`[BrowserService] Closing browser ${browserId} (profile: ${userDataDir || 'temporary'})...`);
276
+ if (cdpClient) {
277
+ try {
278
+ cdpClient.close();
279
+ console.log(`[BrowserService] CDP client disconnected for ${browserId}.`);
280
+ } catch (err) {
281
+ console.warn(`[BrowserService] Error during CDP client close for ${browserId}:`, err.message);
282
+ }
283
+ }
284
+ if (chromeInstance) {
285
+ try {
286
+ await chromeInstance.kill();
287
+ console.log(`[BrowserService] Chrome instance ${browserId} killed.`);
288
+ } catch (err) {
289
+ console.warn(`[BrowserService] Error during Chrome instance kill for ${browserId}:`, err.message);
290
+ }
291
+ }
292
+ delete activeBrowsers[browserId]; // Remove from our store
293
+ console.log(`[BrowserService] Browser ${browserId} removed from active list.`);
294
+ }
295
+
296
+ /**
297
+ * Shuts down all active browser instances. Used for graceful server shutdown.
298
+ * @returns {Promise<void>}
299
+ */
300
+ async function shutdownAllBrowsers() {
301
+ const browserIds = Object.keys(activeBrowsers);
302
+ if (browserIds.length === 0) {
303
+ console.log('[BrowserService] No active browsers to shut down.');
304
+ return;
305
+ }
306
+ console.log(`[BrowserService] Shutting down ${browserIds.length} active browser(s)...`);
307
+ await Promise.all(browserIds.map(id => closeBrowser(id).catch(err => {
308
+ console.error(`[BrowserService] Failed to gracefully close browser ${id}:`, err.message);
309
+ // Continue with other shutdowns even if one fails
310
+ })));
311
+ console.log('[BrowserService] All active browsers shut down.');
312
+ }
313
+
314
+
315
+ module.exports = {
316
+ launchBrowser,
317
+ navigateBrowser,
318
+ getBrowserInstance,
319
+ takeScreenshot,
320
+ getDomContent,
321
+ clickElement,
322
+ typeIntoElement,
323
+ closeBrowser,
324
+ shutdownAllBrowsers // Export for server.js to use
325
+ };