npm - @hypothesi/tauri-mcp-server - Versions diffs - 0.7.0 → 0.8.0 - Mend

@hypothesi/tauri-mcp-server 0.7.0 → 0.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

package/README.md +31 -24
package/dist/driver/scripts/aria-api-loader.js +29 -0
package/dist/driver/scripts/aria-api.bundle.js +1295 -0
package/dist/driver/scripts/dom-snapshot.js +536 -0
package/dist/driver/scripts/find-element.js +10 -2
package/dist/driver/scripts/focus.js +17 -4
package/dist/driver/scripts/get-styles.js +23 -4
package/dist/driver/scripts/index.js +1 -0
package/dist/driver/scripts/interact.js +20 -9
package/dist/driver/scripts/wait-for.js +15 -2
package/dist/driver/session-manager.js +2 -2
package/dist/driver/webview-executor.js +5 -5
package/dist/driver/webview-interactions.js +39 -3
package/dist/prompts-registry.js +5 -5
package/dist/tools-registry.js +65 -35
package/package.json +8 -2

package/dist/driver/scripts/interact.js CHANGED Viewed

@@ -4,7 +4,7 @@
  *
  * @param {Object} params
  * @param {string} params.action - The action to perform
- * @param {string|null} params.selector - CSS selector for the element
+ * @param {string|null} params.selector - CSS selector or ref ID (e.g., "ref=e3") for the element
  * @param {number|null} params.x - X coordinate
  * @param {number|null} params.y - Y coordinate
  * @param {number} params.duration - Duration for long-press
@@ -14,24 +14,35 @@
 (function(params) {
    const { action, selector, x, y, duration, scrollX, scrollY } = params;
+   // Resolve element from CSS selector or ref ID (e.g., "ref=e3" or "e3")
+   function resolveElement(selectorOrRef) {
+      if (!selectorOrRef) return null;
+      var refMatch = selectorOrRef.match(/^(?:ref=)?(e\d+)$/);
+      if (refMatch) {
+         var refId = refMatch[1],
+             refMap = window.__MCP_ARIA_REFS_REVERSE__;
+         if (!refMap) throw new Error('Ref "' + refId + '" not found. Run webview_dom_snapshot first to index elements.');
+         var el = refMap.get(refId);
+         if (!el) throw new Error('Ref "' + refId + '" not found. The DOM may have changed since the snapshot.');
+         return el;
+      }
+      var el = document.querySelector(selectorOrRef);
+      if (!el) throw new Error('Element not found: ' + selectorOrRef);
+      return el;
+   }
    let element = null;
    let targetX, targetY;
    // For scroll action, we don't necessarily need a selector or coordinates
    if (action === 'scroll') {
       if (selector) {
-         element = document.querySelector(selector);
-         if (!element) {
-            throw new Error(`Element not found: ${selector}`);
-         }
+         element = resolveElement(selector);
       }
    } else {
       // For other actions, we need either selector or coordinates
       if (selector) {
-         element = document.querySelector(selector);
-         if (!element) {
-            throw new Error(`Element not found: ${selector}`);
-         }
+         element = resolveElement(selector);
          const rect = element.getBoundingClientRect();
          targetX = rect.left + rect.width / 2;
          targetY = rect.top + rect.height / 2;

package/dist/driver/scripts/wait-for.js CHANGED Viewed

@@ -3,13 +3,26 @@
  *
  * @param {Object} params
  * @param {string} params.type - What to wait for: 'selector', 'text', 'ipc-event'
- * @param {string} params.value - Selector, text, or event name to wait for
+ * @param {string} params.value - Selector/ref ID, text, or event name to wait for
  * @param {number} params.timeout - Timeout in milliseconds
  */
 (async function(params) {
    const { type, value, timeout } = params;
    const startTime = Date.now();
+   // Resolve element from CSS selector or ref ID (e.g., "ref=e3" or "e3")
+   function resolveElement(selectorOrRef) {
+      if (!selectorOrRef) return null;
+      var refMatch = selectorOrRef.match(/^(?:ref=)?(e\d+)$/);
+      if (refMatch) {
+         var refId = refMatch[1],
+             refMap = window.__MCP_ARIA_REFS_REVERSE__;
+         if (!refMap) return null; // For wait-for, return null instead of throwing
+         return refMap.get(refId) || null;
+      }
+      return document.querySelector(selectorOrRef);
+   }
    return new Promise((resolve, reject) => {
       function check() {
          if (Date.now() - startTime > timeout) {
@@ -18,7 +31,7 @@
          }
          if (type === 'selector') {
-            const element = document.querySelector(value);
+            const element = resolveElement(value);
             if (element) {
                resolve(`Element found: ${value}`);
                return;

package/dist/driver/session-manager.js CHANGED Viewed

@@ -75,7 +75,7 @@ function getAppDiscovery(host) {
  */
 export function resolveTargetApp(portOrIdentifier) {
     if (activeSessions.size === 0) {
-        throw new Error('No active session. Call tauri_driver_session with action "start" first to connect to a Tauri app.');
+        throw new Error('No active session. Call driver_session with action "start" first to connect to a Tauri app.');
     }
     // Single app - return it
     if (activeSessions.size === 1) {
@@ -127,7 +127,7 @@ function formatAppNotFoundError(identifier) {
         .join('\n');
     return (`App "${identifier}" not found.\n\n` +
         `Connected apps:\n${appList}\n\n` +
-        'Use tauri_driver_session with action "status" to list all connected apps.');
+        'Use driver_session with action "status" to list all connected apps.');
 }
 /**
  * Promote the next default app when the current default is removed.

package/dist/driver/webview-executor.js CHANGED Viewed

@@ -23,13 +23,13 @@ const driverLogger = createMcpLogger('DRIVER');
  * This is called automatically by all tool functions.
  *
  * Initialization includes:
- * - Verifying an active session exists (via tauri_driver_session)
+ * - Verifying an active session exists (via driver_session)
  * - Connecting to the plugin WebSocket using session config
  * - Console capture is already initialized by bridge.js in the Tauri app
  *
  * This function is idempotent - calling it multiple times is safe.
  *
- * @throws Error if no session is active (tauri_driver_session must be called first)
+ * @throws Error if no session is active (driver_session must be called first)
  */
 export async function ensureReady() {
     if (isInitialized) {
@@ -37,7 +37,7 @@ export async function ensureReady() {
     }
     // Require an active session to prevent connecting to wrong app
     if (!hasActiveSession()) {
-        throw new Error('No active session. Call tauri_driver_session with action "start" first to connect to a Tauri app.');
+        throw new Error('No active session. Call driver_session with action "start" first to connect to a Tauri app.');
     }
     // Get default session for initial connection
     const session = getDefaultSession();
@@ -289,7 +289,7 @@ async function prepareHtml2canvasScript(format, quality) {
  * @returns Screenshot result with image content
  */
 export async function captureScreenshot(options = {}) {
-    const { format = 'png', quality = 90, windowId, appIdentifier, maxWidth } = options;
+    const { format = 'jpeg', quality = 80, windowId, appIdentifier, maxWidth } = options;
     // Primary implementation: Use native platform-specific APIs
     // - macOS: WKWebView takeSnapshot
     // - Windows: WebView2 CapturePreview
@@ -425,6 +425,6 @@ export const GetConsoleLogsSchema = z.object({
     since: z.string().optional().describe('ISO timestamp to filter logs since'),
 });
 export const CaptureScreenshotSchema = z.object({
-    format: z.enum(['png', 'jpeg']).optional().default('png').describe('Image format'),
+    format: z.enum(['png', 'jpeg']).optional().default('jpeg').describe('Image format'),
     quality: z.number().min(0).max(100).optional().describe('JPEG quality (0-100)'),
 });

package/dist/driver/webview-interactions.js CHANGED Viewed

@@ -33,8 +33,8 @@ export const InteractSchema = WindowTargetSchema.extend({
     toY: z.number().optional().describe('Ending Y coordinate for swipe'),
 });
 export const ScreenshotSchema = WindowTargetSchema.extend({
-    format: z.enum(['png', 'jpeg']).optional().default('png').describe('Image format'),
-    quality: z.number().min(0).max(100).optional().describe('JPEG quality (0-100, only for jpeg format)'),
+    format: z.enum(['png', 'jpeg']).optional().default('jpeg').describe('Image format'),
+    quality: z.number().min(0).max(100).optional().default(80).describe('JPEG quality (0-100, only for jpeg format)'),
     filePath: z.string().optional().describe('File path to save the screenshot to instead of returning as base64'),
     maxWidth: z.number().int().positive().optional().describe('Maximum width in pixels. Images wider than this will be scaled down proportionally. ' +
         'Can also be set via TAURI_MCP_SCREENSHOT_MAX_WIDTH environment variable.'),
@@ -75,6 +75,10 @@ export const GetConsoleLogsSchema = WindowTargetSchema.extend({
     filter: z.string().optional().describe('Regex or keyword to filter logs'),
     since: z.string().optional().describe('ISO timestamp to filter logs since'),
 });
+export const DomSnapshotSchema = WindowTargetSchema.extend({
+    type: z.enum(['accessibility', 'structure']).describe('Snapshot type'),
+    selector: z.string().optional().describe('CSS selector to scope the snapshot. If omitted, snapshots entire document.'),
+});
 // ============================================================================
 // Implementation Functions
 // ============================================================================
@@ -123,7 +127,7 @@ async function performSwipe(options) {
     }
 }
 export async function screenshot(options = {}) {
-    const { quality, format = 'png', windowId, filePath, appIdentifier, maxWidth } = options;
+    const { quality, format = 'jpeg', windowId, filePath, appIdentifier, maxWidth } = options;
     // Use the native screenshot function from webview-executor
     const result = await captureScreenshot({ format, quality, windowId, appIdentifier, maxWidth });
     // If filePath is provided, write to file instead of returning base64
@@ -265,3 +269,35 @@ export async function getConsoleLogs(options = {}) {
         throw new Error(`Failed to get console logs: ${message}`);
     }
 }
+/**
+ * Generate a structured DOM snapshot for AI consumption.
+ * Uses aria-api for comprehensive, spec-compliant accessibility computation.
+ */
+export async function domSnapshot(options) {
+    const { type, selector, windowId, appIdentifier } = options;
+    // Only load aria-api for accessibility snapshots
+    if (type === 'accessibility') {
+        await ensureAriaApiLoaded(windowId);
+    }
+    // Then execute the snapshot script
+    const script = buildScript(SCRIPTS.domSnapshot, { type, selector: selector ?? null });
+    try {
+        return await executeInWebview(script, windowId, appIdentifier);
+    }
+    catch (error) {
+        const message = error instanceof Error ? error.message : String(error);
+        throw new Error(`DOM snapshot failed: ${message}`);
+    }
+}
+/**
+ * Ensure aria-api library is loaded in the webview.
+ * Uses the script manager to inject the library if not already present.
+ */
+async function ensureAriaApiLoaded(windowId) {
+    const { getAriaApiSource, ARIA_API_SCRIPT_ID: ariaApiScriptId } = await import('./scripts/aria-api-loader.js');
+    const { registerScript, isScriptRegistered } = await import('./script-manager.js');
+    if (await isScriptRegistered(ariaApiScriptId)) {
+        return;
+    }
+    await registerScript(ariaApiScriptId, 'inline', getAriaApiSource(), windowId);
+}

package/dist/prompts-registry.js CHANGED Viewed

@@ -7,9 +7,9 @@ const FIX_WEBVIEW_ERRORS_PROMPT = `I need help finding and fixing JavaScript err
 Please follow these steps:
-1. **Start a session** - Use \`tauri_driver_session\` with action "start" to connect to the running Tauri app
+1. **Start a session** - Use \`driver_session\` with action "start" to connect to the running Tauri app
-2. **Get console logs** - Use \`tauri_read_logs\` with source "console" to retrieve JavaScript errors or warnings
+2. **Get console logs** - Use \`read_logs\` with source "console" to retrieve JavaScript errors or warnings
 3. **Analyze the errors** - Look at the error messages, stack traces, and identify:
    - What type of error it is (TypeError, ReferenceError, SyntaxError, etc.)
@@ -20,7 +20,7 @@ Please follow these steps:
 5. **Propose a fix** - Explain what's wrong and suggest a concrete fix for each error found
-6. **Stop the session** - Use \`tauri_driver_session\` with action "stop" to clean up
+6. **Stop the session** - Use \`driver_session\` with action "stop" to clean up
 If no errors are found, let me know the app is running cleanly.
@@ -83,8 +83,8 @@ Only after I say yes should you make any modifications.
 Once changes are approved and made:
 1. Run the Tauri app in development mode (\`cargo tauri dev\`)
-2. Use \`tauri_driver_session\` with action "start" to connect
-3. Use \`tauri_driver_session\` with action "status" to verify
+2. Use \`driver_session\` with action "start" to connect
+3. Use \`driver_session\` with action "status" to verify
 ## Notes

package/dist/tools-registry.js CHANGED Viewed

@@ -7,7 +7,7 @@ import { listDevices, ListDevicesSchema } from './manager/mobile.js';
 import { manageDriverSession, ManageDriverSessionSchema, } from './driver/session-manager.js';
 import { readLogs, ReadLogsSchema } from './monitor/logs.js';
 import { executeIPCCommand, manageIPCMonitoring, getIPCEvents, emitTestEvent, getBackendState, manageWindow, ExecuteIPCCommandSchema, ManageIPCMonitoringSchema, GetIPCEventsSchema, EmitTestEventSchema, GetBackendStateSchema, ManageWindowSchema, } from './driver/plugin-commands.js';
-import { interact, screenshot, keyboard, waitFor, getStyles, executeJavaScript, findElement, InteractSchema, ScreenshotSchema, KeyboardSchema, WaitForSchema, GetStylesSchema, ExecuteJavaScriptSchema, FindElementSchema, } from './driver/webview-interactions.js';
+import { interact, screenshot, keyboard, waitFor, getStyles, executeJavaScript, findElement, domSnapshot, InteractSchema, ScreenshotSchema, KeyboardSchema, WaitForSchema, GetStylesSchema, ExecuteJavaScriptSchema, FindElementSchema, DomSnapshotSchema, } from './driver/webview-interactions.js';
 import { PLUGIN_VERSION_CARGO } from './version.js';
 /**
  * Standard multi-app description for webview tools.
@@ -84,8 +84,8 @@ Only after the user says yes should you make any modifications.
 Once changes are approved and made:
 1. Run the Tauri app in development mode (\`cargo tauri dev\`)
-2. Use \`tauri_driver_session\` with action "start" to connect
-3. Use \`tauri_driver_session\` with action "status" to verify
+2. Use \`driver_session\` with action "start" to connect
+3. Use \`driver_session\` with action "status" to verify
 ## Notes
@@ -100,9 +100,9 @@ Once changes are approved and made:
 export const TOOLS = [
     // Setup & Configuration Tools
     {
-        name: 'tauri_get_setup_instructions',
+        name: 'get_setup_instructions',
         description: 'Get instructions for setting up or updating the MCP Bridge plugin in a Tauri project. ' +
-            'Call this tool when: (1) tauri_driver_session fails to connect, (2) you detect the plugin ' +
+            'Call this tool when: (1) driver_session fails to connect, (2) you detect the plugin ' +
             'is not installed or outdated, or (3) the user asks about setup. ' +
             'Returns step-by-step guidance that you should follow to help the user configure their project. ' +
             'IMPORTANT: The instructions require you to examine the project first and ask for permission ' +
@@ -122,7 +122,7 @@ export const TOOLS = [
     },
     // Mobile Development Tools
     {
-        name: 'tauri_list_devices',
+        name: 'list_devices',
         description: '[Tauri Mobile Apps Only] List Android emulators/devices and iOS simulators. ' +
             'Use for Tauri mobile development (tauri android dev, tauri ios dev). ' +
             'Not needed for desktop-only Tauri apps or web projects.',
@@ -140,7 +140,7 @@ export const TOOLS = [
     },
     // UI Automation Tools
     {
-        name: 'tauri_driver_session',
+        name: 'driver_session',
         description: '[Tauri Apps Only] Start/stop automation session to connect to a RUNNING Tauri app. ' +
             'Supports multiple concurrent app connections - each app runs on a unique port. ' +
             'The most recently connected app becomes the "default" app used when no appIdentifier is specified. ' +
@@ -148,7 +148,7 @@ export const TOOLS = [
             'or array format with "isDefault" indicator when multiple apps connected. ' +
             'Action "stop" without appIdentifier stops ALL sessions; with appIdentifier stops only that app. ' +
             'The identifier field (e.g., "com.example.myapp") uniquely identifies each app. ' +
-            'REQUIRED before using other tauri_webview_* or tauri_plugin_* tools. ' +
+            'REQUIRED before using other webview_* or ipc_* tools. ' +
             'Connects via WebSocket to the MCP Bridge plugin in the Tauri app. ' +
             'For browser automation, use Chrome DevTools MCP instead. ' +
             'For Electron apps, this tool will NOT work.',
@@ -167,9 +167,9 @@ export const TOOLS = [
         },
     },
     {
-        name: 'tauri_webview_find_element',
+        name: 'webview_find_element',
         description: '[Tauri Apps Only] Find DOM elements in a running Tauri app\'s webview. ' +
-            'Requires active tauri_driver_session. ' +
+            'Requires active driver_session. ' +
             MULTI_APP_DESC + ' ' +
             'For browser pages or documentation sites, use Chrome DevTools MCP instead.',
         category: TOOL_CATEGORIES.UI_AUTOMATION,
@@ -190,10 +190,10 @@ export const TOOLS = [
         },
     },
     {
-        name: 'tauri_read_logs',
+        name: 'read_logs',
         description: '[Tauri Apps Only] Read logs from various sources: "console" for webview JS logs, ' +
             '"android" for logcat, "ios" for simulator logs, "system" for desktop logs. ' +
-            'Requires active tauri_driver_session for console logs. ' +
+            'Requires active driver_session for console logs. ' +
             'Use for debugging Tauri app issues at any level.',
         category: TOOL_CATEGORIES.UI_AUTOMATION,
         schema: ReadLogsSchema,
@@ -209,10 +209,10 @@ export const TOOLS = [
     },
     // WebView Interaction Tools
     {
-        name: 'tauri_webview_interact',
+        name: 'webview_interact',
         description: '[Tauri Apps Only] Click, scroll, swipe, focus, or perform gestures in a Tauri app webview. ' +
             'Supported actions: click, double-click, long-press, scroll, swipe, focus. ' +
-            'Requires active tauri_driver_session. ' +
+            'Requires active driver_session. ' +
             'For browser interaction, use Chrome DevTools MCP instead.',
         category: TOOL_CATEGORIES.UI_AUTOMATION,
         schema: InteractSchema,
@@ -228,9 +228,9 @@ export const TOOLS = [
         },
     },
     {
-        name: 'tauri_webview_screenshot',
+        name: 'webview_screenshot',
         description: '[Tauri Apps Only] Screenshot a running Tauri app\'s webview. ' +
-            'Requires active tauri_driver_session. Captures only visible viewport. ' +
+            'Requires active driver_session. Captures only visible viewport. ' +
             MULTI_APP_DESC + ' ' +
             'For browser screenshots, use Chrome DevTools MCP instead. ' +
             'For Electron apps, this will NOT work.',
@@ -260,9 +260,9 @@ export const TOOLS = [
         },
     },
     {
-        name: 'tauri_webview_keyboard',
+        name: 'webview_keyboard',
         description: '[Tauri Apps Only] Type text or send keyboard events in a Tauri app. ' +
-            'Requires active tauri_driver_session. ' +
+            'Requires active driver_session. ' +
             MULTI_APP_DESC + ' ' +
             'For browser keyboard input, use Chrome DevTools MCP instead.',
         category: TOOL_CATEGORIES.UI_AUTOMATION,
@@ -294,9 +294,9 @@ export const TOOLS = [
         },
     },
     {
-        name: 'tauri_webview_wait_for',
+        name: 'webview_wait_for',
         description: '[Tauri Apps Only] Wait for elements, text, or IPC events in a Tauri app. ' +
-            'Requires active tauri_driver_session. ' +
+            'Requires active driver_session. ' +
             MULTI_APP_DESC + ' ' +
             'For browser waits, use Chrome DevTools MCP instead.',
         category: TOOL_CATEGORIES.UI_AUTOMATION,
@@ -318,9 +318,9 @@ export const TOOLS = [
         },
     },
     {
-        name: 'tauri_webview_get_styles',
+        name: 'webview_get_styles',
         description: '[Tauri Apps Only] Get computed CSS styles from elements in a Tauri app. ' +
-            'Requires active tauri_driver_session. ' +
+            'Requires active driver_session. ' +
             MULTI_APP_DESC + ' ' +
             'For browser style inspection, use Chrome DevTools MCP instead.',
         category: TOOL_CATEGORIES.UI_AUTOMATION,
@@ -342,9 +342,9 @@ export const TOOLS = [
         },
     },
     {
-        name: 'tauri_webview_execute_js',
+        name: 'webview_execute_js',
         description: '[Tauri Apps Only] Execute JavaScript in a Tauri app\'s webview context. ' +
-            'Requires active tauri_driver_session. Has access to window.__TAURI__. ' +
+            'Requires active driver_session. Has access to window.__TAURI__. ' +
             'If you need a return value, it must be JSON-serializable. ' +
             'For functions that return values, use an IIFE: "(() => { return 5; })()" not "() => { return 5; }". ' +
             MULTI_APP_DESC + ' ' +
@@ -367,11 +367,41 @@ export const TOOLS = [
             });
         },
     },
+    {
+        name: 'webview_dom_snapshot',
+        description: '[Tauri Apps Only] Get a structured DOM snapshot of a Tauri app\'s webview. ' +
+            'Supports different snapshot types for AI consumption. ' +
+            'The "accessibility" type returns a YAML representation of the accessibility tree ' +
+            'similar to Playwright\'s aria snapshots, including roles, names, states, and element refs. ' +
+            'Use this for understanding UI semantics, finding interactive elements, or accessibility testing. ' +
+            'The "structure" type returns a YAML representation of the DOM hierarchy ' +
+            'with element tag names, IDs, CSS classes, and data-testid attributes (if present). ' +
+            'Use this for understanding page layout, debugging CSS selectors, or locating elements by class/ID. ' +
+            'Use the optional selector parameter to scope the snapshot to a subtree. ' +
+            'Requires active driver_session. ' +
+            MULTI_APP_DESC,
+        category: TOOL_CATEGORIES.UI_AUTOMATION,
+        schema: DomSnapshotSchema,
+        annotations: {
+            title: 'DOM Snapshot',
+            readOnlyHint: true,
+            openWorldHint: false,
+        },
+        handler: async (args) => {
+            const parsed = DomSnapshotSchema.parse(args);
+            return await domSnapshot({
+                type: parsed.type,
+                selector: parsed.selector,
+                windowId: parsed.windowId,
+                appIdentifier: parsed.appIdentifier,
+            });
+        },
+    },
     // IPC & Plugin Tools
     {
-        name: 'tauri_ipc_execute_command',
+        name: 'ipc_execute_command',
         description: '[Tauri Apps Only] Execute Tauri IPC commands (invoke Rust backend functions). ' +
-            'Requires active tauri_driver_session. This is Tauri-specific IPC, not browser APIs. ' +
+            'Requires active driver_session. This is Tauri-specific IPC, not browser APIs. ' +
             'For Electron IPC or browser APIs, use appropriate tools for those frameworks.',
         category: TOOL_CATEGORIES.IPC_PLUGIN,
         schema: ExecuteIPCCommandSchema,
@@ -391,9 +421,9 @@ export const TOOLS = [
         },
     },
     {
-        name: 'tauri_ipc_monitor',
+        name: 'ipc_monitor',
         description: '[Tauri Apps Only] Monitor Tauri IPC calls between frontend and Rust backend. ' +
-            'Requires active tauri_driver_session. Captures invoke() calls and responses. ' +
+            'Requires active driver_session. Captures invoke() calls and responses. ' +
             'This is Tauri-specific; for browser network monitoring, use Chrome DevTools MCP.',
         category: TOOL_CATEGORIES.IPC_PLUGIN,
         schema: ManageIPCMonitoringSchema,
@@ -410,7 +440,7 @@ export const TOOLS = [
         },
     },
     {
-        name: 'tauri_ipc_get_captured',
+        name: 'ipc_get_captured',
         description: '[Tauri Apps Only] Get captured Tauri IPC traffic (requires ipc_monitor started). ' +
             'Shows captured commands (invoke calls) and events with arguments and responses. ' +
             'For browser network requests, use Chrome DevTools MCP instead.',
@@ -427,9 +457,9 @@ export const TOOLS = [
         },
     },
     {
-        name: 'tauri_ipc_emit_event',
+        name: 'ipc_emit_event',
         description: '[Tauri Apps Only] Emit a Tauri event to test event handlers. ' +
-            'Requires active tauri_driver_session. Events are Tauri-specific (not DOM events). ' +
+            'Requires active driver_session. Events are Tauri-specific (not DOM events). ' +
             'For browser DOM events, use Chrome DevTools MCP instead.',
         category: TOOL_CATEGORIES.IPC_PLUGIN,
         schema: EmitTestEventSchema,
@@ -445,9 +475,9 @@ export const TOOLS = [
         },
     },
     {
-        name: 'tauri_ipc_get_backend_state',
+        name: 'ipc_get_backend_state',
         description: '[Tauri Apps Only] Get Tauri backend state: app metadata, Tauri version, environment. ' +
-            'Requires active tauri_driver_session. ' +
+            'Requires active driver_session. ' +
             'Use to verify you\'re connected to a Tauri app and get app info.',
         category: TOOL_CATEGORIES.IPC_PLUGIN,
         schema: GetBackendStateSchema,
@@ -463,12 +493,12 @@ export const TOOLS = [
     },
     // Window Management Tools
     {
-        name: 'tauri_manage_window',
+        name: 'manage_window',
         description: '[Tauri Apps Only] Manage Tauri windows. Actions: ' +
             '"list" - List all windows with labels, titles, URLs, and state. ' +
             '"info" - Get detailed info for a window (size, position, title, focus, visibility). ' +
             '"resize" - Resize a window (requires width/height, uses logical pixels by default). ' +
-            'Requires active tauri_driver_session. ' +
+            'Requires active driver_session. ' +
             'For browser windows, use Chrome DevTools MCP instead.',
         category: TOOL_CATEGORIES.UI_AUTOMATION,
         schema: ManageWindowSchema,

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@hypothesi/tauri-mcp-server",
-  "version": "0.7.0",
+  "version": "0.8.0",
   "mcpName": "io.github.hypothesi/mcp-server-tauri",
   "description": "A Model Context Protocol server for use with Tauri v2 applications",
   "type": "module",
@@ -8,6 +8,7 @@
     "mcp-server-tauri": "./dist/index.js"
   },
   "scripts": {
+    "prebuild": "tsx scripts/bundle-aria-api.ts",
     "build": "tsc && cp -r src/driver/scripts/*.js dist/driver/scripts/ && chmod +x dist/index.js",
     "start": "node dist/index.js",
     "test": "vitest run",
@@ -35,14 +36,18 @@
     "model-context-protocol",
     "tauri",
     "automation",
+    "screenshot",
+    "verification",
     "testing",
     "debugging",
     "cursor",
     "windsurf",
-    "vscode"
+    "vscode",
+    "claude-code"
   ],
   "dependencies": {
     "@modelcontextprotocol/sdk": "0.6.1",
+    "aria-api": "0.8.0",
     "execa": "9.6.0",
     "html2canvas": "1.4.1",
     "ws": "8.18.3",
@@ -53,6 +58,7 @@
     "@types/html2canvas": "0.5.35",
     "@types/node": "22.19.1",
     "@types/ws": "8.18.1",
+    "esbuild": "0.25.12",
     "vitest": "4.0.13"
   },
   "publishConfig": {